diff --git "a/checkpoint-36000/trainer_state.json" "b/checkpoint-36000/trainer_state.json" deleted file mode 100644--- "a/checkpoint-36000/trainer_state.json" +++ /dev/null @@ -1,43378 +0,0 @@ -{ - "best_metric": 0.05467037484049797, - "best_model_checkpoint": "wav2vec2-base-pemlsb-la/checkpoint-34000", - "epoch": 0.9989178390077416, - "global_step": 36000, - "is_hyper_param_search": false, - "is_local_process_zero": true, - "is_world_process_zero": true, - "log_history": [ - { - "epoch": 0.0, - "learning_rate": 5.0000000000000004e-08, - "loss": 0.2249, - "step": 5 - }, - { - "epoch": 0.0, - "learning_rate": 1.0000000000000001e-07, - "loss": 0.2536, - "step": 10 - }, - { - "epoch": 0.0, - "learning_rate": 1.5000000000000002e-07, - "loss": 0.1986, - "step": 15 - }, - { - "epoch": 0.0, - "learning_rate": 2.0000000000000002e-07, - "loss": 0.2285, - "step": 20 - }, - { - "epoch": 0.0, - "learning_rate": 2.5000000000000004e-07, - "loss": 0.1936, - "step": 25 - }, - { - "epoch": 0.0, - "learning_rate": 3.0000000000000004e-07, - "loss": 0.0825, - "step": 30 - }, - { - "epoch": 0.0, - "learning_rate": 3.5000000000000004e-07, - "loss": 0.1878, - "step": 35 - }, - { - "epoch": 0.0, - "learning_rate": 4.0000000000000003e-07, - "loss": 0.1953, - "step": 40 - }, - { - "epoch": 0.0, - "learning_rate": 4.5000000000000003e-07, - "loss": 0.3766, - "step": 45 - }, - { - "epoch": 0.0, - "learning_rate": 5.000000000000001e-07, - "loss": 0.5279, - "step": 50 - }, - { - "epoch": 0.0, - "learning_rate": 5.5e-07, - "loss": 0.2282, - "step": 55 - }, - { - "epoch": 0.0, - "learning_rate": 6.000000000000001e-07, - "loss": 0.1752, - "step": 60 - }, - { - "epoch": 0.0, - "learning_rate": 6.5e-07, - "loss": 0.2045, - "step": 65 - }, - { - "epoch": 0.0, - "learning_rate": 7.000000000000001e-07, - "loss": 0.2753, - "step": 70 - }, - { - "epoch": 0.0, - "learning_rate": 7.5e-07, - "loss": 0.0828, - "step": 75 - }, - { - "epoch": 0.0, - "learning_rate": 8.000000000000001e-07, - "loss": 0.1613, - "step": 80 - }, - { - "epoch": 0.0, - "learning_rate": 8.400000000000001e-07, - "loss": 0.2658, - "step": 85 - }, - { - "epoch": 0.0, - "learning_rate": 8.900000000000001e-07, - "loss": 0.1503, - "step": 90 - }, - { - "epoch": 0.0, - "learning_rate": 9.400000000000001e-07, - "loss": 0.2618, - "step": 95 - }, - { - "epoch": 0.0, - "learning_rate": 9.9e-07, - "loss": 0.2933, - "step": 100 - }, - { - "epoch": 0.0, - "learning_rate": 1.04e-06, - "loss": 0.1629, - "step": 105 - }, - { - "epoch": 0.0, - "learning_rate": 1.0900000000000002e-06, - "loss": 0.1351, - "step": 110 - }, - { - "epoch": 0.0, - "learning_rate": 1.14e-06, - "loss": 0.1777, - "step": 115 - }, - { - "epoch": 0.0, - "learning_rate": 1.19e-06, - "loss": 0.1647, - "step": 120 - }, - { - "epoch": 0.0, - "learning_rate": 1.2400000000000002e-06, - "loss": 0.107, - "step": 125 - }, - { - "epoch": 0.0, - "learning_rate": 1.2900000000000001e-06, - "loss": 0.2022, - "step": 130 - }, - { - "epoch": 0.0, - "learning_rate": 1.34e-06, - "loss": 0.562, - "step": 135 - }, - { - "epoch": 0.0, - "learning_rate": 1.3900000000000002e-06, - "loss": 0.2811, - "step": 140 - }, - { - "epoch": 0.0, - "learning_rate": 1.44e-06, - "loss": 0.2064, - "step": 145 - }, - { - "epoch": 0.0, - "learning_rate": 1.48e-06, - "loss": 0.4073, - "step": 150 - }, - { - "epoch": 0.0, - "learning_rate": 1.5300000000000002e-06, - "loss": 0.1724, - "step": 155 - }, - { - "epoch": 0.0, - "learning_rate": 1.5800000000000001e-06, - "loss": 0.2262, - "step": 160 - }, - { - "epoch": 0.0, - "learning_rate": 1.6300000000000003e-06, - "loss": 0.3025, - "step": 165 - }, - { - "epoch": 0.0, - "learning_rate": 1.6800000000000002e-06, - "loss": 0.3449, - "step": 170 - }, - { - "epoch": 0.0, - "learning_rate": 1.73e-06, - "loss": 0.089, - "step": 175 - }, - { - "epoch": 0.0, - "learning_rate": 1.7800000000000001e-06, - "loss": 0.2062, - "step": 180 - }, - { - "epoch": 0.01, - "learning_rate": 1.83e-06, - "loss": 0.1239, - "step": 185 - }, - { - "epoch": 0.01, - "learning_rate": 1.8800000000000002e-06, - "loss": 0.215, - "step": 190 - }, - { - "epoch": 0.01, - "learning_rate": 1.93e-06, - "loss": 0.2719, - "step": 195 - }, - { - "epoch": 0.01, - "learning_rate": 1.98e-06, - "loss": 0.5067, - "step": 200 - }, - { - "epoch": 0.01, - "learning_rate": 2.0300000000000005e-06, - "loss": 0.2739, - "step": 205 - }, - { - "epoch": 0.01, - "learning_rate": 2.08e-06, - "loss": 0.1794, - "step": 210 - }, - { - "epoch": 0.01, - "learning_rate": 2.13e-06, - "loss": 0.2751, - "step": 215 - }, - { - "epoch": 0.01, - "learning_rate": 2.1800000000000003e-06, - "loss": 0.185, - "step": 220 - }, - { - "epoch": 0.01, - "learning_rate": 2.2300000000000002e-06, - "loss": 0.0968, - "step": 225 - }, - { - "epoch": 0.01, - "learning_rate": 2.28e-06, - "loss": 0.2331, - "step": 230 - }, - { - "epoch": 0.01, - "learning_rate": 2.33e-06, - "loss": 0.1052, - "step": 235 - }, - { - "epoch": 0.01, - "learning_rate": 2.38e-06, - "loss": 0.3041, - "step": 240 - }, - { - "epoch": 0.01, - "learning_rate": 2.43e-06, - "loss": 0.3321, - "step": 245 - }, - { - "epoch": 0.01, - "learning_rate": 2.4800000000000004e-06, - "loss": 0.6221, - "step": 250 - }, - { - "epoch": 0.01, - "learning_rate": 2.5300000000000003e-06, - "loss": 0.1997, - "step": 255 - }, - { - "epoch": 0.01, - "learning_rate": 2.5800000000000003e-06, - "loss": 0.1825, - "step": 260 - }, - { - "epoch": 0.01, - "learning_rate": 2.6300000000000002e-06, - "loss": 0.2278, - "step": 265 - }, - { - "epoch": 0.01, - "learning_rate": 2.68e-06, - "loss": 0.2432, - "step": 270 - }, - { - "epoch": 0.01, - "learning_rate": 2.7300000000000005e-06, - "loss": 0.1503, - "step": 275 - }, - { - "epoch": 0.01, - "learning_rate": 2.7800000000000005e-06, - "loss": 0.1733, - "step": 280 - }, - { - "epoch": 0.01, - "learning_rate": 2.83e-06, - "loss": 0.0788, - "step": 285 - }, - { - "epoch": 0.01, - "learning_rate": 2.88e-06, - "loss": 0.2403, - "step": 290 - }, - { - "epoch": 0.01, - "learning_rate": 2.93e-06, - "loss": 0.1724, - "step": 295 - }, - { - "epoch": 0.01, - "learning_rate": 2.9800000000000003e-06, - "loss": 0.5096, - "step": 300 - }, - { - "epoch": 0.01, - "learning_rate": 3.0300000000000002e-06, - "loss": 0.2124, - "step": 305 - }, - { - "epoch": 0.01, - "learning_rate": 3.08e-06, - "loss": 0.2383, - "step": 310 - }, - { - "epoch": 0.01, - "learning_rate": 3.13e-06, - "loss": 0.1581, - "step": 315 - }, - { - "epoch": 0.01, - "learning_rate": 3.1800000000000005e-06, - "loss": 0.2122, - "step": 320 - }, - { - "epoch": 0.01, - "learning_rate": 3.2300000000000004e-06, - "loss": 0.2645, - "step": 325 - }, - { - "epoch": 0.01, - "learning_rate": 3.2800000000000004e-06, - "loss": 0.1838, - "step": 330 - }, - { - "epoch": 0.01, - "learning_rate": 3.3300000000000003e-06, - "loss": 0.1749, - "step": 335 - }, - { - "epoch": 0.01, - "learning_rate": 3.3800000000000007e-06, - "loss": 0.1447, - "step": 340 - }, - { - "epoch": 0.01, - "learning_rate": 3.4300000000000006e-06, - "loss": 0.2553, - "step": 345 - }, - { - "epoch": 0.01, - "learning_rate": 3.48e-06, - "loss": 0.5503, - "step": 350 - }, - { - "epoch": 0.01, - "learning_rate": 3.53e-06, - "loss": 0.2164, - "step": 355 - }, - { - "epoch": 0.01, - "learning_rate": 3.58e-06, - "loss": 0.1653, - "step": 360 - }, - { - "epoch": 0.01, - "learning_rate": 3.6300000000000004e-06, - "loss": 0.1861, - "step": 365 - }, - { - "epoch": 0.01, - "learning_rate": 3.6800000000000003e-06, - "loss": 0.2385, - "step": 370 - }, - { - "epoch": 0.01, - "learning_rate": 3.7300000000000003e-06, - "loss": 0.2468, - "step": 375 - }, - { - "epoch": 0.01, - "learning_rate": 3.7800000000000002e-06, - "loss": 0.1379, - "step": 380 - }, - { - "epoch": 0.01, - "learning_rate": 3.830000000000001e-06, - "loss": 0.0878, - "step": 385 - }, - { - "epoch": 0.01, - "learning_rate": 3.88e-06, - "loss": 0.2242, - "step": 390 - }, - { - "epoch": 0.01, - "learning_rate": 3.9300000000000005e-06, - "loss": 0.3307, - "step": 395 - }, - { - "epoch": 0.01, - "learning_rate": 3.980000000000001e-06, - "loss": 0.4413, - "step": 400 - }, - { - "epoch": 0.01, - "learning_rate": 4.03e-06, - "loss": 0.1462, - "step": 405 - }, - { - "epoch": 0.01, - "learning_rate": 4.08e-06, - "loss": 0.205, - "step": 410 - }, - { - "epoch": 0.01, - "learning_rate": 4.13e-06, - "loss": 0.2098, - "step": 415 - }, - { - "epoch": 0.01, - "learning_rate": 4.18e-06, - "loss": 0.191, - "step": 420 - }, - { - "epoch": 0.01, - "learning_rate": 4.23e-06, - "loss": 0.0629, - "step": 425 - }, - { - "epoch": 0.01, - "learning_rate": 4.2800000000000005e-06, - "loss": 0.1265, - "step": 430 - }, - { - "epoch": 0.01, - "learning_rate": 4.33e-06, - "loss": 0.2014, - "step": 435 - }, - { - "epoch": 0.01, - "learning_rate": 4.38e-06, - "loss": 0.3309, - "step": 440 - }, - { - "epoch": 0.01, - "learning_rate": 4.430000000000001e-06, - "loss": 0.3537, - "step": 445 - }, - { - "epoch": 0.01, - "learning_rate": 4.48e-06, - "loss": 0.4845, - "step": 450 - }, - { - "epoch": 0.01, - "learning_rate": 4.530000000000001e-06, - "loss": 0.2915, - "step": 455 - }, - { - "epoch": 0.01, - "learning_rate": 4.58e-06, - "loss": 0.233, - "step": 460 - }, - { - "epoch": 0.01, - "learning_rate": 4.6300000000000006e-06, - "loss": 0.1498, - "step": 465 - }, - { - "epoch": 0.01, - "learning_rate": 4.680000000000001e-06, - "loss": 0.1597, - "step": 470 - }, - { - "epoch": 0.01, - "learning_rate": 4.7300000000000005e-06, - "loss": 0.182, - "step": 475 - }, - { - "epoch": 0.01, - "learning_rate": 4.78e-06, - "loss": 0.2874, - "step": 480 - }, - { - "epoch": 0.01, - "learning_rate": 4.83e-06, - "loss": 0.1666, - "step": 485 - }, - { - "epoch": 0.01, - "learning_rate": 4.880000000000001e-06, - "loss": 0.3407, - "step": 490 - }, - { - "epoch": 0.01, - "learning_rate": 4.93e-06, - "loss": 0.2495, - "step": 495 - }, - { - "epoch": 0.01, - "learning_rate": 4.980000000000001e-06, - "loss": 0.443, - "step": 500 - }, - { - "epoch": 0.01, - "learning_rate": 5.03e-06, - "loss": 0.1806, - "step": 505 - }, - { - "epoch": 0.01, - "learning_rate": 5.0800000000000005e-06, - "loss": 0.217, - "step": 510 - }, - { - "epoch": 0.01, - "learning_rate": 5.130000000000001e-06, - "loss": 0.1761, - "step": 515 - }, - { - "epoch": 0.01, - "learning_rate": 5.18e-06, - "loss": 0.305, - "step": 520 - }, - { - "epoch": 0.01, - "learning_rate": 5.230000000000001e-06, - "loss": 0.1023, - "step": 525 - }, - { - "epoch": 0.01, - "learning_rate": 5.28e-06, - "loss": 0.0879, - "step": 530 - }, - { - "epoch": 0.01, - "learning_rate": 5.330000000000001e-06, - "loss": 0.1694, - "step": 535 - }, - { - "epoch": 0.01, - "learning_rate": 5.380000000000001e-06, - "loss": 0.1529, - "step": 540 - }, - { - "epoch": 0.02, - "learning_rate": 5.4300000000000005e-06, - "loss": 0.3211, - "step": 545 - }, - { - "epoch": 0.02, - "learning_rate": 5.470000000000001e-06, - "loss": 0.6838, - "step": 550 - }, - { - "epoch": 0.02, - "learning_rate": 5.5200000000000005e-06, - "loss": 0.2006, - "step": 555 - }, - { - "epoch": 0.02, - "learning_rate": 5.570000000000001e-06, - "loss": 0.1613, - "step": 560 - }, - { - "epoch": 0.02, - "learning_rate": 5.620000000000001e-06, - "loss": 0.2125, - "step": 565 - }, - { - "epoch": 0.02, - "learning_rate": 5.67e-06, - "loss": 0.2194, - "step": 570 - }, - { - "epoch": 0.02, - "learning_rate": 5.72e-06, - "loss": 0.2017, - "step": 575 - }, - { - "epoch": 0.02, - "learning_rate": 5.77e-06, - "loss": 0.0922, - "step": 580 - }, - { - "epoch": 0.02, - "learning_rate": 5.82e-06, - "loss": 0.1526, - "step": 585 - }, - { - "epoch": 0.02, - "learning_rate": 5.8700000000000005e-06, - "loss": 0.2183, - "step": 590 - }, - { - "epoch": 0.02, - "learning_rate": 5.92e-06, - "loss": 0.197, - "step": 595 - }, - { - "epoch": 0.02, - "learning_rate": 5.9700000000000004e-06, - "loss": 0.5106, - "step": 600 - }, - { - "epoch": 0.02, - "learning_rate": 6.02e-06, - "loss": 0.2169, - "step": 605 - }, - { - "epoch": 0.02, - "learning_rate": 6.07e-06, - "loss": 0.1802, - "step": 610 - }, - { - "epoch": 0.02, - "learning_rate": 6.120000000000001e-06, - "loss": 0.2202, - "step": 615 - }, - { - "epoch": 0.02, - "learning_rate": 6.17e-06, - "loss": 0.2362, - "step": 620 - }, - { - "epoch": 0.02, - "learning_rate": 6.220000000000001e-06, - "loss": 0.1626, - "step": 625 - }, - { - "epoch": 0.02, - "learning_rate": 6.27e-06, - "loss": 0.1174, - "step": 630 - }, - { - "epoch": 0.02, - "learning_rate": 6.3200000000000005e-06, - "loss": 0.1051, - "step": 635 - }, - { - "epoch": 0.02, - "learning_rate": 6.370000000000001e-06, - "loss": 0.1218, - "step": 640 - }, - { - "epoch": 0.02, - "learning_rate": 6.42e-06, - "loss": 0.2457, - "step": 645 - }, - { - "epoch": 0.02, - "learning_rate": 6.470000000000001e-06, - "loss": 0.3494, - "step": 650 - }, - { - "epoch": 0.02, - "learning_rate": 6.520000000000001e-06, - "loss": 0.2136, - "step": 655 - }, - { - "epoch": 0.02, - "learning_rate": 6.570000000000001e-06, - "loss": 0.2451, - "step": 660 - }, - { - "epoch": 0.02, - "learning_rate": 6.620000000000001e-06, - "loss": 0.2849, - "step": 665 - }, - { - "epoch": 0.02, - "learning_rate": 6.6700000000000005e-06, - "loss": 0.2196, - "step": 670 - }, - { - "epoch": 0.02, - "learning_rate": 6.720000000000001e-06, - "loss": 0.2496, - "step": 675 - }, - { - "epoch": 0.02, - "learning_rate": 6.770000000000001e-06, - "loss": 0.0549, - "step": 680 - }, - { - "epoch": 0.02, - "learning_rate": 6.820000000000001e-06, - "loss": 0.0748, - "step": 685 - }, - { - "epoch": 0.02, - "learning_rate": 6.870000000000001e-06, - "loss": 0.2986, - "step": 690 - }, - { - "epoch": 0.02, - "learning_rate": 6.92e-06, - "loss": 0.2527, - "step": 695 - }, - { - "epoch": 0.02, - "learning_rate": 6.97e-06, - "loss": 0.5124, - "step": 700 - }, - { - "epoch": 0.02, - "learning_rate": 7.0200000000000006e-06, - "loss": 0.2632, - "step": 705 - }, - { - "epoch": 0.02, - "learning_rate": 7.07e-06, - "loss": 0.204, - "step": 710 - }, - { - "epoch": 0.02, - "learning_rate": 7.1200000000000004e-06, - "loss": 0.1899, - "step": 715 - }, - { - "epoch": 0.02, - "learning_rate": 7.17e-06, - "loss": 0.2731, - "step": 720 - }, - { - "epoch": 0.02, - "learning_rate": 7.22e-06, - "loss": 0.2023, - "step": 725 - }, - { - "epoch": 0.02, - "learning_rate": 7.270000000000001e-06, - "loss": 0.1433, - "step": 730 - }, - { - "epoch": 0.02, - "learning_rate": 7.32e-06, - "loss": 0.1118, - "step": 735 - }, - { - "epoch": 0.02, - "learning_rate": 7.370000000000001e-06, - "loss": 0.2098, - "step": 740 - }, - { - "epoch": 0.02, - "learning_rate": 7.420000000000001e-06, - "loss": 0.1431, - "step": 745 - }, - { - "epoch": 0.02, - "learning_rate": 7.4700000000000005e-06, - "loss": 0.3622, - "step": 750 - }, - { - "epoch": 0.02, - "learning_rate": 7.520000000000001e-06, - "loss": 0.1973, - "step": 755 - }, - { - "epoch": 0.02, - "learning_rate": 7.57e-06, - "loss": 0.1582, - "step": 760 - }, - { - "epoch": 0.02, - "learning_rate": 7.620000000000001e-06, - "loss": 0.2339, - "step": 765 - }, - { - "epoch": 0.02, - "learning_rate": 7.670000000000001e-06, - "loss": 0.2483, - "step": 770 - }, - { - "epoch": 0.02, - "learning_rate": 7.72e-06, - "loss": 0.0592, - "step": 775 - }, - { - "epoch": 0.02, - "learning_rate": 7.77e-06, - "loss": 0.1738, - "step": 780 - }, - { - "epoch": 0.02, - "learning_rate": 7.820000000000001e-06, - "loss": 0.1896, - "step": 785 - }, - { - "epoch": 0.02, - "learning_rate": 7.870000000000001e-06, - "loss": 0.2247, - "step": 790 - }, - { - "epoch": 0.02, - "learning_rate": 7.92e-06, - "loss": 0.4066, - "step": 795 - }, - { - "epoch": 0.02, - "learning_rate": 7.970000000000002e-06, - "loss": 0.6385, - "step": 800 - }, - { - "epoch": 0.02, - "learning_rate": 8.020000000000001e-06, - "loss": 0.1883, - "step": 805 - }, - { - "epoch": 0.02, - "learning_rate": 8.07e-06, - "loss": 0.2734, - "step": 810 - }, - { - "epoch": 0.02, - "learning_rate": 8.120000000000002e-06, - "loss": 0.2096, - "step": 815 - }, - { - "epoch": 0.02, - "learning_rate": 8.17e-06, - "loss": 0.1888, - "step": 820 - }, - { - "epoch": 0.02, - "learning_rate": 8.220000000000001e-06, - "loss": 0.1583, - "step": 825 - }, - { - "epoch": 0.02, - "learning_rate": 8.27e-06, - "loss": 0.097, - "step": 830 - }, - { - "epoch": 0.02, - "learning_rate": 8.32e-06, - "loss": 0.1855, - "step": 835 - }, - { - "epoch": 0.02, - "learning_rate": 8.370000000000001e-06, - "loss": 0.1659, - "step": 840 - }, - { - "epoch": 0.02, - "learning_rate": 8.42e-06, - "loss": 0.3064, - "step": 845 - }, - { - "epoch": 0.02, - "learning_rate": 8.47e-06, - "loss": 0.5692, - "step": 850 - }, - { - "epoch": 0.02, - "learning_rate": 8.52e-06, - "loss": 0.1638, - "step": 855 - }, - { - "epoch": 0.02, - "learning_rate": 8.570000000000001e-06, - "loss": 0.2457, - "step": 860 - }, - { - "epoch": 0.02, - "learning_rate": 8.62e-06, - "loss": 0.2183, - "step": 865 - }, - { - "epoch": 0.02, - "learning_rate": 8.67e-06, - "loss": 0.2386, - "step": 870 - }, - { - "epoch": 0.02, - "learning_rate": 8.720000000000001e-06, - "loss": 0.1225, - "step": 875 - }, - { - "epoch": 0.02, - "learning_rate": 8.77e-06, - "loss": 0.2076, - "step": 880 - }, - { - "epoch": 0.02, - "learning_rate": 8.82e-06, - "loss": 0.2056, - "step": 885 - }, - { - "epoch": 0.02, - "learning_rate": 8.870000000000001e-06, - "loss": 0.3954, - "step": 890 - }, - { - "epoch": 0.02, - "learning_rate": 8.920000000000001e-06, - "loss": 0.1682, - "step": 895 - }, - { - "epoch": 0.02, - "learning_rate": 8.97e-06, - "loss": 0.6697, - "step": 900 - }, - { - "epoch": 0.03, - "learning_rate": 9.020000000000002e-06, - "loss": 0.1666, - "step": 905 - }, - { - "epoch": 0.03, - "learning_rate": 9.070000000000001e-06, - "loss": 0.2045, - "step": 910 - }, - { - "epoch": 0.03, - "learning_rate": 9.12e-06, - "loss": 0.2174, - "step": 915 - }, - { - "epoch": 0.03, - "learning_rate": 9.17e-06, - "loss": 0.2384, - "step": 920 - }, - { - "epoch": 0.03, - "learning_rate": 9.220000000000002e-06, - "loss": 0.2176, - "step": 925 - }, - { - "epoch": 0.03, - "learning_rate": 9.270000000000001e-06, - "loss": 0.136, - "step": 930 - }, - { - "epoch": 0.03, - "learning_rate": 9.32e-06, - "loss": 0.2383, - "step": 935 - }, - { - "epoch": 0.03, - "learning_rate": 9.370000000000002e-06, - "loss": 0.1341, - "step": 940 - }, - { - "epoch": 0.03, - "learning_rate": 9.42e-06, - "loss": 0.2451, - "step": 945 - }, - { - "epoch": 0.03, - "learning_rate": 9.47e-06, - "loss": 0.9591, - "step": 950 - }, - { - "epoch": 0.03, - "learning_rate": 9.52e-06, - "loss": 0.1867, - "step": 955 - }, - { - "epoch": 0.03, - "learning_rate": 9.57e-06, - "loss": 0.1873, - "step": 960 - }, - { - "epoch": 0.03, - "learning_rate": 9.620000000000001e-06, - "loss": 0.1948, - "step": 965 - }, - { - "epoch": 0.03, - "learning_rate": 9.67e-06, - "loss": 0.2792, - "step": 970 - }, - { - "epoch": 0.03, - "learning_rate": 9.72e-06, - "loss": 0.3987, - "step": 975 - }, - { - "epoch": 0.03, - "learning_rate": 9.770000000000001e-06, - "loss": 0.039, - "step": 980 - }, - { - "epoch": 0.03, - "learning_rate": 9.820000000000001e-06, - "loss": 0.2448, - "step": 985 - }, - { - "epoch": 0.03, - "learning_rate": 9.87e-06, - "loss": 0.1216, - "step": 990 - }, - { - "epoch": 0.03, - "learning_rate": 9.920000000000002e-06, - "loss": 0.249, - "step": 995 - }, - { - "epoch": 0.03, - "learning_rate": 9.970000000000001e-06, - "loss": 0.433, - "step": 1000 - }, - { - "epoch": 0.03, - "learning_rate": 9.999429207454551e-06, - "loss": 0.1561, - "step": 1005 - }, - { - "epoch": 0.03, - "learning_rate": 9.998002226090927e-06, - "loss": 0.1989, - "step": 1010 - }, - { - "epoch": 0.03, - "learning_rate": 9.996575244727305e-06, - "loss": 0.1724, - "step": 1015 - }, - { - "epoch": 0.03, - "learning_rate": 9.995148263363682e-06, - "loss": 0.1805, - "step": 1020 - }, - { - "epoch": 0.03, - "learning_rate": 9.993721282000058e-06, - "loss": 0.1212, - "step": 1025 - }, - { - "epoch": 0.03, - "learning_rate": 9.992294300636434e-06, - "loss": 0.1385, - "step": 1030 - }, - { - "epoch": 0.03, - "learning_rate": 9.99086731927281e-06, - "loss": 0.1, - "step": 1035 - }, - { - "epoch": 0.03, - "learning_rate": 9.989440337909187e-06, - "loss": 0.1665, - "step": 1040 - }, - { - "epoch": 0.03, - "learning_rate": 9.988013356545563e-06, - "loss": 0.3426, - "step": 1045 - }, - { - "epoch": 0.03, - "learning_rate": 9.986586375181941e-06, - "loss": 0.5495, - "step": 1050 - }, - { - "epoch": 0.03, - "learning_rate": 9.985159393818318e-06, - "loss": 0.1594, - "step": 1055 - }, - { - "epoch": 0.03, - "learning_rate": 9.983732412454694e-06, - "loss": 0.1865, - "step": 1060 - }, - { - "epoch": 0.03, - "learning_rate": 9.98230543109107e-06, - "loss": 0.2308, - "step": 1065 - }, - { - "epoch": 0.03, - "learning_rate": 9.980878449727447e-06, - "loss": 0.1686, - "step": 1070 - }, - { - "epoch": 0.03, - "learning_rate": 9.979451468363825e-06, - "loss": 0.2432, - "step": 1075 - }, - { - "epoch": 0.03, - "learning_rate": 9.978024487000201e-06, - "loss": 0.1348, - "step": 1080 - }, - { - "epoch": 0.03, - "learning_rate": 9.976597505636578e-06, - "loss": 0.1699, - "step": 1085 - }, - { - "epoch": 0.03, - "learning_rate": 9.975170524272954e-06, - "loss": 0.1712, - "step": 1090 - }, - { - "epoch": 0.03, - "learning_rate": 9.97374354290933e-06, - "loss": 0.298, - "step": 1095 - }, - { - "epoch": 0.03, - "learning_rate": 9.972316561545707e-06, - "loss": 0.5211, - "step": 1100 - }, - { - "epoch": 0.03, - "learning_rate": 9.970889580182085e-06, - "loss": 0.2375, - "step": 1105 - }, - { - "epoch": 0.03, - "learning_rate": 9.969462598818461e-06, - "loss": 0.2803, - "step": 1110 - }, - { - "epoch": 0.03, - "learning_rate": 9.968035617454837e-06, - "loss": 0.2163, - "step": 1115 - }, - { - "epoch": 0.03, - "learning_rate": 9.966608636091214e-06, - "loss": 0.2415, - "step": 1120 - }, - { - "epoch": 0.03, - "learning_rate": 9.96518165472759e-06, - "loss": 0.2971, - "step": 1125 - }, - { - "epoch": 0.03, - "learning_rate": 9.963754673363966e-06, - "loss": 0.0985, - "step": 1130 - }, - { - "epoch": 0.03, - "learning_rate": 9.962327692000343e-06, - "loss": 0.1321, - "step": 1135 - }, - { - "epoch": 0.03, - "learning_rate": 9.960900710636719e-06, - "loss": 0.1606, - "step": 1140 - }, - { - "epoch": 0.03, - "learning_rate": 9.959473729273097e-06, - "loss": 0.2521, - "step": 1145 - }, - { - "epoch": 0.03, - "learning_rate": 9.958046747909473e-06, - "loss": 0.6916, - "step": 1150 - }, - { - "epoch": 0.03, - "learning_rate": 9.95661976654585e-06, - "loss": 0.1813, - "step": 1155 - }, - { - "epoch": 0.03, - "learning_rate": 9.955192785182226e-06, - "loss": 0.2017, - "step": 1160 - }, - { - "epoch": 0.03, - "learning_rate": 9.953765803818602e-06, - "loss": 0.2034, - "step": 1165 - }, - { - "epoch": 0.03, - "learning_rate": 9.95233882245498e-06, - "loss": 0.1885, - "step": 1170 - }, - { - "epoch": 0.03, - "learning_rate": 9.950911841091357e-06, - "loss": 0.2131, - "step": 1175 - }, - { - "epoch": 0.03, - "learning_rate": 9.949484859727733e-06, - "loss": 0.0847, - "step": 1180 - }, - { - "epoch": 0.03, - "learning_rate": 9.94805787836411e-06, - "loss": 0.1071, - "step": 1185 - }, - { - "epoch": 0.03, - "learning_rate": 9.946630897000486e-06, - "loss": 0.2301, - "step": 1190 - }, - { - "epoch": 0.03, - "learning_rate": 9.945203915636864e-06, - "loss": 0.1886, - "step": 1195 - }, - { - "epoch": 0.03, - "learning_rate": 9.94377693427324e-06, - "loss": 0.4755, - "step": 1200 - }, - { - "epoch": 0.03, - "learning_rate": 9.942349952909616e-06, - "loss": 0.1931, - "step": 1205 - }, - { - "epoch": 0.03, - "learning_rate": 9.941208367818717e-06, - "loss": 3.617, - "step": 1210 - }, - { - "epoch": 0.03, - "learning_rate": 9.939781386455095e-06, - "loss": 0.2011, - "step": 1215 - }, - { - "epoch": 0.03, - "learning_rate": 9.938354405091471e-06, - "loss": 0.1695, - "step": 1220 - }, - { - "epoch": 0.03, - "learning_rate": 9.936927423727848e-06, - "loss": 0.2074, - "step": 1225 - }, - { - "epoch": 0.03, - "learning_rate": 9.935500442364224e-06, - "loss": 0.1075, - "step": 1230 - }, - { - "epoch": 0.03, - "learning_rate": 9.9340734610006e-06, - "loss": 0.1331, - "step": 1235 - }, - { - "epoch": 0.03, - "learning_rate": 9.932646479636977e-06, - "loss": 0.2502, - "step": 1240 - }, - { - "epoch": 0.03, - "learning_rate": 9.931219498273353e-06, - "loss": 0.2703, - "step": 1245 - }, - { - "epoch": 0.03, - "learning_rate": 9.92979251690973e-06, - "loss": 0.386, - "step": 1250 - }, - { - "epoch": 0.03, - "learning_rate": 9.928365535546106e-06, - "loss": 0.2368, - "step": 1255 - }, - { - "epoch": 0.03, - "learning_rate": 9.926938554182484e-06, - "loss": 0.2148, - "step": 1260 - }, - { - "epoch": 0.04, - "learning_rate": 9.92551157281886e-06, - "loss": 0.2385, - "step": 1265 - }, - { - "epoch": 0.04, - "learning_rate": 9.924084591455236e-06, - "loss": 0.1964, - "step": 1270 - }, - { - "epoch": 0.04, - "learning_rate": 9.922657610091613e-06, - "loss": 0.1165, - "step": 1275 - }, - { - "epoch": 0.04, - "learning_rate": 9.921230628727989e-06, - "loss": 0.1667, - "step": 1280 - }, - { - "epoch": 0.04, - "learning_rate": 9.919803647364367e-06, - "loss": 0.2257, - "step": 1285 - }, - { - "epoch": 0.04, - "learning_rate": 9.918376666000743e-06, - "loss": 0.2837, - "step": 1290 - }, - { - "epoch": 0.04, - "learning_rate": 9.91694968463712e-06, - "loss": 0.5581, - "step": 1295 - }, - { - "epoch": 0.04, - "learning_rate": 9.915522703273496e-06, - "loss": 0.731, - "step": 1300 - }, - { - "epoch": 0.04, - "learning_rate": 9.914095721909872e-06, - "loss": 0.2324, - "step": 1305 - }, - { - "epoch": 0.04, - "learning_rate": 9.91266874054625e-06, - "loss": 0.2118, - "step": 1310 - }, - { - "epoch": 0.04, - "learning_rate": 9.911241759182627e-06, - "loss": 0.2389, - "step": 1315 - }, - { - "epoch": 0.04, - "learning_rate": 9.909814777819003e-06, - "loss": 0.2752, - "step": 1320 - }, - { - "epoch": 0.04, - "learning_rate": 9.90838779645538e-06, - "loss": 0.2481, - "step": 1325 - }, - { - "epoch": 0.04, - "learning_rate": 9.906960815091756e-06, - "loss": 0.0591, - "step": 1330 - }, - { - "epoch": 0.04, - "learning_rate": 9.905533833728132e-06, - "loss": 0.1931, - "step": 1335 - }, - { - "epoch": 0.04, - "learning_rate": 9.904106852364508e-06, - "loss": 0.2633, - "step": 1340 - }, - { - "epoch": 0.04, - "learning_rate": 9.902679871000885e-06, - "loss": 0.4182, - "step": 1345 - }, - { - "epoch": 0.04, - "learning_rate": 9.901252889637261e-06, - "loss": 0.4839, - "step": 1350 - }, - { - "epoch": 0.04, - "learning_rate": 9.899825908273639e-06, - "loss": 0.2509, - "step": 1355 - }, - { - "epoch": 0.04, - "learning_rate": 9.898398926910015e-06, - "loss": 0.251, - "step": 1360 - }, - { - "epoch": 0.04, - "learning_rate": 9.896971945546392e-06, - "loss": 0.1829, - "step": 1365 - }, - { - "epoch": 0.04, - "learning_rate": 9.895544964182768e-06, - "loss": 0.2305, - "step": 1370 - }, - { - "epoch": 0.04, - "learning_rate": 9.894117982819144e-06, - "loss": 0.2734, - "step": 1375 - }, - { - "epoch": 0.04, - "learning_rate": 9.892691001455522e-06, - "loss": 0.1588, - "step": 1380 - }, - { - "epoch": 0.04, - "learning_rate": 9.891264020091899e-06, - "loss": 0.1621, - "step": 1385 - }, - { - "epoch": 0.04, - "learning_rate": 9.889837038728275e-06, - "loss": 0.3336, - "step": 1390 - }, - { - "epoch": 0.04, - "learning_rate": 9.888410057364652e-06, - "loss": 0.26, - "step": 1395 - }, - { - "epoch": 0.04, - "learning_rate": 9.886983076001028e-06, - "loss": 0.3407, - "step": 1400 - }, - { - "epoch": 0.04, - "learning_rate": 9.885556094637406e-06, - "loss": 0.2269, - "step": 1405 - }, - { - "epoch": 0.04, - "learning_rate": 9.884129113273782e-06, - "loss": 0.2338, - "step": 1410 - }, - { - "epoch": 0.04, - "learning_rate": 9.882702131910159e-06, - "loss": 0.175, - "step": 1415 - }, - { - "epoch": 0.04, - "learning_rate": 9.881275150546535e-06, - "loss": 0.2675, - "step": 1420 - }, - { - "epoch": 0.04, - "learning_rate": 9.879848169182911e-06, - "loss": 0.2215, - "step": 1425 - }, - { - "epoch": 0.04, - "learning_rate": 9.878421187819288e-06, - "loss": 0.1028, - "step": 1430 - }, - { - "epoch": 0.04, - "learning_rate": 9.876994206455664e-06, - "loss": 0.1014, - "step": 1435 - }, - { - "epoch": 0.04, - "learning_rate": 9.87556722509204e-06, - "loss": 0.195, - "step": 1440 - }, - { - "epoch": 0.04, - "learning_rate": 9.874140243728417e-06, - "loss": 0.3388, - "step": 1445 - }, - { - "epoch": 0.04, - "learning_rate": 9.872713262364795e-06, - "loss": 0.3025, - "step": 1450 - }, - { - "epoch": 0.04, - "learning_rate": 9.871286281001171e-06, - "loss": 0.1817, - "step": 1455 - }, - { - "epoch": 0.04, - "learning_rate": 9.869859299637547e-06, - "loss": 0.2523, - "step": 1460 - }, - { - "epoch": 0.04, - "learning_rate": 9.868432318273924e-06, - "loss": 0.1917, - "step": 1465 - }, - { - "epoch": 0.04, - "learning_rate": 9.8670053369103e-06, - "loss": 0.2508, - "step": 1470 - }, - { - "epoch": 0.04, - "learning_rate": 9.865578355546678e-06, - "loss": 0.0938, - "step": 1475 - }, - { - "epoch": 0.04, - "learning_rate": 9.864151374183054e-06, - "loss": 0.1335, - "step": 1480 - }, - { - "epoch": 0.04, - "learning_rate": 9.86272439281943e-06, - "loss": 0.2164, - "step": 1485 - }, - { - "epoch": 0.04, - "learning_rate": 9.861297411455807e-06, - "loss": 0.2721, - "step": 1490 - }, - { - "epoch": 0.04, - "learning_rate": 9.859870430092183e-06, - "loss": 0.3324, - "step": 1495 - }, - { - "epoch": 0.04, - "learning_rate": 9.858443448728561e-06, - "loss": 0.6563, - "step": 1500 - }, - { - "epoch": 0.04, - "learning_rate": 9.857016467364938e-06, - "loss": 0.205, - "step": 1505 - }, - { - "epoch": 0.04, - "learning_rate": 9.855589486001314e-06, - "loss": 0.1993, - "step": 1510 - }, - { - "epoch": 0.04, - "learning_rate": 9.85416250463769e-06, - "loss": 0.1924, - "step": 1515 - }, - { - "epoch": 0.04, - "learning_rate": 9.852735523274067e-06, - "loss": 0.2587, - "step": 1520 - }, - { - "epoch": 0.04, - "learning_rate": 9.851308541910443e-06, - "loss": 0.1098, - "step": 1525 - }, - { - "epoch": 0.04, - "learning_rate": 9.84988156054682e-06, - "loss": 0.0455, - "step": 1530 - }, - { - "epoch": 0.04, - "learning_rate": 9.848454579183196e-06, - "loss": 0.1789, - "step": 1535 - }, - { - "epoch": 0.04, - "learning_rate": 9.847027597819572e-06, - "loss": 0.1117, - "step": 1540 - }, - { - "epoch": 0.04, - "learning_rate": 9.84560061645595e-06, - "loss": 0.2805, - "step": 1545 - }, - { - "epoch": 0.04, - "learning_rate": 9.844173635092326e-06, - "loss": 0.4923, - "step": 1550 - }, - { - "epoch": 0.04, - "learning_rate": 9.842746653728703e-06, - "loss": 0.2292, - "step": 1555 - }, - { - "epoch": 0.04, - "learning_rate": 9.841319672365079e-06, - "loss": 0.2311, - "step": 1560 - }, - { - "epoch": 0.04, - "learning_rate": 9.839892691001455e-06, - "loss": 0.2332, - "step": 1565 - }, - { - "epoch": 0.04, - "learning_rate": 9.838465709637834e-06, - "loss": 0.1955, - "step": 1570 - }, - { - "epoch": 0.04, - "learning_rate": 9.83703872827421e-06, - "loss": 0.1574, - "step": 1575 - }, - { - "epoch": 0.04, - "learning_rate": 9.835611746910586e-06, - "loss": 0.1634, - "step": 1580 - }, - { - "epoch": 0.04, - "learning_rate": 9.834184765546963e-06, - "loss": 0.3306, - "step": 1585 - }, - { - "epoch": 0.04, - "learning_rate": 9.832757784183339e-06, - "loss": 0.235, - "step": 1590 - }, - { - "epoch": 0.04, - "learning_rate": 9.831330802819717e-06, - "loss": 0.3012, - "step": 1595 - }, - { - "epoch": 0.04, - "learning_rate": 9.829903821456093e-06, - "loss": 0.4106, - "step": 1600 - }, - { - "epoch": 0.04, - "learning_rate": 9.82847684009247e-06, - "loss": 0.2449, - "step": 1605 - }, - { - "epoch": 0.04, - "learning_rate": 9.827049858728846e-06, - "loss": 0.2571, - "step": 1610 - }, - { - "epoch": 0.04, - "learning_rate": 9.825622877365222e-06, - "loss": 0.2535, - "step": 1615 - }, - { - "epoch": 0.04, - "learning_rate": 9.824195896001599e-06, - "loss": 0.2197, - "step": 1620 - }, - { - "epoch": 0.05, - "learning_rate": 9.822768914637975e-06, - "loss": 0.0862, - "step": 1625 - }, - { - "epoch": 0.05, - "learning_rate": 9.821341933274351e-06, - "loss": 0.1091, - "step": 1630 - }, - { - "epoch": 0.05, - "learning_rate": 9.819914951910728e-06, - "loss": 0.1436, - "step": 1635 - }, - { - "epoch": 0.05, - "learning_rate": 9.818487970547106e-06, - "loss": 0.2528, - "step": 1640 - }, - { - "epoch": 0.05, - "learning_rate": 9.817060989183482e-06, - "loss": 0.3583, - "step": 1645 - }, - { - "epoch": 0.05, - "learning_rate": 9.815634007819858e-06, - "loss": 0.4629, - "step": 1650 - }, - { - "epoch": 0.05, - "learning_rate": 9.814207026456235e-06, - "loss": 0.2162, - "step": 1655 - }, - { - "epoch": 0.05, - "learning_rate": 9.812780045092611e-06, - "loss": 0.2192, - "step": 1660 - }, - { - "epoch": 0.05, - "learning_rate": 9.811353063728989e-06, - "loss": 0.157, - "step": 1665 - }, - { - "epoch": 0.05, - "learning_rate": 9.809926082365365e-06, - "loss": 0.208, - "step": 1670 - }, - { - "epoch": 0.05, - "learning_rate": 9.808499101001742e-06, - "loss": 0.2118, - "step": 1675 - }, - { - "epoch": 0.05, - "learning_rate": 9.807072119638118e-06, - "loss": 0.1081, - "step": 1680 - }, - { - "epoch": 0.05, - "learning_rate": 9.805645138274496e-06, - "loss": 0.198, - "step": 1685 - }, - { - "epoch": 0.05, - "learning_rate": 9.804218156910872e-06, - "loss": 0.2535, - "step": 1690 - }, - { - "epoch": 0.05, - "learning_rate": 9.802791175547249e-06, - "loss": 0.3795, - "step": 1695 - }, - { - "epoch": 0.05, - "learning_rate": 9.801364194183625e-06, - "loss": 0.4864, - "step": 1700 - }, - { - "epoch": 0.05, - "learning_rate": 9.799937212820001e-06, - "loss": 0.1615, - "step": 1705 - }, - { - "epoch": 0.05, - "learning_rate": 9.798510231456378e-06, - "loss": 0.2312, - "step": 1710 - }, - { - "epoch": 0.05, - "learning_rate": 9.797083250092754e-06, - "loss": 0.2066, - "step": 1715 - }, - { - "epoch": 0.05, - "learning_rate": 9.79565626872913e-06, - "loss": 0.2505, - "step": 1720 - }, - { - "epoch": 0.05, - "learning_rate": 9.794229287365507e-06, - "loss": 0.0999, - "step": 1725 - }, - { - "epoch": 0.05, - "learning_rate": 9.792802306001883e-06, - "loss": 0.1156, - "step": 1730 - }, - { - "epoch": 0.05, - "learning_rate": 9.791375324638261e-06, - "loss": 0.0962, - "step": 1735 - }, - { - "epoch": 0.05, - "learning_rate": 9.789948343274638e-06, - "loss": 0.2936, - "step": 1740 - }, - { - "epoch": 0.05, - "learning_rate": 9.788521361911014e-06, - "loss": 0.3334, - "step": 1745 - }, - { - "epoch": 0.05, - "learning_rate": 9.78709438054739e-06, - "loss": 0.5398, - "step": 1750 - }, - { - "epoch": 0.05, - "learning_rate": 9.785667399183767e-06, - "loss": 0.2475, - "step": 1755 - }, - { - "epoch": 0.05, - "learning_rate": 9.784240417820145e-06, - "loss": 0.1535, - "step": 1760 - }, - { - "epoch": 0.05, - "learning_rate": 9.782813436456521e-06, - "loss": 0.1862, - "step": 1765 - }, - { - "epoch": 0.05, - "learning_rate": 9.781386455092897e-06, - "loss": 0.2029, - "step": 1770 - }, - { - "epoch": 0.05, - "learning_rate": 9.779959473729274e-06, - "loss": 0.1054, - "step": 1775 - }, - { - "epoch": 0.05, - "learning_rate": 9.778532492365652e-06, - "loss": 0.166, - "step": 1780 - }, - { - "epoch": 0.05, - "learning_rate": 9.777105511002028e-06, - "loss": 0.2208, - "step": 1785 - }, - { - "epoch": 0.05, - "learning_rate": 9.775678529638404e-06, - "loss": 0.1572, - "step": 1790 - }, - { - "epoch": 0.05, - "learning_rate": 9.77425154827478e-06, - "loss": 0.2488, - "step": 1795 - }, - { - "epoch": 0.05, - "learning_rate": 9.772824566911157e-06, - "loss": 0.2578, - "step": 1800 - }, - { - "epoch": 0.05, - "learning_rate": 9.771397585547533e-06, - "loss": 0.2531, - "step": 1805 - }, - { - "epoch": 0.05, - "learning_rate": 9.76997060418391e-06, - "loss": 0.2395, - "step": 1810 - }, - { - "epoch": 0.05, - "learning_rate": 9.768543622820286e-06, - "loss": 0.2433, - "step": 1815 - }, - { - "epoch": 0.05, - "learning_rate": 9.767116641456664e-06, - "loss": 0.2235, - "step": 1820 - }, - { - "epoch": 0.05, - "learning_rate": 9.76568966009304e-06, - "loss": 0.2172, - "step": 1825 - }, - { - "epoch": 0.05, - "learning_rate": 9.764262678729417e-06, - "loss": 0.1271, - "step": 1830 - }, - { - "epoch": 0.05, - "learning_rate": 9.762835697365793e-06, - "loss": 0.439, - "step": 1835 - }, - { - "epoch": 0.05, - "learning_rate": 9.76140871600217e-06, - "loss": 0.1604, - "step": 1840 - }, - { - "epoch": 0.05, - "learning_rate": 9.759981734638546e-06, - "loss": 0.3628, - "step": 1845 - }, - { - "epoch": 0.05, - "learning_rate": 9.758554753274922e-06, - "loss": 0.4847, - "step": 1850 - }, - { - "epoch": 0.05, - "learning_rate": 9.7571277719113e-06, - "loss": 0.1674, - "step": 1855 - }, - { - "epoch": 0.05, - "learning_rate": 9.755700790547676e-06, - "loss": 0.2104, - "step": 1860 - }, - { - "epoch": 0.05, - "learning_rate": 9.754273809184053e-06, - "loss": 0.2227, - "step": 1865 - }, - { - "epoch": 0.05, - "learning_rate": 9.752846827820429e-06, - "loss": 0.163, - "step": 1870 - }, - { - "epoch": 0.05, - "learning_rate": 9.751419846456807e-06, - "loss": 0.2878, - "step": 1875 - }, - { - "epoch": 0.05, - "learning_rate": 9.749992865093183e-06, - "loss": 0.1738, - "step": 1880 - }, - { - "epoch": 0.05, - "learning_rate": 9.74856588372956e-06, - "loss": 0.109, - "step": 1885 - }, - { - "epoch": 0.05, - "learning_rate": 9.747138902365936e-06, - "loss": 0.2777, - "step": 1890 - }, - { - "epoch": 0.05, - "learning_rate": 9.745711921002312e-06, - "loss": 0.08, - "step": 1895 - }, - { - "epoch": 0.05, - "learning_rate": 9.744284939638689e-06, - "loss": 0.537, - "step": 1900 - }, - { - "epoch": 0.05, - "learning_rate": 9.742857958275065e-06, - "loss": 0.2149, - "step": 1905 - }, - { - "epoch": 0.05, - "learning_rate": 9.741430976911443e-06, - "loss": 0.2135, - "step": 1910 - }, - { - "epoch": 0.05, - "learning_rate": 9.74000399554782e-06, - "loss": 0.2176, - "step": 1915 - }, - { - "epoch": 0.05, - "learning_rate": 9.738577014184196e-06, - "loss": 0.2804, - "step": 1920 - }, - { - "epoch": 0.05, - "learning_rate": 9.737150032820572e-06, - "loss": 0.1747, - "step": 1925 - }, - { - "epoch": 0.05, - "learning_rate": 9.735723051456949e-06, - "loss": 0.1037, - "step": 1930 - }, - { - "epoch": 0.05, - "learning_rate": 9.734296070093325e-06, - "loss": 0.1026, - "step": 1935 - }, - { - "epoch": 0.05, - "learning_rate": 9.732869088729701e-06, - "loss": 0.1829, - "step": 1940 - }, - { - "epoch": 0.05, - "learning_rate": 9.731442107366078e-06, - "loss": 0.4844, - "step": 1945 - }, - { - "epoch": 0.05, - "learning_rate": 9.730015126002456e-06, - "loss": 0.3903, - "step": 1950 - }, - { - "epoch": 0.05, - "learning_rate": 9.728588144638832e-06, - "loss": 0.5092, - "step": 1955 - }, - { - "epoch": 0.05, - "learning_rate": 9.727161163275208e-06, - "loss": 0.1894, - "step": 1960 - }, - { - "epoch": 0.05, - "learning_rate": 9.725734181911585e-06, - "loss": 0.2359, - "step": 1965 - }, - { - "epoch": 0.05, - "learning_rate": 9.724307200547963e-06, - "loss": 0.2379, - "step": 1970 - }, - { - "epoch": 0.05, - "learning_rate": 9.722880219184339e-06, - "loss": 0.2554, - "step": 1975 - }, - { - "epoch": 0.05, - "learning_rate": 9.721453237820715e-06, - "loss": 0.1861, - "step": 1980 - }, - { - "epoch": 0.06, - "learning_rate": 9.720026256457092e-06, - "loss": 0.192, - "step": 1985 - }, - { - "epoch": 0.06, - "learning_rate": 9.718599275093468e-06, - "loss": 0.3486, - "step": 1990 - }, - { - "epoch": 0.06, - "learning_rate": 9.717172293729844e-06, - "loss": 0.2169, - "step": 1995 - }, - { - "epoch": 0.06, - "learning_rate": 9.715745312366222e-06, - "loss": 0.4418, - "step": 2000 - }, - { - "epoch": 0.06, - "eval_loss": 0.08974172174930573, - "eval_runtime": 2327.969, - "eval_samples_per_second": 6.881, - "eval_steps_per_second": 1.72, - "eval_wer": 0.26016949152542374, - "step": 2000 - }, - { - "epoch": 0.06, - "learning_rate": 9.714318331002599e-06, - "loss": 0.202, - "step": 2005 - }, - { - "epoch": 0.06, - "learning_rate": 9.712891349638975e-06, - "loss": 0.4201, - "step": 2010 - }, - { - "epoch": 0.06, - "learning_rate": 9.711464368275351e-06, - "loss": 0.2236, - "step": 2015 - }, - { - "epoch": 0.06, - "learning_rate": 9.710037386911728e-06, - "loss": 0.1821, - "step": 2020 - }, - { - "epoch": 0.06, - "learning_rate": 9.708610405548104e-06, - "loss": 0.2104, - "step": 2025 - }, - { - "epoch": 0.06, - "learning_rate": 9.70718342418448e-06, - "loss": 0.102, - "step": 2030 - }, - { - "epoch": 0.06, - "learning_rate": 9.705756442820857e-06, - "loss": 0.1826, - "step": 2035 - }, - { - "epoch": 0.06, - "learning_rate": 9.704329461457233e-06, - "loss": 0.288, - "step": 2040 - }, - { - "epoch": 0.06, - "learning_rate": 9.702902480093611e-06, - "loss": 0.5527, - "step": 2045 - }, - { - "epoch": 0.06, - "learning_rate": 9.701475498729987e-06, - "loss": 0.4803, - "step": 2050 - }, - { - "epoch": 0.06, - "learning_rate": 9.700048517366364e-06, - "loss": 0.2576, - "step": 2055 - }, - { - "epoch": 0.06, - "learning_rate": 9.69862153600274e-06, - "loss": 0.2127, - "step": 2060 - }, - { - "epoch": 0.06, - "learning_rate": 9.697194554639118e-06, - "loss": 0.2714, - "step": 2065 - }, - { - "epoch": 0.06, - "learning_rate": 9.695767573275494e-06, - "loss": 0.1932, - "step": 2070 - }, - { - "epoch": 0.06, - "learning_rate": 9.69434059191187e-06, - "loss": 0.1743, - "step": 2075 - }, - { - "epoch": 0.06, - "learning_rate": 9.692913610548247e-06, - "loss": 0.2139, - "step": 2080 - }, - { - "epoch": 0.06, - "learning_rate": 9.691486629184624e-06, - "loss": 0.2656, - "step": 2085 - }, - { - "epoch": 0.06, - "learning_rate": 9.690059647821002e-06, - "loss": 0.4477, - "step": 2090 - }, - { - "epoch": 0.06, - "learning_rate": 9.688632666457378e-06, - "loss": 0.215, - "step": 2095 - }, - { - "epoch": 0.06, - "learning_rate": 9.687205685093754e-06, - "loss": 0.3432, - "step": 2100 - }, - { - "epoch": 0.06, - "learning_rate": 9.68577870373013e-06, - "loss": 0.229, - "step": 2105 - }, - { - "epoch": 0.06, - "learning_rate": 9.684351722366507e-06, - "loss": 0.2255, - "step": 2110 - }, - { - "epoch": 0.06, - "learning_rate": 9.682924741002883e-06, - "loss": 0.1953, - "step": 2115 - }, - { - "epoch": 0.06, - "learning_rate": 9.68149775963926e-06, - "loss": 0.1701, - "step": 2120 - }, - { - "epoch": 0.06, - "learning_rate": 9.680070778275636e-06, - "loss": 0.2611, - "step": 2125 - }, - { - "epoch": 0.06, - "learning_rate": 9.678643796912012e-06, - "loss": 0.1288, - "step": 2130 - }, - { - "epoch": 0.06, - "learning_rate": 9.677216815548389e-06, - "loss": 0.0965, - "step": 2135 - }, - { - "epoch": 0.06, - "learning_rate": 9.675789834184767e-06, - "loss": 0.2093, - "step": 2140 - }, - { - "epoch": 0.06, - "learning_rate": 9.674362852821143e-06, - "loss": 0.2346, - "step": 2145 - }, - { - "epoch": 0.06, - "learning_rate": 9.67293587145752e-06, - "loss": 0.6203, - "step": 2150 - }, - { - "epoch": 0.06, - "learning_rate": 9.671508890093896e-06, - "loss": 0.2262, - "step": 2155 - }, - { - "epoch": 0.06, - "learning_rate": 9.670081908730274e-06, - "loss": 0.4529, - "step": 2160 - }, - { - "epoch": 0.06, - "learning_rate": 9.66865492736665e-06, - "loss": 0.235, - "step": 2165 - }, - { - "epoch": 0.06, - "learning_rate": 9.667227946003026e-06, - "loss": 0.1584, - "step": 2170 - }, - { - "epoch": 0.06, - "learning_rate": 9.665800964639403e-06, - "loss": 0.2514, - "step": 2175 - }, - { - "epoch": 0.06, - "learning_rate": 9.664373983275779e-06, - "loss": 0.0816, - "step": 2180 - }, - { - "epoch": 0.06, - "learning_rate": 9.662947001912157e-06, - "loss": 0.0859, - "step": 2185 - }, - { - "epoch": 0.06, - "learning_rate": 9.661520020548533e-06, - "loss": 0.1528, - "step": 2190 - }, - { - "epoch": 0.06, - "learning_rate": 9.66009303918491e-06, - "loss": 0.3267, - "step": 2195 - }, - { - "epoch": 0.06, - "learning_rate": 9.658666057821286e-06, - "loss": 0.3738, - "step": 2200 - }, - { - "epoch": 0.06, - "learning_rate": 9.657239076457662e-06, - "loss": 0.214, - "step": 2205 - }, - { - "epoch": 0.06, - "learning_rate": 9.655812095094039e-06, - "loss": 0.2082, - "step": 2210 - }, - { - "epoch": 0.06, - "learning_rate": 9.654385113730415e-06, - "loss": 0.179, - "step": 2215 - }, - { - "epoch": 0.06, - "learning_rate": 9.652958132366791e-06, - "loss": 0.1861, - "step": 2220 - }, - { - "epoch": 0.06, - "learning_rate": 9.651531151003168e-06, - "loss": 0.1895, - "step": 2225 - }, - { - "epoch": 0.06, - "learning_rate": 9.650104169639544e-06, - "loss": 0.0996, - "step": 2230 - }, - { - "epoch": 0.06, - "learning_rate": 9.648677188275922e-06, - "loss": 0.0948, - "step": 2235 - }, - { - "epoch": 0.06, - "learning_rate": 9.647250206912298e-06, - "loss": 0.1832, - "step": 2240 - }, - { - "epoch": 0.06, - "learning_rate": 9.645823225548675e-06, - "loss": 0.2559, - "step": 2245 - }, - { - "epoch": 0.06, - "learning_rate": 9.644396244185051e-06, - "loss": 0.6217, - "step": 2250 - }, - { - "epoch": 0.06, - "learning_rate": 9.64296926282143e-06, - "loss": 0.2921, - "step": 2255 - }, - { - "epoch": 0.06, - "learning_rate": 9.641542281457806e-06, - "loss": 0.146, - "step": 2260 - }, - { - "epoch": 0.06, - "learning_rate": 9.640115300094182e-06, - "loss": 0.2137, - "step": 2265 - }, - { - "epoch": 0.06, - "learning_rate": 9.638688318730558e-06, - "loss": 0.41, - "step": 2270 - }, - { - "epoch": 0.06, - "learning_rate": 9.637261337366935e-06, - "loss": 0.2422, - "step": 2275 - }, - { - "epoch": 0.06, - "learning_rate": 9.635834356003313e-06, - "loss": 0.1457, - "step": 2280 - }, - { - "epoch": 0.06, - "learning_rate": 9.634407374639689e-06, - "loss": 0.1725, - "step": 2285 - }, - { - "epoch": 0.06, - "learning_rate": 9.632980393276065e-06, - "loss": 0.1379, - "step": 2290 - }, - { - "epoch": 0.06, - "learning_rate": 9.631553411912442e-06, - "loss": 0.2867, - "step": 2295 - }, - { - "epoch": 0.06, - "learning_rate": 9.630126430548818e-06, - "loss": 0.4942, - "step": 2300 - }, - { - "epoch": 0.06, - "learning_rate": 9.628699449185194e-06, - "loss": 0.2345, - "step": 2305 - }, - { - "epoch": 0.06, - "learning_rate": 9.62727246782157e-06, - "loss": 0.1619, - "step": 2310 - }, - { - "epoch": 0.06, - "learning_rate": 9.625845486457947e-06, - "loss": 0.1986, - "step": 2315 - }, - { - "epoch": 0.06, - "learning_rate": 9.624418505094323e-06, - "loss": 0.2719, - "step": 2320 - }, - { - "epoch": 0.06, - "learning_rate": 9.6229915237307e-06, - "loss": 0.2429, - "step": 2325 - }, - { - "epoch": 0.06, - "learning_rate": 9.621564542367078e-06, - "loss": 0.2239, - "step": 2330 - }, - { - "epoch": 0.06, - "learning_rate": 9.620137561003454e-06, - "loss": 0.1842, - "step": 2335 - }, - { - "epoch": 0.06, - "learning_rate": 9.61871057963983e-06, - "loss": 0.2596, - "step": 2340 - }, - { - "epoch": 0.07, - "learning_rate": 9.617283598276207e-06, - "loss": 0.3677, - "step": 2345 - }, - { - "epoch": 0.07, - "learning_rate": 9.615856616912585e-06, - "loss": 0.5166, - "step": 2350 - }, - { - "epoch": 0.07, - "learning_rate": 9.614429635548961e-06, - "loss": 0.1937, - "step": 2355 - }, - { - "epoch": 0.07, - "learning_rate": 9.613002654185337e-06, - "loss": 0.1555, - "step": 2360 - }, - { - "epoch": 0.07, - "learning_rate": 9.611575672821714e-06, - "loss": 0.1997, - "step": 2365 - }, - { - "epoch": 0.07, - "learning_rate": 9.61014869145809e-06, - "loss": 0.2785, - "step": 2370 - }, - { - "epoch": 0.07, - "learning_rate": 9.608721710094468e-06, - "loss": 0.1963, - "step": 2375 - }, - { - "epoch": 0.07, - "learning_rate": 9.607294728730844e-06, - "loss": 0.2269, - "step": 2380 - }, - { - "epoch": 0.07, - "learning_rate": 9.60586774736722e-06, - "loss": 0.1675, - "step": 2385 - }, - { - "epoch": 0.07, - "learning_rate": 9.604440766003597e-06, - "loss": 0.1251, - "step": 2390 - }, - { - "epoch": 0.07, - "learning_rate": 9.603013784639973e-06, - "loss": 0.4726, - "step": 2395 - }, - { - "epoch": 0.07, - "learning_rate": 9.60158680327635e-06, - "loss": 0.6281, - "step": 2400 - }, - { - "epoch": 0.07, - "learning_rate": 9.600159821912726e-06, - "loss": 0.2328, - "step": 2405 - }, - { - "epoch": 0.07, - "learning_rate": 9.598732840549102e-06, - "loss": 0.2014, - "step": 2410 - }, - { - "epoch": 0.07, - "learning_rate": 9.597305859185479e-06, - "loss": 0.2418, - "step": 2415 - }, - { - "epoch": 0.07, - "learning_rate": 9.595878877821855e-06, - "loss": 0.2288, - "step": 2420 - }, - { - "epoch": 0.07, - "learning_rate": 9.594451896458233e-06, - "loss": 0.2354, - "step": 2425 - }, - { - "epoch": 0.07, - "learning_rate": 9.59302491509461e-06, - "loss": 0.1047, - "step": 2430 - }, - { - "epoch": 0.07, - "learning_rate": 9.591597933730986e-06, - "loss": 0.1122, - "step": 2435 - }, - { - "epoch": 0.07, - "learning_rate": 9.590170952367362e-06, - "loss": 0.4132, - "step": 2440 - }, - { - "epoch": 0.07, - "learning_rate": 9.58874397100374e-06, - "loss": 0.2479, - "step": 2445 - }, - { - "epoch": 0.07, - "learning_rate": 9.587316989640117e-06, - "loss": 0.3581, - "step": 2450 - }, - { - "epoch": 0.07, - "learning_rate": 9.585890008276493e-06, - "loss": 0.214, - "step": 2455 - }, - { - "epoch": 0.07, - "learning_rate": 9.58446302691287e-06, - "loss": 0.2046, - "step": 2460 - }, - { - "epoch": 0.07, - "learning_rate": 9.583036045549246e-06, - "loss": 0.1714, - "step": 2465 - }, - { - "epoch": 0.07, - "learning_rate": 9.581609064185624e-06, - "loss": 0.2386, - "step": 2470 - }, - { - "epoch": 0.07, - "learning_rate": 9.580182082822e-06, - "loss": 0.0804, - "step": 2475 - }, - { - "epoch": 0.07, - "learning_rate": 9.578755101458376e-06, - "loss": 0.2579, - "step": 2480 - }, - { - "epoch": 0.07, - "learning_rate": 9.577328120094753e-06, - "loss": 0.2384, - "step": 2485 - }, - { - "epoch": 0.07, - "learning_rate": 9.575901138731129e-06, - "loss": 0.2612, - "step": 2490 - }, - { - "epoch": 0.07, - "learning_rate": 9.574474157367505e-06, - "loss": 0.245, - "step": 2495 - }, - { - "epoch": 0.07, - "learning_rate": 9.573047176003882e-06, - "loss": 0.5089, - "step": 2500 - }, - { - "epoch": 0.07, - "learning_rate": 9.571620194640258e-06, - "loss": 0.2194, - "step": 2505 - }, - { - "epoch": 0.07, - "learning_rate": 9.570193213276634e-06, - "loss": 0.1558, - "step": 2510 - }, - { - "epoch": 0.07, - "learning_rate": 9.56876623191301e-06, - "loss": 0.1905, - "step": 2515 - }, - { - "epoch": 0.07, - "learning_rate": 9.567339250549389e-06, - "loss": 0.2005, - "step": 2520 - }, - { - "epoch": 0.07, - "learning_rate": 9.565912269185765e-06, - "loss": 0.0812, - "step": 2525 - }, - { - "epoch": 0.07, - "learning_rate": 9.564485287822141e-06, - "loss": 0.1355, - "step": 2530 - }, - { - "epoch": 0.07, - "learning_rate": 9.563058306458518e-06, - "loss": 0.2427, - "step": 2535 - }, - { - "epoch": 0.07, - "learning_rate": 9.561631325094896e-06, - "loss": 0.2012, - "step": 2540 - }, - { - "epoch": 0.07, - "learning_rate": 9.560204343731272e-06, - "loss": 0.2796, - "step": 2545 - }, - { - "epoch": 0.07, - "learning_rate": 9.558777362367648e-06, - "loss": 0.5535, - "step": 2550 - }, - { - "epoch": 0.07, - "learning_rate": 9.557350381004025e-06, - "loss": 0.1669, - "step": 2555 - }, - { - "epoch": 0.07, - "learning_rate": 9.555923399640401e-06, - "loss": 0.2318, - "step": 2560 - }, - { - "epoch": 0.07, - "learning_rate": 9.554496418276779e-06, - "loss": 0.2368, - "step": 2565 - }, - { - "epoch": 0.07, - "learning_rate": 9.553069436913155e-06, - "loss": 0.2134, - "step": 2570 - }, - { - "epoch": 0.07, - "learning_rate": 9.551642455549532e-06, - "loss": 0.1166, - "step": 2575 - }, - { - "epoch": 0.07, - "learning_rate": 9.550215474185908e-06, - "loss": 0.0954, - "step": 2580 - }, - { - "epoch": 0.07, - "learning_rate": 9.548788492822284e-06, - "loss": 0.1802, - "step": 2585 - }, - { - "epoch": 0.07, - "learning_rate": 9.54736151145866e-06, - "loss": 0.2293, - "step": 2590 - }, - { - "epoch": 0.07, - "learning_rate": 9.545934530095037e-06, - "loss": 0.275, - "step": 2595 - }, - { - "epoch": 0.07, - "learning_rate": 9.544507548731413e-06, - "loss": 0.3557, - "step": 2600 - }, - { - "epoch": 0.07, - "learning_rate": 9.54308056736779e-06, - "loss": 0.1596, - "step": 2605 - }, - { - "epoch": 0.07, - "learning_rate": 9.541653586004168e-06, - "loss": 0.1963, - "step": 2610 - }, - { - "epoch": 0.07, - "learning_rate": 9.540226604640544e-06, - "loss": 0.2286, - "step": 2615 - }, - { - "epoch": 0.07, - "learning_rate": 9.53879962327692e-06, - "loss": 0.2489, - "step": 2620 - }, - { - "epoch": 0.07, - "learning_rate": 9.537372641913297e-06, - "loss": 0.2016, - "step": 2625 - }, - { - "epoch": 0.07, - "learning_rate": 9.535945660549673e-06, - "loss": 0.1457, - "step": 2630 - }, - { - "epoch": 0.07, - "learning_rate": 9.534518679186051e-06, - "loss": 0.1496, - "step": 2635 - }, - { - "epoch": 0.07, - "learning_rate": 9.533091697822428e-06, - "loss": 0.219, - "step": 2640 - }, - { - "epoch": 0.07, - "learning_rate": 9.531664716458804e-06, - "loss": 0.2844, - "step": 2645 - }, - { - "epoch": 0.07, - "learning_rate": 9.53023773509518e-06, - "loss": 0.5178, - "step": 2650 - }, - { - "epoch": 0.07, - "learning_rate": 9.528810753731557e-06, - "loss": 0.2695, - "step": 2655 - }, - { - "epoch": 0.07, - "learning_rate": 9.527383772367935e-06, - "loss": 0.1573, - "step": 2660 - }, - { - "epoch": 0.07, - "learning_rate": 9.525956791004311e-06, - "loss": 0.1983, - "step": 2665 - }, - { - "epoch": 0.07, - "learning_rate": 9.524529809640687e-06, - "loss": 0.2395, - "step": 2670 - }, - { - "epoch": 0.07, - "learning_rate": 9.523102828277064e-06, - "loss": 0.2201, - "step": 2675 - }, - { - "epoch": 0.07, - "learning_rate": 9.52167584691344e-06, - "loss": 0.1012, - "step": 2680 - }, - { - "epoch": 0.07, - "learning_rate": 9.520248865549816e-06, - "loss": 0.247, - "step": 2685 - }, - { - "epoch": 0.07, - "learning_rate": 9.518821884186193e-06, - "loss": 0.2196, - "step": 2690 - }, - { - "epoch": 0.07, - "learning_rate": 9.517394902822569e-06, - "loss": 0.2505, - "step": 2695 - }, - { - "epoch": 0.07, - "learning_rate": 9.515967921458947e-06, - "loss": 0.4629, - "step": 2700 - }, - { - "epoch": 0.08, - "learning_rate": 9.514540940095323e-06, - "loss": 0.2163, - "step": 2705 - }, - { - "epoch": 0.08, - "learning_rate": 9.5131139587317e-06, - "loss": 0.212, - "step": 2710 - }, - { - "epoch": 0.08, - "learning_rate": 9.511686977368076e-06, - "loss": 0.2412, - "step": 2715 - }, - { - "epoch": 0.08, - "learning_rate": 9.510259996004452e-06, - "loss": 0.1869, - "step": 2720 - }, - { - "epoch": 0.08, - "learning_rate": 9.508833014640829e-06, - "loss": 0.2049, - "step": 2725 - }, - { - "epoch": 0.08, - "learning_rate": 9.507406033277207e-06, - "loss": 0.1012, - "step": 2730 - }, - { - "epoch": 0.08, - "learning_rate": 9.505979051913583e-06, - "loss": 0.1866, - "step": 2735 - }, - { - "epoch": 0.08, - "learning_rate": 9.50455207054996e-06, - "loss": 0.1811, - "step": 2740 - }, - { - "epoch": 0.08, - "learning_rate": 9.503125089186336e-06, - "loss": 0.4811, - "step": 2745 - }, - { - "epoch": 0.08, - "learning_rate": 9.501698107822712e-06, - "loss": 0.6059, - "step": 2750 - }, - { - "epoch": 0.08, - "learning_rate": 9.50027112645909e-06, - "loss": 0.2447, - "step": 2755 - }, - { - "epoch": 0.08, - "learning_rate": 9.498844145095466e-06, - "loss": 0.1582, - "step": 2760 - }, - { - "epoch": 0.08, - "learning_rate": 9.497417163731843e-06, - "loss": 0.1435, - "step": 2765 - }, - { - "epoch": 0.08, - "learning_rate": 9.49599018236822e-06, - "loss": 0.258, - "step": 2770 - }, - { - "epoch": 0.08, - "learning_rate": 9.494563201004596e-06, - "loss": 0.1405, - "step": 2775 - }, - { - "epoch": 0.08, - "learning_rate": 9.493136219640972e-06, - "loss": 0.122, - "step": 2780 - }, - { - "epoch": 0.08, - "learning_rate": 9.491709238277348e-06, - "loss": 0.1433, - "step": 2785 - }, - { - "epoch": 0.08, - "learning_rate": 9.490282256913726e-06, - "loss": 0.141, - "step": 2790 - }, - { - "epoch": 0.08, - "learning_rate": 9.488855275550103e-06, - "loss": 0.2074, - "step": 2795 - }, - { - "epoch": 0.08, - "learning_rate": 9.487428294186479e-06, - "loss": 0.3473, - "step": 2800 - }, - { - "epoch": 0.08, - "learning_rate": 9.486001312822855e-06, - "loss": 0.2921, - "step": 2805 - }, - { - "epoch": 0.08, - "learning_rate": 9.484574331459232e-06, - "loss": 0.2629, - "step": 2810 - }, - { - "epoch": 0.08, - "learning_rate": 9.483147350095608e-06, - "loss": 0.1963, - "step": 2815 - }, - { - "epoch": 0.08, - "learning_rate": 9.481720368731984e-06, - "loss": 0.184, - "step": 2820 - }, - { - "epoch": 0.08, - "learning_rate": 9.480293387368362e-06, - "loss": 0.1284, - "step": 2825 - }, - { - "epoch": 0.08, - "learning_rate": 9.478866406004739e-06, - "loss": 0.153, - "step": 2830 - }, - { - "epoch": 0.08, - "learning_rate": 9.477439424641115e-06, - "loss": 0.1785, - "step": 2835 - }, - { - "epoch": 0.08, - "learning_rate": 9.476012443277491e-06, - "loss": 0.1201, - "step": 2840 - }, - { - "epoch": 0.08, - "learning_rate": 9.474585461913868e-06, - "loss": 0.6185, - "step": 2845 - }, - { - "epoch": 0.08, - "learning_rate": 9.473158480550246e-06, - "loss": 0.3666, - "step": 2850 - }, - { - "epoch": 0.08, - "learning_rate": 9.471731499186622e-06, - "loss": 0.1744, - "step": 2855 - }, - { - "epoch": 0.08, - "learning_rate": 9.470304517822998e-06, - "loss": 0.205, - "step": 2860 - }, - { - "epoch": 0.08, - "learning_rate": 9.468877536459375e-06, - "loss": 0.1366, - "step": 2865 - }, - { - "epoch": 0.08, - "learning_rate": 9.467450555095751e-06, - "loss": 0.2189, - "step": 2870 - }, - { - "epoch": 0.08, - "learning_rate": 9.466023573732129e-06, - "loss": 0.1519, - "step": 2875 - }, - { - "epoch": 0.08, - "learning_rate": 9.464596592368505e-06, - "loss": 0.1423, - "step": 2880 - }, - { - "epoch": 0.08, - "learning_rate": 9.463169611004882e-06, - "loss": 0.2421, - "step": 2885 - }, - { - "epoch": 0.08, - "learning_rate": 9.461742629641258e-06, - "loss": 0.2549, - "step": 2890 - }, - { - "epoch": 0.08, - "learning_rate": 9.460315648277634e-06, - "loss": 0.1883, - "step": 2895 - }, - { - "epoch": 0.08, - "learning_rate": 9.45888866691401e-06, - "loss": 0.2442, - "step": 2900 - }, - { - "epoch": 0.08, - "learning_rate": 9.457461685550387e-06, - "loss": 0.261, - "step": 2905 - }, - { - "epoch": 0.08, - "learning_rate": 9.456034704186763e-06, - "loss": 0.201, - "step": 2910 - }, - { - "epoch": 0.08, - "learning_rate": 9.45460772282314e-06, - "loss": 0.2201, - "step": 2915 - }, - { - "epoch": 0.08, - "learning_rate": 9.453180741459518e-06, - "loss": 0.17, - "step": 2920 - }, - { - "epoch": 0.08, - "learning_rate": 9.451753760095894e-06, - "loss": 0.1684, - "step": 2925 - }, - { - "epoch": 0.08, - "learning_rate": 9.45032677873227e-06, - "loss": 0.1543, - "step": 2930 - }, - { - "epoch": 0.08, - "learning_rate": 9.448899797368647e-06, - "loss": 0.1616, - "step": 2935 - }, - { - "epoch": 0.08, - "learning_rate": 9.447472816005023e-06, - "loss": 0.2266, - "step": 2940 - }, - { - "epoch": 0.08, - "learning_rate": 9.446045834641401e-06, - "loss": 0.2079, - "step": 2945 - }, - { - "epoch": 0.08, - "learning_rate": 9.444618853277778e-06, - "loss": 0.5384, - "step": 2950 - }, - { - "epoch": 0.08, - "learning_rate": 9.443191871914154e-06, - "loss": 0.2111, - "step": 2955 - }, - { - "epoch": 0.08, - "learning_rate": 9.44176489055053e-06, - "loss": 0.1835, - "step": 2960 - }, - { - "epoch": 0.08, - "learning_rate": 9.440337909186907e-06, - "loss": 0.2175, - "step": 2965 - }, - { - "epoch": 0.08, - "learning_rate": 9.438910927823285e-06, - "loss": 0.2433, - "step": 2970 - }, - { - "epoch": 0.08, - "learning_rate": 9.437483946459661e-06, - "loss": 0.1842, - "step": 2975 - }, - { - "epoch": 0.08, - "learning_rate": 9.436056965096037e-06, - "loss": 0.1738, - "step": 2980 - }, - { - "epoch": 0.08, - "learning_rate": 9.434629983732414e-06, - "loss": 0.1602, - "step": 2985 - }, - { - "epoch": 0.08, - "learning_rate": 9.43320300236879e-06, - "loss": 0.3211, - "step": 2990 - }, - { - "epoch": 0.08, - "learning_rate": 9.431776021005166e-06, - "loss": 0.2437, - "step": 2995 - }, - { - "epoch": 0.08, - "learning_rate": 9.430349039641543e-06, - "loss": 0.5782, - "step": 3000 - }, - { - "epoch": 0.08, - "learning_rate": 9.428922058277919e-06, - "loss": 0.2063, - "step": 3005 - }, - { - "epoch": 0.08, - "learning_rate": 9.427495076914295e-06, - "loss": 0.2657, - "step": 3010 - }, - { - "epoch": 0.08, - "learning_rate": 9.426068095550673e-06, - "loss": 0.2458, - "step": 3015 - }, - { - "epoch": 0.08, - "learning_rate": 9.42464111418705e-06, - "loss": 0.1792, - "step": 3020 - }, - { - "epoch": 0.08, - "learning_rate": 9.423214132823426e-06, - "loss": 0.215, - "step": 3025 - }, - { - "epoch": 0.08, - "learning_rate": 9.421787151459802e-06, - "loss": 0.1876, - "step": 3030 - }, - { - "epoch": 0.08, - "learning_rate": 9.420360170096179e-06, - "loss": 0.2164, - "step": 3035 - }, - { - "epoch": 0.08, - "learning_rate": 9.418933188732557e-06, - "loss": 0.3034, - "step": 3040 - }, - { - "epoch": 0.08, - "learning_rate": 9.417506207368933e-06, - "loss": 0.3196, - "step": 3045 - }, - { - "epoch": 0.08, - "learning_rate": 9.41607922600531e-06, - "loss": 0.3141, - "step": 3050 - }, - { - "epoch": 0.08, - "learning_rate": 9.414652244641686e-06, - "loss": 0.1715, - "step": 3055 - }, - { - "epoch": 0.08, - "learning_rate": 9.413225263278062e-06, - "loss": 0.2603, - "step": 3060 - }, - { - "epoch": 0.09, - "learning_rate": 9.41179828191444e-06, - "loss": 0.207, - "step": 3065 - }, - { - "epoch": 0.09, - "learning_rate": 9.410371300550816e-06, - "loss": 0.2695, - "step": 3070 - }, - { - "epoch": 0.09, - "learning_rate": 9.408944319187193e-06, - "loss": 0.2754, - "step": 3075 - }, - { - "epoch": 0.09, - "learning_rate": 9.407517337823569e-06, - "loss": 0.1798, - "step": 3080 - }, - { - "epoch": 0.09, - "learning_rate": 9.406090356459945e-06, - "loss": 0.1376, - "step": 3085 - }, - { - "epoch": 0.09, - "learning_rate": 9.404663375096322e-06, - "loss": 0.2561, - "step": 3090 - }, - { - "epoch": 0.09, - "learning_rate": 9.403236393732698e-06, - "loss": 0.4096, - "step": 3095 - }, - { - "epoch": 0.09, - "learning_rate": 9.401809412369074e-06, - "loss": 0.6031, - "step": 3100 - }, - { - "epoch": 0.09, - "learning_rate": 9.40038243100545e-06, - "loss": 0.1809, - "step": 3105 - }, - { - "epoch": 0.09, - "learning_rate": 9.398955449641829e-06, - "loss": 0.1677, - "step": 3110 - }, - { - "epoch": 0.09, - "learning_rate": 9.397528468278205e-06, - "loss": 0.2089, - "step": 3115 - }, - { - "epoch": 0.09, - "learning_rate": 9.396101486914582e-06, - "loss": 0.1739, - "step": 3120 - }, - { - "epoch": 0.09, - "learning_rate": 9.394674505550958e-06, - "loss": 0.1027, - "step": 3125 - }, - { - "epoch": 0.09, - "learning_rate": 9.393247524187334e-06, - "loss": 0.277, - "step": 3130 - }, - { - "epoch": 0.09, - "learning_rate": 9.391820542823712e-06, - "loss": 0.2017, - "step": 3135 - }, - { - "epoch": 0.09, - "learning_rate": 9.390393561460089e-06, - "loss": 0.1102, - "step": 3140 - }, - { - "epoch": 0.09, - "learning_rate": 9.388966580096465e-06, - "loss": 0.2556, - "step": 3145 - }, - { - "epoch": 0.09, - "learning_rate": 9.387539598732841e-06, - "loss": 0.3088, - "step": 3150 - }, - { - "epoch": 0.09, - "learning_rate": 9.386112617369218e-06, - "loss": 0.2412, - "step": 3155 - }, - { - "epoch": 0.09, - "learning_rate": 9.384685636005596e-06, - "loss": 0.1554, - "step": 3160 - }, - { - "epoch": 0.09, - "learning_rate": 9.383258654641972e-06, - "loss": 0.2364, - "step": 3165 - }, - { - "epoch": 0.09, - "learning_rate": 9.381831673278348e-06, - "loss": 0.1928, - "step": 3170 - }, - { - "epoch": 0.09, - "learning_rate": 9.380404691914725e-06, - "loss": 0.2412, - "step": 3175 - }, - { - "epoch": 0.09, - "learning_rate": 9.378977710551101e-06, - "loss": 0.0616, - "step": 3180 - }, - { - "epoch": 0.09, - "learning_rate": 9.377550729187477e-06, - "loss": 0.1695, - "step": 3185 - }, - { - "epoch": 0.09, - "learning_rate": 9.376123747823854e-06, - "loss": 0.2261, - "step": 3190 - }, - { - "epoch": 0.09, - "learning_rate": 9.37469676646023e-06, - "loss": 0.3939, - "step": 3195 - }, - { - "epoch": 0.09, - "learning_rate": 9.373269785096606e-06, - "loss": 0.3573, - "step": 3200 - }, - { - "epoch": 0.09, - "learning_rate": 9.371842803732984e-06, - "loss": 0.1546, - "step": 3205 - }, - { - "epoch": 0.09, - "learning_rate": 9.37041582236936e-06, - "loss": 0.1995, - "step": 3210 - }, - { - "epoch": 0.09, - "learning_rate": 9.368988841005737e-06, - "loss": 0.1817, - "step": 3215 - }, - { - "epoch": 0.09, - "learning_rate": 9.367561859642113e-06, - "loss": 0.2167, - "step": 3220 - }, - { - "epoch": 0.09, - "learning_rate": 9.36613487827849e-06, - "loss": 0.0847, - "step": 3225 - }, - { - "epoch": 0.09, - "learning_rate": 9.364707896914868e-06, - "loss": 0.3077, - "step": 3230 - }, - { - "epoch": 0.09, - "learning_rate": 9.363280915551244e-06, - "loss": 0.1731, - "step": 3235 - }, - { - "epoch": 0.09, - "learning_rate": 9.36185393418762e-06, - "loss": 0.2065, - "step": 3240 - }, - { - "epoch": 0.09, - "learning_rate": 9.360426952823997e-06, - "loss": 0.2309, - "step": 3245 - }, - { - "epoch": 0.09, - "learning_rate": 9.358999971460373e-06, - "loss": 0.4587, - "step": 3250 - }, - { - "epoch": 0.09, - "learning_rate": 9.357572990096751e-06, - "loss": 0.1917, - "step": 3255 - }, - { - "epoch": 0.09, - "learning_rate": 9.356146008733127e-06, - "loss": 0.2364, - "step": 3260 - }, - { - "epoch": 0.09, - "learning_rate": 9.354719027369504e-06, - "loss": 0.2863, - "step": 3265 - }, - { - "epoch": 0.09, - "learning_rate": 9.35329204600588e-06, - "loss": 0.2016, - "step": 3270 - }, - { - "epoch": 0.09, - "learning_rate": 9.351865064642256e-06, - "loss": 0.0938, - "step": 3275 - }, - { - "epoch": 0.09, - "learning_rate": 9.350438083278633e-06, - "loss": 0.1143, - "step": 3280 - }, - { - "epoch": 0.09, - "learning_rate": 9.34901110191501e-06, - "loss": 0.1648, - "step": 3285 - }, - { - "epoch": 0.09, - "learning_rate": 9.347584120551385e-06, - "loss": 0.1564, - "step": 3290 - }, - { - "epoch": 0.09, - "learning_rate": 9.346157139187762e-06, - "loss": 0.2529, - "step": 3295 - }, - { - "epoch": 0.09, - "learning_rate": 9.34473015782414e-06, - "loss": 0.2956, - "step": 3300 - }, - { - "epoch": 0.09, - "learning_rate": 9.343303176460516e-06, - "loss": 0.2099, - "step": 3305 - }, - { - "epoch": 0.09, - "learning_rate": 9.341876195096893e-06, - "loss": 0.2067, - "step": 3310 - }, - { - "epoch": 0.09, - "learning_rate": 9.340449213733269e-06, - "loss": 0.1962, - "step": 3315 - }, - { - "epoch": 0.09, - "learning_rate": 9.339022232369645e-06, - "loss": 0.2011, - "step": 3320 - }, - { - "epoch": 0.09, - "learning_rate": 9.337595251006023e-06, - "loss": 0.2443, - "step": 3325 - }, - { - "epoch": 0.09, - "learning_rate": 9.3361682696424e-06, - "loss": 0.1325, - "step": 3330 - }, - { - "epoch": 0.09, - "learning_rate": 9.334741288278776e-06, - "loss": 0.0892, - "step": 3335 - }, - { - "epoch": 0.09, - "learning_rate": 9.333314306915152e-06, - "loss": 0.2842, - "step": 3340 - }, - { - "epoch": 0.09, - "learning_rate": 9.331887325551529e-06, - "loss": 0.3977, - "step": 3345 - }, - { - "epoch": 0.09, - "learning_rate": 9.330460344187907e-06, - "loss": 0.5102, - "step": 3350 - }, - { - "epoch": 0.09, - "learning_rate": 9.329033362824283e-06, - "loss": 0.2043, - "step": 3355 - }, - { - "epoch": 0.09, - "learning_rate": 9.32760638146066e-06, - "loss": 0.2347, - "step": 3360 - }, - { - "epoch": 0.09, - "learning_rate": 9.326179400097036e-06, - "loss": 0.1802, - "step": 3365 - }, - { - "epoch": 0.09, - "learning_rate": 9.324752418733412e-06, - "loss": 0.2627, - "step": 3370 - }, - { - "epoch": 0.09, - "learning_rate": 9.323325437369788e-06, - "loss": 0.2043, - "step": 3375 - }, - { - "epoch": 0.09, - "learning_rate": 9.321898456006165e-06, - "loss": 0.175, - "step": 3380 - }, - { - "epoch": 0.09, - "learning_rate": 9.320471474642541e-06, - "loss": 0.1667, - "step": 3385 - }, - { - "epoch": 0.09, - "learning_rate": 9.319044493278917e-06, - "loss": 0.1856, - "step": 3390 - }, - { - "epoch": 0.09, - "learning_rate": 9.317617511915295e-06, - "loss": 0.1524, - "step": 3395 - }, - { - "epoch": 0.09, - "learning_rate": 9.316190530551672e-06, - "loss": 0.5217, - "step": 3400 - }, - { - "epoch": 0.09, - "learning_rate": 9.314763549188048e-06, - "loss": 0.1621, - "step": 3405 - }, - { - "epoch": 0.09, - "learning_rate": 9.313336567824424e-06, - "loss": 0.2443, - "step": 3410 - }, - { - "epoch": 0.09, - "learning_rate": 9.3119095864608e-06, - "loss": 0.1285, - "step": 3415 - }, - { - "epoch": 0.09, - "learning_rate": 9.310482605097179e-06, - "loss": 0.2026, - "step": 3420 - }, - { - "epoch": 0.1, - "learning_rate": 9.309055623733555e-06, - "loss": 0.1533, - "step": 3425 - }, - { - "epoch": 0.1, - "learning_rate": 9.307628642369931e-06, - "loss": 0.1703, - "step": 3430 - }, - { - "epoch": 0.1, - "learning_rate": 9.306201661006308e-06, - "loss": 0.173, - "step": 3435 - }, - { - "epoch": 0.1, - "learning_rate": 9.304774679642684e-06, - "loss": 0.2034, - "step": 3440 - }, - { - "epoch": 0.1, - "learning_rate": 9.303347698279062e-06, - "loss": 0.3843, - "step": 3445 - }, - { - "epoch": 0.1, - "learning_rate": 9.301920716915438e-06, - "loss": 0.6026, - "step": 3450 - }, - { - "epoch": 0.1, - "learning_rate": 9.300493735551815e-06, - "loss": 0.2296, - "step": 3455 - }, - { - "epoch": 0.1, - "learning_rate": 9.299066754188191e-06, - "loss": 0.2542, - "step": 3460 - }, - { - "epoch": 0.1, - "learning_rate": 9.297639772824568e-06, - "loss": 0.2546, - "step": 3465 - }, - { - "epoch": 0.1, - "learning_rate": 9.296212791460944e-06, - "loss": 0.1721, - "step": 3470 - }, - { - "epoch": 0.1, - "learning_rate": 9.29478581009732e-06, - "loss": 0.1002, - "step": 3475 - }, - { - "epoch": 0.1, - "learning_rate": 9.293358828733697e-06, - "loss": 0.1049, - "step": 3480 - }, - { - "epoch": 0.1, - "learning_rate": 9.291931847370073e-06, - "loss": 0.1701, - "step": 3485 - }, - { - "epoch": 0.1, - "learning_rate": 9.290504866006451e-06, - "loss": 0.1776, - "step": 3490 - }, - { - "epoch": 0.1, - "learning_rate": 9.289077884642827e-06, - "loss": 0.3081, - "step": 3495 - }, - { - "epoch": 0.1, - "learning_rate": 9.287650903279204e-06, - "loss": 0.4832, - "step": 3500 - }, - { - "epoch": 0.1, - "learning_rate": 9.28622392191558e-06, - "loss": 0.1629, - "step": 3505 - }, - { - "epoch": 0.1, - "learning_rate": 9.284796940551956e-06, - "loss": 0.1529, - "step": 3510 - }, - { - "epoch": 0.1, - "learning_rate": 9.283369959188334e-06, - "loss": 0.2222, - "step": 3515 - }, - { - "epoch": 0.1, - "learning_rate": 9.28194297782471e-06, - "loss": 0.247, - "step": 3520 - }, - { - "epoch": 0.1, - "learning_rate": 9.280515996461087e-06, - "loss": 0.1803, - "step": 3525 - }, - { - "epoch": 0.1, - "learning_rate": 9.279089015097463e-06, - "loss": 0.1257, - "step": 3530 - }, - { - "epoch": 0.1, - "learning_rate": 9.27766203373384e-06, - "loss": 0.249, - "step": 3535 - }, - { - "epoch": 0.1, - "learning_rate": 9.276235052370218e-06, - "loss": 0.1671, - "step": 3540 - }, - { - "epoch": 0.1, - "learning_rate": 9.274808071006594e-06, - "loss": 0.3034, - "step": 3545 - }, - { - "epoch": 0.1, - "learning_rate": 9.27338108964297e-06, - "loss": 0.7076, - "step": 3550 - }, - { - "epoch": 0.1, - "learning_rate": 9.271954108279347e-06, - "loss": 0.198, - "step": 3555 - }, - { - "epoch": 0.1, - "learning_rate": 9.270527126915723e-06, - "loss": 0.2329, - "step": 3560 - }, - { - "epoch": 0.1, - "learning_rate": 9.2691001455521e-06, - "loss": 0.2115, - "step": 3565 - }, - { - "epoch": 0.1, - "learning_rate": 9.267673164188476e-06, - "loss": 0.241, - "step": 3570 - }, - { - "epoch": 0.1, - "learning_rate": 9.266246182824852e-06, - "loss": 0.1814, - "step": 3575 - }, - { - "epoch": 0.1, - "learning_rate": 9.26481920146123e-06, - "loss": 0.1618, - "step": 3580 - }, - { - "epoch": 0.1, - "learning_rate": 9.263392220097606e-06, - "loss": 0.1482, - "step": 3585 - }, - { - "epoch": 0.1, - "learning_rate": 9.261965238733983e-06, - "loss": 0.3956, - "step": 3590 - }, - { - "epoch": 0.1, - "learning_rate": 9.260538257370359e-06, - "loss": 0.3081, - "step": 3595 - }, - { - "epoch": 0.1, - "learning_rate": 9.259111276006735e-06, - "loss": 0.7055, - "step": 3600 - }, - { - "epoch": 0.1, - "learning_rate": 9.257684294643112e-06, - "loss": 0.1578, - "step": 3605 - }, - { - "epoch": 0.1, - "learning_rate": 9.25625731327949e-06, - "loss": 0.2141, - "step": 3610 - }, - { - "epoch": 0.1, - "learning_rate": 9.254830331915866e-06, - "loss": 0.2331, - "step": 3615 - }, - { - "epoch": 0.1, - "learning_rate": 9.253403350552242e-06, - "loss": 0.1813, - "step": 3620 - }, - { - "epoch": 0.1, - "learning_rate": 9.251976369188619e-06, - "loss": 0.1458, - "step": 3625 - }, - { - "epoch": 0.1, - "learning_rate": 9.250549387824995e-06, - "loss": 0.1256, - "step": 3630 - }, - { - "epoch": 0.1, - "learning_rate": 9.249122406461373e-06, - "loss": 0.1983, - "step": 3635 - }, - { - "epoch": 0.1, - "learning_rate": 9.24769542509775e-06, - "loss": 0.1667, - "step": 3640 - }, - { - "epoch": 0.1, - "learning_rate": 9.246268443734126e-06, - "loss": 0.4398, - "step": 3645 - }, - { - "epoch": 0.1, - "learning_rate": 9.244841462370502e-06, - "loss": 0.5002, - "step": 3650 - }, - { - "epoch": 0.1, - "learning_rate": 9.243414481006879e-06, - "loss": 0.192, - "step": 3655 - }, - { - "epoch": 0.1, - "learning_rate": 9.241987499643255e-06, - "loss": 0.2471, - "step": 3660 - }, - { - "epoch": 0.1, - "learning_rate": 9.240560518279633e-06, - "loss": 0.2014, - "step": 3665 - }, - { - "epoch": 0.1, - "learning_rate": 9.23913353691601e-06, - "loss": 0.2114, - "step": 3670 - }, - { - "epoch": 0.1, - "learning_rate": 9.237706555552386e-06, - "loss": 0.2025, - "step": 3675 - }, - { - "epoch": 0.1, - "learning_rate": 9.236279574188762e-06, - "loss": 0.0411, - "step": 3680 - }, - { - "epoch": 0.1, - "learning_rate": 9.234852592825138e-06, - "loss": 0.206, - "step": 3685 - }, - { - "epoch": 0.1, - "learning_rate": 9.233425611461515e-06, - "loss": 0.1223, - "step": 3690 - }, - { - "epoch": 0.1, - "learning_rate": 9.231998630097891e-06, - "loss": 0.2817, - "step": 3695 - }, - { - "epoch": 0.1, - "learning_rate": 9.230571648734267e-06, - "loss": 0.4316, - "step": 3700 - }, - { - "epoch": 0.1, - "learning_rate": 9.229144667370645e-06, - "loss": 0.2052, - "step": 3705 - }, - { - "epoch": 0.1, - "learning_rate": 9.227717686007022e-06, - "loss": 0.2416, - "step": 3710 - }, - { - "epoch": 0.1, - "learning_rate": 9.226290704643398e-06, - "loss": 0.1811, - "step": 3715 - }, - { - "epoch": 0.1, - "learning_rate": 9.224863723279774e-06, - "loss": 0.1848, - "step": 3720 - }, - { - "epoch": 0.1, - "learning_rate": 9.22343674191615e-06, - "loss": 0.0785, - "step": 3725 - }, - { - "epoch": 0.1, - "learning_rate": 9.222009760552529e-06, - "loss": 0.1411, - "step": 3730 - }, - { - "epoch": 0.1, - "learning_rate": 9.220582779188905e-06, - "loss": 0.0565, - "step": 3735 - }, - { - "epoch": 0.1, - "learning_rate": 9.219155797825281e-06, - "loss": 0.3228, - "step": 3740 - }, - { - "epoch": 0.1, - "learning_rate": 9.217728816461658e-06, - "loss": 0.3325, - "step": 3745 - }, - { - "epoch": 0.1, - "learning_rate": 9.216301835098034e-06, - "loss": 0.2787, - "step": 3750 - }, - { - "epoch": 0.1, - "learning_rate": 9.214874853734412e-06, - "loss": 0.1688, - "step": 3755 - }, - { - "epoch": 0.1, - "learning_rate": 9.213447872370788e-06, - "loss": 0.2905, - "step": 3760 - }, - { - "epoch": 0.1, - "learning_rate": 9.212020891007165e-06, - "loss": 0.2357, - "step": 3765 - }, - { - "epoch": 0.1, - "learning_rate": 9.210593909643541e-06, - "loss": 0.2019, - "step": 3770 - }, - { - "epoch": 0.1, - "learning_rate": 9.209166928279917e-06, - "loss": 0.2344, - "step": 3775 - }, - { - "epoch": 0.1, - "learning_rate": 9.207739946916294e-06, - "loss": 0.0983, - "step": 3780 - }, - { - "epoch": 0.11, - "learning_rate": 9.20631296555267e-06, - "loss": 0.0607, - "step": 3785 - }, - { - "epoch": 0.11, - "learning_rate": 9.204885984189046e-06, - "loss": 0.1757, - "step": 3790 - }, - { - "epoch": 0.11, - "learning_rate": 9.203459002825423e-06, - "loss": 0.2125, - "step": 3795 - }, - { - "epoch": 0.11, - "learning_rate": 9.2020320214618e-06, - "loss": 0.6506, - "step": 3800 - }, - { - "epoch": 0.11, - "learning_rate": 9.200605040098177e-06, - "loss": 0.208, - "step": 3805 - }, - { - "epoch": 0.11, - "learning_rate": 9.199178058734554e-06, - "loss": 0.1704, - "step": 3810 - }, - { - "epoch": 0.11, - "learning_rate": 9.19775107737093e-06, - "loss": 0.1661, - "step": 3815 - }, - { - "epoch": 0.11, - "learning_rate": 9.196324096007306e-06, - "loss": 0.3135, - "step": 3820 - }, - { - "epoch": 0.11, - "learning_rate": 9.194897114643684e-06, - "loss": 0.2682, - "step": 3825 - }, - { - "epoch": 0.11, - "learning_rate": 9.19347013328006e-06, - "loss": 0.0732, - "step": 3830 - }, - { - "epoch": 0.11, - "learning_rate": 9.192043151916437e-06, - "loss": 0.1708, - "step": 3835 - }, - { - "epoch": 0.11, - "learning_rate": 9.190616170552813e-06, - "loss": 0.1189, - "step": 3840 - }, - { - "epoch": 0.11, - "learning_rate": 9.189189189189191e-06, - "loss": 0.2076, - "step": 3845 - }, - { - "epoch": 0.11, - "learning_rate": 9.187762207825568e-06, - "loss": 0.5824, - "step": 3850 - }, - { - "epoch": 0.11, - "learning_rate": 9.186335226461944e-06, - "loss": 0.2316, - "step": 3855 - }, - { - "epoch": 0.11, - "learning_rate": 9.18490824509832e-06, - "loss": 0.239, - "step": 3860 - }, - { - "epoch": 0.11, - "learning_rate": 9.183481263734697e-06, - "loss": 0.2332, - "step": 3865 - }, - { - "epoch": 0.11, - "learning_rate": 9.182054282371073e-06, - "loss": 0.2173, - "step": 3870 - }, - { - "epoch": 0.11, - "learning_rate": 9.18062730100745e-06, - "loss": 0.0937, - "step": 3875 - }, - { - "epoch": 0.11, - "learning_rate": 9.179200319643826e-06, - "loss": 0.2231, - "step": 3880 - }, - { - "epoch": 0.11, - "learning_rate": 9.177773338280202e-06, - "loss": 0.3681, - "step": 3885 - }, - { - "epoch": 0.11, - "learning_rate": 9.176346356916578e-06, - "loss": 0.3334, - "step": 3890 - }, - { - "epoch": 0.11, - "learning_rate": 9.174919375552956e-06, - "loss": 0.3968, - "step": 3895 - }, - { - "epoch": 0.11, - "learning_rate": 9.173492394189333e-06, - "loss": 0.5548, - "step": 3900 - }, - { - "epoch": 0.11, - "learning_rate": 9.172065412825709e-06, - "loss": 0.146, - "step": 3905 - }, - { - "epoch": 0.11, - "learning_rate": 9.170638431462085e-06, - "loss": 0.2168, - "step": 3910 - }, - { - "epoch": 0.11, - "learning_rate": 9.169211450098462e-06, - "loss": 0.2161, - "step": 3915 - }, - { - "epoch": 0.11, - "learning_rate": 9.16778446873484e-06, - "loss": 0.1638, - "step": 3920 - }, - { - "epoch": 0.11, - "learning_rate": 9.166357487371216e-06, - "loss": 0.168, - "step": 3925 - }, - { - "epoch": 0.11, - "learning_rate": 9.164930506007592e-06, - "loss": 0.0929, - "step": 3930 - }, - { - "epoch": 0.11, - "learning_rate": 9.163503524643969e-06, - "loss": 0.2191, - "step": 3935 - }, - { - "epoch": 0.11, - "learning_rate": 9.162076543280347e-06, - "loss": 0.1826, - "step": 3940 - }, - { - "epoch": 0.11, - "learning_rate": 9.160649561916723e-06, - "loss": 0.4173, - "step": 3945 - }, - { - "epoch": 0.11, - "learning_rate": 9.1592225805531e-06, - "loss": 0.5063, - "step": 3950 - }, - { - "epoch": 0.11, - "learning_rate": 9.157795599189476e-06, - "loss": 0.2068, - "step": 3955 - }, - { - "epoch": 0.11, - "learning_rate": 9.156368617825852e-06, - "loss": 0.1955, - "step": 3960 - }, - { - "epoch": 0.11, - "learning_rate": 9.154941636462228e-06, - "loss": 0.2014, - "step": 3965 - }, - { - "epoch": 0.11, - "learning_rate": 9.153514655098605e-06, - "loss": 0.2034, - "step": 3970 - }, - { - "epoch": 0.11, - "learning_rate": 9.152087673734981e-06, - "loss": 0.2596, - "step": 3975 - }, - { - "epoch": 0.11, - "learning_rate": 9.150660692371357e-06, - "loss": 0.0777, - "step": 3980 - }, - { - "epoch": 0.11, - "learning_rate": 9.149233711007734e-06, - "loss": 0.1958, - "step": 3985 - }, - { - "epoch": 0.11, - "learning_rate": 9.147806729644112e-06, - "loss": 0.1974, - "step": 3990 - }, - { - "epoch": 0.11, - "learning_rate": 9.146379748280488e-06, - "loss": 0.2286, - "step": 3995 - }, - { - "epoch": 0.11, - "learning_rate": 9.144952766916865e-06, - "loss": 0.4232, - "step": 4000 - }, - { - "epoch": 0.11, - "eval_loss": 0.08065038919448853, - "eval_runtime": 2611.7113, - "eval_samples_per_second": 6.133, - "eval_steps_per_second": 1.533, - "eval_wer": 0.2415795167688424, - "step": 4000 - }, - { - "epoch": 0.11, - "learning_rate": 9.143525785553241e-06, - "loss": 0.2607, - "step": 4005 - }, - { - "epoch": 0.11, - "learning_rate": 9.142098804189617e-06, - "loss": 0.2374, - "step": 4010 - }, - { - "epoch": 0.11, - "learning_rate": 9.140671822825995e-06, - "loss": 0.2258, - "step": 4015 - }, - { - "epoch": 0.11, - "learning_rate": 9.139244841462372e-06, - "loss": 0.2825, - "step": 4020 - }, - { - "epoch": 0.11, - "learning_rate": 9.137817860098748e-06, - "loss": 0.2166, - "step": 4025 - }, - { - "epoch": 0.11, - "learning_rate": 9.136390878735124e-06, - "loss": 0.1085, - "step": 4030 - }, - { - "epoch": 0.11, - "learning_rate": 9.134963897371502e-06, - "loss": 0.244, - "step": 4035 - }, - { - "epoch": 0.11, - "learning_rate": 9.133536916007879e-06, - "loss": 0.2392, - "step": 4040 - }, - { - "epoch": 0.11, - "learning_rate": 9.132109934644255e-06, - "loss": 0.3185, - "step": 4045 - }, - { - "epoch": 0.11, - "learning_rate": 9.130682953280631e-06, - "loss": 0.4469, - "step": 4050 - }, - { - "epoch": 0.11, - "learning_rate": 9.129255971917008e-06, - "loss": 0.2549, - "step": 4055 - }, - { - "epoch": 0.11, - "learning_rate": 9.127828990553384e-06, - "loss": 0.1936, - "step": 4060 - }, - { - "epoch": 0.11, - "learning_rate": 9.12640200918976e-06, - "loss": 0.2288, - "step": 4065 - }, - { - "epoch": 0.11, - "learning_rate": 9.124975027826137e-06, - "loss": 0.2042, - "step": 4070 - }, - { - "epoch": 0.11, - "learning_rate": 9.123548046462513e-06, - "loss": 0.207, - "step": 4075 - }, - { - "epoch": 0.11, - "learning_rate": 9.12212106509889e-06, - "loss": 0.0934, - "step": 4080 - }, - { - "epoch": 0.11, - "learning_rate": 9.120694083735267e-06, - "loss": 0.2389, - "step": 4085 - }, - { - "epoch": 0.11, - "learning_rate": 9.119267102371644e-06, - "loss": 0.1741, - "step": 4090 - }, - { - "epoch": 0.11, - "learning_rate": 9.11784012100802e-06, - "loss": 0.2289, - "step": 4095 - }, - { - "epoch": 0.11, - "learning_rate": 9.116413139644396e-06, - "loss": 0.7276, - "step": 4100 - }, - { - "epoch": 0.11, - "learning_rate": 9.114986158280773e-06, - "loss": 0.2186, - "step": 4105 - }, - { - "epoch": 0.11, - "learning_rate": 9.11355917691715e-06, - "loss": 0.1656, - "step": 4110 - }, - { - "epoch": 0.11, - "learning_rate": 9.112132195553527e-06, - "loss": 0.1967, - "step": 4115 - }, - { - "epoch": 0.11, - "learning_rate": 9.110705214189903e-06, - "loss": 0.3377, - "step": 4120 - }, - { - "epoch": 0.11, - "learning_rate": 9.10927823282628e-06, - "loss": 0.1491, - "step": 4125 - }, - { - "epoch": 0.11, - "learning_rate": 9.107851251462658e-06, - "loss": 0.0329, - "step": 4130 - }, - { - "epoch": 0.11, - "learning_rate": 9.106424270099034e-06, - "loss": 0.0635, - "step": 4135 - }, - { - "epoch": 0.11, - "learning_rate": 9.10499728873541e-06, - "loss": 0.2521, - "step": 4140 - }, - { - "epoch": 0.12, - "learning_rate": 9.103570307371787e-06, - "loss": 0.4768, - "step": 4145 - }, - { - "epoch": 0.12, - "learning_rate": 9.102143326008163e-06, - "loss": 0.4017, - "step": 4150 - }, - { - "epoch": 0.12, - "learning_rate": 9.10071634464454e-06, - "loss": 0.1938, - "step": 4155 - }, - { - "epoch": 0.12, - "learning_rate": 9.099289363280916e-06, - "loss": 0.1638, - "step": 4160 - }, - { - "epoch": 0.12, - "learning_rate": 9.097862381917292e-06, - "loss": 0.2338, - "step": 4165 - }, - { - "epoch": 0.12, - "learning_rate": 9.096435400553669e-06, - "loss": 0.199, - "step": 4170 - }, - { - "epoch": 0.12, - "learning_rate": 9.095008419190045e-06, - "loss": 0.0978, - "step": 4175 - }, - { - "epoch": 0.12, - "learning_rate": 9.093581437826423e-06, - "loss": 0.1591, - "step": 4180 - }, - { - "epoch": 0.12, - "learning_rate": 9.0921544564628e-06, - "loss": 0.1114, - "step": 4185 - }, - { - "epoch": 0.12, - "learning_rate": 9.090727475099176e-06, - "loss": 0.2239, - "step": 4190 - }, - { - "epoch": 0.12, - "learning_rate": 9.089300493735552e-06, - "loss": 0.285, - "step": 4195 - }, - { - "epoch": 0.12, - "learning_rate": 9.08787351237193e-06, - "loss": 0.5391, - "step": 4200 - }, - { - "epoch": 0.12, - "learning_rate": 9.086446531008306e-06, - "loss": 0.2093, - "step": 4205 - }, - { - "epoch": 0.12, - "learning_rate": 9.085019549644683e-06, - "loss": 0.1986, - "step": 4210 - }, - { - "epoch": 0.12, - "learning_rate": 9.083592568281059e-06, - "loss": 0.2044, - "step": 4215 - }, - { - "epoch": 0.12, - "learning_rate": 9.082165586917435e-06, - "loss": 0.2003, - "step": 4220 - }, - { - "epoch": 0.12, - "learning_rate": 9.080738605553813e-06, - "loss": 0.2496, - "step": 4225 - }, - { - "epoch": 0.12, - "learning_rate": 9.07931162419019e-06, - "loss": 0.1269, - "step": 4230 - }, - { - "epoch": 0.12, - "learning_rate": 9.077884642826566e-06, - "loss": 0.0929, - "step": 4235 - }, - { - "epoch": 0.12, - "learning_rate": 9.076457661462942e-06, - "loss": 0.124, - "step": 4240 - }, - { - "epoch": 0.12, - "learning_rate": 9.075030680099319e-06, - "loss": 0.3424, - "step": 4245 - }, - { - "epoch": 0.12, - "learning_rate": 9.073603698735695e-06, - "loss": 0.4852, - "step": 4250 - }, - { - "epoch": 0.12, - "learning_rate": 9.072176717372071e-06, - "loss": 0.1921, - "step": 4255 - }, - { - "epoch": 0.12, - "learning_rate": 9.070749736008448e-06, - "loss": 0.2314, - "step": 4260 - }, - { - "epoch": 0.12, - "learning_rate": 9.069322754644824e-06, - "loss": 0.1731, - "step": 4265 - }, - { - "epoch": 0.12, - "learning_rate": 9.0678957732812e-06, - "loss": 0.2128, - "step": 4270 - }, - { - "epoch": 0.12, - "learning_rate": 9.066468791917578e-06, - "loss": 0.2346, - "step": 4275 - }, - { - "epoch": 0.12, - "learning_rate": 9.065041810553955e-06, - "loss": 0.0798, - "step": 4280 - }, - { - "epoch": 0.12, - "learning_rate": 9.063614829190331e-06, - "loss": 0.034, - "step": 4285 - }, - { - "epoch": 0.12, - "learning_rate": 9.062187847826707e-06, - "loss": 0.341, - "step": 4290 - }, - { - "epoch": 0.12, - "learning_rate": 9.060760866463085e-06, - "loss": 0.3448, - "step": 4295 - }, - { - "epoch": 0.12, - "learning_rate": 9.059333885099462e-06, - "loss": 0.5544, - "step": 4300 - }, - { - "epoch": 0.12, - "learning_rate": 9.057906903735838e-06, - "loss": 0.2297, - "step": 4305 - }, - { - "epoch": 0.12, - "learning_rate": 9.056479922372214e-06, - "loss": 0.1696, - "step": 4310 - }, - { - "epoch": 0.12, - "learning_rate": 9.05505294100859e-06, - "loss": 0.2084, - "step": 4315 - }, - { - "epoch": 0.12, - "learning_rate": 9.053625959644969e-06, - "loss": 0.221, - "step": 4320 - }, - { - "epoch": 0.12, - "learning_rate": 9.052198978281345e-06, - "loss": 0.1946, - "step": 4325 - }, - { - "epoch": 0.12, - "learning_rate": 9.050771996917722e-06, - "loss": 0.1071, - "step": 4330 - }, - { - "epoch": 0.12, - "learning_rate": 9.049345015554098e-06, - "loss": 0.1961, - "step": 4335 - }, - { - "epoch": 0.12, - "learning_rate": 9.047918034190474e-06, - "loss": 0.3092, - "step": 4340 - }, - { - "epoch": 0.12, - "learning_rate": 9.04649105282685e-06, - "loss": 0.4163, - "step": 4345 - }, - { - "epoch": 0.12, - "learning_rate": 9.045064071463227e-06, - "loss": 0.6229, - "step": 4350 - }, - { - "epoch": 0.12, - "learning_rate": 9.043637090099603e-06, - "loss": 0.2903, - "step": 4355 - }, - { - "epoch": 0.12, - "learning_rate": 9.04221010873598e-06, - "loss": 0.1842, - "step": 4360 - }, - { - "epoch": 0.12, - "learning_rate": 9.040783127372358e-06, - "loss": 0.1753, - "step": 4365 - }, - { - "epoch": 0.12, - "learning_rate": 9.039356146008734e-06, - "loss": 0.1974, - "step": 4370 - }, - { - "epoch": 0.12, - "learning_rate": 9.03792916464511e-06, - "loss": 0.1202, - "step": 4375 - }, - { - "epoch": 0.12, - "learning_rate": 9.036502183281487e-06, - "loss": 0.0612, - "step": 4380 - }, - { - "epoch": 0.12, - "learning_rate": 9.035075201917863e-06, - "loss": 0.1177, - "step": 4385 - }, - { - "epoch": 0.12, - "learning_rate": 9.033648220554241e-06, - "loss": 0.2192, - "step": 4390 - }, - { - "epoch": 0.12, - "learning_rate": 9.032221239190617e-06, - "loss": 0.4009, - "step": 4395 - }, - { - "epoch": 0.12, - "learning_rate": 9.030794257826994e-06, - "loss": 0.7506, - "step": 4400 - }, - { - "epoch": 0.12, - "learning_rate": 9.02936727646337e-06, - "loss": 0.1961, - "step": 4405 - }, - { - "epoch": 0.12, - "learning_rate": 9.027940295099746e-06, - "loss": 0.1984, - "step": 4410 - }, - { - "epoch": 0.12, - "learning_rate": 9.026513313736124e-06, - "loss": 0.1924, - "step": 4415 - }, - { - "epoch": 0.12, - "learning_rate": 9.0250863323725e-06, - "loss": 0.1851, - "step": 4420 - }, - { - "epoch": 0.12, - "learning_rate": 9.023659351008877e-06, - "loss": 0.1969, - "step": 4425 - }, - { - "epoch": 0.12, - "learning_rate": 9.022232369645253e-06, - "loss": 0.1534, - "step": 4430 - }, - { - "epoch": 0.12, - "learning_rate": 9.02080538828163e-06, - "loss": 0.2427, - "step": 4435 - }, - { - "epoch": 0.12, - "learning_rate": 9.019378406918006e-06, - "loss": 0.2435, - "step": 4440 - }, - { - "epoch": 0.12, - "learning_rate": 9.017951425554382e-06, - "loss": 0.2561, - "step": 4445 - }, - { - "epoch": 0.12, - "learning_rate": 9.016524444190759e-06, - "loss": 0.284, - "step": 4450 - }, - { - "epoch": 0.12, - "learning_rate": 9.015097462827137e-06, - "loss": 0.1331, - "step": 4455 - }, - { - "epoch": 0.12, - "learning_rate": 9.013670481463513e-06, - "loss": 0.2267, - "step": 4460 - }, - { - "epoch": 0.12, - "learning_rate": 9.01224350009989e-06, - "loss": 0.1998, - "step": 4465 - }, - { - "epoch": 0.12, - "learning_rate": 9.010816518736266e-06, - "loss": 0.2609, - "step": 4470 - }, - { - "epoch": 0.12, - "learning_rate": 9.009389537372642e-06, - "loss": 0.1334, - "step": 4475 - }, - { - "epoch": 0.12, - "learning_rate": 9.007962556009018e-06, - "loss": 0.0818, - "step": 4480 - }, - { - "epoch": 0.12, - "learning_rate": 9.006535574645396e-06, - "loss": 0.1239, - "step": 4485 - }, - { - "epoch": 0.12, - "learning_rate": 9.005108593281773e-06, - "loss": 0.3317, - "step": 4490 - }, - { - "epoch": 0.12, - "learning_rate": 9.00368161191815e-06, - "loss": 0.216, - "step": 4495 - }, - { - "epoch": 0.12, - "learning_rate": 9.002254630554526e-06, - "loss": 0.5137, - "step": 4500 - }, - { - "epoch": 0.13, - "learning_rate": 9.000827649190902e-06, - "loss": 0.2356, - "step": 4505 - }, - { - "epoch": 0.13, - "learning_rate": 8.99940066782728e-06, - "loss": 0.1811, - "step": 4510 - }, - { - "epoch": 0.13, - "learning_rate": 8.997973686463656e-06, - "loss": 0.2463, - "step": 4515 - }, - { - "epoch": 0.13, - "learning_rate": 8.996546705100033e-06, - "loss": 0.2877, - "step": 4520 - }, - { - "epoch": 0.13, - "learning_rate": 8.995119723736409e-06, - "loss": 0.2499, - "step": 4525 - }, - { - "epoch": 0.13, - "learning_rate": 8.993692742372785e-06, - "loss": 0.2056, - "step": 4530 - }, - { - "epoch": 0.13, - "learning_rate": 8.992265761009162e-06, - "loss": 0.0899, - "step": 4535 - }, - { - "epoch": 0.13, - "learning_rate": 8.990838779645538e-06, - "loss": 0.2066, - "step": 4540 - }, - { - "epoch": 0.13, - "learning_rate": 8.989411798281916e-06, - "loss": 0.1908, - "step": 4545 - }, - { - "epoch": 0.13, - "learning_rate": 8.987984816918292e-06, - "loss": 0.324, - "step": 4550 - }, - { - "epoch": 0.13, - "learning_rate": 8.986557835554669e-06, - "loss": 0.1409, - "step": 4555 - }, - { - "epoch": 0.13, - "learning_rate": 8.985130854191045e-06, - "loss": 0.2014, - "step": 4560 - }, - { - "epoch": 0.13, - "learning_rate": 8.983703872827421e-06, - "loss": 0.1857, - "step": 4565 - }, - { - "epoch": 0.13, - "learning_rate": 8.982276891463798e-06, - "loss": 0.2537, - "step": 4570 - }, - { - "epoch": 0.13, - "learning_rate": 8.980849910100174e-06, - "loss": 0.2109, - "step": 4575 - }, - { - "epoch": 0.13, - "learning_rate": 8.979422928736552e-06, - "loss": 0.1228, - "step": 4580 - }, - { - "epoch": 0.13, - "learning_rate": 8.977995947372928e-06, - "loss": 0.1489, - "step": 4585 - }, - { - "epoch": 0.13, - "learning_rate": 8.976568966009305e-06, - "loss": 0.1028, - "step": 4590 - }, - { - "epoch": 0.13, - "learning_rate": 8.975141984645681e-06, - "loss": 0.3634, - "step": 4595 - }, - { - "epoch": 0.13, - "learning_rate": 8.973715003282057e-06, - "loss": 0.5033, - "step": 4600 - }, - { - "epoch": 0.13, - "learning_rate": 8.972288021918435e-06, - "loss": 0.1769, - "step": 4605 - }, - { - "epoch": 0.13, - "learning_rate": 8.970861040554812e-06, - "loss": 0.2308, - "step": 4610 - }, - { - "epoch": 0.13, - "learning_rate": 8.969434059191188e-06, - "loss": 0.1799, - "step": 4615 - }, - { - "epoch": 0.13, - "learning_rate": 8.968007077827564e-06, - "loss": 0.2012, - "step": 4620 - }, - { - "epoch": 0.13, - "learning_rate": 8.96658009646394e-06, - "loss": 0.2702, - "step": 4625 - }, - { - "epoch": 0.13, - "learning_rate": 8.965153115100317e-06, - "loss": 0.1508, - "step": 4630 - }, - { - "epoch": 0.13, - "learning_rate": 8.963726133736695e-06, - "loss": 0.1771, - "step": 4635 - }, - { - "epoch": 0.13, - "learning_rate": 8.962299152373071e-06, - "loss": 0.0945, - "step": 4640 - }, - { - "epoch": 0.13, - "learning_rate": 8.960872171009448e-06, - "loss": 0.2389, - "step": 4645 - }, - { - "epoch": 0.13, - "learning_rate": 8.959445189645824e-06, - "loss": 0.5115, - "step": 4650 - }, - { - "epoch": 0.13, - "learning_rate": 8.9580182082822e-06, - "loss": 0.2057, - "step": 4655 - }, - { - "epoch": 0.13, - "learning_rate": 8.956591226918577e-06, - "loss": 0.1715, - "step": 4660 - }, - { - "epoch": 0.13, - "learning_rate": 8.955164245554953e-06, - "loss": 0.1947, - "step": 4665 - }, - { - "epoch": 0.13, - "learning_rate": 8.95373726419133e-06, - "loss": 0.19, - "step": 4670 - }, - { - "epoch": 0.13, - "learning_rate": 8.952310282827708e-06, - "loss": 0.257, - "step": 4675 - }, - { - "epoch": 0.13, - "learning_rate": 8.950883301464084e-06, - "loss": 0.15, - "step": 4680 - }, - { - "epoch": 0.13, - "learning_rate": 8.94945632010046e-06, - "loss": 0.1584, - "step": 4685 - }, - { - "epoch": 0.13, - "learning_rate": 8.948029338736837e-06, - "loss": 0.1429, - "step": 4690 - }, - { - "epoch": 0.13, - "learning_rate": 8.946602357373213e-06, - "loss": 0.2701, - "step": 4695 - }, - { - "epoch": 0.13, - "learning_rate": 8.945175376009591e-06, - "loss": 0.3097, - "step": 4700 - }, - { - "epoch": 0.13, - "learning_rate": 8.943748394645967e-06, - "loss": 0.2693, - "step": 4705 - }, - { - "epoch": 0.13, - "learning_rate": 8.942321413282344e-06, - "loss": 0.1758, - "step": 4710 - }, - { - "epoch": 0.13, - "learning_rate": 8.94089443191872e-06, - "loss": 0.2927, - "step": 4715 - }, - { - "epoch": 0.13, - "learning_rate": 8.939467450555096e-06, - "loss": 0.2062, - "step": 4720 - }, - { - "epoch": 0.13, - "learning_rate": 8.938040469191474e-06, - "loss": 0.1183, - "step": 4725 - }, - { - "epoch": 0.13, - "learning_rate": 8.93661348782785e-06, - "loss": 0.1886, - "step": 4730 - }, - { - "epoch": 0.13, - "learning_rate": 8.935186506464227e-06, - "loss": 0.0822, - "step": 4735 - }, - { - "epoch": 0.13, - "learning_rate": 8.933759525100603e-06, - "loss": 0.2749, - "step": 4740 - }, - { - "epoch": 0.13, - "learning_rate": 8.93233254373698e-06, - "loss": 0.2977, - "step": 4745 - }, - { - "epoch": 0.13, - "learning_rate": 8.930905562373356e-06, - "loss": 0.4549, - "step": 4750 - }, - { - "epoch": 0.13, - "learning_rate": 8.929478581009732e-06, - "loss": 0.1402, - "step": 4755 - }, - { - "epoch": 0.13, - "learning_rate": 8.928051599646109e-06, - "loss": 0.1788, - "step": 4760 - }, - { - "epoch": 0.13, - "learning_rate": 8.926624618282485e-06, - "loss": 0.1905, - "step": 4765 - }, - { - "epoch": 0.13, - "learning_rate": 8.925197636918863e-06, - "loss": 0.2435, - "step": 4770 - }, - { - "epoch": 0.13, - "learning_rate": 8.92377065555524e-06, - "loss": 0.0795, - "step": 4775 - }, - { - "epoch": 0.13, - "learning_rate": 8.922343674191616e-06, - "loss": 0.1603, - "step": 4780 - }, - { - "epoch": 0.13, - "learning_rate": 8.920916692827992e-06, - "loss": 0.1377, - "step": 4785 - }, - { - "epoch": 0.13, - "learning_rate": 8.919489711464368e-06, - "loss": 0.2565, - "step": 4790 - }, - { - "epoch": 0.13, - "learning_rate": 8.918062730100746e-06, - "loss": 0.3557, - "step": 4795 - }, - { - "epoch": 0.13, - "learning_rate": 8.916635748737123e-06, - "loss": 0.4561, - "step": 4800 - }, - { - "epoch": 0.13, - "learning_rate": 8.915208767373499e-06, - "loss": 0.1781, - "step": 4805 - }, - { - "epoch": 0.13, - "learning_rate": 8.913781786009875e-06, - "loss": 0.1467, - "step": 4810 - }, - { - "epoch": 0.13, - "learning_rate": 8.912354804646252e-06, - "loss": 0.1543, - "step": 4815 - }, - { - "epoch": 0.13, - "learning_rate": 8.91092782328263e-06, - "loss": 0.2281, - "step": 4820 - }, - { - "epoch": 0.13, - "learning_rate": 8.909500841919006e-06, - "loss": 0.1932, - "step": 4825 - }, - { - "epoch": 0.13, - "learning_rate": 8.908073860555382e-06, - "loss": 0.1857, - "step": 4830 - }, - { - "epoch": 0.13, - "learning_rate": 8.906646879191759e-06, - "loss": 0.1831, - "step": 4835 - }, - { - "epoch": 0.13, - "learning_rate": 8.905219897828135e-06, - "loss": 0.207, - "step": 4840 - }, - { - "epoch": 0.13, - "learning_rate": 8.903792916464512e-06, - "loss": 0.2404, - "step": 4845 - }, - { - "epoch": 0.13, - "learning_rate": 8.902365935100888e-06, - "loss": 0.4327, - "step": 4850 - }, - { - "epoch": 0.13, - "learning_rate": 8.900938953737264e-06, - "loss": 0.16, - "step": 4855 - }, - { - "epoch": 0.13, - "learning_rate": 8.89951197237364e-06, - "loss": 0.1548, - "step": 4860 - }, - { - "epoch": 0.13, - "learning_rate": 8.898084991010019e-06, - "loss": 0.2546, - "step": 4865 - }, - { - "epoch": 0.14, - "learning_rate": 8.896658009646395e-06, - "loss": 0.2301, - "step": 4870 - }, - { - "epoch": 0.14, - "learning_rate": 8.895231028282771e-06, - "loss": 0.1885, - "step": 4875 - }, - { - "epoch": 0.14, - "learning_rate": 8.893804046919148e-06, - "loss": 0.1039, - "step": 4880 - }, - { - "epoch": 0.14, - "learning_rate": 8.892377065555524e-06, - "loss": 0.1215, - "step": 4885 - }, - { - "epoch": 0.14, - "learning_rate": 8.890950084191902e-06, - "loss": 0.2017, - "step": 4890 - }, - { - "epoch": 0.14, - "learning_rate": 8.889523102828278e-06, - "loss": 0.2429, - "step": 4895 - }, - { - "epoch": 0.14, - "learning_rate": 8.888096121464655e-06, - "loss": 0.4522, - "step": 4900 - }, - { - "epoch": 0.14, - "learning_rate": 8.886669140101031e-06, - "loss": 0.2326, - "step": 4905 - }, - { - "epoch": 0.14, - "learning_rate": 8.885242158737407e-06, - "loss": 0.2617, - "step": 4910 - }, - { - "epoch": 0.14, - "learning_rate": 8.883815177373785e-06, - "loss": 0.1861, - "step": 4915 - }, - { - "epoch": 0.14, - "learning_rate": 8.882388196010162e-06, - "loss": 0.2249, - "step": 4920 - }, - { - "epoch": 0.14, - "learning_rate": 8.880961214646538e-06, - "loss": 0.1508, - "step": 4925 - }, - { - "epoch": 0.14, - "learning_rate": 8.879534233282914e-06, - "loss": 0.1548, - "step": 4930 - }, - { - "epoch": 0.14, - "learning_rate": 8.87810725191929e-06, - "loss": 0.1668, - "step": 4935 - }, - { - "epoch": 0.14, - "learning_rate": 8.876680270555667e-06, - "loss": 0.1921, - "step": 4940 - }, - { - "epoch": 0.14, - "learning_rate": 8.875253289192043e-06, - "loss": 0.1872, - "step": 4945 - }, - { - "epoch": 0.14, - "learning_rate": 8.87382630782842e-06, - "loss": 0.5628, - "step": 4950 - }, - { - "epoch": 0.14, - "learning_rate": 8.872399326464796e-06, - "loss": 0.2048, - "step": 4955 - }, - { - "epoch": 0.14, - "learning_rate": 8.870972345101174e-06, - "loss": 0.1782, - "step": 4960 - }, - { - "epoch": 0.14, - "learning_rate": 8.86954536373755e-06, - "loss": 0.1839, - "step": 4965 - }, - { - "epoch": 0.14, - "learning_rate": 8.868118382373927e-06, - "loss": 0.2331, - "step": 4970 - }, - { - "epoch": 0.14, - "learning_rate": 8.866691401010303e-06, - "loss": 0.0948, - "step": 4975 - }, - { - "epoch": 0.14, - "learning_rate": 8.86526441964668e-06, - "loss": 0.071, - "step": 4980 - }, - { - "epoch": 0.14, - "learning_rate": 8.863837438283057e-06, - "loss": 0.2554, - "step": 4985 - }, - { - "epoch": 0.14, - "learning_rate": 8.862410456919434e-06, - "loss": 0.3874, - "step": 4990 - }, - { - "epoch": 0.14, - "learning_rate": 8.86098347555581e-06, - "loss": 0.3417, - "step": 4995 - }, - { - "epoch": 0.14, - "learning_rate": 8.859556494192186e-06, - "loss": 0.4399, - "step": 5000 - }, - { - "epoch": 0.14, - "learning_rate": 8.858129512828563e-06, - "loss": 0.1944, - "step": 5005 - }, - { - "epoch": 0.14, - "learning_rate": 8.856702531464941e-06, - "loss": 0.2096, - "step": 5010 - }, - { - "epoch": 0.14, - "learning_rate": 8.855275550101317e-06, - "loss": 0.2665, - "step": 5015 - }, - { - "epoch": 0.14, - "learning_rate": 8.853848568737694e-06, - "loss": 0.2119, - "step": 5020 - }, - { - "epoch": 0.14, - "learning_rate": 8.85242158737407e-06, - "loss": 0.1429, - "step": 5025 - }, - { - "epoch": 0.14, - "learning_rate": 8.850994606010446e-06, - "loss": 0.1091, - "step": 5030 - }, - { - "epoch": 0.14, - "learning_rate": 8.849567624646823e-06, - "loss": 0.1028, - "step": 5035 - }, - { - "epoch": 0.14, - "learning_rate": 8.848140643283199e-06, - "loss": 0.23, - "step": 5040 - }, - { - "epoch": 0.14, - "learning_rate": 8.846713661919575e-06, - "loss": 0.324, - "step": 5045 - }, - { - "epoch": 0.14, - "learning_rate": 8.845286680555952e-06, - "loss": 0.3115, - "step": 5050 - }, - { - "epoch": 0.14, - "learning_rate": 8.84385969919233e-06, - "loss": 0.1982, - "step": 5055 - }, - { - "epoch": 0.14, - "learning_rate": 8.842432717828706e-06, - "loss": 0.1659, - "step": 5060 - }, - { - "epoch": 0.14, - "learning_rate": 8.841005736465082e-06, - "loss": 0.1552, - "step": 5065 - }, - { - "epoch": 0.14, - "learning_rate": 8.839578755101459e-06, - "loss": 0.2341, - "step": 5070 - }, - { - "epoch": 0.14, - "learning_rate": 8.838151773737835e-06, - "loss": 0.2016, - "step": 5075 - }, - { - "epoch": 0.14, - "learning_rate": 8.836724792374213e-06, - "loss": 0.1199, - "step": 5080 - }, - { - "epoch": 0.14, - "learning_rate": 8.83529781101059e-06, - "loss": 0.0833, - "step": 5085 - }, - { - "epoch": 0.14, - "learning_rate": 8.833870829646966e-06, - "loss": 0.1925, - "step": 5090 - }, - { - "epoch": 0.14, - "learning_rate": 8.832443848283342e-06, - "loss": 0.2766, - "step": 5095 - }, - { - "epoch": 0.14, - "learning_rate": 8.831016866919718e-06, - "loss": 0.5481, - "step": 5100 - }, - { - "epoch": 0.14, - "learning_rate": 8.829589885556096e-06, - "loss": 0.192, - "step": 5105 - }, - { - "epoch": 0.14, - "learning_rate": 8.828162904192473e-06, - "loss": 0.1816, - "step": 5110 - }, - { - "epoch": 0.14, - "learning_rate": 8.826735922828849e-06, - "loss": 0.1952, - "step": 5115 - }, - { - "epoch": 0.14, - "learning_rate": 8.825308941465225e-06, - "loss": 0.1743, - "step": 5120 - }, - { - "epoch": 0.14, - "learning_rate": 8.823881960101602e-06, - "loss": 0.1717, - "step": 5125 - }, - { - "epoch": 0.14, - "learning_rate": 8.822454978737978e-06, - "loss": 0.0976, - "step": 5130 - }, - { - "epoch": 0.14, - "learning_rate": 8.821027997374354e-06, - "loss": 0.2031, - "step": 5135 - }, - { - "epoch": 0.14, - "learning_rate": 8.81960101601073e-06, - "loss": 0.1639, - "step": 5140 - }, - { - "epoch": 0.14, - "learning_rate": 8.818174034647107e-06, - "loss": 0.3788, - "step": 5145 - }, - { - "epoch": 0.14, - "learning_rate": 8.816747053283485e-06, - "loss": 0.6995, - "step": 5150 - }, - { - "epoch": 0.14, - "learning_rate": 8.815320071919861e-06, - "loss": 0.3716, - "step": 5155 - }, - { - "epoch": 0.14, - "learning_rate": 8.813893090556238e-06, - "loss": 0.1552, - "step": 5160 - }, - { - "epoch": 0.14, - "learning_rate": 8.812466109192614e-06, - "loss": 0.1855, - "step": 5165 - }, - { - "epoch": 0.14, - "learning_rate": 8.81103912782899e-06, - "loss": 0.1795, - "step": 5170 - }, - { - "epoch": 0.14, - "learning_rate": 8.809612146465368e-06, - "loss": 0.0744, - "step": 5175 - }, - { - "epoch": 0.14, - "learning_rate": 8.808185165101745e-06, - "loss": 0.1431, - "step": 5180 - }, - { - "epoch": 0.14, - "learning_rate": 8.806758183738121e-06, - "loss": 0.2072, - "step": 5185 - }, - { - "epoch": 0.14, - "learning_rate": 8.805331202374498e-06, - "loss": 0.1924, - "step": 5190 - }, - { - "epoch": 0.14, - "learning_rate": 8.803904221010874e-06, - "loss": 0.223, - "step": 5195 - }, - { - "epoch": 0.14, - "learning_rate": 8.802477239647252e-06, - "loss": 0.5766, - "step": 5200 - }, - { - "epoch": 0.14, - "learning_rate": 8.801050258283628e-06, - "loss": 0.1885, - "step": 5205 - }, - { - "epoch": 0.14, - "learning_rate": 8.799623276920005e-06, - "loss": 0.1874, - "step": 5210 - }, - { - "epoch": 0.14, - "learning_rate": 8.798196295556381e-06, - "loss": 0.1505, - "step": 5215 - }, - { - "epoch": 0.14, - "learning_rate": 8.796769314192757e-06, - "loss": 0.1784, - "step": 5220 - }, - { - "epoch": 0.14, - "learning_rate": 8.795342332829134e-06, - "loss": 0.18, - "step": 5225 - }, - { - "epoch": 0.15, - "learning_rate": 8.79391535146551e-06, - "loss": 0.1108, - "step": 5230 - }, - { - "epoch": 0.15, - "learning_rate": 8.792488370101886e-06, - "loss": 0.1662, - "step": 5235 - }, - { - "epoch": 0.15, - "learning_rate": 8.791061388738263e-06, - "loss": 0.1483, - "step": 5240 - }, - { - "epoch": 0.15, - "learning_rate": 8.78963440737464e-06, - "loss": 0.3551, - "step": 5245 - }, - { - "epoch": 0.15, - "learning_rate": 8.788207426011017e-06, - "loss": 0.262, - "step": 5250 - }, - { - "epoch": 0.15, - "learning_rate": 8.786780444647393e-06, - "loss": 0.1899, - "step": 5255 - }, - { - "epoch": 0.15, - "learning_rate": 8.78535346328377e-06, - "loss": 0.2994, - "step": 5260 - }, - { - "epoch": 0.15, - "learning_rate": 8.783926481920146e-06, - "loss": 0.1549, - "step": 5265 - }, - { - "epoch": 0.15, - "learning_rate": 8.782499500556524e-06, - "loss": 0.2618, - "step": 5270 - }, - { - "epoch": 0.15, - "learning_rate": 8.7810725191929e-06, - "loss": 0.2002, - "step": 5275 - }, - { - "epoch": 0.15, - "learning_rate": 8.779645537829277e-06, - "loss": 0.0888, - "step": 5280 - }, - { - "epoch": 0.15, - "learning_rate": 8.778218556465653e-06, - "loss": 0.2511, - "step": 5285 - }, - { - "epoch": 0.15, - "learning_rate": 8.77679157510203e-06, - "loss": 0.3803, - "step": 5290 - }, - { - "epoch": 0.15, - "learning_rate": 8.775364593738407e-06, - "loss": 0.5372, - "step": 5295 - }, - { - "epoch": 0.15, - "learning_rate": 8.773937612374784e-06, - "loss": 0.5779, - "step": 5300 - }, - { - "epoch": 0.15, - "learning_rate": 8.77251063101116e-06, - "loss": 0.215, - "step": 5305 - }, - { - "epoch": 0.15, - "learning_rate": 8.771083649647536e-06, - "loss": 0.259, - "step": 5310 - }, - { - "epoch": 0.15, - "learning_rate": 8.769656668283913e-06, - "loss": 0.1478, - "step": 5315 - }, - { - "epoch": 0.15, - "learning_rate": 8.768229686920289e-06, - "loss": 0.1971, - "step": 5320 - }, - { - "epoch": 0.15, - "learning_rate": 8.766802705556665e-06, - "loss": 0.2074, - "step": 5325 - }, - { - "epoch": 0.15, - "learning_rate": 8.765375724193042e-06, - "loss": 0.1503, - "step": 5330 - }, - { - "epoch": 0.15, - "learning_rate": 8.76394874282942e-06, - "loss": 0.1515, - "step": 5335 - }, - { - "epoch": 0.15, - "learning_rate": 8.762521761465796e-06, - "loss": 0.3774, - "step": 5340 - }, - { - "epoch": 0.15, - "learning_rate": 8.761094780102172e-06, - "loss": 0.2298, - "step": 5345 - }, - { - "epoch": 0.15, - "learning_rate": 8.759667798738549e-06, - "loss": 0.556, - "step": 5350 - }, - { - "epoch": 0.15, - "learning_rate": 8.758240817374925e-06, - "loss": 0.2015, - "step": 5355 - }, - { - "epoch": 0.15, - "learning_rate": 8.756813836011301e-06, - "loss": 0.148, - "step": 5360 - }, - { - "epoch": 0.15, - "learning_rate": 8.75538685464768e-06, - "loss": 0.2125, - "step": 5365 - }, - { - "epoch": 0.15, - "learning_rate": 8.753959873284056e-06, - "loss": 0.2282, - "step": 5370 - }, - { - "epoch": 0.15, - "learning_rate": 8.752532891920432e-06, - "loss": 0.2395, - "step": 5375 - }, - { - "epoch": 0.15, - "learning_rate": 8.751105910556809e-06, - "loss": 0.0962, - "step": 5380 - }, - { - "epoch": 0.15, - "learning_rate": 8.749678929193185e-06, - "loss": 0.1118, - "step": 5385 - }, - { - "epoch": 0.15, - "learning_rate": 8.748251947829563e-06, - "loss": 0.2768, - "step": 5390 - }, - { - "epoch": 0.15, - "learning_rate": 8.74682496646594e-06, - "loss": 0.3651, - "step": 5395 - }, - { - "epoch": 0.15, - "learning_rate": 8.745397985102316e-06, - "loss": 0.5803, - "step": 5400 - }, - { - "epoch": 0.15, - "learning_rate": 8.743971003738692e-06, - "loss": 0.1585, - "step": 5405 - }, - { - "epoch": 0.15, - "learning_rate": 8.742544022375068e-06, - "loss": 0.2192, - "step": 5410 - }, - { - "epoch": 0.15, - "learning_rate": 8.741117041011445e-06, - "loss": 0.2076, - "step": 5415 - }, - { - "epoch": 0.15, - "learning_rate": 8.739690059647823e-06, - "loss": 0.2241, - "step": 5420 - }, - { - "epoch": 0.15, - "learning_rate": 8.738263078284199e-06, - "loss": 0.1996, - "step": 5425 - }, - { - "epoch": 0.15, - "learning_rate": 8.736836096920575e-06, - "loss": 0.1283, - "step": 5430 - }, - { - "epoch": 0.15, - "learning_rate": 8.735409115556952e-06, - "loss": 0.2356, - "step": 5435 - }, - { - "epoch": 0.15, - "learning_rate": 8.733982134193328e-06, - "loss": 0.1745, - "step": 5440 - }, - { - "epoch": 0.15, - "learning_rate": 8.732555152829704e-06, - "loss": 0.2165, - "step": 5445 - }, - { - "epoch": 0.15, - "learning_rate": 8.73112817146608e-06, - "loss": 0.6278, - "step": 5450 - }, - { - "epoch": 0.15, - "learning_rate": 8.729701190102457e-06, - "loss": 0.1927, - "step": 5455 - }, - { - "epoch": 0.15, - "learning_rate": 8.728274208738835e-06, - "loss": 0.2593, - "step": 5460 - }, - { - "epoch": 0.15, - "learning_rate": 8.726847227375211e-06, - "loss": 0.1807, - "step": 5465 - }, - { - "epoch": 0.15, - "learning_rate": 8.725420246011588e-06, - "loss": 0.1971, - "step": 5470 - }, - { - "epoch": 0.15, - "learning_rate": 8.723993264647964e-06, - "loss": 0.1768, - "step": 5475 - }, - { - "epoch": 0.15, - "learning_rate": 8.72256628328434e-06, - "loss": 0.1762, - "step": 5480 - }, - { - "epoch": 0.15, - "learning_rate": 8.721139301920718e-06, - "loss": 0.1797, - "step": 5485 - }, - { - "epoch": 0.15, - "learning_rate": 8.719712320557095e-06, - "loss": 0.1995, - "step": 5490 - }, - { - "epoch": 0.15, - "learning_rate": 8.718285339193471e-06, - "loss": 0.2537, - "step": 5495 - }, - { - "epoch": 0.15, - "learning_rate": 8.716858357829847e-06, - "loss": 0.4993, - "step": 5500 - }, - { - "epoch": 0.15, - "learning_rate": 8.715431376466224e-06, - "loss": 0.1784, - "step": 5505 - }, - { - "epoch": 0.15, - "learning_rate": 8.714004395102602e-06, - "loss": 0.2367, - "step": 5510 - }, - { - "epoch": 0.15, - "learning_rate": 8.712577413738978e-06, - "loss": 0.1833, - "step": 5515 - }, - { - "epoch": 0.15, - "learning_rate": 8.711150432375354e-06, - "loss": 0.2138, - "step": 5520 - }, - { - "epoch": 0.15, - "learning_rate": 8.70972345101173e-06, - "loss": 0.1933, - "step": 5525 - }, - { - "epoch": 0.15, - "learning_rate": 8.708296469648107e-06, - "loss": 0.1948, - "step": 5530 - }, - { - "epoch": 0.15, - "learning_rate": 8.706869488284484e-06, - "loss": 0.0868, - "step": 5535 - }, - { - "epoch": 0.15, - "learning_rate": 8.70544250692086e-06, - "loss": 0.2228, - "step": 5540 - }, - { - "epoch": 0.15, - "learning_rate": 8.704015525557236e-06, - "loss": 0.263, - "step": 5545 - }, - { - "epoch": 0.15, - "learning_rate": 8.702588544193613e-06, - "loss": 0.4862, - "step": 5550 - }, - { - "epoch": 0.15, - "learning_rate": 8.70116156282999e-06, - "loss": 0.2016, - "step": 5555 - }, - { - "epoch": 0.15, - "learning_rate": 8.699734581466367e-06, - "loss": 0.1936, - "step": 5560 - }, - { - "epoch": 0.15, - "learning_rate": 8.698307600102743e-06, - "loss": 0.2058, - "step": 5565 - }, - { - "epoch": 0.15, - "learning_rate": 8.69688061873912e-06, - "loss": 0.4567, - "step": 5570 - }, - { - "epoch": 0.15, - "learning_rate": 8.695453637375496e-06, - "loss": 0.1977, - "step": 5575 - }, - { - "epoch": 0.15, - "learning_rate": 8.694026656011874e-06, - "loss": 0.0746, - "step": 5580 - }, - { - "epoch": 0.15, - "learning_rate": 8.69259967464825e-06, - "loss": 0.2863, - "step": 5585 - }, - { - "epoch": 0.16, - "learning_rate": 8.691172693284627e-06, - "loss": 0.1975, - "step": 5590 - }, - { - "epoch": 0.16, - "learning_rate": 8.689745711921003e-06, - "loss": 0.3318, - "step": 5595 - }, - { - "epoch": 0.16, - "learning_rate": 8.688318730557381e-06, - "loss": 0.283, - "step": 5600 - }, - { - "epoch": 0.16, - "learning_rate": 8.686891749193757e-06, - "loss": 0.173, - "step": 5605 - }, - { - "epoch": 0.16, - "learning_rate": 8.685464767830134e-06, - "loss": 0.1533, - "step": 5610 - }, - { - "epoch": 0.16, - "learning_rate": 8.68403778646651e-06, - "loss": 0.1697, - "step": 5615 - }, - { - "epoch": 0.16, - "learning_rate": 8.682610805102886e-06, - "loss": 0.1507, - "step": 5620 - }, - { - "epoch": 0.16, - "learning_rate": 8.681183823739263e-06, - "loss": 0.1705, - "step": 5625 - }, - { - "epoch": 0.16, - "learning_rate": 8.679756842375639e-06, - "loss": 0.0738, - "step": 5630 - }, - { - "epoch": 0.16, - "learning_rate": 8.678329861012015e-06, - "loss": 0.1915, - "step": 5635 - }, - { - "epoch": 0.16, - "learning_rate": 8.676902879648392e-06, - "loss": 0.2064, - "step": 5640 - }, - { - "epoch": 0.16, - "learning_rate": 8.675475898284768e-06, - "loss": 0.1501, - "step": 5645 - }, - { - "epoch": 0.16, - "learning_rate": 8.674048916921146e-06, - "loss": 0.4604, - "step": 5650 - }, - { - "epoch": 0.16, - "learning_rate": 8.672621935557522e-06, - "loss": 0.1099, - "step": 5655 - }, - { - "epoch": 0.16, - "learning_rate": 8.671194954193899e-06, - "loss": 0.1849, - "step": 5660 - }, - { - "epoch": 0.16, - "learning_rate": 8.669767972830275e-06, - "loss": 0.2311, - "step": 5665 - }, - { - "epoch": 0.16, - "learning_rate": 8.668340991466651e-06, - "loss": 0.1917, - "step": 5670 - }, - { - "epoch": 0.16, - "learning_rate": 8.66691401010303e-06, - "loss": 0.2114, - "step": 5675 - }, - { - "epoch": 0.16, - "learning_rate": 8.665487028739406e-06, - "loss": 0.0909, - "step": 5680 - }, - { - "epoch": 0.16, - "learning_rate": 8.664060047375782e-06, - "loss": 0.2297, - "step": 5685 - }, - { - "epoch": 0.16, - "learning_rate": 8.662633066012158e-06, - "loss": 0.1691, - "step": 5690 - }, - { - "epoch": 0.16, - "learning_rate": 8.661206084648537e-06, - "loss": 0.3327, - "step": 5695 - }, - { - "epoch": 0.16, - "learning_rate": 8.659779103284913e-06, - "loss": 0.772, - "step": 5700 - }, - { - "epoch": 0.16, - "learning_rate": 8.65835212192129e-06, - "loss": 0.1924, - "step": 5705 - }, - { - "epoch": 0.16, - "learning_rate": 8.656925140557666e-06, - "loss": 0.2268, - "step": 5710 - }, - { - "epoch": 0.16, - "learning_rate": 8.655498159194042e-06, - "loss": 0.2013, - "step": 5715 - }, - { - "epoch": 0.16, - "learning_rate": 8.654071177830418e-06, - "loss": 0.2103, - "step": 5720 - }, - { - "epoch": 0.16, - "learning_rate": 8.652644196466795e-06, - "loss": 0.2448, - "step": 5725 - }, - { - "epoch": 0.16, - "learning_rate": 8.651217215103171e-06, - "loss": 0.099, - "step": 5730 - }, - { - "epoch": 0.16, - "learning_rate": 8.649790233739547e-06, - "loss": 0.1983, - "step": 5735 - }, - { - "epoch": 0.16, - "learning_rate": 8.648363252375924e-06, - "loss": 0.0715, - "step": 5740 - }, - { - "epoch": 0.16, - "learning_rate": 8.646936271012302e-06, - "loss": 0.2699, - "step": 5745 - }, - { - "epoch": 0.16, - "learning_rate": 8.645509289648678e-06, - "loss": 0.4508, - "step": 5750 - }, - { - "epoch": 0.16, - "learning_rate": 8.644082308285054e-06, - "loss": 0.1935, - "step": 5755 - }, - { - "epoch": 0.16, - "learning_rate": 8.64265532692143e-06, - "loss": 0.1979, - "step": 5760 - }, - { - "epoch": 0.16, - "learning_rate": 8.641228345557807e-06, - "loss": 0.1516, - "step": 5765 - }, - { - "epoch": 0.16, - "learning_rate": 8.639801364194185e-06, - "loss": 0.1582, - "step": 5770 - }, - { - "epoch": 0.16, - "learning_rate": 8.638374382830561e-06, - "loss": 0.1515, - "step": 5775 - }, - { - "epoch": 0.16, - "learning_rate": 8.636947401466938e-06, - "loss": 0.0538, - "step": 5780 - }, - { - "epoch": 0.16, - "learning_rate": 8.635520420103314e-06, - "loss": 0.1432, - "step": 5785 - }, - { - "epoch": 0.16, - "learning_rate": 8.634093438739692e-06, - "loss": 0.266, - "step": 5790 - }, - { - "epoch": 0.16, - "learning_rate": 8.632666457376068e-06, - "loss": 0.5542, - "step": 5795 - }, - { - "epoch": 0.16, - "learning_rate": 8.631239476012445e-06, - "loss": 0.2882, - "step": 5800 - }, - { - "epoch": 0.16, - "learning_rate": 8.629812494648821e-06, - "loss": 0.2182, - "step": 5805 - }, - { - "epoch": 0.16, - "learning_rate": 8.628385513285197e-06, - "loss": 0.2666, - "step": 5810 - }, - { - "epoch": 0.16, - "learning_rate": 8.626958531921574e-06, - "loss": 0.1588, - "step": 5815 - }, - { - "epoch": 0.16, - "learning_rate": 8.62553155055795e-06, - "loss": 0.241, - "step": 5820 - }, - { - "epoch": 0.16, - "learning_rate": 8.624104569194326e-06, - "loss": 0.0942, - "step": 5825 - }, - { - "epoch": 0.16, - "learning_rate": 8.622677587830703e-06, - "loss": 0.0784, - "step": 5830 - }, - { - "epoch": 0.16, - "learning_rate": 8.621250606467079e-06, - "loss": 0.1611, - "step": 5835 - }, - { - "epoch": 0.16, - "learning_rate": 8.619823625103457e-06, - "loss": 0.1319, - "step": 5840 - }, - { - "epoch": 0.16, - "learning_rate": 8.618396643739833e-06, - "loss": 0.4533, - "step": 5845 - }, - { - "epoch": 0.16, - "learning_rate": 8.61696966237621e-06, - "loss": 0.4332, - "step": 5850 - }, - { - "epoch": 0.16, - "learning_rate": 8.615542681012586e-06, - "loss": 0.1972, - "step": 5855 - }, - { - "epoch": 0.16, - "learning_rate": 8.614115699648962e-06, - "loss": 0.2395, - "step": 5860 - }, - { - "epoch": 0.16, - "learning_rate": 8.61268871828534e-06, - "loss": 0.2174, - "step": 5865 - }, - { - "epoch": 0.16, - "learning_rate": 8.611261736921717e-06, - "loss": 0.2569, - "step": 5870 - }, - { - "epoch": 0.16, - "learning_rate": 8.609834755558093e-06, - "loss": 0.1612, - "step": 5875 - }, - { - "epoch": 0.16, - "learning_rate": 8.60840777419447e-06, - "loss": 0.1016, - "step": 5880 - }, - { - "epoch": 0.16, - "learning_rate": 8.606980792830848e-06, - "loss": 0.1382, - "step": 5885 - }, - { - "epoch": 0.16, - "learning_rate": 8.605553811467224e-06, - "loss": 0.2932, - "step": 5890 - }, - { - "epoch": 0.16, - "learning_rate": 8.6041268301036e-06, - "loss": 0.3552, - "step": 5895 - }, - { - "epoch": 0.16, - "learning_rate": 8.602699848739977e-06, - "loss": 0.6778, - "step": 5900 - }, - { - "epoch": 0.16, - "learning_rate": 8.601272867376353e-06, - "loss": 0.1395, - "step": 5905 - }, - { - "epoch": 0.16, - "learning_rate": 8.59984588601273e-06, - "loss": 0.1618, - "step": 5910 - }, - { - "epoch": 0.16, - "learning_rate": 8.598418904649106e-06, - "loss": 0.2916, - "step": 5915 - }, - { - "epoch": 0.16, - "learning_rate": 8.596991923285482e-06, - "loss": 0.2307, - "step": 5920 - }, - { - "epoch": 0.16, - "learning_rate": 8.595564941921858e-06, - "loss": 0.1712, - "step": 5925 - }, - { - "epoch": 0.16, - "learning_rate": 8.594137960558235e-06, - "loss": 0.1044, - "step": 5930 - }, - { - "epoch": 0.16, - "learning_rate": 8.592710979194613e-06, - "loss": 0.1749, - "step": 5935 - }, - { - "epoch": 0.16, - "learning_rate": 8.591283997830989e-06, - "loss": 0.2064, - "step": 5940 - }, - { - "epoch": 0.16, - "learning_rate": 8.589857016467365e-06, - "loss": 0.2992, - "step": 5945 - }, - { - "epoch": 0.17, - "learning_rate": 8.588430035103742e-06, - "loss": 0.3827, - "step": 5950 - }, - { - "epoch": 0.17, - "learning_rate": 8.587003053740118e-06, - "loss": 0.2054, - "step": 5955 - }, - { - "epoch": 0.17, - "learning_rate": 8.585576072376496e-06, - "loss": 0.1882, - "step": 5960 - }, - { - "epoch": 0.17, - "learning_rate": 8.584149091012872e-06, - "loss": 0.1752, - "step": 5965 - }, - { - "epoch": 0.17, - "learning_rate": 8.582722109649249e-06, - "loss": 0.2178, - "step": 5970 - }, - { - "epoch": 0.17, - "learning_rate": 8.581295128285625e-06, - "loss": 0.1532, - "step": 5975 - }, - { - "epoch": 0.17, - "learning_rate": 8.579868146922003e-06, - "loss": 0.162, - "step": 5980 - }, - { - "epoch": 0.17, - "learning_rate": 8.57844116555838e-06, - "loss": 0.2166, - "step": 5985 - }, - { - "epoch": 0.17, - "learning_rate": 8.577014184194756e-06, - "loss": 0.2177, - "step": 5990 - }, - { - "epoch": 0.17, - "learning_rate": 8.575587202831132e-06, - "loss": 0.2964, - "step": 5995 - }, - { - "epoch": 0.17, - "learning_rate": 8.574160221467508e-06, - "loss": 0.3765, - "step": 6000 - }, - { - "epoch": 0.17, - "eval_loss": 0.0795619785785675, - "eval_runtime": 3436.6447, - "eval_samples_per_second": 4.661, - "eval_steps_per_second": 1.165, - "eval_wer": 0.2294266137756942, - "step": 6000 - }, - { - "epoch": 0.17, - "learning_rate": 8.572733240103885e-06, - "loss": 0.1503, - "step": 6005 - }, - { - "epoch": 0.17, - "learning_rate": 8.571306258740261e-06, - "loss": 0.2646, - "step": 6010 - }, - { - "epoch": 0.17, - "learning_rate": 8.569879277376637e-06, - "loss": 0.2817, - "step": 6015 - }, - { - "epoch": 0.17, - "learning_rate": 8.568452296013014e-06, - "loss": 0.2402, - "step": 6020 - }, - { - "epoch": 0.17, - "learning_rate": 8.56702531464939e-06, - "loss": 0.1246, - "step": 6025 - }, - { - "epoch": 0.17, - "learning_rate": 8.565598333285768e-06, - "loss": 0.1411, - "step": 6030 - }, - { - "epoch": 0.17, - "learning_rate": 8.564171351922144e-06, - "loss": 0.2098, - "step": 6035 - }, - { - "epoch": 0.17, - "learning_rate": 8.56274437055852e-06, - "loss": 0.1542, - "step": 6040 - }, - { - "epoch": 0.17, - "learning_rate": 8.561317389194897e-06, - "loss": 0.4184, - "step": 6045 - }, - { - "epoch": 0.17, - "learning_rate": 8.559890407831273e-06, - "loss": 0.4777, - "step": 6050 - }, - { - "epoch": 0.17, - "learning_rate": 8.558463426467652e-06, - "loss": 0.1435, - "step": 6055 - }, - { - "epoch": 0.17, - "learning_rate": 8.557036445104028e-06, - "loss": 0.1859, - "step": 6060 - }, - { - "epoch": 0.17, - "learning_rate": 8.555609463740404e-06, - "loss": 0.1865, - "step": 6065 - }, - { - "epoch": 0.17, - "learning_rate": 8.55418248237678e-06, - "loss": 0.2156, - "step": 6070 - }, - { - "epoch": 0.17, - "learning_rate": 8.552755501013159e-06, - "loss": 0.1261, - "step": 6075 - }, - { - "epoch": 0.17, - "learning_rate": 8.551328519649535e-06, - "loss": 0.2086, - "step": 6080 - }, - { - "epoch": 0.17, - "learning_rate": 8.549901538285911e-06, - "loss": 0.0838, - "step": 6085 - }, - { - "epoch": 0.17, - "learning_rate": 8.548474556922288e-06, - "loss": 0.2231, - "step": 6090 - }, - { - "epoch": 0.17, - "learning_rate": 8.547047575558664e-06, - "loss": 0.2857, - "step": 6095 - }, - { - "epoch": 0.17, - "learning_rate": 8.545905990467766e-06, - "loss": 0.4935, - "step": 6100 - }, - { - "epoch": 0.17, - "learning_rate": 8.544479009104142e-06, - "loss": 0.2334, - "step": 6105 - }, - { - "epoch": 0.17, - "learning_rate": 8.543052027740519e-06, - "loss": 0.2609, - "step": 6110 - }, - { - "epoch": 0.17, - "learning_rate": 8.541625046376895e-06, - "loss": 0.2063, - "step": 6115 - }, - { - "epoch": 0.17, - "learning_rate": 8.540198065013271e-06, - "loss": 0.1624, - "step": 6120 - }, - { - "epoch": 0.17, - "learning_rate": 8.538771083649648e-06, - "loss": 0.2474, - "step": 6125 - }, - { - "epoch": 0.17, - "learning_rate": 8.537344102286024e-06, - "loss": 0.1688, - "step": 6130 - }, - { - "epoch": 0.17, - "learning_rate": 8.5359171209224e-06, - "loss": 0.102, - "step": 6135 - }, - { - "epoch": 0.17, - "learning_rate": 8.534490139558778e-06, - "loss": 0.1941, - "step": 6140 - }, - { - "epoch": 0.17, - "learning_rate": 8.533063158195155e-06, - "loss": 0.2409, - "step": 6145 - }, - { - "epoch": 0.17, - "learning_rate": 8.531636176831531e-06, - "loss": 0.5918, - "step": 6150 - }, - { - "epoch": 0.17, - "learning_rate": 8.530209195467907e-06, - "loss": 0.6058, - "step": 6155 - }, - { - "epoch": 0.17, - "learning_rate": 8.528782214104284e-06, - "loss": 0.2429, - "step": 6160 - }, - { - "epoch": 0.17, - "learning_rate": 8.52735523274066e-06, - "loss": 0.2443, - "step": 6165 - }, - { - "epoch": 0.17, - "learning_rate": 8.525928251377038e-06, - "loss": 0.198, - "step": 6170 - }, - { - "epoch": 0.17, - "learning_rate": 8.524501270013414e-06, - "loss": 0.1545, - "step": 6175 - }, - { - "epoch": 0.17, - "learning_rate": 8.52307428864979e-06, - "loss": 0.1433, - "step": 6180 - }, - { - "epoch": 0.17, - "learning_rate": 8.521647307286167e-06, - "loss": 0.0983, - "step": 6185 - }, - { - "epoch": 0.17, - "learning_rate": 8.520220325922545e-06, - "loss": 0.1364, - "step": 6190 - }, - { - "epoch": 0.17, - "learning_rate": 8.518793344558922e-06, - "loss": 0.1471, - "step": 6195 - }, - { - "epoch": 0.17, - "learning_rate": 8.517366363195298e-06, - "loss": 0.5086, - "step": 6200 - }, - { - "epoch": 0.17, - "learning_rate": 8.515939381831674e-06, - "loss": 0.1766, - "step": 6205 - }, - { - "epoch": 0.17, - "learning_rate": 8.51451240046805e-06, - "loss": 0.2234, - "step": 6210 - }, - { - "epoch": 0.17, - "learning_rate": 8.513085419104427e-06, - "loss": 0.2427, - "step": 6215 - }, - { - "epoch": 0.17, - "learning_rate": 8.511658437740803e-06, - "loss": 0.2137, - "step": 6220 - }, - { - "epoch": 0.17, - "learning_rate": 8.51023145637718e-06, - "loss": 0.0814, - "step": 6225 - }, - { - "epoch": 0.17, - "learning_rate": 8.508804475013558e-06, - "loss": 0.2149, - "step": 6230 - }, - { - "epoch": 0.17, - "learning_rate": 8.507377493649934e-06, - "loss": 0.1671, - "step": 6235 - }, - { - "epoch": 0.17, - "learning_rate": 8.50595051228631e-06, - "loss": 0.2632, - "step": 6240 - }, - { - "epoch": 0.17, - "learning_rate": 8.504523530922687e-06, - "loss": 0.3538, - "step": 6245 - }, - { - "epoch": 0.17, - "learning_rate": 8.503096549559063e-06, - "loss": 0.5223, - "step": 6250 - }, - { - "epoch": 0.17, - "learning_rate": 8.50166956819544e-06, - "loss": 0.1936, - "step": 6255 - }, - { - "epoch": 0.17, - "learning_rate": 8.500242586831816e-06, - "loss": 0.1584, - "step": 6260 - }, - { - "epoch": 0.17, - "learning_rate": 8.498815605468194e-06, - "loss": 0.1398, - "step": 6265 - }, - { - "epoch": 0.17, - "learning_rate": 8.49738862410457e-06, - "loss": 0.1843, - "step": 6270 - }, - { - "epoch": 0.17, - "learning_rate": 8.495961642740946e-06, - "loss": 0.1717, - "step": 6275 - }, - { - "epoch": 0.17, - "learning_rate": 8.494534661377323e-06, - "loss": 0.0737, - "step": 6280 - }, - { - "epoch": 0.17, - "learning_rate": 8.4931076800137e-06, - "loss": 0.0921, - "step": 6285 - }, - { - "epoch": 0.17, - "learning_rate": 8.491680698650077e-06, - "loss": 0.2542, - "step": 6290 - }, - { - "epoch": 0.17, - "learning_rate": 8.490253717286453e-06, - "loss": 0.2339, - "step": 6295 - }, - { - "epoch": 0.17, - "learning_rate": 8.48882673592283e-06, - "loss": 0.5075, - "step": 6300 - }, - { - "epoch": 0.17, - "learning_rate": 8.487399754559206e-06, - "loss": 0.1163, - "step": 6305 - }, - { - "epoch": 0.18, - "learning_rate": 8.485972773195582e-06, - "loss": 0.1872, - "step": 6310 - }, - { - "epoch": 0.18, - "learning_rate": 8.484545791831959e-06, - "loss": 0.1719, - "step": 6315 - }, - { - "epoch": 0.18, - "learning_rate": 8.483118810468337e-06, - "loss": 0.2333, - "step": 6320 - }, - { - "epoch": 0.18, - "learning_rate": 8.481691829104713e-06, - "loss": 0.1895, - "step": 6325 - }, - { - "epoch": 0.18, - "learning_rate": 8.48026484774109e-06, - "loss": 0.0974, - "step": 6330 - }, - { - "epoch": 0.18, - "learning_rate": 8.478837866377466e-06, - "loss": 0.1817, - "step": 6335 - }, - { - "epoch": 0.18, - "learning_rate": 8.477410885013842e-06, - "loss": 0.2273, - "step": 6340 - }, - { - "epoch": 0.18, - "learning_rate": 8.475983903650218e-06, - "loss": 0.3048, - "step": 6345 - }, - { - "epoch": 0.18, - "learning_rate": 8.474556922286595e-06, - "loss": 0.4877, - "step": 6350 - }, - { - "epoch": 0.18, - "learning_rate": 8.473129940922971e-06, - "loss": 0.1744, - "step": 6355 - }, - { - "epoch": 0.18, - "learning_rate": 8.47170295955935e-06, - "loss": 0.138, - "step": 6360 - }, - { - "epoch": 0.18, - "learning_rate": 8.470275978195726e-06, - "loss": 0.108, - "step": 6365 - }, - { - "epoch": 0.18, - "learning_rate": 8.468848996832102e-06, - "loss": 0.1577, - "step": 6370 - }, - { - "epoch": 0.18, - "learning_rate": 8.467422015468478e-06, - "loss": 0.2492, - "step": 6375 - }, - { - "epoch": 0.18, - "learning_rate": 8.465995034104856e-06, - "loss": 0.0848, - "step": 6380 - }, - { - "epoch": 0.18, - "learning_rate": 8.464568052741233e-06, - "loss": 0.1697, - "step": 6385 - }, - { - "epoch": 0.18, - "learning_rate": 8.463141071377609e-06, - "loss": 0.3038, - "step": 6390 - }, - { - "epoch": 0.18, - "learning_rate": 8.461714090013985e-06, - "loss": 0.4789, - "step": 6395 - }, - { - "epoch": 0.18, - "learning_rate": 8.460287108650362e-06, - "loss": 0.5222, - "step": 6400 - }, - { - "epoch": 0.18, - "learning_rate": 8.45886012728674e-06, - "loss": 0.1689, - "step": 6405 - }, - { - "epoch": 0.18, - "learning_rate": 8.457433145923116e-06, - "loss": 0.1895, - "step": 6410 - }, - { - "epoch": 0.18, - "learning_rate": 8.456006164559492e-06, - "loss": 0.3185, - "step": 6415 - }, - { - "epoch": 0.18, - "learning_rate": 8.454579183195869e-06, - "loss": 0.2007, - "step": 6420 - }, - { - "epoch": 0.18, - "learning_rate": 8.453152201832245e-06, - "loss": 0.0862, - "step": 6425 - }, - { - "epoch": 0.18, - "learning_rate": 8.451725220468621e-06, - "loss": 0.1575, - "step": 6430 - }, - { - "epoch": 0.18, - "learning_rate": 8.450298239104998e-06, - "loss": 0.1323, - "step": 6435 - }, - { - "epoch": 0.18, - "learning_rate": 8.448871257741374e-06, - "loss": 0.205, - "step": 6440 - }, - { - "epoch": 0.18, - "learning_rate": 8.44744427637775e-06, - "loss": 0.4507, - "step": 6445 - }, - { - "epoch": 0.18, - "learning_rate": 8.446017295014127e-06, - "loss": 0.6509, - "step": 6450 - }, - { - "epoch": 0.18, - "learning_rate": 8.444590313650505e-06, - "loss": 0.1532, - "step": 6455 - }, - { - "epoch": 0.18, - "learning_rate": 8.443163332286881e-06, - "loss": 0.1993, - "step": 6460 - }, - { - "epoch": 0.18, - "learning_rate": 8.441736350923257e-06, - "loss": 0.2075, - "step": 6465 - }, - { - "epoch": 0.18, - "learning_rate": 8.440309369559634e-06, - "loss": 0.2406, - "step": 6470 - }, - { - "epoch": 0.18, - "learning_rate": 8.438882388196012e-06, - "loss": 0.1678, - "step": 6475 - }, - { - "epoch": 0.18, - "learning_rate": 8.437455406832388e-06, - "loss": 0.0898, - "step": 6480 - }, - { - "epoch": 0.18, - "learning_rate": 8.436028425468764e-06, - "loss": 0.0728, - "step": 6485 - }, - { - "epoch": 0.18, - "learning_rate": 8.43460144410514e-06, - "loss": 0.178, - "step": 6490 - }, - { - "epoch": 0.18, - "learning_rate": 8.433174462741517e-06, - "loss": 0.328, - "step": 6495 - }, - { - "epoch": 0.18, - "learning_rate": 8.431747481377895e-06, - "loss": 0.5988, - "step": 6500 - }, - { - "epoch": 0.18, - "learning_rate": 8.430320500014271e-06, - "loss": 0.2281, - "step": 6505 - }, - { - "epoch": 0.18, - "learning_rate": 8.428893518650648e-06, - "loss": 0.1533, - "step": 6510 - }, - { - "epoch": 0.18, - "learning_rate": 8.427466537287024e-06, - "loss": 0.1882, - "step": 6515 - }, - { - "epoch": 0.18, - "learning_rate": 8.4260395559234e-06, - "loss": 0.1461, - "step": 6520 - }, - { - "epoch": 0.18, - "learning_rate": 8.424612574559777e-06, - "loss": 0.1125, - "step": 6525 - }, - { - "epoch": 0.18, - "learning_rate": 8.423185593196153e-06, - "loss": 0.2008, - "step": 6530 - }, - { - "epoch": 0.18, - "learning_rate": 8.42175861183253e-06, - "loss": 0.1642, - "step": 6535 - }, - { - "epoch": 0.18, - "learning_rate": 8.420331630468906e-06, - "loss": 0.3273, - "step": 6540 - }, - { - "epoch": 0.18, - "learning_rate": 8.418904649105282e-06, - "loss": 0.1172, - "step": 6545 - }, - { - "epoch": 0.18, - "learning_rate": 8.41747766774166e-06, - "loss": 0.5899, - "step": 6550 - }, - { - "epoch": 0.18, - "learning_rate": 8.416050686378037e-06, - "loss": 0.226, - "step": 6555 - }, - { - "epoch": 0.18, - "learning_rate": 8.414623705014413e-06, - "loss": 0.1787, - "step": 6560 - }, - { - "epoch": 0.18, - "learning_rate": 8.41319672365079e-06, - "loss": 0.1932, - "step": 6565 - }, - { - "epoch": 0.18, - "learning_rate": 8.411769742287167e-06, - "loss": 0.3157, - "step": 6570 - }, - { - "epoch": 0.18, - "learning_rate": 8.410342760923544e-06, - "loss": 0.1779, - "step": 6575 - }, - { - "epoch": 0.18, - "learning_rate": 8.40891577955992e-06, - "loss": 0.0548, - "step": 6580 - }, - { - "epoch": 0.18, - "learning_rate": 8.407488798196296e-06, - "loss": 0.2249, - "step": 6585 - }, - { - "epoch": 0.18, - "learning_rate": 8.406061816832673e-06, - "loss": 0.3006, - "step": 6590 - }, - { - "epoch": 0.18, - "learning_rate": 8.40463483546905e-06, - "loss": 0.4068, - "step": 6595 - }, - { - "epoch": 0.18, - "learning_rate": 8.403207854105427e-06, - "loss": 0.4126, - "step": 6600 - }, - { - "epoch": 0.18, - "learning_rate": 8.401780872741803e-06, - "loss": 0.2776, - "step": 6605 - }, - { - "epoch": 0.18, - "learning_rate": 8.40035389137818e-06, - "loss": 0.2043, - "step": 6610 - }, - { - "epoch": 0.18, - "learning_rate": 8.398926910014556e-06, - "loss": 0.202, - "step": 6615 - }, - { - "epoch": 0.18, - "learning_rate": 8.397499928650932e-06, - "loss": 0.2153, - "step": 6620 - }, - { - "epoch": 0.18, - "learning_rate": 8.396072947287309e-06, - "loss": 0.1042, - "step": 6625 - }, - { - "epoch": 0.18, - "learning_rate": 8.394645965923685e-06, - "loss": 0.1125, - "step": 6630 - }, - { - "epoch": 0.18, - "learning_rate": 8.393218984560061e-06, - "loss": 0.2851, - "step": 6635 - }, - { - "epoch": 0.18, - "learning_rate": 8.39179200319644e-06, - "loss": 0.2376, - "step": 6640 - }, - { - "epoch": 0.18, - "learning_rate": 8.390365021832816e-06, - "loss": 0.3222, - "step": 6645 - }, - { - "epoch": 0.18, - "learning_rate": 8.388938040469192e-06, - "loss": 0.4322, - "step": 6650 - }, - { - "epoch": 0.18, - "learning_rate": 8.387511059105568e-06, - "loss": 0.1321, - "step": 6655 - }, - { - "epoch": 0.18, - "learning_rate": 8.386084077741945e-06, - "loss": 0.2256, - "step": 6660 - }, - { - "epoch": 0.18, - "learning_rate": 8.384657096378323e-06, - "loss": 0.1782, - "step": 6665 - }, - { - "epoch": 0.19, - "learning_rate": 8.383230115014699e-06, - "loss": 0.1718, - "step": 6670 - }, - { - "epoch": 0.19, - "learning_rate": 8.381803133651075e-06, - "loss": 0.241, - "step": 6675 - }, - { - "epoch": 0.19, - "learning_rate": 8.380376152287452e-06, - "loss": 0.2157, - "step": 6680 - }, - { - "epoch": 0.19, - "learning_rate": 8.378949170923828e-06, - "loss": 0.2164, - "step": 6685 - }, - { - "epoch": 0.19, - "learning_rate": 8.377522189560206e-06, - "loss": 0.1748, - "step": 6690 - }, - { - "epoch": 0.19, - "learning_rate": 8.376095208196583e-06, - "loss": 0.1148, - "step": 6695 - }, - { - "epoch": 0.19, - "learning_rate": 8.374668226832959e-06, - "loss": 0.3105, - "step": 6700 - }, - { - "epoch": 0.19, - "learning_rate": 8.373241245469335e-06, - "loss": 0.2214, - "step": 6705 - }, - { - "epoch": 0.19, - "learning_rate": 8.371814264105712e-06, - "loss": 0.1674, - "step": 6710 - }, - { - "epoch": 0.19, - "learning_rate": 8.370387282742088e-06, - "loss": 0.1968, - "step": 6715 - }, - { - "epoch": 0.19, - "learning_rate": 8.368960301378464e-06, - "loss": 0.2137, - "step": 6720 - }, - { - "epoch": 0.19, - "learning_rate": 8.36753332001484e-06, - "loss": 0.1645, - "step": 6725 - }, - { - "epoch": 0.19, - "learning_rate": 8.366106338651217e-06, - "loss": 0.1292, - "step": 6730 - }, - { - "epoch": 0.19, - "learning_rate": 8.364679357287595e-06, - "loss": 0.1719, - "step": 6735 - }, - { - "epoch": 0.19, - "learning_rate": 8.363252375923971e-06, - "loss": 0.2621, - "step": 6740 - }, - { - "epoch": 0.19, - "learning_rate": 8.361825394560348e-06, - "loss": 0.5572, - "step": 6745 - }, - { - "epoch": 0.19, - "learning_rate": 8.360398413196724e-06, - "loss": 0.4367, - "step": 6750 - }, - { - "epoch": 0.19, - "learning_rate": 8.3589714318331e-06, - "loss": 0.1601, - "step": 6755 - }, - { - "epoch": 0.19, - "learning_rate": 8.357544450469478e-06, - "loss": 0.2053, - "step": 6760 - }, - { - "epoch": 0.19, - "learning_rate": 8.356117469105855e-06, - "loss": 0.1942, - "step": 6765 - }, - { - "epoch": 0.19, - "learning_rate": 8.354690487742231e-06, - "loss": 0.1708, - "step": 6770 - }, - { - "epoch": 0.19, - "learning_rate": 8.353263506378607e-06, - "loss": 0.2491, - "step": 6775 - }, - { - "epoch": 0.19, - "learning_rate": 8.351836525014984e-06, - "loss": 0.1236, - "step": 6780 - }, - { - "epoch": 0.19, - "learning_rate": 8.350409543651362e-06, - "loss": 0.2253, - "step": 6785 - }, - { - "epoch": 0.19, - "learning_rate": 8.348982562287738e-06, - "loss": 0.2409, - "step": 6790 - }, - { - "epoch": 0.19, - "learning_rate": 8.347555580924114e-06, - "loss": 0.2078, - "step": 6795 - }, - { - "epoch": 0.19, - "learning_rate": 8.34612859956049e-06, - "loss": 0.4089, - "step": 6800 - }, - { - "epoch": 0.19, - "learning_rate": 8.344701618196867e-06, - "loss": 0.1342, - "step": 6805 - }, - { - "epoch": 0.19, - "learning_rate": 8.343274636833243e-06, - "loss": 0.1629, - "step": 6810 - }, - { - "epoch": 0.19, - "learning_rate": 8.34184765546962e-06, - "loss": 0.149, - "step": 6815 - }, - { - "epoch": 0.19, - "learning_rate": 8.340420674105996e-06, - "loss": 0.1979, - "step": 6820 - }, - { - "epoch": 0.19, - "learning_rate": 8.338993692742372e-06, - "loss": 0.1371, - "step": 6825 - }, - { - "epoch": 0.19, - "learning_rate": 8.33756671137875e-06, - "loss": 0.1345, - "step": 6830 - }, - { - "epoch": 0.19, - "learning_rate": 8.336139730015127e-06, - "loss": 0.3031, - "step": 6835 - }, - { - "epoch": 0.19, - "learning_rate": 8.334712748651503e-06, - "loss": 0.0934, - "step": 6840 - }, - { - "epoch": 0.19, - "learning_rate": 8.33328576728788e-06, - "loss": 0.3847, - "step": 6845 - }, - { - "epoch": 0.19, - "learning_rate": 8.331858785924256e-06, - "loss": 0.4262, - "step": 6850 - }, - { - "epoch": 0.19, - "learning_rate": 8.330431804560634e-06, - "loss": 0.2704, - "step": 6855 - }, - { - "epoch": 0.19, - "learning_rate": 8.32900482319701e-06, - "loss": 0.174, - "step": 6860 - }, - { - "epoch": 0.19, - "learning_rate": 8.327577841833386e-06, - "loss": 0.203, - "step": 6865 - }, - { - "epoch": 0.19, - "learning_rate": 8.326150860469763e-06, - "loss": 0.1766, - "step": 6870 - }, - { - "epoch": 0.19, - "learning_rate": 8.32472387910614e-06, - "loss": 0.1113, - "step": 6875 - }, - { - "epoch": 0.19, - "learning_rate": 8.323296897742517e-06, - "loss": 0.1789, - "step": 6880 - }, - { - "epoch": 0.19, - "learning_rate": 8.321869916378894e-06, - "loss": 0.1672, - "step": 6885 - }, - { - "epoch": 0.19, - "learning_rate": 8.32044293501527e-06, - "loss": 0.2633, - "step": 6890 - }, - { - "epoch": 0.19, - "learning_rate": 8.319015953651646e-06, - "loss": 0.3725, - "step": 6895 - }, - { - "epoch": 0.19, - "learning_rate": 8.317588972288023e-06, - "loss": 0.3129, - "step": 6900 - }, - { - "epoch": 0.19, - "learning_rate": 8.316161990924399e-06, - "loss": 0.2139, - "step": 6905 - }, - { - "epoch": 0.19, - "learning_rate": 8.314735009560775e-06, - "loss": 0.3623, - "step": 6910 - }, - { - "epoch": 0.19, - "learning_rate": 8.313308028197152e-06, - "loss": 0.1442, - "step": 6915 - }, - { - "epoch": 0.19, - "learning_rate": 8.311881046833528e-06, - "loss": 0.1482, - "step": 6920 - }, - { - "epoch": 0.19, - "learning_rate": 8.310454065469906e-06, - "loss": 0.2105, - "step": 6925 - }, - { - "epoch": 0.19, - "learning_rate": 8.309027084106282e-06, - "loss": 0.1828, - "step": 6930 - }, - { - "epoch": 0.19, - "learning_rate": 8.307600102742659e-06, - "loss": 0.1349, - "step": 6935 - }, - { - "epoch": 0.19, - "learning_rate": 8.306173121379035e-06, - "loss": 0.2098, - "step": 6940 - }, - { - "epoch": 0.19, - "learning_rate": 8.304746140015411e-06, - "loss": 0.3807, - "step": 6945 - }, - { - "epoch": 0.19, - "learning_rate": 8.30331915865179e-06, - "loss": 0.5789, - "step": 6950 - }, - { - "epoch": 0.19, - "learning_rate": 8.301892177288166e-06, - "loss": 0.1509, - "step": 6955 - }, - { - "epoch": 0.19, - "learning_rate": 8.300465195924542e-06, - "loss": 0.1647, - "step": 6960 - }, - { - "epoch": 0.19, - "learning_rate": 8.299038214560918e-06, - "loss": 0.1773, - "step": 6965 - }, - { - "epoch": 0.19, - "learning_rate": 8.297611233197295e-06, - "loss": 0.1803, - "step": 6970 - }, - { - "epoch": 0.19, - "learning_rate": 8.296184251833673e-06, - "loss": 0.2572, - "step": 6975 - }, - { - "epoch": 0.19, - "learning_rate": 8.294757270470049e-06, - "loss": 0.0578, - "step": 6980 - }, - { - "epoch": 0.19, - "learning_rate": 8.293330289106425e-06, - "loss": 0.194, - "step": 6985 - }, - { - "epoch": 0.19, - "learning_rate": 8.291903307742802e-06, - "loss": 0.2055, - "step": 6990 - }, - { - "epoch": 0.19, - "learning_rate": 8.290476326379178e-06, - "loss": 0.3183, - "step": 6995 - }, - { - "epoch": 0.19, - "learning_rate": 8.289049345015554e-06, - "loss": 0.5604, - "step": 7000 - }, - { - "epoch": 0.19, - "learning_rate": 8.28762236365193e-06, - "loss": 0.1832, - "step": 7005 - }, - { - "epoch": 0.19, - "learning_rate": 8.286195382288307e-06, - "loss": 0.229, - "step": 7010 - }, - { - "epoch": 0.19, - "learning_rate": 8.284768400924683e-06, - "loss": 0.1836, - "step": 7015 - }, - { - "epoch": 0.19, - "learning_rate": 8.283341419561061e-06, - "loss": 0.2354, - "step": 7020 - }, - { - "epoch": 0.19, - "learning_rate": 8.281914438197438e-06, - "loss": 0.1575, - "step": 7025 - }, - { - "epoch": 0.2, - "learning_rate": 8.280487456833814e-06, - "loss": 0.047, - "step": 7030 - }, - { - "epoch": 0.2, - "learning_rate": 8.27906047547019e-06, - "loss": 0.0861, - "step": 7035 - }, - { - "epoch": 0.2, - "learning_rate": 8.277633494106567e-06, - "loss": 0.2914, - "step": 7040 - }, - { - "epoch": 0.2, - "learning_rate": 8.276206512742945e-06, - "loss": 0.1699, - "step": 7045 - }, - { - "epoch": 0.2, - "learning_rate": 8.274779531379321e-06, - "loss": 0.3493, - "step": 7050 - }, - { - "epoch": 0.2, - "learning_rate": 8.273352550015698e-06, - "loss": 0.1849, - "step": 7055 - }, - { - "epoch": 0.2, - "learning_rate": 8.271925568652074e-06, - "loss": 0.1878, - "step": 7060 - }, - { - "epoch": 0.2, - "learning_rate": 8.27049858728845e-06, - "loss": 0.1817, - "step": 7065 - }, - { - "epoch": 0.2, - "learning_rate": 8.269071605924828e-06, - "loss": 0.1612, - "step": 7070 - }, - { - "epoch": 0.2, - "learning_rate": 8.267644624561205e-06, - "loss": 0.1838, - "step": 7075 - }, - { - "epoch": 0.2, - "learning_rate": 8.266217643197581e-06, - "loss": 0.1406, - "step": 7080 - }, - { - "epoch": 0.2, - "learning_rate": 8.264790661833957e-06, - "loss": 0.2158, - "step": 7085 - }, - { - "epoch": 0.2, - "learning_rate": 8.263363680470334e-06, - "loss": 0.3149, - "step": 7090 - }, - { - "epoch": 0.2, - "learning_rate": 8.26193669910671e-06, - "loss": 0.3768, - "step": 7095 - }, - { - "epoch": 0.2, - "learning_rate": 8.260509717743086e-06, - "loss": 0.4874, - "step": 7100 - }, - { - "epoch": 0.2, - "learning_rate": 8.259082736379464e-06, - "loss": 0.1532, - "step": 7105 - }, - { - "epoch": 0.2, - "learning_rate": 8.25765575501584e-06, - "loss": 0.1728, - "step": 7110 - }, - { - "epoch": 0.2, - "learning_rate": 8.256228773652217e-06, - "loss": 0.162, - "step": 7115 - }, - { - "epoch": 0.2, - "learning_rate": 8.254801792288593e-06, - "loss": 0.2831, - "step": 7120 - }, - { - "epoch": 0.2, - "learning_rate": 8.25337481092497e-06, - "loss": 0.1868, - "step": 7125 - }, - { - "epoch": 0.2, - "learning_rate": 8.251947829561346e-06, - "loss": 0.0658, - "step": 7130 - }, - { - "epoch": 0.2, - "learning_rate": 8.250520848197722e-06, - "loss": 0.2732, - "step": 7135 - }, - { - "epoch": 0.2, - "learning_rate": 8.2490938668341e-06, - "loss": 0.1974, - "step": 7140 - }, - { - "epoch": 0.2, - "learning_rate": 8.247666885470477e-06, - "loss": 0.21, - "step": 7145 - }, - { - "epoch": 0.2, - "learning_rate": 8.246239904106853e-06, - "loss": 0.3657, - "step": 7150 - }, - { - "epoch": 0.2, - "learning_rate": 8.24481292274323e-06, - "loss": 0.1833, - "step": 7155 - }, - { - "epoch": 0.2, - "learning_rate": 8.243385941379606e-06, - "loss": 0.1515, - "step": 7160 - }, - { - "epoch": 0.2, - "learning_rate": 8.241958960015984e-06, - "loss": 0.2312, - "step": 7165 - }, - { - "epoch": 0.2, - "learning_rate": 8.24053197865236e-06, - "loss": 0.1856, - "step": 7170 - }, - { - "epoch": 0.2, - "learning_rate": 8.239104997288736e-06, - "loss": 0.2191, - "step": 7175 - }, - { - "epoch": 0.2, - "learning_rate": 8.237678015925113e-06, - "loss": 0.1461, - "step": 7180 - }, - { - "epoch": 0.2, - "learning_rate": 8.236251034561489e-06, - "loss": 0.1361, - "step": 7185 - }, - { - "epoch": 0.2, - "learning_rate": 8.234824053197865e-06, - "loss": 0.1592, - "step": 7190 - }, - { - "epoch": 0.2, - "learning_rate": 8.233397071834243e-06, - "loss": 0.1711, - "step": 7195 - }, - { - "epoch": 0.2, - "learning_rate": 8.23197009047062e-06, - "loss": 0.4492, - "step": 7200 - }, - { - "epoch": 0.2, - "learning_rate": 8.230543109106996e-06, - "loss": 0.2174, - "step": 7205 - }, - { - "epoch": 0.2, - "learning_rate": 8.229116127743372e-06, - "loss": 0.1999, - "step": 7210 - }, - { - "epoch": 0.2, - "learning_rate": 8.227689146379749e-06, - "loss": 0.1429, - "step": 7215 - }, - { - "epoch": 0.2, - "learning_rate": 8.226262165016125e-06, - "loss": 0.2191, - "step": 7220 - }, - { - "epoch": 0.2, - "learning_rate": 8.224835183652502e-06, - "loss": 0.171, - "step": 7225 - }, - { - "epoch": 0.2, - "learning_rate": 8.223408202288878e-06, - "loss": 0.1044, - "step": 7230 - }, - { - "epoch": 0.2, - "learning_rate": 8.221981220925256e-06, - "loss": 0.1673, - "step": 7235 - }, - { - "epoch": 0.2, - "learning_rate": 8.220554239561632e-06, - "loss": 0.1706, - "step": 7240 - }, - { - "epoch": 0.2, - "learning_rate": 8.219127258198009e-06, - "loss": 0.178, - "step": 7245 - }, - { - "epoch": 0.2, - "learning_rate": 8.217700276834385e-06, - "loss": 0.6589, - "step": 7250 - }, - { - "epoch": 0.2, - "learning_rate": 8.216273295470761e-06, - "loss": 0.1911, - "step": 7255 - }, - { - "epoch": 0.2, - "learning_rate": 8.21484631410714e-06, - "loss": 0.1498, - "step": 7260 - }, - { - "epoch": 0.2, - "learning_rate": 8.213419332743516e-06, - "loss": 0.1801, - "step": 7265 - }, - { - "epoch": 0.2, - "learning_rate": 8.211992351379892e-06, - "loss": 0.1972, - "step": 7270 - }, - { - "epoch": 0.2, - "learning_rate": 8.210565370016268e-06, - "loss": 0.1474, - "step": 7275 - }, - { - "epoch": 0.2, - "learning_rate": 8.209138388652645e-06, - "loss": 0.1972, - "step": 7280 - }, - { - "epoch": 0.2, - "learning_rate": 8.207711407289023e-06, - "loss": 0.2453, - "step": 7285 - }, - { - "epoch": 0.2, - "learning_rate": 8.206284425925399e-06, - "loss": 0.2086, - "step": 7290 - }, - { - "epoch": 0.2, - "learning_rate": 8.204857444561775e-06, - "loss": 0.1912, - "step": 7295 - }, - { - "epoch": 0.2, - "learning_rate": 8.203430463198152e-06, - "loss": 0.3786, - "step": 7300 - }, - { - "epoch": 0.2, - "learning_rate": 8.202003481834528e-06, - "loss": 0.2067, - "step": 7305 - }, - { - "epoch": 0.2, - "learning_rate": 8.200576500470904e-06, - "loss": 0.2041, - "step": 7310 - }, - { - "epoch": 0.2, - "learning_rate": 8.19914951910728e-06, - "loss": 0.244, - "step": 7315 - }, - { - "epoch": 0.2, - "learning_rate": 8.197722537743657e-06, - "loss": 0.2493, - "step": 7320 - }, - { - "epoch": 0.2, - "learning_rate": 8.196295556380033e-06, - "loss": 0.0708, - "step": 7325 - }, - { - "epoch": 0.2, - "learning_rate": 8.194868575016411e-06, - "loss": 0.0863, - "step": 7330 - }, - { - "epoch": 0.2, - "learning_rate": 8.193441593652788e-06, - "loss": 0.1413, - "step": 7335 - }, - { - "epoch": 0.2, - "learning_rate": 8.192014612289164e-06, - "loss": 0.1141, - "step": 7340 - }, - { - "epoch": 0.2, - "learning_rate": 8.19058763092554e-06, - "loss": 0.4008, - "step": 7345 - }, - { - "epoch": 0.2, - "learning_rate": 8.189160649561917e-06, - "loss": 0.5528, - "step": 7350 - }, - { - "epoch": 0.2, - "learning_rate": 8.187733668198295e-06, - "loss": 0.1992, - "step": 7355 - }, - { - "epoch": 0.2, - "learning_rate": 8.186306686834671e-06, - "loss": 0.1314, - "step": 7360 - }, - { - "epoch": 0.2, - "learning_rate": 8.184879705471047e-06, - "loss": 0.1417, - "step": 7365 - }, - { - "epoch": 0.2, - "learning_rate": 8.183452724107424e-06, - "loss": 0.1609, - "step": 7370 - }, - { - "epoch": 0.2, - "learning_rate": 8.1820257427438e-06, - "loss": 0.1983, - "step": 7375 - }, - { - "epoch": 0.2, - "learning_rate": 8.180598761380178e-06, - "loss": 0.1147, - "step": 7380 - }, - { - "epoch": 0.2, - "learning_rate": 8.179171780016555e-06, - "loss": 0.1589, - "step": 7385 - }, - { - "epoch": 0.21, - "learning_rate": 8.17774479865293e-06, - "loss": 0.1664, - "step": 7390 - }, - { - "epoch": 0.21, - "learning_rate": 8.176317817289307e-06, - "loss": 0.4555, - "step": 7395 - }, - { - "epoch": 0.21, - "learning_rate": 8.174890835925684e-06, - "loss": 0.5475, - "step": 7400 - }, - { - "epoch": 0.21, - "learning_rate": 8.17346385456206e-06, - "loss": 0.1252, - "step": 7405 - }, - { - "epoch": 0.21, - "learning_rate": 8.172036873198436e-06, - "loss": 0.21, - "step": 7410 - }, - { - "epoch": 0.21, - "learning_rate": 8.170609891834813e-06, - "loss": 0.202, - "step": 7415 - }, - { - "epoch": 0.21, - "learning_rate": 8.169182910471189e-06, - "loss": 0.2249, - "step": 7420 - }, - { - "epoch": 0.21, - "learning_rate": 8.167755929107567e-06, - "loss": 0.2559, - "step": 7425 - }, - { - "epoch": 0.21, - "learning_rate": 8.166328947743943e-06, - "loss": 0.1324, - "step": 7430 - }, - { - "epoch": 0.21, - "learning_rate": 8.16490196638032e-06, - "loss": 0.2564, - "step": 7435 - }, - { - "epoch": 0.21, - "learning_rate": 8.163474985016696e-06, - "loss": 0.2318, - "step": 7440 - }, - { - "epoch": 0.21, - "learning_rate": 8.162048003653072e-06, - "loss": 0.2666, - "step": 7445 - }, - { - "epoch": 0.21, - "learning_rate": 8.16062102228945e-06, - "loss": 0.3466, - "step": 7450 - }, - { - "epoch": 0.21, - "learning_rate": 8.159194040925827e-06, - "loss": 0.2163, - "step": 7455 - }, - { - "epoch": 0.21, - "learning_rate": 8.157767059562203e-06, - "loss": 0.2175, - "step": 7460 - }, - { - "epoch": 0.21, - "learning_rate": 8.15634007819858e-06, - "loss": 0.2092, - "step": 7465 - }, - { - "epoch": 0.21, - "learning_rate": 8.154913096834956e-06, - "loss": 0.2197, - "step": 7470 - }, - { - "epoch": 0.21, - "learning_rate": 8.153486115471334e-06, - "loss": 0.0569, - "step": 7475 - }, - { - "epoch": 0.21, - "learning_rate": 8.15205913410771e-06, - "loss": 0.0812, - "step": 7480 - }, - { - "epoch": 0.21, - "learning_rate": 8.150632152744086e-06, - "loss": 0.1031, - "step": 7485 - }, - { - "epoch": 0.21, - "learning_rate": 8.149205171380463e-06, - "loss": 0.3571, - "step": 7490 - }, - { - "epoch": 0.21, - "learning_rate": 8.147778190016839e-06, - "loss": 0.1208, - "step": 7495 - }, - { - "epoch": 0.21, - "learning_rate": 8.146351208653215e-06, - "loss": 0.2976, - "step": 7500 - }, - { - "epoch": 0.21, - "learning_rate": 8.144924227289592e-06, - "loss": 0.1949, - "step": 7505 - }, - { - "epoch": 0.21, - "learning_rate": 8.143497245925968e-06, - "loss": 0.246, - "step": 7510 - }, - { - "epoch": 0.21, - "learning_rate": 8.142070264562344e-06, - "loss": 0.1885, - "step": 7515 - }, - { - "epoch": 0.21, - "learning_rate": 8.140643283198722e-06, - "loss": 0.2733, - "step": 7520 - }, - { - "epoch": 0.21, - "learning_rate": 8.139216301835099e-06, - "loss": 0.0634, - "step": 7525 - }, - { - "epoch": 0.21, - "learning_rate": 8.137789320471475e-06, - "loss": 0.1103, - "step": 7530 - }, - { - "epoch": 0.21, - "learning_rate": 8.136362339107851e-06, - "loss": 0.0912, - "step": 7535 - }, - { - "epoch": 0.21, - "learning_rate": 8.134935357744228e-06, - "loss": 0.2565, - "step": 7540 - }, - { - "epoch": 0.21, - "learning_rate": 8.133508376380606e-06, - "loss": 0.3867, - "step": 7545 - }, - { - "epoch": 0.21, - "learning_rate": 8.132081395016982e-06, - "loss": 0.4726, - "step": 7550 - }, - { - "epoch": 0.21, - "learning_rate": 8.130654413653358e-06, - "loss": 0.4183, - "step": 7555 - }, - { - "epoch": 0.21, - "learning_rate": 8.129227432289735e-06, - "loss": 0.1844, - "step": 7560 - }, - { - "epoch": 0.21, - "learning_rate": 8.127800450926111e-06, - "loss": 0.1948, - "step": 7565 - }, - { - "epoch": 0.21, - "learning_rate": 8.12637346956249e-06, - "loss": 0.2435, - "step": 7570 - }, - { - "epoch": 0.21, - "learning_rate": 8.124946488198866e-06, - "loss": 0.2355, - "step": 7575 - }, - { - "epoch": 0.21, - "learning_rate": 8.123519506835242e-06, - "loss": 0.1969, - "step": 7580 - }, - { - "epoch": 0.21, - "learning_rate": 8.122092525471618e-06, - "loss": 0.1432, - "step": 7585 - }, - { - "epoch": 0.21, - "learning_rate": 8.120665544107995e-06, - "loss": 0.2547, - "step": 7590 - }, - { - "epoch": 0.21, - "learning_rate": 8.119238562744371e-06, - "loss": 0.3437, - "step": 7595 - }, - { - "epoch": 0.21, - "learning_rate": 8.117811581380747e-06, - "loss": 0.6044, - "step": 7600 - }, - { - "epoch": 0.21, - "learning_rate": 8.116384600017124e-06, - "loss": 0.2163, - "step": 7605 - }, - { - "epoch": 0.21, - "learning_rate": 8.1149576186535e-06, - "loss": 0.1687, - "step": 7610 - }, - { - "epoch": 0.21, - "learning_rate": 8.113530637289878e-06, - "loss": 0.1551, - "step": 7615 - }, - { - "epoch": 0.21, - "learning_rate": 8.112103655926254e-06, - "loss": 0.2271, - "step": 7620 - }, - { - "epoch": 0.21, - "learning_rate": 8.11067667456263e-06, - "loss": 0.1671, - "step": 7625 - }, - { - "epoch": 0.21, - "learning_rate": 8.109249693199007e-06, - "loss": 0.0885, - "step": 7630 - }, - { - "epoch": 0.21, - "learning_rate": 8.107822711835383e-06, - "loss": 0.1219, - "step": 7635 - }, - { - "epoch": 0.21, - "learning_rate": 8.106395730471761e-06, - "loss": 0.1902, - "step": 7640 - }, - { - "epoch": 0.21, - "learning_rate": 8.104968749108138e-06, - "loss": 0.2712, - "step": 7645 - }, - { - "epoch": 0.21, - "learning_rate": 8.103541767744514e-06, - "loss": 0.4752, - "step": 7650 - }, - { - "epoch": 0.21, - "learning_rate": 8.10211478638089e-06, - "loss": 0.1733, - "step": 7655 - }, - { - "epoch": 0.21, - "learning_rate": 8.100687805017267e-06, - "loss": 0.1289, - "step": 7660 - }, - { - "epoch": 0.21, - "learning_rate": 8.099260823653645e-06, - "loss": 0.2383, - "step": 7665 - }, - { - "epoch": 0.21, - "learning_rate": 8.097833842290021e-06, - "loss": 0.1959, - "step": 7670 - }, - { - "epoch": 0.21, - "learning_rate": 8.096406860926397e-06, - "loss": 0.1568, - "step": 7675 - }, - { - "epoch": 0.21, - "learning_rate": 8.094979879562774e-06, - "loss": 0.1829, - "step": 7680 - }, - { - "epoch": 0.21, - "learning_rate": 8.09355289819915e-06, - "loss": 0.1501, - "step": 7685 - }, - { - "epoch": 0.21, - "learning_rate": 8.092125916835526e-06, - "loss": 0.2989, - "step": 7690 - }, - { - "epoch": 0.21, - "learning_rate": 8.090698935471903e-06, - "loss": 0.2442, - "step": 7695 - }, - { - "epoch": 0.21, - "learning_rate": 8.089271954108279e-06, - "loss": 0.8114, - "step": 7700 - }, - { - "epoch": 0.21, - "learning_rate": 8.087844972744655e-06, - "loss": 0.1299, - "step": 7705 - }, - { - "epoch": 0.21, - "learning_rate": 8.086417991381033e-06, - "loss": 0.2395, - "step": 7710 - }, - { - "epoch": 0.21, - "learning_rate": 8.08499101001741e-06, - "loss": 0.1642, - "step": 7715 - }, - { - "epoch": 0.21, - "learning_rate": 8.083564028653786e-06, - "loss": 0.1507, - "step": 7720 - }, - { - "epoch": 0.21, - "learning_rate": 8.082137047290162e-06, - "loss": 0.1931, - "step": 7725 - }, - { - "epoch": 0.21, - "learning_rate": 8.080710065926539e-06, - "loss": 0.079, - "step": 7730 - }, - { - "epoch": 0.21, - "learning_rate": 8.079283084562917e-06, - "loss": 0.0929, - "step": 7735 - }, - { - "epoch": 0.21, - "learning_rate": 8.077856103199293e-06, - "loss": 0.1381, - "step": 7740 - }, - { - "epoch": 0.21, - "learning_rate": 8.07642912183567e-06, - "loss": 0.3335, - "step": 7745 - }, - { - "epoch": 0.22, - "learning_rate": 8.075002140472046e-06, - "loss": 0.3351, - "step": 7750 - }, - { - "epoch": 0.22, - "learning_rate": 8.073575159108422e-06, - "loss": 0.1355, - "step": 7755 - }, - { - "epoch": 0.22, - "learning_rate": 8.0721481777448e-06, - "loss": 0.1426, - "step": 7760 - }, - { - "epoch": 0.22, - "learning_rate": 8.070721196381177e-06, - "loss": 0.1558, - "step": 7765 - }, - { - "epoch": 0.22, - "learning_rate": 8.069294215017553e-06, - "loss": 0.1551, - "step": 7770 - }, - { - "epoch": 0.22, - "learning_rate": 8.06786723365393e-06, - "loss": 0.2197, - "step": 7775 - }, - { - "epoch": 0.22, - "learning_rate": 8.066440252290306e-06, - "loss": 0.0977, - "step": 7780 - }, - { - "epoch": 0.22, - "learning_rate": 8.065013270926682e-06, - "loss": 0.168, - "step": 7785 - }, - { - "epoch": 0.22, - "learning_rate": 8.063586289563058e-06, - "loss": 0.1557, - "step": 7790 - }, - { - "epoch": 0.22, - "learning_rate": 8.062159308199435e-06, - "loss": 0.1372, - "step": 7795 - }, - { - "epoch": 0.22, - "learning_rate": 8.060732326835811e-06, - "loss": 0.384, - "step": 7800 - }, - { - "epoch": 0.22, - "learning_rate": 8.059305345472189e-06, - "loss": 0.1653, - "step": 7805 - }, - { - "epoch": 0.22, - "learning_rate": 8.057878364108565e-06, - "loss": 0.1789, - "step": 7810 - }, - { - "epoch": 0.22, - "learning_rate": 8.056451382744942e-06, - "loss": 0.2406, - "step": 7815 - }, - { - "epoch": 0.22, - "learning_rate": 8.055024401381318e-06, - "loss": 0.1819, - "step": 7820 - }, - { - "epoch": 0.22, - "learning_rate": 8.053597420017694e-06, - "loss": 0.1301, - "step": 7825 - }, - { - "epoch": 0.22, - "learning_rate": 8.052170438654072e-06, - "loss": 0.1108, - "step": 7830 - }, - { - "epoch": 0.22, - "learning_rate": 8.050743457290449e-06, - "loss": 0.0467, - "step": 7835 - }, - { - "epoch": 0.22, - "learning_rate": 8.049316475926825e-06, - "loss": 0.3237, - "step": 7840 - }, - { - "epoch": 0.22, - "learning_rate": 8.047889494563201e-06, - "loss": 0.2159, - "step": 7845 - }, - { - "epoch": 0.22, - "learning_rate": 8.046462513199578e-06, - "loss": 0.4882, - "step": 7850 - }, - { - "epoch": 0.22, - "learning_rate": 8.045035531835956e-06, - "loss": 0.1892, - "step": 7855 - }, - { - "epoch": 0.22, - "learning_rate": 8.043608550472332e-06, - "loss": 0.1517, - "step": 7860 - }, - { - "epoch": 0.22, - "learning_rate": 8.042181569108708e-06, - "loss": 0.17, - "step": 7865 - }, - { - "epoch": 0.22, - "learning_rate": 8.040754587745085e-06, - "loss": 0.2468, - "step": 7870 - }, - { - "epoch": 0.22, - "learning_rate": 8.039327606381461e-06, - "loss": 0.1442, - "step": 7875 - }, - { - "epoch": 0.22, - "learning_rate": 8.037900625017837e-06, - "loss": 0.121, - "step": 7880 - }, - { - "epoch": 0.22, - "learning_rate": 8.036473643654214e-06, - "loss": 0.1657, - "step": 7885 - }, - { - "epoch": 0.22, - "learning_rate": 8.03504666229059e-06, - "loss": 0.1207, - "step": 7890 - }, - { - "epoch": 0.22, - "learning_rate": 8.033619680926968e-06, - "loss": 0.3081, - "step": 7895 - }, - { - "epoch": 0.22, - "learning_rate": 8.032192699563344e-06, - "loss": 0.4598, - "step": 7900 - }, - { - "epoch": 0.22, - "learning_rate": 8.03076571819972e-06, - "loss": 0.2183, - "step": 7905 - }, - { - "epoch": 0.22, - "learning_rate": 8.029338736836097e-06, - "loss": 0.2336, - "step": 7910 - }, - { - "epoch": 0.22, - "learning_rate": 8.027911755472474e-06, - "loss": 0.1913, - "step": 7915 - }, - { - "epoch": 0.22, - "learning_rate": 8.02648477410885e-06, - "loss": 0.2144, - "step": 7920 - }, - { - "epoch": 0.22, - "learning_rate": 8.025057792745228e-06, - "loss": 0.1693, - "step": 7925 - }, - { - "epoch": 0.22, - "learning_rate": 8.023630811381604e-06, - "loss": 0.3176, - "step": 7930 - }, - { - "epoch": 0.22, - "learning_rate": 8.02220383001798e-06, - "loss": 0.2124, - "step": 7935 - }, - { - "epoch": 0.22, - "learning_rate": 8.020776848654357e-06, - "loss": 0.1698, - "step": 7940 - }, - { - "epoch": 0.22, - "learning_rate": 8.019349867290735e-06, - "loss": 0.1724, - "step": 7945 - }, - { - "epoch": 0.22, - "learning_rate": 8.017922885927111e-06, - "loss": 0.2481, - "step": 7950 - }, - { - "epoch": 0.22, - "learning_rate": 8.016495904563488e-06, - "loss": 0.1423, - "step": 7955 - }, - { - "epoch": 0.22, - "learning_rate": 8.015068923199864e-06, - "loss": 0.2494, - "step": 7960 - }, - { - "epoch": 0.22, - "learning_rate": 8.01364194183624e-06, - "loss": 0.2003, - "step": 7965 - }, - { - "epoch": 0.22, - "learning_rate": 8.012214960472617e-06, - "loss": 0.195, - "step": 7970 - }, - { - "epoch": 0.22, - "learning_rate": 8.010787979108993e-06, - "loss": 0.143, - "step": 7975 - }, - { - "epoch": 0.22, - "learning_rate": 8.00936099774537e-06, - "loss": 0.0434, - "step": 7980 - }, - { - "epoch": 0.22, - "learning_rate": 8.007934016381747e-06, - "loss": 0.2307, - "step": 7985 - }, - { - "epoch": 0.22, - "learning_rate": 8.006507035018124e-06, - "loss": 0.2078, - "step": 7990 - }, - { - "epoch": 0.22, - "learning_rate": 8.0050800536545e-06, - "loss": 0.316, - "step": 7995 - }, - { - "epoch": 0.22, - "learning_rate": 8.003653072290876e-06, - "loss": 0.2622, - "step": 8000 - }, - { - "epoch": 0.22, - "eval_loss": 0.08057957142591476, - "eval_runtime": 3022.947, - "eval_samples_per_second": 5.299, - "eval_steps_per_second": 1.325, - "eval_wer": 0.22843490804183195, - "step": 8000 - }, - { - "epoch": 0.22, - "learning_rate": 8.002226090927253e-06, - "loss": 0.2346, - "step": 8005 - }, - { - "epoch": 0.22, - "learning_rate": 8.000799109563629e-06, - "loss": 0.1882, - "step": 8010 - }, - { - "epoch": 0.22, - "learning_rate": 7.999372128200005e-06, - "loss": 0.1467, - "step": 8015 - }, - { - "epoch": 0.22, - "learning_rate": 7.997945146836383e-06, - "loss": 0.2359, - "step": 8020 - }, - { - "epoch": 0.22, - "learning_rate": 7.99651816547276e-06, - "loss": 0.1228, - "step": 8025 - }, - { - "epoch": 0.22, - "learning_rate": 7.995091184109136e-06, - "loss": 0.0632, - "step": 8030 - }, - { - "epoch": 0.22, - "learning_rate": 7.993664202745512e-06, - "loss": 0.1376, - "step": 8035 - }, - { - "epoch": 0.22, - "learning_rate": 7.99223722138189e-06, - "loss": 0.362, - "step": 8040 - }, - { - "epoch": 0.22, - "learning_rate": 7.990810240018267e-06, - "loss": 0.5213, - "step": 8045 - }, - { - "epoch": 0.22, - "learning_rate": 7.989383258654643e-06, - "loss": 0.5246, - "step": 8050 - }, - { - "epoch": 0.22, - "learning_rate": 7.98795627729102e-06, - "loss": 0.161, - "step": 8055 - }, - { - "epoch": 0.22, - "learning_rate": 7.986529295927396e-06, - "loss": 0.2175, - "step": 8060 - }, - { - "epoch": 0.22, - "learning_rate": 7.985102314563772e-06, - "loss": 0.1384, - "step": 8065 - }, - { - "epoch": 0.22, - "learning_rate": 7.983675333200148e-06, - "loss": 0.1738, - "step": 8070 - }, - { - "epoch": 0.22, - "learning_rate": 7.982248351836527e-06, - "loss": 0.2637, - "step": 8075 - }, - { - "epoch": 0.22, - "learning_rate": 7.980821370472903e-06, - "loss": 0.1429, - "step": 8080 - }, - { - "epoch": 0.22, - "learning_rate": 7.97939438910928e-06, - "loss": 0.189, - "step": 8085 - }, - { - "epoch": 0.22, - "learning_rate": 7.977967407745656e-06, - "loss": 0.1426, - "step": 8090 - }, - { - "epoch": 0.22, - "learning_rate": 7.976540426382032e-06, - "loss": 0.2112, - "step": 8095 - }, - { - "epoch": 0.22, - "learning_rate": 7.975113445018408e-06, - "loss": 0.2782, - "step": 8100 - }, - { - "epoch": 0.22, - "learning_rate": 7.973686463654785e-06, - "loss": 0.1385, - "step": 8105 - }, - { - "epoch": 0.23, - "learning_rate": 7.972259482291161e-06, - "loss": 0.2095, - "step": 8110 - }, - { - "epoch": 0.23, - "learning_rate": 7.970832500927539e-06, - "loss": 0.1658, - "step": 8115 - }, - { - "epoch": 0.23, - "learning_rate": 7.969405519563915e-06, - "loss": 0.1805, - "step": 8120 - }, - { - "epoch": 0.23, - "learning_rate": 7.967978538200292e-06, - "loss": 0.224, - "step": 8125 - }, - { - "epoch": 0.23, - "learning_rate": 7.966551556836668e-06, - "loss": 0.1345, - "step": 8130 - }, - { - "epoch": 0.23, - "learning_rate": 7.965124575473046e-06, - "loss": 0.091, - "step": 8135 - }, - { - "epoch": 0.23, - "learning_rate": 7.963697594109422e-06, - "loss": 0.1689, - "step": 8140 - }, - { - "epoch": 0.23, - "learning_rate": 7.962270612745799e-06, - "loss": 0.3499, - "step": 8145 - }, - { - "epoch": 0.23, - "learning_rate": 7.960843631382175e-06, - "loss": 0.3034, - "step": 8150 - }, - { - "epoch": 0.23, - "learning_rate": 7.959416650018551e-06, - "loss": 0.2078, - "step": 8155 - }, - { - "epoch": 0.23, - "learning_rate": 7.95798966865493e-06, - "loss": 0.1228, - "step": 8160 - }, - { - "epoch": 0.23, - "learning_rate": 7.956562687291306e-06, - "loss": 0.1752, - "step": 8165 - }, - { - "epoch": 0.23, - "learning_rate": 7.955135705927682e-06, - "loss": 0.1979, - "step": 8170 - }, - { - "epoch": 0.23, - "learning_rate": 7.953708724564058e-06, - "loss": 0.2338, - "step": 8175 - }, - { - "epoch": 0.23, - "learning_rate": 7.952281743200435e-06, - "loss": 0.161, - "step": 8180 - }, - { - "epoch": 0.23, - "learning_rate": 7.950854761836811e-06, - "loss": 0.1555, - "step": 8185 - }, - { - "epoch": 0.23, - "learning_rate": 7.949427780473187e-06, - "loss": 0.1691, - "step": 8190 - }, - { - "epoch": 0.23, - "learning_rate": 7.948000799109564e-06, - "loss": 0.2433, - "step": 8195 - }, - { - "epoch": 0.23, - "learning_rate": 7.94657381774594e-06, - "loss": 0.35, - "step": 8200 - }, - { - "epoch": 0.23, - "learning_rate": 7.945146836382316e-06, - "loss": 0.183, - "step": 8205 - }, - { - "epoch": 0.23, - "learning_rate": 7.943719855018694e-06, - "loss": 0.1599, - "step": 8210 - }, - { - "epoch": 0.23, - "learning_rate": 7.94229287365507e-06, - "loss": 0.1263, - "step": 8215 - }, - { - "epoch": 0.23, - "learning_rate": 7.940865892291447e-06, - "loss": 0.2152, - "step": 8220 - }, - { - "epoch": 0.23, - "learning_rate": 7.939438910927823e-06, - "loss": 0.1271, - "step": 8225 - }, - { - "epoch": 0.23, - "learning_rate": 7.938011929564201e-06, - "loss": 0.0165, - "step": 8230 - }, - { - "epoch": 0.23, - "learning_rate": 7.936584948200578e-06, - "loss": 0.1579, - "step": 8235 - }, - { - "epoch": 0.23, - "learning_rate": 7.935157966836954e-06, - "loss": 0.3127, - "step": 8240 - }, - { - "epoch": 0.23, - "learning_rate": 7.93373098547333e-06, - "loss": 0.1991, - "step": 8245 - }, - { - "epoch": 0.23, - "learning_rate": 7.932304004109707e-06, - "loss": 0.5045, - "step": 8250 - }, - { - "epoch": 0.23, - "learning_rate": 7.930877022746085e-06, - "loss": 0.1249, - "step": 8255 - }, - { - "epoch": 0.23, - "learning_rate": 7.929450041382461e-06, - "loss": 0.1456, - "step": 8260 - }, - { - "epoch": 0.23, - "learning_rate": 7.928023060018838e-06, - "loss": 0.163, - "step": 8265 - }, - { - "epoch": 0.23, - "learning_rate": 7.926596078655214e-06, - "loss": 0.2551, - "step": 8270 - }, - { - "epoch": 0.23, - "learning_rate": 7.92516909729159e-06, - "loss": 0.0672, - "step": 8275 - }, - { - "epoch": 0.23, - "learning_rate": 7.923742115927967e-06, - "loss": 0.1371, - "step": 8280 - }, - { - "epoch": 0.23, - "learning_rate": 7.922315134564343e-06, - "loss": 0.1814, - "step": 8285 - }, - { - "epoch": 0.23, - "learning_rate": 7.92088815320072e-06, - "loss": 0.2584, - "step": 8290 - }, - { - "epoch": 0.23, - "learning_rate": 7.919461171837096e-06, - "loss": 0.3287, - "step": 8295 - }, - { - "epoch": 0.23, - "learning_rate": 7.918319586746198e-06, - "loss": 0.4046, - "step": 8300 - }, - { - "epoch": 0.23, - "learning_rate": 7.916892605382574e-06, - "loss": 0.1849, - "step": 8305 - }, - { - "epoch": 0.23, - "learning_rate": 7.91546562401895e-06, - "loss": 0.1787, - "step": 8310 - }, - { - "epoch": 0.23, - "learning_rate": 7.914038642655327e-06, - "loss": 0.233, - "step": 8315 - }, - { - "epoch": 0.23, - "learning_rate": 7.912611661291703e-06, - "loss": 0.1461, - "step": 8320 - }, - { - "epoch": 0.23, - "learning_rate": 7.911184679928081e-06, - "loss": 0.0856, - "step": 8325 - }, - { - "epoch": 0.23, - "learning_rate": 7.909757698564457e-06, - "loss": 0.2195, - "step": 8330 - }, - { - "epoch": 0.23, - "learning_rate": 7.908330717200834e-06, - "loss": 0.1154, - "step": 8335 - }, - { - "epoch": 0.23, - "learning_rate": 7.90690373583721e-06, - "loss": 0.2593, - "step": 8340 - }, - { - "epoch": 0.23, - "learning_rate": 7.905476754473588e-06, - "loss": 0.1829, - "step": 8345 - }, - { - "epoch": 0.23, - "learning_rate": 7.904049773109964e-06, - "loss": 0.5558, - "step": 8350 - }, - { - "epoch": 0.23, - "learning_rate": 7.90262279174634e-06, - "loss": 0.1854, - "step": 8355 - }, - { - "epoch": 0.23, - "learning_rate": 7.901195810382717e-06, - "loss": 0.2554, - "step": 8360 - }, - { - "epoch": 0.23, - "learning_rate": 7.899768829019093e-06, - "loss": 0.2087, - "step": 8365 - }, - { - "epoch": 0.23, - "learning_rate": 7.898341847655471e-06, - "loss": 0.18, - "step": 8370 - }, - { - "epoch": 0.23, - "learning_rate": 7.896914866291848e-06, - "loss": 0.2436, - "step": 8375 - }, - { - "epoch": 0.23, - "learning_rate": 7.895487884928224e-06, - "loss": 0.0874, - "step": 8380 - }, - { - "epoch": 0.23, - "learning_rate": 7.8940609035646e-06, - "loss": 0.1586, - "step": 8385 - }, - { - "epoch": 0.23, - "learning_rate": 7.892633922200977e-06, - "loss": 0.2233, - "step": 8390 - }, - { - "epoch": 0.23, - "learning_rate": 7.891206940837353e-06, - "loss": 0.3407, - "step": 8395 - }, - { - "epoch": 0.23, - "learning_rate": 7.88977995947373e-06, - "loss": 0.3159, - "step": 8400 - }, - { - "epoch": 0.23, - "learning_rate": 7.888352978110106e-06, - "loss": 0.1739, - "step": 8405 - }, - { - "epoch": 0.23, - "learning_rate": 7.886925996746482e-06, - "loss": 0.1841, - "step": 8410 - }, - { - "epoch": 0.23, - "learning_rate": 7.885499015382859e-06, - "loss": 0.1759, - "step": 8415 - }, - { - "epoch": 0.23, - "learning_rate": 7.884072034019237e-06, - "loss": 0.2541, - "step": 8420 - }, - { - "epoch": 0.23, - "learning_rate": 7.882645052655613e-06, - "loss": 0.0824, - "step": 8425 - }, - { - "epoch": 0.23, - "learning_rate": 7.88121807129199e-06, - "loss": 0.0575, - "step": 8430 - }, - { - "epoch": 0.23, - "learning_rate": 7.879791089928366e-06, - "loss": 0.1388, - "step": 8435 - }, - { - "epoch": 0.23, - "learning_rate": 7.878364108564744e-06, - "loss": 0.1756, - "step": 8440 - }, - { - "epoch": 0.23, - "learning_rate": 7.87693712720112e-06, - "loss": 0.2056, - "step": 8445 - }, - { - "epoch": 0.23, - "learning_rate": 7.875510145837496e-06, - "loss": 0.6129, - "step": 8450 - }, - { - "epoch": 0.23, - "learning_rate": 7.874083164473873e-06, - "loss": 0.1343, - "step": 8455 - }, - { - "epoch": 0.23, - "learning_rate": 7.872656183110249e-06, - "loss": 0.1692, - "step": 8460 - }, - { - "epoch": 0.23, - "learning_rate": 7.871229201746627e-06, - "loss": 0.193, - "step": 8465 - }, - { - "epoch": 0.24, - "learning_rate": 7.869802220383003e-06, - "loss": 0.1887, - "step": 8470 - }, - { - "epoch": 0.24, - "learning_rate": 7.86837523901938e-06, - "loss": 0.1236, - "step": 8475 - }, - { - "epoch": 0.24, - "learning_rate": 7.866948257655756e-06, - "loss": 0.1449, - "step": 8480 - }, - { - "epoch": 0.24, - "learning_rate": 7.865521276292132e-06, - "loss": 0.1807, - "step": 8485 - }, - { - "epoch": 0.24, - "learning_rate": 7.864094294928509e-06, - "loss": 0.0956, - "step": 8490 - }, - { - "epoch": 0.24, - "learning_rate": 7.862667313564885e-06, - "loss": 0.2542, - "step": 8495 - }, - { - "epoch": 0.24, - "learning_rate": 7.861240332201261e-06, - "loss": 0.4587, - "step": 8500 - }, - { - "epoch": 0.24, - "learning_rate": 7.859813350837638e-06, - "loss": 0.2121, - "step": 8505 - }, - { - "epoch": 0.24, - "learning_rate": 7.858386369474014e-06, - "loss": 0.3679, - "step": 8510 - }, - { - "epoch": 0.24, - "learning_rate": 7.856959388110392e-06, - "loss": 0.1392, - "step": 8515 - }, - { - "epoch": 0.24, - "learning_rate": 7.855532406746768e-06, - "loss": 0.1165, - "step": 8520 - }, - { - "epoch": 0.24, - "learning_rate": 7.854105425383145e-06, - "loss": 0.204, - "step": 8525 - }, - { - "epoch": 0.24, - "learning_rate": 7.852678444019521e-06, - "loss": 0.1654, - "step": 8530 - }, - { - "epoch": 0.24, - "learning_rate": 7.851251462655899e-06, - "loss": 0.1839, - "step": 8535 - }, - { - "epoch": 0.24, - "learning_rate": 7.849824481292275e-06, - "loss": 0.1727, - "step": 8540 - }, - { - "epoch": 0.24, - "learning_rate": 7.848397499928652e-06, - "loss": 0.2335, - "step": 8545 - }, - { - "epoch": 0.24, - "learning_rate": 7.846970518565028e-06, - "loss": 0.4425, - "step": 8550 - }, - { - "epoch": 0.24, - "learning_rate": 7.845543537201404e-06, - "loss": 0.1648, - "step": 8555 - }, - { - "epoch": 0.24, - "learning_rate": 7.844116555837783e-06, - "loss": 0.1482, - "step": 8560 - }, - { - "epoch": 0.24, - "learning_rate": 7.842689574474159e-06, - "loss": 0.1983, - "step": 8565 - }, - { - "epoch": 0.24, - "learning_rate": 7.841262593110535e-06, - "loss": 0.2705, - "step": 8570 - }, - { - "epoch": 0.24, - "learning_rate": 7.839835611746912e-06, - "loss": 0.1826, - "step": 8575 - }, - { - "epoch": 0.24, - "learning_rate": 7.838408630383288e-06, - "loss": 0.1382, - "step": 8580 - }, - { - "epoch": 0.24, - "learning_rate": 7.836981649019664e-06, - "loss": 0.2028, - "step": 8585 - }, - { - "epoch": 0.24, - "learning_rate": 7.83555466765604e-06, - "loss": 0.098, - "step": 8590 - }, - { - "epoch": 0.24, - "learning_rate": 7.834127686292417e-06, - "loss": 0.2188, - "step": 8595 - }, - { - "epoch": 0.24, - "learning_rate": 7.832700704928793e-06, - "loss": 0.6639, - "step": 8600 - }, - { - "epoch": 0.24, - "learning_rate": 7.83127372356517e-06, - "loss": 0.1766, - "step": 8605 - }, - { - "epoch": 0.24, - "learning_rate": 7.829846742201548e-06, - "loss": 0.1344, - "step": 8610 - }, - { - "epoch": 0.24, - "learning_rate": 7.828419760837924e-06, - "loss": 0.1565, - "step": 8615 - }, - { - "epoch": 0.24, - "learning_rate": 7.8269927794743e-06, - "loss": 0.2745, - "step": 8620 - }, - { - "epoch": 0.24, - "learning_rate": 7.825565798110677e-06, - "loss": 0.2157, - "step": 8625 - }, - { - "epoch": 0.24, - "learning_rate": 7.824138816747055e-06, - "loss": 0.095, - "step": 8630 - }, - { - "epoch": 0.24, - "learning_rate": 7.822711835383431e-06, - "loss": 0.1851, - "step": 8635 - }, - { - "epoch": 0.24, - "learning_rate": 7.821284854019807e-06, - "loss": 0.2995, - "step": 8640 - }, - { - "epoch": 0.24, - "learning_rate": 7.819857872656184e-06, - "loss": 0.3037, - "step": 8645 - }, - { - "epoch": 0.24, - "learning_rate": 7.81843089129256e-06, - "loss": 0.3917, - "step": 8650 - }, - { - "epoch": 0.24, - "learning_rate": 7.817003909928938e-06, - "loss": 0.1416, - "step": 8655 - }, - { - "epoch": 0.24, - "learning_rate": 7.815576928565314e-06, - "loss": 0.2278, - "step": 8660 - }, - { - "epoch": 0.24, - "learning_rate": 7.81414994720169e-06, - "loss": 0.2162, - "step": 8665 - }, - { - "epoch": 0.24, - "learning_rate": 7.812722965838067e-06, - "loss": 0.2055, - "step": 8670 - }, - { - "epoch": 0.24, - "learning_rate": 7.811295984474443e-06, - "loss": 0.0889, - "step": 8675 - }, - { - "epoch": 0.24, - "learning_rate": 7.80986900311082e-06, - "loss": 0.1144, - "step": 8680 - }, - { - "epoch": 0.24, - "learning_rate": 7.808442021747196e-06, - "loss": 0.2463, - "step": 8685 - }, - { - "epoch": 0.24, - "learning_rate": 7.807015040383572e-06, - "loss": 0.3082, - "step": 8690 - }, - { - "epoch": 0.24, - "learning_rate": 7.805588059019949e-06, - "loss": 0.1998, - "step": 8695 - }, - { - "epoch": 0.24, - "learning_rate": 7.804161077656325e-06, - "loss": 0.288, - "step": 8700 - }, - { - "epoch": 0.24, - "learning_rate": 7.802734096292703e-06, - "loss": 0.1421, - "step": 8705 - }, - { - "epoch": 0.24, - "learning_rate": 7.80130711492908e-06, - "loss": 0.1546, - "step": 8710 - }, - { - "epoch": 0.24, - "learning_rate": 7.799880133565456e-06, - "loss": 0.2216, - "step": 8715 - }, - { - "epoch": 0.24, - "learning_rate": 7.798453152201832e-06, - "loss": 0.2045, - "step": 8720 - }, - { - "epoch": 0.24, - "learning_rate": 7.79702617083821e-06, - "loss": 0.2076, - "step": 8725 - }, - { - "epoch": 0.24, - "learning_rate": 7.795599189474586e-06, - "loss": 0.0846, - "step": 8730 - }, - { - "epoch": 0.24, - "learning_rate": 7.794172208110963e-06, - "loss": 0.2256, - "step": 8735 - }, - { - "epoch": 0.24, - "learning_rate": 7.79274522674734e-06, - "loss": 0.1954, - "step": 8740 - }, - { - "epoch": 0.24, - "learning_rate": 7.791318245383716e-06, - "loss": 0.0833, - "step": 8745 - }, - { - "epoch": 0.24, - "learning_rate": 7.789891264020094e-06, - "loss": 0.6029, - "step": 8750 - }, - { - "epoch": 0.24, - "learning_rate": 7.78846428265647e-06, - "loss": 0.1641, - "step": 8755 - }, - { - "epoch": 0.24, - "learning_rate": 7.787037301292846e-06, - "loss": 0.2114, - "step": 8760 - }, - { - "epoch": 0.24, - "learning_rate": 7.785610319929223e-06, - "loss": 0.1914, - "step": 8765 - }, - { - "epoch": 0.24, - "learning_rate": 7.784183338565599e-06, - "loss": 0.2398, - "step": 8770 - }, - { - "epoch": 0.24, - "learning_rate": 7.782756357201975e-06, - "loss": 0.1619, - "step": 8775 - }, - { - "epoch": 0.24, - "learning_rate": 7.781329375838352e-06, - "loss": 0.1529, - "step": 8780 - }, - { - "epoch": 0.24, - "learning_rate": 7.779902394474728e-06, - "loss": 0.2231, - "step": 8785 - }, - { - "epoch": 0.24, - "learning_rate": 7.778475413111104e-06, - "loss": 0.1318, - "step": 8790 - }, - { - "epoch": 0.24, - "learning_rate": 7.777048431747482e-06, - "loss": 0.1566, - "step": 8795 - }, - { - "epoch": 0.24, - "learning_rate": 7.775621450383859e-06, - "loss": 0.3991, - "step": 8800 - }, - { - "epoch": 0.24, - "learning_rate": 7.774194469020235e-06, - "loss": 0.146, - "step": 8805 - }, - { - "epoch": 0.24, - "learning_rate": 7.772767487656611e-06, - "loss": 0.2099, - "step": 8810 - }, - { - "epoch": 0.24, - "learning_rate": 7.771340506292988e-06, - "loss": 0.2104, - "step": 8815 - }, - { - "epoch": 0.24, - "learning_rate": 7.769913524929366e-06, - "loss": 0.1561, - "step": 8820 - }, - { - "epoch": 0.24, - "learning_rate": 7.768486543565742e-06, - "loss": 0.1779, - "step": 8825 - }, - { - "epoch": 0.25, - "learning_rate": 7.767059562202118e-06, - "loss": 0.1237, - "step": 8830 - }, - { - "epoch": 0.25, - "learning_rate": 7.765632580838495e-06, - "loss": 0.212, - "step": 8835 - }, - { - "epoch": 0.25, - "learning_rate": 7.764205599474871e-06, - "loss": 0.2135, - "step": 8840 - }, - { - "epoch": 0.25, - "learning_rate": 7.762778618111249e-06, - "loss": 0.3727, - "step": 8845 - }, - { - "epoch": 0.25, - "learning_rate": 7.761351636747625e-06, - "loss": 0.9279, - "step": 8850 - }, - { - "epoch": 0.25, - "learning_rate": 7.759924655384002e-06, - "loss": 0.1871, - "step": 8855 - }, - { - "epoch": 0.25, - "learning_rate": 7.758497674020378e-06, - "loss": 0.2423, - "step": 8860 - }, - { - "epoch": 0.25, - "learning_rate": 7.757070692656754e-06, - "loss": 0.1663, - "step": 8865 - }, - { - "epoch": 0.25, - "learning_rate": 7.75564371129313e-06, - "loss": 0.252, - "step": 8870 - }, - { - "epoch": 0.25, - "learning_rate": 7.754216729929507e-06, - "loss": 0.0367, - "step": 8875 - }, - { - "epoch": 0.25, - "learning_rate": 7.752789748565885e-06, - "loss": 0.0966, - "step": 8880 - }, - { - "epoch": 0.25, - "learning_rate": 7.751362767202261e-06, - "loss": 0.186, - "step": 8885 - }, - { - "epoch": 0.25, - "learning_rate": 7.749935785838638e-06, - "loss": 0.3719, - "step": 8890 - }, - { - "epoch": 0.25, - "learning_rate": 7.748508804475014e-06, - "loss": 0.5401, - "step": 8895 - }, - { - "epoch": 0.25, - "learning_rate": 7.74708182311139e-06, - "loss": 0.5217, - "step": 8900 - }, - { - "epoch": 0.25, - "learning_rate": 7.745654841747767e-06, - "loss": 0.1836, - "step": 8905 - }, - { - "epoch": 0.25, - "learning_rate": 7.744227860384143e-06, - "loss": 0.199, - "step": 8910 - }, - { - "epoch": 0.25, - "learning_rate": 7.742800879020521e-06, - "loss": 0.2465, - "step": 8915 - }, - { - "epoch": 0.25, - "learning_rate": 7.741373897656898e-06, - "loss": 0.2377, - "step": 8920 - }, - { - "epoch": 0.25, - "learning_rate": 7.739946916293274e-06, - "loss": 0.2297, - "step": 8925 - }, - { - "epoch": 0.25, - "learning_rate": 7.73851993492965e-06, - "loss": 0.072, - "step": 8930 - }, - { - "epoch": 0.25, - "learning_rate": 7.737092953566027e-06, - "loss": 0.1414, - "step": 8935 - }, - { - "epoch": 0.25, - "learning_rate": 7.735665972202405e-06, - "loss": 0.1911, - "step": 8940 - }, - { - "epoch": 0.25, - "learning_rate": 7.734238990838781e-06, - "loss": 0.2331, - "step": 8945 - }, - { - "epoch": 0.25, - "learning_rate": 7.732812009475157e-06, - "loss": 0.5353, - "step": 8950 - }, - { - "epoch": 0.25, - "learning_rate": 7.731385028111534e-06, - "loss": 0.2056, - "step": 8955 - }, - { - "epoch": 0.25, - "learning_rate": 7.72995804674791e-06, - "loss": 0.1993, - "step": 8960 - }, - { - "epoch": 0.25, - "learning_rate": 7.728531065384286e-06, - "loss": 0.2409, - "step": 8965 - }, - { - "epoch": 0.25, - "learning_rate": 7.727104084020664e-06, - "loss": 0.2607, - "step": 8970 - }, - { - "epoch": 0.25, - "learning_rate": 7.72567710265704e-06, - "loss": 0.202, - "step": 8975 - }, - { - "epoch": 0.25, - "learning_rate": 7.724250121293417e-06, - "loss": 0.098, - "step": 8980 - }, - { - "epoch": 0.25, - "learning_rate": 7.722823139929793e-06, - "loss": 0.1181, - "step": 8985 - }, - { - "epoch": 0.25, - "learning_rate": 7.72139615856617e-06, - "loss": 0.1399, - "step": 8990 - }, - { - "epoch": 0.25, - "learning_rate": 7.719969177202546e-06, - "loss": 0.3393, - "step": 8995 - }, - { - "epoch": 0.25, - "learning_rate": 7.718542195838922e-06, - "loss": 0.2566, - "step": 9000 - }, - { - "epoch": 0.25, - "learning_rate": 7.717115214475299e-06, - "loss": 0.1742, - "step": 9005 - }, - { - "epoch": 0.25, - "learning_rate": 7.715688233111677e-06, - "loss": 0.1669, - "step": 9010 - }, - { - "epoch": 0.25, - "learning_rate": 7.714261251748053e-06, - "loss": 0.1532, - "step": 9015 - }, - { - "epoch": 0.25, - "learning_rate": 7.71283427038443e-06, - "loss": 0.1997, - "step": 9020 - }, - { - "epoch": 0.25, - "learning_rate": 7.711407289020806e-06, - "loss": 0.102, - "step": 9025 - }, - { - "epoch": 0.25, - "learning_rate": 7.709980307657182e-06, - "loss": 0.1047, - "step": 9030 - }, - { - "epoch": 0.25, - "learning_rate": 7.70855332629356e-06, - "loss": 0.1207, - "step": 9035 - }, - { - "epoch": 0.25, - "learning_rate": 7.707126344929936e-06, - "loss": 0.1498, - "step": 9040 - }, - { - "epoch": 0.25, - "learning_rate": 7.705699363566313e-06, - "loss": 0.3169, - "step": 9045 - }, - { - "epoch": 0.25, - "learning_rate": 7.704272382202689e-06, - "loss": 0.5967, - "step": 9050 - }, - { - "epoch": 0.25, - "learning_rate": 7.702845400839065e-06, - "loss": 0.1251, - "step": 9055 - }, - { - "epoch": 0.25, - "learning_rate": 7.701418419475443e-06, - "loss": 0.1762, - "step": 9060 - }, - { - "epoch": 0.25, - "learning_rate": 7.69999143811182e-06, - "loss": 0.2053, - "step": 9065 - }, - { - "epoch": 0.25, - "learning_rate": 7.698564456748196e-06, - "loss": 0.223, - "step": 9070 - }, - { - "epoch": 0.25, - "learning_rate": 7.697137475384573e-06, - "loss": 0.1064, - "step": 9075 - }, - { - "epoch": 0.25, - "learning_rate": 7.695710494020949e-06, - "loss": 0.1265, - "step": 9080 - }, - { - "epoch": 0.25, - "learning_rate": 7.694283512657325e-06, - "loss": 0.0834, - "step": 9085 - }, - { - "epoch": 0.25, - "learning_rate": 7.692856531293702e-06, - "loss": 0.3055, - "step": 9090 - }, - { - "epoch": 0.25, - "learning_rate": 7.691429549930078e-06, - "loss": 0.3791, - "step": 9095 - }, - { - "epoch": 0.25, - "learning_rate": 7.690002568566454e-06, - "loss": 0.7226, - "step": 9100 - }, - { - "epoch": 0.25, - "learning_rate": 7.688575587202832e-06, - "loss": 0.2248, - "step": 9105 - }, - { - "epoch": 0.25, - "learning_rate": 7.687148605839209e-06, - "loss": 0.167, - "step": 9110 - }, - { - "epoch": 0.25, - "learning_rate": 7.685721624475585e-06, - "loss": 0.157, - "step": 9115 - }, - { - "epoch": 0.25, - "learning_rate": 7.684294643111961e-06, - "loss": 0.1776, - "step": 9120 - }, - { - "epoch": 0.25, - "learning_rate": 7.682867661748338e-06, - "loss": 0.1557, - "step": 9125 - }, - { - "epoch": 0.25, - "learning_rate": 7.681440680384716e-06, - "loss": 0.1552, - "step": 9130 - }, - { - "epoch": 0.25, - "learning_rate": 7.680013699021092e-06, - "loss": 0.1635, - "step": 9135 - }, - { - "epoch": 0.25, - "learning_rate": 7.678586717657468e-06, - "loss": 0.2556, - "step": 9140 - }, - { - "epoch": 0.25, - "learning_rate": 7.677159736293845e-06, - "loss": 0.3, - "step": 9145 - }, - { - "epoch": 0.25, - "learning_rate": 7.675732754930221e-06, - "loss": 0.4252, - "step": 9150 - }, - { - "epoch": 0.25, - "learning_rate": 7.674305773566599e-06, - "loss": 0.1934, - "step": 9155 - }, - { - "epoch": 0.25, - "learning_rate": 7.672878792202975e-06, - "loss": 0.1446, - "step": 9160 - }, - { - "epoch": 0.25, - "learning_rate": 7.671451810839352e-06, - "loss": 0.1904, - "step": 9165 - }, - { - "epoch": 0.25, - "learning_rate": 7.670024829475728e-06, - "loss": 0.2697, - "step": 9170 - }, - { - "epoch": 0.25, - "learning_rate": 7.668597848112104e-06, - "loss": 0.1665, - "step": 9175 - }, - { - "epoch": 0.25, - "learning_rate": 7.66717086674848e-06, - "loss": 0.0452, - "step": 9180 - }, - { - "epoch": 0.25, - "learning_rate": 7.665743885384857e-06, - "loss": 0.213, - "step": 9185 - }, - { - "epoch": 0.26, - "learning_rate": 7.664316904021233e-06, - "loss": 0.2696, - "step": 9190 - }, - { - "epoch": 0.26, - "learning_rate": 7.66288992265761e-06, - "loss": 0.254, - "step": 9195 - }, - { - "epoch": 0.26, - "learning_rate": 7.661462941293988e-06, - "loss": 0.34, - "step": 9200 - }, - { - "epoch": 0.26, - "learning_rate": 7.660035959930364e-06, - "loss": 0.2095, - "step": 9205 - }, - { - "epoch": 0.26, - "learning_rate": 7.65860897856674e-06, - "loss": 0.1563, - "step": 9210 - }, - { - "epoch": 0.26, - "learning_rate": 7.657181997203117e-06, - "loss": 0.1154, - "step": 9215 - }, - { - "epoch": 0.26, - "learning_rate": 7.655755015839493e-06, - "loss": 0.1982, - "step": 9220 - }, - { - "epoch": 0.26, - "learning_rate": 7.654328034475871e-06, - "loss": 0.1001, - "step": 9225 - }, - { - "epoch": 0.26, - "learning_rate": 7.652901053112247e-06, - "loss": 0.1257, - "step": 9230 - }, - { - "epoch": 0.26, - "learning_rate": 7.651474071748624e-06, - "loss": 0.1364, - "step": 9235 - }, - { - "epoch": 0.26, - "learning_rate": 7.650047090385e-06, - "loss": 0.1823, - "step": 9240 - }, - { - "epoch": 0.26, - "learning_rate": 7.648620109021376e-06, - "loss": 0.3176, - "step": 9245 - }, - { - "epoch": 0.26, - "learning_rate": 7.647193127657755e-06, - "loss": 0.411, - "step": 9250 - }, - { - "epoch": 0.26, - "learning_rate": 7.645766146294131e-06, - "loss": 0.168, - "step": 9255 - }, - { - "epoch": 0.26, - "learning_rate": 7.644339164930507e-06, - "loss": 0.2204, - "step": 9260 - }, - { - "epoch": 0.26, - "learning_rate": 7.642912183566884e-06, - "loss": 0.2458, - "step": 9265 - }, - { - "epoch": 0.26, - "learning_rate": 7.64148520220326e-06, - "loss": 0.1735, - "step": 9270 - }, - { - "epoch": 0.26, - "learning_rate": 7.640058220839636e-06, - "loss": 0.0257, - "step": 9275 - }, - { - "epoch": 0.26, - "learning_rate": 7.638631239476013e-06, - "loss": 0.2665, - "step": 9280 - }, - { - "epoch": 0.26, - "learning_rate": 7.637204258112389e-06, - "loss": 0.1184, - "step": 9285 - }, - { - "epoch": 0.26, - "learning_rate": 7.635777276748765e-06, - "loss": 0.1373, - "step": 9290 - }, - { - "epoch": 0.26, - "learning_rate": 7.634350295385143e-06, - "loss": 0.1819, - "step": 9295 - }, - { - "epoch": 0.26, - "learning_rate": 7.63292331402152e-06, - "loss": 0.226, - "step": 9300 - }, - { - "epoch": 0.26, - "learning_rate": 7.631496332657896e-06, - "loss": 0.1845, - "step": 9305 - }, - { - "epoch": 0.26, - "learning_rate": 7.630069351294272e-06, - "loss": 0.1571, - "step": 9310 - }, - { - "epoch": 0.26, - "learning_rate": 7.628642369930649e-06, - "loss": 0.1804, - "step": 9315 - }, - { - "epoch": 0.26, - "learning_rate": 7.627215388567027e-06, - "loss": 0.2218, - "step": 9320 - }, - { - "epoch": 0.26, - "learning_rate": 7.625788407203403e-06, - "loss": 0.1621, - "step": 9325 - }, - { - "epoch": 0.26, - "learning_rate": 7.624361425839779e-06, - "loss": 0.1616, - "step": 9330 - }, - { - "epoch": 0.26, - "learning_rate": 7.622934444476156e-06, - "loss": 0.1291, - "step": 9335 - }, - { - "epoch": 0.26, - "learning_rate": 7.621507463112532e-06, - "loss": 0.0476, - "step": 9340 - }, - { - "epoch": 0.26, - "learning_rate": 7.620080481748909e-06, - "loss": 0.1954, - "step": 9345 - }, - { - "epoch": 0.26, - "learning_rate": 7.6186535003852855e-06, - "loss": 0.4141, - "step": 9350 - }, - { - "epoch": 0.26, - "learning_rate": 7.617226519021662e-06, - "loss": 0.1552, - "step": 9355 - }, - { - "epoch": 0.26, - "learning_rate": 7.615799537658038e-06, - "loss": 0.1397, - "step": 9360 - }, - { - "epoch": 0.26, - "learning_rate": 7.614372556294416e-06, - "loss": 0.1373, - "step": 9365 - }, - { - "epoch": 0.26, - "learning_rate": 7.6129455749307926e-06, - "loss": 0.1499, - "step": 9370 - }, - { - "epoch": 0.26, - "learning_rate": 7.611518593567169e-06, - "loss": 0.1765, - "step": 9375 - }, - { - "epoch": 0.26, - "learning_rate": 7.610091612203545e-06, - "loss": 0.0806, - "step": 9380 - }, - { - "epoch": 0.26, - "learning_rate": 7.608664630839922e-06, - "loss": 0.0987, - "step": 9385 - }, - { - "epoch": 0.26, - "learning_rate": 7.607237649476299e-06, - "loss": 0.2782, - "step": 9390 - }, - { - "epoch": 0.26, - "learning_rate": 7.605810668112675e-06, - "loss": 0.4899, - "step": 9395 - }, - { - "epoch": 0.26, - "learning_rate": 7.6043836867490515e-06, - "loss": 0.4337, - "step": 9400 - }, - { - "epoch": 0.26, - "learning_rate": 7.602956705385428e-06, - "loss": 0.192, - "step": 9405 - }, - { - "epoch": 0.26, - "learning_rate": 7.601529724021804e-06, - "loss": 0.1428, - "step": 9410 - }, - { - "epoch": 0.26, - "learning_rate": 7.600102742658182e-06, - "loss": 0.2142, - "step": 9415 - }, - { - "epoch": 0.26, - "learning_rate": 7.5986757612945585e-06, - "loss": 0.2392, - "step": 9420 - }, - { - "epoch": 0.26, - "learning_rate": 7.597248779930935e-06, - "loss": 0.1141, - "step": 9425 - }, - { - "epoch": 0.26, - "learning_rate": 7.595821798567311e-06, - "loss": 0.0959, - "step": 9430 - }, - { - "epoch": 0.26, - "learning_rate": 7.5943948172036875e-06, - "loss": 0.3744, - "step": 9435 - }, - { - "epoch": 0.26, - "learning_rate": 7.592967835840065e-06, - "loss": 0.2595, - "step": 9440 - }, - { - "epoch": 0.26, - "learning_rate": 7.591540854476441e-06, - "loss": 0.1794, - "step": 9445 - }, - { - "epoch": 0.26, - "learning_rate": 7.590113873112817e-06, - "loss": 0.4224, - "step": 9450 - }, - { - "epoch": 0.26, - "learning_rate": 7.588686891749194e-06, - "loss": 0.2906, - "step": 9455 - }, - { - "epoch": 0.26, - "learning_rate": 7.587259910385572e-06, - "loss": 0.1409, - "step": 9460 - }, - { - "epoch": 0.26, - "learning_rate": 7.585832929021948e-06, - "loss": 0.1964, - "step": 9465 - }, - { - "epoch": 0.26, - "learning_rate": 7.5844059476583244e-06, - "loss": 0.2423, - "step": 9470 - }, - { - "epoch": 0.26, - "learning_rate": 7.582978966294701e-06, - "loss": 0.0667, - "step": 9475 - }, - { - "epoch": 0.26, - "learning_rate": 7.581551984931077e-06, - "loss": 0.1139, - "step": 9480 - }, - { - "epoch": 0.26, - "learning_rate": 7.580125003567454e-06, - "loss": 0.2279, - "step": 9485 - }, - { - "epoch": 0.26, - "learning_rate": 7.578698022203831e-06, - "loss": 0.3152, - "step": 9490 - }, - { - "epoch": 0.26, - "learning_rate": 7.577271040840207e-06, - "loss": 0.265, - "step": 9495 - }, - { - "epoch": 0.26, - "learning_rate": 7.575844059476583e-06, - "loss": 0.482, - "step": 9500 - }, - { - "epoch": 0.26, - "learning_rate": 7.57441707811296e-06, - "loss": 0.159, - "step": 9505 - }, - { - "epoch": 0.26, - "learning_rate": 7.572990096749338e-06, - "loss": 0.1347, - "step": 9510 - }, - { - "epoch": 0.26, - "learning_rate": 7.571563115385714e-06, - "loss": 0.1418, - "step": 9515 - }, - { - "epoch": 0.26, - "learning_rate": 7.57013613402209e-06, - "loss": 0.1773, - "step": 9520 - }, - { - "epoch": 0.26, - "learning_rate": 7.568709152658467e-06, - "loss": 0.0984, - "step": 9525 - }, - { - "epoch": 0.26, - "learning_rate": 7.567282171294843e-06, - "loss": 0.0493, - "step": 9530 - }, - { - "epoch": 0.26, - "learning_rate": 7.56585518993122e-06, - "loss": 0.3436, - "step": 9535 - }, - { - "epoch": 0.26, - "learning_rate": 7.5644282085675966e-06, - "loss": 0.2792, - "step": 9540 - }, - { - "epoch": 0.26, - "learning_rate": 7.563001227203973e-06, - "loss": 0.2537, - "step": 9545 - }, - { - "epoch": 0.26, - "learning_rate": 7.561574245840349e-06, - "loss": 0.2774, - "step": 9550 - }, - { - "epoch": 0.27, - "learning_rate": 7.560147264476727e-06, - "loss": 0.0976, - "step": 9555 - }, - { - "epoch": 0.27, - "learning_rate": 7.558720283113104e-06, - "loss": 0.2648, - "step": 9560 - }, - { - "epoch": 0.27, - "learning_rate": 7.55729330174948e-06, - "loss": 0.2325, - "step": 9565 - }, - { - "epoch": 0.27, - "learning_rate": 7.555866320385856e-06, - "loss": 0.2104, - "step": 9570 - }, - { - "epoch": 0.27, - "learning_rate": 7.554439339022233e-06, - "loss": 0.1456, - "step": 9575 - }, - { - "epoch": 0.27, - "learning_rate": 7.55301235765861e-06, - "loss": 0.1227, - "step": 9580 - }, - { - "epoch": 0.27, - "learning_rate": 7.551585376294986e-06, - "loss": 0.1161, - "step": 9585 - }, - { - "epoch": 0.27, - "learning_rate": 7.5501583949313625e-06, - "loss": 0.2457, - "step": 9590 - }, - { - "epoch": 0.27, - "learning_rate": 7.548731413567739e-06, - "loss": 0.3123, - "step": 9595 - }, - { - "epoch": 0.27, - "learning_rate": 7.547304432204115e-06, - "loss": 0.4145, - "step": 9600 - }, - { - "epoch": 0.27, - "learning_rate": 7.545877450840493e-06, - "loss": 0.1799, - "step": 9605 - }, - { - "epoch": 0.27, - "learning_rate": 7.5444504694768695e-06, - "loss": 0.1297, - "step": 9610 - }, - { - "epoch": 0.27, - "learning_rate": 7.543023488113246e-06, - "loss": 0.1053, - "step": 9615 - }, - { - "epoch": 0.27, - "learning_rate": 7.541596506749622e-06, - "loss": 0.2045, - "step": 9620 - }, - { - "epoch": 0.27, - "learning_rate": 7.5401695253859985e-06, - "loss": 0.1469, - "step": 9625 - }, - { - "epoch": 0.27, - "learning_rate": 7.538742544022376e-06, - "loss": 0.1846, - "step": 9630 - }, - { - "epoch": 0.27, - "learning_rate": 7.537315562658752e-06, - "loss": 0.1, - "step": 9635 - }, - { - "epoch": 0.27, - "learning_rate": 7.535888581295128e-06, - "loss": 0.1658, - "step": 9640 - }, - { - "epoch": 0.27, - "learning_rate": 7.534461599931505e-06, - "loss": 0.1718, - "step": 9645 - }, - { - "epoch": 0.27, - "learning_rate": 7.533034618567883e-06, - "loss": 0.263, - "step": 9650 - }, - { - "epoch": 0.27, - "learning_rate": 7.531607637204259e-06, - "loss": 0.1255, - "step": 9655 - }, - { - "epoch": 0.27, - "learning_rate": 7.5301806558406355e-06, - "loss": 0.2833, - "step": 9660 - }, - { - "epoch": 0.27, - "learning_rate": 7.528753674477012e-06, - "loss": 0.1569, - "step": 9665 - }, - { - "epoch": 0.27, - "learning_rate": 7.527326693113388e-06, - "loss": 0.153, - "step": 9670 - }, - { - "epoch": 0.27, - "learning_rate": 7.525899711749765e-06, - "loss": 0.237, - "step": 9675 - }, - { - "epoch": 0.27, - "learning_rate": 7.524472730386142e-06, - "loss": 0.0772, - "step": 9680 - }, - { - "epoch": 0.27, - "learning_rate": 7.523045749022518e-06, - "loss": 0.1243, - "step": 9685 - }, - { - "epoch": 0.27, - "learning_rate": 7.521618767658894e-06, - "loss": 0.1303, - "step": 9690 - }, - { - "epoch": 0.27, - "learning_rate": 7.5201917862952715e-06, - "loss": 0.2455, - "step": 9695 - }, - { - "epoch": 0.27, - "learning_rate": 7.518764804931649e-06, - "loss": 0.4695, - "step": 9700 - }, - { - "epoch": 0.27, - "learning_rate": 7.517337823568025e-06, - "loss": 0.1337, - "step": 9705 - }, - { - "epoch": 0.27, - "learning_rate": 7.515910842204401e-06, - "loss": 0.1306, - "step": 9710 - }, - { - "epoch": 0.27, - "learning_rate": 7.514483860840778e-06, - "loss": 0.1741, - "step": 9715 - }, - { - "epoch": 0.27, - "learning_rate": 7.513056879477154e-06, - "loss": 0.203, - "step": 9720 - }, - { - "epoch": 0.27, - "learning_rate": 7.511629898113531e-06, - "loss": 0.1038, - "step": 9725 - }, - { - "epoch": 0.27, - "learning_rate": 7.510202916749908e-06, - "loss": 0.1263, - "step": 9730 - }, - { - "epoch": 0.27, - "learning_rate": 7.508775935386285e-06, - "loss": 0.1612, - "step": 9735 - }, - { - "epoch": 0.27, - "learning_rate": 7.507348954022661e-06, - "loss": 0.2431, - "step": 9740 - }, - { - "epoch": 0.27, - "learning_rate": 7.505921972659038e-06, - "loss": 0.1577, - "step": 9745 - }, - { - "epoch": 0.27, - "learning_rate": 7.504494991295415e-06, - "loss": 0.3567, - "step": 9750 - }, - { - "epoch": 0.27, - "learning_rate": 7.503068009931791e-06, - "loss": 0.2375, - "step": 9755 - }, - { - "epoch": 0.27, - "learning_rate": 7.501641028568167e-06, - "loss": 0.1828, - "step": 9760 - }, - { - "epoch": 0.27, - "learning_rate": 7.500214047204544e-06, - "loss": 0.1248, - "step": 9765 - }, - { - "epoch": 0.27, - "learning_rate": 7.498787065840921e-06, - "loss": 0.2088, - "step": 9770 - }, - { - "epoch": 0.27, - "learning_rate": 7.497360084477297e-06, - "loss": 0.1981, - "step": 9775 - }, - { - "epoch": 0.27, - "learning_rate": 7.495933103113674e-06, - "loss": 0.139, - "step": 9780 - }, - { - "epoch": 0.27, - "learning_rate": 7.494506121750051e-06, - "loss": 0.1037, - "step": 9785 - }, - { - "epoch": 0.27, - "learning_rate": 7.493079140386427e-06, - "loss": 0.1607, - "step": 9790 - }, - { - "epoch": 0.27, - "learning_rate": 7.491652159022804e-06, - "loss": 0.3597, - "step": 9795 - }, - { - "epoch": 0.27, - "learning_rate": 7.4902251776591806e-06, - "loss": 0.2919, - "step": 9800 - }, - { - "epoch": 0.27, - "learning_rate": 7.488798196295557e-06, - "loss": 0.1854, - "step": 9805 - }, - { - "epoch": 0.27, - "learning_rate": 7.487371214931933e-06, - "loss": 0.1637, - "step": 9810 - }, - { - "epoch": 0.27, - "learning_rate": 7.48594423356831e-06, - "loss": 0.2263, - "step": 9815 - }, - { - "epoch": 0.27, - "learning_rate": 7.484517252204687e-06, - "loss": 0.1544, - "step": 9820 - }, - { - "epoch": 0.27, - "learning_rate": 7.483090270841064e-06, - "loss": 0.2028, - "step": 9825 - }, - { - "epoch": 0.27, - "learning_rate": 7.48166328947744e-06, - "loss": 0.12, - "step": 9830 - }, - { - "epoch": 0.27, - "learning_rate": 7.480236308113817e-06, - "loss": 0.1801, - "step": 9835 - }, - { - "epoch": 0.27, - "learning_rate": 7.478809326750194e-06, - "loss": 0.2422, - "step": 9840 - }, - { - "epoch": 0.27, - "learning_rate": 7.47738234538657e-06, - "loss": 0.1783, - "step": 9845 - }, - { - "epoch": 0.27, - "learning_rate": 7.4759553640229465e-06, - "loss": 0.6002, - "step": 9850 - }, - { - "epoch": 0.27, - "learning_rate": 7.474528382659323e-06, - "loss": 0.176, - "step": 9855 - }, - { - "epoch": 0.27, - "learning_rate": 7.473101401295699e-06, - "loss": 0.1873, - "step": 9860 - }, - { - "epoch": 0.27, - "learning_rate": 7.471674419932076e-06, - "loss": 0.2043, - "step": 9865 - }, - { - "epoch": 0.27, - "learning_rate": 7.4702474385684535e-06, - "loss": 0.1526, - "step": 9870 - }, - { - "epoch": 0.27, - "learning_rate": 7.46882045720483e-06, - "loss": 0.202, - "step": 9875 - }, - { - "epoch": 0.27, - "learning_rate": 7.467393475841206e-06, - "loss": 0.155, - "step": 9880 - }, - { - "epoch": 0.27, - "learning_rate": 7.4659664944775826e-06, - "loss": 0.1549, - "step": 9885 - }, - { - "epoch": 0.27, - "learning_rate": 7.46453951311396e-06, - "loss": 0.2724, - "step": 9890 - }, - { - "epoch": 0.27, - "learning_rate": 7.463112531750336e-06, - "loss": 0.2492, - "step": 9895 - }, - { - "epoch": 0.27, - "learning_rate": 7.461685550386712e-06, - "loss": 0.397, - "step": 9900 - }, - { - "epoch": 0.27, - "learning_rate": 7.460258569023089e-06, - "loss": 0.2147, - "step": 9905 - }, - { - "epoch": 0.27, - "learning_rate": 7.458831587659465e-06, - "loss": 0.1992, - "step": 9910 - }, - { - "epoch": 0.28, - "learning_rate": 7.457404606295843e-06, - "loss": 0.1494, - "step": 9915 - }, - { - "epoch": 0.28, - "learning_rate": 7.4559776249322195e-06, - "loss": 0.2049, - "step": 9920 - }, - { - "epoch": 0.28, - "learning_rate": 7.454550643568596e-06, - "loss": 0.1952, - "step": 9925 - }, - { - "epoch": 0.28, - "learning_rate": 7.453123662204972e-06, - "loss": 0.0743, - "step": 9930 - }, - { - "epoch": 0.28, - "learning_rate": 7.451696680841349e-06, - "loss": 0.1328, - "step": 9935 - }, - { - "epoch": 0.28, - "learning_rate": 7.450269699477726e-06, - "loss": 0.2897, - "step": 9940 - }, - { - "epoch": 0.28, - "learning_rate": 7.448842718114102e-06, - "loss": 0.2717, - "step": 9945 - }, - { - "epoch": 0.28, - "learning_rate": 7.447415736750478e-06, - "loss": 0.3851, - "step": 9950 - }, - { - "epoch": 0.28, - "learning_rate": 7.445988755386855e-06, - "loss": 0.2401, - "step": 9955 - }, - { - "epoch": 0.28, - "learning_rate": 7.444561774023233e-06, - "loss": 0.2105, - "step": 9960 - }, - { - "epoch": 0.28, - "learning_rate": 7.443134792659609e-06, - "loss": 0.1656, - "step": 9965 - }, - { - "epoch": 0.28, - "learning_rate": 7.441707811295985e-06, - "loss": 0.2268, - "step": 9970 - }, - { - "epoch": 0.28, - "learning_rate": 7.440280829932362e-06, - "loss": 0.1913, - "step": 9975 - }, - { - "epoch": 0.28, - "learning_rate": 7.438853848568738e-06, - "loss": 0.0646, - "step": 9980 - }, - { - "epoch": 0.28, - "learning_rate": 7.437426867205115e-06, - "loss": 0.143, - "step": 9985 - }, - { - "epoch": 0.28, - "learning_rate": 7.435999885841492e-06, - "loss": 0.1793, - "step": 9990 - }, - { - "epoch": 0.28, - "learning_rate": 7.434572904477868e-06, - "loss": 0.1764, - "step": 9995 - }, - { - "epoch": 0.28, - "learning_rate": 7.433145923114244e-06, - "loss": 0.2205, - "step": 10000 - }, - { - "epoch": 0.28, - "eval_loss": 0.07491611689329147, - "eval_runtime": 2332.1386, - "eval_samples_per_second": 6.868, - "eval_steps_per_second": 1.717, - "eval_wer": 0.2068698160836639, - "step": 10000 - }, - { - "epoch": 0.28, - "learning_rate": 7.431718941750621e-06, - "loss": 0.2567, - "step": 10005 - }, - { - "epoch": 0.28, - "learning_rate": 7.430291960386999e-06, - "loss": 0.1234, - "step": 10010 - }, - { - "epoch": 0.28, - "learning_rate": 7.428864979023375e-06, - "loss": 0.1736, - "step": 10015 - }, - { - "epoch": 0.28, - "learning_rate": 7.427437997659751e-06, - "loss": 0.2017, - "step": 10020 - }, - { - "epoch": 0.28, - "learning_rate": 7.426011016296128e-06, - "loss": 0.1199, - "step": 10025 - }, - { - "epoch": 0.28, - "learning_rate": 7.424584034932505e-06, - "loss": 0.0675, - "step": 10030 - }, - { - "epoch": 0.28, - "learning_rate": 7.423157053568881e-06, - "loss": 0.1714, - "step": 10035 - }, - { - "epoch": 0.28, - "learning_rate": 7.4217300722052575e-06, - "loss": 0.1121, - "step": 10040 - }, - { - "epoch": 0.28, - "learning_rate": 7.420303090841634e-06, - "loss": 0.2543, - "step": 10045 - }, - { - "epoch": 0.28, - "learning_rate": 7.41887610947801e-06, - "loss": 0.7649, - "step": 10050 - }, - { - "epoch": 0.28, - "learning_rate": 7.417449128114388e-06, - "loss": 0.1539, - "step": 10055 - }, - { - "epoch": 0.28, - "learning_rate": 7.4160221467507646e-06, - "loss": 0.1907, - "step": 10060 - }, - { - "epoch": 0.28, - "learning_rate": 7.414595165387141e-06, - "loss": 0.1908, - "step": 10065 - }, - { - "epoch": 0.28, - "learning_rate": 7.413168184023517e-06, - "loss": 0.2002, - "step": 10070 - }, - { - "epoch": 0.28, - "learning_rate": 7.411741202659894e-06, - "loss": 0.1605, - "step": 10075 - }, - { - "epoch": 0.28, - "learning_rate": 7.410314221296271e-06, - "loss": 0.1371, - "step": 10080 - }, - { - "epoch": 0.28, - "learning_rate": 7.408887239932647e-06, - "loss": 0.227, - "step": 10085 - }, - { - "epoch": 0.28, - "learning_rate": 7.4074602585690235e-06, - "loss": 0.3145, - "step": 10090 - }, - { - "epoch": 0.28, - "learning_rate": 7.4060332772054e-06, - "loss": 0.3825, - "step": 10095 - }, - { - "epoch": 0.28, - "learning_rate": 7.404606295841776e-06, - "loss": 0.4545, - "step": 10100 - }, - { - "epoch": 0.28, - "learning_rate": 7.403179314478154e-06, - "loss": 0.1605, - "step": 10105 - }, - { - "epoch": 0.28, - "learning_rate": 7.4017523331145305e-06, - "loss": 0.1218, - "step": 10110 - }, - { - "epoch": 0.28, - "learning_rate": 7.400325351750907e-06, - "loss": 0.1969, - "step": 10115 - }, - { - "epoch": 0.28, - "learning_rate": 7.398898370387283e-06, - "loss": 0.159, - "step": 10120 - }, - { - "epoch": 0.28, - "learning_rate": 7.39747138902366e-06, - "loss": 0.2698, - "step": 10125 - }, - { - "epoch": 0.28, - "learning_rate": 7.396044407660037e-06, - "loss": 0.1793, - "step": 10130 - }, - { - "epoch": 0.28, - "learning_rate": 7.394617426296413e-06, - "loss": 0.1331, - "step": 10135 - }, - { - "epoch": 0.28, - "learning_rate": 7.393190444932789e-06, - "loss": 0.2675, - "step": 10140 - }, - { - "epoch": 0.28, - "learning_rate": 7.391763463569166e-06, - "loss": 0.3275, - "step": 10145 - }, - { - "epoch": 0.28, - "learning_rate": 7.390336482205544e-06, - "loss": 0.3463, - "step": 10150 - }, - { - "epoch": 0.28, - "learning_rate": 7.38890950084192e-06, - "loss": 0.1608, - "step": 10155 - }, - { - "epoch": 0.28, - "learning_rate": 7.3874825194782964e-06, - "loss": 0.1301, - "step": 10160 - }, - { - "epoch": 0.28, - "learning_rate": 7.386055538114673e-06, - "loss": 0.1259, - "step": 10165 - }, - { - "epoch": 0.28, - "learning_rate": 7.384628556751049e-06, - "loss": 0.2146, - "step": 10170 - }, - { - "epoch": 0.28, - "learning_rate": 7.383201575387426e-06, - "loss": 0.1014, - "step": 10175 - }, - { - "epoch": 0.28, - "learning_rate": 7.381774594023803e-06, - "loss": 0.1242, - "step": 10180 - }, - { - "epoch": 0.28, - "learning_rate": 7.380347612660179e-06, - "loss": 0.0413, - "step": 10185 - }, - { - "epoch": 0.28, - "learning_rate": 7.378920631296555e-06, - "loss": 0.2255, - "step": 10190 - }, - { - "epoch": 0.28, - "learning_rate": 7.377493649932932e-06, - "loss": 0.291, - "step": 10195 - }, - { - "epoch": 0.28, - "learning_rate": 7.37606666856931e-06, - "loss": 0.7039, - "step": 10200 - }, - { - "epoch": 0.28, - "learning_rate": 7.374639687205686e-06, - "loss": 0.1755, - "step": 10205 - }, - { - "epoch": 0.28, - "learning_rate": 7.373212705842062e-06, - "loss": 0.248, - "step": 10210 - }, - { - "epoch": 0.28, - "learning_rate": 7.371785724478439e-06, - "loss": 0.1566, - "step": 10215 - }, - { - "epoch": 0.28, - "learning_rate": 7.370358743114816e-06, - "loss": 0.1532, - "step": 10220 - }, - { - "epoch": 0.28, - "learning_rate": 7.368931761751192e-06, - "loss": 0.0946, - "step": 10225 - }, - { - "epoch": 0.28, - "learning_rate": 7.3675047803875686e-06, - "loss": 0.1811, - "step": 10230 - }, - { - "epoch": 0.28, - "learning_rate": 7.366077799023945e-06, - "loss": 0.2768, - "step": 10235 - }, - { - "epoch": 0.28, - "learning_rate": 7.364650817660321e-06, - "loss": 0.2201, - "step": 10240 - }, - { - "epoch": 0.28, - "learning_rate": 7.363223836296699e-06, - "loss": 0.238, - "step": 10245 - }, - { - "epoch": 0.28, - "learning_rate": 7.361796854933076e-06, - "loss": 0.4387, - "step": 10250 - }, - { - "epoch": 0.28, - "learning_rate": 7.360369873569452e-06, - "loss": 0.1397, - "step": 10255 - }, - { - "epoch": 0.28, - "learning_rate": 7.358942892205828e-06, - "loss": 0.1958, - "step": 10260 - }, - { - "epoch": 0.28, - "learning_rate": 7.357515910842205e-06, - "loss": 0.1626, - "step": 10265 - }, - { - "epoch": 0.28, - "learning_rate": 7.356088929478582e-06, - "loss": 0.2076, - "step": 10270 - }, - { - "epoch": 0.29, - "learning_rate": 7.354661948114958e-06, - "loss": 0.2224, - "step": 10275 - }, - { - "epoch": 0.29, - "learning_rate": 7.3532349667513345e-06, - "loss": 0.0584, - "step": 10280 - }, - { - "epoch": 0.29, - "learning_rate": 7.351807985387711e-06, - "loss": 0.1163, - "step": 10285 - }, - { - "epoch": 0.29, - "learning_rate": 7.350381004024087e-06, - "loss": 0.3164, - "step": 10290 - }, - { - "epoch": 0.29, - "learning_rate": 7.348954022660465e-06, - "loss": 0.2504, - "step": 10295 - }, - { - "epoch": 0.29, - "learning_rate": 7.3475270412968415e-06, - "loss": 0.3822, - "step": 10300 - }, - { - "epoch": 0.29, - "learning_rate": 7.346100059933218e-06, - "loss": 0.1097, - "step": 10305 - }, - { - "epoch": 0.29, - "learning_rate": 7.344673078569594e-06, - "loss": 0.2248, - "step": 10310 - }, - { - "epoch": 0.29, - "learning_rate": 7.343246097205971e-06, - "loss": 0.1898, - "step": 10315 - }, - { - "epoch": 0.29, - "learning_rate": 7.341819115842348e-06, - "loss": 0.2194, - "step": 10320 - }, - { - "epoch": 0.29, - "learning_rate": 7.340392134478724e-06, - "loss": 0.0948, - "step": 10325 - }, - { - "epoch": 0.29, - "learning_rate": 7.3389651531151e-06, - "loss": 0.16, - "step": 10330 - }, - { - "epoch": 0.29, - "learning_rate": 7.337538171751477e-06, - "loss": 0.1801, - "step": 10335 - }, - { - "epoch": 0.29, - "learning_rate": 7.336111190387855e-06, - "loss": 0.2755, - "step": 10340 - }, - { - "epoch": 0.29, - "learning_rate": 7.334684209024231e-06, - "loss": 0.3869, - "step": 10345 - }, - { - "epoch": 0.29, - "learning_rate": 7.3332572276606075e-06, - "loss": 0.3723, - "step": 10350 - }, - { - "epoch": 0.29, - "learning_rate": 7.331830246296984e-06, - "loss": 0.1728, - "step": 10355 - }, - { - "epoch": 0.29, - "learning_rate": 7.33040326493336e-06, - "loss": 0.1652, - "step": 10360 - }, - { - "epoch": 0.29, - "learning_rate": 7.328976283569737e-06, - "loss": 0.2152, - "step": 10365 - }, - { - "epoch": 0.29, - "learning_rate": 7.327549302206114e-06, - "loss": 0.2127, - "step": 10370 - }, - { - "epoch": 0.29, - "learning_rate": 7.32612232084249e-06, - "loss": 0.0725, - "step": 10375 - }, - { - "epoch": 0.29, - "learning_rate": 7.324695339478866e-06, - "loss": 0.1122, - "step": 10380 - }, - { - "epoch": 0.29, - "learning_rate": 7.323268358115243e-06, - "loss": 0.098, - "step": 10385 - }, - { - "epoch": 0.29, - "learning_rate": 7.321841376751621e-06, - "loss": 0.1685, - "step": 10390 - }, - { - "epoch": 0.29, - "learning_rate": 7.320414395387997e-06, - "loss": 0.2073, - "step": 10395 - }, - { - "epoch": 0.29, - "learning_rate": 7.318987414024373e-06, - "loss": 0.3399, - "step": 10400 - }, - { - "epoch": 0.29, - "learning_rate": 7.31756043266075e-06, - "loss": 0.1522, - "step": 10405 - }, - { - "epoch": 0.29, - "learning_rate": 7.316133451297127e-06, - "loss": 0.2102, - "step": 10410 - }, - { - "epoch": 0.29, - "learning_rate": 7.314706469933503e-06, - "loss": 0.2329, - "step": 10415 - }, - { - "epoch": 0.29, - "learning_rate": 7.31327948856988e-06, - "loss": 0.227, - "step": 10420 - }, - { - "epoch": 0.29, - "learning_rate": 7.312137903478981e-06, - "loss": 1.2355, - "step": 10425 - }, - { - "epoch": 0.29, - "learning_rate": 7.310710922115358e-06, - "loss": 0.1112, - "step": 10430 - }, - { - "epoch": 0.29, - "learning_rate": 7.309283940751734e-06, - "loss": 0.1159, - "step": 10435 - }, - { - "epoch": 0.29, - "learning_rate": 7.307856959388111e-06, - "loss": 0.1421, - "step": 10440 - }, - { - "epoch": 0.29, - "learning_rate": 7.306429978024487e-06, - "loss": 0.36, - "step": 10445 - }, - { - "epoch": 0.29, - "learning_rate": 7.305002996660863e-06, - "loss": 0.415, - "step": 10450 - }, - { - "epoch": 0.29, - "learning_rate": 7.303576015297241e-06, - "loss": 0.3397, - "step": 10455 - }, - { - "epoch": 0.29, - "learning_rate": 7.302149033933618e-06, - "loss": 0.1816, - "step": 10460 - }, - { - "epoch": 0.29, - "learning_rate": 7.300722052569994e-06, - "loss": 0.1479, - "step": 10465 - }, - { - "epoch": 0.29, - "learning_rate": 7.29929507120637e-06, - "loss": 0.176, - "step": 10470 - }, - { - "epoch": 0.29, - "learning_rate": 7.297868089842747e-06, - "loss": 0.1749, - "step": 10475 - }, - { - "epoch": 0.29, - "learning_rate": 7.296441108479124e-06, - "loss": 0.0827, - "step": 10480 - }, - { - "epoch": 0.29, - "learning_rate": 7.2950141271155e-06, - "loss": 0.1076, - "step": 10485 - }, - { - "epoch": 0.29, - "learning_rate": 7.293587145751877e-06, - "loss": 0.2105, - "step": 10490 - }, - { - "epoch": 0.29, - "learning_rate": 7.292160164388253e-06, - "loss": 0.3473, - "step": 10495 - }, - { - "epoch": 0.29, - "learning_rate": 7.290733183024631e-06, - "loss": 0.6358, - "step": 10500 - }, - { - "epoch": 0.29, - "learning_rate": 7.289306201661007e-06, - "loss": 0.1205, - "step": 10505 - }, - { - "epoch": 0.29, - "learning_rate": 7.287879220297384e-06, - "loss": 0.1851, - "step": 10510 - }, - { - "epoch": 0.29, - "learning_rate": 7.28645223893376e-06, - "loss": 0.1954, - "step": 10515 - }, - { - "epoch": 0.29, - "learning_rate": 7.285025257570136e-06, - "loss": 0.2525, - "step": 10520 - }, - { - "epoch": 0.29, - "learning_rate": 7.2835982762065135e-06, - "loss": 0.2418, - "step": 10525 - }, - { - "epoch": 0.29, - "learning_rate": 7.28217129484289e-06, - "loss": 0.0711, - "step": 10530 - }, - { - "epoch": 0.29, - "learning_rate": 7.280744313479266e-06, - "loss": 0.1908, - "step": 10535 - }, - { - "epoch": 0.29, - "learning_rate": 7.2793173321156425e-06, - "loss": 0.2853, - "step": 10540 - }, - { - "epoch": 0.29, - "learning_rate": 7.27789035075202e-06, - "loss": 0.3841, - "step": 10545 - }, - { - "epoch": 0.29, - "learning_rate": 7.276463369388397e-06, - "loss": 0.6, - "step": 10550 - }, - { - "epoch": 0.29, - "learning_rate": 7.275036388024773e-06, - "loss": 0.11, - "step": 10555 - }, - { - "epoch": 0.29, - "learning_rate": 7.27360940666115e-06, - "loss": 0.1714, - "step": 10560 - }, - { - "epoch": 0.29, - "learning_rate": 7.272182425297526e-06, - "loss": 0.0995, - "step": 10565 - }, - { - "epoch": 0.29, - "learning_rate": 7.270755443933902e-06, - "loss": 0.1887, - "step": 10570 - }, - { - "epoch": 0.29, - "learning_rate": 7.2693284625702795e-06, - "loss": 0.1676, - "step": 10575 - }, - { - "epoch": 0.29, - "learning_rate": 7.267901481206656e-06, - "loss": 0.1543, - "step": 10580 - }, - { - "epoch": 0.29, - "learning_rate": 7.266474499843032e-06, - "loss": 0.0817, - "step": 10585 - }, - { - "epoch": 0.29, - "learning_rate": 7.265047518479409e-06, - "loss": 0.1569, - "step": 10590 - }, - { - "epoch": 0.29, - "learning_rate": 7.2636205371157865e-06, - "loss": 0.2467, - "step": 10595 - }, - { - "epoch": 0.29, - "learning_rate": 7.262193555752163e-06, - "loss": 0.3902, - "step": 10600 - }, - { - "epoch": 0.29, - "learning_rate": 7.260766574388539e-06, - "loss": 0.1886, - "step": 10605 - }, - { - "epoch": 0.29, - "learning_rate": 7.2593395930249155e-06, - "loss": 0.2343, - "step": 10610 - }, - { - "epoch": 0.29, - "learning_rate": 7.257912611661292e-06, - "loss": 0.1152, - "step": 10615 - }, - { - "epoch": 0.29, - "learning_rate": 7.256485630297669e-06, - "loss": 0.2069, - "step": 10620 - }, - { - "epoch": 0.29, - "learning_rate": 7.255058648934045e-06, - "loss": 0.1517, - "step": 10625 - }, - { - "epoch": 0.29, - "learning_rate": 7.253631667570422e-06, - "loss": 0.1141, - "step": 10630 - }, - { - "epoch": 0.3, - "learning_rate": 7.252204686206799e-06, - "loss": 0.1, - "step": 10635 - }, - { - "epoch": 0.3, - "learning_rate": 7.250777704843175e-06, - "loss": 0.2799, - "step": 10640 - }, - { - "epoch": 0.3, - "learning_rate": 7.2493507234795524e-06, - "loss": 0.3713, - "step": 10645 - }, - { - "epoch": 0.3, - "learning_rate": 7.247923742115929e-06, - "loss": 0.2662, - "step": 10650 - }, - { - "epoch": 0.3, - "learning_rate": 7.246496760752305e-06, - "loss": 0.1017, - "step": 10655 - }, - { - "epoch": 0.3, - "learning_rate": 7.2450697793886815e-06, - "loss": 0.1982, - "step": 10660 - }, - { - "epoch": 0.3, - "learning_rate": 7.243642798025058e-06, - "loss": 0.183, - "step": 10665 - }, - { - "epoch": 0.3, - "learning_rate": 7.242215816661435e-06, - "loss": 0.1771, - "step": 10670 - }, - { - "epoch": 0.3, - "learning_rate": 7.240788835297811e-06, - "loss": 0.155, - "step": 10675 - }, - { - "epoch": 0.3, - "learning_rate": 7.2393618539341885e-06, - "loss": 0.077, - "step": 10680 - }, - { - "epoch": 0.3, - "learning_rate": 7.237934872570565e-06, - "loss": 0.0747, - "step": 10685 - }, - { - "epoch": 0.3, - "learning_rate": 7.236507891206942e-06, - "loss": 0.4591, - "step": 10690 - }, - { - "epoch": 0.3, - "learning_rate": 7.235080909843318e-06, - "loss": 0.3071, - "step": 10695 - }, - { - "epoch": 0.3, - "learning_rate": 7.233653928479695e-06, - "loss": 0.4575, - "step": 10700 - }, - { - "epoch": 0.3, - "learning_rate": 7.232226947116071e-06, - "loss": 0.5442, - "step": 10705 - }, - { - "epoch": 0.3, - "learning_rate": 7.230799965752447e-06, - "loss": 0.2193, - "step": 10710 - }, - { - "epoch": 0.3, - "learning_rate": 7.2293729843888246e-06, - "loss": 0.225, - "step": 10715 - }, - { - "epoch": 0.3, - "learning_rate": 7.227946003025202e-06, - "loss": 0.3045, - "step": 10720 - }, - { - "epoch": 0.3, - "learning_rate": 7.226519021661578e-06, - "loss": 0.1232, - "step": 10725 - }, - { - "epoch": 0.3, - "learning_rate": 7.2250920402979544e-06, - "loss": 0.1332, - "step": 10730 - }, - { - "epoch": 0.3, - "learning_rate": 7.223665058934331e-06, - "loss": 0.0676, - "step": 10735 - }, - { - "epoch": 0.3, - "learning_rate": 7.222238077570708e-06, - "loss": 0.2668, - "step": 10740 - }, - { - "epoch": 0.3, - "learning_rate": 7.220811096207084e-06, - "loss": 0.3183, - "step": 10745 - }, - { - "epoch": 0.3, - "learning_rate": 7.219384114843461e-06, - "loss": 0.3311, - "step": 10750 - }, - { - "epoch": 0.3, - "learning_rate": 7.217957133479837e-06, - "loss": 0.1576, - "step": 10755 - }, - { - "epoch": 0.3, - "learning_rate": 7.216530152116213e-06, - "loss": 0.1797, - "step": 10760 - }, - { - "epoch": 0.3, - "learning_rate": 7.215103170752591e-06, - "loss": 0.1971, - "step": 10765 - }, - { - "epoch": 0.3, - "learning_rate": 7.213676189388968e-06, - "loss": 0.231, - "step": 10770 - }, - { - "epoch": 0.3, - "learning_rate": 7.212249208025344e-06, - "loss": 0.1203, - "step": 10775 - }, - { - "epoch": 0.3, - "learning_rate": 7.21082222666172e-06, - "loss": 0.1624, - "step": 10780 - }, - { - "epoch": 0.3, - "learning_rate": 7.2093952452980975e-06, - "loss": 0.1252, - "step": 10785 - }, - { - "epoch": 0.3, - "learning_rate": 7.207968263934474e-06, - "loss": 0.1593, - "step": 10790 - }, - { - "epoch": 0.3, - "learning_rate": 7.20654128257085e-06, - "loss": 0.1432, - "step": 10795 - }, - { - "epoch": 0.3, - "learning_rate": 7.2051143012072266e-06, - "loss": 0.4471, - "step": 10800 - }, - { - "epoch": 0.3, - "learning_rate": 7.203687319843603e-06, - "loss": 0.154, - "step": 10805 - }, - { - "epoch": 0.3, - "learning_rate": 7.202260338479981e-06, - "loss": 0.2305, - "step": 10810 - }, - { - "epoch": 0.3, - "learning_rate": 7.200833357116357e-06, - "loss": 0.2097, - "step": 10815 - }, - { - "epoch": 0.3, - "learning_rate": 7.199406375752734e-06, - "loss": 0.13, - "step": 10820 - }, - { - "epoch": 0.3, - "learning_rate": 7.19797939438911e-06, - "loss": 0.1908, - "step": 10825 - }, - { - "epoch": 0.3, - "learning_rate": 7.196552413025486e-06, - "loss": 0.0708, - "step": 10830 - }, - { - "epoch": 0.3, - "learning_rate": 7.1951254316618635e-06, - "loss": 0.172, - "step": 10835 - }, - { - "epoch": 0.3, - "learning_rate": 7.19369845029824e-06, - "loss": 0.2536, - "step": 10840 - }, - { - "epoch": 0.3, - "learning_rate": 7.192271468934616e-06, - "loss": 0.1223, - "step": 10845 - }, - { - "epoch": 0.3, - "learning_rate": 7.1908444875709925e-06, - "loss": 0.533, - "step": 10850 - }, - { - "epoch": 0.3, - "learning_rate": 7.189417506207369e-06, - "loss": 0.1416, - "step": 10855 - }, - { - "epoch": 0.3, - "learning_rate": 7.187990524843747e-06, - "loss": 0.1807, - "step": 10860 - }, - { - "epoch": 0.3, - "learning_rate": 7.186563543480123e-06, - "loss": 0.2, - "step": 10865 - }, - { - "epoch": 0.3, - "learning_rate": 7.1851365621164995e-06, - "loss": 0.1764, - "step": 10870 - }, - { - "epoch": 0.3, - "learning_rate": 7.183709580752876e-06, - "loss": 0.1812, - "step": 10875 - }, - { - "epoch": 0.3, - "learning_rate": 7.182282599389253e-06, - "loss": 0.0932, - "step": 10880 - }, - { - "epoch": 0.3, - "learning_rate": 7.180855618025629e-06, - "loss": 0.2631, - "step": 10885 - }, - { - "epoch": 0.3, - "learning_rate": 7.179428636662006e-06, - "loss": 0.0859, - "step": 10890 - }, - { - "epoch": 0.3, - "learning_rate": 7.178001655298382e-06, - "loss": 0.1994, - "step": 10895 - }, - { - "epoch": 0.3, - "learning_rate": 7.176574673934758e-06, - "loss": 0.3887, - "step": 10900 - }, - { - "epoch": 0.3, - "learning_rate": 7.1751476925711364e-06, - "loss": 0.1399, - "step": 10905 - }, - { - "epoch": 0.3, - "learning_rate": 7.173720711207513e-06, - "loss": 0.2339, - "step": 10910 - }, - { - "epoch": 0.3, - "learning_rate": 7.172293729843889e-06, - "loss": 0.2061, - "step": 10915 - }, - { - "epoch": 0.3, - "learning_rate": 7.1708667484802655e-06, - "loss": 0.1486, - "step": 10920 - }, - { - "epoch": 0.3, - "learning_rate": 7.169439767116642e-06, - "loss": 0.1816, - "step": 10925 - }, - { - "epoch": 0.3, - "learning_rate": 7.168012785753019e-06, - "loss": 0.13, - "step": 10930 - }, - { - "epoch": 0.3, - "learning_rate": 7.166585804389395e-06, - "loss": 0.155, - "step": 10935 - }, - { - "epoch": 0.3, - "learning_rate": 7.165158823025772e-06, - "loss": 0.1147, - "step": 10940 - }, - { - "epoch": 0.3, - "learning_rate": 7.163731841662148e-06, - "loss": 0.2045, - "step": 10945 - }, - { - "epoch": 0.3, - "learning_rate": 7.162304860298524e-06, - "loss": 0.2344, - "step": 10950 - }, - { - "epoch": 0.3, - "learning_rate": 7.160877878934902e-06, - "loss": 0.301, - "step": 10955 - }, - { - "epoch": 0.3, - "learning_rate": 7.159450897571279e-06, - "loss": 0.213, - "step": 10960 - }, - { - "epoch": 0.3, - "learning_rate": 7.158023916207655e-06, - "loss": 0.1779, - "step": 10965 - }, - { - "epoch": 0.3, - "learning_rate": 7.156596934844031e-06, - "loss": 0.2003, - "step": 10970 - }, - { - "epoch": 0.3, - "learning_rate": 7.1551699534804086e-06, - "loss": 0.1772, - "step": 10975 - }, - { - "epoch": 0.3, - "learning_rate": 7.153742972116785e-06, - "loss": 0.0908, - "step": 10980 - }, - { - "epoch": 0.3, - "learning_rate": 7.152315990753161e-06, - "loss": 0.1826, - "step": 10985 - }, - { - "epoch": 0.3, - "learning_rate": 7.150889009389538e-06, - "loss": 0.2637, - "step": 10990 - }, - { - "epoch": 0.31, - "learning_rate": 7.149462028025914e-06, - "loss": 0.4362, - "step": 10995 - }, - { - "epoch": 0.31, - "learning_rate": 7.148035046662292e-06, - "loss": 0.5842, - "step": 11000 - }, - { - "epoch": 0.31, - "learning_rate": 7.146608065298668e-06, - "loss": 0.1434, - "step": 11005 - }, - { - "epoch": 0.31, - "learning_rate": 7.145181083935045e-06, - "loss": 0.106, - "step": 11010 - }, - { - "epoch": 0.31, - "learning_rate": 7.143754102571421e-06, - "loss": 0.1779, - "step": 11015 - }, - { - "epoch": 0.31, - "learning_rate": 7.142327121207797e-06, - "loss": 0.219, - "step": 11020 - }, - { - "epoch": 0.31, - "learning_rate": 7.1409001398441745e-06, - "loss": 0.1088, - "step": 11025 - }, - { - "epoch": 0.31, - "learning_rate": 7.139473158480551e-06, - "loss": 0.0586, - "step": 11030 - }, - { - "epoch": 0.31, - "learning_rate": 7.138046177116927e-06, - "loss": 0.2313, - "step": 11035 - }, - { - "epoch": 0.31, - "learning_rate": 7.1366191957533035e-06, - "loss": 0.2773, - "step": 11040 - }, - { - "epoch": 0.31, - "learning_rate": 7.135477610662406e-06, - "loss": 1.0288, - "step": 11045 - }, - { - "epoch": 0.31, - "learning_rate": 7.134050629298782e-06, - "loss": 0.2824, - "step": 11050 - }, - { - "epoch": 0.31, - "learning_rate": 7.132623647935158e-06, - "loss": 0.1649, - "step": 11055 - }, - { - "epoch": 0.31, - "learning_rate": 7.131196666571535e-06, - "loss": 0.1973, - "step": 11060 - }, - { - "epoch": 0.31, - "learning_rate": 7.129769685207911e-06, - "loss": 0.1333, - "step": 11065 - }, - { - "epoch": 0.31, - "learning_rate": 7.128342703844289e-06, - "loss": 0.16, - "step": 11070 - }, - { - "epoch": 0.31, - "learning_rate": 7.126915722480665e-06, - "loss": 0.1792, - "step": 11075 - }, - { - "epoch": 0.31, - "learning_rate": 7.125488741117042e-06, - "loss": 0.1677, - "step": 11080 - }, - { - "epoch": 0.31, - "learning_rate": 7.124061759753418e-06, - "loss": 0.0933, - "step": 11085 - }, - { - "epoch": 0.31, - "learning_rate": 7.122634778389795e-06, - "loss": 0.0849, - "step": 11090 - }, - { - "epoch": 0.31, - "learning_rate": 7.1212077970261715e-06, - "loss": 0.2138, - "step": 11095 - }, - { - "epoch": 0.31, - "learning_rate": 7.119780815662548e-06, - "loss": 0.4769, - "step": 11100 - }, - { - "epoch": 0.31, - "learning_rate": 7.118353834298924e-06, - "loss": 0.1347, - "step": 11105 - }, - { - "epoch": 0.31, - "learning_rate": 7.1169268529353005e-06, - "loss": 0.1429, - "step": 11110 - }, - { - "epoch": 0.31, - "learning_rate": 7.115499871571679e-06, - "loss": 0.1614, - "step": 11115 - }, - { - "epoch": 0.31, - "learning_rate": 7.114072890208055e-06, - "loss": 0.1527, - "step": 11120 - }, - { - "epoch": 0.31, - "learning_rate": 7.112645908844431e-06, - "loss": 0.1226, - "step": 11125 - }, - { - "epoch": 0.31, - "learning_rate": 7.111218927480808e-06, - "loss": 0.1522, - "step": 11130 - }, - { - "epoch": 0.31, - "learning_rate": 7.109791946117184e-06, - "loss": 0.2053, - "step": 11135 - }, - { - "epoch": 0.31, - "learning_rate": 7.108364964753561e-06, - "loss": 0.2242, - "step": 11140 - }, - { - "epoch": 0.31, - "learning_rate": 7.1069379833899375e-06, - "loss": 0.2609, - "step": 11145 - }, - { - "epoch": 0.31, - "learning_rate": 7.105511002026314e-06, - "loss": 0.2835, - "step": 11150 - }, - { - "epoch": 0.31, - "learning_rate": 7.10408402066269e-06, - "loss": 0.1587, - "step": 11155 - }, - { - "epoch": 0.31, - "learning_rate": 7.1026570392990665e-06, - "loss": 0.1726, - "step": 11160 - }, - { - "epoch": 0.31, - "learning_rate": 7.1012300579354445e-06, - "loss": 0.1555, - "step": 11165 - }, - { - "epoch": 0.31, - "learning_rate": 7.099803076571821e-06, - "loss": 0.2174, - "step": 11170 - }, - { - "epoch": 0.31, - "learning_rate": 7.098376095208197e-06, - "loss": 0.2005, - "step": 11175 - }, - { - "epoch": 0.31, - "learning_rate": 7.0969491138445735e-06, - "loss": 0.0682, - "step": 11180 - }, - { - "epoch": 0.31, - "learning_rate": 7.095522132480951e-06, - "loss": 0.0635, - "step": 11185 - }, - { - "epoch": 0.31, - "learning_rate": 7.094095151117327e-06, - "loss": 0.1272, - "step": 11190 - }, - { - "epoch": 0.31, - "learning_rate": 7.092668169753703e-06, - "loss": 0.1967, - "step": 11195 - }, - { - "epoch": 0.31, - "learning_rate": 7.09124118839008e-06, - "loss": 0.3992, - "step": 11200 - }, - { - "epoch": 0.31, - "learning_rate": 7.089814207026456e-06, - "loss": 0.1422, - "step": 11205 - }, - { - "epoch": 0.31, - "learning_rate": 7.088387225662834e-06, - "loss": 0.1684, - "step": 11210 - }, - { - "epoch": 0.31, - "learning_rate": 7.0869602442992104e-06, - "loss": 0.1779, - "step": 11215 - }, - { - "epoch": 0.31, - "learning_rate": 7.085533262935587e-06, - "loss": 0.1859, - "step": 11220 - }, - { - "epoch": 0.31, - "learning_rate": 7.084106281571963e-06, - "loss": 0.1575, - "step": 11225 - }, - { - "epoch": 0.31, - "learning_rate": 7.0826793002083395e-06, - "loss": 0.0327, - "step": 11230 - }, - { - "epoch": 0.31, - "learning_rate": 7.081252318844717e-06, - "loss": 0.1897, - "step": 11235 - }, - { - "epoch": 0.31, - "learning_rate": 7.079825337481093e-06, - "loss": 0.2325, - "step": 11240 - }, - { - "epoch": 0.31, - "learning_rate": 7.078398356117469e-06, - "loss": 0.2526, - "step": 11245 - }, - { - "epoch": 0.31, - "learning_rate": 7.076971374753846e-06, - "loss": 0.3376, - "step": 11250 - }, - { - "epoch": 0.31, - "learning_rate": 7.075544393390222e-06, - "loss": 0.1749, - "step": 11255 - }, - { - "epoch": 0.31, - "learning_rate": 7.0741174120266e-06, - "loss": 0.1364, - "step": 11260 - }, - { - "epoch": 0.31, - "learning_rate": 7.072690430662976e-06, - "loss": 0.1842, - "step": 11265 - }, - { - "epoch": 0.31, - "learning_rate": 7.071263449299353e-06, - "loss": 0.2257, - "step": 11270 - }, - { - "epoch": 0.31, - "learning_rate": 7.069836467935729e-06, - "loss": 0.2042, - "step": 11275 - }, - { - "epoch": 0.31, - "learning_rate": 7.068409486572106e-06, - "loss": 0.196, - "step": 11280 - }, - { - "epoch": 0.31, - "learning_rate": 7.0669825052084826e-06, - "loss": 0.2094, - "step": 11285 - }, - { - "epoch": 0.31, - "learning_rate": 7.065555523844859e-06, - "loss": 0.1393, - "step": 11290 - }, - { - "epoch": 0.31, - "learning_rate": 7.064128542481235e-06, - "loss": 0.284, - "step": 11295 - }, - { - "epoch": 0.31, - "learning_rate": 7.062701561117612e-06, - "loss": 0.5269, - "step": 11300 - }, - { - "epoch": 0.31, - "learning_rate": 7.06127457975399e-06, - "loss": 0.1672, - "step": 11305 - }, - { - "epoch": 0.31, - "learning_rate": 7.059847598390366e-06, - "loss": 0.1597, - "step": 11310 - }, - { - "epoch": 0.31, - "learning_rate": 7.058420617026742e-06, - "loss": 0.2241, - "step": 11315 - }, - { - "epoch": 0.31, - "learning_rate": 7.056993635663119e-06, - "loss": 0.1999, - "step": 11320 - }, - { - "epoch": 0.31, - "learning_rate": 7.055566654299495e-06, - "loss": 0.1571, - "step": 11325 - }, - { - "epoch": 0.31, - "learning_rate": 7.054139672935872e-06, - "loss": 0.2032, - "step": 11330 - }, - { - "epoch": 0.31, - "learning_rate": 7.0527126915722485e-06, - "loss": 0.1385, - "step": 11335 - }, - { - "epoch": 0.31, - "learning_rate": 7.051285710208625e-06, - "loss": 0.2935, - "step": 11340 - }, - { - "epoch": 0.31, - "learning_rate": 7.049858728845001e-06, - "loss": 0.3487, - "step": 11345 - }, - { - "epoch": 0.31, - "learning_rate": 7.0484317474813775e-06, - "loss": 0.6493, - "step": 11350 - }, - { - "epoch": 0.32, - "learning_rate": 7.0470047661177555e-06, - "loss": 0.1724, - "step": 11355 - }, - { - "epoch": 0.32, - "learning_rate": 7.045577784754132e-06, - "loss": 0.2007, - "step": 11360 - }, - { - "epoch": 0.32, - "learning_rate": 7.044150803390508e-06, - "loss": 0.1461, - "step": 11365 - }, - { - "epoch": 0.32, - "learning_rate": 7.0427238220268846e-06, - "loss": 0.2509, - "step": 11370 - }, - { - "epoch": 0.32, - "learning_rate": 7.041296840663262e-06, - "loss": 0.1743, - "step": 11375 - }, - { - "epoch": 0.32, - "learning_rate": 7.039869859299638e-06, - "loss": 0.1169, - "step": 11380 - }, - { - "epoch": 0.32, - "learning_rate": 7.038442877936014e-06, - "loss": 0.1445, - "step": 11385 - }, - { - "epoch": 0.32, - "learning_rate": 7.037015896572391e-06, - "loss": 0.232, - "step": 11390 - }, - { - "epoch": 0.32, - "learning_rate": 7.035588915208768e-06, - "loss": 0.3013, - "step": 11395 - }, - { - "epoch": 0.32, - "learning_rate": 7.034161933845145e-06, - "loss": 0.5159, - "step": 11400 - }, - { - "epoch": 0.32, - "learning_rate": 7.0327349524815215e-06, - "loss": 0.1103, - "step": 11405 - }, - { - "epoch": 0.32, - "learning_rate": 7.031307971117898e-06, - "loss": 0.18, - "step": 11410 - }, - { - "epoch": 0.32, - "learning_rate": 7.029880989754274e-06, - "loss": 0.1824, - "step": 11415 - }, - { - "epoch": 0.32, - "learning_rate": 7.0284540083906505e-06, - "loss": 0.1726, - "step": 11420 - }, - { - "epoch": 0.32, - "learning_rate": 7.027027027027028e-06, - "loss": 0.1194, - "step": 11425 - }, - { - "epoch": 0.32, - "learning_rate": 7.025600045663404e-06, - "loss": 0.1098, - "step": 11430 - }, - { - "epoch": 0.32, - "learning_rate": 7.02417306429978e-06, - "loss": 0.2506, - "step": 11435 - }, - { - "epoch": 0.32, - "learning_rate": 7.0227460829361575e-06, - "loss": 0.1701, - "step": 11440 - }, - { - "epoch": 0.32, - "learning_rate": 7.021319101572534e-06, - "loss": 0.2646, - "step": 11445 - }, - { - "epoch": 0.32, - "learning_rate": 7.019892120208911e-06, - "loss": 0.4503, - "step": 11450 - }, - { - "epoch": 0.32, - "learning_rate": 7.018465138845287e-06, - "loss": 0.1358, - "step": 11455 - }, - { - "epoch": 0.32, - "learning_rate": 7.017038157481664e-06, - "loss": 0.1648, - "step": 11460 - }, - { - "epoch": 0.32, - "learning_rate": 7.01561117611804e-06, - "loss": 0.1177, - "step": 11465 - }, - { - "epoch": 0.32, - "learning_rate": 7.014184194754417e-06, - "loss": 0.2052, - "step": 11470 - }, - { - "epoch": 0.32, - "learning_rate": 7.012757213390794e-06, - "loss": 0.047, - "step": 11475 - }, - { - "epoch": 0.32, - "learning_rate": 7.01133023202717e-06, - "loss": 0.1613, - "step": 11480 - }, - { - "epoch": 0.32, - "learning_rate": 7.009903250663547e-06, - "loss": 0.1665, - "step": 11485 - }, - { - "epoch": 0.32, - "learning_rate": 7.0084762692999235e-06, - "loss": 0.1467, - "step": 11490 - }, - { - "epoch": 0.32, - "learning_rate": 7.007049287936301e-06, - "loss": 0.317, - "step": 11495 - }, - { - "epoch": 0.32, - "learning_rate": 7.005622306572677e-06, - "loss": 0.5236, - "step": 11500 - }, - { - "epoch": 0.32, - "learning_rate": 7.004195325209053e-06, - "loss": 0.1651, - "step": 11505 - }, - { - "epoch": 0.32, - "learning_rate": 7.00276834384543e-06, - "loss": 0.1625, - "step": 11510 - }, - { - "epoch": 0.32, - "learning_rate": 7.001341362481806e-06, - "loss": 0.2025, - "step": 11515 - }, - { - "epoch": 0.32, - "learning_rate": 6.999914381118183e-06, - "loss": 0.1807, - "step": 11520 - }, - { - "epoch": 0.32, - "learning_rate": 6.9984873997545595e-06, - "loss": 0.2067, - "step": 11525 - }, - { - "epoch": 0.32, - "learning_rate": 6.997060418390937e-06, - "loss": 0.0538, - "step": 11530 - }, - { - "epoch": 0.32, - "learning_rate": 6.995633437027313e-06, - "loss": 0.1535, - "step": 11535 - }, - { - "epoch": 0.32, - "learning_rate": 6.994206455663689e-06, - "loss": 0.2358, - "step": 11540 - }, - { - "epoch": 0.32, - "learning_rate": 6.9927794743000666e-06, - "loss": 0.1317, - "step": 11545 - }, - { - "epoch": 0.32, - "learning_rate": 6.991352492936443e-06, - "loss": 0.3778, - "step": 11550 - }, - { - "epoch": 0.32, - "learning_rate": 6.989925511572819e-06, - "loss": 0.2059, - "step": 11555 - }, - { - "epoch": 0.32, - "learning_rate": 6.988498530209196e-06, - "loss": 0.1814, - "step": 11560 - }, - { - "epoch": 0.32, - "learning_rate": 6.987071548845573e-06, - "loss": 0.1676, - "step": 11565 - }, - { - "epoch": 0.32, - "learning_rate": 6.985644567481949e-06, - "loss": 0.1986, - "step": 11570 - }, - { - "epoch": 0.32, - "learning_rate": 6.984217586118326e-06, - "loss": 0.1007, - "step": 11575 - }, - { - "epoch": 0.32, - "learning_rate": 6.982790604754703e-06, - "loss": 0.1667, - "step": 11580 - }, - { - "epoch": 0.32, - "learning_rate": 6.981363623391079e-06, - "loss": 0.1611, - "step": 11585 - }, - { - "epoch": 0.32, - "learning_rate": 6.979936642027456e-06, - "loss": 0.2181, - "step": 11590 - }, - { - "epoch": 0.32, - "learning_rate": 6.9785096606638325e-06, - "loss": 0.2542, - "step": 11595 - }, - { - "epoch": 0.32, - "learning_rate": 6.977082679300209e-06, - "loss": 0.4274, - "step": 11600 - }, - { - "epoch": 0.32, - "learning_rate": 6.975655697936585e-06, - "loss": 0.1906, - "step": 11605 - }, - { - "epoch": 0.32, - "learning_rate": 6.9742287165729615e-06, - "loss": 0.1839, - "step": 11610 - }, - { - "epoch": 0.32, - "learning_rate": 6.972801735209339e-06, - "loss": 0.1624, - "step": 11615 - }, - { - "epoch": 0.32, - "learning_rate": 6.971374753845716e-06, - "loss": 0.2312, - "step": 11620 - }, - { - "epoch": 0.32, - "learning_rate": 6.969947772482092e-06, - "loss": 0.1718, - "step": 11625 - }, - { - "epoch": 0.32, - "learning_rate": 6.9685207911184686e-06, - "loss": 0.0537, - "step": 11630 - }, - { - "epoch": 0.32, - "learning_rate": 6.967093809754845e-06, - "loss": 0.1676, - "step": 11635 - }, - { - "epoch": 0.32, - "learning_rate": 6.965666828391222e-06, - "loss": 0.1831, - "step": 11640 - }, - { - "epoch": 0.32, - "learning_rate": 6.9642398470275984e-06, - "loss": 0.3179, - "step": 11645 - }, - { - "epoch": 0.32, - "learning_rate": 6.962812865663975e-06, - "loss": 0.3606, - "step": 11650 - }, - { - "epoch": 0.32, - "learning_rate": 6.961385884300351e-06, - "loss": 0.1715, - "step": 11655 - }, - { - "epoch": 0.32, - "learning_rate": 6.959958902936728e-06, - "loss": 0.1673, - "step": 11660 - }, - { - "epoch": 0.32, - "learning_rate": 6.9585319215731055e-06, - "loss": 0.154, - "step": 11665 - }, - { - "epoch": 0.32, - "learning_rate": 6.957104940209482e-06, - "loss": 0.187, - "step": 11670 - }, - { - "epoch": 0.32, - "learning_rate": 6.955677958845858e-06, - "loss": 0.1616, - "step": 11675 - }, - { - "epoch": 0.32, - "learning_rate": 6.9542509774822345e-06, - "loss": 0.15, - "step": 11680 - }, - { - "epoch": 0.32, - "learning_rate": 6.952823996118612e-06, - "loss": 0.2719, - "step": 11685 - }, - { - "epoch": 0.32, - "learning_rate": 6.951397014754988e-06, - "loss": 0.1173, - "step": 11690 - }, - { - "epoch": 0.32, - "learning_rate": 6.949970033391364e-06, - "loss": 0.2932, - "step": 11695 - }, - { - "epoch": 0.32, - "learning_rate": 6.948543052027741e-06, - "loss": 0.6715, - "step": 11700 - }, - { - "epoch": 0.32, - "learning_rate": 6.947116070664117e-06, - "loss": 0.148, - "step": 11705 - }, - { - "epoch": 0.32, - "learning_rate": 6.945689089300495e-06, - "loss": 0.1502, - "step": 11710 - }, - { - "epoch": 0.33, - "learning_rate": 6.944262107936871e-06, - "loss": 0.2129, - "step": 11715 - }, - { - "epoch": 0.33, - "learning_rate": 6.942835126573248e-06, - "loss": 0.1811, - "step": 11720 - }, - { - "epoch": 0.33, - "learning_rate": 6.941408145209624e-06, - "loss": 0.2013, - "step": 11725 - }, - { - "epoch": 0.33, - "learning_rate": 6.939981163846001e-06, - "loss": 0.0523, - "step": 11730 - }, - { - "epoch": 0.33, - "learning_rate": 6.938554182482378e-06, - "loss": 0.1874, - "step": 11735 - }, - { - "epoch": 0.33, - "learning_rate": 6.937127201118754e-06, - "loss": 0.0713, - "step": 11740 - }, - { - "epoch": 0.33, - "learning_rate": 6.93570021975513e-06, - "loss": 0.2806, - "step": 11745 - }, - { - "epoch": 0.33, - "learning_rate": 6.934273238391507e-06, - "loss": 0.2965, - "step": 11750 - }, - { - "epoch": 0.33, - "learning_rate": 6.932846257027885e-06, - "loss": 0.1685, - "step": 11755 - }, - { - "epoch": 0.33, - "learning_rate": 6.931419275664261e-06, - "loss": 0.1686, - "step": 11760 - }, - { - "epoch": 0.33, - "learning_rate": 6.929992294300637e-06, - "loss": 0.1532, - "step": 11765 - }, - { - "epoch": 0.33, - "learning_rate": 6.928565312937014e-06, - "loss": 0.1886, - "step": 11770 - }, - { - "epoch": 0.33, - "learning_rate": 6.92713833157339e-06, - "loss": 0.1128, - "step": 11775 - }, - { - "epoch": 0.33, - "learning_rate": 6.925711350209767e-06, - "loss": 0.0301, - "step": 11780 - }, - { - "epoch": 0.33, - "learning_rate": 6.9242843688461435e-06, - "loss": 0.1901, - "step": 11785 - }, - { - "epoch": 0.33, - "learning_rate": 6.92285738748252e-06, - "loss": 0.2202, - "step": 11790 - }, - { - "epoch": 0.33, - "learning_rate": 6.921430406118896e-06, - "loss": 0.3021, - "step": 11795 - }, - { - "epoch": 0.33, - "learning_rate": 6.9200034247552726e-06, - "loss": 0.5823, - "step": 11800 - }, - { - "epoch": 0.33, - "learning_rate": 6.918576443391651e-06, - "loss": 0.4491, - "step": 11805 - }, - { - "epoch": 0.33, - "learning_rate": 6.917149462028027e-06, - "loss": 0.1753, - "step": 11810 - }, - { - "epoch": 0.33, - "learning_rate": 6.915722480664403e-06, - "loss": 0.1456, - "step": 11815 - }, - { - "epoch": 0.33, - "learning_rate": 6.91429549930078e-06, - "loss": 0.1782, - "step": 11820 - }, - { - "epoch": 0.33, - "learning_rate": 6.912868517937157e-06, - "loss": 0.0875, - "step": 11825 - }, - { - "epoch": 0.33, - "learning_rate": 6.911441536573533e-06, - "loss": 0.0452, - "step": 11830 - }, - { - "epoch": 0.33, - "learning_rate": 6.9100145552099095e-06, - "loss": 0.2525, - "step": 11835 - }, - { - "epoch": 0.33, - "learning_rate": 6.908587573846286e-06, - "loss": 0.2504, - "step": 11840 - }, - { - "epoch": 0.33, - "learning_rate": 6.907160592482662e-06, - "loss": 0.2647, - "step": 11845 - }, - { - "epoch": 0.33, - "learning_rate": 6.90573361111904e-06, - "loss": 0.4513, - "step": 11850 - }, - { - "epoch": 0.33, - "learning_rate": 6.9043066297554165e-06, - "loss": 0.1579, - "step": 11855 - }, - { - "epoch": 0.33, - "learning_rate": 6.902879648391793e-06, - "loss": 0.2213, - "step": 11860 - }, - { - "epoch": 0.33, - "learning_rate": 6.901452667028169e-06, - "loss": 0.2816, - "step": 11865 - }, - { - "epoch": 0.33, - "learning_rate": 6.9000256856645455e-06, - "loss": 0.1949, - "step": 11870 - }, - { - "epoch": 0.33, - "learning_rate": 6.898598704300923e-06, - "loss": 0.1781, - "step": 11875 - }, - { - "epoch": 0.33, - "learning_rate": 6.897171722937299e-06, - "loss": 0.1304, - "step": 11880 - }, - { - "epoch": 0.33, - "learning_rate": 6.895744741573675e-06, - "loss": 0.1648, - "step": 11885 - }, - { - "epoch": 0.33, - "learning_rate": 6.894317760210052e-06, - "loss": 0.1741, - "step": 11890 - }, - { - "epoch": 0.33, - "learning_rate": 6.892890778846428e-06, - "loss": 0.1889, - "step": 11895 - }, - { - "epoch": 0.33, - "learning_rate": 6.891463797482806e-06, - "loss": 0.5496, - "step": 11900 - }, - { - "epoch": 0.33, - "learning_rate": 6.8900368161191824e-06, - "loss": 0.2701, - "step": 11905 - }, - { - "epoch": 0.33, - "learning_rate": 6.888609834755559e-06, - "loss": 0.2145, - "step": 11910 - }, - { - "epoch": 0.33, - "learning_rate": 6.887182853391935e-06, - "loss": 0.2208, - "step": 11915 - }, - { - "epoch": 0.33, - "learning_rate": 6.885755872028312e-06, - "loss": 0.1022, - "step": 11920 - }, - { - "epoch": 0.33, - "learning_rate": 6.884328890664689e-06, - "loss": 0.1382, - "step": 11925 - }, - { - "epoch": 0.33, - "learning_rate": 6.882901909301065e-06, - "loss": 0.1889, - "step": 11930 - }, - { - "epoch": 0.33, - "learning_rate": 6.881474927937441e-06, - "loss": 0.1475, - "step": 11935 - }, - { - "epoch": 0.33, - "learning_rate": 6.880047946573818e-06, - "loss": 0.2216, - "step": 11940 - }, - { - "epoch": 0.33, - "learning_rate": 6.878620965210196e-06, - "loss": 0.233, - "step": 11945 - }, - { - "epoch": 0.33, - "learning_rate": 6.877193983846572e-06, - "loss": 0.5957, - "step": 11950 - }, - { - "epoch": 0.33, - "learning_rate": 6.875767002482948e-06, - "loss": 0.1498, - "step": 11955 - }, - { - "epoch": 0.33, - "learning_rate": 6.874340021119325e-06, - "loss": 0.1514, - "step": 11960 - }, - { - "epoch": 0.33, - "learning_rate": 6.872913039755701e-06, - "loss": 0.1007, - "step": 11965 - }, - { - "epoch": 0.33, - "learning_rate": 6.871486058392078e-06, - "loss": 0.1524, - "step": 11970 - }, - { - "epoch": 0.33, - "learning_rate": 6.8700590770284546e-06, - "loss": 0.2239, - "step": 11975 - }, - { - "epoch": 0.33, - "learning_rate": 6.868632095664831e-06, - "loss": 0.097, - "step": 11980 - }, - { - "epoch": 0.33, - "learning_rate": 6.867205114301207e-06, - "loss": 0.1536, - "step": 11985 - }, - { - "epoch": 0.33, - "learning_rate": 6.865778132937584e-06, - "loss": 0.2596, - "step": 11990 - }, - { - "epoch": 0.33, - "learning_rate": 6.864351151573962e-06, - "loss": 0.2747, - "step": 11995 - }, - { - "epoch": 0.33, - "learning_rate": 6.862924170210338e-06, - "loss": 0.3562, - "step": 12000 - }, - { - "epoch": 0.33, - "eval_loss": 0.07923547923564911, - "eval_runtime": 2106.0892, - "eval_samples_per_second": 7.606, - "eval_steps_per_second": 1.902, - "eval_wer": 0.22589253516047603, - "step": 12000 - }, - { - "epoch": 0.33, - "learning_rate": 6.861497188846714e-06, - "loss": 0.1722, - "step": 12005 - }, - { - "epoch": 0.33, - "learning_rate": 6.860070207483091e-06, - "loss": 0.169, - "step": 12010 - }, - { - "epoch": 0.33, - "learning_rate": 6.858643226119468e-06, - "loss": 0.1367, - "step": 12015 - }, - { - "epoch": 0.33, - "learning_rate": 6.857216244755844e-06, - "loss": 0.1788, - "step": 12020 - }, - { - "epoch": 0.33, - "learning_rate": 6.8557892633922205e-06, - "loss": 0.1067, - "step": 12025 - }, - { - "epoch": 0.33, - "learning_rate": 6.854362282028597e-06, - "loss": 0.086, - "step": 12030 - }, - { - "epoch": 0.33, - "learning_rate": 6.852935300664973e-06, - "loss": 0.154, - "step": 12035 - }, - { - "epoch": 0.33, - "learning_rate": 6.851508319301351e-06, - "loss": 0.2277, - "step": 12040 - }, - { - "epoch": 0.33, - "learning_rate": 6.8500813379377275e-06, - "loss": 0.2513, - "step": 12045 - }, - { - "epoch": 0.33, - "learning_rate": 6.848654356574104e-06, - "loss": 0.2739, - "step": 12050 - }, - { - "epoch": 0.33, - "learning_rate": 6.84722737521048e-06, - "loss": 0.1541, - "step": 12055 - }, - { - "epoch": 0.33, - "learning_rate": 6.8458003938468566e-06, - "loss": 0.1395, - "step": 12060 - }, - { - "epoch": 0.33, - "learning_rate": 6.844373412483234e-06, - "loss": 0.1674, - "step": 12065 - }, - { - "epoch": 0.33, - "learning_rate": 6.84294643111961e-06, - "loss": 0.2734, - "step": 12070 - }, - { - "epoch": 0.34, - "learning_rate": 6.841519449755986e-06, - "loss": 0.0343, - "step": 12075 - }, - { - "epoch": 0.34, - "learning_rate": 6.840092468392363e-06, - "loss": 0.0648, - "step": 12080 - }, - { - "epoch": 0.34, - "learning_rate": 6.838665487028739e-06, - "loss": 0.0999, - "step": 12085 - }, - { - "epoch": 0.34, - "learning_rate": 6.837238505665117e-06, - "loss": 0.1609, - "step": 12090 - }, - { - "epoch": 0.34, - "learning_rate": 6.8358115243014935e-06, - "loss": 0.2068, - "step": 12095 - }, - { - "epoch": 0.34, - "learning_rate": 6.83438454293787e-06, - "loss": 0.5631, - "step": 12100 - }, - { - "epoch": 0.34, - "learning_rate": 6.832957561574246e-06, - "loss": 0.2012, - "step": 12105 - }, - { - "epoch": 0.34, - "learning_rate": 6.831530580210623e-06, - "loss": 0.1435, - "step": 12110 - }, - { - "epoch": 0.34, - "learning_rate": 6.830103598847e-06, - "loss": 0.1954, - "step": 12115 - }, - { - "epoch": 0.34, - "learning_rate": 6.828676617483376e-06, - "loss": 0.1535, - "step": 12120 - }, - { - "epoch": 0.34, - "learning_rate": 6.827249636119752e-06, - "loss": 0.1071, - "step": 12125 - }, - { - "epoch": 0.34, - "learning_rate": 6.825822654756129e-06, - "loss": 0.0774, - "step": 12130 - }, - { - "epoch": 0.34, - "learning_rate": 6.824395673392507e-06, - "loss": 0.1752, - "step": 12135 - }, - { - "epoch": 0.34, - "learning_rate": 6.822968692028883e-06, - "loss": 0.111, - "step": 12140 - }, - { - "epoch": 0.34, - "learning_rate": 6.821541710665259e-06, - "loss": 0.2101, - "step": 12145 - }, - { - "epoch": 0.34, - "learning_rate": 6.820114729301636e-06, - "loss": 0.6161, - "step": 12150 - }, - { - "epoch": 0.34, - "learning_rate": 6.818687747938012e-06, - "loss": 0.1055, - "step": 12155 - }, - { - "epoch": 0.34, - "learning_rate": 6.817260766574389e-06, - "loss": 0.1056, - "step": 12160 - }, - { - "epoch": 0.34, - "learning_rate": 6.815833785210766e-06, - "loss": 0.1723, - "step": 12165 - }, - { - "epoch": 0.34, - "learning_rate": 6.814406803847142e-06, - "loss": 0.1849, - "step": 12170 - }, - { - "epoch": 0.34, - "learning_rate": 6.812979822483518e-06, - "loss": 0.1547, - "step": 12175 - }, - { - "epoch": 0.34, - "learning_rate": 6.811552841119895e-06, - "loss": 0.0779, - "step": 12180 - }, - { - "epoch": 0.34, - "learning_rate": 6.810125859756273e-06, - "loss": 0.0533, - "step": 12185 - }, - { - "epoch": 0.34, - "learning_rate": 6.808698878392649e-06, - "loss": 0.1573, - "step": 12190 - }, - { - "epoch": 0.34, - "learning_rate": 6.807271897029025e-06, - "loss": 0.2096, - "step": 12195 - }, - { - "epoch": 0.34, - "learning_rate": 6.805844915665402e-06, - "loss": 0.4607, - "step": 12200 - }, - { - "epoch": 0.34, - "learning_rate": 6.804417934301779e-06, - "loss": 0.1499, - "step": 12205 - }, - { - "epoch": 0.34, - "learning_rate": 6.802990952938155e-06, - "loss": 0.196, - "step": 12210 - }, - { - "epoch": 0.34, - "learning_rate": 6.8015639715745315e-06, - "loss": 0.2675, - "step": 12215 - }, - { - "epoch": 0.34, - "learning_rate": 6.800136990210908e-06, - "loss": 0.1761, - "step": 12220 - }, - { - "epoch": 0.34, - "learning_rate": 6.798710008847284e-06, - "loss": 0.1389, - "step": 12225 - }, - { - "epoch": 0.34, - "learning_rate": 6.797283027483662e-06, - "loss": 0.0576, - "step": 12230 - }, - { - "epoch": 0.34, - "learning_rate": 6.7958560461200386e-06, - "loss": 0.2832, - "step": 12235 - }, - { - "epoch": 0.34, - "learning_rate": 6.794429064756415e-06, - "loss": 0.1552, - "step": 12240 - }, - { - "epoch": 0.34, - "learning_rate": 6.793002083392791e-06, - "loss": 0.2106, - "step": 12245 - }, - { - "epoch": 0.34, - "learning_rate": 6.791575102029168e-06, - "loss": 0.3959, - "step": 12250 - }, - { - "epoch": 0.34, - "learning_rate": 6.790148120665545e-06, - "loss": 0.1223, - "step": 12255 - }, - { - "epoch": 0.34, - "learning_rate": 6.788721139301921e-06, - "loss": 0.1802, - "step": 12260 - }, - { - "epoch": 0.34, - "learning_rate": 6.7872941579382975e-06, - "loss": 0.1227, - "step": 12265 - }, - { - "epoch": 0.34, - "learning_rate": 6.785867176574674e-06, - "loss": 0.1722, - "step": 12270 - }, - { - "epoch": 0.34, - "learning_rate": 6.784440195211051e-06, - "loss": 0.1879, - "step": 12275 - }, - { - "epoch": 0.34, - "learning_rate": 6.783013213847428e-06, - "loss": 0.1466, - "step": 12280 - }, - { - "epoch": 0.34, - "learning_rate": 6.7815862324838045e-06, - "loss": 0.0777, - "step": 12285 - }, - { - "epoch": 0.34, - "learning_rate": 6.780159251120181e-06, - "loss": 0.0767, - "step": 12290 - }, - { - "epoch": 0.34, - "learning_rate": 6.778732269756557e-06, - "loss": 0.209, - "step": 12295 - }, - { - "epoch": 0.34, - "learning_rate": 6.777305288392934e-06, - "loss": 0.4856, - "step": 12300 - }, - { - "epoch": 0.34, - "learning_rate": 6.775878307029311e-06, - "loss": 0.2182, - "step": 12305 - }, - { - "epoch": 0.34, - "learning_rate": 6.774451325665687e-06, - "loss": 0.193, - "step": 12310 - }, - { - "epoch": 0.34, - "learning_rate": 6.773024344302063e-06, - "loss": 0.1729, - "step": 12315 - }, - { - "epoch": 0.34, - "learning_rate": 6.7715973629384406e-06, - "loss": 0.1722, - "step": 12320 - }, - { - "epoch": 0.34, - "learning_rate": 6.770170381574818e-06, - "loss": 0.1712, - "step": 12325 - }, - { - "epoch": 0.34, - "learning_rate": 6.768743400211194e-06, - "loss": 0.1361, - "step": 12330 - }, - { - "epoch": 0.34, - "learning_rate": 6.7673164188475704e-06, - "loss": 0.0951, - "step": 12335 - }, - { - "epoch": 0.34, - "learning_rate": 6.765889437483947e-06, - "loss": 0.1864, - "step": 12340 - }, - { - "epoch": 0.34, - "learning_rate": 6.764462456120323e-06, - "loss": 0.3715, - "step": 12345 - }, - { - "epoch": 0.34, - "learning_rate": 6.7630354747567e-06, - "loss": 0.4201, - "step": 12350 - }, - { - "epoch": 0.34, - "learning_rate": 6.761608493393077e-06, - "loss": 0.1058, - "step": 12355 - }, - { - "epoch": 0.34, - "learning_rate": 6.760181512029453e-06, - "loss": 0.1139, - "step": 12360 - }, - { - "epoch": 0.34, - "learning_rate": 6.75875453066583e-06, - "loss": 0.1212, - "step": 12365 - }, - { - "epoch": 0.34, - "learning_rate": 6.7573275493022065e-06, - "loss": 0.1982, - "step": 12370 - }, - { - "epoch": 0.34, - "learning_rate": 6.755900567938584e-06, - "loss": 0.2394, - "step": 12375 - }, - { - "epoch": 0.34, - "learning_rate": 6.75447358657496e-06, - "loss": 0.3017, - "step": 12380 - }, - { - "epoch": 0.34, - "learning_rate": 6.753046605211336e-06, - "loss": 0.1209, - "step": 12385 - }, - { - "epoch": 0.34, - "learning_rate": 6.751619623847713e-06, - "loss": 0.284, - "step": 12390 - }, - { - "epoch": 0.34, - "learning_rate": 6.75019264248409e-06, - "loss": 0.1577, - "step": 12395 - }, - { - "epoch": 0.34, - "learning_rate": 6.748765661120466e-06, - "loss": 0.3294, - "step": 12400 - }, - { - "epoch": 0.34, - "learning_rate": 6.7473386797568426e-06, - "loss": 0.1664, - "step": 12405 - }, - { - "epoch": 0.34, - "learning_rate": 6.74591169839322e-06, - "loss": 0.1291, - "step": 12410 - }, - { - "epoch": 0.34, - "learning_rate": 6.744484717029596e-06, - "loss": 0.1548, - "step": 12415 - }, - { - "epoch": 0.34, - "learning_rate": 6.743057735665973e-06, - "loss": 0.1263, - "step": 12420 - }, - { - "epoch": 0.34, - "learning_rate": 6.74163075430235e-06, - "loss": 0.1347, - "step": 12425 - }, - { - "epoch": 0.34, - "learning_rate": 6.740203772938726e-06, - "loss": 0.0752, - "step": 12430 - }, - { - "epoch": 0.35, - "learning_rate": 6.738776791575102e-06, - "loss": 0.1343, - "step": 12435 - }, - { - "epoch": 0.35, - "learning_rate": 6.737349810211479e-06, - "loss": 0.3127, - "step": 12440 - }, - { - "epoch": 0.35, - "learning_rate": 6.735922828847856e-06, - "loss": 0.2375, - "step": 12445 - }, - { - "epoch": 0.35, - "learning_rate": 6.734495847484233e-06, - "loss": 0.4197, - "step": 12450 - }, - { - "epoch": 0.35, - "learning_rate": 6.733068866120609e-06, - "loss": 0.1688, - "step": 12455 - }, - { - "epoch": 0.35, - "learning_rate": 6.731641884756986e-06, - "loss": 0.1575, - "step": 12460 - }, - { - "epoch": 0.35, - "learning_rate": 6.730214903393362e-06, - "loss": 0.1481, - "step": 12465 - }, - { - "epoch": 0.35, - "learning_rate": 6.728787922029739e-06, - "loss": 0.1359, - "step": 12470 - }, - { - "epoch": 0.35, - "learning_rate": 6.7273609406661155e-06, - "loss": 0.1666, - "step": 12475 - }, - { - "epoch": 0.35, - "learning_rate": 6.725933959302492e-06, - "loss": 0.1549, - "step": 12480 - }, - { - "epoch": 0.35, - "learning_rate": 6.724506977938868e-06, - "loss": 0.2111, - "step": 12485 - }, - { - "epoch": 0.35, - "learning_rate": 6.723079996575245e-06, - "loss": 0.0749, - "step": 12490 - }, - { - "epoch": 0.35, - "learning_rate": 6.721653015211623e-06, - "loss": 0.3546, - "step": 12495 - }, - { - "epoch": 0.35, - "learning_rate": 6.720226033847999e-06, - "loss": 0.533, - "step": 12500 - }, - { - "epoch": 0.35, - "learning_rate": 6.718799052484375e-06, - "loss": 0.2164, - "step": 12505 - }, - { - "epoch": 0.35, - "learning_rate": 6.717372071120752e-06, - "loss": 0.178, - "step": 12510 - }, - { - "epoch": 0.35, - "learning_rate": 6.715945089757129e-06, - "loss": 0.1629, - "step": 12515 - }, - { - "epoch": 0.35, - "learning_rate": 6.714518108393505e-06, - "loss": 0.156, - "step": 12520 - }, - { - "epoch": 0.35, - "learning_rate": 6.7130911270298815e-06, - "loss": 0.1892, - "step": 12525 - }, - { - "epoch": 0.35, - "learning_rate": 6.711664145666258e-06, - "loss": 0.1118, - "step": 12530 - }, - { - "epoch": 0.35, - "learning_rate": 6.710237164302634e-06, - "loss": 0.1347, - "step": 12535 - }, - { - "epoch": 0.35, - "learning_rate": 6.708810182939012e-06, - "loss": 0.2332, - "step": 12540 - }, - { - "epoch": 0.35, - "learning_rate": 6.7073832015753885e-06, - "loss": 0.3007, - "step": 12545 - }, - { - "epoch": 0.35, - "learning_rate": 6.705956220211765e-06, - "loss": 0.3231, - "step": 12550 - }, - { - "epoch": 0.35, - "learning_rate": 6.704529238848141e-06, - "loss": 0.1384, - "step": 12555 - }, - { - "epoch": 0.35, - "learning_rate": 6.7031022574845175e-06, - "loss": 0.1172, - "step": 12560 - }, - { - "epoch": 0.35, - "learning_rate": 6.701675276120895e-06, - "loss": 0.2045, - "step": 12565 - }, - { - "epoch": 0.35, - "learning_rate": 6.700248294757271e-06, - "loss": 0.188, - "step": 12570 - }, - { - "epoch": 0.35, - "learning_rate": 6.698821313393647e-06, - "loss": 0.1805, - "step": 12575 - }, - { - "epoch": 0.35, - "learning_rate": 6.697394332030024e-06, - "loss": 0.1306, - "step": 12580 - }, - { - "epoch": 0.35, - "learning_rate": 6.695967350666402e-06, - "loss": 0.2015, - "step": 12585 - }, - { - "epoch": 0.35, - "learning_rate": 6.694540369302778e-06, - "loss": 0.318, - "step": 12590 - }, - { - "epoch": 0.35, - "learning_rate": 6.6931133879391544e-06, - "loss": 0.22, - "step": 12595 - }, - { - "epoch": 0.35, - "learning_rate": 6.691686406575531e-06, - "loss": 0.4261, - "step": 12600 - }, - { - "epoch": 0.35, - "learning_rate": 6.690259425211907e-06, - "loss": 0.1451, - "step": 12605 - }, - { - "epoch": 0.35, - "learning_rate": 6.688832443848284e-06, - "loss": 0.2177, - "step": 12610 - }, - { - "epoch": 0.35, - "learning_rate": 6.687405462484661e-06, - "loss": 0.1622, - "step": 12615 - }, - { - "epoch": 0.35, - "learning_rate": 6.685978481121037e-06, - "loss": 0.1724, - "step": 12620 - }, - { - "epoch": 0.35, - "learning_rate": 6.684551499757413e-06, - "loss": 0.0654, - "step": 12625 - }, - { - "epoch": 0.35, - "learning_rate": 6.68312451839379e-06, - "loss": 0.056, - "step": 12630 - }, - { - "epoch": 0.35, - "learning_rate": 6.681697537030168e-06, - "loss": 0.1806, - "step": 12635 - }, - { - "epoch": 0.35, - "learning_rate": 6.680270555666544e-06, - "loss": 0.1486, - "step": 12640 - }, - { - "epoch": 0.35, - "learning_rate": 6.67884357430292e-06, - "loss": 0.4049, - "step": 12645 - }, - { - "epoch": 0.35, - "learning_rate": 6.677416592939297e-06, - "loss": 0.2504, - "step": 12650 - }, - { - "epoch": 0.35, - "learning_rate": 6.675989611575673e-06, - "loss": 0.2093, - "step": 12655 - }, - { - "epoch": 0.35, - "learning_rate": 6.67456263021205e-06, - "loss": 0.1685, - "step": 12660 - }, - { - "epoch": 0.35, - "learning_rate": 6.6731356488484266e-06, - "loss": 0.1728, - "step": 12665 - }, - { - "epoch": 0.35, - "learning_rate": 6.671708667484803e-06, - "loss": 0.1841, - "step": 12670 - }, - { - "epoch": 0.35, - "learning_rate": 6.670281686121179e-06, - "loss": 0.056, - "step": 12675 - }, - { - "epoch": 0.35, - "learning_rate": 6.668854704757557e-06, - "loss": 0.1487, - "step": 12680 - }, - { - "epoch": 0.35, - "learning_rate": 6.667427723393934e-06, - "loss": 0.1941, - "step": 12685 - }, - { - "epoch": 0.35, - "learning_rate": 6.66600074203031e-06, - "loss": 0.1175, - "step": 12690 - }, - { - "epoch": 0.35, - "learning_rate": 6.664573760666686e-06, - "loss": 0.3037, - "step": 12695 - }, - { - "epoch": 0.35, - "learning_rate": 6.663146779303063e-06, - "loss": 0.5031, - "step": 12700 - }, - { - "epoch": 0.35, - "learning_rate": 6.66171979793944e-06, - "loss": 0.1533, - "step": 12705 - }, - { - "epoch": 0.35, - "learning_rate": 6.660292816575816e-06, - "loss": 0.1927, - "step": 12710 - }, - { - "epoch": 0.35, - "learning_rate": 6.6588658352121925e-06, - "loss": 0.1464, - "step": 12715 - }, - { - "epoch": 0.35, - "learning_rate": 6.657438853848569e-06, - "loss": 0.1705, - "step": 12720 - }, - { - "epoch": 0.35, - "learning_rate": 6.656011872484945e-06, - "loss": 0.153, - "step": 12725 - }, - { - "epoch": 0.35, - "learning_rate": 6.654584891121323e-06, - "loss": 0.075, - "step": 12730 - }, - { - "epoch": 0.35, - "learning_rate": 6.6531579097576995e-06, - "loss": 0.1802, - "step": 12735 - }, - { - "epoch": 0.35, - "learning_rate": 6.651730928394076e-06, - "loss": 0.1223, - "step": 12740 - }, - { - "epoch": 0.35, - "learning_rate": 6.650303947030452e-06, - "loss": 0.1696, - "step": 12745 - }, - { - "epoch": 0.35, - "learning_rate": 6.6488769656668286e-06, - "loss": 0.2838, - "step": 12750 - }, - { - "epoch": 0.35, - "learning_rate": 6.647449984303206e-06, - "loss": 0.1788, - "step": 12755 - }, - { - "epoch": 0.35, - "learning_rate": 6.646023002939582e-06, - "loss": 0.1858, - "step": 12760 - }, - { - "epoch": 0.35, - "learning_rate": 6.644596021575958e-06, - "loss": 0.1803, - "step": 12765 - }, - { - "epoch": 0.35, - "learning_rate": 6.643169040212335e-06, - "loss": 0.2407, - "step": 12770 - }, - { - "epoch": 0.35, - "learning_rate": 6.641742058848713e-06, - "loss": 0.1448, - "step": 12775 - }, - { - "epoch": 0.35, - "learning_rate": 6.640315077485089e-06, - "loss": 0.0726, - "step": 12780 - }, - { - "epoch": 0.35, - "learning_rate": 6.6388880961214655e-06, - "loss": 0.149, - "step": 12785 - }, - { - "epoch": 0.35, - "learning_rate": 6.637461114757842e-06, - "loss": 0.1544, - "step": 12790 - }, - { - "epoch": 0.36, - "learning_rate": 6.636034133394218e-06, - "loss": 0.2843, - "step": 12795 - }, - { - "epoch": 0.36, - "learning_rate": 6.634607152030595e-06, - "loss": 0.4658, - "step": 12800 - }, - { - "epoch": 0.36, - "learning_rate": 6.633180170666972e-06, - "loss": 0.1841, - "step": 12805 - }, - { - "epoch": 0.36, - "learning_rate": 6.631753189303348e-06, - "loss": 0.1337, - "step": 12810 - }, - { - "epoch": 0.36, - "learning_rate": 6.630326207939724e-06, - "loss": 0.1977, - "step": 12815 - }, - { - "epoch": 0.36, - "learning_rate": 6.628899226576101e-06, - "loss": 0.1626, - "step": 12820 - }, - { - "epoch": 0.36, - "learning_rate": 6.627472245212479e-06, - "loss": 0.1412, - "step": 12825 - }, - { - "epoch": 0.36, - "learning_rate": 6.626045263848855e-06, - "loss": 0.0621, - "step": 12830 - }, - { - "epoch": 0.36, - "learning_rate": 6.624618282485231e-06, - "loss": 0.1898, - "step": 12835 - }, - { - "epoch": 0.36, - "learning_rate": 6.623191301121608e-06, - "loss": 0.2279, - "step": 12840 - }, - { - "epoch": 0.36, - "learning_rate": 6.621764319757984e-06, - "loss": 0.1943, - "step": 12845 - }, - { - "epoch": 0.36, - "learning_rate": 6.620337338394361e-06, - "loss": 0.3011, - "step": 12850 - }, - { - "epoch": 0.36, - "learning_rate": 6.618910357030738e-06, - "loss": 0.1656, - "step": 12855 - }, - { - "epoch": 0.36, - "learning_rate": 6.617483375667114e-06, - "loss": 0.1859, - "step": 12860 - }, - { - "epoch": 0.36, - "learning_rate": 6.61605639430349e-06, - "loss": 0.166, - "step": 12865 - }, - { - "epoch": 0.36, - "learning_rate": 6.614629412939868e-06, - "loss": 0.1987, - "step": 12870 - }, - { - "epoch": 0.36, - "learning_rate": 6.613202431576245e-06, - "loss": 0.1146, - "step": 12875 - }, - { - "epoch": 0.36, - "learning_rate": 6.611775450212621e-06, - "loss": 0.0917, - "step": 12880 - }, - { - "epoch": 0.36, - "learning_rate": 6.610348468848997e-06, - "loss": 0.1346, - "step": 12885 - }, - { - "epoch": 0.36, - "learning_rate": 6.608921487485374e-06, - "loss": 0.172, - "step": 12890 - }, - { - "epoch": 0.36, - "learning_rate": 6.607494506121751e-06, - "loss": 0.2051, - "step": 12895 - }, - { - "epoch": 0.36, - "learning_rate": 6.606067524758127e-06, - "loss": 0.3892, - "step": 12900 - }, - { - "epoch": 0.36, - "learning_rate": 6.6046405433945035e-06, - "loss": 0.1457, - "step": 12905 - }, - { - "epoch": 0.36, - "learning_rate": 6.60321356203088e-06, - "loss": 0.1606, - "step": 12910 - }, - { - "epoch": 0.36, - "learning_rate": 6.601786580667256e-06, - "loss": 0.1592, - "step": 12915 - }, - { - "epoch": 0.36, - "learning_rate": 6.600359599303634e-06, - "loss": 0.1946, - "step": 12920 - }, - { - "epoch": 0.36, - "learning_rate": 6.598932617940011e-06, - "loss": 0.1297, - "step": 12925 - }, - { - "epoch": 0.36, - "learning_rate": 6.597505636576387e-06, - "loss": 0.1505, - "step": 12930 - }, - { - "epoch": 0.36, - "learning_rate": 6.596078655212763e-06, - "loss": 0.1718, - "step": 12935 - }, - { - "epoch": 0.36, - "learning_rate": 6.5946516738491404e-06, - "loss": 0.4016, - "step": 12940 - }, - { - "epoch": 0.36, - "learning_rate": 6.593224692485517e-06, - "loss": 0.2401, - "step": 12945 - }, - { - "epoch": 0.36, - "learning_rate": 6.591797711121893e-06, - "loss": 0.3069, - "step": 12950 - }, - { - "epoch": 0.36, - "learning_rate": 6.5903707297582695e-06, - "loss": 0.228, - "step": 12955 - }, - { - "epoch": 0.36, - "learning_rate": 6.588943748394646e-06, - "loss": 0.1626, - "step": 12960 - }, - { - "epoch": 0.36, - "learning_rate": 6.587516767031024e-06, - "loss": 0.1761, - "step": 12965 - }, - { - "epoch": 0.36, - "learning_rate": 6.5860897856674e-06, - "loss": 0.1507, - "step": 12970 - }, - { - "epoch": 0.36, - "learning_rate": 6.5846628043037765e-06, - "loss": 0.1849, - "step": 12975 - }, - { - "epoch": 0.36, - "learning_rate": 6.583235822940153e-06, - "loss": 0.1138, - "step": 12980 - }, - { - "epoch": 0.36, - "learning_rate": 6.581808841576529e-06, - "loss": 0.2012, - "step": 12985 - }, - { - "epoch": 0.36, - "learning_rate": 6.580381860212906e-06, - "loss": 0.163, - "step": 12990 - }, - { - "epoch": 0.36, - "learning_rate": 6.578954878849283e-06, - "loss": 0.2199, - "step": 12995 - }, - { - "epoch": 0.36, - "learning_rate": 6.577527897485659e-06, - "loss": 0.525, - "step": 13000 - }, - { - "epoch": 0.36, - "learning_rate": 6.576100916122035e-06, - "loss": 0.1355, - "step": 13005 - }, - { - "epoch": 0.36, - "learning_rate": 6.574673934758412e-06, - "loss": 0.0978, - "step": 13010 - }, - { - "epoch": 0.36, - "learning_rate": 6.57324695339479e-06, - "loss": 0.1562, - "step": 13015 - }, - { - "epoch": 0.36, - "learning_rate": 6.571819972031166e-06, - "loss": 0.2119, - "step": 13020 - }, - { - "epoch": 0.36, - "learning_rate": 6.5703929906675424e-06, - "loss": 0.0624, - "step": 13025 - }, - { - "epoch": 0.36, - "learning_rate": 6.568966009303919e-06, - "loss": 0.0974, - "step": 13030 - }, - { - "epoch": 0.36, - "learning_rate": 6.567539027940296e-06, - "loss": 0.2115, - "step": 13035 - }, - { - "epoch": 0.36, - "learning_rate": 6.566112046576672e-06, - "loss": 0.1932, - "step": 13040 - }, - { - "epoch": 0.36, - "learning_rate": 6.564685065213049e-06, - "loss": 0.3689, - "step": 13045 - }, - { - "epoch": 0.36, - "learning_rate": 6.563258083849425e-06, - "loss": 0.4729, - "step": 13050 - }, - { - "epoch": 0.36, - "learning_rate": 6.561831102485801e-06, - "loss": 0.1639, - "step": 13055 - }, - { - "epoch": 0.36, - "learning_rate": 6.560404121122179e-06, - "loss": 0.1029, - "step": 13060 - }, - { - "epoch": 0.36, - "learning_rate": 6.558977139758556e-06, - "loss": 0.1764, - "step": 13065 - }, - { - "epoch": 0.36, - "learning_rate": 6.557550158394932e-06, - "loss": 0.2053, - "step": 13070 - }, - { - "epoch": 0.36, - "learning_rate": 6.556123177031308e-06, - "loss": 0.1633, - "step": 13075 - }, - { - "epoch": 0.36, - "learning_rate": 6.554696195667685e-06, - "loss": 0.2154, - "step": 13080 - }, - { - "epoch": 0.36, - "learning_rate": 6.553269214304062e-06, - "loss": 0.1189, - "step": 13085 - }, - { - "epoch": 0.36, - "learning_rate": 6.551842232940438e-06, - "loss": 0.1119, - "step": 13090 - }, - { - "epoch": 0.36, - "learning_rate": 6.5504152515768146e-06, - "loss": 0.298, - "step": 13095 - }, - { - "epoch": 0.36, - "learning_rate": 6.548988270213191e-06, - "loss": 0.3527, - "step": 13100 - }, - { - "epoch": 0.36, - "learning_rate": 6.547561288849567e-06, - "loss": 0.2411, - "step": 13105 - }, - { - "epoch": 0.36, - "learning_rate": 6.546134307485945e-06, - "loss": 0.1694, - "step": 13110 - }, - { - "epoch": 0.36, - "learning_rate": 6.544707326122322e-06, - "loss": 0.129, - "step": 13115 - }, - { - "epoch": 0.36, - "learning_rate": 6.543280344758698e-06, - "loss": 0.2187, - "step": 13120 - }, - { - "epoch": 0.36, - "learning_rate": 6.541853363395074e-06, - "loss": 0.1709, - "step": 13125 - }, - { - "epoch": 0.36, - "learning_rate": 6.5404263820314515e-06, - "loss": 0.1164, - "step": 13130 - }, - { - "epoch": 0.36, - "learning_rate": 6.538999400667828e-06, - "loss": 0.0528, - "step": 13135 - }, - { - "epoch": 0.36, - "learning_rate": 6.537572419304204e-06, - "loss": 0.1298, - "step": 13140 - }, - { - "epoch": 0.36, - "learning_rate": 6.5361454379405805e-06, - "loss": 0.2292, - "step": 13145 - }, - { - "epoch": 0.36, - "learning_rate": 6.534718456576957e-06, - "loss": 0.2503, - "step": 13150 - }, - { - "epoch": 0.37, - "learning_rate": 6.533291475213335e-06, - "loss": 0.1328, - "step": 13155 - }, - { - "epoch": 0.37, - "learning_rate": 6.531864493849711e-06, - "loss": 0.1546, - "step": 13160 - }, - { - "epoch": 0.37, - "learning_rate": 6.5304375124860875e-06, - "loss": 0.202, - "step": 13165 - }, - { - "epoch": 0.37, - "learning_rate": 6.529010531122464e-06, - "loss": 0.2743, - "step": 13170 - }, - { - "epoch": 0.37, - "learning_rate": 6.52758354975884e-06, - "loss": 0.0807, - "step": 13175 - }, - { - "epoch": 0.37, - "learning_rate": 6.526156568395217e-06, - "loss": 0.0131, - "step": 13180 - }, - { - "epoch": 0.37, - "learning_rate": 6.524729587031594e-06, - "loss": 0.0778, - "step": 13185 - }, - { - "epoch": 0.37, - "learning_rate": 6.52330260566797e-06, - "loss": 0.1794, - "step": 13190 - }, - { - "epoch": 0.37, - "learning_rate": 6.521875624304347e-06, - "loss": 0.3173, - "step": 13195 - }, - { - "epoch": 0.37, - "learning_rate": 6.520448642940724e-06, - "loss": 0.3544, - "step": 13200 - }, - { - "epoch": 0.37, - "learning_rate": 6.519021661577101e-06, - "loss": 0.2196, - "step": 13205 - }, - { - "epoch": 0.37, - "learning_rate": 6.517594680213477e-06, - "loss": 0.1745, - "step": 13210 - }, - { - "epoch": 0.37, - "learning_rate": 6.5161676988498535e-06, - "loss": 0.1374, - "step": 13215 - }, - { - "epoch": 0.37, - "learning_rate": 6.51474071748623e-06, - "loss": 0.2678, - "step": 13220 - }, - { - "epoch": 0.37, - "learning_rate": 6.513313736122607e-06, - "loss": 0.1534, - "step": 13225 - }, - { - "epoch": 0.37, - "learning_rate": 6.511886754758983e-06, - "loss": 0.0927, - "step": 13230 - }, - { - "epoch": 0.37, - "learning_rate": 6.51045977339536e-06, - "loss": 0.1013, - "step": 13235 - }, - { - "epoch": 0.37, - "learning_rate": 6.509032792031737e-06, - "loss": 0.2501, - "step": 13240 - }, - { - "epoch": 0.37, - "learning_rate": 6.507605810668113e-06, - "loss": 0.2229, - "step": 13245 - }, - { - "epoch": 0.37, - "learning_rate": 6.50617882930449e-06, - "loss": 0.2752, - "step": 13250 - }, - { - "epoch": 0.37, - "learning_rate": 6.504751847940867e-06, - "loss": 0.1636, - "step": 13255 - }, - { - "epoch": 0.37, - "learning_rate": 6.503324866577243e-06, - "loss": 0.136, - "step": 13260 - }, - { - "epoch": 0.37, - "learning_rate": 6.501897885213619e-06, - "loss": 0.14, - "step": 13265 - }, - { - "epoch": 0.37, - "learning_rate": 6.500470903849996e-06, - "loss": 0.1113, - "step": 13270 - }, - { - "epoch": 0.37, - "learning_rate": 6.499043922486373e-06, - "loss": 0.165, - "step": 13275 - }, - { - "epoch": 0.37, - "learning_rate": 6.497616941122749e-06, - "loss": 0.0431, - "step": 13280 - }, - { - "epoch": 0.37, - "learning_rate": 6.4961899597591264e-06, - "loss": 0.0915, - "step": 13285 - }, - { - "epoch": 0.37, - "learning_rate": 6.494762978395503e-06, - "loss": 0.0957, - "step": 13290 - }, - { - "epoch": 0.37, - "learning_rate": 6.493335997031879e-06, - "loss": 0.3148, - "step": 13295 - }, - { - "epoch": 0.37, - "learning_rate": 6.491909015668256e-06, - "loss": 0.2711, - "step": 13300 - }, - { - "epoch": 0.37, - "learning_rate": 6.490482034304633e-06, - "loss": 0.2059, - "step": 13305 - }, - { - "epoch": 0.37, - "learning_rate": 6.489055052941009e-06, - "loss": 0.1473, - "step": 13310 - }, - { - "epoch": 0.37, - "learning_rate": 6.487628071577385e-06, - "loss": 0.2038, - "step": 13315 - }, - { - "epoch": 0.37, - "learning_rate": 6.4862010902137625e-06, - "loss": 0.2306, - "step": 13320 - }, - { - "epoch": 0.37, - "learning_rate": 6.484774108850139e-06, - "loss": 0.1228, - "step": 13325 - }, - { - "epoch": 0.37, - "learning_rate": 6.483347127486516e-06, - "loss": 0.0809, - "step": 13330 - }, - { - "epoch": 0.37, - "learning_rate": 6.481920146122892e-06, - "loss": 0.1194, - "step": 13335 - }, - { - "epoch": 0.37, - "learning_rate": 6.480493164759269e-06, - "loss": 0.3542, - "step": 13340 - }, - { - "epoch": 0.37, - "learning_rate": 6.479066183395646e-06, - "loss": 0.3603, - "step": 13345 - }, - { - "epoch": 0.37, - "learning_rate": 6.477639202032022e-06, - "loss": 0.4615, - "step": 13350 - }, - { - "epoch": 0.37, - "learning_rate": 6.4762122206683986e-06, - "loss": 0.2122, - "step": 13355 - }, - { - "epoch": 0.37, - "learning_rate": 6.474785239304775e-06, - "loss": 0.1875, - "step": 13360 - }, - { - "epoch": 0.37, - "learning_rate": 6.473358257941151e-06, - "loss": 0.1534, - "step": 13365 - }, - { - "epoch": 0.37, - "learning_rate": 6.4719312765775284e-06, - "loss": 0.1891, - "step": 13370 - }, - { - "epoch": 0.37, - "learning_rate": 6.470504295213906e-06, - "loss": 0.2287, - "step": 13375 - }, - { - "epoch": 0.37, - "learning_rate": 6.469077313850282e-06, - "loss": 0.1701, - "step": 13380 - }, - { - "epoch": 0.37, - "learning_rate": 6.467650332486658e-06, - "loss": 0.0908, - "step": 13385 - }, - { - "epoch": 0.37, - "learning_rate": 6.466223351123035e-06, - "loss": 0.1964, - "step": 13390 - }, - { - "epoch": 0.37, - "learning_rate": 6.464796369759412e-06, - "loss": 0.2054, - "step": 13395 - }, - { - "epoch": 0.37, - "learning_rate": 6.463369388395788e-06, - "loss": 0.5634, - "step": 13400 - }, - { - "epoch": 0.37, - "learning_rate": 6.4619424070321645e-06, - "loss": 0.1152, - "step": 13405 - }, - { - "epoch": 0.37, - "learning_rate": 6.460515425668541e-06, - "loss": 0.2444, - "step": 13410 - }, - { - "epoch": 0.37, - "learning_rate": 6.459088444304918e-06, - "loss": 0.1514, - "step": 13415 - }, - { - "epoch": 0.37, - "learning_rate": 6.457661462941295e-06, - "loss": 0.1599, - "step": 13420 - }, - { - "epoch": 0.37, - "learning_rate": 6.4562344815776715e-06, - "loss": 0.188, - "step": 13425 - }, - { - "epoch": 0.37, - "learning_rate": 6.454807500214048e-06, - "loss": 0.0559, - "step": 13430 - }, - { - "epoch": 0.37, - "learning_rate": 6.453380518850424e-06, - "loss": 0.022, - "step": 13435 - }, - { - "epoch": 0.37, - "learning_rate": 6.451953537486801e-06, - "loss": 0.1629, - "step": 13440 - }, - { - "epoch": 0.37, - "learning_rate": 6.450526556123178e-06, - "loss": 0.295, - "step": 13445 - }, - { - "epoch": 0.37, - "learning_rate": 6.449099574759554e-06, - "loss": 0.6125, - "step": 13450 - }, - { - "epoch": 0.37, - "learning_rate": 6.4476725933959304e-06, - "loss": 0.184, - "step": 13455 - }, - { - "epoch": 0.37, - "learning_rate": 6.446245612032307e-06, - "loss": 0.2965, - "step": 13460 - }, - { - "epoch": 0.37, - "learning_rate": 6.444818630668685e-06, - "loss": 0.1644, - "step": 13465 - }, - { - "epoch": 0.37, - "learning_rate": 6.443391649305061e-06, - "loss": 0.1635, - "step": 13470 - }, - { - "epoch": 0.37, - "learning_rate": 6.4419646679414375e-06, - "loss": 0.1359, - "step": 13475 - }, - { - "epoch": 0.37, - "learning_rate": 6.440537686577814e-06, - "loss": 0.1287, - "step": 13480 - }, - { - "epoch": 0.37, - "learning_rate": 6.43911070521419e-06, - "loss": 0.1645, - "step": 13485 - }, - { - "epoch": 0.37, - "learning_rate": 6.437683723850567e-06, - "loss": 0.1742, - "step": 13490 - }, - { - "epoch": 0.37, - "learning_rate": 6.436256742486944e-06, - "loss": 0.1094, - "step": 13495 - }, - { - "epoch": 0.37, - "learning_rate": 6.43482976112332e-06, - "loss": 0.3841, - "step": 13500 - }, - { - "epoch": 0.37, - "learning_rate": 6.433402779759696e-06, - "loss": 0.1358, - "step": 13505 - }, - { - "epoch": 0.37, - "learning_rate": 6.431975798396074e-06, - "loss": 0.1486, - "step": 13510 - }, - { - "epoch": 0.38, - "learning_rate": 6.430548817032451e-06, - "loss": 0.1687, - "step": 13515 - }, - { - "epoch": 0.38, - "learning_rate": 6.429121835668827e-06, - "loss": 0.2705, - "step": 13520 - }, - { - "epoch": 0.38, - "learning_rate": 6.427694854305203e-06, - "loss": 0.0766, - "step": 13525 - }, - { - "epoch": 0.38, - "learning_rate": 6.42626787294158e-06, - "loss": 0.1227, - "step": 13530 - }, - { - "epoch": 0.38, - "learning_rate": 6.424840891577957e-06, - "loss": 0.1874, - "step": 13535 - }, - { - "epoch": 0.38, - "learning_rate": 6.423413910214333e-06, - "loss": 0.1504, - "step": 13540 - }, - { - "epoch": 0.38, - "learning_rate": 6.42198692885071e-06, - "loss": 0.1187, - "step": 13545 - }, - { - "epoch": 0.38, - "learning_rate": 6.420559947487086e-06, - "loss": 0.3289, - "step": 13550 - }, - { - "epoch": 0.38, - "learning_rate": 6.419132966123462e-06, - "loss": 0.1386, - "step": 13555 - }, - { - "epoch": 0.38, - "learning_rate": 6.41770598475984e-06, - "loss": 0.1542, - "step": 13560 - }, - { - "epoch": 0.38, - "learning_rate": 6.416279003396217e-06, - "loss": 0.16, - "step": 13565 - }, - { - "epoch": 0.38, - "learning_rate": 6.414852022032593e-06, - "loss": 0.2421, - "step": 13570 - }, - { - "epoch": 0.38, - "learning_rate": 6.413425040668969e-06, - "loss": 0.1571, - "step": 13575 - }, - { - "epoch": 0.38, - "learning_rate": 6.411998059305346e-06, - "loss": 0.0579, - "step": 13580 - }, - { - "epoch": 0.38, - "learning_rate": 6.410571077941723e-06, - "loss": 0.1032, - "step": 13585 - }, - { - "epoch": 0.38, - "learning_rate": 6.409144096578099e-06, - "loss": 0.0885, - "step": 13590 - }, - { - "epoch": 0.38, - "learning_rate": 6.4077171152144755e-06, - "loss": 0.2286, - "step": 13595 - }, - { - "epoch": 0.38, - "learning_rate": 6.406290133850852e-06, - "loss": 0.6907, - "step": 13600 - }, - { - "epoch": 0.38, - "learning_rate": 6.40486315248723e-06, - "loss": 0.1718, - "step": 13605 - }, - { - "epoch": 0.38, - "learning_rate": 6.403436171123606e-06, - "loss": 0.1999, - "step": 13610 - }, - { - "epoch": 0.38, - "learning_rate": 6.402009189759983e-06, - "loss": 0.2339, - "step": 13615 - }, - { - "epoch": 0.38, - "learning_rate": 6.400582208396359e-06, - "loss": 0.1723, - "step": 13620 - }, - { - "epoch": 0.38, - "learning_rate": 6.399155227032735e-06, - "loss": 0.0938, - "step": 13625 - }, - { - "epoch": 0.38, - "learning_rate": 6.3977282456691124e-06, - "loss": 0.0504, - "step": 13630 - }, - { - "epoch": 0.38, - "learning_rate": 6.396301264305489e-06, - "loss": 0.1868, - "step": 13635 - }, - { - "epoch": 0.38, - "learning_rate": 6.394874282941865e-06, - "loss": 0.2351, - "step": 13640 - }, - { - "epoch": 0.38, - "learning_rate": 6.3934473015782415e-06, - "loss": 0.3668, - "step": 13645 - }, - { - "epoch": 0.38, - "learning_rate": 6.392020320214618e-06, - "loss": 0.6481, - "step": 13650 - }, - { - "epoch": 0.38, - "learning_rate": 6.390593338850996e-06, - "loss": 0.1458, - "step": 13655 - }, - { - "epoch": 0.38, - "learning_rate": 6.389166357487372e-06, - "loss": 0.2637, - "step": 13660 - }, - { - "epoch": 0.38, - "learning_rate": 6.3877393761237485e-06, - "loss": 0.2027, - "step": 13665 - }, - { - "epoch": 0.38, - "learning_rate": 6.386312394760125e-06, - "loss": 0.2086, - "step": 13670 - }, - { - "epoch": 0.38, - "learning_rate": 6.384885413396501e-06, - "loss": 0.0929, - "step": 13675 - }, - { - "epoch": 0.38, - "learning_rate": 6.383458432032878e-06, - "loss": 0.0966, - "step": 13680 - }, - { - "epoch": 0.38, - "learning_rate": 6.382031450669255e-06, - "loss": 0.2651, - "step": 13685 - }, - { - "epoch": 0.38, - "learning_rate": 6.380604469305631e-06, - "loss": 0.2294, - "step": 13690 - }, - { - "epoch": 0.38, - "learning_rate": 6.379177487942007e-06, - "loss": 0.406, - "step": 13695 - }, - { - "epoch": 0.38, - "learning_rate": 6.377750506578385e-06, - "loss": 0.4792, - "step": 13700 - }, - { - "epoch": 0.38, - "learning_rate": 6.376323525214762e-06, - "loss": 0.1531, - "step": 13705 - }, - { - "epoch": 0.38, - "learning_rate": 6.374896543851138e-06, - "loss": 0.1431, - "step": 13710 - }, - { - "epoch": 0.38, - "learning_rate": 6.3734695624875144e-06, - "loss": 0.1865, - "step": 13715 - }, - { - "epoch": 0.38, - "learning_rate": 6.372042581123891e-06, - "loss": 0.1561, - "step": 13720 - }, - { - "epoch": 0.38, - "learning_rate": 6.370615599760268e-06, - "loss": 0.1485, - "step": 13725 - }, - { - "epoch": 0.38, - "learning_rate": 6.369188618396644e-06, - "loss": 0.0859, - "step": 13730 - }, - { - "epoch": 0.38, - "learning_rate": 6.367761637033021e-06, - "loss": 0.2794, - "step": 13735 - }, - { - "epoch": 0.38, - "learning_rate": 6.366334655669397e-06, - "loss": 0.2333, - "step": 13740 - }, - { - "epoch": 0.38, - "learning_rate": 6.364907674305773e-06, - "loss": 0.3636, - "step": 13745 - }, - { - "epoch": 0.38, - "learning_rate": 6.363480692942151e-06, - "loss": 0.5979, - "step": 13750 - }, - { - "epoch": 0.38, - "learning_rate": 6.362053711578528e-06, - "loss": 0.1171, - "step": 13755 - }, - { - "epoch": 0.38, - "learning_rate": 6.360626730214904e-06, - "loss": 0.1514, - "step": 13760 - }, - { - "epoch": 0.38, - "learning_rate": 6.35919974885128e-06, - "loss": 0.1609, - "step": 13765 - }, - { - "epoch": 0.38, - "learning_rate": 6.357772767487657e-06, - "loss": 0.1385, - "step": 13770 - }, - { - "epoch": 0.38, - "learning_rate": 6.356345786124034e-06, - "loss": 0.0788, - "step": 13775 - }, - { - "epoch": 0.38, - "learning_rate": 6.35491880476041e-06, - "loss": 0.1974, - "step": 13780 - }, - { - "epoch": 0.38, - "learning_rate": 6.3534918233967866e-06, - "loss": 0.1626, - "step": 13785 - }, - { - "epoch": 0.38, - "learning_rate": 6.352064842033163e-06, - "loss": 0.3104, - "step": 13790 - }, - { - "epoch": 0.38, - "learning_rate": 6.350637860669541e-06, - "loss": 0.2074, - "step": 13795 - }, - { - "epoch": 0.38, - "learning_rate": 6.349210879305917e-06, - "loss": 0.2424, - "step": 13800 - }, - { - "epoch": 0.38, - "learning_rate": 6.347783897942294e-06, - "loss": 0.1079, - "step": 13805 - }, - { - "epoch": 0.38, - "learning_rate": 6.34635691657867e-06, - "loss": 0.1808, - "step": 13810 - }, - { - "epoch": 0.38, - "learning_rate": 6.344929935215046e-06, - "loss": 0.1682, - "step": 13815 - }, - { - "epoch": 0.38, - "learning_rate": 6.3435029538514235e-06, - "loss": 0.2335, - "step": 13820 - }, - { - "epoch": 0.38, - "learning_rate": 6.3420759724878e-06, - "loss": 0.2089, - "step": 13825 - }, - { - "epoch": 0.38, - "learning_rate": 6.340648991124176e-06, - "loss": 0.1013, - "step": 13830 - }, - { - "epoch": 0.38, - "learning_rate": 6.3392220097605525e-06, - "loss": 0.1075, - "step": 13835 - }, - { - "epoch": 0.38, - "learning_rate": 6.337795028396929e-06, - "loss": 0.204, - "step": 13840 - }, - { - "epoch": 0.38, - "learning_rate": 6.336368047033307e-06, - "loss": 0.1115, - "step": 13845 - }, - { - "epoch": 0.38, - "learning_rate": 6.334941065669683e-06, - "loss": 0.2524, - "step": 13850 - }, - { - "epoch": 0.38, - "learning_rate": 6.3335140843060595e-06, - "loss": 0.1643, - "step": 13855 - }, - { - "epoch": 0.38, - "learning_rate": 6.332087102942436e-06, - "loss": 0.1864, - "step": 13860 - }, - { - "epoch": 0.38, - "learning_rate": 6.330660121578812e-06, - "loss": 0.1753, - "step": 13865 - }, - { - "epoch": 0.38, - "learning_rate": 6.329233140215189e-06, - "loss": 0.2333, - "step": 13870 - }, - { - "epoch": 0.38, - "learning_rate": 6.327806158851566e-06, - "loss": 0.2355, - "step": 13875 - }, - { - "epoch": 0.39, - "learning_rate": 6.326379177487942e-06, - "loss": 0.0981, - "step": 13880 - }, - { - "epoch": 0.39, - "learning_rate": 6.324952196124318e-06, - "loss": 0.1081, - "step": 13885 - }, - { - "epoch": 0.39, - "learning_rate": 6.3235252147606964e-06, - "loss": 0.2217, - "step": 13890 - }, - { - "epoch": 0.39, - "learning_rate": 6.322098233397073e-06, - "loss": 0.2834, - "step": 13895 - }, - { - "epoch": 0.39, - "learning_rate": 6.320671252033449e-06, - "loss": 0.3532, - "step": 13900 - }, - { - "epoch": 0.39, - "learning_rate": 6.3192442706698255e-06, - "loss": 0.1661, - "step": 13905 - }, - { - "epoch": 0.39, - "learning_rate": 6.317817289306202e-06, - "loss": 0.1203, - "step": 13910 - }, - { - "epoch": 0.39, - "learning_rate": 6.316390307942579e-06, - "loss": 0.2317, - "step": 13915 - }, - { - "epoch": 0.39, - "learning_rate": 6.314963326578955e-06, - "loss": 0.216, - "step": 13920 - }, - { - "epoch": 0.39, - "learning_rate": 6.313536345215332e-06, - "loss": 0.1415, - "step": 13925 - }, - { - "epoch": 0.39, - "learning_rate": 6.312109363851708e-06, - "loss": 0.2143, - "step": 13930 - }, - { - "epoch": 0.39, - "learning_rate": 6.310682382488084e-06, - "loss": 0.0619, - "step": 13935 - }, - { - "epoch": 0.39, - "learning_rate": 6.309255401124462e-06, - "loss": 0.2325, - "step": 13940 - }, - { - "epoch": 0.39, - "learning_rate": 6.307828419760839e-06, - "loss": 0.1864, - "step": 13945 - }, - { - "epoch": 0.39, - "learning_rate": 6.306401438397215e-06, - "loss": 0.4923, - "step": 13950 - }, - { - "epoch": 0.39, - "learning_rate": 6.304974457033591e-06, - "loss": 0.167, - "step": 13955 - }, - { - "epoch": 0.39, - "learning_rate": 6.303547475669968e-06, - "loss": 0.2789, - "step": 13960 - }, - { - "epoch": 0.39, - "learning_rate": 6.302120494306345e-06, - "loss": 0.3597, - "step": 13965 - }, - { - "epoch": 0.39, - "learning_rate": 6.300693512942721e-06, - "loss": 0.2088, - "step": 13970 - }, - { - "epoch": 0.39, - "learning_rate": 6.299266531579098e-06, - "loss": 0.2258, - "step": 13975 - }, - { - "epoch": 0.39, - "learning_rate": 6.297839550215474e-06, - "loss": 0.0746, - "step": 13980 - }, - { - "epoch": 0.39, - "learning_rate": 6.296412568851852e-06, - "loss": 0.1711, - "step": 13985 - }, - { - "epoch": 0.39, - "learning_rate": 6.294985587488228e-06, - "loss": 0.1465, - "step": 13990 - }, - { - "epoch": 0.39, - "learning_rate": 6.293558606124605e-06, - "loss": 0.277, - "step": 13995 - }, - { - "epoch": 0.39, - "learning_rate": 6.292131624760981e-06, - "loss": 0.3886, - "step": 14000 - }, - { - "epoch": 0.39, - "eval_loss": 0.06621355563402176, - "eval_runtime": 2033.5992, - "eval_samples_per_second": 7.877, - "eval_steps_per_second": 1.969, - "eval_wer": 0.19680851063829788, - "step": 14000 - }, - { - "epoch": 0.39, - "learning_rate": 6.290704643397357e-06, - "loss": 0.1386, - "step": 14005 - }, - { - "epoch": 0.39, - "learning_rate": 6.2892776620337345e-06, - "loss": 0.2327, - "step": 14010 - }, - { - "epoch": 0.39, - "learning_rate": 6.287850680670111e-06, - "loss": 0.2392, - "step": 14015 - }, - { - "epoch": 0.39, - "learning_rate": 6.286423699306487e-06, - "loss": 0.2466, - "step": 14020 - }, - { - "epoch": 0.39, - "learning_rate": 6.2849967179428635e-06, - "loss": 0.1271, - "step": 14025 - }, - { - "epoch": 0.39, - "learning_rate": 6.283569736579241e-06, - "loss": 0.092, - "step": 14030 - }, - { - "epoch": 0.39, - "learning_rate": 6.282142755215618e-06, - "loss": 0.1979, - "step": 14035 - }, - { - "epoch": 0.39, - "learning_rate": 6.280715773851994e-06, - "loss": 0.1962, - "step": 14040 - }, - { - "epoch": 0.39, - "learning_rate": 6.2792887924883706e-06, - "loss": 0.3097, - "step": 14045 - }, - { - "epoch": 0.39, - "learning_rate": 6.277861811124747e-06, - "loss": 0.4639, - "step": 14050 - }, - { - "epoch": 0.39, - "learning_rate": 6.276434829761123e-06, - "loss": 0.1918, - "step": 14055 - }, - { - "epoch": 0.39, - "learning_rate": 6.2750078483975004e-06, - "loss": 0.2204, - "step": 14060 - }, - { - "epoch": 0.39, - "learning_rate": 6.273580867033877e-06, - "loss": 0.1276, - "step": 14065 - }, - { - "epoch": 0.39, - "learning_rate": 6.272153885670253e-06, - "loss": 0.125, - "step": 14070 - }, - { - "epoch": 0.39, - "learning_rate": 6.27072690430663e-06, - "loss": 0.1187, - "step": 14075 - }, - { - "epoch": 0.39, - "learning_rate": 6.2692999229430075e-06, - "loss": 0.1567, - "step": 14080 - }, - { - "epoch": 0.39, - "learning_rate": 6.267872941579384e-06, - "loss": 0.1703, - "step": 14085 - }, - { - "epoch": 0.39, - "learning_rate": 6.26644596021576e-06, - "loss": 0.2286, - "step": 14090 - }, - { - "epoch": 0.39, - "learning_rate": 6.2650189788521365e-06, - "loss": 0.2252, - "step": 14095 - }, - { - "epoch": 0.39, - "learning_rate": 6.263591997488513e-06, - "loss": 0.5425, - "step": 14100 - }, - { - "epoch": 0.39, - "learning_rate": 6.26216501612489e-06, - "loss": 0.1377, - "step": 14105 - }, - { - "epoch": 0.39, - "learning_rate": 6.260738034761266e-06, - "loss": 0.2165, - "step": 14110 - }, - { - "epoch": 0.39, - "learning_rate": 6.259311053397643e-06, - "loss": 0.1183, - "step": 14115 - }, - { - "epoch": 0.39, - "learning_rate": 6.25788407203402e-06, - "loss": 0.1774, - "step": 14120 - }, - { - "epoch": 0.39, - "learning_rate": 6.256457090670396e-06, - "loss": 0.196, - "step": 14125 - }, - { - "epoch": 0.39, - "learning_rate": 6.255030109306773e-06, - "loss": 0.0132, - "step": 14130 - }, - { - "epoch": 0.39, - "learning_rate": 6.25360312794315e-06, - "loss": 0.1714, - "step": 14135 - }, - { - "epoch": 0.39, - "learning_rate": 6.252176146579526e-06, - "loss": 0.2184, - "step": 14140 - }, - { - "epoch": 0.39, - "learning_rate": 6.2507491652159024e-06, - "loss": 0.2794, - "step": 14145 - }, - { - "epoch": 0.39, - "learning_rate": 6.24932218385228e-06, - "loss": 0.3971, - "step": 14150 - }, - { - "epoch": 0.39, - "learning_rate": 6.247895202488656e-06, - "loss": 0.1343, - "step": 14155 - }, - { - "epoch": 0.39, - "learning_rate": 6.246468221125032e-06, - "loss": 0.1995, - "step": 14160 - }, - { - "epoch": 0.39, - "learning_rate": 6.2450412397614095e-06, - "loss": 0.1216, - "step": 14165 - }, - { - "epoch": 0.39, - "learning_rate": 6.243614258397786e-06, - "loss": 0.2421, - "step": 14170 - }, - { - "epoch": 0.39, - "learning_rate": 6.242187277034163e-06, - "loss": 0.1313, - "step": 14175 - }, - { - "epoch": 0.39, - "learning_rate": 6.240760295670539e-06, - "loss": 0.1285, - "step": 14180 - }, - { - "epoch": 0.39, - "learning_rate": 6.239333314306916e-06, - "loss": 0.2933, - "step": 14185 - }, - { - "epoch": 0.39, - "learning_rate": 6.237906332943292e-06, - "loss": 0.1455, - "step": 14190 - }, - { - "epoch": 0.39, - "learning_rate": 6.236479351579668e-06, - "loss": 0.2936, - "step": 14195 - }, - { - "epoch": 0.39, - "learning_rate": 6.2350523702160455e-06, - "loss": 0.6418, - "step": 14200 - }, - { - "epoch": 0.39, - "learning_rate": 6.233625388852422e-06, - "loss": 0.1547, - "step": 14205 - }, - { - "epoch": 0.39, - "learning_rate": 6.232198407488799e-06, - "loss": 0.1088, - "step": 14210 - }, - { - "epoch": 0.39, - "learning_rate": 6.230771426125175e-06, - "loss": 0.1535, - "step": 14215 - }, - { - "epoch": 0.39, - "learning_rate": 6.229344444761552e-06, - "loss": 0.1816, - "step": 14220 - }, - { - "epoch": 0.39, - "learning_rate": 6.227917463397929e-06, - "loss": 0.2131, - "step": 14225 - }, - { - "epoch": 0.39, - "learning_rate": 6.226490482034305e-06, - "loss": 0.0358, - "step": 14230 - }, - { - "epoch": 0.39, - "learning_rate": 6.225063500670682e-06, - "loss": 0.116, - "step": 14235 - }, - { - "epoch": 0.4, - "learning_rate": 6.223636519307058e-06, - "loss": 0.0447, - "step": 14240 - }, - { - "epoch": 0.4, - "learning_rate": 6.222209537943435e-06, - "loss": 0.2341, - "step": 14245 - }, - { - "epoch": 0.4, - "learning_rate": 6.220782556579812e-06, - "loss": 0.2686, - "step": 14250 - }, - { - "epoch": 0.4, - "learning_rate": 6.219355575216189e-06, - "loss": 0.1419, - "step": 14255 - }, - { - "epoch": 0.4, - "learning_rate": 6.217928593852565e-06, - "loss": 0.1696, - "step": 14260 - }, - { - "epoch": 0.4, - "learning_rate": 6.216501612488941e-06, - "loss": 0.2146, - "step": 14265 - }, - { - "epoch": 0.4, - "learning_rate": 6.2150746311253185e-06, - "loss": 0.1784, - "step": 14270 - }, - { - "epoch": 0.4, - "learning_rate": 6.213647649761695e-06, - "loss": 0.1043, - "step": 14275 - }, - { - "epoch": 0.4, - "learning_rate": 6.212220668398071e-06, - "loss": 0.1636, - "step": 14280 - }, - { - "epoch": 0.4, - "learning_rate": 6.2107936870344475e-06, - "loss": 0.0623, - "step": 14285 - }, - { - "epoch": 0.4, - "learning_rate": 6.209366705670824e-06, - "loss": 0.2764, - "step": 14290 - }, - { - "epoch": 0.4, - "learning_rate": 6.207939724307202e-06, - "loss": 0.3821, - "step": 14295 - }, - { - "epoch": 0.4, - "learning_rate": 6.206512742943578e-06, - "loss": 0.3635, - "step": 14300 - }, - { - "epoch": 0.4, - "learning_rate": 6.205085761579955e-06, - "loss": 0.1758, - "step": 14305 - }, - { - "epoch": 0.4, - "learning_rate": 6.203658780216331e-06, - "loss": 0.2334, - "step": 14310 - }, - { - "epoch": 0.4, - "learning_rate": 6.202231798852707e-06, - "loss": 0.2056, - "step": 14315 - }, - { - "epoch": 0.4, - "learning_rate": 6.2008048174890844e-06, - "loss": 0.205, - "step": 14320 - }, - { - "epoch": 0.4, - "learning_rate": 6.199377836125461e-06, - "loss": 0.0321, - "step": 14325 - }, - { - "epoch": 0.4, - "learning_rate": 6.197950854761837e-06, - "loss": 0.1652, - "step": 14330 - }, - { - "epoch": 0.4, - "learning_rate": 6.1965238733982135e-06, - "loss": 0.0713, - "step": 14335 - }, - { - "epoch": 0.4, - "learning_rate": 6.1950968920345915e-06, - "loss": 0.2637, - "step": 14340 - }, - { - "epoch": 0.4, - "learning_rate": 6.193669910670968e-06, - "loss": 0.1655, - "step": 14345 - }, - { - "epoch": 0.4, - "learning_rate": 6.192242929307344e-06, - "loss": 0.5425, - "step": 14350 - }, - { - "epoch": 0.4, - "learning_rate": 6.1908159479437205e-06, - "loss": 0.1133, - "step": 14355 - }, - { - "epoch": 0.4, - "learning_rate": 6.189388966580097e-06, - "loss": 0.1184, - "step": 14360 - }, - { - "epoch": 0.4, - "learning_rate": 6.187961985216474e-06, - "loss": 0.1982, - "step": 14365 - }, - { - "epoch": 0.4, - "learning_rate": 6.18653500385285e-06, - "loss": 0.1289, - "step": 14370 - }, - { - "epoch": 0.4, - "learning_rate": 6.185108022489227e-06, - "loss": 0.158, - "step": 14375 - }, - { - "epoch": 0.4, - "learning_rate": 6.183681041125603e-06, - "loss": 0.0574, - "step": 14380 - }, - { - "epoch": 0.4, - "learning_rate": 6.182254059761979e-06, - "loss": 0.1613, - "step": 14385 - }, - { - "epoch": 0.4, - "learning_rate": 6.180827078398357e-06, - "loss": 0.0882, - "step": 14390 - }, - { - "epoch": 0.4, - "learning_rate": 6.179400097034734e-06, - "loss": 0.285, - "step": 14395 - }, - { - "epoch": 0.4, - "learning_rate": 6.17797311567111e-06, - "loss": 0.4831, - "step": 14400 - }, - { - "epoch": 0.4, - "learning_rate": 6.1765461343074864e-06, - "loss": 0.1271, - "step": 14405 - }, - { - "epoch": 0.4, - "learning_rate": 6.175119152943863e-06, - "loss": 0.1416, - "step": 14410 - }, - { - "epoch": 0.4, - "learning_rate": 6.17369217158024e-06, - "loss": 0.2117, - "step": 14415 - }, - { - "epoch": 0.4, - "learning_rate": 6.172265190216616e-06, - "loss": 0.217, - "step": 14420 - }, - { - "epoch": 0.4, - "learning_rate": 6.170838208852993e-06, - "loss": 0.1049, - "step": 14425 - }, - { - "epoch": 0.4, - "learning_rate": 6.169411227489369e-06, - "loss": 0.0806, - "step": 14430 - }, - { - "epoch": 0.4, - "learning_rate": 6.167984246125747e-06, - "loss": 0.165, - "step": 14435 - }, - { - "epoch": 0.4, - "learning_rate": 6.166557264762123e-06, - "loss": 0.2446, - "step": 14440 - }, - { - "epoch": 0.4, - "learning_rate": 6.1651302833985e-06, - "loss": 0.3714, - "step": 14445 - }, - { - "epoch": 0.4, - "learning_rate": 6.163703302034876e-06, - "loss": 0.4461, - "step": 14450 - }, - { - "epoch": 0.4, - "learning_rate": 6.162276320671252e-06, - "loss": 0.1162, - "step": 14455 - }, - { - "epoch": 0.4, - "learning_rate": 6.1608493393076295e-06, - "loss": 0.148, - "step": 14460 - }, - { - "epoch": 0.4, - "learning_rate": 6.159422357944006e-06, - "loss": 0.1423, - "step": 14465 - }, - { - "epoch": 0.4, - "learning_rate": 6.157995376580382e-06, - "loss": 0.2353, - "step": 14470 - }, - { - "epoch": 0.4, - "learning_rate": 6.1565683952167586e-06, - "loss": 0.212, - "step": 14475 - }, - { - "epoch": 0.4, - "learning_rate": 6.155141413853135e-06, - "loss": 0.1511, - "step": 14480 - }, - { - "epoch": 0.4, - "learning_rate": 6.153714432489513e-06, - "loss": 0.1371, - "step": 14485 - }, - { - "epoch": 0.4, - "learning_rate": 6.152287451125889e-06, - "loss": 0.189, - "step": 14490 - }, - { - "epoch": 0.4, - "learning_rate": 6.150860469762266e-06, - "loss": 0.2548, - "step": 14495 - }, - { - "epoch": 0.4, - "learning_rate": 6.149433488398642e-06, - "loss": 0.5477, - "step": 14500 - }, - { - "epoch": 0.4, - "learning_rate": 6.148006507035018e-06, - "loss": 0.1403, - "step": 14505 - }, - { - "epoch": 0.4, - "learning_rate": 6.1465795256713955e-06, - "loss": 0.1262, - "step": 14510 - }, - { - "epoch": 0.4, - "learning_rate": 6.145152544307772e-06, - "loss": 0.1666, - "step": 14515 - }, - { - "epoch": 0.4, - "learning_rate": 6.143725562944148e-06, - "loss": 0.1582, - "step": 14520 - }, - { - "epoch": 0.4, - "learning_rate": 6.1422985815805245e-06, - "loss": 0.0996, - "step": 14525 - }, - { - "epoch": 0.4, - "learning_rate": 6.1408716002169025e-06, - "loss": 0.0793, - "step": 14530 - }, - { - "epoch": 0.4, - "learning_rate": 6.139444618853279e-06, - "loss": 0.1115, - "step": 14535 - }, - { - "epoch": 0.4, - "learning_rate": 6.138017637489655e-06, - "loss": 0.1565, - "step": 14540 - }, - { - "epoch": 0.4, - "learning_rate": 6.1365906561260315e-06, - "loss": 0.3243, - "step": 14545 - }, - { - "epoch": 0.4, - "learning_rate": 6.135163674762408e-06, - "loss": 0.4306, - "step": 14550 - }, - { - "epoch": 0.4, - "learning_rate": 6.133736693398785e-06, - "loss": 0.1278, - "step": 14555 - }, - { - "epoch": 0.4, - "learning_rate": 6.132309712035161e-06, - "loss": 0.1131, - "step": 14560 - }, - { - "epoch": 0.4, - "learning_rate": 6.130882730671538e-06, - "loss": 0.1418, - "step": 14565 - }, - { - "epoch": 0.4, - "learning_rate": 6.129455749307914e-06, - "loss": 0.195, - "step": 14570 - }, - { - "epoch": 0.4, - "learning_rate": 6.12802876794429e-06, - "loss": 0.1337, - "step": 14575 - }, - { - "epoch": 0.4, - "learning_rate": 6.1266017865806685e-06, - "loss": 0.1816, - "step": 14580 - }, - { - "epoch": 0.4, - "learning_rate": 6.125174805217045e-06, - "loss": 0.0926, - "step": 14585 - }, - { - "epoch": 0.4, - "learning_rate": 6.123747823853421e-06, - "loss": 0.1594, - "step": 14590 - }, - { - "epoch": 0.4, - "learning_rate": 6.1223208424897975e-06, - "loss": 0.2272, - "step": 14595 - }, - { - "epoch": 0.41, - "learning_rate": 6.120893861126174e-06, - "loss": 0.5619, - "step": 14600 - }, - { - "epoch": 0.41, - "learning_rate": 6.119466879762551e-06, - "loss": 0.1702, - "step": 14605 - }, - { - "epoch": 0.41, - "learning_rate": 6.118039898398927e-06, - "loss": 0.1968, - "step": 14610 - }, - { - "epoch": 0.41, - "learning_rate": 6.116612917035304e-06, - "loss": 0.15, - "step": 14615 - }, - { - "epoch": 0.41, - "learning_rate": 6.11518593567168e-06, - "loss": 0.1767, - "step": 14620 - }, - { - "epoch": 0.41, - "learning_rate": 6.113758954308058e-06, - "loss": 0.1723, - "step": 14625 - }, - { - "epoch": 0.41, - "learning_rate": 6.112331972944434e-06, - "loss": 0.1547, - "step": 14630 - }, - { - "epoch": 0.41, - "learning_rate": 6.110904991580811e-06, - "loss": 0.1129, - "step": 14635 - }, - { - "epoch": 0.41, - "learning_rate": 6.109478010217187e-06, - "loss": 0.1855, - "step": 14640 - }, - { - "epoch": 0.41, - "learning_rate": 6.108051028853563e-06, - "loss": 0.2278, - "step": 14645 - }, - { - "epoch": 0.41, - "learning_rate": 6.106624047489941e-06, - "loss": 0.4278, - "step": 14650 - }, - { - "epoch": 0.41, - "learning_rate": 6.105197066126317e-06, - "loss": 0.1545, - "step": 14655 - }, - { - "epoch": 0.41, - "learning_rate": 6.103770084762693e-06, - "loss": 0.1949, - "step": 14660 - }, - { - "epoch": 0.41, - "learning_rate": 6.10234310339907e-06, - "loss": 0.1673, - "step": 14665 - }, - { - "epoch": 0.41, - "learning_rate": 6.100916122035446e-06, - "loss": 0.2014, - "step": 14670 - }, - { - "epoch": 0.41, - "learning_rate": 6.099489140671824e-06, - "loss": 0.1868, - "step": 14675 - }, - { - "epoch": 0.41, - "learning_rate": 6.0980621593082e-06, - "loss": 0.0941, - "step": 14680 - }, - { - "epoch": 0.41, - "learning_rate": 6.096635177944577e-06, - "loss": 0.1168, - "step": 14685 - }, - { - "epoch": 0.41, - "learning_rate": 6.095208196580953e-06, - "loss": 0.1158, - "step": 14690 - }, - { - "epoch": 0.41, - "learning_rate": 6.093781215217329e-06, - "loss": 0.3806, - "step": 14695 - }, - { - "epoch": 0.41, - "learning_rate": 6.0923542338537065e-06, - "loss": 0.4403, - "step": 14700 - }, - { - "epoch": 0.41, - "learning_rate": 6.090927252490083e-06, - "loss": 0.147, - "step": 14705 - }, - { - "epoch": 0.41, - "learning_rate": 6.089500271126459e-06, - "loss": 0.1279, - "step": 14710 - }, - { - "epoch": 0.41, - "learning_rate": 6.0880732897628355e-06, - "loss": 0.1222, - "step": 14715 - }, - { - "epoch": 0.41, - "learning_rate": 6.0866463083992136e-06, - "loss": 0.2057, - "step": 14720 - }, - { - "epoch": 0.41, - "learning_rate": 6.08521932703559e-06, - "loss": 0.1129, - "step": 14725 - }, - { - "epoch": 0.41, - "learning_rate": 6.083792345671966e-06, - "loss": 0.2365, - "step": 14730 - }, - { - "epoch": 0.41, - "learning_rate": 6.0823653643083426e-06, - "loss": 0.1269, - "step": 14735 - }, - { - "epoch": 0.41, - "learning_rate": 6.080938382944719e-06, - "loss": 0.1231, - "step": 14740 - }, - { - "epoch": 0.41, - "learning_rate": 6.079511401581096e-06, - "loss": 0.2604, - "step": 14745 - }, - { - "epoch": 0.41, - "learning_rate": 6.0780844202174724e-06, - "loss": 0.4422, - "step": 14750 - }, - { - "epoch": 0.41, - "learning_rate": 6.076657438853849e-06, - "loss": 0.174, - "step": 14755 - }, - { - "epoch": 0.41, - "learning_rate": 6.075230457490225e-06, - "loss": 0.113, - "step": 14760 - }, - { - "epoch": 0.41, - "learning_rate": 6.0738034761266015e-06, - "loss": 0.2471, - "step": 14765 - }, - { - "epoch": 0.41, - "learning_rate": 6.0723764947629795e-06, - "loss": 0.1751, - "step": 14770 - }, - { - "epoch": 0.41, - "learning_rate": 6.070949513399356e-06, - "loss": 0.1614, - "step": 14775 - }, - { - "epoch": 0.41, - "learning_rate": 6.069522532035732e-06, - "loss": 0.1217, - "step": 14780 - }, - { - "epoch": 0.41, - "learning_rate": 6.0680955506721085e-06, - "loss": 0.1163, - "step": 14785 - }, - { - "epoch": 0.41, - "learning_rate": 6.066668569308485e-06, - "loss": 0.089, - "step": 14790 - }, - { - "epoch": 0.41, - "learning_rate": 6.065241587944862e-06, - "loss": 0.1482, - "step": 14795 - }, - { - "epoch": 0.41, - "learning_rate": 6.063814606581238e-06, - "loss": 0.4254, - "step": 14800 - }, - { - "epoch": 0.41, - "learning_rate": 6.062387625217615e-06, - "loss": 0.148, - "step": 14805 - }, - { - "epoch": 0.41, - "learning_rate": 6.060960643853991e-06, - "loss": 0.1652, - "step": 14810 - }, - { - "epoch": 0.41, - "learning_rate": 6.059533662490369e-06, - "loss": 0.173, - "step": 14815 - }, - { - "epoch": 0.41, - "learning_rate": 6.058106681126745e-06, - "loss": 0.1958, - "step": 14820 - }, - { - "epoch": 0.41, - "learning_rate": 6.056679699763122e-06, - "loss": 0.1786, - "step": 14825 - }, - { - "epoch": 0.41, - "learning_rate": 6.055252718399498e-06, - "loss": 0.1066, - "step": 14830 - }, - { - "epoch": 0.41, - "learning_rate": 6.0538257370358744e-06, - "loss": 0.0715, - "step": 14835 - }, - { - "epoch": 0.41, - "learning_rate": 6.052398755672252e-06, - "loss": 0.1148, - "step": 14840 - }, - { - "epoch": 0.41, - "learning_rate": 6.050971774308628e-06, - "loss": 0.2405, - "step": 14845 - }, - { - "epoch": 0.41, - "learning_rate": 6.049544792945004e-06, - "loss": 0.2661, - "step": 14850 - }, - { - "epoch": 0.41, - "learning_rate": 6.048117811581381e-06, - "loss": 0.1637, - "step": 14855 - }, - { - "epoch": 0.41, - "learning_rate": 6.046690830217757e-06, - "loss": 0.1238, - "step": 14860 - }, - { - "epoch": 0.41, - "learning_rate": 6.045263848854135e-06, - "loss": 0.2242, - "step": 14865 - }, - { - "epoch": 0.41, - "learning_rate": 6.043836867490511e-06, - "loss": 0.2049, - "step": 14870 - }, - { - "epoch": 0.41, - "learning_rate": 6.042409886126888e-06, - "loss": 0.0851, - "step": 14875 - }, - { - "epoch": 0.41, - "learning_rate": 6.040982904763264e-06, - "loss": 0.0644, - "step": 14880 - }, - { - "epoch": 0.41, - "learning_rate": 6.03955592339964e-06, - "loss": 0.0894, - "step": 14885 - }, - { - "epoch": 0.41, - "learning_rate": 6.0381289420360175e-06, - "loss": 0.2002, - "step": 14890 - }, - { - "epoch": 0.41, - "learning_rate": 6.036701960672394e-06, - "loss": 0.2101, - "step": 14895 - }, - { - "epoch": 0.41, - "learning_rate": 6.03527497930877e-06, - "loss": 0.3475, - "step": 14900 - }, - { - "epoch": 0.41, - "learning_rate": 6.0338479979451466e-06, - "loss": 0.1352, - "step": 14905 - }, - { - "epoch": 0.41, - "learning_rate": 6.032421016581525e-06, - "loss": 0.1464, - "step": 14910 - }, - { - "epoch": 0.41, - "learning_rate": 6.030994035217901e-06, - "loss": 0.1251, - "step": 14915 - }, - { - "epoch": 0.41, - "learning_rate": 6.029567053854277e-06, - "loss": 0.1559, - "step": 14920 - }, - { - "epoch": 0.41, - "learning_rate": 6.028140072490654e-06, - "loss": 0.1228, - "step": 14925 - }, - { - "epoch": 0.41, - "learning_rate": 6.02671309112703e-06, - "loss": 0.1002, - "step": 14930 - }, - { - "epoch": 0.41, - "learning_rate": 6.025286109763407e-06, - "loss": 0.1621, - "step": 14935 - }, - { - "epoch": 0.41, - "learning_rate": 6.0238591283997835e-06, - "loss": 0.1759, - "step": 14940 - }, - { - "epoch": 0.41, - "learning_rate": 6.02243214703616e-06, - "loss": 0.3777, - "step": 14945 - }, - { - "epoch": 0.41, - "learning_rate": 6.021005165672536e-06, - "loss": 0.2646, - "step": 14950 - }, - { - "epoch": 0.41, - "learning_rate": 6.019578184308913e-06, - "loss": 0.1493, - "step": 14955 - }, - { - "epoch": 0.42, - "learning_rate": 6.0181512029452905e-06, - "loss": 0.1904, - "step": 14960 - }, - { - "epoch": 0.42, - "learning_rate": 6.016724221581667e-06, - "loss": 0.1436, - "step": 14965 - }, - { - "epoch": 0.42, - "learning_rate": 6.015297240218043e-06, - "loss": 0.1792, - "step": 14970 - }, - { - "epoch": 0.42, - "learning_rate": 6.0138702588544195e-06, - "loss": 0.1413, - "step": 14975 - }, - { - "epoch": 0.42, - "learning_rate": 6.012443277490796e-06, - "loss": 0.0761, - "step": 14980 - }, - { - "epoch": 0.42, - "learning_rate": 6.011016296127173e-06, - "loss": 0.1626, - "step": 14985 - }, - { - "epoch": 0.42, - "learning_rate": 6.009589314763549e-06, - "loss": 0.1427, - "step": 14990 - }, - { - "epoch": 0.42, - "learning_rate": 6.008162333399927e-06, - "loss": 0.1857, - "step": 14995 - }, - { - "epoch": 0.42, - "learning_rate": 6.006735352036303e-06, - "loss": 0.3772, - "step": 15000 - }, - { - "epoch": 0.42, - "learning_rate": 6.00530837067268e-06, - "loss": 0.1449, - "step": 15005 - }, - { - "epoch": 0.42, - "learning_rate": 6.0038813893090564e-06, - "loss": 0.1873, - "step": 15010 - }, - { - "epoch": 0.42, - "learning_rate": 6.002454407945433e-06, - "loss": 0.1683, - "step": 15015 - }, - { - "epoch": 0.42, - "learning_rate": 6.001027426581809e-06, - "loss": 0.1978, - "step": 15020 - }, - { - "epoch": 0.42, - "learning_rate": 5.9996004452181855e-06, - "loss": 0.1495, - "step": 15025 - }, - { - "epoch": 0.42, - "learning_rate": 5.998173463854563e-06, - "loss": 0.1911, - "step": 15030 - }, - { - "epoch": 0.42, - "learning_rate": 5.996746482490939e-06, - "loss": 0.0522, - "step": 15035 - }, - { - "epoch": 0.42, - "learning_rate": 5.995319501127316e-06, - "loss": 0.1913, - "step": 15040 - }, - { - "epoch": 0.42, - "learning_rate": 5.9938925197636925e-06, - "loss": 0.0795, - "step": 15045 - }, - { - "epoch": 0.42, - "learning_rate": 5.992465538400069e-06, - "loss": 0.6079, - "step": 15050 - }, - { - "epoch": 0.42, - "learning_rate": 5.991038557036446e-06, - "loss": 0.1595, - "step": 15055 - }, - { - "epoch": 0.42, - "learning_rate": 5.989611575672822e-06, - "loss": 0.1979, - "step": 15060 - }, - { - "epoch": 0.42, - "learning_rate": 5.988184594309199e-06, - "loss": 0.1023, - "step": 15065 - }, - { - "epoch": 0.42, - "learning_rate": 5.986757612945575e-06, - "loss": 0.1596, - "step": 15070 - }, - { - "epoch": 0.42, - "learning_rate": 5.985330631581951e-06, - "loss": 0.1979, - "step": 15075 - }, - { - "epoch": 0.42, - "learning_rate": 5.9839036502183286e-06, - "loss": 0.0847, - "step": 15080 - }, - { - "epoch": 0.42, - "learning_rate": 5.982476668854706e-06, - "loss": 0.1253, - "step": 15085 - }, - { - "epoch": 0.42, - "learning_rate": 5.981049687491082e-06, - "loss": 0.1647, - "step": 15090 - }, - { - "epoch": 0.42, - "learning_rate": 5.9796227061274584e-06, - "loss": 0.1517, - "step": 15095 - }, - { - "epoch": 0.42, - "learning_rate": 5.978195724763836e-06, - "loss": 0.5746, - "step": 15100 - }, - { - "epoch": 0.42, - "learning_rate": 5.976768743400212e-06, - "loss": 0.3669, - "step": 15105 - }, - { - "epoch": 0.42, - "learning_rate": 5.975341762036588e-06, - "loss": 0.1328, - "step": 15110 - }, - { - "epoch": 0.42, - "learning_rate": 5.973914780672965e-06, - "loss": 0.1376, - "step": 15115 - }, - { - "epoch": 0.42, - "learning_rate": 5.972487799309341e-06, - "loss": 0.1686, - "step": 15120 - }, - { - "epoch": 0.42, - "learning_rate": 5.971060817945718e-06, - "loss": 0.0865, - "step": 15125 - }, - { - "epoch": 0.42, - "learning_rate": 5.969633836582095e-06, - "loss": 0.1565, - "step": 15130 - }, - { - "epoch": 0.42, - "learning_rate": 5.968206855218472e-06, - "loss": 0.1184, - "step": 15135 - }, - { - "epoch": 0.42, - "learning_rate": 5.966779873854848e-06, - "loss": 0.0771, - "step": 15140 - }, - { - "epoch": 0.42, - "learning_rate": 5.965352892491224e-06, - "loss": 0.4435, - "step": 15145 - }, - { - "epoch": 0.42, - "learning_rate": 5.9639259111276015e-06, - "loss": 0.4307, - "step": 15150 - }, - { - "epoch": 0.42, - "learning_rate": 5.962498929763978e-06, - "loss": 0.0955, - "step": 15155 - }, - { - "epoch": 0.42, - "learning_rate": 5.961071948400354e-06, - "loss": 0.13, - "step": 15160 - }, - { - "epoch": 0.42, - "learning_rate": 5.9596449670367306e-06, - "loss": 0.1701, - "step": 15165 - }, - { - "epoch": 0.42, - "learning_rate": 5.958217985673107e-06, - "loss": 0.2054, - "step": 15170 - }, - { - "epoch": 0.42, - "learning_rate": 5.956791004309485e-06, - "loss": 0.1288, - "step": 15175 - }, - { - "epoch": 0.42, - "learning_rate": 5.955364022945861e-06, - "loss": 0.1721, - "step": 15180 - }, - { - "epoch": 0.42, - "learning_rate": 5.953937041582238e-06, - "loss": 0.0594, - "step": 15185 - }, - { - "epoch": 0.42, - "learning_rate": 5.952510060218614e-06, - "loss": 0.2867, - "step": 15190 - }, - { - "epoch": 0.42, - "learning_rate": 5.951083078854991e-06, - "loss": 0.4329, - "step": 15195 - }, - { - "epoch": 0.42, - "learning_rate": 5.9496560974913675e-06, - "loss": 0.4032, - "step": 15200 - }, - { - "epoch": 0.42, - "learning_rate": 5.948229116127744e-06, - "loss": 0.1789, - "step": 15205 - }, - { - "epoch": 0.42, - "learning_rate": 5.94680213476412e-06, - "loss": 0.1517, - "step": 15210 - }, - { - "epoch": 0.42, - "learning_rate": 5.9453751534004965e-06, - "loss": 0.1671, - "step": 15215 - }, - { - "epoch": 0.42, - "learning_rate": 5.9439481720368745e-06, - "loss": 0.1864, - "step": 15220 - }, - { - "epoch": 0.42, - "learning_rate": 5.942521190673251e-06, - "loss": 0.1615, - "step": 15225 - }, - { - "epoch": 0.42, - "learning_rate": 5.941094209309627e-06, - "loss": 0.054, - "step": 15230 - }, - { - "epoch": 0.42, - "learning_rate": 5.9396672279460035e-06, - "loss": 0.1439, - "step": 15235 - }, - { - "epoch": 0.42, - "learning_rate": 5.93824024658238e-06, - "loss": 0.1283, - "step": 15240 - }, - { - "epoch": 0.42, - "learning_rate": 5.936813265218757e-06, - "loss": 0.2536, - "step": 15245 - }, - { - "epoch": 0.42, - "learning_rate": 5.935386283855133e-06, - "loss": 0.2707, - "step": 15250 - }, - { - "epoch": 0.42, - "learning_rate": 5.93395930249151e-06, - "loss": 0.2927, - "step": 15255 - }, - { - "epoch": 0.42, - "learning_rate": 5.932532321127886e-06, - "loss": 0.1679, - "step": 15260 - }, - { - "epoch": 0.42, - "learning_rate": 5.931105339764262e-06, - "loss": 0.2068, - "step": 15265 - }, - { - "epoch": 0.42, - "learning_rate": 5.9296783584006405e-06, - "loss": 0.1637, - "step": 15270 - }, - { - "epoch": 0.42, - "learning_rate": 5.928251377037017e-06, - "loss": 0.0461, - "step": 15275 - }, - { - "epoch": 0.42, - "learning_rate": 5.926824395673393e-06, - "loss": 0.0905, - "step": 15280 - }, - { - "epoch": 0.42, - "learning_rate": 5.9253974143097695e-06, - "loss": 0.2088, - "step": 15285 - }, - { - "epoch": 0.42, - "learning_rate": 5.923970432946147e-06, - "loss": 0.1959, - "step": 15290 - }, - { - "epoch": 0.42, - "learning_rate": 5.922543451582523e-06, - "loss": 0.3654, - "step": 15295 - }, - { - "epoch": 0.42, - "learning_rate": 5.921116470218899e-06, - "loss": 0.4821, - "step": 15300 - }, - { - "epoch": 0.42, - "learning_rate": 5.919689488855276e-06, - "loss": 0.1287, - "step": 15305 - }, - { - "epoch": 0.42, - "learning_rate": 5.918262507491652e-06, - "loss": 0.1532, - "step": 15310 - }, - { - "epoch": 0.42, - "learning_rate": 5.91683552612803e-06, - "loss": 0.1781, - "step": 15315 - }, - { - "epoch": 0.43, - "learning_rate": 5.915408544764406e-06, - "loss": 0.1431, - "step": 15320 - }, - { - "epoch": 0.43, - "learning_rate": 5.913981563400783e-06, - "loss": 0.1377, - "step": 15325 - }, - { - "epoch": 0.43, - "learning_rate": 5.912554582037159e-06, - "loss": 0.1645, - "step": 15330 - }, - { - "epoch": 0.43, - "learning_rate": 5.911127600673535e-06, - "loss": 0.119, - "step": 15335 - }, - { - "epoch": 0.43, - "learning_rate": 5.909700619309913e-06, - "loss": 0.187, - "step": 15340 - }, - { - "epoch": 0.43, - "learning_rate": 5.908273637946289e-06, - "loss": 0.2611, - "step": 15345 - }, - { - "epoch": 0.43, - "learning_rate": 5.906846656582665e-06, - "loss": 0.4396, - "step": 15350 - }, - { - "epoch": 0.43, - "learning_rate": 5.905419675219042e-06, - "loss": 0.1585, - "step": 15355 - }, - { - "epoch": 0.43, - "learning_rate": 5.903992693855418e-06, - "loss": 0.1651, - "step": 15360 - }, - { - "epoch": 0.43, - "learning_rate": 5.902565712491796e-06, - "loss": 0.266, - "step": 15365 - }, - { - "epoch": 0.43, - "learning_rate": 5.901138731128172e-06, - "loss": 0.1742, - "step": 15370 - }, - { - "epoch": 0.43, - "learning_rate": 5.899711749764549e-06, - "loss": 0.1705, - "step": 15375 - }, - { - "epoch": 0.43, - "learning_rate": 5.898284768400925e-06, - "loss": 0.0397, - "step": 15380 - }, - { - "epoch": 0.43, - "learning_rate": 5.896857787037302e-06, - "loss": 0.2106, - "step": 15385 - }, - { - "epoch": 0.43, - "learning_rate": 5.8954308056736785e-06, - "loss": 0.1104, - "step": 15390 - }, - { - "epoch": 0.43, - "learning_rate": 5.894003824310055e-06, - "loss": 0.25, - "step": 15395 - }, - { - "epoch": 0.43, - "learning_rate": 5.892576842946431e-06, - "loss": 0.1658, - "step": 15400 - }, - { - "epoch": 0.43, - "learning_rate": 5.8911498615828075e-06, - "loss": 0.2023, - "step": 15405 - }, - { - "epoch": 0.43, - "learning_rate": 5.8897228802191856e-06, - "loss": 0.1889, - "step": 15410 - }, - { - "epoch": 0.43, - "learning_rate": 5.888295898855562e-06, - "loss": 0.1971, - "step": 15415 - }, - { - "epoch": 0.43, - "learning_rate": 5.886868917491938e-06, - "loss": 0.186, - "step": 15420 - }, - { - "epoch": 0.43, - "learning_rate": 5.8854419361283146e-06, - "loss": 0.1272, - "step": 15425 - }, - { - "epoch": 0.43, - "learning_rate": 5.884014954764691e-06, - "loss": 0.0889, - "step": 15430 - }, - { - "epoch": 0.43, - "learning_rate": 5.882587973401068e-06, - "loss": 0.0736, - "step": 15435 - }, - { - "epoch": 0.43, - "learning_rate": 5.8811609920374444e-06, - "loss": 0.2415, - "step": 15440 - }, - { - "epoch": 0.43, - "learning_rate": 5.879734010673821e-06, - "loss": 0.2244, - "step": 15445 - }, - { - "epoch": 0.43, - "learning_rate": 5.878307029310197e-06, - "loss": 0.3602, - "step": 15450 - }, - { - "epoch": 0.43, - "learning_rate": 5.876880047946575e-06, - "loss": 0.1511, - "step": 15455 - }, - { - "epoch": 0.43, - "learning_rate": 5.8754530665829515e-06, - "loss": 0.1409, - "step": 15460 - }, - { - "epoch": 0.43, - "learning_rate": 5.874026085219328e-06, - "loss": 0.1107, - "step": 15465 - }, - { - "epoch": 0.43, - "learning_rate": 5.872599103855704e-06, - "loss": 0.1823, - "step": 15470 - }, - { - "epoch": 0.43, - "learning_rate": 5.8711721224920805e-06, - "loss": 0.0253, - "step": 15475 - }, - { - "epoch": 0.43, - "learning_rate": 5.869745141128458e-06, - "loss": 0.2005, - "step": 15480 - }, - { - "epoch": 0.43, - "learning_rate": 5.868318159764834e-06, - "loss": 0.2155, - "step": 15485 - }, - { - "epoch": 0.43, - "learning_rate": 5.86689117840121e-06, - "loss": 0.1663, - "step": 15490 - }, - { - "epoch": 0.43, - "learning_rate": 5.865464197037587e-06, - "loss": 0.1827, - "step": 15495 - }, - { - "epoch": 0.43, - "learning_rate": 5.864037215673963e-06, - "loss": 0.5004, - "step": 15500 - }, - { - "epoch": 0.43, - "learning_rate": 5.862610234310341e-06, - "loss": 0.1969, - "step": 15505 - }, - { - "epoch": 0.43, - "learning_rate": 5.861183252946717e-06, - "loss": 0.167, - "step": 15510 - }, - { - "epoch": 0.43, - "learning_rate": 5.859756271583094e-06, - "loss": 0.1858, - "step": 15515 - }, - { - "epoch": 0.43, - "learning_rate": 5.85832929021947e-06, - "loss": 0.1566, - "step": 15520 - }, - { - "epoch": 0.43, - "learning_rate": 5.8569023088558464e-06, - "loss": 0.1181, - "step": 15525 - }, - { - "epoch": 0.43, - "learning_rate": 5.855475327492224e-06, - "loss": 0.139, - "step": 15530 - }, - { - "epoch": 0.43, - "learning_rate": 5.8540483461286e-06, - "loss": 0.1463, - "step": 15535 - }, - { - "epoch": 0.43, - "learning_rate": 5.852621364764976e-06, - "loss": 0.1682, - "step": 15540 - }, - { - "epoch": 0.43, - "learning_rate": 5.851194383401353e-06, - "loss": 0.3414, - "step": 15545 - }, - { - "epoch": 0.43, - "learning_rate": 5.849767402037731e-06, - "loss": 0.4187, - "step": 15550 - }, - { - "epoch": 0.43, - "learning_rate": 5.848340420674107e-06, - "loss": 0.1858, - "step": 15555 - }, - { - "epoch": 0.43, - "learning_rate": 5.846913439310483e-06, - "loss": 0.1252, - "step": 15560 - }, - { - "epoch": 0.43, - "learning_rate": 5.84548645794686e-06, - "loss": 0.1411, - "step": 15565 - }, - { - "epoch": 0.43, - "learning_rate": 5.844059476583236e-06, - "loss": 0.1414, - "step": 15570 - }, - { - "epoch": 0.43, - "learning_rate": 5.842632495219613e-06, - "loss": 0.1748, - "step": 15575 - }, - { - "epoch": 0.43, - "learning_rate": 5.8412055138559895e-06, - "loss": 0.0769, - "step": 15580 - }, - { - "epoch": 0.43, - "learning_rate": 5.839778532492366e-06, - "loss": 0.0694, - "step": 15585 - }, - { - "epoch": 0.43, - "learning_rate": 5.838351551128742e-06, - "loss": 0.194, - "step": 15590 - }, - { - "epoch": 0.43, - "learning_rate": 5.8369245697651186e-06, - "loss": 0.2519, - "step": 15595 - }, - { - "epoch": 0.43, - "learning_rate": 5.835497588401497e-06, - "loss": 0.288, - "step": 15600 - }, - { - "epoch": 0.43, - "learning_rate": 5.834070607037873e-06, - "loss": 0.1731, - "step": 15605 - }, - { - "epoch": 0.43, - "learning_rate": 5.832643625674249e-06, - "loss": 0.1078, - "step": 15610 - }, - { - "epoch": 0.43, - "learning_rate": 5.831216644310626e-06, - "loss": 0.1198, - "step": 15615 - }, - { - "epoch": 0.43, - "learning_rate": 5.829789662947002e-06, - "loss": 0.2483, - "step": 15620 - }, - { - "epoch": 0.43, - "learning_rate": 5.828362681583379e-06, - "loss": 0.0385, - "step": 15625 - }, - { - "epoch": 0.43, - "learning_rate": 5.8269357002197555e-06, - "loss": 0.1998, - "step": 15630 - }, - { - "epoch": 0.43, - "learning_rate": 5.825508718856132e-06, - "loss": 0.3765, - "step": 15635 - }, - { - "epoch": 0.43, - "learning_rate": 5.824081737492508e-06, - "loss": 0.1923, - "step": 15640 - }, - { - "epoch": 0.43, - "learning_rate": 5.822654756128886e-06, - "loss": 0.1936, - "step": 15645 - }, - { - "epoch": 0.43, - "learning_rate": 5.8212277747652625e-06, - "loss": 0.406, - "step": 15650 - }, - { - "epoch": 0.43, - "learning_rate": 5.819800793401639e-06, - "loss": 0.1442, - "step": 15655 - }, - { - "epoch": 0.43, - "learning_rate": 5.818373812038015e-06, - "loss": 0.105, - "step": 15660 - }, - { - "epoch": 0.43, - "learning_rate": 5.8169468306743915e-06, - "loss": 0.1852, - "step": 15665 - }, - { - "epoch": 0.43, - "learning_rate": 5.815519849310769e-06, - "loss": 0.1685, - "step": 15670 - }, - { - "epoch": 0.43, - "learning_rate": 5.814092867947145e-06, - "loss": 0.2012, - "step": 15675 - }, - { - "epoch": 0.44, - "learning_rate": 5.812665886583521e-06, - "loss": 0.108, - "step": 15680 - }, - { - "epoch": 0.44, - "learning_rate": 5.811238905219898e-06, - "loss": 0.1475, - "step": 15685 - }, - { - "epoch": 0.44, - "learning_rate": 5.809811923856274e-06, - "loss": 0.0816, - "step": 15690 - }, - { - "epoch": 0.44, - "learning_rate": 5.808384942492652e-06, - "loss": 0.3827, - "step": 15695 - }, - { - "epoch": 0.44, - "learning_rate": 5.8069579611290284e-06, - "loss": 0.5066, - "step": 15700 - }, - { - "epoch": 0.44, - "learning_rate": 5.805530979765405e-06, - "loss": 0.1954, - "step": 15705 - }, - { - "epoch": 0.44, - "learning_rate": 5.804103998401781e-06, - "loss": 0.1015, - "step": 15710 - }, - { - "epoch": 0.44, - "learning_rate": 5.8026770170381575e-06, - "loss": 0.1712, - "step": 15715 - }, - { - "epoch": 0.44, - "learning_rate": 5.801250035674535e-06, - "loss": 0.1948, - "step": 15720 - }, - { - "epoch": 0.44, - "learning_rate": 5.799823054310911e-06, - "loss": 0.19, - "step": 15725 - }, - { - "epoch": 0.44, - "learning_rate": 5.798396072947287e-06, - "loss": 0.072, - "step": 15730 - }, - { - "epoch": 0.44, - "learning_rate": 5.796969091583664e-06, - "loss": 0.1734, - "step": 15735 - }, - { - "epoch": 0.44, - "learning_rate": 5.795542110220042e-06, - "loss": 0.0767, - "step": 15740 - }, - { - "epoch": 0.44, - "learning_rate": 5.794115128856418e-06, - "loss": 0.1765, - "step": 15745 - }, - { - "epoch": 0.44, - "learning_rate": 5.792688147492794e-06, - "loss": 0.4795, - "step": 15750 - }, - { - "epoch": 0.44, - "learning_rate": 5.791261166129171e-06, - "loss": 0.174, - "step": 15755 - }, - { - "epoch": 0.44, - "learning_rate": 5.789834184765547e-06, - "loss": 0.1905, - "step": 15760 - }, - { - "epoch": 0.44, - "learning_rate": 5.788407203401924e-06, - "loss": 0.1317, - "step": 15765 - }, - { - "epoch": 0.44, - "learning_rate": 5.7869802220383006e-06, - "loss": 0.1573, - "step": 15770 - }, - { - "epoch": 0.44, - "learning_rate": 5.785553240674677e-06, - "loss": 0.1188, - "step": 15775 - }, - { - "epoch": 0.44, - "learning_rate": 5.784126259311053e-06, - "loss": 0.1563, - "step": 15780 - }, - { - "epoch": 0.44, - "learning_rate": 5.7826992779474304e-06, - "loss": 0.0544, - "step": 15785 - }, - { - "epoch": 0.44, - "learning_rate": 5.781272296583808e-06, - "loss": 0.2061, - "step": 15790 - }, - { - "epoch": 0.44, - "learning_rate": 5.779845315220184e-06, - "loss": 0.2543, - "step": 15795 - }, - { - "epoch": 0.44, - "learning_rate": 5.77841833385656e-06, - "loss": 0.4642, - "step": 15800 - }, - { - "epoch": 0.44, - "learning_rate": 5.776991352492937e-06, - "loss": 0.2213, - "step": 15805 - }, - { - "epoch": 0.44, - "learning_rate": 5.775564371129313e-06, - "loss": 0.1508, - "step": 15810 - }, - { - "epoch": 0.44, - "learning_rate": 5.77413738976569e-06, - "loss": 0.1495, - "step": 15815 - }, - { - "epoch": 0.44, - "learning_rate": 5.7727104084020665e-06, - "loss": 0.1711, - "step": 15820 - }, - { - "epoch": 0.44, - "learning_rate": 5.771283427038443e-06, - "loss": 0.063, - "step": 15825 - }, - { - "epoch": 0.44, - "learning_rate": 5.76985644567482e-06, - "loss": 0.0513, - "step": 15830 - }, - { - "epoch": 0.44, - "learning_rate": 5.768429464311197e-06, - "loss": 0.3326, - "step": 15835 - }, - { - "epoch": 0.44, - "learning_rate": 5.7670024829475735e-06, - "loss": 0.1372, - "step": 15840 - }, - { - "epoch": 0.44, - "learning_rate": 5.76557550158395e-06, - "loss": 0.2871, - "step": 15845 - }, - { - "epoch": 0.44, - "learning_rate": 5.764148520220326e-06, - "loss": 0.5247, - "step": 15850 - }, - { - "epoch": 0.44, - "learning_rate": 5.7627215388567026e-06, - "loss": 0.1836, - "step": 15855 - }, - { - "epoch": 0.44, - "learning_rate": 5.76129455749308e-06, - "loss": 0.142, - "step": 15860 - }, - { - "epoch": 0.44, - "learning_rate": 5.759867576129456e-06, - "loss": 0.2079, - "step": 15865 - }, - { - "epoch": 0.44, - "learning_rate": 5.7584405947658324e-06, - "loss": 0.1359, - "step": 15870 - }, - { - "epoch": 0.44, - "learning_rate": 5.75701361340221e-06, - "loss": 0.1529, - "step": 15875 - }, - { - "epoch": 0.44, - "learning_rate": 5.755586632038586e-06, - "loss": 0.1607, - "step": 15880 - }, - { - "epoch": 0.44, - "learning_rate": 5.754159650674963e-06, - "loss": 0.179, - "step": 15885 - }, - { - "epoch": 0.44, - "learning_rate": 5.7527326693113395e-06, - "loss": 0.1321, - "step": 15890 - }, - { - "epoch": 0.44, - "learning_rate": 5.751305687947716e-06, - "loss": 0.2263, - "step": 15895 - }, - { - "epoch": 0.44, - "learning_rate": 5.749878706584092e-06, - "loss": 0.2971, - "step": 15900 - }, - { - "epoch": 0.44, - "learning_rate": 5.7484517252204685e-06, - "loss": 0.1456, - "step": 15905 - }, - { - "epoch": 0.44, - "learning_rate": 5.747024743856846e-06, - "loss": 0.2264, - "step": 15910 - }, - { - "epoch": 0.44, - "learning_rate": 5.745597762493222e-06, - "loss": 0.1319, - "step": 15915 - }, - { - "epoch": 0.44, - "learning_rate": 5.744170781129599e-06, - "loss": 0.1284, - "step": 15920 - }, - { - "epoch": 0.44, - "learning_rate": 5.7427437997659755e-06, - "loss": 0.1671, - "step": 15925 - }, - { - "epoch": 0.44, - "learning_rate": 5.741316818402353e-06, - "loss": 0.1931, - "step": 15930 - }, - { - "epoch": 0.44, - "learning_rate": 5.739889837038729e-06, - "loss": 0.3126, - "step": 15935 - }, - { - "epoch": 0.44, - "learning_rate": 5.738462855675105e-06, - "loss": 0.3046, - "step": 15940 - }, - { - "epoch": 0.44, - "learning_rate": 5.737035874311482e-06, - "loss": 0.3687, - "step": 15945 - }, - { - "epoch": 0.44, - "learning_rate": 5.735608892947858e-06, - "loss": 0.4295, - "step": 15950 - }, - { - "epoch": 0.44, - "learning_rate": 5.734181911584235e-06, - "loss": 0.1389, - "step": 15955 - }, - { - "epoch": 0.44, - "learning_rate": 5.732754930220612e-06, - "loss": 0.2207, - "step": 15960 - }, - { - "epoch": 0.44, - "learning_rate": 5.731327948856989e-06, - "loss": 0.1332, - "step": 15965 - }, - { - "epoch": 0.44, - "learning_rate": 5.729900967493365e-06, - "loss": 0.1509, - "step": 15970 - }, - { - "epoch": 0.44, - "learning_rate": 5.7284739861297415e-06, - "loss": 0.1135, - "step": 15975 - }, - { - "epoch": 0.44, - "learning_rate": 5.727047004766119e-06, - "loss": 0.138, - "step": 15980 - }, - { - "epoch": 0.44, - "learning_rate": 5.725620023402495e-06, - "loss": 0.1944, - "step": 15985 - }, - { - "epoch": 0.44, - "learning_rate": 5.724193042038871e-06, - "loss": 0.1586, - "step": 15990 - }, - { - "epoch": 0.44, - "learning_rate": 5.722766060675248e-06, - "loss": 0.1768, - "step": 15995 - }, - { - "epoch": 0.44, - "learning_rate": 5.721339079311624e-06, - "loss": 0.5374, - "step": 16000 - }, - { - "epoch": 0.44, - "eval_loss": 0.0686265304684639, - "eval_runtime": 1948.2008, - "eval_samples_per_second": 8.222, - "eval_steps_per_second": 2.056, - "eval_wer": 0.185971871619185, - "step": 16000 - }, - { - "epoch": 0.44, - "learning_rate": 5.719912097948002e-06, - "loss": 0.1114, - "step": 16005 - }, - { - "epoch": 0.44, - "learning_rate": 5.718485116584378e-06, - "loss": 0.2, - "step": 16010 - }, - { - "epoch": 0.44, - "learning_rate": 5.717058135220755e-06, - "loss": 0.1075, - "step": 16015 - }, - { - "epoch": 0.44, - "learning_rate": 5.715631153857131e-06, - "loss": 0.1529, - "step": 16020 - }, - { - "epoch": 0.44, - "learning_rate": 5.714204172493508e-06, - "loss": 0.0363, - "step": 16025 - }, - { - "epoch": 0.44, - "learning_rate": 5.712777191129885e-06, - "loss": 0.2312, - "step": 16030 - }, - { - "epoch": 0.44, - "learning_rate": 5.711350209766261e-06, - "loss": 0.056, - "step": 16035 - }, - { - "epoch": 0.45, - "learning_rate": 5.709923228402637e-06, - "loss": 0.1475, - "step": 16040 - }, - { - "epoch": 0.45, - "learning_rate": 5.708496247039014e-06, - "loss": 0.2889, - "step": 16045 - }, - { - "epoch": 0.45, - "learning_rate": 5.707069265675392e-06, - "loss": 0.5634, - "step": 16050 - }, - { - "epoch": 0.45, - "learning_rate": 5.705642284311768e-06, - "loss": 0.1819, - "step": 16055 - }, - { - "epoch": 0.45, - "learning_rate": 5.704215302948144e-06, - "loss": 0.1169, - "step": 16060 - }, - { - "epoch": 0.45, - "learning_rate": 5.702788321584521e-06, - "loss": 0.2161, - "step": 16065 - }, - { - "epoch": 0.45, - "learning_rate": 5.701361340220897e-06, - "loss": 0.2054, - "step": 16070 - }, - { - "epoch": 0.45, - "learning_rate": 5.699934358857274e-06, - "loss": 0.1147, - "step": 16075 - }, - { - "epoch": 0.45, - "learning_rate": 5.6985073774936505e-06, - "loss": 0.1058, - "step": 16080 - }, - { - "epoch": 0.45, - "learning_rate": 5.697080396130027e-06, - "loss": 0.1971, - "step": 16085 - }, - { - "epoch": 0.45, - "learning_rate": 5.695653414766403e-06, - "loss": 0.1929, - "step": 16090 - }, - { - "epoch": 0.45, - "learning_rate": 5.6942264334027795e-06, - "loss": 0.2481, - "step": 16095 - }, - { - "epoch": 0.45, - "learning_rate": 5.6927994520391576e-06, - "loss": 0.6187, - "step": 16100 - }, - { - "epoch": 0.45, - "learning_rate": 5.691372470675534e-06, - "loss": 0.1115, - "step": 16105 - }, - { - "epoch": 0.45, - "learning_rate": 5.68994548931191e-06, - "loss": 0.1638, - "step": 16110 - }, - { - "epoch": 0.45, - "learning_rate": 5.6885185079482866e-06, - "loss": 0.1671, - "step": 16115 - }, - { - "epoch": 0.45, - "learning_rate": 5.687091526584664e-06, - "loss": 0.1476, - "step": 16120 - }, - { - "epoch": 0.45, - "learning_rate": 5.68566454522104e-06, - "loss": 0.1183, - "step": 16125 - }, - { - "epoch": 0.45, - "learning_rate": 5.6842375638574164e-06, - "loss": 0.0607, - "step": 16130 - }, - { - "epoch": 0.45, - "learning_rate": 5.682810582493793e-06, - "loss": 0.097, - "step": 16135 - }, - { - "epoch": 0.45, - "learning_rate": 5.681383601130169e-06, - "loss": 0.1784, - "step": 16140 - }, - { - "epoch": 0.45, - "learning_rate": 5.679956619766547e-06, - "loss": 0.2754, - "step": 16145 - }, - { - "epoch": 0.45, - "learning_rate": 5.6785296384029235e-06, - "loss": 0.4347, - "step": 16150 - }, - { - "epoch": 0.45, - "learning_rate": 5.6771026570393e-06, - "loss": 0.2081, - "step": 16155 - }, - { - "epoch": 0.45, - "learning_rate": 5.675675675675676e-06, - "loss": 0.1189, - "step": 16160 - }, - { - "epoch": 0.45, - "learning_rate": 5.6742486943120525e-06, - "loss": 0.1428, - "step": 16165 - }, - { - "epoch": 0.45, - "learning_rate": 5.67282171294843e-06, - "loss": 0.1191, - "step": 16170 - }, - { - "epoch": 0.45, - "learning_rate": 5.671394731584806e-06, - "loss": 0.1557, - "step": 16175 - }, - { - "epoch": 0.45, - "learning_rate": 5.669967750221182e-06, - "loss": 0.0787, - "step": 16180 - }, - { - "epoch": 0.45, - "learning_rate": 5.668540768857559e-06, - "loss": 0.0814, - "step": 16185 - }, - { - "epoch": 0.45, - "learning_rate": 5.667113787493935e-06, - "loss": 0.4326, - "step": 16190 - }, - { - "epoch": 0.45, - "learning_rate": 5.665686806130313e-06, - "loss": 0.3891, - "step": 16195 - }, - { - "epoch": 0.45, - "learning_rate": 5.664259824766689e-06, - "loss": 0.3938, - "step": 16200 - }, - { - "epoch": 0.45, - "learning_rate": 5.662832843403066e-06, - "loss": 0.0934, - "step": 16205 - }, - { - "epoch": 0.45, - "learning_rate": 5.661405862039442e-06, - "loss": 0.1079, - "step": 16210 - }, - { - "epoch": 0.45, - "learning_rate": 5.659978880675819e-06, - "loss": 0.1906, - "step": 16215 - }, - { - "epoch": 0.45, - "learning_rate": 5.658551899312196e-06, - "loss": 0.1347, - "step": 16220 - }, - { - "epoch": 0.45, - "learning_rate": 5.657124917948572e-06, - "loss": 0.1073, - "step": 16225 - }, - { - "epoch": 0.45, - "learning_rate": 5.655697936584948e-06, - "loss": 0.0906, - "step": 16230 - }, - { - "epoch": 0.45, - "learning_rate": 5.654270955221325e-06, - "loss": 0.0965, - "step": 16235 - }, - { - "epoch": 0.45, - "learning_rate": 5.652843973857703e-06, - "loss": 0.1537, - "step": 16240 - }, - { - "epoch": 0.45, - "learning_rate": 5.651416992494079e-06, - "loss": 0.1443, - "step": 16245 - }, - { - "epoch": 0.45, - "learning_rate": 5.649990011130455e-06, - "loss": 0.3198, - "step": 16250 - }, - { - "epoch": 0.45, - "learning_rate": 5.648563029766832e-06, - "loss": 0.1844, - "step": 16255 - }, - { - "epoch": 0.45, - "learning_rate": 5.647136048403208e-06, - "loss": 0.1468, - "step": 16260 - }, - { - "epoch": 0.45, - "learning_rate": 5.645709067039585e-06, - "loss": 0.2023, - "step": 16265 - }, - { - "epoch": 0.45, - "learning_rate": 5.6442820856759615e-06, - "loss": 0.1989, - "step": 16270 - }, - { - "epoch": 0.45, - "learning_rate": 5.642855104312338e-06, - "loss": 0.0832, - "step": 16275 - }, - { - "epoch": 0.45, - "learning_rate": 5.641428122948714e-06, - "loss": 0.0124, - "step": 16280 - }, - { - "epoch": 0.45, - "learning_rate": 5.6400011415850906e-06, - "loss": 0.1311, - "step": 16285 - }, - { - "epoch": 0.45, - "learning_rate": 5.638574160221469e-06, - "loss": 0.1941, - "step": 16290 - }, - { - "epoch": 0.45, - "learning_rate": 5.637147178857845e-06, - "loss": 0.0791, - "step": 16295 - }, - { - "epoch": 0.45, - "learning_rate": 5.635720197494221e-06, - "loss": 0.3192, - "step": 16300 - }, - { - "epoch": 0.45, - "learning_rate": 5.634293216130598e-06, - "loss": 0.1634, - "step": 16305 - }, - { - "epoch": 0.45, - "learning_rate": 5.632866234766975e-06, - "loss": 0.2161, - "step": 16310 - }, - { - "epoch": 0.45, - "learning_rate": 5.631439253403351e-06, - "loss": 0.1839, - "step": 16315 - }, - { - "epoch": 0.45, - "learning_rate": 5.6300122720397275e-06, - "loss": 0.1424, - "step": 16320 - }, - { - "epoch": 0.45, - "learning_rate": 5.628585290676104e-06, - "loss": 0.1061, - "step": 16325 - }, - { - "epoch": 0.45, - "learning_rate": 5.62715830931248e-06, - "loss": 0.0574, - "step": 16330 - }, - { - "epoch": 0.45, - "learning_rate": 5.625731327948858e-06, - "loss": 0.1294, - "step": 16335 - }, - { - "epoch": 0.45, - "learning_rate": 5.6243043465852345e-06, - "loss": 0.1222, - "step": 16340 - }, - { - "epoch": 0.45, - "learning_rate": 5.622877365221611e-06, - "loss": 0.2917, - "step": 16345 - }, - { - "epoch": 0.45, - "learning_rate": 5.621450383857987e-06, - "loss": 0.2507, - "step": 16350 - }, - { - "epoch": 0.45, - "learning_rate": 5.6200234024943635e-06, - "loss": 0.1206, - "step": 16355 - }, - { - "epoch": 0.45, - "learning_rate": 5.618596421130741e-06, - "loss": 0.1327, - "step": 16360 - }, - { - "epoch": 0.45, - "learning_rate": 5.617169439767117e-06, - "loss": 0.1302, - "step": 16365 - }, - { - "epoch": 0.45, - "learning_rate": 5.615742458403493e-06, - "loss": 0.1795, - "step": 16370 - }, - { - "epoch": 0.45, - "learning_rate": 5.61431547703987e-06, - "loss": 0.1121, - "step": 16375 - }, - { - "epoch": 0.45, - "learning_rate": 5.612888495676246e-06, - "loss": 0.1555, - "step": 16380 - }, - { - "epoch": 0.45, - "learning_rate": 5.611461514312624e-06, - "loss": 0.0623, - "step": 16385 - }, - { - "epoch": 0.45, - "learning_rate": 5.6100345329490004e-06, - "loss": 0.1516, - "step": 16390 - }, - { - "epoch": 0.45, - "learning_rate": 5.608607551585377e-06, - "loss": 0.2326, - "step": 16395 - }, - { - "epoch": 0.46, - "learning_rate": 5.607180570221753e-06, - "loss": 0.4471, - "step": 16400 - }, - { - "epoch": 0.46, - "learning_rate": 5.60575358885813e-06, - "loss": 0.149, - "step": 16405 - }, - { - "epoch": 0.46, - "learning_rate": 5.604326607494507e-06, - "loss": 0.1888, - "step": 16410 - }, - { - "epoch": 0.46, - "learning_rate": 5.602899626130883e-06, - "loss": 0.2294, - "step": 16415 - }, - { - "epoch": 0.46, - "learning_rate": 5.601472644767259e-06, - "loss": 0.1127, - "step": 16420 - }, - { - "epoch": 0.46, - "learning_rate": 5.600045663403636e-06, - "loss": 0.0707, - "step": 16425 - }, - { - "epoch": 0.46, - "learning_rate": 5.598618682040014e-06, - "loss": 0.0558, - "step": 16430 - }, - { - "epoch": 0.46, - "learning_rate": 5.59719170067639e-06, - "loss": 0.134, - "step": 16435 - }, - { - "epoch": 0.46, - "learning_rate": 5.595764719312766e-06, - "loss": 0.1683, - "step": 16440 - }, - { - "epoch": 0.46, - "learning_rate": 5.594337737949143e-06, - "loss": 0.3001, - "step": 16445 - }, - { - "epoch": 0.46, - "learning_rate": 5.592910756585519e-06, - "loss": 0.445, - "step": 16450 - }, - { - "epoch": 0.46, - "learning_rate": 5.591483775221896e-06, - "loss": 0.1413, - "step": 16455 - }, - { - "epoch": 0.46, - "learning_rate": 5.5900567938582726e-06, - "loss": 0.0874, - "step": 16460 - }, - { - "epoch": 0.46, - "learning_rate": 5.588629812494649e-06, - "loss": 0.1695, - "step": 16465 - }, - { - "epoch": 0.46, - "learning_rate": 5.587202831131025e-06, - "loss": 0.1552, - "step": 16470 - }, - { - "epoch": 0.46, - "learning_rate": 5.585775849767402e-06, - "loss": 0.171, - "step": 16475 - }, - { - "epoch": 0.46, - "learning_rate": 5.58434886840378e-06, - "loss": 0.0791, - "step": 16480 - }, - { - "epoch": 0.46, - "learning_rate": 5.582921887040156e-06, - "loss": 0.1119, - "step": 16485 - }, - { - "epoch": 0.46, - "learning_rate": 5.581494905676532e-06, - "loss": 0.2402, - "step": 16490 - }, - { - "epoch": 0.46, - "learning_rate": 5.580067924312909e-06, - "loss": 0.2793, - "step": 16495 - }, - { - "epoch": 0.46, - "learning_rate": 5.578640942949286e-06, - "loss": 0.5294, - "step": 16500 - }, - { - "epoch": 0.46, - "learning_rate": 5.577213961585662e-06, - "loss": 0.1235, - "step": 16505 - }, - { - "epoch": 0.46, - "learning_rate": 5.5757869802220385e-06, - "loss": 0.1802, - "step": 16510 - }, - { - "epoch": 0.46, - "learning_rate": 5.574359998858415e-06, - "loss": 0.112, - "step": 16515 - }, - { - "epoch": 0.46, - "learning_rate": 5.572933017494791e-06, - "loss": 0.1402, - "step": 16520 - }, - { - "epoch": 0.46, - "learning_rate": 5.571506036131169e-06, - "loss": 0.2075, - "step": 16525 - }, - { - "epoch": 0.46, - "learning_rate": 5.57036445104027e-06, - "loss": 0.9067, - "step": 16530 - }, - { - "epoch": 0.46, - "learning_rate": 5.568937469676646e-06, - "loss": 0.0746, - "step": 16535 - }, - { - "epoch": 0.46, - "learning_rate": 5.567510488313022e-06, - "loss": 0.3122, - "step": 16540 - }, - { - "epoch": 0.46, - "learning_rate": 5.5660835069494e-06, - "loss": 0.3623, - "step": 16545 - }, - { - "epoch": 0.46, - "learning_rate": 5.564656525585777e-06, - "loss": 0.4181, - "step": 16550 - }, - { - "epoch": 0.46, - "learning_rate": 5.563229544222153e-06, - "loss": 0.2052, - "step": 16555 - }, - { - "epoch": 0.46, - "learning_rate": 5.561802562858529e-06, - "loss": 0.1638, - "step": 16560 - }, - { - "epoch": 0.46, - "learning_rate": 5.560375581494906e-06, - "loss": 0.1692, - "step": 16565 - }, - { - "epoch": 0.46, - "learning_rate": 5.558948600131283e-06, - "loss": 0.1753, - "step": 16570 - }, - { - "epoch": 0.46, - "learning_rate": 5.557521618767659e-06, - "loss": 0.1365, - "step": 16575 - }, - { - "epoch": 0.46, - "learning_rate": 5.5560946374040355e-06, - "loss": 0.11, - "step": 16580 - }, - { - "epoch": 0.46, - "learning_rate": 5.554667656040412e-06, - "loss": 0.0666, - "step": 16585 - }, - { - "epoch": 0.46, - "learning_rate": 5.553240674676788e-06, - "loss": 0.1271, - "step": 16590 - }, - { - "epoch": 0.46, - "learning_rate": 5.551813693313166e-06, - "loss": 0.2357, - "step": 16595 - }, - { - "epoch": 0.46, - "learning_rate": 5.550386711949543e-06, - "loss": 0.5136, - "step": 16600 - }, - { - "epoch": 0.46, - "learning_rate": 5.548959730585919e-06, - "loss": 0.0782, - "step": 16605 - }, - { - "epoch": 0.46, - "learning_rate": 5.547532749222295e-06, - "loss": 0.1825, - "step": 16610 - }, - { - "epoch": 0.46, - "learning_rate": 5.5461057678586724e-06, - "loss": 0.2018, - "step": 16615 - }, - { - "epoch": 0.46, - "learning_rate": 5.544678786495049e-06, - "loss": 0.1425, - "step": 16620 - }, - { - "epoch": 0.46, - "learning_rate": 5.543251805131425e-06, - "loss": 0.0838, - "step": 16625 - }, - { - "epoch": 0.46, - "learning_rate": 5.5418248237678015e-06, - "loss": 0.1659, - "step": 16630 - }, - { - "epoch": 0.46, - "learning_rate": 5.540397842404178e-06, - "loss": 0.112, - "step": 16635 - }, - { - "epoch": 0.46, - "learning_rate": 5.538970861040556e-06, - "loss": 0.3056, - "step": 16640 - }, - { - "epoch": 0.46, - "learning_rate": 5.537543879676932e-06, - "loss": 0.303, - "step": 16645 - }, - { - "epoch": 0.46, - "learning_rate": 5.5361168983133085e-06, - "loss": 0.4717, - "step": 16650 - }, - { - "epoch": 0.46, - "learning_rate": 5.534689916949685e-06, - "loss": 0.2241, - "step": 16655 - }, - { - "epoch": 0.46, - "learning_rate": 5.533262935586061e-06, - "loss": 0.1074, - "step": 16660 - }, - { - "epoch": 0.46, - "learning_rate": 5.531835954222438e-06, - "loss": 0.1684, - "step": 16665 - }, - { - "epoch": 0.46, - "learning_rate": 5.530408972858815e-06, - "loss": 0.1234, - "step": 16670 - }, - { - "epoch": 0.46, - "learning_rate": 5.528981991495191e-06, - "loss": 0.1283, - "step": 16675 - }, - { - "epoch": 0.46, - "learning_rate": 5.527555010131567e-06, - "loss": 0.0778, - "step": 16680 - }, - { - "epoch": 0.46, - "learning_rate": 5.526128028767945e-06, - "loss": 0.1442, - "step": 16685 - }, - { - "epoch": 0.46, - "learning_rate": 5.524701047404322e-06, - "loss": 0.1708, - "step": 16690 - }, - { - "epoch": 0.46, - "learning_rate": 5.523274066040698e-06, - "loss": 0.3219, - "step": 16695 - }, - { - "epoch": 0.46, - "learning_rate": 5.5218470846770744e-06, - "loss": 0.3452, - "step": 16700 - }, - { - "epoch": 0.46, - "learning_rate": 5.520420103313451e-06, - "loss": 0.1205, - "step": 16705 - }, - { - "epoch": 0.46, - "learning_rate": 5.518993121949828e-06, - "loss": 0.1505, - "step": 16710 - }, - { - "epoch": 0.46, - "learning_rate": 5.517566140586204e-06, - "loss": 0.1963, - "step": 16715 - }, - { - "epoch": 0.46, - "learning_rate": 5.516139159222581e-06, - "loss": 0.1394, - "step": 16720 - }, - { - "epoch": 0.46, - "learning_rate": 5.514712177858958e-06, - "loss": 0.1005, - "step": 16725 - }, - { - "epoch": 0.46, - "learning_rate": 5.513285196495334e-06, - "loss": 0.0825, - "step": 16730 - }, - { - "epoch": 0.46, - "learning_rate": 5.511858215131711e-06, - "loss": 0.1205, - "step": 16735 - }, - { - "epoch": 0.46, - "learning_rate": 5.510431233768088e-06, - "loss": 0.2447, - "step": 16740 - }, - { - "epoch": 0.46, - "learning_rate": 5.509004252404464e-06, - "loss": 0.152, - "step": 16745 - }, - { - "epoch": 0.46, - "learning_rate": 5.50757727104084e-06, - "loss": 0.3954, - "step": 16750 - }, - { - "epoch": 0.46, - "learning_rate": 5.506150289677217e-06, - "loss": 0.1702, - "step": 16755 - }, - { - "epoch": 0.47, - "learning_rate": 5.504723308313594e-06, - "loss": 0.1558, - "step": 16760 - }, - { - "epoch": 0.47, - "learning_rate": 5.50329632694997e-06, - "loss": 0.1411, - "step": 16765 - }, - { - "epoch": 0.47, - "learning_rate": 5.501869345586347e-06, - "loss": 0.3309, - "step": 16770 - }, - { - "epoch": 0.47, - "learning_rate": 5.500442364222724e-06, - "loss": 0.1496, - "step": 16775 - }, - { - "epoch": 0.47, - "learning_rate": 5.499015382859101e-06, - "loss": 0.2113, - "step": 16780 - }, - { - "epoch": 0.47, - "learning_rate": 5.497588401495477e-06, - "loss": 0.1642, - "step": 16785 - }, - { - "epoch": 0.47, - "learning_rate": 5.496161420131854e-06, - "loss": 0.0975, - "step": 16790 - }, - { - "epoch": 0.47, - "learning_rate": 5.49473443876823e-06, - "loss": 0.1134, - "step": 16795 - }, - { - "epoch": 0.47, - "learning_rate": 5.493307457404606e-06, - "loss": 0.3543, - "step": 16800 - }, - { - "epoch": 0.47, - "learning_rate": 5.4918804760409835e-06, - "loss": 0.129, - "step": 16805 - }, - { - "epoch": 0.47, - "learning_rate": 5.49045349467736e-06, - "loss": 0.1279, - "step": 16810 - }, - { - "epoch": 0.47, - "learning_rate": 5.489026513313737e-06, - "loss": 0.1819, - "step": 16815 - }, - { - "epoch": 0.47, - "learning_rate": 5.487599531950113e-06, - "loss": 0.1646, - "step": 16820 - }, - { - "epoch": 0.47, - "learning_rate": 5.48617255058649e-06, - "loss": 0.1626, - "step": 16825 - }, - { - "epoch": 0.47, - "learning_rate": 5.484745569222867e-06, - "loss": 0.0615, - "step": 16830 - }, - { - "epoch": 0.47, - "learning_rate": 5.483318587859243e-06, - "loss": 0.0538, - "step": 16835 - }, - { - "epoch": 0.47, - "learning_rate": 5.4818916064956195e-06, - "loss": 0.2278, - "step": 16840 - }, - { - "epoch": 0.47, - "learning_rate": 5.480464625131996e-06, - "loss": 0.2573, - "step": 16845 - }, - { - "epoch": 0.47, - "learning_rate": 5.479037643768372e-06, - "loss": 0.3704, - "step": 16850 - }, - { - "epoch": 0.47, - "learning_rate": 5.477610662404749e-06, - "loss": 0.2063, - "step": 16855 - }, - { - "epoch": 0.47, - "learning_rate": 5.476183681041127e-06, - "loss": 0.1791, - "step": 16860 - }, - { - "epoch": 0.47, - "learning_rate": 5.474756699677503e-06, - "loss": 0.1397, - "step": 16865 - }, - { - "epoch": 0.47, - "learning_rate": 5.473329718313879e-06, - "loss": 0.2235, - "step": 16870 - }, - { - "epoch": 0.47, - "learning_rate": 5.4719027369502565e-06, - "loss": 0.1106, - "step": 16875 - }, - { - "epoch": 0.47, - "learning_rate": 5.470475755586633e-06, - "loss": 0.0626, - "step": 16880 - }, - { - "epoch": 0.47, - "learning_rate": 5.469048774223009e-06, - "loss": 0.0783, - "step": 16885 - }, - { - "epoch": 0.47, - "learning_rate": 5.4676217928593855e-06, - "loss": 0.1718, - "step": 16890 - }, - { - "epoch": 0.47, - "learning_rate": 5.466194811495762e-06, - "loss": 0.319, - "step": 16895 - }, - { - "epoch": 0.47, - "learning_rate": 5.464767830132139e-06, - "loss": 0.4389, - "step": 16900 - }, - { - "epoch": 0.47, - "learning_rate": 5.463340848768516e-06, - "loss": 0.1144, - "step": 16905 - }, - { - "epoch": 0.47, - "learning_rate": 5.4619138674048925e-06, - "loss": 0.1494, - "step": 16910 - }, - { - "epoch": 0.47, - "learning_rate": 5.460486886041269e-06, - "loss": 0.1487, - "step": 16915 - }, - { - "epoch": 0.47, - "learning_rate": 5.459059904677645e-06, - "loss": 0.1755, - "step": 16920 - }, - { - "epoch": 0.47, - "learning_rate": 5.457632923314022e-06, - "loss": 0.1109, - "step": 16925 - }, - { - "epoch": 0.47, - "learning_rate": 5.456205941950399e-06, - "loss": 0.0623, - "step": 16930 - }, - { - "epoch": 0.47, - "learning_rate": 5.454778960586775e-06, - "loss": 0.059, - "step": 16935 - }, - { - "epoch": 0.47, - "learning_rate": 5.453351979223151e-06, - "loss": 0.1484, - "step": 16940 - }, - { - "epoch": 0.47, - "learning_rate": 5.451924997859528e-06, - "loss": 0.2676, - "step": 16945 - }, - { - "epoch": 0.47, - "learning_rate": 5.450498016495906e-06, - "loss": 0.4759, - "step": 16950 - }, - { - "epoch": 0.47, - "learning_rate": 5.449071035132282e-06, - "loss": 0.1805, - "step": 16955 - }, - { - "epoch": 0.47, - "learning_rate": 5.4476440537686584e-06, - "loss": 0.1408, - "step": 16960 - }, - { - "epoch": 0.47, - "learning_rate": 5.446217072405035e-06, - "loss": 0.1618, - "step": 16965 - }, - { - "epoch": 0.47, - "learning_rate": 5.444790091041412e-06, - "loss": 0.2413, - "step": 16970 - }, - { - "epoch": 0.47, - "learning_rate": 5.443363109677788e-06, - "loss": 0.2339, - "step": 16975 - }, - { - "epoch": 0.47, - "learning_rate": 5.441936128314165e-06, - "loss": 0.1131, - "step": 16980 - }, - { - "epoch": 0.47, - "learning_rate": 5.440509146950541e-06, - "loss": 0.1233, - "step": 16985 - }, - { - "epoch": 0.47, - "learning_rate": 5.439082165586917e-06, - "loss": 0.2213, - "step": 16990 - }, - { - "epoch": 0.47, - "learning_rate": 5.437655184223295e-06, - "loss": 0.2989, - "step": 16995 - }, - { - "epoch": 0.47, - "learning_rate": 5.436228202859672e-06, - "loss": 0.2412, - "step": 17000 - }, - { - "epoch": 0.47, - "learning_rate": 5.434801221496048e-06, - "loss": 0.1614, - "step": 17005 - }, - { - "epoch": 0.47, - "learning_rate": 5.433374240132424e-06, - "loss": 0.2254, - "step": 17010 - }, - { - "epoch": 0.47, - "learning_rate": 5.431947258768801e-06, - "loss": 0.1363, - "step": 17015 - }, - { - "epoch": 0.47, - "learning_rate": 5.430520277405178e-06, - "loss": 0.1185, - "step": 17020 - }, - { - "epoch": 0.47, - "learning_rate": 5.429093296041554e-06, - "loss": 0.1609, - "step": 17025 - }, - { - "epoch": 0.47, - "learning_rate": 5.4276663146779306e-06, - "loss": 0.0382, - "step": 17030 - }, - { - "epoch": 0.47, - "learning_rate": 5.426239333314307e-06, - "loss": 0.0805, - "step": 17035 - }, - { - "epoch": 0.47, - "learning_rate": 5.424812351950683e-06, - "loss": 0.2417, - "step": 17040 - }, - { - "epoch": 0.47, - "learning_rate": 5.423385370587061e-06, - "loss": 0.1484, - "step": 17045 - }, - { - "epoch": 0.47, - "learning_rate": 5.421958389223438e-06, - "loss": 0.3142, - "step": 17050 - }, - { - "epoch": 0.47, - "learning_rate": 5.420531407859814e-06, - "loss": 0.1211, - "step": 17055 - }, - { - "epoch": 0.47, - "learning_rate": 5.41910442649619e-06, - "loss": 0.2209, - "step": 17060 - }, - { - "epoch": 0.47, - "learning_rate": 5.4176774451325675e-06, - "loss": 0.1553, - "step": 17065 - }, - { - "epoch": 0.47, - "learning_rate": 5.416250463768944e-06, - "loss": 0.1036, - "step": 17070 - }, - { - "epoch": 0.47, - "learning_rate": 5.41482348240532e-06, - "loss": 0.1512, - "step": 17075 - }, - { - "epoch": 0.47, - "learning_rate": 5.4133965010416965e-06, - "loss": 0.1245, - "step": 17080 - }, - { - "epoch": 0.47, - "learning_rate": 5.411969519678073e-06, - "loss": 0.1974, - "step": 17085 - }, - { - "epoch": 0.47, - "learning_rate": 5.410542538314451e-06, - "loss": 0.0876, - "step": 17090 - }, - { - "epoch": 0.47, - "learning_rate": 5.409115556950827e-06, - "loss": 0.2816, - "step": 17095 - }, - { - "epoch": 0.47, - "learning_rate": 5.4076885755872036e-06, - "loss": 0.5595, - "step": 17100 - }, - { - "epoch": 0.47, - "learning_rate": 5.40626159422358e-06, - "loss": 0.1111, - "step": 17105 - }, - { - "epoch": 0.47, - "learning_rate": 5.404834612859956e-06, - "loss": 0.1536, - "step": 17110 - }, - { - "epoch": 0.47, - "learning_rate": 5.403407631496333e-06, - "loss": 0.1523, - "step": 17115 - }, - { - "epoch": 0.48, - "learning_rate": 5.40198065013271e-06, - "loss": 0.1873, - "step": 17120 - }, - { - "epoch": 0.48, - "learning_rate": 5.400553668769086e-06, - "loss": 0.116, - "step": 17125 - }, - { - "epoch": 0.48, - "learning_rate": 5.3991266874054624e-06, - "loss": 0.2162, - "step": 17130 - }, - { - "epoch": 0.48, - "learning_rate": 5.397699706041839e-06, - "loss": 0.1174, - "step": 17135 - }, - { - "epoch": 0.48, - "learning_rate": 5.396272724678217e-06, - "loss": 0.1295, - "step": 17140 - }, - { - "epoch": 0.48, - "learning_rate": 5.394845743314593e-06, - "loss": 0.4878, - "step": 17145 - }, - { - "epoch": 0.48, - "learning_rate": 5.3934187619509695e-06, - "loss": 0.4039, - "step": 17150 - }, - { - "epoch": 0.48, - "learning_rate": 5.391991780587346e-06, - "loss": 0.1392, - "step": 17155 - }, - { - "epoch": 0.48, - "learning_rate": 5.390564799223723e-06, - "loss": 0.1637, - "step": 17160 - }, - { - "epoch": 0.48, - "learning_rate": 5.389137817860099e-06, - "loss": 0.2175, - "step": 17165 - }, - { - "epoch": 0.48, - "learning_rate": 5.387710836496476e-06, - "loss": 0.184, - "step": 17170 - }, - { - "epoch": 0.48, - "learning_rate": 5.386283855132852e-06, - "loss": 0.1522, - "step": 17175 - }, - { - "epoch": 0.48, - "learning_rate": 5.384856873769228e-06, - "loss": 0.0885, - "step": 17180 - }, - { - "epoch": 0.48, - "learning_rate": 5.383429892405606e-06, - "loss": 0.1185, - "step": 17185 - }, - { - "epoch": 0.48, - "learning_rate": 5.382002911041983e-06, - "loss": 0.1916, - "step": 17190 - }, - { - "epoch": 0.48, - "learning_rate": 5.380575929678359e-06, - "loss": 0.2418, - "step": 17195 - }, - { - "epoch": 0.48, - "learning_rate": 5.379148948314735e-06, - "loss": 0.4827, - "step": 17200 - }, - { - "epoch": 0.48, - "learning_rate": 5.377721966951112e-06, - "loss": 0.1402, - "step": 17205 - }, - { - "epoch": 0.48, - "learning_rate": 5.376294985587489e-06, - "loss": 0.2107, - "step": 17210 - }, - { - "epoch": 0.48, - "learning_rate": 5.374868004223865e-06, - "loss": 0.1448, - "step": 17215 - }, - { - "epoch": 0.48, - "learning_rate": 5.373441022860242e-06, - "loss": 0.2342, - "step": 17220 - }, - { - "epoch": 0.48, - "learning_rate": 5.372014041496618e-06, - "loss": 0.0894, - "step": 17225 - }, - { - "epoch": 0.48, - "learning_rate": 5.370587060132994e-06, - "loss": 0.187, - "step": 17230 - }, - { - "epoch": 0.48, - "learning_rate": 5.369160078769372e-06, - "loss": 0.1241, - "step": 17235 - }, - { - "epoch": 0.48, - "learning_rate": 5.367733097405749e-06, - "loss": 0.1505, - "step": 17240 - }, - { - "epoch": 0.48, - "learning_rate": 5.366306116042125e-06, - "loss": 0.3462, - "step": 17245 - }, - { - "epoch": 0.48, - "learning_rate": 5.364879134678501e-06, - "loss": 0.346, - "step": 17250 - }, - { - "epoch": 0.48, - "learning_rate": 5.3634521533148785e-06, - "loss": 0.2012, - "step": 17255 - }, - { - "epoch": 0.48, - "learning_rate": 5.362025171951255e-06, - "loss": 0.1905, - "step": 17260 - }, - { - "epoch": 0.48, - "learning_rate": 5.360598190587631e-06, - "loss": 0.1316, - "step": 17265 - }, - { - "epoch": 0.48, - "learning_rate": 5.3591712092240075e-06, - "loss": 0.1953, - "step": 17270 - }, - { - "epoch": 0.48, - "learning_rate": 5.357744227860384e-06, - "loss": 0.1508, - "step": 17275 - }, - { - "epoch": 0.48, - "learning_rate": 5.356317246496762e-06, - "loss": 0.0538, - "step": 17280 - }, - { - "epoch": 0.48, - "learning_rate": 5.354890265133138e-06, - "loss": 0.1284, - "step": 17285 - }, - { - "epoch": 0.48, - "learning_rate": 5.353463283769515e-06, - "loss": 0.2855, - "step": 17290 - }, - { - "epoch": 0.48, - "learning_rate": 5.352036302405891e-06, - "loss": 0.215, - "step": 17295 - }, - { - "epoch": 0.48, - "learning_rate": 5.350609321042267e-06, - "loss": 0.2805, - "step": 17300 - }, - { - "epoch": 0.48, - "learning_rate": 5.3491823396786444e-06, - "loss": 0.2176, - "step": 17305 - }, - { - "epoch": 0.48, - "learning_rate": 5.347755358315021e-06, - "loss": 0.1513, - "step": 17310 - }, - { - "epoch": 0.48, - "learning_rate": 5.346328376951397e-06, - "loss": 0.1399, - "step": 17315 - }, - { - "epoch": 0.48, - "learning_rate": 5.3449013955877735e-06, - "loss": 0.1568, - "step": 17320 - }, - { - "epoch": 0.48, - "learning_rate": 5.34347441422415e-06, - "loss": 0.1231, - "step": 17325 - }, - { - "epoch": 0.48, - "learning_rate": 5.342047432860528e-06, - "loss": 0.0907, - "step": 17330 - }, - { - "epoch": 0.48, - "learning_rate": 5.340620451496904e-06, - "loss": 0.0697, - "step": 17335 - }, - { - "epoch": 0.48, - "learning_rate": 5.3391934701332805e-06, - "loss": 0.1351, - "step": 17340 - }, - { - "epoch": 0.48, - "learning_rate": 5.337766488769657e-06, - "loss": 0.3501, - "step": 17345 - }, - { - "epoch": 0.48, - "learning_rate": 5.336339507406034e-06, - "loss": 0.3423, - "step": 17350 - }, - { - "epoch": 0.48, - "learning_rate": 5.33491252604241e-06, - "loss": 0.1806, - "step": 17355 - }, - { - "epoch": 0.48, - "learning_rate": 5.333485544678787e-06, - "loss": 0.2168, - "step": 17360 - }, - { - "epoch": 0.48, - "learning_rate": 5.332058563315163e-06, - "loss": 0.2062, - "step": 17365 - }, - { - "epoch": 0.48, - "learning_rate": 5.330631581951539e-06, - "loss": 0.1623, - "step": 17370 - }, - { - "epoch": 0.48, - "learning_rate": 5.329204600587917e-06, - "loss": 0.1093, - "step": 17375 - }, - { - "epoch": 0.48, - "learning_rate": 5.327777619224294e-06, - "loss": 0.0914, - "step": 17380 - }, - { - "epoch": 0.48, - "learning_rate": 5.32635063786067e-06, - "loss": 0.0801, - "step": 17385 - }, - { - "epoch": 0.48, - "learning_rate": 5.3249236564970464e-06, - "loss": 0.18, - "step": 17390 - }, - { - "epoch": 0.48, - "learning_rate": 5.323496675133423e-06, - "loss": 0.3545, - "step": 17395 - }, - { - "epoch": 0.48, - "learning_rate": 5.3220696937698e-06, - "loss": 0.2112, - "step": 17400 - }, - { - "epoch": 0.48, - "learning_rate": 5.320642712406176e-06, - "loss": 0.1072, - "step": 17405 - }, - { - "epoch": 0.48, - "learning_rate": 5.319215731042553e-06, - "loss": 0.1603, - "step": 17410 - }, - { - "epoch": 0.48, - "learning_rate": 5.317788749678929e-06, - "loss": 0.1775, - "step": 17415 - }, - { - "epoch": 0.48, - "learning_rate": 5.316361768315305e-06, - "loss": 0.1867, - "step": 17420 - }, - { - "epoch": 0.48, - "learning_rate": 5.314934786951683e-06, - "loss": 0.1381, - "step": 17425 - }, - { - "epoch": 0.48, - "learning_rate": 5.31350780558806e-06, - "loss": 0.1061, - "step": 17430 - }, - { - "epoch": 0.48, - "learning_rate": 5.312080824224436e-06, - "loss": 0.1987, - "step": 17435 - }, - { - "epoch": 0.48, - "learning_rate": 5.310653842860812e-06, - "loss": 0.2463, - "step": 17440 - }, - { - "epoch": 0.48, - "learning_rate": 5.3092268614971896e-06, - "loss": 0.2434, - "step": 17445 - }, - { - "epoch": 0.48, - "learning_rate": 5.307799880133566e-06, - "loss": 0.406, - "step": 17450 - }, - { - "epoch": 0.48, - "learning_rate": 5.306372898769942e-06, - "loss": 0.1069, - "step": 17455 - }, - { - "epoch": 0.48, - "learning_rate": 5.3049459174063186e-06, - "loss": 0.1613, - "step": 17460 - }, - { - "epoch": 0.48, - "learning_rate": 5.303518936042695e-06, - "loss": 0.2305, - "step": 17465 - }, - { - "epoch": 0.48, - "learning_rate": 5.302091954679073e-06, - "loss": 0.2166, - "step": 17470 - }, - { - "epoch": 0.48, - "learning_rate": 5.300664973315449e-06, - "loss": 0.1284, - "step": 17475 - }, - { - "epoch": 0.49, - "learning_rate": 5.299237991951826e-06, - "loss": 0.0405, - "step": 17480 - }, - { - "epoch": 0.49, - "learning_rate": 5.297811010588202e-06, - "loss": 0.1256, - "step": 17485 - }, - { - "epoch": 0.49, - "learning_rate": 5.296384029224578e-06, - "loss": 0.1613, - "step": 17490 - }, - { - "epoch": 0.49, - "learning_rate": 5.2949570478609555e-06, - "loss": 0.1741, - "step": 17495 - }, - { - "epoch": 0.49, - "learning_rate": 5.293530066497332e-06, - "loss": 0.4977, - "step": 17500 - }, - { - "epoch": 0.49, - "learning_rate": 5.292103085133708e-06, - "loss": 0.1077, - "step": 17505 - }, - { - "epoch": 0.49, - "learning_rate": 5.2906761037700845e-06, - "loss": 0.1564, - "step": 17510 - }, - { - "epoch": 0.49, - "learning_rate": 5.289249122406462e-06, - "loss": 0.1938, - "step": 17515 - }, - { - "epoch": 0.49, - "learning_rate": 5.287822141042839e-06, - "loss": 0.1949, - "step": 17520 - }, - { - "epoch": 0.49, - "learning_rate": 5.286395159679215e-06, - "loss": 0.2227, - "step": 17525 - }, - { - "epoch": 0.49, - "learning_rate": 5.2849681783155915e-06, - "loss": 0.0831, - "step": 17530 - }, - { - "epoch": 0.49, - "learning_rate": 5.283541196951968e-06, - "loss": 0.1108, - "step": 17535 - }, - { - "epoch": 0.49, - "learning_rate": 5.282114215588345e-06, - "loss": 0.0977, - "step": 17540 - }, - { - "epoch": 0.49, - "learning_rate": 5.280687234224721e-06, - "loss": 0.1692, - "step": 17545 - }, - { - "epoch": 0.49, - "learning_rate": 5.279260252861098e-06, - "loss": 0.3128, - "step": 17550 - }, - { - "epoch": 0.49, - "learning_rate": 5.277833271497474e-06, - "loss": 0.1295, - "step": 17555 - }, - { - "epoch": 0.49, - "learning_rate": 5.276406290133851e-06, - "loss": 0.1572, - "step": 17560 - }, - { - "epoch": 0.49, - "learning_rate": 5.2749793087702285e-06, - "loss": 0.1622, - "step": 17565 - }, - { - "epoch": 0.49, - "learning_rate": 5.273552327406605e-06, - "loss": 0.1761, - "step": 17570 - }, - { - "epoch": 0.49, - "learning_rate": 5.272125346042981e-06, - "loss": 0.0468, - "step": 17575 - }, - { - "epoch": 0.49, - "learning_rate": 5.2706983646793575e-06, - "loss": 0.0853, - "step": 17580 - }, - { - "epoch": 0.49, - "learning_rate": 5.269271383315734e-06, - "loss": 0.196, - "step": 17585 - }, - { - "epoch": 0.49, - "learning_rate": 5.267844401952111e-06, - "loss": 0.2446, - "step": 17590 - }, - { - "epoch": 0.49, - "learning_rate": 5.266417420588487e-06, - "loss": 0.2089, - "step": 17595 - }, - { - "epoch": 0.49, - "learning_rate": 5.264990439224864e-06, - "loss": 0.8299, - "step": 17600 - }, - { - "epoch": 0.49, - "learning_rate": 5.263563457861241e-06, - "loss": 0.1186, - "step": 17605 - }, - { - "epoch": 0.49, - "learning_rate": 5.262136476497617e-06, - "loss": 0.2162, - "step": 17610 - }, - { - "epoch": 0.49, - "learning_rate": 5.260709495133994e-06, - "loss": 0.1515, - "step": 17615 - }, - { - "epoch": 0.49, - "learning_rate": 5.259282513770371e-06, - "loss": 0.1404, - "step": 17620 - }, - { - "epoch": 0.49, - "learning_rate": 5.257855532406747e-06, - "loss": 0.0805, - "step": 17625 - }, - { - "epoch": 0.49, - "learning_rate": 5.256428551043123e-06, - "loss": 0.1446, - "step": 17630 - }, - { - "epoch": 0.49, - "learning_rate": 5.255001569679501e-06, - "loss": 0.1575, - "step": 17635 - }, - { - "epoch": 0.49, - "learning_rate": 5.253574588315877e-06, - "loss": 0.1792, - "step": 17640 - }, - { - "epoch": 0.49, - "learning_rate": 5.252147606952253e-06, - "loss": 0.2785, - "step": 17645 - }, - { - "epoch": 0.49, - "learning_rate": 5.2507206255886304e-06, - "loss": 0.3261, - "step": 17650 - }, - { - "epoch": 0.49, - "learning_rate": 5.249293644225007e-06, - "loss": 0.1054, - "step": 17655 - }, - { - "epoch": 0.49, - "learning_rate": 5.247866662861384e-06, - "loss": 0.1029, - "step": 17660 - }, - { - "epoch": 0.49, - "learning_rate": 5.24643968149776e-06, - "loss": 0.1423, - "step": 17665 - }, - { - "epoch": 0.49, - "learning_rate": 5.245012700134137e-06, - "loss": 0.1382, - "step": 17670 - }, - { - "epoch": 0.49, - "learning_rate": 5.243585718770513e-06, - "loss": 0.1093, - "step": 17675 - }, - { - "epoch": 0.49, - "learning_rate": 5.242158737406889e-06, - "loss": 0.2346, - "step": 17680 - }, - { - "epoch": 0.49, - "learning_rate": 5.2407317560432665e-06, - "loss": 0.1895, - "step": 17685 - }, - { - "epoch": 0.49, - "learning_rate": 5.239304774679643e-06, - "loss": 0.268, - "step": 17690 - }, - { - "epoch": 0.49, - "learning_rate": 5.23787779331602e-06, - "loss": 0.2064, - "step": 17695 - }, - { - "epoch": 0.49, - "learning_rate": 5.236450811952396e-06, - "loss": 0.4262, - "step": 17700 - }, - { - "epoch": 0.49, - "learning_rate": 5.235023830588773e-06, - "loss": 0.1548, - "step": 17705 - }, - { - "epoch": 0.49, - "learning_rate": 5.23359684922515e-06, - "loss": 0.3673, - "step": 17710 - }, - { - "epoch": 0.49, - "learning_rate": 5.232169867861526e-06, - "loss": 0.1372, - "step": 17715 - }, - { - "epoch": 0.49, - "learning_rate": 5.2307428864979026e-06, - "loss": 0.2551, - "step": 17720 - }, - { - "epoch": 0.49, - "learning_rate": 5.229315905134279e-06, - "loss": 0.2321, - "step": 17725 - }, - { - "epoch": 0.49, - "learning_rate": 5.227888923770656e-06, - "loss": 0.0697, - "step": 17730 - }, - { - "epoch": 0.49, - "learning_rate": 5.226461942407033e-06, - "loss": 0.0874, - "step": 17735 - }, - { - "epoch": 0.49, - "learning_rate": 5.22503496104341e-06, - "loss": 0.1746, - "step": 17740 - }, - { - "epoch": 0.49, - "learning_rate": 5.223607979679786e-06, - "loss": 0.2093, - "step": 17745 - }, - { - "epoch": 0.49, - "learning_rate": 5.222180998316162e-06, - "loss": 0.4258, - "step": 17750 - }, - { - "epoch": 0.49, - "learning_rate": 5.2207540169525395e-06, - "loss": 0.157, - "step": 17755 - }, - { - "epoch": 0.49, - "learning_rate": 5.219327035588916e-06, - "loss": 0.1516, - "step": 17760 - }, - { - "epoch": 0.49, - "learning_rate": 5.217900054225292e-06, - "loss": 0.1675, - "step": 17765 - }, - { - "epoch": 0.49, - "learning_rate": 5.2164730728616685e-06, - "loss": 0.2068, - "step": 17770 - }, - { - "epoch": 0.49, - "learning_rate": 5.215046091498045e-06, - "loss": 0.1738, - "step": 17775 - }, - { - "epoch": 0.49, - "learning_rate": 5.213619110134423e-06, - "loss": 0.0531, - "step": 17780 - }, - { - "epoch": 0.49, - "learning_rate": 5.212192128770799e-06, - "loss": 0.1019, - "step": 17785 - }, - { - "epoch": 0.49, - "learning_rate": 5.2107651474071756e-06, - "loss": 0.2422, - "step": 17790 - }, - { - "epoch": 0.49, - "learning_rate": 5.209338166043552e-06, - "loss": 0.2592, - "step": 17795 - }, - { - "epoch": 0.49, - "learning_rate": 5.207911184679928e-06, - "loss": 0.4477, - "step": 17800 - }, - { - "epoch": 0.49, - "learning_rate": 5.206484203316305e-06, - "loss": 0.1812, - "step": 17805 - }, - { - "epoch": 0.49, - "learning_rate": 5.205057221952682e-06, - "loss": 0.1483, - "step": 17810 - }, - { - "epoch": 0.49, - "learning_rate": 5.203630240589058e-06, - "loss": 0.1255, - "step": 17815 - }, - { - "epoch": 0.49, - "learning_rate": 5.2022032592254344e-06, - "loss": 0.1468, - "step": 17820 - }, - { - "epoch": 0.49, - "learning_rate": 5.2007762778618125e-06, - "loss": 0.0766, - "step": 17825 - }, - { - "epoch": 0.49, - "learning_rate": 5.199349296498189e-06, - "loss": 0.0317, - "step": 17830 - }, - { - "epoch": 0.49, - "learning_rate": 5.197922315134565e-06, - "loss": 0.1377, - "step": 17835 - }, - { - "epoch": 0.5, - "learning_rate": 5.1964953337709415e-06, - "loss": 0.1483, - "step": 17840 - }, - { - "epoch": 0.5, - "learning_rate": 5.195068352407318e-06, - "loss": 0.2709, - "step": 17845 - }, - { - "epoch": 0.5, - "learning_rate": 5.193641371043695e-06, - "loss": 0.3546, - "step": 17850 - }, - { - "epoch": 0.5, - "learning_rate": 5.192214389680071e-06, - "loss": 0.1371, - "step": 17855 - }, - { - "epoch": 0.5, - "learning_rate": 5.190787408316448e-06, - "loss": 0.1574, - "step": 17860 - }, - { - "epoch": 0.5, - "learning_rate": 5.189360426952824e-06, - "loss": 0.1483, - "step": 17865 - }, - { - "epoch": 0.5, - "learning_rate": 5.1879334455892e-06, - "loss": 0.1485, - "step": 17870 - }, - { - "epoch": 0.5, - "learning_rate": 5.186506464225578e-06, - "loss": 0.1632, - "step": 17875 - }, - { - "epoch": 0.5, - "learning_rate": 5.185079482861955e-06, - "loss": 0.1516, - "step": 17880 - }, - { - "epoch": 0.5, - "learning_rate": 5.183652501498331e-06, - "loss": 0.1936, - "step": 17885 - }, - { - "epoch": 0.5, - "learning_rate": 5.182225520134707e-06, - "loss": 0.3391, - "step": 17890 - }, - { - "epoch": 0.5, - "learning_rate": 5.180798538771084e-06, - "loss": 0.2453, - "step": 17895 - }, - { - "epoch": 0.5, - "learning_rate": 5.179371557407461e-06, - "loss": 0.4235, - "step": 17900 - }, - { - "epoch": 0.5, - "learning_rate": 5.177944576043837e-06, - "loss": 0.1901, - "step": 17905 - }, - { - "epoch": 0.5, - "learning_rate": 5.176517594680214e-06, - "loss": 0.1267, - "step": 17910 - }, - { - "epoch": 0.5, - "learning_rate": 5.17509061331659e-06, - "loss": 0.1892, - "step": 17915 - }, - { - "epoch": 0.5, - "learning_rate": 5.173663631952968e-06, - "loss": 0.2079, - "step": 17920 - }, - { - "epoch": 0.5, - "learning_rate": 5.172236650589344e-06, - "loss": 0.1089, - "step": 17925 - }, - { - "epoch": 0.5, - "learning_rate": 5.170809669225721e-06, - "loss": 0.0372, - "step": 17930 - }, - { - "epoch": 0.5, - "learning_rate": 5.169382687862097e-06, - "loss": 0.0917, - "step": 17935 - }, - { - "epoch": 0.5, - "learning_rate": 5.167955706498473e-06, - "loss": 0.1767, - "step": 17940 - }, - { - "epoch": 0.5, - "learning_rate": 5.1665287251348505e-06, - "loss": 0.2681, - "step": 17945 - }, - { - "epoch": 0.5, - "learning_rate": 5.165101743771227e-06, - "loss": 0.6623, - "step": 17950 - }, - { - "epoch": 0.5, - "learning_rate": 5.163674762407603e-06, - "loss": 0.1652, - "step": 17955 - }, - { - "epoch": 0.5, - "learning_rate": 5.1622477810439795e-06, - "loss": 0.1949, - "step": 17960 - }, - { - "epoch": 0.5, - "learning_rate": 5.160820799680356e-06, - "loss": 0.1519, - "step": 17965 - }, - { - "epoch": 0.5, - "learning_rate": 5.159393818316734e-06, - "loss": 0.1855, - "step": 17970 - }, - { - "epoch": 0.5, - "learning_rate": 5.15796683695311e-06, - "loss": 0.1434, - "step": 17975 - }, - { - "epoch": 0.5, - "learning_rate": 5.156539855589487e-06, - "loss": 0.1216, - "step": 17980 - }, - { - "epoch": 0.5, - "learning_rate": 5.155112874225863e-06, - "loss": 0.2063, - "step": 17985 - }, - { - "epoch": 0.5, - "learning_rate": 5.15368589286224e-06, - "loss": 0.1467, - "step": 17990 - }, - { - "epoch": 0.5, - "learning_rate": 5.1522589114986164e-06, - "loss": 0.1407, - "step": 17995 - }, - { - "epoch": 0.5, - "learning_rate": 5.150831930134993e-06, - "loss": 0.5262, - "step": 18000 - }, - { - "epoch": 0.5, - "eval_loss": 0.06189865618944168, - "eval_runtime": 1891.1772, - "eval_samples_per_second": 8.47, - "eval_steps_per_second": 2.118, - "eval_wer": 0.17731698521456907, - "step": 18000 - }, - { - "epoch": 0.5, - "learning_rate": 5.149404948771369e-06, - "loss": 0.1568, - "step": 18005 - }, - { - "epoch": 0.5, - "learning_rate": 5.1479779674077455e-06, - "loss": 0.1248, - "step": 18010 - }, - { - "epoch": 0.5, - "learning_rate": 5.1465509860441235e-06, - "loss": 0.207, - "step": 18015 - }, - { - "epoch": 0.5, - "learning_rate": 5.1451240046805e-06, - "loss": 0.1563, - "step": 18020 - }, - { - "epoch": 0.5, - "learning_rate": 5.143697023316876e-06, - "loss": 0.1114, - "step": 18025 - }, - { - "epoch": 0.5, - "learning_rate": 5.1422700419532525e-06, - "loss": 0.0905, - "step": 18030 - }, - { - "epoch": 0.5, - "learning_rate": 5.140843060589629e-06, - "loss": 0.1048, - "step": 18035 - }, - { - "epoch": 0.5, - "learning_rate": 5.139416079226006e-06, - "loss": 0.1992, - "step": 18040 - }, - { - "epoch": 0.5, - "learning_rate": 5.137989097862382e-06, - "loss": 0.1553, - "step": 18045 - }, - { - "epoch": 0.5, - "learning_rate": 5.136562116498759e-06, - "loss": 0.4436, - "step": 18050 - }, - { - "epoch": 0.5, - "learning_rate": 5.135135135135135e-06, - "loss": 0.1276, - "step": 18055 - }, - { - "epoch": 0.5, - "learning_rate": 5.133708153771511e-06, - "loss": 0.1311, - "step": 18060 - }, - { - "epoch": 0.5, - "learning_rate": 5.132281172407889e-06, - "loss": 0.1655, - "step": 18065 - }, - { - "epoch": 0.5, - "learning_rate": 5.130854191044266e-06, - "loss": 0.1517, - "step": 18070 - }, - { - "epoch": 0.5, - "learning_rate": 5.129427209680642e-06, - "loss": 0.0479, - "step": 18075 - }, - { - "epoch": 0.5, - "learning_rate": 5.1280002283170184e-06, - "loss": 0.0382, - "step": 18080 - }, - { - "epoch": 0.5, - "learning_rate": 5.126573246953396e-06, - "loss": 0.1758, - "step": 18085 - }, - { - "epoch": 0.5, - "learning_rate": 5.125146265589772e-06, - "loss": 0.2523, - "step": 18090 - }, - { - "epoch": 0.5, - "learning_rate": 5.123719284226148e-06, - "loss": 0.223, - "step": 18095 - }, - { - "epoch": 0.5, - "learning_rate": 5.122292302862525e-06, - "loss": 0.3482, - "step": 18100 - }, - { - "epoch": 0.5, - "learning_rate": 5.120865321498901e-06, - "loss": 0.0802, - "step": 18105 - }, - { - "epoch": 0.5, - "learning_rate": 5.119438340135279e-06, - "loss": 0.1132, - "step": 18110 - }, - { - "epoch": 0.5, - "learning_rate": 5.118011358771655e-06, - "loss": 0.1595, - "step": 18115 - }, - { - "epoch": 0.5, - "learning_rate": 5.116584377408032e-06, - "loss": 0.1813, - "step": 18120 - }, - { - "epoch": 0.5, - "learning_rate": 5.115157396044408e-06, - "loss": 0.0865, - "step": 18125 - }, - { - "epoch": 0.5, - "learning_rate": 5.113730414680784e-06, - "loss": 0.0802, - "step": 18130 - }, - { - "epoch": 0.5, - "learning_rate": 5.1123034333171616e-06, - "loss": 0.0854, - "step": 18135 - }, - { - "epoch": 0.5, - "learning_rate": 5.110876451953538e-06, - "loss": 0.1714, - "step": 18140 - }, - { - "epoch": 0.5, - "learning_rate": 5.109449470589914e-06, - "loss": 0.2229, - "step": 18145 - }, - { - "epoch": 0.5, - "learning_rate": 5.1080224892262906e-06, - "loss": 0.1786, - "step": 18150 - }, - { - "epoch": 0.5, - "learning_rate": 5.106595507862667e-06, - "loss": 0.153, - "step": 18155 - }, - { - "epoch": 0.5, - "learning_rate": 5.105168526499045e-06, - "loss": 0.175, - "step": 18160 - }, - { - "epoch": 0.5, - "learning_rate": 5.103741545135421e-06, - "loss": 0.201, - "step": 18165 - }, - { - "epoch": 0.5, - "learning_rate": 5.102314563771798e-06, - "loss": 0.1102, - "step": 18170 - }, - { - "epoch": 0.5, - "learning_rate": 5.100887582408174e-06, - "loss": 0.195, - "step": 18175 - }, - { - "epoch": 0.5, - "learning_rate": 5.099460601044551e-06, - "loss": 0.0287, - "step": 18180 - }, - { - "epoch": 0.5, - "learning_rate": 5.0980336196809275e-06, - "loss": 0.0427, - "step": 18185 - }, - { - "epoch": 0.5, - "learning_rate": 5.096606638317304e-06, - "loss": 0.2079, - "step": 18190 - }, - { - "epoch": 0.5, - "learning_rate": 5.09517965695368e-06, - "loss": 0.204, - "step": 18195 - }, - { - "epoch": 0.51, - "learning_rate": 5.0937526755900565e-06, - "loss": 0.3059, - "step": 18200 - }, - { - "epoch": 0.51, - "learning_rate": 5.0923256942264345e-06, - "loss": 0.1668, - "step": 18205 - }, - { - "epoch": 0.51, - "learning_rate": 5.090898712862811e-06, - "loss": 0.2312, - "step": 18210 - }, - { - "epoch": 0.51, - "learning_rate": 5.089471731499187e-06, - "loss": 0.1517, - "step": 18215 - }, - { - "epoch": 0.51, - "learning_rate": 5.0880447501355635e-06, - "loss": 0.1628, - "step": 18220 - }, - { - "epoch": 0.51, - "learning_rate": 5.08661776877194e-06, - "loss": 0.0852, - "step": 18225 - }, - { - "epoch": 0.51, - "learning_rate": 5.085190787408317e-06, - "loss": 0.0657, - "step": 18230 - }, - { - "epoch": 0.51, - "learning_rate": 5.083763806044693e-06, - "loss": 0.12, - "step": 18235 - }, - { - "epoch": 0.51, - "learning_rate": 5.08233682468107e-06, - "loss": 0.1348, - "step": 18240 - }, - { - "epoch": 0.51, - "learning_rate": 5.080909843317446e-06, - "loss": 0.219, - "step": 18245 - }, - { - "epoch": 0.51, - "learning_rate": 5.079482861953822e-06, - "loss": 0.5334, - "step": 18250 - }, - { - "epoch": 0.51, - "learning_rate": 5.0780558805902005e-06, - "loss": 0.1511, - "step": 18255 - }, - { - "epoch": 0.51, - "learning_rate": 5.076628899226577e-06, - "loss": 0.1443, - "step": 18260 - }, - { - "epoch": 0.51, - "learning_rate": 5.075201917862953e-06, - "loss": 0.1843, - "step": 18265 - }, - { - "epoch": 0.51, - "learning_rate": 5.0737749364993295e-06, - "loss": 0.1302, - "step": 18270 - }, - { - "epoch": 0.51, - "learning_rate": 5.072347955135707e-06, - "loss": 0.0972, - "step": 18275 - }, - { - "epoch": 0.51, - "learning_rate": 5.070920973772083e-06, - "loss": 0.2034, - "step": 18280 - }, - { - "epoch": 0.51, - "learning_rate": 5.069493992408459e-06, - "loss": 0.125, - "step": 18285 - }, - { - "epoch": 0.51, - "learning_rate": 5.068067011044836e-06, - "loss": 0.1517, - "step": 18290 - }, - { - "epoch": 0.51, - "learning_rate": 5.066640029681212e-06, - "loss": 0.2896, - "step": 18295 - }, - { - "epoch": 0.51, - "learning_rate": 5.06521304831759e-06, - "loss": 0.297, - "step": 18300 - }, - { - "epoch": 0.51, - "learning_rate": 5.063786066953966e-06, - "loss": 0.1865, - "step": 18305 - }, - { - "epoch": 0.51, - "learning_rate": 5.062359085590343e-06, - "loss": 0.1178, - "step": 18310 - }, - { - "epoch": 0.51, - "learning_rate": 5.060932104226719e-06, - "loss": 0.181, - "step": 18315 - }, - { - "epoch": 0.51, - "learning_rate": 5.059505122863095e-06, - "loss": 0.1583, - "step": 18320 - }, - { - "epoch": 0.51, - "learning_rate": 5.058078141499473e-06, - "loss": 0.2078, - "step": 18325 - }, - { - "epoch": 0.51, - "learning_rate": 5.056651160135849e-06, - "loss": 0.0346, - "step": 18330 - }, - { - "epoch": 0.51, - "learning_rate": 5.055224178772225e-06, - "loss": 0.142, - "step": 18335 - }, - { - "epoch": 0.51, - "learning_rate": 5.053797197408602e-06, - "loss": 0.0779, - "step": 18340 - }, - { - "epoch": 0.51, - "learning_rate": 5.052370216044978e-06, - "loss": 0.2198, - "step": 18345 - }, - { - "epoch": 0.51, - "learning_rate": 5.050943234681356e-06, - "loss": 0.4314, - "step": 18350 - }, - { - "epoch": 0.51, - "learning_rate": 5.049516253317732e-06, - "loss": 0.1005, - "step": 18355 - }, - { - "epoch": 0.51, - "learning_rate": 5.048089271954109e-06, - "loss": 0.0979, - "step": 18360 - }, - { - "epoch": 0.51, - "learning_rate": 5.046662290590485e-06, - "loss": 0.2008, - "step": 18365 - }, - { - "epoch": 0.51, - "learning_rate": 5.045235309226862e-06, - "loss": 0.1816, - "step": 18370 - }, - { - "epoch": 0.51, - "learning_rate": 5.0438083278632385e-06, - "loss": 0.0629, - "step": 18375 - }, - { - "epoch": 0.51, - "learning_rate": 5.042381346499615e-06, - "loss": 0.1564, - "step": 18380 - }, - { - "epoch": 0.51, - "learning_rate": 5.040954365135991e-06, - "loss": 0.1654, - "step": 18385 - }, - { - "epoch": 0.51, - "learning_rate": 5.0395273837723675e-06, - "loss": 0.2169, - "step": 18390 - }, - { - "epoch": 0.51, - "learning_rate": 5.0381004024087456e-06, - "loss": 0.2023, - "step": 18395 - }, - { - "epoch": 0.51, - "learning_rate": 5.036673421045122e-06, - "loss": 0.4018, - "step": 18400 - }, - { - "epoch": 0.51, - "learning_rate": 5.035246439681498e-06, - "loss": 0.1353, - "step": 18405 - }, - { - "epoch": 0.51, - "learning_rate": 5.0338194583178746e-06, - "loss": 0.1655, - "step": 18410 - }, - { - "epoch": 0.51, - "learning_rate": 5.032392476954251e-06, - "loss": 0.297, - "step": 18415 - }, - { - "epoch": 0.51, - "learning_rate": 5.030965495590628e-06, - "loss": 0.2271, - "step": 18420 - }, - { - "epoch": 0.51, - "learning_rate": 5.0295385142270044e-06, - "loss": 0.1084, - "step": 18425 - }, - { - "epoch": 0.51, - "learning_rate": 5.028111532863381e-06, - "loss": 0.1346, - "step": 18430 - }, - { - "epoch": 0.51, - "learning_rate": 5.026684551499757e-06, - "loss": 0.1331, - "step": 18435 - }, - { - "epoch": 0.51, - "learning_rate": 5.025257570136134e-06, - "loss": 0.162, - "step": 18440 - }, - { - "epoch": 0.51, - "learning_rate": 5.0238305887725115e-06, - "loss": 0.1401, - "step": 18445 - }, - { - "epoch": 0.51, - "learning_rate": 5.022403607408888e-06, - "loss": 0.4347, - "step": 18450 - }, - { - "epoch": 0.51, - "learning_rate": 5.020976626045264e-06, - "loss": 0.107, - "step": 18455 - }, - { - "epoch": 0.51, - "learning_rate": 5.0195496446816405e-06, - "loss": 0.1016, - "step": 18460 - }, - { - "epoch": 0.51, - "learning_rate": 5.018122663318018e-06, - "loss": 0.1409, - "step": 18465 - }, - { - "epoch": 0.51, - "learning_rate": 5.016695681954394e-06, - "loss": 0.1334, - "step": 18470 - }, - { - "epoch": 0.51, - "learning_rate": 5.01526870059077e-06, - "loss": 0.1433, - "step": 18475 - }, - { - "epoch": 0.51, - "learning_rate": 5.0138417192271476e-06, - "loss": 0.0913, - "step": 18480 - }, - { - "epoch": 0.51, - "learning_rate": 5.012414737863524e-06, - "loss": 0.0915, - "step": 18485 - }, - { - "epoch": 0.51, - "learning_rate": 5.010987756499901e-06, - "loss": 0.2491, - "step": 18490 - }, - { - "epoch": 0.51, - "learning_rate": 5.009560775136277e-06, - "loss": 0.1918, - "step": 18495 - }, - { - "epoch": 0.51, - "learning_rate": 5.008133793772654e-06, - "loss": 0.4121, - "step": 18500 - }, - { - "epoch": 0.51, - "learning_rate": 5.00670681240903e-06, - "loss": 0.1865, - "step": 18505 - }, - { - "epoch": 0.51, - "learning_rate": 5.0052798310454064e-06, - "loss": 0.1793, - "step": 18510 - }, - { - "epoch": 0.51, - "learning_rate": 5.003852849681784e-06, - "loss": 0.1419, - "step": 18515 - }, - { - "epoch": 0.51, - "learning_rate": 5.00242586831816e-06, - "loss": 0.1374, - "step": 18520 - }, - { - "epoch": 0.51, - "learning_rate": 5.000998886954537e-06, - "loss": 0.0294, - "step": 18525 - }, - { - "epoch": 0.51, - "learning_rate": 4.9995719055909135e-06, - "loss": 0.0931, - "step": 18530 - }, - { - "epoch": 0.51, - "learning_rate": 4.99814492422729e-06, - "loss": 0.2111, - "step": 18535 - }, - { - "epoch": 0.51, - "learning_rate": 4.996717942863666e-06, - "loss": 0.2355, - "step": 18540 - }, - { - "epoch": 0.51, - "learning_rate": 4.995290961500043e-06, - "loss": 0.2988, - "step": 18545 - }, - { - "epoch": 0.51, - "learning_rate": 4.99386398013642e-06, - "loss": 0.4671, - "step": 18550 - }, - { - "epoch": 0.51, - "learning_rate": 4.992436998772797e-06, - "loss": 0.0891, - "step": 18555 - }, - { - "epoch": 0.51, - "learning_rate": 4.991010017409173e-06, - "loss": 0.1915, - "step": 18560 - }, - { - "epoch": 0.52, - "learning_rate": 4.9895830360455495e-06, - "loss": 0.177, - "step": 18565 - }, - { - "epoch": 0.52, - "learning_rate": 4.988156054681927e-06, - "loss": 0.1975, - "step": 18570 - }, - { - "epoch": 0.52, - "learning_rate": 4.986729073318303e-06, - "loss": 0.2193, - "step": 18575 - }, - { - "epoch": 0.52, - "learning_rate": 4.985302091954679e-06, - "loss": 0.1107, - "step": 18580 - }, - { - "epoch": 0.52, - "learning_rate": 4.983875110591056e-06, - "loss": 0.1263, - "step": 18585 - }, - { - "epoch": 0.52, - "learning_rate": 4.982448129227433e-06, - "loss": 0.1766, - "step": 18590 - }, - { - "epoch": 0.52, - "learning_rate": 4.981021147863809e-06, - "loss": 0.1956, - "step": 18595 - }, - { - "epoch": 0.52, - "learning_rate": 4.979594166500186e-06, - "loss": 0.3, - "step": 18600 - }, - { - "epoch": 0.52, - "learning_rate": 4.978167185136563e-06, - "loss": 0.1515, - "step": 18605 - }, - { - "epoch": 0.52, - "learning_rate": 4.976740203772939e-06, - "loss": 0.1442, - "step": 18610 - }, - { - "epoch": 0.52, - "learning_rate": 4.975313222409316e-06, - "loss": 0.1284, - "step": 18615 - }, - { - "epoch": 0.52, - "learning_rate": 4.973886241045693e-06, - "loss": 0.1416, - "step": 18620 - }, - { - "epoch": 0.52, - "learning_rate": 4.972459259682069e-06, - "loss": 0.1804, - "step": 18625 - }, - { - "epoch": 0.52, - "learning_rate": 4.971032278318445e-06, - "loss": 0.0842, - "step": 18630 - }, - { - "epoch": 0.52, - "learning_rate": 4.969605296954822e-06, - "loss": 0.1027, - "step": 18635 - }, - { - "epoch": 0.52, - "learning_rate": 4.968178315591199e-06, - "loss": 0.1315, - "step": 18640 - }, - { - "epoch": 0.52, - "learning_rate": 4.966751334227575e-06, - "loss": 0.3734, - "step": 18645 - }, - { - "epoch": 0.52, - "learning_rate": 4.965324352863952e-06, - "loss": 0.4681, - "step": 18650 - }, - { - "epoch": 0.52, - "learning_rate": 4.963897371500329e-06, - "loss": 0.1777, - "step": 18655 - }, - { - "epoch": 0.52, - "learning_rate": 4.962470390136705e-06, - "loss": 0.2419, - "step": 18660 - }, - { - "epoch": 0.52, - "learning_rate": 4.961043408773082e-06, - "loss": 0.1455, - "step": 18665 - }, - { - "epoch": 0.52, - "learning_rate": 4.959616427409459e-06, - "loss": 0.1937, - "step": 18670 - }, - { - "epoch": 0.52, - "learning_rate": 4.958189446045835e-06, - "loss": 0.1785, - "step": 18675 - }, - { - "epoch": 0.52, - "learning_rate": 4.956762464682211e-06, - "loss": 0.0755, - "step": 18680 - }, - { - "epoch": 0.52, - "learning_rate": 4.9553354833185884e-06, - "loss": 0.1912, - "step": 18685 - }, - { - "epoch": 0.52, - "learning_rate": 4.953908501954965e-06, - "loss": 0.1188, - "step": 18690 - }, - { - "epoch": 0.52, - "learning_rate": 4.952481520591341e-06, - "loss": 0.1998, - "step": 18695 - }, - { - "epoch": 0.52, - "learning_rate": 4.951054539227718e-06, - "loss": 0.2255, - "step": 18700 - }, - { - "epoch": 0.52, - "learning_rate": 4.949627557864095e-06, - "loss": 0.0936, - "step": 18705 - }, - { - "epoch": 0.52, - "learning_rate": 4.948200576500472e-06, - "loss": 0.0934, - "step": 18710 - }, - { - "epoch": 0.52, - "learning_rate": 4.946773595136848e-06, - "loss": 0.1606, - "step": 18715 - }, - { - "epoch": 0.52, - "learning_rate": 4.9453466137732245e-06, - "loss": 0.1571, - "step": 18720 - }, - { - "epoch": 0.52, - "learning_rate": 4.943919632409601e-06, - "loss": 0.0658, - "step": 18725 - }, - { - "epoch": 0.52, - "learning_rate": 4.942492651045977e-06, - "loss": 0.069, - "step": 18730 - }, - { - "epoch": 0.52, - "learning_rate": 4.941065669682354e-06, - "loss": 0.1073, - "step": 18735 - }, - { - "epoch": 0.52, - "learning_rate": 4.939638688318731e-06, - "loss": 0.0662, - "step": 18740 - }, - { - "epoch": 0.52, - "learning_rate": 4.938211706955108e-06, - "loss": 0.338, - "step": 18745 - }, - { - "epoch": 0.52, - "learning_rate": 4.936784725591484e-06, - "loss": 0.2188, - "step": 18750 - }, - { - "epoch": 0.52, - "learning_rate": 4.935357744227861e-06, - "loss": 0.1863, - "step": 18755 - }, - { - "epoch": 0.52, - "learning_rate": 4.933930762864238e-06, - "loss": 0.2082, - "step": 18760 - }, - { - "epoch": 0.52, - "learning_rate": 4.932503781500614e-06, - "loss": 0.1422, - "step": 18765 - }, - { - "epoch": 0.52, - "learning_rate": 4.9310768001369904e-06, - "loss": 0.2215, - "step": 18770 - }, - { - "epoch": 0.52, - "learning_rate": 4.929649818773367e-06, - "loss": 0.0921, - "step": 18775 - }, - { - "epoch": 0.52, - "learning_rate": 4.928222837409744e-06, - "loss": 0.098, - "step": 18780 - }, - { - "epoch": 0.52, - "learning_rate": 4.92679585604612e-06, - "loss": 0.0824, - "step": 18785 - }, - { - "epoch": 0.52, - "learning_rate": 4.925368874682497e-06, - "loss": 0.1358, - "step": 18790 - }, - { - "epoch": 0.52, - "learning_rate": 4.923941893318874e-06, - "loss": 0.1977, - "step": 18795 - }, - { - "epoch": 0.52, - "learning_rate": 4.92251491195525e-06, - "loss": 0.4446, - "step": 18800 - }, - { - "epoch": 0.52, - "learning_rate": 4.921087930591627e-06, - "loss": 0.1165, - "step": 18805 - }, - { - "epoch": 0.52, - "learning_rate": 4.919660949228004e-06, - "loss": 0.1562, - "step": 18810 - }, - { - "epoch": 0.52, - "learning_rate": 4.91823396786438e-06, - "loss": 0.0988, - "step": 18815 - }, - { - "epoch": 0.52, - "learning_rate": 4.916806986500756e-06, - "loss": 0.167, - "step": 18820 - }, - { - "epoch": 0.52, - "learning_rate": 4.915380005137133e-06, - "loss": 0.0711, - "step": 18825 - }, - { - "epoch": 0.52, - "learning_rate": 4.91395302377351e-06, - "loss": 0.1165, - "step": 18830 - }, - { - "epoch": 0.52, - "learning_rate": 4.912526042409886e-06, - "loss": 0.0943, - "step": 18835 - }, - { - "epoch": 0.52, - "learning_rate": 4.911099061046263e-06, - "loss": 0.231, - "step": 18840 - }, - { - "epoch": 0.52, - "learning_rate": 4.90967207968264e-06, - "loss": 0.2684, - "step": 18845 - }, - { - "epoch": 0.52, - "learning_rate": 4.908245098319017e-06, - "loss": 0.3325, - "step": 18850 - }, - { - "epoch": 0.52, - "learning_rate": 4.906818116955393e-06, - "loss": 0.1257, - "step": 18855 - }, - { - "epoch": 0.52, - "learning_rate": 4.90539113559177e-06, - "loss": 0.1308, - "step": 18860 - }, - { - "epoch": 0.52, - "learning_rate": 4.903964154228146e-06, - "loss": 0.1406, - "step": 18865 - }, - { - "epoch": 0.52, - "learning_rate": 4.902537172864522e-06, - "loss": 0.1921, - "step": 18870 - }, - { - "epoch": 0.52, - "learning_rate": 4.9011101915008995e-06, - "loss": 0.1859, - "step": 18875 - }, - { - "epoch": 0.52, - "learning_rate": 4.899683210137276e-06, - "loss": 0.1193, - "step": 18880 - }, - { - "epoch": 0.52, - "learning_rate": 4.898256228773652e-06, - "loss": 0.0525, - "step": 18885 - }, - { - "epoch": 0.52, - "learning_rate": 4.896829247410029e-06, - "loss": 0.148, - "step": 18890 - }, - { - "epoch": 0.52, - "learning_rate": 4.895402266046406e-06, - "loss": 0.2575, - "step": 18895 - }, - { - "epoch": 0.52, - "learning_rate": 4.893975284682783e-06, - "loss": 0.3488, - "step": 18900 - }, - { - "epoch": 0.52, - "learning_rate": 4.892548303319159e-06, - "loss": 0.1078, - "step": 18905 - }, - { - "epoch": 0.52, - "learning_rate": 4.8911213219555355e-06, - "loss": 0.1403, - "step": 18910 - }, - { - "epoch": 0.52, - "learning_rate": 4.889694340591912e-06, - "loss": 0.151, - "step": 18915 - }, - { - "epoch": 0.52, - "learning_rate": 4.888267359228289e-06, - "loss": 0.1313, - "step": 18920 - }, - { - "epoch": 0.53, - "learning_rate": 4.886840377864665e-06, - "loss": 0.1577, - "step": 18925 - }, - { - "epoch": 0.53, - "learning_rate": 4.885413396501042e-06, - "loss": 0.0513, - "step": 18930 - }, - { - "epoch": 0.53, - "learning_rate": 4.883986415137419e-06, - "loss": 0.0805, - "step": 18935 - }, - { - "epoch": 0.53, - "learning_rate": 4.882559433773795e-06, - "loss": 0.1599, - "step": 18940 - }, - { - "epoch": 0.53, - "learning_rate": 4.8811324524101725e-06, - "loss": 0.1188, - "step": 18945 - }, - { - "epoch": 0.53, - "learning_rate": 4.879705471046549e-06, - "loss": 0.2917, - "step": 18950 - }, - { - "epoch": 0.53, - "learning_rate": 4.878278489682925e-06, - "loss": 0.1129, - "step": 18955 - }, - { - "epoch": 0.53, - "learning_rate": 4.8768515083193015e-06, - "loss": 0.1425, - "step": 18960 - }, - { - "epoch": 0.53, - "learning_rate": 4.875424526955679e-06, - "loss": 0.1773, - "step": 18965 - }, - { - "epoch": 0.53, - "learning_rate": 4.873997545592055e-06, - "loss": 0.1527, - "step": 18970 - }, - { - "epoch": 0.53, - "learning_rate": 4.872570564228431e-06, - "loss": 0.2487, - "step": 18975 - }, - { - "epoch": 0.53, - "learning_rate": 4.871143582864808e-06, - "loss": 0.1026, - "step": 18980 - }, - { - "epoch": 0.53, - "learning_rate": 4.869716601501185e-06, - "loss": 0.1377, - "step": 18985 - }, - { - "epoch": 0.53, - "learning_rate": 4.868289620137561e-06, - "loss": 0.1255, - "step": 18990 - }, - { - "epoch": 0.53, - "learning_rate": 4.866862638773938e-06, - "loss": 0.3781, - "step": 18995 - }, - { - "epoch": 0.53, - "learning_rate": 4.865435657410315e-06, - "loss": 0.3524, - "step": 19000 - }, - { - "epoch": 0.53, - "learning_rate": 4.864008676046691e-06, - "loss": 0.1394, - "step": 19005 - }, - { - "epoch": 0.53, - "learning_rate": 4.862581694683068e-06, - "loss": 0.1842, - "step": 19010 - }, - { - "epoch": 0.53, - "learning_rate": 4.861154713319445e-06, - "loss": 0.1438, - "step": 19015 - }, - { - "epoch": 0.53, - "learning_rate": 4.859727731955821e-06, - "loss": 0.1551, - "step": 19020 - }, - { - "epoch": 0.53, - "learning_rate": 4.858300750592197e-06, - "loss": 0.131, - "step": 19025 - }, - { - "epoch": 0.53, - "learning_rate": 4.8568737692285744e-06, - "loss": 0.1145, - "step": 19030 - }, - { - "epoch": 0.53, - "learning_rate": 4.855446787864951e-06, - "loss": 0.0724, - "step": 19035 - }, - { - "epoch": 0.53, - "learning_rate": 4.854019806501328e-06, - "loss": 0.1353, - "step": 19040 - }, - { - "epoch": 0.53, - "learning_rate": 4.852592825137704e-06, - "loss": 0.2609, - "step": 19045 - }, - { - "epoch": 0.53, - "learning_rate": 4.851165843774081e-06, - "loss": 0.3902, - "step": 19050 - }, - { - "epoch": 0.53, - "learning_rate": 4.849738862410458e-06, - "loss": 0.137, - "step": 19055 - }, - { - "epoch": 0.53, - "learning_rate": 4.848311881046834e-06, - "loss": 0.141, - "step": 19060 - }, - { - "epoch": 0.53, - "learning_rate": 4.8468848996832105e-06, - "loss": 0.1448, - "step": 19065 - }, - { - "epoch": 0.53, - "learning_rate": 4.845457918319587e-06, - "loss": 0.1721, - "step": 19070 - }, - { - "epoch": 0.53, - "learning_rate": 4.844030936955963e-06, - "loss": 0.1683, - "step": 19075 - }, - { - "epoch": 0.53, - "learning_rate": 4.84260395559234e-06, - "loss": 0.2113, - "step": 19080 - }, - { - "epoch": 0.53, - "learning_rate": 4.841176974228717e-06, - "loss": 0.158, - "step": 19085 - }, - { - "epoch": 0.53, - "learning_rate": 4.839749992865094e-06, - "loss": 0.3753, - "step": 19090 - }, - { - "epoch": 0.53, - "learning_rate": 4.83832301150147e-06, - "loss": 0.1677, - "step": 19095 - }, - { - "epoch": 0.53, - "learning_rate": 4.8368960301378474e-06, - "loss": 0.5716, - "step": 19100 - }, - { - "epoch": 0.53, - "learning_rate": 4.835469048774224e-06, - "loss": 0.1239, - "step": 19105 - }, - { - "epoch": 0.53, - "learning_rate": 4.8340420674106e-06, - "loss": 0.1726, - "step": 19110 - }, - { - "epoch": 0.53, - "learning_rate": 4.8326150860469764e-06, - "loss": 0.1212, - "step": 19115 - }, - { - "epoch": 0.53, - "learning_rate": 4.831188104683353e-06, - "loss": 0.2156, - "step": 19120 - }, - { - "epoch": 0.53, - "learning_rate": 4.82976112331973e-06, - "loss": 0.1658, - "step": 19125 - }, - { - "epoch": 0.53, - "learning_rate": 4.828334141956106e-06, - "loss": 0.0955, - "step": 19130 - }, - { - "epoch": 0.53, - "learning_rate": 4.8269071605924835e-06, - "loss": 0.1119, - "step": 19135 - }, - { - "epoch": 0.53, - "learning_rate": 4.82548017922886e-06, - "loss": 0.1332, - "step": 19140 - }, - { - "epoch": 0.53, - "learning_rate": 4.824053197865236e-06, - "loss": 0.3604, - "step": 19145 - }, - { - "epoch": 0.53, - "learning_rate": 4.822626216501613e-06, - "loss": 0.3792, - "step": 19150 - }, - { - "epoch": 0.53, - "learning_rate": 4.82119923513799e-06, - "loss": 0.1281, - "step": 19155 - }, - { - "epoch": 0.53, - "learning_rate": 4.819772253774366e-06, - "loss": 0.176, - "step": 19160 - }, - { - "epoch": 0.53, - "learning_rate": 4.818345272410742e-06, - "loss": 0.137, - "step": 19165 - }, - { - "epoch": 0.53, - "learning_rate": 4.816918291047119e-06, - "loss": 0.1358, - "step": 19170 - }, - { - "epoch": 0.53, - "learning_rate": 4.815491309683496e-06, - "loss": 0.2131, - "step": 19175 - }, - { - "epoch": 0.53, - "learning_rate": 4.814064328319872e-06, - "loss": 0.1543, - "step": 19180 - }, - { - "epoch": 0.53, - "learning_rate": 4.812637346956249e-06, - "loss": 0.1545, - "step": 19185 - }, - { - "epoch": 0.53, - "learning_rate": 4.811210365592626e-06, - "loss": 0.2762, - "step": 19190 - }, - { - "epoch": 0.53, - "learning_rate": 4.809783384229003e-06, - "loss": 0.21, - "step": 19195 - }, - { - "epoch": 0.53, - "learning_rate": 4.808356402865379e-06, - "loss": 0.2492, - "step": 19200 - }, - { - "epoch": 0.53, - "learning_rate": 4.806929421501756e-06, - "loss": 0.1531, - "step": 19205 - }, - { - "epoch": 0.53, - "learning_rate": 4.805502440138132e-06, - "loss": 0.0952, - "step": 19210 - }, - { - "epoch": 0.53, - "learning_rate": 4.804075458774508e-06, - "loss": 0.1695, - "step": 19215 - }, - { - "epoch": 0.53, - "learning_rate": 4.8026484774108855e-06, - "loss": 0.2047, - "step": 19220 - }, - { - "epoch": 0.53, - "learning_rate": 4.801221496047262e-06, - "loss": 0.1026, - "step": 19225 - }, - { - "epoch": 0.53, - "learning_rate": 4.799794514683639e-06, - "loss": 0.0705, - "step": 19230 - }, - { - "epoch": 0.53, - "learning_rate": 4.798367533320015e-06, - "loss": 0.1268, - "step": 19235 - }, - { - "epoch": 0.53, - "learning_rate": 4.796940551956392e-06, - "loss": 0.2088, - "step": 19240 - }, - { - "epoch": 0.53, - "learning_rate": 4.795513570592769e-06, - "loss": 0.2085, - "step": 19245 - }, - { - "epoch": 0.53, - "learning_rate": 4.794086589229145e-06, - "loss": 0.5394, - "step": 19250 - }, - { - "epoch": 0.53, - "learning_rate": 4.7926596078655215e-06, - "loss": 0.1162, - "step": 19255 - }, - { - "epoch": 0.53, - "learning_rate": 4.791232626501898e-06, - "loss": 0.1291, - "step": 19260 - }, - { - "epoch": 0.53, - "learning_rate": 4.789805645138274e-06, - "loss": 0.1823, - "step": 19265 - }, - { - "epoch": 0.53, - "learning_rate": 4.788378663774651e-06, - "loss": 0.2043, - "step": 19270 - }, - { - "epoch": 0.53, - "learning_rate": 4.786951682411028e-06, - "loss": 0.0934, - "step": 19275 - }, - { - "epoch": 0.53, - "learning_rate": 4.785524701047405e-06, - "loss": 0.1623, - "step": 19280 - }, - { - "epoch": 0.54, - "learning_rate": 4.784097719683781e-06, - "loss": 0.1179, - "step": 19285 - }, - { - "epoch": 0.54, - "learning_rate": 4.7826707383201585e-06, - "loss": 0.1375, - "step": 19290 - }, - { - "epoch": 0.54, - "learning_rate": 4.781243756956535e-06, - "loss": 0.3264, - "step": 19295 - }, - { - "epoch": 0.54, - "learning_rate": 4.779816775592911e-06, - "loss": 0.3038, - "step": 19300 - }, - { - "epoch": 0.54, - "learning_rate": 4.7783897942292875e-06, - "loss": 0.2116, - "step": 19305 - }, - { - "epoch": 0.54, - "learning_rate": 4.776962812865664e-06, - "loss": 0.1304, - "step": 19310 - }, - { - "epoch": 0.54, - "learning_rate": 4.775535831502041e-06, - "loss": 0.2129, - "step": 19315 - }, - { - "epoch": 0.54, - "learning_rate": 4.774108850138417e-06, - "loss": 0.1695, - "step": 19320 - }, - { - "epoch": 0.54, - "learning_rate": 4.7726818687747945e-06, - "loss": 0.1732, - "step": 19325 - }, - { - "epoch": 0.54, - "learning_rate": 4.771254887411171e-06, - "loss": 0.0737, - "step": 19330 - }, - { - "epoch": 0.54, - "learning_rate": 4.769827906047547e-06, - "loss": 0.0705, - "step": 19335 - }, - { - "epoch": 0.54, - "learning_rate": 4.768400924683924e-06, - "loss": 0.2558, - "step": 19340 - }, - { - "epoch": 0.54, - "learning_rate": 4.766973943320301e-06, - "loss": 0.1931, - "step": 19345 - }, - { - "epoch": 0.54, - "learning_rate": 4.765546961956677e-06, - "loss": 0.4469, - "step": 19350 - }, - { - "epoch": 0.54, - "learning_rate": 4.764119980593053e-06, - "loss": 0.1145, - "step": 19355 - }, - { - "epoch": 0.54, - "learning_rate": 4.762692999229431e-06, - "loss": 0.1274, - "step": 19360 - }, - { - "epoch": 0.54, - "learning_rate": 4.761266017865807e-06, - "loss": 0.1393, - "step": 19365 - }, - { - "epoch": 0.54, - "learning_rate": 4.759839036502183e-06, - "loss": 0.1389, - "step": 19370 - }, - { - "epoch": 0.54, - "learning_rate": 4.7584120551385604e-06, - "loss": 0.0456, - "step": 19375 - }, - { - "epoch": 0.54, - "learning_rate": 4.756985073774937e-06, - "loss": 0.1148, - "step": 19380 - }, - { - "epoch": 0.54, - "learning_rate": 4.755558092411314e-06, - "loss": 0.1288, - "step": 19385 - }, - { - "epoch": 0.54, - "learning_rate": 4.75413111104769e-06, - "loss": 0.1497, - "step": 19390 - }, - { - "epoch": 0.54, - "learning_rate": 4.752704129684067e-06, - "loss": 0.2034, - "step": 19395 - }, - { - "epoch": 0.54, - "learning_rate": 4.751277148320443e-06, - "loss": 0.4643, - "step": 19400 - }, - { - "epoch": 0.54, - "learning_rate": 4.74985016695682e-06, - "loss": 0.0889, - "step": 19405 - }, - { - "epoch": 0.54, - "learning_rate": 4.7484231855931965e-06, - "loss": 0.1055, - "step": 19410 - }, - { - "epoch": 0.54, - "learning_rate": 4.746996204229573e-06, - "loss": 0.2563, - "step": 19415 - }, - { - "epoch": 0.54, - "learning_rate": 4.74556922286595e-06, - "loss": 0.1439, - "step": 19420 - }, - { - "epoch": 0.54, - "learning_rate": 4.744142241502326e-06, - "loss": 0.098, - "step": 19425 - }, - { - "epoch": 0.54, - "learning_rate": 4.742715260138703e-06, - "loss": 0.1248, - "step": 19430 - }, - { - "epoch": 0.54, - "learning_rate": 4.74128827877508e-06, - "loss": 0.1136, - "step": 19435 - }, - { - "epoch": 0.54, - "learning_rate": 4.739861297411456e-06, - "loss": 0.134, - "step": 19440 - }, - { - "epoch": 0.54, - "learning_rate": 4.738434316047833e-06, - "loss": 0.2237, - "step": 19445 - }, - { - "epoch": 0.54, - "learning_rate": 4.73700733468421e-06, - "loss": 0.3613, - "step": 19450 - }, - { - "epoch": 0.54, - "learning_rate": 4.735580353320586e-06, - "loss": 0.1377, - "step": 19455 - }, - { - "epoch": 0.54, - "learning_rate": 4.7341533719569624e-06, - "loss": 0.1604, - "step": 19460 - }, - { - "epoch": 0.54, - "learning_rate": 4.732726390593339e-06, - "loss": 0.1725, - "step": 19465 - }, - { - "epoch": 0.54, - "learning_rate": 4.731299409229716e-06, - "loss": 0.1327, - "step": 19470 - }, - { - "epoch": 0.54, - "learning_rate": 4.729872427866092e-06, - "loss": 0.2093, - "step": 19475 - }, - { - "epoch": 0.54, - "learning_rate": 4.7284454465024695e-06, - "loss": 0.0596, - "step": 19480 - }, - { - "epoch": 0.54, - "learning_rate": 4.727018465138846e-06, - "loss": 0.1679, - "step": 19485 - }, - { - "epoch": 0.54, - "learning_rate": 4.725591483775222e-06, - "loss": 0.1075, - "step": 19490 - }, - { - "epoch": 0.54, - "learning_rate": 4.724164502411599e-06, - "loss": 0.0746, - "step": 19495 - }, - { - "epoch": 0.54, - "learning_rate": 4.722737521047976e-06, - "loss": 0.5567, - "step": 19500 - }, - { - "epoch": 0.54, - "learning_rate": 4.721310539684352e-06, - "loss": 0.1269, - "step": 19505 - }, - { - "epoch": 0.54, - "learning_rate": 4.719883558320728e-06, - "loss": 0.0943, - "step": 19510 - }, - { - "epoch": 0.54, - "learning_rate": 4.7184565769571056e-06, - "loss": 0.1285, - "step": 19515 - }, - { - "epoch": 0.54, - "learning_rate": 4.717029595593482e-06, - "loss": 0.1681, - "step": 19520 - }, - { - "epoch": 0.54, - "learning_rate": 4.715602614229858e-06, - "loss": 0.108, - "step": 19525 - }, - { - "epoch": 0.54, - "learning_rate": 4.714175632866235e-06, - "loss": 0.0724, - "step": 19530 - }, - { - "epoch": 0.54, - "learning_rate": 4.712748651502612e-06, - "loss": 0.171, - "step": 19535 - }, - { - "epoch": 0.54, - "learning_rate": 4.711321670138989e-06, - "loss": 0.2208, - "step": 19540 - }, - { - "epoch": 0.54, - "learning_rate": 4.709894688775365e-06, - "loss": 0.2565, - "step": 19545 - }, - { - "epoch": 0.54, - "learning_rate": 4.708467707411742e-06, - "loss": 0.5097, - "step": 19550 - }, - { - "epoch": 0.54, - "learning_rate": 4.707040726048118e-06, - "loss": 0.1562, - "step": 19555 - }, - { - "epoch": 0.54, - "learning_rate": 4.705613744684494e-06, - "loss": 0.134, - "step": 19560 - }, - { - "epoch": 0.54, - "learning_rate": 4.7041867633208715e-06, - "loss": 0.1897, - "step": 19565 - }, - { - "epoch": 0.54, - "learning_rate": 4.702759781957248e-06, - "loss": 0.1167, - "step": 19570 - }, - { - "epoch": 0.54, - "learning_rate": 4.701332800593625e-06, - "loss": 0.1494, - "step": 19575 - }, - { - "epoch": 0.54, - "learning_rate": 4.699905819230001e-06, - "loss": 0.08, - "step": 19580 - }, - { - "epoch": 0.54, - "learning_rate": 4.698478837866378e-06, - "loss": 0.1657, - "step": 19585 - }, - { - "epoch": 0.54, - "learning_rate": 4.697051856502755e-06, - "loss": 0.1345, - "step": 19590 - }, - { - "epoch": 0.54, - "learning_rate": 4.695624875139131e-06, - "loss": 0.4074, - "step": 19595 - }, - { - "epoch": 0.54, - "learning_rate": 4.6941978937755075e-06, - "loss": 0.5657, - "step": 19600 - }, - { - "epoch": 0.54, - "learning_rate": 4.692770912411884e-06, - "loss": 0.1583, - "step": 19605 - }, - { - "epoch": 0.54, - "learning_rate": 4.691343931048261e-06, - "loss": 0.1803, - "step": 19610 - }, - { - "epoch": 0.54, - "learning_rate": 4.689916949684637e-06, - "loss": 0.1114, - "step": 19615 - }, - { - "epoch": 0.54, - "learning_rate": 4.688489968321014e-06, - "loss": 0.1527, - "step": 19620 - }, - { - "epoch": 0.54, - "learning_rate": 4.687062986957391e-06, - "loss": 0.1877, - "step": 19625 - }, - { - "epoch": 0.54, - "learning_rate": 4.685636005593767e-06, - "loss": 0.0716, - "step": 19630 - }, - { - "epoch": 0.54, - "learning_rate": 4.6842090242301445e-06, - "loss": 0.204, - "step": 19635 - }, - { - "epoch": 0.54, - "learning_rate": 4.682782042866521e-06, - "loss": 0.1118, - "step": 19640 - }, - { - "epoch": 0.55, - "learning_rate": 4.681355061502897e-06, - "loss": 0.1386, - "step": 19645 - }, - { - "epoch": 0.55, - "learning_rate": 4.6799280801392735e-06, - "loss": 0.4537, - "step": 19650 - }, - { - "epoch": 0.55, - "learning_rate": 4.67850109877565e-06, - "loss": 0.1359, - "step": 19655 - }, - { - "epoch": 0.55, - "learning_rate": 4.677074117412027e-06, - "loss": 0.1826, - "step": 19660 - }, - { - "epoch": 0.55, - "learning_rate": 4.675647136048403e-06, - "loss": 0.1137, - "step": 19665 - }, - { - "epoch": 0.55, - "learning_rate": 4.6742201546847805e-06, - "loss": 0.1227, - "step": 19670 - }, - { - "epoch": 0.55, - "learning_rate": 4.672793173321157e-06, - "loss": 0.1025, - "step": 19675 - }, - { - "epoch": 0.55, - "learning_rate": 4.671366191957533e-06, - "loss": 0.1241, - "step": 19680 - }, - { - "epoch": 0.55, - "learning_rate": 4.66993921059391e-06, - "loss": 0.1798, - "step": 19685 - }, - { - "epoch": 0.55, - "learning_rate": 4.668512229230287e-06, - "loss": 0.2408, - "step": 19690 - }, - { - "epoch": 0.55, - "learning_rate": 4.667085247866663e-06, - "loss": 0.1606, - "step": 19695 - }, - { - "epoch": 0.55, - "learning_rate": 4.665658266503039e-06, - "loss": 0.3169, - "step": 19700 - }, - { - "epoch": 0.55, - "learning_rate": 4.664231285139417e-06, - "loss": 0.1612, - "step": 19705 - }, - { - "epoch": 0.55, - "learning_rate": 4.662804303775793e-06, - "loss": 0.1583, - "step": 19710 - }, - { - "epoch": 0.55, - "learning_rate": 4.661377322412169e-06, - "loss": 0.096, - "step": 19715 - }, - { - "epoch": 0.55, - "learning_rate": 4.6599503410485464e-06, - "loss": 0.153, - "step": 19720 - }, - { - "epoch": 0.55, - "learning_rate": 4.658523359684923e-06, - "loss": 0.1391, - "step": 19725 - }, - { - "epoch": 0.55, - "learning_rate": 4.6570963783213e-06, - "loss": 0.0755, - "step": 19730 - }, - { - "epoch": 0.55, - "learning_rate": 4.655669396957676e-06, - "loss": 0.3471, - "step": 19735 - }, - { - "epoch": 0.55, - "learning_rate": 4.654242415594053e-06, - "loss": 0.328, - "step": 19740 - }, - { - "epoch": 0.55, - "learning_rate": 4.652815434230429e-06, - "loss": 0.2589, - "step": 19745 - }, - { - "epoch": 0.55, - "learning_rate": 4.651388452866805e-06, - "loss": 0.5256, - "step": 19750 - }, - { - "epoch": 0.55, - "learning_rate": 4.6499614715031825e-06, - "loss": 0.1261, - "step": 19755 - }, - { - "epoch": 0.55, - "learning_rate": 4.648534490139559e-06, - "loss": 0.1566, - "step": 19760 - }, - { - "epoch": 0.55, - "learning_rate": 4.647107508775936e-06, - "loss": 0.1264, - "step": 19765 - }, - { - "epoch": 0.55, - "learning_rate": 4.645680527412312e-06, - "loss": 0.1441, - "step": 19770 - }, - { - "epoch": 0.55, - "learning_rate": 4.644253546048689e-06, - "loss": 0.0962, - "step": 19775 - }, - { - "epoch": 0.55, - "learning_rate": 4.642826564685066e-06, - "loss": 0.1559, - "step": 19780 - }, - { - "epoch": 0.55, - "learning_rate": 4.641399583321442e-06, - "loss": 0.3271, - "step": 19785 - }, - { - "epoch": 0.55, - "learning_rate": 4.639972601957819e-06, - "loss": 0.2518, - "step": 19790 - }, - { - "epoch": 0.55, - "learning_rate": 4.638545620594195e-06, - "loss": 0.2339, - "step": 19795 - }, - { - "epoch": 0.55, - "learning_rate": 4.637118639230572e-06, - "loss": 0.3957, - "step": 19800 - }, - { - "epoch": 0.55, - "learning_rate": 4.6356916578669484e-06, - "loss": 0.1017, - "step": 19805 - }, - { - "epoch": 0.55, - "learning_rate": 4.634264676503325e-06, - "loss": 0.1268, - "step": 19810 - }, - { - "epoch": 0.55, - "learning_rate": 4.632837695139702e-06, - "loss": 0.1723, - "step": 19815 - }, - { - "epoch": 0.55, - "learning_rate": 4.631410713776078e-06, - "loss": 0.2455, - "step": 19820 - }, - { - "epoch": 0.55, - "learning_rate": 4.6299837324124555e-06, - "loss": 0.1241, - "step": 19825 - }, - { - "epoch": 0.55, - "learning_rate": 4.628556751048832e-06, - "loss": 0.0737, - "step": 19830 - }, - { - "epoch": 0.55, - "learning_rate": 4.627129769685208e-06, - "loss": 0.0642, - "step": 19835 - }, - { - "epoch": 0.55, - "learning_rate": 4.6257027883215845e-06, - "loss": 0.0967, - "step": 19840 - }, - { - "epoch": 0.55, - "learning_rate": 4.624275806957962e-06, - "loss": 0.2759, - "step": 19845 - }, - { - "epoch": 0.55, - "learning_rate": 4.622848825594338e-06, - "loss": 0.3172, - "step": 19850 - }, - { - "epoch": 0.55, - "learning_rate": 4.621421844230714e-06, - "loss": 0.1524, - "step": 19855 - }, - { - "epoch": 0.55, - "learning_rate": 4.6199948628670916e-06, - "loss": 0.1349, - "step": 19860 - }, - { - "epoch": 0.55, - "learning_rate": 4.618567881503468e-06, - "loss": 0.1402, - "step": 19865 - }, - { - "epoch": 0.55, - "learning_rate": 4.617140900139844e-06, - "loss": 0.1438, - "step": 19870 - }, - { - "epoch": 0.55, - "learning_rate": 4.615713918776221e-06, - "loss": 0.0545, - "step": 19875 - }, - { - "epoch": 0.55, - "learning_rate": 4.614286937412598e-06, - "loss": 0.1018, - "step": 19880 - }, - { - "epoch": 0.55, - "learning_rate": 4.612859956048975e-06, - "loss": 0.0954, - "step": 19885 - }, - { - "epoch": 0.55, - "learning_rate": 4.611432974685351e-06, - "loss": 0.1953, - "step": 19890 - }, - { - "epoch": 0.55, - "learning_rate": 4.610005993321728e-06, - "loss": 0.3253, - "step": 19895 - }, - { - "epoch": 0.55, - "learning_rate": 4.608579011958104e-06, - "loss": 0.3014, - "step": 19900 - }, - { - "epoch": 0.55, - "learning_rate": 4.60715203059448e-06, - "loss": 0.1242, - "step": 19905 - }, - { - "epoch": 0.55, - "learning_rate": 4.6057250492308575e-06, - "loss": 0.1286, - "step": 19910 - }, - { - "epoch": 0.55, - "learning_rate": 4.604298067867234e-06, - "loss": 0.1293, - "step": 19915 - }, - { - "epoch": 0.55, - "learning_rate": 4.602871086503611e-06, - "loss": 0.1594, - "step": 19920 - }, - { - "epoch": 0.55, - "learning_rate": 4.601444105139987e-06, - "loss": 0.1248, - "step": 19925 - }, - { - "epoch": 0.55, - "learning_rate": 4.6000171237763645e-06, - "loss": 0.0895, - "step": 19930 - }, - { - "epoch": 0.55, - "learning_rate": 4.598590142412741e-06, - "loss": 0.1539, - "step": 19935 - }, - { - "epoch": 0.55, - "learning_rate": 4.597163161049117e-06, - "loss": 0.166, - "step": 19940 - }, - { - "epoch": 0.55, - "learning_rate": 4.5957361796854935e-06, - "loss": 0.1508, - "step": 19945 - }, - { - "epoch": 0.55, - "learning_rate": 4.59430919832187e-06, - "loss": 0.3545, - "step": 19950 - }, - { - "epoch": 0.55, - "learning_rate": 4.592882216958247e-06, - "loss": 0.1807, - "step": 19955 - }, - { - "epoch": 0.55, - "learning_rate": 4.591455235594623e-06, - "loss": 0.2103, - "step": 19960 - }, - { - "epoch": 0.55, - "learning_rate": 4.590028254231e-06, - "loss": 0.2293, - "step": 19965 - }, - { - "epoch": 0.55, - "learning_rate": 4.588601272867377e-06, - "loss": 0.1707, - "step": 19970 - }, - { - "epoch": 0.55, - "learning_rate": 4.587174291503753e-06, - "loss": 0.0613, - "step": 19975 - }, - { - "epoch": 0.55, - "learning_rate": 4.5857473101401305e-06, - "loss": 0.091, - "step": 19980 - }, - { - "epoch": 0.55, - "learning_rate": 4.584320328776507e-06, - "loss": 0.1545, - "step": 19985 - }, - { - "epoch": 0.55, - "learning_rate": 4.582893347412883e-06, - "loss": 0.1857, - "step": 19990 - }, - { - "epoch": 0.55, - "learning_rate": 4.5814663660492595e-06, - "loss": 0.1609, - "step": 19995 - }, - { - "epoch": 0.55, - "learning_rate": 4.580039384685636e-06, - "loss": 0.4993, - "step": 20000 - }, - { - "epoch": 0.55, - "eval_loss": 0.0669386014342308, - "eval_runtime": 1938.2183, - "eval_samples_per_second": 8.264, - "eval_steps_per_second": 2.066, - "eval_wer": 0.18878470970068517, - "step": 20000 - }, - { - "epoch": 0.56, - "learning_rate": 4.578612403322013e-06, - "loss": 0.1699, - "step": 20005 - }, - { - "epoch": 0.56, - "learning_rate": 4.577185421958389e-06, - "loss": 0.1706, - "step": 20010 - }, - { - "epoch": 0.56, - "learning_rate": 4.5757584405947665e-06, - "loss": 0.1171, - "step": 20015 - }, - { - "epoch": 0.56, - "learning_rate": 4.574331459231143e-06, - "loss": 0.2332, - "step": 20020 - }, - { - "epoch": 0.56, - "learning_rate": 4.57290447786752e-06, - "loss": 0.0381, - "step": 20025 - }, - { - "epoch": 0.56, - "learning_rate": 4.571477496503896e-06, - "loss": 0.1741, - "step": 20030 - }, - { - "epoch": 0.56, - "learning_rate": 4.570050515140273e-06, - "loss": 0.0784, - "step": 20035 - }, - { - "epoch": 0.56, - "learning_rate": 4.568623533776649e-06, - "loss": 0.1647, - "step": 20040 - }, - { - "epoch": 0.56, - "learning_rate": 4.567196552413025e-06, - "loss": 0.1712, - "step": 20045 - }, - { - "epoch": 0.56, - "learning_rate": 4.565769571049403e-06, - "loss": 0.3781, - "step": 20050 - }, - { - "epoch": 0.56, - "learning_rate": 4.564342589685779e-06, - "loss": 0.128, - "step": 20055 - }, - { - "epoch": 0.56, - "learning_rate": 4.562915608322155e-06, - "loss": 0.1474, - "step": 20060 - }, - { - "epoch": 0.56, - "learning_rate": 4.5614886269585325e-06, - "loss": 0.1729, - "step": 20065 - }, - { - "epoch": 0.56, - "learning_rate": 4.560061645594909e-06, - "loss": 0.112, - "step": 20070 - }, - { - "epoch": 0.56, - "learning_rate": 4.558634664231286e-06, - "loss": 0.1977, - "step": 20075 - }, - { - "epoch": 0.56, - "learning_rate": 4.557207682867662e-06, - "loss": 0.0751, - "step": 20080 - }, - { - "epoch": 0.56, - "learning_rate": 4.555780701504039e-06, - "loss": 0.1949, - "step": 20085 - }, - { - "epoch": 0.56, - "learning_rate": 4.554353720140415e-06, - "loss": 0.048, - "step": 20090 - }, - { - "epoch": 0.56, - "learning_rate": 4.552926738776791e-06, - "loss": 0.2332, - "step": 20095 - }, - { - "epoch": 0.56, - "learning_rate": 4.5514997574131685e-06, - "loss": 0.2679, - "step": 20100 - }, - { - "epoch": 0.56, - "learning_rate": 4.550072776049545e-06, - "loss": 0.1536, - "step": 20105 - }, - { - "epoch": 0.56, - "learning_rate": 4.548645794685922e-06, - "loss": 0.1591, - "step": 20110 - }, - { - "epoch": 0.56, - "learning_rate": 4.547218813322298e-06, - "loss": 0.154, - "step": 20115 - }, - { - "epoch": 0.56, - "learning_rate": 4.5457918319586756e-06, - "loss": 0.1012, - "step": 20120 - }, - { - "epoch": 0.56, - "learning_rate": 4.544364850595052e-06, - "loss": 0.1548, - "step": 20125 - }, - { - "epoch": 0.56, - "learning_rate": 4.542937869231428e-06, - "loss": 0.0512, - "step": 20130 - }, - { - "epoch": 0.56, - "learning_rate": 4.541510887867805e-06, - "loss": 0.0681, - "step": 20135 - }, - { - "epoch": 0.56, - "learning_rate": 4.540083906504181e-06, - "loss": 0.0874, - "step": 20140 - }, - { - "epoch": 0.56, - "learning_rate": 4.538656925140558e-06, - "loss": 0.1211, - "step": 20145 - }, - { - "epoch": 0.56, - "learning_rate": 4.5372299437769344e-06, - "loss": 0.4391, - "step": 20150 - }, - { - "epoch": 0.56, - "learning_rate": 4.535802962413312e-06, - "loss": 0.1699, - "step": 20155 - }, - { - "epoch": 0.56, - "learning_rate": 4.534375981049688e-06, - "loss": 0.1564, - "step": 20160 - }, - { - "epoch": 0.56, - "learning_rate": 4.532948999686064e-06, - "loss": 0.1292, - "step": 20165 - }, - { - "epoch": 0.56, - "learning_rate": 4.5315220183224415e-06, - "loss": 0.2075, - "step": 20170 - }, - { - "epoch": 0.56, - "learning_rate": 4.530095036958818e-06, - "loss": 0.1313, - "step": 20175 - }, - { - "epoch": 0.56, - "learning_rate": 4.528668055595194e-06, - "loss": 0.2009, - "step": 20180 - }, - { - "epoch": 0.56, - "learning_rate": 4.5272410742315705e-06, - "loss": 0.0512, - "step": 20185 - }, - { - "epoch": 0.56, - "learning_rate": 4.525814092867947e-06, - "loss": 0.1592, - "step": 20190 - }, - { - "epoch": 0.56, - "learning_rate": 4.524387111504324e-06, - "loss": 0.3646, - "step": 20195 - }, - { - "epoch": 0.56, - "learning_rate": 4.5229601301407e-06, - "loss": 0.3226, - "step": 20200 - }, - { - "epoch": 0.56, - "learning_rate": 4.5215331487770776e-06, - "loss": 0.1047, - "step": 20205 - }, - { - "epoch": 0.56, - "learning_rate": 4.520106167413454e-06, - "loss": 0.1136, - "step": 20210 - }, - { - "epoch": 0.56, - "learning_rate": 4.518679186049831e-06, - "loss": 0.1991, - "step": 20215 - }, - { - "epoch": 0.56, - "learning_rate": 4.517252204686207e-06, - "loss": 0.1289, - "step": 20220 - }, - { - "epoch": 0.56, - "learning_rate": 4.515825223322584e-06, - "loss": 0.1628, - "step": 20225 - }, - { - "epoch": 0.56, - "learning_rate": 4.51439824195896e-06, - "loss": 0.0617, - "step": 20230 - }, - { - "epoch": 0.56, - "learning_rate": 4.5129712605953364e-06, - "loss": 0.0902, - "step": 20235 - }, - { - "epoch": 0.56, - "learning_rate": 4.511544279231714e-06, - "loss": 0.1425, - "step": 20240 - }, - { - "epoch": 0.56, - "learning_rate": 4.51011729786809e-06, - "loss": 0.1862, - "step": 20245 - }, - { - "epoch": 0.56, - "learning_rate": 4.508690316504467e-06, - "loss": 0.39, - "step": 20250 - }, - { - "epoch": 0.56, - "learning_rate": 4.5072633351408435e-06, - "loss": 0.1516, - "step": 20255 - }, - { - "epoch": 0.56, - "learning_rate": 4.50583635377722e-06, - "loss": 0.1834, - "step": 20260 - }, - { - "epoch": 0.56, - "learning_rate": 4.504409372413597e-06, - "loss": 0.1808, - "step": 20265 - }, - { - "epoch": 0.56, - "learning_rate": 4.502982391049973e-06, - "loss": 0.1624, - "step": 20270 - }, - { - "epoch": 0.56, - "learning_rate": 4.50155540968635e-06, - "loss": 0.0985, - "step": 20275 - }, - { - "epoch": 0.56, - "learning_rate": 4.500128428322727e-06, - "loss": 0.102, - "step": 20280 - }, - { - "epoch": 0.56, - "learning_rate": 4.498701446959103e-06, - "loss": 0.116, - "step": 20285 - }, - { - "epoch": 0.56, - "learning_rate": 4.4972744655954795e-06, - "loss": 0.1095, - "step": 20290 - }, - { - "epoch": 0.56, - "learning_rate": 4.495847484231856e-06, - "loss": 0.2776, - "step": 20295 - }, - { - "epoch": 0.56, - "learning_rate": 4.494420502868233e-06, - "loss": 0.2438, - "step": 20300 - }, - { - "epoch": 0.56, - "learning_rate": 4.492993521504609e-06, - "loss": 0.1154, - "step": 20305 - }, - { - "epoch": 0.56, - "learning_rate": 4.491566540140987e-06, - "loss": 0.169, - "step": 20310 - }, - { - "epoch": 0.56, - "learning_rate": 4.490139558777363e-06, - "loss": 0.1826, - "step": 20315 - }, - { - "epoch": 0.56, - "learning_rate": 4.488712577413739e-06, - "loss": 0.1493, - "step": 20320 - }, - { - "epoch": 0.56, - "learning_rate": 4.4872855960501165e-06, - "loss": 0.1289, - "step": 20325 - }, - { - "epoch": 0.56, - "learning_rate": 4.485858614686493e-06, - "loss": 0.0935, - "step": 20330 - }, - { - "epoch": 0.56, - "learning_rate": 4.484431633322869e-06, - "loss": 0.0403, - "step": 20335 - }, - { - "epoch": 0.56, - "learning_rate": 4.4830046519592455e-06, - "loss": 0.1808, - "step": 20340 - }, - { - "epoch": 0.56, - "learning_rate": 4.481577670595623e-06, - "loss": 0.0966, - "step": 20345 - }, - { - "epoch": 0.56, - "learning_rate": 4.480150689231999e-06, - "loss": 0.411, - "step": 20350 - }, - { - "epoch": 0.56, - "learning_rate": 4.478723707868375e-06, - "loss": 0.0877, - "step": 20355 - }, - { - "epoch": 0.56, - "learning_rate": 4.4772967265047525e-06, - "loss": 0.1105, - "step": 20360 - }, - { - "epoch": 0.57, - "learning_rate": 4.475869745141129e-06, - "loss": 0.1447, - "step": 20365 - }, - { - "epoch": 0.57, - "learning_rate": 4.474442763777506e-06, - "loss": 0.179, - "step": 20370 - }, - { - "epoch": 0.57, - "learning_rate": 4.473015782413882e-06, - "loss": 0.1692, - "step": 20375 - }, - { - "epoch": 0.57, - "learning_rate": 4.471588801050259e-06, - "loss": 0.1855, - "step": 20380 - }, - { - "epoch": 0.57, - "learning_rate": 4.470161819686635e-06, - "loss": 0.1729, - "step": 20385 - }, - { - "epoch": 0.57, - "learning_rate": 4.468734838323011e-06, - "loss": 0.1352, - "step": 20390 - }, - { - "epoch": 0.57, - "learning_rate": 4.467307856959389e-06, - "loss": 0.3104, - "step": 20395 - }, - { - "epoch": 0.57, - "learning_rate": 4.465880875595765e-06, - "loss": 0.3898, - "step": 20400 - }, - { - "epoch": 0.57, - "learning_rate": 4.464453894232142e-06, - "loss": 0.1416, - "step": 20405 - }, - { - "epoch": 0.57, - "learning_rate": 4.4630269128685185e-06, - "loss": 0.1073, - "step": 20410 - }, - { - "epoch": 0.57, - "learning_rate": 4.461599931504895e-06, - "loss": 0.1166, - "step": 20415 - }, - { - "epoch": 0.57, - "learning_rate": 4.460172950141272e-06, - "loss": 0.1951, - "step": 20420 - }, - { - "epoch": 0.57, - "learning_rate": 4.458745968777648e-06, - "loss": 0.2497, - "step": 20425 - }, - { - "epoch": 0.57, - "learning_rate": 4.457318987414025e-06, - "loss": 0.2005, - "step": 20430 - }, - { - "epoch": 0.57, - "learning_rate": 4.455892006050401e-06, - "loss": 0.1289, - "step": 20435 - }, - { - "epoch": 0.57, - "learning_rate": 4.454465024686778e-06, - "loss": 0.1432, - "step": 20440 - }, - { - "epoch": 0.57, - "learning_rate": 4.4530380433231545e-06, - "loss": 0.2041, - "step": 20445 - }, - { - "epoch": 0.57, - "learning_rate": 4.451611061959531e-06, - "loss": 0.3785, - "step": 20450 - }, - { - "epoch": 0.57, - "learning_rate": 4.450184080595908e-06, - "loss": 0.1748, - "step": 20455 - }, - { - "epoch": 0.57, - "learning_rate": 4.448757099232284e-06, - "loss": 0.1515, - "step": 20460 - }, - { - "epoch": 0.57, - "learning_rate": 4.4473301178686616e-06, - "loss": 0.1289, - "step": 20465 - }, - { - "epoch": 0.57, - "learning_rate": 4.445903136505038e-06, - "loss": 0.1449, - "step": 20470 - }, - { - "epoch": 0.57, - "learning_rate": 4.444476155141414e-06, - "loss": 0.159, - "step": 20475 - }, - { - "epoch": 0.57, - "learning_rate": 4.443049173777791e-06, - "loss": 0.0797, - "step": 20480 - }, - { - "epoch": 0.57, - "learning_rate": 4.441622192414167e-06, - "loss": 0.1511, - "step": 20485 - }, - { - "epoch": 0.57, - "learning_rate": 4.440195211050544e-06, - "loss": 0.1973, - "step": 20490 - }, - { - "epoch": 0.57, - "learning_rate": 4.4387682296869204e-06, - "loss": 0.2574, - "step": 20495 - }, - { - "epoch": 0.57, - "learning_rate": 4.437341248323298e-06, - "loss": 0.3839, - "step": 20500 - }, - { - "epoch": 0.57, - "learning_rate": 4.435914266959674e-06, - "loss": 0.1251, - "step": 20505 - }, - { - "epoch": 0.57, - "learning_rate": 4.43448728559605e-06, - "loss": 0.2167, - "step": 20510 - }, - { - "epoch": 0.57, - "learning_rate": 4.4330603042324275e-06, - "loss": 0.1524, - "step": 20515 - }, - { - "epoch": 0.57, - "learning_rate": 4.431633322868804e-06, - "loss": 0.1234, - "step": 20520 - }, - { - "epoch": 0.57, - "learning_rate": 4.43020634150518e-06, - "loss": 0.1171, - "step": 20525 - }, - { - "epoch": 0.57, - "learning_rate": 4.4287793601415565e-06, - "loss": 0.084, - "step": 20530 - }, - { - "epoch": 0.57, - "learning_rate": 4.427352378777934e-06, - "loss": 0.1054, - "step": 20535 - }, - { - "epoch": 0.57, - "learning_rate": 4.42592539741431e-06, - "loss": 0.1512, - "step": 20540 - }, - { - "epoch": 0.57, - "learning_rate": 4.424498416050686e-06, - "loss": 0.2869, - "step": 20545 - }, - { - "epoch": 0.57, - "learning_rate": 4.4230714346870636e-06, - "loss": 0.4615, - "step": 20550 - }, - { - "epoch": 0.57, - "learning_rate": 4.42164445332344e-06, - "loss": 0.1295, - "step": 20555 - }, - { - "epoch": 0.57, - "learning_rate": 4.420217471959817e-06, - "loss": 0.1585, - "step": 20560 - }, - { - "epoch": 0.57, - "learning_rate": 4.418790490596193e-06, - "loss": 0.1597, - "step": 20565 - }, - { - "epoch": 0.57, - "learning_rate": 4.41736350923257e-06, - "loss": 0.1442, - "step": 20570 - }, - { - "epoch": 0.57, - "learning_rate": 4.415936527868946e-06, - "loss": 0.1386, - "step": 20575 - }, - { - "epoch": 0.57, - "learning_rate": 4.4145095465053224e-06, - "loss": 0.1077, - "step": 20580 - }, - { - "epoch": 0.57, - "learning_rate": 4.4130825651417e-06, - "loss": 0.1364, - "step": 20585 - }, - { - "epoch": 0.57, - "learning_rate": 4.411655583778076e-06, - "loss": 0.1187, - "step": 20590 - }, - { - "epoch": 0.57, - "learning_rate": 4.410228602414453e-06, - "loss": 0.2429, - "step": 20595 - }, - { - "epoch": 0.57, - "learning_rate": 4.4088016210508295e-06, - "loss": 0.3807, - "step": 20600 - }, - { - "epoch": 0.57, - "learning_rate": 4.407374639687206e-06, - "loss": 0.1403, - "step": 20605 - }, - { - "epoch": 0.57, - "learning_rate": 4.405947658323583e-06, - "loss": 0.1602, - "step": 20610 - }, - { - "epoch": 0.57, - "learning_rate": 4.404520676959959e-06, - "loss": 0.1603, - "step": 20615 - }, - { - "epoch": 0.57, - "learning_rate": 4.403093695596336e-06, - "loss": 0.1754, - "step": 20620 - }, - { - "epoch": 0.57, - "learning_rate": 4.401666714232712e-06, - "loss": 0.2135, - "step": 20625 - }, - { - "epoch": 0.57, - "learning_rate": 4.400239732869089e-06, - "loss": 0.0698, - "step": 20630 - }, - { - "epoch": 0.57, - "learning_rate": 4.3988127515054655e-06, - "loss": 0.0483, - "step": 20635 - }, - { - "epoch": 0.57, - "learning_rate": 4.397385770141842e-06, - "loss": 0.1518, - "step": 20640 - }, - { - "epoch": 0.57, - "learning_rate": 4.395958788778219e-06, - "loss": 0.334, - "step": 20645 - }, - { - "epoch": 0.57, - "learning_rate": 4.394531807414595e-06, - "loss": 0.4927, - "step": 20650 - }, - { - "epoch": 0.57, - "learning_rate": 4.393104826050973e-06, - "loss": 0.0987, - "step": 20655 - }, - { - "epoch": 0.57, - "learning_rate": 4.391677844687349e-06, - "loss": 0.1963, - "step": 20660 - }, - { - "epoch": 0.57, - "learning_rate": 4.390250863323725e-06, - "loss": 0.1392, - "step": 20665 - }, - { - "epoch": 0.57, - "learning_rate": 4.388823881960102e-06, - "loss": 0.1584, - "step": 20670 - }, - { - "epoch": 0.57, - "learning_rate": 4.387396900596479e-06, - "loss": 0.0979, - "step": 20675 - }, - { - "epoch": 0.57, - "learning_rate": 4.385969919232855e-06, - "loss": 0.0659, - "step": 20680 - }, - { - "epoch": 0.57, - "learning_rate": 4.3845429378692315e-06, - "loss": 0.1128, - "step": 20685 - }, - { - "epoch": 0.57, - "learning_rate": 4.383115956505609e-06, - "loss": 0.1779, - "step": 20690 - }, - { - "epoch": 0.57, - "learning_rate": 4.381688975141985e-06, - "loss": 0.2824, - "step": 20695 - }, - { - "epoch": 0.57, - "learning_rate": 4.380261993778361e-06, - "loss": 0.2393, - "step": 20700 - }, - { - "epoch": 0.57, - "learning_rate": 4.3788350124147385e-06, - "loss": 0.1658, - "step": 20705 - }, - { - "epoch": 0.57, - "learning_rate": 4.377408031051115e-06, - "loss": 0.0941, - "step": 20710 - }, - { - "epoch": 0.57, - "learning_rate": 4.375981049687491e-06, - "loss": 0.1224, - "step": 20715 - }, - { - "epoch": 0.57, - "learning_rate": 4.374554068323868e-06, - "loss": 0.2027, - "step": 20720 - }, - { - "epoch": 0.58, - "learning_rate": 4.373127086960245e-06, - "loss": 0.0874, - "step": 20725 - }, - { - "epoch": 0.58, - "learning_rate": 4.371700105596621e-06, - "loss": 0.035, - "step": 20730 - }, - { - "epoch": 0.58, - "learning_rate": 4.370273124232997e-06, - "loss": 0.1263, - "step": 20735 - }, - { - "epoch": 0.58, - "learning_rate": 4.368846142869375e-06, - "loss": 0.1757, - "step": 20740 - }, - { - "epoch": 0.58, - "learning_rate": 4.367419161505751e-06, - "loss": 0.2759, - "step": 20745 - }, - { - "epoch": 0.58, - "learning_rate": 4.365992180142128e-06, - "loss": 0.5597, - "step": 20750 - }, - { - "epoch": 0.58, - "learning_rate": 4.3645651987785045e-06, - "loss": 0.1479, - "step": 20755 - }, - { - "epoch": 0.58, - "learning_rate": 4.363138217414881e-06, - "loss": 0.1397, - "step": 20760 - }, - { - "epoch": 0.58, - "learning_rate": 4.361711236051258e-06, - "loss": 0.1465, - "step": 20765 - }, - { - "epoch": 0.58, - "learning_rate": 4.360284254687634e-06, - "loss": 0.1723, - "step": 20770 - }, - { - "epoch": 0.58, - "learning_rate": 4.358857273324011e-06, - "loss": 0.1158, - "step": 20775 - }, - { - "epoch": 0.58, - "learning_rate": 4.357430291960387e-06, - "loss": 0.0537, - "step": 20780 - }, - { - "epoch": 0.58, - "learning_rate": 4.356003310596764e-06, - "loss": 0.0526, - "step": 20785 - }, - { - "epoch": 0.58, - "learning_rate": 4.3545763292331405e-06, - "loss": 0.2546, - "step": 20790 - }, - { - "epoch": 0.58, - "learning_rate": 4.353149347869517e-06, - "loss": 0.26, - "step": 20795 - }, - { - "epoch": 0.58, - "learning_rate": 4.351722366505894e-06, - "loss": 0.7419, - "step": 20800 - }, - { - "epoch": 0.58, - "learning_rate": 4.35029538514227e-06, - "loss": 0.186, - "step": 20805 - }, - { - "epoch": 0.58, - "learning_rate": 4.3488684037786476e-06, - "loss": 0.1095, - "step": 20810 - }, - { - "epoch": 0.58, - "learning_rate": 4.347441422415024e-06, - "loss": 0.1813, - "step": 20815 - }, - { - "epoch": 0.58, - "learning_rate": 4.3460144410514e-06, - "loss": 0.169, - "step": 20820 - }, - { - "epoch": 0.58, - "learning_rate": 4.344587459687777e-06, - "loss": 0.2242, - "step": 20825 - }, - { - "epoch": 0.58, - "learning_rate": 4.343160478324153e-06, - "loss": 0.1274, - "step": 20830 - }, - { - "epoch": 0.58, - "learning_rate": 4.34173349696053e-06, - "loss": 0.1351, - "step": 20835 - }, - { - "epoch": 0.58, - "learning_rate": 4.3403065155969064e-06, - "loss": 0.1285, - "step": 20840 - }, - { - "epoch": 0.58, - "learning_rate": 4.338879534233284e-06, - "loss": 0.202, - "step": 20845 - }, - { - "epoch": 0.58, - "learning_rate": 4.33745255286966e-06, - "loss": 0.4036, - "step": 20850 - }, - { - "epoch": 0.58, - "learning_rate": 4.336025571506037e-06, - "loss": 0.1037, - "step": 20855 - }, - { - "epoch": 0.58, - "learning_rate": 4.3345985901424135e-06, - "loss": 0.1949, - "step": 20860 - }, - { - "epoch": 0.58, - "learning_rate": 4.33317160877879e-06, - "loss": 0.1631, - "step": 20865 - }, - { - "epoch": 0.58, - "learning_rate": 4.331744627415166e-06, - "loss": 0.1696, - "step": 20870 - }, - { - "epoch": 0.58, - "learning_rate": 4.3303176460515425e-06, - "loss": 0.1076, - "step": 20875 - }, - { - "epoch": 0.58, - "learning_rate": 4.32889066468792e-06, - "loss": 0.093, - "step": 20880 - }, - { - "epoch": 0.58, - "learning_rate": 4.327463683324296e-06, - "loss": 0.0859, - "step": 20885 - }, - { - "epoch": 0.58, - "learning_rate": 4.326036701960672e-06, - "loss": 0.1325, - "step": 20890 - }, - { - "epoch": 0.58, - "learning_rate": 4.3246097205970496e-06, - "loss": 0.1415, - "step": 20895 - }, - { - "epoch": 0.58, - "learning_rate": 4.323182739233426e-06, - "loss": 0.2313, - "step": 20900 - }, - { - "epoch": 0.58, - "learning_rate": 4.321755757869803e-06, - "loss": 0.068, - "step": 20905 - }, - { - "epoch": 0.58, - "learning_rate": 4.320328776506179e-06, - "loss": 0.2165, - "step": 20910 - }, - { - "epoch": 0.58, - "learning_rate": 4.318901795142556e-06, - "loss": 0.1739, - "step": 20915 - }, - { - "epoch": 0.58, - "learning_rate": 4.317474813778932e-06, - "loss": 0.2026, - "step": 20920 - }, - { - "epoch": 0.58, - "learning_rate": 4.3160478324153084e-06, - "loss": 0.0622, - "step": 20925 - }, - { - "epoch": 0.58, - "learning_rate": 4.314620851051686e-06, - "loss": 0.1017, - "step": 20930 - }, - { - "epoch": 0.58, - "learning_rate": 4.313193869688062e-06, - "loss": 0.1367, - "step": 20935 - }, - { - "epoch": 0.58, - "learning_rate": 4.311766888324439e-06, - "loss": 0.2419, - "step": 20940 - }, - { - "epoch": 0.58, - "learning_rate": 4.3103399069608155e-06, - "loss": 0.2738, - "step": 20945 - }, - { - "epoch": 0.58, - "learning_rate": 4.308912925597193e-06, - "loss": 0.3316, - "step": 20950 - }, - { - "epoch": 0.58, - "learning_rate": 4.307485944233569e-06, - "loss": 0.1736, - "step": 20955 - }, - { - "epoch": 0.58, - "learning_rate": 4.306058962869945e-06, - "loss": 0.1284, - "step": 20960 - }, - { - "epoch": 0.58, - "learning_rate": 4.304631981506322e-06, - "loss": 0.1507, - "step": 20965 - }, - { - "epoch": 0.58, - "learning_rate": 4.303205000142698e-06, - "loss": 0.2268, - "step": 20970 - }, - { - "epoch": 0.58, - "learning_rate": 4.301778018779075e-06, - "loss": 0.0751, - "step": 20975 - }, - { - "epoch": 0.58, - "learning_rate": 4.3003510374154515e-06, - "loss": 0.153, - "step": 20980 - }, - { - "epoch": 0.58, - "learning_rate": 4.298924056051828e-06, - "loss": 0.1526, - "step": 20985 - }, - { - "epoch": 0.58, - "learning_rate": 4.297497074688205e-06, - "loss": 0.3756, - "step": 20990 - }, - { - "epoch": 0.58, - "learning_rate": 4.296070093324581e-06, - "loss": 0.1955, - "step": 20995 - }, - { - "epoch": 0.58, - "learning_rate": 4.294928508233683e-06, - "loss": 0.2918, - "step": 21000 - }, - { - "epoch": 0.58, - "learning_rate": 4.293501526870059e-06, - "loss": 0.1349, - "step": 21005 - }, - { - "epoch": 0.58, - "learning_rate": 4.292074545506436e-06, - "loss": 0.1168, - "step": 21010 - }, - { - "epoch": 0.58, - "learning_rate": 4.2906475641428125e-06, - "loss": 0.1455, - "step": 21015 - }, - { - "epoch": 0.58, - "learning_rate": 4.28922058277919e-06, - "loss": 0.2116, - "step": 21020 - }, - { - "epoch": 0.58, - "learning_rate": 4.287793601415566e-06, - "loss": 0.0509, - "step": 21025 - }, - { - "epoch": 0.58, - "learning_rate": 4.286366620051942e-06, - "loss": 0.093, - "step": 21030 - }, - { - "epoch": 0.58, - "learning_rate": 4.284939638688319e-06, - "loss": 0.1425, - "step": 21035 - }, - { - "epoch": 0.58, - "learning_rate": 4.283512657324695e-06, - "loss": 0.2013, - "step": 21040 - }, - { - "epoch": 0.58, - "learning_rate": 4.282085675961072e-06, - "loss": 0.4366, - "step": 21045 - }, - { - "epoch": 0.58, - "learning_rate": 4.280658694597449e-06, - "loss": 0.2633, - "step": 21050 - }, - { - "epoch": 0.58, - "learning_rate": 4.279231713233826e-06, - "loss": 0.1191, - "step": 21055 - }, - { - "epoch": 0.58, - "learning_rate": 4.277804731870202e-06, - "loss": 0.1401, - "step": 21060 - }, - { - "epoch": 0.58, - "learning_rate": 4.276377750506579e-06, - "loss": 0.1819, - "step": 21065 - }, - { - "epoch": 0.58, - "learning_rate": 4.274950769142956e-06, - "loss": 0.1411, - "step": 21070 - }, - { - "epoch": 0.58, - "learning_rate": 4.273523787779332e-06, - "loss": 0.1296, - "step": 21075 - }, - { - "epoch": 0.58, - "learning_rate": 4.272096806415708e-06, - "loss": 0.1174, - "step": 21080 - }, - { - "epoch": 0.59, - "learning_rate": 4.270669825052085e-06, - "loss": 0.2018, - "step": 21085 - }, - { - "epoch": 0.59, - "learning_rate": 4.269242843688462e-06, - "loss": 0.1544, - "step": 21090 - }, - { - "epoch": 0.59, - "learning_rate": 4.267815862324838e-06, - "loss": 0.4319, - "step": 21095 - }, - { - "epoch": 0.59, - "learning_rate": 4.2663888809612145e-06, - "loss": 0.5075, - "step": 21100 - }, - { - "epoch": 0.59, - "learning_rate": 4.264961899597592e-06, - "loss": 0.0764, - "step": 21105 - }, - { - "epoch": 0.59, - "learning_rate": 4.263534918233968e-06, - "loss": 0.1584, - "step": 21110 - }, - { - "epoch": 0.59, - "learning_rate": 4.262107936870345e-06, - "loss": 0.1203, - "step": 21115 - }, - { - "epoch": 0.59, - "learning_rate": 4.2606809555067216e-06, - "loss": 0.1413, - "step": 21120 - }, - { - "epoch": 0.59, - "learning_rate": 4.259253974143098e-06, - "loss": 0.0478, - "step": 21125 - }, - { - "epoch": 0.59, - "learning_rate": 4.257826992779474e-06, - "loss": 0.0766, - "step": 21130 - }, - { - "epoch": 0.59, - "learning_rate": 4.256400011415851e-06, - "loss": 0.084, - "step": 21135 - }, - { - "epoch": 0.59, - "learning_rate": 4.254973030052228e-06, - "loss": 0.1812, - "step": 21140 - }, - { - "epoch": 0.59, - "learning_rate": 4.253546048688604e-06, - "loss": 0.1909, - "step": 21145 - }, - { - "epoch": 0.59, - "learning_rate": 4.252119067324981e-06, - "loss": 0.4103, - "step": 21150 - }, - { - "epoch": 0.59, - "learning_rate": 4.250692085961358e-06, - "loss": 0.1331, - "step": 21155 - }, - { - "epoch": 0.59, - "learning_rate": 4.249265104597735e-06, - "loss": 0.1468, - "step": 21160 - }, - { - "epoch": 0.59, - "learning_rate": 4.247838123234111e-06, - "loss": 0.1293, - "step": 21165 - }, - { - "epoch": 0.59, - "learning_rate": 4.2464111418704875e-06, - "loss": 0.1586, - "step": 21170 - }, - { - "epoch": 0.59, - "learning_rate": 4.244984160506864e-06, - "loss": 0.1686, - "step": 21175 - }, - { - "epoch": 0.59, - "learning_rate": 4.243557179143241e-06, - "loss": 0.0373, - "step": 21180 - }, - { - "epoch": 0.59, - "learning_rate": 4.242130197779617e-06, - "loss": 0.1762, - "step": 21185 - }, - { - "epoch": 0.59, - "learning_rate": 4.240703216415994e-06, - "loss": 0.1562, - "step": 21190 - }, - { - "epoch": 0.59, - "learning_rate": 4.23927623505237e-06, - "loss": 0.1351, - "step": 21195 - }, - { - "epoch": 0.59, - "learning_rate": 4.237849253688747e-06, - "loss": 0.2875, - "step": 21200 - }, - { - "epoch": 0.59, - "learning_rate": 4.2364222723251235e-06, - "loss": 0.1819, - "step": 21205 - }, - { - "epoch": 0.59, - "learning_rate": 4.234995290961501e-06, - "loss": 0.1727, - "step": 21210 - }, - { - "epoch": 0.59, - "learning_rate": 4.233568309597877e-06, - "loss": 0.18, - "step": 21215 - }, - { - "epoch": 0.59, - "learning_rate": 4.232141328234253e-06, - "loss": 0.2093, - "step": 21220 - }, - { - "epoch": 0.59, - "learning_rate": 4.230714346870631e-06, - "loss": 0.0974, - "step": 21225 - }, - { - "epoch": 0.59, - "learning_rate": 4.229287365507007e-06, - "loss": 0.1422, - "step": 21230 - }, - { - "epoch": 0.59, - "learning_rate": 4.227860384143383e-06, - "loss": 0.0592, - "step": 21235 - }, - { - "epoch": 0.59, - "learning_rate": 4.22643340277976e-06, - "loss": 0.0948, - "step": 21240 - }, - { - "epoch": 0.59, - "learning_rate": 4.225006421416137e-06, - "loss": 0.1492, - "step": 21245 - }, - { - "epoch": 0.59, - "learning_rate": 4.223579440052513e-06, - "loss": 0.4271, - "step": 21250 - }, - { - "epoch": 0.59, - "learning_rate": 4.22215245868889e-06, - "loss": 0.1395, - "step": 21255 - }, - { - "epoch": 0.59, - "learning_rate": 4.220725477325267e-06, - "loss": 0.1376, - "step": 21260 - }, - { - "epoch": 0.59, - "learning_rate": 4.219298495961643e-06, - "loss": 0.1993, - "step": 21265 - }, - { - "epoch": 0.59, - "learning_rate": 4.21787151459802e-06, - "loss": 0.159, - "step": 21270 - }, - { - "epoch": 0.59, - "learning_rate": 4.2164445332343965e-06, - "loss": 0.1568, - "step": 21275 - }, - { - "epoch": 0.59, - "learning_rate": 4.215017551870773e-06, - "loss": 0.0631, - "step": 21280 - }, - { - "epoch": 0.59, - "learning_rate": 4.213590570507149e-06, - "loss": 0.0991, - "step": 21285 - }, - { - "epoch": 0.59, - "learning_rate": 4.2121635891435255e-06, - "loss": 0.093, - "step": 21290 - }, - { - "epoch": 0.59, - "learning_rate": 4.210736607779903e-06, - "loss": 0.1594, - "step": 21295 - }, - { - "epoch": 0.59, - "learning_rate": 4.209309626416279e-06, - "loss": 0.4936, - "step": 21300 - }, - { - "epoch": 0.59, - "learning_rate": 4.207882645052656e-06, - "loss": 0.2851, - "step": 21305 - }, - { - "epoch": 0.59, - "learning_rate": 4.206455663689033e-06, - "loss": 0.1734, - "step": 21310 - }, - { - "epoch": 0.59, - "learning_rate": 4.20502868232541e-06, - "loss": 0.1556, - "step": 21315 - }, - { - "epoch": 0.59, - "learning_rate": 4.203601700961786e-06, - "loss": 0.1751, - "step": 21320 - }, - { - "epoch": 0.59, - "learning_rate": 4.2021747195981625e-06, - "loss": 0.1749, - "step": 21325 - }, - { - "epoch": 0.59, - "learning_rate": 4.200747738234539e-06, - "loss": 0.0951, - "step": 21330 - }, - { - "epoch": 0.59, - "learning_rate": 4.199320756870915e-06, - "loss": 0.0707, - "step": 21335 - }, - { - "epoch": 0.59, - "learning_rate": 4.197893775507292e-06, - "loss": 0.2316, - "step": 21340 - }, - { - "epoch": 0.59, - "learning_rate": 4.196466794143669e-06, - "loss": 0.1699, - "step": 21345 - }, - { - "epoch": 0.59, - "learning_rate": 4.195039812780046e-06, - "loss": 0.5433, - "step": 21350 - }, - { - "epoch": 0.59, - "learning_rate": 4.193612831416422e-06, - "loss": 0.1202, - "step": 21355 - }, - { - "epoch": 0.59, - "learning_rate": 4.1921858500527985e-06, - "loss": 0.1348, - "step": 21360 - }, - { - "epoch": 0.59, - "learning_rate": 4.190758868689176e-06, - "loss": 0.1644, - "step": 21365 - }, - { - "epoch": 0.59, - "learning_rate": 4.189331887325552e-06, - "loss": 0.1987, - "step": 21370 - }, - { - "epoch": 0.59, - "learning_rate": 4.187904905961928e-06, - "loss": 0.0504, - "step": 21375 - }, - { - "epoch": 0.59, - "learning_rate": 4.186477924598305e-06, - "loss": 0.1044, - "step": 21380 - }, - { - "epoch": 0.59, - "learning_rate": 4.185050943234682e-06, - "loss": 0.1106, - "step": 21385 - }, - { - "epoch": 0.59, - "learning_rate": 4.183623961871058e-06, - "loss": 0.2073, - "step": 21390 - }, - { - "epoch": 0.59, - "learning_rate": 4.182196980507435e-06, - "loss": 0.1753, - "step": 21395 - }, - { - "epoch": 0.59, - "learning_rate": 4.180769999143812e-06, - "loss": 0.4103, - "step": 21400 - }, - { - "epoch": 0.59, - "learning_rate": 4.179343017780188e-06, - "loss": 0.1441, - "step": 21405 - }, - { - "epoch": 0.59, - "learning_rate": 4.177916036416565e-06, - "loss": 0.1364, - "step": 21410 - }, - { - "epoch": 0.59, - "learning_rate": 4.176489055052942e-06, - "loss": 0.1536, - "step": 21415 - }, - { - "epoch": 0.59, - "learning_rate": 4.175062073689318e-06, - "loss": 0.1332, - "step": 21420 - }, - { - "epoch": 0.59, - "learning_rate": 4.173635092325694e-06, - "loss": 0.1466, - "step": 21425 - }, - { - "epoch": 0.59, - "learning_rate": 4.172208110962071e-06, - "loss": 0.1344, - "step": 21430 - }, - { - "epoch": 0.59, - "learning_rate": 4.170781129598448e-06, - "loss": 0.1798, - "step": 21435 - }, - { - "epoch": 0.59, - "learning_rate": 4.169354148234824e-06, - "loss": 0.1823, - "step": 21440 - }, - { - "epoch": 0.6, - "learning_rate": 4.167927166871201e-06, - "loss": 0.1012, - "step": 21445 - }, - { - "epoch": 0.6, - "learning_rate": 4.166500185507578e-06, - "loss": 0.3861, - "step": 21450 - }, - { - "epoch": 0.6, - "learning_rate": 4.165073204143954e-06, - "loss": 0.1132, - "step": 21455 - }, - { - "epoch": 0.6, - "learning_rate": 4.163646222780331e-06, - "loss": 0.1297, - "step": 21460 - }, - { - "epoch": 0.6, - "learning_rate": 4.1622192414167076e-06, - "loss": 0.1917, - "step": 21465 - }, - { - "epoch": 0.6, - "learning_rate": 4.160792260053084e-06, - "loss": 0.1914, - "step": 21470 - }, - { - "epoch": 0.6, - "learning_rate": 4.15936527868946e-06, - "loss": 0.0978, - "step": 21475 - }, - { - "epoch": 0.6, - "learning_rate": 4.157938297325837e-06, - "loss": 0.1377, - "step": 21480 - }, - { - "epoch": 0.6, - "learning_rate": 4.156511315962214e-06, - "loss": 0.1585, - "step": 21485 - }, - { - "epoch": 0.6, - "learning_rate": 4.15508433459859e-06, - "loss": 0.1966, - "step": 21490 - }, - { - "epoch": 0.6, - "learning_rate": 4.153657353234967e-06, - "loss": 0.2469, - "step": 21495 - }, - { - "epoch": 0.6, - "learning_rate": 4.152230371871344e-06, - "loss": 0.2976, - "step": 21500 - }, - { - "epoch": 0.6, - "learning_rate": 4.150803390507721e-06, - "loss": 0.1127, - "step": 21505 - }, - { - "epoch": 0.6, - "learning_rate": 4.149376409144097e-06, - "loss": 0.1079, - "step": 21510 - }, - { - "epoch": 0.6, - "learning_rate": 4.1479494277804735e-06, - "loss": 0.1243, - "step": 21515 - }, - { - "epoch": 0.6, - "learning_rate": 4.14652244641685e-06, - "loss": 0.1525, - "step": 21520 - }, - { - "epoch": 0.6, - "learning_rate": 4.145095465053226e-06, - "loss": 0.1036, - "step": 21525 - }, - { - "epoch": 0.6, - "learning_rate": 4.143668483689603e-06, - "loss": 0.1125, - "step": 21530 - }, - { - "epoch": 0.6, - "learning_rate": 4.14224150232598e-06, - "loss": 0.0137, - "step": 21535 - }, - { - "epoch": 0.6, - "learning_rate": 4.140814520962357e-06, - "loss": 0.168, - "step": 21540 - }, - { - "epoch": 0.6, - "learning_rate": 4.139387539598733e-06, - "loss": 0.3707, - "step": 21545 - }, - { - "epoch": 0.6, - "learning_rate": 4.1379605582351095e-06, - "loss": 0.5945, - "step": 21550 - }, - { - "epoch": 0.6, - "learning_rate": 4.136533576871487e-06, - "loss": 0.1056, - "step": 21555 - }, - { - "epoch": 0.6, - "learning_rate": 4.135106595507863e-06, - "loss": 0.148, - "step": 21560 - }, - { - "epoch": 0.6, - "learning_rate": 4.133679614144239e-06, - "loss": 0.1136, - "step": 21565 - }, - { - "epoch": 0.6, - "learning_rate": 4.132252632780616e-06, - "loss": 0.1784, - "step": 21570 - }, - { - "epoch": 0.6, - "learning_rate": 4.130825651416993e-06, - "loss": 0.0645, - "step": 21575 - }, - { - "epoch": 0.6, - "learning_rate": 4.129398670053369e-06, - "loss": 0.0799, - "step": 21580 - }, - { - "epoch": 0.6, - "learning_rate": 4.127971688689746e-06, - "loss": 0.0947, - "step": 21585 - }, - { - "epoch": 0.6, - "learning_rate": 4.126544707326123e-06, - "loss": 0.0839, - "step": 21590 - }, - { - "epoch": 0.6, - "learning_rate": 4.125117725962499e-06, - "loss": 0.1737, - "step": 21595 - }, - { - "epoch": 0.6, - "learning_rate": 4.123690744598876e-06, - "loss": 0.2954, - "step": 21600 - }, - { - "epoch": 0.6, - "learning_rate": 4.122263763235253e-06, - "loss": 0.1737, - "step": 21605 - }, - { - "epoch": 0.6, - "learning_rate": 4.120836781871629e-06, - "loss": 0.1259, - "step": 21610 - }, - { - "epoch": 0.6, - "learning_rate": 4.119409800508006e-06, - "loss": 0.1646, - "step": 21615 - }, - { - "epoch": 0.6, - "learning_rate": 4.1179828191443825e-06, - "loss": 0.1515, - "step": 21620 - }, - { - "epoch": 0.6, - "learning_rate": 4.116555837780759e-06, - "loss": 0.085, - "step": 21625 - }, - { - "epoch": 0.6, - "learning_rate": 4.115128856417135e-06, - "loss": 0.0497, - "step": 21630 - }, - { - "epoch": 0.6, - "learning_rate": 4.113701875053512e-06, - "loss": 0.1347, - "step": 21635 - }, - { - "epoch": 0.6, - "learning_rate": 4.112274893689889e-06, - "loss": 0.1324, - "step": 21640 - }, - { - "epoch": 0.6, - "learning_rate": 4.110847912326265e-06, - "loss": 0.1714, - "step": 21645 - }, - { - "epoch": 0.6, - "learning_rate": 4.109420930962642e-06, - "loss": 0.21, - "step": 21650 - }, - { - "epoch": 0.6, - "learning_rate": 4.107993949599019e-06, - "loss": 0.1229, - "step": 21655 - }, - { - "epoch": 0.6, - "learning_rate": 4.106566968235396e-06, - "loss": 0.1586, - "step": 21660 - }, - { - "epoch": 0.6, - "learning_rate": 4.105139986871772e-06, - "loss": 0.1512, - "step": 21665 - }, - { - "epoch": 0.6, - "learning_rate": 4.1037130055081485e-06, - "loss": 0.1363, - "step": 21670 - }, - { - "epoch": 0.6, - "learning_rate": 4.102286024144525e-06, - "loss": 0.1104, - "step": 21675 - }, - { - "epoch": 0.6, - "learning_rate": 4.100859042780901e-06, - "loss": 0.0787, - "step": 21680 - }, - { - "epoch": 0.6, - "learning_rate": 4.099432061417278e-06, - "loss": 0.2136, - "step": 21685 - }, - { - "epoch": 0.6, - "learning_rate": 4.098005080053655e-06, - "loss": 0.0721, - "step": 21690 - }, - { - "epoch": 0.6, - "learning_rate": 4.096578098690032e-06, - "loss": 0.2246, - "step": 21695 - }, - { - "epoch": 0.6, - "learning_rate": 4.095151117326408e-06, - "loss": 0.2887, - "step": 21700 - }, - { - "epoch": 0.6, - "learning_rate": 4.0937241359627845e-06, - "loss": 0.098, - "step": 21705 - }, - { - "epoch": 0.6, - "learning_rate": 4.092297154599162e-06, - "loss": 0.1688, - "step": 21710 - }, - { - "epoch": 0.6, - "learning_rate": 4.090870173235538e-06, - "loss": 0.1673, - "step": 21715 - }, - { - "epoch": 0.6, - "learning_rate": 4.089443191871914e-06, - "loss": 0.1548, - "step": 21720 - }, - { - "epoch": 0.6, - "learning_rate": 4.088016210508291e-06, - "loss": 0.1483, - "step": 21725 - }, - { - "epoch": 0.6, - "learning_rate": 4.086589229144668e-06, - "loss": 0.1353, - "step": 21730 - }, - { - "epoch": 0.6, - "learning_rate": 4.085162247781044e-06, - "loss": 0.1639, - "step": 21735 - }, - { - "epoch": 0.6, - "learning_rate": 4.083735266417421e-06, - "loss": 0.1349, - "step": 21740 - }, - { - "epoch": 0.6, - "learning_rate": 4.082308285053798e-06, - "loss": 0.1502, - "step": 21745 - }, - { - "epoch": 0.6, - "learning_rate": 4.080881303690174e-06, - "loss": 0.2666, - "step": 21750 - }, - { - "epoch": 0.6, - "learning_rate": 4.079454322326551e-06, - "loss": 0.0917, - "step": 21755 - }, - { - "epoch": 0.6, - "learning_rate": 4.078027340962928e-06, - "loss": 0.1191, - "step": 21760 - }, - { - "epoch": 0.6, - "learning_rate": 4.076600359599304e-06, - "loss": 0.1464, - "step": 21765 - }, - { - "epoch": 0.6, - "learning_rate": 4.07517337823568e-06, - "loss": 0.118, - "step": 21770 - }, - { - "epoch": 0.6, - "learning_rate": 4.073746396872057e-06, - "loss": 0.1638, - "step": 21775 - }, - { - "epoch": 0.6, - "learning_rate": 4.072319415508434e-06, - "loss": 0.0496, - "step": 21780 - }, - { - "epoch": 0.6, - "learning_rate": 4.07089243414481e-06, - "loss": 0.1049, - "step": 21785 - }, - { - "epoch": 0.6, - "learning_rate": 4.069465452781187e-06, - "loss": 0.164, - "step": 21790 - }, - { - "epoch": 0.6, - "learning_rate": 4.068038471417564e-06, - "loss": 0.1524, - "step": 21795 - }, - { - "epoch": 0.6, - "learning_rate": 4.06661149005394e-06, - "loss": 0.2877, - "step": 21800 - }, - { - "epoch": 0.61, - "learning_rate": 4.065184508690317e-06, - "loss": 0.1462, - "step": 21805 - }, - { - "epoch": 0.61, - "learning_rate": 4.0637575273266936e-06, - "loss": 0.1615, - "step": 21810 - }, - { - "epoch": 0.61, - "learning_rate": 4.06233054596307e-06, - "loss": 0.1057, - "step": 21815 - }, - { - "epoch": 0.61, - "learning_rate": 4.060903564599446e-06, - "loss": 0.146, - "step": 21820 - }, - { - "epoch": 0.61, - "learning_rate": 4.059476583235823e-06, - "loss": 0.1112, - "step": 21825 - }, - { - "epoch": 0.61, - "learning_rate": 4.0580496018722e-06, - "loss": 0.0587, - "step": 21830 - }, - { - "epoch": 0.61, - "learning_rate": 4.056622620508576e-06, - "loss": 0.0971, - "step": 21835 - }, - { - "epoch": 0.61, - "learning_rate": 4.055195639144953e-06, - "loss": 0.2333, - "step": 21840 - }, - { - "epoch": 0.61, - "learning_rate": 4.05376865778133e-06, - "loss": 0.1488, - "step": 21845 - }, - { - "epoch": 0.61, - "learning_rate": 4.052341676417707e-06, - "loss": 0.7283, - "step": 21850 - }, - { - "epoch": 0.61, - "learning_rate": 4.050914695054083e-06, - "loss": 0.0987, - "step": 21855 - }, - { - "epoch": 0.61, - "learning_rate": 4.0494877136904595e-06, - "loss": 0.1239, - "step": 21860 - }, - { - "epoch": 0.61, - "learning_rate": 4.048060732326836e-06, - "loss": 0.0952, - "step": 21865 - }, - { - "epoch": 0.61, - "learning_rate": 4.046633750963212e-06, - "loss": 0.136, - "step": 21870 - }, - { - "epoch": 0.61, - "learning_rate": 4.045206769599589e-06, - "loss": 0.1609, - "step": 21875 - }, - { - "epoch": 0.61, - "learning_rate": 4.043779788235966e-06, - "loss": 0.063, - "step": 21880 - }, - { - "epoch": 0.61, - "learning_rate": 4.042352806872343e-06, - "loss": 0.1227, - "step": 21885 - }, - { - "epoch": 0.61, - "learning_rate": 4.040925825508719e-06, - "loss": 0.1381, - "step": 21890 - }, - { - "epoch": 0.61, - "learning_rate": 4.0394988441450955e-06, - "loss": 0.2777, - "step": 21895 - }, - { - "epoch": 0.61, - "learning_rate": 4.038071862781473e-06, - "loss": 0.5384, - "step": 21900 - }, - { - "epoch": 0.61, - "learning_rate": 4.036644881417849e-06, - "loss": 0.1427, - "step": 21905 - }, - { - "epoch": 0.61, - "learning_rate": 4.035217900054225e-06, - "loss": 0.1222, - "step": 21910 - }, - { - "epoch": 0.61, - "learning_rate": 4.033790918690602e-06, - "loss": 0.1591, - "step": 21915 - }, - { - "epoch": 0.61, - "learning_rate": 4.032363937326979e-06, - "loss": 0.0948, - "step": 21920 - }, - { - "epoch": 0.61, - "learning_rate": 4.030936955963355e-06, - "loss": 0.1851, - "step": 21925 - }, - { - "epoch": 0.61, - "learning_rate": 4.029509974599732e-06, - "loss": 0.0329, - "step": 21930 - }, - { - "epoch": 0.61, - "learning_rate": 4.028082993236109e-06, - "loss": 0.1093, - "step": 21935 - }, - { - "epoch": 0.61, - "learning_rate": 4.026656011872485e-06, - "loss": 0.3272, - "step": 21940 - }, - { - "epoch": 0.61, - "learning_rate": 4.025229030508862e-06, - "loss": 0.306, - "step": 21945 - }, - { - "epoch": 0.61, - "learning_rate": 4.023802049145239e-06, - "loss": 0.5171, - "step": 21950 - }, - { - "epoch": 0.61, - "learning_rate": 4.022375067781615e-06, - "loss": 0.1122, - "step": 21955 - }, - { - "epoch": 0.61, - "learning_rate": 4.020948086417991e-06, - "loss": 0.0891, - "step": 21960 - }, - { - "epoch": 0.61, - "learning_rate": 4.019521105054368e-06, - "loss": 0.1444, - "step": 21965 - }, - { - "epoch": 0.61, - "learning_rate": 4.018094123690745e-06, - "loss": 0.1775, - "step": 21970 - }, - { - "epoch": 0.61, - "learning_rate": 4.016667142327121e-06, - "loss": 0.1363, - "step": 21975 - }, - { - "epoch": 0.61, - "learning_rate": 4.015240160963498e-06, - "loss": 0.0984, - "step": 21980 - }, - { - "epoch": 0.61, - "learning_rate": 4.013813179599875e-06, - "loss": 0.1114, - "step": 21985 - }, - { - "epoch": 0.61, - "learning_rate": 4.012386198236252e-06, - "loss": 0.1603, - "step": 21990 - }, - { - "epoch": 0.61, - "learning_rate": 4.010959216872628e-06, - "loss": 0.1489, - "step": 21995 - }, - { - "epoch": 0.61, - "learning_rate": 4.009532235509005e-06, - "loss": 0.3808, - "step": 22000 - }, - { - "epoch": 0.61, - "eval_loss": 0.059859082102775574, - "eval_runtime": 1843.3789, - "eval_samples_per_second": 8.689, - "eval_steps_per_second": 2.173, - "eval_wer": 0.16849981968986658, - "step": 22000 - }, - { - "epoch": 0.61, - "learning_rate": 4.008105254145381e-06, - "loss": 0.0803, - "step": 22005 - }, - { - "epoch": 0.61, - "learning_rate": 4.006678272781758e-06, - "loss": 0.1432, - "step": 22010 - }, - { - "epoch": 0.61, - "learning_rate": 4.0052512914181345e-06, - "loss": 0.1594, - "step": 22015 - }, - { - "epoch": 0.61, - "learning_rate": 4.003824310054511e-06, - "loss": 0.2076, - "step": 22020 - }, - { - "epoch": 0.61, - "learning_rate": 4.002397328690887e-06, - "loss": 0.0678, - "step": 22025 - }, - { - "epoch": 0.61, - "learning_rate": 4.000970347327264e-06, - "loss": 0.0397, - "step": 22030 - }, - { - "epoch": 0.61, - "learning_rate": 3.999543365963641e-06, - "loss": 0.1157, - "step": 22035 - }, - { - "epoch": 0.61, - "learning_rate": 3.998116384600018e-06, - "loss": 0.1655, - "step": 22040 - }, - { - "epoch": 0.61, - "learning_rate": 3.996689403236394e-06, - "loss": 0.0887, - "step": 22045 - }, - { - "epoch": 0.61, - "learning_rate": 3.9952624218727705e-06, - "loss": 0.3724, - "step": 22050 - }, - { - "epoch": 0.61, - "learning_rate": 3.993835440509148e-06, - "loss": 0.0935, - "step": 22055 - }, - { - "epoch": 0.61, - "learning_rate": 3.992408459145524e-06, - "loss": 0.1776, - "step": 22060 - }, - { - "epoch": 0.61, - "learning_rate": 3.9909814777819e-06, - "loss": 0.1447, - "step": 22065 - }, - { - "epoch": 0.61, - "learning_rate": 3.989554496418277e-06, - "loss": 0.1518, - "step": 22070 - }, - { - "epoch": 0.61, - "learning_rate": 3.988127515054654e-06, - "loss": 0.1164, - "step": 22075 - }, - { - "epoch": 0.61, - "learning_rate": 3.98670053369103e-06, - "loss": 0.1649, - "step": 22080 - }, - { - "epoch": 0.61, - "learning_rate": 3.9852735523274074e-06, - "loss": 0.0446, - "step": 22085 - }, - { - "epoch": 0.61, - "learning_rate": 3.983846570963784e-06, - "loss": 0.2027, - "step": 22090 - }, - { - "epoch": 0.61, - "learning_rate": 3.98241958960016e-06, - "loss": 0.185, - "step": 22095 - }, - { - "epoch": 0.61, - "learning_rate": 3.980992608236537e-06, - "loss": 0.2873, - "step": 22100 - }, - { - "epoch": 0.61, - "learning_rate": 3.979565626872914e-06, - "loss": 0.1553, - "step": 22105 - }, - { - "epoch": 0.61, - "learning_rate": 3.97813864550929e-06, - "loss": 0.156, - "step": 22110 - }, - { - "epoch": 0.61, - "learning_rate": 3.976711664145666e-06, - "loss": 0.1238, - "step": 22115 - }, - { - "epoch": 0.61, - "learning_rate": 3.975284682782043e-06, - "loss": 0.1911, - "step": 22120 - }, - { - "epoch": 0.61, - "learning_rate": 3.97385770141842e-06, - "loss": 0.0836, - "step": 22125 - }, - { - "epoch": 0.61, - "learning_rate": 3.972430720054796e-06, - "loss": 0.1757, - "step": 22130 - }, - { - "epoch": 0.61, - "learning_rate": 3.971003738691173e-06, - "loss": 0.093, - "step": 22135 - }, - { - "epoch": 0.61, - "learning_rate": 3.96957675732755e-06, - "loss": 0.1251, - "step": 22140 - }, - { - "epoch": 0.61, - "learning_rate": 3.968149775963927e-06, - "loss": 0.1767, - "step": 22145 - }, - { - "epoch": 0.61, - "learning_rate": 3.966722794600303e-06, - "loss": 0.3181, - "step": 22150 - }, - { - "epoch": 0.61, - "learning_rate": 3.9652958132366796e-06, - "loss": 0.1479, - "step": 22155 - }, - { - "epoch": 0.61, - "learning_rate": 3.963868831873056e-06, - "loss": 0.1128, - "step": 22160 - }, - { - "epoch": 0.62, - "learning_rate": 3.962441850509432e-06, - "loss": 0.1561, - "step": 22165 - }, - { - "epoch": 0.62, - "learning_rate": 3.961014869145809e-06, - "loss": 0.2144, - "step": 22170 - }, - { - "epoch": 0.62, - "learning_rate": 3.959587887782186e-06, - "loss": 0.0875, - "step": 22175 - }, - { - "epoch": 0.62, - "learning_rate": 3.958160906418563e-06, - "loss": 0.1531, - "step": 22180 - }, - { - "epoch": 0.62, - "learning_rate": 3.956733925054939e-06, - "loss": 0.1169, - "step": 22185 - }, - { - "epoch": 0.62, - "learning_rate": 3.955306943691316e-06, - "loss": 0.1518, - "step": 22190 - }, - { - "epoch": 0.62, - "learning_rate": 3.953879962327693e-06, - "loss": 0.1385, - "step": 22195 - }, - { - "epoch": 0.62, - "learning_rate": 3.952452980964069e-06, - "loss": 0.3973, - "step": 22200 - }, - { - "epoch": 0.62, - "learning_rate": 3.9510259996004455e-06, - "loss": 0.1574, - "step": 22205 - }, - { - "epoch": 0.62, - "learning_rate": 3.949599018236822e-06, - "loss": 0.2186, - "step": 22210 - }, - { - "epoch": 0.62, - "learning_rate": 3.948172036873198e-06, - "loss": 0.1752, - "step": 22215 - }, - { - "epoch": 0.62, - "learning_rate": 3.946745055509575e-06, - "loss": 0.1642, - "step": 22220 - }, - { - "epoch": 0.62, - "learning_rate": 3.945318074145952e-06, - "loss": 0.1781, - "step": 22225 - }, - { - "epoch": 0.62, - "learning_rate": 3.943891092782329e-06, - "loss": 0.0601, - "step": 22230 - }, - { - "epoch": 0.62, - "learning_rate": 3.942464111418705e-06, - "loss": 0.0634, - "step": 22235 - }, - { - "epoch": 0.62, - "learning_rate": 3.941037130055082e-06, - "loss": 0.1057, - "step": 22240 - }, - { - "epoch": 0.62, - "learning_rate": 3.939610148691459e-06, - "loss": 0.2088, - "step": 22245 - }, - { - "epoch": 0.62, - "learning_rate": 3.938183167327835e-06, - "loss": 0.2691, - "step": 22250 - }, - { - "epoch": 0.62, - "learning_rate": 3.936756185964211e-06, - "loss": 0.1449, - "step": 22255 - }, - { - "epoch": 0.62, - "learning_rate": 3.935329204600588e-06, - "loss": 0.105, - "step": 22260 - }, - { - "epoch": 0.62, - "learning_rate": 3.933902223236965e-06, - "loss": 0.1411, - "step": 22265 - }, - { - "epoch": 0.62, - "learning_rate": 3.932475241873341e-06, - "loss": 0.1517, - "step": 22270 - }, - { - "epoch": 0.62, - "learning_rate": 3.9310482605097185e-06, - "loss": 0.1313, - "step": 22275 - }, - { - "epoch": 0.62, - "learning_rate": 3.929621279146095e-06, - "loss": 0.1082, - "step": 22280 - }, - { - "epoch": 0.62, - "learning_rate": 3.928194297782471e-06, - "loss": 0.1042, - "step": 22285 - }, - { - "epoch": 0.62, - "learning_rate": 3.926767316418848e-06, - "loss": 0.0742, - "step": 22290 - }, - { - "epoch": 0.62, - "learning_rate": 3.925340335055225e-06, - "loss": 0.1411, - "step": 22295 - }, - { - "epoch": 0.62, - "learning_rate": 3.924198749964326e-06, - "loss": 0.3382, - "step": 22300 - }, - { - "epoch": 0.62, - "learning_rate": 3.922771768600702e-06, - "loss": 0.1718, - "step": 22305 - }, - { - "epoch": 0.62, - "learning_rate": 3.9213447872370794e-06, - "loss": 0.1203, - "step": 22310 - }, - { - "epoch": 0.62, - "learning_rate": 3.919917805873456e-06, - "loss": 0.1173, - "step": 22315 - }, - { - "epoch": 0.62, - "learning_rate": 3.918490824509832e-06, - "loss": 0.1667, - "step": 22320 - }, - { - "epoch": 0.62, - "learning_rate": 3.9170638431462084e-06, - "loss": 0.147, - "step": 22325 - }, - { - "epoch": 0.62, - "learning_rate": 3.915636861782585e-06, - "loss": 0.0457, - "step": 22330 - }, - { - "epoch": 0.62, - "learning_rate": 3.914209880418962e-06, - "loss": 0.0543, - "step": 22335 - }, - { - "epoch": 0.62, - "learning_rate": 3.912782899055338e-06, - "loss": 0.1849, - "step": 22340 - }, - { - "epoch": 0.62, - "learning_rate": 3.9113559176917155e-06, - "loss": 0.1187, - "step": 22345 - }, - { - "epoch": 0.62, - "learning_rate": 3.909928936328092e-06, - "loss": 0.5127, - "step": 22350 - }, - { - "epoch": 0.62, - "learning_rate": 3.908501954964469e-06, - "loss": 0.1292, - "step": 22355 - }, - { - "epoch": 0.62, - "learning_rate": 3.907074973600845e-06, - "loss": 0.0939, - "step": 22360 - }, - { - "epoch": 0.62, - "learning_rate": 3.905647992237222e-06, - "loss": 0.1346, - "step": 22365 - }, - { - "epoch": 0.62, - "learning_rate": 3.904221010873598e-06, - "loss": 0.1726, - "step": 22370 - }, - { - "epoch": 0.62, - "learning_rate": 3.902794029509974e-06, - "loss": 0.1197, - "step": 22375 - }, - { - "epoch": 0.62, - "learning_rate": 3.9013670481463516e-06, - "loss": 0.0341, - "step": 22380 - }, - { - "epoch": 0.62, - "learning_rate": 3.899940066782728e-06, - "loss": 0.1054, - "step": 22385 - }, - { - "epoch": 0.62, - "learning_rate": 3.898513085419105e-06, - "loss": 0.2072, - "step": 22390 - }, - { - "epoch": 0.62, - "learning_rate": 3.897086104055481e-06, - "loss": 0.2113, - "step": 22395 - }, - { - "epoch": 0.62, - "learning_rate": 3.895659122691858e-06, - "loss": 0.3128, - "step": 22400 - }, - { - "epoch": 0.62, - "learning_rate": 3.894232141328235e-06, - "loss": 0.1308, - "step": 22405 - }, - { - "epoch": 0.62, - "learning_rate": 3.892805159964611e-06, - "loss": 0.186, - "step": 22410 - }, - { - "epoch": 0.62, - "learning_rate": 3.891378178600988e-06, - "loss": 0.1807, - "step": 22415 - }, - { - "epoch": 0.62, - "learning_rate": 3.889951197237364e-06, - "loss": 0.1598, - "step": 22420 - }, - { - "epoch": 0.62, - "learning_rate": 3.888524215873741e-06, - "loss": 0.0927, - "step": 22425 - }, - { - "epoch": 0.62, - "learning_rate": 3.8870972345101175e-06, - "loss": 0.0842, - "step": 22430 - }, - { - "epoch": 0.62, - "learning_rate": 3.885670253146494e-06, - "loss": 0.2275, - "step": 22435 - }, - { - "epoch": 0.62, - "learning_rate": 3.884243271782871e-06, - "loss": 0.1117, - "step": 22440 - }, - { - "epoch": 0.62, - "learning_rate": 3.882816290419247e-06, - "loss": 0.3245, - "step": 22445 - }, - { - "epoch": 0.62, - "learning_rate": 3.8813893090556245e-06, - "loss": 0.5859, - "step": 22450 - }, - { - "epoch": 0.62, - "learning_rate": 3.879962327692001e-06, - "loss": 0.1725, - "step": 22455 - }, - { - "epoch": 0.62, - "learning_rate": 3.878535346328377e-06, - "loss": 0.1432, - "step": 22460 - }, - { - "epoch": 0.62, - "learning_rate": 3.8771083649647535e-06, - "loss": 0.2215, - "step": 22465 - }, - { - "epoch": 0.62, - "learning_rate": 3.875681383601131e-06, - "loss": 0.1653, - "step": 22470 - }, - { - "epoch": 0.62, - "learning_rate": 3.874254402237507e-06, - "loss": 0.1194, - "step": 22475 - }, - { - "epoch": 0.62, - "learning_rate": 3.872827420873883e-06, - "loss": 0.1344, - "step": 22480 - }, - { - "epoch": 0.62, - "learning_rate": 3.871400439510261e-06, - "loss": 0.256, - "step": 22485 - }, - { - "epoch": 0.62, - "learning_rate": 3.869973458146637e-06, - "loss": 0.0864, - "step": 22490 - }, - { - "epoch": 0.62, - "learning_rate": 3.868546476783013e-06, - "loss": 0.4852, - "step": 22495 - }, - { - "epoch": 0.62, - "learning_rate": 3.8671194954193905e-06, - "loss": 0.4037, - "step": 22500 - }, - { - "epoch": 0.62, - "learning_rate": 3.865692514055767e-06, - "loss": 0.1035, - "step": 22505 - }, - { - "epoch": 0.62, - "learning_rate": 3.864265532692143e-06, - "loss": 0.1562, - "step": 22510 - }, - { - "epoch": 0.62, - "learning_rate": 3.86283855132852e-06, - "loss": 0.1622, - "step": 22515 - }, - { - "epoch": 0.62, - "learning_rate": 3.861411569964897e-06, - "loss": 0.1827, - "step": 22520 - }, - { - "epoch": 0.63, - "learning_rate": 3.859984588601273e-06, - "loss": 0.1404, - "step": 22525 - }, - { - "epoch": 0.63, - "learning_rate": 3.858557607237649e-06, - "loss": 0.1047, - "step": 22530 - }, - { - "epoch": 0.63, - "learning_rate": 3.8571306258740265e-06, - "loss": 0.1108, - "step": 22535 - }, - { - "epoch": 0.63, - "learning_rate": 3.855703644510403e-06, - "loss": 0.1106, - "step": 22540 - }, - { - "epoch": 0.63, - "learning_rate": 3.85427666314678e-06, - "loss": 0.1454, - "step": 22545 - }, - { - "epoch": 0.63, - "learning_rate": 3.852849681783156e-06, - "loss": 0.4207, - "step": 22550 - }, - { - "epoch": 0.63, - "learning_rate": 3.851422700419533e-06, - "loss": 0.1075, - "step": 22555 - }, - { - "epoch": 0.63, - "learning_rate": 3.84999571905591e-06, - "loss": 0.1428, - "step": 22560 - }, - { - "epoch": 0.63, - "learning_rate": 3.848568737692286e-06, - "loss": 0.1541, - "step": 22565 - }, - { - "epoch": 0.63, - "learning_rate": 3.847141756328663e-06, - "loss": 0.2013, - "step": 22570 - }, - { - "epoch": 0.63, - "learning_rate": 3.845714774965039e-06, - "loss": 0.136, - "step": 22575 - }, - { - "epoch": 0.63, - "learning_rate": 3.844287793601416e-06, - "loss": 0.1132, - "step": 22580 - }, - { - "epoch": 0.63, - "learning_rate": 3.8428608122377925e-06, - "loss": 0.1936, - "step": 22585 - }, - { - "epoch": 0.63, - "learning_rate": 3.841433830874169e-06, - "loss": 0.2513, - "step": 22590 - }, - { - "epoch": 0.63, - "learning_rate": 3.840006849510546e-06, - "loss": 0.367, - "step": 22595 - }, - { - "epoch": 0.63, - "learning_rate": 3.838579868146922e-06, - "loss": 0.2205, - "step": 22600 - }, - { - "epoch": 0.63, - "learning_rate": 3.8371528867832995e-06, - "loss": 0.1057, - "step": 22605 - }, - { - "epoch": 0.63, - "learning_rate": 3.835725905419676e-06, - "loss": 0.1495, - "step": 22610 - }, - { - "epoch": 0.63, - "learning_rate": 3.834298924056052e-06, - "loss": 0.1303, - "step": 22615 - }, - { - "epoch": 0.63, - "learning_rate": 3.8328719426924285e-06, - "loss": 0.1811, - "step": 22620 - }, - { - "epoch": 0.63, - "learning_rate": 3.831444961328805e-06, - "loss": 0.0864, - "step": 22625 - }, - { - "epoch": 0.63, - "learning_rate": 3.830017979965182e-06, - "loss": 0.0427, - "step": 22630 - }, - { - "epoch": 0.63, - "learning_rate": 3.828590998601558e-06, - "loss": 0.1305, - "step": 22635 - }, - { - "epoch": 0.63, - "learning_rate": 3.8271640172379356e-06, - "loss": 0.1432, - "step": 22640 - }, - { - "epoch": 0.63, - "learning_rate": 3.825737035874312e-06, - "loss": 0.1697, - "step": 22645 - }, - { - "epoch": 0.63, - "learning_rate": 3.824310054510688e-06, - "loss": 0.386, - "step": 22650 - }, - { - "epoch": 0.63, - "learning_rate": 3.8228830731470654e-06, - "loss": 0.1587, - "step": 22655 - }, - { - "epoch": 0.63, - "learning_rate": 3.821456091783442e-06, - "loss": 0.1269, - "step": 22660 - }, - { - "epoch": 0.63, - "learning_rate": 3.820029110419818e-06, - "loss": 0.1869, - "step": 22665 - }, - { - "epoch": 0.63, - "learning_rate": 3.8186021290561944e-06, - "loss": 0.1689, - "step": 22670 - }, - { - "epoch": 0.63, - "learning_rate": 3.817175147692572e-06, - "loss": 0.157, - "step": 22675 - }, - { - "epoch": 0.63, - "learning_rate": 3.815748166328948e-06, - "loss": 0.0621, - "step": 22680 - }, - { - "epoch": 0.63, - "learning_rate": 3.8143211849653243e-06, - "loss": 0.1575, - "step": 22685 - }, - { - "epoch": 0.63, - "learning_rate": 3.8128942036017015e-06, - "loss": 0.1115, - "step": 22690 - }, - { - "epoch": 0.63, - "learning_rate": 3.811467222238078e-06, - "loss": 0.1717, - "step": 22695 - }, - { - "epoch": 0.63, - "learning_rate": 3.8100402408744546e-06, - "loss": 0.3862, - "step": 22700 - }, - { - "epoch": 0.63, - "learning_rate": 3.808613259510831e-06, - "loss": 0.141, - "step": 22705 - }, - { - "epoch": 0.63, - "learning_rate": 3.807186278147208e-06, - "loss": 0.0854, - "step": 22710 - }, - { - "epoch": 0.63, - "learning_rate": 3.8057592967835845e-06, - "loss": 0.1455, - "step": 22715 - }, - { - "epoch": 0.63, - "learning_rate": 3.804332315419961e-06, - "loss": 0.1458, - "step": 22720 - }, - { - "epoch": 0.63, - "learning_rate": 3.8029053340563376e-06, - "loss": 0.0959, - "step": 22725 - }, - { - "epoch": 0.63, - "learning_rate": 3.801478352692714e-06, - "loss": 0.1955, - "step": 22730 - }, - { - "epoch": 0.63, - "learning_rate": 3.800051371329091e-06, - "loss": 0.0662, - "step": 22735 - }, - { - "epoch": 0.63, - "learning_rate": 3.7986243899654674e-06, - "loss": 0.169, - "step": 22740 - }, - { - "epoch": 0.63, - "learning_rate": 3.7971974086018438e-06, - "loss": 0.1332, - "step": 22745 - }, - { - "epoch": 0.63, - "learning_rate": 3.7957704272382205e-06, - "loss": 0.4515, - "step": 22750 - }, - { - "epoch": 0.63, - "learning_rate": 3.794343445874597e-06, - "loss": 0.0705, - "step": 22755 - }, - { - "epoch": 0.63, - "learning_rate": 3.792916464510974e-06, - "loss": 0.2404, - "step": 22760 - }, - { - "epoch": 0.63, - "learning_rate": 3.7914894831473504e-06, - "loss": 0.0873, - "step": 22765 - }, - { - "epoch": 0.63, - "learning_rate": 3.790062501783727e-06, - "loss": 0.1521, - "step": 22770 - }, - { - "epoch": 0.63, - "learning_rate": 3.7886355204201035e-06, - "loss": 0.0806, - "step": 22775 - }, - { - "epoch": 0.63, - "learning_rate": 3.78720853905648e-06, - "loss": 0.1339, - "step": 22780 - }, - { - "epoch": 0.63, - "learning_rate": 3.785781557692857e-06, - "loss": 0.1963, - "step": 22785 - }, - { - "epoch": 0.63, - "learning_rate": 3.7843545763292333e-06, - "loss": 0.1837, - "step": 22790 - }, - { - "epoch": 0.63, - "learning_rate": 3.78292759496561e-06, - "loss": 0.1914, - "step": 22795 - }, - { - "epoch": 0.63, - "learning_rate": 3.7815006136019864e-06, - "loss": 0.3424, - "step": 22800 - }, - { - "epoch": 0.63, - "learning_rate": 3.7800736322383636e-06, - "loss": 0.1903, - "step": 22805 - }, - { - "epoch": 0.63, - "learning_rate": 3.77864665087474e-06, - "loss": 0.1242, - "step": 22810 - }, - { - "epoch": 0.63, - "learning_rate": 3.7772196695111163e-06, - "loss": 0.1694, - "step": 22815 - }, - { - "epoch": 0.63, - "learning_rate": 3.775792688147493e-06, - "loss": 0.1367, - "step": 22820 - }, - { - "epoch": 0.63, - "learning_rate": 3.7743657067838694e-06, - "loss": 0.0764, - "step": 22825 - }, - { - "epoch": 0.63, - "learning_rate": 3.7729387254202466e-06, - "loss": 0.0922, - "step": 22830 - }, - { - "epoch": 0.63, - "learning_rate": 3.771511744056623e-06, - "loss": 0.0857, - "step": 22835 - }, - { - "epoch": 0.63, - "learning_rate": 3.7700847626929993e-06, - "loss": 0.1124, - "step": 22840 - }, - { - "epoch": 0.63, - "learning_rate": 3.768657781329376e-06, - "loss": 0.2392, - "step": 22845 - }, - { - "epoch": 0.63, - "learning_rate": 3.7672307999657524e-06, - "loss": 0.6366, - "step": 22850 - }, - { - "epoch": 0.63, - "learning_rate": 3.7658038186021296e-06, - "loss": 0.1192, - "step": 22855 - }, - { - "epoch": 0.63, - "learning_rate": 3.764376837238506e-06, - "loss": 0.1585, - "step": 22860 - }, - { - "epoch": 0.63, - "learning_rate": 3.7629498558748827e-06, - "loss": 0.1129, - "step": 22865 - }, - { - "epoch": 0.63, - "learning_rate": 3.761522874511259e-06, - "loss": 0.1819, - "step": 22870 - }, - { - "epoch": 0.63, - "learning_rate": 3.7600958931476358e-06, - "loss": 0.1054, - "step": 22875 - }, - { - "epoch": 0.63, - "learning_rate": 3.7586689117840125e-06, - "loss": 0.1105, - "step": 22880 - }, - { - "epoch": 0.64, - "learning_rate": 3.757241930420389e-06, - "loss": 0.0801, - "step": 22885 - }, - { - "epoch": 0.64, - "learning_rate": 3.7558149490567656e-06, - "loss": 0.0801, - "step": 22890 - }, - { - "epoch": 0.64, - "learning_rate": 3.7543879676931424e-06, - "loss": 0.1595, - "step": 22895 - }, - { - "epoch": 0.64, - "learning_rate": 3.752960986329519e-06, - "loss": 0.604, - "step": 22900 - }, - { - "epoch": 0.64, - "learning_rate": 3.7515340049658955e-06, - "loss": 0.093, - "step": 22905 - }, - { - "epoch": 0.64, - "learning_rate": 3.750107023602272e-06, - "loss": 0.187, - "step": 22910 - }, - { - "epoch": 0.64, - "learning_rate": 3.7486800422386486e-06, - "loss": 0.1357, - "step": 22915 - }, - { - "epoch": 0.64, - "learning_rate": 3.7472530608750254e-06, - "loss": 0.1621, - "step": 22920 - }, - { - "epoch": 0.64, - "learning_rate": 3.745826079511402e-06, - "loss": 0.0294, - "step": 22925 - }, - { - "epoch": 0.64, - "learning_rate": 3.7443990981477785e-06, - "loss": 0.0212, - "step": 22930 - }, - { - "epoch": 0.64, - "learning_rate": 3.742972116784155e-06, - "loss": 0.1594, - "step": 22935 - }, - { - "epoch": 0.64, - "learning_rate": 3.741545135420532e-06, - "loss": 0.1677, - "step": 22940 - }, - { - "epoch": 0.64, - "learning_rate": 3.7401181540569083e-06, - "loss": 0.1924, - "step": 22945 - }, - { - "epoch": 0.64, - "learning_rate": 3.738691172693285e-06, - "loss": 0.4647, - "step": 22950 - }, - { - "epoch": 0.64, - "learning_rate": 3.7372641913296614e-06, - "loss": 0.0777, - "step": 22955 - }, - { - "epoch": 0.64, - "learning_rate": 3.735837209966038e-06, - "loss": 0.1238, - "step": 22960 - }, - { - "epoch": 0.64, - "learning_rate": 3.734410228602415e-06, - "loss": 0.1013, - "step": 22965 - }, - { - "epoch": 0.64, - "learning_rate": 3.7329832472387913e-06, - "loss": 0.1405, - "step": 22970 - }, - { - "epoch": 0.64, - "learning_rate": 3.731556265875168e-06, - "loss": 0.1518, - "step": 22975 - }, - { - "epoch": 0.64, - "learning_rate": 3.7301292845115444e-06, - "loss": 0.0388, - "step": 22980 - }, - { - "epoch": 0.64, - "learning_rate": 3.7287023031479216e-06, - "loss": 0.0532, - "step": 22985 - }, - { - "epoch": 0.64, - "learning_rate": 3.727275321784298e-06, - "loss": 0.1454, - "step": 22990 - }, - { - "epoch": 0.64, - "learning_rate": 3.7258483404206747e-06, - "loss": 0.3034, - "step": 22995 - }, - { - "epoch": 0.64, - "learning_rate": 3.724421359057051e-06, - "loss": 0.447, - "step": 23000 - }, - { - "epoch": 0.64, - "learning_rate": 3.7229943776934273e-06, - "loss": 0.1081, - "step": 23005 - }, - { - "epoch": 0.64, - "learning_rate": 3.7215673963298045e-06, - "loss": 0.1586, - "step": 23010 - }, - { - "epoch": 0.64, - "learning_rate": 3.720140414966181e-06, - "loss": 0.1271, - "step": 23015 - }, - { - "epoch": 0.64, - "learning_rate": 3.7187134336025576e-06, - "loss": 0.128, - "step": 23020 - }, - { - "epoch": 0.64, - "learning_rate": 3.717286452238934e-06, - "loss": 0.081, - "step": 23025 - }, - { - "epoch": 0.64, - "learning_rate": 3.7158594708753103e-06, - "loss": 0.1812, - "step": 23030 - }, - { - "epoch": 0.64, - "learning_rate": 3.7144324895116875e-06, - "loss": 0.1127, - "step": 23035 - }, - { - "epoch": 0.64, - "learning_rate": 3.713005508148064e-06, - "loss": 0.2226, - "step": 23040 - }, - { - "epoch": 0.64, - "learning_rate": 3.7115785267844406e-06, - "loss": 0.3506, - "step": 23045 - }, - { - "epoch": 0.64, - "learning_rate": 3.710151545420817e-06, - "loss": 0.221, - "step": 23050 - }, - { - "epoch": 0.64, - "learning_rate": 3.708724564057194e-06, - "loss": 0.1317, - "step": 23055 - }, - { - "epoch": 0.64, - "learning_rate": 3.7072975826935705e-06, - "loss": 0.0892, - "step": 23060 - }, - { - "epoch": 0.64, - "learning_rate": 3.705870601329947e-06, - "loss": 0.149, - "step": 23065 - }, - { - "epoch": 0.64, - "learning_rate": 3.7044436199663236e-06, - "loss": 0.1818, - "step": 23070 - }, - { - "epoch": 0.64, - "learning_rate": 3.7030166386027e-06, - "loss": 0.0497, - "step": 23075 - }, - { - "epoch": 0.64, - "learning_rate": 3.701589657239077e-06, - "loss": 0.0308, - "step": 23080 - }, - { - "epoch": 0.64, - "learning_rate": 3.7001626758754534e-06, - "loss": 0.2085, - "step": 23085 - }, - { - "epoch": 0.64, - "learning_rate": 3.69873569451183e-06, - "loss": 0.2694, - "step": 23090 - }, - { - "epoch": 0.64, - "learning_rate": 3.6973087131482065e-06, - "loss": 0.232, - "step": 23095 - }, - { - "epoch": 0.64, - "learning_rate": 3.695881731784583e-06, - "loss": 0.3407, - "step": 23100 - }, - { - "epoch": 0.64, - "learning_rate": 3.69445475042096e-06, - "loss": 0.1512, - "step": 23105 - }, - { - "epoch": 0.64, - "learning_rate": 3.6930277690573364e-06, - "loss": 0.0969, - "step": 23110 - }, - { - "epoch": 0.64, - "learning_rate": 3.691600787693713e-06, - "loss": 0.1553, - "step": 23115 - }, - { - "epoch": 0.64, - "learning_rate": 3.6901738063300895e-06, - "loss": 0.2289, - "step": 23120 - }, - { - "epoch": 0.64, - "learning_rate": 3.688746824966466e-06, - "loss": 0.096, - "step": 23125 - }, - { - "epoch": 0.64, - "learning_rate": 3.687319843602843e-06, - "loss": 0.0663, - "step": 23130 - }, - { - "epoch": 0.64, - "learning_rate": 3.6858928622392193e-06, - "loss": 0.1077, - "step": 23135 - }, - { - "epoch": 0.64, - "learning_rate": 3.684465880875596e-06, - "loss": 0.0969, - "step": 23140 - }, - { - "epoch": 0.64, - "learning_rate": 3.6830388995119724e-06, - "loss": 0.3644, - "step": 23145 - }, - { - "epoch": 0.64, - "learning_rate": 3.6816119181483496e-06, - "loss": 0.568, - "step": 23150 - }, - { - "epoch": 0.64, - "learning_rate": 3.680184936784726e-06, - "loss": 0.121, - "step": 23155 - }, - { - "epoch": 0.64, - "learning_rate": 3.6787579554211023e-06, - "loss": 0.1523, - "step": 23160 - }, - { - "epoch": 0.64, - "learning_rate": 3.677330974057479e-06, - "loss": 0.1514, - "step": 23165 - }, - { - "epoch": 0.64, - "learning_rate": 3.6759039926938554e-06, - "loss": 0.1478, - "step": 23170 - }, - { - "epoch": 0.64, - "learning_rate": 3.6744770113302326e-06, - "loss": 0.0865, - "step": 23175 - }, - { - "epoch": 0.64, - "learning_rate": 3.673050029966609e-06, - "loss": 0.0337, - "step": 23180 - }, - { - "epoch": 0.64, - "learning_rate": 3.6716230486029857e-06, - "loss": 0.0987, - "step": 23185 - }, - { - "epoch": 0.64, - "learning_rate": 3.670196067239362e-06, - "loss": 0.1177, - "step": 23190 - }, - { - "epoch": 0.64, - "learning_rate": 3.6687690858757384e-06, - "loss": 0.2375, - "step": 23195 - }, - { - "epoch": 0.64, - "learning_rate": 3.6673421045121156e-06, - "loss": 0.3224, - "step": 23200 - }, - { - "epoch": 0.64, - "learning_rate": 3.665915123148492e-06, - "loss": 0.1336, - "step": 23205 - }, - { - "epoch": 0.64, - "learning_rate": 3.6644881417848687e-06, - "loss": 0.1603, - "step": 23210 - }, - { - "epoch": 0.64, - "learning_rate": 3.663061160421245e-06, - "loss": 0.1432, - "step": 23215 - }, - { - "epoch": 0.64, - "learning_rate": 3.6616341790576213e-06, - "loss": 0.1694, - "step": 23220 - }, - { - "epoch": 0.64, - "learning_rate": 3.6602071976939985e-06, - "loss": 0.1676, - "step": 23225 - }, - { - "epoch": 0.64, - "learning_rate": 3.658780216330375e-06, - "loss": 0.0683, - "step": 23230 - }, - { - "epoch": 0.64, - "learning_rate": 3.6573532349667516e-06, - "loss": 0.1797, - "step": 23235 - }, - { - "epoch": 0.64, - "learning_rate": 3.655926253603128e-06, - "loss": 0.1551, - "step": 23240 - }, - { - "epoch": 0.64, - "learning_rate": 3.654499272239505e-06, - "loss": 0.3179, - "step": 23245 - }, - { - "epoch": 0.65, - "learning_rate": 3.6530722908758815e-06, - "loss": 0.4787, - "step": 23250 - }, - { - "epoch": 0.65, - "learning_rate": 3.651645309512258e-06, - "loss": 0.1608, - "step": 23255 - }, - { - "epoch": 0.65, - "learning_rate": 3.6502183281486346e-06, - "loss": 0.1087, - "step": 23260 - }, - { - "epoch": 0.65, - "learning_rate": 3.648791346785011e-06, - "loss": 0.1297, - "step": 23265 - }, - { - "epoch": 0.65, - "learning_rate": 3.647364365421388e-06, - "loss": 0.1842, - "step": 23270 - }, - { - "epoch": 0.65, - "learning_rate": 3.6459373840577645e-06, - "loss": 0.0747, - "step": 23275 - }, - { - "epoch": 0.65, - "learning_rate": 3.6445104026941412e-06, - "loss": 0.2023, - "step": 23280 - }, - { - "epoch": 0.65, - "learning_rate": 3.6430834213305176e-06, - "loss": 0.1042, - "step": 23285 - }, - { - "epoch": 0.65, - "learning_rate": 3.6416564399668943e-06, - "loss": 0.1426, - "step": 23290 - }, - { - "epoch": 0.65, - "learning_rate": 3.640229458603271e-06, - "loss": 0.3445, - "step": 23295 - }, - { - "epoch": 0.65, - "learning_rate": 3.6388024772396474e-06, - "loss": 0.6512, - "step": 23300 - }, - { - "epoch": 0.65, - "learning_rate": 3.637375495876024e-06, - "loss": 0.1894, - "step": 23305 - }, - { - "epoch": 0.65, - "learning_rate": 3.6359485145124005e-06, - "loss": 0.1087, - "step": 23310 - }, - { - "epoch": 0.65, - "learning_rate": 3.6345215331487777e-06, - "loss": 0.144, - "step": 23315 - }, - { - "epoch": 0.65, - "learning_rate": 3.633094551785154e-06, - "loss": 0.1743, - "step": 23320 - }, - { - "epoch": 0.65, - "learning_rate": 3.6316675704215304e-06, - "loss": 0.1719, - "step": 23325 - }, - { - "epoch": 0.65, - "learning_rate": 3.630240589057907e-06, - "loss": 0.0125, - "step": 23330 - }, - { - "epoch": 0.65, - "learning_rate": 3.628813607694284e-06, - "loss": 0.1268, - "step": 23335 - }, - { - "epoch": 0.65, - "learning_rate": 3.6273866263306607e-06, - "loss": 0.1219, - "step": 23340 - }, - { - "epoch": 0.65, - "learning_rate": 3.625959644967037e-06, - "loss": 0.1726, - "step": 23345 - }, - { - "epoch": 0.65, - "learning_rate": 3.6245326636034133e-06, - "loss": 0.2476, - "step": 23350 - }, - { - "epoch": 0.65, - "learning_rate": 3.62310568223979e-06, - "loss": 0.1386, - "step": 23355 - }, - { - "epoch": 0.65, - "learning_rate": 3.621678700876167e-06, - "loss": 0.1267, - "step": 23360 - }, - { - "epoch": 0.65, - "learning_rate": 3.6202517195125436e-06, - "loss": 0.1364, - "step": 23365 - }, - { - "epoch": 0.65, - "learning_rate": 3.61882473814892e-06, - "loss": 0.1671, - "step": 23370 - }, - { - "epoch": 0.65, - "learning_rate": 3.6173977567852967e-06, - "loss": 0.1315, - "step": 23375 - }, - { - "epoch": 0.65, - "learning_rate": 3.6159707754216735e-06, - "loss": 0.1379, - "step": 23380 - }, - { - "epoch": 0.65, - "learning_rate": 3.61454379405805e-06, - "loss": 0.0916, - "step": 23385 - }, - { - "epoch": 0.65, - "learning_rate": 3.6131168126944266e-06, - "loss": 0.1413, - "step": 23390 - }, - { - "epoch": 0.65, - "learning_rate": 3.611689831330803e-06, - "loss": 0.1736, - "step": 23395 - }, - { - "epoch": 0.65, - "learning_rate": 3.6102628499671797e-06, - "loss": 0.373, - "step": 23400 - }, - { - "epoch": 0.65, - "learning_rate": 3.6088358686035565e-06, - "loss": 0.1233, - "step": 23405 - }, - { - "epoch": 0.65, - "learning_rate": 3.6074088872399332e-06, - "loss": 0.1222, - "step": 23410 - }, - { - "epoch": 0.65, - "learning_rate": 3.6059819058763096e-06, - "loss": 0.1344, - "step": 23415 - }, - { - "epoch": 0.65, - "learning_rate": 3.604554924512686e-06, - "loss": 0.1504, - "step": 23420 - }, - { - "epoch": 0.65, - "learning_rate": 3.603127943149063e-06, - "loss": 0.2086, - "step": 23425 - }, - { - "epoch": 0.65, - "learning_rate": 3.6017009617854394e-06, - "loss": 0.0836, - "step": 23430 - }, - { - "epoch": 0.65, - "learning_rate": 3.600273980421816e-06, - "loss": 0.1385, - "step": 23435 - }, - { - "epoch": 0.65, - "learning_rate": 3.5988469990581925e-06, - "loss": 0.1634, - "step": 23440 - }, - { - "epoch": 0.65, - "learning_rate": 3.597420017694569e-06, - "loss": 0.2463, - "step": 23445 - }, - { - "epoch": 0.65, - "learning_rate": 3.595993036330946e-06, - "loss": 0.3586, - "step": 23450 - }, - { - "epoch": 0.65, - "learning_rate": 3.5945660549673224e-06, - "loss": 0.1436, - "step": 23455 - }, - { - "epoch": 0.65, - "learning_rate": 3.593139073603699e-06, - "loss": 0.1569, - "step": 23460 - }, - { - "epoch": 0.65, - "learning_rate": 3.5917120922400755e-06, - "loss": 0.1627, - "step": 23465 - }, - { - "epoch": 0.65, - "learning_rate": 3.5902851108764527e-06, - "loss": 0.2061, - "step": 23470 - }, - { - "epoch": 0.65, - "learning_rate": 3.588858129512829e-06, - "loss": 0.127, - "step": 23475 - }, - { - "epoch": 0.65, - "learning_rate": 3.5874311481492053e-06, - "loss": 0.0794, - "step": 23480 - }, - { - "epoch": 0.65, - "learning_rate": 3.586004166785582e-06, - "loss": 0.0913, - "step": 23485 - }, - { - "epoch": 0.65, - "learning_rate": 3.5845771854219584e-06, - "loss": 0.1909, - "step": 23490 - }, - { - "epoch": 0.65, - "learning_rate": 3.5831502040583356e-06, - "loss": 0.3552, - "step": 23495 - }, - { - "epoch": 0.65, - "learning_rate": 3.581723222694712e-06, - "loss": 0.2849, - "step": 23500 - }, - { - "epoch": 0.65, - "learning_rate": 3.5802962413310887e-06, - "loss": 0.1741, - "step": 23505 - }, - { - "epoch": 0.65, - "learning_rate": 3.578869259967465e-06, - "loss": 0.1317, - "step": 23510 - }, - { - "epoch": 0.65, - "learning_rate": 3.5774422786038414e-06, - "loss": 0.1657, - "step": 23515 - }, - { - "epoch": 0.65, - "learning_rate": 3.5760152972402186e-06, - "loss": 0.1563, - "step": 23520 - }, - { - "epoch": 0.65, - "learning_rate": 3.574588315876595e-06, - "loss": 0.1125, - "step": 23525 - }, - { - "epoch": 0.65, - "learning_rate": 3.5731613345129717e-06, - "loss": 0.1364, - "step": 23530 - }, - { - "epoch": 0.65, - "learning_rate": 3.571734353149348e-06, - "loss": 0.216, - "step": 23535 - }, - { - "epoch": 0.65, - "learning_rate": 3.5703073717857244e-06, - "loss": 0.172, - "step": 23540 - }, - { - "epoch": 0.65, - "learning_rate": 3.5688803904221016e-06, - "loss": 0.2617, - "step": 23545 - }, - { - "epoch": 0.65, - "learning_rate": 3.567453409058478e-06, - "loss": 0.372, - "step": 23550 - }, - { - "epoch": 0.65, - "learning_rate": 3.5660264276948547e-06, - "loss": 0.1688, - "step": 23555 - }, - { - "epoch": 0.65, - "learning_rate": 3.564599446331231e-06, - "loss": 0.1386, - "step": 23560 - }, - { - "epoch": 0.65, - "learning_rate": 3.563172464967608e-06, - "loss": 0.1018, - "step": 23565 - }, - { - "epoch": 0.65, - "learning_rate": 3.5617454836039845e-06, - "loss": 0.1901, - "step": 23570 - }, - { - "epoch": 0.65, - "learning_rate": 3.560318502240361e-06, - "loss": 0.1043, - "step": 23575 - }, - { - "epoch": 0.65, - "learning_rate": 3.5588915208767376e-06, - "loss": 0.0829, - "step": 23580 - }, - { - "epoch": 0.65, - "learning_rate": 3.557464539513114e-06, - "loss": 0.1622, - "step": 23585 - }, - { - "epoch": 0.65, - "learning_rate": 3.556037558149491e-06, - "loss": 0.1634, - "step": 23590 - }, - { - "epoch": 0.65, - "learning_rate": 3.5546105767858675e-06, - "loss": 0.3626, - "step": 23595 - }, - { - "epoch": 0.65, - "learning_rate": 3.5531835954222443e-06, - "loss": 0.3029, - "step": 23600 - }, - { - "epoch": 0.65, - "learning_rate": 3.5517566140586206e-06, - "loss": 0.1306, - "step": 23605 - }, - { - "epoch": 0.66, - "learning_rate": 3.550329632694997e-06, - "loss": 0.1171, - "step": 23610 - }, - { - "epoch": 0.66, - "learning_rate": 3.548902651331374e-06, - "loss": 0.1345, - "step": 23615 - }, - { - "epoch": 0.66, - "learning_rate": 3.5474756699677505e-06, - "loss": 0.1034, - "step": 23620 - }, - { - "epoch": 0.66, - "learning_rate": 3.5460486886041272e-06, - "loss": 0.0366, - "step": 23625 - }, - { - "epoch": 0.66, - "learning_rate": 3.5446217072405036e-06, - "loss": 0.0737, - "step": 23630 - }, - { - "epoch": 0.66, - "learning_rate": 3.54319472587688e-06, - "loss": 0.1304, - "step": 23635 - }, - { - "epoch": 0.66, - "learning_rate": 3.541767744513257e-06, - "loss": 0.1246, - "step": 23640 - }, - { - "epoch": 0.66, - "learning_rate": 3.5403407631496334e-06, - "loss": 0.306, - "step": 23645 - }, - { - "epoch": 0.66, - "learning_rate": 3.53891378178601e-06, - "loss": 0.4532, - "step": 23650 - }, - { - "epoch": 0.66, - "learning_rate": 3.5374868004223865e-06, - "loss": 0.284, - "step": 23655 - }, - { - "epoch": 0.66, - "learning_rate": 3.5360598190587637e-06, - "loss": 0.1246, - "step": 23660 - }, - { - "epoch": 0.66, - "learning_rate": 3.53463283769514e-06, - "loss": 0.1596, - "step": 23665 - }, - { - "epoch": 0.66, - "learning_rate": 3.5332058563315164e-06, - "loss": 0.1537, - "step": 23670 - }, - { - "epoch": 0.66, - "learning_rate": 3.531778874967893e-06, - "loss": 0.0664, - "step": 23675 - }, - { - "epoch": 0.66, - "learning_rate": 3.5303518936042695e-06, - "loss": 0.2958, - "step": 23680 - }, - { - "epoch": 0.66, - "learning_rate": 3.5289249122406467e-06, - "loss": 0.0775, - "step": 23685 - }, - { - "epoch": 0.66, - "learning_rate": 3.527497930877023e-06, - "loss": 0.1909, - "step": 23690 - }, - { - "epoch": 0.66, - "learning_rate": 3.5260709495133998e-06, - "loss": 0.5231, - "step": 23695 - }, - { - "epoch": 0.66, - "learning_rate": 3.524643968149776e-06, - "loss": 0.3175, - "step": 23700 - }, - { - "epoch": 0.66, - "learning_rate": 3.5232169867861524e-06, - "loss": 0.1515, - "step": 23705 - }, - { - "epoch": 0.66, - "learning_rate": 3.5217900054225296e-06, - "loss": 0.1724, - "step": 23710 - }, - { - "epoch": 0.66, - "learning_rate": 3.520363024058906e-06, - "loss": 0.133, - "step": 23715 - }, - { - "epoch": 0.66, - "learning_rate": 3.5189360426952827e-06, - "loss": 0.1605, - "step": 23720 - }, - { - "epoch": 0.66, - "learning_rate": 3.517509061331659e-06, - "loss": 0.1722, - "step": 23725 - }, - { - "epoch": 0.66, - "learning_rate": 3.516082079968036e-06, - "loss": 0.0575, - "step": 23730 - }, - { - "epoch": 0.66, - "learning_rate": 3.5146550986044126e-06, - "loss": 0.0801, - "step": 23735 - }, - { - "epoch": 0.66, - "learning_rate": 3.513228117240789e-06, - "loss": 0.2827, - "step": 23740 - }, - { - "epoch": 0.66, - "learning_rate": 3.5118011358771657e-06, - "loss": 0.1989, - "step": 23745 - }, - { - "epoch": 0.66, - "learning_rate": 3.510374154513542e-06, - "loss": 0.3007, - "step": 23750 - }, - { - "epoch": 0.66, - "learning_rate": 3.5089471731499192e-06, - "loss": 0.0585, - "step": 23755 - }, - { - "epoch": 0.66, - "learning_rate": 3.5075201917862956e-06, - "loss": 0.1668, - "step": 23760 - }, - { - "epoch": 0.66, - "learning_rate": 3.506093210422672e-06, - "loss": 0.1849, - "step": 23765 - }, - { - "epoch": 0.66, - "learning_rate": 3.5046662290590487e-06, - "loss": 0.1545, - "step": 23770 - }, - { - "epoch": 0.66, - "learning_rate": 3.5032392476954254e-06, - "loss": 0.0453, - "step": 23775 - }, - { - "epoch": 0.66, - "learning_rate": 3.501812266331802e-06, - "loss": 0.091, - "step": 23780 - }, - { - "epoch": 0.66, - "learning_rate": 3.5003852849681785e-06, - "loss": 0.1137, - "step": 23785 - }, - { - "epoch": 0.66, - "learning_rate": 3.4989583036045553e-06, - "loss": 0.1104, - "step": 23790 - }, - { - "epoch": 0.66, - "learning_rate": 3.497531322240932e-06, - "loss": 0.1074, - "step": 23795 - }, - { - "epoch": 0.66, - "learning_rate": 3.4961043408773084e-06, - "loss": 0.5004, - "step": 23800 - }, - { - "epoch": 0.66, - "learning_rate": 3.494677359513685e-06, - "loss": 0.0985, - "step": 23805 - }, - { - "epoch": 0.66, - "learning_rate": 3.4932503781500615e-06, - "loss": 0.1606, - "step": 23810 - }, - { - "epoch": 0.66, - "learning_rate": 3.4918233967864382e-06, - "loss": 0.1426, - "step": 23815 - }, - { - "epoch": 0.66, - "learning_rate": 3.490396415422815e-06, - "loss": 0.1338, - "step": 23820 - }, - { - "epoch": 0.66, - "learning_rate": 3.4889694340591913e-06, - "loss": 0.1647, - "step": 23825 - }, - { - "epoch": 0.66, - "learning_rate": 3.487542452695568e-06, - "loss": 0.0531, - "step": 23830 - }, - { - "epoch": 0.66, - "learning_rate": 3.4861154713319444e-06, - "loss": 0.061, - "step": 23835 - }, - { - "epoch": 0.66, - "learning_rate": 3.4846884899683216e-06, - "loss": 0.1268, - "step": 23840 - }, - { - "epoch": 0.66, - "learning_rate": 3.483261508604698e-06, - "loss": 0.166, - "step": 23845 - }, - { - "epoch": 0.66, - "learning_rate": 3.4818345272410747e-06, - "loss": 0.5046, - "step": 23850 - }, - { - "epoch": 0.66, - "learning_rate": 3.480407545877451e-06, - "loss": 0.1384, - "step": 23855 - }, - { - "epoch": 0.66, - "learning_rate": 3.4789805645138274e-06, - "loss": 0.1635, - "step": 23860 - }, - { - "epoch": 0.66, - "learning_rate": 3.4775535831502046e-06, - "loss": 0.1346, - "step": 23865 - }, - { - "epoch": 0.66, - "learning_rate": 3.476126601786581e-06, - "loss": 0.1902, - "step": 23870 - }, - { - "epoch": 0.66, - "learning_rate": 3.4746996204229577e-06, - "loss": 0.0762, - "step": 23875 - }, - { - "epoch": 0.66, - "learning_rate": 3.473272639059334e-06, - "loss": 0.027, - "step": 23880 - }, - { - "epoch": 0.66, - "learning_rate": 3.4718456576957112e-06, - "loss": 0.3273, - "step": 23885 - }, - { - "epoch": 0.66, - "learning_rate": 3.4704186763320876e-06, - "loss": 0.1416, - "step": 23890 - }, - { - "epoch": 0.66, - "learning_rate": 3.468991694968464e-06, - "loss": 0.4064, - "step": 23895 - }, - { - "epoch": 0.66, - "learning_rate": 3.4675647136048407e-06, - "loss": 0.4853, - "step": 23900 - }, - { - "epoch": 0.66, - "learning_rate": 3.466137732241217e-06, - "loss": 0.1373, - "step": 23905 - }, - { - "epoch": 0.66, - "learning_rate": 3.464710750877594e-06, - "loss": 0.1968, - "step": 23910 - }, - { - "epoch": 0.66, - "learning_rate": 3.4632837695139705e-06, - "loss": 0.1565, - "step": 23915 - }, - { - "epoch": 0.66, - "learning_rate": 3.4618567881503473e-06, - "loss": 0.206, - "step": 23920 - }, - { - "epoch": 0.66, - "learning_rate": 3.4604298067867236e-06, - "loss": 0.1417, - "step": 23925 - }, - { - "epoch": 0.66, - "learning_rate": 3.4590028254231e-06, - "loss": 0.1064, - "step": 23930 - }, - { - "epoch": 0.66, - "learning_rate": 3.457575844059477e-06, - "loss": 0.0539, - "step": 23935 - }, - { - "epoch": 0.66, - "learning_rate": 3.4561488626958535e-06, - "loss": 0.1214, - "step": 23940 - }, - { - "epoch": 0.66, - "learning_rate": 3.4547218813322303e-06, - "loss": 0.0785, - "step": 23945 - }, - { - "epoch": 0.66, - "learning_rate": 3.4532948999686066e-06, - "loss": 0.375, - "step": 23950 - }, - { - "epoch": 0.66, - "learning_rate": 3.451867918604983e-06, - "loss": 0.1294, - "step": 23955 - }, - { - "epoch": 0.66, - "learning_rate": 3.45044093724136e-06, - "loss": 0.1702, - "step": 23960 - }, - { - "epoch": 0.66, - "learning_rate": 3.4490139558777365e-06, - "loss": 0.1358, - "step": 23965 - }, - { - "epoch": 0.67, - "learning_rate": 3.4475869745141132e-06, - "loss": 0.1221, - "step": 23970 - }, - { - "epoch": 0.67, - "learning_rate": 3.4461599931504896e-06, - "loss": 0.1358, - "step": 23975 - }, - { - "epoch": 0.67, - "learning_rate": 3.4447330117868667e-06, - "loss": 0.1159, - "step": 23980 - }, - { - "epoch": 0.67, - "learning_rate": 3.443306030423243e-06, - "loss": 0.0946, - "step": 23985 - }, - { - "epoch": 0.67, - "learning_rate": 3.4418790490596194e-06, - "loss": 0.0759, - "step": 23990 - }, - { - "epoch": 0.67, - "learning_rate": 3.440452067695996e-06, - "loss": 0.2981, - "step": 23995 - }, - { - "epoch": 0.67, - "learning_rate": 3.4390250863323725e-06, - "loss": 0.521, - "step": 24000 - }, - { - "epoch": 0.67, - "eval_loss": 0.061234455555677414, - "eval_runtime": 1558.3951, - "eval_samples_per_second": 10.279, - "eval_steps_per_second": 2.57, - "eval_wer": 0.1717273710782546, - "step": 24000 - }, - { - "epoch": 0.67, - "learning_rate": 3.4375981049687497e-06, - "loss": 0.1503, - "step": 24005 - }, - { - "epoch": 0.67, - "learning_rate": 3.436171123605126e-06, - "loss": 0.1167, - "step": 24010 - }, - { - "epoch": 0.67, - "learning_rate": 3.434744142241503e-06, - "loss": 0.1155, - "step": 24015 - }, - { - "epoch": 0.67, - "learning_rate": 3.433317160877879e-06, - "loss": 0.133, - "step": 24020 - }, - { - "epoch": 0.67, - "learning_rate": 3.4318901795142555e-06, - "loss": 0.1115, - "step": 24025 - }, - { - "epoch": 0.67, - "learning_rate": 3.4304631981506327e-06, - "loss": 0.1889, - "step": 24030 - }, - { - "epoch": 0.67, - "learning_rate": 3.429036216787009e-06, - "loss": 0.0863, - "step": 24035 - }, - { - "epoch": 0.67, - "learning_rate": 3.4276092354233858e-06, - "loss": 0.3958, - "step": 24040 - }, - { - "epoch": 0.67, - "learning_rate": 3.426182254059762e-06, - "loss": 0.3577, - "step": 24045 - }, - { - "epoch": 0.67, - "learning_rate": 3.4247552726961384e-06, - "loss": 0.49, - "step": 24050 - }, - { - "epoch": 0.67, - "learning_rate": 3.4233282913325156e-06, - "loss": 0.1459, - "step": 24055 - }, - { - "epoch": 0.67, - "learning_rate": 3.421901309968892e-06, - "loss": 0.1008, - "step": 24060 - }, - { - "epoch": 0.67, - "learning_rate": 3.4204743286052687e-06, - "loss": 0.1263, - "step": 24065 - }, - { - "epoch": 0.67, - "learning_rate": 3.419047347241645e-06, - "loss": 0.152, - "step": 24070 - }, - { - "epoch": 0.67, - "learning_rate": 3.4176203658780223e-06, - "loss": 0.1596, - "step": 24075 - }, - { - "epoch": 0.67, - "learning_rate": 3.4161933845143986e-06, - "loss": 0.0835, - "step": 24080 - }, - { - "epoch": 0.67, - "learning_rate": 3.414766403150775e-06, - "loss": 0.1273, - "step": 24085 - }, - { - "epoch": 0.67, - "learning_rate": 3.4133394217871517e-06, - "loss": 0.1407, - "step": 24090 - }, - { - "epoch": 0.67, - "learning_rate": 3.411912440423528e-06, - "loss": 0.2252, - "step": 24095 - }, - { - "epoch": 0.67, - "learning_rate": 3.4104854590599052e-06, - "loss": 0.2954, - "step": 24100 - }, - { - "epoch": 0.67, - "learning_rate": 3.4090584776962816e-06, - "loss": 0.2298, - "step": 24105 - }, - { - "epoch": 0.67, - "learning_rate": 3.4076314963326583e-06, - "loss": 0.0906, - "step": 24110 - }, - { - "epoch": 0.67, - "learning_rate": 3.4062045149690347e-06, - "loss": 0.1589, - "step": 24115 - }, - { - "epoch": 0.67, - "learning_rate": 3.404777533605411e-06, - "loss": 0.173, - "step": 24120 - }, - { - "epoch": 0.67, - "learning_rate": 3.403350552241788e-06, - "loss": 0.113, - "step": 24125 - }, - { - "epoch": 0.67, - "learning_rate": 3.4019235708781645e-06, - "loss": 0.1035, - "step": 24130 - }, - { - "epoch": 0.67, - "learning_rate": 3.4004965895145413e-06, - "loss": 0.1338, - "step": 24135 - }, - { - "epoch": 0.67, - "learning_rate": 3.3990696081509176e-06, - "loss": 0.17, - "step": 24140 - }, - { - "epoch": 0.67, - "learning_rate": 3.397642626787294e-06, - "loss": 0.0888, - "step": 24145 - }, - { - "epoch": 0.67, - "learning_rate": 3.396215645423671e-06, - "loss": 0.2657, - "step": 24150 - }, - { - "epoch": 0.67, - "learning_rate": 3.3947886640600475e-06, - "loss": 0.1518, - "step": 24155 - }, - { - "epoch": 0.67, - "learning_rate": 3.3933616826964242e-06, - "loss": 0.1659, - "step": 24160 - }, - { - "epoch": 0.67, - "learning_rate": 3.3919347013328006e-06, - "loss": 0.148, - "step": 24165 - }, - { - "epoch": 0.67, - "learning_rate": 3.3905077199691778e-06, - "loss": 0.2036, - "step": 24170 - }, - { - "epoch": 0.67, - "learning_rate": 3.389080738605554e-06, - "loss": 0.1084, - "step": 24175 - }, - { - "epoch": 0.67, - "learning_rate": 3.3876537572419305e-06, - "loss": 0.1029, - "step": 24180 - }, - { - "epoch": 0.67, - "learning_rate": 3.3862267758783072e-06, - "loss": 0.0879, - "step": 24185 - }, - { - "epoch": 0.67, - "learning_rate": 3.384799794514684e-06, - "loss": 0.2674, - "step": 24190 - }, - { - "epoch": 0.67, - "learning_rate": 3.3833728131510607e-06, - "loss": 0.2432, - "step": 24195 - }, - { - "epoch": 0.67, - "learning_rate": 3.381945831787437e-06, - "loss": 0.6116, - "step": 24200 - }, - { - "epoch": 0.67, - "learning_rate": 3.380518850423814e-06, - "loss": 0.1596, - "step": 24205 - }, - { - "epoch": 0.67, - "learning_rate": 3.37909186906019e-06, - "loss": 0.1456, - "step": 24210 - }, - { - "epoch": 0.67, - "learning_rate": 3.377664887696567e-06, - "loss": 0.1003, - "step": 24215 - }, - { - "epoch": 0.67, - "learning_rate": 3.3762379063329437e-06, - "loss": 0.177, - "step": 24220 - }, - { - "epoch": 0.67, - "learning_rate": 3.37481092496932e-06, - "loss": 0.1047, - "step": 24225 - }, - { - "epoch": 0.67, - "learning_rate": 3.373383943605697e-06, - "loss": 0.0667, - "step": 24230 - }, - { - "epoch": 0.67, - "learning_rate": 3.3719569622420736e-06, - "loss": 0.1686, - "step": 24235 - }, - { - "epoch": 0.67, - "learning_rate": 3.37052998087845e-06, - "loss": 0.0855, - "step": 24240 - }, - { - "epoch": 0.67, - "learning_rate": 3.3691029995148267e-06, - "loss": 0.1652, - "step": 24245 - }, - { - "epoch": 0.67, - "learning_rate": 3.367676018151203e-06, - "loss": 0.3478, - "step": 24250 - }, - { - "epoch": 0.67, - "learning_rate": 3.3662490367875798e-06, - "loss": 0.0967, - "step": 24255 - }, - { - "epoch": 0.67, - "learning_rate": 3.3648220554239565e-06, - "loss": 0.1227, - "step": 24260 - }, - { - "epoch": 0.67, - "learning_rate": 3.3633950740603333e-06, - "loss": 0.1537, - "step": 24265 - }, - { - "epoch": 0.67, - "learning_rate": 3.3619680926967096e-06, - "loss": 0.1587, - "step": 24270 - }, - { - "epoch": 0.67, - "learning_rate": 3.360541111333086e-06, - "loss": 0.0498, - "step": 24275 - }, - { - "epoch": 0.67, - "learning_rate": 3.359114129969463e-06, - "loss": 0.0124, - "step": 24280 - }, - { - "epoch": 0.67, - "learning_rate": 3.3576871486058395e-06, - "loss": 0.0995, - "step": 24285 - }, - { - "epoch": 0.67, - "learning_rate": 3.3562601672422163e-06, - "loss": 0.17, - "step": 24290 - }, - { - "epoch": 0.67, - "learning_rate": 3.3548331858785926e-06, - "loss": 0.2525, - "step": 24295 - }, - { - "epoch": 0.67, - "learning_rate": 3.3534062045149694e-06, - "loss": 0.3695, - "step": 24300 - }, - { - "epoch": 0.67, - "learning_rate": 3.351979223151346e-06, - "loss": 0.1427, - "step": 24305 - }, - { - "epoch": 0.67, - "learning_rate": 3.3505522417877225e-06, - "loss": 0.123, - "step": 24310 - }, - { - "epoch": 0.67, - "learning_rate": 3.3491252604240992e-06, - "loss": 0.1756, - "step": 24315 - }, - { - "epoch": 0.67, - "learning_rate": 3.3476982790604756e-06, - "loss": 0.2576, - "step": 24320 - }, - { - "epoch": 0.67, - "learning_rate": 3.3462712976968527e-06, - "loss": 0.1732, - "step": 24325 - }, - { - "epoch": 0.68, - "learning_rate": 3.344844316333229e-06, - "loss": 0.082, - "step": 24330 - }, - { - "epoch": 0.68, - "learning_rate": 3.3434173349696054e-06, - "loss": 0.0868, - "step": 24335 - }, - { - "epoch": 0.68, - "learning_rate": 3.341990353605982e-06, - "loss": 0.2351, - "step": 24340 - }, - { - "epoch": 0.68, - "learning_rate": 3.3405633722423585e-06, - "loss": 0.1013, - "step": 24345 - }, - { - "epoch": 0.68, - "learning_rate": 3.3391363908787357e-06, - "loss": 0.2214, - "step": 24350 - }, - { - "epoch": 0.68, - "learning_rate": 3.337709409515112e-06, - "loss": 0.1216, - "step": 24355 - }, - { - "epoch": 0.68, - "learning_rate": 3.336282428151489e-06, - "loss": 0.1518, - "step": 24360 - }, - { - "epoch": 0.68, - "learning_rate": 3.334855446787865e-06, - "loss": 0.1282, - "step": 24365 - }, - { - "epoch": 0.68, - "learning_rate": 3.3334284654242415e-06, - "loss": 0.2552, - "step": 24370 - }, - { - "epoch": 0.68, - "learning_rate": 3.3320014840606187e-06, - "loss": 0.1445, - "step": 24375 - }, - { - "epoch": 0.68, - "learning_rate": 3.330574502696995e-06, - "loss": 0.1411, - "step": 24380 - }, - { - "epoch": 0.68, - "learning_rate": 3.3291475213333718e-06, - "loss": 0.1767, - "step": 24385 - }, - { - "epoch": 0.68, - "learning_rate": 3.327720539969748e-06, - "loss": 0.1734, - "step": 24390 - }, - { - "epoch": 0.68, - "learning_rate": 3.3262935586061253e-06, - "loss": 0.2567, - "step": 24395 - }, - { - "epoch": 0.68, - "learning_rate": 3.3248665772425016e-06, - "loss": 0.3992, - "step": 24400 - }, - { - "epoch": 0.68, - "learning_rate": 3.323439595878878e-06, - "loss": 0.1647, - "step": 24405 - }, - { - "epoch": 0.68, - "learning_rate": 3.3220126145152547e-06, - "loss": 0.1232, - "step": 24410 - }, - { - "epoch": 0.68, - "learning_rate": 3.320585633151631e-06, - "loss": 0.1844, - "step": 24415 - }, - { - "epoch": 0.68, - "learning_rate": 3.3191586517880083e-06, - "loss": 0.1531, - "step": 24420 - }, - { - "epoch": 0.68, - "learning_rate": 3.3177316704243846e-06, - "loss": 0.0488, - "step": 24425 - }, - { - "epoch": 0.68, - "learning_rate": 3.316304689060761e-06, - "loss": 0.1118, - "step": 24430 - }, - { - "epoch": 0.68, - "learning_rate": 3.3148777076971377e-06, - "loss": 0.2331, - "step": 24435 - }, - { - "epoch": 0.68, - "learning_rate": 3.313450726333514e-06, - "loss": 0.2966, - "step": 24440 - }, - { - "epoch": 0.68, - "learning_rate": 3.3120237449698912e-06, - "loss": 0.2844, - "step": 24445 - }, - { - "epoch": 0.68, - "learning_rate": 3.3105967636062676e-06, - "loss": 0.6628, - "step": 24450 - }, - { - "epoch": 0.68, - "learning_rate": 3.3091697822426443e-06, - "loss": 0.1269, - "step": 24455 - }, - { - "epoch": 0.68, - "learning_rate": 3.3077428008790207e-06, - "loss": 0.1566, - "step": 24460 - }, - { - "epoch": 0.68, - "learning_rate": 3.306315819515397e-06, - "loss": 0.2109, - "step": 24465 - }, - { - "epoch": 0.68, - "learning_rate": 3.304888838151774e-06, - "loss": 0.2047, - "step": 24470 - }, - { - "epoch": 0.68, - "learning_rate": 3.3034618567881505e-06, - "loss": 0.1145, - "step": 24475 - }, - { - "epoch": 0.68, - "learning_rate": 3.3020348754245273e-06, - "loss": 0.0569, - "step": 24480 - }, - { - "epoch": 0.68, - "learning_rate": 3.3006078940609036e-06, - "loss": 0.1161, - "step": 24485 - }, - { - "epoch": 0.68, - "learning_rate": 3.299180912697281e-06, - "loss": 0.2084, - "step": 24490 - }, - { - "epoch": 0.68, - "learning_rate": 3.297753931333657e-06, - "loss": 0.2207, - "step": 24495 - }, - { - "epoch": 0.68, - "learning_rate": 3.2963269499700335e-06, - "loss": 0.6217, - "step": 24500 - }, - { - "epoch": 0.68, - "learning_rate": 3.2948999686064102e-06, - "loss": 0.093, - "step": 24505 - }, - { - "epoch": 0.68, - "learning_rate": 3.2934729872427866e-06, - "loss": 0.0841, - "step": 24510 - }, - { - "epoch": 0.68, - "learning_rate": 3.2920460058791638e-06, - "loss": 0.2002, - "step": 24515 - }, - { - "epoch": 0.68, - "learning_rate": 3.29061902451554e-06, - "loss": 0.1339, - "step": 24520 - }, - { - "epoch": 0.68, - "learning_rate": 3.289192043151917e-06, - "loss": 0.1352, - "step": 24525 - }, - { - "epoch": 0.68, - "learning_rate": 3.2877650617882932e-06, - "loss": 0.1269, - "step": 24530 - }, - { - "epoch": 0.68, - "learning_rate": 3.2863380804246696e-06, - "loss": 0.0433, - "step": 24535 - }, - { - "epoch": 0.68, - "learning_rate": 3.2849110990610467e-06, - "loss": 0.2801, - "step": 24540 - }, - { - "epoch": 0.68, - "learning_rate": 3.283484117697423e-06, - "loss": 0.2385, - "step": 24545 - }, - { - "epoch": 0.68, - "learning_rate": 3.2820571363338e-06, - "loss": 0.2845, - "step": 24550 - }, - { - "epoch": 0.68, - "learning_rate": 3.280630154970176e-06, - "loss": 0.0912, - "step": 24555 - }, - { - "epoch": 0.68, - "learning_rate": 3.2792031736065525e-06, - "loss": 0.1496, - "step": 24560 - }, - { - "epoch": 0.68, - "learning_rate": 3.2777761922429297e-06, - "loss": 0.2442, - "step": 24565 - }, - { - "epoch": 0.68, - "learning_rate": 3.276349210879306e-06, - "loss": 0.1874, - "step": 24570 - }, - { - "epoch": 0.68, - "learning_rate": 3.274922229515683e-06, - "loss": 0.1175, - "step": 24575 - }, - { - "epoch": 0.68, - "learning_rate": 3.273495248152059e-06, - "loss": 0.0182, - "step": 24580 - }, - { - "epoch": 0.68, - "learning_rate": 3.2720682667884363e-06, - "loss": 0.2497, - "step": 24585 - }, - { - "epoch": 0.68, - "learning_rate": 3.2706412854248127e-06, - "loss": 0.1674, - "step": 24590 - }, - { - "epoch": 0.68, - "learning_rate": 3.269214304061189e-06, - "loss": 0.1815, - "step": 24595 - }, - { - "epoch": 0.68, - "learning_rate": 3.2677873226975658e-06, - "loss": 0.37, - "step": 24600 - }, - { - "epoch": 0.68, - "learning_rate": 3.266360341333942e-06, - "loss": 0.1292, - "step": 24605 - }, - { - "epoch": 0.68, - "learning_rate": 3.2649333599703193e-06, - "loss": 0.1061, - "step": 24610 - }, - { - "epoch": 0.68, - "learning_rate": 3.2635063786066956e-06, - "loss": 0.1565, - "step": 24615 - }, - { - "epoch": 0.68, - "learning_rate": 3.2620793972430724e-06, - "loss": 0.1779, - "step": 24620 - }, - { - "epoch": 0.68, - "learning_rate": 3.2606524158794487e-06, - "loss": 0.1077, - "step": 24625 - }, - { - "epoch": 0.68, - "learning_rate": 3.2592254345158255e-06, - "loss": 0.0938, - "step": 24630 - }, - { - "epoch": 0.68, - "learning_rate": 3.2577984531522023e-06, - "loss": 0.1082, - "step": 24635 - }, - { - "epoch": 0.68, - "learning_rate": 3.2563714717885786e-06, - "loss": 0.0819, - "step": 24640 - }, - { - "epoch": 0.68, - "learning_rate": 3.2549444904249554e-06, - "loss": 0.4498, - "step": 24645 - }, - { - "epoch": 0.68, - "learning_rate": 3.2535175090613317e-06, - "loss": 0.6766, - "step": 24650 - }, - { - "epoch": 0.68, - "learning_rate": 3.2520905276977085e-06, - "loss": 0.1111, - "step": 24655 - }, - { - "epoch": 0.68, - "learning_rate": 3.2506635463340852e-06, - "loss": 0.1768, - "step": 24660 - }, - { - "epoch": 0.68, - "learning_rate": 3.2492365649704616e-06, - "loss": 0.1568, - "step": 24665 - }, - { - "epoch": 0.68, - "learning_rate": 3.2478095836068383e-06, - "loss": 0.1591, - "step": 24670 - }, - { - "epoch": 0.68, - "learning_rate": 3.246382602243215e-06, - "loss": 0.1138, - "step": 24675 - }, - { - "epoch": 0.68, - "learning_rate": 3.244955620879592e-06, - "loss": 0.1041, - "step": 24680 - }, - { - "epoch": 0.68, - "learning_rate": 3.243528639515968e-06, - "loss": 0.0842, - "step": 24685 - }, - { - "epoch": 0.69, - "learning_rate": 3.2421016581523445e-06, - "loss": 0.181, - "step": 24690 - }, - { - "epoch": 0.69, - "learning_rate": 3.2406746767887217e-06, - "loss": 0.1652, - "step": 24695 - }, - { - "epoch": 0.69, - "learning_rate": 3.239247695425098e-06, - "loss": 0.4201, - "step": 24700 - }, - { - "epoch": 0.69, - "learning_rate": 3.237820714061475e-06, - "loss": 0.1204, - "step": 24705 - }, - { - "epoch": 0.69, - "learning_rate": 3.236393732697851e-06, - "loss": 0.1886, - "step": 24710 - }, - { - "epoch": 0.69, - "learning_rate": 3.234966751334228e-06, - "loss": 0.1273, - "step": 24715 - }, - { - "epoch": 0.69, - "learning_rate": 3.2335397699706047e-06, - "loss": 0.168, - "step": 24720 - }, - { - "epoch": 0.69, - "learning_rate": 3.232112788606981e-06, - "loss": 0.2194, - "step": 24725 - }, - { - "epoch": 0.69, - "learning_rate": 3.2306858072433578e-06, - "loss": 0.1397, - "step": 24730 - }, - { - "epoch": 0.69, - "learning_rate": 3.229258825879734e-06, - "loss": 0.1028, - "step": 24735 - }, - { - "epoch": 0.69, - "learning_rate": 3.2278318445161113e-06, - "loss": 0.2445, - "step": 24740 - }, - { - "epoch": 0.69, - "learning_rate": 3.2264048631524876e-06, - "loss": 0.1483, - "step": 24745 - }, - { - "epoch": 0.69, - "learning_rate": 3.224977881788864e-06, - "loss": 0.4142, - "step": 24750 - }, - { - "epoch": 0.69, - "learning_rate": 3.2235509004252407e-06, - "loss": 0.1048, - "step": 24755 - }, - { - "epoch": 0.69, - "learning_rate": 3.222123919061617e-06, - "loss": 0.1253, - "step": 24760 - }, - { - "epoch": 0.69, - "learning_rate": 3.2206969376979943e-06, - "loss": 0.1067, - "step": 24765 - }, - { - "epoch": 0.69, - "learning_rate": 3.2192699563343706e-06, - "loss": 0.1786, - "step": 24770 - }, - { - "epoch": 0.69, - "learning_rate": 3.2178429749707474e-06, - "loss": 0.1778, - "step": 24775 - }, - { - "epoch": 0.69, - "learning_rate": 3.2164159936071237e-06, - "loss": 0.1355, - "step": 24780 - }, - { - "epoch": 0.69, - "learning_rate": 3.2149890122435e-06, - "loss": 0.1129, - "step": 24785 - }, - { - "epoch": 0.69, - "learning_rate": 3.2135620308798772e-06, - "loss": 0.1761, - "step": 24790 - }, - { - "epoch": 0.69, - "learning_rate": 3.2121350495162536e-06, - "loss": 0.2162, - "step": 24795 - }, - { - "epoch": 0.69, - "learning_rate": 3.2107080681526303e-06, - "loss": 0.4048, - "step": 24800 - }, - { - "epoch": 0.69, - "learning_rate": 3.2092810867890067e-06, - "loss": 0.1602, - "step": 24805 - }, - { - "epoch": 0.69, - "learning_rate": 3.207854105425384e-06, - "loss": 0.1191, - "step": 24810 - }, - { - "epoch": 0.69, - "learning_rate": 3.20642712406176e-06, - "loss": 0.1368, - "step": 24815 - }, - { - "epoch": 0.69, - "learning_rate": 3.2050001426981365e-06, - "loss": 0.1553, - "step": 24820 - }, - { - "epoch": 0.69, - "learning_rate": 3.2035731613345133e-06, - "loss": 0.0768, - "step": 24825 - }, - { - "epoch": 0.69, - "learning_rate": 3.2021461799708896e-06, - "loss": 0.0305, - "step": 24830 - }, - { - "epoch": 0.69, - "learning_rate": 3.200719198607267e-06, - "loss": 0.2172, - "step": 24835 - }, - { - "epoch": 0.69, - "learning_rate": 3.199292217243643e-06, - "loss": 0.2116, - "step": 24840 - }, - { - "epoch": 0.69, - "learning_rate": 3.1978652358800195e-06, - "loss": 0.1883, - "step": 24845 - }, - { - "epoch": 0.69, - "learning_rate": 3.1964382545163963e-06, - "loss": 0.3431, - "step": 24850 - }, - { - "epoch": 0.69, - "learning_rate": 3.1950112731527726e-06, - "loss": 0.1449, - "step": 24855 - }, - { - "epoch": 0.69, - "learning_rate": 3.1935842917891498e-06, - "loss": 0.1767, - "step": 24860 - }, - { - "epoch": 0.69, - "learning_rate": 3.192157310425526e-06, - "loss": 0.1833, - "step": 24865 - }, - { - "epoch": 0.69, - "learning_rate": 3.190730329061903e-06, - "loss": 0.163, - "step": 24870 - }, - { - "epoch": 0.69, - "learning_rate": 3.1893033476982792e-06, - "loss": 0.1874, - "step": 24875 - }, - { - "epoch": 0.69, - "learning_rate": 3.1878763663346556e-06, - "loss": 0.1119, - "step": 24880 - }, - { - "epoch": 0.69, - "learning_rate": 3.1864493849710327e-06, - "loss": 0.1364, - "step": 24885 - }, - { - "epoch": 0.69, - "learning_rate": 3.185022403607409e-06, - "loss": 0.1162, - "step": 24890 - }, - { - "epoch": 0.69, - "learning_rate": 3.183595422243786e-06, - "loss": 0.2754, - "step": 24895 - }, - { - "epoch": 0.69, - "learning_rate": 3.182168440880162e-06, - "loss": 0.4152, - "step": 24900 - }, - { - "epoch": 0.69, - "learning_rate": 3.1807414595165394e-06, - "loss": 0.0828, - "step": 24905 - }, - { - "epoch": 0.69, - "learning_rate": 3.1793144781529157e-06, - "loss": 0.1073, - "step": 24910 - }, - { - "epoch": 0.69, - "learning_rate": 3.177887496789292e-06, - "loss": 0.0854, - "step": 24915 - }, - { - "epoch": 0.69, - "learning_rate": 3.176460515425669e-06, - "loss": 0.1355, - "step": 24920 - }, - { - "epoch": 0.69, - "learning_rate": 3.175033534062045e-06, - "loss": 0.1573, - "step": 24925 - }, - { - "epoch": 0.69, - "learning_rate": 3.1736065526984223e-06, - "loss": 0.1358, - "step": 24930 - }, - { - "epoch": 0.69, - "learning_rate": 3.1721795713347987e-06, - "loss": 0.0669, - "step": 24935 - }, - { - "epoch": 0.69, - "learning_rate": 3.170752589971175e-06, - "loss": 0.1749, - "step": 24940 - }, - { - "epoch": 0.69, - "learning_rate": 3.1693256086075518e-06, - "loss": 0.1238, - "step": 24945 - }, - { - "epoch": 0.69, - "learning_rate": 3.1681840235166534e-06, - "loss": 0.5303, - "step": 24950 - }, - { - "epoch": 0.69, - "learning_rate": 3.1667570421530298e-06, - "loss": 0.1184, - "step": 24955 - }, - { - "epoch": 0.69, - "learning_rate": 3.165330060789406e-06, - "loss": 0.2232, - "step": 24960 - }, - { - "epoch": 0.69, - "learning_rate": 3.163903079425783e-06, - "loss": 0.1473, - "step": 24965 - }, - { - "epoch": 0.69, - "learning_rate": 3.162476098062159e-06, - "loss": 0.2284, - "step": 24970 - }, - { - "epoch": 0.69, - "learning_rate": 3.1610491166985364e-06, - "loss": 0.1185, - "step": 24975 - }, - { - "epoch": 0.69, - "learning_rate": 3.1596221353349127e-06, - "loss": 0.111, - "step": 24980 - }, - { - "epoch": 0.69, - "learning_rate": 3.1581951539712895e-06, - "loss": 0.1202, - "step": 24985 - }, - { - "epoch": 0.69, - "learning_rate": 3.156768172607666e-06, - "loss": 0.125, - "step": 24990 - }, - { - "epoch": 0.69, - "learning_rate": 3.155341191244042e-06, - "loss": 0.2482, - "step": 24995 - }, - { - "epoch": 0.69, - "learning_rate": 3.1539142098804194e-06, - "loss": 0.3502, - "step": 25000 - }, - { - "epoch": 0.69, - "learning_rate": 3.1524872285167957e-06, - "loss": 0.1993, - "step": 25005 - }, - { - "epoch": 0.69, - "learning_rate": 3.1510602471531725e-06, - "loss": 0.0801, - "step": 25010 - }, - { - "epoch": 0.69, - "learning_rate": 3.149633265789549e-06, - "loss": 0.166, - "step": 25015 - }, - { - "epoch": 0.69, - "learning_rate": 3.148206284425926e-06, - "loss": 0.2255, - "step": 25020 - }, - { - "epoch": 0.69, - "learning_rate": 3.1467793030623023e-06, - "loss": 0.131, - "step": 25025 - }, - { - "epoch": 0.69, - "learning_rate": 3.1453523216986787e-06, - "loss": 0.0902, - "step": 25030 - }, - { - "epoch": 0.69, - "learning_rate": 3.1439253403350554e-06, - "loss": 0.0461, - "step": 25035 - }, - { - "epoch": 0.69, - "learning_rate": 3.1424983589714318e-06, - "loss": 0.2501, - "step": 25040 - }, - { - "epoch": 0.69, - "learning_rate": 3.141071377607809e-06, - "loss": 0.184, - "step": 25045 - }, - { - "epoch": 0.7, - "learning_rate": 3.1396443962441853e-06, - "loss": 0.4096, - "step": 25050 - }, - { - "epoch": 0.7, - "learning_rate": 3.1382174148805616e-06, - "loss": 0.1553, - "step": 25055 - }, - { - "epoch": 0.7, - "learning_rate": 3.1367904335169384e-06, - "loss": 0.1454, - "step": 25060 - }, - { - "epoch": 0.7, - "learning_rate": 3.135363452153315e-06, - "loss": 0.114, - "step": 25065 - }, - { - "epoch": 0.7, - "learning_rate": 3.133936470789692e-06, - "loss": 0.1724, - "step": 25070 - }, - { - "epoch": 0.7, - "learning_rate": 3.1325094894260682e-06, - "loss": 0.028, - "step": 25075 - }, - { - "epoch": 0.7, - "learning_rate": 3.131082508062445e-06, - "loss": 0.1044, - "step": 25080 - }, - { - "epoch": 0.7, - "learning_rate": 3.1296555266988213e-06, - "loss": 0.0878, - "step": 25085 - }, - { - "epoch": 0.7, - "learning_rate": 3.128228545335198e-06, - "loss": 0.274, - "step": 25090 - }, - { - "epoch": 0.7, - "learning_rate": 3.126801563971575e-06, - "loss": 0.2244, - "step": 25095 - }, - { - "epoch": 0.7, - "learning_rate": 3.1253745826079512e-06, - "loss": 0.6099, - "step": 25100 - }, - { - "epoch": 0.7, - "learning_rate": 3.123947601244328e-06, - "loss": 0.1223, - "step": 25105 - }, - { - "epoch": 0.7, - "learning_rate": 3.1225206198807047e-06, - "loss": 0.1702, - "step": 25110 - }, - { - "epoch": 0.7, - "learning_rate": 3.1210936385170815e-06, - "loss": 0.1585, - "step": 25115 - }, - { - "epoch": 0.7, - "learning_rate": 3.119666657153458e-06, - "loss": 0.2234, - "step": 25120 - }, - { - "epoch": 0.7, - "learning_rate": 3.118239675789834e-06, - "loss": 0.1095, - "step": 25125 - }, - { - "epoch": 0.7, - "learning_rate": 3.116812694426211e-06, - "loss": 0.108, - "step": 25130 - }, - { - "epoch": 0.7, - "learning_rate": 3.1153857130625877e-06, - "loss": 0.1036, - "step": 25135 - }, - { - "epoch": 0.7, - "learning_rate": 3.1139587316989645e-06, - "loss": 0.3185, - "step": 25140 - }, - { - "epoch": 0.7, - "learning_rate": 3.112531750335341e-06, - "loss": 0.2863, - "step": 25145 - }, - { - "epoch": 0.7, - "learning_rate": 3.1111047689717176e-06, - "loss": 0.3655, - "step": 25150 - }, - { - "epoch": 0.7, - "learning_rate": 3.1096777876080943e-06, - "loss": 0.0881, - "step": 25155 - }, - { - "epoch": 0.7, - "learning_rate": 3.1082508062444707e-06, - "loss": 0.1322, - "step": 25160 - }, - { - "epoch": 0.7, - "learning_rate": 3.1068238248808474e-06, - "loss": 0.1561, - "step": 25165 - }, - { - "epoch": 0.7, - "learning_rate": 3.1053968435172238e-06, - "loss": 0.1948, - "step": 25170 - }, - { - "epoch": 0.7, - "learning_rate": 3.103969862153601e-06, - "loss": 0.1177, - "step": 25175 - }, - { - "epoch": 0.7, - "learning_rate": 3.1025428807899773e-06, - "loss": 0.1238, - "step": 25180 - }, - { - "epoch": 0.7, - "learning_rate": 3.1011158994263536e-06, - "loss": 0.1788, - "step": 25185 - }, - { - "epoch": 0.7, - "learning_rate": 3.0996889180627304e-06, - "loss": 0.0869, - "step": 25190 - }, - { - "epoch": 0.7, - "learning_rate": 3.0982619366991067e-06, - "loss": 0.1081, - "step": 25195 - }, - { - "epoch": 0.7, - "learning_rate": 3.096834955335484e-06, - "loss": 0.4041, - "step": 25200 - }, - { - "epoch": 0.7, - "learning_rate": 3.0954079739718603e-06, - "loss": 0.1634, - "step": 25205 - }, - { - "epoch": 0.7, - "learning_rate": 3.093980992608237e-06, - "loss": 0.1709, - "step": 25210 - }, - { - "epoch": 0.7, - "learning_rate": 3.0925540112446134e-06, - "loss": 0.1343, - "step": 25215 - }, - { - "epoch": 0.7, - "learning_rate": 3.0911270298809897e-06, - "loss": 0.153, - "step": 25220 - }, - { - "epoch": 0.7, - "learning_rate": 3.089700048517367e-06, - "loss": 0.0494, - "step": 25225 - }, - { - "epoch": 0.7, - "learning_rate": 3.0882730671537432e-06, - "loss": 0.1105, - "step": 25230 - }, - { - "epoch": 0.7, - "learning_rate": 3.08684608579012e-06, - "loss": 0.041, - "step": 25235 - }, - { - "epoch": 0.7, - "learning_rate": 3.0854191044264963e-06, - "loss": 0.1833, - "step": 25240 - }, - { - "epoch": 0.7, - "learning_rate": 3.0839921230628735e-06, - "loss": 0.1466, - "step": 25245 - }, - { - "epoch": 0.7, - "learning_rate": 3.08256514169925e-06, - "loss": 0.44, - "step": 25250 - }, - { - "epoch": 0.7, - "learning_rate": 3.081138160335626e-06, - "loss": 0.1542, - "step": 25255 - }, - { - "epoch": 0.7, - "learning_rate": 3.079711178972003e-06, - "loss": 0.1108, - "step": 25260 - }, - { - "epoch": 0.7, - "learning_rate": 3.0782841976083793e-06, - "loss": 0.1412, - "step": 25265 - }, - { - "epoch": 0.7, - "learning_rate": 3.0768572162447565e-06, - "loss": 0.1025, - "step": 25270 - }, - { - "epoch": 0.7, - "learning_rate": 3.075430234881133e-06, - "loss": 0.0943, - "step": 25275 - }, - { - "epoch": 0.7, - "learning_rate": 3.074003253517509e-06, - "loss": 0.0713, - "step": 25280 - }, - { - "epoch": 0.7, - "learning_rate": 3.072576272153886e-06, - "loss": 0.0824, - "step": 25285 - }, - { - "epoch": 0.7, - "learning_rate": 3.0711492907902622e-06, - "loss": 0.0725, - "step": 25290 - }, - { - "epoch": 0.7, - "learning_rate": 3.0697223094266394e-06, - "loss": 0.3779, - "step": 25295 - }, - { - "epoch": 0.7, - "learning_rate": 3.0682953280630158e-06, - "loss": 0.3996, - "step": 25300 - }, - { - "epoch": 0.7, - "learning_rate": 3.0668683466993925e-06, - "loss": 0.1536, - "step": 25305 - }, - { - "epoch": 0.7, - "learning_rate": 3.065441365335769e-06, - "loss": 0.1816, - "step": 25310 - }, - { - "epoch": 0.7, - "learning_rate": 3.064014383972145e-06, - "loss": 0.1062, - "step": 25315 - }, - { - "epoch": 0.7, - "learning_rate": 3.0625874026085224e-06, - "loss": 0.2004, - "step": 25320 - }, - { - "epoch": 0.7, - "learning_rate": 3.0611604212448987e-06, - "loss": 0.1371, - "step": 25325 - }, - { - "epoch": 0.7, - "learning_rate": 3.0597334398812755e-06, - "loss": 0.0809, - "step": 25330 - }, - { - "epoch": 0.7, - "learning_rate": 3.058306458517652e-06, - "loss": 0.1249, - "step": 25335 - }, - { - "epoch": 0.7, - "learning_rate": 3.056879477154029e-06, - "loss": 0.2874, - "step": 25340 - }, - { - "epoch": 0.7, - "learning_rate": 3.0554524957904054e-06, - "loss": 0.2563, - "step": 25345 - }, - { - "epoch": 0.7, - "learning_rate": 3.0540255144267817e-06, - "loss": 0.3192, - "step": 25350 - }, - { - "epoch": 0.7, - "learning_rate": 3.0525985330631585e-06, - "loss": 0.2538, - "step": 25355 - }, - { - "epoch": 0.7, - "learning_rate": 3.051171551699535e-06, - "loss": 0.157, - "step": 25360 - }, - { - "epoch": 0.7, - "learning_rate": 3.049744570335912e-06, - "loss": 0.1524, - "step": 25365 - }, - { - "epoch": 0.7, - "learning_rate": 3.0483175889722883e-06, - "loss": 0.1248, - "step": 25370 - }, - { - "epoch": 0.7, - "learning_rate": 3.0468906076086647e-06, - "loss": 0.1673, - "step": 25375 - }, - { - "epoch": 0.7, - "learning_rate": 3.0454636262450414e-06, - "loss": 0.0247, - "step": 25380 - }, - { - "epoch": 0.7, - "learning_rate": 3.0440366448814178e-06, - "loss": 0.2293, - "step": 25385 - }, - { - "epoch": 0.7, - "learning_rate": 3.042609663517795e-06, - "loss": 0.184, - "step": 25390 - }, - { - "epoch": 0.7, - "learning_rate": 3.0411826821541713e-06, - "loss": 0.1514, - "step": 25395 - }, - { - "epoch": 0.7, - "learning_rate": 3.039755700790548e-06, - "loss": 0.383, - "step": 25400 - }, - { - "epoch": 0.7, - "learning_rate": 3.0383287194269244e-06, - "loss": 0.0815, - "step": 25405 - }, - { - "epoch": 0.71, - "learning_rate": 3.0369017380633007e-06, - "loss": 0.1618, - "step": 25410 - }, - { - "epoch": 0.71, - "learning_rate": 3.035474756699678e-06, - "loss": 0.1624, - "step": 25415 - }, - { - "epoch": 0.71, - "learning_rate": 3.0340477753360542e-06, - "loss": 0.1379, - "step": 25420 - }, - { - "epoch": 0.71, - "learning_rate": 3.032620793972431e-06, - "loss": 0.0769, - "step": 25425 - }, - { - "epoch": 0.71, - "learning_rate": 3.0311938126088074e-06, - "loss": 0.0432, - "step": 25430 - }, - { - "epoch": 0.71, - "learning_rate": 3.0297668312451845e-06, - "loss": 0.1571, - "step": 25435 - }, - { - "epoch": 0.71, - "learning_rate": 3.028339849881561e-06, - "loss": 0.1198, - "step": 25440 - }, - { - "epoch": 0.71, - "learning_rate": 3.0269128685179372e-06, - "loss": 0.1957, - "step": 25445 - }, - { - "epoch": 0.71, - "learning_rate": 3.025485887154314e-06, - "loss": 0.292, - "step": 25450 - }, - { - "epoch": 0.71, - "learning_rate": 3.0240589057906903e-06, - "loss": 0.108, - "step": 25455 - }, - { - "epoch": 0.71, - "learning_rate": 3.0226319244270675e-06, - "loss": 0.1, - "step": 25460 - }, - { - "epoch": 0.71, - "learning_rate": 3.021204943063444e-06, - "loss": 0.1045, - "step": 25465 - }, - { - "epoch": 0.71, - "learning_rate": 3.01977796169982e-06, - "loss": 0.1527, - "step": 25470 - }, - { - "epoch": 0.71, - "learning_rate": 3.018350980336197e-06, - "loss": 0.1147, - "step": 25475 - }, - { - "epoch": 0.71, - "learning_rate": 3.0169239989725733e-06, - "loss": 0.043, - "step": 25480 - }, - { - "epoch": 0.71, - "learning_rate": 3.0154970176089505e-06, - "loss": 0.0107, - "step": 25485 - }, - { - "epoch": 0.71, - "learning_rate": 3.014070036245327e-06, - "loss": 0.1393, - "step": 25490 - }, - { - "epoch": 0.71, - "learning_rate": 3.0126430548817036e-06, - "loss": 0.2449, - "step": 25495 - }, - { - "epoch": 0.71, - "learning_rate": 3.01121607351808e-06, - "loss": 0.3843, - "step": 25500 - }, - { - "epoch": 0.71, - "learning_rate": 3.0097890921544567e-06, - "loss": 0.0952, - "step": 25505 - }, - { - "epoch": 0.71, - "learning_rate": 3.0083621107908334e-06, - "loss": 0.1409, - "step": 25510 - }, - { - "epoch": 0.71, - "learning_rate": 3.0069351294272098e-06, - "loss": 0.1487, - "step": 25515 - }, - { - "epoch": 0.71, - "learning_rate": 3.0055081480635865e-06, - "loss": 0.151, - "step": 25520 - }, - { - "epoch": 0.71, - "learning_rate": 3.0040811666999633e-06, - "loss": 0.1024, - "step": 25525 - }, - { - "epoch": 0.71, - "learning_rate": 3.00265418533634e-06, - "loss": 0.1171, - "step": 25530 - }, - { - "epoch": 0.71, - "learning_rate": 3.0012272039727164e-06, - "loss": 0.1517, - "step": 25535 - }, - { - "epoch": 0.71, - "learning_rate": 2.9998002226090927e-06, - "loss": 0.3867, - "step": 25540 - }, - { - "epoch": 0.71, - "learning_rate": 2.9983732412454695e-06, - "loss": 0.2584, - "step": 25545 - }, - { - "epoch": 0.71, - "learning_rate": 2.9969462598818463e-06, - "loss": 0.4842, - "step": 25550 - }, - { - "epoch": 0.71, - "learning_rate": 2.995519278518223e-06, - "loss": 0.1562, - "step": 25555 - }, - { - "epoch": 0.71, - "learning_rate": 2.9940922971545994e-06, - "loss": 0.1135, - "step": 25560 - }, - { - "epoch": 0.71, - "learning_rate": 2.9926653157909757e-06, - "loss": 0.1413, - "step": 25565 - }, - { - "epoch": 0.71, - "learning_rate": 2.991238334427353e-06, - "loss": 0.1179, - "step": 25570 - }, - { - "epoch": 0.71, - "learning_rate": 2.9898113530637292e-06, - "loss": 0.1406, - "step": 25575 - }, - { - "epoch": 0.71, - "learning_rate": 2.988384371700106e-06, - "loss": 0.1572, - "step": 25580 - }, - { - "epoch": 0.71, - "learning_rate": 2.9869573903364823e-06, - "loss": 0.1412, - "step": 25585 - }, - { - "epoch": 0.71, - "learning_rate": 2.985530408972859e-06, - "loss": 0.266, - "step": 25590 - }, - { - "epoch": 0.71, - "learning_rate": 2.984103427609236e-06, - "loss": 0.3005, - "step": 25595 - }, - { - "epoch": 0.71, - "learning_rate": 2.982676446245612e-06, - "loss": 0.549, - "step": 25600 - }, - { - "epoch": 0.71, - "learning_rate": 2.981249464881989e-06, - "loss": 0.0852, - "step": 25605 - }, - { - "epoch": 0.71, - "learning_rate": 2.9798224835183653e-06, - "loss": 0.1306, - "step": 25610 - }, - { - "epoch": 0.71, - "learning_rate": 2.9783955021547425e-06, - "loss": 0.0573, - "step": 25615 - }, - { - "epoch": 0.71, - "learning_rate": 2.976968520791119e-06, - "loss": 0.1642, - "step": 25620 - }, - { - "epoch": 0.71, - "learning_rate": 2.9755415394274956e-06, - "loss": 0.1541, - "step": 25625 - }, - { - "epoch": 0.71, - "learning_rate": 2.974114558063872e-06, - "loss": 0.0305, - "step": 25630 - }, - { - "epoch": 0.71, - "learning_rate": 2.9726875767002482e-06, - "loss": 0.2669, - "step": 25635 - }, - { - "epoch": 0.71, - "learning_rate": 2.9712605953366254e-06, - "loss": 0.2604, - "step": 25640 - }, - { - "epoch": 0.71, - "learning_rate": 2.9698336139730018e-06, - "loss": 0.1894, - "step": 25645 - }, - { - "epoch": 0.71, - "learning_rate": 2.9684066326093785e-06, - "loss": 0.5792, - "step": 25650 - }, - { - "epoch": 0.71, - "learning_rate": 2.966979651245755e-06, - "loss": 0.1189, - "step": 25655 - }, - { - "epoch": 0.71, - "learning_rate": 2.965552669882131e-06, - "loss": 0.1772, - "step": 25660 - }, - { - "epoch": 0.71, - "learning_rate": 2.9641256885185084e-06, - "loss": 0.1495, - "step": 25665 - }, - { - "epoch": 0.71, - "learning_rate": 2.9626987071548847e-06, - "loss": 0.1614, - "step": 25670 - }, - { - "epoch": 0.71, - "learning_rate": 2.9612717257912615e-06, - "loss": 0.0493, - "step": 25675 - }, - { - "epoch": 0.71, - "learning_rate": 2.959844744427638e-06, - "loss": 0.0841, - "step": 25680 - }, - { - "epoch": 0.71, - "learning_rate": 2.958417763064015e-06, - "loss": 0.1262, - "step": 25685 - }, - { - "epoch": 0.71, - "learning_rate": 2.9569907817003914e-06, - "loss": 0.2289, - "step": 25690 - }, - { - "epoch": 0.71, - "learning_rate": 2.9555638003367677e-06, - "loss": 0.1331, - "step": 25695 - }, - { - "epoch": 0.71, - "learning_rate": 2.9541368189731445e-06, - "loss": 0.2359, - "step": 25700 - }, - { - "epoch": 0.71, - "learning_rate": 2.952709837609521e-06, - "loss": 0.0779, - "step": 25705 - }, - { - "epoch": 0.71, - "learning_rate": 2.951282856245898e-06, - "loss": 0.115, - "step": 25710 - }, - { - "epoch": 0.71, - "learning_rate": 2.9498558748822743e-06, - "loss": 0.1122, - "step": 25715 - }, - { - "epoch": 0.71, - "learning_rate": 2.948428893518651e-06, - "loss": 0.1536, - "step": 25720 - }, - { - "epoch": 0.71, - "learning_rate": 2.9470019121550274e-06, - "loss": 0.1202, - "step": 25725 - }, - { - "epoch": 0.71, - "learning_rate": 2.9455749307914038e-06, - "loss": 0.0517, - "step": 25730 - }, - { - "epoch": 0.71, - "learning_rate": 2.944147949427781e-06, - "loss": 0.1488, - "step": 25735 - }, - { - "epoch": 0.71, - "learning_rate": 2.9427209680641573e-06, - "loss": 0.2269, - "step": 25740 - }, - { - "epoch": 0.71, - "learning_rate": 2.941293986700534e-06, - "loss": 0.353, - "step": 25745 - }, - { - "epoch": 0.71, - "learning_rate": 2.9398670053369104e-06, - "loss": 0.2729, - "step": 25750 - }, - { - "epoch": 0.71, - "learning_rate": 2.9384400239732876e-06, - "loss": 0.1162, - "step": 25755 - }, - { - "epoch": 0.71, - "learning_rate": 2.937013042609664e-06, - "loss": 0.09, - "step": 25760 - }, - { - "epoch": 0.71, - "learning_rate": 2.9355860612460403e-06, - "loss": 0.125, - "step": 25765 - }, - { - "epoch": 0.72, - "learning_rate": 2.934159079882417e-06, - "loss": 0.1344, - "step": 25770 - }, - { - "epoch": 0.72, - "learning_rate": 2.9327320985187934e-06, - "loss": 0.1441, - "step": 25775 - }, - { - "epoch": 0.72, - "learning_rate": 2.9313051171551705e-06, - "loss": 0.075, - "step": 25780 - }, - { - "epoch": 0.72, - "learning_rate": 2.929878135791547e-06, - "loss": 0.1001, - "step": 25785 - }, - { - "epoch": 0.72, - "learning_rate": 2.9284511544279232e-06, - "loss": 0.2468, - "step": 25790 - }, - { - "epoch": 0.72, - "learning_rate": 2.9270241730643e-06, - "loss": 0.2485, - "step": 25795 - }, - { - "epoch": 0.72, - "learning_rate": 2.9255971917006763e-06, - "loss": 0.4041, - "step": 25800 - }, - { - "epoch": 0.72, - "learning_rate": 2.9241702103370535e-06, - "loss": 0.1131, - "step": 25805 - }, - { - "epoch": 0.72, - "learning_rate": 2.92274322897343e-06, - "loss": 0.1758, - "step": 25810 - }, - { - "epoch": 0.72, - "learning_rate": 2.9213162476098066e-06, - "loss": 0.1028, - "step": 25815 - }, - { - "epoch": 0.72, - "learning_rate": 2.919889266246183e-06, - "loss": 0.1707, - "step": 25820 - }, - { - "epoch": 0.72, - "learning_rate": 2.9184622848825593e-06, - "loss": 0.0508, - "step": 25825 - }, - { - "epoch": 0.72, - "learning_rate": 2.9170353035189365e-06, - "loss": 0.1092, - "step": 25830 - }, - { - "epoch": 0.72, - "learning_rate": 2.915608322155313e-06, - "loss": 0.1646, - "step": 25835 - }, - { - "epoch": 0.72, - "learning_rate": 2.9141813407916896e-06, - "loss": 0.2093, - "step": 25840 - }, - { - "epoch": 0.72, - "learning_rate": 2.912754359428066e-06, - "loss": 0.256, - "step": 25845 - }, - { - "epoch": 0.72, - "learning_rate": 2.911327378064443e-06, - "loss": 0.1588, - "step": 25850 - }, - { - "epoch": 0.72, - "learning_rate": 2.9099003967008194e-06, - "loss": 0.1443, - "step": 25855 - }, - { - "epoch": 0.72, - "learning_rate": 2.9084734153371958e-06, - "loss": 0.1734, - "step": 25860 - }, - { - "epoch": 0.72, - "learning_rate": 2.9070464339735725e-06, - "loss": 0.1045, - "step": 25865 - }, - { - "epoch": 0.72, - "learning_rate": 2.905619452609949e-06, - "loss": 0.2762, - "step": 25870 - }, - { - "epoch": 0.72, - "learning_rate": 2.904192471246326e-06, - "loss": 0.0354, - "step": 25875 - }, - { - "epoch": 0.72, - "learning_rate": 2.9027654898827024e-06, - "loss": 0.1832, - "step": 25880 - }, - { - "epoch": 0.72, - "learning_rate": 2.9013385085190787e-06, - "loss": 0.0922, - "step": 25885 - }, - { - "epoch": 0.72, - "learning_rate": 2.8999115271554555e-06, - "loss": 0.111, - "step": 25890 - }, - { - "epoch": 0.72, - "learning_rate": 2.898484545791832e-06, - "loss": 0.1338, - "step": 25895 - }, - { - "epoch": 0.72, - "learning_rate": 2.897057564428209e-06, - "loss": 0.4749, - "step": 25900 - }, - { - "epoch": 0.72, - "learning_rate": 2.8956305830645854e-06, - "loss": 0.1815, - "step": 25905 - }, - { - "epoch": 0.72, - "learning_rate": 2.894203601700962e-06, - "loss": 0.1365, - "step": 25910 - }, - { - "epoch": 0.72, - "learning_rate": 2.8927766203373385e-06, - "loss": 0.1343, - "step": 25915 - }, - { - "epoch": 0.72, - "learning_rate": 2.8913496389737152e-06, - "loss": 0.1013, - "step": 25920 - }, - { - "epoch": 0.72, - "learning_rate": 2.889922657610092e-06, - "loss": 0.12, - "step": 25925 - }, - { - "epoch": 0.72, - "learning_rate": 2.8884956762464683e-06, - "loss": 0.1476, - "step": 25930 - }, - { - "epoch": 0.72, - "learning_rate": 2.887068694882845e-06, - "loss": 0.1328, - "step": 25935 - }, - { - "epoch": 0.72, - "learning_rate": 2.8856417135192214e-06, - "loss": 0.1709, - "step": 25940 - }, - { - "epoch": 0.72, - "learning_rate": 2.8842147321555986e-06, - "loss": 0.123, - "step": 25945 - }, - { - "epoch": 0.72, - "learning_rate": 2.882787750791975e-06, - "loss": 0.5435, - "step": 25950 - }, - { - "epoch": 0.72, - "learning_rate": 2.8813607694283513e-06, - "loss": 0.117, - "step": 25955 - }, - { - "epoch": 0.72, - "learning_rate": 2.879933788064728e-06, - "loss": 0.1596, - "step": 25960 - }, - { - "epoch": 0.72, - "learning_rate": 2.878506806701105e-06, - "loss": 0.1398, - "step": 25965 - }, - { - "epoch": 0.72, - "learning_rate": 2.8770798253374816e-06, - "loss": 0.2197, - "step": 25970 - }, - { - "epoch": 0.72, - "learning_rate": 2.875652843973858e-06, - "loss": 0.1027, - "step": 25975 - }, - { - "epoch": 0.72, - "learning_rate": 2.8742258626102342e-06, - "loss": 0.043, - "step": 25980 - }, - { - "epoch": 0.72, - "learning_rate": 2.872798881246611e-06, - "loss": 0.0459, - "step": 25985 - }, - { - "epoch": 0.72, - "learning_rate": 2.8713718998829878e-06, - "loss": 0.0957, - "step": 25990 - }, - { - "epoch": 0.72, - "learning_rate": 2.8699449185193645e-06, - "loss": 0.2356, - "step": 25995 - }, - { - "epoch": 0.72, - "learning_rate": 2.868517937155741e-06, - "loss": 0.284, - "step": 26000 - }, - { - "epoch": 0.72, - "eval_loss": 0.05732240900397301, - "eval_runtime": 1599.5138, - "eval_samples_per_second": 10.014, - "eval_steps_per_second": 2.504, - "eval_wer": 0.16871619184998196, - "step": 26000 - }, - { - "epoch": 0.72, - "learning_rate": 2.8670909557921176e-06, - "loss": 0.1305, - "step": 26005 - }, - { - "epoch": 0.72, - "learning_rate": 2.8656639744284944e-06, - "loss": 0.2248, - "step": 26010 - }, - { - "epoch": 0.72, - "learning_rate": 2.8642369930648707e-06, - "loss": 0.1827, - "step": 26015 - }, - { - "epoch": 0.72, - "learning_rate": 2.8628100117012475e-06, - "loss": 0.1403, - "step": 26020 - }, - { - "epoch": 0.72, - "learning_rate": 2.861383030337624e-06, - "loss": 0.2165, - "step": 26025 - }, - { - "epoch": 0.72, - "learning_rate": 2.859956048974001e-06, - "loss": 0.0734, - "step": 26030 - }, - { - "epoch": 0.72, - "learning_rate": 2.8585290676103774e-06, - "loss": 0.1511, - "step": 26035 - }, - { - "epoch": 0.72, - "learning_rate": 2.857102086246754e-06, - "loss": 0.2121, - "step": 26040 - }, - { - "epoch": 0.72, - "learning_rate": 2.8556751048831305e-06, - "loss": 0.1674, - "step": 26045 - }, - { - "epoch": 0.72, - "learning_rate": 2.854248123519507e-06, - "loss": 0.3052, - "step": 26050 - }, - { - "epoch": 0.72, - "learning_rate": 2.852821142155884e-06, - "loss": 0.1277, - "step": 26055 - }, - { - "epoch": 0.72, - "learning_rate": 2.8513941607922603e-06, - "loss": 0.1229, - "step": 26060 - }, - { - "epoch": 0.72, - "learning_rate": 2.849967179428637e-06, - "loss": 0.1208, - "step": 26065 - }, - { - "epoch": 0.72, - "learning_rate": 2.8485401980650134e-06, - "loss": 0.17, - "step": 26070 - }, - { - "epoch": 0.72, - "learning_rate": 2.8471132167013898e-06, - "loss": 0.1901, - "step": 26075 - }, - { - "epoch": 0.72, - "learning_rate": 2.845686235337767e-06, - "loss": 0.1311, - "step": 26080 - }, - { - "epoch": 0.72, - "learning_rate": 2.8442592539741433e-06, - "loss": 0.0815, - "step": 26085 - }, - { - "epoch": 0.72, - "learning_rate": 2.84283227261052e-06, - "loss": 0.1416, - "step": 26090 - }, - { - "epoch": 0.72, - "learning_rate": 2.8414052912468964e-06, - "loss": 0.1607, - "step": 26095 - }, - { - "epoch": 0.72, - "learning_rate": 2.8399783098832736e-06, - "loss": 0.5613, - "step": 26100 - }, - { - "epoch": 0.72, - "learning_rate": 2.83855132851965e-06, - "loss": 0.1265, - "step": 26105 - }, - { - "epoch": 0.72, - "learning_rate": 2.8371243471560263e-06, - "loss": 0.1373, - "step": 26110 - }, - { - "epoch": 0.72, - "learning_rate": 2.835697365792403e-06, - "loss": 0.158, - "step": 26115 - }, - { - "epoch": 0.72, - "learning_rate": 2.8342703844287794e-06, - "loss": 0.1546, - "step": 26120 - }, - { - "epoch": 0.72, - "learning_rate": 2.8328434030651565e-06, - "loss": 0.1494, - "step": 26125 - }, - { - "epoch": 0.73, - "learning_rate": 2.831416421701533e-06, - "loss": 0.0512, - "step": 26130 - }, - { - "epoch": 0.73, - "learning_rate": 2.8299894403379096e-06, - "loss": 0.0766, - "step": 26135 - }, - { - "epoch": 0.73, - "learning_rate": 2.828562458974286e-06, - "loss": 0.2311, - "step": 26140 - }, - { - "epoch": 0.73, - "learning_rate": 2.8271354776106623e-06, - "loss": 0.1519, - "step": 26145 - }, - { - "epoch": 0.73, - "learning_rate": 2.8257084962470395e-06, - "loss": 0.5217, - "step": 26150 - }, - { - "epoch": 0.73, - "learning_rate": 2.824281514883416e-06, - "loss": 0.1174, - "step": 26155 - }, - { - "epoch": 0.73, - "learning_rate": 2.8228545335197926e-06, - "loss": 0.1366, - "step": 26160 - }, - { - "epoch": 0.73, - "learning_rate": 2.821427552156169e-06, - "loss": 0.249, - "step": 26165 - }, - { - "epoch": 0.73, - "learning_rate": 2.8200005707925453e-06, - "loss": 0.1411, - "step": 26170 - }, - { - "epoch": 0.73, - "learning_rate": 2.8185735894289225e-06, - "loss": 0.0867, - "step": 26175 - }, - { - "epoch": 0.73, - "learning_rate": 2.817146608065299e-06, - "loss": 0.0346, - "step": 26180 - }, - { - "epoch": 0.73, - "learning_rate": 2.8157196267016756e-06, - "loss": 0.0907, - "step": 26185 - }, - { - "epoch": 0.73, - "learning_rate": 2.814292645338052e-06, - "loss": 0.2065, - "step": 26190 - }, - { - "epoch": 0.73, - "learning_rate": 2.812865663974429e-06, - "loss": 0.1469, - "step": 26195 - }, - { - "epoch": 0.73, - "learning_rate": 2.8114386826108054e-06, - "loss": 0.4471, - "step": 26200 - }, - { - "epoch": 0.73, - "learning_rate": 2.8100117012471818e-06, - "loss": 0.1199, - "step": 26205 - }, - { - "epoch": 0.73, - "learning_rate": 2.8085847198835585e-06, - "loss": 0.1215, - "step": 26210 - }, - { - "epoch": 0.73, - "learning_rate": 2.807157738519935e-06, - "loss": 0.1368, - "step": 26215 - }, - { - "epoch": 0.73, - "learning_rate": 2.805730757156312e-06, - "loss": 0.1158, - "step": 26220 - }, - { - "epoch": 0.73, - "learning_rate": 2.8043037757926884e-06, - "loss": 0.1989, - "step": 26225 - }, - { - "epoch": 0.73, - "learning_rate": 2.802876794429065e-06, - "loss": 0.2644, - "step": 26230 - }, - { - "epoch": 0.73, - "learning_rate": 2.8014498130654415e-06, - "loss": 0.1495, - "step": 26235 - }, - { - "epoch": 0.73, - "learning_rate": 2.800022831701818e-06, - "loss": 0.0975, - "step": 26240 - }, - { - "epoch": 0.73, - "learning_rate": 2.798595850338195e-06, - "loss": 0.1118, - "step": 26245 - }, - { - "epoch": 0.73, - "learning_rate": 2.7971688689745714e-06, - "loss": 0.4682, - "step": 26250 - }, - { - "epoch": 0.73, - "learning_rate": 2.795741887610948e-06, - "loss": 0.17, - "step": 26255 - }, - { - "epoch": 0.73, - "learning_rate": 2.7943149062473245e-06, - "loss": 0.1316, - "step": 26260 - }, - { - "epoch": 0.73, - "learning_rate": 2.792887924883701e-06, - "loss": 0.1506, - "step": 26265 - }, - { - "epoch": 0.73, - "learning_rate": 2.791460943520078e-06, - "loss": 0.211, - "step": 26270 - }, - { - "epoch": 0.73, - "learning_rate": 2.7900339621564543e-06, - "loss": 0.1409, - "step": 26275 - }, - { - "epoch": 0.73, - "learning_rate": 2.788606980792831e-06, - "loss": 0.034, - "step": 26280 - }, - { - "epoch": 0.73, - "learning_rate": 2.7871799994292074e-06, - "loss": 0.1001, - "step": 26285 - }, - { - "epoch": 0.73, - "learning_rate": 2.7857530180655846e-06, - "loss": 0.0589, - "step": 26290 - }, - { - "epoch": 0.73, - "learning_rate": 2.784326036701961e-06, - "loss": 0.2897, - "step": 26295 - }, - { - "epoch": 0.73, - "learning_rate": 2.7828990553383373e-06, - "loss": 0.2913, - "step": 26300 - }, - { - "epoch": 0.73, - "learning_rate": 2.781472073974714e-06, - "loss": 0.1237, - "step": 26305 - }, - { - "epoch": 0.73, - "learning_rate": 2.7800450926110904e-06, - "loss": 0.1621, - "step": 26310 - }, - { - "epoch": 0.73, - "learning_rate": 2.7786181112474676e-06, - "loss": 0.1255, - "step": 26315 - }, - { - "epoch": 0.73, - "learning_rate": 2.777191129883844e-06, - "loss": 0.1752, - "step": 26320 - }, - { - "epoch": 0.73, - "learning_rate": 2.7757641485202207e-06, - "loss": 0.1037, - "step": 26325 - }, - { - "epoch": 0.73, - "learning_rate": 2.774337167156597e-06, - "loss": 0.101, - "step": 26330 - }, - { - "epoch": 0.73, - "learning_rate": 2.7729101857929733e-06, - "loss": 0.2034, - "step": 26335 - }, - { - "epoch": 0.73, - "learning_rate": 2.7714832044293505e-06, - "loss": 0.1355, - "step": 26340 - }, - { - "epoch": 0.73, - "learning_rate": 2.770056223065727e-06, - "loss": 0.2262, - "step": 26345 - }, - { - "epoch": 0.73, - "learning_rate": 2.7686292417021036e-06, - "loss": 0.2849, - "step": 26350 - }, - { - "epoch": 0.73, - "learning_rate": 2.76720226033848e-06, - "loss": 0.0806, - "step": 26355 - }, - { - "epoch": 0.73, - "learning_rate": 2.765775278974857e-06, - "loss": 0.1381, - "step": 26360 - }, - { - "epoch": 0.73, - "learning_rate": 2.7643482976112335e-06, - "loss": 0.1695, - "step": 26365 - }, - { - "epoch": 0.73, - "learning_rate": 2.76292131624761e-06, - "loss": 0.1678, - "step": 26370 - }, - { - "epoch": 0.73, - "learning_rate": 2.7614943348839866e-06, - "loss": 0.1797, - "step": 26375 - }, - { - "epoch": 0.73, - "learning_rate": 2.760067353520363e-06, - "loss": 0.1025, - "step": 26380 - }, - { - "epoch": 0.73, - "learning_rate": 2.75864037215674e-06, - "loss": 0.2294, - "step": 26385 - }, - { - "epoch": 0.73, - "learning_rate": 2.7572133907931165e-06, - "loss": 0.2152, - "step": 26390 - }, - { - "epoch": 0.73, - "learning_rate": 2.755786409429493e-06, - "loss": 0.1731, - "step": 26395 - }, - { - "epoch": 0.73, - "learning_rate": 2.7543594280658696e-06, - "loss": 0.3767, - "step": 26400 - }, - { - "epoch": 0.73, - "learning_rate": 2.7529324467022463e-06, - "loss": 0.0844, - "step": 26405 - }, - { - "epoch": 0.73, - "learning_rate": 2.751505465338623e-06, - "loss": 0.1569, - "step": 26410 - }, - { - "epoch": 0.73, - "learning_rate": 2.7500784839749994e-06, - "loss": 0.2803, - "step": 26415 - }, - { - "epoch": 0.73, - "learning_rate": 2.748651502611376e-06, - "loss": 0.1608, - "step": 26420 - }, - { - "epoch": 0.73, - "learning_rate": 2.747224521247753e-06, - "loss": 0.1184, - "step": 26425 - }, - { - "epoch": 0.73, - "learning_rate": 2.7457975398841293e-06, - "loss": 0.0333, - "step": 26430 - }, - { - "epoch": 0.73, - "learning_rate": 2.744370558520506e-06, - "loss": 0.0804, - "step": 26435 - }, - { - "epoch": 0.73, - "learning_rate": 2.7429435771568824e-06, - "loss": 0.2207, - "step": 26440 - }, - { - "epoch": 0.73, - "learning_rate": 2.741516595793259e-06, - "loss": 0.231, - "step": 26445 - }, - { - "epoch": 0.73, - "learning_rate": 2.740089614429636e-06, - "loss": 0.4283, - "step": 26450 - }, - { - "epoch": 0.73, - "learning_rate": 2.7386626330660127e-06, - "loss": 0.1311, - "step": 26455 - }, - { - "epoch": 0.73, - "learning_rate": 2.737235651702389e-06, - "loss": 0.1237, - "step": 26460 - }, - { - "epoch": 0.73, - "learning_rate": 2.7358086703387654e-06, - "loss": 0.1065, - "step": 26465 - }, - { - "epoch": 0.73, - "learning_rate": 2.7343816889751425e-06, - "loss": 0.2122, - "step": 26470 - }, - { - "epoch": 0.73, - "learning_rate": 2.732954707611519e-06, - "loss": 0.0672, - "step": 26475 - }, - { - "epoch": 0.73, - "learning_rate": 2.7315277262478956e-06, - "loss": 0.18, - "step": 26480 - }, - { - "epoch": 0.73, - "learning_rate": 2.730100744884272e-06, - "loss": 0.276, - "step": 26485 - }, - { - "epoch": 0.74, - "learning_rate": 2.7286737635206483e-06, - "loss": 0.2462, - "step": 26490 - }, - { - "epoch": 0.74, - "learning_rate": 2.7272467821570255e-06, - "loss": 0.0714, - "step": 26495 - }, - { - "epoch": 0.74, - "learning_rate": 2.725819800793402e-06, - "loss": 0.2961, - "step": 26500 - }, - { - "epoch": 0.74, - "learning_rate": 2.7243928194297786e-06, - "loss": 0.1474, - "step": 26505 - }, - { - "epoch": 0.74, - "learning_rate": 2.722965838066155e-06, - "loss": 0.118, - "step": 26510 - }, - { - "epoch": 0.74, - "learning_rate": 2.721538856702532e-06, - "loss": 0.1449, - "step": 26515 - }, - { - "epoch": 0.74, - "learning_rate": 2.7201118753389085e-06, - "loss": 0.1919, - "step": 26520 - }, - { - "epoch": 0.74, - "learning_rate": 2.718684893975285e-06, - "loss": 0.1371, - "step": 26525 - }, - { - "epoch": 0.74, - "learning_rate": 2.7172579126116616e-06, - "loss": 0.1795, - "step": 26530 - }, - { - "epoch": 0.74, - "learning_rate": 2.715830931248038e-06, - "loss": 0.0662, - "step": 26535 - }, - { - "epoch": 0.74, - "learning_rate": 2.714403949884415e-06, - "loss": 0.0727, - "step": 26540 - }, - { - "epoch": 0.74, - "learning_rate": 2.7129769685207914e-06, - "loss": 0.218, - "step": 26545 - }, - { - "epoch": 0.74, - "learning_rate": 2.711549987157168e-06, - "loss": 0.2782, - "step": 26550 - }, - { - "epoch": 0.74, - "learning_rate": 2.7101230057935445e-06, - "loss": 0.0953, - "step": 26555 - }, - { - "epoch": 0.74, - "learning_rate": 2.708696024429921e-06, - "loss": 0.1086, - "step": 26560 - }, - { - "epoch": 0.74, - "learning_rate": 2.707269043066298e-06, - "loss": 0.129, - "step": 26565 - }, - { - "epoch": 0.74, - "learning_rate": 2.7058420617026744e-06, - "loss": 0.1382, - "step": 26570 - }, - { - "epoch": 0.74, - "learning_rate": 2.704415080339051e-06, - "loss": 0.1681, - "step": 26575 - }, - { - "epoch": 0.74, - "learning_rate": 2.7029880989754275e-06, - "loss": 0.0586, - "step": 26580 - }, - { - "epoch": 0.74, - "learning_rate": 2.701561117611804e-06, - "loss": 0.0819, - "step": 26585 - }, - { - "epoch": 0.74, - "learning_rate": 2.700134136248181e-06, - "loss": 0.0729, - "step": 26590 - }, - { - "epoch": 0.74, - "learning_rate": 2.6987071548845574e-06, - "loss": 0.1718, - "step": 26595 - }, - { - "epoch": 0.74, - "learning_rate": 2.697280173520934e-06, - "loss": 0.7693, - "step": 26600 - }, - { - "epoch": 0.74, - "learning_rate": 2.6958531921573105e-06, - "loss": 0.1223, - "step": 26605 - }, - { - "epoch": 0.74, - "learning_rate": 2.6944262107936876e-06, - "loss": 0.1018, - "step": 26610 - }, - { - "epoch": 0.74, - "learning_rate": 2.692999229430064e-06, - "loss": 0.1375, - "step": 26615 - }, - { - "epoch": 0.74, - "learning_rate": 2.6915722480664403e-06, - "loss": 0.1235, - "step": 26620 - }, - { - "epoch": 0.74, - "learning_rate": 2.690145266702817e-06, - "loss": 0.0849, - "step": 26625 - }, - { - "epoch": 0.74, - "learning_rate": 2.6887182853391934e-06, - "loss": 0.185, - "step": 26630 - }, - { - "epoch": 0.74, - "learning_rate": 2.6872913039755706e-06, - "loss": 0.0632, - "step": 26635 - }, - { - "epoch": 0.74, - "learning_rate": 2.685864322611947e-06, - "loss": 0.1054, - "step": 26640 - }, - { - "epoch": 0.74, - "learning_rate": 2.6844373412483237e-06, - "loss": 0.1819, - "step": 26645 - }, - { - "epoch": 0.74, - "learning_rate": 2.6830103598847e-06, - "loss": 0.1812, - "step": 26650 - }, - { - "epoch": 0.74, - "learning_rate": 2.6815833785210764e-06, - "loss": 0.1602, - "step": 26655 - }, - { - "epoch": 0.74, - "learning_rate": 2.6801563971574536e-06, - "loss": 0.147, - "step": 26660 - }, - { - "epoch": 0.74, - "learning_rate": 2.67872941579383e-06, - "loss": 0.1197, - "step": 26665 - }, - { - "epoch": 0.74, - "learning_rate": 2.6773024344302067e-06, - "loss": 0.1357, - "step": 26670 - }, - { - "epoch": 0.74, - "learning_rate": 2.675875453066583e-06, - "loss": 0.1372, - "step": 26675 - }, - { - "epoch": 0.74, - "learning_rate": 2.6744484717029593e-06, - "loss": 0.0134, - "step": 26680 - }, - { - "epoch": 0.74, - "learning_rate": 2.6730214903393365e-06, - "loss": 0.0678, - "step": 26685 - }, - { - "epoch": 0.74, - "learning_rate": 2.671594508975713e-06, - "loss": 0.0896, - "step": 26690 - }, - { - "epoch": 0.74, - "learning_rate": 2.6701675276120896e-06, - "loss": 0.2949, - "step": 26695 - }, - { - "epoch": 0.74, - "learning_rate": 2.668740546248466e-06, - "loss": 0.4508, - "step": 26700 - }, - { - "epoch": 0.74, - "learning_rate": 2.667313564884843e-06, - "loss": 0.1432, - "step": 26705 - }, - { - "epoch": 0.74, - "learning_rate": 2.6658865835212195e-06, - "loss": 0.156, - "step": 26710 - }, - { - "epoch": 0.74, - "learning_rate": 2.664459602157596e-06, - "loss": 0.1392, - "step": 26715 - }, - { - "epoch": 0.74, - "learning_rate": 2.6630326207939726e-06, - "loss": 0.1732, - "step": 26720 - }, - { - "epoch": 0.74, - "learning_rate": 2.661605639430349e-06, - "loss": 0.0862, - "step": 26725 - }, - { - "epoch": 0.74, - "learning_rate": 2.660178658066726e-06, - "loss": 0.0326, - "step": 26730 - }, - { - "epoch": 0.74, - "learning_rate": 2.6587516767031025e-06, - "loss": 0.0985, - "step": 26735 - }, - { - "epoch": 0.74, - "learning_rate": 2.6573246953394792e-06, - "loss": 0.1581, - "step": 26740 - }, - { - "epoch": 0.74, - "learning_rate": 2.6558977139758556e-06, - "loss": 0.1858, - "step": 26745 - }, - { - "epoch": 0.74, - "learning_rate": 2.654470732612232e-06, - "loss": 0.4903, - "step": 26750 - }, - { - "epoch": 0.74, - "learning_rate": 2.653043751248609e-06, - "loss": 0.1636, - "step": 26755 - }, - { - "epoch": 0.74, - "learning_rate": 2.6516167698849854e-06, - "loss": 0.1551, - "step": 26760 - }, - { - "epoch": 0.74, - "learning_rate": 2.650189788521362e-06, - "loss": 0.1687, - "step": 26765 - }, - { - "epoch": 0.74, - "learning_rate": 2.6487628071577385e-06, - "loss": 0.1462, - "step": 26770 - }, - { - "epoch": 0.74, - "learning_rate": 2.6473358257941153e-06, - "loss": 0.1929, - "step": 26775 - }, - { - "epoch": 0.74, - "learning_rate": 2.645908844430492e-06, - "loss": 0.1037, - "step": 26780 - }, - { - "epoch": 0.74, - "learning_rate": 2.6444818630668684e-06, - "loss": 0.2719, - "step": 26785 - }, - { - "epoch": 0.74, - "learning_rate": 2.643054881703245e-06, - "loss": 0.1249, - "step": 26790 - }, - { - "epoch": 0.74, - "learning_rate": 2.6416279003396215e-06, - "loss": 0.1853, - "step": 26795 - }, - { - "epoch": 0.74, - "learning_rate": 2.6402009189759987e-06, - "loss": 0.4481, - "step": 26800 - }, - { - "epoch": 0.74, - "learning_rate": 2.638773937612375e-06, - "loss": 0.1416, - "step": 26805 - }, - { - "epoch": 0.74, - "learning_rate": 2.6373469562487514e-06, - "loss": 0.1283, - "step": 26810 - }, - { - "epoch": 0.74, - "learning_rate": 2.635919974885128e-06, - "loss": 0.1811, - "step": 26815 - }, - { - "epoch": 0.74, - "learning_rate": 2.634492993521505e-06, - "loss": 0.1281, - "step": 26820 - }, - { - "epoch": 0.74, - "learning_rate": 2.6330660121578816e-06, - "loss": 0.1362, - "step": 26825 - }, - { - "epoch": 0.74, - "learning_rate": 2.631639030794258e-06, - "loss": 0.0721, - "step": 26830 - }, - { - "epoch": 0.74, - "learning_rate": 2.6302120494306347e-06, - "loss": 0.0757, - "step": 26835 - }, - { - "epoch": 0.74, - "learning_rate": 2.628785068067011e-06, - "loss": 0.2048, - "step": 26840 - }, - { - "epoch": 0.74, - "learning_rate": 2.627358086703388e-06, - "loss": 0.0996, - "step": 26845 - }, - { - "epoch": 0.75, - "learning_rate": 2.6259311053397646e-06, - "loss": 0.3021, - "step": 26850 - }, - { - "epoch": 0.75, - "learning_rate": 2.624504123976141e-06, - "loss": 0.1129, - "step": 26855 - }, - { - "epoch": 0.75, - "learning_rate": 2.6230771426125177e-06, - "loss": 0.1188, - "step": 26860 - }, - { - "epoch": 0.75, - "learning_rate": 2.6216501612488945e-06, - "loss": 0.1518, - "step": 26865 - }, - { - "epoch": 0.75, - "learning_rate": 2.620223179885271e-06, - "loss": 0.2, - "step": 26870 - }, - { - "epoch": 0.75, - "learning_rate": 2.6187961985216476e-06, - "loss": 0.0576, - "step": 26875 - }, - { - "epoch": 0.75, - "learning_rate": 2.617369217158024e-06, - "loss": 0.0494, - "step": 26880 - }, - { - "epoch": 0.75, - "learning_rate": 2.6159422357944007e-06, - "loss": 0.2218, - "step": 26885 - }, - { - "epoch": 0.75, - "learning_rate": 2.6145152544307774e-06, - "loss": 0.1026, - "step": 26890 - }, - { - "epoch": 0.75, - "learning_rate": 2.613088273067154e-06, - "loss": 0.144, - "step": 26895 - }, - { - "epoch": 0.75, - "learning_rate": 2.6116612917035305e-06, - "loss": 0.445, - "step": 26900 - }, - { - "epoch": 0.75, - "learning_rate": 2.610234310339907e-06, - "loss": 0.1412, - "step": 26905 - }, - { - "epoch": 0.75, - "learning_rate": 2.608807328976284e-06, - "loss": 0.1615, - "step": 26910 - }, - { - "epoch": 0.75, - "learning_rate": 2.6073803476126604e-06, - "loss": 0.096, - "step": 26915 - }, - { - "epoch": 0.75, - "learning_rate": 2.605953366249037e-06, - "loss": 0.1041, - "step": 26920 - }, - { - "epoch": 0.75, - "learning_rate": 2.6045263848854135e-06, - "loss": 0.1171, - "step": 26925 - }, - { - "epoch": 0.75, - "learning_rate": 2.6030994035217907e-06, - "loss": 0.0616, - "step": 26930 - }, - { - "epoch": 0.75, - "learning_rate": 2.601672422158167e-06, - "loss": 0.1357, - "step": 26935 - }, - { - "epoch": 0.75, - "learning_rate": 2.6002454407945434e-06, - "loss": 0.121, - "step": 26940 - }, - { - "epoch": 0.75, - "learning_rate": 2.59881845943092e-06, - "loss": 0.3521, - "step": 26945 - }, - { - "epoch": 0.75, - "learning_rate": 2.5973914780672965e-06, - "loss": 0.2587, - "step": 26950 - }, - { - "epoch": 0.75, - "learning_rate": 2.5959644967036736e-06, - "loss": 0.0782, - "step": 26955 - }, - { - "epoch": 0.75, - "learning_rate": 2.59453751534005e-06, - "loss": 0.1999, - "step": 26960 - }, - { - "epoch": 0.75, - "learning_rate": 2.5931105339764263e-06, - "loss": 0.1359, - "step": 26965 - }, - { - "epoch": 0.75, - "learning_rate": 2.591683552612803e-06, - "loss": 0.1388, - "step": 26970 - }, - { - "epoch": 0.75, - "learning_rate": 2.5902565712491794e-06, - "loss": 0.1563, - "step": 26975 - }, - { - "epoch": 0.75, - "learning_rate": 2.5888295898855566e-06, - "loss": 0.092, - "step": 26980 - }, - { - "epoch": 0.75, - "learning_rate": 2.587402608521933e-06, - "loss": 0.0767, - "step": 26985 - }, - { - "epoch": 0.75, - "learning_rate": 2.5859756271583097e-06, - "loss": 0.1331, - "step": 26990 - }, - { - "epoch": 0.75, - "learning_rate": 2.584548645794686e-06, - "loss": 0.1713, - "step": 26995 - }, - { - "epoch": 0.75, - "learning_rate": 2.5831216644310624e-06, - "loss": 0.2481, - "step": 27000 - }, - { - "epoch": 0.75, - "learning_rate": 2.5816946830674396e-06, - "loss": 0.151, - "step": 27005 - }, - { - "epoch": 0.75, - "learning_rate": 2.580267701703816e-06, - "loss": 0.1115, - "step": 27010 - }, - { - "epoch": 0.75, - "learning_rate": 2.5788407203401927e-06, - "loss": 0.1995, - "step": 27015 - }, - { - "epoch": 0.75, - "learning_rate": 2.577413738976569e-06, - "loss": 0.0765, - "step": 27020 - }, - { - "epoch": 0.75, - "learning_rate": 2.575986757612946e-06, - "loss": 0.0888, - "step": 27025 - }, - { - "epoch": 0.75, - "learning_rate": 2.5745597762493225e-06, - "loss": 0.0971, - "step": 27030 - }, - { - "epoch": 0.75, - "learning_rate": 2.573132794885699e-06, - "loss": 0.103, - "step": 27035 - }, - { - "epoch": 0.75, - "learning_rate": 2.5717058135220756e-06, - "loss": 0.1728, - "step": 27040 - }, - { - "epoch": 0.75, - "learning_rate": 2.570278832158452e-06, - "loss": 0.1494, - "step": 27045 - }, - { - "epoch": 0.75, - "learning_rate": 2.568851850794829e-06, - "loss": 0.2001, - "step": 27050 - }, - { - "epoch": 0.75, - "learning_rate": 2.5674248694312055e-06, - "loss": 0.138, - "step": 27055 - }, - { - "epoch": 0.75, - "learning_rate": 2.5659978880675823e-06, - "loss": 0.1154, - "step": 27060 - }, - { - "epoch": 0.75, - "learning_rate": 2.5645709067039586e-06, - "loss": 0.1979, - "step": 27065 - }, - { - "epoch": 0.75, - "learning_rate": 2.563143925340335e-06, - "loss": 0.1417, - "step": 27070 - }, - { - "epoch": 0.75, - "learning_rate": 2.561716943976712e-06, - "loss": 0.061, - "step": 27075 - }, - { - "epoch": 0.75, - "learning_rate": 2.5602899626130885e-06, - "loss": 0.061, - "step": 27080 - }, - { - "epoch": 0.75, - "learning_rate": 2.5588629812494652e-06, - "loss": 0.1333, - "step": 27085 - }, - { - "epoch": 0.75, - "learning_rate": 2.5574359998858416e-06, - "loss": 0.4135, - "step": 27090 - }, - { - "epoch": 0.75, - "learning_rate": 2.556009018522218e-06, - "loss": 0.3602, - "step": 27095 - }, - { - "epoch": 0.75, - "learning_rate": 2.554582037158595e-06, - "loss": 0.6737, - "step": 27100 - }, - { - "epoch": 0.75, - "learning_rate": 2.5531550557949714e-06, - "loss": 0.136, - "step": 27105 - }, - { - "epoch": 0.75, - "learning_rate": 2.551728074431348e-06, - "loss": 0.1231, - "step": 27110 - }, - { - "epoch": 0.75, - "learning_rate": 2.5503010930677245e-06, - "loss": 0.1484, - "step": 27115 - }, - { - "epoch": 0.75, - "learning_rate": 2.5488741117041017e-06, - "loss": 0.1621, - "step": 27120 - }, - { - "epoch": 0.75, - "learning_rate": 2.547447130340478e-06, - "loss": 0.1258, - "step": 27125 - }, - { - "epoch": 0.75, - "learning_rate": 2.5460201489768544e-06, - "loss": 0.0405, - "step": 27130 - }, - { - "epoch": 0.75, - "learning_rate": 2.544593167613231e-06, - "loss": 0.1641, - "step": 27135 - }, - { - "epoch": 0.75, - "learning_rate": 2.5431661862496075e-06, - "loss": 0.1708, - "step": 27140 - }, - { - "epoch": 0.75, - "learning_rate": 2.5417392048859847e-06, - "loss": 0.1728, - "step": 27145 - }, - { - "epoch": 0.75, - "learning_rate": 2.540312223522361e-06, - "loss": 0.5788, - "step": 27150 - }, - { - "epoch": 0.75, - "learning_rate": 2.5388852421587378e-06, - "loss": 0.1277, - "step": 27155 - }, - { - "epoch": 0.75, - "learning_rate": 2.537458260795114e-06, - "loss": 0.1229, - "step": 27160 - }, - { - "epoch": 0.75, - "learning_rate": 2.5360312794314905e-06, - "loss": 0.1463, - "step": 27165 - }, - { - "epoch": 0.75, - "learning_rate": 2.5346042980678676e-06, - "loss": 0.2008, - "step": 27170 - }, - { - "epoch": 0.75, - "learning_rate": 2.533177316704244e-06, - "loss": 0.115, - "step": 27175 - }, - { - "epoch": 0.75, - "learning_rate": 2.5317503353406207e-06, - "loss": 0.1009, - "step": 27180 - }, - { - "epoch": 0.75, - "learning_rate": 2.530323353976997e-06, - "loss": 0.1141, - "step": 27185 - }, - { - "epoch": 0.75, - "learning_rate": 2.5288963726133734e-06, - "loss": 0.1155, - "step": 27190 - }, - { - "epoch": 0.75, - "learning_rate": 2.5274693912497506e-06, - "loss": 0.3133, - "step": 27195 - }, - { - "epoch": 0.75, - "learning_rate": 2.526042409886127e-06, - "loss": 0.4243, - "step": 27200 - }, - { - "epoch": 0.75, - "learning_rate": 2.5246154285225037e-06, - "loss": 0.1038, - "step": 27205 - }, - { - "epoch": 0.76, - "learning_rate": 2.52318844715888e-06, - "loss": 0.1554, - "step": 27210 - }, - { - "epoch": 0.76, - "learning_rate": 2.5217614657952572e-06, - "loss": 0.1083, - "step": 27215 - }, - { - "epoch": 0.76, - "learning_rate": 2.5203344844316336e-06, - "loss": 0.1736, - "step": 27220 - }, - { - "epoch": 0.76, - "learning_rate": 2.51890750306801e-06, - "loss": 0.0624, - "step": 27225 - }, - { - "epoch": 0.76, - "learning_rate": 2.5174805217043867e-06, - "loss": 0.0619, - "step": 27230 - }, - { - "epoch": 0.76, - "learning_rate": 2.516053540340763e-06, - "loss": 0.1438, - "step": 27235 - }, - { - "epoch": 0.76, - "learning_rate": 2.51462655897714e-06, - "loss": 0.1014, - "step": 27240 - }, - { - "epoch": 0.76, - "learning_rate": 2.5131995776135165e-06, - "loss": 0.2204, - "step": 27245 - }, - { - "epoch": 0.76, - "learning_rate": 2.5117725962498933e-06, - "loss": 0.3898, - "step": 27250 - }, - { - "epoch": 0.76, - "learning_rate": 2.5103456148862696e-06, - "loss": 0.1691, - "step": 27255 - }, - { - "epoch": 0.76, - "learning_rate": 2.5089186335226464e-06, - "loss": 0.1972, - "step": 27260 - }, - { - "epoch": 0.76, - "learning_rate": 2.507491652159023e-06, - "loss": 0.1593, - "step": 27265 - }, - { - "epoch": 0.76, - "learning_rate": 2.5060646707953995e-06, - "loss": 0.1196, - "step": 27270 - }, - { - "epoch": 0.76, - "learning_rate": 2.5046376894317763e-06, - "loss": 0.1242, - "step": 27275 - }, - { - "epoch": 0.76, - "learning_rate": 2.5032107080681526e-06, - "loss": 0.0395, - "step": 27280 - }, - { - "epoch": 0.76, - "learning_rate": 2.5017837267045294e-06, - "loss": 0.2878, - "step": 27285 - }, - { - "epoch": 0.76, - "learning_rate": 2.500356745340906e-06, - "loss": 0.1655, - "step": 27290 - }, - { - "epoch": 0.76, - "learning_rate": 2.498929763977283e-06, - "loss": 0.3432, - "step": 27295 - }, - { - "epoch": 0.76, - "learning_rate": 2.4975027826136592e-06, - "loss": 0.2969, - "step": 27300 - }, - { - "epoch": 0.76, - "learning_rate": 2.496075801250036e-06, - "loss": 0.158, - "step": 27305 - }, - { - "epoch": 0.76, - "learning_rate": 2.4946488198864123e-06, - "loss": 0.1344, - "step": 27310 - }, - { - "epoch": 0.76, - "learning_rate": 2.493221838522789e-06, - "loss": 0.1479, - "step": 27315 - }, - { - "epoch": 0.76, - "learning_rate": 2.491794857159166e-06, - "loss": 0.1574, - "step": 27320 - }, - { - "epoch": 0.76, - "learning_rate": 2.4903678757955426e-06, - "loss": 0.1102, - "step": 27325 - }, - { - "epoch": 0.76, - "learning_rate": 2.488940894431919e-06, - "loss": 0.0472, - "step": 27330 - }, - { - "epoch": 0.76, - "learning_rate": 2.4875139130682953e-06, - "loss": 0.1569, - "step": 27335 - }, - { - "epoch": 0.76, - "learning_rate": 2.486086931704672e-06, - "loss": 0.1781, - "step": 27340 - }, - { - "epoch": 0.76, - "learning_rate": 2.484659950341049e-06, - "loss": 0.2265, - "step": 27345 - }, - { - "epoch": 0.76, - "learning_rate": 2.4832329689774256e-06, - "loss": 0.2439, - "step": 27350 - }, - { - "epoch": 0.76, - "learning_rate": 2.481805987613802e-06, - "loss": 0.068, - "step": 27355 - }, - { - "epoch": 0.76, - "learning_rate": 2.4803790062501787e-06, - "loss": 0.2212, - "step": 27360 - }, - { - "epoch": 0.76, - "learning_rate": 2.478952024886555e-06, - "loss": 0.1199, - "step": 27365 - }, - { - "epoch": 0.76, - "learning_rate": 2.4775250435229318e-06, - "loss": 0.1074, - "step": 27370 - }, - { - "epoch": 0.76, - "learning_rate": 2.4760980621593085e-06, - "loss": 0.1394, - "step": 27375 - }, - { - "epoch": 0.76, - "learning_rate": 2.474671080795685e-06, - "loss": 0.0687, - "step": 27380 - }, - { - "epoch": 0.76, - "learning_rate": 2.4732440994320616e-06, - "loss": 0.0813, - "step": 27385 - }, - { - "epoch": 0.76, - "learning_rate": 2.4718171180684384e-06, - "loss": 0.1012, - "step": 27390 - }, - { - "epoch": 0.76, - "learning_rate": 2.4703901367048147e-06, - "loss": 0.1528, - "step": 27395 - }, - { - "epoch": 0.76, - "learning_rate": 2.4689631553411915e-06, - "loss": 0.475, - "step": 27400 - }, - { - "epoch": 0.76, - "learning_rate": 2.467536173977568e-06, - "loss": 0.1211, - "step": 27405 - }, - { - "epoch": 0.76, - "learning_rate": 2.4661091926139446e-06, - "loss": 0.1699, - "step": 27410 - }, - { - "epoch": 0.76, - "learning_rate": 2.4646822112503214e-06, - "loss": 0.1281, - "step": 27415 - }, - { - "epoch": 0.76, - "learning_rate": 2.463255229886698e-06, - "loss": 0.1253, - "step": 27420 - }, - { - "epoch": 0.76, - "learning_rate": 2.4618282485230745e-06, - "loss": 0.2102, - "step": 27425 - }, - { - "epoch": 0.76, - "learning_rate": 2.460401267159451e-06, - "loss": 0.0762, - "step": 27430 - }, - { - "epoch": 0.76, - "learning_rate": 2.4589742857958276e-06, - "loss": 0.1024, - "step": 27435 - }, - { - "epoch": 0.76, - "learning_rate": 2.4575473044322043e-06, - "loss": 0.1654, - "step": 27440 - }, - { - "epoch": 0.76, - "learning_rate": 2.456120323068581e-06, - "loss": 0.2602, - "step": 27445 - }, - { - "epoch": 0.76, - "learning_rate": 2.4546933417049574e-06, - "loss": 0.525, - "step": 27450 - }, - { - "epoch": 0.76, - "learning_rate": 2.453266360341334e-06, - "loss": 0.1613, - "step": 27455 - }, - { - "epoch": 0.76, - "learning_rate": 2.4518393789777105e-06, - "loss": 0.1533, - "step": 27460 - }, - { - "epoch": 0.76, - "learning_rate": 2.4504123976140873e-06, - "loss": 0.1351, - "step": 27465 - }, - { - "epoch": 0.76, - "learning_rate": 2.448985416250464e-06, - "loss": 0.1482, - "step": 27470 - }, - { - "epoch": 0.76, - "learning_rate": 2.4475584348868404e-06, - "loss": 0.1441, - "step": 27475 - }, - { - "epoch": 0.76, - "learning_rate": 2.446131453523217e-06, - "loss": 0.0479, - "step": 27480 - }, - { - "epoch": 0.76, - "learning_rate": 2.444704472159594e-06, - "loss": 0.0756, - "step": 27485 - }, - { - "epoch": 0.76, - "learning_rate": 2.4432774907959707e-06, - "loss": 0.1747, - "step": 27490 - }, - { - "epoch": 0.76, - "learning_rate": 2.441850509432347e-06, - "loss": 0.186, - "step": 27495 - }, - { - "epoch": 0.76, - "learning_rate": 2.4404235280687238e-06, - "loss": 0.2346, - "step": 27500 - }, - { - "epoch": 0.76, - "learning_rate": 2.4389965467051e-06, - "loss": 0.1429, - "step": 27505 - }, - { - "epoch": 0.76, - "learning_rate": 2.437569565341477e-06, - "loss": 0.1096, - "step": 27510 - }, - { - "epoch": 0.76, - "learning_rate": 2.4361425839778536e-06, - "loss": 0.1442, - "step": 27515 - }, - { - "epoch": 0.76, - "learning_rate": 2.43471560261423e-06, - "loss": 0.106, - "step": 27520 - }, - { - "epoch": 0.76, - "learning_rate": 2.4332886212506067e-06, - "loss": 0.1568, - "step": 27525 - }, - { - "epoch": 0.76, - "learning_rate": 2.431861639886983e-06, - "loss": 0.096, - "step": 27530 - }, - { - "epoch": 0.76, - "learning_rate": 2.43043465852336e-06, - "loss": 0.0707, - "step": 27535 - }, - { - "epoch": 0.76, - "learning_rate": 2.4290076771597366e-06, - "loss": 0.2006, - "step": 27540 - }, - { - "epoch": 0.76, - "learning_rate": 2.4275806957961134e-06, - "loss": 0.2437, - "step": 27545 - }, - { - "epoch": 0.76, - "learning_rate": 2.4261537144324897e-06, - "loss": 0.2953, - "step": 27550 - }, - { - "epoch": 0.76, - "learning_rate": 2.424726733068866e-06, - "loss": 0.1089, - "step": 27555 - }, - { - "epoch": 0.76, - "learning_rate": 2.423299751705243e-06, - "loss": 0.1225, - "step": 27560 - }, - { - "epoch": 0.76, - "learning_rate": 2.4218727703416196e-06, - "loss": 0.1321, - "step": 27565 - }, - { - "epoch": 0.77, - "learning_rate": 2.4204457889779963e-06, - "loss": 0.1517, - "step": 27570 - }, - { - "epoch": 0.77, - "learning_rate": 2.4190188076143727e-06, - "loss": 0.1099, - "step": 27575 - }, - { - "epoch": 0.77, - "learning_rate": 2.4175918262507494e-06, - "loss": 0.1013, - "step": 27580 - }, - { - "epoch": 0.77, - "learning_rate": 2.416164844887126e-06, - "loss": 0.0818, - "step": 27585 - }, - { - "epoch": 0.77, - "learning_rate": 2.4147378635235025e-06, - "loss": 0.1875, - "step": 27590 - }, - { - "epoch": 0.77, - "learning_rate": 2.4133108821598793e-06, - "loss": 0.1188, - "step": 27595 - }, - { - "epoch": 0.77, - "learning_rate": 2.4118839007962556e-06, - "loss": 0.3558, - "step": 27600 - }, - { - "epoch": 0.77, - "learning_rate": 2.4104569194326324e-06, - "loss": 0.1315, - "step": 27605 - }, - { - "epoch": 0.77, - "learning_rate": 2.409029938069009e-06, - "loss": 0.1606, - "step": 27610 - }, - { - "epoch": 0.77, - "learning_rate": 2.407602956705386e-06, - "loss": 0.1286, - "step": 27615 - }, - { - "epoch": 0.77, - "learning_rate": 2.4061759753417623e-06, - "loss": 0.12, - "step": 27620 - }, - { - "epoch": 0.77, - "learning_rate": 2.4047489939781386e-06, - "loss": 0.027, - "step": 27625 - }, - { - "epoch": 0.77, - "learning_rate": 2.4033220126145154e-06, - "loss": 0.1582, - "step": 27630 - }, - { - "epoch": 0.77, - "learning_rate": 2.401895031250892e-06, - "loss": 0.0792, - "step": 27635 - }, - { - "epoch": 0.77, - "learning_rate": 2.400468049887269e-06, - "loss": 0.1332, - "step": 27640 - }, - { - "epoch": 0.77, - "learning_rate": 2.3990410685236452e-06, - "loss": 0.1546, - "step": 27645 - }, - { - "epoch": 0.77, - "learning_rate": 2.3976140871600216e-06, - "loss": 0.5325, - "step": 27650 - }, - { - "epoch": 0.77, - "learning_rate": 2.3961871057963983e-06, - "loss": 0.1191, - "step": 27655 - }, - { - "epoch": 0.77, - "learning_rate": 2.394760124432775e-06, - "loss": 0.1728, - "step": 27660 - }, - { - "epoch": 0.77, - "learning_rate": 2.393333143069152e-06, - "loss": 0.1316, - "step": 27665 - }, - { - "epoch": 0.77, - "learning_rate": 2.391906161705528e-06, - "loss": 0.1639, - "step": 27670 - }, - { - "epoch": 0.77, - "learning_rate": 2.390479180341905e-06, - "loss": 0.0454, - "step": 27675 - }, - { - "epoch": 0.77, - "learning_rate": 2.3890521989782817e-06, - "loss": 0.1234, - "step": 27680 - }, - { - "epoch": 0.77, - "learning_rate": 2.387625217614658e-06, - "loss": 0.1786, - "step": 27685 - }, - { - "epoch": 0.77, - "learning_rate": 2.386198236251035e-06, - "loss": 0.1624, - "step": 27690 - }, - { - "epoch": 0.77, - "learning_rate": 2.384771254887411e-06, - "loss": 0.193, - "step": 27695 - }, - { - "epoch": 0.77, - "learning_rate": 2.383344273523788e-06, - "loss": 0.3262, - "step": 27700 - }, - { - "epoch": 0.77, - "learning_rate": 2.3819172921601647e-06, - "loss": 0.1204, - "step": 27705 - }, - { - "epoch": 0.77, - "learning_rate": 2.3804903107965414e-06, - "loss": 0.063, - "step": 27710 - }, - { - "epoch": 0.77, - "learning_rate": 2.3790633294329178e-06, - "loss": 0.144, - "step": 27715 - }, - { - "epoch": 0.77, - "learning_rate": 2.3776363480692945e-06, - "loss": 0.1995, - "step": 27720 - }, - { - "epoch": 0.77, - "learning_rate": 2.376209366705671e-06, - "loss": 0.211, - "step": 27725 - }, - { - "epoch": 0.77, - "learning_rate": 2.3747823853420476e-06, - "loss": 0.09, - "step": 27730 - }, - { - "epoch": 0.77, - "learning_rate": 2.3733554039784244e-06, - "loss": 0.0303, - "step": 27735 - }, - { - "epoch": 0.77, - "learning_rate": 2.3719284226148007e-06, - "loss": 0.1759, - "step": 27740 - }, - { - "epoch": 0.77, - "learning_rate": 2.3705014412511775e-06, - "loss": 0.1973, - "step": 27745 - }, - { - "epoch": 0.77, - "learning_rate": 2.369074459887554e-06, - "loss": 0.422, - "step": 27750 - }, - { - "epoch": 0.77, - "learning_rate": 2.3676474785239306e-06, - "loss": 0.1344, - "step": 27755 - }, - { - "epoch": 0.77, - "learning_rate": 2.3662204971603074e-06, - "loss": 0.1056, - "step": 27760 - }, - { - "epoch": 0.77, - "learning_rate": 2.364793515796684e-06, - "loss": 0.1137, - "step": 27765 - }, - { - "epoch": 0.77, - "learning_rate": 2.3633665344330605e-06, - "loss": 0.0922, - "step": 27770 - }, - { - "epoch": 0.77, - "learning_rate": 2.3619395530694372e-06, - "loss": 0.1029, - "step": 27775 - }, - { - "epoch": 0.77, - "learning_rate": 2.3605125717058136e-06, - "loss": 0.1035, - "step": 27780 - }, - { - "epoch": 0.77, - "learning_rate": 2.3590855903421903e-06, - "loss": 0.1228, - "step": 27785 - }, - { - "epoch": 0.77, - "learning_rate": 2.357658608978567e-06, - "loss": 0.1267, - "step": 27790 - }, - { - "epoch": 0.77, - "learning_rate": 2.3562316276149434e-06, - "loss": 0.3028, - "step": 27795 - }, - { - "epoch": 0.77, - "learning_rate": 2.35480464625132e-06, - "loss": 0.3352, - "step": 27800 - }, - { - "epoch": 0.77, - "learning_rate": 2.353377664887697e-06, - "loss": 0.113, - "step": 27805 - }, - { - "epoch": 0.77, - "learning_rate": 2.3519506835240733e-06, - "loss": 0.1714, - "step": 27810 - }, - { - "epoch": 0.77, - "learning_rate": 2.35052370216045e-06, - "loss": 0.1211, - "step": 27815 - }, - { - "epoch": 0.77, - "learning_rate": 2.3490967207968264e-06, - "loss": 0.1798, - "step": 27820 - }, - { - "epoch": 0.77, - "learning_rate": 2.347669739433203e-06, - "loss": 0.1656, - "step": 27825 - }, - { - "epoch": 0.77, - "learning_rate": 2.34624275806958e-06, - "loss": 0.101, - "step": 27830 - }, - { - "epoch": 0.77, - "learning_rate": 2.3448157767059567e-06, - "loss": 0.0754, - "step": 27835 - }, - { - "epoch": 0.77, - "learning_rate": 2.343388795342333e-06, - "loss": 0.1488, - "step": 27840 - }, - { - "epoch": 0.77, - "learning_rate": 2.3419618139787094e-06, - "loss": 0.2053, - "step": 27845 - }, - { - "epoch": 0.77, - "learning_rate": 2.340534832615086e-06, - "loss": 0.3365, - "step": 27850 - }, - { - "epoch": 0.77, - "learning_rate": 2.339107851251463e-06, - "loss": 0.1392, - "step": 27855 - }, - { - "epoch": 0.77, - "learning_rate": 2.3376808698878396e-06, - "loss": 0.1091, - "step": 27860 - }, - { - "epoch": 0.77, - "learning_rate": 2.336253888524216e-06, - "loss": 0.1421, - "step": 27865 - }, - { - "epoch": 0.77, - "learning_rate": 2.3348269071605927e-06, - "loss": 0.1185, - "step": 27870 - }, - { - "epoch": 0.77, - "learning_rate": 2.333399925796969e-06, - "loss": 0.0654, - "step": 27875 - }, - { - "epoch": 0.77, - "learning_rate": 2.331972944433346e-06, - "loss": 0.1035, - "step": 27880 - }, - { - "epoch": 0.77, - "learning_rate": 2.3305459630697226e-06, - "loss": 0.1693, - "step": 27885 - }, - { - "epoch": 0.77, - "learning_rate": 2.329118981706099e-06, - "loss": 0.0753, - "step": 27890 - }, - { - "epoch": 0.77, - "learning_rate": 2.3276920003424757e-06, - "loss": 0.1208, - "step": 27895 - }, - { - "epoch": 0.77, - "learning_rate": 2.3262650189788525e-06, - "loss": 0.4328, - "step": 27900 - }, - { - "epoch": 0.77, - "learning_rate": 2.324838037615229e-06, - "loss": 0.0933, - "step": 27905 - }, - { - "epoch": 0.77, - "learning_rate": 2.3234110562516056e-06, - "loss": 0.1772, - "step": 27910 - }, - { - "epoch": 0.77, - "learning_rate": 2.321984074887982e-06, - "loss": 0.1042, - "step": 27915 - }, - { - "epoch": 0.77, - "learning_rate": 2.3205570935243587e-06, - "loss": 0.1693, - "step": 27920 - }, - { - "epoch": 0.77, - "learning_rate": 2.3191301121607354e-06, - "loss": 0.1167, - "step": 27925 - }, - { - "epoch": 0.77, - "learning_rate": 2.317703130797112e-06, - "loss": 0.0532, - "step": 27930 - }, - { - "epoch": 0.78, - "learning_rate": 2.3162761494334885e-06, - "loss": 0.0951, - "step": 27935 - }, - { - "epoch": 0.78, - "learning_rate": 2.3148491680698653e-06, - "loss": 0.086, - "step": 27940 - }, - { - "epoch": 0.78, - "learning_rate": 2.3134221867062416e-06, - "loss": 0.2343, - "step": 27945 - }, - { - "epoch": 0.78, - "learning_rate": 2.3119952053426184e-06, - "loss": 0.5699, - "step": 27950 - }, - { - "epoch": 0.78, - "learning_rate": 2.310568223978995e-06, - "loss": 0.2167, - "step": 27955 - }, - { - "epoch": 0.78, - "learning_rate": 2.3091412426153715e-06, - "loss": 0.1388, - "step": 27960 - }, - { - "epoch": 0.78, - "learning_rate": 2.3077142612517483e-06, - "loss": 0.1511, - "step": 27965 - }, - { - "epoch": 0.78, - "learning_rate": 2.3062872798881246e-06, - "loss": 0.1833, - "step": 27970 - }, - { - "epoch": 0.78, - "learning_rate": 2.3048602985245014e-06, - "loss": 0.1014, - "step": 27975 - }, - { - "epoch": 0.78, - "learning_rate": 2.303433317160878e-06, - "loss": 0.0743, - "step": 27980 - }, - { - "epoch": 0.78, - "learning_rate": 2.302006335797255e-06, - "loss": 0.097, - "step": 27985 - }, - { - "epoch": 0.78, - "learning_rate": 2.3005793544336312e-06, - "loss": 0.1605, - "step": 27990 - }, - { - "epoch": 0.78, - "learning_rate": 2.299152373070008e-06, - "loss": 0.2227, - "step": 27995 - }, - { - "epoch": 0.78, - "learning_rate": 2.2977253917063843e-06, - "loss": 0.1816, - "step": 28000 - }, - { - "epoch": 0.78, - "eval_loss": 0.05539175495505333, - "eval_runtime": 1838.9691, - "eval_samples_per_second": 8.71, - "eval_steps_per_second": 2.178, - "eval_wer": 0.16172015867291742, - "step": 28000 - }, - { - "epoch": 0.78, - "learning_rate": 2.296298410342761e-06, - "loss": 0.1441, - "step": 28005 - }, - { - "epoch": 0.78, - "learning_rate": 2.294871428979138e-06, - "loss": 0.1065, - "step": 28010 - }, - { - "epoch": 0.78, - "learning_rate": 2.293444447615514e-06, - "loss": 0.1141, - "step": 28015 - }, - { - "epoch": 0.78, - "learning_rate": 2.292017466251891e-06, - "loss": 0.3045, - "step": 28020 - }, - { - "epoch": 0.78, - "learning_rate": 2.2905904848882677e-06, - "loss": 0.1289, - "step": 28025 - }, - { - "epoch": 0.78, - "learning_rate": 2.2891635035246445e-06, - "loss": 0.1346, - "step": 28030 - }, - { - "epoch": 0.78, - "learning_rate": 2.287736522161021e-06, - "loss": 0.0897, - "step": 28035 - }, - { - "epoch": 0.78, - "learning_rate": 2.286309540797397e-06, - "loss": 0.1108, - "step": 28040 - }, - { - "epoch": 0.78, - "learning_rate": 2.284882559433774e-06, - "loss": 0.1147, - "step": 28045 - }, - { - "epoch": 0.78, - "learning_rate": 2.2834555780701507e-06, - "loss": 0.3611, - "step": 28050 - }, - { - "epoch": 0.78, - "learning_rate": 2.2820285967065274e-06, - "loss": 0.1684, - "step": 28055 - }, - { - "epoch": 0.78, - "learning_rate": 2.2806016153429038e-06, - "loss": 0.1289, - "step": 28060 - }, - { - "epoch": 0.78, - "learning_rate": 2.27917463397928e-06, - "loss": 0.2035, - "step": 28065 - }, - { - "epoch": 0.78, - "learning_rate": 2.277747652615657e-06, - "loss": 0.1857, - "step": 28070 - }, - { - "epoch": 0.78, - "learning_rate": 2.2763206712520336e-06, - "loss": 0.0604, - "step": 28075 - }, - { - "epoch": 0.78, - "learning_rate": 2.2748936898884104e-06, - "loss": 0.0587, - "step": 28080 - }, - { - "epoch": 0.78, - "learning_rate": 2.2734667085247867e-06, - "loss": 0.1677, - "step": 28085 - }, - { - "epoch": 0.78, - "learning_rate": 2.2720397271611635e-06, - "loss": 0.1768, - "step": 28090 - }, - { - "epoch": 0.78, - "learning_rate": 2.2706127457975403e-06, - "loss": 0.2347, - "step": 28095 - }, - { - "epoch": 0.78, - "learning_rate": 2.2691857644339166e-06, - "loss": 0.5117, - "step": 28100 - }, - { - "epoch": 0.78, - "learning_rate": 2.2677587830702934e-06, - "loss": 0.1398, - "step": 28105 - }, - { - "epoch": 0.78, - "learning_rate": 2.2663318017066697e-06, - "loss": 0.0991, - "step": 28110 - }, - { - "epoch": 0.78, - "learning_rate": 2.2649048203430465e-06, - "loss": 0.1617, - "step": 28115 - }, - { - "epoch": 0.78, - "learning_rate": 2.2634778389794232e-06, - "loss": 0.1641, - "step": 28120 - }, - { - "epoch": 0.78, - "learning_rate": 2.2620508576158e-06, - "loss": 0.1207, - "step": 28125 - }, - { - "epoch": 0.78, - "learning_rate": 2.2606238762521763e-06, - "loss": 0.0788, - "step": 28130 - }, - { - "epoch": 0.78, - "learning_rate": 2.2591968948885527e-06, - "loss": 0.2249, - "step": 28135 - }, - { - "epoch": 0.78, - "learning_rate": 2.2577699135249294e-06, - "loss": 0.2089, - "step": 28140 - }, - { - "epoch": 0.78, - "learning_rate": 2.256342932161306e-06, - "loss": 0.1748, - "step": 28145 - }, - { - "epoch": 0.78, - "learning_rate": 2.254915950797683e-06, - "loss": 0.3743, - "step": 28150 - }, - { - "epoch": 0.78, - "learning_rate": 2.2534889694340593e-06, - "loss": 0.1678, - "step": 28155 - }, - { - "epoch": 0.78, - "learning_rate": 2.252061988070436e-06, - "loss": 0.1129, - "step": 28160 - }, - { - "epoch": 0.78, - "learning_rate": 2.2506350067068124e-06, - "loss": 0.1907, - "step": 28165 - }, - { - "epoch": 0.78, - "learning_rate": 2.249208025343189e-06, - "loss": 0.1486, - "step": 28170 - }, - { - "epoch": 0.78, - "learning_rate": 2.247781043979566e-06, - "loss": 0.0594, - "step": 28175 - }, - { - "epoch": 0.78, - "learning_rate": 2.2463540626159423e-06, - "loss": 0.0934, - "step": 28180 - }, - { - "epoch": 0.78, - "learning_rate": 2.244927081252319e-06, - "loss": 0.0663, - "step": 28185 - }, - { - "epoch": 0.78, - "learning_rate": 2.2435000998886958e-06, - "loss": 0.0894, - "step": 28190 - }, - { - "epoch": 0.78, - "learning_rate": 2.242073118525072e-06, - "loss": 0.3374, - "step": 28195 - }, - { - "epoch": 0.78, - "learning_rate": 2.240646137161449e-06, - "loss": 0.3275, - "step": 28200 - }, - { - "epoch": 0.78, - "learning_rate": 2.2392191557978256e-06, - "loss": 0.077, - "step": 28205 - }, - { - "epoch": 0.78, - "learning_rate": 2.237792174434202e-06, - "loss": 0.1487, - "step": 28210 - }, - { - "epoch": 0.78, - "learning_rate": 2.2363651930705787e-06, - "loss": 0.1179, - "step": 28215 - }, - { - "epoch": 0.78, - "learning_rate": 2.2349382117069555e-06, - "loss": 0.1686, - "step": 28220 - }, - { - "epoch": 0.78, - "learning_rate": 2.233511230343332e-06, - "loss": 0.2046, - "step": 28225 - }, - { - "epoch": 0.78, - "learning_rate": 2.2320842489797086e-06, - "loss": 0.1222, - "step": 28230 - }, - { - "epoch": 0.78, - "learning_rate": 2.230657267616085e-06, - "loss": 0.0498, - "step": 28235 - }, - { - "epoch": 0.78, - "learning_rate": 2.2292302862524617e-06, - "loss": 0.1486, - "step": 28240 - }, - { - "epoch": 0.78, - "learning_rate": 2.2278033048888385e-06, - "loss": 0.2174, - "step": 28245 - }, - { - "epoch": 0.78, - "learning_rate": 2.2263763235252152e-06, - "loss": 0.5739, - "step": 28250 - }, - { - "epoch": 0.78, - "learning_rate": 2.2249493421615916e-06, - "loss": 0.1467, - "step": 28255 - }, - { - "epoch": 0.78, - "learning_rate": 2.223522360797968e-06, - "loss": 0.168, - "step": 28260 - }, - { - "epoch": 0.78, - "learning_rate": 2.2220953794343447e-06, - "loss": 0.1441, - "step": 28265 - }, - { - "epoch": 0.78, - "learning_rate": 2.2206683980707214e-06, - "loss": 0.2266, - "step": 28270 - }, - { - "epoch": 0.78, - "learning_rate": 2.219241416707098e-06, - "loss": 0.2335, - "step": 28275 - }, - { - "epoch": 0.78, - "learning_rate": 2.2178144353434745e-06, - "loss": 0.1233, - "step": 28280 - }, - { - "epoch": 0.78, - "learning_rate": 2.2163874539798513e-06, - "loss": 0.0237, - "step": 28285 - }, - { - "epoch": 0.78, - "learning_rate": 2.2149604726162276e-06, - "loss": 0.1866, - "step": 28290 - }, - { - "epoch": 0.79, - "learning_rate": 2.2135334912526044e-06, - "loss": 0.2368, - "step": 28295 - }, - { - "epoch": 0.79, - "learning_rate": 2.212106509888981e-06, - "loss": 0.466, - "step": 28300 - }, - { - "epoch": 0.79, - "learning_rate": 2.2106795285253575e-06, - "loss": 0.2206, - "step": 28305 - }, - { - "epoch": 0.79, - "learning_rate": 2.2092525471617343e-06, - "loss": 0.1756, - "step": 28310 - }, - { - "epoch": 0.79, - "learning_rate": 2.207825565798111e-06, - "loss": 0.1234, - "step": 28315 - }, - { - "epoch": 0.79, - "learning_rate": 2.2063985844344874e-06, - "loss": 0.1879, - "step": 28320 - }, - { - "epoch": 0.79, - "learning_rate": 2.204971603070864e-06, - "loss": 0.0889, - "step": 28325 - }, - { - "epoch": 0.79, - "learning_rate": 2.2035446217072405e-06, - "loss": 0.0262, - "step": 28330 - }, - { - "epoch": 0.79, - "learning_rate": 2.2021176403436172e-06, - "loss": 0.0909, - "step": 28335 - }, - { - "epoch": 0.79, - "learning_rate": 2.200690658979994e-06, - "loss": 0.2125, - "step": 28340 - }, - { - "epoch": 0.79, - "learning_rate": 2.1992636776163707e-06, - "loss": 0.1656, - "step": 28345 - }, - { - "epoch": 0.79, - "learning_rate": 2.197836696252747e-06, - "loss": 0.3062, - "step": 28350 - }, - { - "epoch": 0.79, - "learning_rate": 2.1964097148891234e-06, - "loss": 0.1637, - "step": 28355 - }, - { - "epoch": 0.79, - "learning_rate": 2.1949827335255e-06, - "loss": 0.1259, - "step": 28360 - }, - { - "epoch": 0.79, - "learning_rate": 2.193555752161877e-06, - "loss": 0.162, - "step": 28365 - }, - { - "epoch": 0.79, - "learning_rate": 2.1921287707982537e-06, - "loss": 0.1843, - "step": 28370 - }, - { - "epoch": 0.79, - "learning_rate": 2.19070178943463e-06, - "loss": 0.084, - "step": 28375 - }, - { - "epoch": 0.79, - "learning_rate": 2.189274808071007e-06, - "loss": 0.048, - "step": 28380 - }, - { - "epoch": 0.79, - "learning_rate": 2.187847826707383e-06, - "loss": 0.2166, - "step": 28385 - }, - { - "epoch": 0.79, - "learning_rate": 2.18642084534376e-06, - "loss": 0.1625, - "step": 28390 - }, - { - "epoch": 0.79, - "learning_rate": 2.1849938639801367e-06, - "loss": 0.1636, - "step": 28395 - }, - { - "epoch": 0.79, - "learning_rate": 2.1835668826165134e-06, - "loss": 0.5252, - "step": 28400 - }, - { - "epoch": 0.79, - "learning_rate": 2.1821399012528898e-06, - "loss": 0.1424, - "step": 28405 - }, - { - "epoch": 0.79, - "learning_rate": 2.1807129198892665e-06, - "loss": 0.1969, - "step": 28410 - }, - { - "epoch": 0.79, - "learning_rate": 2.179285938525643e-06, - "loss": 0.115, - "step": 28415 - }, - { - "epoch": 0.79, - "learning_rate": 2.1778589571620196e-06, - "loss": 0.1032, - "step": 28420 - }, - { - "epoch": 0.79, - "learning_rate": 2.1764319757983964e-06, - "loss": 0.0824, - "step": 28425 - }, - { - "epoch": 0.79, - "learning_rate": 2.1750049944347727e-06, - "loss": 0.0057, - "step": 28430 - }, - { - "epoch": 0.79, - "learning_rate": 2.1735780130711495e-06, - "loss": 0.152, - "step": 28435 - }, - { - "epoch": 0.79, - "learning_rate": 2.1721510317075263e-06, - "loss": 0.1678, - "step": 28440 - }, - { - "epoch": 0.79, - "learning_rate": 2.170724050343903e-06, - "loss": 0.3145, - "step": 28445 - }, - { - "epoch": 0.79, - "learning_rate": 2.1692970689802794e-06, - "loss": 0.3238, - "step": 28450 - }, - { - "epoch": 0.79, - "learning_rate": 2.1678700876166557e-06, - "loss": 0.1323, - "step": 28455 - }, - { - "epoch": 0.79, - "learning_rate": 2.1664431062530325e-06, - "loss": 0.1021, - "step": 28460 - }, - { - "epoch": 0.79, - "learning_rate": 2.1650161248894092e-06, - "loss": 0.1061, - "step": 28465 - }, - { - "epoch": 0.79, - "learning_rate": 2.163589143525786e-06, - "loss": 0.2099, - "step": 28470 - }, - { - "epoch": 0.79, - "learning_rate": 2.1621621621621623e-06, - "loss": 0.2323, - "step": 28475 - }, - { - "epoch": 0.79, - "learning_rate": 2.1607351807985387e-06, - "loss": 0.0497, - "step": 28480 - }, - { - "epoch": 0.79, - "learning_rate": 2.1593081994349154e-06, - "loss": 0.1263, - "step": 28485 - }, - { - "epoch": 0.79, - "learning_rate": 2.157881218071292e-06, - "loss": 0.1116, - "step": 28490 - }, - { - "epoch": 0.79, - "learning_rate": 2.156454236707669e-06, - "loss": 0.1851, - "step": 28495 - }, - { - "epoch": 0.79, - "learning_rate": 2.1550272553440453e-06, - "loss": 0.337, - "step": 28500 - }, - { - "epoch": 0.79, - "learning_rate": 2.153600273980422e-06, - "loss": 0.13, - "step": 28505 - }, - { - "epoch": 0.79, - "learning_rate": 2.1521732926167984e-06, - "loss": 0.0929, - "step": 28510 - }, - { - "epoch": 0.79, - "learning_rate": 2.150746311253175e-06, - "loss": 0.1028, - "step": 28515 - }, - { - "epoch": 0.79, - "learning_rate": 2.149319329889552e-06, - "loss": 0.1104, - "step": 28520 - }, - { - "epoch": 0.79, - "learning_rate": 2.1478923485259283e-06, - "loss": 0.1081, - "step": 28525 - }, - { - "epoch": 0.79, - "learning_rate": 2.146465367162305e-06, - "loss": 0.1647, - "step": 28530 - }, - { - "epoch": 0.79, - "learning_rate": 2.1450383857986818e-06, - "loss": 0.0791, - "step": 28535 - }, - { - "epoch": 0.79, - "learning_rate": 2.1436114044350585e-06, - "loss": 0.2013, - "step": 28540 - }, - { - "epoch": 0.79, - "learning_rate": 2.142184423071435e-06, - "loss": 0.0707, - "step": 28545 - }, - { - "epoch": 0.79, - "learning_rate": 2.1407574417078112e-06, - "loss": 0.4112, - "step": 28550 - }, - { - "epoch": 0.79, - "learning_rate": 2.139330460344188e-06, - "loss": 0.1367, - "step": 28555 - }, - { - "epoch": 0.79, - "learning_rate": 2.1379034789805647e-06, - "loss": 0.1587, - "step": 28560 - }, - { - "epoch": 0.79, - "learning_rate": 2.1364764976169415e-06, - "loss": 0.1337, - "step": 28565 - }, - { - "epoch": 0.79, - "learning_rate": 2.135049516253318e-06, - "loss": 0.1745, - "step": 28570 - }, - { - "epoch": 0.79, - "learning_rate": 2.1336225348896946e-06, - "loss": 0.0903, - "step": 28575 - }, - { - "epoch": 0.79, - "learning_rate": 2.132195553526071e-06, - "loss": 0.0845, - "step": 28580 - }, - { - "epoch": 0.79, - "learning_rate": 2.1307685721624477e-06, - "loss": 0.0549, - "step": 28585 - }, - { - "epoch": 0.79, - "learning_rate": 2.1293415907988245e-06, - "loss": 0.1265, - "step": 28590 - }, - { - "epoch": 0.79, - "learning_rate": 2.127914609435201e-06, - "loss": 0.2066, - "step": 28595 - }, - { - "epoch": 0.79, - "learning_rate": 2.1264876280715776e-06, - "loss": 0.4262, - "step": 28600 - }, - { - "epoch": 0.79, - "learning_rate": 2.125060646707954e-06, - "loss": 0.0848, - "step": 28605 - }, - { - "epoch": 0.79, - "learning_rate": 2.1236336653443307e-06, - "loss": 0.1373, - "step": 28610 - }, - { - "epoch": 0.79, - "learning_rate": 2.1222066839807074e-06, - "loss": 0.1562, - "step": 28615 - }, - { - "epoch": 0.79, - "learning_rate": 2.120779702617084e-06, - "loss": 0.1411, - "step": 28620 - }, - { - "epoch": 0.79, - "learning_rate": 2.1193527212534605e-06, - "loss": 0.1259, - "step": 28625 - }, - { - "epoch": 0.79, - "learning_rate": 2.1179257398898373e-06, - "loss": 0.0769, - "step": 28630 - }, - { - "epoch": 0.79, - "learning_rate": 2.116498758526214e-06, - "loss": 0.1427, - "step": 28635 - }, - { - "epoch": 0.79, - "learning_rate": 2.1150717771625904e-06, - "loss": 0.127, - "step": 28640 - }, - { - "epoch": 0.79, - "learning_rate": 2.113644795798967e-06, - "loss": 0.3177, - "step": 28645 - }, - { - "epoch": 0.79, - "learning_rate": 2.1122178144353435e-06, - "loss": 0.2704, - "step": 28650 - }, - { - "epoch": 0.8, - "learning_rate": 2.1107908330717203e-06, - "loss": 0.1654, - "step": 28655 - }, - { - "epoch": 0.8, - "learning_rate": 2.109363851708097e-06, - "loss": 0.1295, - "step": 28660 - }, - { - "epoch": 0.8, - "learning_rate": 2.1079368703444738e-06, - "loss": 0.1461, - "step": 28665 - }, - { - "epoch": 0.8, - "learning_rate": 2.10650988898085e-06, - "loss": 0.1282, - "step": 28670 - }, - { - "epoch": 0.8, - "learning_rate": 2.1050829076172265e-06, - "loss": 0.0971, - "step": 28675 - }, - { - "epoch": 0.8, - "learning_rate": 2.1036559262536032e-06, - "loss": 0.0834, - "step": 28680 - }, - { - "epoch": 0.8, - "learning_rate": 2.10222894488998e-06, - "loss": 0.1027, - "step": 28685 - }, - { - "epoch": 0.8, - "learning_rate": 2.1008019635263567e-06, - "loss": 0.1586, - "step": 28690 - }, - { - "epoch": 0.8, - "learning_rate": 2.099374982162733e-06, - "loss": 0.3027, - "step": 28695 - }, - { - "epoch": 0.8, - "learning_rate": 2.09794800079911e-06, - "loss": 0.2732, - "step": 28700 - }, - { - "epoch": 0.8, - "learning_rate": 2.096521019435486e-06, - "loss": 0.0897, - "step": 28705 - }, - { - "epoch": 0.8, - "learning_rate": 2.095094038071863e-06, - "loss": 0.1643, - "step": 28710 - }, - { - "epoch": 0.8, - "learning_rate": 2.0936670567082397e-06, - "loss": 0.1752, - "step": 28715 - }, - { - "epoch": 0.8, - "learning_rate": 2.092240075344616e-06, - "loss": 0.1947, - "step": 28720 - }, - { - "epoch": 0.8, - "learning_rate": 2.090813093980993e-06, - "loss": 0.206, - "step": 28725 - }, - { - "epoch": 0.8, - "learning_rate": 2.0893861126173696e-06, - "loss": 0.0614, - "step": 28730 - }, - { - "epoch": 0.8, - "learning_rate": 2.087959131253746e-06, - "loss": 0.1007, - "step": 28735 - }, - { - "epoch": 0.8, - "learning_rate": 2.0865321498901227e-06, - "loss": 0.2373, - "step": 28740 - }, - { - "epoch": 0.8, - "learning_rate": 2.085390564799224e-06, - "loss": 0.8765, - "step": 28745 - }, - { - "epoch": 0.8, - "learning_rate": 2.0839635834356007e-06, - "loss": 0.4749, - "step": 28750 - }, - { - "epoch": 0.8, - "learning_rate": 2.082536602071977e-06, - "loss": 0.1613, - "step": 28755 - }, - { - "epoch": 0.8, - "learning_rate": 2.0811096207083538e-06, - "loss": 0.1467, - "step": 28760 - }, - { - "epoch": 0.8, - "learning_rate": 2.07968263934473e-06, - "loss": 0.1365, - "step": 28765 - }, - { - "epoch": 0.8, - "learning_rate": 2.078255657981107e-06, - "loss": 0.1313, - "step": 28770 - }, - { - "epoch": 0.8, - "learning_rate": 2.0768286766174836e-06, - "loss": 0.1381, - "step": 28775 - }, - { - "epoch": 0.8, - "learning_rate": 2.0754016952538604e-06, - "loss": 0.1045, - "step": 28780 - }, - { - "epoch": 0.8, - "learning_rate": 2.0739747138902367e-06, - "loss": 0.1228, - "step": 28785 - }, - { - "epoch": 0.8, - "learning_rate": 2.072547732526613e-06, - "loss": 0.1446, - "step": 28790 - }, - { - "epoch": 0.8, - "learning_rate": 2.07112075116299e-06, - "loss": 0.186, - "step": 28795 - }, - { - "epoch": 0.8, - "learning_rate": 2.0696937697993666e-06, - "loss": 0.3615, - "step": 28800 - }, - { - "epoch": 0.8, - "learning_rate": 2.0682667884357434e-06, - "loss": 0.1192, - "step": 28805 - }, - { - "epoch": 0.8, - "learning_rate": 2.0668398070721197e-06, - "loss": 0.1187, - "step": 28810 - }, - { - "epoch": 0.8, - "learning_rate": 2.0654128257084965e-06, - "loss": 0.15, - "step": 28815 - }, - { - "epoch": 0.8, - "learning_rate": 2.063985844344873e-06, - "loss": 0.123, - "step": 28820 - }, - { - "epoch": 0.8, - "learning_rate": 2.0625588629812496e-06, - "loss": 0.1635, - "step": 28825 - }, - { - "epoch": 0.8, - "learning_rate": 2.0611318816176263e-06, - "loss": 0.1189, - "step": 28830 - }, - { - "epoch": 0.8, - "learning_rate": 2.059704900254003e-06, - "loss": 0.0586, - "step": 28835 - }, - { - "epoch": 0.8, - "learning_rate": 2.0582779188903794e-06, - "loss": 0.0981, - "step": 28840 - }, - { - "epoch": 0.8, - "learning_rate": 2.056850937526756e-06, - "loss": 0.0877, - "step": 28845 - }, - { - "epoch": 0.8, - "learning_rate": 2.0554239561631325e-06, - "loss": 0.4166, - "step": 28850 - }, - { - "epoch": 0.8, - "learning_rate": 2.0539969747995093e-06, - "loss": 0.1074, - "step": 28855 - }, - { - "epoch": 0.8, - "learning_rate": 2.052569993435886e-06, - "loss": 0.1494, - "step": 28860 - }, - { - "epoch": 0.8, - "learning_rate": 2.0511430120722624e-06, - "loss": 0.1262, - "step": 28865 - }, - { - "epoch": 0.8, - "learning_rate": 2.049716030708639e-06, - "loss": 0.1526, - "step": 28870 - }, - { - "epoch": 0.8, - "learning_rate": 2.048289049345016e-06, - "loss": 0.1377, - "step": 28875 - }, - { - "epoch": 0.8, - "learning_rate": 2.0468620679813923e-06, - "loss": 0.0577, - "step": 28880 - }, - { - "epoch": 0.8, - "learning_rate": 2.045435086617769e-06, - "loss": 0.0924, - "step": 28885 - }, - { - "epoch": 0.8, - "learning_rate": 2.0440081052541454e-06, - "loss": 0.1076, - "step": 28890 - }, - { - "epoch": 0.8, - "learning_rate": 2.042581123890522e-06, - "loss": 0.1331, - "step": 28895 - }, - { - "epoch": 0.8, - "learning_rate": 2.041154142526899e-06, - "loss": 0.2208, - "step": 28900 - }, - { - "epoch": 0.8, - "learning_rate": 2.0397271611632756e-06, - "loss": 0.0929, - "step": 28905 - }, - { - "epoch": 0.8, - "learning_rate": 2.038300179799652e-06, - "loss": 0.1111, - "step": 28910 - }, - { - "epoch": 0.8, - "learning_rate": 2.0368731984360283e-06, - "loss": 0.1567, - "step": 28915 - }, - { - "epoch": 0.8, - "learning_rate": 2.035446217072405e-06, - "loss": 0.1782, - "step": 28920 - }, - { - "epoch": 0.8, - "learning_rate": 2.034019235708782e-06, - "loss": 0.1117, - "step": 28925 - }, - { - "epoch": 0.8, - "learning_rate": 2.0325922543451586e-06, - "loss": 0.0977, - "step": 28930 - }, - { - "epoch": 0.8, - "learning_rate": 2.031165272981535e-06, - "loss": 0.105, - "step": 28935 - }, - { - "epoch": 0.8, - "learning_rate": 2.0297382916179117e-06, - "loss": 0.328, - "step": 28940 - }, - { - "epoch": 0.8, - "learning_rate": 2.028311310254288e-06, - "loss": 0.1402, - "step": 28945 - }, - { - "epoch": 0.8, - "learning_rate": 2.026884328890665e-06, - "loss": 0.2992, - "step": 28950 - }, - { - "epoch": 0.8, - "learning_rate": 2.0254573475270416e-06, - "loss": 0.1506, - "step": 28955 - }, - { - "epoch": 0.8, - "learning_rate": 2.024030366163418e-06, - "loss": 0.1239, - "step": 28960 - }, - { - "epoch": 0.8, - "learning_rate": 2.0226033847997947e-06, - "loss": 0.1656, - "step": 28965 - }, - { - "epoch": 0.8, - "learning_rate": 2.0211764034361714e-06, - "loss": 0.11, - "step": 28970 - }, - { - "epoch": 0.8, - "learning_rate": 2.0197494220725478e-06, - "loss": 0.1406, - "step": 28975 - }, - { - "epoch": 0.8, - "learning_rate": 2.0183224407089245e-06, - "loss": 0.1073, - "step": 28980 - }, - { - "epoch": 0.8, - "learning_rate": 2.016895459345301e-06, - "loss": 0.1071, - "step": 28985 - }, - { - "epoch": 0.8, - "learning_rate": 2.0154684779816776e-06, - "loss": 0.2867, - "step": 28990 - }, - { - "epoch": 0.8, - "learning_rate": 2.0140414966180544e-06, - "loss": 0.2095, - "step": 28995 - }, - { - "epoch": 0.8, - "learning_rate": 2.012614515254431e-06, - "loss": 0.412, - "step": 29000 - }, - { - "epoch": 0.8, - "learning_rate": 2.0111875338908075e-06, - "loss": 0.0761, - "step": 29005 - }, - { - "epoch": 0.8, - "learning_rate": 2.009760552527184e-06, - "loss": 0.167, - "step": 29010 - }, - { - "epoch": 0.81, - "learning_rate": 2.0083335711635606e-06, - "loss": 0.1434, - "step": 29015 - }, - { - "epoch": 0.81, - "learning_rate": 2.0069065897999374e-06, - "loss": 0.1703, - "step": 29020 - }, - { - "epoch": 0.81, - "learning_rate": 2.005479608436314e-06, - "loss": 0.1315, - "step": 29025 - }, - { - "epoch": 0.81, - "learning_rate": 2.0040526270726905e-06, - "loss": 0.0482, - "step": 29030 - }, - { - "epoch": 0.81, - "learning_rate": 2.0026256457090672e-06, - "loss": 0.0902, - "step": 29035 - }, - { - "epoch": 0.81, - "learning_rate": 2.0011986643454436e-06, - "loss": 0.13, - "step": 29040 - }, - { - "epoch": 0.81, - "learning_rate": 1.9997716829818203e-06, - "loss": 0.1629, - "step": 29045 - }, - { - "epoch": 0.81, - "learning_rate": 1.998344701618197e-06, - "loss": 0.306, - "step": 29050 - }, - { - "epoch": 0.81, - "learning_rate": 1.996917720254574e-06, - "loss": 0.1238, - "step": 29055 - }, - { - "epoch": 0.81, - "learning_rate": 1.99549073889095e-06, - "loss": 0.1279, - "step": 29060 - }, - { - "epoch": 0.81, - "learning_rate": 1.994063757527327e-06, - "loss": 0.1375, - "step": 29065 - }, - { - "epoch": 0.81, - "learning_rate": 1.9926367761637037e-06, - "loss": 0.1839, - "step": 29070 - }, - { - "epoch": 0.81, - "learning_rate": 1.99120979480008e-06, - "loss": 0.1504, - "step": 29075 - }, - { - "epoch": 0.81, - "learning_rate": 1.989782813436457e-06, - "loss": 0.0427, - "step": 29080 - }, - { - "epoch": 0.81, - "learning_rate": 1.988355832072833e-06, - "loss": 0.1892, - "step": 29085 - }, - { - "epoch": 0.81, - "learning_rate": 1.98692885070921e-06, - "loss": 0.1265, - "step": 29090 - }, - { - "epoch": 0.81, - "learning_rate": 1.9855018693455867e-06, - "loss": 0.1475, - "step": 29095 - }, - { - "epoch": 0.81, - "learning_rate": 1.9840748879819634e-06, - "loss": 0.1996, - "step": 29100 - }, - { - "epoch": 0.81, - "learning_rate": 1.9826479066183398e-06, - "loss": 0.1312, - "step": 29105 - }, - { - "epoch": 0.81, - "learning_rate": 1.981220925254716e-06, - "loss": 0.1338, - "step": 29110 - }, - { - "epoch": 0.81, - "learning_rate": 1.979793943891093e-06, - "loss": 0.1202, - "step": 29115 - }, - { - "epoch": 0.81, - "learning_rate": 1.9783669625274696e-06, - "loss": 0.1662, - "step": 29120 - }, - { - "epoch": 0.81, - "learning_rate": 1.9769399811638464e-06, - "loss": 0.176, - "step": 29125 - }, - { - "epoch": 0.81, - "learning_rate": 1.9755129998002227e-06, - "loss": 0.0265, - "step": 29130 - }, - { - "epoch": 0.81, - "learning_rate": 1.974086018436599e-06, - "loss": 0.0414, - "step": 29135 - }, - { - "epoch": 0.81, - "learning_rate": 1.972659037072976e-06, - "loss": 0.1461, - "step": 29140 - }, - { - "epoch": 0.81, - "learning_rate": 1.9712320557093526e-06, - "loss": 0.2434, - "step": 29145 - }, - { - "epoch": 0.81, - "learning_rate": 1.9698050743457294e-06, - "loss": 0.2549, - "step": 29150 - }, - { - "epoch": 0.81, - "learning_rate": 1.9683780929821057e-06, - "loss": 0.1046, - "step": 29155 - }, - { - "epoch": 0.81, - "learning_rate": 1.9669511116184825e-06, - "loss": 0.1638, - "step": 29160 - }, - { - "epoch": 0.81, - "learning_rate": 1.9655241302548592e-06, - "loss": 0.2054, - "step": 29165 - }, - { - "epoch": 0.81, - "learning_rate": 1.9640971488912356e-06, - "loss": 0.1687, - "step": 29170 - }, - { - "epoch": 0.81, - "learning_rate": 1.9626701675276123e-06, - "loss": 0.182, - "step": 29175 - }, - { - "epoch": 0.81, - "learning_rate": 1.9612431861639887e-06, - "loss": 0.0696, - "step": 29180 - }, - { - "epoch": 0.81, - "learning_rate": 1.9598162048003654e-06, - "loss": 0.0819, - "step": 29185 - }, - { - "epoch": 0.81, - "learning_rate": 1.958389223436742e-06, - "loss": 0.0868, - "step": 29190 - }, - { - "epoch": 0.81, - "learning_rate": 1.956962242073119e-06, - "loss": 0.1614, - "step": 29195 - }, - { - "epoch": 0.81, - "learning_rate": 1.9555352607094953e-06, - "loss": 0.2675, - "step": 29200 - }, - { - "epoch": 0.81, - "learning_rate": 1.9541082793458716e-06, - "loss": 0.1194, - "step": 29205 - }, - { - "epoch": 0.81, - "learning_rate": 1.9526812979822484e-06, - "loss": 0.1698, - "step": 29210 - }, - { - "epoch": 0.81, - "learning_rate": 1.951254316618625e-06, - "loss": 0.1408, - "step": 29215 - }, - { - "epoch": 0.81, - "learning_rate": 1.949827335255002e-06, - "loss": 0.1261, - "step": 29220 - }, - { - "epoch": 0.81, - "learning_rate": 1.9484003538913783e-06, - "loss": 0.0789, - "step": 29225 - }, - { - "epoch": 0.81, - "learning_rate": 1.946973372527755e-06, - "loss": 0.1169, - "step": 29230 - }, - { - "epoch": 0.81, - "learning_rate": 1.9455463911641314e-06, - "loss": 0.0752, - "step": 29235 - }, - { - "epoch": 0.81, - "learning_rate": 1.944119409800508e-06, - "loss": 0.1521, - "step": 29240 - }, - { - "epoch": 0.81, - "learning_rate": 1.942692428436885e-06, - "loss": 0.1285, - "step": 29245 - }, - { - "epoch": 0.81, - "learning_rate": 1.9412654470732612e-06, - "loss": 0.3726, - "step": 29250 - }, - { - "epoch": 0.81, - "learning_rate": 1.939838465709638e-06, - "loss": 0.1007, - "step": 29255 - }, - { - "epoch": 0.81, - "learning_rate": 1.9384114843460147e-06, - "loss": 0.1351, - "step": 29260 - }, - { - "epoch": 0.81, - "learning_rate": 1.936984502982391e-06, - "loss": 0.1856, - "step": 29265 - }, - { - "epoch": 0.81, - "learning_rate": 1.935557521618768e-06, - "loss": 0.1899, - "step": 29270 - }, - { - "epoch": 0.81, - "learning_rate": 1.9341305402551446e-06, - "loss": 0.1647, - "step": 29275 - }, - { - "epoch": 0.81, - "learning_rate": 1.932703558891521e-06, - "loss": 0.1379, - "step": 29280 - }, - { - "epoch": 0.81, - "learning_rate": 1.9312765775278977e-06, - "loss": 0.1229, - "step": 29285 - }, - { - "epoch": 0.81, - "learning_rate": 1.9298495961642745e-06, - "loss": 0.1981, - "step": 29290 - }, - { - "epoch": 0.81, - "learning_rate": 1.928422614800651e-06, - "loss": 0.1811, - "step": 29295 - }, - { - "epoch": 0.81, - "learning_rate": 1.9269956334370276e-06, - "loss": 0.3038, - "step": 29300 - }, - { - "epoch": 0.81, - "learning_rate": 1.925568652073404e-06, - "loss": 0.0714, - "step": 29305 - }, - { - "epoch": 0.81, - "learning_rate": 1.9241416707097807e-06, - "loss": 0.1724, - "step": 29310 - }, - { - "epoch": 0.81, - "learning_rate": 1.9227146893461574e-06, - "loss": 0.1529, - "step": 29315 - }, - { - "epoch": 0.81, - "learning_rate": 1.921287707982534e-06, - "loss": 0.1615, - "step": 29320 - }, - { - "epoch": 0.81, - "learning_rate": 1.9198607266189105e-06, - "loss": 0.1092, - "step": 29325 - }, - { - "epoch": 0.81, - "learning_rate": 1.918433745255287e-06, - "loss": 0.0957, - "step": 29330 - }, - { - "epoch": 0.81, - "learning_rate": 1.9170067638916636e-06, - "loss": 0.1288, - "step": 29335 - }, - { - "epoch": 0.81, - "learning_rate": 1.9155797825280404e-06, - "loss": 0.1648, - "step": 29340 - }, - { - "epoch": 0.81, - "learning_rate": 1.914152801164417e-06, - "loss": 0.1914, - "step": 29345 - }, - { - "epoch": 0.81, - "learning_rate": 1.9127258198007935e-06, - "loss": 0.3363, - "step": 29350 - }, - { - "epoch": 0.81, - "learning_rate": 1.9112988384371703e-06, - "loss": 0.1357, - "step": 29355 - }, - { - "epoch": 0.81, - "learning_rate": 1.9098718570735466e-06, - "loss": 0.1336, - "step": 29360 - }, - { - "epoch": 0.81, - "learning_rate": 1.9084448757099234e-06, - "loss": 0.1413, - "step": 29365 - }, - { - "epoch": 0.81, - "learning_rate": 1.9070178943463e-06, - "loss": 0.1587, - "step": 29370 - }, - { - "epoch": 0.82, - "learning_rate": 1.9055909129826767e-06, - "loss": 0.2068, - "step": 29375 - }, - { - "epoch": 0.82, - "learning_rate": 1.9041639316190532e-06, - "loss": 0.0638, - "step": 29380 - }, - { - "epoch": 0.82, - "learning_rate": 1.90273695025543e-06, - "loss": 0.3071, - "step": 29385 - }, - { - "epoch": 0.82, - "learning_rate": 1.9013099688918063e-06, - "loss": 0.0693, - "step": 29390 - }, - { - "epoch": 0.82, - "learning_rate": 1.8998829875281829e-06, - "loss": 0.1451, - "step": 29395 - }, - { - "epoch": 0.82, - "learning_rate": 1.8984560061645596e-06, - "loss": 0.2641, - "step": 29400 - }, - { - "epoch": 0.82, - "learning_rate": 1.8970290248009362e-06, - "loss": 0.1411, - "step": 29405 - }, - { - "epoch": 0.82, - "learning_rate": 1.895602043437313e-06, - "loss": 0.1326, - "step": 29410 - }, - { - "epoch": 0.82, - "learning_rate": 1.8941750620736895e-06, - "loss": 0.1322, - "step": 29415 - }, - { - "epoch": 0.82, - "learning_rate": 1.8927480807100663e-06, - "loss": 0.1163, - "step": 29420 - }, - { - "epoch": 0.82, - "learning_rate": 1.8913210993464426e-06, - "loss": 0.1126, - "step": 29425 - }, - { - "epoch": 0.82, - "learning_rate": 1.8898941179828192e-06, - "loss": 0.0469, - "step": 29430 - }, - { - "epoch": 0.82, - "learning_rate": 1.888467136619196e-06, - "loss": 0.0579, - "step": 29435 - }, - { - "epoch": 0.82, - "learning_rate": 1.8870401552555725e-06, - "loss": 0.1405, - "step": 29440 - }, - { - "epoch": 0.82, - "learning_rate": 1.8856131738919492e-06, - "loss": 0.3488, - "step": 29445 - }, - { - "epoch": 0.82, - "learning_rate": 1.8841861925283258e-06, - "loss": 0.4339, - "step": 29450 - }, - { - "epoch": 0.82, - "learning_rate": 1.8827592111647023e-06, - "loss": 0.2233, - "step": 29455 - }, - { - "epoch": 0.82, - "learning_rate": 1.8813322298010789e-06, - "loss": 0.153, - "step": 29460 - }, - { - "epoch": 0.82, - "learning_rate": 1.8799052484374554e-06, - "loss": 0.1254, - "step": 29465 - }, - { - "epoch": 0.82, - "learning_rate": 1.8784782670738322e-06, - "loss": 0.1401, - "step": 29470 - }, - { - "epoch": 0.82, - "learning_rate": 1.8770512857102087e-06, - "loss": 0.0785, - "step": 29475 - }, - { - "epoch": 0.82, - "learning_rate": 1.8756243043465855e-06, - "loss": 0.1434, - "step": 29480 - }, - { - "epoch": 0.82, - "learning_rate": 1.8741973229829618e-06, - "loss": 0.1638, - "step": 29485 - }, - { - "epoch": 0.82, - "learning_rate": 1.8727703416193386e-06, - "loss": 0.254, - "step": 29490 - }, - { - "epoch": 0.82, - "learning_rate": 1.8713433602557152e-06, - "loss": 0.1793, - "step": 29495 - }, - { - "epoch": 0.82, - "learning_rate": 1.869916378892092e-06, - "loss": 0.4827, - "step": 29500 - }, - { - "epoch": 0.82, - "learning_rate": 1.8684893975284685e-06, - "loss": 0.1294, - "step": 29505 - }, - { - "epoch": 0.82, - "learning_rate": 1.8670624161648452e-06, - "loss": 0.1245, - "step": 29510 - }, - { - "epoch": 0.82, - "learning_rate": 1.8656354348012218e-06, - "loss": 0.2984, - "step": 29515 - }, - { - "epoch": 0.82, - "learning_rate": 1.8642084534375981e-06, - "loss": 0.1426, - "step": 29520 - }, - { - "epoch": 0.82, - "learning_rate": 1.8627814720739749e-06, - "loss": 0.0468, - "step": 29525 - }, - { - "epoch": 0.82, - "learning_rate": 1.8613544907103514e-06, - "loss": 0.0844, - "step": 29530 - }, - { - "epoch": 0.82, - "learning_rate": 1.8599275093467282e-06, - "loss": 0.0907, - "step": 29535 - }, - { - "epoch": 0.82, - "learning_rate": 1.8585005279831047e-06, - "loss": 0.1162, - "step": 29540 - }, - { - "epoch": 0.82, - "learning_rate": 1.8570735466194815e-06, - "loss": 0.2419, - "step": 29545 - }, - { - "epoch": 0.82, - "learning_rate": 1.8556465652558578e-06, - "loss": 0.3571, - "step": 29550 - }, - { - "epoch": 0.82, - "learning_rate": 1.8542195838922344e-06, - "loss": 0.1416, - "step": 29555 - }, - { - "epoch": 0.82, - "learning_rate": 1.8527926025286112e-06, - "loss": 0.1364, - "step": 29560 - }, - { - "epoch": 0.82, - "learning_rate": 1.8513656211649877e-06, - "loss": 0.1309, - "step": 29565 - }, - { - "epoch": 0.82, - "learning_rate": 1.8499386398013645e-06, - "loss": 0.1941, - "step": 29570 - }, - { - "epoch": 0.82, - "learning_rate": 1.848511658437741e-06, - "loss": 0.162, - "step": 29575 - }, - { - "epoch": 0.82, - "learning_rate": 1.8470846770741174e-06, - "loss": 0.0987, - "step": 29580 - }, - { - "epoch": 0.82, - "learning_rate": 1.8456576957104941e-06, - "loss": 0.1344, - "step": 29585 - }, - { - "epoch": 0.82, - "learning_rate": 1.8442307143468707e-06, - "loss": 0.1251, - "step": 29590 - }, - { - "epoch": 0.82, - "learning_rate": 1.8428037329832474e-06, - "loss": 0.1892, - "step": 29595 - }, - { - "epoch": 0.82, - "learning_rate": 1.841376751619624e-06, - "loss": 0.5304, - "step": 29600 - }, - { - "epoch": 0.82, - "learning_rate": 1.8399497702560007e-06, - "loss": 0.144, - "step": 29605 - }, - { - "epoch": 0.82, - "learning_rate": 1.8385227888923773e-06, - "loss": 0.1337, - "step": 29610 - }, - { - "epoch": 0.82, - "learning_rate": 1.8370958075287536e-06, - "loss": 0.1263, - "step": 29615 - }, - { - "epoch": 0.82, - "learning_rate": 1.8356688261651304e-06, - "loss": 0.1888, - "step": 29620 - }, - { - "epoch": 0.82, - "learning_rate": 1.834241844801507e-06, - "loss": 0.1318, - "step": 29625 - }, - { - "epoch": 0.82, - "learning_rate": 1.8328148634378837e-06, - "loss": 0.1316, - "step": 29630 - }, - { - "epoch": 0.82, - "learning_rate": 1.8313878820742603e-06, - "loss": 0.0733, - "step": 29635 - }, - { - "epoch": 0.82, - "learning_rate": 1.829960900710637e-06, - "loss": 0.1689, - "step": 29640 - }, - { - "epoch": 0.82, - "learning_rate": 1.8285339193470134e-06, - "loss": 0.1285, - "step": 29645 - }, - { - "epoch": 0.82, - "learning_rate": 1.82710693798339e-06, - "loss": 0.4993, - "step": 29650 - }, - { - "epoch": 0.82, - "learning_rate": 1.8256799566197667e-06, - "loss": 0.1109, - "step": 29655 - }, - { - "epoch": 0.82, - "learning_rate": 1.8242529752561432e-06, - "loss": 0.1775, - "step": 29660 - }, - { - "epoch": 0.82, - "learning_rate": 1.82282599389252e-06, - "loss": 0.1561, - "step": 29665 - }, - { - "epoch": 0.82, - "learning_rate": 1.8213990125288965e-06, - "loss": 0.0936, - "step": 29670 - }, - { - "epoch": 0.82, - "learning_rate": 1.8199720311652733e-06, - "loss": 0.0657, - "step": 29675 - }, - { - "epoch": 0.82, - "learning_rate": 1.8185450498016496e-06, - "loss": 0.0613, - "step": 29680 - }, - { - "epoch": 0.82, - "learning_rate": 1.8171180684380262e-06, - "loss": 0.088, - "step": 29685 - }, - { - "epoch": 0.82, - "learning_rate": 1.815691087074403e-06, - "loss": 0.0859, - "step": 29690 - }, - { - "epoch": 0.82, - "learning_rate": 1.8142641057107795e-06, - "loss": 0.203, - "step": 29695 - }, - { - "epoch": 0.82, - "learning_rate": 1.8128371243471563e-06, - "loss": 0.3191, - "step": 29700 - }, - { - "epoch": 0.82, - "learning_rate": 1.8114101429835328e-06, - "loss": 0.1306, - "step": 29705 - }, - { - "epoch": 0.82, - "learning_rate": 1.8099831616199094e-06, - "loss": 0.1267, - "step": 29710 - }, - { - "epoch": 0.82, - "learning_rate": 1.808556180256286e-06, - "loss": 0.1168, - "step": 29715 - }, - { - "epoch": 0.82, - "learning_rate": 1.8071291988926627e-06, - "loss": 0.1634, - "step": 29720 - }, - { - "epoch": 0.82, - "learning_rate": 1.8057022175290392e-06, - "loss": 0.1051, - "step": 29725 - }, - { - "epoch": 0.82, - "learning_rate": 1.804275236165416e-06, - "loss": 0.0556, - "step": 29730 - }, - { - "epoch": 0.83, - "learning_rate": 1.8028482548017925e-06, - "loss": 0.0653, - "step": 29735 - }, - { - "epoch": 0.83, - "learning_rate": 1.8014212734381689e-06, - "loss": 0.2693, - "step": 29740 - }, - { - "epoch": 0.83, - "learning_rate": 1.7999942920745456e-06, - "loss": 0.1349, - "step": 29745 - }, - { - "epoch": 0.83, - "learning_rate": 1.7985673107109222e-06, - "loss": 0.3507, - "step": 29750 - }, - { - "epoch": 0.83, - "learning_rate": 1.797140329347299e-06, - "loss": 0.1368, - "step": 29755 - }, - { - "epoch": 0.83, - "learning_rate": 1.7957133479836755e-06, - "loss": 0.1215, - "step": 29760 - }, - { - "epoch": 0.83, - "learning_rate": 1.7942863666200523e-06, - "loss": 0.1801, - "step": 29765 - }, - { - "epoch": 0.83, - "learning_rate": 1.7928593852564288e-06, - "loss": 0.1228, - "step": 29770 - }, - { - "epoch": 0.83, - "learning_rate": 1.7914324038928052e-06, - "loss": 0.0795, - "step": 29775 - }, - { - "epoch": 0.83, - "learning_rate": 1.790005422529182e-06, - "loss": 0.0496, - "step": 29780 - }, - { - "epoch": 0.83, - "learning_rate": 1.7885784411655585e-06, - "loss": 0.141, - "step": 29785 - }, - { - "epoch": 0.83, - "learning_rate": 1.7871514598019352e-06, - "loss": 0.1736, - "step": 29790 - }, - { - "epoch": 0.83, - "learning_rate": 1.7857244784383118e-06, - "loss": 0.163, - "step": 29795 - }, - { - "epoch": 0.83, - "learning_rate": 1.7842974970746885e-06, - "loss": 0.1673, - "step": 29800 - }, - { - "epoch": 0.83, - "learning_rate": 1.7828705157110649e-06, - "loss": 0.1442, - "step": 29805 - }, - { - "epoch": 0.83, - "learning_rate": 1.7814435343474414e-06, - "loss": 0.1148, - "step": 29810 - }, - { - "epoch": 0.83, - "learning_rate": 1.7800165529838182e-06, - "loss": 0.1531, - "step": 29815 - }, - { - "epoch": 0.83, - "learning_rate": 1.7785895716201947e-06, - "loss": 0.1766, - "step": 29820 - }, - { - "epoch": 0.83, - "learning_rate": 1.7771625902565715e-06, - "loss": 0.1422, - "step": 29825 - }, - { - "epoch": 0.83, - "learning_rate": 1.775735608892948e-06, - "loss": 0.0921, - "step": 29830 - }, - { - "epoch": 0.83, - "learning_rate": 1.7743086275293244e-06, - "loss": 0.0602, - "step": 29835 - }, - { - "epoch": 0.83, - "learning_rate": 1.7728816461657012e-06, - "loss": 0.1568, - "step": 29840 - }, - { - "epoch": 0.83, - "learning_rate": 1.7714546648020777e-06, - "loss": 0.2646, - "step": 29845 - }, - { - "epoch": 0.83, - "learning_rate": 1.7700276834384545e-06, - "loss": 0.37, - "step": 29850 - }, - { - "epoch": 0.83, - "learning_rate": 1.768600702074831e-06, - "loss": 0.1707, - "step": 29855 - }, - { - "epoch": 0.83, - "learning_rate": 1.7671737207112078e-06, - "loss": 0.158, - "step": 29860 - }, - { - "epoch": 0.83, - "learning_rate": 1.7657467393475843e-06, - "loss": 0.1415, - "step": 29865 - }, - { - "epoch": 0.83, - "learning_rate": 1.7643197579839607e-06, - "loss": 0.195, - "step": 29870 - }, - { - "epoch": 0.83, - "learning_rate": 1.7628927766203374e-06, - "loss": 0.1228, - "step": 29875 - }, - { - "epoch": 0.83, - "learning_rate": 1.761465795256714e-06, - "loss": 0.0604, - "step": 29880 - }, - { - "epoch": 0.83, - "learning_rate": 1.7600388138930907e-06, - "loss": 0.0835, - "step": 29885 - }, - { - "epoch": 0.83, - "learning_rate": 1.7586118325294673e-06, - "loss": 0.1226, - "step": 29890 - }, - { - "epoch": 0.83, - "learning_rate": 1.757184851165844e-06, - "loss": 0.202, - "step": 29895 - }, - { - "epoch": 0.83, - "learning_rate": 1.7557578698022204e-06, - "loss": 0.2161, - "step": 29900 - }, - { - "epoch": 0.83, - "learning_rate": 1.7543308884385972e-06, - "loss": 0.0818, - "step": 29905 - }, - { - "epoch": 0.83, - "learning_rate": 1.7529039070749737e-06, - "loss": 0.1051, - "step": 29910 - }, - { - "epoch": 0.83, - "learning_rate": 1.7514769257113503e-06, - "loss": 0.1467, - "step": 29915 - }, - { - "epoch": 0.83, - "learning_rate": 1.750049944347727e-06, - "loss": 0.1323, - "step": 29920 - }, - { - "epoch": 0.83, - "learning_rate": 1.7486229629841036e-06, - "loss": 0.1149, - "step": 29925 - }, - { - "epoch": 0.83, - "learning_rate": 1.7471959816204801e-06, - "loss": 0.0566, - "step": 29930 - }, - { - "epoch": 0.83, - "learning_rate": 1.7457690002568567e-06, - "loss": 0.1111, - "step": 29935 - }, - { - "epoch": 0.83, - "learning_rate": 1.7443420188932334e-06, - "loss": 0.165, - "step": 29940 - }, - { - "epoch": 0.83, - "learning_rate": 1.74291503752961e-06, - "loss": 0.2132, - "step": 29945 - }, - { - "epoch": 0.83, - "learning_rate": 1.7414880561659867e-06, - "loss": 0.3464, - "step": 29950 - }, - { - "epoch": 0.83, - "learning_rate": 1.7400610748023633e-06, - "loss": 0.1466, - "step": 29955 - }, - { - "epoch": 0.83, - "learning_rate": 1.73863409343874e-06, - "loss": 0.1953, - "step": 29960 - }, - { - "epoch": 0.83, - "learning_rate": 1.7372071120751164e-06, - "loss": 0.174, - "step": 29965 - }, - { - "epoch": 0.83, - "learning_rate": 1.735780130711493e-06, - "loss": 0.1493, - "step": 29970 - }, - { - "epoch": 0.83, - "learning_rate": 1.7343531493478697e-06, - "loss": 0.062, - "step": 29975 - }, - { - "epoch": 0.83, - "learning_rate": 1.7329261679842463e-06, - "loss": 0.0588, - "step": 29980 - }, - { - "epoch": 0.83, - "learning_rate": 1.731499186620623e-06, - "loss": 0.084, - "step": 29985 - }, - { - "epoch": 0.83, - "learning_rate": 1.7300722052569996e-06, - "loss": 0.1432, - "step": 29990 - }, - { - "epoch": 0.83, - "learning_rate": 1.728645223893376e-06, - "loss": 0.14, - "step": 29995 - }, - { - "epoch": 0.83, - "learning_rate": 1.7272182425297527e-06, - "loss": 0.6414, - "step": 30000 - }, - { - "epoch": 0.83, - "eval_loss": 0.05838534235954285, - "eval_runtime": 1928.5758, - "eval_samples_per_second": 8.306, - "eval_steps_per_second": 2.077, - "eval_wer": 0.16357735304724125, - "step": 30000 - }, - { - "epoch": 0.83, - "learning_rate": 1.7257912611661292e-06, - "loss": 0.1612, - "step": 30005 - }, - { - "epoch": 0.83, - "learning_rate": 1.724364279802506e-06, - "loss": 0.1507, - "step": 30010 - }, - { - "epoch": 0.83, - "learning_rate": 1.7229372984388825e-06, - "loss": 0.1451, - "step": 30015 - }, - { - "epoch": 0.83, - "learning_rate": 1.7215103170752593e-06, - "loss": 0.1457, - "step": 30020 - }, - { - "epoch": 0.83, - "learning_rate": 1.7200833357116359e-06, - "loss": 0.1106, - "step": 30025 - }, - { - "epoch": 0.83, - "learning_rate": 1.7186563543480122e-06, - "loss": 0.1255, - "step": 30030 - }, - { - "epoch": 0.83, - "learning_rate": 1.717229372984389e-06, - "loss": 0.061, - "step": 30035 - }, - { - "epoch": 0.83, - "learning_rate": 1.7158023916207655e-06, - "loss": 0.1902, - "step": 30040 - }, - { - "epoch": 0.83, - "learning_rate": 1.7143754102571423e-06, - "loss": 0.1521, - "step": 30045 - }, - { - "epoch": 0.83, - "learning_rate": 1.7129484288935188e-06, - "loss": 0.3394, - "step": 30050 - }, - { - "epoch": 0.83, - "learning_rate": 1.7115214475298956e-06, - "loss": 0.1139, - "step": 30055 - }, - { - "epoch": 0.83, - "learning_rate": 1.710094466166272e-06, - "loss": 0.1206, - "step": 30060 - }, - { - "epoch": 0.83, - "learning_rate": 1.7086674848026485e-06, - "loss": 0.163, - "step": 30065 - }, - { - "epoch": 0.83, - "learning_rate": 1.7072405034390252e-06, - "loss": 0.1296, - "step": 30070 - }, - { - "epoch": 0.83, - "learning_rate": 1.7058135220754018e-06, - "loss": 0.0688, - "step": 30075 - }, - { - "epoch": 0.83, - "learning_rate": 1.7043865407117785e-06, - "loss": 0.2041, - "step": 30080 - }, - { - "epoch": 0.83, - "learning_rate": 1.702959559348155e-06, - "loss": 0.1542, - "step": 30085 - }, - { - "epoch": 0.83, - "learning_rate": 1.7015325779845314e-06, - "loss": 0.0918, - "step": 30090 - }, - { - "epoch": 0.84, - "learning_rate": 1.7001055966209082e-06, - "loss": 0.1101, - "step": 30095 - }, - { - "epoch": 0.84, - "learning_rate": 1.6986786152572847e-06, - "loss": 0.5718, - "step": 30100 - }, - { - "epoch": 0.84, - "learning_rate": 1.6972516338936615e-06, - "loss": 0.141, - "step": 30105 - }, - { - "epoch": 0.84, - "learning_rate": 1.695824652530038e-06, - "loss": 0.1428, - "step": 30110 - }, - { - "epoch": 0.84, - "learning_rate": 1.6943976711664148e-06, - "loss": 0.1814, - "step": 30115 - }, - { - "epoch": 0.84, - "learning_rate": 1.6929706898027914e-06, - "loss": 0.1347, - "step": 30120 - }, - { - "epoch": 0.84, - "learning_rate": 1.691543708439168e-06, - "loss": 0.0723, - "step": 30125 - }, - { - "epoch": 0.84, - "learning_rate": 1.6901167270755445e-06, - "loss": 0.1598, - "step": 30130 - }, - { - "epoch": 0.84, - "learning_rate": 1.6886897457119212e-06, - "loss": 0.1219, - "step": 30135 - }, - { - "epoch": 0.84, - "learning_rate": 1.6872627643482978e-06, - "loss": 0.2055, - "step": 30140 - }, - { - "epoch": 0.84, - "learning_rate": 1.6858357829846743e-06, - "loss": 0.2999, - "step": 30145 - }, - { - "epoch": 0.84, - "learning_rate": 1.684408801621051e-06, - "loss": 0.5244, - "step": 30150 - }, - { - "epoch": 0.84, - "learning_rate": 1.6829818202574274e-06, - "loss": 0.2096, - "step": 30155 - }, - { - "epoch": 0.84, - "learning_rate": 1.6815548388938042e-06, - "loss": 0.1008, - "step": 30160 - }, - { - "epoch": 0.84, - "learning_rate": 1.6801278575301807e-06, - "loss": 0.1061, - "step": 30165 - }, - { - "epoch": 0.84, - "learning_rate": 1.6787008761665575e-06, - "loss": 0.14, - "step": 30170 - }, - { - "epoch": 0.84, - "learning_rate": 1.677273894802934e-06, - "loss": 0.1069, - "step": 30175 - }, - { - "epoch": 0.84, - "learning_rate": 1.6758469134393108e-06, - "loss": 0.0708, - "step": 30180 - }, - { - "epoch": 0.84, - "learning_rate": 1.6744199320756872e-06, - "loss": 0.0701, - "step": 30185 - }, - { - "epoch": 0.84, - "learning_rate": 1.6729929507120637e-06, - "loss": 0.1315, - "step": 30190 - }, - { - "epoch": 0.84, - "learning_rate": 1.6715659693484405e-06, - "loss": 0.2271, - "step": 30195 - }, - { - "epoch": 0.84, - "learning_rate": 1.670138987984817e-06, - "loss": 0.5044, - "step": 30200 - }, - { - "epoch": 0.84, - "learning_rate": 1.6687120066211938e-06, - "loss": 0.1734, - "step": 30205 - }, - { - "epoch": 0.84, - "learning_rate": 1.6672850252575703e-06, - "loss": 0.0858, - "step": 30210 - }, - { - "epoch": 0.84, - "learning_rate": 1.665858043893947e-06, - "loss": 0.1001, - "step": 30215 - }, - { - "epoch": 0.84, - "learning_rate": 1.6644310625303234e-06, - "loss": 0.1547, - "step": 30220 - }, - { - "epoch": 0.84, - "learning_rate": 1.6630040811667e-06, - "loss": 0.1222, - "step": 30225 - }, - { - "epoch": 0.84, - "learning_rate": 1.6615770998030767e-06, - "loss": 0.0436, - "step": 30230 - }, - { - "epoch": 0.84, - "learning_rate": 1.6601501184394533e-06, - "loss": 0.0757, - "step": 30235 - }, - { - "epoch": 0.84, - "learning_rate": 1.65872313707583e-06, - "loss": 0.2041, - "step": 30240 - }, - { - "epoch": 0.84, - "learning_rate": 1.6572961557122066e-06, - "loss": 0.2425, - "step": 30245 - }, - { - "epoch": 0.84, - "learning_rate": 1.655869174348583e-06, - "loss": 0.3683, - "step": 30250 - }, - { - "epoch": 0.84, - "learning_rate": 1.6544421929849597e-06, - "loss": 0.0863, - "step": 30255 - }, - { - "epoch": 0.84, - "learning_rate": 1.6530152116213363e-06, - "loss": 0.1347, - "step": 30260 - }, - { - "epoch": 0.84, - "learning_rate": 1.651588230257713e-06, - "loss": 0.1001, - "step": 30265 - }, - { - "epoch": 0.84, - "learning_rate": 1.6501612488940896e-06, - "loss": 0.098, - "step": 30270 - }, - { - "epoch": 0.84, - "learning_rate": 1.6487342675304663e-06, - "loss": 0.0426, - "step": 30275 - }, - { - "epoch": 0.84, - "learning_rate": 1.6473072861668429e-06, - "loss": 0.0671, - "step": 30280 - }, - { - "epoch": 0.84, - "learning_rate": 1.6458803048032192e-06, - "loss": 0.2194, - "step": 30285 - }, - { - "epoch": 0.84, - "learning_rate": 1.644453323439596e-06, - "loss": 0.0606, - "step": 30290 - }, - { - "epoch": 0.84, - "learning_rate": 1.6430263420759725e-06, - "loss": 0.1529, - "step": 30295 - }, - { - "epoch": 0.84, - "learning_rate": 1.6415993607123493e-06, - "loss": 0.3677, - "step": 30300 - }, - { - "epoch": 0.84, - "learning_rate": 1.6401723793487258e-06, - "loss": 0.0818, - "step": 30305 - }, - { - "epoch": 0.84, - "learning_rate": 1.6387453979851026e-06, - "loss": 0.0956, - "step": 30310 - }, - { - "epoch": 0.84, - "learning_rate": 1.637318416621479e-06, - "loss": 0.1368, - "step": 30315 - }, - { - "epoch": 0.84, - "learning_rate": 1.6358914352578555e-06, - "loss": 0.1383, - "step": 30320 - }, - { - "epoch": 0.84, - "learning_rate": 1.6344644538942323e-06, - "loss": 0.1168, - "step": 30325 - }, - { - "epoch": 0.84, - "learning_rate": 1.6330374725306088e-06, - "loss": 0.109, - "step": 30330 - }, - { - "epoch": 0.84, - "learning_rate": 1.6316104911669856e-06, - "loss": 0.3013, - "step": 30335 - }, - { - "epoch": 0.84, - "learning_rate": 1.6301835098033621e-06, - "loss": 0.3281, - "step": 30340 - }, - { - "epoch": 0.84, - "learning_rate": 1.6287565284397387e-06, - "loss": 0.2898, - "step": 30345 - }, - { - "epoch": 0.84, - "learning_rate": 1.6273295470761152e-06, - "loss": 0.383, - "step": 30350 - }, - { - "epoch": 0.84, - "learning_rate": 1.625902565712492e-06, - "loss": 0.1322, - "step": 30355 - }, - { - "epoch": 0.84, - "learning_rate": 1.6244755843488685e-06, - "loss": 0.1253, - "step": 30360 - }, - { - "epoch": 0.84, - "learning_rate": 1.623048602985245e-06, - "loss": 0.1888, - "step": 30365 - }, - { - "epoch": 0.84, - "learning_rate": 1.6216216216216219e-06, - "loss": 0.1797, - "step": 30370 - }, - { - "epoch": 0.84, - "learning_rate": 1.6201946402579984e-06, - "loss": 0.0675, - "step": 30375 - }, - { - "epoch": 0.84, - "learning_rate": 1.618767658894375e-06, - "loss": 0.2116, - "step": 30380 - }, - { - "epoch": 0.84, - "learning_rate": 1.6173406775307515e-06, - "loss": 0.1694, - "step": 30385 - }, - { - "epoch": 0.84, - "learning_rate": 1.6159136961671283e-06, - "loss": 0.2422, - "step": 30390 - }, - { - "epoch": 0.84, - "learning_rate": 1.6144867148035048e-06, - "loss": 0.1664, - "step": 30395 - }, - { - "epoch": 0.84, - "learning_rate": 1.6130597334398816e-06, - "loss": 0.2869, - "step": 30400 - }, - { - "epoch": 0.84, - "learning_rate": 1.6116327520762581e-06, - "loss": 0.1527, - "step": 30405 - }, - { - "epoch": 0.84, - "learning_rate": 1.6102057707126345e-06, - "loss": 0.1121, - "step": 30410 - }, - { - "epoch": 0.84, - "learning_rate": 1.6087787893490112e-06, - "loss": 0.1529, - "step": 30415 - }, - { - "epoch": 0.84, - "learning_rate": 1.6073518079853878e-06, - "loss": 0.1104, - "step": 30420 - }, - { - "epoch": 0.84, - "learning_rate": 1.6059248266217645e-06, - "loss": 0.0833, - "step": 30425 - }, - { - "epoch": 0.84, - "learning_rate": 1.604497845258141e-06, - "loss": 0.1159, - "step": 30430 - }, - { - "epoch": 0.84, - "learning_rate": 1.6030708638945179e-06, - "loss": 0.042, - "step": 30435 - }, - { - "epoch": 0.84, - "learning_rate": 1.6016438825308942e-06, - "loss": 0.2316, - "step": 30440 - }, - { - "epoch": 0.84, - "learning_rate": 1.6002169011672707e-06, - "loss": 0.2693, - "step": 30445 - }, - { - "epoch": 0.84, - "learning_rate": 1.5987899198036475e-06, - "loss": 0.439, - "step": 30450 - }, - { - "epoch": 0.85, - "learning_rate": 1.597362938440024e-06, - "loss": 0.1224, - "step": 30455 - }, - { - "epoch": 0.85, - "learning_rate": 1.5959359570764008e-06, - "loss": 0.1079, - "step": 30460 - }, - { - "epoch": 0.85, - "learning_rate": 1.5945089757127774e-06, - "loss": 0.2648, - "step": 30465 - }, - { - "epoch": 0.85, - "learning_rate": 1.5930819943491541e-06, - "loss": 0.1247, - "step": 30470 - }, - { - "epoch": 0.85, - "learning_rate": 1.5916550129855305e-06, - "loss": 0.1804, - "step": 30475 - }, - { - "epoch": 0.85, - "learning_rate": 1.590228031621907e-06, - "loss": 0.0743, - "step": 30480 - }, - { - "epoch": 0.85, - "learning_rate": 1.5888010502582838e-06, - "loss": 0.0926, - "step": 30485 - }, - { - "epoch": 0.85, - "learning_rate": 1.5873740688946603e-06, - "loss": 0.117, - "step": 30490 - }, - { - "epoch": 0.85, - "learning_rate": 1.585947087531037e-06, - "loss": 0.1502, - "step": 30495 - }, - { - "epoch": 0.85, - "learning_rate": 1.5845201061674136e-06, - "loss": 0.6149, - "step": 30500 - }, - { - "epoch": 0.85, - "learning_rate": 1.58309312480379e-06, - "loss": 0.1727, - "step": 30505 - }, - { - "epoch": 0.85, - "learning_rate": 1.5816661434401667e-06, - "loss": 0.118, - "step": 30510 - }, - { - "epoch": 0.85, - "learning_rate": 1.5802391620765433e-06, - "loss": 0.1302, - "step": 30515 - }, - { - "epoch": 0.85, - "learning_rate": 1.57881218071292e-06, - "loss": 0.2098, - "step": 30520 - }, - { - "epoch": 0.85, - "learning_rate": 1.5773851993492966e-06, - "loss": 0.115, - "step": 30525 - }, - { - "epoch": 0.85, - "learning_rate": 1.5759582179856734e-06, - "loss": 0.0751, - "step": 30530 - }, - { - "epoch": 0.85, - "learning_rate": 1.5745312366220497e-06, - "loss": 0.1084, - "step": 30535 - }, - { - "epoch": 0.85, - "learning_rate": 1.5731042552584263e-06, - "loss": 0.1145, - "step": 30540 - }, - { - "epoch": 0.85, - "learning_rate": 1.571677273894803e-06, - "loss": 0.1338, - "step": 30545 - }, - { - "epoch": 0.85, - "learning_rate": 1.5702502925311796e-06, - "loss": 0.4143, - "step": 30550 - }, - { - "epoch": 0.85, - "learning_rate": 1.5688233111675563e-06, - "loss": 0.08, - "step": 30555 - }, - { - "epoch": 0.85, - "learning_rate": 1.5673963298039329e-06, - "loss": 0.1183, - "step": 30560 - }, - { - "epoch": 0.85, - "learning_rate": 1.5659693484403096e-06, - "loss": 0.1822, - "step": 30565 - }, - { - "epoch": 0.85, - "learning_rate": 1.564542367076686e-06, - "loss": 0.1639, - "step": 30570 - }, - { - "epoch": 0.85, - "learning_rate": 1.5631153857130627e-06, - "loss": 0.0777, - "step": 30575 - }, - { - "epoch": 0.85, - "learning_rate": 1.5616884043494393e-06, - "loss": 0.094, - "step": 30580 - }, - { - "epoch": 0.85, - "learning_rate": 1.560261422985816e-06, - "loss": 0.0695, - "step": 30585 - }, - { - "epoch": 0.85, - "learning_rate": 1.5588344416221926e-06, - "loss": 0.1541, - "step": 30590 - }, - { - "epoch": 0.85, - "learning_rate": 1.5574074602585692e-06, - "loss": 0.1856, - "step": 30595 - }, - { - "epoch": 0.85, - "learning_rate": 1.5559804788949457e-06, - "loss": 0.6199, - "step": 30600 - }, - { - "epoch": 0.85, - "learning_rate": 1.5545534975313223e-06, - "loss": 0.1189, - "step": 30605 - }, - { - "epoch": 0.85, - "learning_rate": 1.553126516167699e-06, - "loss": 0.1934, - "step": 30610 - }, - { - "epoch": 0.85, - "learning_rate": 1.5516995348040756e-06, - "loss": 0.2187, - "step": 30615 - }, - { - "epoch": 0.85, - "learning_rate": 1.5502725534404523e-06, - "loss": 0.122, - "step": 30620 - }, - { - "epoch": 0.85, - "learning_rate": 1.5488455720768289e-06, - "loss": 0.1632, - "step": 30625 - }, - { - "epoch": 0.85, - "learning_rate": 1.5474185907132056e-06, - "loss": 0.0978, - "step": 30630 - }, - { - "epoch": 0.85, - "learning_rate": 1.545991609349582e-06, - "loss": 0.1313, - "step": 30635 - }, - { - "epoch": 0.85, - "learning_rate": 1.5445646279859585e-06, - "loss": 0.1484, - "step": 30640 - }, - { - "epoch": 0.85, - "learning_rate": 1.5431376466223353e-06, - "loss": 0.089, - "step": 30645 - }, - { - "epoch": 0.85, - "learning_rate": 1.5417106652587119e-06, - "loss": 0.2633, - "step": 30650 - }, - { - "epoch": 0.85, - "learning_rate": 1.5402836838950886e-06, - "loss": 0.1022, - "step": 30655 - }, - { - "epoch": 0.85, - "learning_rate": 1.5388567025314652e-06, - "loss": 0.1222, - "step": 30660 - }, - { - "epoch": 0.85, - "learning_rate": 1.5374297211678415e-06, - "loss": 0.1354, - "step": 30665 - }, - { - "epoch": 0.85, - "learning_rate": 1.5360027398042183e-06, - "loss": 0.1546, - "step": 30670 - }, - { - "epoch": 0.85, - "learning_rate": 1.5345757584405948e-06, - "loss": 0.0776, - "step": 30675 - }, - { - "epoch": 0.85, - "learning_rate": 1.5331487770769716e-06, - "loss": 0.1215, - "step": 30680 - }, - { - "epoch": 0.85, - "learning_rate": 1.5317217957133481e-06, - "loss": 0.0722, - "step": 30685 - }, - { - "epoch": 0.85, - "learning_rate": 1.5302948143497249e-06, - "loss": 0.2274, - "step": 30690 - }, - { - "epoch": 0.85, - "learning_rate": 1.5288678329861012e-06, - "loss": 0.4315, - "step": 30695 - }, - { - "epoch": 0.85, - "learning_rate": 1.5274408516224778e-06, - "loss": 0.4468, - "step": 30700 - }, - { - "epoch": 0.85, - "learning_rate": 1.5260138702588545e-06, - "loss": 0.1523, - "step": 30705 - }, - { - "epoch": 0.85, - "learning_rate": 1.524586888895231e-06, - "loss": 0.172, - "step": 30710 - }, - { - "epoch": 0.85, - "learning_rate": 1.5231599075316079e-06, - "loss": 0.1838, - "step": 30715 - }, - { - "epoch": 0.85, - "learning_rate": 1.5217329261679844e-06, - "loss": 0.154, - "step": 30720 - }, - { - "epoch": 0.85, - "learning_rate": 1.5203059448043612e-06, - "loss": 0.0943, - "step": 30725 - }, - { - "epoch": 0.85, - "learning_rate": 1.5188789634407375e-06, - "loss": 0.1492, - "step": 30730 - }, - { - "epoch": 0.85, - "learning_rate": 1.517451982077114e-06, - "loss": 0.1907, - "step": 30735 - }, - { - "epoch": 0.85, - "learning_rate": 1.5160250007134908e-06, - "loss": 0.1713, - "step": 30740 - }, - { - "epoch": 0.85, - "learning_rate": 1.5145980193498674e-06, - "loss": 0.2305, - "step": 30745 - }, - { - "epoch": 0.85, - "learning_rate": 1.5131710379862441e-06, - "loss": 0.3482, - "step": 30750 - }, - { - "epoch": 0.85, - "learning_rate": 1.5117440566226207e-06, - "loss": 0.0889, - "step": 30755 - }, - { - "epoch": 0.85, - "learning_rate": 1.510317075258997e-06, - "loss": 0.1548, - "step": 30760 - }, - { - "epoch": 0.85, - "learning_rate": 1.5088900938953738e-06, - "loss": 0.1263, - "step": 30765 - }, - { - "epoch": 0.85, - "learning_rate": 1.5074631125317503e-06, - "loss": 0.2411, - "step": 30770 - }, - { - "epoch": 0.85, - "learning_rate": 1.506036131168127e-06, - "loss": 0.0851, - "step": 30775 - }, - { - "epoch": 0.85, - "learning_rate": 1.5046091498045036e-06, - "loss": 0.0612, - "step": 30780 - }, - { - "epoch": 0.85, - "learning_rate": 1.5031821684408804e-06, - "loss": 0.1413, - "step": 30785 - }, - { - "epoch": 0.85, - "learning_rate": 1.5017551870772567e-06, - "loss": 0.1998, - "step": 30790 - }, - { - "epoch": 0.85, - "learning_rate": 1.5003282057136335e-06, - "loss": 0.2209, - "step": 30795 - }, - { - "epoch": 0.85, - "learning_rate": 1.49890122435001e-06, - "loss": 0.4875, - "step": 30800 - }, - { - "epoch": 0.85, - "learning_rate": 1.4974742429863868e-06, - "loss": 0.1209, - "step": 30805 - }, - { - "epoch": 0.85, - "learning_rate": 1.4960472616227634e-06, - "loss": 0.1503, - "step": 30810 - }, - { - "epoch": 0.86, - "learning_rate": 1.49462028025914e-06, - "loss": 0.1309, - "step": 30815 - }, - { - "epoch": 0.86, - "learning_rate": 1.4931932988955167e-06, - "loss": 0.1346, - "step": 30820 - }, - { - "epoch": 0.86, - "learning_rate": 1.491766317531893e-06, - "loss": 0.2226, - "step": 30825 - }, - { - "epoch": 0.86, - "learning_rate": 1.4903393361682698e-06, - "loss": 0.0535, - "step": 30830 - }, - { - "epoch": 0.86, - "learning_rate": 1.4889123548046463e-06, - "loss": 0.0537, - "step": 30835 - }, - { - "epoch": 0.86, - "learning_rate": 1.487485373441023e-06, - "loss": 0.0843, - "step": 30840 - }, - { - "epoch": 0.86, - "learning_rate": 1.4860583920773996e-06, - "loss": 0.2167, - "step": 30845 - }, - { - "epoch": 0.86, - "learning_rate": 1.4846314107137764e-06, - "loss": 0.5243, - "step": 30850 - }, - { - "epoch": 0.86, - "learning_rate": 1.4832044293501527e-06, - "loss": 0.1337, - "step": 30855 - }, - { - "epoch": 0.86, - "learning_rate": 1.4817774479865293e-06, - "loss": 0.2129, - "step": 30860 - }, - { - "epoch": 0.86, - "learning_rate": 1.480350466622906e-06, - "loss": 0.1939, - "step": 30865 - }, - { - "epoch": 0.86, - "learning_rate": 1.4789234852592826e-06, - "loss": 0.1159, - "step": 30870 - }, - { - "epoch": 0.86, - "learning_rate": 1.4774965038956594e-06, - "loss": 0.1603, - "step": 30875 - }, - { - "epoch": 0.86, - "learning_rate": 1.476069522532036e-06, - "loss": 0.0404, - "step": 30880 - }, - { - "epoch": 0.86, - "learning_rate": 1.4746425411684123e-06, - "loss": 0.0998, - "step": 30885 - }, - { - "epoch": 0.86, - "learning_rate": 1.473215559804789e-06, - "loss": 0.2034, - "step": 30890 - }, - { - "epoch": 0.86, - "learning_rate": 1.4717885784411656e-06, - "loss": 0.1779, - "step": 30895 - }, - { - "epoch": 0.86, - "learning_rate": 1.4703615970775423e-06, - "loss": 0.3657, - "step": 30900 - }, - { - "epoch": 0.86, - "learning_rate": 1.4689346157139189e-06, - "loss": 0.1614, - "step": 30905 - }, - { - "epoch": 0.86, - "learning_rate": 1.4675076343502956e-06, - "loss": 0.1086, - "step": 30910 - }, - { - "epoch": 0.86, - "learning_rate": 1.4660806529866722e-06, - "loss": 0.133, - "step": 30915 - }, - { - "epoch": 0.86, - "learning_rate": 1.4646536716230485e-06, - "loss": 0.1572, - "step": 30920 - }, - { - "epoch": 0.86, - "learning_rate": 1.4632266902594253e-06, - "loss": 0.1444, - "step": 30925 - }, - { - "epoch": 0.86, - "learning_rate": 1.4617997088958018e-06, - "loss": 0.0483, - "step": 30930 - }, - { - "epoch": 0.86, - "learning_rate": 1.4603727275321786e-06, - "loss": 0.1232, - "step": 30935 - }, - { - "epoch": 0.86, - "learning_rate": 1.4589457461685552e-06, - "loss": 0.0518, - "step": 30940 - }, - { - "epoch": 0.86, - "learning_rate": 1.457518764804932e-06, - "loss": 0.1726, - "step": 30945 - }, - { - "epoch": 0.86, - "learning_rate": 1.4560917834413083e-06, - "loss": 0.2552, - "step": 30950 - }, - { - "epoch": 0.86, - "learning_rate": 1.4546648020776848e-06, - "loss": 0.0978, - "step": 30955 - }, - { - "epoch": 0.86, - "learning_rate": 1.4532378207140616e-06, - "loss": 0.1388, - "step": 30960 - }, - { - "epoch": 0.86, - "learning_rate": 1.4518108393504381e-06, - "loss": 0.1976, - "step": 30965 - }, - { - "epoch": 0.86, - "learning_rate": 1.4503838579868149e-06, - "loss": 0.1231, - "step": 30970 - }, - { - "epoch": 0.86, - "learning_rate": 1.4489568766231914e-06, - "loss": 0.1281, - "step": 30975 - }, - { - "epoch": 0.86, - "learning_rate": 1.4475298952595682e-06, - "loss": 0.0442, - "step": 30980 - }, - { - "epoch": 0.86, - "learning_rate": 1.4461029138959445e-06, - "loss": 0.1627, - "step": 30985 - }, - { - "epoch": 0.86, - "learning_rate": 1.444675932532321e-06, - "loss": 0.2215, - "step": 30990 - }, - { - "epoch": 0.86, - "learning_rate": 1.4432489511686979e-06, - "loss": 0.1335, - "step": 30995 - }, - { - "epoch": 0.86, - "learning_rate": 1.4418219698050744e-06, - "loss": 0.5371, - "step": 31000 - }, - { - "epoch": 0.86, - "learning_rate": 1.4403949884414512e-06, - "loss": 0.1816, - "step": 31005 - }, - { - "epoch": 0.86, - "learning_rate": 1.4389680070778277e-06, - "loss": 0.143, - "step": 31010 - }, - { - "epoch": 0.86, - "learning_rate": 1.4375410257142043e-06, - "loss": 0.153, - "step": 31015 - }, - { - "epoch": 0.86, - "learning_rate": 1.4361140443505808e-06, - "loss": 0.16, - "step": 31020 - }, - { - "epoch": 0.86, - "learning_rate": 1.4346870629869576e-06, - "loss": 0.066, - "step": 31025 - }, - { - "epoch": 0.86, - "learning_rate": 1.4332600816233341e-06, - "loss": 0.0365, - "step": 31030 - }, - { - "epoch": 0.86, - "learning_rate": 1.4318331002597109e-06, - "loss": 0.0748, - "step": 31035 - }, - { - "epoch": 0.86, - "learning_rate": 1.4304061188960874e-06, - "loss": 0.1075, - "step": 31040 - }, - { - "epoch": 0.86, - "learning_rate": 1.4289791375324638e-06, - "loss": 0.2343, - "step": 31045 - }, - { - "epoch": 0.86, - "learning_rate": 1.4275521561688405e-06, - "loss": 0.2463, - "step": 31050 - }, - { - "epoch": 0.86, - "learning_rate": 1.426125174805217e-06, - "loss": 0.1182, - "step": 31055 - }, - { - "epoch": 0.86, - "learning_rate": 1.4246981934415939e-06, - "loss": 0.1763, - "step": 31060 - }, - { - "epoch": 0.86, - "learning_rate": 1.4232712120779704e-06, - "loss": 0.1413, - "step": 31065 - }, - { - "epoch": 0.86, - "learning_rate": 1.4218442307143472e-06, - "loss": 0.1772, - "step": 31070 - }, - { - "epoch": 0.86, - "learning_rate": 1.4204172493507237e-06, - "loss": 0.067, - "step": 31075 - }, - { - "epoch": 0.86, - "learning_rate": 1.4189902679871e-06, - "loss": 0.1534, - "step": 31080 - }, - { - "epoch": 0.86, - "learning_rate": 1.4175632866234768e-06, - "loss": 0.1724, - "step": 31085 - }, - { - "epoch": 0.86, - "learning_rate": 1.4161363052598534e-06, - "loss": 0.2235, - "step": 31090 - }, - { - "epoch": 0.86, - "learning_rate": 1.4147093238962301e-06, - "loss": 0.1799, - "step": 31095 - }, - { - "epoch": 0.86, - "learning_rate": 1.4132823425326067e-06, - "loss": 0.4721, - "step": 31100 - }, - { - "epoch": 0.86, - "learning_rate": 1.4118553611689834e-06, - "loss": 0.1463, - "step": 31105 - }, - { - "epoch": 0.86, - "learning_rate": 1.4104283798053598e-06, - "loss": 0.1202, - "step": 31110 - }, - { - "epoch": 0.86, - "learning_rate": 1.4090013984417363e-06, - "loss": 0.1882, - "step": 31115 - }, - { - "epoch": 0.86, - "learning_rate": 1.407574417078113e-06, - "loss": 0.2152, - "step": 31120 - }, - { - "epoch": 0.86, - "learning_rate": 1.4061474357144896e-06, - "loss": 0.1173, - "step": 31125 - }, - { - "epoch": 0.86, - "learning_rate": 1.4047204543508664e-06, - "loss": 0.1154, - "step": 31130 - }, - { - "epoch": 0.86, - "learning_rate": 1.403293472987243e-06, - "loss": 0.0957, - "step": 31135 - }, - { - "epoch": 0.86, - "learning_rate": 1.4018664916236193e-06, - "loss": 0.0875, - "step": 31140 - }, - { - "epoch": 0.86, - "learning_rate": 1.400439510259996e-06, - "loss": 0.2762, - "step": 31145 - }, - { - "epoch": 0.86, - "learning_rate": 1.3990125288963726e-06, - "loss": 0.232, - "step": 31150 - }, - { - "epoch": 0.86, - "learning_rate": 1.3975855475327494e-06, - "loss": 0.0594, - "step": 31155 - }, - { - "epoch": 0.86, - "learning_rate": 1.396158566169126e-06, - "loss": 0.1108, - "step": 31160 - }, - { - "epoch": 0.86, - "learning_rate": 1.3947315848055027e-06, - "loss": 0.1318, - "step": 31165 - }, - { - "epoch": 0.86, - "learning_rate": 1.3933046034418792e-06, - "loss": 0.1815, - "step": 31170 - }, - { - "epoch": 0.87, - "learning_rate": 1.3918776220782556e-06, - "loss": 0.1016, - "step": 31175 - }, - { - "epoch": 0.87, - "learning_rate": 1.3904506407146323e-06, - "loss": 0.0792, - "step": 31180 - }, - { - "epoch": 0.87, - "learning_rate": 1.3890236593510089e-06, - "loss": 0.1084, - "step": 31185 - }, - { - "epoch": 0.87, - "learning_rate": 1.3875966779873856e-06, - "loss": 0.1061, - "step": 31190 - }, - { - "epoch": 0.87, - "learning_rate": 1.3861696966237622e-06, - "loss": 0.251, - "step": 31195 - }, - { - "epoch": 0.87, - "learning_rate": 1.384742715260139e-06, - "loss": 0.4001, - "step": 31200 - }, - { - "epoch": 0.87, - "learning_rate": 1.3833157338965153e-06, - "loss": 0.1066, - "step": 31205 - }, - { - "epoch": 0.87, - "learning_rate": 1.3818887525328918e-06, - "loss": 0.1573, - "step": 31210 - }, - { - "epoch": 0.87, - "learning_rate": 1.3804617711692686e-06, - "loss": 0.1168, - "step": 31215 - }, - { - "epoch": 0.87, - "learning_rate": 1.3790347898056452e-06, - "loss": 0.1735, - "step": 31220 - }, - { - "epoch": 0.87, - "learning_rate": 1.377607808442022e-06, - "loss": 0.0906, - "step": 31225 - }, - { - "epoch": 0.87, - "learning_rate": 1.3761808270783985e-06, - "loss": 0.0829, - "step": 31230 - }, - { - "epoch": 0.87, - "learning_rate": 1.3747538457147752e-06, - "loss": 0.0907, - "step": 31235 - }, - { - "epoch": 0.87, - "learning_rate": 1.3733268643511516e-06, - "loss": 0.1583, - "step": 31240 - }, - { - "epoch": 0.87, - "learning_rate": 1.3718998829875283e-06, - "loss": 0.1788, - "step": 31245 - }, - { - "epoch": 0.87, - "learning_rate": 1.3704729016239049e-06, - "loss": 0.3387, - "step": 31250 - }, - { - "epoch": 0.87, - "learning_rate": 1.3690459202602816e-06, - "loss": 0.1139, - "step": 31255 - }, - { - "epoch": 0.87, - "learning_rate": 1.3676189388966582e-06, - "loss": 0.1146, - "step": 31260 - }, - { - "epoch": 0.87, - "learning_rate": 1.3661919575330347e-06, - "loss": 0.1633, - "step": 31265 - }, - { - "epoch": 0.87, - "learning_rate": 1.3647649761694113e-06, - "loss": 0.137, - "step": 31270 - }, - { - "epoch": 0.87, - "learning_rate": 1.3633379948057878e-06, - "loss": 0.1519, - "step": 31275 - }, - { - "epoch": 0.87, - "learning_rate": 1.3619110134421646e-06, - "loss": 0.1357, - "step": 31280 - }, - { - "epoch": 0.87, - "learning_rate": 1.3604840320785412e-06, - "loss": 0.1447, - "step": 31285 - }, - { - "epoch": 0.87, - "learning_rate": 1.359057050714918e-06, - "loss": 0.1816, - "step": 31290 - }, - { - "epoch": 0.87, - "learning_rate": 1.3576300693512945e-06, - "loss": 0.3118, - "step": 31295 - }, - { - "epoch": 0.87, - "learning_rate": 1.3562030879876708e-06, - "loss": 0.3088, - "step": 31300 - }, - { - "epoch": 0.87, - "learning_rate": 1.3547761066240476e-06, - "loss": 0.1523, - "step": 31305 - }, - { - "epoch": 0.87, - "learning_rate": 1.3533491252604241e-06, - "loss": 0.1324, - "step": 31310 - }, - { - "epoch": 0.87, - "learning_rate": 1.3519221438968009e-06, - "loss": 0.185, - "step": 31315 - }, - { - "epoch": 0.87, - "learning_rate": 1.3504951625331774e-06, - "loss": 0.1934, - "step": 31320 - }, - { - "epoch": 0.87, - "learning_rate": 1.3490681811695542e-06, - "loss": 0.0723, - "step": 31325 - }, - { - "epoch": 0.87, - "learning_rate": 1.3476411998059308e-06, - "loss": 0.0841, - "step": 31330 - }, - { - "epoch": 0.87, - "learning_rate": 1.346214218442307e-06, - "loss": 0.0896, - "step": 31335 - }, - { - "epoch": 0.87, - "learning_rate": 1.3447872370786839e-06, - "loss": 0.0524, - "step": 31340 - }, - { - "epoch": 0.87, - "learning_rate": 1.3433602557150604e-06, - "loss": 0.2578, - "step": 31345 - }, - { - "epoch": 0.87, - "learning_rate": 1.3419332743514372e-06, - "loss": 0.304, - "step": 31350 - }, - { - "epoch": 0.87, - "learning_rate": 1.3405062929878137e-06, - "loss": 0.1347, - "step": 31355 - }, - { - "epoch": 0.87, - "learning_rate": 1.3390793116241905e-06, - "loss": 0.0809, - "step": 31360 - }, - { - "epoch": 0.87, - "learning_rate": 1.3376523302605668e-06, - "loss": 0.1255, - "step": 31365 - }, - { - "epoch": 0.87, - "learning_rate": 1.3362253488969434e-06, - "loss": 0.1806, - "step": 31370 - }, - { - "epoch": 0.87, - "learning_rate": 1.3347983675333201e-06, - "loss": 0.1287, - "step": 31375 - }, - { - "epoch": 0.87, - "learning_rate": 1.3333713861696967e-06, - "loss": 0.0332, - "step": 31380 - }, - { - "epoch": 0.87, - "learning_rate": 1.3319444048060734e-06, - "loss": 0.0514, - "step": 31385 - }, - { - "epoch": 0.87, - "learning_rate": 1.33051742344245e-06, - "loss": 0.1219, - "step": 31390 - }, - { - "epoch": 0.87, - "learning_rate": 1.3290904420788263e-06, - "loss": 0.1158, - "step": 31395 - }, - { - "epoch": 0.87, - "learning_rate": 1.327663460715203e-06, - "loss": 0.3232, - "step": 31400 - }, - { - "epoch": 0.87, - "learning_rate": 1.3262364793515796e-06, - "loss": 0.1389, - "step": 31405 - }, - { - "epoch": 0.87, - "learning_rate": 1.3248094979879564e-06, - "loss": 0.1863, - "step": 31410 - }, - { - "epoch": 0.87, - "learning_rate": 1.323382516624333e-06, - "loss": 0.1359, - "step": 31415 - }, - { - "epoch": 0.87, - "learning_rate": 1.3219555352607097e-06, - "loss": 0.0884, - "step": 31420 - }, - { - "epoch": 0.87, - "learning_rate": 1.3205285538970863e-06, - "loss": 0.2151, - "step": 31425 - }, - { - "epoch": 0.87, - "learning_rate": 1.3191015725334628e-06, - "loss": 0.0598, - "step": 31430 - }, - { - "epoch": 0.87, - "learning_rate": 1.3176745911698394e-06, - "loss": 0.0646, - "step": 31435 - }, - { - "epoch": 0.87, - "learning_rate": 1.316247609806216e-06, - "loss": 0.166, - "step": 31440 - }, - { - "epoch": 0.87, - "learning_rate": 1.3148206284425927e-06, - "loss": 0.1687, - "step": 31445 - }, - { - "epoch": 0.87, - "learning_rate": 1.3133936470789692e-06, - "loss": 0.2897, - "step": 31450 - }, - { - "epoch": 0.87, - "learning_rate": 1.311966665715346e-06, - "loss": 0.1198, - "step": 31455 - }, - { - "epoch": 0.87, - "learning_rate": 1.3105396843517223e-06, - "loss": 0.1161, - "step": 31460 - }, - { - "epoch": 0.87, - "learning_rate": 1.309112702988099e-06, - "loss": 0.1257, - "step": 31465 - }, - { - "epoch": 0.87, - "learning_rate": 1.3076857216244756e-06, - "loss": 0.1707, - "step": 31470 - }, - { - "epoch": 0.87, - "learning_rate": 1.3062587402608524e-06, - "loss": 0.1482, - "step": 31475 - }, - { - "epoch": 0.87, - "learning_rate": 1.304831758897229e-06, - "loss": 0.1203, - "step": 31480 - }, - { - "epoch": 0.87, - "learning_rate": 1.3034047775336057e-06, - "loss": 0.1097, - "step": 31485 - }, - { - "epoch": 0.87, - "learning_rate": 1.301977796169982e-06, - "loss": 0.1457, - "step": 31490 - }, - { - "epoch": 0.87, - "learning_rate": 1.3005508148063586e-06, - "loss": 0.1297, - "step": 31495 - }, - { - "epoch": 0.87, - "learning_rate": 1.2991238334427354e-06, - "loss": 0.5984, - "step": 31500 - }, - { - "epoch": 0.87, - "learning_rate": 1.297696852079112e-06, - "loss": 0.1224, - "step": 31505 - }, - { - "epoch": 0.87, - "learning_rate": 1.2962698707154887e-06, - "loss": 0.1312, - "step": 31510 - }, - { - "epoch": 0.87, - "learning_rate": 1.2948428893518652e-06, - "loss": 0.1565, - "step": 31515 - }, - { - "epoch": 0.87, - "learning_rate": 1.293415907988242e-06, - "loss": 0.1429, - "step": 31520 - }, - { - "epoch": 0.87, - "learning_rate": 1.2919889266246183e-06, - "loss": 0.1364, - "step": 31525 - }, - { - "epoch": 0.87, - "learning_rate": 1.2905619452609949e-06, - "loss": 0.0708, - "step": 31530 - }, - { - "epoch": 0.88, - "learning_rate": 1.2891349638973716e-06, - "loss": 0.1318, - "step": 31535 - }, - { - "epoch": 0.88, - "learning_rate": 1.2877079825337482e-06, - "loss": 0.1534, - "step": 31540 - }, - { - "epoch": 0.88, - "learning_rate": 1.286281001170125e-06, - "loss": 0.218, - "step": 31545 - }, - { - "epoch": 0.88, - "learning_rate": 1.2848540198065015e-06, - "loss": 0.2157, - "step": 31550 - }, - { - "epoch": 0.88, - "learning_rate": 1.2834270384428778e-06, - "loss": 0.1351, - "step": 31555 - }, - { - "epoch": 0.88, - "learning_rate": 1.2820000570792546e-06, - "loss": 0.0787, - "step": 31560 - }, - { - "epoch": 0.88, - "learning_rate": 1.2805730757156312e-06, - "loss": 0.13, - "step": 31565 - }, - { - "epoch": 0.88, - "learning_rate": 1.279146094352008e-06, - "loss": 0.0911, - "step": 31570 - }, - { - "epoch": 0.88, - "learning_rate": 1.2777191129883845e-06, - "loss": 0.0631, - "step": 31575 - }, - { - "epoch": 0.88, - "learning_rate": 1.2762921316247612e-06, - "loss": 0.1197, - "step": 31580 - }, - { - "epoch": 0.88, - "learning_rate": 1.2748651502611378e-06, - "loss": 0.0612, - "step": 31585 - }, - { - "epoch": 0.88, - "learning_rate": 1.2734381688975141e-06, - "loss": 0.1578, - "step": 31590 - }, - { - "epoch": 0.88, - "learning_rate": 1.2720111875338909e-06, - "loss": 0.2743, - "step": 31595 - }, - { - "epoch": 0.88, - "learning_rate": 1.2705842061702674e-06, - "loss": 0.2193, - "step": 31600 - }, - { - "epoch": 0.88, - "learning_rate": 1.2691572248066442e-06, - "loss": 0.1699, - "step": 31605 - }, - { - "epoch": 0.88, - "learning_rate": 1.2677302434430207e-06, - "loss": 0.1013, - "step": 31610 - }, - { - "epoch": 0.88, - "learning_rate": 1.2663032620793975e-06, - "loss": 0.1239, - "step": 31615 - }, - { - "epoch": 0.88, - "learning_rate": 1.2648762807157738e-06, - "loss": 0.1823, - "step": 31620 - }, - { - "epoch": 0.88, - "learning_rate": 1.2634492993521504e-06, - "loss": 0.1302, - "step": 31625 - }, - { - "epoch": 0.88, - "learning_rate": 1.2620223179885272e-06, - "loss": 0.0766, - "step": 31630 - }, - { - "epoch": 0.88, - "learning_rate": 1.2605953366249037e-06, - "loss": 0.0278, - "step": 31635 - }, - { - "epoch": 0.88, - "learning_rate": 1.2591683552612805e-06, - "loss": 0.1773, - "step": 31640 - }, - { - "epoch": 0.88, - "learning_rate": 1.257741373897657e-06, - "loss": 0.1424, - "step": 31645 - }, - { - "epoch": 0.88, - "learning_rate": 1.2563143925340336e-06, - "loss": 0.2133, - "step": 31650 - }, - { - "epoch": 0.88, - "learning_rate": 1.2548874111704101e-06, - "loss": 0.1234, - "step": 31655 - }, - { - "epoch": 0.88, - "learning_rate": 1.2534604298067869e-06, - "loss": 0.1191, - "step": 31660 - }, - { - "epoch": 0.88, - "learning_rate": 1.2520334484431634e-06, - "loss": 0.1727, - "step": 31665 - }, - { - "epoch": 0.88, - "learning_rate": 1.25060646707954e-06, - "loss": 0.1757, - "step": 31670 - }, - { - "epoch": 0.88, - "learning_rate": 1.2491794857159165e-06, - "loss": 0.1101, - "step": 31675 - }, - { - "epoch": 0.88, - "learning_rate": 1.2477525043522933e-06, - "loss": 0.0878, - "step": 31680 - }, - { - "epoch": 0.88, - "learning_rate": 1.2463255229886699e-06, - "loss": 0.217, - "step": 31685 - }, - { - "epoch": 0.88, - "learning_rate": 1.2448985416250464e-06, - "loss": 0.2261, - "step": 31690 - }, - { - "epoch": 0.88, - "learning_rate": 1.2434715602614232e-06, - "loss": 0.1033, - "step": 31695 - }, - { - "epoch": 0.88, - "learning_rate": 1.2420445788977997e-06, - "loss": 0.5031, - "step": 31700 - }, - { - "epoch": 0.88, - "learning_rate": 1.2406175975341763e-06, - "loss": 0.136, - "step": 31705 - }, - { - "epoch": 0.88, - "learning_rate": 1.2391906161705528e-06, - "loss": 0.128, - "step": 31710 - }, - { - "epoch": 0.88, - "learning_rate": 1.2377636348069296e-06, - "loss": 0.122, - "step": 31715 - }, - { - "epoch": 0.88, - "learning_rate": 1.2363366534433061e-06, - "loss": 0.2872, - "step": 31720 - }, - { - "epoch": 0.88, - "learning_rate": 1.2349096720796827e-06, - "loss": 0.0875, - "step": 31725 - }, - { - "epoch": 0.88, - "learning_rate": 1.2334826907160594e-06, - "loss": 0.0886, - "step": 31730 - }, - { - "epoch": 0.88, - "learning_rate": 1.232055709352436e-06, - "loss": 0.2008, - "step": 31735 - }, - { - "epoch": 0.88, - "learning_rate": 1.2306287279888125e-06, - "loss": 0.2025, - "step": 31740 - }, - { - "epoch": 0.88, - "learning_rate": 1.229201746625189e-06, - "loss": 0.2424, - "step": 31745 - }, - { - "epoch": 0.88, - "learning_rate": 1.2277747652615659e-06, - "loss": 0.423, - "step": 31750 - }, - { - "epoch": 0.88, - "learning_rate": 1.2263477838979424e-06, - "loss": 0.124, - "step": 31755 - }, - { - "epoch": 0.88, - "learning_rate": 1.224920802534319e-06, - "loss": 0.1409, - "step": 31760 - }, - { - "epoch": 0.88, - "learning_rate": 1.2234938211706957e-06, - "loss": 0.1322, - "step": 31765 - }, - { - "epoch": 0.88, - "learning_rate": 1.2220668398070723e-06, - "loss": 0.1554, - "step": 31770 - }, - { - "epoch": 0.88, - "learning_rate": 1.2206398584434488e-06, - "loss": 0.1138, - "step": 31775 - }, - { - "epoch": 0.88, - "learning_rate": 1.2192128770798254e-06, - "loss": 0.1026, - "step": 31780 - }, - { - "epoch": 0.88, - "learning_rate": 1.217785895716202e-06, - "loss": 0.0916, - "step": 31785 - }, - { - "epoch": 0.88, - "learning_rate": 1.2163589143525787e-06, - "loss": 0.1633, - "step": 31790 - }, - { - "epoch": 0.88, - "learning_rate": 1.2149319329889552e-06, - "loss": 0.1434, - "step": 31795 - }, - { - "epoch": 0.88, - "learning_rate": 1.213504951625332e-06, - "loss": 0.2791, - "step": 31800 - }, - { - "epoch": 0.88, - "learning_rate": 1.2120779702617085e-06, - "loss": 0.1665, - "step": 31805 - }, - { - "epoch": 0.88, - "learning_rate": 1.210650988898085e-06, - "loss": 0.171, - "step": 31810 - }, - { - "epoch": 0.88, - "learning_rate": 1.2092240075344619e-06, - "loss": 0.1433, - "step": 31815 - }, - { - "epoch": 0.88, - "learning_rate": 1.2077970261708382e-06, - "loss": 0.1034, - "step": 31820 - }, - { - "epoch": 0.88, - "learning_rate": 1.206370044807215e-06, - "loss": 0.0952, - "step": 31825 - }, - { - "epoch": 0.88, - "learning_rate": 1.2049430634435915e-06, - "loss": 0.0653, - "step": 31830 - }, - { - "epoch": 0.88, - "learning_rate": 1.203516082079968e-06, - "loss": 0.0148, - "step": 31835 - }, - { - "epoch": 0.88, - "learning_rate": 1.2020891007163448e-06, - "loss": 0.1245, - "step": 31840 - }, - { - "epoch": 0.88, - "learning_rate": 1.2006621193527214e-06, - "loss": 0.1621, - "step": 31845 - }, - { - "epoch": 0.88, - "learning_rate": 1.199235137989098e-06, - "loss": 0.2584, - "step": 31850 - }, - { - "epoch": 0.88, - "learning_rate": 1.1978081566254745e-06, - "loss": 0.1122, - "step": 31855 - }, - { - "epoch": 0.88, - "learning_rate": 1.1963811752618512e-06, - "loss": 0.0627, - "step": 31860 - }, - { - "epoch": 0.88, - "learning_rate": 1.1949541938982278e-06, - "loss": 0.1209, - "step": 31865 - }, - { - "epoch": 0.88, - "learning_rate": 1.1935272125346043e-06, - "loss": 0.095, - "step": 31870 - }, - { - "epoch": 0.88, - "learning_rate": 1.192100231170981e-06, - "loss": 0.1409, - "step": 31875 - }, - { - "epoch": 0.88, - "learning_rate": 1.1906732498073576e-06, - "loss": 0.1354, - "step": 31880 - }, - { - "epoch": 0.88, - "learning_rate": 1.1892462684437342e-06, - "loss": 0.1059, - "step": 31885 - }, - { - "epoch": 0.88, - "learning_rate": 1.1878192870801107e-06, - "loss": 0.2424, - "step": 31890 - }, - { - "epoch": 0.89, - "learning_rate": 1.1863923057164875e-06, - "loss": 0.2392, - "step": 31895 - }, - { - "epoch": 0.89, - "learning_rate": 1.184965324352864e-06, - "loss": 0.4215, - "step": 31900 - }, - { - "epoch": 0.89, - "learning_rate": 1.1835383429892406e-06, - "loss": 0.1059, - "step": 31905 - }, - { - "epoch": 0.89, - "learning_rate": 1.1821113616256174e-06, - "loss": 0.153, - "step": 31910 - }, - { - "epoch": 0.89, - "learning_rate": 1.180684380261994e-06, - "loss": 0.1594, - "step": 31915 - }, - { - "epoch": 0.89, - "learning_rate": 1.1792573988983705e-06, - "loss": 0.197, - "step": 31920 - }, - { - "epoch": 0.89, - "learning_rate": 1.1778304175347472e-06, - "loss": 0.1146, - "step": 31925 - }, - { - "epoch": 0.89, - "learning_rate": 1.1764034361711236e-06, - "loss": 0.0842, - "step": 31930 - }, - { - "epoch": 0.89, - "learning_rate": 1.1749764548075003e-06, - "loss": 0.0934, - "step": 31935 - }, - { - "epoch": 0.89, - "learning_rate": 1.1735494734438769e-06, - "loss": 0.1809, - "step": 31940 - }, - { - "epoch": 0.89, - "learning_rate": 1.1721224920802534e-06, - "loss": 0.2709, - "step": 31945 - }, - { - "epoch": 0.89, - "learning_rate": 1.1706955107166302e-06, - "loss": 0.2268, - "step": 31950 - }, - { - "epoch": 0.89, - "learning_rate": 1.1692685293530067e-06, - "loss": 0.1638, - "step": 31955 - }, - { - "epoch": 0.89, - "learning_rate": 1.1678415479893833e-06, - "loss": 0.2125, - "step": 31960 - }, - { - "epoch": 0.89, - "learning_rate": 1.1664145666257599e-06, - "loss": 0.1602, - "step": 31965 - }, - { - "epoch": 0.89, - "learning_rate": 1.1649875852621366e-06, - "loss": 0.1404, - "step": 31970 - }, - { - "epoch": 0.89, - "learning_rate": 1.1635606038985132e-06, - "loss": 0.1611, - "step": 31975 - }, - { - "epoch": 0.89, - "learning_rate": 1.1621336225348897e-06, - "loss": 0.0797, - "step": 31980 - }, - { - "epoch": 0.89, - "learning_rate": 1.1607066411712665e-06, - "loss": 0.1523, - "step": 31985 - }, - { - "epoch": 0.89, - "learning_rate": 1.159279659807643e-06, - "loss": 0.0897, - "step": 31990 - }, - { - "epoch": 0.89, - "learning_rate": 1.1578526784440196e-06, - "loss": 0.272, - "step": 31995 - }, - { - "epoch": 0.89, - "learning_rate": 1.1564256970803961e-06, - "loss": 0.2478, - "step": 32000 - }, - { - "epoch": 0.89, - "eval_loss": 0.05729741230607033, - "eval_runtime": 1893.4584, - "eval_samples_per_second": 8.46, - "eval_steps_per_second": 2.115, - "eval_wer": 0.16078254597908404, - "step": 32000 - }, - { - "epoch": 0.89, - "learning_rate": 1.1549987157167729e-06, - "loss": 0.117, - "step": 32005 - }, - { - "epoch": 0.89, - "learning_rate": 1.1535717343531494e-06, - "loss": 0.1405, - "step": 32010 - }, - { - "epoch": 0.89, - "learning_rate": 1.152144752989526e-06, - "loss": 0.1392, - "step": 32015 - }, - { - "epoch": 0.89, - "learning_rate": 1.1507177716259028e-06, - "loss": 0.1713, - "step": 32020 - }, - { - "epoch": 0.89, - "learning_rate": 1.1492907902622793e-06, - "loss": 0.0718, - "step": 32025 - }, - { - "epoch": 0.89, - "learning_rate": 1.1478638088986559e-06, - "loss": 0.1474, - "step": 32030 - }, - { - "epoch": 0.89, - "learning_rate": 1.1464368275350326e-06, - "loss": 0.0845, - "step": 32035 - }, - { - "epoch": 0.89, - "learning_rate": 1.145009846171409e-06, - "loss": 0.1377, - "step": 32040 - }, - { - "epoch": 0.89, - "learning_rate": 1.1435828648077857e-06, - "loss": 0.1113, - "step": 32045 - }, - { - "epoch": 0.89, - "learning_rate": 1.1421558834441623e-06, - "loss": 0.5476, - "step": 32050 - }, - { - "epoch": 0.89, - "learning_rate": 1.1407289020805388e-06, - "loss": 0.1391, - "step": 32055 - }, - { - "epoch": 0.89, - "learning_rate": 1.1393019207169156e-06, - "loss": 0.1375, - "step": 32060 - }, - { - "epoch": 0.89, - "learning_rate": 1.1378749393532921e-06, - "loss": 0.1473, - "step": 32065 - }, - { - "epoch": 0.89, - "learning_rate": 1.1364479579896689e-06, - "loss": 0.1647, - "step": 32070 - }, - { - "epoch": 0.89, - "learning_rate": 1.1350209766260452e-06, - "loss": 0.1695, - "step": 32075 - }, - { - "epoch": 0.89, - "learning_rate": 1.133593995262422e-06, - "loss": 0.0699, - "step": 32080 - }, - { - "epoch": 0.89, - "learning_rate": 1.1321670138987985e-06, - "loss": 0.1329, - "step": 32085 - }, - { - "epoch": 0.89, - "learning_rate": 1.130740032535175e-06, - "loss": 0.1167, - "step": 32090 - }, - { - "epoch": 0.89, - "learning_rate": 1.1293130511715519e-06, - "loss": 0.3794, - "step": 32095 - }, - { - "epoch": 0.89, - "learning_rate": 1.1278860698079284e-06, - "loss": 0.2516, - "step": 32100 - }, - { - "epoch": 0.89, - "learning_rate": 1.126459088444305e-06, - "loss": 0.161, - "step": 32105 - }, - { - "epoch": 0.89, - "learning_rate": 1.1250321070806817e-06, - "loss": 0.1521, - "step": 32110 - }, - { - "epoch": 0.89, - "learning_rate": 1.1236051257170583e-06, - "loss": 0.1331, - "step": 32115 - }, - { - "epoch": 0.89, - "learning_rate": 1.1221781443534348e-06, - "loss": 0.1449, - "step": 32120 - }, - { - "epoch": 0.89, - "learning_rate": 1.1207511629898114e-06, - "loss": 0.1729, - "step": 32125 - }, - { - "epoch": 0.89, - "learning_rate": 1.1193241816261881e-06, - "loss": 0.0596, - "step": 32130 - }, - { - "epoch": 0.89, - "learning_rate": 1.1178972002625647e-06, - "loss": 0.1664, - "step": 32135 - }, - { - "epoch": 0.89, - "learning_rate": 1.1164702188989412e-06, - "loss": 0.1217, - "step": 32140 - }, - { - "epoch": 0.89, - "learning_rate": 1.115043237535318e-06, - "loss": 0.238, - "step": 32145 - }, - { - "epoch": 0.89, - "learning_rate": 1.1136162561716945e-06, - "loss": 0.3408, - "step": 32150 - }, - { - "epoch": 0.89, - "learning_rate": 1.112189274808071e-06, - "loss": 0.135, - "step": 32155 - }, - { - "epoch": 0.89, - "learning_rate": 1.1107622934444476e-06, - "loss": 0.1022, - "step": 32160 - }, - { - "epoch": 0.89, - "learning_rate": 1.1093353120808244e-06, - "loss": 0.1174, - "step": 32165 - }, - { - "epoch": 0.89, - "learning_rate": 1.107908330717201e-06, - "loss": 0.1456, - "step": 32170 - }, - { - "epoch": 0.89, - "learning_rate": 1.1064813493535775e-06, - "loss": 0.1333, - "step": 32175 - }, - { - "epoch": 0.89, - "learning_rate": 1.1050543679899543e-06, - "loss": 0.0945, - "step": 32180 - }, - { - "epoch": 0.89, - "learning_rate": 1.1036273866263306e-06, - "loss": 0.1796, - "step": 32185 - }, - { - "epoch": 0.89, - "learning_rate": 1.1022004052627074e-06, - "loss": 0.1358, - "step": 32190 - }, - { - "epoch": 0.89, - "learning_rate": 1.100773423899084e-06, - "loss": 0.1462, - "step": 32195 - }, - { - "epoch": 0.89, - "learning_rate": 1.0993464425354605e-06, - "loss": 0.349, - "step": 32200 - }, - { - "epoch": 0.89, - "learning_rate": 1.0979194611718372e-06, - "loss": 0.0936, - "step": 32205 - }, - { - "epoch": 0.89, - "learning_rate": 1.0964924798082138e-06, - "loss": 0.1575, - "step": 32210 - }, - { - "epoch": 0.89, - "learning_rate": 1.0950654984445903e-06, - "loss": 0.0929, - "step": 32215 - }, - { - "epoch": 0.89, - "learning_rate": 1.093638517080967e-06, - "loss": 0.1964, - "step": 32220 - }, - { - "epoch": 0.89, - "learning_rate": 1.0922115357173436e-06, - "loss": 0.0948, - "step": 32225 - }, - { - "epoch": 0.89, - "learning_rate": 1.0907845543537202e-06, - "loss": 0.0401, - "step": 32230 - }, - { - "epoch": 0.89, - "learning_rate": 1.0893575729900967e-06, - "loss": 0.2228, - "step": 32235 - }, - { - "epoch": 0.89, - "learning_rate": 1.0879305916264735e-06, - "loss": 0.2275, - "step": 32240 - }, - { - "epoch": 0.89, - "learning_rate": 1.08650361026285e-06, - "loss": 0.1291, - "step": 32245 - }, - { - "epoch": 0.89, - "learning_rate": 1.0850766288992266e-06, - "loss": 0.2682, - "step": 32250 - }, - { - "epoch": 0.9, - "learning_rate": 1.0836496475356034e-06, - "loss": 0.1324, - "step": 32255 - }, - { - "epoch": 0.9, - "learning_rate": 1.08222266617198e-06, - "loss": 0.2206, - "step": 32260 - }, - { - "epoch": 0.9, - "learning_rate": 1.0807956848083565e-06, - "loss": 0.1372, - "step": 32265 - }, - { - "epoch": 0.9, - "learning_rate": 1.079368703444733e-06, - "loss": 0.1072, - "step": 32270 - }, - { - "epoch": 0.9, - "learning_rate": 1.0779417220811098e-06, - "loss": 0.2071, - "step": 32275 - }, - { - "epoch": 0.9, - "learning_rate": 1.0765147407174863e-06, - "loss": 0.0434, - "step": 32280 - }, - { - "epoch": 0.9, - "learning_rate": 1.0750877593538629e-06, - "loss": 0.0655, - "step": 32285 - }, - { - "epoch": 0.9, - "learning_rate": 1.0736607779902396e-06, - "loss": 0.1538, - "step": 32290 - }, - { - "epoch": 0.9, - "learning_rate": 1.072233796626616e-06, - "loss": 0.2186, - "step": 32295 - }, - { - "epoch": 0.9, - "learning_rate": 1.0708068152629928e-06, - "loss": 0.3193, - "step": 32300 - }, - { - "epoch": 0.9, - "learning_rate": 1.0693798338993693e-06, - "loss": 0.1266, - "step": 32305 - }, - { - "epoch": 0.9, - "learning_rate": 1.0679528525357459e-06, - "loss": 0.1263, - "step": 32310 - }, - { - "epoch": 0.9, - "learning_rate": 1.0665258711721226e-06, - "loss": 0.121, - "step": 32315 - }, - { - "epoch": 0.9, - "learning_rate": 1.0650988898084992e-06, - "loss": 0.1924, - "step": 32320 - }, - { - "epoch": 0.9, - "learning_rate": 1.063671908444876e-06, - "loss": 0.0982, - "step": 32325 - }, - { - "epoch": 0.9, - "learning_rate": 1.0622449270812525e-06, - "loss": 0.0966, - "step": 32330 - }, - { - "epoch": 0.9, - "learning_rate": 1.060817945717629e-06, - "loss": 0.079, - "step": 32335 - }, - { - "epoch": 0.9, - "learning_rate": 1.0593909643540056e-06, - "loss": 0.2549, - "step": 32340 - }, - { - "epoch": 0.9, - "learning_rate": 1.0579639829903821e-06, - "loss": 0.2105, - "step": 32345 - }, - { - "epoch": 0.9, - "learning_rate": 1.0565370016267589e-06, - "loss": 0.2951, - "step": 32350 - }, - { - "epoch": 0.9, - "learning_rate": 1.0551100202631354e-06, - "loss": 0.0777, - "step": 32355 - }, - { - "epoch": 0.9, - "learning_rate": 1.053683038899512e-06, - "loss": 0.108, - "step": 32360 - }, - { - "epoch": 0.9, - "learning_rate": 1.0522560575358888e-06, - "loss": 0.144, - "step": 32365 - }, - { - "epoch": 0.9, - "learning_rate": 1.0508290761722653e-06, - "loss": 0.1481, - "step": 32370 - }, - { - "epoch": 0.9, - "learning_rate": 1.0494020948086419e-06, - "loss": 0.2673, - "step": 32375 - }, - { - "epoch": 0.9, - "learning_rate": 1.0479751134450184e-06, - "loss": 0.1464, - "step": 32380 - }, - { - "epoch": 0.9, - "learning_rate": 1.0465481320813952e-06, - "loss": 0.0679, - "step": 32385 - }, - { - "epoch": 0.9, - "learning_rate": 1.0451211507177717e-06, - "loss": 0.0727, - "step": 32390 - }, - { - "epoch": 0.9, - "learning_rate": 1.0436941693541483e-06, - "loss": 0.1183, - "step": 32395 - }, - { - "epoch": 0.9, - "learning_rate": 1.042267187990525e-06, - "loss": 0.3782, - "step": 32400 - }, - { - "epoch": 0.9, - "learning_rate": 1.0408402066269016e-06, - "loss": 0.1716, - "step": 32405 - }, - { - "epoch": 0.9, - "learning_rate": 1.0394132252632781e-06, - "loss": 0.1466, - "step": 32410 - }, - { - "epoch": 0.9, - "learning_rate": 1.0379862438996547e-06, - "loss": 0.131, - "step": 32415 - }, - { - "epoch": 0.9, - "learning_rate": 1.0365592625360314e-06, - "loss": 0.172, - "step": 32420 - }, - { - "epoch": 0.9, - "learning_rate": 1.035132281172408e-06, - "loss": 0.2046, - "step": 32425 - }, - { - "epoch": 0.9, - "learning_rate": 1.0337052998087845e-06, - "loss": 0.134, - "step": 32430 - }, - { - "epoch": 0.9, - "learning_rate": 1.0322783184451613e-06, - "loss": 0.1269, - "step": 32435 - }, - { - "epoch": 0.9, - "learning_rate": 1.0308513370815379e-06, - "loss": 0.1931, - "step": 32440 - }, - { - "epoch": 0.9, - "learning_rate": 1.0294243557179144e-06, - "loss": 0.3455, - "step": 32445 - }, - { - "epoch": 0.9, - "learning_rate": 1.027997374354291e-06, - "loss": 0.4596, - "step": 32450 - }, - { - "epoch": 0.9, - "learning_rate": 1.0265703929906675e-06, - "loss": 0.1474, - "step": 32455 - }, - { - "epoch": 0.9, - "learning_rate": 1.0251434116270443e-06, - "loss": 0.1049, - "step": 32460 - }, - { - "epoch": 0.9, - "learning_rate": 1.0237164302634208e-06, - "loss": 0.1086, - "step": 32465 - }, - { - "epoch": 0.9, - "learning_rate": 1.0222894488997974e-06, - "loss": 0.1306, - "step": 32470 - }, - { - "epoch": 0.9, - "learning_rate": 1.0208624675361741e-06, - "loss": 0.1247, - "step": 32475 - }, - { - "epoch": 0.9, - "learning_rate": 1.0194354861725507e-06, - "loss": 0.1273, - "step": 32480 - }, - { - "epoch": 0.9, - "learning_rate": 1.0180085048089272e-06, - "loss": 0.1708, - "step": 32485 - }, - { - "epoch": 0.9, - "learning_rate": 1.0165815234453038e-06, - "loss": 0.1291, - "step": 32490 - }, - { - "epoch": 0.9, - "learning_rate": 1.0151545420816805e-06, - "loss": 0.1723, - "step": 32495 - }, - { - "epoch": 0.9, - "learning_rate": 1.013727560718057e-06, - "loss": 0.4103, - "step": 32500 - }, - { - "epoch": 0.9, - "learning_rate": 1.0123005793544336e-06, - "loss": 0.1288, - "step": 32505 - }, - { - "epoch": 0.9, - "learning_rate": 1.0108735979908104e-06, - "loss": 0.117, - "step": 32510 - }, - { - "epoch": 0.9, - "learning_rate": 1.009446616627187e-06, - "loss": 0.2106, - "step": 32515 - }, - { - "epoch": 0.9, - "learning_rate": 1.0080196352635635e-06, - "loss": 0.1813, - "step": 32520 - }, - { - "epoch": 0.9, - "learning_rate": 1.00659265389994e-06, - "loss": 0.2038, - "step": 32525 - }, - { - "epoch": 0.9, - "learning_rate": 1.0051656725363168e-06, - "loss": 0.04, - "step": 32530 - }, - { - "epoch": 0.9, - "learning_rate": 1.0037386911726934e-06, - "loss": 0.0859, - "step": 32535 - }, - { - "epoch": 0.9, - "learning_rate": 1.00231170980907e-06, - "loss": 0.1195, - "step": 32540 - }, - { - "epoch": 0.9, - "learning_rate": 1.0008847284454467e-06, - "loss": 0.3733, - "step": 32545 - }, - { - "epoch": 0.9, - "learning_rate": 9.994577470818232e-07, - "loss": 0.4709, - "step": 32550 - }, - { - "epoch": 0.9, - "learning_rate": 9.980307657181998e-07, - "loss": 0.1486, - "step": 32555 - }, - { - "epoch": 0.9, - "learning_rate": 9.966037843545765e-07, - "loss": 0.2014, - "step": 32560 - }, - { - "epoch": 0.9, - "learning_rate": 9.951768029909529e-07, - "loss": 0.129, - "step": 32565 - }, - { - "epoch": 0.9, - "learning_rate": 9.937498216273296e-07, - "loss": 0.1603, - "step": 32570 - }, - { - "epoch": 0.9, - "learning_rate": 9.923228402637062e-07, - "loss": 0.1285, - "step": 32575 - }, - { - "epoch": 0.9, - "learning_rate": 9.90895858900083e-07, - "loss": 0.132, - "step": 32580 - }, - { - "epoch": 0.9, - "learning_rate": 9.894688775364595e-07, - "loss": 0.0625, - "step": 32585 - }, - { - "epoch": 0.9, - "learning_rate": 9.88041896172836e-07, - "loss": 0.3227, - "step": 32590 - }, - { - "epoch": 0.9, - "learning_rate": 9.866149148092128e-07, - "loss": 0.2231, - "step": 32595 - }, - { - "epoch": 0.9, - "learning_rate": 9.851879334455892e-07, - "loss": 0.2693, - "step": 32600 - }, - { - "epoch": 0.9, - "learning_rate": 9.83760952081966e-07, - "loss": 0.1329, - "step": 32605 - }, - { - "epoch": 0.9, - "learning_rate": 9.823339707183425e-07, - "loss": 0.0944, - "step": 32610 - }, - { - "epoch": 0.9, - "learning_rate": 9.80906989354719e-07, - "loss": 0.1512, - "step": 32615 - }, - { - "epoch": 0.91, - "learning_rate": 9.794800079910958e-07, - "loss": 0.1565, - "step": 32620 - }, - { - "epoch": 0.91, - "learning_rate": 9.780530266274723e-07, - "loss": 0.0535, - "step": 32625 - }, - { - "epoch": 0.91, - "learning_rate": 9.766260452638489e-07, - "loss": 0.0325, - "step": 32630 - }, - { - "epoch": 0.91, - "learning_rate": 9.751990639002254e-07, - "loss": 0.139, - "step": 32635 - }, - { - "epoch": 0.91, - "learning_rate": 9.737720825366022e-07, - "loss": 0.1512, - "step": 32640 - }, - { - "epoch": 0.91, - "learning_rate": 9.723451011729788e-07, - "loss": 0.2666, - "step": 32645 - }, - { - "epoch": 0.91, - "learning_rate": 9.709181198093553e-07, - "loss": 0.3004, - "step": 32650 - }, - { - "epoch": 0.91, - "learning_rate": 9.69491138445732e-07, - "loss": 0.1139, - "step": 32655 - }, - { - "epoch": 0.91, - "learning_rate": 9.680641570821086e-07, - "loss": 0.125, - "step": 32660 - }, - { - "epoch": 0.91, - "learning_rate": 9.666371757184852e-07, - "loss": 0.1188, - "step": 32665 - }, - { - "epoch": 0.91, - "learning_rate": 9.65210194354862e-07, - "loss": 0.1088, - "step": 32670 - }, - { - "epoch": 0.91, - "learning_rate": 9.637832129912385e-07, - "loss": 0.1492, - "step": 32675 - }, - { - "epoch": 0.91, - "learning_rate": 9.62356231627615e-07, - "loss": 0.0954, - "step": 32680 - }, - { - "epoch": 0.91, - "learning_rate": 9.609292502639916e-07, - "loss": 0.1257, - "step": 32685 - }, - { - "epoch": 0.91, - "learning_rate": 9.595022689003683e-07, - "loss": 0.1355, - "step": 32690 - }, - { - "epoch": 0.91, - "learning_rate": 9.580752875367449e-07, - "loss": 0.3235, - "step": 32695 - }, - { - "epoch": 0.91, - "learning_rate": 9.566483061731214e-07, - "loss": 0.2797, - "step": 32700 - }, - { - "epoch": 0.91, - "learning_rate": 9.552213248094982e-07, - "loss": 0.1561, - "step": 32705 - }, - { - "epoch": 0.91, - "learning_rate": 9.537943434458745e-07, - "loss": 0.1145, - "step": 32710 - }, - { - "epoch": 0.91, - "learning_rate": 9.523673620822513e-07, - "loss": 0.1294, - "step": 32715 - }, - { - "epoch": 0.91, - "learning_rate": 9.50940380718628e-07, - "loss": 0.2222, - "step": 32720 - }, - { - "epoch": 0.91, - "learning_rate": 9.495133993550044e-07, - "loss": 0.061, - "step": 32725 - }, - { - "epoch": 0.91, - "learning_rate": 9.480864179913811e-07, - "loss": 0.0274, - "step": 32730 - }, - { - "epoch": 0.91, - "learning_rate": 9.466594366277577e-07, - "loss": 0.0451, - "step": 32735 - }, - { - "epoch": 0.91, - "learning_rate": 9.452324552641343e-07, - "loss": 0.2271, - "step": 32740 - }, - { - "epoch": 0.91, - "learning_rate": 9.438054739005109e-07, - "loss": 0.197, - "step": 32745 - }, - { - "epoch": 0.91, - "learning_rate": 9.423784925368876e-07, - "loss": 0.3383, - "step": 32750 - }, - { - "epoch": 0.91, - "learning_rate": 9.409515111732642e-07, - "loss": 0.1195, - "step": 32755 - }, - { - "epoch": 0.91, - "learning_rate": 9.395245298096408e-07, - "loss": 0.1709, - "step": 32760 - }, - { - "epoch": 0.91, - "learning_rate": 9.380975484460173e-07, - "loss": 0.108, - "step": 32765 - }, - { - "epoch": 0.91, - "learning_rate": 9.36670567082394e-07, - "loss": 0.1488, - "step": 32770 - }, - { - "epoch": 0.91, - "learning_rate": 9.352435857187705e-07, - "loss": 0.2289, - "step": 32775 - }, - { - "epoch": 0.91, - "learning_rate": 9.338166043551472e-07, - "loss": 0.05, - "step": 32780 - }, - { - "epoch": 0.91, - "learning_rate": 9.323896229915239e-07, - "loss": 0.0459, - "step": 32785 - }, - { - "epoch": 0.91, - "learning_rate": 9.309626416279004e-07, - "loss": 0.1959, - "step": 32790 - }, - { - "epoch": 0.91, - "learning_rate": 9.295356602642771e-07, - "loss": 0.4017, - "step": 32795 - }, - { - "epoch": 0.91, - "learning_rate": 9.281086789006537e-07, - "loss": 0.2562, - "step": 32800 - }, - { - "epoch": 0.91, - "learning_rate": 9.266816975370302e-07, - "loss": 0.1345, - "step": 32805 - }, - { - "epoch": 0.91, - "learning_rate": 9.252547161734068e-07, - "loss": 0.1602, - "step": 32810 - }, - { - "epoch": 0.91, - "learning_rate": 9.238277348097835e-07, - "loss": 0.1423, - "step": 32815 - }, - { - "epoch": 0.91, - "learning_rate": 9.2240075344616e-07, - "loss": 0.0745, - "step": 32820 - }, - { - "epoch": 0.91, - "learning_rate": 9.209737720825367e-07, - "loss": 0.0695, - "step": 32825 - }, - { - "epoch": 0.91, - "learning_rate": 9.195467907189133e-07, - "loss": 0.1367, - "step": 32830 - }, - { - "epoch": 0.91, - "learning_rate": 9.181198093552898e-07, - "loss": 0.1857, - "step": 32835 - }, - { - "epoch": 0.91, - "learning_rate": 9.169782242643911e-07, - "loss": 0.2616, - "step": 32840 - }, - { - "epoch": 0.91, - "learning_rate": 9.155512429007678e-07, - "loss": 0.2157, - "step": 32845 - }, - { - "epoch": 0.91, - "learning_rate": 9.141242615371444e-07, - "loss": 0.2924, - "step": 32850 - }, - { - "epoch": 0.91, - "learning_rate": 9.126972801735211e-07, - "loss": 0.2066, - "step": 32855 - }, - { - "epoch": 0.91, - "learning_rate": 9.112702988098975e-07, - "loss": 0.1573, - "step": 32860 - }, - { - "epoch": 0.91, - "learning_rate": 9.098433174462742e-07, - "loss": 0.1145, - "step": 32865 - }, - { - "epoch": 0.91, - "learning_rate": 9.084163360826509e-07, - "loss": 0.1879, - "step": 32870 - }, - { - "epoch": 0.91, - "learning_rate": 9.069893547190274e-07, - "loss": 0.17, - "step": 32875 - }, - { - "epoch": 0.91, - "learning_rate": 9.055623733554041e-07, - "loss": 0.0442, - "step": 32880 - }, - { - "epoch": 0.91, - "learning_rate": 9.041353919917807e-07, - "loss": 0.0631, - "step": 32885 - }, - { - "epoch": 0.91, - "learning_rate": 9.027084106281573e-07, - "loss": 0.2354, - "step": 32890 - }, - { - "epoch": 0.91, - "learning_rate": 9.012814292645339e-07, - "loss": 0.1421, - "step": 32895 - }, - { - "epoch": 0.91, - "learning_rate": 8.998544479009106e-07, - "loss": 0.2422, - "step": 32900 - }, - { - "epoch": 0.91, - "learning_rate": 8.98427466537287e-07, - "loss": 0.1385, - "step": 32905 - }, - { - "epoch": 0.91, - "learning_rate": 8.970004851736637e-07, - "loss": 0.1083, - "step": 32910 - }, - { - "epoch": 0.91, - "learning_rate": 8.955735038100403e-07, - "loss": 0.1864, - "step": 32915 - }, - { - "epoch": 0.91, - "learning_rate": 8.941465224464169e-07, - "loss": 0.149, - "step": 32920 - }, - { - "epoch": 0.91, - "learning_rate": 8.927195410827935e-07, - "loss": 0.2301, - "step": 32925 - }, - { - "epoch": 0.91, - "learning_rate": 8.912925597191702e-07, - "loss": 0.029, - "step": 32930 - }, - { - "epoch": 0.91, - "learning_rate": 8.898655783555466e-07, - "loss": 0.1289, - "step": 32935 - }, - { - "epoch": 0.91, - "learning_rate": 8.884385969919233e-07, - "loss": 0.1008, - "step": 32940 - }, - { - "epoch": 0.91, - "learning_rate": 8.870116156283e-07, - "loss": 0.1501, - "step": 32945 - }, - { - "epoch": 0.91, - "learning_rate": 8.855846342646766e-07, - "loss": 0.4542, - "step": 32950 - }, - { - "epoch": 0.91, - "learning_rate": 8.841576529010532e-07, - "loss": 0.1106, - "step": 32955 - }, - { - "epoch": 0.91, - "learning_rate": 8.827306715374298e-07, - "loss": 0.1505, - "step": 32960 - }, - { - "epoch": 0.91, - "learning_rate": 8.813036901738065e-07, - "loss": 0.1458, - "step": 32965 - }, - { - "epoch": 0.91, - "learning_rate": 8.798767088101829e-07, - "loss": 0.2285, - "step": 32970 - }, - { - "epoch": 0.91, - "learning_rate": 8.784497274465596e-07, - "loss": 0.1022, - "step": 32975 - }, - { - "epoch": 0.92, - "learning_rate": 8.770227460829362e-07, - "loss": 0.0422, - "step": 32980 - }, - { - "epoch": 0.92, - "learning_rate": 8.755957647193128e-07, - "loss": 0.0593, - "step": 32985 - }, - { - "epoch": 0.92, - "learning_rate": 8.741687833556894e-07, - "loss": 0.2012, - "step": 32990 - }, - { - "epoch": 0.92, - "learning_rate": 8.727418019920661e-07, - "loss": 0.1078, - "step": 32995 - }, - { - "epoch": 0.92, - "learning_rate": 8.713148206284426e-07, - "loss": 0.245, - "step": 33000 - }, - { - "epoch": 0.92, - "learning_rate": 8.698878392648193e-07, - "loss": 0.1325, - "step": 33005 - }, - { - "epoch": 0.92, - "learning_rate": 8.68460857901196e-07, - "loss": 0.093, - "step": 33010 - }, - { - "epoch": 0.92, - "learning_rate": 8.670338765375724e-07, - "loss": 0.1878, - "step": 33015 - }, - { - "epoch": 0.92, - "learning_rate": 8.656068951739491e-07, - "loss": 0.119, - "step": 33020 - }, - { - "epoch": 0.92, - "learning_rate": 8.641799138103257e-07, - "loss": 0.1321, - "step": 33025 - }, - { - "epoch": 0.92, - "learning_rate": 8.627529324467024e-07, - "loss": 0.1079, - "step": 33030 - }, - { - "epoch": 0.92, - "learning_rate": 8.613259510830789e-07, - "loss": 0.1126, - "step": 33035 - }, - { - "epoch": 0.92, - "learning_rate": 8.598989697194556e-07, - "loss": 0.1239, - "step": 33040 - }, - { - "epoch": 0.92, - "learning_rate": 8.584719883558322e-07, - "loss": 0.2793, - "step": 33045 - }, - { - "epoch": 0.92, - "learning_rate": 8.570450069922087e-07, - "loss": 0.5398, - "step": 33050 - }, - { - "epoch": 0.92, - "learning_rate": 8.556180256285853e-07, - "loss": 0.1289, - "step": 33055 - }, - { - "epoch": 0.92, - "learning_rate": 8.54191044264962e-07, - "loss": 0.1211, - "step": 33060 - }, - { - "epoch": 0.92, - "learning_rate": 8.527640629013385e-07, - "loss": 0.1767, - "step": 33065 - }, - { - "epoch": 0.92, - "learning_rate": 8.513370815377152e-07, - "loss": 0.182, - "step": 33070 - }, - { - "epoch": 0.92, - "learning_rate": 8.499101001740919e-07, - "loss": 0.0843, - "step": 33075 - }, - { - "epoch": 0.92, - "learning_rate": 8.484831188104683e-07, - "loss": 0.218, - "step": 33080 - }, - { - "epoch": 0.92, - "learning_rate": 8.47056137446845e-07, - "loss": 0.1083, - "step": 33085 - }, - { - "epoch": 0.92, - "learning_rate": 8.456291560832216e-07, - "loss": 0.2618, - "step": 33090 - }, - { - "epoch": 0.92, - "learning_rate": 8.442021747195982e-07, - "loss": 0.2359, - "step": 33095 - }, - { - "epoch": 0.92, - "learning_rate": 8.427751933559748e-07, - "loss": 0.2874, - "step": 33100 - }, - { - "epoch": 0.92, - "learning_rate": 8.413482119923515e-07, - "loss": 0.1613, - "step": 33105 - }, - { - "epoch": 0.92, - "learning_rate": 8.39921230628728e-07, - "loss": 0.1171, - "step": 33110 - }, - { - "epoch": 0.92, - "learning_rate": 8.384942492651047e-07, - "loss": 0.1422, - "step": 33115 - }, - { - "epoch": 0.92, - "learning_rate": 8.370672679014813e-07, - "loss": 0.1607, - "step": 33120 - }, - { - "epoch": 0.92, - "learning_rate": 8.35640286537858e-07, - "loss": 0.0315, - "step": 33125 - }, - { - "epoch": 0.92, - "learning_rate": 8.342133051742344e-07, - "loss": 0.0461, - "step": 33130 - }, - { - "epoch": 0.92, - "learning_rate": 8.327863238106111e-07, - "loss": 0.0458, - "step": 33135 - }, - { - "epoch": 0.92, - "learning_rate": 8.313593424469878e-07, - "loss": 0.2426, - "step": 33140 - }, - { - "epoch": 0.92, - "learning_rate": 8.299323610833643e-07, - "loss": 0.2135, - "step": 33145 - }, - { - "epoch": 0.92, - "learning_rate": 8.28505379719741e-07, - "loss": 0.2423, - "step": 33150 - }, - { - "epoch": 0.92, - "learning_rate": 8.270783983561176e-07, - "loss": 0.1246, - "step": 33155 - }, - { - "epoch": 0.92, - "learning_rate": 8.256514169924941e-07, - "loss": 0.1177, - "step": 33160 - }, - { - "epoch": 0.92, - "learning_rate": 8.242244356288707e-07, - "loss": 0.1109, - "step": 33165 - }, - { - "epoch": 0.92, - "learning_rate": 8.227974542652474e-07, - "loss": 0.1596, - "step": 33170 - }, - { - "epoch": 0.92, - "learning_rate": 8.213704729016239e-07, - "loss": 0.0513, - "step": 33175 - }, - { - "epoch": 0.92, - "learning_rate": 8.199434915380006e-07, - "loss": 0.0563, - "step": 33180 - }, - { - "epoch": 0.92, - "learning_rate": 8.185165101743772e-07, - "loss": 0.1136, - "step": 33185 - }, - { - "epoch": 0.92, - "learning_rate": 8.170895288107538e-07, - "loss": 0.2111, - "step": 33190 - }, - { - "epoch": 0.92, - "learning_rate": 8.156625474471303e-07, - "loss": 0.3876, - "step": 33195 - }, - { - "epoch": 0.92, - "learning_rate": 8.14235566083507e-07, - "loss": 0.3911, - "step": 33200 - }, - { - "epoch": 0.92, - "learning_rate": 8.128085847198836e-07, - "loss": 0.0825, - "step": 33205 - }, - { - "epoch": 0.92, - "learning_rate": 8.113816033562602e-07, - "loss": 0.1268, - "step": 33210 - }, - { - "epoch": 0.92, - "learning_rate": 8.099546219926369e-07, - "loss": 0.1564, - "step": 33215 - }, - { - "epoch": 0.92, - "learning_rate": 8.085276406290135e-07, - "loss": 0.203, - "step": 33220 - }, - { - "epoch": 0.92, - "learning_rate": 8.071006592653901e-07, - "loss": 0.1381, - "step": 33225 - }, - { - "epoch": 0.92, - "learning_rate": 8.056736779017667e-07, - "loss": 0.0553, - "step": 33230 - }, - { - "epoch": 0.92, - "learning_rate": 8.042466965381434e-07, - "loss": 0.1891, - "step": 33235 - }, - { - "epoch": 0.92, - "learning_rate": 8.028197151745198e-07, - "loss": 0.119, - "step": 33240 - }, - { - "epoch": 0.92, - "learning_rate": 8.013927338108965e-07, - "loss": 0.2053, - "step": 33245 - }, - { - "epoch": 0.92, - "learning_rate": 7.999657524472731e-07, - "loss": 0.2148, - "step": 33250 - }, - { - "epoch": 0.92, - "learning_rate": 7.985387710836497e-07, - "loss": 0.0989, - "step": 33255 - }, - { - "epoch": 0.92, - "learning_rate": 7.971117897200263e-07, - "loss": 0.1083, - "step": 33260 - }, - { - "epoch": 0.92, - "learning_rate": 7.95684808356403e-07, - "loss": 0.1214, - "step": 33265 - }, - { - "epoch": 0.92, - "learning_rate": 7.942578269927794e-07, - "loss": 0.1139, - "step": 33270 - }, - { - "epoch": 0.92, - "learning_rate": 7.928308456291561e-07, - "loss": 0.1189, - "step": 33275 - }, - { - "epoch": 0.92, - "learning_rate": 7.914038642655328e-07, - "loss": 0.112, - "step": 33280 - }, - { - "epoch": 0.92, - "learning_rate": 7.899768829019093e-07, - "loss": 0.2058, - "step": 33285 - }, - { - "epoch": 0.92, - "learning_rate": 7.88549901538286e-07, - "loss": 0.1444, - "step": 33290 - }, - { - "epoch": 0.92, - "learning_rate": 7.871229201746626e-07, - "loss": 0.2797, - "step": 33295 - }, - { - "epoch": 0.92, - "learning_rate": 7.856959388110393e-07, - "loss": 0.1918, - "step": 33300 - }, - { - "epoch": 0.92, - "learning_rate": 7.842689574474157e-07, - "loss": 0.0939, - "step": 33305 - }, - { - "epoch": 0.92, - "learning_rate": 7.828419760837924e-07, - "loss": 0.1664, - "step": 33310 - }, - { - "epoch": 0.92, - "learning_rate": 7.81414994720169e-07, - "loss": 0.0634, - "step": 33315 - }, - { - "epoch": 0.92, - "learning_rate": 7.799880133565456e-07, - "loss": 0.1292, - "step": 33320 - }, - { - "epoch": 0.92, - "learning_rate": 7.785610319929222e-07, - "loss": 0.1139, - "step": 33325 - }, - { - "epoch": 0.92, - "learning_rate": 7.771340506292989e-07, - "loss": 0.0575, - "step": 33330 - }, - { - "epoch": 0.92, - "learning_rate": 7.757070692656754e-07, - "loss": 0.0883, - "step": 33335 - }, - { - "epoch": 0.93, - "learning_rate": 7.742800879020521e-07, - "loss": 0.0945, - "step": 33340 - }, - { - "epoch": 0.93, - "learning_rate": 7.728531065384288e-07, - "loss": 0.4529, - "step": 33345 - }, - { - "epoch": 0.93, - "learning_rate": 7.714261251748052e-07, - "loss": 0.2622, - "step": 33350 - }, - { - "epoch": 0.93, - "learning_rate": 7.699991438111819e-07, - "loss": 0.1283, - "step": 33355 - }, - { - "epoch": 0.93, - "learning_rate": 7.685721624475585e-07, - "loss": 0.1511, - "step": 33360 - }, - { - "epoch": 0.93, - "learning_rate": 7.671451810839351e-07, - "loss": 0.1189, - "step": 33365 - }, - { - "epoch": 0.93, - "learning_rate": 7.657181997203117e-07, - "loss": 0.1398, - "step": 33370 - }, - { - "epoch": 0.93, - "learning_rate": 7.642912183566884e-07, - "loss": 0.0603, - "step": 33375 - }, - { - "epoch": 0.93, - "learning_rate": 7.62864236993065e-07, - "loss": 0.1477, - "step": 33380 - }, - { - "epoch": 0.93, - "learning_rate": 7.614372556294415e-07, - "loss": 0.1919, - "step": 33385 - }, - { - "epoch": 0.93, - "learning_rate": 7.600102742658181e-07, - "loss": 0.0869, - "step": 33390 - }, - { - "epoch": 0.93, - "learning_rate": 7.585832929021948e-07, - "loss": 0.3016, - "step": 33395 - }, - { - "epoch": 0.93, - "learning_rate": 7.571563115385713e-07, - "loss": 0.1987, - "step": 33400 - }, - { - "epoch": 0.93, - "learning_rate": 7.55729330174948e-07, - "loss": 0.1416, - "step": 33405 - }, - { - "epoch": 0.93, - "learning_rate": 7.543023488113247e-07, - "loss": 0.1149, - "step": 33410 - }, - { - "epoch": 0.93, - "learning_rate": 7.528753674477012e-07, - "loss": 0.1641, - "step": 33415 - }, - { - "epoch": 0.93, - "learning_rate": 7.514483860840778e-07, - "loss": 0.0868, - "step": 33420 - }, - { - "epoch": 0.93, - "learning_rate": 7.500214047204544e-07, - "loss": 0.0629, - "step": 33425 - }, - { - "epoch": 0.93, - "learning_rate": 7.48594423356831e-07, - "loss": 0.0216, - "step": 33430 - }, - { - "epoch": 0.93, - "learning_rate": 7.471674419932076e-07, - "loss": 0.1032, - "step": 33435 - }, - { - "epoch": 0.93, - "learning_rate": 7.457404606295843e-07, - "loss": 0.1709, - "step": 33440 - }, - { - "epoch": 0.93, - "learning_rate": 7.443134792659608e-07, - "loss": 0.175, - "step": 33445 - }, - { - "epoch": 0.93, - "learning_rate": 7.428864979023375e-07, - "loss": 0.309, - "step": 33450 - }, - { - "epoch": 0.93, - "learning_rate": 7.414595165387141e-07, - "loss": 0.0988, - "step": 33455 - }, - { - "epoch": 0.93, - "learning_rate": 7.400325351750906e-07, - "loss": 0.1871, - "step": 33460 - }, - { - "epoch": 0.93, - "learning_rate": 7.386055538114672e-07, - "loss": 0.0989, - "step": 33465 - }, - { - "epoch": 0.93, - "learning_rate": 7.371785724478439e-07, - "loss": 0.1144, - "step": 33470 - }, - { - "epoch": 0.93, - "learning_rate": 7.357515910842205e-07, - "loss": 0.1737, - "step": 33475 - }, - { - "epoch": 0.93, - "learning_rate": 7.343246097205971e-07, - "loss": 0.1028, - "step": 33480 - }, - { - "epoch": 0.93, - "learning_rate": 7.328976283569738e-07, - "loss": 0.1129, - "step": 33485 - }, - { - "epoch": 0.93, - "learning_rate": 7.314706469933504e-07, - "loss": 0.17, - "step": 33490 - }, - { - "epoch": 0.93, - "learning_rate": 7.300436656297269e-07, - "loss": 0.1031, - "step": 33495 - }, - { - "epoch": 0.93, - "learning_rate": 7.286166842661035e-07, - "loss": 0.2834, - "step": 33500 - }, - { - "epoch": 0.93, - "learning_rate": 7.271897029024802e-07, - "loss": 0.0981, - "step": 33505 - }, - { - "epoch": 0.93, - "learning_rate": 7.257627215388567e-07, - "loss": 0.0891, - "step": 33510 - }, - { - "epoch": 0.93, - "learning_rate": 7.243357401752334e-07, - "loss": 0.1161, - "step": 33515 - }, - { - "epoch": 0.93, - "learning_rate": 7.2290875881161e-07, - "loss": 0.1518, - "step": 33520 - }, - { - "epoch": 0.93, - "learning_rate": 7.214817774479866e-07, - "loss": 0.1283, - "step": 33525 - }, - { - "epoch": 0.93, - "learning_rate": 7.200547960843631e-07, - "loss": 0.0354, - "step": 33530 - }, - { - "epoch": 0.93, - "learning_rate": 7.186278147207398e-07, - "loss": 0.0688, - "step": 33535 - }, - { - "epoch": 0.93, - "learning_rate": 7.172008333571163e-07, - "loss": 0.0727, - "step": 33540 - }, - { - "epoch": 0.93, - "learning_rate": 7.15773851993493e-07, - "loss": 0.0814, - "step": 33545 - }, - { - "epoch": 0.93, - "learning_rate": 7.143468706298696e-07, - "loss": 0.5167, - "step": 33550 - }, - { - "epoch": 0.93, - "learning_rate": 7.129198892662463e-07, - "loss": 0.1586, - "step": 33555 - }, - { - "epoch": 0.93, - "learning_rate": 7.114929079026229e-07, - "loss": 0.1507, - "step": 33560 - }, - { - "epoch": 0.93, - "learning_rate": 7.100659265389995e-07, - "loss": 0.0854, - "step": 33565 - }, - { - "epoch": 0.93, - "learning_rate": 7.086389451753762e-07, - "loss": 0.1534, - "step": 33570 - }, - { - "epoch": 0.93, - "learning_rate": 7.072119638117526e-07, - "loss": 0.0691, - "step": 33575 - }, - { - "epoch": 0.93, - "learning_rate": 7.057849824481293e-07, - "loss": 0.0863, - "step": 33580 - }, - { - "epoch": 0.93, - "learning_rate": 7.043580010845059e-07, - "loss": 0.216, - "step": 33585 - }, - { - "epoch": 0.93, - "learning_rate": 7.029310197208825e-07, - "loss": 0.2592, - "step": 33590 - }, - { - "epoch": 0.93, - "learning_rate": 7.015040383572591e-07, - "loss": 0.2099, - "step": 33595 - }, - { - "epoch": 0.93, - "learning_rate": 7.000770569936358e-07, - "loss": 0.4863, - "step": 33600 - }, - { - "epoch": 0.93, - "learning_rate": 6.986500756300122e-07, - "loss": 0.1039, - "step": 33605 - }, - { - "epoch": 0.93, - "learning_rate": 6.972230942663889e-07, - "loss": 0.1078, - "step": 33610 - }, - { - "epoch": 0.93, - "learning_rate": 6.957961129027655e-07, - "loss": 0.1677, - "step": 33615 - }, - { - "epoch": 0.93, - "learning_rate": 6.943691315391421e-07, - "loss": 0.1357, - "step": 33620 - }, - { - "epoch": 0.93, - "learning_rate": 6.929421501755188e-07, - "loss": 0.1395, - "step": 33625 - }, - { - "epoch": 0.93, - "learning_rate": 6.915151688118954e-07, - "loss": 0.0897, - "step": 33630 - }, - { - "epoch": 0.93, - "learning_rate": 6.900881874482721e-07, - "loss": 0.127, - "step": 33635 - }, - { - "epoch": 0.93, - "learning_rate": 6.886612060846486e-07, - "loss": 0.112, - "step": 33640 - }, - { - "epoch": 0.93, - "learning_rate": 6.872342247210252e-07, - "loss": 0.2524, - "step": 33645 - }, - { - "epoch": 0.93, - "learning_rate": 6.858072433574018e-07, - "loss": 0.3926, - "step": 33650 - }, - { - "epoch": 0.93, - "learning_rate": 6.843802619937784e-07, - "loss": 0.1851, - "step": 33655 - }, - { - "epoch": 0.93, - "learning_rate": 6.82953280630155e-07, - "loss": 0.1679, - "step": 33660 - }, - { - "epoch": 0.93, - "learning_rate": 6.815262992665317e-07, - "loss": 0.118, - "step": 33665 - }, - { - "epoch": 0.93, - "learning_rate": 6.800993179029082e-07, - "loss": 0.151, - "step": 33670 - }, - { - "epoch": 0.93, - "learning_rate": 6.786723365392849e-07, - "loss": 0.1039, - "step": 33675 - }, - { - "epoch": 0.93, - "learning_rate": 6.772453551756615e-07, - "loss": 0.0517, - "step": 33680 - }, - { - "epoch": 0.93, - "learning_rate": 6.75818373812038e-07, - "loss": 0.0684, - "step": 33685 - }, - { - "epoch": 0.93, - "learning_rate": 6.743913924484146e-07, - "loss": 0.2406, - "step": 33690 - }, - { - "epoch": 0.93, - "learning_rate": 6.729644110847913e-07, - "loss": 0.22, - "step": 33695 - }, - { - "epoch": 0.94, - "learning_rate": 6.715374297211679e-07, - "loss": 0.3595, - "step": 33700 - }, - { - "epoch": 0.94, - "learning_rate": 6.701104483575445e-07, - "loss": 0.0667, - "step": 33705 - }, - { - "epoch": 0.94, - "learning_rate": 6.686834669939212e-07, - "loss": 0.118, - "step": 33710 - }, - { - "epoch": 0.94, - "learning_rate": 6.672564856302976e-07, - "loss": 0.1186, - "step": 33715 - }, - { - "epoch": 0.94, - "learning_rate": 6.658295042666743e-07, - "loss": 0.2361, - "step": 33720 - }, - { - "epoch": 0.94, - "learning_rate": 6.644025229030509e-07, - "loss": 0.082, - "step": 33725 - }, - { - "epoch": 0.94, - "learning_rate": 6.629755415394276e-07, - "loss": 0.0234, - "step": 33730 - }, - { - "epoch": 0.94, - "learning_rate": 6.615485601758041e-07, - "loss": 0.2071, - "step": 33735 - }, - { - "epoch": 0.94, - "learning_rate": 6.601215788121808e-07, - "loss": 0.1544, - "step": 33740 - }, - { - "epoch": 0.94, - "learning_rate": 6.586945974485574e-07, - "loss": 0.2061, - "step": 33745 - }, - { - "epoch": 0.94, - "learning_rate": 6.57267616084934e-07, - "loss": 0.4038, - "step": 33750 - }, - { - "epoch": 0.94, - "learning_rate": 6.558406347213105e-07, - "loss": 0.1776, - "step": 33755 - }, - { - "epoch": 0.94, - "learning_rate": 6.544136533576872e-07, - "loss": 0.0942, - "step": 33760 - }, - { - "epoch": 0.94, - "learning_rate": 6.529866719940638e-07, - "loss": 0.1116, - "step": 33765 - }, - { - "epoch": 0.94, - "learning_rate": 6.515596906304404e-07, - "loss": 0.1359, - "step": 33770 - }, - { - "epoch": 0.94, - "learning_rate": 6.501327092668171e-07, - "loss": 0.2254, - "step": 33775 - }, - { - "epoch": 0.94, - "learning_rate": 6.487057279031936e-07, - "loss": 0.0678, - "step": 33780 - }, - { - "epoch": 0.94, - "learning_rate": 6.472787465395703e-07, - "loss": 0.1444, - "step": 33785 - }, - { - "epoch": 0.94, - "learning_rate": 6.458517651759469e-07, - "loss": 0.1639, - "step": 33790 - }, - { - "epoch": 0.94, - "learning_rate": 6.444247838123234e-07, - "loss": 0.2531, - "step": 33795 - }, - { - "epoch": 0.94, - "learning_rate": 6.429978024487e-07, - "loss": 0.3698, - "step": 33800 - }, - { - "epoch": 0.94, - "learning_rate": 6.415708210850767e-07, - "loss": 0.2081, - "step": 33805 - }, - { - "epoch": 0.94, - "learning_rate": 6.401438397214533e-07, - "loss": 0.1877, - "step": 33810 - }, - { - "epoch": 0.94, - "learning_rate": 6.387168583578299e-07, - "loss": 0.1325, - "step": 33815 - }, - { - "epoch": 0.94, - "learning_rate": 6.372898769942065e-07, - "loss": 0.1665, - "step": 33820 - }, - { - "epoch": 0.94, - "learning_rate": 6.358628956305832e-07, - "loss": 0.0933, - "step": 33825 - }, - { - "epoch": 0.94, - "learning_rate": 6.344359142669596e-07, - "loss": 0.1967, - "step": 33830 - }, - { - "epoch": 0.94, - "learning_rate": 6.330089329033363e-07, - "loss": 0.1324, - "step": 33835 - }, - { - "epoch": 0.94, - "learning_rate": 6.31581951539713e-07, - "loss": 0.2487, - "step": 33840 - }, - { - "epoch": 0.94, - "learning_rate": 6.301549701760895e-07, - "loss": 0.2832, - "step": 33845 - }, - { - "epoch": 0.94, - "learning_rate": 6.287279888124662e-07, - "loss": 0.2227, - "step": 33850 - }, - { - "epoch": 0.94, - "learning_rate": 6.273010074488428e-07, - "loss": 0.1731, - "step": 33855 - }, - { - "epoch": 0.94, - "learning_rate": 6.258740260852194e-07, - "loss": 0.1842, - "step": 33860 - }, - { - "epoch": 0.94, - "learning_rate": 6.24447044721596e-07, - "loss": 0.1187, - "step": 33865 - }, - { - "epoch": 0.94, - "learning_rate": 6.230200633579726e-07, - "loss": 0.1944, - "step": 33870 - }, - { - "epoch": 0.94, - "learning_rate": 6.215930819943492e-07, - "loss": 0.0547, - "step": 33875 - }, - { - "epoch": 0.94, - "learning_rate": 6.201661006307258e-07, - "loss": 0.162, - "step": 33880 - }, - { - "epoch": 0.94, - "learning_rate": 6.187391192671024e-07, - "loss": 0.1699, - "step": 33885 - }, - { - "epoch": 0.94, - "learning_rate": 6.17312137903479e-07, - "loss": 0.1574, - "step": 33890 - }, - { - "epoch": 0.94, - "learning_rate": 6.158851565398557e-07, - "loss": 0.3172, - "step": 33895 - }, - { - "epoch": 0.94, - "learning_rate": 6.144581751762323e-07, - "loss": 0.1541, - "step": 33900 - }, - { - "epoch": 0.94, - "learning_rate": 6.130311938126089e-07, - "loss": 0.1386, - "step": 33905 - }, - { - "epoch": 0.94, - "learning_rate": 6.116042124489854e-07, - "loss": 0.1226, - "step": 33910 - }, - { - "epoch": 0.94, - "learning_rate": 6.101772310853621e-07, - "loss": 0.1656, - "step": 33915 - }, - { - "epoch": 0.94, - "learning_rate": 6.087502497217387e-07, - "loss": 0.1377, - "step": 33920 - }, - { - "epoch": 0.94, - "learning_rate": 6.073232683581153e-07, - "loss": 0.1143, - "step": 33925 - }, - { - "epoch": 0.94, - "learning_rate": 6.058962869944919e-07, - "loss": 0.119, - "step": 33930 - }, - { - "epoch": 0.94, - "learning_rate": 6.044693056308685e-07, - "loss": 0.1434, - "step": 33935 - }, - { - "epoch": 0.94, - "learning_rate": 6.030423242672451e-07, - "loss": 0.199, - "step": 33940 - }, - { - "epoch": 0.94, - "learning_rate": 6.016153429036217e-07, - "loss": 0.2497, - "step": 33945 - }, - { - "epoch": 0.94, - "learning_rate": 6.001883615399983e-07, - "loss": 0.2519, - "step": 33950 - }, - { - "epoch": 0.94, - "learning_rate": 5.98761380176375e-07, - "loss": 0.0983, - "step": 33955 - }, - { - "epoch": 0.94, - "learning_rate": 5.973343988127515e-07, - "loss": 0.1828, - "step": 33960 - }, - { - "epoch": 0.94, - "learning_rate": 5.959074174491282e-07, - "loss": 0.1122, - "step": 33965 - }, - { - "epoch": 0.94, - "learning_rate": 5.944804360855048e-07, - "loss": 0.179, - "step": 33970 - }, - { - "epoch": 0.94, - "learning_rate": 5.930534547218814e-07, - "loss": 0.084, - "step": 33975 - }, - { - "epoch": 0.94, - "learning_rate": 5.916264733582581e-07, - "loss": 0.0931, - "step": 33980 - }, - { - "epoch": 0.94, - "learning_rate": 5.901994919946346e-07, - "loss": 0.035, - "step": 33985 - }, - { - "epoch": 0.94, - "learning_rate": 5.887725106310112e-07, - "loss": 0.2044, - "step": 33990 - }, - { - "epoch": 0.94, - "learning_rate": 5.873455292673878e-07, - "loss": 0.1952, - "step": 33995 - }, - { - "epoch": 0.94, - "learning_rate": 5.859185479037644e-07, - "loss": 0.372, - "step": 34000 - }, - { - "epoch": 0.94, - "eval_loss": 0.05467037484049797, - "eval_runtime": 1883.2508, - "eval_samples_per_second": 8.506, - "eval_steps_per_second": 2.127, - "eval_wer": 0.1568698160836639, - "step": 34000 - }, - { - "epoch": 0.94, - "learning_rate": 5.84491566540141e-07, - "loss": 0.1497, - "step": 34005 - }, - { - "epoch": 0.94, - "learning_rate": 5.830645851765177e-07, - "loss": 0.0938, - "step": 34010 - }, - { - "epoch": 0.94, - "learning_rate": 5.816376038128942e-07, - "loss": 0.1519, - "step": 34015 - }, - { - "epoch": 0.94, - "learning_rate": 5.802106224492709e-07, - "loss": 0.1306, - "step": 34020 - }, - { - "epoch": 0.94, - "learning_rate": 5.787836410856474e-07, - "loss": 0.1581, - "step": 34025 - }, - { - "epoch": 0.94, - "learning_rate": 5.773566597220241e-07, - "loss": 0.1854, - "step": 34030 - }, - { - "epoch": 0.94, - "learning_rate": 5.759296783584008e-07, - "loss": 0.1341, - "step": 34035 - }, - { - "epoch": 0.94, - "learning_rate": 5.745026969947773e-07, - "loss": 0.1319, - "step": 34040 - }, - { - "epoch": 0.94, - "learning_rate": 5.730757156311539e-07, - "loss": 0.112, - "step": 34045 - }, - { - "epoch": 0.94, - "learning_rate": 5.716487342675305e-07, - "loss": 0.4464, - "step": 34050 - }, - { - "epoch": 0.94, - "learning_rate": 5.702217529039071e-07, - "loss": 0.0791, - "step": 34055 - }, - { - "epoch": 0.95, - "learning_rate": 5.687947715402837e-07, - "loss": 0.1547, - "step": 34060 - }, - { - "epoch": 0.95, - "learning_rate": 5.673677901766604e-07, - "loss": 0.1451, - "step": 34065 - }, - { - "epoch": 0.95, - "learning_rate": 5.659408088130369e-07, - "loss": 0.1407, - "step": 34070 - }, - { - "epoch": 0.95, - "learning_rate": 5.645138274494136e-07, - "loss": 0.0622, - "step": 34075 - }, - { - "epoch": 0.95, - "learning_rate": 5.630868460857901e-07, - "loss": 0.0915, - "step": 34080 - }, - { - "epoch": 0.95, - "learning_rate": 5.616598647221668e-07, - "loss": 0.1956, - "step": 34085 - }, - { - "epoch": 0.95, - "learning_rate": 5.602328833585434e-07, - "loss": 0.2255, - "step": 34090 - }, - { - "epoch": 0.95, - "learning_rate": 5.5880590199492e-07, - "loss": 0.212, - "step": 34095 - }, - { - "epoch": 0.95, - "learning_rate": 5.573789206312967e-07, - "loss": 0.2122, - "step": 34100 - }, - { - "epoch": 0.95, - "learning_rate": 5.559519392676732e-07, - "loss": 0.1178, - "step": 34105 - }, - { - "epoch": 0.95, - "learning_rate": 5.545249579040498e-07, - "loss": 0.1361, - "step": 34110 - }, - { - "epoch": 0.95, - "learning_rate": 5.530979765404264e-07, - "loss": 0.2336, - "step": 34115 - }, - { - "epoch": 0.95, - "learning_rate": 5.516709951768031e-07, - "loss": 0.1697, - "step": 34120 - }, - { - "epoch": 0.95, - "learning_rate": 5.502440138131796e-07, - "loss": 0.1405, - "step": 34125 - }, - { - "epoch": 0.95, - "learning_rate": 5.488170324495563e-07, - "loss": 0.0917, - "step": 34130 - }, - { - "epoch": 0.95, - "learning_rate": 5.473900510859328e-07, - "loss": 0.0833, - "step": 34135 - }, - { - "epoch": 0.95, - "learning_rate": 5.459630697223095e-07, - "loss": 0.1232, - "step": 34140 - }, - { - "epoch": 0.95, - "learning_rate": 5.445360883586861e-07, - "loss": 0.1445, - "step": 34145 - }, - { - "epoch": 0.95, - "learning_rate": 5.431091069950627e-07, - "loss": 0.2142, - "step": 34150 - }, - { - "epoch": 0.95, - "learning_rate": 5.416821256314393e-07, - "loss": 0.2708, - "step": 34155 - }, - { - "epoch": 0.95, - "learning_rate": 5.402551442678159e-07, - "loss": 0.1244, - "step": 34160 - }, - { - "epoch": 0.95, - "learning_rate": 5.388281629041924e-07, - "loss": 0.1725, - "step": 34165 - }, - { - "epoch": 0.95, - "learning_rate": 5.374011815405691e-07, - "loss": 0.1629, - "step": 34170 - }, - { - "epoch": 0.95, - "learning_rate": 5.359742001769458e-07, - "loss": 0.1498, - "step": 34175 - }, - { - "epoch": 0.95, - "learning_rate": 5.345472188133224e-07, - "loss": 0.0467, - "step": 34180 - }, - { - "epoch": 0.95, - "learning_rate": 5.33120237449699e-07, - "loss": 0.1044, - "step": 34185 - }, - { - "epoch": 0.95, - "learning_rate": 5.316932560860755e-07, - "loss": 0.2158, - "step": 34190 - }, - { - "epoch": 0.95, - "learning_rate": 5.302662747224522e-07, - "loss": 0.1713, - "step": 34195 - }, - { - "epoch": 0.95, - "learning_rate": 5.288392933588288e-07, - "loss": 0.2982, - "step": 34200 - }, - { - "epoch": 0.95, - "learning_rate": 5.274123119952054e-07, - "loss": 0.0977, - "step": 34205 - }, - { - "epoch": 0.95, - "learning_rate": 5.25985330631582e-07, - "loss": 0.1338, - "step": 34210 - }, - { - "epoch": 0.95, - "learning_rate": 5.245583492679586e-07, - "loss": 0.1383, - "step": 34215 - }, - { - "epoch": 0.95, - "learning_rate": 5.231313679043352e-07, - "loss": 0.17, - "step": 34220 - }, - { - "epoch": 0.95, - "learning_rate": 5.217043865407118e-07, - "loss": 0.156, - "step": 34225 - }, - { - "epoch": 0.95, - "learning_rate": 5.202774051770884e-07, - "loss": 0.1594, - "step": 34230 - }, - { - "epoch": 0.95, - "learning_rate": 5.188504238134651e-07, - "loss": 0.2174, - "step": 34235 - }, - { - "epoch": 0.95, - "learning_rate": 5.174234424498417e-07, - "loss": 0.215, - "step": 34240 - }, - { - "epoch": 0.95, - "learning_rate": 5.159964610862182e-07, - "loss": 0.2561, - "step": 34245 - }, - { - "epoch": 0.95, - "learning_rate": 5.145694797225949e-07, - "loss": 0.3894, - "step": 34250 - }, - { - "epoch": 0.95, - "learning_rate": 5.131424983589715e-07, - "loss": 0.1347, - "step": 34255 - }, - { - "epoch": 0.95, - "learning_rate": 5.117155169953481e-07, - "loss": 0.0987, - "step": 34260 - }, - { - "epoch": 0.95, - "learning_rate": 5.102885356317247e-07, - "loss": 0.1218, - "step": 34265 - }, - { - "epoch": 0.95, - "learning_rate": 5.088615542681013e-07, - "loss": 0.2163, - "step": 34270 - }, - { - "epoch": 0.95, - "learning_rate": 5.074345729044779e-07, - "loss": 0.1458, - "step": 34275 - }, - { - "epoch": 0.95, - "learning_rate": 5.060075915408545e-07, - "loss": 0.0558, - "step": 34280 - }, - { - "epoch": 0.95, - "learning_rate": 5.045806101772311e-07, - "loss": 0.2161, - "step": 34285 - }, - { - "epoch": 0.95, - "learning_rate": 5.031536288136078e-07, - "loss": 0.3511, - "step": 34290 - }, - { - "epoch": 0.95, - "learning_rate": 5.017266474499843e-07, - "loss": 0.2886, - "step": 34295 - }, - { - "epoch": 0.95, - "learning_rate": 5.002996660863609e-07, - "loss": 0.2923, - "step": 34300 - }, - { - "epoch": 0.95, - "learning_rate": 4.988726847227375e-07, - "loss": 0.0922, - "step": 34305 - }, - { - "epoch": 0.95, - "learning_rate": 4.974457033591142e-07, - "loss": 0.1362, - "step": 34310 - }, - { - "epoch": 0.95, - "learning_rate": 4.960187219954909e-07, - "loss": 0.1991, - "step": 34315 - }, - { - "epoch": 0.95, - "learning_rate": 4.945917406318674e-07, - "loss": 0.1168, - "step": 34320 - }, - { - "epoch": 0.95, - "learning_rate": 4.93164759268244e-07, - "loss": 0.1358, - "step": 34325 - }, - { - "epoch": 0.95, - "learning_rate": 4.917377779046206e-07, - "loss": 0.2186, - "step": 34330 - }, - { - "epoch": 0.95, - "learning_rate": 4.903107965409972e-07, - "loss": 0.1316, - "step": 34335 - }, - { - "epoch": 0.95, - "learning_rate": 4.888838151773738e-07, - "loss": 0.1039, - "step": 34340 - }, - { - "epoch": 0.95, - "learning_rate": 4.874568338137505e-07, - "loss": 0.3293, - "step": 34345 - }, - { - "epoch": 0.95, - "learning_rate": 4.86029852450127e-07, - "loss": 0.4838, - "step": 34350 - }, - { - "epoch": 0.95, - "learning_rate": 4.846028710865037e-07, - "loss": 0.141, - "step": 34355 - }, - { - "epoch": 0.95, - "learning_rate": 4.831758897228802e-07, - "loss": 0.1439, - "step": 34360 - }, - { - "epoch": 0.95, - "learning_rate": 4.817489083592569e-07, - "loss": 0.1556, - "step": 34365 - }, - { - "epoch": 0.95, - "learning_rate": 4.803219269956335e-07, - "loss": 0.1648, - "step": 34370 - }, - { - "epoch": 0.95, - "learning_rate": 4.788949456320101e-07, - "loss": 0.2439, - "step": 34375 - }, - { - "epoch": 0.95, - "learning_rate": 4.774679642683867e-07, - "loss": 0.1302, - "step": 34380 - }, - { - "epoch": 0.95, - "learning_rate": 4.760409829047633e-07, - "loss": 0.112, - "step": 34385 - }, - { - "epoch": 0.95, - "learning_rate": 4.746140015411399e-07, - "loss": 0.0683, - "step": 34390 - }, - { - "epoch": 0.95, - "learning_rate": 4.7318702017751657e-07, - "loss": 0.1355, - "step": 34395 - }, - { - "epoch": 0.95, - "learning_rate": 4.717600388138931e-07, - "loss": 0.3024, - "step": 34400 - }, - { - "epoch": 0.95, - "learning_rate": 4.703330574502697e-07, - "loss": 0.1625, - "step": 34405 - }, - { - "epoch": 0.95, - "learning_rate": 4.689060760866464e-07, - "loss": 0.0693, - "step": 34410 - }, - { - "epoch": 0.95, - "learning_rate": 4.67479094723023e-07, - "loss": 0.1088, - "step": 34415 - }, - { - "epoch": 0.96, - "learning_rate": 4.6605211335939953e-07, - "loss": 0.1668, - "step": 34420 - }, - { - "epoch": 0.96, - "learning_rate": 4.646251319957762e-07, - "loss": 0.1632, - "step": 34425 - }, - { - "epoch": 0.96, - "learning_rate": 4.631981506321528e-07, - "loss": 0.0736, - "step": 34430 - }, - { - "epoch": 0.96, - "learning_rate": 4.6177116926852934e-07, - "loss": 0.0816, - "step": 34435 - }, - { - "epoch": 0.96, - "learning_rate": 4.60344187904906e-07, - "loss": 0.1986, - "step": 34440 - }, - { - "epoch": 0.96, - "learning_rate": 4.589172065412826e-07, - "loss": 0.2765, - "step": 34445 - }, - { - "epoch": 0.96, - "learning_rate": 4.5749022517765926e-07, - "loss": 0.2922, - "step": 34450 - }, - { - "epoch": 0.96, - "learning_rate": 4.560632438140358e-07, - "loss": 0.1496, - "step": 34455 - }, - { - "epoch": 0.96, - "learning_rate": 4.546362624504124e-07, - "loss": 0.1196, - "step": 34460 - }, - { - "epoch": 0.96, - "learning_rate": 4.5320928108678907e-07, - "loss": 0.1497, - "step": 34465 - }, - { - "epoch": 0.96, - "learning_rate": 4.5178229972316567e-07, - "loss": 0.1215, - "step": 34470 - }, - { - "epoch": 0.96, - "learning_rate": 4.503553183595422e-07, - "loss": 0.1484, - "step": 34475 - }, - { - "epoch": 0.96, - "learning_rate": 4.489283369959189e-07, - "loss": 0.0978, - "step": 34480 - }, - { - "epoch": 0.96, - "learning_rate": 4.475013556322955e-07, - "loss": 0.068, - "step": 34485 - }, - { - "epoch": 0.96, - "learning_rate": 4.4607437426867214e-07, - "loss": 0.07, - "step": 34490 - }, - { - "epoch": 0.96, - "learning_rate": 4.446473929050487e-07, - "loss": 0.2794, - "step": 34495 - }, - { - "epoch": 0.96, - "learning_rate": 4.432204115414253e-07, - "loss": 0.4696, - "step": 34500 - }, - { - "epoch": 0.96, - "learning_rate": 4.4179343017780195e-07, - "loss": 0.1744, - "step": 34505 - }, - { - "epoch": 0.96, - "learning_rate": 4.403664488141785e-07, - "loss": 0.1074, - "step": 34510 - }, - { - "epoch": 0.96, - "learning_rate": 4.389394674505551e-07, - "loss": 0.1396, - "step": 34515 - }, - { - "epoch": 0.96, - "learning_rate": 4.3751248608693176e-07, - "loss": 0.1238, - "step": 34520 - }, - { - "epoch": 0.96, - "learning_rate": 4.3608550472330836e-07, - "loss": 0.0882, - "step": 34525 - }, - { - "epoch": 0.96, - "learning_rate": 4.34658523359685e-07, - "loss": 0.0838, - "step": 34530 - }, - { - "epoch": 0.96, - "learning_rate": 4.3323154199606157e-07, - "loss": 0.143, - "step": 34535 - }, - { - "epoch": 0.96, - "learning_rate": 4.3180456063243817e-07, - "loss": 0.3865, - "step": 34540 - }, - { - "epoch": 0.96, - "learning_rate": 4.303775792688148e-07, - "loss": 0.1572, - "step": 34545 - }, - { - "epoch": 0.96, - "learning_rate": 4.289505979051914e-07, - "loss": 0.2699, - "step": 34550 - }, - { - "epoch": 0.96, - "learning_rate": 4.27523616541568e-07, - "loss": 0.1138, - "step": 34555 - }, - { - "epoch": 0.96, - "learning_rate": 4.2609663517794464e-07, - "loss": 0.1457, - "step": 34560 - }, - { - "epoch": 0.96, - "learning_rate": 4.246696538143212e-07, - "loss": 0.1412, - "step": 34565 - }, - { - "epoch": 0.96, - "learning_rate": 4.2324267245069784e-07, - "loss": 0.1349, - "step": 34570 - }, - { - "epoch": 0.96, - "learning_rate": 4.2181569108707445e-07, - "loss": 0.0811, - "step": 34575 - }, - { - "epoch": 0.96, - "learning_rate": 4.2038870972345105e-07, - "loss": 0.0344, - "step": 34580 - }, - { - "epoch": 0.96, - "learning_rate": 4.189617283598277e-07, - "loss": 0.1733, - "step": 34585 - }, - { - "epoch": 0.96, - "learning_rate": 4.1753474699620426e-07, - "loss": 0.1684, - "step": 34590 - }, - { - "epoch": 0.96, - "learning_rate": 4.1610776563258086e-07, - "loss": 0.3173, - "step": 34595 - }, - { - "epoch": 0.96, - "learning_rate": 4.146807842689575e-07, - "loss": 0.366, - "step": 34600 - }, - { - "epoch": 0.96, - "learning_rate": 4.1325380290533407e-07, - "loss": 0.2108, - "step": 34605 - }, - { - "epoch": 0.96, - "learning_rate": 4.118268215417107e-07, - "loss": 0.1436, - "step": 34610 - }, - { - "epoch": 0.96, - "learning_rate": 4.103998401780873e-07, - "loss": 0.1333, - "step": 34615 - }, - { - "epoch": 0.96, - "learning_rate": 4.089728588144639e-07, - "loss": 0.1779, - "step": 34620 - }, - { - "epoch": 0.96, - "learning_rate": 4.0754587745084053e-07, - "loss": 0.1584, - "step": 34625 - }, - { - "epoch": 0.96, - "learning_rate": 4.0611889608721713e-07, - "loss": 0.0484, - "step": 34630 - }, - { - "epoch": 0.96, - "learning_rate": 4.0469191472359374e-07, - "loss": 0.1154, - "step": 34635 - }, - { - "epoch": 0.96, - "learning_rate": 4.032649333599704e-07, - "loss": 0.1999, - "step": 34640 - }, - { - "epoch": 0.96, - "learning_rate": 4.0183795199634694e-07, - "loss": 0.1535, - "step": 34645 - }, - { - "epoch": 0.96, - "learning_rate": 4.0041097063272355e-07, - "loss": 0.4743, - "step": 34650 - }, - { - "epoch": 0.96, - "learning_rate": 3.989839892691002e-07, - "loss": 0.112, - "step": 34655 - }, - { - "epoch": 0.96, - "learning_rate": 3.9755700790547675e-07, - "loss": 0.1344, - "step": 34660 - }, - { - "epoch": 0.96, - "learning_rate": 3.961300265418534e-07, - "loss": 0.1642, - "step": 34665 - }, - { - "epoch": 0.96, - "learning_rate": 3.9470304517823e-07, - "loss": 0.1568, - "step": 34670 - }, - { - "epoch": 0.96, - "learning_rate": 3.9327606381460656e-07, - "loss": 0.0745, - "step": 34675 - }, - { - "epoch": 0.96, - "learning_rate": 3.918490824509832e-07, - "loss": 0.0574, - "step": 34680 - }, - { - "epoch": 0.96, - "learning_rate": 3.904221010873598e-07, - "loss": 0.1727, - "step": 34685 - }, - { - "epoch": 0.96, - "learning_rate": 3.8899511972373643e-07, - "loss": 0.195, - "step": 34690 - }, - { - "epoch": 0.96, - "learning_rate": 3.875681383601131e-07, - "loss": 0.1001, - "step": 34695 - }, - { - "epoch": 0.96, - "learning_rate": 3.8614115699648963e-07, - "loss": 0.2735, - "step": 34700 - }, - { - "epoch": 0.96, - "learning_rate": 3.847141756328663e-07, - "loss": 0.1598, - "step": 34705 - }, - { - "epoch": 0.96, - "learning_rate": 3.832871942692429e-07, - "loss": 0.1469, - "step": 34710 - }, - { - "epoch": 0.96, - "learning_rate": 3.8186021290561944e-07, - "loss": 0.0894, - "step": 34715 - }, - { - "epoch": 0.96, - "learning_rate": 3.804332315419961e-07, - "loss": 0.1188, - "step": 34720 - }, - { - "epoch": 0.96, - "learning_rate": 3.790062501783727e-07, - "loss": 0.0872, - "step": 34725 - }, - { - "epoch": 0.96, - "learning_rate": 3.7757926881474925e-07, - "loss": 0.07, - "step": 34730 - }, - { - "epoch": 0.96, - "learning_rate": 3.761522874511259e-07, - "loss": 0.0319, - "step": 34735 - }, - { - "epoch": 0.96, - "learning_rate": 3.747253060875025e-07, - "loss": 0.1835, - "step": 34740 - }, - { - "epoch": 0.96, - "learning_rate": 3.7329832472387917e-07, - "loss": 0.2409, - "step": 34745 - }, - { - "epoch": 0.96, - "learning_rate": 3.718713433602558e-07, - "loss": 0.4132, - "step": 34750 - }, - { - "epoch": 0.96, - "learning_rate": 3.704443619966323e-07, - "loss": 0.0954, - "step": 34755 - }, - { - "epoch": 0.96, - "learning_rate": 3.69017380633009e-07, - "loss": 0.1412, - "step": 34760 - }, - { - "epoch": 0.96, - "learning_rate": 3.675903992693856e-07, - "loss": 0.121, - "step": 34765 - }, - { - "epoch": 0.96, - "learning_rate": 3.6616341790576213e-07, - "loss": 0.1002, - "step": 34770 - }, - { - "epoch": 0.96, - "learning_rate": 3.647364365421388e-07, - "loss": 0.1016, - "step": 34775 - }, - { - "epoch": 0.97, - "learning_rate": 3.633094551785154e-07, - "loss": 0.0578, - "step": 34780 - }, - { - "epoch": 0.97, - "learning_rate": 3.6188247381489205e-07, - "loss": 0.1585, - "step": 34785 - }, - { - "epoch": 0.97, - "learning_rate": 3.604554924512686e-07, - "loss": 0.1897, - "step": 34790 - }, - { - "epoch": 0.97, - "learning_rate": 3.590285110876452e-07, - "loss": 0.1645, - "step": 34795 - }, - { - "epoch": 0.97, - "learning_rate": 3.5760152972402186e-07, - "loss": 0.2441, - "step": 34800 - }, - { - "epoch": 0.97, - "learning_rate": 3.5617454836039846e-07, - "loss": 0.1414, - "step": 34805 - }, - { - "epoch": 0.97, - "learning_rate": 3.54747566996775e-07, - "loss": 0.1433, - "step": 34810 - }, - { - "epoch": 0.97, - "learning_rate": 3.5332058563315167e-07, - "loss": 0.1351, - "step": 34815 - }, - { - "epoch": 0.97, - "learning_rate": 3.5189360426952827e-07, - "loss": 0.1397, - "step": 34820 - }, - { - "epoch": 0.97, - "learning_rate": 3.504666229059048e-07, - "loss": 0.125, - "step": 34825 - }, - { - "epoch": 0.97, - "learning_rate": 3.490396415422815e-07, - "loss": 0.0434, - "step": 34830 - }, - { - "epoch": 0.97, - "learning_rate": 3.476126601786581e-07, - "loss": 0.082, - "step": 34835 - }, - { - "epoch": 0.97, - "learning_rate": 3.4618567881503474e-07, - "loss": 0.1364, - "step": 34840 - }, - { - "epoch": 0.97, - "learning_rate": 3.447586974514113e-07, - "loss": 0.2254, - "step": 34845 - }, - { - "epoch": 0.97, - "learning_rate": 3.433317160877879e-07, - "loss": 0.3636, - "step": 34850 - }, - { - "epoch": 0.97, - "learning_rate": 3.4190473472416455e-07, - "loss": 0.1336, - "step": 34855 - }, - { - "epoch": 0.97, - "learning_rate": 3.4047775336054115e-07, - "loss": 0.1011, - "step": 34860 - }, - { - "epoch": 0.97, - "learning_rate": 3.390507719969177e-07, - "loss": 0.1526, - "step": 34865 - }, - { - "epoch": 0.97, - "learning_rate": 3.3762379063329436e-07, - "loss": 0.1421, - "step": 34870 - }, - { - "epoch": 0.97, - "learning_rate": 3.3619680926967096e-07, - "loss": 0.1655, - "step": 34875 - }, - { - "epoch": 0.97, - "learning_rate": 3.347698279060476e-07, - "loss": 0.0904, - "step": 34880 - }, - { - "epoch": 0.97, - "learning_rate": 3.3334284654242417e-07, - "loss": 0.1185, - "step": 34885 - }, - { - "epoch": 0.97, - "learning_rate": 3.3191586517880077e-07, - "loss": 0.5719, - "step": 34890 - }, - { - "epoch": 0.97, - "learning_rate": 3.3048888381517743e-07, - "loss": 0.2122, - "step": 34895 - }, - { - "epoch": 0.97, - "learning_rate": 3.29061902451554e-07, - "loss": 0.2588, - "step": 34900 - }, - { - "epoch": 0.97, - "learning_rate": 3.276349210879306e-07, - "loss": 0.0989, - "step": 34905 - }, - { - "epoch": 0.97, - "learning_rate": 3.2620793972430724e-07, - "loss": 0.1128, - "step": 34910 - }, - { - "epoch": 0.97, - "learning_rate": 3.2478095836068384e-07, - "loss": 0.194, - "step": 34915 - }, - { - "epoch": 0.97, - "learning_rate": 3.233539769970605e-07, - "loss": 0.1925, - "step": 34920 - }, - { - "epoch": 0.97, - "learning_rate": 3.2192699563343705e-07, - "loss": 0.0354, - "step": 34925 - }, - { - "epoch": 0.97, - "learning_rate": 3.2050001426981365e-07, - "loss": 0.1624, - "step": 34930 - }, - { - "epoch": 0.97, - "learning_rate": 3.190730329061903e-07, - "loss": 0.1294, - "step": 34935 - }, - { - "epoch": 0.97, - "learning_rate": 3.1764605154256686e-07, - "loss": 0.0661, - "step": 34940 - }, - { - "epoch": 0.97, - "learning_rate": 3.1621907017894346e-07, - "loss": 0.2772, - "step": 34945 - }, - { - "epoch": 0.97, - "learning_rate": 3.147920888153201e-07, - "loss": 0.4215, - "step": 34950 - }, - { - "epoch": 0.97, - "learning_rate": 3.133651074516967e-07, - "loss": 0.0999, - "step": 34955 - }, - { - "epoch": 0.97, - "learning_rate": 3.119381260880733e-07, - "loss": 0.1122, - "step": 34960 - }, - { - "epoch": 0.97, - "learning_rate": 3.1051114472444993e-07, - "loss": 0.1662, - "step": 34965 - }, - { - "epoch": 0.97, - "learning_rate": 3.0908416336082653e-07, - "loss": 0.1567, - "step": 34970 - }, - { - "epoch": 0.97, - "learning_rate": 3.0765718199720314e-07, - "loss": 0.0603, - "step": 34975 - }, - { - "epoch": 0.97, - "learning_rate": 3.0623020063357974e-07, - "loss": 0.1126, - "step": 34980 - }, - { - "epoch": 0.97, - "learning_rate": 3.0480321926995634e-07, - "loss": 0.1242, - "step": 34985 - }, - { - "epoch": 0.97, - "learning_rate": 3.03376237906333e-07, - "loss": 0.2789, - "step": 34990 - }, - { - "epoch": 0.97, - "learning_rate": 3.0194925654270955e-07, - "loss": 0.2336, - "step": 34995 - }, - { - "epoch": 0.97, - "learning_rate": 3.005222751790862e-07, - "loss": 0.292, - "step": 35000 - }, - { - "epoch": 0.97, - "learning_rate": 2.990952938154628e-07, - "loss": 0.0991, - "step": 35005 - }, - { - "epoch": 0.97, - "learning_rate": 2.976683124518394e-07, - "loss": 0.0919, - "step": 35010 - }, - { - "epoch": 0.97, - "learning_rate": 2.96241331088216e-07, - "loss": 0.1113, - "step": 35015 - }, - { - "epoch": 0.97, - "learning_rate": 2.948143497245926e-07, - "loss": 0.2276, - "step": 35020 - }, - { - "epoch": 0.97, - "learning_rate": 2.933873683609692e-07, - "loss": 0.1697, - "step": 35025 - }, - { - "epoch": 0.97, - "learning_rate": 2.919603869973458e-07, - "loss": 0.1605, - "step": 35030 - }, - { - "epoch": 0.97, - "learning_rate": 2.9053340563372243e-07, - "loss": 0.0764, - "step": 35035 - }, - { - "epoch": 0.97, - "learning_rate": 2.8910642427009903e-07, - "loss": 0.1852, - "step": 35040 - }, - { - "epoch": 0.97, - "learning_rate": 2.876794429064757e-07, - "loss": 0.0919, - "step": 35045 - }, - { - "epoch": 0.97, - "learning_rate": 2.8625246154285224e-07, - "loss": 0.2574, - "step": 35050 - }, - { - "epoch": 0.97, - "learning_rate": 2.848254801792289e-07, - "loss": 0.0825, - "step": 35055 - }, - { - "epoch": 0.97, - "learning_rate": 2.833984988156055e-07, - "loss": 0.1501, - "step": 35060 - }, - { - "epoch": 0.97, - "learning_rate": 2.819715174519821e-07, - "loss": 0.1756, - "step": 35065 - }, - { - "epoch": 0.97, - "learning_rate": 2.805445360883587e-07, - "loss": 0.1294, - "step": 35070 - }, - { - "epoch": 0.97, - "learning_rate": 2.791175547247353e-07, - "loss": 0.0994, - "step": 35075 - }, - { - "epoch": 0.97, - "learning_rate": 2.776905733611119e-07, - "loss": 0.0486, - "step": 35080 - }, - { - "epoch": 0.97, - "learning_rate": 2.7626359199748857e-07, - "loss": 0.0461, - "step": 35085 - }, - { - "epoch": 0.97, - "learning_rate": 2.748366106338651e-07, - "loss": 0.128, - "step": 35090 - }, - { - "epoch": 0.97, - "learning_rate": 2.734096292702418e-07, - "loss": 0.1552, - "step": 35095 - }, - { - "epoch": 0.97, - "learning_rate": 2.719826479066184e-07, - "loss": 0.3513, - "step": 35100 - }, - { - "epoch": 0.97, - "learning_rate": 2.70555666542995e-07, - "loss": 0.1427, - "step": 35105 - }, - { - "epoch": 0.97, - "learning_rate": 2.691286851793716e-07, - "loss": 0.185, - "step": 35110 - }, - { - "epoch": 0.97, - "learning_rate": 2.679871000884729e-07, - "loss": 0.8986, - "step": 35115 - }, - { - "epoch": 0.97, - "learning_rate": 2.665601187248495e-07, - "loss": 0.1575, - "step": 35120 - }, - { - "epoch": 0.97, - "learning_rate": 2.651331373612261e-07, - "loss": 0.1109, - "step": 35125 - }, - { - "epoch": 0.97, - "learning_rate": 2.637061559976027e-07, - "loss": 0.1015, - "step": 35130 - }, - { - "epoch": 0.97, - "learning_rate": 2.622791746339793e-07, - "loss": 0.1472, - "step": 35135 - }, - { - "epoch": 0.98, - "learning_rate": 2.608521932703559e-07, - "loss": 0.1659, - "step": 35140 - }, - { - "epoch": 0.98, - "learning_rate": 2.5942521190673255e-07, - "loss": 0.2268, - "step": 35145 - }, - { - "epoch": 0.98, - "learning_rate": 2.579982305431091e-07, - "loss": 0.7038, - "step": 35150 - }, - { - "epoch": 0.98, - "learning_rate": 2.5657124917948576e-07, - "loss": 0.1293, - "step": 35155 - }, - { - "epoch": 0.98, - "learning_rate": 2.5514426781586236e-07, - "loss": 0.1241, - "step": 35160 - }, - { - "epoch": 0.98, - "learning_rate": 2.5371728645223896e-07, - "loss": 0.1475, - "step": 35165 - }, - { - "epoch": 0.98, - "learning_rate": 2.5229030508861557e-07, - "loss": 0.1089, - "step": 35170 - }, - { - "epoch": 0.98, - "learning_rate": 2.5086332372499217e-07, - "loss": 0.0438, - "step": 35175 - }, - { - "epoch": 0.98, - "learning_rate": 2.494363423613688e-07, - "loss": 0.0869, - "step": 35180 - }, - { - "epoch": 0.98, - "learning_rate": 2.4800936099774543e-07, - "loss": 0.1248, - "step": 35185 - }, - { - "epoch": 0.98, - "learning_rate": 2.46582379634122e-07, - "loss": 0.088, - "step": 35190 - }, - { - "epoch": 0.98, - "learning_rate": 2.451553982704986e-07, - "loss": 0.1219, - "step": 35195 - }, - { - "epoch": 0.98, - "learning_rate": 2.4372841690687524e-07, - "loss": 0.5478, - "step": 35200 - }, - { - "epoch": 0.98, - "learning_rate": 2.4230143554325184e-07, - "loss": 0.1223, - "step": 35205 - }, - { - "epoch": 0.98, - "learning_rate": 2.4087445417962845e-07, - "loss": 0.1074, - "step": 35210 - }, - { - "epoch": 0.98, - "learning_rate": 2.3944747281600505e-07, - "loss": 0.1491, - "step": 35215 - }, - { - "epoch": 0.98, - "learning_rate": 2.3802049145238165e-07, - "loss": 0.1427, - "step": 35220 - }, - { - "epoch": 0.98, - "learning_rate": 2.3659351008875828e-07, - "loss": 0.0811, - "step": 35225 - }, - { - "epoch": 0.98, - "learning_rate": 2.3516652872513486e-07, - "loss": 0.0861, - "step": 35230 - }, - { - "epoch": 0.98, - "learning_rate": 2.337395473615115e-07, - "loss": 0.22, - "step": 35235 - }, - { - "epoch": 0.98, - "learning_rate": 2.323125659978881e-07, - "loss": 0.1128, - "step": 35240 - }, - { - "epoch": 0.98, - "learning_rate": 2.3088558463426467e-07, - "loss": 0.2804, - "step": 35245 - }, - { - "epoch": 0.98, - "learning_rate": 2.294586032706413e-07, - "loss": 0.6717, - "step": 35250 - }, - { - "epoch": 0.98, - "learning_rate": 2.280316219070179e-07, - "loss": 0.0846, - "step": 35255 - }, - { - "epoch": 0.98, - "learning_rate": 2.2660464054339453e-07, - "loss": 0.1158, - "step": 35260 - }, - { - "epoch": 0.98, - "learning_rate": 2.251776591797711e-07, - "loss": 0.1617, - "step": 35265 - }, - { - "epoch": 0.98, - "learning_rate": 2.2375067781614774e-07, - "loss": 0.1591, - "step": 35270 - }, - { - "epoch": 0.98, - "learning_rate": 2.2232369645252434e-07, - "loss": 0.0976, - "step": 35275 - }, - { - "epoch": 0.98, - "learning_rate": 2.2089671508890097e-07, - "loss": 0.1654, - "step": 35280 - }, - { - "epoch": 0.98, - "learning_rate": 2.1946973372527755e-07, - "loss": 0.0895, - "step": 35285 - }, - { - "epoch": 0.98, - "learning_rate": 2.1804275236165418e-07, - "loss": 0.1478, - "step": 35290 - }, - { - "epoch": 0.98, - "learning_rate": 2.1661577099803078e-07, - "loss": 0.4118, - "step": 35295 - }, - { - "epoch": 0.98, - "learning_rate": 2.151887896344074e-07, - "loss": 0.487, - "step": 35300 - }, - { - "epoch": 0.98, - "learning_rate": 2.13761808270784e-07, - "loss": 0.0738, - "step": 35305 - }, - { - "epoch": 0.98, - "learning_rate": 2.123348269071606e-07, - "loss": 0.1111, - "step": 35310 - }, - { - "epoch": 0.98, - "learning_rate": 2.1090784554353722e-07, - "loss": 0.1431, - "step": 35315 - }, - { - "epoch": 0.98, - "learning_rate": 2.0948086417991385e-07, - "loss": 0.1239, - "step": 35320 - }, - { - "epoch": 0.98, - "learning_rate": 2.0805388281629043e-07, - "loss": 0.1123, - "step": 35325 - }, - { - "epoch": 0.98, - "learning_rate": 2.0662690145266703e-07, - "loss": 0.3435, - "step": 35330 - }, - { - "epoch": 0.98, - "learning_rate": 2.0519992008904366e-07, - "loss": 0.1787, - "step": 35335 - }, - { - "epoch": 0.98, - "learning_rate": 2.0377293872542027e-07, - "loss": 0.1007, - "step": 35340 - }, - { - "epoch": 0.98, - "learning_rate": 2.0234595736179687e-07, - "loss": 0.1983, - "step": 35345 - }, - { - "epoch": 0.98, - "learning_rate": 2.0091897599817347e-07, - "loss": 0.3054, - "step": 35350 - }, - { - "epoch": 0.98, - "learning_rate": 1.994919946345501e-07, - "loss": 0.0983, - "step": 35355 - }, - { - "epoch": 0.98, - "learning_rate": 1.980650132709267e-07, - "loss": 0.1992, - "step": 35360 - }, - { - "epoch": 0.98, - "learning_rate": 1.9663803190730328e-07, - "loss": 0.1044, - "step": 35365 - }, - { - "epoch": 0.98, - "learning_rate": 1.952110505436799e-07, - "loss": 0.1358, - "step": 35370 - }, - { - "epoch": 0.98, - "learning_rate": 1.9378406918005654e-07, - "loss": 0.1224, - "step": 35375 - }, - { - "epoch": 0.98, - "learning_rate": 1.9235708781643315e-07, - "loss": 0.2086, - "step": 35380 - }, - { - "epoch": 0.98, - "learning_rate": 1.9093010645280972e-07, - "loss": 0.08, - "step": 35385 - }, - { - "epoch": 0.98, - "learning_rate": 1.8950312508918635e-07, - "loss": 0.1485, - "step": 35390 - }, - { - "epoch": 0.98, - "learning_rate": 1.8807614372556296e-07, - "loss": 0.3554, - "step": 35395 - }, - { - "epoch": 0.98, - "learning_rate": 1.8664916236193959e-07, - "loss": 0.4487, - "step": 35400 - }, - { - "epoch": 0.98, - "learning_rate": 1.8522218099831616e-07, - "loss": 0.1093, - "step": 35405 - }, - { - "epoch": 0.98, - "learning_rate": 1.837951996346928e-07, - "loss": 0.1351, - "step": 35410 - }, - { - "epoch": 0.98, - "learning_rate": 1.823682182710694e-07, - "loss": 0.1125, - "step": 35415 - }, - { - "epoch": 0.98, - "learning_rate": 1.8094123690744602e-07, - "loss": 0.1658, - "step": 35420 - }, - { - "epoch": 0.98, - "learning_rate": 1.795142555438226e-07, - "loss": 0.1496, - "step": 35425 - }, - { - "epoch": 0.98, - "learning_rate": 1.7808727418019923e-07, - "loss": 0.1278, - "step": 35430 - }, - { - "epoch": 0.98, - "learning_rate": 1.7666029281657583e-07, - "loss": 0.1258, - "step": 35435 - }, - { - "epoch": 0.98, - "learning_rate": 1.752333114529524e-07, - "loss": 0.1438, - "step": 35440 - }, - { - "epoch": 0.98, - "learning_rate": 1.7380633008932904e-07, - "loss": 0.2054, - "step": 35445 - }, - { - "epoch": 0.98, - "learning_rate": 1.7237934872570564e-07, - "loss": 0.4075, - "step": 35450 - }, - { - "epoch": 0.98, - "learning_rate": 1.7095236736208227e-07, - "loss": 0.1032, - "step": 35455 - }, - { - "epoch": 0.98, - "learning_rate": 1.6952538599845885e-07, - "loss": 0.1323, - "step": 35460 - }, - { - "epoch": 0.98, - "learning_rate": 1.6809840463483548e-07, - "loss": 0.1425, - "step": 35465 - }, - { - "epoch": 0.98, - "learning_rate": 1.6667142327121208e-07, - "loss": 0.1637, - "step": 35470 - }, - { - "epoch": 0.98, - "learning_rate": 1.6524444190758871e-07, - "loss": 0.0934, - "step": 35475 - }, - { - "epoch": 0.98, - "learning_rate": 1.638174605439653e-07, - "loss": 0.1711, - "step": 35480 - }, - { - "epoch": 0.98, - "learning_rate": 1.6239047918034192e-07, - "loss": 0.0627, - "step": 35485 - }, - { - "epoch": 0.98, - "learning_rate": 1.6096349781671852e-07, - "loss": 0.1645, - "step": 35490 - }, - { - "epoch": 0.98, - "learning_rate": 1.5953651645309515e-07, - "loss": 0.2765, - "step": 35495 - }, - { - "epoch": 0.99, - "learning_rate": 1.5810953508947173e-07, - "loss": 0.3501, - "step": 35500 - }, - { - "epoch": 0.99, - "learning_rate": 1.5668255372584836e-07, - "loss": 0.209, - "step": 35505 - }, - { - "epoch": 0.99, - "learning_rate": 1.5525557236222496e-07, - "loss": 0.1304, - "step": 35510 - }, - { - "epoch": 0.99, - "learning_rate": 1.5382859099860157e-07, - "loss": 0.1425, - "step": 35515 - }, - { - "epoch": 0.99, - "learning_rate": 1.5240160963497817e-07, - "loss": 0.204, - "step": 35520 - }, - { - "epoch": 0.99, - "learning_rate": 1.5097462827135477e-07, - "loss": 0.1164, - "step": 35525 - }, - { - "epoch": 0.99, - "learning_rate": 1.495476469077314e-07, - "loss": 0.1311, - "step": 35530 - }, - { - "epoch": 0.99, - "learning_rate": 1.48120665544108e-07, - "loss": 0.0595, - "step": 35535 - }, - { - "epoch": 0.99, - "learning_rate": 1.466936841804846e-07, - "loss": 0.1267, - "step": 35540 - }, - { - "epoch": 0.99, - "learning_rate": 1.4526670281686121e-07, - "loss": 0.1321, - "step": 35545 - }, - { - "epoch": 0.99, - "learning_rate": 1.4383972145323784e-07, - "loss": 0.3876, - "step": 35550 - }, - { - "epoch": 0.99, - "learning_rate": 1.4241274008961445e-07, - "loss": 0.1327, - "step": 35555 - }, - { - "epoch": 0.99, - "learning_rate": 1.4098575872599105e-07, - "loss": 0.0863, - "step": 35560 - }, - { - "epoch": 0.99, - "learning_rate": 1.3955877736236765e-07, - "loss": 0.1759, - "step": 35565 - }, - { - "epoch": 0.99, - "learning_rate": 1.3813179599874428e-07, - "loss": 0.136, - "step": 35570 - }, - { - "epoch": 0.99, - "learning_rate": 1.367048146351209e-07, - "loss": 0.1388, - "step": 35575 - }, - { - "epoch": 0.99, - "learning_rate": 1.352778332714975e-07, - "loss": 0.0729, - "step": 35580 - }, - { - "epoch": 0.99, - "learning_rate": 1.338508519078741e-07, - "loss": 0.1155, - "step": 35585 - }, - { - "epoch": 0.99, - "learning_rate": 1.324238705442507e-07, - "loss": 0.1004, - "step": 35590 - }, - { - "epoch": 0.99, - "learning_rate": 1.309968891806273e-07, - "loss": 0.1075, - "step": 35595 - }, - { - "epoch": 0.99, - "learning_rate": 1.2956990781700393e-07, - "loss": 0.1885, - "step": 35600 - }, - { - "epoch": 0.99, - "learning_rate": 1.2814292645338053e-07, - "loss": 0.1211, - "step": 35605 - }, - { - "epoch": 0.99, - "learning_rate": 1.2671594508975714e-07, - "loss": 0.1307, - "step": 35610 - }, - { - "epoch": 0.99, - "learning_rate": 1.2528896372613374e-07, - "loss": 0.1678, - "step": 35615 - }, - { - "epoch": 0.99, - "learning_rate": 1.2386198236251037e-07, - "loss": 0.1706, - "step": 35620 - }, - { - "epoch": 0.99, - "learning_rate": 1.2243500099888697e-07, - "loss": 0.0801, - "step": 35625 - }, - { - "epoch": 0.99, - "learning_rate": 1.2100801963526358e-07, - "loss": 0.105, - "step": 35630 - }, - { - "epoch": 0.99, - "learning_rate": 1.1958103827164018e-07, - "loss": 0.0717, - "step": 35635 - }, - { - "epoch": 0.99, - "learning_rate": 1.1815405690801678e-07, - "loss": 0.3152, - "step": 35640 - }, - { - "epoch": 0.99, - "learning_rate": 1.167270755443934e-07, - "loss": 0.2692, - "step": 35645 - }, - { - "epoch": 0.99, - "learning_rate": 1.1530009418077e-07, - "loss": 0.5868, - "step": 35650 - }, - { - "epoch": 0.99, - "learning_rate": 1.1387311281714662e-07, - "loss": 0.0953, - "step": 35655 - }, - { - "epoch": 0.99, - "learning_rate": 1.1244613145352322e-07, - "loss": 0.1201, - "step": 35660 - }, - { - "epoch": 0.99, - "learning_rate": 1.1101915008989984e-07, - "loss": 0.2317, - "step": 35665 - }, - { - "epoch": 0.99, - "learning_rate": 1.0959216872627644e-07, - "loss": 0.1824, - "step": 35670 - }, - { - "epoch": 0.99, - "learning_rate": 1.0816518736265306e-07, - "loss": 0.0918, - "step": 35675 - }, - { - "epoch": 0.99, - "learning_rate": 1.0673820599902965e-07, - "loss": 0.0509, - "step": 35680 - }, - { - "epoch": 0.99, - "learning_rate": 1.0531122463540627e-07, - "loss": 0.2317, - "step": 35685 - }, - { - "epoch": 0.99, - "learning_rate": 1.0388424327178287e-07, - "loss": 0.0458, - "step": 35690 - }, - { - "epoch": 0.99, - "learning_rate": 1.0245726190815949e-07, - "loss": 0.0866, - "step": 35695 - }, - { - "epoch": 0.99, - "learning_rate": 1.0103028054453609e-07, - "loss": 0.342, - "step": 35700 - }, - { - "epoch": 0.99, - "learning_rate": 9.96032991809127e-08, - "loss": 0.1037, - "step": 35705 - }, - { - "epoch": 0.99, - "learning_rate": 9.817631781728931e-08, - "loss": 0.1197, - "step": 35710 - }, - { - "epoch": 0.99, - "learning_rate": 9.674933645366593e-08, - "loss": 0.1261, - "step": 35715 - }, - { - "epoch": 0.99, - "learning_rate": 9.532235509004253e-08, - "loss": 0.13, - "step": 35720 - }, - { - "epoch": 0.99, - "learning_rate": 9.389537372641915e-08, - "loss": 0.1034, - "step": 35725 - }, - { - "epoch": 0.99, - "learning_rate": 9.246839236279575e-08, - "loss": 0.0929, - "step": 35730 - }, - { - "epoch": 0.99, - "learning_rate": 9.104141099917237e-08, - "loss": 0.084, - "step": 35735 - }, - { - "epoch": 0.99, - "learning_rate": 8.961442963554897e-08, - "loss": 0.1509, - "step": 35740 - }, - { - "epoch": 0.99, - "learning_rate": 8.818744827192559e-08, - "loss": 0.1683, - "step": 35745 - }, - { - "epoch": 0.99, - "learning_rate": 8.676046690830218e-08, - "loss": 0.2674, - "step": 35750 - }, - { - "epoch": 0.99, - "learning_rate": 8.53334855446788e-08, - "loss": 0.1209, - "step": 35755 - }, - { - "epoch": 0.99, - "learning_rate": 8.39065041810554e-08, - "loss": 0.1556, - "step": 35760 - }, - { - "epoch": 0.99, - "learning_rate": 8.247952281743201e-08, - "loss": 0.1462, - "step": 35765 - }, - { - "epoch": 0.99, - "learning_rate": 8.105254145380862e-08, - "loss": 0.1477, - "step": 35770 - }, - { - "epoch": 0.99, - "learning_rate": 7.962556009018523e-08, - "loss": 0.0594, - "step": 35775 - }, - { - "epoch": 0.99, - "learning_rate": 7.819857872656184e-08, - "loss": 0.1337, - "step": 35780 - }, - { - "epoch": 0.99, - "learning_rate": 7.677159736293844e-08, - "loss": 0.1388, - "step": 35785 - }, - { - "epoch": 0.99, - "learning_rate": 7.534461599931506e-08, - "loss": 0.1755, - "step": 35790 - }, - { - "epoch": 0.99, - "learning_rate": 7.391763463569166e-08, - "loss": 0.3601, - "step": 35795 - }, - { - "epoch": 0.99, - "learning_rate": 7.249065327206828e-08, - "loss": 0.249, - "step": 35800 - }, - { - "epoch": 0.99, - "learning_rate": 7.106367190844488e-08, - "loss": 0.162, - "step": 35805 - }, - { - "epoch": 0.99, - "learning_rate": 6.96366905448215e-08, - "loss": 0.1262, - "step": 35810 - }, - { - "epoch": 0.99, - "learning_rate": 6.82097091811981e-08, - "loss": 0.1319, - "step": 35815 - }, - { - "epoch": 0.99, - "learning_rate": 6.67827278175747e-08, - "loss": 0.1157, - "step": 35820 - }, - { - "epoch": 0.99, - "learning_rate": 6.535574645395132e-08, - "loss": 0.1637, - "step": 35825 - }, - { - "epoch": 0.99, - "learning_rate": 6.392876509032792e-08, - "loss": 0.0901, - "step": 35830 - }, - { - "epoch": 0.99, - "learning_rate": 6.250178372670454e-08, - "loss": 0.0832, - "step": 35835 - }, - { - "epoch": 0.99, - "learning_rate": 6.107480236308114e-08, - "loss": 0.244, - "step": 35840 - }, - { - "epoch": 0.99, - "learning_rate": 5.964782099945776e-08, - "loss": 0.2451, - "step": 35845 - }, - { - "epoch": 0.99, - "learning_rate": 5.822083963583436e-08, - "loss": 0.4593, - "step": 35850 - }, - { - "epoch": 0.99, - "learning_rate": 5.679385827221097e-08, - "loss": 0.1072, - "step": 35855 - }, - { - "epoch": 1.0, - "learning_rate": 5.536687690858758e-08, - "loss": 0.1056, - "step": 35860 - }, - { - "epoch": 1.0, - "learning_rate": 5.393989554496419e-08, - "loss": 0.1076, - "step": 35865 - }, - { - "epoch": 1.0, - "learning_rate": 5.25129141813408e-08, - "loss": 0.1398, - "step": 35870 - }, - { - "epoch": 1.0, - "learning_rate": 5.1085932817717405e-08, - "loss": 0.1973, - "step": 35875 - }, - { - "epoch": 1.0, - "learning_rate": 4.9658951454094015e-08, - "loss": 0.0593, - "step": 35880 - }, - { - "epoch": 1.0, - "learning_rate": 4.8231970090470625e-08, - "loss": 0.1092, - "step": 35885 - }, - { - "epoch": 1.0, - "learning_rate": 4.6804988726847235e-08, - "loss": 0.0982, - "step": 35890 - }, - { - "epoch": 1.0, - "learning_rate": 4.5378007363223845e-08, - "loss": 0.3747, - "step": 35895 - }, - { - "epoch": 1.0, - "learning_rate": 4.3951025999600455e-08, - "loss": 0.2814, - "step": 35900 - }, - { - "epoch": 1.0, - "learning_rate": 4.2524044635977064e-08, - "loss": 0.1131, - "step": 35905 - }, - { - "epoch": 1.0, - "learning_rate": 4.109706327235367e-08, - "loss": 0.1311, - "step": 35910 - }, - { - "epoch": 1.0, - "learning_rate": 3.967008190873028e-08, - "loss": 0.1271, - "step": 35915 - }, - { - "epoch": 1.0, - "learning_rate": 3.824310054510688e-08, - "loss": 0.1759, - "step": 35920 - }, - { - "epoch": 1.0, - "learning_rate": 3.681611918148349e-08, - "loss": 0.0869, - "step": 35925 - }, - { - "epoch": 1.0, - "learning_rate": 3.53891378178601e-08, - "loss": 0.0654, - "step": 35930 - }, - { - "epoch": 1.0, - "learning_rate": 3.396215645423671e-08, - "loss": 0.1665, - "step": 35935 - }, - { - "epoch": 1.0, - "learning_rate": 3.253517509061332e-08, - "loss": 0.1279, - "step": 35940 - }, - { - "epoch": 1.0, - "learning_rate": 3.110819372698993e-08, - "loss": 0.2591, - "step": 35945 - }, - { - "epoch": 1.0, - "learning_rate": 2.9681212363366537e-08, - "loss": 0.1954, - "step": 35950 - }, - { - "epoch": 1.0, - "learning_rate": 2.8254230999743147e-08, - "loss": 0.0886, - "step": 35955 - }, - { - "epoch": 1.0, - "learning_rate": 2.6827249636119757e-08, - "loss": 0.1037, - "step": 35960 - }, - { - "epoch": 1.0, - "learning_rate": 2.5400268272496364e-08, - "loss": 0.23, - "step": 35965 - }, - { - "epoch": 1.0, - "learning_rate": 2.397328690887297e-08, - "loss": 0.1149, - "step": 35970 - }, - { - "epoch": 1.0, - "learning_rate": 2.254630554524958e-08, - "loss": 0.0986, - "step": 35975 - }, - { - "epoch": 1.0, - "learning_rate": 2.1119324181626187e-08, - "loss": 0.1273, - "step": 35980 - }, - { - "epoch": 1.0, - "learning_rate": 1.9692342818002797e-08, - "loss": 0.0634, - "step": 35985 - }, - { - "epoch": 1.0, - "learning_rate": 1.8265361454379407e-08, - "loss": 0.065, - "step": 35990 - }, - { - "epoch": 1.0, - "learning_rate": 1.6838380090756014e-08, - "loss": 0.2194, - "step": 35995 - }, - { - "epoch": 1.0, - "learning_rate": 1.5411398727132624e-08, - "loss": 0.4803, - "step": 36000 - }, - { - "epoch": 1.0, - "eval_loss": 0.05520357936620712, - "eval_runtime": 2114.1161, - "eval_samples_per_second": 7.577, - "eval_steps_per_second": 1.894, - "eval_wer": 0.15631085467003245, - "step": 36000 - } - ], - "max_steps": 36039, - "num_train_epochs": 1, - "total_flos": 4.5501417276130427e+18, - "trial_name": null, - "trial_params": null -}