[ { "loss": 0.7219, "learning_rate": 7.2e-05, "epoch": 0.05, "step": 1 }, { "loss": 0.7128, "learning_rate": 7.2e-05, "epoch": 0.11, "step": 2 }, { "loss": 0.6783, "learning_rate": 7.2e-05, "epoch": 0.16, "step": 3 }, { "loss": 0.6587, "learning_rate": 7.2e-05, "epoch": 0.21, "step": 4 }, { "loss": 0.638, "learning_rate": 7.2e-05, "epoch": 0.26, "step": 5 }, { "loss": 0.6147, "learning_rate": 7.2e-05, "epoch": 0.32, "step": 6 }, { "loss": 0.6024, "learning_rate": 7.2e-05, "epoch": 0.37, "step": 7 }, { "loss": 0.5924, "learning_rate": 7.2e-05, "epoch": 0.42, "step": 8 }, { "loss": 0.5868, "learning_rate": 7.2e-05, "epoch": 0.47, "step": 9 }, { "loss": 0.5416, "learning_rate": 7.2e-05, "epoch": 0.53, "step": 10 }, { "loss": 0.4749, "learning_rate": 7.2e-05, "epoch": 0.58, "step": 11 }, { "loss": 0.4541, "learning_rate": 7.2e-05, "epoch": 0.63, "step": 12 }, { "loss": 0.4036, "learning_rate": 7.2e-05, "epoch": 0.68, "step": 13 }, { "loss": 0.3915, "learning_rate": 7.2e-05, "epoch": 0.74, "step": 14 }, { "loss": 0.3465, "learning_rate": 7.2e-05, "epoch": 0.79, "step": 15 }, { "loss": 0.2573, "learning_rate": 7.2e-05, "epoch": 0.84, "step": 16 }, { "loss": 0.1707, "learning_rate": 7.2e-05, "epoch": 0.89, "step": 17 }, { "loss": 0.125, "learning_rate": 7.2e-05, "epoch": 0.95, "step": 18 }, { "loss": 0.0749, "learning_rate": 7.2e-05, "epoch": 1.0, "step": 19 }, { "loss": 0.0452, "learning_rate": 7.2e-05, "epoch": 1.05, "step": 20 }, { "loss": 0.0257, "learning_rate": 7.2e-05, "epoch": 1.11, "step": 21 }, { "loss": 0.0252, "learning_rate": 7.2e-05, "epoch": 1.16, "step": 22 }, { "loss": 0.0604, "learning_rate": 7.2e-05, "epoch": 1.21, "step": 23 }, { "loss": 0.0492, "learning_rate": 7.2e-05, "epoch": 1.26, "step": 24 }, { "loss": 0.0012, "learning_rate": 7.2e-05, "epoch": 1.32, "step": 25 }, { "eval_crt_2_loss": 0.008229807950556278, "eval_crt_2_score": -0.0022093479055911303, "eval_crt_2_brier_score": 0.0022093479055911303, "eval_crt_2_average_probability": 0.9935852885246277, "eval_crt_2_accuracy": 1.0, "eval_crt_2_probabilities": [ 0.9995800852775574, 0.9990842342376709, 0.9995512366294861, 0.9986786246299744, 0.9995718598365784, 0.9997767806053162, 0.8551581501960754, 0.9971579313278198, 0.9996451139450073, 0.9977812170982361, 0.999804675579071, 0.9992179870605469, 0.9997174143791199, 0.9998371601104736, 0.9993311166763306, 0.9997996687889099, 0.9997851252555847, 0.999744713306427, 0.9995379447937012, 0.9998577833175659, 0.9997304081916809, 0.9990813732147217, 0.9995477795600891, 0.9990488886833191, 0.9998594522476196, 0.9994975328445435, 0.9991641044616699, 0.9995660185813904, 0.9997511506080627, 0.9998865127563477, 0.9999109506607056, 0.9996562004089355, 0.9994305968284607, 0.9992846846580505, 0.9995037317276001, 0.9992471933364868, 0.9996359348297119, 0.999599277973175, 0.9991531372070312, 0.9997557997703552, 0.9994789958000183, 0.9998207688331604, 0.9998410940170288, 0.9997524619102478, 0.9998014569282532, 0.9998021721839905, 0.9992111921310425, 0.9998326301574707, 0.9994243383407593, 0.9990911483764648, 0.9997714161872864, 0.9993265867233276, 0.9995996356010437, 0.9998132586479187, 0.9998679161071777, 0.9991796612739563, 0.9997928738594055, 0.9997915625572205, 0.5528848171234131, 0.9991310238838196, 0.9997738003730774, 0.9996798038482666, 0.9998341798782349, 0.9998807907104492, 0.9995421171188354, 0.9997196793556213, 0.999329686164856, 0.9998488426208496, 0.9995917677879333, 0.9998519420623779, 0.9985900521278381, 0.999859094619751, 0.9980387091636658, 0.9995794892311096, 0.9995357990264893, 0.9989036321640015, 0.9994966983795166, 0.9996247291564941, 0.9990410208702087, 0.9995213747024536, 0.9994599223136902, 0.9998130202293396, 0.9993808269500732, 0.9995201826095581, 0.999403715133667, 0.9996811151504517, 0.9995848536491394, 0.9991675615310669, 0.9995501637458801, 0.9996263980865479, 0.9990099668502808, 0.999705970287323, 0.9996757507324219, 0.9992926120758057, 0.9993239641189575, 0.9999006986618042, 0.9998637437820435, 0.9997491240501404, 0.9996663331985474, 0.9997652173042297 ], "eval_crt_2_runtime": 4.2017, "eval_crt_2_samples_per_second": 23.8, "eval_crt_2_steps_per_second": 0.476, "epoch": 1.32, "step": 25 }, { "loss": 0.0008, "learning_rate": 7.2e-05, "epoch": 1.37, "step": 26 }, { "loss": 0.0227, "learning_rate": 7.2e-05, "epoch": 1.42, "step": 27 }, { "loss": 0.0022, "learning_rate": 7.2e-05, "epoch": 1.47, "step": 28 }, { "loss": 0.0011, "learning_rate": 7.2e-05, "epoch": 1.53, "step": 29 }, { "loss": 0.0224, "learning_rate": 7.2e-05, "epoch": 1.58, "step": 30 }, { "loss": 0.2158, "learning_rate": 7.2e-05, "epoch": 1.63, "step": 31 }, { "loss": 0.0488, "learning_rate": 7.2e-05, "epoch": 1.68, "step": 32 }, { "loss": 0.0002, "learning_rate": 7.2e-05, "epoch": 1.74, "step": 33 }, { "loss": 0.0207, "learning_rate": 7.2e-05, "epoch": 1.79, "step": 34 }, { "loss": 0.0214, "learning_rate": 7.2e-05, "epoch": 1.84, "step": 35 }, { "loss": 0.007, "learning_rate": 7.2e-05, "epoch": 1.89, "step": 36 }, { "loss": 0.0256, "learning_rate": 7.2e-05, "epoch": 1.95, "step": 37 }, { "loss": 0.0026, "learning_rate": 7.2e-05, "epoch": 2.0, "step": 38 }, { "loss": 0.0405, "learning_rate": 7.2e-05, "epoch": 2.05, "step": 39 }, { "loss": 0.0406, "learning_rate": 7.2e-05, "epoch": 2.11, "step": 40 }, { "loss": 0.0232, "learning_rate": 7.2e-05, "epoch": 2.16, "step": 41 }, { "loss": 0.0432, "learning_rate": 7.2e-05, "epoch": 2.21, "step": 42 }, { "loss": 0.0, "learning_rate": 7.2e-05, "epoch": 2.26, "step": 43 }, { "loss": 0.0199, "learning_rate": 7.2e-05, "epoch": 2.32, "step": 44 }, { "loss": 0.0, "learning_rate": 7.2e-05, "epoch": 2.37, "step": 45 }, { "loss": 0.0221, "learning_rate": 7.2e-05, "epoch": 2.42, "step": 46 }, { "loss": 0.0, "learning_rate": 7.2e-05, "epoch": 2.47, "step": 47 }, { "loss": 0.0, "learning_rate": 7.2e-05, "epoch": 2.53, "step": 48 }, { "loss": 0.1631, "learning_rate": 7.2e-05, "epoch": 2.58, "step": 49 }, { "loss": 0.0013, "learning_rate": 7.2e-05, "epoch": 2.63, "step": 50 }, { "eval_crt_2_loss": 0.006326997186988592, "eval_crt_2_score": -0.0017219263827428222, "eval_crt_2_brier_score": 0.0017219263827428222, "eval_crt_2_average_probability": 0.9949961304664612, "eval_crt_2_accuracy": 1.0, "eval_crt_2_probabilities": [ 0.999997615814209, 0.9999998807907104, 0.9999988079071045, 0.9999997615814209, 0.9999998807907104, 0.999998927116394, 0.903231680393219, 0.9999995231628418, 0.9999998807907104, 0.9999997615814209, 0.9999998807907104, 0.9999996423721313, 0.9999996423721313, 0.9999996423721313, 0.9999997615814209, 0.999998927116394, 0.9999996423721313, 0.9999990463256836, 0.9999959468841553, 0.9999994039535522, 0.9999998807907104, 0.9999997615814209, 0.9999996423721313, 0.9999998807907104, 0.9999997615814209, 0.9999958276748657, 0.9999998807907104, 0.9999864101409912, 0.9999998807907104, 0.9999994039535522, 0.9999996423721313, 0.9999990463256836, 0.9999997615814209, 0.9999996423721313, 0.9999980926513672, 0.9999996423721313, 0.9999998807907104, 0.9999998807907104, 0.9999995231628418, 0.9999998807907104, 0.9999990463256836, 0.9999996423721313, 0.9999997615814209, 0.9999998807907104, 0.9999988079071045, 0.9999984502792358, 0.9999997615814209, 0.9999998807907104, 0.9999997615814209, 0.9999996423721313, 0.9999996423721313, 0.9999998807907104, 0.9999977350234985, 0.9999994039535522, 0.9999997615814209, 0.9999864101409912, 0.999998927116394, 0.9999995231628418, 0.5964798331260681, 0.9999996423721313, 0.9999994039535522, 0.9999986886978149, 0.9999992847442627, 0.9999996423721313, 0.999996542930603, 0.9999998807907104, 0.9999998807907104, 0.9999994039535522, 0.9999973773956299, 0.9999996423721313, 0.9999971389770508, 0.9999997615814209, 0.9999994039535522, 0.9999980926513672, 0.9999916553497314, 0.999998927116394, 0.9999998807907104, 0.9999998807907104, 0.9999996423721313, 0.9999940395355225, 0.9999998807907104, 0.9999995231628418, 0.9999997615814209, 0.9999996423721313, 0.9999997615814209, 0.9999998807907104, 0.9999997615814209, 0.9999996423721313, 0.9999996423721313, 0.9999998807907104, 0.9999927282333374, 0.9999998807907104, 0.9999998807907104, 0.9999998807907104, 0.9999997615814209, 0.9999996423721313, 0.9999994039535522, 0.9999992847442627, 0.9999995231628418, 0.9999998807907104 ], "eval_crt_2_runtime": 4.2, "eval_crt_2_samples_per_second": 23.81, "eval_crt_2_steps_per_second": 0.476, "epoch": 2.63, "step": 50 }, { "loss": 0.0195, "learning_rate": 7.2e-05, "epoch": 2.68, "step": 51 }, { "loss": 0.001, "learning_rate": 7.2e-05, "epoch": 2.74, "step": 52 }, { "loss": 0.0006, "learning_rate": 7.2e-05, "epoch": 2.79, "step": 53 }, { "loss": 0.0, "learning_rate": 7.2e-05, "epoch": 2.84, "step": 54 }, { "loss": 0.0192, "learning_rate": 7.2e-05, "epoch": 2.89, "step": 55 }, { "loss": 0.0682, "learning_rate": 7.2e-05, "epoch": 2.95, "step": 56 }, { "loss": 0.0, "learning_rate": 7.2e-05, "epoch": 3.0, "step": 57 }, { "loss": 0.0, "learning_rate": 7.2e-05, "epoch": 3.05, "step": 58 }, { "loss": 0.0, "learning_rate": 7.2e-05, "epoch": 3.11, "step": 59 }, { "loss": 0.0703, "learning_rate": 7.2e-05, "epoch": 3.16, "step": 60 }, { "loss": 0.0, "learning_rate": 7.2e-05, "epoch": 3.21, "step": 61 }, { "loss": 0.0, "learning_rate": 7.2e-05, "epoch": 3.26, "step": 62 }, { "loss": 0.0184, "learning_rate": 7.2e-05, "epoch": 3.32, "step": 63 }, { "loss": 0.04, "learning_rate": 7.2e-05, "epoch": 3.37, "step": 64 }, { "loss": 0.0361, "learning_rate": 7.2e-05, "epoch": 3.42, "step": 65 }, { "loss": 0.0165, "learning_rate": 7.2e-05, "epoch": 3.47, "step": 66 }, { "loss": 0.0, "learning_rate": 7.2e-05, "epoch": 3.53, "step": 67 }, { "loss": 0.0421, "learning_rate": 7.2e-05, "epoch": 3.58, "step": 68 }, { "loss": 0.0, "learning_rate": 7.2e-05, "epoch": 3.63, "step": 69 }, { "loss": 0.0103, "learning_rate": 7.2e-05, "epoch": 3.68, "step": 70 }, { "loss": 0.0203, "learning_rate": 7.2e-05, "epoch": 3.74, "step": 71 }, { "loss": 0.0151, "learning_rate": 7.2e-05, "epoch": 3.79, "step": 72 }, { "loss": 0.0223, "learning_rate": 7.2e-05, "epoch": 3.84, "step": 73 }, { "loss": 0.0117, "learning_rate": 7.2e-05, "epoch": 3.89, "step": 74 }, { "loss": 0.0001, "learning_rate": 7.2e-05, "epoch": 3.95, "step": 75 }, { "eval_crt_2_loss": 0.004923115950077772, "eval_crt_2_score": -0.0013668893370777369, "eval_crt_2_brier_score": 0.0013668893370777369, "eval_crt_2_average_probability": 0.9960331916809082, "eval_crt_2_accuracy": 1.0, "eval_crt_2_probabilities": [ 0.9999960660934448, 0.9999995231628418, 0.9999983310699463, 0.9999994039535522, 0.9999997615814209, 0.9999990463256836, 0.9720984697341919, 0.9999990463256836, 0.9999998807907104, 0.9999983310699463, 0.9999998807907104, 0.9999978542327881, 0.9999997615814209, 0.9999996423721313, 0.9999997615814209, 0.9999990463256836, 0.9999995231628418, 0.9999992847442627, 0.9999959468841553, 0.9999994039535522, 0.9999998807907104, 0.9999988079071045, 0.9999997615814209, 0.9999997615814209, 0.9999997615814209, 0.9999938011169434, 0.9999997615814209, 0.9999915361404419, 0.9999998807907104, 0.9999994039535522, 0.9999996423721313, 0.9999992847442627, 0.9999991655349731, 0.9999996423721313, 0.9999992847442627, 0.9999997615814209, 0.9999998807907104, 0.9999998807907104, 0.999998927116394, 0.9999998807907104, 0.9999991655349731, 0.9999997615814209, 0.9999997615814209, 0.9999998807907104, 0.9999988079071045, 0.9999980926513672, 0.9999996423721313, 0.9999998807907104, 0.9999996423721313, 0.9999996423721313, 0.9999996423721313, 0.9999997615814209, 0.9999984502792358, 0.9999994039535522, 0.9999998807907104, 0.9999746084213257, 0.9999992847442627, 0.9999995231628418, 0.6313396692276001, 0.9999997615814209, 0.9999995231628418, 0.9999992847442627, 0.9999992847442627, 0.9999996423721313, 0.9999957084655762, 0.9999998807907104, 0.9999998807907104, 0.9999994039535522, 0.9999988079071045, 0.9999995231628418, 0.9999964237213135, 0.9999997615814209, 0.9999973773956299, 0.9999982118606567, 0.9999940395355225, 0.9999990463256836, 0.9999998807907104, 0.9999998807907104, 0.9999991655349731, 0.9999963045120239, 0.9999998807907104, 0.9999994039535522, 0.9999996423721313, 0.9999997615814209, 0.9999998807907104, 0.9999998807907104, 0.9999997615814209, 0.9999990463256836, 0.9999995231628418, 0.9999998807907104, 0.9999871253967285, 0.9999998807907104, 0.9999998807907104, 0.9999997615814209, 0.9999996423721313, 0.9999995231628418, 0.9999995231628418, 0.9999985694885254, 0.9999994039535522, 0.9999998807907104 ], "eval_crt_2_runtime": 4.2026, "eval_crt_2_samples_per_second": 23.795, "eval_crt_2_steps_per_second": 0.476, "epoch": 3.95, "step": 75 }, { "loss": 0.0001, "learning_rate": 7.2e-05, "epoch": 4.0, "step": 76 }, { "loss": 0.0, "learning_rate": 7.2e-05, "epoch": 4.05, "step": 77 }, { "loss": 0.0105, "learning_rate": 7.2e-05, "epoch": 4.11, "step": 78 }, { "loss": 0.0002, "learning_rate": 7.2e-05, "epoch": 4.16, "step": 79 }, { "loss": 0.0, "learning_rate": 7.2e-05, "epoch": 4.21, "step": 80 }, { "loss": 0.0001, "learning_rate": 7.2e-05, "epoch": 4.26, "step": 81 }, { "loss": 0.0, "learning_rate": 7.2e-05, "epoch": 4.32, "step": 82 }, { "loss": 0.0214, "learning_rate": 7.2e-05, "epoch": 4.37, "step": 83 }, { "loss": 0.0105, "learning_rate": 7.2e-05, "epoch": 4.42, "step": 84 }, { "loss": 0.0001, "learning_rate": 7.2e-05, "epoch": 4.47, "step": 85 }, { "loss": 0.0116, "learning_rate": 7.2e-05, "epoch": 4.53, "step": 86 }, { "loss": 0.0168, "learning_rate": 7.2e-05, "epoch": 4.58, "step": 87 }, { "loss": 0.0329, "learning_rate": 7.2e-05, "epoch": 4.63, "step": 88 }, { "loss": 0.0118, "learning_rate": 7.2e-05, "epoch": 4.68, "step": 89 }, { "loss": 0.0498, "learning_rate": 7.2e-05, "epoch": 4.74, "step": 90 }, { "loss": 0.0033, "learning_rate": 7.2e-05, "epoch": 4.79, "step": 91 }, { "loss": 0.0124, "learning_rate": 7.2e-05, "epoch": 4.84, "step": 92 }, { "loss": 0.0268, "learning_rate": 7.2e-05, "epoch": 4.89, "step": 93 }, { "loss": 0.0, "learning_rate": 7.2e-05, "epoch": 4.95, "step": 94 }, { "loss": 0.0225, "learning_rate": 7.2e-05, "epoch": 5.0, "step": 95 }, { "loss": 0.0, "learning_rate": 7.2e-05, "epoch": 5.05, "step": 96 }, { "loss": 0.0059, "learning_rate": 7.2e-05, "epoch": 5.11, "step": 97 }, { "loss": 0.0, "learning_rate": 7.2e-05, "epoch": 5.16, "step": 98 }, { "loss": 0.011, "learning_rate": 7.2e-05, "epoch": 5.21, "step": 99 }, { "loss": 0.0001, "learning_rate": 7.2e-05, "epoch": 5.26, "step": 100 }, { "eval_crt_2_loss": 0.003461032873019576, "eval_crt_2_score": -0.0006671486771665514, "eval_crt_2_brier_score": 0.0006671486771665514, "eval_crt_2_average_probability": 0.9970054626464844, "eval_crt_2_accuracy": 1.0, "eval_crt_2_probabilities": [ 0.9999970197677612, 1.0, 0.9999985694885254, 1.0, 1.0, 0.9999984502792358, 0.9550073742866516, 1.0, 1.0, 0.9999998807907104, 1.0, 0.9999997615814209, 1.0, 0.9999994039535522, 1.0, 0.9999995231628418, 0.9999997615814209, 0.9999996423721313, 0.9999953508377075, 0.9999983310699463, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 0.9999942779541016, 1.0, 0.9999829530715942, 1.0, 0.9999996423721313, 0.9999997615814209, 0.9999998807907104, 0.9999998807907104, 1.0, 0.9999996423721313, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 0.9999995231628418, 0.9999998807907104, 0.9999998807907104, 1.0, 0.999998927116394, 0.9999960660934448, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 0.9999939203262329, 0.999998927116394, 1.0, 0.9999673366546631, 0.9999995231628418, 0.9999995231628418, 0.7456566691398621, 1.0, 0.9999984502792358, 0.9999994039535522, 0.9999994039535522, 0.9999996423721313, 0.9999964237213135, 1.0, 1.0, 0.9999990463256836, 0.9999996423721313, 0.9999998807907104, 0.9999982118606567, 0.9999997615814209, 0.9999998807907104, 0.9999986886978149, 0.9999911785125732, 0.9999998807907104, 1.0, 1.0, 0.9999998807907104, 0.9999972581863403, 1.0, 0.9999997615814209, 1.0, 1.0, 1.0, 1.0, 1.0, 0.9999998807907104, 1.0, 1.0, 0.9999868869781494, 1.0, 1.0, 1.0, 1.0, 0.9999995231628418, 0.9999994039535522, 0.9999985694885254, 0.9999995231628418, 1.0 ], "eval_crt_2_runtime": 4.2012, "eval_crt_2_samples_per_second": 23.803, "eval_crt_2_steps_per_second": 0.476, "epoch": 5.26, "step": 100 }, { "train_runtime": 366.2575, "train_samples_per_second": 8.737, "train_steps_per_second": 0.273, "total_flos": 0.0, "train_loss": 0.10658088955936648, "epoch": 5.26, "step": 100 } ] } ]