{ "best_metric": null, "best_model_checkpoint": null, "epoch": 10.0, "global_step": 2610, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_loss": 1.281923770904541, "eval_mean_acc": 0.0, "eval_median_acc": 0.0, "eval_runtime": 30.1615, "eval_samples_per_second": 612.602, "eval_steps_per_second": 0.829, "step": 261 }, { "epoch": 1.92, "learning_rate": 0.001616858237547893, "loss": 1.2698, "step": 500 }, { "epoch": 2.0, "eval_loss": 1.2800453901290894, "eval_mean_acc": 0.0, "eval_median_acc": 0.0, "eval_runtime": 29.8737, "eval_samples_per_second": 618.504, "eval_steps_per_second": 0.837, "step": 522 }, { "epoch": 3.0, "eval_loss": 1.2790213823318481, "eval_mean_acc": 0.0, "eval_median_acc": 0.0, "eval_runtime": 30.0127, "eval_samples_per_second": 615.639, "eval_steps_per_second": 0.833, "step": 783 }, { "epoch": 3.83, "learning_rate": 0.0012337164750957853, "loss": 1.2596, "step": 1000 }, { "epoch": 4.0, "eval_loss": 1.2786147594451904, "eval_mean_acc": 0.0, "eval_median_acc": 0.0, "eval_runtime": 31.1625, "eval_samples_per_second": 592.924, "eval_steps_per_second": 0.802, "step": 1044 }, { "epoch": 5.0, "eval_loss": 1.2777519226074219, "eval_mean_acc": 0.0, "eval_median_acc": 0.0, "eval_runtime": 31.1737, "eval_samples_per_second": 592.711, "eval_steps_per_second": 0.802, "step": 1305 }, { "epoch": 5.75, "learning_rate": 0.0008505747126436781, "loss": 1.2598, "step": 1500 }, { "epoch": 6.0, "eval_loss": 1.276727318763733, "eval_mean_acc": 0.0, "eval_median_acc": 0.0, "eval_runtime": 30.7028, "eval_samples_per_second": 601.803, "eval_steps_per_second": 0.814, "step": 1566 }, { "epoch": 7.0, "eval_loss": 1.2621368169784546, "eval_mean_acc": 0.0, "eval_median_acc": 0.0, "eval_runtime": 31.0027, "eval_samples_per_second": 595.981, "eval_steps_per_second": 0.806, "step": 1827 }, { "epoch": 7.66, "learning_rate": 0.00046743295019157087, "loss": 1.2464, "step": 2000 }, { "epoch": 8.0, "eval_loss": 1.2596102952957153, "eval_mean_acc": 0.0, "eval_median_acc": 0.0, "eval_runtime": 31.2545, "eval_samples_per_second": 591.178, "eval_steps_per_second": 0.8, "step": 2088 }, { "epoch": 9.0, "eval_loss": 1.233572006225586, "eval_mean_acc": 0.0, "eval_median_acc": 0.0, "eval_runtime": 31.267, "eval_samples_per_second": 590.942, "eval_steps_per_second": 0.8, "step": 2349 }, { "epoch": 9.58, "learning_rate": 8.42911877394636e-05, "loss": 1.2184, "step": 2500 }, { "epoch": 10.0, "eval_loss": 1.2309106588363647, "eval_mean_acc": 0.0, "eval_median_acc": 0.0, "eval_runtime": 31.0235, "eval_samples_per_second": 595.581, "eval_steps_per_second": 0.806, "step": 2610 }, { "epoch": 10.0, "step": 2610, "total_flos": 1.660761144e+17, "train_loss": 1.2492360374479916, "train_runtime": 3648.4025, "train_samples_per_second": 274.093, "train_steps_per_second": 0.715 } ], "max_steps": 2610, "num_train_epochs": 10, "total_flos": 1.660761144e+17, "trial_name": null, "trial_params": null }