|
{"current_steps": 5, "total_steps": 36, "loss": 10.5953, "lr": 4.765769467591625e-05, "epoch": 0.39603960396039606, "percentage": 13.89, "elapsed_time": "0:00:59", "remaining_time": "0:06:07", "throughput": 593.47, "total_tokens": 35216} |
|
{"current_steps": 10, "total_steps": 36, "loss": 2.1097, "lr": 4.1069690242163484e-05, "epoch": 0.7920792079207921, "percentage": 27.78, "elapsed_time": "0:01:59", "remaining_time": "0:05:11", "throughput": 598.49, "total_tokens": 71704} |
|
{"current_steps": 15, "total_steps": 36, "loss": 0.4752, "lr": 3.147047612756302e-05, "epoch": 1.1584158415841583, "percentage": 41.67, "elapsed_time": "0:02:53", "remaining_time": "0:04:03", "throughput": 595.11, "total_tokens": 103424} |
|
{"current_steps": 20, "total_steps": 36, "loss": 0.4311, "lr": 2.0658795558326743e-05, "epoch": 1.5544554455445545, "percentage": 55.56, "elapsed_time": "0:03:53", "remaining_time": "0:03:06", "throughput": 596.05, "total_tokens": 139184} |
|
{"current_steps": 25, "total_steps": 36, "loss": 0.4116, "lr": 1.0660589091223855e-05, "epoch": 1.9504950495049505, "percentage": 69.44, "elapsed_time": "0:04:53", "remaining_time": "0:02:09", "throughput": 597.38, "total_tokens": 175496} |
|
{"current_steps": 30, "total_steps": 36, "loss": 0.333, "lr": 3.3493649053890326e-06, "epoch": 2.3168316831683167, "percentage": 83.33, "elapsed_time": "0:05:48", "remaining_time": "0:01:09", "throughput": 596.59, "total_tokens": 207928} |
|
{"current_steps": 35, "total_steps": 36, "loss": 0.3408, "lr": 9.513254770636137e-08, "epoch": 2.7128712871287126, "percentage": 97.22, "elapsed_time": "0:06:48", "remaining_time": "0:00:11", "throughput": 596.82, "total_tokens": 243800} |
|
{"current_steps": 36, "total_steps": 36, "epoch": 2.792079207920792, "percentage": 100.0, "elapsed_time": "0:07:02", "remaining_time": "0:00:00", "throughput": 593.72, "total_tokens": 250896} |
|
|