Qwen-2.5-1.5B-Instruct-Datamix / all_results.json
andrewsiah's picture
End of training
e02586f verified
{
"eval_loss": 1.040108561515808,
"eval_runtime": 203.3075,
"eval_samples": 700,
"eval_samples_per_second": 3.443,
"eval_steps_per_second": 0.02,
"total_flos": 0.0,
"train_loss": 1.0761486015149526,
"train_runtime": 1434.8598,
"train_samples": 2000,
"train_samples_per_second": 1.394,
"train_steps_per_second": 0.005
}