smolm-autoreg-bpe-counterfactual_babylm_aann_low_variability_noun-seed_211-1e-3
/
train_results.json
{ | |
"epoch": 20.0, | |
"train_loss": 3.027271946791392, | |
"train_runtime": 83852.6874, | |
"train_samples": 595027, | |
"train_samples_per_second": 141.922, | |
"train_steps_per_second": 4.435 | |
} |