train_math_qa_1756735780 / all_results.json
rbelanec's picture
End of training
11aafe9 verified
{
"epoch": 10.0,
"eval_loss": 0.8015885949134827,
"eval_runtime": 57.0513,
"eval_samples_per_second": 52.304,
"eval_steps_per_second": 26.152,
"num_input_tokens_seen": 35721744,
"total_flos": 1.6085339872348078e+18,
"train_loss": 0.8150753764391674,
"train_runtime": 12852.7266,
"train_samples_per_second": 20.893,
"train_steps_per_second": 10.447
}