train_multirc_123_1765085968 / train_results.json
rbelanec's picture
End of training
4d9b7f1 verified
{
"epoch": 20.0,
"num_input_tokens_seen": 264547520,
"total_flos": 1.191287785737683e+19,
"train_loss": 0.07439011100779885,
"train_runtime": 56245.3932,
"train_samples_per_second": 8.718,
"train_steps_per_second": 2.18
}