train_qqp_1744902593 / all_results.json
rbelanec's picture
End of training
5cb7406 verified
raw
history blame
407 Bytes
{
"epoch": 1.9544377397210075,
"eval_loss": 0.08336079865694046,
"eval_runtime": 401.6364,
"eval_samples_per_second": 90.592,
"eval_steps_per_second": 22.65,
"num_input_tokens_seen": 51858816,
"total_flos": 2.1715238142060134e+17,
"train_loss": 0.10561876927614212,
"train_runtime": 96179.8765,
"train_samples_per_second": 6.654,
"train_steps_per_second": 0.416
}