pretrain / all_results.json
furmaniak's picture
End of training
0d2ffcc verified
raw
history blame
390 Bytes
{
"epoch": 0.7619047619047619,
"eval_loss": 1.4561185836791992,
"eval_runtime": 2.8429,
"eval_samples_per_second": 5.98,
"eval_steps_per_second": 1.055,
"perplexity": 4.289278700316188,
"total_flos": 2446118092800.0,
"train_loss": 1.5153563022613525,
"train_runtime": 280.4756,
"train_samples_per_second": 0.578,
"train_steps_per_second": 0.007
}