| { | |
| "epoch": 0.7619047619047619, | |
| "eval_loss": 1.4561185836791992, | |
| "eval_runtime": 2.8429, | |
| "eval_samples_per_second": 5.98, | |
| "eval_steps_per_second": 1.055, | |
| "perplexity": 4.289278700316188, | |
| "total_flos": 2446118092800.0, | |
| "train_loss": 1.5153563022613525, | |
| "train_runtime": 280.4756, | |
| "train_samples_per_second": 0.578, | |
| "train_steps_per_second": 0.007 | |
| } |