{ "total_flos": 1.0995762888818688e+16, "train_loss": 1.0670766773223876, "train_runtime": 40993.3469, "train_samples_per_second": 0.024, "train_steps_per_second": 0.024 }