{ "epoch": 3.0, "eval_loss": 2.212934732437134, "eval_runtime": 98.6913, "eval_samples_per_second": 7.073, "eval_steps_per_second": 7.073, "perplexity": 9.142507875313894, "total_flos": 8.691117166323302e+17, "train_loss": 2.267601152893844, "train_runtime": 8636.3508, "train_samples_per_second": 2.181, "train_steps_per_second": 0.273 }