{ | |
"epoch": 0.9999588580080144, | |
"eval_loss": 0.10019518435001373, | |
"eval_runtime": 106.3168, | |
"eval_samples": 14749, | |
"eval_samples_per_second": 138.727, | |
"eval_steps_per_second": 17.344, | |
"perplexity": 1.105386651196126, | |
"total_flos": 5.63814937437143e+18, | |
"train_loss": 3.3859311055856667, | |
"train_runtime": 70616.0694, | |
"train_samples": 2916727, | |
"train_samples_per_second": 41.304, | |
"train_steps_per_second": 0.161 | |
} |