{ | |
"epoch": 3.0, | |
"eval_loss": 0.6613607406616211, | |
"eval_runtime": 13.2548, | |
"eval_samples": 3200, | |
"eval_samples_per_second": 103.962, | |
"eval_steps_per_second": 0.83, | |
"perplexity": 1.9374268770613925, | |
"train_loss": 0.6159939037574517, | |
"train_runtime": 13745.4884, | |
"train_samples": 344926, | |
"train_samples_per_second": 25.399, | |
"train_steps_per_second": 0.199 | |
} |