{ | |
"epoch": 0.9995988768551946, | |
"eval_loss": 1.1075533628463745, | |
"eval_runtime": 37.4732, | |
"eval_samples_per_second": 5.391, | |
"eval_steps_per_second": 1.361, | |
"perplexity": 3.026943494933559, | |
"total_flos": 6308174864842752.0, | |
"train_loss": 1.1638640125146074, | |
"train_runtime": 6246.6188, | |
"train_samples_per_second": 3.192, | |
"train_steps_per_second": 0.1 | |
} |