{ "epoch": 0.9995988768551946, "eval_loss": 1.1075533628463745, "eval_runtime": 37.4732, "eval_samples_per_second": 5.391, "eval_steps_per_second": 1.361, "perplexity": 3.026943494933559, "total_flos": 6308174864842752.0, "train_loss": 1.1638640125146074, "train_runtime": 6246.6188, "train_samples_per_second": 3.192, "train_steps_per_second": 0.1 }