{ "epoch": 2.9918166939443536, "eval_loss": 0.7127311825752258, "eval_runtime": 27.5772, "eval_samples_per_second": 607.423, "eval_steps_per_second": 9.501, "perplexity": 2.0395540531763667, "total_flos": 5.437860691102925e+16, "train_loss": 0.9607737994584881, "train_runtime": 2198.2213, "train_samples_per_second": 106.683, "train_steps_per_second": 0.416 }