{ "epoch": 6.0, "eval_loss": 2.4573256969451904, "eval_runtime": 40.2671, "eval_samples": 239, "eval_samples_per_second": 5.935, "eval_steps_per_second": 5.935, "perplexity": 11.673551145239013, "total_flos": 815647319654400.0, "train_loss": 2.3345105418791197, "train_runtime": 399646.5053, "train_samples": 24415, "train_samples_per_second": 0.367, "train_steps_per_second": 0.367 }