| { | |
| "epoch": 6.0, | |
| "eval_loss": 5.5764055252075195, | |
| "eval_runtime": 21.6138, | |
| "eval_samples": 162, | |
| "eval_samples_per_second": 7.495, | |
| "eval_steps_per_second": 7.495, | |
| "perplexity": 264.1205229267267, | |
| "total_flos": 23285119057920.0, | |
| "train_loss": 4.497406111357601, | |
| "train_runtime": 3411.1469, | |
| "train_samples": 697, | |
| "train_samples_per_second": 1.226, | |
| "train_steps_per_second": 1.226 | |
| } |