{ "achieved_tflops_per_gpu": 3.9736859436403944, "achieved_tflops_per_gpu_theoretical": 674.1930080018105, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.16928507387638092, "mfu_percent": 0.401788265282143, "mfu_percent_theoretical": 68.16916157753393, "total_flos": 2.2347755431133184e+16, "train_loss": 0.4597333984715598, "train_runtime": 702.992, "train_samples_per_second": 3.147, "train_steps_per_second": 0.199, "valid_targets_mean": 2156.8, "valid_targets_min": 1031 }