{ "achieved_tflops_per_gpu": 0.0030600983611038064, "achieved_tflops_per_gpu_theoretical": 501.4098752978288, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.1350942999124527, "mfu_percent": 0.00021626136827588736, "mfu_percent_theoretical": 35.43532687617165, "total_flos": 1404577005436928.0, "train_loss": 0.2162718369941081, "train_runtime": 28687.3337, "train_samples_per_second": 2.359, "train_steps_per_second": 0.148, "valid_targets_mean": 6305.2, "valid_targets_min": 396 }