{ "achieved_tflops_per_gpu": 1.8033590828859047, "achieved_tflops_per_gpu_theoretical": 98.24923232187187, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.11018558591604233, "mfu_percent": 0.5779997060531746, "mfu_percent_theoretical": 31.490138564702526, "total_flos": 2.0678579759758705e+18, "train_loss": 0.2535776594557861, "train_runtime": 143333.765, "train_samples_per_second": 0.464, "train_steps_per_second": 0.029, "valid_targets_mean": 5060.9, "valid_targets_min": 1241 }