{ "achieved_tflops_per_gpu": 3.494839125490133, "achieved_tflops_per_gpu_theoretical": 447.2034022926582, "epoch": 5.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.21225425601005554, "mfu_percent": 0.24698509720778328, "mfu_percent_theoretical": 31.60448072739634, "total_flos": 6.613684893274604e+17, "train_loss": 0.5546745132177304, "train_runtime": 11827.5918, "train_samples_per_second": 4.22, "train_steps_per_second": 0.132, "valid_targets_mean": 2312.1, "valid_targets_min": 769 }