swesmith-stack-reason / all_results.json
penfever's picture
End of training
30d98b5 verified
{
"achieved_tflops_per_gpu": 2.830142988382763,
"achieved_tflops_per_gpu_theoretical": 166.00732357833525,
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.14267900586128235,
"mfu_percent": 0.907097111661142,
"mfu_percent_theoretical": 53.20747550587668,
"total_flos": 3.0948342577517036e+18,
"train_loss": 0.11350778881926644,
"train_runtime": 136690.7198,
"train_samples_per_second": 0.785,
"train_steps_per_second": 0.049,
"valid_targets_mean": 6167.6,
"valid_targets_min": 3936
}