stack-swesmithseq / train_results.json
penfever's picture
Add files using upload-large-folder tool
aeed870 verified
{
"achieved_tflops_per_gpu": 4.002569748940458,
"achieved_tflops_per_gpu_theoretical": 233.76541483479863,
"epoch": 7.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.11204883456230164,
"mfu_percent": 1.282874919532198,
"mfu_percent_theoretical": 74.92481244705085,
"total_flos": 3.0947556970284974e+18,
"train_loss": 0.09641505422623421,
"train_runtime": 96649.0246,
"train_samples_per_second": 1.11,
"train_steps_per_second": 0.069,
"valid_targets_mean": 4614.6,
"valid_targets_min": 1320
}