{ | |
"epoch": 39.98755832037325, | |
"eval_bleu": 18.257, | |
"eval_gen_len": 25.2238, | |
"eval_loss": 2.161628246307373, | |
"eval_runtime": 21.3567, | |
"eval_samples": 1001, | |
"eval_samples_per_second": 46.871, | |
"eval_steps_per_second": 1.498, | |
"num_experts_activated": 0, | |
"total_flos": 9.385287725187072e+17, | |
"train_loss": 1.2382845392268715, | |
"train_runtime": 18637.6228, | |
"train_samples": 205756, | |
"train_samples_per_second": 441.593, | |
"train_steps_per_second": 3.449 | |
} |