{ "epoch": 39.98755832037325, "eval_bleu": 18.257, "eval_gen_len": 25.2238, "eval_loss": 2.161628246307373, "eval_runtime": 21.3567, "eval_samples": 1001, "eval_samples_per_second": 46.871, "eval_steps_per_second": 1.498, "num_experts_activated": 0, "total_flos": 9.385287725187072e+17, "train_loss": 1.2382845392268715, "train_runtime": 18637.6228, "train_samples": 205756, "train_samples_per_second": 441.593, "train_steps_per_second": 3.449 }