{ "epoch": 6.25, "total_flos": 4.798362622332561e+18, "train_loss": 0.6602616081237793, "train_runtime": 4840.2702, "train_samples": 2554, "train_samples_per_second": 3.306, "train_steps_per_second": 0.207 }