{ "epoch": 8.94, "eval_accuracy": 0.15909518159736963, "eval_loss": 5.773181915283203, "eval_runtime": 623.532, "eval_samples": 308356, "eval_samples_per_second": 494.531, "eval_steps_per_second": 5.153, "perplexity": 321.55928093587033, "train_loss": 6.136735617761035, "train_runtime": 197999.1773, "train_samples": 5858758, "train_samples_per_second": 2958.981, "train_steps_per_second": 30.823 }