{ "epoch": 3.98, "eval_accuracy": 0.39803375322279416, "eval_loss": 3.6018850803375244, "eval_runtime": 1041.2833, "eval_samples": 308356, "eval_samples_per_second": 296.131, "eval_steps_per_second": 3.702, "perplexity": 36.667290123118356, "train_loss": 5.310745644091381, "train_runtime": 197999.4599, "train_samples": 5858758, "train_samples_per_second": 2958.977, "train_steps_per_second": 36.987 }