{ "best_metric": 0.9119440459110474, "best_model_checkpoint": "output/fine_tuned/t5-base/MRPC/checkpoint-1035", "epoch": 10.0, "eval_steps": 500, "global_step": 1150, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.7107843137254902, "eval_combined_score": 0.767068803569332, "eval_f1": 0.8233532934131738, "eval_loss": 0.5475682020187378, "eval_runtime": 1.5083, "eval_samples_per_second": 270.506, "eval_steps_per_second": 33.813, "step": 115 }, { "epoch": 2.0, "eval_accuracy": 0.8700980392156863, "eval_combined_score": 0.8900575085721896, "eval_f1": 0.9100169779286927, "eval_loss": 0.35225751996040344, "eval_runtime": 1.5518, "eval_samples_per_second": 262.913, "eval_steps_per_second": 32.864, "step": 230 }, { "epoch": 3.0, "eval_accuracy": 0.8725490196078431, "eval_combined_score": 0.8923555908850027, "eval_f1": 0.9121621621621623, "eval_loss": 0.3623868525028229, "eval_runtime": 1.5259, "eval_samples_per_second": 267.39, "eval_steps_per_second": 33.424, "step": 345 }, { "epoch": 4.0, "eval_accuracy": 0.8774509803921569, "eval_combined_score": 0.8948658410732715, "eval_f1": 0.912280701754386, "eval_loss": 0.36461111903190613, "eval_runtime": 1.5073, "eval_samples_per_second": 270.69, "eval_steps_per_second": 33.836, "step": 460 }, { "epoch": 4.3478260869565215, "grad_norm": 4.906887054443359, "learning_rate": 2.826086956521739e-05, "loss": 0.3744, "step": 500 }, { "epoch": 5.0, "eval_accuracy": 0.8946078431372549, "eval_combined_score": 0.9099126172208014, "eval_f1": 0.9252173913043479, "eval_loss": 0.40538841485977173, "eval_runtime": 1.5339, "eval_samples_per_second": 265.981, "eval_steps_per_second": 33.248, "step": 575 }, { "epoch": 6.0, "eval_accuracy": 0.8897058823529411, "eval_combined_score": 0.9057225063938619, "eval_f1": 0.9217391304347826, "eval_loss": 0.46239176392555237, "eval_runtime": 1.5008, "eval_samples_per_second": 271.86, "eval_steps_per_second": 33.982, "step": 690 }, { "epoch": 7.0, "eval_accuracy": 0.8872549019607843, "eval_combined_score": 0.9042438893365565, "eval_f1": 0.9212328767123288, "eval_loss": 0.552967369556427, "eval_runtime": 0.8648, "eval_samples_per_second": 471.8, "eval_steps_per_second": 58.975, "step": 805 }, { "epoch": 8.0, "eval_accuracy": 0.8897058823529411, "eval_combined_score": 0.9058581404832297, "eval_f1": 0.9220103986135182, "eval_loss": 0.5404660701751709, "eval_runtime": 0.8838, "eval_samples_per_second": 461.635, "eval_steps_per_second": 57.704, "step": 920 }, { "epoch": 8.695652173913043, "grad_norm": 13.78760051727295, "learning_rate": 6.521739130434783e-06, "loss": 0.0877, "step": 1000 }, { "epoch": 9.0, "eval_accuracy": 0.8970588235294118, "eval_combined_score": 0.9119440459110474, "eval_f1": 0.926829268292683, "eval_loss": 0.5629165768623352, "eval_runtime": 0.8913, "eval_samples_per_second": 457.747, "eval_steps_per_second": 57.218, "step": 1035 }, { "epoch": 10.0, "eval_accuracy": 0.8921568627450981, "eval_combined_score": 0.9081473968897904, "eval_f1": 0.9241379310344827, "eval_loss": 0.5856015086174011, "eval_runtime": 0.8578, "eval_samples_per_second": 475.635, "eval_steps_per_second": 59.454, "step": 1150 }, { "epoch": 10.0, "step": 1150, "total_flos": 5600824300646400.0, "train_loss": 0.03282318198162577, "train_runtime": 93.6204, "train_samples_per_second": 391.795, "train_steps_per_second": 12.284 } ], "logging_steps": 500, "max_steps": 1150, "num_input_tokens_seen": 0, "num_train_epochs": 10, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 5600824300646400.0, "train_batch_size": 32, "trial_name": null, "trial_params": null }