{ "best_metric": 0.33440420560747663, "best_model_checkpoint": "/content/drive/MyDrive/wav2vec2-large-xlsr-persian-asr-shemo_lnxdx/checkpoint-1700", "epoch": 12.5, "eval_steps": 100, "global_step": 2000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.62, "learning_rate": 2.0000000000000003e-06, "loss": 1.9455, "step": 100 }, { "epoch": 0.62, "eval_loss": 1.4246947765350342, "eval_runtime": 33.9505, "eval_samples_per_second": 8.365, "eval_steps_per_second": 1.06, "eval_wer": 0.4830607476635514, "step": 100 }, { "epoch": 1.25, "learning_rate": 4.000000000000001e-06, "loss": 1.4824, "step": 200 }, { "epoch": 1.25, "eval_loss": 1.110669493675232, "eval_runtime": 35.7852, "eval_samples_per_second": 7.936, "eval_steps_per_second": 1.006, "eval_wer": 0.43311915887850466, "step": 200 }, { "epoch": 1.88, "learning_rate": 6e-06, "loss": 1.2516, "step": 300 }, { "epoch": 1.88, "eval_loss": 0.9141018390655518, "eval_runtime": 33.4012, "eval_samples_per_second": 8.503, "eval_steps_per_second": 1.078, "eval_wer": 0.4135514018691589, "step": 300 }, { "epoch": 2.5, "learning_rate": 7.980000000000002e-06, "loss": 1.0859, "step": 400 }, { "epoch": 2.5, "eval_loss": 0.8359942436218262, "eval_runtime": 33.9773, "eval_samples_per_second": 8.359, "eval_steps_per_second": 1.06, "eval_wer": 0.3974883177570093, "step": 400 }, { "epoch": 3.12, "learning_rate": 9.980000000000001e-06, "loss": 1.0357, "step": 500 }, { "epoch": 3.12, "eval_loss": 0.8096792101860046, "eval_runtime": 33.8733, "eval_samples_per_second": 8.384, "eval_steps_per_second": 1.063, "eval_wer": 0.3814252336448598, "step": 500 }, { "epoch": 3.75, "learning_rate": 9.340000000000002e-06, "loss": 1.0472, "step": 600 }, { "epoch": 3.75, "eval_loss": 0.7550356984138489, "eval_runtime": 34.119, "eval_samples_per_second": 8.324, "eval_steps_per_second": 1.055, "eval_wer": 0.37529205607476634, "step": 600 }, { "epoch": 4.38, "learning_rate": 8.673333333333334e-06, "loss": 0.9963, "step": 700 }, { "epoch": 4.38, "eval_loss": 0.7533305287361145, "eval_runtime": 36.7992, "eval_samples_per_second": 7.718, "eval_steps_per_second": 0.978, "eval_wer": 0.36360981308411217, "step": 700 }, { "epoch": 5.0, "learning_rate": 8.006666666666667e-06, "loss": 0.9767, "step": 800 }, { "epoch": 5.0, "eval_loss": 0.7423538565635681, "eval_runtime": 33.6729, "eval_samples_per_second": 8.434, "eval_steps_per_second": 1.069, "eval_wer": 0.3589369158878505, "step": 800 }, { "epoch": 5.62, "learning_rate": 7.340000000000001e-06, "loss": 0.9667, "step": 900 }, { "epoch": 5.62, "eval_loss": 0.736015796661377, "eval_runtime": 34.1214, "eval_samples_per_second": 8.323, "eval_steps_per_second": 1.055, "eval_wer": 0.3516355140186916, "step": 900 }, { "epoch": 6.25, "learning_rate": 6.680000000000001e-06, "loss": 0.9385, "step": 1000 }, { "epoch": 6.25, "eval_loss": 0.7354543209075928, "eval_runtime": 33.4234, "eval_samples_per_second": 8.497, "eval_steps_per_second": 1.077, "eval_wer": 0.348714953271028, "step": 1000 }, { "epoch": 6.88, "learning_rate": 6.013333333333335e-06, "loss": 0.9805, "step": 1100 }, { "epoch": 6.88, "eval_loss": 0.7237350940704346, "eval_runtime": 36.5425, "eval_samples_per_second": 7.772, "eval_steps_per_second": 0.985, "eval_wer": 0.3463785046728972, "step": 1100 }, { "epoch": 7.5, "learning_rate": 5.346666666666667e-06, "loss": 0.976, "step": 1200 }, { "epoch": 7.5, "eval_loss": 0.7077719569206238, "eval_runtime": 33.9188, "eval_samples_per_second": 8.373, "eval_steps_per_second": 1.061, "eval_wer": 0.3455023364485981, "step": 1200 }, { "epoch": 8.12, "learning_rate": 4.680000000000001e-06, "loss": 0.88, "step": 1300 }, { "epoch": 8.12, "eval_loss": 0.7229148745536804, "eval_runtime": 33.6191, "eval_samples_per_second": 8.448, "eval_steps_per_second": 1.071, "eval_wer": 0.34375, "step": 1300 }, { "epoch": 8.75, "learning_rate": 4.013333333333334e-06, "loss": 0.9421, "step": 1400 }, { "epoch": 8.75, "eval_loss": 0.7180063128471375, "eval_runtime": 33.4233, "eval_samples_per_second": 8.497, "eval_steps_per_second": 1.077, "eval_wer": 0.3431658878504673, "step": 1400 }, { "epoch": 9.38, "learning_rate": 3.346666666666667e-06, "loss": 0.9584, "step": 1500 }, { "epoch": 9.38, "eval_loss": 0.705901563167572, "eval_runtime": 33.1792, "eval_samples_per_second": 8.56, "eval_steps_per_second": 1.085, "eval_wer": 0.3364485981308411, "step": 1500 }, { "epoch": 10.0, "learning_rate": 2.68e-06, "loss": 0.88, "step": 1600 }, { "epoch": 10.0, "eval_loss": 0.7106391191482544, "eval_runtime": 35.2342, "eval_samples_per_second": 8.06, "eval_steps_per_second": 1.022, "eval_wer": 0.3364485981308411, "step": 1600 }, { "epoch": 10.62, "learning_rate": 2.0133333333333337e-06, "loss": 0.9113, "step": 1700 }, { "epoch": 10.62, "eval_loss": 0.7124722599983215, "eval_runtime": 34.7063, "eval_samples_per_second": 8.183, "eval_steps_per_second": 1.037, "eval_wer": 0.33440420560747663, "step": 1700 }, { "epoch": 11.25, "learning_rate": 1.3466666666666668e-06, "loss": 0.912, "step": 1800 }, { "epoch": 11.25, "eval_loss": 0.7090508937835693, "eval_runtime": 33.4477, "eval_samples_per_second": 8.491, "eval_steps_per_second": 1.076, "eval_wer": 0.3352803738317757, "step": 1800 }, { "epoch": 11.88, "learning_rate": 6.800000000000001e-07, "loss": 0.9607, "step": 1900 }, { "epoch": 11.88, "eval_loss": 0.7066251635551453, "eval_runtime": 33.4966, "eval_samples_per_second": 8.478, "eval_steps_per_second": 1.075, "eval_wer": 0.33440420560747663, "step": 1900 }, { "epoch": 12.5, "learning_rate": 1.3333333333333334e-08, "loss": 0.8974, "step": 2000 }, { "epoch": 12.5, "eval_loss": 0.7064409852027893, "eval_runtime": 33.5058, "eval_samples_per_second": 8.476, "eval_steps_per_second": 1.074, "eval_wer": 0.33440420560747663, "step": 2000 }, { "epoch": 12.5, "step": 2000, "total_flos": 9.605345431463184e+18, "train_loss": 1.0512529983520509, "train_runtime": 9036.2889, "train_samples_per_second": 3.541, "train_steps_per_second": 0.221 } ], "logging_steps": 100, "max_steps": 2000, "num_train_epochs": 13, "save_steps": 100, "total_flos": 9.605345431463184e+18, "trial_name": null, "trial_params": null }