{ "best_metric": 0.9504132231404959, "best_model_checkpoint": "videomae-base-finetuned-good-gestureUnitsV3/checkpoint-255", "epoch": 19.05, "eval_steps": 500, "global_step": 340, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.029411764705882353, "grad_norm": 9.534835815429688, "learning_rate": 1.4705882352941177e-06, "loss": 0.7047, "step": 10 }, { "epoch": 0.05, "eval_accuracy": 0.5619834710743802, "eval_accuracy_gunit": 0.575, "eval_accuracy_nothing": 0.5555555555555556, "eval_loss": 0.7023928165435791, "eval_runtime": 15.7256, "eval_samples_per_second": 7.694, "eval_steps_per_second": 1.017, "step": 17 }, { "epoch": 1.0088235294117647, "grad_norm": 5.451850414276123, "learning_rate": 2.9411764705882355e-06, "loss": 0.7083, "step": 20 }, { "epoch": 1.0382352941176471, "grad_norm": 5.070091724395752, "learning_rate": 4.411764705882353e-06, "loss": 0.6958, "step": 30 }, { "epoch": 1.05, "eval_accuracy": 0.38016528925619836, "eval_accuracy_gunit": 0.725, "eval_accuracy_nothing": 0.20987654320987653, "eval_loss": 0.7165102362632751, "eval_runtime": 15.8798, "eval_samples_per_second": 7.62, "eval_steps_per_second": 1.008, "step": 34 }, { "epoch": 2.0176470588235293, "grad_norm": 4.038697719573975, "learning_rate": 4.901960784313726e-06, "loss": 0.6585, "step": 40 }, { "epoch": 2.0470588235294116, "grad_norm": 3.2235519886016846, "learning_rate": 4.7385620915032685e-06, "loss": 0.6534, "step": 50 }, { "epoch": 2.05, "eval_accuracy": 0.371900826446281, "eval_accuracy_gunit": 0.85, "eval_accuracy_nothing": 0.13580246913580246, "eval_loss": 0.7150475382804871, "eval_runtime": 16.0184, "eval_samples_per_second": 7.554, "eval_steps_per_second": 0.999, "step": 51 }, { "epoch": 3.026470588235294, "grad_norm": 4.749432563781738, "learning_rate": 4.5751633986928105e-06, "loss": 0.655, "step": 60 }, { "epoch": 3.05, "eval_accuracy": 0.32231404958677684, "eval_accuracy_gunit": 0.975, "eval_accuracy_nothing": 0.0, "eval_loss": 0.7505635619163513, "eval_runtime": 15.7625, "eval_samples_per_second": 7.676, "eval_steps_per_second": 1.015, "step": 68 }, { "epoch": 4.0058823529411764, "grad_norm": 6.722472190856934, "learning_rate": 4.411764705882353e-06, "loss": 0.6741, "step": 70 }, { "epoch": 4.035294117647059, "grad_norm": 6.8286638259887695, "learning_rate": 4.2483660130718954e-06, "loss": 0.6545, "step": 80 }, { "epoch": 4.05, "eval_accuracy": 0.4297520661157025, "eval_accuracy_gunit": 0.95, "eval_accuracy_nothing": 0.1728395061728395, "eval_loss": 0.6991418600082397, "eval_runtime": 15.5171, "eval_samples_per_second": 7.798, "eval_steps_per_second": 1.031, "step": 85 }, { "epoch": 5.014705882352941, "grad_norm": 7.191628456115723, "learning_rate": 4.084967320261438e-06, "loss": 0.56, "step": 90 }, { "epoch": 5.044117647058823, "grad_norm": 5.416815757751465, "learning_rate": 3.92156862745098e-06, "loss": 0.6321, "step": 100 }, { "epoch": 5.05, "eval_accuracy": 0.47107438016528924, "eval_accuracy_gunit": 0.95, "eval_accuracy_nothing": 0.2345679012345679, "eval_loss": 0.6750265955924988, "eval_runtime": 15.9488, "eval_samples_per_second": 7.587, "eval_steps_per_second": 1.003, "step": 102 }, { "epoch": 6.023529411764706, "grad_norm": 4.386753559112549, "learning_rate": 3.758169934640523e-06, "loss": 0.5883, "step": 110 }, { "epoch": 6.05, "eval_accuracy": 0.743801652892562, "eval_accuracy_gunit": 0.9, "eval_accuracy_nothing": 0.6666666666666666, "eval_loss": 0.6142133474349976, "eval_runtime": 16.6481, "eval_samples_per_second": 7.268, "eval_steps_per_second": 0.961, "step": 119 }, { "epoch": 7.002941176470588, "grad_norm": 5.5603108406066895, "learning_rate": 3.5947712418300657e-06, "loss": 0.5803, "step": 120 }, { "epoch": 7.0323529411764705, "grad_norm": 3.9502112865448, "learning_rate": 3.431372549019608e-06, "loss": 0.5045, "step": 130 }, { "epoch": 7.05, "eval_accuracy": 0.8181818181818182, "eval_accuracy_gunit": 0.9, "eval_accuracy_nothing": 0.7777777777777778, "eval_loss": 0.549534022808075, "eval_runtime": 15.8267, "eval_samples_per_second": 7.645, "eval_steps_per_second": 1.011, "step": 136 }, { "epoch": 8.011764705882353, "grad_norm": 5.036988735198975, "learning_rate": 3.2679738562091506e-06, "loss": 0.578, "step": 140 }, { "epoch": 8.041176470588235, "grad_norm": 4.750277519226074, "learning_rate": 3.104575163398693e-06, "loss": 0.455, "step": 150 }, { "epoch": 8.05, "eval_accuracy": 0.71900826446281, "eval_accuracy_gunit": 0.925, "eval_accuracy_nothing": 0.6172839506172839, "eval_loss": 0.572287917137146, "eval_runtime": 16.0277, "eval_samples_per_second": 7.549, "eval_steps_per_second": 0.998, "step": 153 }, { "epoch": 9.020588235294118, "grad_norm": 4.390650749206543, "learning_rate": 2.9411764705882355e-06, "loss": 0.382, "step": 160 }, { "epoch": 9.05, "grad_norm": 12.403214454650879, "learning_rate": 2.7777777777777783e-06, "loss": 0.4191, "step": 170 }, { "epoch": 9.05, "eval_accuracy": 0.9338842975206612, "eval_accuracy_gunit": 0.85, "eval_accuracy_nothing": 0.9753086419753086, "eval_loss": 0.37085020542144775, "eval_runtime": 19.423, "eval_samples_per_second": 6.23, "eval_steps_per_second": 0.824, "step": 170 }, { "epoch": 10.029411764705882, "grad_norm": 8.752729415893555, "learning_rate": 2.6143790849673208e-06, "loss": 0.365, "step": 180 }, { "epoch": 10.05, "eval_accuracy": 0.9090909090909091, "eval_accuracy_gunit": 0.85, "eval_accuracy_nothing": 0.9382716049382716, "eval_loss": 0.3546590209007263, "eval_runtime": 15.5146, "eval_samples_per_second": 7.799, "eval_steps_per_second": 1.031, "step": 187 }, { "epoch": 11.008823529411766, "grad_norm": 6.302486896514893, "learning_rate": 2.450980392156863e-06, "loss": 0.3493, "step": 190 }, { "epoch": 11.038235294117648, "grad_norm": 4.457513809204102, "learning_rate": 2.2875816993464053e-06, "loss": 0.2593, "step": 200 }, { "epoch": 11.05, "eval_accuracy": 0.8925619834710744, "eval_accuracy_gunit": 0.85, "eval_accuracy_nothing": 0.9135802469135802, "eval_loss": 0.36317938566207886, "eval_runtime": 15.7061, "eval_samples_per_second": 7.704, "eval_steps_per_second": 1.019, "step": 204 }, { "epoch": 12.01764705882353, "grad_norm": 11.817601203918457, "learning_rate": 2.1241830065359477e-06, "loss": 0.3111, "step": 210 }, { "epoch": 12.047058823529412, "grad_norm": 6.769512176513672, "learning_rate": 1.96078431372549e-06, "loss": 0.2225, "step": 220 }, { "epoch": 12.05, "eval_accuracy": 0.9421487603305785, "eval_accuracy_gunit": 0.85, "eval_accuracy_nothing": 0.9876543209876543, "eval_loss": 0.24565516412258148, "eval_runtime": 20.1411, "eval_samples_per_second": 6.008, "eval_steps_per_second": 0.794, "step": 221 }, { "epoch": 13.026470588235295, "grad_norm": 3.0028862953186035, "learning_rate": 1.7973856209150328e-06, "loss": 0.2121, "step": 230 }, { "epoch": 13.05, "eval_accuracy": 0.9256198347107438, "eval_accuracy_gunit": 0.85, "eval_accuracy_nothing": 0.9629629629629629, "eval_loss": 0.26187241077423096, "eval_runtime": 15.6231, "eval_samples_per_second": 7.745, "eval_steps_per_second": 1.024, "step": 238 }, { "epoch": 14.005882352941176, "grad_norm": 11.049546241760254, "learning_rate": 1.6339869281045753e-06, "loss": 0.1814, "step": 240 }, { "epoch": 14.035294117647059, "grad_norm": 13.598651885986328, "learning_rate": 1.4705882352941177e-06, "loss": 0.1506, "step": 250 }, { "epoch": 14.05, "eval_accuracy": 0.9504132231404959, "eval_accuracy_gunit": 0.85, "eval_accuracy_nothing": 1.0, "eval_loss": 0.2190253734588623, "eval_runtime": 15.7623, "eval_samples_per_second": 7.677, "eval_steps_per_second": 1.015, "step": 255 }, { "epoch": 15.014705882352942, "grad_norm": 5.206620693206787, "learning_rate": 1.3071895424836604e-06, "loss": 0.1518, "step": 260 }, { "epoch": 15.044117647058824, "grad_norm": 15.521167755126953, "learning_rate": 1.1437908496732026e-06, "loss": 0.1335, "step": 270 }, { "epoch": 15.05, "eval_accuracy": 0.9338842975206612, "eval_accuracy_gunit": 0.85, "eval_accuracy_nothing": 0.9753086419753086, "eval_loss": 0.22213229537010193, "eval_runtime": 15.6243, "eval_samples_per_second": 7.744, "eval_steps_per_second": 1.024, "step": 272 }, { "epoch": 16.023529411764706, "grad_norm": 3.6706037521362305, "learning_rate": 9.80392156862745e-07, "loss": 0.1039, "step": 280 }, { "epoch": 16.05, "eval_accuracy": 0.9421487603305785, "eval_accuracy_gunit": 0.85, "eval_accuracy_nothing": 0.9876543209876543, "eval_loss": 0.2107107788324356, "eval_runtime": 15.8386, "eval_samples_per_second": 7.64, "eval_steps_per_second": 1.01, "step": 289 }, { "epoch": 17.00294117647059, "grad_norm": 2.560628890991211, "learning_rate": 8.169934640522876e-07, "loss": 0.1959, "step": 290 }, { "epoch": 17.03235294117647, "grad_norm": 13.137368202209473, "learning_rate": 6.535947712418302e-07, "loss": 0.1036, "step": 300 }, { "epoch": 17.05, "eval_accuracy": 0.9421487603305785, "eval_accuracy_gunit": 0.85, "eval_accuracy_nothing": 0.9876543209876543, "eval_loss": 0.20594191551208496, "eval_runtime": 15.7489, "eval_samples_per_second": 7.683, "eval_steps_per_second": 1.016, "step": 306 }, { "epoch": 18.011764705882353, "grad_norm": 105.94062805175781, "learning_rate": 4.901960784313725e-07, "loss": 0.139, "step": 310 }, { "epoch": 18.041176470588237, "grad_norm": 7.893646240234375, "learning_rate": 3.267973856209151e-07, "loss": 0.1019, "step": 320 }, { "epoch": 18.05, "eval_accuracy": 0.9421487603305785, "eval_accuracy_gunit": 0.85, "eval_accuracy_nothing": 0.9876543209876543, "eval_loss": 0.2062729150056839, "eval_runtime": 15.7147, "eval_samples_per_second": 7.7, "eval_steps_per_second": 1.018, "step": 323 }, { "epoch": 19.020588235294117, "grad_norm": 4.479135036468506, "learning_rate": 1.6339869281045755e-07, "loss": 0.0837, "step": 330 }, { "epoch": 19.05, "grad_norm": 84.62340545654297, "learning_rate": 0.0, "loss": 0.1181, "step": 340 }, { "epoch": 19.05, "eval_accuracy": 0.9504132231404959, "eval_accuracy_gunit": 0.85, "eval_accuracy_nothing": 1.0, "eval_loss": 0.21026436984539032, "eval_runtime": 15.8645, "eval_samples_per_second": 7.627, "eval_steps_per_second": 1.009, "step": 340 }, { "epoch": 19.05, "step": 340, "total_flos": 3.339453099784274e+18, "train_loss": 0.3907703813384561, "train_runtime": 996.3737, "train_samples_per_second": 2.73, "train_steps_per_second": 0.341 }, { "epoch": 19.05, "eval_accuracy": 0.8932038834951457, "eval_accuracy_gunit": 0.5416666666666666, "eval_accuracy_nothing": 1.0, "eval_loss": 0.34902578592300415, "eval_runtime": 14.5221, "eval_samples_per_second": 7.093, "eval_steps_per_second": 0.895, "step": 340 }, { "epoch": 19.05, "eval_accuracy": 0.8932038834951457, "eval_accuracy_gunit": 0.5416666666666666, "eval_accuracy_nothing": 1.0, "eval_loss": 0.3490257263183594, "eval_runtime": 13.7098, "eval_samples_per_second": 7.513, "eval_steps_per_second": 0.948, "step": 340 } ], "logging_steps": 10, "max_steps": 340, "num_input_tokens_seen": 0, "num_train_epochs": 9223372036854775807, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 3.339453099784274e+18, "train_batch_size": 8, "trial_name": null, "trial_params": null }