{ "best_metric": 0.08737248182296753, "best_model_checkpoint": "bert-base-uncased-Abusive_Or_Threatening_Speech/checkpoint-1531", "epoch": 2.0, "global_step": 3062, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 1.999346832135859e-05, "loss": 0.7907, "step": 1 }, { "epoch": 0.03, "learning_rate": 1.967341606792946e-05, "loss": 0.2498, "step": 50 }, { "epoch": 0.07, "learning_rate": 1.9346832135858918e-05, "loss": 0.1179, "step": 100 }, { "epoch": 0.1, "learning_rate": 1.9020248203788378e-05, "loss": 0.1278, "step": 150 }, { "epoch": 0.13, "learning_rate": 1.8693664271717834e-05, "loss": 0.1106, "step": 200 }, { "epoch": 0.16, "learning_rate": 1.836708033964729e-05, "loss": 0.1209, "step": 250 }, { "epoch": 0.2, "learning_rate": 1.8040496407576747e-05, "loss": 0.109, "step": 300 }, { "epoch": 0.23, "learning_rate": 1.7713912475506207e-05, "loss": 0.1062, "step": 350 }, { "epoch": 0.26, "learning_rate": 1.7387328543435663e-05, "loss": 0.096, "step": 400 }, { "epoch": 0.29, "learning_rate": 1.7060744611365123e-05, "loss": 0.1032, "step": 450 }, { "epoch": 0.33, "learning_rate": 1.673416067929458e-05, "loss": 0.0895, "step": 500 }, { "epoch": 0.36, "learning_rate": 1.640757674722404e-05, "loss": 0.087, "step": 550 }, { "epoch": 0.39, "learning_rate": 1.6080992815153496e-05, "loss": 0.1026, "step": 600 }, { "epoch": 0.42, "learning_rate": 1.5754408883082955e-05, "loss": 0.0871, "step": 650 }, { "epoch": 0.46, "learning_rate": 1.5427824951012412e-05, "loss": 0.0948, "step": 700 }, { "epoch": 0.49, "learning_rate": 1.510124101894187e-05, "loss": 0.1008, "step": 750 }, { "epoch": 0.52, "learning_rate": 1.4774657086871326e-05, "loss": 0.0696, "step": 800 }, { "epoch": 0.56, "learning_rate": 1.4448073154800786e-05, "loss": 0.1023, "step": 850 }, { "epoch": 0.59, "learning_rate": 1.4121489222730243e-05, "loss": 0.1002, "step": 900 }, { "epoch": 0.62, "learning_rate": 1.37949052906597e-05, "loss": 0.0789, "step": 950 }, { "epoch": 0.65, "learning_rate": 1.3468321358589159e-05, "loss": 0.0844, "step": 1000 }, { "epoch": 0.69, "learning_rate": 1.3141737426518617e-05, "loss": 0.099, "step": 1050 }, { "epoch": 0.72, "learning_rate": 1.2815153494448073e-05, "loss": 0.0859, "step": 1100 }, { "epoch": 0.75, "learning_rate": 1.2488569562377533e-05, "loss": 0.0806, "step": 1150 }, { "epoch": 0.78, "learning_rate": 1.216198563030699e-05, "loss": 0.0762, "step": 1200 }, { "epoch": 0.82, "learning_rate": 1.1835401698236448e-05, "loss": 0.1023, "step": 1250 }, { "epoch": 0.85, "learning_rate": 1.1508817766165906e-05, "loss": 0.0875, "step": 1300 }, { "epoch": 0.88, "learning_rate": 1.1182233834095364e-05, "loss": 0.0867, "step": 1350 }, { "epoch": 0.91, "learning_rate": 1.085564990202482e-05, "loss": 0.0875, "step": 1400 }, { "epoch": 0.95, "learning_rate": 1.052906596995428e-05, "loss": 0.1097, "step": 1450 }, { "epoch": 0.98, "learning_rate": 1.0202482037883737e-05, "loss": 0.1008, "step": 1500 }, { "epoch": 1.0, "eval_F1": 0.7590146376294181, "eval_Precision": 0.6918320859095347, "eval_Recall": 0.8406484776591538, "eval_accuracy": 0.9720213052579221, "eval_loss": 0.08737248182296753, "eval_runtime": 21370.7121, "eval_samples_per_second": 2.258, "eval_steps_per_second": 0.035, "step": 1531 }, { "epoch": 1.01, "learning_rate": 9.875898105813195e-06, "loss": 0.0676, "step": 1550 }, { "epoch": 1.05, "learning_rate": 9.549314173742653e-06, "loss": 0.0564, "step": 1600 }, { "epoch": 1.08, "learning_rate": 9.222730241672111e-06, "loss": 0.0683, "step": 1650 }, { "epoch": 1.11, "learning_rate": 8.896146309601569e-06, "loss": 0.0593, "step": 1700 }, { "epoch": 1.14, "learning_rate": 8.569562377531027e-06, "loss": 0.0628, "step": 1750 }, { "epoch": 1.18, "learning_rate": 8.242978445460484e-06, "loss": 0.0528, "step": 1800 }, { "epoch": 1.21, "learning_rate": 7.916394513389942e-06, "loss": 0.0589, "step": 1850 }, { "epoch": 1.24, "learning_rate": 7.5898105813194e-06, "loss": 0.065, "step": 1900 }, { "epoch": 1.27, "learning_rate": 7.263226649248858e-06, "loss": 0.0582, "step": 1950 }, { "epoch": 1.31, "learning_rate": 6.936642717178315e-06, "loss": 0.0542, "step": 2000 }, { "epoch": 1.34, "learning_rate": 6.6100587851077734e-06, "loss": 0.0625, "step": 2050 }, { "epoch": 1.37, "learning_rate": 6.2834748530372315e-06, "loss": 0.0701, "step": 2100 }, { "epoch": 1.4, "learning_rate": 5.956890920966689e-06, "loss": 0.0698, "step": 2150 }, { "epoch": 1.44, "learning_rate": 5.630306988896147e-06, "loss": 0.0526, "step": 2200 }, { "epoch": 1.47, "learning_rate": 5.303723056825605e-06, "loss": 0.0724, "step": 2250 }, { "epoch": 1.5, "learning_rate": 4.977139124755062e-06, "loss": 0.0616, "step": 2300 }, { "epoch": 1.53, "learning_rate": 4.6505551926845204e-06, "loss": 0.0714, "step": 2350 }, { "epoch": 1.57, "learning_rate": 4.3239712606139786e-06, "loss": 0.0648, "step": 2400 }, { "epoch": 1.6, "learning_rate": 3.997387328543436e-06, "loss": 0.0629, "step": 2450 }, { "epoch": 1.63, "learning_rate": 3.670803396472894e-06, "loss": 0.0666, "step": 2500 }, { "epoch": 1.67, "learning_rate": 3.3442194644023516e-06, "loss": 0.0666, "step": 2550 }, { "epoch": 1.7, "learning_rate": 3.0176355323318098e-06, "loss": 0.0562, "step": 2600 }, { "epoch": 1.73, "learning_rate": 2.6910516002612675e-06, "loss": 0.056, "step": 2650 }, { "epoch": 1.76, "learning_rate": 2.364467668190725e-06, "loss": 0.0625, "step": 2700 }, { "epoch": 1.8, "learning_rate": 2.0378837361201833e-06, "loss": 0.064, "step": 2750 }, { "epoch": 1.83, "learning_rate": 1.711299804049641e-06, "loss": 0.0568, "step": 2800 }, { "epoch": 1.86, "learning_rate": 1.3847158719790987e-06, "loss": 0.0605, "step": 2850 }, { "epoch": 1.89, "learning_rate": 1.0581319399085566e-06, "loss": 0.057, "step": 2900 }, { "epoch": 1.93, "learning_rate": 7.315480078380144e-07, "loss": 0.0587, "step": 2950 }, { "epoch": 1.96, "learning_rate": 4.0496407576747226e-07, "loss": 0.0654, "step": 3000 }, { "epoch": 1.99, "learning_rate": 7.838014369693013e-08, "loss": 0.0673, "step": 3050 }, { "epoch": 2.0, "eval_F1": 0.7591474245115454, "eval_Precision": 0.6891325378910029, "eval_Recall": 0.844998022933966, "eval_accuracy": 0.9718969555035128, "eval_loss": 0.09812068194150925, "eval_runtime": 21573.5728, "eval_samples_per_second": 2.237, "eval_steps_per_second": 0.035, "step": 3062 }, { "epoch": 2.0, "step": 3062, "total_flos": 2.21505180842616e+16, "train_loss": 0.08183616427017301, "train_runtime": 498162.2121, "train_samples_per_second": 0.393, "train_steps_per_second": 0.006 } ], "max_steps": 3062, "num_train_epochs": 2, "total_flos": 2.21505180842616e+16, "trial_name": null, "trial_params": null }