| { | |
| "best_metric": 0.9099219196343554, | |
| "best_model_checkpoint": "./output//roberta-large_ipc1_D_5_32_5e-6_0.01_0.06_07-08-22_05-38/checkpoint-54000", | |
| "epoch": 3.8676404571981076, | |
| "global_step": 56000, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.14, | |
| "learning_rate": 2.3020257826887664e-06, | |
| "loss": 0.2633, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 0.14, | |
| "eval_accuracy": 0.782186065915728, | |
| "eval_f1": 0.8434414112545581, | |
| "eval_loss": 0.12234517931938171, | |
| "eval_roc_auc": 0.8943263793686275, | |
| "eval_runtime": 707.0346, | |
| "eval_samples_per_second": 33.902, | |
| "eval_steps_per_second": 2.12, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 0.28, | |
| "learning_rate": 4.604051565377533e-06, | |
| "loss": 0.1135, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 0.28, | |
| "eval_accuracy": 0.81543596161869, | |
| "eval_f1": 0.8686181075561606, | |
| "eval_loss": 0.09953225404024124, | |
| "eval_roc_auc": 0.9126753468236911, | |
| "eval_runtime": 707.1318, | |
| "eval_samples_per_second": 33.897, | |
| "eval_steps_per_second": 2.12, | |
| "step": 4000 | |
| }, | |
| { | |
| "epoch": 0.41, | |
| "learning_rate": 4.878326549205743e-06, | |
| "loss": 0.0975, | |
| "step": 6000 | |
| }, | |
| { | |
| "epoch": 0.41, | |
| "eval_accuracy": 0.827784730913642, | |
| "eval_f1": 0.8807810494379399, | |
| "eval_loss": 0.08744705468416214, | |
| "eval_roc_auc": 0.9195269073883311, | |
| "eval_runtime": 707.2934, | |
| "eval_samples_per_second": 33.89, | |
| "eval_steps_per_second": 2.119, | |
| "step": 6000 | |
| }, | |
| { | |
| "epoch": 0.55, | |
| "learning_rate": 4.731377937135384e-06, | |
| "loss": 0.0897, | |
| "step": 8000 | |
| }, | |
| { | |
| "epoch": 0.55, | |
| "eval_accuracy": 0.8280350438047559, | |
| "eval_f1": 0.883428263546798, | |
| "eval_loss": 0.08566972613334656, | |
| "eval_roc_auc": 0.9246573113358266, | |
| "eval_runtime": 707.7071, | |
| "eval_samples_per_second": 33.87, | |
| "eval_steps_per_second": 2.118, | |
| "step": 8000 | |
| }, | |
| { | |
| "epoch": 0.69, | |
| "learning_rate": 4.584429325065025e-06, | |
| "loss": 0.0845, | |
| "step": 10000 | |
| }, | |
| { | |
| "epoch": 0.69, | |
| "eval_accuracy": 0.8415936587400917, | |
| "eval_f1": 0.8920891085286283, | |
| "eval_loss": 0.07975932210683823, | |
| "eval_roc_auc": 0.928458970107628, | |
| "eval_runtime": 707.3951, | |
| "eval_samples_per_second": 33.885, | |
| "eval_steps_per_second": 2.119, | |
| "step": 10000 | |
| }, | |
| { | |
| "epoch": 0.83, | |
| "learning_rate": 4.437480712994666e-06, | |
| "loss": 0.0818, | |
| "step": 12000 | |
| }, | |
| { | |
| "epoch": 0.83, | |
| "eval_accuracy": 0.8427200667501042, | |
| "eval_f1": 0.8958713920350749, | |
| "eval_loss": 0.0771109014749527, | |
| "eval_roc_auc": 0.9319582466091877, | |
| "eval_runtime": 707.8327, | |
| "eval_samples_per_second": 33.864, | |
| "eval_steps_per_second": 2.118, | |
| "step": 12000 | |
| }, | |
| { | |
| "epoch": 0.97, | |
| "learning_rate": 4.2905321009243076e-06, | |
| "loss": 0.0799, | |
| "step": 14000 | |
| }, | |
| { | |
| "epoch": 0.97, | |
| "eval_accuracy": 0.8450146015853149, | |
| "eval_f1": 0.8957159726658537, | |
| "eval_loss": 0.07565668225288391, | |
| "eval_roc_auc": 0.9295314687703254, | |
| "eval_runtime": 707.6287, | |
| "eval_samples_per_second": 33.874, | |
| "eval_steps_per_second": 2.118, | |
| "step": 14000 | |
| }, | |
| { | |
| "epoch": 1.11, | |
| "learning_rate": 4.143583488853948e-06, | |
| "loss": 0.0732, | |
| "step": 16000 | |
| }, | |
| { | |
| "epoch": 1.11, | |
| "eval_accuracy": 0.8493950771798081, | |
| "eval_f1": 0.8984909514907395, | |
| "eval_loss": 0.07519076764583588, | |
| "eval_roc_auc": 0.9326589314853615, | |
| "eval_runtime": 707.9951, | |
| "eval_samples_per_second": 33.856, | |
| "eval_steps_per_second": 2.117, | |
| "step": 16000 | |
| }, | |
| { | |
| "epoch": 1.24, | |
| "learning_rate": 3.996634876783589e-06, | |
| "loss": 0.0726, | |
| "step": 18000 | |
| }, | |
| { | |
| "epoch": 1.24, | |
| "eval_accuracy": 0.8492699207342511, | |
| "eval_f1": 0.8975535762903036, | |
| "eval_loss": 0.07450989633798599, | |
| "eval_roc_auc": 0.9289754929708756, | |
| "eval_runtime": 708.1958, | |
| "eval_samples_per_second": 33.847, | |
| "eval_steps_per_second": 2.117, | |
| "step": 18000 | |
| }, | |
| { | |
| "epoch": 1.38, | |
| "learning_rate": 3.84968626471323e-06, | |
| "loss": 0.0716, | |
| "step": 20000 | |
| }, | |
| { | |
| "epoch": 1.38, | |
| "eval_accuracy": 0.8525657071339174, | |
| "eval_f1": 0.9005084354055927, | |
| "eval_loss": 0.07325474917888641, | |
| "eval_roc_auc": 0.9340545363189772, | |
| "eval_runtime": 707.8752, | |
| "eval_samples_per_second": 33.862, | |
| "eval_steps_per_second": 2.118, | |
| "step": 20000 | |
| }, | |
| { | |
| "epoch": 1.52, | |
| "learning_rate": 3.702737652642871e-06, | |
| "loss": 0.0708, | |
| "step": 22000 | |
| }, | |
| { | |
| "epoch": 1.52, | |
| "eval_accuracy": 0.8506466416353775, | |
| "eval_f1": 0.9017078523041694, | |
| "eval_loss": 0.0716293528676033, | |
| "eval_roc_auc": 0.9380172851232347, | |
| "eval_runtime": 707.8218, | |
| "eval_samples_per_second": 33.864, | |
| "eval_steps_per_second": 2.118, | |
| "step": 22000 | |
| }, | |
| { | |
| "epoch": 1.66, | |
| "learning_rate": 3.555789040572512e-06, | |
| "loss": 0.0695, | |
| "step": 24000 | |
| }, | |
| { | |
| "epoch": 1.66, | |
| "eval_accuracy": 0.8547350855235711, | |
| "eval_f1": 0.9044931999464413, | |
| "eval_loss": 0.07056614011526108, | |
| "eval_roc_auc": 0.9387482370760931, | |
| "eval_runtime": 708.0549, | |
| "eval_samples_per_second": 33.853, | |
| "eval_steps_per_second": 2.117, | |
| "step": 24000 | |
| }, | |
| { | |
| "epoch": 1.8, | |
| "learning_rate": 3.4088404285021533e-06, | |
| "loss": 0.069, | |
| "step": 26000 | |
| }, | |
| { | |
| "epoch": 1.8, | |
| "eval_accuracy": 0.8569044639132248, | |
| "eval_f1": 0.9042787144565763, | |
| "eval_loss": 0.07104314118623734, | |
| "eval_roc_auc": 0.9356039344541693, | |
| "eval_runtime": 707.8507, | |
| "eval_samples_per_second": 33.863, | |
| "eval_steps_per_second": 2.118, | |
| "step": 26000 | |
| }, | |
| { | |
| "epoch": 1.93, | |
| "learning_rate": 3.261891816431794e-06, | |
| "loss": 0.0682, | |
| "step": 28000 | |
| }, | |
| { | |
| "epoch": 1.93, | |
| "eval_accuracy": 0.8599499374217772, | |
| "eval_f1": 0.9060724534406717, | |
| "eval_loss": 0.06967160105705261, | |
| "eval_roc_auc": 0.9372038441063302, | |
| "eval_runtime": 708.2055, | |
| "eval_samples_per_second": 33.846, | |
| "eval_steps_per_second": 2.117, | |
| "step": 28000 | |
| }, | |
| { | |
| "epoch": 2.07, | |
| "learning_rate": 3.1149432043614354e-06, | |
| "loss": 0.0639, | |
| "step": 30000 | |
| }, | |
| { | |
| "epoch": 2.07, | |
| "eval_accuracy": 0.854276178556529, | |
| "eval_f1": 0.9025946730864763, | |
| "eval_loss": 0.07231773436069489, | |
| "eval_roc_auc": 0.9380671303178707, | |
| "eval_runtime": 708.1848, | |
| "eval_samples_per_second": 33.847, | |
| "eval_steps_per_second": 2.117, | |
| "step": 30000 | |
| }, | |
| { | |
| "epoch": 2.21, | |
| "learning_rate": 2.9679945922910757e-06, | |
| "loss": 0.0595, | |
| "step": 32000 | |
| }, | |
| { | |
| "epoch": 2.21, | |
| "eval_accuracy": 0.8584897788902796, | |
| "eval_f1": 0.9064987752602572, | |
| "eval_loss": 0.07001405209302902, | |
| "eval_roc_auc": 0.9397355166673759, | |
| "eval_runtime": 708.0437, | |
| "eval_samples_per_second": 33.854, | |
| "eval_steps_per_second": 2.117, | |
| "step": 32000 | |
| }, | |
| { | |
| "epoch": 2.35, | |
| "learning_rate": 2.821045980220717e-06, | |
| "loss": 0.0609, | |
| "step": 34000 | |
| }, | |
| { | |
| "epoch": 2.35, | |
| "eval_accuracy": 0.8602002503128912, | |
| "eval_f1": 0.9077644010972264, | |
| "eval_loss": 0.06918834149837494, | |
| "eval_roc_auc": 0.9421116895582996, | |
| "eval_runtime": 707.9146, | |
| "eval_samples_per_second": 33.86, | |
| "eval_steps_per_second": 2.117, | |
| "step": 34000 | |
| }, | |
| { | |
| "epoch": 2.49, | |
| "learning_rate": 2.674097368150358e-06, | |
| "loss": 0.0612, | |
| "step": 36000 | |
| }, | |
| { | |
| "epoch": 2.49, | |
| "eval_accuracy": 0.8603671255736337, | |
| "eval_f1": 0.9078671395339969, | |
| "eval_loss": 0.06887050718069077, | |
| "eval_roc_auc": 0.9418260414584333, | |
| "eval_runtime": 708.0484, | |
| "eval_samples_per_second": 33.854, | |
| "eval_steps_per_second": 2.117, | |
| "step": 36000 | |
| }, | |
| { | |
| "epoch": 2.62, | |
| "learning_rate": 2.527148756079999e-06, | |
| "loss": 0.0607, | |
| "step": 38000 | |
| }, | |
| { | |
| "epoch": 2.62, | |
| "eval_accuracy": 0.8638715060492282, | |
| "eval_f1": 0.9094039329711531, | |
| "eval_loss": 0.0678349956870079, | |
| "eval_roc_auc": 0.941532162317987, | |
| "eval_runtime": 707.9126, | |
| "eval_samples_per_second": 33.86, | |
| "eval_steps_per_second": 2.117, | |
| "step": 38000 | |
| }, | |
| { | |
| "epoch": 2.76, | |
| "learning_rate": 2.38020014400964e-06, | |
| "loss": 0.0598, | |
| "step": 40000 | |
| }, | |
| { | |
| "epoch": 2.76, | |
| "eval_accuracy": 0.8620775969962453, | |
| "eval_f1": 0.9084244866628287, | |
| "eval_loss": 0.06894223392009735, | |
| "eval_roc_auc": 0.9398278292003405, | |
| "eval_runtime": 708.1682, | |
| "eval_samples_per_second": 33.848, | |
| "eval_steps_per_second": 2.117, | |
| "step": 40000 | |
| }, | |
| { | |
| "epoch": 2.9, | |
| "learning_rate": 2.233251531939281e-06, | |
| "loss": 0.0589, | |
| "step": 42000 | |
| }, | |
| { | |
| "epoch": 2.9, | |
| "eval_accuracy": 0.8625782227784731, | |
| "eval_f1": 0.9087424782492046, | |
| "eval_loss": 0.06813088804483414, | |
| "eval_roc_auc": 0.9405057223889542, | |
| "eval_runtime": 708.1038, | |
| "eval_samples_per_second": 33.851, | |
| "eval_steps_per_second": 2.117, | |
| "step": 42000 | |
| }, | |
| { | |
| "epoch": 3.04, | |
| "learning_rate": 2.086302919868922e-06, | |
| "loss": 0.0584, | |
| "step": 44000 | |
| }, | |
| { | |
| "epoch": 3.04, | |
| "eval_accuracy": 0.863537755527743, | |
| "eval_f1": 0.9081979164668188, | |
| "eval_loss": 0.07025768607854843, | |
| "eval_roc_auc": 0.9397884820006503, | |
| "eval_runtime": 707.4211, | |
| "eval_samples_per_second": 33.884, | |
| "eval_steps_per_second": 2.119, | |
| "step": 44000 | |
| }, | |
| { | |
| "epoch": 3.18, | |
| "learning_rate": 1.939354307798563e-06, | |
| "loss": 0.0521, | |
| "step": 46000 | |
| }, | |
| { | |
| "epoch": 3.18, | |
| "eval_accuracy": 0.8621610346266166, | |
| "eval_f1": 0.9091812742530537, | |
| "eval_loss": 0.0701606273651123, | |
| "eval_roc_auc": 0.941660515050063, | |
| "eval_runtime": 707.6705, | |
| "eval_samples_per_second": 33.872, | |
| "eval_steps_per_second": 2.118, | |
| "step": 46000 | |
| }, | |
| { | |
| "epoch": 3.32, | |
| "learning_rate": 1.792405695728204e-06, | |
| "loss": 0.0528, | |
| "step": 48000 | |
| }, | |
| { | |
| "epoch": 3.32, | |
| "eval_accuracy": 0.8632874426366292, | |
| "eval_f1": 0.9089131684876366, | |
| "eval_loss": 0.06941932439804077, | |
| "eval_roc_auc": 0.9405201937068114, | |
| "eval_runtime": 707.419, | |
| "eval_samples_per_second": 33.884, | |
| "eval_steps_per_second": 2.119, | |
| "step": 48000 | |
| }, | |
| { | |
| "epoch": 3.45, | |
| "learning_rate": 1.6454570836578452e-06, | |
| "loss": 0.0527, | |
| "step": 50000 | |
| }, | |
| { | |
| "epoch": 3.45, | |
| "eval_accuracy": 0.8617855652899458, | |
| "eval_f1": 0.9090562440419447, | |
| "eval_loss": 0.069430410861969, | |
| "eval_roc_auc": 0.9425349573751873, | |
| "eval_runtime": 707.7016, | |
| "eval_samples_per_second": 33.87, | |
| "eval_steps_per_second": 2.118, | |
| "step": 50000 | |
| }, | |
| { | |
| "epoch": 3.59, | |
| "learning_rate": 1.498508471587486e-06, | |
| "loss": 0.053, | |
| "step": 52000 | |
| }, | |
| { | |
| "epoch": 3.59, | |
| "eval_accuracy": 0.8624530663329162, | |
| "eval_f1": 0.9087446678854357, | |
| "eval_loss": 0.06918352842330933, | |
| "eval_roc_auc": 0.9427842849830317, | |
| "eval_runtime": 707.4215, | |
| "eval_samples_per_second": 33.884, | |
| "eval_steps_per_second": 2.119, | |
| "step": 52000 | |
| }, | |
| { | |
| "epoch": 3.73, | |
| "learning_rate": 1.351559859517127e-06, | |
| "loss": 0.0522, | |
| "step": 54000 | |
| }, | |
| { | |
| "epoch": 3.73, | |
| "eval_accuracy": 0.8645390070921986, | |
| "eval_f1": 0.9099219196343554, | |
| "eval_loss": 0.0693092793226242, | |
| "eval_roc_auc": 0.943445813623303, | |
| "eval_runtime": 717.1057, | |
| "eval_samples_per_second": 33.426, | |
| "eval_steps_per_second": 2.09, | |
| "step": 54000 | |
| }, | |
| { | |
| "epoch": 3.87, | |
| "learning_rate": 1.2046112474467679e-06, | |
| "loss": 0.0521, | |
| "step": 56000 | |
| }, | |
| { | |
| "epoch": 3.87, | |
| "eval_accuracy": 0.8630788485607008, | |
| "eval_f1": 0.9097205045758101, | |
| "eval_loss": 0.06953160464763641, | |
| "eval_roc_auc": 0.9436689409083443, | |
| "eval_runtime": 707.5176, | |
| "eval_samples_per_second": 33.879, | |
| "eval_steps_per_second": 2.119, | |
| "step": 56000 | |
| } | |
| ], | |
| "max_steps": 72395, | |
| "num_train_epochs": 5, | |
| "total_flos": 1.6700995925936701e+18, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |