| { |
| "best_metric": null, |
| "best_model_checkpoint": null, |
| "epoch": 2.701164294954722, |
| "global_step": 4176, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 0.03, |
| "learning_rate": 5.064655172413793e-06, |
| "loss": 1.827, |
| "step": 47 |
| }, |
| { |
| "epoch": 0.06, |
| "learning_rate": 1.0129310344827586e-05, |
| "loss": 1.288, |
| "step": 94 |
| }, |
| { |
| "epoch": 0.09, |
| "learning_rate": 1.5086206896551724e-05, |
| "loss": 1.0612, |
| "step": 141 |
| }, |
| { |
| "epoch": 0.12, |
| "learning_rate": 2.0150862068965517e-05, |
| "loss": 0.9538, |
| "step": 188 |
| }, |
| { |
| "epoch": 0.15, |
| "eval_accuracy": 0.6960748846884327, |
| "eval_b_acc": 0.4789797300032158, |
| "eval_f1": 0.683716357682452, |
| "eval_f1_anger": 0.497677504976775, |
| "eval_f1_disgust": 0.0035460992907801418, |
| "eval_f1_fear": 0.4832126398946675, |
| "eval_f1_joy": 0.685316256600382, |
| "eval_f1_neutral": 0.827884745457005, |
| "eval_f1_sadness": 0.5799599198396794, |
| "eval_f1_surprise": 0.2866323907455013, |
| "eval_loss": 0.8701004981994629, |
| "eval_prec": 0.6836877535141815, |
| "eval_prec_anger": 0.462202136400986, |
| "eval_prec_disgust": 0.25, |
| "eval_prec_fear": 0.552710843373494, |
| "eval_prec_joy": 0.7401116233923805, |
| "eval_prec_neutral": 0.796529284164859, |
| "eval_prec_sadness": 0.5281021897810219, |
| "eval_prec_surprise": 0.3562300319488818, |
| "eval_recall": 0.6960748846884327, |
| "eval_recall_anger": 0.5390512697652132, |
| "eval_recall_disgust": 0.0017857142857142857, |
| "eval_recall_fear": 0.42923976608187137, |
| "eval_recall_joy": 0.6380753138075314, |
| "eval_recall_neutral": 0.86180998873451, |
| "eval_recall_sadness": 0.6431111111111111, |
| "eval_recall_surprise": 0.23978494623655913, |
| "eval_runtime": 16.0297, |
| "eval_samples_per_second": 1379.566, |
| "eval_steps_per_second": 10.792, |
| "step": 232 |
| }, |
| { |
| "epoch": 0.15, |
| "learning_rate": 2.521551724137931e-05, |
| "loss": 0.8837, |
| "step": 235 |
| }, |
| { |
| "epoch": 0.18, |
| "learning_rate": 3.0280172413793107e-05, |
| "loss": 0.881, |
| "step": 282 |
| }, |
| { |
| "epoch": 0.21, |
| "learning_rate": 3.53448275862069e-05, |
| "loss": 0.8462, |
| "step": 329 |
| }, |
| { |
| "epoch": 0.24, |
| "learning_rate": 4.0409482758620696e-05, |
| "loss": 0.8242, |
| "step": 376 |
| }, |
| { |
| "epoch": 0.27, |
| "learning_rate": 4.5474137931034485e-05, |
| "loss": 0.7952, |
| "step": 423 |
| }, |
| { |
| "epoch": 0.3, |
| "eval_accuracy": 0.7168309668083567, |
| "eval_b_acc": 0.5241940962877409, |
| "eval_f1": 0.7025228198992769, |
| "eval_f1_anger": 0.5170962651236192, |
| "eval_f1_disgust": 0.3386727688787185, |
| "eval_f1_fear": 0.5674653215636821, |
| "eval_f1_joy": 0.6853079426298663, |
| "eval_f1_neutral": 0.8225570814375757, |
| "eval_f1_sadness": 0.6211089494163424, |
| "eval_f1_surprise": 0.37250000000000005, |
| "eval_loss": 0.8009697198867798, |
| "eval_prec": 0.7097552640353452, |
| "eval_prec_anger": 0.5731778425655977, |
| "eval_prec_disgust": 0.4713375796178344, |
| "eval_prec_fear": 0.615595075239398, |
| "eval_prec_joy": 0.8083593972135342, |
| "eval_prec_neutral": 0.7405486659150695, |
| "eval_prec_sadness": 0.6858216970998926, |
| "eval_prec_surprise": 0.44477611940298506, |
| "eval_recall": 0.7168309668083567, |
| "eval_recall_anger": 0.4710110206037374, |
| "eval_recall_disgust": 0.2642857142857143, |
| "eval_recall_fear": 0.5263157894736842, |
| "eval_recall_joy": 0.5947698744769875, |
| "eval_recall_neutral": 0.924990612091626, |
| "eval_recall_sadness": 0.5675555555555556, |
| "eval_recall_surprise": 0.3204301075268817, |
| "eval_runtime": 15.1427, |
| "eval_samples_per_second": 1460.377, |
| "eval_steps_per_second": 11.425, |
| "step": 464 |
| }, |
| { |
| "epoch": 0.3, |
| "learning_rate": 4.9940105414470535e-05, |
| "loss": 0.7998, |
| "step": 470 |
| }, |
| { |
| "epoch": 0.33, |
| "learning_rate": 4.938907522759943e-05, |
| "loss": 0.7996, |
| "step": 517 |
| }, |
| { |
| "epoch": 0.36, |
| "learning_rate": 4.882606612362243e-05, |
| "loss": 0.776, |
| "step": 564 |
| }, |
| { |
| "epoch": 0.4, |
| "learning_rate": 4.826305701964542e-05, |
| "loss": 0.8018, |
| "step": 611 |
| }, |
| { |
| "epoch": 0.43, |
| "learning_rate": 4.770004791566843e-05, |
| "loss": 0.7528, |
| "step": 658 |
| }, |
| { |
| "epoch": 0.45, |
| "eval_accuracy": 0.7260558921949896, |
| "eval_b_acc": 0.5878316350938373, |
| "eval_f1": 0.7255951803151626, |
| "eval_f1_anger": 0.5542226487523992, |
| "eval_f1_disgust": 0.3994082840236686, |
| "eval_f1_fear": 0.5798319327731093, |
| "eval_f1_joy": 0.7291770573566084, |
| "eval_f1_neutral": 0.8314359514015114, |
| "eval_f1_sadness": 0.6541166735622672, |
| "eval_f1_surprise": 0.38283828382838286, |
| "eval_loss": 0.7560049891471863, |
| "eval_prec": 0.7309376250219672, |
| "eval_prec_anger": 0.5550216242191254, |
| "eval_prec_disgust": 0.3409090909090909, |
| "eval_prec_fear": 0.7225130890052356, |
| "eval_prec_joy": 0.6968541468064824, |
| "eval_prec_neutral": 0.847571679344646, |
| "eval_prec_sadness": 0.6118421052631579, |
| "eval_prec_surprise": 0.49572649572649574, |
| "eval_recall": 0.7260558921949896, |
| "eval_recall_anger": 0.5534259702922856, |
| "eval_recall_disgust": 0.48214285714285715, |
| "eval_recall_fear": 0.4842105263157895, |
| "eval_recall_joy": 0.7646443514644351, |
| "eval_recall_neutral": 0.8159031167855801, |
| "eval_recall_sadness": 0.7026666666666667, |
| "eval_recall_surprise": 0.3118279569892473, |
| "eval_runtime": 14.7708, |
| "eval_samples_per_second": 1497.143, |
| "eval_steps_per_second": 11.712, |
| "step": 696 |
| }, |
| { |
| "epoch": 0.46, |
| "learning_rate": 4.713703881169142e-05, |
| "loss": 0.7459, |
| "step": 705 |
| }, |
| { |
| "epoch": 0.49, |
| "learning_rate": 4.657402970771442e-05, |
| "loss": 0.7599, |
| "step": 752 |
| }, |
| { |
| "epoch": 0.52, |
| "learning_rate": 4.601102060373742e-05, |
| "loss": 0.7648, |
| "step": 799 |
| }, |
| { |
| "epoch": 0.55, |
| "learning_rate": 4.544801149976042e-05, |
| "loss": 0.7436, |
| "step": 846 |
| }, |
| { |
| "epoch": 0.58, |
| "learning_rate": 4.488500239578342e-05, |
| "loss": 0.7334, |
| "step": 893 |
| }, |
| { |
| "epoch": 0.6, |
| "eval_accuracy": 0.7370444062584788, |
| "eval_b_acc": 0.5867600905079025, |
| "eval_f1": 0.7282740654207969, |
| "eval_f1_anger": 0.5218712029161603, |
| "eval_f1_disgust": 0.4505649717514124, |
| "eval_f1_fear": 0.6104060913705585, |
| "eval_f1_joy": 0.7311320754716981, |
| "eval_f1_neutral": 0.8351327433628318, |
| "eval_f1_sadness": 0.6498640968618731, |
| "eval_f1_surprise": 0.4181229773462783, |
| "eval_loss": 0.7309762835502625, |
| "eval_prec": 0.7344879537976949, |
| "eval_prec_anger": 0.7128630705394191, |
| "eval_prec_disgust": 0.3726635514018692, |
| "eval_prec_fear": 0.6671289875173371, |
| "eval_prec_joy": 0.7170152855993563, |
| "eval_prec_neutral": 0.7898393036491463, |
| "eval_prec_sadness": 0.7317751808569839, |
| "eval_prec_surprise": 0.5252032520325203, |
| "eval_recall": 0.7370444062584788, |
| "eval_recall_anger": 0.411595591758505, |
| "eval_recall_disgust": 0.5696428571428571, |
| "eval_recall_fear": 0.5625730994152047, |
| "eval_recall_joy": 0.74581589958159, |
| "eval_recall_neutral": 0.8859369132557267, |
| "eval_recall_sadness": 0.5844444444444444, |
| "eval_recall_surprise": 0.3473118279569892, |
| "eval_runtime": 14.5647, |
| "eval_samples_per_second": 1518.332, |
| "eval_steps_per_second": 11.878, |
| "step": 928 |
| }, |
| { |
| "epoch": 0.61, |
| "learning_rate": 4.432199329180642e-05, |
| "loss": 0.7493, |
| "step": 940 |
| }, |
| { |
| "epoch": 0.64, |
| "learning_rate": 4.375898418782942e-05, |
| "loss": 0.7194, |
| "step": 987 |
| }, |
| { |
| "epoch": 0.67, |
| "learning_rate": 4.319597508385242e-05, |
| "loss": 0.7158, |
| "step": 1034 |
| }, |
| { |
| "epoch": 0.7, |
| "learning_rate": 4.263296597987542e-05, |
| "loss": 0.719, |
| "step": 1081 |
| }, |
| { |
| "epoch": 0.73, |
| "learning_rate": 4.206995687589842e-05, |
| "loss": 0.7216, |
| "step": 1128 |
| }, |
| { |
| "epoch": 0.75, |
| "eval_accuracy": 0.7448222845256399, |
| "eval_b_acc": 0.6009457685058381, |
| "eval_f1": 0.7388819166581033, |
| "eval_f1_anger": 0.5746421267893661, |
| "eval_f1_disgust": 0.48046875, |
| "eval_f1_fear": 0.6597796143250689, |
| "eval_f1_joy": 0.7266451397394499, |
| "eval_f1_neutral": 0.8355743035416118, |
| "eval_f1_sadness": 0.6644859813084112, |
| "eval_f1_surprise": 0.4711696869851729, |
| "eval_loss": 0.7043296694755554, |
| "eval_prec": 0.7402960337790491, |
| "eval_prec_anger": 0.6158904109589041, |
| "eval_prec_disgust": 0.5301724137931034, |
| "eval_prec_fear": 0.8023450586264657, |
| "eval_prec_joy": 0.7767198286122352, |
| "eval_prec_neutral": 0.7853956715678176, |
| "eval_prec_sadness": 0.7004926108374384, |
| "eval_prec_surprise": 0.48148148148148145, |
| "eval_recall": 0.7448222845256399, |
| "eval_recall_anger": 0.5385721130809775, |
| "eval_recall_disgust": 0.4392857142857143, |
| "eval_recall_fear": 0.560233918128655, |
| "eval_recall_joy": 0.6826359832635983, |
| "eval_recall_neutral": 0.8926023282012767, |
| "eval_recall_sadness": 0.632, |
| "eval_recall_surprise": 0.4612903225806452, |
| "eval_runtime": 14.6801, |
| "eval_samples_per_second": 1506.393, |
| "eval_steps_per_second": 11.785, |
| "step": 1160 |
| }, |
| { |
| "epoch": 0.76, |
| "learning_rate": 4.150694777192142e-05, |
| "loss": 0.7134, |
| "step": 1175 |
| }, |
| { |
| "epoch": 0.79, |
| "learning_rate": 4.094393866794442e-05, |
| "loss": 0.7029, |
| "step": 1222 |
| }, |
| { |
| "epoch": 0.82, |
| "learning_rate": 4.0380929563967415e-05, |
| "loss": 0.6945, |
| "step": 1269 |
| }, |
| { |
| "epoch": 0.85, |
| "learning_rate": 3.981792045999042e-05, |
| "loss": 0.7033, |
| "step": 1316 |
| }, |
| { |
| "epoch": 0.88, |
| "learning_rate": 3.9254911356013415e-05, |
| "loss": 0.7259, |
| "step": 1363 |
| }, |
| { |
| "epoch": 0.9, |
| "eval_accuracy": 0.7475354978746496, |
| "eval_b_acc": 0.6082480515560814, |
| "eval_f1": 0.741168197686153, |
| "eval_f1_anger": 0.5405405405405406, |
| "eval_f1_disgust": 0.4599559147685525, |
| "eval_f1_fear": 0.6475358702432937, |
| "eval_f1_joy": 0.7468589083419156, |
| "eval_f1_neutral": 0.8421338155515371, |
| "eval_f1_sadness": 0.6752079118903124, |
| "eval_f1_surprise": 0.42070338420703385, |
| "eval_loss": 0.6962281465530396, |
| "eval_prec": 0.7432901970674257, |
| "eval_prec_anger": 0.6757728253055356, |
| "eval_prec_disgust": 0.39076154806491886, |
| "eval_prec_fear": 0.6938502673796791, |
| "eval_prec_joy": 0.7354969574036511, |
| "eval_prec_neutral": 0.8121730031391698, |
| "eval_prec_sadness": 0.683037744429286, |
| "eval_prec_surprise": 0.5493934142114385, |
| "eval_recall": 0.7475354978746496, |
| "eval_recall_anger": 0.4504072831816004, |
| "eval_recall_disgust": 0.5589285714285714, |
| "eval_recall_fear": 0.6070175438596491, |
| "eval_recall_joy": 0.7585774058577406, |
| "eval_recall_neutral": 0.8743897859556891, |
| "eval_recall_sadness": 0.6675555555555556, |
| "eval_recall_surprise": 0.34086021505376346, |
| "eval_runtime": 14.6912, |
| "eval_samples_per_second": 1505.258, |
| "eval_steps_per_second": 11.776, |
| "step": 1392 |
| }, |
| { |
| "epoch": 0.91, |
| "learning_rate": 3.8691902252036415e-05, |
| "loss": 0.7143, |
| "step": 1410 |
| }, |
| { |
| "epoch": 0.94, |
| "learning_rate": 3.812889314805942e-05, |
| "loss": 0.6903, |
| "step": 1457 |
| }, |
| { |
| "epoch": 0.97, |
| "learning_rate": 3.7565884044082415e-05, |
| "loss": 0.6812, |
| "step": 1504 |
| }, |
| { |
| "epoch": 1.0, |
| "learning_rate": 3.7002874940105415e-05, |
| "loss": 0.7182, |
| "step": 1551 |
| }, |
| { |
| "epoch": 1.03, |
| "learning_rate": 3.6439865836128415e-05, |
| "loss": 0.6362, |
| "step": 1598 |
| }, |
| { |
| "epoch": 1.05, |
| "eval_accuracy": 0.7526453830152844, |
| "eval_b_acc": 0.6055170494206373, |
| "eval_f1": 0.7483739984911967, |
| "eval_f1_anger": 0.602752507581059, |
| "eval_f1_disgust": 0.4405010438413361, |
| "eval_f1_fear": 0.6491803278688525, |
| "eval_f1_joy": 0.7437363551304709, |
| "eval_f1_neutral": 0.8435330654000731, |
| "eval_f1_sadness": 0.6785631517960602, |
| "eval_f1_surprise": 0.45454545454545453, |
| "eval_loss": 0.6771188974380493, |
| "eval_prec": 0.7472415916170276, |
| "eval_prec_anger": 0.5872727272727273, |
| "eval_prec_disgust": 0.5301507537688442, |
| "eval_prec_fear": 0.7388059701492538, |
| "eval_prec_joy": 0.739202314527795, |
| "eval_prec_neutral": 0.8213269299181786, |
| "eval_prec_sadness": 0.7089588377723971, |
| "eval_prec_surprise": 0.5300859598853869, |
| "eval_recall": 0.7526453830152844, |
| "eval_recall_anger": 0.6190704360325826, |
| "eval_recall_disgust": 0.3767857142857143, |
| "eval_recall_fear": 0.5789473684210527, |
| "eval_recall_joy": 0.748326359832636, |
| "eval_recall_neutral": 0.8669733383402178, |
| "eval_recall_sadness": 0.6506666666666666, |
| "eval_recall_surprise": 0.3978494623655914, |
| "eval_runtime": 14.8683, |
| "eval_samples_per_second": 1487.33, |
| "eval_steps_per_second": 11.636, |
| "step": 1624 |
| }, |
| { |
| "epoch": 1.06, |
| "learning_rate": 3.5876856732151415e-05, |
| "loss": 0.6432, |
| "step": 1645 |
| }, |
| { |
| "epoch": 1.09, |
| "learning_rate": 3.5313847628174415e-05, |
| "loss": 0.652, |
| "step": 1692 |
| }, |
| { |
| "epoch": 1.12, |
| "learning_rate": 3.4750838524197415e-05, |
| "loss": 0.6474, |
| "step": 1739 |
| }, |
| { |
| "epoch": 1.16, |
| "learning_rate": 3.4187829420220415e-05, |
| "loss": 0.6364, |
| "step": 1786 |
| }, |
| { |
| "epoch": 1.19, |
| "learning_rate": 3.362482031624341e-05, |
| "loss": 0.621, |
| "step": 1833 |
| }, |
| { |
| "epoch": 1.2, |
| "eval_accuracy": 0.7528262639052185, |
| "eval_b_acc": 0.6120366345893286, |
| "eval_f1": 0.7487165396015127, |
| "eval_f1_anger": 0.6196334421290485, |
| "eval_f1_disgust": 0.47378277153558057, |
| "eval_f1_fear": 0.6528640441683919, |
| "eval_f1_joy": 0.7450472872075661, |
| "eval_f1_neutral": 0.8372220697227559, |
| "eval_f1_sadness": 0.6809026935209901, |
| "eval_f1_surprise": 0.4612676056338028, |
| "eval_loss": 0.67792809009552, |
| "eval_prec": 0.749407175516463, |
| "eval_prec_anger": 0.6508438818565401, |
| "eval_prec_disgust": 0.49803149606299213, |
| "eval_prec_fear": 0.7962962962962963, |
| "eval_prec_joy": 0.7107312440645774, |
| "eval_prec_neutral": 0.8165268606103873, |
| "eval_prec_sadness": 0.7498663816141101, |
| "eval_prec_surprise": 0.5077519379844961, |
| "eval_recall": 0.7528262639052185, |
| "eval_recall_anger": 0.5912793483469094, |
| "eval_recall_disgust": 0.4517857142857143, |
| "eval_recall_fear": 0.5532163742690058, |
| "eval_recall_joy": 0.7828451882845189, |
| "eval_recall_neutral": 0.8589936162223056, |
| "eval_recall_sadness": 0.6235555555555555, |
| "eval_recall_surprise": 0.42258064516129035, |
| "eval_runtime": 14.7115, |
| "eval_samples_per_second": 1503.179, |
| "eval_steps_per_second": 11.76, |
| "step": 1856 |
| }, |
| { |
| "epoch": 1.22, |
| "learning_rate": 3.3061811212266415e-05, |
| "loss": 0.6195, |
| "step": 1880 |
| }, |
| { |
| "epoch": 1.25, |
| "learning_rate": 3.249880210828941e-05, |
| "loss": 0.6332, |
| "step": 1927 |
| }, |
| { |
| "epoch": 1.28, |
| "learning_rate": 3.1935793004312415e-05, |
| "loss": 0.6251, |
| "step": 1974 |
| }, |
| { |
| "epoch": 1.31, |
| "learning_rate": 3.1372783900335415e-05, |
| "loss": 0.63, |
| "step": 2021 |
| }, |
| { |
| "epoch": 1.34, |
| "learning_rate": 3.080977479635841e-05, |
| "loss": 0.6241, |
| "step": 2068 |
| }, |
| { |
| "epoch": 1.35, |
| "eval_accuracy": 0.7512887763407796, |
| "eval_b_acc": 0.6367091163081916, |
| "eval_f1": 0.7514440246825209, |
| "eval_f1_anger": 0.6141022752872269, |
| "eval_f1_disgust": 0.4511668107173725, |
| "eval_f1_fear": 0.6488060570762958, |
| "eval_f1_joy": 0.7509570615623384, |
| "eval_f1_neutral": 0.843150231634679, |
| "eval_f1_sadness": 0.6745293717396236, |
| "eval_f1_surprise": 0.4730290456431535, |
| "eval_loss": 0.6849319338798523, |
| "eval_prec": 0.7525985800729426, |
| "eval_prec_anger": 0.5795068027210885, |
| "eval_prec_disgust": 0.4371859296482412, |
| "eval_prec_fear": 0.6461716937354989, |
| "eval_prec_joy": 0.7428863868986694, |
| "eval_prec_neutral": 0.849171586364502, |
| "eval_prec_sadness": 0.6887447892542844, |
| "eval_prec_surprise": 0.5270805812417437, |
| "eval_recall": 0.7512887763407796, |
| "eval_recall_anger": 0.6530905606133206, |
| "eval_recall_disgust": 0.4660714285714286, |
| "eval_recall_fear": 0.6514619883040935, |
| "eval_recall_joy": 0.7592050209205021, |
| "eval_recall_neutral": 0.8372136687945926, |
| "eval_recall_sadness": 0.6608888888888889, |
| "eval_recall_surprise": 0.4290322580645161, |
| "eval_runtime": 14.591, |
| "eval_samples_per_second": 1515.587, |
| "eval_steps_per_second": 11.857, |
| "step": 2088 |
| }, |
| { |
| "epoch": 1.37, |
| "learning_rate": 3.024676569238141e-05, |
| "loss": 0.5997, |
| "step": 2115 |
| }, |
| { |
| "epoch": 1.4, |
| "learning_rate": 2.968375658840441e-05, |
| "loss": 0.6348, |
| "step": 2162 |
| }, |
| { |
| "epoch": 1.43, |
| "learning_rate": 2.9120747484427408e-05, |
| "loss": 0.6269, |
| "step": 2209 |
| }, |
| { |
| "epoch": 1.46, |
| "learning_rate": 2.855773838045041e-05, |
| "loss": 0.6411, |
| "step": 2256 |
| }, |
| { |
| "epoch": 1.49, |
| "learning_rate": 2.7994729276473408e-05, |
| "loss": 0.6188, |
| "step": 2303 |
| }, |
| { |
| "epoch": 1.5, |
| "eval_accuracy": 0.7578909288233698, |
| "eval_b_acc": 0.6158634091154939, |
| "eval_f1": 0.7533929534836733, |
| "eval_f1_anger": 0.6305133767172812, |
| "eval_f1_disgust": 0.45919477693144717, |
| "eval_f1_fear": 0.6729323308270676, |
| "eval_f1_joy": 0.7494099134539732, |
| "eval_f1_neutral": 0.84280126653008, |
| "eval_f1_sadness": 0.681602172437203, |
| "eval_f1_surprise": 0.4503664223850767, |
| "eval_loss": 0.6713131070137024, |
| "eval_prec": 0.7538941653702528, |
| "eval_prec_anger": 0.6343355965082444, |
| "eval_prec_disgust": 0.5877437325905293, |
| "eval_prec_fear": 0.7246963562753036, |
| "eval_prec_joy": 0.7071269487750557, |
| "eval_prec_neutral": 0.8361049519586105, |
| "eval_prec_sadness": 0.69432918395574, |
| "eval_prec_surprise": 0.5919439579684763, |
| "eval_recall": 0.7578909288233698, |
| "eval_recall_anger": 0.6267369429803545, |
| "eval_recall_disgust": 0.3767857142857143, |
| "eval_recall_fear": 0.6280701754385964, |
| "eval_recall_joy": 0.797071129707113, |
| "eval_recall_neutral": 0.8496057078482914, |
| "eval_recall_sadness": 0.6693333333333333, |
| "eval_recall_surprise": 0.3634408602150538, |
| "eval_runtime": 14.588, |
| "eval_samples_per_second": 1515.9, |
| "eval_steps_per_second": 11.859, |
| "step": 2320 |
| }, |
| { |
| "epoch": 1.52, |
| "learning_rate": 2.7431720172496405e-05, |
| "loss": 0.622, |
| "step": 2350 |
| }, |
| { |
| "epoch": 1.55, |
| "learning_rate": 2.6868711068519408e-05, |
| "loss": 0.6278, |
| "step": 2397 |
| }, |
| { |
| "epoch": 1.58, |
| "learning_rate": 2.6305701964542405e-05, |
| "loss": 0.6227, |
| "step": 2444 |
| }, |
| { |
| "epoch": 1.61, |
| "learning_rate": 2.5742692860565405e-05, |
| "loss": 0.6337, |
| "step": 2491 |
| }, |
| { |
| "epoch": 1.64, |
| "learning_rate": 2.5179683756588408e-05, |
| "loss": 0.6182, |
| "step": 2538 |
| }, |
| { |
| "epoch": 1.65, |
| "eval_accuracy": 0.760106719725061, |
| "eval_b_acc": 0.6198832054514857, |
| "eval_f1": 0.7565733944354605, |
| "eval_f1_anger": 0.625943396226415, |
| "eval_f1_disgust": 0.4582893347412883, |
| "eval_f1_fear": 0.6753246753246753, |
| "eval_f1_joy": 0.7498260610277309, |
| "eval_f1_neutral": 0.8475095074668398, |
| "eval_f1_sadness": 0.6851194700733381, |
| "eval_f1_surprise": 0.4700181708055723, |
| "eval_loss": 0.6608244180679321, |
| "eval_prec": 0.7566647637236428, |
| "eval_prec_anger": 0.6163492800743149, |
| "eval_prec_disgust": 0.5607235142118863, |
| "eval_prec_fear": 0.7591240875912408, |
| "eval_prec_joy": 0.7142586631319826, |
| "eval_prec_neutral": 0.8374885426214482, |
| "eval_prec_sadness": 0.7324228629236217, |
| "eval_prec_surprise": 0.5381414701803051, |
| "eval_recall": 0.760106719725061, |
| "eval_recall_anger": 0.6358409199808337, |
| "eval_recall_disgust": 0.3875, |
| "eval_recall_fear": 0.6081871345029239, |
| "eval_recall_joy": 0.7891213389121339, |
| "eval_recall_neutral": 0.8577731881336839, |
| "eval_recall_sadness": 0.6435555555555555, |
| "eval_recall_surprise": 0.4172043010752688, |
| "eval_runtime": 14.5162, |
| "eval_samples_per_second": 1523.406, |
| "eval_steps_per_second": 11.918, |
| "step": 2552 |
| }, |
| { |
| "epoch": 1.67, |
| "learning_rate": 2.4616674652611405e-05, |
| "loss": 0.6078, |
| "step": 2585 |
| }, |
| { |
| "epoch": 1.7, |
| "learning_rate": 2.4053665548634405e-05, |
| "loss": 0.6167, |
| "step": 2632 |
| }, |
| { |
| "epoch": 1.73, |
| "learning_rate": 2.3490656444657405e-05, |
| "loss": 0.6329, |
| "step": 2679 |
| }, |
| { |
| "epoch": 1.76, |
| "learning_rate": 2.29396262577863e-05, |
| "loss": 0.6153, |
| "step": 2726 |
| }, |
| { |
| "epoch": 1.79, |
| "learning_rate": 2.2376617153809296e-05, |
| "loss": 0.6392, |
| "step": 2773 |
| }, |
| { |
| "epoch": 1.8, |
| "eval_accuracy": 0.7623677308492358, |
| "eval_b_acc": 0.626106698297278, |
| "eval_f1": 0.7595959808260688, |
| "eval_f1_anger": 0.6317689530685919, |
| "eval_f1_disgust": 0.46170212765957447, |
| "eval_f1_fear": 0.6752246469833119, |
| "eval_f1_joy": 0.7548152004164499, |
| "eval_f1_neutral": 0.8505247584261871, |
| "eval_f1_sadness": 0.6872427983539094, |
| "eval_f1_surprise": 0.4615384615384616, |
| "eval_loss": 0.6541842818260193, |
| "eval_prec": 0.7593266897219236, |
| "eval_prec_anger": 0.5970149253731343, |
| "eval_prec_disgust": 0.5710526315789474, |
| "eval_prec_fear": 0.748221906116643, |
| "eval_prec_joy": 0.7512953367875648, |
| "eval_prec_neutral": 0.8379338617108499, |
| "eval_prec_sadness": 0.7076271186440678, |
| "eval_prec_surprise": 0.5131578947368421, |
| "eval_recall": 0.7623677308492358, |
| "eval_recall_anger": 0.6708193579300431, |
| "eval_recall_disgust": 0.3875, |
| "eval_recall_fear": 0.6152046783625731, |
| "eval_recall_joy": 0.7583682008368201, |
| "eval_recall_neutral": 0.8634998122418325, |
| "eval_recall_sadness": 0.668, |
| "eval_recall_surprise": 0.41935483870967744, |
| "eval_runtime": 14.6661, |
| "eval_samples_per_second": 1507.827, |
| "eval_steps_per_second": 11.796, |
| "step": 2784 |
| }, |
| { |
| "epoch": 1.82, |
| "learning_rate": 2.1813608049832296e-05, |
| "loss": 0.6221, |
| "step": 2820 |
| }, |
| { |
| "epoch": 1.85, |
| "learning_rate": 2.1250598945855296e-05, |
| "loss": 0.6109, |
| "step": 2867 |
| }, |
| { |
| "epoch": 1.88, |
| "learning_rate": 2.0687589841878296e-05, |
| "loss": 0.6029, |
| "step": 2914 |
| }, |
| { |
| "epoch": 1.92, |
| "learning_rate": 2.0124580737901292e-05, |
| "loss": 0.6243, |
| "step": 2961 |
| }, |
| { |
| "epoch": 1.95, |
| "learning_rate": 1.9561571633924296e-05, |
| "loss": 0.6158, |
| "step": 3008 |
| }, |
| { |
| "epoch": 1.95, |
| "eval_accuracy": 0.764854843085828, |
| "eval_b_acc": 0.6279403178124943, |
| "eval_f1": 0.761380516026678, |
| "eval_f1_anger": 0.6389822371579453, |
| "eval_f1_disgust": 0.4711729622266402, |
| "eval_f1_fear": 0.6765847347994824, |
| "eval_f1_joy": 0.751901635927894, |
| "eval_f1_neutral": 0.8525969275786394, |
| "eval_f1_sadness": 0.6901180282342051, |
| "eval_f1_surprise": 0.46511627906976744, |
| "eval_loss": 0.6456097960472107, |
| "eval_prec": 0.7598739530313577, |
| "eval_prec_anger": 0.6402116402116402, |
| "eval_prec_disgust": 0.531390134529148, |
| "eval_prec_fear": 0.7568740955137482, |
| "eval_prec_joy": 0.7490139090720366, |
| "eval_prec_neutral": 0.8310160427807487, |
| "eval_prec_sadness": 0.7199420569773056, |
| "eval_prec_surprise": 0.5063291139240507, |
| "eval_recall": 0.764854843085828, |
| "eval_recall_anger": 0.6377575467177767, |
| "eval_recall_disgust": 0.4232142857142857, |
| "eval_recall_fear": 0.6116959064327485, |
| "eval_recall_joy": 0.7548117154811715, |
| "eval_recall_neutral": 0.8753285767930905, |
| "eval_recall_sadness": 0.6626666666666666, |
| "eval_recall_surprise": 0.43010752688172044, |
| "eval_runtime": 14.622, |
| "eval_samples_per_second": 1512.381, |
| "eval_steps_per_second": 11.832, |
| "step": 3016 |
| }, |
| { |
| "epoch": 1.98, |
| "learning_rate": 1.8998562529947296e-05, |
| "loss": 0.5901, |
| "step": 3055 |
| }, |
| { |
| "epoch": 2.01, |
| "learning_rate": 1.8435553425970292e-05, |
| "loss": 0.5923, |
| "step": 3102 |
| }, |
| { |
| "epoch": 2.04, |
| "learning_rate": 1.7872544321993292e-05, |
| "loss": 0.5239, |
| "step": 3149 |
| }, |
| { |
| "epoch": 2.07, |
| "learning_rate": 1.7309535218016292e-05, |
| "loss": 0.5329, |
| "step": 3196 |
| }, |
| { |
| "epoch": 2.1, |
| "learning_rate": 1.6758505031145187e-05, |
| "loss": 0.554, |
| "step": 3243 |
| }, |
| { |
| "epoch": 2.1, |
| "eval_accuracy": 0.7583883512706883, |
| "eval_b_acc": 0.634571558597101, |
| "eval_f1": 0.7563700086517053, |
| "eval_f1_anger": 0.643182362808531, |
| "eval_f1_disgust": 0.4690181124880839, |
| "eval_f1_fear": 0.6795752654590881, |
| "eval_f1_joy": 0.7506092607636069, |
| "eval_f1_neutral": 0.842095468502838, |
| "eval_f1_sadness": 0.6862699699004399, |
| "eval_f1_surprise": 0.47133027522935783, |
| "eval_loss": 0.6742041707038879, |
| "eval_prec": 0.7554687165264222, |
| "eval_prec_anger": 0.6433365292425696, |
| "eval_prec_disgust": 0.5030674846625767, |
| "eval_prec_fear": 0.7292225201072386, |
| "eval_prec_joy": 0.7292817679558011, |
| "eval_prec_neutral": 0.8347168419110865, |
| "eval_prec_sadness": 0.7162880618656355, |
| "eval_prec_surprise": 0.504914004914005, |
| "eval_recall": 0.7583883512706883, |
| "eval_recall_anger": 0.6430282702443699, |
| "eval_recall_disgust": 0.4392857142857143, |
| "eval_recall_fear": 0.6362573099415205, |
| "eval_recall_joy": 0.7732217573221757, |
| "eval_recall_neutral": 0.8496057078482914, |
| "eval_recall_sadness": 0.6586666666666666, |
| "eval_recall_surprise": 0.44193548387096776, |
| "eval_runtime": 14.8261, |
| "eval_samples_per_second": 1491.559, |
| "eval_steps_per_second": 11.669, |
| "step": 3248 |
| }, |
| { |
| "epoch": 2.13, |
| "learning_rate": 1.6195495927168187e-05, |
| "loss": 0.5568, |
| "step": 3290 |
| }, |
| { |
| "epoch": 2.16, |
| "learning_rate": 1.5632486823191184e-05, |
| "loss": 0.5375, |
| "step": 3337 |
| }, |
| { |
| "epoch": 2.19, |
| "learning_rate": 1.5069477719214184e-05, |
| "loss": 0.5198, |
| "step": 3384 |
| }, |
| { |
| "epoch": 2.22, |
| "learning_rate": 1.4506468615237184e-05, |
| "loss": 0.5255, |
| "step": 3431 |
| }, |
| { |
| "epoch": 2.25, |
| "learning_rate": 1.3943459511260182e-05, |
| "loss": 0.5537, |
| "step": 3478 |
| }, |
| { |
| "epoch": 2.25, |
| "eval_accuracy": 0.7632721352989057, |
| "eval_b_acc": 0.6282518018397625, |
| "eval_f1": 0.7604673635172584, |
| "eval_f1_anger": 0.6454630495790459, |
| "eval_f1_disgust": 0.45434782608695656, |
| "eval_f1_fear": 0.6718246292714378, |
| "eval_f1_joy": 0.7522695178535405, |
| "eval_f1_neutral": 0.8484961703717542, |
| "eval_f1_sadness": 0.6950892857142857, |
| "eval_f1_surprise": 0.47641791044776116, |
| "eval_loss": 0.670791745185852, |
| "eval_prec": 0.7603587760472442, |
| "eval_prec_anger": 0.6304248515303792, |
| "eval_prec_disgust": 0.5805555555555556, |
| "eval_prec_fear": 0.7485632183908046, |
| "eval_prec_joy": 0.726334242306194, |
| "eval_prec_neutral": 0.8442379182156133, |
| "eval_prec_sadness": 0.6982062780269058, |
| "eval_prec_surprise": 0.5355704697986577, |
| "eval_recall": 0.7632721352989057, |
| "eval_recall_anger": 0.6612362242453282, |
| "eval_recall_disgust": 0.3732142857142857, |
| "eval_recall_fear": 0.6093567251461989, |
| "eval_recall_joy": 0.7801255230125523, |
| "eval_recall_neutral": 0.8527975966954563, |
| "eval_recall_sadness": 0.692, |
| "eval_recall_surprise": 0.4290322580645161, |
| "eval_runtime": 14.5517, |
| "eval_samples_per_second": 1519.68, |
| "eval_steps_per_second": 11.889, |
| "step": 3480 |
| }, |
| { |
| "epoch": 2.28, |
| "learning_rate": 1.3380450407283182e-05, |
| "loss": 0.5305, |
| "step": 3525 |
| }, |
| { |
| "epoch": 2.31, |
| "learning_rate": 1.2817441303306182e-05, |
| "loss": 0.5313, |
| "step": 3572 |
| }, |
| { |
| "epoch": 2.34, |
| "learning_rate": 1.2254432199329182e-05, |
| "loss": 0.5182, |
| "step": 3619 |
| }, |
| { |
| "epoch": 2.37, |
| "learning_rate": 1.169142309535218e-05, |
| "loss": 0.5375, |
| "step": 3666 |
| }, |
| { |
| "epoch": 2.4, |
| "eval_accuracy": 0.7605589219498959, |
| "eval_b_acc": 0.6402110359246711, |
| "eval_f1": 0.7594675823716318, |
| "eval_f1_anger": 0.6421420256111757, |
| "eval_f1_disgust": 0.4648148148148148, |
| "eval_f1_fear": 0.6746532156368222, |
| "eval_f1_joy": 0.7537328697075065, |
| "eval_f1_neutral": 0.8463990997749438, |
| "eval_f1_sadness": 0.6885171790235082, |
| "eval_f1_surprise": 0.4835924006908463, |
| "eval_loss": 0.671157717704773, |
| "eval_prec": 0.7592351302120464, |
| "eval_prec_anger": 0.6245471014492754, |
| "eval_prec_disgust": 0.4826923076923077, |
| "eval_prec_fear": 0.7318741450068399, |
| "eval_prec_joy": 0.7372949179671868, |
| "eval_prec_neutral": 0.8454477332334207, |
| "eval_prec_sadness": 0.7005519779208832, |
| "eval_prec_surprise": 0.5204460966542751, |
| "eval_recall": 0.7605589219498959, |
| "eval_recall_anger": 0.6607570675610924, |
| "eval_recall_disgust": 0.44821428571428573, |
| "eval_recall_fear": 0.6257309941520468, |
| "eval_recall_joy": 0.7709205020920502, |
| "eval_recall_neutral": 0.847352609838528, |
| "eval_recall_sadness": 0.6768888888888889, |
| "eval_recall_surprise": 0.45161290322580644, |
| "eval_runtime": 14.5753, |
| "eval_samples_per_second": 1517.225, |
| "eval_steps_per_second": 11.869, |
| "step": 3712 |
| }, |
| { |
| "epoch": 2.4, |
| "learning_rate": 1.112841399137518e-05, |
| "loss": 0.5266, |
| "step": 3713 |
| }, |
| { |
| "epoch": 2.43, |
| "learning_rate": 1.056540488739818e-05, |
| "loss": 0.5276, |
| "step": 3760 |
| }, |
| { |
| "epoch": 2.46, |
| "learning_rate": 1.000239578342118e-05, |
| "loss": 0.5432, |
| "step": 3807 |
| }, |
| { |
| "epoch": 2.49, |
| "learning_rate": 9.439386679444178e-06, |
| "loss": 0.5262, |
| "step": 3854 |
| }, |
| { |
| "epoch": 2.52, |
| "learning_rate": 8.876377575467178e-06, |
| "loss": 0.5175, |
| "step": 3901 |
| }, |
| { |
| "epoch": 2.55, |
| "eval_accuracy": 0.7625033915166862, |
| "eval_b_acc": 0.6369042077487537, |
| "eval_f1": 0.7603749093215698, |
| "eval_f1_anger": 0.6429077177248053, |
| "eval_f1_disgust": 0.46938775510204084, |
| "eval_f1_fear": 0.677336747759283, |
| "eval_f1_joy": 0.7530406101834674, |
| "eval_f1_neutral": 0.8487682904241526, |
| "eval_f1_sadness": 0.6956521739130433, |
| "eval_f1_surprise": 0.457388105456775, |
| "eval_loss": 0.66249018907547, |
| "eval_prec": 0.7600295878449174, |
| "eval_prec_anger": 0.6334883720930232, |
| "eval_prec_disgust": 0.44805194805194803, |
| "eval_prec_fear": 0.7482319660537482, |
| "eval_prec_joy": 0.7421779764323446, |
| "eval_prec_neutral": 0.8374451754385965, |
| "eval_prec_sadness": 0.7251687560270009, |
| "eval_prec_surprise": 0.5320970042796006, |
| "eval_recall": 0.7625033915166862, |
| "eval_recall_anger": 0.6526114039290848, |
| "eval_recall_disgust": 0.4928571428571429, |
| "eval_recall_fear": 0.6187134502923977, |
| "eval_recall_joy": 0.7642259414225941, |
| "eval_recall_neutral": 0.8604018024784078, |
| "eval_recall_sadness": 0.6684444444444444, |
| "eval_recall_surprise": 0.4010752688172043, |
| "eval_runtime": 14.6386, |
| "eval_samples_per_second": 1510.666, |
| "eval_steps_per_second": 11.818, |
| "step": 3944 |
| }, |
| { |
| "epoch": 2.55, |
| "learning_rate": 8.313368471490178e-06, |
| "loss": 0.5337, |
| "step": 3948 |
| }, |
| { |
| "epoch": 2.58, |
| "learning_rate": 7.750359367513177e-06, |
| "loss": 0.5148, |
| "step": 3995 |
| }, |
| { |
| "epoch": 2.61, |
| "learning_rate": 7.1873502635361775e-06, |
| "loss": 0.5234, |
| "step": 4042 |
| }, |
| { |
| "epoch": 2.64, |
| "learning_rate": 6.624341159559177e-06, |
| "loss": 0.5286, |
| "step": 4089 |
| }, |
| { |
| "epoch": 2.68, |
| "learning_rate": 6.061332055582176e-06, |
| "loss": 0.5182, |
| "step": 4136 |
| }, |
| { |
| "epoch": 2.7, |
| "eval_accuracy": 0.7631364746314552, |
| "eval_b_acc": 0.6403726819328496, |
| "eval_f1": 0.7611758530200116, |
| "eval_f1_anger": 0.6441332689521971, |
| "eval_f1_disgust": 0.4635036496350365, |
| "eval_f1_fear": 0.6658725431804646, |
| "eval_f1_joy": 0.7548551093035079, |
| "eval_f1_neutral": 0.848629209284947, |
| "eval_f1_sadness": 0.6971687429218574, |
| "eval_f1_surprise": 0.4763636363636364, |
| "eval_loss": 0.6621036529541016, |
| "eval_prec": 0.7602393679680954, |
| "eval_prec_anger": 0.6491484184914842, |
| "eval_prec_disgust": 0.47388059701492535, |
| "eval_prec_fear": 0.6783980582524272, |
| "eval_prec_joy": 0.734322453016815, |
| "eval_prec_neutral": 0.844409331722279, |
| "eval_prec_sadness": 0.7108545034642032, |
| "eval_prec_surprise": 0.5458333333333333, |
| "eval_recall": 0.7631364746314552, |
| "eval_recall_anger": 0.639195016770484, |
| "eval_recall_disgust": 0.45357142857142857, |
| "eval_recall_fear": 0.6538011695906433, |
| "eval_recall_joy": 0.7765690376569038, |
| "eval_recall_neutral": 0.8528914757791964, |
| "eval_recall_sadness": 0.684, |
| "eval_recall_surprise": 0.42258064516129035, |
| "eval_runtime": 14.5758, |
| "eval_samples_per_second": 1517.169, |
| "eval_steps_per_second": 11.869, |
| "step": 4176 |
| } |
| ], |
| "max_steps": 4638, |
| "num_train_epochs": 3, |
| "total_flos": 3.51500575835136e+16, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|