|
{ |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 2.701164294954722, |
|
"global_step": 4176, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.03, |
|
"learning_rate": 5.064655172413793e-06, |
|
"loss": 1.827, |
|
"step": 47 |
|
}, |
|
{ |
|
"epoch": 0.06, |
|
"learning_rate": 1.0129310344827586e-05, |
|
"loss": 1.288, |
|
"step": 94 |
|
}, |
|
{ |
|
"epoch": 0.09, |
|
"learning_rate": 1.5086206896551724e-05, |
|
"loss": 1.0612, |
|
"step": 141 |
|
}, |
|
{ |
|
"epoch": 0.12, |
|
"learning_rate": 2.0150862068965517e-05, |
|
"loss": 0.9538, |
|
"step": 188 |
|
}, |
|
{ |
|
"epoch": 0.15, |
|
"eval_accuracy": 0.6960748846884327, |
|
"eval_b_acc": 0.4789797300032158, |
|
"eval_f1": 0.683716357682452, |
|
"eval_f1_anger": 0.497677504976775, |
|
"eval_f1_disgust": 0.0035460992907801418, |
|
"eval_f1_fear": 0.4832126398946675, |
|
"eval_f1_joy": 0.685316256600382, |
|
"eval_f1_neutral": 0.827884745457005, |
|
"eval_f1_sadness": 0.5799599198396794, |
|
"eval_f1_surprise": 0.2866323907455013, |
|
"eval_loss": 0.8701004981994629, |
|
"eval_prec": 0.6836877535141815, |
|
"eval_prec_anger": 0.462202136400986, |
|
"eval_prec_disgust": 0.25, |
|
"eval_prec_fear": 0.552710843373494, |
|
"eval_prec_joy": 0.7401116233923805, |
|
"eval_prec_neutral": 0.796529284164859, |
|
"eval_prec_sadness": 0.5281021897810219, |
|
"eval_prec_surprise": 0.3562300319488818, |
|
"eval_recall": 0.6960748846884327, |
|
"eval_recall_anger": 0.5390512697652132, |
|
"eval_recall_disgust": 0.0017857142857142857, |
|
"eval_recall_fear": 0.42923976608187137, |
|
"eval_recall_joy": 0.6380753138075314, |
|
"eval_recall_neutral": 0.86180998873451, |
|
"eval_recall_sadness": 0.6431111111111111, |
|
"eval_recall_surprise": 0.23978494623655913, |
|
"eval_runtime": 16.0297, |
|
"eval_samples_per_second": 1379.566, |
|
"eval_steps_per_second": 10.792, |
|
"step": 232 |
|
}, |
|
{ |
|
"epoch": 0.15, |
|
"learning_rate": 2.521551724137931e-05, |
|
"loss": 0.8837, |
|
"step": 235 |
|
}, |
|
{ |
|
"epoch": 0.18, |
|
"learning_rate": 3.0280172413793107e-05, |
|
"loss": 0.881, |
|
"step": 282 |
|
}, |
|
{ |
|
"epoch": 0.21, |
|
"learning_rate": 3.53448275862069e-05, |
|
"loss": 0.8462, |
|
"step": 329 |
|
}, |
|
{ |
|
"epoch": 0.24, |
|
"learning_rate": 4.0409482758620696e-05, |
|
"loss": 0.8242, |
|
"step": 376 |
|
}, |
|
{ |
|
"epoch": 0.27, |
|
"learning_rate": 4.5474137931034485e-05, |
|
"loss": 0.7952, |
|
"step": 423 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"eval_accuracy": 0.7168309668083567, |
|
"eval_b_acc": 0.5241940962877409, |
|
"eval_f1": 0.7025228198992769, |
|
"eval_f1_anger": 0.5170962651236192, |
|
"eval_f1_disgust": 0.3386727688787185, |
|
"eval_f1_fear": 0.5674653215636821, |
|
"eval_f1_joy": 0.6853079426298663, |
|
"eval_f1_neutral": 0.8225570814375757, |
|
"eval_f1_sadness": 0.6211089494163424, |
|
"eval_f1_surprise": 0.37250000000000005, |
|
"eval_loss": 0.8009697198867798, |
|
"eval_prec": 0.7097552640353452, |
|
"eval_prec_anger": 0.5731778425655977, |
|
"eval_prec_disgust": 0.4713375796178344, |
|
"eval_prec_fear": 0.615595075239398, |
|
"eval_prec_joy": 0.8083593972135342, |
|
"eval_prec_neutral": 0.7405486659150695, |
|
"eval_prec_sadness": 0.6858216970998926, |
|
"eval_prec_surprise": 0.44477611940298506, |
|
"eval_recall": 0.7168309668083567, |
|
"eval_recall_anger": 0.4710110206037374, |
|
"eval_recall_disgust": 0.2642857142857143, |
|
"eval_recall_fear": 0.5263157894736842, |
|
"eval_recall_joy": 0.5947698744769875, |
|
"eval_recall_neutral": 0.924990612091626, |
|
"eval_recall_sadness": 0.5675555555555556, |
|
"eval_recall_surprise": 0.3204301075268817, |
|
"eval_runtime": 15.1427, |
|
"eval_samples_per_second": 1460.377, |
|
"eval_steps_per_second": 11.425, |
|
"step": 464 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"learning_rate": 4.9940105414470535e-05, |
|
"loss": 0.7998, |
|
"step": 470 |
|
}, |
|
{ |
|
"epoch": 0.33, |
|
"learning_rate": 4.938907522759943e-05, |
|
"loss": 0.7996, |
|
"step": 517 |
|
}, |
|
{ |
|
"epoch": 0.36, |
|
"learning_rate": 4.882606612362243e-05, |
|
"loss": 0.776, |
|
"step": 564 |
|
}, |
|
{ |
|
"epoch": 0.4, |
|
"learning_rate": 4.826305701964542e-05, |
|
"loss": 0.8018, |
|
"step": 611 |
|
}, |
|
{ |
|
"epoch": 0.43, |
|
"learning_rate": 4.770004791566843e-05, |
|
"loss": 0.7528, |
|
"step": 658 |
|
}, |
|
{ |
|
"epoch": 0.45, |
|
"eval_accuracy": 0.7260558921949896, |
|
"eval_b_acc": 0.5878316350938373, |
|
"eval_f1": 0.7255951803151626, |
|
"eval_f1_anger": 0.5542226487523992, |
|
"eval_f1_disgust": 0.3994082840236686, |
|
"eval_f1_fear": 0.5798319327731093, |
|
"eval_f1_joy": 0.7291770573566084, |
|
"eval_f1_neutral": 0.8314359514015114, |
|
"eval_f1_sadness": 0.6541166735622672, |
|
"eval_f1_surprise": 0.38283828382838286, |
|
"eval_loss": 0.7560049891471863, |
|
"eval_prec": 0.7309376250219672, |
|
"eval_prec_anger": 0.5550216242191254, |
|
"eval_prec_disgust": 0.3409090909090909, |
|
"eval_prec_fear": 0.7225130890052356, |
|
"eval_prec_joy": 0.6968541468064824, |
|
"eval_prec_neutral": 0.847571679344646, |
|
"eval_prec_sadness": 0.6118421052631579, |
|
"eval_prec_surprise": 0.49572649572649574, |
|
"eval_recall": 0.7260558921949896, |
|
"eval_recall_anger": 0.5534259702922856, |
|
"eval_recall_disgust": 0.48214285714285715, |
|
"eval_recall_fear": 0.4842105263157895, |
|
"eval_recall_joy": 0.7646443514644351, |
|
"eval_recall_neutral": 0.8159031167855801, |
|
"eval_recall_sadness": 0.7026666666666667, |
|
"eval_recall_surprise": 0.3118279569892473, |
|
"eval_runtime": 14.7708, |
|
"eval_samples_per_second": 1497.143, |
|
"eval_steps_per_second": 11.712, |
|
"step": 696 |
|
}, |
|
{ |
|
"epoch": 0.46, |
|
"learning_rate": 4.713703881169142e-05, |
|
"loss": 0.7459, |
|
"step": 705 |
|
}, |
|
{ |
|
"epoch": 0.49, |
|
"learning_rate": 4.657402970771442e-05, |
|
"loss": 0.7599, |
|
"step": 752 |
|
}, |
|
{ |
|
"epoch": 0.52, |
|
"learning_rate": 4.601102060373742e-05, |
|
"loss": 0.7648, |
|
"step": 799 |
|
}, |
|
{ |
|
"epoch": 0.55, |
|
"learning_rate": 4.544801149976042e-05, |
|
"loss": 0.7436, |
|
"step": 846 |
|
}, |
|
{ |
|
"epoch": 0.58, |
|
"learning_rate": 4.488500239578342e-05, |
|
"loss": 0.7334, |
|
"step": 893 |
|
}, |
|
{ |
|
"epoch": 0.6, |
|
"eval_accuracy": 0.7370444062584788, |
|
"eval_b_acc": 0.5867600905079025, |
|
"eval_f1": 0.7282740654207969, |
|
"eval_f1_anger": 0.5218712029161603, |
|
"eval_f1_disgust": 0.4505649717514124, |
|
"eval_f1_fear": 0.6104060913705585, |
|
"eval_f1_joy": 0.7311320754716981, |
|
"eval_f1_neutral": 0.8351327433628318, |
|
"eval_f1_sadness": 0.6498640968618731, |
|
"eval_f1_surprise": 0.4181229773462783, |
|
"eval_loss": 0.7309762835502625, |
|
"eval_prec": 0.7344879537976949, |
|
"eval_prec_anger": 0.7128630705394191, |
|
"eval_prec_disgust": 0.3726635514018692, |
|
"eval_prec_fear": 0.6671289875173371, |
|
"eval_prec_joy": 0.7170152855993563, |
|
"eval_prec_neutral": 0.7898393036491463, |
|
"eval_prec_sadness": 0.7317751808569839, |
|
"eval_prec_surprise": 0.5252032520325203, |
|
"eval_recall": 0.7370444062584788, |
|
"eval_recall_anger": 0.411595591758505, |
|
"eval_recall_disgust": 0.5696428571428571, |
|
"eval_recall_fear": 0.5625730994152047, |
|
"eval_recall_joy": 0.74581589958159, |
|
"eval_recall_neutral": 0.8859369132557267, |
|
"eval_recall_sadness": 0.5844444444444444, |
|
"eval_recall_surprise": 0.3473118279569892, |
|
"eval_runtime": 14.5647, |
|
"eval_samples_per_second": 1518.332, |
|
"eval_steps_per_second": 11.878, |
|
"step": 928 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"learning_rate": 4.432199329180642e-05, |
|
"loss": 0.7493, |
|
"step": 940 |
|
}, |
|
{ |
|
"epoch": 0.64, |
|
"learning_rate": 4.375898418782942e-05, |
|
"loss": 0.7194, |
|
"step": 987 |
|
}, |
|
{ |
|
"epoch": 0.67, |
|
"learning_rate": 4.319597508385242e-05, |
|
"loss": 0.7158, |
|
"step": 1034 |
|
}, |
|
{ |
|
"epoch": 0.7, |
|
"learning_rate": 4.263296597987542e-05, |
|
"loss": 0.719, |
|
"step": 1081 |
|
}, |
|
{ |
|
"epoch": 0.73, |
|
"learning_rate": 4.206995687589842e-05, |
|
"loss": 0.7216, |
|
"step": 1128 |
|
}, |
|
{ |
|
"epoch": 0.75, |
|
"eval_accuracy": 0.7448222845256399, |
|
"eval_b_acc": 0.6009457685058381, |
|
"eval_f1": 0.7388819166581033, |
|
"eval_f1_anger": 0.5746421267893661, |
|
"eval_f1_disgust": 0.48046875, |
|
"eval_f1_fear": 0.6597796143250689, |
|
"eval_f1_joy": 0.7266451397394499, |
|
"eval_f1_neutral": 0.8355743035416118, |
|
"eval_f1_sadness": 0.6644859813084112, |
|
"eval_f1_surprise": 0.4711696869851729, |
|
"eval_loss": 0.7043296694755554, |
|
"eval_prec": 0.7402960337790491, |
|
"eval_prec_anger": 0.6158904109589041, |
|
"eval_prec_disgust": 0.5301724137931034, |
|
"eval_prec_fear": 0.8023450586264657, |
|
"eval_prec_joy": 0.7767198286122352, |
|
"eval_prec_neutral": 0.7853956715678176, |
|
"eval_prec_sadness": 0.7004926108374384, |
|
"eval_prec_surprise": 0.48148148148148145, |
|
"eval_recall": 0.7448222845256399, |
|
"eval_recall_anger": 0.5385721130809775, |
|
"eval_recall_disgust": 0.4392857142857143, |
|
"eval_recall_fear": 0.560233918128655, |
|
"eval_recall_joy": 0.6826359832635983, |
|
"eval_recall_neutral": 0.8926023282012767, |
|
"eval_recall_sadness": 0.632, |
|
"eval_recall_surprise": 0.4612903225806452, |
|
"eval_runtime": 14.6801, |
|
"eval_samples_per_second": 1506.393, |
|
"eval_steps_per_second": 11.785, |
|
"step": 1160 |
|
}, |
|
{ |
|
"epoch": 0.76, |
|
"learning_rate": 4.150694777192142e-05, |
|
"loss": 0.7134, |
|
"step": 1175 |
|
}, |
|
{ |
|
"epoch": 0.79, |
|
"learning_rate": 4.094393866794442e-05, |
|
"loss": 0.7029, |
|
"step": 1222 |
|
}, |
|
{ |
|
"epoch": 0.82, |
|
"learning_rate": 4.0380929563967415e-05, |
|
"loss": 0.6945, |
|
"step": 1269 |
|
}, |
|
{ |
|
"epoch": 0.85, |
|
"learning_rate": 3.981792045999042e-05, |
|
"loss": 0.7033, |
|
"step": 1316 |
|
}, |
|
{ |
|
"epoch": 0.88, |
|
"learning_rate": 3.9254911356013415e-05, |
|
"loss": 0.7259, |
|
"step": 1363 |
|
}, |
|
{ |
|
"epoch": 0.9, |
|
"eval_accuracy": 0.7475354978746496, |
|
"eval_b_acc": 0.6082480515560814, |
|
"eval_f1": 0.741168197686153, |
|
"eval_f1_anger": 0.5405405405405406, |
|
"eval_f1_disgust": 0.4599559147685525, |
|
"eval_f1_fear": 0.6475358702432937, |
|
"eval_f1_joy": 0.7468589083419156, |
|
"eval_f1_neutral": 0.8421338155515371, |
|
"eval_f1_sadness": 0.6752079118903124, |
|
"eval_f1_surprise": 0.42070338420703385, |
|
"eval_loss": 0.6962281465530396, |
|
"eval_prec": 0.7432901970674257, |
|
"eval_prec_anger": 0.6757728253055356, |
|
"eval_prec_disgust": 0.39076154806491886, |
|
"eval_prec_fear": 0.6938502673796791, |
|
"eval_prec_joy": 0.7354969574036511, |
|
"eval_prec_neutral": 0.8121730031391698, |
|
"eval_prec_sadness": 0.683037744429286, |
|
"eval_prec_surprise": 0.5493934142114385, |
|
"eval_recall": 0.7475354978746496, |
|
"eval_recall_anger": 0.4504072831816004, |
|
"eval_recall_disgust": 0.5589285714285714, |
|
"eval_recall_fear": 0.6070175438596491, |
|
"eval_recall_joy": 0.7585774058577406, |
|
"eval_recall_neutral": 0.8743897859556891, |
|
"eval_recall_sadness": 0.6675555555555556, |
|
"eval_recall_surprise": 0.34086021505376346, |
|
"eval_runtime": 14.6912, |
|
"eval_samples_per_second": 1505.258, |
|
"eval_steps_per_second": 11.776, |
|
"step": 1392 |
|
}, |
|
{ |
|
"epoch": 0.91, |
|
"learning_rate": 3.8691902252036415e-05, |
|
"loss": 0.7143, |
|
"step": 1410 |
|
}, |
|
{ |
|
"epoch": 0.94, |
|
"learning_rate": 3.812889314805942e-05, |
|
"loss": 0.6903, |
|
"step": 1457 |
|
}, |
|
{ |
|
"epoch": 0.97, |
|
"learning_rate": 3.7565884044082415e-05, |
|
"loss": 0.6812, |
|
"step": 1504 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"learning_rate": 3.7002874940105415e-05, |
|
"loss": 0.7182, |
|
"step": 1551 |
|
}, |
|
{ |
|
"epoch": 1.03, |
|
"learning_rate": 3.6439865836128415e-05, |
|
"loss": 0.6362, |
|
"step": 1598 |
|
}, |
|
{ |
|
"epoch": 1.05, |
|
"eval_accuracy": 0.7526453830152844, |
|
"eval_b_acc": 0.6055170494206373, |
|
"eval_f1": 0.7483739984911967, |
|
"eval_f1_anger": 0.602752507581059, |
|
"eval_f1_disgust": 0.4405010438413361, |
|
"eval_f1_fear": 0.6491803278688525, |
|
"eval_f1_joy": 0.7437363551304709, |
|
"eval_f1_neutral": 0.8435330654000731, |
|
"eval_f1_sadness": 0.6785631517960602, |
|
"eval_f1_surprise": 0.45454545454545453, |
|
"eval_loss": 0.6771188974380493, |
|
"eval_prec": 0.7472415916170276, |
|
"eval_prec_anger": 0.5872727272727273, |
|
"eval_prec_disgust": 0.5301507537688442, |
|
"eval_prec_fear": 0.7388059701492538, |
|
"eval_prec_joy": 0.739202314527795, |
|
"eval_prec_neutral": 0.8213269299181786, |
|
"eval_prec_sadness": 0.7089588377723971, |
|
"eval_prec_surprise": 0.5300859598853869, |
|
"eval_recall": 0.7526453830152844, |
|
"eval_recall_anger": 0.6190704360325826, |
|
"eval_recall_disgust": 0.3767857142857143, |
|
"eval_recall_fear": 0.5789473684210527, |
|
"eval_recall_joy": 0.748326359832636, |
|
"eval_recall_neutral": 0.8669733383402178, |
|
"eval_recall_sadness": 0.6506666666666666, |
|
"eval_recall_surprise": 0.3978494623655914, |
|
"eval_runtime": 14.8683, |
|
"eval_samples_per_second": 1487.33, |
|
"eval_steps_per_second": 11.636, |
|
"step": 1624 |
|
}, |
|
{ |
|
"epoch": 1.06, |
|
"learning_rate": 3.5876856732151415e-05, |
|
"loss": 0.6432, |
|
"step": 1645 |
|
}, |
|
{ |
|
"epoch": 1.09, |
|
"learning_rate": 3.5313847628174415e-05, |
|
"loss": 0.652, |
|
"step": 1692 |
|
}, |
|
{ |
|
"epoch": 1.12, |
|
"learning_rate": 3.4750838524197415e-05, |
|
"loss": 0.6474, |
|
"step": 1739 |
|
}, |
|
{ |
|
"epoch": 1.16, |
|
"learning_rate": 3.4187829420220415e-05, |
|
"loss": 0.6364, |
|
"step": 1786 |
|
}, |
|
{ |
|
"epoch": 1.19, |
|
"learning_rate": 3.362482031624341e-05, |
|
"loss": 0.621, |
|
"step": 1833 |
|
}, |
|
{ |
|
"epoch": 1.2, |
|
"eval_accuracy": 0.7528262639052185, |
|
"eval_b_acc": 0.6120366345893286, |
|
"eval_f1": 0.7487165396015127, |
|
"eval_f1_anger": 0.6196334421290485, |
|
"eval_f1_disgust": 0.47378277153558057, |
|
"eval_f1_fear": 0.6528640441683919, |
|
"eval_f1_joy": 0.7450472872075661, |
|
"eval_f1_neutral": 0.8372220697227559, |
|
"eval_f1_sadness": 0.6809026935209901, |
|
"eval_f1_surprise": 0.4612676056338028, |
|
"eval_loss": 0.67792809009552, |
|
"eval_prec": 0.749407175516463, |
|
"eval_prec_anger": 0.6508438818565401, |
|
"eval_prec_disgust": 0.49803149606299213, |
|
"eval_prec_fear": 0.7962962962962963, |
|
"eval_prec_joy": 0.7107312440645774, |
|
"eval_prec_neutral": 0.8165268606103873, |
|
"eval_prec_sadness": 0.7498663816141101, |
|
"eval_prec_surprise": 0.5077519379844961, |
|
"eval_recall": 0.7528262639052185, |
|
"eval_recall_anger": 0.5912793483469094, |
|
"eval_recall_disgust": 0.4517857142857143, |
|
"eval_recall_fear": 0.5532163742690058, |
|
"eval_recall_joy": 0.7828451882845189, |
|
"eval_recall_neutral": 0.8589936162223056, |
|
"eval_recall_sadness": 0.6235555555555555, |
|
"eval_recall_surprise": 0.42258064516129035, |
|
"eval_runtime": 14.7115, |
|
"eval_samples_per_second": 1503.179, |
|
"eval_steps_per_second": 11.76, |
|
"step": 1856 |
|
}, |
|
{ |
|
"epoch": 1.22, |
|
"learning_rate": 3.3061811212266415e-05, |
|
"loss": 0.6195, |
|
"step": 1880 |
|
}, |
|
{ |
|
"epoch": 1.25, |
|
"learning_rate": 3.249880210828941e-05, |
|
"loss": 0.6332, |
|
"step": 1927 |
|
}, |
|
{ |
|
"epoch": 1.28, |
|
"learning_rate": 3.1935793004312415e-05, |
|
"loss": 0.6251, |
|
"step": 1974 |
|
}, |
|
{ |
|
"epoch": 1.31, |
|
"learning_rate": 3.1372783900335415e-05, |
|
"loss": 0.63, |
|
"step": 2021 |
|
}, |
|
{ |
|
"epoch": 1.34, |
|
"learning_rate": 3.080977479635841e-05, |
|
"loss": 0.6241, |
|
"step": 2068 |
|
}, |
|
{ |
|
"epoch": 1.35, |
|
"eval_accuracy": 0.7512887763407796, |
|
"eval_b_acc": 0.6367091163081916, |
|
"eval_f1": 0.7514440246825209, |
|
"eval_f1_anger": 0.6141022752872269, |
|
"eval_f1_disgust": 0.4511668107173725, |
|
"eval_f1_fear": 0.6488060570762958, |
|
"eval_f1_joy": 0.7509570615623384, |
|
"eval_f1_neutral": 0.843150231634679, |
|
"eval_f1_sadness": 0.6745293717396236, |
|
"eval_f1_surprise": 0.4730290456431535, |
|
"eval_loss": 0.6849319338798523, |
|
"eval_prec": 0.7525985800729426, |
|
"eval_prec_anger": 0.5795068027210885, |
|
"eval_prec_disgust": 0.4371859296482412, |
|
"eval_prec_fear": 0.6461716937354989, |
|
"eval_prec_joy": 0.7428863868986694, |
|
"eval_prec_neutral": 0.849171586364502, |
|
"eval_prec_sadness": 0.6887447892542844, |
|
"eval_prec_surprise": 0.5270805812417437, |
|
"eval_recall": 0.7512887763407796, |
|
"eval_recall_anger": 0.6530905606133206, |
|
"eval_recall_disgust": 0.4660714285714286, |
|
"eval_recall_fear": 0.6514619883040935, |
|
"eval_recall_joy": 0.7592050209205021, |
|
"eval_recall_neutral": 0.8372136687945926, |
|
"eval_recall_sadness": 0.6608888888888889, |
|
"eval_recall_surprise": 0.4290322580645161, |
|
"eval_runtime": 14.591, |
|
"eval_samples_per_second": 1515.587, |
|
"eval_steps_per_second": 11.857, |
|
"step": 2088 |
|
}, |
|
{ |
|
"epoch": 1.37, |
|
"learning_rate": 3.024676569238141e-05, |
|
"loss": 0.5997, |
|
"step": 2115 |
|
}, |
|
{ |
|
"epoch": 1.4, |
|
"learning_rate": 2.968375658840441e-05, |
|
"loss": 0.6348, |
|
"step": 2162 |
|
}, |
|
{ |
|
"epoch": 1.43, |
|
"learning_rate": 2.9120747484427408e-05, |
|
"loss": 0.6269, |
|
"step": 2209 |
|
}, |
|
{ |
|
"epoch": 1.46, |
|
"learning_rate": 2.855773838045041e-05, |
|
"loss": 0.6411, |
|
"step": 2256 |
|
}, |
|
{ |
|
"epoch": 1.49, |
|
"learning_rate": 2.7994729276473408e-05, |
|
"loss": 0.6188, |
|
"step": 2303 |
|
}, |
|
{ |
|
"epoch": 1.5, |
|
"eval_accuracy": 0.7578909288233698, |
|
"eval_b_acc": 0.6158634091154939, |
|
"eval_f1": 0.7533929534836733, |
|
"eval_f1_anger": 0.6305133767172812, |
|
"eval_f1_disgust": 0.45919477693144717, |
|
"eval_f1_fear": 0.6729323308270676, |
|
"eval_f1_joy": 0.7494099134539732, |
|
"eval_f1_neutral": 0.84280126653008, |
|
"eval_f1_sadness": 0.681602172437203, |
|
"eval_f1_surprise": 0.4503664223850767, |
|
"eval_loss": 0.6713131070137024, |
|
"eval_prec": 0.7538941653702528, |
|
"eval_prec_anger": 0.6343355965082444, |
|
"eval_prec_disgust": 0.5877437325905293, |
|
"eval_prec_fear": 0.7246963562753036, |
|
"eval_prec_joy": 0.7071269487750557, |
|
"eval_prec_neutral": 0.8361049519586105, |
|
"eval_prec_sadness": 0.69432918395574, |
|
"eval_prec_surprise": 0.5919439579684763, |
|
"eval_recall": 0.7578909288233698, |
|
"eval_recall_anger": 0.6267369429803545, |
|
"eval_recall_disgust": 0.3767857142857143, |
|
"eval_recall_fear": 0.6280701754385964, |
|
"eval_recall_joy": 0.797071129707113, |
|
"eval_recall_neutral": 0.8496057078482914, |
|
"eval_recall_sadness": 0.6693333333333333, |
|
"eval_recall_surprise": 0.3634408602150538, |
|
"eval_runtime": 14.588, |
|
"eval_samples_per_second": 1515.9, |
|
"eval_steps_per_second": 11.859, |
|
"step": 2320 |
|
}, |
|
{ |
|
"epoch": 1.52, |
|
"learning_rate": 2.7431720172496405e-05, |
|
"loss": 0.622, |
|
"step": 2350 |
|
}, |
|
{ |
|
"epoch": 1.55, |
|
"learning_rate": 2.6868711068519408e-05, |
|
"loss": 0.6278, |
|
"step": 2397 |
|
}, |
|
{ |
|
"epoch": 1.58, |
|
"learning_rate": 2.6305701964542405e-05, |
|
"loss": 0.6227, |
|
"step": 2444 |
|
}, |
|
{ |
|
"epoch": 1.61, |
|
"learning_rate": 2.5742692860565405e-05, |
|
"loss": 0.6337, |
|
"step": 2491 |
|
}, |
|
{ |
|
"epoch": 1.64, |
|
"learning_rate": 2.5179683756588408e-05, |
|
"loss": 0.6182, |
|
"step": 2538 |
|
}, |
|
{ |
|
"epoch": 1.65, |
|
"eval_accuracy": 0.760106719725061, |
|
"eval_b_acc": 0.6198832054514857, |
|
"eval_f1": 0.7565733944354605, |
|
"eval_f1_anger": 0.625943396226415, |
|
"eval_f1_disgust": 0.4582893347412883, |
|
"eval_f1_fear": 0.6753246753246753, |
|
"eval_f1_joy": 0.7498260610277309, |
|
"eval_f1_neutral": 0.8475095074668398, |
|
"eval_f1_sadness": 0.6851194700733381, |
|
"eval_f1_surprise": 0.4700181708055723, |
|
"eval_loss": 0.6608244180679321, |
|
"eval_prec": 0.7566647637236428, |
|
"eval_prec_anger": 0.6163492800743149, |
|
"eval_prec_disgust": 0.5607235142118863, |
|
"eval_prec_fear": 0.7591240875912408, |
|
"eval_prec_joy": 0.7142586631319826, |
|
"eval_prec_neutral": 0.8374885426214482, |
|
"eval_prec_sadness": 0.7324228629236217, |
|
"eval_prec_surprise": 0.5381414701803051, |
|
"eval_recall": 0.760106719725061, |
|
"eval_recall_anger": 0.6358409199808337, |
|
"eval_recall_disgust": 0.3875, |
|
"eval_recall_fear": 0.6081871345029239, |
|
"eval_recall_joy": 0.7891213389121339, |
|
"eval_recall_neutral": 0.8577731881336839, |
|
"eval_recall_sadness": 0.6435555555555555, |
|
"eval_recall_surprise": 0.4172043010752688, |
|
"eval_runtime": 14.5162, |
|
"eval_samples_per_second": 1523.406, |
|
"eval_steps_per_second": 11.918, |
|
"step": 2552 |
|
}, |
|
{ |
|
"epoch": 1.67, |
|
"learning_rate": 2.4616674652611405e-05, |
|
"loss": 0.6078, |
|
"step": 2585 |
|
}, |
|
{ |
|
"epoch": 1.7, |
|
"learning_rate": 2.4053665548634405e-05, |
|
"loss": 0.6167, |
|
"step": 2632 |
|
}, |
|
{ |
|
"epoch": 1.73, |
|
"learning_rate": 2.3490656444657405e-05, |
|
"loss": 0.6329, |
|
"step": 2679 |
|
}, |
|
{ |
|
"epoch": 1.76, |
|
"learning_rate": 2.29396262577863e-05, |
|
"loss": 0.6153, |
|
"step": 2726 |
|
}, |
|
{ |
|
"epoch": 1.79, |
|
"learning_rate": 2.2376617153809296e-05, |
|
"loss": 0.6392, |
|
"step": 2773 |
|
}, |
|
{ |
|
"epoch": 1.8, |
|
"eval_accuracy": 0.7623677308492358, |
|
"eval_b_acc": 0.626106698297278, |
|
"eval_f1": 0.7595959808260688, |
|
"eval_f1_anger": 0.6317689530685919, |
|
"eval_f1_disgust": 0.46170212765957447, |
|
"eval_f1_fear": 0.6752246469833119, |
|
"eval_f1_joy": 0.7548152004164499, |
|
"eval_f1_neutral": 0.8505247584261871, |
|
"eval_f1_sadness": 0.6872427983539094, |
|
"eval_f1_surprise": 0.4615384615384616, |
|
"eval_loss": 0.6541842818260193, |
|
"eval_prec": 0.7593266897219236, |
|
"eval_prec_anger": 0.5970149253731343, |
|
"eval_prec_disgust": 0.5710526315789474, |
|
"eval_prec_fear": 0.748221906116643, |
|
"eval_prec_joy": 0.7512953367875648, |
|
"eval_prec_neutral": 0.8379338617108499, |
|
"eval_prec_sadness": 0.7076271186440678, |
|
"eval_prec_surprise": 0.5131578947368421, |
|
"eval_recall": 0.7623677308492358, |
|
"eval_recall_anger": 0.6708193579300431, |
|
"eval_recall_disgust": 0.3875, |
|
"eval_recall_fear": 0.6152046783625731, |
|
"eval_recall_joy": 0.7583682008368201, |
|
"eval_recall_neutral": 0.8634998122418325, |
|
"eval_recall_sadness": 0.668, |
|
"eval_recall_surprise": 0.41935483870967744, |
|
"eval_runtime": 14.6661, |
|
"eval_samples_per_second": 1507.827, |
|
"eval_steps_per_second": 11.796, |
|
"step": 2784 |
|
}, |
|
{ |
|
"epoch": 1.82, |
|
"learning_rate": 2.1813608049832296e-05, |
|
"loss": 0.6221, |
|
"step": 2820 |
|
}, |
|
{ |
|
"epoch": 1.85, |
|
"learning_rate": 2.1250598945855296e-05, |
|
"loss": 0.6109, |
|
"step": 2867 |
|
}, |
|
{ |
|
"epoch": 1.88, |
|
"learning_rate": 2.0687589841878296e-05, |
|
"loss": 0.6029, |
|
"step": 2914 |
|
}, |
|
{ |
|
"epoch": 1.92, |
|
"learning_rate": 2.0124580737901292e-05, |
|
"loss": 0.6243, |
|
"step": 2961 |
|
}, |
|
{ |
|
"epoch": 1.95, |
|
"learning_rate": 1.9561571633924296e-05, |
|
"loss": 0.6158, |
|
"step": 3008 |
|
}, |
|
{ |
|
"epoch": 1.95, |
|
"eval_accuracy": 0.764854843085828, |
|
"eval_b_acc": 0.6279403178124943, |
|
"eval_f1": 0.761380516026678, |
|
"eval_f1_anger": 0.6389822371579453, |
|
"eval_f1_disgust": 0.4711729622266402, |
|
"eval_f1_fear": 0.6765847347994824, |
|
"eval_f1_joy": 0.751901635927894, |
|
"eval_f1_neutral": 0.8525969275786394, |
|
"eval_f1_sadness": 0.6901180282342051, |
|
"eval_f1_surprise": 0.46511627906976744, |
|
"eval_loss": 0.6456097960472107, |
|
"eval_prec": 0.7598739530313577, |
|
"eval_prec_anger": 0.6402116402116402, |
|
"eval_prec_disgust": 0.531390134529148, |
|
"eval_prec_fear": 0.7568740955137482, |
|
"eval_prec_joy": 0.7490139090720366, |
|
"eval_prec_neutral": 0.8310160427807487, |
|
"eval_prec_sadness": 0.7199420569773056, |
|
"eval_prec_surprise": 0.5063291139240507, |
|
"eval_recall": 0.764854843085828, |
|
"eval_recall_anger": 0.6377575467177767, |
|
"eval_recall_disgust": 0.4232142857142857, |
|
"eval_recall_fear": 0.6116959064327485, |
|
"eval_recall_joy": 0.7548117154811715, |
|
"eval_recall_neutral": 0.8753285767930905, |
|
"eval_recall_sadness": 0.6626666666666666, |
|
"eval_recall_surprise": 0.43010752688172044, |
|
"eval_runtime": 14.622, |
|
"eval_samples_per_second": 1512.381, |
|
"eval_steps_per_second": 11.832, |
|
"step": 3016 |
|
}, |
|
{ |
|
"epoch": 1.98, |
|
"learning_rate": 1.8998562529947296e-05, |
|
"loss": 0.5901, |
|
"step": 3055 |
|
}, |
|
{ |
|
"epoch": 2.01, |
|
"learning_rate": 1.8435553425970292e-05, |
|
"loss": 0.5923, |
|
"step": 3102 |
|
}, |
|
{ |
|
"epoch": 2.04, |
|
"learning_rate": 1.7872544321993292e-05, |
|
"loss": 0.5239, |
|
"step": 3149 |
|
}, |
|
{ |
|
"epoch": 2.07, |
|
"learning_rate": 1.7309535218016292e-05, |
|
"loss": 0.5329, |
|
"step": 3196 |
|
}, |
|
{ |
|
"epoch": 2.1, |
|
"learning_rate": 1.6758505031145187e-05, |
|
"loss": 0.554, |
|
"step": 3243 |
|
}, |
|
{ |
|
"epoch": 2.1, |
|
"eval_accuracy": 0.7583883512706883, |
|
"eval_b_acc": 0.634571558597101, |
|
"eval_f1": 0.7563700086517053, |
|
"eval_f1_anger": 0.643182362808531, |
|
"eval_f1_disgust": 0.4690181124880839, |
|
"eval_f1_fear": 0.6795752654590881, |
|
"eval_f1_joy": 0.7506092607636069, |
|
"eval_f1_neutral": 0.842095468502838, |
|
"eval_f1_sadness": 0.6862699699004399, |
|
"eval_f1_surprise": 0.47133027522935783, |
|
"eval_loss": 0.6742041707038879, |
|
"eval_prec": 0.7554687165264222, |
|
"eval_prec_anger": 0.6433365292425696, |
|
"eval_prec_disgust": 0.5030674846625767, |
|
"eval_prec_fear": 0.7292225201072386, |
|
"eval_prec_joy": 0.7292817679558011, |
|
"eval_prec_neutral": 0.8347168419110865, |
|
"eval_prec_sadness": 0.7162880618656355, |
|
"eval_prec_surprise": 0.504914004914005, |
|
"eval_recall": 0.7583883512706883, |
|
"eval_recall_anger": 0.6430282702443699, |
|
"eval_recall_disgust": 0.4392857142857143, |
|
"eval_recall_fear": 0.6362573099415205, |
|
"eval_recall_joy": 0.7732217573221757, |
|
"eval_recall_neutral": 0.8496057078482914, |
|
"eval_recall_sadness": 0.6586666666666666, |
|
"eval_recall_surprise": 0.44193548387096776, |
|
"eval_runtime": 14.8261, |
|
"eval_samples_per_second": 1491.559, |
|
"eval_steps_per_second": 11.669, |
|
"step": 3248 |
|
}, |
|
{ |
|
"epoch": 2.13, |
|
"learning_rate": 1.6195495927168187e-05, |
|
"loss": 0.5568, |
|
"step": 3290 |
|
}, |
|
{ |
|
"epoch": 2.16, |
|
"learning_rate": 1.5632486823191184e-05, |
|
"loss": 0.5375, |
|
"step": 3337 |
|
}, |
|
{ |
|
"epoch": 2.19, |
|
"learning_rate": 1.5069477719214184e-05, |
|
"loss": 0.5198, |
|
"step": 3384 |
|
}, |
|
{ |
|
"epoch": 2.22, |
|
"learning_rate": 1.4506468615237184e-05, |
|
"loss": 0.5255, |
|
"step": 3431 |
|
}, |
|
{ |
|
"epoch": 2.25, |
|
"learning_rate": 1.3943459511260182e-05, |
|
"loss": 0.5537, |
|
"step": 3478 |
|
}, |
|
{ |
|
"epoch": 2.25, |
|
"eval_accuracy": 0.7632721352989057, |
|
"eval_b_acc": 0.6282518018397625, |
|
"eval_f1": 0.7604673635172584, |
|
"eval_f1_anger": 0.6454630495790459, |
|
"eval_f1_disgust": 0.45434782608695656, |
|
"eval_f1_fear": 0.6718246292714378, |
|
"eval_f1_joy": 0.7522695178535405, |
|
"eval_f1_neutral": 0.8484961703717542, |
|
"eval_f1_sadness": 0.6950892857142857, |
|
"eval_f1_surprise": 0.47641791044776116, |
|
"eval_loss": 0.670791745185852, |
|
"eval_prec": 0.7603587760472442, |
|
"eval_prec_anger": 0.6304248515303792, |
|
"eval_prec_disgust": 0.5805555555555556, |
|
"eval_prec_fear": 0.7485632183908046, |
|
"eval_prec_joy": 0.726334242306194, |
|
"eval_prec_neutral": 0.8442379182156133, |
|
"eval_prec_sadness": 0.6982062780269058, |
|
"eval_prec_surprise": 0.5355704697986577, |
|
"eval_recall": 0.7632721352989057, |
|
"eval_recall_anger": 0.6612362242453282, |
|
"eval_recall_disgust": 0.3732142857142857, |
|
"eval_recall_fear": 0.6093567251461989, |
|
"eval_recall_joy": 0.7801255230125523, |
|
"eval_recall_neutral": 0.8527975966954563, |
|
"eval_recall_sadness": 0.692, |
|
"eval_recall_surprise": 0.4290322580645161, |
|
"eval_runtime": 14.5517, |
|
"eval_samples_per_second": 1519.68, |
|
"eval_steps_per_second": 11.889, |
|
"step": 3480 |
|
}, |
|
{ |
|
"epoch": 2.28, |
|
"learning_rate": 1.3380450407283182e-05, |
|
"loss": 0.5305, |
|
"step": 3525 |
|
}, |
|
{ |
|
"epoch": 2.31, |
|
"learning_rate": 1.2817441303306182e-05, |
|
"loss": 0.5313, |
|
"step": 3572 |
|
}, |
|
{ |
|
"epoch": 2.34, |
|
"learning_rate": 1.2254432199329182e-05, |
|
"loss": 0.5182, |
|
"step": 3619 |
|
}, |
|
{ |
|
"epoch": 2.37, |
|
"learning_rate": 1.169142309535218e-05, |
|
"loss": 0.5375, |
|
"step": 3666 |
|
}, |
|
{ |
|
"epoch": 2.4, |
|
"eval_accuracy": 0.7605589219498959, |
|
"eval_b_acc": 0.6402110359246711, |
|
"eval_f1": 0.7594675823716318, |
|
"eval_f1_anger": 0.6421420256111757, |
|
"eval_f1_disgust": 0.4648148148148148, |
|
"eval_f1_fear": 0.6746532156368222, |
|
"eval_f1_joy": 0.7537328697075065, |
|
"eval_f1_neutral": 0.8463990997749438, |
|
"eval_f1_sadness": 0.6885171790235082, |
|
"eval_f1_surprise": 0.4835924006908463, |
|
"eval_loss": 0.671157717704773, |
|
"eval_prec": 0.7592351302120464, |
|
"eval_prec_anger": 0.6245471014492754, |
|
"eval_prec_disgust": 0.4826923076923077, |
|
"eval_prec_fear": 0.7318741450068399, |
|
"eval_prec_joy": 0.7372949179671868, |
|
"eval_prec_neutral": 0.8454477332334207, |
|
"eval_prec_sadness": 0.7005519779208832, |
|
"eval_prec_surprise": 0.5204460966542751, |
|
"eval_recall": 0.7605589219498959, |
|
"eval_recall_anger": 0.6607570675610924, |
|
"eval_recall_disgust": 0.44821428571428573, |
|
"eval_recall_fear": 0.6257309941520468, |
|
"eval_recall_joy": 0.7709205020920502, |
|
"eval_recall_neutral": 0.847352609838528, |
|
"eval_recall_sadness": 0.6768888888888889, |
|
"eval_recall_surprise": 0.45161290322580644, |
|
"eval_runtime": 14.5753, |
|
"eval_samples_per_second": 1517.225, |
|
"eval_steps_per_second": 11.869, |
|
"step": 3712 |
|
}, |
|
{ |
|
"epoch": 2.4, |
|
"learning_rate": 1.112841399137518e-05, |
|
"loss": 0.5266, |
|
"step": 3713 |
|
}, |
|
{ |
|
"epoch": 2.43, |
|
"learning_rate": 1.056540488739818e-05, |
|
"loss": 0.5276, |
|
"step": 3760 |
|
}, |
|
{ |
|
"epoch": 2.46, |
|
"learning_rate": 1.000239578342118e-05, |
|
"loss": 0.5432, |
|
"step": 3807 |
|
}, |
|
{ |
|
"epoch": 2.49, |
|
"learning_rate": 9.439386679444178e-06, |
|
"loss": 0.5262, |
|
"step": 3854 |
|
}, |
|
{ |
|
"epoch": 2.52, |
|
"learning_rate": 8.876377575467178e-06, |
|
"loss": 0.5175, |
|
"step": 3901 |
|
}, |
|
{ |
|
"epoch": 2.55, |
|
"eval_accuracy": 0.7625033915166862, |
|
"eval_b_acc": 0.6369042077487537, |
|
"eval_f1": 0.7603749093215698, |
|
"eval_f1_anger": 0.6429077177248053, |
|
"eval_f1_disgust": 0.46938775510204084, |
|
"eval_f1_fear": 0.677336747759283, |
|
"eval_f1_joy": 0.7530406101834674, |
|
"eval_f1_neutral": 0.8487682904241526, |
|
"eval_f1_sadness": 0.6956521739130433, |
|
"eval_f1_surprise": 0.457388105456775, |
|
"eval_loss": 0.66249018907547, |
|
"eval_prec": 0.7600295878449174, |
|
"eval_prec_anger": 0.6334883720930232, |
|
"eval_prec_disgust": 0.44805194805194803, |
|
"eval_prec_fear": 0.7482319660537482, |
|
"eval_prec_joy": 0.7421779764323446, |
|
"eval_prec_neutral": 0.8374451754385965, |
|
"eval_prec_sadness": 0.7251687560270009, |
|
"eval_prec_surprise": 0.5320970042796006, |
|
"eval_recall": 0.7625033915166862, |
|
"eval_recall_anger": 0.6526114039290848, |
|
"eval_recall_disgust": 0.4928571428571429, |
|
"eval_recall_fear": 0.6187134502923977, |
|
"eval_recall_joy": 0.7642259414225941, |
|
"eval_recall_neutral": 0.8604018024784078, |
|
"eval_recall_sadness": 0.6684444444444444, |
|
"eval_recall_surprise": 0.4010752688172043, |
|
"eval_runtime": 14.6386, |
|
"eval_samples_per_second": 1510.666, |
|
"eval_steps_per_second": 11.818, |
|
"step": 3944 |
|
}, |
|
{ |
|
"epoch": 2.55, |
|
"learning_rate": 8.313368471490178e-06, |
|
"loss": 0.5337, |
|
"step": 3948 |
|
}, |
|
{ |
|
"epoch": 2.58, |
|
"learning_rate": 7.750359367513177e-06, |
|
"loss": 0.5148, |
|
"step": 3995 |
|
}, |
|
{ |
|
"epoch": 2.61, |
|
"learning_rate": 7.1873502635361775e-06, |
|
"loss": 0.5234, |
|
"step": 4042 |
|
}, |
|
{ |
|
"epoch": 2.64, |
|
"learning_rate": 6.624341159559177e-06, |
|
"loss": 0.5286, |
|
"step": 4089 |
|
}, |
|
{ |
|
"epoch": 2.68, |
|
"learning_rate": 6.061332055582176e-06, |
|
"loss": 0.5182, |
|
"step": 4136 |
|
}, |
|
{ |
|
"epoch": 2.7, |
|
"eval_accuracy": 0.7631364746314552, |
|
"eval_b_acc": 0.6403726819328496, |
|
"eval_f1": 0.7611758530200116, |
|
"eval_f1_anger": 0.6441332689521971, |
|
"eval_f1_disgust": 0.4635036496350365, |
|
"eval_f1_fear": 0.6658725431804646, |
|
"eval_f1_joy": 0.7548551093035079, |
|
"eval_f1_neutral": 0.848629209284947, |
|
"eval_f1_sadness": 0.6971687429218574, |
|
"eval_f1_surprise": 0.4763636363636364, |
|
"eval_loss": 0.6621036529541016, |
|
"eval_prec": 0.7602393679680954, |
|
"eval_prec_anger": 0.6491484184914842, |
|
"eval_prec_disgust": 0.47388059701492535, |
|
"eval_prec_fear": 0.6783980582524272, |
|
"eval_prec_joy": 0.734322453016815, |
|
"eval_prec_neutral": 0.844409331722279, |
|
"eval_prec_sadness": 0.7108545034642032, |
|
"eval_prec_surprise": 0.5458333333333333, |
|
"eval_recall": 0.7631364746314552, |
|
"eval_recall_anger": 0.639195016770484, |
|
"eval_recall_disgust": 0.45357142857142857, |
|
"eval_recall_fear": 0.6538011695906433, |
|
"eval_recall_joy": 0.7765690376569038, |
|
"eval_recall_neutral": 0.8528914757791964, |
|
"eval_recall_sadness": 0.684, |
|
"eval_recall_surprise": 0.42258064516129035, |
|
"eval_runtime": 14.5758, |
|
"eval_samples_per_second": 1517.169, |
|
"eval_steps_per_second": 11.869, |
|
"step": 4176 |
|
} |
|
], |
|
"max_steps": 4638, |
|
"num_train_epochs": 3, |
|
"total_flos": 3.51500575835136e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|