| [ | |
| { | |
| "step": 100, | |
| "epoch": 0.111358574610245, | |
| "loss": 0.6139, | |
| "grad_norm": 0.6548389792442322, | |
| "learning_rate": 2.7500000000000004e-06 | |
| }, | |
| { | |
| "step": 200, | |
| "epoch": 0.22271714922049, | |
| "loss": 0.4821, | |
| "grad_norm": 1.2604601383209229, | |
| "learning_rate": 5.527777777777779e-06 | |
| }, | |
| { | |
| "step": 200, | |
| "epoch": 0.22271714922049, | |
| "eval_loss": 0.41080573201179504, | |
| "eval_f1_micro": 0.8395441892832289, | |
| "eval_f1_macro": 0.7509803650720916, | |
| "eval_f1_weighted": 0.8265873475311692, | |
| "eval_accuracy": 0.35198329853862215, | |
| "eval_subset_accuracy": 0.8395441892832289, | |
| "eval_f1_label_rado\u015b\u0107": 0.19078947368421054, | |
| "eval_f1_label_wstr\u0119t": 0.5752023860247124, | |
| "eval_f1_label_gniew": 0.6845324788814448, | |
| "eval_f1_label_przeczuwanie": 0.0, | |
| "eval_f1_label_pozytywny": 0.42994241842610365, | |
| "eval_f1_label_negatywny": 0.7949462182004439, | |
| "eval_f1_label_neutralny": 0.7492940069030436, | |
| "eval_f1_label_sarkazm": 0.0, | |
| "eval_runtime": 13.553, | |
| "eval_samples_per_second": 530.14, | |
| "eval_steps_per_second": 16.601 | |
| }, | |
| { | |
| "step": 300, | |
| "epoch": 0.33407572383073497, | |
| "loss": 0.4129, | |
| "grad_norm": 1.7567846775054932, | |
| "learning_rate": 8.305555555555557e-06 | |
| }, | |
| { | |
| "step": 400, | |
| "epoch": 0.44543429844098, | |
| "loss": 0.3769, | |
| "grad_norm": 2.582125186920166, | |
| "learning_rate": 9.99640768631301e-06 | |
| }, | |
| { | |
| "step": 400, | |
| "epoch": 0.44543429844098, | |
| "eval_loss": 0.33686527609825134, | |
| "eval_f1_micro": 0.8666144745998609, | |
| "eval_f1_macro": 0.8079475306110289, | |
| "eval_f1_weighted": 0.8619885595665887, | |
| "eval_accuracy": 0.4321503131524008, | |
| "eval_subset_accuracy": 0.8666144745998609, | |
| "eval_f1_label_rado\u015b\u0107": 0.6868131868131868, | |
| "eval_f1_label_wstr\u0119t": 0.6907111262334127, | |
| "eval_f1_label_gniew": 0.7182017543859649, | |
| "eval_f1_label_przeczuwanie": 0.534637326813366, | |
| "eval_f1_label_pozytywny": 0.7161493477282951, | |
| "eval_f1_label_negatywny": 0.8120326308633583, | |
| "eval_f1_label_neutralny": 0.7886710239651417, | |
| "eval_f1_label_sarkazm": 0.005263157894736842, | |
| "eval_runtime": 13.4667, | |
| "eval_samples_per_second": 533.539, | |
| "eval_steps_per_second": 16.708 | |
| }, | |
| { | |
| "step": 500, | |
| "epoch": 0.5567928730512249, | |
| "loss": 0.3415, | |
| "grad_norm": 2.2375481128692627, | |
| "learning_rate": 9.954431380479526e-06 | |
| }, | |
| { | |
| "step": 600, | |
| "epoch": 0.6681514476614699, | |
| "loss": 0.3359, | |
| "grad_norm": 2.377732515335083, | |
| "learning_rate": 9.86568060370307e-06 | |
| }, | |
| { | |
| "step": 600, | |
| "epoch": 0.6681514476614699, | |
| "eval_loss": 0.307725727558136, | |
| "eval_f1_micro": 0.8731384829505915, | |
| "eval_f1_macro": 0.8208003215407338, | |
| "eval_f1_weighted": 0.8701057540509732, | |
| "eval_accuracy": 0.44231036882393876, | |
| "eval_subset_accuracy": 0.8731384829505915, | |
| "eval_f1_label_rado\u015b\u0107": 0.7128842380640942, | |
| "eval_f1_label_wstr\u0119t": 0.6842447916666666, | |
| "eval_f1_label_gniew": 0.7346007604562738, | |
| "eval_f1_label_przeczuwanie": 0.6198969480776853, | |
| "eval_f1_label_pozytywny": 0.7572641931157801, | |
| "eval_f1_label_negatywny": 0.8233744855967078, | |
| "eval_f1_label_neutralny": 0.7887421820708825, | |
| "eval_f1_label_sarkazm": 0.18295543393275998, | |
| "eval_runtime": 13.3682, | |
| "eval_samples_per_second": 537.472, | |
| "eval_steps_per_second": 16.831 | |
| }, | |
| { | |
| "step": 700, | |
| "epoch": 0.779510022271715, | |
| "loss": 0.3179, | |
| "grad_norm": 2.0692615509033203, | |
| "learning_rate": 9.730993246411562e-06 | |
| }, | |
| { | |
| "step": 800, | |
| "epoch": 0.89086859688196, | |
| "loss": 0.3184, | |
| "grad_norm": 3.814361095428467, | |
| "learning_rate": 9.551640883362268e-06 | |
| }, | |
| { | |
| "step": 800, | |
| "epoch": 0.89086859688196, | |
| "eval_loss": 0.29314953088760376, | |
| "eval_f1_micro": 0.8788100208768267, | |
| "eval_f1_macro": 0.8300609729014572, | |
| "eval_f1_weighted": 0.8763999627004312, | |
| "eval_accuracy": 0.4701461377870564, | |
| "eval_subset_accuracy": 0.8788100208768267, | |
| "eval_f1_label_rado\u015b\u0107": 0.6844694307800422, | |
| "eval_f1_label_wstr\u0119t": 0.7084769124741558, | |
| "eval_f1_label_gniew": 0.7435356200527704, | |
| "eval_f1_label_przeczuwanie": 0.6724700761697497, | |
| "eval_f1_label_pozytywny": 0.7029945999018163, | |
| "eval_f1_label_negatywny": 0.8380327868852459, | |
| "eval_f1_label_neutralny": 0.8036529680365296, | |
| "eval_f1_label_sarkazm": 0.3567289117836446, | |
| "eval_runtime": 13.6772, | |
| "eval_samples_per_second": 525.325, | |
| "eval_steps_per_second": 16.451 | |
| }, | |
| { | |
| "step": 900, | |
| "epoch": 1.0022271714922049, | |
| "loss": 0.3097, | |
| "grad_norm": 2.8335301876068115, | |
| "learning_rate": 9.329316768785544e-06 | |
| }, | |
| { | |
| "step": 1000, | |
| "epoch": 1.1135857461024499, | |
| "loss": 0.2756, | |
| "grad_norm": 1.909611701965332, | |
| "learning_rate": 9.066119850479551e-06 | |
| }, | |
| { | |
| "step": 1000, | |
| "epoch": 1.1135857461024499, | |
| "eval_loss": 0.28486499190330505, | |
| "eval_f1_micro": 0.8823938761308281, | |
| "eval_f1_macro": 0.8361271998835582, | |
| "eval_f1_weighted": 0.8804578924937377, | |
| "eval_accuracy": 0.4810020876826722, | |
| "eval_subset_accuracy": 0.8823938761308281, | |
| "eval_f1_label_rado\u015b\u0107": 0.7310513447432763, | |
| "eval_f1_label_wstr\u0119t": 0.7109237794169301, | |
| "eval_f1_label_gniew": 0.7485624673288029, | |
| "eval_f1_label_przeczuwanie": 0.681491618200479, | |
| "eval_f1_label_pozytywny": 0.7727272727272727, | |
| "eval_f1_label_negatywny": 0.8409730266423961, | |
| "eval_f1_label_neutralny": 0.8091783364265227, | |
| "eval_f1_label_sarkazm": 0.3149171270718232, | |
| "eval_runtime": 14.7594, | |
| "eval_samples_per_second": 486.807, | |
| "eval_steps_per_second": 15.244 | |
| }, | |
| { | |
| "step": 1100, | |
| "epoch": 1.2249443207126949, | |
| "loss": 0.2685, | |
| "grad_norm": 4.029219150543213, | |
| "learning_rate": 8.764534953777842e-06 | |
| }, | |
| { | |
| "step": 1200, | |
| "epoch": 1.3363028953229399, | |
| "loss": 0.2622, | |
| "grad_norm": 1.7298495769500732, | |
| "learning_rate": 8.427409322471743e-06 | |
| }, | |
| { | |
| "step": 1200, | |
| "epoch": 1.3363028953229399, | |
| "eval_loss": 0.28199732303619385, | |
| "eval_f1_micro": 0.881419624217119, | |
| "eval_f1_macro": 0.8361219089623048, | |
| "eval_f1_weighted": 0.8799866455346702, | |
| "eval_accuracy": 0.4683368128044537, | |
| "eval_subset_accuracy": 0.881419624217119, | |
| "eval_f1_label_rado\u015b\u0107": 0.7399756986634265, | |
| "eval_f1_label_wstr\u0119t": 0.7199725463280714, | |
| "eval_f1_label_gniew": 0.7479035639412998, | |
| "eval_f1_label_przeczuwanie": 0.7060367454068242, | |
| "eval_f1_label_pozytywny": 0.7732656514382402, | |
| "eval_f1_label_negatywny": 0.8449914316871787, | |
| "eval_f1_label_neutralny": 0.7788461538461539, | |
| "eval_f1_label_sarkazm": 0.4, | |
| "eval_runtime": 13.3959, | |
| "eval_samples_per_second": 536.358, | |
| "eval_steps_per_second": 16.796 | |
| }, | |
| { | |
| "step": 1300, | |
| "epoch": 1.447661469933185, | |
| "loss": 0.2689, | |
| "grad_norm": 2.291908025741577, | |
| "learning_rate": 8.057925738163153e-06 | |
| }, | |
| { | |
| "step": 1400, | |
| "epoch": 1.5590200445434297, | |
| "loss": 0.2653, | |
| "grad_norm": 2.64717960357666, | |
| "learning_rate": 7.659572471826265e-06 | |
| }, | |
| { | |
| "step": 1400, | |
| "epoch": 1.5590200445434297, | |
| "eval_loss": 0.27665975689888, | |
| "eval_f1_micro": 0.8838726513569938, | |
| "eval_f1_macro": 0.8415650899916123, | |
| "eval_f1_weighted": 0.8832473603278248, | |
| "eval_accuracy": 0.48434237995824636, | |
| "eval_subset_accuracy": 0.8838726513569938, | |
| "eval_f1_label_rado\u015b\u0107": 0.7375621890547264, | |
| "eval_f1_label_wstr\u0119t": 0.7300771208226221, | |
| "eval_f1_label_gniew": 0.7580278128950695, | |
| "eval_f1_label_przeczuwanie": 0.6951871657754011, | |
| "eval_f1_label_pozytywny": 0.777292576419214, | |
| "eval_f1_label_negatywny": 0.8478637868516475, | |
| "eval_f1_label_neutralny": 0.8011984490659148, | |
| "eval_f1_label_sarkazm": 0.47809206877426513, | |
| "eval_runtime": 13.39, | |
| "eval_samples_per_second": 536.594, | |
| "eval_steps_per_second": 16.804 | |
| }, | |
| { | |
| "step": 1500, | |
| "epoch": 1.670378619153675, | |
| "loss": 0.2551, | |
| "grad_norm": 2.742314100265503, | |
| "learning_rate": 7.236110351263578e-06 | |
| }, | |
| { | |
| "step": 1600, | |
| "epoch": 1.7817371937639197, | |
| "loss": 0.253, | |
| "grad_norm": 2.0853464603424072, | |
| "learning_rate": 6.7915372553702926e-06 | |
| }, | |
| { | |
| "step": 1600, | |
| "epoch": 1.7817371937639197, | |
| "eval_loss": 0.27193114161491394, | |
| "eval_f1_micro": 0.8862908837856646, | |
| "eval_f1_macro": 0.8419394716369004, | |
| "eval_f1_weighted": 0.8845662361245985, | |
| "eval_accuracy": 0.49255393180236606, | |
| "eval_subset_accuracy": 0.8862908837856646, | |
| "eval_f1_label_rado\u015b\u0107": 0.7449786975045648, | |
| "eval_f1_label_wstr\u0119t": 0.7020958083832335, | |
| "eval_f1_label_gniew": 0.745141588006663, | |
| "eval_f1_label_przeczuwanie": 0.7135483870967742, | |
| "eval_f1_label_pozytywny": 0.7725178047758693, | |
| "eval_f1_label_negatywny": 0.8427041499330656, | |
| "eval_f1_label_neutralny": 0.8148646376324197, | |
| "eval_f1_label_sarkazm": 0.45395894428152495, | |
| "eval_runtime": 13.4458, | |
| "eval_samples_per_second": 534.368, | |
| "eval_steps_per_second": 16.734 | |
| }, | |
| { | |
| "step": 1700, | |
| "epoch": 1.893095768374165, | |
| "loss": 0.2502, | |
| "grad_norm": 2.6639328002929688, | |
| "learning_rate": 6.330050370414403e-06 | |
| }, | |
| { | |
| "step": 1800, | |
| "epoch": 2.0044543429844097, | |
| "loss": 0.2511, | |
| "grad_norm": 2.5934195518493652, | |
| "learning_rate": 5.856006564668624e-06 | |
| }, | |
| { | |
| "step": 1800, | |
| "epoch": 2.0044543429844097, | |
| "eval_loss": 0.2889347970485687, | |
| "eval_f1_micro": 0.8771746694502436, | |
| "eval_f1_macro": 0.8367166256068449, | |
| "eval_f1_weighted": 0.8780966128511206, | |
| "eval_accuracy": 0.46583159359777315, | |
| "eval_subset_accuracy": 0.8771746694502436, | |
| "eval_f1_label_rado\u015b\u0107": 0.7299448867115738, | |
| "eval_f1_label_wstr\u0119t": 0.7176891006551519, | |
| "eval_f1_label_gniew": 0.7512172501738928, | |
| "eval_f1_label_przeczuwanie": 0.7179814755669115, | |
| "eval_f1_label_pozytywny": 0.7771623348956114, | |
| "eval_f1_label_negatywny": 0.8434200743494423, | |
| "eval_f1_label_neutralny": 0.7797117724125023, | |
| "eval_f1_label_sarkazm": 0.5232903865213082, | |
| "eval_runtime": 13.5639, | |
| "eval_samples_per_second": 529.716, | |
| "eval_steps_per_second": 16.588 | |
| }, | |
| { | |
| "step": 1900, | |
| "epoch": 2.115812917594655, | |
| "loss": 0.2128, | |
| "grad_norm": 2.778862714767456, | |
| "learning_rate": 5.373881255494652e-06 | |
| }, | |
| { | |
| "step": 2000, | |
| "epoch": 2.2271714922048997, | |
| "loss": 0.2068, | |
| "grad_norm": 2.1749610900878906, | |
| "learning_rate": 4.888226157213061e-06 | |
| }, | |
| { | |
| "step": 2000, | |
| "epoch": 2.2271714922048997, | |
| "eval_loss": 0.2712438106536865, | |
| "eval_f1_micro": 0.8896659707724426, | |
| "eval_f1_macro": 0.8469364739492785, | |
| "eval_f1_weighted": 0.8881098685832289, | |
| "eval_accuracy": 0.5082811412665275, | |
| "eval_subset_accuracy": 0.8896659707724426, | |
| "eval_f1_label_rado\u015b\u0107": 0.7382636655948553, | |
| "eval_f1_label_wstr\u0119t": 0.7270175438596491, | |
| "eval_f1_label_gniew": 0.7617009895694036, | |
| "eval_f1_label_przeczuwanie": 0.7022071307300509, | |
| "eval_f1_label_pozytywny": 0.7810858143607706, | |
| "eval_f1_label_negatywny": 0.8477131847880717, | |
| "eval_f1_label_neutralny": 0.8223467369808833, | |
| "eval_f1_label_sarkazm": 0.46941176470588236, | |
| "eval_runtime": 13.4837, | |
| "eval_samples_per_second": 532.864, | |
| "eval_steps_per_second": 16.687 | |
| }, | |
| { | |
| "step": 2100, | |
| "epoch": 2.338530066815145, | |
| "loss": 0.2042, | |
| "grad_norm": 3.2917253971099854, | |
| "learning_rate": 4.403626308658459e-06 | |
| }, | |
| { | |
| "step": 2200, | |
| "epoch": 2.4498886414253898, | |
| "loss": 0.2097, | |
| "grad_norm": 2.2220280170440674, | |
| "learning_rate": 3.9246567861200166e-06 | |
| }, | |
| { | |
| "step": 2200, | |
| "epoch": 2.4498886414253898, | |
| "eval_loss": 0.2748867869377136, | |
| "eval_f1_micro": 0.8878044537230341, | |
| "eval_f1_macro": 0.8475632085047498, | |
| "eval_f1_weighted": 0.8874379181538837, | |
| "eval_accuracy": 0.4989561586638831, | |
| "eval_subset_accuracy": 0.8878044537230341, | |
| "eval_f1_label_rado\u015b\u0107": 0.7484811664641555, | |
| "eval_f1_label_wstr\u0119t": 0.7377866400797607, | |
| "eval_f1_label_gniew": 0.75792897804283, | |
| "eval_f1_label_przeczuwanie": 0.7263442475217783, | |
| "eval_f1_label_pozytywny": 0.7774578362813657, | |
| "eval_f1_label_negatywny": 0.8532080362929358, | |
| "eval_f1_label_neutralny": 0.8129346314325452, | |
| "eval_f1_label_sarkazm": 0.5211047420531527, | |
| "eval_runtime": 13.5472, | |
| "eval_samples_per_second": 530.369, | |
| "eval_steps_per_second": 16.609 | |
| }, | |
| { | |
| "step": 2300, | |
| "epoch": 2.5612472160356345, | |
| "loss": 0.202, | |
| "grad_norm": 4.778714179992676, | |
| "learning_rate": 3.4558395103377882e-06 | |
| }, | |
| { | |
| "step": 2400, | |
| "epoch": 2.6726057906458798, | |
| "loss": 0.2042, | |
| "grad_norm": 2.9350364208221436, | |
| "learning_rate": 3.0016005553371464e-06 | |
| }, | |
| { | |
| "step": 2400, | |
| "epoch": 2.6726057906458798, | |
| "eval_loss": 0.27490347623825073, | |
| "eval_f1_micro": 0.8879262352122478, | |
| "eval_f1_macro": 0.8486039951352532, | |
| "eval_f1_weighted": 0.8878859652865869, | |
| "eval_accuracy": 0.5029923451635352, | |
| "eval_subset_accuracy": 0.8879262352122478, | |
| "eval_f1_label_rado\u015b\u0107": 0.7540394973070018, | |
| "eval_f1_label_wstr\u0119t": 0.7323117052494295, | |
| "eval_f1_label_gniew": 0.7653221581980094, | |
| "eval_f1_label_przeczuwanie": 0.7192023158571889, | |
| "eval_f1_label_pozytywny": 0.7812627291242362, | |
| "eval_f1_label_negatywny": 0.8546814044213265, | |
| "eval_f1_label_neutralny": 0.8173642338291248, | |
| "eval_f1_label_sarkazm": 0.5525328330206379, | |
| "eval_runtime": 13.5014, | |
| "eval_samples_per_second": 532.167, | |
| "eval_steps_per_second": 16.665 | |
| }, | |
| { | |
| "step": 2500, | |
| "epoch": 2.7839643652561246, | |
| "loss": 0.1985, | |
| "grad_norm": 3.124579906463623, | |
| "learning_rate": 2.566228362145968e-06 | |
| }, | |
| { | |
| "step": 2600, | |
| "epoch": 2.89532293986637, | |
| "loss": 0.2071, | |
| "grad_norm": 2.5567288398742676, | |
| "learning_rate": 2.1538332518961635e-06 | |
| }, | |
| { | |
| "step": 2600, | |
| "epoch": 2.89532293986637, | |
| "eval_loss": 0.2728336453437805, | |
| "eval_f1_micro": 0.8903096729297146, | |
| "eval_f1_macro": 0.8485724561583636, | |
| "eval_f1_weighted": 0.8890469205384153, | |
| "eval_accuracy": 0.5102296450939457, | |
| "eval_subset_accuracy": 0.8903096729297146, | |
| "eval_f1_label_rado\u015b\u0107": 0.7517985611510791, | |
| "eval_f1_label_wstr\u0119t": 0.7267462902642056, | |
| "eval_f1_label_gniew": 0.7664253150978815, | |
| "eval_f1_label_przeczuwanie": 0.7165740438051651, | |
| "eval_f1_label_pozytywny": 0.7838400666389005, | |
| "eval_f1_label_negatywny": 0.8534298404342819, | |
| "eval_f1_label_neutralny": 0.8198167628096369, | |
| "eval_f1_label_sarkazm": 0.4584795321637427, | |
| "eval_runtime": 13.4, | |
| "eval_samples_per_second": 536.194, | |
| "eval_steps_per_second": 16.791 | |
| }, | |
| { | |
| "step": 2700, | |
| "epoch": 3.0066815144766146, | |
| "loss": 0.2014, | |
| "grad_norm": 3.9624898433685303, | |
| "learning_rate": 1.76830862054381e-06 | |
| }, | |
| { | |
| "step": 2800, | |
| "epoch": 3.11804008908686, | |
| "loss": 0.1767, | |
| "grad_norm": 1.9180693626403809, | |
| "learning_rate": 1.4132941815660222e-06 | |
| }, | |
| { | |
| "step": 2800, | |
| "epoch": 3.11804008908686, | |
| "eval_loss": 0.2742355167865753, | |
| "eval_f1_micro": 0.8887265135699374, | |
| "eval_f1_macro": 0.8473642910777622, | |
| "eval_f1_weighted": 0.8878169372581985, | |
| "eval_accuracy": 0.5039665970772442, | |
| "eval_subset_accuracy": 0.8887265135699374, | |
| "eval_f1_label_rado\u015b\u0107": 0.745920745920746, | |
| "eval_f1_label_wstr\u0119t": 0.7262289199856476, | |
| "eval_f1_label_gniew": 0.7623196297304655, | |
| "eval_f1_label_przeczuwanie": 0.7178329571106095, | |
| "eval_f1_label_pozytywny": 0.7777777777777778, | |
| "eval_f1_label_negatywny": 0.8542283645936163, | |
| "eval_f1_label_neutralny": 0.8082359099633571, | |
| "eval_f1_label_sarkazm": 0.5346432264736298, | |
| "eval_runtime": 16.0479, | |
| "eval_samples_per_second": 447.723, | |
| "eval_steps_per_second": 14.021 | |
| }, | |
| { | |
| "step": 2900, | |
| "epoch": 3.2293986636971046, | |
| "loss": 0.1773, | |
| "grad_norm": 2.348484992980957, | |
| "learning_rate": 1.092141603657972e-06 | |
| }, | |
| { | |
| "step": 3000, | |
| "epoch": 3.34075723830735, | |
| "loss": 0.173, | |
| "grad_norm": 2.2864317893981934, | |
| "learning_rate": 8.078828678422995e-07 | |
| }, | |
| { | |
| "step": 3000, | |
| "epoch": 3.34075723830735, | |
| "eval_loss": 0.27491486072540283, | |
| "eval_f1_micro": 0.889544189283229, | |
| "eval_f1_macro": 0.8494136493629865, | |
| "eval_f1_weighted": 0.8889910470048148, | |
| "eval_accuracy": 0.508141962421712, | |
| "eval_subset_accuracy": 0.889544189283229, | |
| "eval_f1_label_rado\u015b\u0107": 0.7475728155339806, | |
| "eval_f1_label_wstr\u0119t": 0.7339011925042589, | |
| "eval_f1_label_gniew": 0.7665431445209105, | |
| "eval_f1_label_przeczuwanie": 0.7226675216415518, | |
| "eval_f1_label_pozytywny": 0.781314592806945, | |
| "eval_f1_label_negatywny": 0.8550937245313773, | |
| "eval_f1_label_neutralny": 0.8155373032169747, | |
| "eval_f1_label_sarkazm": 0.5287713841368584, | |
| "eval_runtime": 13.5687, | |
| "eval_samples_per_second": 529.527, | |
| "eval_steps_per_second": 16.582 | |
| }, | |
| { | |
| "step": 3100, | |
| "epoch": 3.4521158129175946, | |
| "loss": 0.1756, | |
| "grad_norm": 2.671910524368286, | |
| "learning_rate": 5.632016427295134e-07 | |
| }, | |
| { | |
| "step": 3200, | |
| "epoch": 3.5634743875278394, | |
| "loss": 0.1695, | |
| "grad_norm": 3.2793824672698975, | |
| "learning_rate": 3.6040794817364335e-07 | |
| }, | |
| { | |
| "step": 3200, | |
| "epoch": 3.5634743875278394, | |
| "eval_loss": 0.27663180232048035, | |
| "eval_f1_micro": 0.889544189283229, | |
| "eval_f1_macro": 0.8495682589006989, | |
| "eval_f1_weighted": 0.8890490603152431, | |
| "eval_accuracy": 0.511482254697286, | |
| "eval_subset_accuracy": 0.889544189283229, | |
| "eval_f1_label_rado\u015b\u0107": 0.7479091995221028, | |
| "eval_f1_label_wstr\u0119t": 0.731740614334471, | |
| "eval_f1_label_gniew": 0.7687056970333421, | |
| "eval_f1_label_przeczuwanie": 0.7237728585178056, | |
| "eval_f1_label_pozytywny": 0.7816091954022989, | |
| "eval_f1_label_negatywny": 0.8545868575146389, | |
| "eval_f1_label_neutralny": 0.8166494668042655, | |
| "eval_f1_label_sarkazm": 0.527850078084331, | |
| "eval_runtime": 13.4661, | |
| "eval_samples_per_second": 533.56, | |
| "eval_steps_per_second": 16.709 | |
| }, | |
| { | |
| "step": 3300, | |
| "epoch": 3.6748329621380846, | |
| "loss": 0.167, | |
| "grad_norm": 1.78013277053833, | |
| "learning_rate": 2.0141634652200205e-07 | |
| }, | |
| { | |
| "step": 3400, | |
| "epoch": 3.78619153674833, | |
| "loss": 0.172, | |
| "grad_norm": 2.706618070602417, | |
| "learning_rate": 8.772786735407601e-08 | |
| }, | |
| { | |
| "step": 3400, | |
| "epoch": 3.78619153674833, | |
| "eval_loss": 0.2760503590106964, | |
| "eval_f1_micro": 0.8900487125956854, | |
| "eval_f1_macro": 0.8500096117258309, | |
| "eval_f1_weighted": 0.8894635900360007, | |
| "eval_accuracy": 0.5124565066109952, | |
| "eval_subset_accuracy": 0.8900487125956854, | |
| "eval_f1_label_rado\u015b\u0107": 0.7476190476190476, | |
| "eval_f1_label_wstr\u0119t": 0.7336787564766839, | |
| "eval_f1_label_gniew": 0.7693124502256438, | |
| "eval_f1_label_przeczuwanie": 0.7220240025948751, | |
| "eval_f1_label_pozytywny": 0.7813649366571311, | |
| "eval_f1_label_negatywny": 0.8553212358999509, | |
| "eval_f1_label_neutralny": 0.8172006167551824, | |
| "eval_f1_label_sarkazm": 0.5337423312883436, | |
| "eval_runtime": 13.4196, | |
| "eval_samples_per_second": 535.411, | |
| "eval_steps_per_second": 16.767 | |
| } | |
| ] |