{ "best_metric": 0.090567946434021, "best_model_checkpoint": "/home/jcanete/ft-data/all_results/pos/albeto_base_2/epochs_4_bs_16_lr_5e-5/checkpoint-2650", "epoch": 4.0, "global_step": 3580, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.06, "eval_accuracy": 0.8647261144338456, "eval_f1": 0.8347301307241961, "eval_loss": 0.5675407648086548, "eval_precision": 0.8376692621878835, "eval_recall": 0.831811552216739, "eval_runtime": 2.1288, "eval_samples_per_second": 776.962, "eval_steps_per_second": 48.854, "step": 50 }, { "epoch": 0.11, "eval_accuracy": 0.9262465901967096, "eval_f1": 0.9161967839136014, "eval_loss": 0.27364614605903625, "eval_precision": 0.9120698530867619, "eval_recall": 0.9203612315438253, "eval_runtime": 2.143, "eval_samples_per_second": 771.822, "eval_steps_per_second": 48.531, "step": 100 }, { "epoch": 0.17, "eval_accuracy": 0.939106419748903, "eval_f1": 0.93049913086665, "eval_loss": 0.2097783237695694, "eval_precision": 0.9252330910240202, "eval_recall": 0.9358254580328066, "eval_runtime": 2.134, "eval_samples_per_second": 775.068, "eval_steps_per_second": 48.735, "step": 150 }, { "epoch": 0.22, "eval_accuracy": 0.9438166076481252, "eval_f1": 0.9369849926356434, "eval_loss": 0.18860450387001038, "eval_precision": 0.9334364404259116, "eval_recall": 0.9405606281592775, "eval_runtime": 2.1394, "eval_samples_per_second": 773.12, "eval_steps_per_second": 48.612, "step": 200 }, { "epoch": 0.28, "eval_accuracy": 0.9517968180816997, "eval_f1": 0.9457094561002287, "eval_loss": 0.1621113270521164, "eval_precision": 0.9413290049288386, "eval_recall": 0.9501308665161535, "eval_runtime": 2.1281, "eval_samples_per_second": 777.203, "eval_steps_per_second": 48.869, "step": 250 }, { "epoch": 0.34, "eval_accuracy": 0.9550160112502329, "eval_f1": 0.9493230481719319, "eval_loss": 0.15087193250656128, "eval_precision": 0.9446653609511939, "eval_recall": 0.9540268925695791, "eval_runtime": 2.298, "eval_samples_per_second": 719.743, "eval_steps_per_second": 45.256, "step": 300 }, { "epoch": 0.39, "eval_accuracy": 0.9569475271513529, "eval_f1": 0.9518080688370796, "eval_loss": 0.14275319874286652, "eval_precision": 0.9488880063542494, "eval_recall": 0.9547461589179037, "eval_runtime": 2.1296, "eval_samples_per_second": 776.672, "eval_steps_per_second": 48.836, "step": 350 }, { "epoch": 0.45, "eval_accuracy": 0.9599125734907914, "eval_f1": 0.9552152672059542, "eval_loss": 0.13306136429309845, "eval_precision": 0.9514191706969001, "eval_recall": 0.9590417773870652, "eval_runtime": 2.1348, "eval_samples_per_second": 774.763, "eval_steps_per_second": 48.715, "step": 400 }, { "epoch": 0.5, "eval_accuracy": 0.9615729994408769, "eval_f1": 0.9574688383576919, "eval_loss": 0.1282903254032135, "eval_precision": 0.9542198321195404, "eval_recall": 0.960740045153943, "eval_runtime": 2.1298, "eval_samples_per_second": 776.615, "eval_steps_per_second": 48.832, "step": 450 }, { "epoch": 0.56, "learning_rate": 4.301675977653631e-05, "loss": 0.3237, "step": 500 }, { "epoch": 0.56, "eval_accuracy": 0.9627081886108334, "eval_f1": 0.9586143012241402, "eval_loss": 0.12317304313182831, "eval_precision": 0.955805823699996, "eval_recall": 0.9614393318814809, "eval_runtime": 2.1308, "eval_samples_per_second": 776.237, "eval_steps_per_second": 48.808, "step": 500 }, { "epoch": 0.61, "eval_accuracy": 0.9631487097812643, "eval_f1": 0.9595639523297063, "eval_loss": 0.12186494469642639, "eval_precision": 0.9571414372328795, "eval_recall": 0.9619987612635112, "eval_runtime": 2.1344, "eval_samples_per_second": 774.932, "eval_steps_per_second": 48.726, "step": 550 }, { "epoch": 0.67, "eval_accuracy": 0.9634875722200573, "eval_f1": 0.958921835030408, "eval_loss": 0.11784511059522629, "eval_precision": 0.9554506505871152, "eval_recall": 0.962418333300034, "eval_runtime": 2.1352, "eval_samples_per_second": 774.645, "eval_steps_per_second": 48.708, "step": 600 }, { "epoch": 0.73, "eval_accuracy": 0.9650971688043238, "eval_f1": 0.9605728341947756, "eval_loss": 0.11247887462377548, "eval_precision": 0.9576069258567967, "eval_recall": 0.9635571716848814, "eval_runtime": 2.1435, "eval_samples_per_second": 771.651, "eval_steps_per_second": 48.52, "step": 650 }, { "epoch": 0.78, "eval_accuracy": 0.964944680706867, "eval_f1": 0.9602157922501917, "eval_loss": 0.11355415731668472, "eval_precision": 0.9567399238337035, "eval_recall": 0.9637170086511758, "eval_runtime": 2.2141, "eval_samples_per_second": 747.036, "eval_steps_per_second": 46.972, "step": 700 }, { "epoch": 0.84, "eval_accuracy": 0.9651310550482032, "eval_f1": 0.9611485310065565, "eval_loss": 0.1140877828001976, "eval_precision": 0.9572532699167657, "eval_recall": 0.9650756228646781, "eval_runtime": 2.1438, "eval_samples_per_second": 771.53, "eval_steps_per_second": 48.512, "step": 750 }, { "epoch": 0.89, "eval_accuracy": 0.966927025973806, "eval_f1": 0.9630610538054083, "eval_loss": 0.10770992189645767, "eval_precision": 0.9598690086335219, "eval_recall": 0.9662744001118859, "eval_runtime": 2.2364, "eval_samples_per_second": 739.577, "eval_steps_per_second": 46.503, "step": 800 }, { "epoch": 0.95, "eval_accuracy": 0.96721505904678, "eval_f1": 0.9637699922321589, "eval_loss": 0.10767628997564316, "eval_precision": 0.9607847030558148, "eval_recall": 0.9667738906315558, "eval_runtime": 2.1375, "eval_samples_per_second": 773.803, "eval_steps_per_second": 48.655, "step": 850 }, { "epoch": 1.01, "eval_accuracy": 0.9668592534860473, "eval_f1": 0.9632716541713192, "eval_loss": 0.10464677959680557, "eval_precision": 0.9613356416532346, "eval_recall": 0.9652154802101857, "eval_runtime": 2.1343, "eval_samples_per_second": 774.949, "eval_steps_per_second": 48.727, "step": 900 }, { "epoch": 1.06, "eval_accuracy": 0.967164229680961, "eval_f1": 0.964045682196091, "eval_loss": 0.10587447881698608, "eval_precision": 0.9608788853161844, "eval_recall": 0.9672334219096521, "eval_runtime": 2.1299, "eval_samples_per_second": 776.577, "eval_steps_per_second": 48.83, "step": 950 }, { "epoch": 1.12, "learning_rate": 3.603351955307263e-05, "loss": 0.1016, "step": 1000 }, { "epoch": 1.12, "eval_accuracy": 0.9680961013876417, "eval_f1": 0.964487843762455, "eval_loss": 0.10317474603652954, "eval_precision": 0.962014748852094, "eval_recall": 0.9669736868394238, "eval_runtime": 2.136, "eval_samples_per_second": 774.328, "eval_steps_per_second": 48.688, "step": 1000 }, { "epoch": 1.17, "eval_accuracy": 0.9681638738754003, "eval_f1": 0.9649510829497678, "eval_loss": 0.10267002880573273, "eval_precision": 0.9623432625240943, "eval_recall": 0.9675730754630277, "eval_runtime": 2.1373, "eval_samples_per_second": 773.858, "eval_steps_per_second": 48.659, "step": 1050 }, { "epoch": 1.23, "eval_accuracy": 0.9678419545585469, "eval_f1": 0.9647576653820493, "eval_loss": 0.10265430808067322, "eval_precision": 0.9617217280813215, "eval_recall": 0.9678128309124693, "eval_runtime": 2.2158, "eval_samples_per_second": 746.462, "eval_steps_per_second": 46.936, "step": 1100 }, { "epoch": 1.28, "eval_accuracy": 0.9681638738754003, "eval_f1": 0.9656238468979685, "eval_loss": 0.10431361943483353, "eval_precision": 0.9639799291147306, "eval_recall": 0.9672733811512257, "eval_runtime": 2.1356, "eval_samples_per_second": 774.507, "eval_steps_per_second": 48.699, "step": 1150 }, { "epoch": 1.34, "eval_accuracy": 0.9690279730943223, "eval_f1": 0.9660102697043721, "eval_loss": 0.09999706596136093, "eval_precision": 0.9641549239710214, "eval_recall": 0.9678727697748297, "eval_runtime": 2.1302, "eval_samples_per_second": 776.464, "eval_steps_per_second": 48.822, "step": 1200 }, { "epoch": 1.4, "eval_accuracy": 0.9696887548499686, "eval_f1": 0.9667211350683513, "eval_loss": 0.09862436354160309, "eval_precision": 0.9642040824439012, "eval_recall": 0.9692513636091187, "eval_runtime": 2.1352, "eval_samples_per_second": 774.617, "eval_steps_per_second": 48.706, "step": 1250 }, { "epoch": 1.45, "eval_accuracy": 0.969722641093848, "eval_f1": 0.9668191649473233, "eval_loss": 0.09789332747459412, "eval_precision": 0.9646366203906281, "eval_recall": 0.9690116081596771, "eval_runtime": 2.1358, "eval_samples_per_second": 774.418, "eval_steps_per_second": 48.694, "step": 1300 }, { "epoch": 1.51, "eval_accuracy": 0.9700276172887616, "eval_f1": 0.9670270539584476, "eval_loss": 0.09716714918613434, "eval_precision": 0.9645952608142494, "eval_recall": 0.9694711394377735, "eval_runtime": 2.2431, "eval_samples_per_second": 737.37, "eval_steps_per_second": 46.364, "step": 1350 }, { "epoch": 1.56, "eval_accuracy": 0.9706545128005286, "eval_f1": 0.9676860072340298, "eval_loss": 0.09573524445295334, "eval_precision": 0.9652142800349846, "eval_recall": 0.9701704261653114, "eval_runtime": 2.1264, "eval_samples_per_second": 777.85, "eval_steps_per_second": 48.91, "step": 1400 }, { "epoch": 1.62, "eval_accuracy": 0.9709594889954423, "eval_f1": 0.967925205326529, "eval_loss": 0.09566310793161392, "eval_precision": 0.9657497464049167, "eval_recall": 0.970110487302951, "eval_runtime": 2.1392, "eval_samples_per_second": 773.185, "eval_steps_per_second": 48.616, "step": 1450 }, { "epoch": 1.68, "learning_rate": 2.9050279329608944e-05, "loss": 0.0743, "step": 1500 }, { "epoch": 1.68, "eval_accuracy": 0.9710950339709595, "eval_f1": 0.9684382567792472, "eval_loss": 0.09543575346469879, "eval_precision": 0.9661178716296827, "eval_recall": 0.9707698147889153, "eval_runtime": 2.1291, "eval_samples_per_second": 776.851, "eval_steps_per_second": 48.847, "step": 1500 }, { "epoch": 1.73, "eval_accuracy": 0.9710103183612613, "eval_f1": 0.9679354324432046, "eval_loss": 0.09453850984573364, "eval_precision": 0.9654534973861536, "eval_recall": 0.9704301612355397, "eval_runtime": 2.1938, "eval_samples_per_second": 753.935, "eval_steps_per_second": 47.406, "step": 1550 }, { "epoch": 1.79, "eval_accuracy": 0.9709594889954423, "eval_f1": 0.9680789552387599, "eval_loss": 0.0951261818408966, "eval_precision": 0.9660757277303568, "eval_recall": 0.9700905076821642, "eval_runtime": 2.1335, "eval_samples_per_second": 775.251, "eval_steps_per_second": 48.746, "step": 1600 }, { "epoch": 1.84, "eval_accuracy": 0.9714677826536318, "eval_f1": 0.9685327588442396, "eval_loss": 0.09292884916067123, "eval_precision": 0.9669800047797339, "eval_recall": 0.9700905076821642, "eval_runtime": 2.1353, "eval_samples_per_second": 774.607, "eval_steps_per_second": 48.706, "step": 1650 }, { "epoch": 1.9, "eval_accuracy": 0.9701292760203996, "eval_f1": 0.9677001037427181, "eval_loss": 0.09427014738321304, "eval_precision": 0.9662928063430085, "eval_recall": 0.9691115062636111, "eval_runtime": 2.1273, "eval_samples_per_second": 777.503, "eval_steps_per_second": 48.888, "step": 1700 }, { "epoch": 1.96, "eval_accuracy": 0.9717049863607868, "eval_f1": 0.9692304624404251, "eval_loss": 0.09205251187086105, "eval_precision": 0.9673785402941704, "eval_recall": 0.971089488721504, "eval_runtime": 2.1221, "eval_samples_per_second": 779.408, "eval_steps_per_second": 49.008, "step": 1750 }, { "epoch": 2.01, "eval_accuracy": 0.9717727588485454, "eval_f1": 0.9690059994817724, "eval_loss": 0.09247507154941559, "eval_precision": 0.9666938418404883, "eval_recall": 0.9713292441709457, "eval_runtime": 2.1236, "eval_samples_per_second": 778.86, "eval_steps_per_second": 48.973, "step": 1800 }, { "epoch": 2.07, "eval_accuracy": 0.9717897019704851, "eval_f1": 0.969009253350351, "eval_loss": 0.09157387167215347, "eval_precision": 0.9672153990086988, "eval_recall": 0.9708097740304888, "eval_runtime": 2.2335, "eval_samples_per_second": 740.542, "eval_steps_per_second": 46.564, "step": 1850 }, { "epoch": 2.12, "eval_accuracy": 0.9720269056776402, "eval_f1": 0.9689462039823802, "eval_loss": 0.09219598025083542, "eval_precision": 0.9666341890199042, "eval_recall": 0.9712693053085852, "eval_runtime": 2.1305, "eval_samples_per_second": 776.351, "eval_steps_per_second": 48.815, "step": 1900 }, { "epoch": 2.18, "eval_accuracy": 0.9708408871418648, "eval_f1": 0.9684567439541261, "eval_loss": 0.09351955354213715, "eval_precision": 0.9667887862376553, "eval_recall": 0.9701304669237378, "eval_runtime": 2.1221, "eval_samples_per_second": 779.416, "eval_steps_per_second": 49.008, "step": 1950 }, { "epoch": 2.23, "learning_rate": 2.206703910614525e-05, "loss": 0.0615, "step": 2000 }, { "epoch": 2.23, "eval_accuracy": 0.9721455075312178, "eval_f1": 0.9688911039122852, "eval_loss": 0.09326422959566116, "eval_precision": 0.9667422524565382, "eval_recall": 0.9710495294799305, "eval_runtime": 2.219, "eval_samples_per_second": 745.381, "eval_steps_per_second": 46.868, "step": 2000 }, { "epoch": 2.29, "eval_accuracy": 0.9722132800189763, "eval_f1": 0.96901296111665, "eval_loss": 0.09226556122303009, "eval_precision": 0.967103822961651, "eval_recall": 0.9709296517552097, "eval_runtime": 2.123, "eval_samples_per_second": 779.099, "eval_steps_per_second": 48.988, "step": 2050 }, { "epoch": 2.35, "eval_accuracy": 0.9717049863607868, "eval_f1": 0.9685824213065407, "eval_loss": 0.09270057827234268, "eval_precision": 0.9664246643460964, "eval_recall": 0.9707498351681285, "eval_runtime": 2.1288, "eval_samples_per_second": 776.969, "eval_steps_per_second": 48.854, "step": 2100 }, { "epoch": 2.4, "eval_accuracy": 0.9722302231409159, "eval_f1": 0.9689141376389098, "eval_loss": 0.09301681816577911, "eval_precision": 0.9666693182722138, "eval_recall": 0.9711694072046513, "eval_runtime": 2.1326, "eval_samples_per_second": 775.588, "eval_steps_per_second": 48.767, "step": 2150 }, { "epoch": 2.46, "eval_accuracy": 0.9719252469460022, "eval_f1": 0.9685870659661645, "eval_loss": 0.09278148412704468, "eval_precision": 0.9665923833021608, "eval_recall": 0.9705899982018341, "eval_runtime": 2.1276, "eval_samples_per_second": 777.387, "eval_steps_per_second": 48.88, "step": 2200 }, { "epoch": 2.51, "eval_accuracy": 0.9719930194337608, "eval_f1": 0.9692303088937873, "eval_loss": 0.09329798072576523, "eval_precision": 0.9676956781517626, "eval_recall": 0.9707698147889153, "eval_runtime": 2.1211, "eval_samples_per_second": 779.788, "eval_steps_per_second": 49.031, "step": 2250 }, { "epoch": 2.57, "eval_accuracy": 0.9717558157266057, "eval_f1": 0.9686011044436914, "eval_loss": 0.09375003725290298, "eval_precision": 0.9664816693521115, "eval_recall": 0.9707298555473417, "eval_runtime": 2.1294, "eval_samples_per_second": 776.741, "eval_steps_per_second": 48.84, "step": 2300 }, { "epoch": 2.63, "eval_accuracy": 0.9717558157266057, "eval_f1": 0.9686278420422816, "eval_loss": 0.0936710387468338, "eval_precision": 0.9669115451233351, "eval_recall": 0.9703502427523926, "eval_runtime": 2.1262, "eval_samples_per_second": 777.923, "eval_steps_per_second": 48.914, "step": 2350 }, { "epoch": 2.68, "eval_accuracy": 0.9719760763118213, "eval_f1": 0.9692519504359799, "eval_loss": 0.0930139347910881, "eval_precision": 0.9679772034354264, "eval_recall": 0.9705300593394738, "eval_runtime": 2.1439, "eval_samples_per_second": 771.475, "eval_steps_per_second": 48.509, "step": 2400 }, { "epoch": 2.74, "eval_accuracy": 0.9723488249944935, "eval_f1": 0.9693586650983831, "eval_loss": 0.09228159487247467, "eval_precision": 0.9672375723578206, "eval_recall": 0.97148908113724, "eval_runtime": 2.1904, "eval_samples_per_second": 755.118, "eval_steps_per_second": 47.48, "step": 2450 }, { "epoch": 2.79, "learning_rate": 1.5083798882681566e-05, "loss": 0.0476, "step": 2500 }, { "epoch": 2.79, "eval_accuracy": 0.9725690855797089, "eval_f1": 0.9697827951413127, "eval_loss": 0.09134206175804138, "eval_precision": 0.9681221750990582, "eval_recall": 0.9714491218956665, "eval_runtime": 2.129, "eval_samples_per_second": 776.908, "eval_steps_per_second": 48.85, "step": 2500 }, { "epoch": 2.85, "eval_accuracy": 0.9723996543603124, "eval_f1": 0.9693912141817385, "eval_loss": 0.09225371479988098, "eval_precision": 0.967500547296356, "eval_recall": 0.971289284929372, "eval_runtime": 2.1338, "eval_samples_per_second": 775.13, "eval_steps_per_second": 48.739, "step": 2550 }, { "epoch": 2.91, "eval_accuracy": 0.9726199149455279, "eval_f1": 0.9692855220264976, "eval_loss": 0.09092037379741669, "eval_precision": 0.9672701949860725, "eval_recall": 0.9713092645501589, "eval_runtime": 2.1425, "eval_samples_per_second": 772.0, "eval_steps_per_second": 48.542, "step": 2600 }, { "epoch": 2.96, "eval_accuracy": 0.9727893461649243, "eval_f1": 0.9692160459366775, "eval_loss": 0.090567946434021, "eval_precision": 0.967191261614373, "eval_recall": 0.9712493256877984, "eval_runtime": 2.1343, "eval_samples_per_second": 774.944, "eval_steps_per_second": 48.727, "step": 2650 }, { "epoch": 3.02, "eval_accuracy": 0.9726707443113468, "eval_f1": 0.9698335610359304, "eval_loss": 0.09072472155094147, "eval_precision": 0.9681439891689563, "eval_recall": 0.9715290403788136, "eval_runtime": 2.1224, "eval_samples_per_second": 779.321, "eval_steps_per_second": 49.002, "step": 2700 }, { "epoch": 3.07, "eval_accuracy": 0.9726707443113468, "eval_f1": 0.9696003189474732, "eval_loss": 0.09210502356290817, "eval_precision": 0.9674018974124385, "eval_recall": 0.9718087550698288, "eval_runtime": 2.138, "eval_samples_per_second": 773.607, "eval_steps_per_second": 48.643, "step": 2750 }, { "epoch": 3.13, "eval_accuracy": 0.9726876874332865, "eval_f1": 0.9699822486387298, "eval_loss": 0.09258724749088287, "eval_precision": 0.9683212870597137, "eval_recall": 0.9716489181035344, "eval_runtime": 2.133, "eval_samples_per_second": 775.419, "eval_steps_per_second": 48.757, "step": 2800 }, { "epoch": 3.18, "eval_accuracy": 0.97251825621389, "eval_f1": 0.9694595618284392, "eval_loss": 0.0923946425318718, "eval_precision": 0.9672998508204873, "eval_recall": 0.9716289384827476, "eval_runtime": 2.1344, "eval_samples_per_second": 774.911, "eval_steps_per_second": 48.725, "step": 2850 }, { "epoch": 3.24, "eval_accuracy": 0.9721624506531573, "eval_f1": 0.9694086198469933, "eval_loss": 0.09172414243221283, "eval_precision": 0.967912201728877, "eval_recall": 0.9709096721344229, "eval_runtime": 2.252, "eval_samples_per_second": 734.459, "eval_steps_per_second": 46.181, "step": 2900 }, { "epoch": 3.3, "eval_accuracy": 0.9729248911404416, "eval_f1": 0.9698389283151264, "eval_loss": 0.09304258227348328, "eval_precision": 0.967659168208127, "eval_recall": 0.9720285308984835, "eval_runtime": 2.138, "eval_samples_per_second": 773.613, "eval_steps_per_second": 48.643, "step": 2950 }, { "epoch": 3.35, "learning_rate": 8.100558659217877e-06, "loss": 0.0401, "step": 3000 }, { "epoch": 3.35, "eval_accuracy": 0.9726199149455279, "eval_f1": 0.9696093196756466, "eval_loss": 0.09338225424289703, "eval_precision": 0.9680740888269269, "eval_recall": 0.9711494275838645, "eval_runtime": 2.1217, "eval_samples_per_second": 779.556, "eval_steps_per_second": 49.017, "step": 3000 }, { "epoch": 3.41, "eval_accuracy": 0.9726029718235882, "eval_f1": 0.9700723011717777, "eval_loss": 0.0939800962805748, "eval_precision": 0.9684015610066901, "eval_recall": 0.9717488162074683, "eval_runtime": 2.1338, "eval_samples_per_second": 775.131, "eval_steps_per_second": 48.739, "step": 3050 }, { "epoch": 3.46, "eval_accuracy": 0.9725860287016486, "eval_f1": 0.9697096594081518, "eval_loss": 0.0932546854019165, "eval_precision": 0.9678375957806747, "eval_recall": 0.971588979241174, "eval_runtime": 2.1338, "eval_samples_per_second": 775.149, "eval_steps_per_second": 48.74, "step": 3100 }, { "epoch": 3.52, "eval_accuracy": 0.9730096067501398, "eval_f1": 0.970347393303478, "eval_loss": 0.09254217892885208, "eval_precision": 0.968810993825931, "eval_recall": 0.9718886735529759, "eval_runtime": 2.1334, "eval_samples_per_second": 775.292, "eval_steps_per_second": 48.749, "step": 3150 }, { "epoch": 3.58, "eval_accuracy": 0.9728740617746225, "eval_f1": 0.9700208368643012, "eval_loss": 0.0929267629981041, "eval_precision": 0.9680808724030885, "eval_recall": 0.9719685920361232, "eval_runtime": 2.1261, "eval_samples_per_second": 777.96, "eval_steps_per_second": 48.916, "step": 3200 }, { "epoch": 3.63, "eval_accuracy": 0.9730096067501398, "eval_f1": 0.970106690597268, "eval_loss": 0.09258970618247986, "eval_precision": 0.9682915663130237, "eval_recall": 0.9719286327945496, "eval_runtime": 2.1319, "eval_samples_per_second": 775.827, "eval_steps_per_second": 48.782, "step": 3250 }, { "epoch": 3.69, "eval_accuracy": 0.9729587773843208, "eval_f1": 0.9697857790803154, "eval_loss": 0.09318643063306808, "eval_precision": 0.9677117733656945, "eval_recall": 0.9718686939321892, "eval_runtime": 2.1448, "eval_samples_per_second": 771.163, "eval_steps_per_second": 48.489, "step": 3300 }, { "epoch": 3.74, "eval_accuracy": 0.9721455075312178, "eval_f1": 0.9693965087281795, "eval_loss": 0.09343180060386658, "eval_precision": 0.967967489392219, "eval_recall": 0.9708297536512757, "eval_runtime": 2.1975, "eval_samples_per_second": 752.673, "eval_steps_per_second": 47.326, "step": 3350 }, { "epoch": 3.8, "eval_accuracy": 0.9727893461649243, "eval_f1": 0.9701992699419543, "eval_loss": 0.09262708574533463, "eval_precision": 0.9686149556905307, "eval_recall": 0.971788775449042, "eval_runtime": 2.1286, "eval_samples_per_second": 777.052, "eval_steps_per_second": 48.859, "step": 3400 }, { "epoch": 3.85, "eval_accuracy": 0.9730943223598381, "eval_f1": 0.9702263436035498, "eval_loss": 0.09267932176589966, "eval_precision": 0.9684109954417882, "eval_recall": 0.9720485105192703, "eval_runtime": 2.2372, "eval_samples_per_second": 739.323, "eval_steps_per_second": 46.487, "step": 3450 }, { "epoch": 3.91, "learning_rate": 1.11731843575419e-06, "loss": 0.0345, "step": 3500 }, { "epoch": 3.91, "eval_accuracy": 0.9730773792378984, "eval_f1": 0.9700788657686671, "eval_loss": 0.09281700849533081, "eval_precision": 0.9681964733511125, "eval_recall": 0.9719685920361232, "eval_runtime": 2.1359, "eval_samples_per_second": 774.388, "eval_steps_per_second": 48.692, "step": 3500 }, { "epoch": 3.97, "eval_accuracy": 0.9729926636282001, "eval_f1": 0.9700680000797655, "eval_loss": 0.09279671311378479, "eval_precision": 0.9682144776386761, "eval_recall": 0.9719286327945496, "eval_runtime": 2.134, "eval_samples_per_second": 775.061, "eval_steps_per_second": 48.734, "step": 3550 }, { "epoch": 4.0, "step": 3580, "total_flos": 191596914718944.0, "train_loss": 0.09616074821802491, "train_runtime": 221.8255, "train_samples_per_second": 257.951, "train_steps_per_second": 16.139 } ], "max_steps": 3580, "num_train_epochs": 4, "total_flos": 191596914718944.0, "trial_name": null, "trial_params": null }