{ "best_metric": null, "best_model_checkpoint": null, "epoch": 86.0, "global_step": 2752, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, "eval_accuracy": 0.6175584724649537, "eval_f1": 0.0769764216366158, "eval_loss": 1.250605583190918, "eval_precision": 0.06442251886244922, "eval_recall": 0.09560723514211886, "eval_runtime": 3.5402, "eval_samples_per_second": 26.553, "eval_steps_per_second": 3.39, "step": 32 }, { "epoch": 2.0, "eval_accuracy": 0.6520655932770609, "eval_f1": 0.18170731707317075, "eval_loss": 1.0688396692276, "eval_precision": 0.14063237376120813, "eval_recall": 0.2566752799310939, "eval_runtime": 3.2469, "eval_samples_per_second": 28.95, "eval_steps_per_second": 3.696, "step": 64 }, { "epoch": 3.0, "eval_accuracy": 0.733239132859852, "eval_f1": 0.26462128475551294, "eval_loss": 0.8916715383529663, "eval_precision": 0.21036585365853658, "eval_recall": 0.35658914728682173, "eval_runtime": 3.5217, "eval_samples_per_second": 26.692, "eval_steps_per_second": 3.407, "step": 96 }, { "epoch": 4.0, "eval_accuracy": 0.7502695868813446, "eval_f1": 0.31227821149751595, "eval_loss": 0.8893136382102966, "eval_precision": 0.2655401327700664, "eval_recall": 0.3789836347975883, "eval_runtime": 3.1549, "eval_samples_per_second": 29.795, "eval_steps_per_second": 3.804, "step": 128 }, { "epoch": 5.0, "eval_accuracy": 0.7515338563938572, "eval_f1": 0.3259361997226075, "eval_loss": 0.8177661299705505, "eval_precision": 0.2727800348229832, "eval_recall": 0.40482342807924204, "eval_runtime": 3.1577, "eval_samples_per_second": 29.768, "eval_steps_per_second": 3.8, "step": 160 }, { "epoch": 6.0, "eval_accuracy": 0.7685271260179228, "eval_f1": 0.3471241170534813, "eval_loss": 0.818898618221283, "eval_precision": 0.2847682119205298, "eval_recall": 0.4444444444444444, "eval_runtime": 3.5275, "eval_samples_per_second": 26.648, "eval_steps_per_second": 3.402, "step": 192 }, { "epoch": 7.0, "eval_accuracy": 0.7693451827613134, "eval_f1": 0.39416058394160586, "eval_loss": 0.8939387798309326, "eval_precision": 0.34198860037998735, "eval_recall": 0.46511627906976744, "eval_runtime": 4.3875, "eval_samples_per_second": 21.424, "eval_steps_per_second": 2.735, "step": 224 }, { "epoch": 8.0, "eval_accuracy": 0.7565537500464805, "eval_f1": 0.3823943661971831, "eval_loss": 0.8892739415168762, "eval_precision": 0.323406789755807, "eval_recall": 0.46770025839793283, "eval_runtime": 3.5968, "eval_samples_per_second": 26.135, "eval_steps_per_second": 3.336, "step": 256 }, { "epoch": 9.0, "eval_accuracy": 0.7693451827613134, "eval_f1": 0.41654247391952315, "eval_loss": 0.9633013010025024, "eval_precision": 0.3670387393302692, "eval_recall": 0.48148148148148145, "eval_runtime": 3.1245, "eval_samples_per_second": 30.085, "eval_steps_per_second": 3.841, "step": 288 }, { "epoch": 10.0, "eval_accuracy": 0.765478005428922, "eval_f1": 0.3988900450919181, "eval_loss": 0.9256911873817444, "eval_precision": 0.3339140534262485, "eval_recall": 0.49526270456503013, "eval_runtime": 3.0684, "eval_samples_per_second": 30.635, "eval_steps_per_second": 3.911, "step": 320 }, { "epoch": 11.0, "eval_accuracy": 0.7651061614546536, "eval_f1": 0.4374537379718727, "eval_loss": 1.0472618341445923, "eval_precision": 0.3835171966255678, "eval_recall": 0.5090439276485789, "eval_runtime": 15.8515, "eval_samples_per_second": 5.93, "eval_steps_per_second": 0.757, "step": 352 }, { "epoch": 12.0, "eval_accuracy": 0.7513107500092961, "eval_f1": 0.4116819141449683, "eval_loss": 1.0901930332183838, "eval_precision": 0.34800713860797144, "eval_recall": 0.5038759689922481, "eval_runtime": 3.3377, "eval_samples_per_second": 28.163, "eval_steps_per_second": 3.595, "step": 384 }, { "epoch": 13.0, "eval_accuracy": 0.7735842040679731, "eval_f1": 0.4424198250728863, "eval_loss": 1.0164769887924194, "eval_precision": 0.38344914718888184, "eval_recall": 0.5228251507321274, "eval_runtime": 3.1559, "eval_samples_per_second": 29.785, "eval_steps_per_second": 3.802, "step": 416 }, { "epoch": 14.0, "eval_accuracy": 0.7737329416576805, "eval_f1": 0.46205860255447034, "eval_loss": 1.0768243074417114, "eval_precision": 0.4097268487674883, "eval_recall": 0.5297157622739018, "eval_runtime": 3.0915, "eval_samples_per_second": 30.406, "eval_steps_per_second": 3.882, "step": 448 }, { "epoch": 15.0, "eval_accuracy": 0.7817647715018778, "eval_f1": 0.4762264150943396, "eval_loss": 1.1149170398712158, "eval_precision": 0.4237743451981195, "eval_recall": 0.5434969853574505, "eval_runtime": 3.2505, "eval_samples_per_second": 28.919, "eval_steps_per_second": 3.692, "step": 480 }, { "epoch": 15.62, "learning_rate": 1.6875e-05, "loss": 0.4087, "step": 500 }, { "epoch": 16.0, "eval_accuracy": 0.7796452608485479, "eval_f1": 0.4698749526335733, "eval_loss": 1.1298694610595703, "eval_precision": 0.41948579161028415, "eval_recall": 0.5340223944875108, "eval_runtime": 3.0471, "eval_samples_per_second": 30.849, "eval_steps_per_second": 3.938, "step": 512 }, { "epoch": 17.0, "eval_accuracy": 0.7883464098464285, "eval_f1": 0.4673040152963671, "eval_loss": 1.1149996519088745, "eval_precision": 0.4202200825309491, "eval_recall": 0.5262704565030146, "eval_runtime": 3.1689, "eval_samples_per_second": 29.664, "eval_steps_per_second": 3.787, "step": 544 }, { "epoch": 18.0, "eval_accuracy": 0.7801286580150969, "eval_f1": 0.45127436281859074, "eval_loss": 1.1859441995620728, "eval_precision": 0.39946914399469147, "eval_recall": 0.5185185185185185, "eval_runtime": 7.3417, "eval_samples_per_second": 12.803, "eval_steps_per_second": 1.634, "step": 576 }, { "epoch": 19.0, "eval_accuracy": 0.7609043245454208, "eval_f1": 0.4414210128495843, "eval_loss": 1.2266000509262085, "eval_precision": 0.39326599326599326, "eval_recall": 0.5030146425495263, "eval_runtime": 3.4668, "eval_samples_per_second": 27.114, "eval_steps_per_second": 3.461, "step": 608 }, { "epoch": 20.0, "eval_accuracy": 0.7837355445655003, "eval_f1": 0.4707198806415516, "eval_loss": 1.1946580410003662, "eval_precision": 0.4151315789473684, "eval_recall": 0.5434969853574505, "eval_runtime": 3.1596, "eval_samples_per_second": 29.75, "eval_steps_per_second": 3.798, "step": 640 }, { "epoch": 21.0, "eval_accuracy": 0.7890900977949652, "eval_f1": 0.4974698326196964, "eval_loss": 1.2461358308792114, "eval_precision": 0.4538352272727273, "eval_recall": 0.5503875968992248, "eval_runtime": 3.1747, "eval_samples_per_second": 29.609, "eval_steps_per_second": 3.78, "step": 672 }, { "epoch": 22.0, "eval_accuracy": 0.7804261331945116, "eval_f1": 0.4870506378044067, "eval_loss": 1.2504911422729492, "eval_precision": 0.4417952314165498, "eval_recall": 0.5426356589147286, "eval_runtime": 3.1491, "eval_samples_per_second": 29.849, "eval_steps_per_second": 3.811, "step": 704 }, { "epoch": 23.0, "eval_accuracy": 0.7844420481166102, "eval_f1": 0.4932249322493225, "eval_loss": 1.287372350692749, "eval_precision": 0.4479606188466948, "eval_recall": 0.5486649440137812, "eval_runtime": 3.7236, "eval_samples_per_second": 25.244, "eval_steps_per_second": 3.223, "step": 736 }, { "epoch": 24.0, "eval_accuracy": 0.7877886438850259, "eval_f1": 0.49941107184923444, "eval_loss": 1.277133584022522, "eval_precision": 0.4588744588744589, "eval_recall": 0.5478036175710594, "eval_runtime": 3.2052, "eval_samples_per_second": 29.328, "eval_steps_per_second": 3.744, "step": 768 }, { "epoch": 25.0, "eval_accuracy": 0.7892760197820994, "eval_f1": 0.4747201852566576, "eval_loss": 1.2719131708145142, "eval_precision": 0.43006993006993005, "eval_recall": 0.5297157622739018, "eval_runtime": 3.0524, "eval_samples_per_second": 30.795, "eval_steps_per_second": 3.931, "step": 800 }, { "epoch": 26.0, "eval_accuracy": 0.7896478637563679, "eval_f1": 0.49407265774378584, "eval_loss": 1.2584308385849, "eval_precision": 0.4442916093535076, "eval_recall": 0.5564168819982773, "eval_runtime": 3.7701, "eval_samples_per_second": 24.933, "eval_steps_per_second": 3.183, "step": 832 }, { "epoch": 27.0, "eval_accuracy": 0.7868590339493549, "eval_f1": 0.4920077972709551, "eval_loss": 1.3040637969970703, "eval_precision": 0.4494301994301994, "eval_recall": 0.5434969853574505, "eval_runtime": 3.4169, "eval_samples_per_second": 27.51, "eval_steps_per_second": 3.512, "step": 864 }, { "epoch": 28.0, "eval_accuracy": 0.7880861190644406, "eval_f1": 0.4916158536585366, "eval_loss": 1.3579275608062744, "eval_precision": 0.4408749145591251, "eval_recall": 0.5555555555555556, "eval_runtime": 3.4487, "eval_samples_per_second": 27.256, "eval_steps_per_second": 3.48, "step": 896 }, { "epoch": 29.0, "eval_accuracy": 0.7839958353474882, "eval_f1": 0.501557632398754, "eval_loss": 1.3749990463256836, "eval_precision": 0.4577114427860697, "eval_recall": 0.5546942291128337, "eval_runtime": 3.131, "eval_samples_per_second": 30.022, "eval_steps_per_second": 3.833, "step": 928 }, { "epoch": 30.0, "eval_accuracy": 0.7871936935261964, "eval_f1": 0.4903883876029816, "eval_loss": 1.3733103275299072, "eval_precision": 0.45028818443804036, "eval_recall": 0.5383290267011197, "eval_runtime": 3.4968, "eval_samples_per_second": 26.882, "eval_steps_per_second": 3.432, "step": 960 }, { "epoch": 31.0, "eval_accuracy": 0.7819135090915852, "eval_f1": 0.5099260412611912, "eval_loss": 1.395755410194397, "eval_precision": 0.46519886363636365, "eval_recall": 0.5641688199827735, "eval_runtime": 3.2027, "eval_samples_per_second": 29.351, "eval_steps_per_second": 3.747, "step": 992 }, { "epoch": 31.25, "learning_rate": 1.375e-05, "loss": 0.0138, "step": 1000 }, { "epoch": 32.0, "eval_accuracy": 0.7822481686684267, "eval_f1": 0.49709639953542384, "eval_loss": 1.4415804147720337, "eval_precision": 0.45147679324894513, "eval_recall": 0.5529715762273901, "eval_runtime": 3.081, "eval_samples_per_second": 30.51, "eval_steps_per_second": 3.895, "step": 1024 }, { "epoch": 33.0, "eval_accuracy": 0.7877886438850259, "eval_f1": 0.49035187287173665, "eval_loss": 1.384263277053833, "eval_precision": 0.43724696356275305, "eval_recall": 0.5581395348837209, "eval_runtime": 3.7036, "eval_samples_per_second": 25.381, "eval_steps_per_second": 3.24, "step": 1056 }, { "epoch": 34.0, "eval_accuracy": 0.7796080764511211, "eval_f1": 0.490521327014218, "eval_loss": 1.4162341356277466, "eval_precision": 0.45295404814004375, "eval_recall": 0.5348837209302325, "eval_runtime": 3.1016, "eval_samples_per_second": 30.307, "eval_steps_per_second": 3.869, "step": 1088 }, { "epoch": 35.0, "eval_accuracy": 0.7906146580894656, "eval_f1": 0.5060240963855421, "eval_loss": 1.380549669265747, "eval_precision": 0.46104815864022664, "eval_recall": 0.5607235142118863, "eval_runtime": 3.5552, "eval_samples_per_second": 26.44, "eval_steps_per_second": 3.375, "step": 1120 }, { "epoch": 36.0, "eval_accuracy": 0.7868590339493549, "eval_f1": 0.4811210587777345, "eval_loss": 1.4221726655960083, "eval_precision": 0.43892045454545453, "eval_recall": 0.5322997416020672, "eval_runtime": 3.1728, "eval_samples_per_second": 29.627, "eval_steps_per_second": 3.782, "step": 1152 }, { "epoch": 37.0, "eval_accuracy": 0.7899453389357826, "eval_f1": 0.502147598594299, "eval_loss": 1.407759189605713, "eval_precision": 0.4592857142857143, "eval_recall": 0.553832902670112, "eval_runtime": 3.1234, "eval_samples_per_second": 30.096, "eval_steps_per_second": 3.842, "step": 1184 }, { "epoch": 38.0, "eval_accuracy": 0.7908377644740266, "eval_f1": 0.4872389791183295, "eval_loss": 1.4327783584594727, "eval_precision": 0.4421052631578947, "eval_recall": 0.5426356589147286, "eval_runtime": 3.409, "eval_samples_per_second": 27.574, "eval_steps_per_second": 3.52, "step": 1216 }, { "epoch": 39.0, "eval_accuracy": 0.7851113672702934, "eval_f1": 0.4913227921326649, "eval_loss": 1.4441440105438232, "eval_precision": 0.4448324022346369, "eval_recall": 0.5486649440137812, "eval_runtime": 3.2678, "eval_samples_per_second": 28.766, "eval_steps_per_second": 3.672, "step": 1248 }, { "epoch": 40.0, "eval_accuracy": 0.7912839772431488, "eval_f1": 0.5036864571206829, "eval_loss": 1.4089561700820923, "eval_precision": 0.4583333333333333, "eval_recall": 0.5590008613264428, "eval_runtime": 3.1449, "eval_samples_per_second": 29.89, "eval_steps_per_second": 3.816, "step": 1280 }, { "epoch": 41.0, "eval_accuracy": 0.7902428141151973, "eval_f1": 0.503858024691358, "eval_loss": 1.4232546091079712, "eval_precision": 0.45632424877707894, "eval_recall": 0.5624461670973299, "eval_runtime": 8.2173, "eval_samples_per_second": 11.439, "eval_steps_per_second": 1.46, "step": 1312 }, { "epoch": 42.0, "eval_accuracy": 0.7909493176663073, "eval_f1": 0.49484536082474234, "eval_loss": 1.4232605695724487, "eval_precision": 0.4444444444444444, "eval_recall": 0.5581395348837209, "eval_runtime": 3.0349, "eval_samples_per_second": 30.973, "eval_steps_per_second": 3.954, "step": 1344 }, { "epoch": 43.0, "eval_accuracy": 0.7923995091659539, "eval_f1": 0.5162324649298597, "eval_loss": 1.4146913290023804, "eval_precision": 0.4827586206896552, "eval_recall": 0.5546942291128337, "eval_runtime": 3.288, "eval_samples_per_second": 28.589, "eval_steps_per_second": 3.65, "step": 1376 }, { "epoch": 44.0, "eval_accuracy": 0.7880117502695869, "eval_f1": 0.4955684007707129, "eval_loss": 1.4241943359375, "eval_precision": 0.44839609483960946, "eval_recall": 0.553832902670112, "eval_runtime": 6.1717, "eval_samples_per_second": 15.231, "eval_steps_per_second": 1.944, "step": 1408 }, { "epoch": 45.0, "eval_accuracy": 0.7880861190644406, "eval_f1": 0.49018853405155827, "eval_loss": 1.421156644821167, "eval_precision": 0.4429763560500695, "eval_recall": 0.5486649440137812, "eval_runtime": 3.1226, "eval_samples_per_second": 30.103, "eval_steps_per_second": 3.843, "step": 1440 }, { "epoch": 46.0, "eval_accuracy": 0.7936637786784665, "eval_f1": 0.5089463220675944, "eval_loss": 1.424131989479065, "eval_precision": 0.4726735598227474, "eval_recall": 0.5512489233419466, "eval_runtime": 3.3347, "eval_samples_per_second": 28.189, "eval_steps_per_second": 3.599, "step": 1472 }, { "epoch": 46.88, "learning_rate": 1.0625e-05, "loss": 0.0034, "step": 1500 }, { "epoch": 47.0, "eval_accuracy": 0.7858550552188301, "eval_f1": 0.5065398335315101, "eval_loss": 1.443221926689148, "eval_precision": 0.46916299559471364, "eval_recall": 0.5503875968992248, "eval_runtime": 3.0632, "eval_samples_per_second": 30.687, "eval_steps_per_second": 3.917, "step": 1504 }, { "epoch": 48.0, "eval_accuracy": 0.784739523296025, "eval_f1": 0.49553398058252424, "eval_loss": 1.4684823751449585, "eval_precision": 0.4512022630834512, "eval_recall": 0.549526270456503, "eval_runtime": 3.2701, "eval_samples_per_second": 28.745, "eval_steps_per_second": 3.67, "step": 1536 }, { "epoch": 49.0, "eval_accuracy": 0.7949280481909791, "eval_f1": 0.5152113789016199, "eval_loss": 1.4661859273910522, "eval_precision": 0.4759124087591241, "eval_recall": 0.5615848406546081, "eval_runtime": 3.3592, "eval_samples_per_second": 27.983, "eval_steps_per_second": 3.572, "step": 1568 }, { "epoch": 50.0, "eval_accuracy": 0.7894619417692337, "eval_f1": 0.506033476060724, "eval_loss": 1.5200412273406982, "eval_precision": 0.4616477272727273, "eval_recall": 0.5598621877691645, "eval_runtime": 3.1539, "eval_samples_per_second": 29.805, "eval_steps_per_second": 3.805, "step": 1600 }, { "epoch": 51.0, "eval_accuracy": 0.7907262112817461, "eval_f1": 0.5102848101265823, "eval_loss": 1.49446702003479, "eval_precision": 0.4718361375274323, "eval_recall": 0.5555555555555556, "eval_runtime": 6.9973, "eval_samples_per_second": 13.434, "eval_steps_per_second": 1.715, "step": 1632 }, { "epoch": 52.0, "eval_accuracy": 0.7916558212174172, "eval_f1": 0.5182511030886483, "eval_loss": 1.5040817260742188, "eval_precision": 0.484984984984985, "eval_recall": 0.5564168819982773, "eval_runtime": 8.0818, "eval_samples_per_second": 11.631, "eval_steps_per_second": 1.485, "step": 1664 }, { "epoch": 53.0, "eval_accuracy": 0.7928829063325029, "eval_f1": 0.5159489633173845, "eval_loss": 1.5629594326019287, "eval_precision": 0.4803266518188567, "eval_recall": 0.5572782084409992, "eval_runtime": 3.423, "eval_samples_per_second": 27.462, "eval_steps_per_second": 3.506, "step": 1696 }, { "epoch": 54.0, "eval_accuracy": 0.7840702041423419, "eval_f1": 0.5010117361392149, "eval_loss": 1.5059171915054321, "eval_precision": 0.4725190839694656, "eval_recall": 0.533161068044789, "eval_runtime": 3.1466, "eval_samples_per_second": 29.874, "eval_steps_per_second": 3.814, "step": 1728 }, { "epoch": 55.0, "eval_accuracy": 0.790763395679173, "eval_f1": 0.5078616352201258, "eval_loss": 1.5826448202133179, "eval_precision": 0.4671005061460593, "eval_recall": 0.5564168819982773, "eval_runtime": 3.1003, "eval_samples_per_second": 30.319, "eval_steps_per_second": 3.871, "step": 1760 }, { "epoch": 56.0, "eval_accuracy": 0.791246792845722, "eval_f1": 0.520757758968158, "eval_loss": 1.5211557149887085, "eval_precision": 0.4893939393939394, "eval_recall": 0.5564168819982773, "eval_runtime": 3.5151, "eval_samples_per_second": 26.742, "eval_steps_per_second": 3.414, "step": 1792 }, { "epoch": 57.0, "eval_accuracy": 0.7894619417692337, "eval_f1": 0.5172550575168584, "eval_loss": 1.5194625854492188, "eval_precision": 0.47941176470588237, "eval_recall": 0.5615848406546081, "eval_runtime": 3.1721, "eval_samples_per_second": 29.634, "eval_steps_per_second": 3.783, "step": 1824 }, { "epoch": 58.0, "eval_accuracy": 0.7864871899750865, "eval_f1": 0.5015600624024961, "eval_loss": 1.5568981170654297, "eval_precision": 0.45830363506771205, "eval_recall": 0.553832902670112, "eval_runtime": 3.0367, "eval_samples_per_second": 30.954, "eval_steps_per_second": 3.952, "step": 1856 }, { "epoch": 59.0, "eval_accuracy": 0.789610679358941, "eval_f1": 0.5186953062848051, "eval_loss": 1.5378462076187134, "eval_precision": 0.4818920916481892, "eval_recall": 0.5615848406546081, "eval_runtime": 3.0368, "eval_samples_per_second": 30.954, "eval_steps_per_second": 3.952, "step": 1888 }, { "epoch": 60.0, "eval_accuracy": 0.7838842821552077, "eval_f1": 0.490257209664848, "eval_loss": 1.5430467128753662, "eval_precision": 0.44768683274021354, "eval_recall": 0.5417743324720069, "eval_runtime": 3.2599, "eval_samples_per_second": 28.835, "eval_steps_per_second": 3.681, "step": 1920 }, { "epoch": 61.0, "eval_accuracy": 0.7890529133975384, "eval_f1": 0.5021816739389131, "eval_loss": 1.5567139387130737, "eval_precision": 0.46544117647058825, "eval_recall": 0.5452196382428941, "eval_runtime": 3.4648, "eval_samples_per_second": 27.13, "eval_steps_per_second": 3.463, "step": 1952 }, { "epoch": 62.0, "eval_accuracy": 0.7909865020637341, "eval_f1": 0.5128824476650564, "eval_loss": 1.5516618490219116, "eval_precision": 0.48148148148148145, "eval_recall": 0.5486649440137812, "eval_runtime": 3.3346, "eval_samples_per_second": 28.19, "eval_steps_per_second": 3.599, "step": 1984 }, { "epoch": 62.5, "learning_rate": 7.500000000000001e-06, "loss": 0.0017, "step": 2000 }, { "epoch": 63.0, "eval_accuracy": 0.7902056297177704, "eval_f1": 0.508203281312525, "eval_loss": 1.5522751808166504, "eval_precision": 0.47458893871449925, "eval_recall": 0.5469422911283376, "eval_runtime": 3.095, "eval_samples_per_second": 30.372, "eval_steps_per_second": 3.877, "step": 2016 }, { "epoch": 64.0, "eval_accuracy": 0.787044955936489, "eval_f1": 0.4970691676436107, "eval_loss": 1.5659950971603394, "eval_precision": 0.45493562231759654, "eval_recall": 0.5478036175710594, "eval_runtime": 3.7257, "eval_samples_per_second": 25.23, "eval_steps_per_second": 3.221, "step": 2048 }, { "epoch": 65.0, "eval_accuracy": 0.791246792845722, "eval_f1": 0.5023219814241486, "eval_loss": 1.5194514989852905, "eval_precision": 0.4560787069571328, "eval_recall": 0.5590008613264428, "eval_runtime": 3.1193, "eval_samples_per_second": 30.135, "eval_steps_per_second": 3.847, "step": 2080 }, { "epoch": 66.0, "eval_accuracy": 0.7909493176663073, "eval_f1": 0.504884720593982, "eval_loss": 1.5329976081848145, "eval_precision": 0.46208869814020026, "eval_recall": 0.5564168819982773, "eval_runtime": 3.2791, "eval_samples_per_second": 28.666, "eval_steps_per_second": 3.66, "step": 2112 }, { "epoch": 67.0, "eval_accuracy": 0.7897222325512215, "eval_f1": 0.5118296529968455, "eval_loss": 1.5393718481063843, "eval_precision": 0.472, "eval_recall": 0.5590008613264428, "eval_runtime": 3.3565, "eval_samples_per_second": 28.006, "eval_steps_per_second": 3.575, "step": 2144 }, { "epoch": 68.0, "eval_accuracy": 0.7929572751273566, "eval_f1": 0.5202220459952419, "eval_loss": 1.5860378742218018, "eval_precision": 0.4819985304922851, "eval_recall": 0.5650301464254953, "eval_runtime": 3.0372, "eval_samples_per_second": 30.949, "eval_steps_per_second": 3.951, "step": 2176 }, { "epoch": 69.0, "eval_accuracy": 0.7916186368199903, "eval_f1": 0.5208667736757624, "eval_loss": 1.622610092163086, "eval_precision": 0.48760330578512395, "eval_recall": 0.5590008613264428, "eval_runtime": 3.1363, "eval_samples_per_second": 29.972, "eval_steps_per_second": 3.826, "step": 2208 }, { "epoch": 70.0, "eval_accuracy": 0.7935150410887591, "eval_f1": 0.5205158264947246, "eval_loss": 1.613077163696289, "eval_precision": 0.47639484978540775, "eval_recall": 0.5736434108527132, "eval_runtime": 3.4181, "eval_samples_per_second": 27.501, "eval_steps_per_second": 3.511, "step": 2240 }, { "epoch": 71.0, "eval_accuracy": 0.7962666864983453, "eval_f1": 0.5341365461847388, "eval_loss": 1.617754340171814, "eval_precision": 0.5003762227238525, "eval_recall": 0.5727820844099913, "eval_runtime": 3.9965, "eval_samples_per_second": 23.521, "eval_steps_per_second": 3.003, "step": 2272 }, { "epoch": 72.0, "eval_accuracy": 0.7960063957163575, "eval_f1": 0.5309876049580169, "eval_loss": 1.6110599040985107, "eval_precision": 0.4955223880597015, "eval_recall": 0.5719207579672696, "eval_runtime": 3.0526, "eval_samples_per_second": 30.794, "eval_steps_per_second": 3.931, "step": 2304 }, { "epoch": 73.0, "eval_accuracy": 0.7905774736920388, "eval_f1": 0.5087025316455697, "eval_loss": 1.5602927207946777, "eval_precision": 0.4703730797366496, "eval_recall": 0.553832902670112, "eval_runtime": 3.378, "eval_samples_per_second": 27.827, "eval_steps_per_second": 3.552, "step": 2336 }, { "epoch": 74.0, "eval_accuracy": 0.7928085375376492, "eval_f1": 0.5181962025316456, "eval_loss": 1.555016040802002, "eval_precision": 0.479151426481346, "eval_recall": 0.5641688199827735, "eval_runtime": 3.0403, "eval_samples_per_second": 30.918, "eval_steps_per_second": 3.947, "step": 2368 }, { "epoch": 75.0, "eval_accuracy": 0.7963782396906258, "eval_f1": 0.5212933753943217, "eval_loss": 1.5542960166931152, "eval_precision": 0.4807272727272727, "eval_recall": 0.5693367786391043, "eval_runtime": 3.1539, "eval_samples_per_second": 29.805, "eval_steps_per_second": 3.805, "step": 2400 }, { "epoch": 76.0, "eval_accuracy": 0.7952998921652474, "eval_f1": 0.5285996055226825, "eval_loss": 1.560102939605713, "eval_precision": 0.487627365356623, "eval_recall": 0.5770887166236004, "eval_runtime": 3.3272, "eval_samples_per_second": 28.252, "eval_steps_per_second": 3.607, "step": 2432 }, { "epoch": 77.0, "eval_accuracy": 0.7926597999479419, "eval_f1": 0.5247999999999999, "eval_loss": 1.559518575668335, "eval_precision": 0.4899178491411501, "eval_recall": 0.5650301464254953, "eval_runtime": 3.1588, "eval_samples_per_second": 29.758, "eval_steps_per_second": 3.799, "step": 2464 }, { "epoch": 78.0, "eval_accuracy": 0.7940356226527349, "eval_f1": 0.533066132264529, "eval_loss": 1.5632045269012451, "eval_precision": 0.4985007496251874, "eval_recall": 0.5727820844099913, "eval_runtime": 3.5803, "eval_samples_per_second": 26.255, "eval_steps_per_second": 3.352, "step": 2496 }, { "epoch": 78.12, "learning_rate": 4.3750000000000005e-06, "loss": 0.0011, "step": 2500 }, { "epoch": 79.0, "eval_accuracy": 0.7931431971144908, "eval_f1": 0.5266084193804608, "eval_loss": 1.5693398714065552, "eval_precision": 0.4885777450257922, "eval_recall": 0.5710594315245479, "eval_runtime": 3.2284, "eval_samples_per_second": 29.117, "eval_steps_per_second": 3.717, "step": 2528 }, { "epoch": 80.0, "eval_accuracy": 0.7927341687427956, "eval_f1": 0.5263575108997226, "eval_loss": 1.5728816986083984, "eval_precision": 0.48751835535976507, "eval_recall": 0.5719207579672696, "eval_runtime": 3.0942, "eval_samples_per_second": 30.38, "eval_steps_per_second": 3.878, "step": 2560 }, { "epoch": 81.0, "eval_accuracy": 0.7929200907299297, "eval_f1": 0.5305313243457573, "eval_loss": 1.5773258209228516, "eval_precision": 0.49155033063923587, "eval_recall": 0.5762273901808785, "eval_runtime": 3.5248, "eval_samples_per_second": 26.668, "eval_steps_per_second": 3.404, "step": 2592 }, { "epoch": 82.0, "eval_accuracy": 0.7932919347041981, "eval_f1": 0.5318382058470164, "eval_loss": 1.579202651977539, "eval_precision": 0.49700598802395207, "eval_recall": 0.5719207579672696, "eval_runtime": 3.0984, "eval_samples_per_second": 30.338, "eval_steps_per_second": 3.873, "step": 2624 }, { "epoch": 83.0, "eval_accuracy": 0.793329119101625, "eval_f1": 0.5278780585639792, "eval_loss": 1.58578622341156, "eval_precision": 0.493993993993994, "eval_recall": 0.5667527993109388, "eval_runtime": 3.0353, "eval_samples_per_second": 30.969, "eval_steps_per_second": 3.954, "step": 2656 }, { "epoch": 84.0, "eval_accuracy": 0.7925110623582344, "eval_f1": 0.528965241709948, "eval_loss": 1.584820032119751, "eval_precision": 0.4932935916542474, "eval_recall": 0.570198105081826, "eval_runtime": 3.3844, "eval_samples_per_second": 27.774, "eval_steps_per_second": 3.546, "step": 2688 }, { "epoch": 85.0, "eval_accuracy": 0.7922135871788197, "eval_f1": 0.5333866453418633, "eval_loss": 1.5820199251174927, "eval_precision": 0.49776119402985075, "eval_recall": 0.5745047372954349, "eval_runtime": 3.2337, "eval_samples_per_second": 29.069, "eval_steps_per_second": 3.711, "step": 2720 }, { "epoch": 86.0, "eval_accuracy": 0.7920648495891124, "eval_f1": 0.5324830609804703, "eval_loss": 1.5860569477081299, "eval_precision": 0.49554896142433236, "eval_recall": 0.5753660637381568, "eval_runtime": 3.1113, "eval_samples_per_second": 30.212, "eval_steps_per_second": 3.857, "step": 2752 } ], "max_steps": 3200, "num_train_epochs": 100, "total_flos": 1.8890572813041664e+16, "trial_name": null, "trial_params": null }