{ "best_metric": 0.3024933338165283, "best_model_checkpoint": "./Hubert-common_voice-ja-demo-roma-cosine-3e-4/checkpoint-4400", "epoch": 50.0, "eval_steps": 100, "global_step": 18800, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.26595744680851063, "eval_cer": 1.6163371077245385, "eval_loss": 15.823559761047363, "eval_runtime": 210.3767, "eval_samples_per_second": 23.572, "eval_steps_per_second": 2.947, "eval_wer": 1.792498487598306, "step": 100 }, { "epoch": 0.5319148936170213, "eval_cer": 0.9276012616915579, "eval_loss": 6.4206719398498535, "eval_runtime": 221.1891, "eval_samples_per_second": 22.42, "eval_steps_per_second": 2.803, "eval_wer": 1.0, "step": 200 }, { "epoch": 0.7978723404255319, "eval_cer": 0.9276012616915579, "eval_loss": 5.419256210327148, "eval_runtime": 241.9799, "eval_samples_per_second": 20.493, "eval_steps_per_second": 2.562, "eval_wer": 1.0, "step": 300 }, { "epoch": 1.0638297872340425, "eval_cer": 0.9276012616915579, "eval_loss": 4.907326698303223, "eval_runtime": 261.1648, "eval_samples_per_second": 18.988, "eval_steps_per_second": 2.374, "eval_wer": 1.0, "step": 400 }, { "epoch": 1.3297872340425532, "grad_norm": 20.339691162109375, "learning_rate": 1.1903999999999998e-05, "loss": 7.456, "step": 500 }, { "epoch": 1.3297872340425532, "eval_cer": 0.9276012616915579, "eval_loss": 4.358646869659424, "eval_runtime": 256.9257, "eval_samples_per_second": 19.301, "eval_steps_per_second": 2.413, "eval_wer": 1.0, "step": 500 }, { "epoch": 1.5957446808510638, "eval_cer": 0.9276012616915579, "eval_loss": 3.8341214656829834, "eval_runtime": 284.7473, "eval_samples_per_second": 17.415, "eval_steps_per_second": 2.177, "eval_wer": 1.0, "step": 600 }, { "epoch": 1.8617021276595744, "eval_cer": 0.9276012616915579, "eval_loss": 3.4148387908935547, "eval_runtime": 301.2939, "eval_samples_per_second": 16.459, "eval_steps_per_second": 2.058, "eval_wer": 1.0, "step": 700 }, { "epoch": 2.127659574468085, "eval_cer": 0.9276012616915579, "eval_loss": 3.104691982269287, "eval_runtime": 236.1726, "eval_samples_per_second": 20.997, "eval_steps_per_second": 2.625, "eval_wer": 1.0, "step": 800 }, { "epoch": 2.393617021276596, "eval_cer": 0.9276012616915579, "eval_loss": 2.961205244064331, "eval_runtime": 231.5216, "eval_samples_per_second": 21.419, "eval_steps_per_second": 2.678, "eval_wer": 1.0, "step": 900 }, { "epoch": 2.6595744680851063, "grad_norm": 1.9079935550689697, "learning_rate": 2.3903999999999997e-05, "loss": 3.2563, "step": 1000 }, { "epoch": 2.6595744680851063, "eval_cer": 0.9276012616915579, "eval_loss": 2.902658700942993, "eval_runtime": 265.314, "eval_samples_per_second": 18.691, "eval_steps_per_second": 2.337, "eval_wer": 1.0, "step": 1000 }, { "epoch": 2.925531914893617, "eval_cer": 0.9276012616915579, "eval_loss": 2.876744031906128, "eval_runtime": 268.5469, "eval_samples_per_second": 18.466, "eval_steps_per_second": 2.309, "eval_wer": 1.0, "step": 1100 }, { "epoch": 3.1914893617021276, "eval_cer": 0.9276012616915579, "eval_loss": 2.8588435649871826, "eval_runtime": 250.7138, "eval_samples_per_second": 19.78, "eval_steps_per_second": 2.473, "eval_wer": 1.0, "step": 1200 }, { "epoch": 3.4574468085106385, "eval_cer": 0.9276012616915579, "eval_loss": 2.803792953491211, "eval_runtime": 253.4886, "eval_samples_per_second": 19.563, "eval_steps_per_second": 2.446, "eval_wer": 1.0, "step": 1300 }, { "epoch": 3.723404255319149, "eval_cer": 0.8359292858622536, "eval_loss": 1.9932550191879272, "eval_runtime": 266.0365, "eval_samples_per_second": 18.64, "eval_steps_per_second": 2.331, "eval_wer": 1.0, "step": 1400 }, { "epoch": 3.9893617021276597, "grad_norm": 4.3663716316223145, "learning_rate": 3.5903999999999994e-05, "loss": 2.5032, "step": 1500 }, { "epoch": 3.9893617021276597, "eval_cer": 0.38112231138141156, "eval_loss": 1.1380858421325684, "eval_runtime": 256.0779, "eval_samples_per_second": 19.365, "eval_steps_per_second": 2.421, "eval_wer": 0.9997983464408147, "step": 1500 }, { "epoch": 4.25531914893617, "eval_cer": 0.2746446118187823, "eval_loss": 0.8252492547035217, "eval_runtime": 240.6394, "eval_samples_per_second": 20.608, "eval_steps_per_second": 2.576, "eval_wer": 0.9983867715265174, "step": 1600 }, { "epoch": 4.5212765957446805, "eval_cer": 0.2507318827267859, "eval_loss": 0.6762787103652954, "eval_runtime": 212.2043, "eval_samples_per_second": 23.369, "eval_steps_per_second": 2.922, "eval_wer": 0.9973785037305909, "step": 1700 }, { "epoch": 4.787234042553192, "eval_cer": 0.24174213494783992, "eval_loss": 0.6010992527008057, "eval_runtime": 212.3652, "eval_samples_per_second": 23.351, "eval_steps_per_second": 2.919, "eval_wer": 0.9979834644081468, "step": 1800 }, { "epoch": 5.053191489361702, "eval_cer": 0.23079418558748002, "eval_loss": 0.5514463782310486, "eval_runtime": 209.5514, "eval_samples_per_second": 23.665, "eval_steps_per_second": 2.959, "eval_wer": 0.9975801572897761, "step": 1900 }, { "epoch": 5.319148936170213, "grad_norm": 2.237888813018799, "learning_rate": 4.7903999999999994e-05, "loss": 0.678, "step": 2000 }, { "epoch": 5.319148936170213, "eval_cer": 0.22485313488139397, "eval_loss": 0.5128617882728577, "eval_runtime": 210.7223, "eval_samples_per_second": 23.533, "eval_steps_per_second": 2.942, "eval_wer": 0.9985884250857028, "step": 2000 }, { "epoch": 5.585106382978723, "eval_cer": 0.23253350635340653, "eval_loss": 0.4957906901836395, "eval_runtime": 209.1903, "eval_samples_per_second": 23.706, "eval_steps_per_second": 2.964, "eval_wer": 0.994353700342811, "step": 2100 }, { "epoch": 5.851063829787234, "eval_cer": 0.21945146904204466, "eval_loss": 0.47169229388237, "eval_runtime": 208.7444, "eval_samples_per_second": 23.756, "eval_steps_per_second": 2.97, "eval_wer": 0.9977818108489614, "step": 2200 }, { "epoch": 6.117021276595745, "eval_cer": 0.217309563919061, "eval_loss": 0.4651758670806885, "eval_runtime": 239.8374, "eval_samples_per_second": 20.677, "eval_steps_per_second": 2.585, "eval_wer": 0.9991933857632587, "step": 2300 }, { "epoch": 6.382978723404255, "eval_cer": 0.21218149909907094, "eval_loss": 0.45553550124168396, "eval_runtime": 209.0918, "eval_samples_per_second": 23.717, "eval_steps_per_second": 2.965, "eval_wer": 0.9973785037305909, "step": 2400 }, { "epoch": 6.648936170212766, "grad_norm": 3.0910284519195557, "learning_rate": 5.9903999999999994e-05, "loss": 0.4238, "step": 2500 }, { "epoch": 6.648936170212766, "eval_cer": 0.21164211423233417, "eval_loss": 0.4360628128051758, "eval_runtime": 211.1218, "eval_samples_per_second": 23.489, "eval_steps_per_second": 2.937, "eval_wer": 0.9987900786448881, "step": 2500 }, { "epoch": 6.914893617021277, "eval_cer": 0.20628344283888417, "eval_loss": 0.4180741608142853, "eval_runtime": 210.3304, "eval_samples_per_second": 23.577, "eval_steps_per_second": 2.948, "eval_wer": 0.9989917322040734, "step": 2600 }, { "epoch": 7.180851063829787, "eval_cer": 0.2011983724647934, "eval_loss": 0.4185584485530853, "eval_runtime": 209.9592, "eval_samples_per_second": 23.619, "eval_steps_per_second": 2.953, "eval_wer": 0.9957652752571083, "step": 2700 }, { "epoch": 7.446808510638298, "eval_cer": 0.20350052961340176, "eval_loss": 0.4253988265991211, "eval_runtime": 212.3471, "eval_samples_per_second": 23.353, "eval_steps_per_second": 2.92, "eval_wer": 0.999395039322444, "step": 2800 }, { "epoch": 7.712765957446808, "eval_cer": 0.1980519607421623, "eval_loss": 0.4013788104057312, "eval_runtime": 213.4065, "eval_samples_per_second": 23.237, "eval_steps_per_second": 2.905, "eval_wer": 0.9983867715265174, "step": 2900 }, { "epoch": 7.9787234042553195, "grad_norm": 2.3959779739379883, "learning_rate": 7.1904e-05, "loss": 0.3375, "step": 3000 }, { "epoch": 7.9787234042553195, "eval_cer": 0.19799333195229962, "eval_loss": 0.38772091269493103, "eval_runtime": 212.9922, "eval_samples_per_second": 23.283, "eval_steps_per_second": 2.911, "eval_wer": 0.9975801572897761, "step": 3000 }, { "epoch": 8.24468085106383, "eval_cer": 0.19256821459700524, "eval_loss": 0.3868231475353241, "eval_runtime": 211.4945, "eval_samples_per_second": 23.447, "eval_steps_per_second": 2.932, "eval_wer": 0.9981851179673321, "step": 3100 }, { "epoch": 8.51063829787234, "eval_cer": 0.19027778320636943, "eval_loss": 0.374016672372818, "eval_runtime": 207.4949, "eval_samples_per_second": 23.899, "eval_steps_per_second": 2.988, "eval_wer": 0.9977818108489614, "step": 3200 }, { "epoch": 8.77659574468085, "eval_cer": 0.18545067950767452, "eval_loss": 0.36447063088417053, "eval_runtime": 208.0584, "eval_samples_per_second": 23.835, "eval_steps_per_second": 2.98, "eval_wer": 0.9981851179673321, "step": 3300 }, { "epoch": 9.042553191489361, "eval_cer": 0.18235117081693356, "eval_loss": 0.35864943265914917, "eval_runtime": 233.9479, "eval_samples_per_second": 21.197, "eval_steps_per_second": 2.65, "eval_wer": 0.9991933857632587, "step": 3400 }, { "epoch": 9.308510638297872, "grad_norm": 1.6243752241134644, "learning_rate": 8.390399999999999e-05, "loss": 0.2553, "step": 3500 }, { "epoch": 9.308510638297872, "eval_cer": 0.1774537125704034, "eval_loss": 0.3328181505203247, "eval_runtime": 208.1328, "eval_samples_per_second": 23.826, "eval_steps_per_second": 2.979, "eval_wer": 0.9979834644081468, "step": 3500 }, { "epoch": 9.574468085106384, "eval_cer": 0.174365929637635, "eval_loss": 0.34012970328330994, "eval_runtime": 208.9838, "eval_samples_per_second": 23.729, "eval_steps_per_second": 2.967, "eval_wer": 0.9977818108489614, "step": 3600 }, { "epoch": 9.840425531914894, "eval_cer": 0.1727282321074705, "eval_loss": 0.31242451071739197, "eval_runtime": 209.0076, "eval_samples_per_second": 23.726, "eval_steps_per_second": 2.966, "eval_wer": 0.9975801572897761, "step": 3700 }, { "epoch": 10.106382978723405, "eval_cer": 0.1708716537618186, "eval_loss": 0.322468101978302, "eval_runtime": 207.4311, "eval_samples_per_second": 23.907, "eval_steps_per_second": 2.989, "eval_wer": 0.9987900786448881, "step": 3800 }, { "epoch": 10.372340425531915, "eval_cer": 0.17599971858180866, "eval_loss": 0.3310896158218384, "eval_runtime": 206.3784, "eval_samples_per_second": 24.029, "eval_steps_per_second": 3.004, "eval_wer": 0.9973785037305909, "step": 3900 }, { "epoch": 10.638297872340425, "grad_norm": 2.6917850971221924, "learning_rate": 9.5904e-05, "loss": 0.2035, "step": 4000 }, { "epoch": 10.638297872340425, "eval_cer": 0.17048861233471568, "eval_loss": 0.3098428249359131, "eval_runtime": 207.2374, "eval_samples_per_second": 23.929, "eval_steps_per_second": 2.992, "eval_wer": 0.9979834644081468, "step": 4000 }, { "epoch": 10.904255319148936, "eval_cer": 0.1713641355966652, "eval_loss": 0.32444971799850464, "eval_runtime": 207.2878, "eval_samples_per_second": 23.923, "eval_steps_per_second": 2.991, "eval_wer": 0.9979834644081468, "step": 4100 }, { "epoch": 11.170212765957446, "eval_cer": 0.16859294812915532, "eval_loss": 0.3280084431171417, "eval_runtime": 206.6779, "eval_samples_per_second": 23.994, "eval_steps_per_second": 3.0, "eval_wer": 0.9925388183101431, "step": 4200 }, { "epoch": 11.436170212765958, "eval_cer": 0.17051206385066076, "eval_loss": 0.31342190504074097, "eval_runtime": 214.4373, "eval_samples_per_second": 23.126, "eval_steps_per_second": 2.891, "eval_wer": 0.9983867715265174, "step": 4300 }, { "epoch": 11.702127659574469, "eval_cer": 0.16671291826755835, "eval_loss": 0.3024933338165283, "eval_runtime": 208.7095, "eval_samples_per_second": 23.76, "eval_steps_per_second": 2.971, "eval_wer": 0.9987900786448881, "step": 4400 }, { "epoch": 11.96808510638298, "grad_norm": 1.652050256729126, "learning_rate": 0.00010787999999999998, "loss": 0.1772, "step": 4500 }, { "epoch": 11.96808510638298, "eval_cer": 0.16904634410409347, "eval_loss": 0.31564900279045105, "eval_runtime": 207.6579, "eval_samples_per_second": 23.881, "eval_steps_per_second": 2.986, "eval_wer": 0.9979834644081468, "step": 4500 }, { "epoch": 12.23404255319149, "eval_cer": 0.16571232025390176, "eval_loss": 0.3212853670120239, "eval_runtime": 208.1891, "eval_samples_per_second": 23.82, "eval_steps_per_second": 2.978, "eval_wer": 0.9967735430530349, "step": 4600 }, { "epoch": 12.5, "eval_cer": 0.17018374262742966, "eval_loss": 0.31842583417892456, "eval_runtime": 207.4188, "eval_samples_per_second": 23.908, "eval_steps_per_second": 2.989, "eval_wer": 0.9975801572897761, "step": 4700 }, { "epoch": 12.76595744680851, "eval_cer": 0.16590774955344406, "eval_loss": 0.3348098397254944, "eval_runtime": 206.5664, "eval_samples_per_second": 24.007, "eval_steps_per_second": 3.001, "eval_wer": 0.9989917322040734, "step": 4800 }, { "epoch": 13.03191489361702, "eval_cer": 0.16545044499251504, "eval_loss": 0.31754830479621887, "eval_runtime": 204.6212, "eval_samples_per_second": 24.235, "eval_steps_per_second": 3.03, "eval_wer": 0.9977818108489614, "step": 4900 }, { "epoch": 13.297872340425531, "grad_norm": 1.4975948333740234, "learning_rate": 0.00011988, "loss": 0.1542, "step": 5000 }, { "epoch": 13.297872340425531, "eval_cer": 0.16795975719863826, "eval_loss": 0.3414091467857361, "eval_runtime": 212.8965, "eval_samples_per_second": 23.293, "eval_steps_per_second": 2.912, "eval_wer": 0.9997983464408147, "step": 5000 }, { "epoch": 13.563829787234042, "eval_cer": 0.17008993656364937, "eval_loss": 0.3142850399017334, "eval_runtime": 206.8293, "eval_samples_per_second": 23.976, "eval_steps_per_second": 2.998, "eval_wer": 0.999395039322444, "step": 5100 }, { "epoch": 13.829787234042554, "eval_cer": 0.16879228601468846, "eval_loss": 0.3204251229763031, "eval_runtime": 205.7182, "eval_samples_per_second": 24.106, "eval_steps_per_second": 3.014, "eval_wer": 0.9985884250857028, "step": 5200 }, { "epoch": 14.095744680851064, "eval_cer": 0.16618525915879412, "eval_loss": 0.35486334562301636, "eval_runtime": 206.3465, "eval_samples_per_second": 24.032, "eval_steps_per_second": 3.005, "eval_wer": 0.9989917322040734, "step": 5300 }, { "epoch": 14.361702127659575, "eval_cer": 0.1666073864458055, "eval_loss": 0.40914931893348694, "eval_runtime": 206.0512, "eval_samples_per_second": 24.067, "eval_steps_per_second": 3.009, "eval_wer": 0.9973785037305909, "step": 5400 }, { "epoch": 14.627659574468085, "grad_norm": 2.959421157836914, "learning_rate": 0.000131856, "loss": 0.1449, "step": 5500 }, { "epoch": 14.627659574468085, "eval_cer": 0.16760407587347126, "eval_loss": 0.3907996714115143, "eval_runtime": 205.2139, "eval_samples_per_second": 24.165, "eval_steps_per_second": 3.021, "eval_wer": 0.9985884250857028, "step": 5500 }, { "epoch": 14.893617021276595, "eval_cer": 0.1662243450187026, "eval_loss": 0.3705514073371887, "eval_runtime": 205.3677, "eval_samples_per_second": 24.147, "eval_steps_per_second": 3.019, "eval_wer": 0.9983867715265174, "step": 5600 }, { "epoch": 15.159574468085106, "eval_cer": 0.164105891411664, "eval_loss": 0.3971535861492157, "eval_runtime": 205.6896, "eval_samples_per_second": 24.109, "eval_steps_per_second": 3.014, "eval_wer": 0.9971768501714056, "step": 5700 }, { "epoch": 15.425531914893616, "eval_cer": 0.1653097358968446, "eval_loss": 0.3461838662624359, "eval_runtime": 206.3509, "eval_samples_per_second": 24.032, "eval_steps_per_second": 3.005, "eval_wer": 0.9983867715265174, "step": 5800 }, { "epoch": 15.691489361702128, "eval_cer": 0.16992186736604298, "eval_loss": 0.35435542464256287, "eval_runtime": 205.3227, "eval_samples_per_second": 24.152, "eval_steps_per_second": 3.02, "eval_wer": 0.9983867715265174, "step": 5900 }, { "epoch": 15.957446808510639, "grad_norm": 1.915339469909668, "learning_rate": 0.00014385599999999999, "loss": 0.1396, "step": 6000 }, { "epoch": 15.957446808510639, "eval_cer": 0.1681590950841714, "eval_loss": 0.33965829014778137, "eval_runtime": 205.3964, "eval_samples_per_second": 24.144, "eval_steps_per_second": 3.019, "eval_wer": 0.9987900786448881, "step": 6000 }, { "epoch": 16.22340425531915, "eval_cer": 0.16804574609043688, "eval_loss": 0.3451753556728363, "eval_runtime": 205.8971, "eval_samples_per_second": 24.085, "eval_steps_per_second": 3.011, "eval_wer": 0.9983867715265174, "step": 6100 }, { "epoch": 16.48936170212766, "eval_cer": 0.16652921472598858, "eval_loss": 0.3533567488193512, "eval_runtime": 205.4803, "eval_samples_per_second": 24.134, "eval_steps_per_second": 3.017, "eval_wer": 0.9981851179673321, "step": 6200 }, { "epoch": 16.75531914893617, "eval_cer": 0.17028145727720082, "eval_loss": 0.3502165377140045, "eval_runtime": 205.7767, "eval_samples_per_second": 24.099, "eval_steps_per_second": 3.013, "eval_wer": 0.9985884250857028, "step": 6300 }, { "epoch": 17.02127659574468, "eval_cer": 0.17007430221968597, "eval_loss": 0.34754782915115356, "eval_runtime": 205.7613, "eval_samples_per_second": 24.101, "eval_steps_per_second": 3.013, "eval_wer": 0.9977818108489614, "step": 6400 }, { "epoch": 17.28723404255319, "grad_norm": 1.2938112020492554, "learning_rate": 0.00015585599999999998, "loss": 0.1293, "step": 6500 }, { "epoch": 17.28723404255319, "eval_cer": 0.1681239178102538, "eval_loss": 0.3350105881690979, "eval_runtime": 206.0245, "eval_samples_per_second": 24.07, "eval_steps_per_second": 3.009, "eval_wer": 0.9987900786448881, "step": 6500 }, { "epoch": 17.5531914893617, "eval_cer": 0.16944501987515975, "eval_loss": 0.3442031443119049, "eval_runtime": 205.3927, "eval_samples_per_second": 24.144, "eval_steps_per_second": 3.019, "eval_wer": 0.9977818108489614, "step": 6600 }, { "epoch": 17.819148936170212, "eval_cer": 0.16870629712288984, "eval_loss": 0.33415013551712036, "eval_runtime": 205.9912, "eval_samples_per_second": 24.074, "eval_steps_per_second": 3.01, "eval_wer": 0.9987900786448881, "step": 6700 }, { "epoch": 18.085106382978722, "eval_cer": 0.1696013633147936, "eval_loss": 0.3668520450592041, "eval_runtime": 205.5898, "eval_samples_per_second": 24.121, "eval_steps_per_second": 3.016, "eval_wer": 0.9985884250857028, "step": 6800 }, { "epoch": 18.351063829787233, "eval_cer": 0.16906197844805684, "eval_loss": 0.34041330218315125, "eval_runtime": 205.1961, "eval_samples_per_second": 24.167, "eval_steps_per_second": 3.022, "eval_wer": 0.9969751966122202, "step": 6900 }, { "epoch": 18.617021276595743, "grad_norm": 2.553234815597534, "learning_rate": 0.000167856, "loss": 0.1276, "step": 7000 }, { "epoch": 18.617021276595743, "eval_cer": 0.16789331123679385, "eval_loss": 0.3463904857635498, "eval_runtime": 204.7479, "eval_samples_per_second": 24.22, "eval_steps_per_second": 3.028, "eval_wer": 0.9989917322040734, "step": 7000 }, { "epoch": 18.882978723404257, "eval_cer": 0.16948801432105906, "eval_loss": 0.3496261537075043, "eval_runtime": 205.3143, "eval_samples_per_second": 24.153, "eval_steps_per_second": 3.02, "eval_wer": 0.9983867715265174, "step": 7100 }, { "epoch": 19.148936170212767, "eval_cer": 0.16978897544235422, "eval_loss": 0.3436301350593567, "eval_runtime": 205.1734, "eval_samples_per_second": 24.17, "eval_steps_per_second": 3.022, "eval_wer": 0.9967735430530349, "step": 7200 }, { "epoch": 19.414893617021278, "eval_cer": 0.16896035521229485, "eval_loss": 0.36047497391700745, "eval_runtime": 205.4789, "eval_samples_per_second": 24.134, "eval_steps_per_second": 3.017, "eval_wer": 0.9953619681387377, "step": 7300 }, { "epoch": 19.680851063829788, "eval_cer": 0.16866330267699053, "eval_loss": 0.3582172989845276, "eval_runtime": 205.1102, "eval_samples_per_second": 24.177, "eval_steps_per_second": 3.023, "eval_wer": 0.9973785037305909, "step": 7400 }, { "epoch": 19.9468085106383, "grad_norm": 1.7617504596710205, "learning_rate": 0.000179856, "loss": 0.1264, "step": 7500 }, { "epoch": 19.9468085106383, "eval_cer": 0.17402197407044054, "eval_loss": 0.3575660288333893, "eval_runtime": 204.7059, "eval_samples_per_second": 24.225, "eval_steps_per_second": 3.029, "eval_wer": 0.9981851179673321, "step": 7500 }, { "epoch": 20.21276595744681, "eval_cer": 0.17258752301180003, "eval_loss": 0.3668830990791321, "eval_runtime": 205.0195, "eval_samples_per_second": 24.188, "eval_steps_per_second": 3.024, "eval_wer": 0.9985884250857028, "step": 7600 }, { "epoch": 20.47872340425532, "eval_cer": 0.17064495577434952, "eval_loss": 0.361765593290329, "eval_runtime": 204.8268, "eval_samples_per_second": 24.211, "eval_steps_per_second": 3.027, "eval_wer": 0.9979834644081468, "step": 7700 }, { "epoch": 20.74468085106383, "eval_cer": 0.17463562207100336, "eval_loss": 0.34747639298439026, "eval_runtime": 204.8046, "eval_samples_per_second": 24.213, "eval_steps_per_second": 3.027, "eval_wer": 0.9989917322040734, "step": 7800 }, { "epoch": 21.01063829787234, "eval_cer": 0.1715165704503082, "eval_loss": 0.34254932403564453, "eval_runtime": 204.6469, "eval_samples_per_second": 24.232, "eval_steps_per_second": 3.03, "eval_wer": 0.9971768501714056, "step": 7900 }, { "epoch": 21.27659574468085, "grad_norm": 1.5520191192626953, "learning_rate": 0.000191856, "loss": 0.1219, "step": 8000 }, { "epoch": 21.27659574468085, "eval_cer": 0.1716377366160244, "eval_loss": 0.3685350716114044, "eval_runtime": 204.5671, "eval_samples_per_second": 24.241, "eval_steps_per_second": 3.031, "eval_wer": 0.9983867715265174, "step": 8000 }, { "epoch": 21.54255319148936, "eval_cer": 0.1755893170527698, "eval_loss": 0.38032132387161255, "eval_runtime": 204.7288, "eval_samples_per_second": 24.222, "eval_steps_per_second": 3.028, "eval_wer": 0.9989917322040734, "step": 8100 }, { "epoch": 21.80851063829787, "eval_cer": 0.17974805254703005, "eval_loss": 0.36628487706184387, "eval_runtime": 205.2564, "eval_samples_per_second": 24.16, "eval_steps_per_second": 3.021, "eval_wer": 0.9983867715265174, "step": 8200 }, { "epoch": 22.074468085106382, "eval_cer": 0.1709576426536172, "eval_loss": 0.3641684055328369, "eval_runtime": 205.4639, "eval_samples_per_second": 24.136, "eval_steps_per_second": 3.018, "eval_wer": 0.9977818108489614, "step": 8300 }, { "epoch": 22.340425531914892, "eval_cer": 0.17367801850324607, "eval_loss": 0.38052114844322205, "eval_runtime": 205.4218, "eval_samples_per_second": 24.141, "eval_steps_per_second": 3.018, "eval_wer": 0.9987900786448881, "step": 8400 }, { "epoch": 22.606382978723403, "grad_norm": 2.203418493270874, "learning_rate": 0.00020385599999999998, "loss": 0.1177, "step": 8500 }, { "epoch": 22.606382978723403, "eval_cer": 0.17468252510289353, "eval_loss": 0.36295458674430847, "eval_runtime": 205.462, "eval_samples_per_second": 24.136, "eval_steps_per_second": 3.018, "eval_wer": 0.9985884250857028, "step": 8500 }, { "epoch": 22.872340425531917, "eval_cer": 0.1753078988614289, "eval_loss": 0.4001345634460449, "eval_runtime": 205.3238, "eval_samples_per_second": 24.152, "eval_steps_per_second": 3.02, "eval_wer": 0.9973785037305909, "step": 8600 }, { "epoch": 23.138297872340427, "eval_cer": 0.17578865493830298, "eval_loss": 0.375848650932312, "eval_runtime": 205.2532, "eval_samples_per_second": 24.16, "eval_steps_per_second": 3.021, "eval_wer": 0.9977818108489614, "step": 8700 }, { "epoch": 23.404255319148938, "eval_cer": 0.17470988520482944, "eval_loss": 0.37709999084472656, "eval_runtime": 205.004, "eval_samples_per_second": 24.19, "eval_steps_per_second": 3.024, "eval_wer": 0.9983867715265174, "step": 8800 }, { "epoch": 23.670212765957448, "eval_cer": 0.17936501111992714, "eval_loss": 0.4001403748989105, "eval_runtime": 204.8778, "eval_samples_per_second": 24.205, "eval_steps_per_second": 3.026, "eval_wer": 0.9983867715265174, "step": 8900 }, { "epoch": 23.93617021276596, "grad_norm": 1.3760440349578857, "learning_rate": 0.000215856, "loss": 0.1241, "step": 9000 }, { "epoch": 23.93617021276596, "eval_cer": 0.17689087618772156, "eval_loss": 0.3929387629032135, "eval_runtime": 205.6986, "eval_samples_per_second": 24.108, "eval_steps_per_second": 3.014, "eval_wer": 0.9997983464408147, "step": 9000 }, { "epoch": 24.20212765957447, "eval_cer": 0.17517500693774013, "eval_loss": 0.3732432425022125, "eval_runtime": 205.6021, "eval_samples_per_second": 24.119, "eval_steps_per_second": 3.016, "eval_wer": 0.9991933857632587, "step": 9100 }, { "epoch": 24.46808510638298, "eval_cer": 0.17383045335688907, "eval_loss": 0.3813112676143646, "eval_runtime": 205.3982, "eval_samples_per_second": 24.143, "eval_steps_per_second": 3.019, "eval_wer": 0.9983867715265174, "step": 9200 }, { "epoch": 24.73404255319149, "eval_cer": 0.17939627980785391, "eval_loss": 0.41280829906463623, "eval_runtime": 219.7977, "eval_samples_per_second": 22.562, "eval_steps_per_second": 2.821, "eval_wer": 0.9989917322040734, "step": 9300 }, { "epoch": 25.0, "eval_cer": 0.17513592107783169, "eval_loss": 0.3756047785282135, "eval_runtime": 219.9345, "eval_samples_per_second": 22.548, "eval_steps_per_second": 2.819, "eval_wer": 0.9989917322040734, "step": 9400 }, { "epoch": 25.26595744680851, "grad_norm": 9.107454299926758, "learning_rate": 0.00022783199999999997, "loss": 0.121, "step": 9500 }, { "epoch": 25.26595744680851, "eval_cer": 0.17971678385910328, "eval_loss": 0.39162904024124146, "eval_runtime": 219.1957, "eval_samples_per_second": 22.624, "eval_steps_per_second": 2.829, "eval_wer": 0.9989917322040734, "step": 9500 }, { "epoch": 25.53191489361702, "eval_cer": 0.18236680516089696, "eval_loss": 0.38820743560791016, "eval_runtime": 219.4833, "eval_samples_per_second": 22.594, "eval_steps_per_second": 2.825, "eval_wer": 0.9983867715265174, "step": 9600 }, { "epoch": 25.79787234042553, "eval_cer": 0.18378562187557407, "eval_loss": 0.39170223474502563, "eval_runtime": 219.5415, "eval_samples_per_second": 22.588, "eval_steps_per_second": 2.824, "eval_wer": 0.9975801572897761, "step": 9700 }, { "epoch": 26.06382978723404, "eval_cer": 0.17702376811141032, "eval_loss": 0.3927652835845947, "eval_runtime": 219.475, "eval_samples_per_second": 22.595, "eval_steps_per_second": 2.825, "eval_wer": 0.9983867715265174, "step": 9800 }, { "epoch": 26.329787234042552, "eval_cer": 0.18011155104417875, "eval_loss": 0.3928898870944977, "eval_runtime": 219.0682, "eval_samples_per_second": 22.637, "eval_steps_per_second": 2.83, "eval_wer": 0.9995966928816293, "step": 9900 }, { "epoch": 26.595744680851062, "grad_norm": 1.6058417558670044, "learning_rate": 0.000239832, "loss": 0.1206, "step": 10000 }, { "epoch": 26.595744680851062, "eval_cer": 0.17812598936082893, "eval_loss": 0.39845964312553406, "eval_runtime": 219.0245, "eval_samples_per_second": 22.641, "eval_steps_per_second": 2.831, "eval_wer": 0.9987900786448881, "step": 10000 }, { "epoch": 26.861702127659573, "eval_cer": 0.1770628539713188, "eval_loss": 0.3799264132976532, "eval_runtime": 219.8342, "eval_samples_per_second": 22.558, "eval_steps_per_second": 2.82, "eval_wer": 0.999395039322444, "step": 10100 }, { "epoch": 27.127659574468087, "eval_cer": 0.1785715681637854, "eval_loss": 0.4022609293460846, "eval_runtime": 221.0183, "eval_samples_per_second": 22.437, "eval_steps_per_second": 2.805, "eval_wer": 0.999395039322444, "step": 10200 }, { "epoch": 27.393617021276597, "eval_cer": 0.17838395603622478, "eval_loss": 0.4000260531902313, "eval_runtime": 218.5093, "eval_samples_per_second": 22.695, "eval_steps_per_second": 2.837, "eval_wer": 0.9991933857632587, "step": 10300 }, { "epoch": 27.659574468085108, "eval_cer": 0.18251142284255825, "eval_loss": 0.37564513087272644, "eval_runtime": 218.7597, "eval_samples_per_second": 22.669, "eval_steps_per_second": 2.834, "eval_wer": 0.9975801572897761, "step": 10400 }, { "epoch": 27.925531914893618, "grad_norm": 5.426018238067627, "learning_rate": 0.00025183199999999996, "loss": 0.124, "step": 10500 }, { "epoch": 27.925531914893618, "eval_cer": 0.17786411409944225, "eval_loss": 0.39711853861808777, "eval_runtime": 219.1126, "eval_samples_per_second": 22.632, "eval_steps_per_second": 2.83, "eval_wer": 0.9985884250857028, "step": 10500 }, { "epoch": 28.19148936170213, "eval_cer": 0.178911615144989, "eval_loss": 0.42398887872695923, "eval_runtime": 216.8565, "eval_samples_per_second": 22.868, "eval_steps_per_second": 2.859, "eval_wer": 0.9995966928816293, "step": 10600 }, { "epoch": 28.45744680851064, "eval_cer": 0.17917349040637567, "eval_loss": 0.37179791927337646, "eval_runtime": 219.2208, "eval_samples_per_second": 22.621, "eval_steps_per_second": 2.828, "eval_wer": 0.9979834644081468, "step": 10700 }, { "epoch": 28.72340425531915, "eval_cer": 0.17998256770648083, "eval_loss": 0.41135987639427185, "eval_runtime": 220.5483, "eval_samples_per_second": 22.485, "eval_steps_per_second": 2.811, "eval_wer": 0.9985884250857028, "step": 10800 }, { "epoch": 28.98936170212766, "eval_cer": 0.18003337932436184, "eval_loss": 0.41742414236068726, "eval_runtime": 218.3591, "eval_samples_per_second": 22.71, "eval_steps_per_second": 2.839, "eval_wer": 0.9977818108489614, "step": 10900 }, { "epoch": 29.25531914893617, "grad_norm": 2.8614120483398438, "learning_rate": 0.000263832, "loss": 0.122, "step": 11000 }, { "epoch": 29.25531914893617, "eval_cer": 0.18530997041200406, "eval_loss": 0.4062168598175049, "eval_runtime": 220.2511, "eval_samples_per_second": 22.515, "eval_steps_per_second": 2.815, "eval_wer": 0.9987900786448881, "step": 11000 }, { "epoch": 29.52127659574468, "eval_cer": 0.1861112305401275, "eval_loss": 0.4202740788459778, "eval_runtime": 217.0728, "eval_samples_per_second": 22.845, "eval_steps_per_second": 2.856, "eval_wer": 0.9977818108489614, "step": 11100 }, { "epoch": 29.78723404255319, "eval_cer": 0.18606432750823734, "eval_loss": 0.43755000829696655, "eval_runtime": 219.2588, "eval_samples_per_second": 22.617, "eval_steps_per_second": 2.828, "eval_wer": 0.9985884250857028, "step": 11200 }, { "epoch": 30.0531914893617, "eval_cer": 0.18122940663756074, "eval_loss": 0.409412682056427, "eval_runtime": 223.5339, "eval_samples_per_second": 22.185, "eval_steps_per_second": 2.774, "eval_wer": 0.9991933857632587, "step": 11300 }, { "epoch": 30.319148936170212, "eval_cer": 0.18185868898208696, "eval_loss": 0.40995094180107117, "eval_runtime": 225.4254, "eval_samples_per_second": 21.998, "eval_steps_per_second": 2.75, "eval_wer": 0.9987900786448881, "step": 11400 }, { "epoch": 30.585106382978722, "grad_norm": 1.4252536296844482, "learning_rate": 0.000275832, "loss": 0.125, "step": 11500 }, { "epoch": 30.585106382978722, "eval_cer": 0.18692812501221434, "eval_loss": 0.39966416358947754, "eval_runtime": 219.2997, "eval_samples_per_second": 22.613, "eval_steps_per_second": 2.827, "eval_wer": 0.9981851179673321, "step": 11500 }, { "epoch": 30.851063829787233, "eval_cer": 0.18203848393766586, "eval_loss": 0.4437381625175476, "eval_runtime": 219.4853, "eval_samples_per_second": 22.594, "eval_steps_per_second": 2.825, "eval_wer": 0.9989917322040734, "step": 11600 }, { "epoch": 31.117021276595743, "eval_cer": 0.18580245224685066, "eval_loss": 0.44233861565589905, "eval_runtime": 216.9437, "eval_samples_per_second": 22.858, "eval_steps_per_second": 2.858, "eval_wer": 0.9989917322040734, "step": 11700 }, { "epoch": 31.382978723404257, "eval_cer": 0.18947652307824597, "eval_loss": 0.4216567575931549, "eval_runtime": 217.1103, "eval_samples_per_second": 22.841, "eval_steps_per_second": 2.856, "eval_wer": 0.9987900786448881, "step": 11800 }, { "epoch": 31.648936170212767, "eval_cer": 0.1966175096835218, "eval_loss": 0.4611862301826477, "eval_runtime": 226.5232, "eval_samples_per_second": 21.892, "eval_steps_per_second": 2.737, "eval_wer": 0.9991933857632587, "step": 11900 }, { "epoch": 31.914893617021278, "grad_norm": 5.578627586364746, "learning_rate": 0.00028783199999999996, "loss": 0.1294, "step": 12000 }, { "epoch": 31.914893617021278, "eval_cer": 0.18622067094787118, "eval_loss": 0.4385882318019867, "eval_runtime": 216.3818, "eval_samples_per_second": 22.918, "eval_steps_per_second": 2.865, "eval_wer": 0.9973785037305909, "step": 12000 }, { "epoch": 32.180851063829785, "eval_cer": 0.1892146478168593, "eval_loss": 0.42784062027931213, "eval_runtime": 236.4807, "eval_samples_per_second": 20.97, "eval_steps_per_second": 2.622, "eval_wer": 0.9983867715265174, "step": 12100 }, { "epoch": 32.4468085106383, "eval_cer": 0.1856109315332992, "eval_loss": 0.4187084436416626, "eval_runtime": 222.7058, "eval_samples_per_second": 22.267, "eval_steps_per_second": 2.784, "eval_wer": 0.9983867715265174, "step": 12200 }, { "epoch": 32.712765957446805, "eval_cer": 0.18286710416772525, "eval_loss": 0.4047478437423706, "eval_runtime": 222.5261, "eval_samples_per_second": 22.285, "eval_steps_per_second": 2.786, "eval_wer": 0.9985884250857028, "step": 12300 }, { "epoch": 32.97872340425532, "eval_cer": 0.18515753555836106, "eval_loss": 0.4230673015117645, "eval_runtime": 219.6428, "eval_samples_per_second": 22.578, "eval_steps_per_second": 2.823, "eval_wer": 0.9979834644081468, "step": 12400 }, { "epoch": 33.244680851063826, "grad_norm": 3.530928134918213, "learning_rate": 0.000299832, "loss": 0.1275, "step": 12500 }, { "epoch": 33.244680851063826, "eval_cer": 0.1842781037104207, "eval_loss": 0.41239944100379944, "eval_runtime": 212.9629, "eval_samples_per_second": 23.286, "eval_steps_per_second": 2.911, "eval_wer": 0.999395039322444, "step": 12500 }, { "epoch": 33.51063829787234, "eval_cer": 0.18698284521608619, "eval_loss": 0.41910141706466675, "eval_runtime": 209.3165, "eval_samples_per_second": 23.691, "eval_steps_per_second": 2.962, "eval_wer": 0.999395039322444, "step": 12600 }, { "epoch": 33.776595744680854, "eval_cer": 0.19266983783276723, "eval_loss": 0.4845859110355377, "eval_runtime": 209.6184, "eval_samples_per_second": 23.657, "eval_steps_per_second": 2.958, "eval_wer": 0.9979834644081468, "step": 12700 }, { "epoch": 34.04255319148936, "eval_cer": 0.18445399008000876, "eval_loss": 0.421185702085495, "eval_runtime": 209.5402, "eval_samples_per_second": 23.666, "eval_steps_per_second": 2.959, "eval_wer": 0.9983867715265174, "step": 12800 }, { "epoch": 34.308510638297875, "eval_cer": 0.183660547123867, "eval_loss": 0.43256160616874695, "eval_runtime": 219.5902, "eval_samples_per_second": 22.583, "eval_steps_per_second": 2.823, "eval_wer": 0.9983867715265174, "step": 12900 }, { "epoch": 34.57446808510638, "grad_norm": 1.3231768608093262, "learning_rate": 0.00029548990895071305, "loss": 0.134, "step": 13000 }, { "epoch": 34.57446808510638, "eval_cer": 0.18797171747177024, "eval_loss": 0.4103536009788513, "eval_runtime": 213.3906, "eval_samples_per_second": 23.239, "eval_steps_per_second": 2.905, "eval_wer": 0.9991933857632587, "step": 13000 }, { "epoch": 34.840425531914896, "eval_cer": 0.18773329372632863, "eval_loss": 0.3964749276638031, "eval_runtime": 219.4036, "eval_samples_per_second": 22.602, "eval_steps_per_second": 2.826, "eval_wer": 0.9977818108489614, "step": 13100 }, { "epoch": 35.1063829787234, "eval_cer": 0.18439145270415522, "eval_loss": 0.4146926701068878, "eval_runtime": 211.7608, "eval_samples_per_second": 23.418, "eval_steps_per_second": 2.928, "eval_wer": 0.999395039322444, "step": 13200 }, { "epoch": 35.37234042553192, "eval_cer": 0.18589625831063097, "eval_loss": 0.4251463711261749, "eval_runtime": 208.6917, "eval_samples_per_second": 23.762, "eval_steps_per_second": 2.971, "eval_wer": 0.9977818108489614, "step": 13300 }, { "epoch": 35.638297872340424, "eval_cer": 0.19017225138461658, "eval_loss": 0.4457683861255646, "eval_runtime": 211.8043, "eval_samples_per_second": 23.413, "eval_steps_per_second": 2.927, "eval_wer": 0.999395039322444, "step": 13400 }, { "epoch": 35.90425531914894, "grad_norm": 3.084670066833496, "learning_rate": 0.00028198284613067677, "loss": 0.1293, "step": 13500 }, { "epoch": 35.90425531914894, "eval_cer": 0.19420591212716976, "eval_loss": 0.43544086813926697, "eval_runtime": 209.3943, "eval_samples_per_second": 23.683, "eval_steps_per_second": 2.961, "eval_wer": 0.9991933857632587, "step": 13500 }, { "epoch": 36.170212765957444, "eval_cer": 0.1863222941836332, "eval_loss": 0.4197835326194763, "eval_runtime": 210.9951, "eval_samples_per_second": 23.503, "eval_steps_per_second": 2.938, "eval_wer": 0.9995966928816293, "step": 13600 }, { "epoch": 36.43617021276596, "eval_cer": 0.18905830437722546, "eval_loss": 0.4278818666934967, "eval_runtime": 214.736, "eval_samples_per_second": 23.093, "eval_steps_per_second": 2.887, "eval_wer": 0.9985884250857028, "step": 13700 }, { "epoch": 36.702127659574465, "eval_cer": 0.18459079058968836, "eval_loss": 0.4114536941051483, "eval_runtime": 212.7503, "eval_samples_per_second": 23.309, "eval_steps_per_second": 2.914, "eval_wer": 0.9975801572897761, "step": 13800 }, { "epoch": 36.96808510638298, "eval_cer": 0.18683822753442486, "eval_loss": 0.43593207001686096, "eval_runtime": 213.278, "eval_samples_per_second": 23.251, "eval_steps_per_second": 2.907, "eval_wer": 0.9985884250857028, "step": 13900 }, { "epoch": 37.234042553191486, "grad_norm": 2.2776243686676025, "learning_rate": 0.00026031324776349936, "loss": 0.1193, "step": 14000 }, { "epoch": 37.234042553191486, "eval_cer": 0.19045757816194836, "eval_loss": 0.43160808086395264, "eval_runtime": 209.1934, "eval_samples_per_second": 23.705, "eval_steps_per_second": 2.964, "eval_wer": 0.9991933857632587, "step": 14000 }, { "epoch": 37.5, "eval_cer": 0.18992991905318413, "eval_loss": 0.4389212727546692, "eval_runtime": 215.9667, "eval_samples_per_second": 22.962, "eval_steps_per_second": 2.871, "eval_wer": 0.999395039322444, "step": 14100 }, { "epoch": 37.765957446808514, "eval_cer": 0.1825231486005308, "eval_loss": 0.42151185870170593, "eval_runtime": 208.7788, "eval_samples_per_second": 23.752, "eval_steps_per_second": 2.97, "eval_wer": 0.9991933857632587, "step": 14200 }, { "epoch": 38.03191489361702, "eval_cer": 0.18895668114146344, "eval_loss": 0.47925981879234314, "eval_runtime": 211.6717, "eval_samples_per_second": 23.428, "eval_steps_per_second": 2.929, "eval_wer": 0.9991933857632587, "step": 14300 }, { "epoch": 38.297872340425535, "eval_cer": 0.1853920507178118, "eval_loss": 0.4381818473339081, "eval_runtime": 209.7616, "eval_samples_per_second": 23.641, "eval_steps_per_second": 2.956, "eval_wer": 0.9983867715265174, "step": 14400 }, { "epoch": 38.56382978723404, "grad_norm": 1.5227301120758057, "learning_rate": 0.00023182127942485896, "loss": 0.1132, "step": 14500 }, { "epoch": 38.56382978723404, "eval_cer": 0.182441068294723, "eval_loss": 0.40106824040412903, "eval_runtime": 209.0948, "eval_samples_per_second": 23.717, "eval_steps_per_second": 2.965, "eval_wer": 0.9975801572897761, "step": 14500 }, { "epoch": 38.829787234042556, "eval_cer": 0.1797675954769843, "eval_loss": 0.4283459186553955, "eval_runtime": 209.0149, "eval_samples_per_second": 23.726, "eval_steps_per_second": 2.966, "eval_wer": 0.994958661020367, "step": 14600 }, { "epoch": 39.09574468085106, "eval_cer": 0.18034997478962037, "eval_loss": 0.4303878843784332, "eval_runtime": 211.9384, "eval_samples_per_second": 23.398, "eval_steps_per_second": 2.925, "eval_wer": 0.9979834644081468, "step": 14700 }, { "epoch": 39.361702127659576, "eval_cer": 0.18114732633175296, "eval_loss": 0.40491461753845215, "eval_runtime": 210.1586, "eval_samples_per_second": 23.596, "eval_steps_per_second": 2.95, "eval_wer": 0.9983867715265174, "step": 14800 }, { "epoch": 39.62765957446808, "eval_cer": 0.1785129393739227, "eval_loss": 0.41461843252182007, "eval_runtime": 209.4294, "eval_samples_per_second": 23.679, "eval_steps_per_second": 2.96, "eval_wer": 0.9987900786448881, "step": 14900 }, { "epoch": 39.8936170212766, "grad_norm": 3.955990791320801, "learning_rate": 0.00019826903907816743, "loss": 0.0949, "step": 15000 }, { "epoch": 39.8936170212766, "eval_cer": 0.18166325968254465, "eval_loss": 0.44991689920425415, "eval_runtime": 208.9423, "eval_samples_per_second": 23.734, "eval_steps_per_second": 2.967, "eval_wer": 0.9997983464408147, "step": 15000 }, { "epoch": 40.159574468085104, "eval_cer": 0.17907968434259539, "eval_loss": 0.420516699552536, "eval_runtime": 210.185, "eval_samples_per_second": 23.593, "eval_steps_per_second": 2.95, "eval_wer": 0.9977818108489614, "step": 15100 }, { "epoch": 40.42553191489362, "eval_cer": 0.1807017475287965, "eval_loss": 0.4418542683124542, "eval_runtime": 210.2936, "eval_samples_per_second": 23.581, "eval_steps_per_second": 2.948, "eval_wer": 0.9985884250857028, "step": 15200 }, { "epoch": 40.691489361702125, "eval_cer": 0.18009591670021535, "eval_loss": 0.4282812476158142, "eval_runtime": 209.7755, "eval_samples_per_second": 23.64, "eval_steps_per_second": 2.956, "eval_wer": 0.9981851179673321, "step": 15300 }, { "epoch": 40.95744680851064, "eval_cer": 0.17690651053168496, "eval_loss": 0.4327284097671509, "eval_runtime": 210.8473, "eval_samples_per_second": 23.519, "eval_steps_per_second": 2.941, "eval_wer": 0.9995966928816293, "step": 15400 }, { "epoch": 41.223404255319146, "grad_norm": 1.6714894771575928, "learning_rate": 0.0001617315793726526, "loss": 0.0876, "step": 15500 }, { "epoch": 41.223404255319146, "eval_cer": 0.17806736057096625, "eval_loss": 0.44882500171661377, "eval_runtime": 210.3046, "eval_samples_per_second": 23.58, "eval_steps_per_second": 2.948, "eval_wer": 0.9995966928816293, "step": 15500 }, { "epoch": 41.48936170212766, "eval_cer": 0.17360766395541086, "eval_loss": 0.41944339871406555, "eval_runtime": 210.2221, "eval_samples_per_second": 23.589, "eval_steps_per_second": 2.949, "eval_wer": 0.9989917322040734, "step": 15600 }, { "epoch": 41.755319148936174, "eval_cer": 0.17544079078511768, "eval_loss": 0.4319663345813751, "eval_runtime": 209.0871, "eval_samples_per_second": 23.717, "eval_steps_per_second": 2.965, "eval_wer": 0.9991933857632587, "step": 15700 }, { "epoch": 42.02127659574468, "eval_cer": 0.1729080270630494, "eval_loss": 0.4347435235977173, "eval_runtime": 209.3479, "eval_samples_per_second": 23.688, "eval_steps_per_second": 2.962, "eval_wer": 0.9989917322040734, "step": 15800 }, { "epoch": 42.287234042553195, "eval_cer": 0.17443628418547022, "eval_loss": 0.48187553882598877, "eval_runtime": 208.6066, "eval_samples_per_second": 23.772, "eval_steps_per_second": 2.972, "eval_wer": 0.999395039322444, "step": 15900 }, { "epoch": 42.5531914893617, "grad_norm": 0.7495588660240173, "learning_rate": 0.00012446857512509515, "loss": 0.0725, "step": 16000 }, { "epoch": 42.5531914893617, "eval_cer": 0.17520236703967607, "eval_loss": 0.44911447167396545, "eval_runtime": 208.5357, "eval_samples_per_second": 23.78, "eval_steps_per_second": 2.973, "eval_wer": 0.9989917322040734, "step": 16000 }, { "epoch": 42.819148936170215, "eval_cer": 0.17413923165016593, "eval_loss": 0.45369845628738403, "eval_runtime": 210.1991, "eval_samples_per_second": 23.592, "eval_steps_per_second": 2.95, "eval_wer": 0.9985884250857028, "step": 16100 }, { "epoch": 43.08510638297872, "eval_cer": 0.17170809116385966, "eval_loss": 0.4587579071521759, "eval_runtime": 209.6677, "eval_samples_per_second": 23.652, "eval_steps_per_second": 2.957, "eval_wer": 0.9983867715265174, "step": 16200 }, { "epoch": 43.351063829787236, "eval_cer": 0.17147357600440888, "eval_loss": 0.4416778087615967, "eval_runtime": 209.0934, "eval_samples_per_second": 23.717, "eval_steps_per_second": 2.965, "eval_wer": 0.9981851179673321, "step": 16300 }, { "epoch": 43.61702127659574, "eval_cer": 0.17290411847705855, "eval_loss": 0.45538103580474854, "eval_runtime": 210.428, "eval_samples_per_second": 23.566, "eval_steps_per_second": 2.946, "eval_wer": 0.9983867715265174, "step": 16400 }, { "epoch": 43.88297872340426, "grad_norm": 1.7286139726638794, "learning_rate": 8.878457276467852e-05, "loss": 0.0615, "step": 16500 }, { "epoch": 43.88297872340426, "eval_cer": 0.17189570329142026, "eval_loss": 0.44644975662231445, "eval_runtime": 208.6857, "eval_samples_per_second": 23.763, "eval_steps_per_second": 2.971, "eval_wer": 0.9995966928816293, "step": 16500 }, { "epoch": 44.148936170212764, "eval_cer": 0.17184489167353925, "eval_loss": 0.47256070375442505, "eval_runtime": 214.9431, "eval_samples_per_second": 23.071, "eval_steps_per_second": 2.884, "eval_wer": 0.9981851179673321, "step": 16600 }, { "epoch": 44.41489361702128, "eval_cer": 0.1704495264748072, "eval_loss": 0.4455854296684265, "eval_runtime": 212.2795, "eval_samples_per_second": 23.361, "eval_steps_per_second": 2.921, "eval_wer": 0.9979834644081468, "step": 16700 }, { "epoch": 44.680851063829785, "eval_cer": 0.16927304209156255, "eval_loss": 0.42471006512641907, "eval_runtime": 208.6276, "eval_samples_per_second": 23.77, "eval_steps_per_second": 2.972, "eval_wer": 0.9979834644081468, "step": 16800 }, { "epoch": 44.9468085106383, "eval_cer": 0.1683897016576313, "eval_loss": 0.4499261975288391, "eval_runtime": 208.8575, "eval_samples_per_second": 23.743, "eval_steps_per_second": 2.969, "eval_wer": 0.9985884250857028, "step": 16900 }, { "epoch": 45.212765957446805, "grad_norm": 1.9694031476974487, "learning_rate": 5.6886464673787096e-05, "loss": 0.0524, "step": 17000 }, { "epoch": 45.212765957446805, "eval_cer": 0.16670119250958582, "eval_loss": 0.46098417043685913, "eval_runtime": 209.0801, "eval_samples_per_second": 23.718, "eval_steps_per_second": 2.965, "eval_wer": 0.9987900786448881, "step": 17000 }, { "epoch": 45.47872340425532, "eval_cer": 0.16754153849761771, "eval_loss": 0.42516496777534485, "eval_runtime": 215.2938, "eval_samples_per_second": 23.034, "eval_steps_per_second": 2.88, "eval_wer": 0.9981851179673321, "step": 17100 }, { "epoch": 45.744680851063826, "eval_cer": 0.16701778797484435, "eval_loss": 0.41850271821022034, "eval_runtime": 208.7292, "eval_samples_per_second": 23.758, "eval_steps_per_second": 2.97, "eval_wer": 0.9979834644081468, "step": 17200 }, { "epoch": 46.01063829787234, "eval_cer": 0.16651748896801605, "eval_loss": 0.4377266764640808, "eval_runtime": 208.7268, "eval_samples_per_second": 23.758, "eval_steps_per_second": 2.97, "eval_wer": 0.9979834644081468, "step": 17300 }, { "epoch": 46.276595744680854, "eval_cer": 0.16658784351585126, "eval_loss": 0.4386991262435913, "eval_runtime": 208.9381, "eval_samples_per_second": 23.734, "eval_steps_per_second": 2.967, "eval_wer": 0.9991933857632587, "step": 17400 }, { "epoch": 46.54255319148936, "grad_norm": 0.5704839825630188, "learning_rate": 3.074700298507786e-05, "loss": 0.0466, "step": 17500 }, { "epoch": 46.54255319148936, "eval_cer": 0.16593510965537997, "eval_loss": 0.4388461112976074, "eval_runtime": 208.6064, "eval_samples_per_second": 23.772, "eval_steps_per_second": 2.972, "eval_wer": 0.9985884250857028, "step": 17500 }, { "epoch": 46.808510638297875, "eval_cer": 0.16539963337463406, "eval_loss": 0.4407631754875183, "eval_runtime": 209.5029, "eval_samples_per_second": 23.67, "eval_steps_per_second": 2.959, "eval_wer": 0.9985884250857028, "step": 17600 }, { "epoch": 47.07446808510638, "eval_cer": 0.16512603235527484, "eval_loss": 0.4277360141277313, "eval_runtime": 208.9388, "eval_samples_per_second": 23.734, "eval_steps_per_second": 2.967, "eval_wer": 0.9983867715265174, "step": 17700 }, { "epoch": 47.340425531914896, "eval_cer": 0.16503222629149453, "eval_loss": 0.4244243800640106, "eval_runtime": 208.9653, "eval_samples_per_second": 23.731, "eval_steps_per_second": 2.967, "eval_wer": 0.9985884250857028, "step": 17800 }, { "epoch": 47.6063829787234, "eval_cer": 0.16441857829093168, "eval_loss": 0.42959603667259216, "eval_runtime": 209.1668, "eval_samples_per_second": 23.708, "eval_steps_per_second": 2.964, "eval_wer": 0.9977818108489614, "step": 17900 }, { "epoch": 47.87234042553192, "grad_norm": 1.8080158233642578, "learning_rate": 1.1982793882402725e-05, "loss": 0.0393, "step": 18000 }, { "epoch": 47.87234042553192, "eval_cer": 0.1648250712339797, "eval_loss": 0.43411195278167725, "eval_runtime": 215.2833, "eval_samples_per_second": 23.035, "eval_steps_per_second": 2.88, "eval_wer": 0.9983867715265174, "step": 18000 }, { "epoch": 48.138297872340424, "eval_cer": 0.16460228183250145, "eval_loss": 0.43372273445129395, "eval_runtime": 259.5957, "eval_samples_per_second": 19.103, "eval_steps_per_second": 2.388, "eval_wer": 0.9981851179673321, "step": 18100 }, { "epoch": 48.40425531914894, "eval_cer": 0.16421142323341684, "eval_loss": 0.43311166763305664, "eval_runtime": 209.0523, "eval_samples_per_second": 23.721, "eval_steps_per_second": 2.966, "eval_wer": 0.9977818108489614, "step": 18200 }, { "epoch": 48.670212765957444, "eval_cer": 0.16413716009959078, "eval_loss": 0.4280834197998047, "eval_runtime": 210.4305, "eval_samples_per_second": 23.566, "eval_steps_per_second": 2.946, "eval_wer": 0.9979834644081468, "step": 18300 }, { "epoch": 48.93617021276596, "eval_cer": 0.1640824398957189, "eval_loss": 0.42681965231895447, "eval_runtime": 261.2993, "eval_samples_per_second": 18.978, "eval_steps_per_second": 2.373, "eval_wer": 0.9981851179673321, "step": 18400 }, { "epoch": 49.202127659574465, "grad_norm": 0.8930312395095825, "learning_rate": 1.7543179002012464e-06, "loss": 0.0373, "step": 18500 }, { "epoch": 49.202127659574465, "eval_cer": 0.16407071413774638, "eval_loss": 0.42752090096473694, "eval_runtime": 209.2156, "eval_samples_per_second": 23.703, "eval_steps_per_second": 2.963, "eval_wer": 0.9981851179673321, "step": 18500 }, { "epoch": 49.46808510638298, "eval_cer": 0.16406680555175554, "eval_loss": 0.4268626868724823, "eval_runtime": 212.2555, "eval_samples_per_second": 23.363, "eval_steps_per_second": 2.921, "eval_wer": 0.9981851179673321, "step": 18600 }, { "epoch": 49.734042553191486, "eval_cer": 0.16399254241792946, "eval_loss": 0.4268469214439392, "eval_runtime": 208.7487, "eval_samples_per_second": 23.756, "eval_steps_per_second": 2.97, "eval_wer": 0.9977818108489614, "step": 18700 }, { "epoch": 50.0, "eval_cer": 0.16415279444355416, "eval_loss": 0.42705675959587097, "eval_runtime": 208.3387, "eval_samples_per_second": 23.803, "eval_steps_per_second": 2.976, "eval_wer": 0.9977818108489614, "step": 18800 }, { "epoch": 50.0, "step": 18800, "total_flos": 2.6273093616415412e+19, "train_loss": 0.4882018888757584, "train_runtime": 107059.6152, "train_samples_per_second": 5.619, "train_steps_per_second": 0.176 } ], "logging_steps": 500, "max_steps": 18800, "num_input_tokens_seen": 0, "num_train_epochs": 50, "save_steps": 400, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 2.6273093616415412e+19, "train_batch_size": 16, "trial_name": null, "trial_params": null }