{ "best_metric": 0.8816327044764588, "best_model_checkpoint": "./models/bart-base-spelling-nl-9m-3/checkpoint-696000", "epoch": 1.999998703928716, "global_step": 771562, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 0.0002999961117836285, "loss": 0.9868, "step": 10 }, { "epoch": 0.0, "learning_rate": 0.000299992223567257, "loss": 0.289, "step": 20 }, { "epoch": 0.0, "learning_rate": 0.00029998833535088557, "loss": 0.1965, "step": 30 }, { "epoch": 0.0, "learning_rate": 0.00029998444713451414, "loss": 0.1664, "step": 40 }, { "epoch": 0.0, "learning_rate": 0.00029998055891814265, "loss": 0.1631, "step": 50 }, { "epoch": 0.0, "learning_rate": 0.00029997667070177117, "loss": 0.1647, "step": 60 }, { "epoch": 0.0, "learning_rate": 0.00029997278248539974, "loss": 0.1531, "step": 70 }, { "epoch": 0.0, "learning_rate": 0.00029996889426902825, "loss": 0.1556, "step": 80 }, { "epoch": 0.0, "learning_rate": 0.00029996500605265677, "loss": 0.1376, "step": 90 }, { "epoch": 0.0, "learning_rate": 0.00029996111783628534, "loss": 0.1429, "step": 100 }, { "epoch": 0.0, "learning_rate": 0.00029995722961991385, "loss": 0.1162, "step": 110 }, { "epoch": 0.0, "learning_rate": 0.0002999533414035424, "loss": 0.1291, "step": 120 }, { "epoch": 0.0, "learning_rate": 0.00029994945318717093, "loss": 0.13, "step": 130 }, { "epoch": 0.0, "learning_rate": 0.00029994556497079945, "loss": 0.1487, "step": 140 }, { "epoch": 0.0, "learning_rate": 0.000299941676754428, "loss": 0.1119, "step": 150 }, { "epoch": 0.0, "learning_rate": 0.00029993778853805653, "loss": 0.1375, "step": 160 }, { "epoch": 0.0, "learning_rate": 0.00029993390032168505, "loss": 0.1118, "step": 170 }, { "epoch": 0.0, "learning_rate": 0.0002999300121053136, "loss": 0.1084, "step": 180 }, { "epoch": 0.0, "learning_rate": 0.0002999261238889422, "loss": 0.1184, "step": 190 }, { "epoch": 0.0, "learning_rate": 0.0002999222356725707, "loss": 0.1323, "step": 200 }, { "epoch": 0.0, "learning_rate": 0.0002999183474561992, "loss": 0.1202, "step": 210 }, { "epoch": 0.0, "learning_rate": 0.00029991445923982773, "loss": 0.1063, "step": 220 }, { "epoch": 0.0, "learning_rate": 0.0002999105710234563, "loss": 0.1167, "step": 230 }, { "epoch": 0.0, "learning_rate": 0.0002999066828070848, "loss": 0.1002, "step": 240 }, { "epoch": 0.0, "learning_rate": 0.0002999027945907134, "loss": 0.104, "step": 250 }, { "epoch": 0.0, "learning_rate": 0.0002998989063743419, "loss": 0.1216, "step": 260 }, { "epoch": 0.0, "learning_rate": 0.0002998950181579704, "loss": 0.117, "step": 270 }, { "epoch": 0.0, "learning_rate": 0.000299891129941599, "loss": 0.1064, "step": 280 }, { "epoch": 0.0, "learning_rate": 0.0002998872417252275, "loss": 0.1148, "step": 290 }, { "epoch": 0.0, "learning_rate": 0.000299883353508856, "loss": 0.0943, "step": 300 }, { "epoch": 0.0, "learning_rate": 0.0002998794652924846, "loss": 0.1039, "step": 310 }, { "epoch": 0.0, "learning_rate": 0.0002998755770761131, "loss": 0.1171, "step": 320 }, { "epoch": 0.0, "learning_rate": 0.00029987168885974166, "loss": 0.1102, "step": 330 }, { "epoch": 0.0, "learning_rate": 0.00029986780064337017, "loss": 0.1102, "step": 340 }, { "epoch": 0.0, "learning_rate": 0.0002998639124269987, "loss": 0.1167, "step": 350 }, { "epoch": 0.0, "learning_rate": 0.00029986002421062726, "loss": 0.1074, "step": 360 }, { "epoch": 0.0, "learning_rate": 0.00029985613599425577, "loss": 0.1107, "step": 370 }, { "epoch": 0.0, "learning_rate": 0.00029985224777788434, "loss": 0.1021, "step": 380 }, { "epoch": 0.0, "learning_rate": 0.00029984835956151285, "loss": 0.1011, "step": 390 }, { "epoch": 0.0, "learning_rate": 0.0002998444713451414, "loss": 0.1051, "step": 400 }, { "epoch": 0.0, "learning_rate": 0.00029984058312876994, "loss": 0.0837, "step": 410 }, { "epoch": 0.0, "learning_rate": 0.00029983669491239845, "loss": 0.0925, "step": 420 }, { "epoch": 0.0, "learning_rate": 0.00029983280669602697, "loss": 0.1086, "step": 430 }, { "epoch": 0.0, "learning_rate": 0.00029982891847965553, "loss": 0.0881, "step": 440 }, { "epoch": 0.0, "learning_rate": 0.00029982503026328405, "loss": 0.0898, "step": 450 }, { "epoch": 0.0, "learning_rate": 0.0002998211420469126, "loss": 0.1033, "step": 460 }, { "epoch": 0.0, "learning_rate": 0.00029981725383054113, "loss": 0.1079, "step": 470 }, { "epoch": 0.0, "learning_rate": 0.0002998133656141697, "loss": 0.0976, "step": 480 }, { "epoch": 0.0, "learning_rate": 0.0002998094773977982, "loss": 0.1109, "step": 490 }, { "epoch": 0.0, "learning_rate": 0.00029980558918142673, "loss": 0.1082, "step": 500 }, { "epoch": 0.0, "learning_rate": 0.00029980170096505524, "loss": 0.1971, "step": 510 }, { "epoch": 0.0, "learning_rate": 0.0002997978127486838, "loss": 0.1078, "step": 520 }, { "epoch": 0.0, "learning_rate": 0.0002997939245323124, "loss": 0.0928, "step": 530 }, { "epoch": 0.0, "learning_rate": 0.0002997900363159409, "loss": 0.1055, "step": 540 }, { "epoch": 0.0, "learning_rate": 0.0002997861480995694, "loss": 0.1023, "step": 550 }, { "epoch": 0.0, "learning_rate": 0.0002997822598831979, "loss": 0.0934, "step": 560 }, { "epoch": 0.0, "learning_rate": 0.0002997783716668265, "loss": 0.1039, "step": 570 }, { "epoch": 0.0, "learning_rate": 0.000299774483450455, "loss": 0.087, "step": 580 }, { "epoch": 0.0, "learning_rate": 0.0002997705952340836, "loss": 0.0906, "step": 590 }, { "epoch": 0.0, "learning_rate": 0.0002997667070177121, "loss": 0.0846, "step": 600 }, { "epoch": 0.0, "learning_rate": 0.00029976281880134066, "loss": 0.0917, "step": 610 }, { "epoch": 0.0, "learning_rate": 0.0002997589305849692, "loss": 0.1092, "step": 620 }, { "epoch": 0.0, "learning_rate": 0.0002997550423685977, "loss": 0.1039, "step": 630 }, { "epoch": 0.0, "learning_rate": 0.0002997511541522262, "loss": 0.1769, "step": 640 }, { "epoch": 0.0, "learning_rate": 0.0002997472659358548, "loss": 0.1353, "step": 650 }, { "epoch": 0.0, "learning_rate": 0.0002997433777194833, "loss": 0.0978, "step": 660 }, { "epoch": 0.0, "learning_rate": 0.00029973948950311186, "loss": 0.1023, "step": 670 }, { "epoch": 0.0, "learning_rate": 0.00029973560128674037, "loss": 0.0935, "step": 680 }, { "epoch": 0.0, "learning_rate": 0.00029973171307036894, "loss": 0.1242, "step": 690 }, { "epoch": 0.0, "learning_rate": 0.00029972782485399745, "loss": 0.0939, "step": 700 }, { "epoch": 0.0, "learning_rate": 0.00029972393663762597, "loss": 0.095, "step": 710 }, { "epoch": 0.0, "learning_rate": 0.0002997200484212545, "loss": 0.095, "step": 720 }, { "epoch": 0.0, "learning_rate": 0.00029971616020488305, "loss": 0.0844, "step": 730 }, { "epoch": 0.0, "learning_rate": 0.0002997122719885116, "loss": 0.1014, "step": 740 }, { "epoch": 0.0, "learning_rate": 0.00029970838377214014, "loss": 0.0894, "step": 750 }, { "epoch": 0.0, "learning_rate": 0.00029970449555576865, "loss": 0.0934, "step": 760 }, { "epoch": 0.0, "learning_rate": 0.00029970060733939716, "loss": 0.1144, "step": 770 }, { "epoch": 0.0, "learning_rate": 0.00029969671912302573, "loss": 0.0885, "step": 780 }, { "epoch": 0.0, "learning_rate": 0.00029969283090665425, "loss": 0.0893, "step": 790 }, { "epoch": 0.0, "learning_rate": 0.0002996889426902828, "loss": 0.0883, "step": 800 }, { "epoch": 0.0, "learning_rate": 0.00029968505447391133, "loss": 0.083, "step": 810 }, { "epoch": 0.0, "learning_rate": 0.0002996811662575399, "loss": 0.0868, "step": 820 }, { "epoch": 0.0, "learning_rate": 0.0002996772780411684, "loss": 0.0977, "step": 830 }, { "epoch": 0.0, "learning_rate": 0.00029967338982479693, "loss": 0.0841, "step": 840 }, { "epoch": 0.0, "learning_rate": 0.00029966950160842544, "loss": 0.0846, "step": 850 }, { "epoch": 0.0, "learning_rate": 0.000299665613392054, "loss": 0.0754, "step": 860 }, { "epoch": 0.0, "learning_rate": 0.0002996617251756826, "loss": 0.0802, "step": 870 }, { "epoch": 0.0, "learning_rate": 0.0002996578369593111, "loss": 0.0986, "step": 880 }, { "epoch": 0.0, "learning_rate": 0.0002996539487429396, "loss": 0.0845, "step": 890 }, { "epoch": 0.0, "learning_rate": 0.0002996500605265682, "loss": 0.0767, "step": 900 }, { "epoch": 0.0, "learning_rate": 0.0002996461723101967, "loss": 0.0787, "step": 910 }, { "epoch": 0.0, "learning_rate": 0.0002996422840938252, "loss": 0.0861, "step": 920 }, { "epoch": 0.0, "learning_rate": 0.0002996383958774538, "loss": 0.086, "step": 930 }, { "epoch": 0.0, "learning_rate": 0.0002996345076610823, "loss": 0.0706, "step": 940 }, { "epoch": 0.0, "learning_rate": 0.00029963061944471086, "loss": 0.0881, "step": 950 }, { "epoch": 0.0, "learning_rate": 0.0002996267312283394, "loss": 0.0731, "step": 960 }, { "epoch": 0.0, "learning_rate": 0.0002996228430119679, "loss": 0.0821, "step": 970 }, { "epoch": 0.0, "learning_rate": 0.00029961895479559646, "loss": 0.0737, "step": 980 }, { "epoch": 0.0, "learning_rate": 0.00029961506657922497, "loss": 0.0892, "step": 990 }, { "epoch": 0.0, "learning_rate": 0.0002996111783628535, "loss": 0.0694, "step": 1000 }, { "epoch": 0.0, "eval_cer": 0.8818566463859275, "eval_loss": 0.06612774729728699, "eval_runtime": 107.9329, "eval_samples_per_second": 18.53, "eval_steps_per_second": 4.633, "step": 1000 }, { "epoch": 0.0, "learning_rate": 0.00029960729014648206, "loss": 0.0788, "step": 1010 }, { "epoch": 0.0, "learning_rate": 0.00029960340193011057, "loss": 0.0885, "step": 1020 }, { "epoch": 0.0, "learning_rate": 0.00029959951371373914, "loss": 0.094, "step": 1030 }, { "epoch": 0.0, "learning_rate": 0.00029959562549736765, "loss": 0.0913, "step": 1040 }, { "epoch": 0.0, "learning_rate": 0.00029959173728099617, "loss": 0.0892, "step": 1050 }, { "epoch": 0.0, "learning_rate": 0.0002995878490646247, "loss": 0.078, "step": 1060 }, { "epoch": 0.0, "learning_rate": 0.00029958396084825325, "loss": 0.0822, "step": 1070 }, { "epoch": 0.0, "learning_rate": 0.0002995800726318818, "loss": 0.0802, "step": 1080 }, { "epoch": 0.0, "learning_rate": 0.00029957618441551033, "loss": 0.0878, "step": 1090 }, { "epoch": 0.0, "learning_rate": 0.00029957229619913885, "loss": 0.0858, "step": 1100 }, { "epoch": 0.0, "learning_rate": 0.0002995684079827674, "loss": 0.0799, "step": 1110 }, { "epoch": 0.0, "learning_rate": 0.00029956451976639593, "loss": 0.0817, "step": 1120 }, { "epoch": 0.0, "learning_rate": 0.00029956063155002445, "loss": 0.0783, "step": 1130 }, { "epoch": 0.0, "learning_rate": 0.000299556743333653, "loss": 0.0846, "step": 1140 }, { "epoch": 0.0, "learning_rate": 0.00029955285511728153, "loss": 0.0719, "step": 1150 }, { "epoch": 0.0, "learning_rate": 0.0002995489669009101, "loss": 0.0744, "step": 1160 }, { "epoch": 0.0, "learning_rate": 0.0002995450786845386, "loss": 0.0723, "step": 1170 }, { "epoch": 0.0, "learning_rate": 0.00029954119046816713, "loss": 0.0738, "step": 1180 }, { "epoch": 0.0, "learning_rate": 0.0002995373022517957, "loss": 0.0719, "step": 1190 }, { "epoch": 0.0, "learning_rate": 0.0002995334140354242, "loss": 0.0693, "step": 1200 }, { "epoch": 0.0, "learning_rate": 0.0002995295258190527, "loss": 0.0873, "step": 1210 }, { "epoch": 0.0, "learning_rate": 0.0002995256376026813, "loss": 0.0718, "step": 1220 }, { "epoch": 0.0, "learning_rate": 0.00029952174938630986, "loss": 0.0786, "step": 1230 }, { "epoch": 0.0, "learning_rate": 0.0002995178611699384, "loss": 0.0907, "step": 1240 }, { "epoch": 0.0, "learning_rate": 0.0002995139729535669, "loss": 0.0682, "step": 1250 }, { "epoch": 0.0, "learning_rate": 0.0002995100847371954, "loss": 0.0745, "step": 1260 }, { "epoch": 0.0, "learning_rate": 0.000299506196520824, "loss": 0.076, "step": 1270 }, { "epoch": 0.0, "learning_rate": 0.0002995023083044525, "loss": 0.0741, "step": 1280 }, { "epoch": 0.0, "learning_rate": 0.00029949842008808106, "loss": 0.0667, "step": 1290 }, { "epoch": 0.0, "learning_rate": 0.0002994945318717096, "loss": 0.0749, "step": 1300 }, { "epoch": 0.0, "learning_rate": 0.0002994906436553381, "loss": 0.0662, "step": 1310 }, { "epoch": 0.0, "learning_rate": 0.00029948675543896666, "loss": 0.0797, "step": 1320 }, { "epoch": 0.0, "learning_rate": 0.00029948286722259517, "loss": 0.0678, "step": 1330 }, { "epoch": 0.0, "learning_rate": 0.0002994789790062237, "loss": 0.0727, "step": 1340 }, { "epoch": 0.0, "learning_rate": 0.00029947509078985225, "loss": 0.0707, "step": 1350 }, { "epoch": 0.0, "learning_rate": 0.00029947120257348077, "loss": 0.0772, "step": 1360 }, { "epoch": 0.0, "learning_rate": 0.00029946731435710934, "loss": 0.0816, "step": 1370 }, { "epoch": 0.0, "learning_rate": 0.00029946342614073785, "loss": 0.0686, "step": 1380 }, { "epoch": 0.0, "learning_rate": 0.00029945953792436637, "loss": 0.0735, "step": 1390 }, { "epoch": 0.0, "learning_rate": 0.00029945564970799494, "loss": 0.0699, "step": 1400 }, { "epoch": 0.0, "learning_rate": 0.00029945176149162345, "loss": 0.0721, "step": 1410 }, { "epoch": 0.0, "learning_rate": 0.000299447873275252, "loss": 0.0639, "step": 1420 }, { "epoch": 0.0, "learning_rate": 0.00029944398505888053, "loss": 0.0736, "step": 1430 }, { "epoch": 0.0, "learning_rate": 0.0002994400968425091, "loss": 0.0691, "step": 1440 }, { "epoch": 0.0, "learning_rate": 0.0002994362086261376, "loss": 0.0772, "step": 1450 }, { "epoch": 0.0, "learning_rate": 0.00029943232040976613, "loss": 0.078, "step": 1460 }, { "epoch": 0.0, "learning_rate": 0.00029942843219339465, "loss": 0.0773, "step": 1470 }, { "epoch": 0.0, "learning_rate": 0.0002994245439770232, "loss": 0.0689, "step": 1480 }, { "epoch": 0.0, "learning_rate": 0.00029942065576065173, "loss": 0.076, "step": 1490 }, { "epoch": 0.0, "learning_rate": 0.0002994167675442803, "loss": 0.0729, "step": 1500 }, { "epoch": 0.0, "learning_rate": 0.0002994128793279088, "loss": 0.072, "step": 1510 }, { "epoch": 0.0, "learning_rate": 0.0002994089911115373, "loss": 0.0747, "step": 1520 }, { "epoch": 0.0, "learning_rate": 0.0002994051028951659, "loss": 0.0733, "step": 1530 }, { "epoch": 0.0, "learning_rate": 0.0002994012146787944, "loss": 0.0746, "step": 1540 }, { "epoch": 0.0, "learning_rate": 0.0002993973264624229, "loss": 0.076, "step": 1550 }, { "epoch": 0.0, "learning_rate": 0.0002993934382460515, "loss": 0.0692, "step": 1560 }, { "epoch": 0.0, "learning_rate": 0.00029938955002968006, "loss": 0.0668, "step": 1570 }, { "epoch": 0.0, "learning_rate": 0.0002993856618133086, "loss": 0.0786, "step": 1580 }, { "epoch": 0.0, "learning_rate": 0.0002993817735969371, "loss": 0.0709, "step": 1590 }, { "epoch": 0.0, "learning_rate": 0.0002993778853805656, "loss": 0.0715, "step": 1600 }, { "epoch": 0.0, "learning_rate": 0.0002993739971641942, "loss": 0.081, "step": 1610 }, { "epoch": 0.0, "learning_rate": 0.0002993701089478227, "loss": 0.1191, "step": 1620 }, { "epoch": 0.0, "learning_rate": 0.00029936622073145126, "loss": 0.1162, "step": 1630 }, { "epoch": 0.0, "learning_rate": 0.00029936233251507977, "loss": 0.07, "step": 1640 }, { "epoch": 0.0, "learning_rate": 0.00029935844429870834, "loss": 0.0789, "step": 1650 }, { "epoch": 0.0, "learning_rate": 0.00029935455608233686, "loss": 0.0745, "step": 1660 }, { "epoch": 0.0, "learning_rate": 0.00029935066786596537, "loss": 0.0832, "step": 1670 }, { "epoch": 0.0, "learning_rate": 0.0002993467796495939, "loss": 0.0877, "step": 1680 }, { "epoch": 0.0, "learning_rate": 0.00029934289143322245, "loss": 0.0762, "step": 1690 }, { "epoch": 0.0, "learning_rate": 0.00029933900321685097, "loss": 0.0694, "step": 1700 }, { "epoch": 0.0, "learning_rate": 0.00029933511500047954, "loss": 0.0824, "step": 1710 }, { "epoch": 0.0, "learning_rate": 0.00029933122678410805, "loss": 0.0831, "step": 1720 }, { "epoch": 0.0, "learning_rate": 0.0002993273385677366, "loss": 0.0773, "step": 1730 }, { "epoch": 0.0, "learning_rate": 0.00029932345035136513, "loss": 0.0658, "step": 1740 }, { "epoch": 0.0, "learning_rate": 0.00029931956213499365, "loss": 0.0758, "step": 1750 }, { "epoch": 0.0, "learning_rate": 0.00029931567391862216, "loss": 0.0781, "step": 1760 }, { "epoch": 0.0, "learning_rate": 0.00029931178570225073, "loss": 0.0683, "step": 1770 }, { "epoch": 0.0, "learning_rate": 0.0002993078974858793, "loss": 0.075, "step": 1780 }, { "epoch": 0.0, "learning_rate": 0.0002993040092695078, "loss": 0.0753, "step": 1790 }, { "epoch": 0.0, "learning_rate": 0.00029930012105313633, "loss": 0.0709, "step": 1800 }, { "epoch": 0.0, "learning_rate": 0.00029929623283676484, "loss": 0.0658, "step": 1810 }, { "epoch": 0.0, "learning_rate": 0.0002992923446203934, "loss": 0.0714, "step": 1820 }, { "epoch": 0.0, "learning_rate": 0.00029928845640402193, "loss": 0.0787, "step": 1830 }, { "epoch": 0.0, "learning_rate": 0.0002992845681876505, "loss": 0.078, "step": 1840 }, { "epoch": 0.0, "learning_rate": 0.000299280679971279, "loss": 0.0707, "step": 1850 }, { "epoch": 0.0, "learning_rate": 0.0002992767917549076, "loss": 0.0677, "step": 1860 }, { "epoch": 0.0, "learning_rate": 0.0002992729035385361, "loss": 0.0664, "step": 1870 }, { "epoch": 0.0, "learning_rate": 0.0002992690153221646, "loss": 0.0704, "step": 1880 }, { "epoch": 0.0, "learning_rate": 0.0002992651271057931, "loss": 0.0717, "step": 1890 }, { "epoch": 0.0, "learning_rate": 0.0002992612388894217, "loss": 0.0689, "step": 1900 }, { "epoch": 0.0, "learning_rate": 0.0002992573506730502, "loss": 0.0565, "step": 1910 }, { "epoch": 0.0, "learning_rate": 0.0002992534624566788, "loss": 0.1213, "step": 1920 }, { "epoch": 0.01, "learning_rate": 0.0002992495742403073, "loss": 0.089, "step": 1930 }, { "epoch": 0.01, "learning_rate": 0.00029924568602393586, "loss": 0.0781, "step": 1940 }, { "epoch": 0.01, "learning_rate": 0.0002992417978075644, "loss": 0.0892, "step": 1950 }, { "epoch": 0.01, "learning_rate": 0.0002992379095911929, "loss": 0.0952, "step": 1960 }, { "epoch": 0.01, "learning_rate": 0.00029923402137482146, "loss": 0.1112, "step": 1970 }, { "epoch": 0.01, "learning_rate": 0.00029923013315844997, "loss": 0.0685, "step": 1980 }, { "epoch": 0.01, "learning_rate": 0.00029922624494207854, "loss": 0.0803, "step": 1990 }, { "epoch": 0.01, "learning_rate": 0.00029922235672570705, "loss": 0.0688, "step": 2000 }, { "epoch": 0.01, "eval_cer": 0.8818524474751249, "eval_loss": 0.05534271523356438, "eval_runtime": 107.227, "eval_samples_per_second": 18.652, "eval_steps_per_second": 4.663, "step": 2000 }, { "epoch": 0.01, "learning_rate": 0.00029921846850933557, "loss": 0.0748, "step": 2010 }, { "epoch": 0.01, "learning_rate": 0.0002992145802929641, "loss": 0.0765, "step": 2020 }, { "epoch": 0.01, "learning_rate": 0.00029921069207659265, "loss": 0.0679, "step": 2030 }, { "epoch": 0.01, "learning_rate": 0.00029920680386022117, "loss": 0.0698, "step": 2040 }, { "epoch": 0.01, "learning_rate": 0.00029920291564384974, "loss": 0.0723, "step": 2050 }, { "epoch": 0.01, "learning_rate": 0.00029919902742747825, "loss": 0.0768, "step": 2060 }, { "epoch": 0.01, "learning_rate": 0.0002991951392111068, "loss": 0.0664, "step": 2070 }, { "epoch": 0.01, "learning_rate": 0.00029919125099473533, "loss": 0.0647, "step": 2080 }, { "epoch": 0.01, "learning_rate": 0.00029918736277836385, "loss": 0.0678, "step": 2090 }, { "epoch": 0.01, "learning_rate": 0.00029918347456199236, "loss": 0.0812, "step": 2100 }, { "epoch": 0.01, "learning_rate": 0.00029917958634562093, "loss": 0.0666, "step": 2110 }, { "epoch": 0.01, "learning_rate": 0.0002991756981292495, "loss": 0.0857, "step": 2120 }, { "epoch": 0.01, "learning_rate": 0.000299171809912878, "loss": 0.0785, "step": 2130 }, { "epoch": 0.01, "learning_rate": 0.00029916792169650653, "loss": 0.0821, "step": 2140 }, { "epoch": 0.01, "learning_rate": 0.0002991640334801351, "loss": 0.0761, "step": 2150 }, { "epoch": 0.01, "learning_rate": 0.0002991601452637636, "loss": 0.0778, "step": 2160 }, { "epoch": 0.01, "learning_rate": 0.0002991562570473921, "loss": 0.0631, "step": 2170 }, { "epoch": 0.01, "learning_rate": 0.0002991523688310207, "loss": 0.069, "step": 2180 }, { "epoch": 0.01, "learning_rate": 0.0002991484806146492, "loss": 0.0718, "step": 2190 }, { "epoch": 0.01, "learning_rate": 0.0002991445923982778, "loss": 0.0633, "step": 2200 }, { "epoch": 0.01, "learning_rate": 0.0002991407041819063, "loss": 0.0653, "step": 2210 }, { "epoch": 0.01, "learning_rate": 0.0002991368159655348, "loss": 0.0659, "step": 2220 }, { "epoch": 0.01, "learning_rate": 0.0002991329277491634, "loss": 0.0608, "step": 2230 }, { "epoch": 0.01, "learning_rate": 0.0002991290395327919, "loss": 0.0725, "step": 2240 }, { "epoch": 0.01, "learning_rate": 0.0002991251513164204, "loss": 0.0751, "step": 2250 }, { "epoch": 0.01, "learning_rate": 0.000299121263100049, "loss": 0.0726, "step": 2260 }, { "epoch": 0.01, "learning_rate": 0.0002991173748836775, "loss": 0.0653, "step": 2270 }, { "epoch": 0.01, "learning_rate": 0.00029911348666730606, "loss": 0.0627, "step": 2280 }, { "epoch": 0.01, "learning_rate": 0.00029910959845093457, "loss": 0.0625, "step": 2290 }, { "epoch": 0.01, "learning_rate": 0.0002991057102345631, "loss": 0.0615, "step": 2300 }, { "epoch": 0.01, "learning_rate": 0.0002991018220181916, "loss": 0.0675, "step": 2310 }, { "epoch": 0.01, "learning_rate": 0.00029909793380182017, "loss": 0.0709, "step": 2320 }, { "epoch": 0.01, "learning_rate": 0.00029909404558544874, "loss": 0.0631, "step": 2330 }, { "epoch": 0.01, "learning_rate": 0.00029909015736907725, "loss": 0.0617, "step": 2340 }, { "epoch": 0.01, "learning_rate": 0.00029908626915270577, "loss": 0.0762, "step": 2350 }, { "epoch": 0.01, "learning_rate": 0.00029908238093633434, "loss": 0.0659, "step": 2360 }, { "epoch": 0.01, "learning_rate": 0.00029907849271996285, "loss": 0.0766, "step": 2370 }, { "epoch": 0.01, "learning_rate": 0.00029907460450359137, "loss": 0.0633, "step": 2380 }, { "epoch": 0.01, "learning_rate": 0.00029907071628721993, "loss": 0.0548, "step": 2390 }, { "epoch": 0.01, "learning_rate": 0.00029906682807084845, "loss": 0.0632, "step": 2400 }, { "epoch": 0.01, "learning_rate": 0.000299062939854477, "loss": 0.0565, "step": 2410 }, { "epoch": 0.01, "learning_rate": 0.00029905905163810553, "loss": 0.0635, "step": 2420 }, { "epoch": 0.01, "learning_rate": 0.00029905516342173405, "loss": 0.066, "step": 2430 }, { "epoch": 0.01, "learning_rate": 0.0002990512752053626, "loss": 0.064, "step": 2440 }, { "epoch": 0.01, "learning_rate": 0.00029904738698899113, "loss": 0.0639, "step": 2450 }, { "epoch": 0.01, "learning_rate": 0.0002990434987726197, "loss": 0.0619, "step": 2460 }, { "epoch": 0.01, "learning_rate": 0.0002990396105562482, "loss": 0.068, "step": 2470 }, { "epoch": 0.01, "learning_rate": 0.0002990357223398768, "loss": 0.0636, "step": 2480 }, { "epoch": 0.01, "learning_rate": 0.0002990318341235053, "loss": 0.0596, "step": 2490 }, { "epoch": 0.01, "learning_rate": 0.0002990279459071338, "loss": 0.0689, "step": 2500 }, { "epoch": 0.01, "learning_rate": 0.0002990240576907623, "loss": 0.0664, "step": 2510 }, { "epoch": 0.01, "learning_rate": 0.0002990201694743909, "loss": 0.0642, "step": 2520 }, { "epoch": 0.01, "learning_rate": 0.0002990162812580194, "loss": 0.0769, "step": 2530 }, { "epoch": 0.01, "learning_rate": 0.000299012393041648, "loss": 0.0666, "step": 2540 }, { "epoch": 0.01, "learning_rate": 0.0002990085048252765, "loss": 0.0638, "step": 2550 }, { "epoch": 0.01, "learning_rate": 0.000299004616608905, "loss": 0.0627, "step": 2560 }, { "epoch": 0.01, "learning_rate": 0.0002990007283925336, "loss": 0.0687, "step": 2570 }, { "epoch": 0.01, "learning_rate": 0.0002989968401761621, "loss": 0.0614, "step": 2580 }, { "epoch": 0.01, "learning_rate": 0.0002989929519597906, "loss": 0.0713, "step": 2590 }, { "epoch": 0.01, "learning_rate": 0.0002989890637434192, "loss": 0.0697, "step": 2600 }, { "epoch": 0.01, "learning_rate": 0.00029898517552704774, "loss": 0.067, "step": 2610 }, { "epoch": 0.01, "learning_rate": 0.00029898128731067626, "loss": 0.0678, "step": 2620 }, { "epoch": 0.01, "learning_rate": 0.00029897739909430477, "loss": 0.0588, "step": 2630 }, { "epoch": 0.01, "learning_rate": 0.0002989735108779333, "loss": 0.0673, "step": 2640 }, { "epoch": 0.01, "learning_rate": 0.00029896962266156185, "loss": 0.0685, "step": 2650 }, { "epoch": 0.01, "learning_rate": 0.00029896573444519037, "loss": 0.0745, "step": 2660 }, { "epoch": 0.01, "learning_rate": 0.00029896184622881894, "loss": 0.0798, "step": 2670 }, { "epoch": 0.01, "learning_rate": 0.00029895795801244745, "loss": 0.0744, "step": 2680 }, { "epoch": 0.01, "learning_rate": 0.000298954069796076, "loss": 0.0809, "step": 2690 }, { "epoch": 0.01, "learning_rate": 0.00029895018157970454, "loss": 0.0668, "step": 2700 }, { "epoch": 0.01, "learning_rate": 0.00029894629336333305, "loss": 0.0775, "step": 2710 }, { "epoch": 0.01, "learning_rate": 0.00029894240514696156, "loss": 0.0732, "step": 2720 }, { "epoch": 0.01, "learning_rate": 0.00029893851693059013, "loss": 0.0708, "step": 2730 }, { "epoch": 0.01, "learning_rate": 0.00029893462871421865, "loss": 0.0628, "step": 2740 }, { "epoch": 0.01, "learning_rate": 0.0002989307404978472, "loss": 0.0631, "step": 2750 }, { "epoch": 0.01, "learning_rate": 0.00029892685228147573, "loss": 0.095, "step": 2760 }, { "epoch": 0.01, "learning_rate": 0.00029892296406510425, "loss": 0.0681, "step": 2770 }, { "epoch": 0.01, "learning_rate": 0.0002989190758487328, "loss": 0.0627, "step": 2780 }, { "epoch": 0.01, "learning_rate": 0.00029891518763236133, "loss": 0.0694, "step": 2790 }, { "epoch": 0.01, "learning_rate": 0.00029891129941598984, "loss": 0.0673, "step": 2800 }, { "epoch": 0.01, "learning_rate": 0.0002989074111996184, "loss": 0.0654, "step": 2810 }, { "epoch": 0.01, "learning_rate": 0.000298903522983247, "loss": 0.0688, "step": 2820 }, { "epoch": 0.01, "learning_rate": 0.0002988996347668755, "loss": 0.0673, "step": 2830 }, { "epoch": 0.01, "learning_rate": 0.000298895746550504, "loss": 0.0678, "step": 2840 }, { "epoch": 0.01, "learning_rate": 0.0002988918583341325, "loss": 0.0686, "step": 2850 }, { "epoch": 0.01, "learning_rate": 0.0002988879701177611, "loss": 0.0708, "step": 2860 }, { "epoch": 0.01, "learning_rate": 0.0002988840819013896, "loss": 0.0866, "step": 2870 }, { "epoch": 0.01, "learning_rate": 0.0002988801936850182, "loss": 0.0746, "step": 2880 }, { "epoch": 0.01, "learning_rate": 0.0002988763054686467, "loss": 0.0657, "step": 2890 }, { "epoch": 0.01, "learning_rate": 0.00029887241725227526, "loss": 0.0715, "step": 2900 }, { "epoch": 0.01, "learning_rate": 0.0002988685290359038, "loss": 0.0641, "step": 2910 }, { "epoch": 0.01, "learning_rate": 0.0002988646408195323, "loss": 0.07, "step": 2920 }, { "epoch": 0.01, "learning_rate": 0.0002988607526031608, "loss": 0.0689, "step": 2930 }, { "epoch": 0.01, "learning_rate": 0.00029885686438678937, "loss": 0.0578, "step": 2940 }, { "epoch": 0.01, "learning_rate": 0.0002988529761704179, "loss": 0.0586, "step": 2950 }, { "epoch": 0.01, "learning_rate": 0.00029884908795404646, "loss": 0.0629, "step": 2960 }, { "epoch": 0.01, "learning_rate": 0.00029884519973767497, "loss": 0.0664, "step": 2970 }, { "epoch": 0.01, "learning_rate": 0.0002988413115213035, "loss": 0.0581, "step": 2980 }, { "epoch": 0.01, "learning_rate": 0.00029883742330493205, "loss": 0.1604, "step": 2990 }, { "epoch": 0.01, "learning_rate": 0.00029883353508856057, "loss": 0.1397, "step": 3000 }, { "epoch": 0.01, "eval_cer": 0.8836117911013883, "eval_loss": 0.06463418900966644, "eval_runtime": 107.8405, "eval_samples_per_second": 18.546, "eval_steps_per_second": 4.636, "step": 3000 }, { "epoch": 0.01, "learning_rate": 0.00029882964687218914, "loss": 0.0778, "step": 3010 }, { "epoch": 0.01, "learning_rate": 0.00029882575865581765, "loss": 0.0669, "step": 3020 }, { "epoch": 0.01, "learning_rate": 0.0002988218704394462, "loss": 0.0723, "step": 3030 }, { "epoch": 0.01, "learning_rate": 0.00029881798222307473, "loss": 0.0695, "step": 3040 }, { "epoch": 0.01, "learning_rate": 0.00029881409400670325, "loss": 0.0611, "step": 3050 }, { "epoch": 0.01, "learning_rate": 0.00029881020579033176, "loss": 0.0761, "step": 3060 }, { "epoch": 0.01, "learning_rate": 0.00029880631757396033, "loss": 0.0636, "step": 3070 }, { "epoch": 0.01, "learning_rate": 0.00029880242935758885, "loss": 0.0658, "step": 3080 }, { "epoch": 0.01, "learning_rate": 0.0002987985411412174, "loss": 0.0685, "step": 3090 }, { "epoch": 0.01, "learning_rate": 0.00029879465292484593, "loss": 0.081, "step": 3100 }, { "epoch": 0.01, "learning_rate": 0.0002987907647084745, "loss": 0.0649, "step": 3110 }, { "epoch": 0.01, "learning_rate": 0.000298786876492103, "loss": 0.0634, "step": 3120 }, { "epoch": 0.01, "learning_rate": 0.00029878298827573153, "loss": 0.0747, "step": 3130 }, { "epoch": 0.01, "learning_rate": 0.00029877910005936004, "loss": 0.0699, "step": 3140 }, { "epoch": 0.01, "learning_rate": 0.0002987752118429886, "loss": 0.0661, "step": 3150 }, { "epoch": 0.01, "learning_rate": 0.0002987713236266172, "loss": 0.0721, "step": 3160 }, { "epoch": 0.01, "learning_rate": 0.0002987674354102457, "loss": 0.0964, "step": 3170 }, { "epoch": 0.01, "learning_rate": 0.0002987635471938742, "loss": 0.0708, "step": 3180 }, { "epoch": 0.01, "learning_rate": 0.0002987596589775028, "loss": 0.0742, "step": 3190 }, { "epoch": 0.01, "learning_rate": 0.0002987557707611313, "loss": 0.0671, "step": 3200 }, { "epoch": 0.01, "learning_rate": 0.0002987518825447598, "loss": 0.066, "step": 3210 }, { "epoch": 0.01, "learning_rate": 0.0002987479943283884, "loss": 0.0803, "step": 3220 }, { "epoch": 0.01, "learning_rate": 0.0002987441061120169, "loss": 0.0708, "step": 3230 }, { "epoch": 0.01, "learning_rate": 0.00029874021789564546, "loss": 0.052, "step": 3240 }, { "epoch": 0.01, "learning_rate": 0.000298736329679274, "loss": 0.0742, "step": 3250 }, { "epoch": 0.01, "learning_rate": 0.0002987324414629025, "loss": 0.0673, "step": 3260 }, { "epoch": 0.01, "learning_rate": 0.000298728553246531, "loss": 0.0646, "step": 3270 }, { "epoch": 0.01, "learning_rate": 0.00029872466503015957, "loss": 0.0643, "step": 3280 }, { "epoch": 0.01, "learning_rate": 0.0002987207768137881, "loss": 0.0731, "step": 3290 }, { "epoch": 0.01, "learning_rate": 0.00029871688859741665, "loss": 0.0835, "step": 3300 }, { "epoch": 0.01, "learning_rate": 0.00029871300038104517, "loss": 0.0708, "step": 3310 }, { "epoch": 0.01, "learning_rate": 0.00029870911216467374, "loss": 0.0607, "step": 3320 }, { "epoch": 0.01, "learning_rate": 0.00029870522394830225, "loss": 0.0564, "step": 3330 }, { "epoch": 0.01, "learning_rate": 0.00029870133573193077, "loss": 0.0643, "step": 3340 }, { "epoch": 0.01, "learning_rate": 0.0002986974475155593, "loss": 0.0694, "step": 3350 }, { "epoch": 0.01, "learning_rate": 0.00029869355929918785, "loss": 0.0565, "step": 3360 }, { "epoch": 0.01, "learning_rate": 0.0002986896710828164, "loss": 0.0655, "step": 3370 }, { "epoch": 0.01, "learning_rate": 0.00029868578286644493, "loss": 0.0634, "step": 3380 }, { "epoch": 0.01, "learning_rate": 0.00029868189465007345, "loss": 0.0642, "step": 3390 }, { "epoch": 0.01, "learning_rate": 0.000298678006433702, "loss": 0.0587, "step": 3400 }, { "epoch": 0.01, "learning_rate": 0.00029867411821733053, "loss": 0.0557, "step": 3410 }, { "epoch": 0.01, "learning_rate": 0.00029867023000095905, "loss": 0.0587, "step": 3420 }, { "epoch": 0.01, "learning_rate": 0.0002986663417845876, "loss": 0.0583, "step": 3430 }, { "epoch": 0.01, "learning_rate": 0.00029866245356821613, "loss": 0.0552, "step": 3440 }, { "epoch": 0.01, "learning_rate": 0.0002986585653518447, "loss": 0.063, "step": 3450 }, { "epoch": 0.01, "learning_rate": 0.0002986546771354732, "loss": 0.0531, "step": 3460 }, { "epoch": 0.01, "learning_rate": 0.0002986507889191017, "loss": 0.0575, "step": 3470 }, { "epoch": 0.01, "learning_rate": 0.00029864690070273024, "loss": 0.0635, "step": 3480 }, { "epoch": 0.01, "learning_rate": 0.0002986430124863588, "loss": 0.0619, "step": 3490 }, { "epoch": 0.01, "learning_rate": 0.0002986391242699873, "loss": 0.0759, "step": 3500 }, { "epoch": 0.01, "learning_rate": 0.0002986352360536159, "loss": 0.0633, "step": 3510 }, { "epoch": 0.01, "learning_rate": 0.0002986313478372444, "loss": 0.0698, "step": 3520 }, { "epoch": 0.01, "learning_rate": 0.000298627459620873, "loss": 0.0604, "step": 3530 }, { "epoch": 0.01, "learning_rate": 0.0002986235714045015, "loss": 0.0583, "step": 3540 }, { "epoch": 0.01, "learning_rate": 0.00029861968318813, "loss": 0.0602, "step": 3550 }, { "epoch": 0.01, "learning_rate": 0.0002986157949717586, "loss": 0.0535, "step": 3560 }, { "epoch": 0.01, "learning_rate": 0.0002986119067553871, "loss": 0.0602, "step": 3570 }, { "epoch": 0.01, "learning_rate": 0.00029860801853901566, "loss": 0.0705, "step": 3580 }, { "epoch": 0.01, "learning_rate": 0.00029860413032264417, "loss": 0.063, "step": 3590 }, { "epoch": 0.01, "learning_rate": 0.0002986002421062727, "loss": 0.0599, "step": 3600 }, { "epoch": 0.01, "learning_rate": 0.00029859635388990126, "loss": 0.0827, "step": 3610 }, { "epoch": 0.01, "learning_rate": 0.00029859246567352977, "loss": 0.0624, "step": 3620 }, { "epoch": 0.01, "learning_rate": 0.0002985885774571583, "loss": 0.0782, "step": 3630 }, { "epoch": 0.01, "learning_rate": 0.00029858468924078685, "loss": 0.0619, "step": 3640 }, { "epoch": 0.01, "learning_rate": 0.0002985808010244154, "loss": 0.0616, "step": 3650 }, { "epoch": 0.01, "learning_rate": 0.00029857691280804394, "loss": 0.0596, "step": 3660 }, { "epoch": 0.01, "learning_rate": 0.00029857302459167245, "loss": 0.0691, "step": 3670 }, { "epoch": 0.01, "learning_rate": 0.00029856913637530097, "loss": 0.0569, "step": 3680 }, { "epoch": 0.01, "learning_rate": 0.00029856524815892953, "loss": 0.0574, "step": 3690 }, { "epoch": 0.01, "learning_rate": 0.00029856135994255805, "loss": 0.0601, "step": 3700 }, { "epoch": 0.01, "learning_rate": 0.0002985574717261866, "loss": 0.0571, "step": 3710 }, { "epoch": 0.01, "learning_rate": 0.00029855358350981513, "loss": 0.0541, "step": 3720 }, { "epoch": 0.01, "learning_rate": 0.00029854969529344365, "loss": 0.0568, "step": 3730 }, { "epoch": 0.01, "learning_rate": 0.0002985458070770722, "loss": 0.0597, "step": 3740 }, { "epoch": 0.01, "learning_rate": 0.00029854191886070073, "loss": 0.0655, "step": 3750 }, { "epoch": 0.01, "learning_rate": 0.00029853803064432924, "loss": 0.0588, "step": 3760 }, { "epoch": 0.01, "learning_rate": 0.0002985341424279578, "loss": 0.0641, "step": 3770 }, { "epoch": 0.01, "learning_rate": 0.00029853025421158633, "loss": 0.068, "step": 3780 }, { "epoch": 0.01, "learning_rate": 0.0002985263659952149, "loss": 0.0597, "step": 3790 }, { "epoch": 0.01, "learning_rate": 0.0002985224777788434, "loss": 0.0619, "step": 3800 }, { "epoch": 0.01, "learning_rate": 0.0002985185895624719, "loss": 0.0554, "step": 3810 }, { "epoch": 0.01, "learning_rate": 0.0002985147013461005, "loss": 0.052, "step": 3820 }, { "epoch": 0.01, "learning_rate": 0.000298510813129729, "loss": 0.0584, "step": 3830 }, { "epoch": 0.01, "learning_rate": 0.0002985069249133575, "loss": 0.056, "step": 3840 }, { "epoch": 0.01, "learning_rate": 0.0002985030366969861, "loss": 0.0499, "step": 3850 }, { "epoch": 0.01, "learning_rate": 0.00029849914848061466, "loss": 0.0667, "step": 3860 }, { "epoch": 0.01, "learning_rate": 0.0002984952602642432, "loss": 0.053, "step": 3870 }, { "epoch": 0.01, "learning_rate": 0.0002984913720478717, "loss": 0.0802, "step": 3880 }, { "epoch": 0.01, "learning_rate": 0.0002984874838315002, "loss": 0.0703, "step": 3890 }, { "epoch": 0.01, "learning_rate": 0.0002984835956151288, "loss": 0.0608, "step": 3900 }, { "epoch": 0.01, "learning_rate": 0.0002984797073987573, "loss": 0.0551, "step": 3910 }, { "epoch": 0.01, "learning_rate": 0.00029847581918238586, "loss": 0.0563, "step": 3920 }, { "epoch": 0.01, "learning_rate": 0.00029847193096601437, "loss": 0.0546, "step": 3930 }, { "epoch": 0.01, "learning_rate": 0.00029846804274964294, "loss": 0.0533, "step": 3940 }, { "epoch": 0.01, "learning_rate": 0.00029846415453327145, "loss": 0.0598, "step": 3950 }, { "epoch": 0.01, "learning_rate": 0.00029846026631689997, "loss": 0.0662, "step": 3960 }, { "epoch": 0.01, "learning_rate": 0.0002984563781005285, "loss": 0.0501, "step": 3970 }, { "epoch": 0.01, "learning_rate": 0.00029845248988415705, "loss": 0.0574, "step": 3980 }, { "epoch": 0.01, "learning_rate": 0.00029844860166778557, "loss": 0.058, "step": 3990 }, { "epoch": 0.01, "learning_rate": 0.00029844471345141414, "loss": 0.0488, "step": 4000 }, { "epoch": 0.01, "eval_cer": 0.8818566463859275, "eval_loss": 0.04614216089248657, "eval_runtime": 108.2516, "eval_samples_per_second": 18.475, "eval_steps_per_second": 4.619, "step": 4000 }, { "epoch": 0.01, "learning_rate": 0.00029844082523504265, "loss": 0.0674, "step": 4010 }, { "epoch": 0.01, "learning_rate": 0.00029843693701867116, "loss": 0.0578, "step": 4020 }, { "epoch": 0.01, "learning_rate": 0.00029843304880229973, "loss": 0.0618, "step": 4030 }, { "epoch": 0.01, "learning_rate": 0.00029842916058592825, "loss": 0.0501, "step": 4040 }, { "epoch": 0.01, "learning_rate": 0.0002984252723695568, "loss": 0.0549, "step": 4050 }, { "epoch": 0.01, "learning_rate": 0.00029842138415318533, "loss": 0.0528, "step": 4060 }, { "epoch": 0.01, "learning_rate": 0.0002984174959368139, "loss": 0.0546, "step": 4070 }, { "epoch": 0.01, "learning_rate": 0.0002984136077204424, "loss": 0.062, "step": 4080 }, { "epoch": 0.01, "learning_rate": 0.00029840971950407093, "loss": 0.0536, "step": 4090 }, { "epoch": 0.01, "learning_rate": 0.00029840583128769944, "loss": 0.0546, "step": 4100 }, { "epoch": 0.01, "learning_rate": 0.000298401943071328, "loss": 0.0492, "step": 4110 }, { "epoch": 0.01, "learning_rate": 0.0002983980548549565, "loss": 0.0491, "step": 4120 }, { "epoch": 0.01, "learning_rate": 0.0002983941666385851, "loss": 0.0528, "step": 4130 }, { "epoch": 0.01, "learning_rate": 0.0002983902784222136, "loss": 0.059, "step": 4140 }, { "epoch": 0.01, "learning_rate": 0.0002983863902058422, "loss": 0.0551, "step": 4150 }, { "epoch": 0.01, "learning_rate": 0.0002983825019894707, "loss": 0.0738, "step": 4160 }, { "epoch": 0.01, "learning_rate": 0.0002983786137730992, "loss": 0.0697, "step": 4170 }, { "epoch": 0.01, "learning_rate": 0.0002983747255567277, "loss": 0.0554, "step": 4180 }, { "epoch": 0.01, "learning_rate": 0.0002983708373403563, "loss": 0.0623, "step": 4190 }, { "epoch": 0.01, "learning_rate": 0.00029836694912398486, "loss": 0.0579, "step": 4200 }, { "epoch": 0.01, "learning_rate": 0.0002983630609076134, "loss": 0.0583, "step": 4210 }, { "epoch": 0.01, "learning_rate": 0.0002983591726912419, "loss": 0.058, "step": 4220 }, { "epoch": 0.01, "learning_rate": 0.0002983552844748704, "loss": 0.0461, "step": 4230 }, { "epoch": 0.01, "learning_rate": 0.00029835139625849897, "loss": 0.0552, "step": 4240 }, { "epoch": 0.01, "learning_rate": 0.0002983475080421275, "loss": 0.0575, "step": 4250 }, { "epoch": 0.01, "learning_rate": 0.00029834361982575606, "loss": 0.0514, "step": 4260 }, { "epoch": 0.01, "learning_rate": 0.00029833973160938457, "loss": 0.0558, "step": 4270 }, { "epoch": 0.01, "learning_rate": 0.00029833584339301314, "loss": 0.0576, "step": 4280 }, { "epoch": 0.01, "learning_rate": 0.00029833195517664165, "loss": 0.0573, "step": 4290 }, { "epoch": 0.01, "learning_rate": 0.00029832806696027017, "loss": 0.0564, "step": 4300 }, { "epoch": 0.01, "learning_rate": 0.0002983241787438987, "loss": 0.0581, "step": 4310 }, { "epoch": 0.01, "learning_rate": 0.00029832029052752725, "loss": 0.0578, "step": 4320 }, { "epoch": 0.01, "learning_rate": 0.00029831640231115577, "loss": 0.0556, "step": 4330 }, { "epoch": 0.01, "learning_rate": 0.00029831251409478433, "loss": 0.0532, "step": 4340 }, { "epoch": 0.01, "learning_rate": 0.00029830862587841285, "loss": 0.0515, "step": 4350 }, { "epoch": 0.01, "learning_rate": 0.0002983047376620414, "loss": 0.0657, "step": 4360 }, { "epoch": 0.01, "learning_rate": 0.00029830084944566993, "loss": 0.0505, "step": 4370 }, { "epoch": 0.01, "learning_rate": 0.00029829696122929845, "loss": 0.0577, "step": 4380 }, { "epoch": 0.01, "learning_rate": 0.00029829307301292696, "loss": 0.0532, "step": 4390 }, { "epoch": 0.01, "learning_rate": 0.00029828918479655553, "loss": 0.0619, "step": 4400 }, { "epoch": 0.01, "learning_rate": 0.0002982852965801841, "loss": 0.0569, "step": 4410 }, { "epoch": 0.01, "learning_rate": 0.0002982814083638126, "loss": 0.0599, "step": 4420 }, { "epoch": 0.01, "learning_rate": 0.00029827752014744113, "loss": 0.0542, "step": 4430 }, { "epoch": 0.01, "learning_rate": 0.0002982736319310697, "loss": 0.0615, "step": 4440 }, { "epoch": 0.01, "learning_rate": 0.0002982697437146982, "loss": 0.057, "step": 4450 }, { "epoch": 0.01, "learning_rate": 0.0002982658554983267, "loss": 0.0589, "step": 4460 }, { "epoch": 0.01, "learning_rate": 0.0002982619672819553, "loss": 0.0551, "step": 4470 }, { "epoch": 0.01, "learning_rate": 0.0002982580790655838, "loss": 0.061, "step": 4480 }, { "epoch": 0.01, "learning_rate": 0.0002982541908492124, "loss": 0.052, "step": 4490 }, { "epoch": 0.01, "learning_rate": 0.0002982503026328409, "loss": 0.0536, "step": 4500 }, { "epoch": 0.01, "learning_rate": 0.0002982464144164694, "loss": 0.0537, "step": 4510 }, { "epoch": 0.01, "learning_rate": 0.0002982425262000979, "loss": 0.0709, "step": 4520 }, { "epoch": 0.01, "learning_rate": 0.0002982386379837265, "loss": 0.0524, "step": 4530 }, { "epoch": 0.01, "learning_rate": 0.000298234749767355, "loss": 0.0562, "step": 4540 }, { "epoch": 0.01, "learning_rate": 0.00029823086155098357, "loss": 0.061, "step": 4550 }, { "epoch": 0.01, "learning_rate": 0.0002982269733346121, "loss": 0.0584, "step": 4560 }, { "epoch": 0.01, "learning_rate": 0.00029822308511824066, "loss": 0.0648, "step": 4570 }, { "epoch": 0.01, "learning_rate": 0.00029821919690186917, "loss": 0.0624, "step": 4580 }, { "epoch": 0.01, "learning_rate": 0.0002982153086854977, "loss": 0.0833, "step": 4590 }, { "epoch": 0.01, "learning_rate": 0.00029821142046912625, "loss": 0.0506, "step": 4600 }, { "epoch": 0.01, "learning_rate": 0.00029820753225275477, "loss": 0.0602, "step": 4610 }, { "epoch": 0.01, "learning_rate": 0.00029820364403638334, "loss": 0.0497, "step": 4620 }, { "epoch": 0.01, "learning_rate": 0.00029819975582001185, "loss": 0.0742, "step": 4630 }, { "epoch": 0.01, "learning_rate": 0.00029819586760364037, "loss": 0.0569, "step": 4640 }, { "epoch": 0.01, "learning_rate": 0.00029819197938726894, "loss": 0.0489, "step": 4650 }, { "epoch": 0.01, "learning_rate": 0.00029818809117089745, "loss": 0.0821, "step": 4660 }, { "epoch": 0.01, "learning_rate": 0.00029818420295452596, "loss": 0.0609, "step": 4670 }, { "epoch": 0.01, "learning_rate": 0.00029818031473815453, "loss": 0.0532, "step": 4680 }, { "epoch": 0.01, "learning_rate": 0.00029817642652178305, "loss": 0.0577, "step": 4690 }, { "epoch": 0.01, "learning_rate": 0.0002981725383054116, "loss": 0.0579, "step": 4700 }, { "epoch": 0.01, "learning_rate": 0.00029816865008904013, "loss": 0.0674, "step": 4710 }, { "epoch": 0.01, "learning_rate": 0.00029816476187266865, "loss": 0.0576, "step": 4720 }, { "epoch": 0.01, "learning_rate": 0.00029816087365629716, "loss": 0.0607, "step": 4730 }, { "epoch": 0.01, "learning_rate": 0.00029815698543992573, "loss": 0.0517, "step": 4740 }, { "epoch": 0.01, "learning_rate": 0.0002981530972235543, "loss": 0.0606, "step": 4750 }, { "epoch": 0.01, "learning_rate": 0.0002981492090071828, "loss": 0.0658, "step": 4760 }, { "epoch": 0.01, "learning_rate": 0.0002981453207908113, "loss": 0.0594, "step": 4770 }, { "epoch": 0.01, "learning_rate": 0.0002981414325744399, "loss": 0.0844, "step": 4780 }, { "epoch": 0.01, "learning_rate": 0.0002981375443580684, "loss": 0.0531, "step": 4790 }, { "epoch": 0.01, "learning_rate": 0.0002981336561416969, "loss": 0.0609, "step": 4800 }, { "epoch": 0.01, "learning_rate": 0.0002981297679253255, "loss": 0.0573, "step": 4810 }, { "epoch": 0.01, "learning_rate": 0.000298125879708954, "loss": 0.0534, "step": 4820 }, { "epoch": 0.01, "learning_rate": 0.0002981219914925826, "loss": 0.0508, "step": 4830 }, { "epoch": 0.01, "learning_rate": 0.0002981181032762111, "loss": 0.0756, "step": 4840 }, { "epoch": 0.01, "learning_rate": 0.0002981142150598396, "loss": 0.0727, "step": 4850 }, { "epoch": 0.01, "learning_rate": 0.0002981103268434682, "loss": 0.0594, "step": 4860 }, { "epoch": 0.01, "learning_rate": 0.0002981064386270967, "loss": 0.0571, "step": 4870 }, { "epoch": 0.01, "learning_rate": 0.0002981025504107252, "loss": 0.0594, "step": 4880 }, { "epoch": 0.01, "learning_rate": 0.00029809866219435377, "loss": 0.0587, "step": 4890 }, { "epoch": 0.01, "learning_rate": 0.00029809477397798234, "loss": 0.0628, "step": 4900 }, { "epoch": 0.01, "learning_rate": 0.00029809088576161085, "loss": 0.0529, "step": 4910 }, { "epoch": 0.01, "learning_rate": 0.00029808699754523937, "loss": 0.0587, "step": 4920 }, { "epoch": 0.01, "learning_rate": 0.0002980831093288679, "loss": 0.0587, "step": 4930 }, { "epoch": 0.01, "learning_rate": 0.00029807922111249645, "loss": 0.0533, "step": 4940 }, { "epoch": 0.01, "learning_rate": 0.00029807533289612497, "loss": 0.061, "step": 4950 }, { "epoch": 0.01, "learning_rate": 0.00029807144467975354, "loss": 0.057, "step": 4960 }, { "epoch": 0.01, "learning_rate": 0.00029806755646338205, "loss": 0.0561, "step": 4970 }, { "epoch": 0.01, "learning_rate": 0.00029806366824701057, "loss": 0.0564, "step": 4980 }, { "epoch": 0.01, "learning_rate": 0.00029805978003063913, "loss": 0.0618, "step": 4990 }, { "epoch": 0.01, "learning_rate": 0.00029805589181426765, "loss": 0.0533, "step": 5000 }, { "epoch": 0.01, "eval_cer": 0.8818384511057832, "eval_loss": 0.04352134093642235, "eval_runtime": 107.4217, "eval_samples_per_second": 18.618, "eval_steps_per_second": 4.655, "step": 5000 }, { "epoch": 0.01, "learning_rate": 0.00029805200359789616, "loss": 0.0524, "step": 5010 }, { "epoch": 0.01, "learning_rate": 0.00029804811538152473, "loss": 0.0565, "step": 5020 }, { "epoch": 0.01, "learning_rate": 0.00029804422716515325, "loss": 0.0635, "step": 5030 }, { "epoch": 0.01, "learning_rate": 0.0002980403389487818, "loss": 0.0633, "step": 5040 }, { "epoch": 0.01, "learning_rate": 0.00029803645073241033, "loss": 0.0577, "step": 5050 }, { "epoch": 0.01, "learning_rate": 0.00029803256251603884, "loss": 0.051, "step": 5060 }, { "epoch": 0.01, "learning_rate": 0.0002980286742996674, "loss": 0.064, "step": 5070 }, { "epoch": 0.01, "learning_rate": 0.00029802478608329593, "loss": 0.0575, "step": 5080 }, { "epoch": 0.01, "learning_rate": 0.00029802089786692444, "loss": 0.0524, "step": 5090 }, { "epoch": 0.01, "learning_rate": 0.000298017009650553, "loss": 0.0593, "step": 5100 }, { "epoch": 0.01, "learning_rate": 0.0002980131214341816, "loss": 0.0563, "step": 5110 }, { "epoch": 0.01, "learning_rate": 0.0002980092332178101, "loss": 0.062, "step": 5120 }, { "epoch": 0.01, "learning_rate": 0.0002980053450014386, "loss": 0.0695, "step": 5130 }, { "epoch": 0.01, "learning_rate": 0.0002980014567850671, "loss": 0.0664, "step": 5140 }, { "epoch": 0.01, "learning_rate": 0.0002979975685686957, "loss": 0.0559, "step": 5150 }, { "epoch": 0.01, "learning_rate": 0.0002979936803523242, "loss": 0.0502, "step": 5160 }, { "epoch": 0.01, "learning_rate": 0.0002979897921359528, "loss": 0.0537, "step": 5170 }, { "epoch": 0.01, "learning_rate": 0.0002979859039195813, "loss": 0.0484, "step": 5180 }, { "epoch": 0.01, "learning_rate": 0.00029798201570320986, "loss": 0.0484, "step": 5190 }, { "epoch": 0.01, "learning_rate": 0.00029797812748683837, "loss": 0.0562, "step": 5200 }, { "epoch": 0.01, "learning_rate": 0.0002979742392704669, "loss": 0.0541, "step": 5210 }, { "epoch": 0.01, "learning_rate": 0.0002979703510540954, "loss": 0.0673, "step": 5220 }, { "epoch": 0.01, "learning_rate": 0.00029796646283772397, "loss": 0.0536, "step": 5230 }, { "epoch": 0.01, "learning_rate": 0.00029796257462135254, "loss": 0.0556, "step": 5240 }, { "epoch": 0.01, "learning_rate": 0.00029795868640498105, "loss": 0.0469, "step": 5250 }, { "epoch": 0.01, "learning_rate": 0.00029795479818860957, "loss": 0.0601, "step": 5260 }, { "epoch": 0.01, "learning_rate": 0.0002979509099722381, "loss": 0.0537, "step": 5270 }, { "epoch": 0.01, "learning_rate": 0.00029794702175586665, "loss": 0.0569, "step": 5280 }, { "epoch": 0.01, "learning_rate": 0.00029794313353949517, "loss": 0.0462, "step": 5290 }, { "epoch": 0.01, "learning_rate": 0.00029793924532312373, "loss": 0.0461, "step": 5300 }, { "epoch": 0.01, "learning_rate": 0.00029793535710675225, "loss": 0.0489, "step": 5310 }, { "epoch": 0.01, "learning_rate": 0.0002979314688903808, "loss": 0.0535, "step": 5320 }, { "epoch": 0.01, "learning_rate": 0.00029792758067400933, "loss": 0.0546, "step": 5330 }, { "epoch": 0.01, "learning_rate": 0.00029792369245763785, "loss": 0.058, "step": 5340 }, { "epoch": 0.01, "learning_rate": 0.00029791980424126636, "loss": 0.0555, "step": 5350 }, { "epoch": 0.01, "learning_rate": 0.00029791591602489493, "loss": 0.0479, "step": 5360 }, { "epoch": 0.01, "learning_rate": 0.00029791202780852345, "loss": 0.0584, "step": 5370 }, { "epoch": 0.01, "learning_rate": 0.000297908139592152, "loss": 0.0514, "step": 5380 }, { "epoch": 0.01, "learning_rate": 0.00029790425137578053, "loss": 0.0491, "step": 5390 }, { "epoch": 0.01, "learning_rate": 0.0002979003631594091, "loss": 0.0511, "step": 5400 }, { "epoch": 0.01, "learning_rate": 0.0002978964749430376, "loss": 0.0489, "step": 5410 }, { "epoch": 0.01, "learning_rate": 0.0002978925867266661, "loss": 0.0532, "step": 5420 }, { "epoch": 0.01, "learning_rate": 0.00029788869851029464, "loss": 0.0484, "step": 5430 }, { "epoch": 0.01, "learning_rate": 0.0002978848102939232, "loss": 0.0599, "step": 5440 }, { "epoch": 0.01, "learning_rate": 0.0002978809220775518, "loss": 0.0483, "step": 5450 }, { "epoch": 0.01, "learning_rate": 0.0002978770338611803, "loss": 0.0587, "step": 5460 }, { "epoch": 0.01, "learning_rate": 0.0002978731456448088, "loss": 0.0512, "step": 5470 }, { "epoch": 0.01, "learning_rate": 0.0002978692574284373, "loss": 0.0508, "step": 5480 }, { "epoch": 0.01, "learning_rate": 0.0002978653692120659, "loss": 0.0508, "step": 5490 }, { "epoch": 0.01, "learning_rate": 0.0002978614809956944, "loss": 0.0495, "step": 5500 }, { "epoch": 0.01, "learning_rate": 0.000297857592779323, "loss": 0.0501, "step": 5510 }, { "epoch": 0.01, "learning_rate": 0.0002978537045629515, "loss": 0.057, "step": 5520 }, { "epoch": 0.01, "learning_rate": 0.00029784981634658006, "loss": 0.0646, "step": 5530 }, { "epoch": 0.01, "learning_rate": 0.00029784592813020857, "loss": 0.0549, "step": 5540 }, { "epoch": 0.01, "learning_rate": 0.0002978420399138371, "loss": 0.0562, "step": 5550 }, { "epoch": 0.01, "learning_rate": 0.0002978381516974656, "loss": 0.0589, "step": 5560 }, { "epoch": 0.01, "learning_rate": 0.00029783426348109417, "loss": 0.0552, "step": 5570 }, { "epoch": 0.01, "learning_rate": 0.0002978303752647227, "loss": 0.0616, "step": 5580 }, { "epoch": 0.01, "learning_rate": 0.00029782648704835125, "loss": 0.0601, "step": 5590 }, { "epoch": 0.01, "learning_rate": 0.00029782259883197977, "loss": 0.0528, "step": 5600 }, { "epoch": 0.01, "learning_rate": 0.00029781871061560834, "loss": 0.0515, "step": 5610 }, { "epoch": 0.01, "learning_rate": 0.00029781482239923685, "loss": 0.0585, "step": 5620 }, { "epoch": 0.01, "learning_rate": 0.00029781093418286537, "loss": 0.0572, "step": 5630 }, { "epoch": 0.01, "learning_rate": 0.00029780704596649393, "loss": 0.0533, "step": 5640 }, { "epoch": 0.01, "learning_rate": 0.00029780315775012245, "loss": 0.06, "step": 5650 }, { "epoch": 0.01, "learning_rate": 0.000297799269533751, "loss": 0.0529, "step": 5660 }, { "epoch": 0.01, "learning_rate": 0.00029779538131737953, "loss": 0.0557, "step": 5670 }, { "epoch": 0.01, "learning_rate": 0.00029779149310100805, "loss": 0.0457, "step": 5680 }, { "epoch": 0.01, "learning_rate": 0.0002977876048846366, "loss": 0.0462, "step": 5690 }, { "epoch": 0.01, "learning_rate": 0.00029778371666826513, "loss": 0.052, "step": 5700 }, { "epoch": 0.01, "learning_rate": 0.00029777982845189364, "loss": 0.0478, "step": 5710 }, { "epoch": 0.01, "learning_rate": 0.0002977759402355222, "loss": 0.0501, "step": 5720 }, { "epoch": 0.01, "learning_rate": 0.00029777205201915073, "loss": 0.0539, "step": 5730 }, { "epoch": 0.01, "learning_rate": 0.0002977681638027793, "loss": 0.0455, "step": 5740 }, { "epoch": 0.01, "learning_rate": 0.0002977642755864078, "loss": 0.0542, "step": 5750 }, { "epoch": 0.01, "learning_rate": 0.0002977603873700363, "loss": 0.0425, "step": 5760 }, { "epoch": 0.01, "learning_rate": 0.00029775649915366484, "loss": 0.0524, "step": 5770 }, { "epoch": 0.01, "learning_rate": 0.0002977526109372934, "loss": 0.0516, "step": 5780 }, { "epoch": 0.02, "learning_rate": 0.000297748722720922, "loss": 0.0505, "step": 5790 }, { "epoch": 0.02, "learning_rate": 0.0002977448345045505, "loss": 0.0497, "step": 5800 }, { "epoch": 0.02, "learning_rate": 0.000297740946288179, "loss": 0.0536, "step": 5810 }, { "epoch": 0.02, "learning_rate": 0.0002977370580718076, "loss": 0.0507, "step": 5820 }, { "epoch": 0.02, "learning_rate": 0.0002977331698554361, "loss": 0.0486, "step": 5830 }, { "epoch": 0.02, "learning_rate": 0.0002977292816390646, "loss": 0.0567, "step": 5840 }, { "epoch": 0.02, "learning_rate": 0.00029772539342269317, "loss": 0.0507, "step": 5850 }, { "epoch": 0.02, "learning_rate": 0.0002977215052063217, "loss": 0.0582, "step": 5860 }, { "epoch": 0.02, "learning_rate": 0.00029771761698995026, "loss": 0.0482, "step": 5870 }, { "epoch": 0.02, "learning_rate": 0.00029771372877357877, "loss": 0.0467, "step": 5880 }, { "epoch": 0.02, "learning_rate": 0.0002977098405572073, "loss": 0.0607, "step": 5890 }, { "epoch": 0.02, "learning_rate": 0.00029770595234083585, "loss": 0.051, "step": 5900 }, { "epoch": 0.02, "learning_rate": 0.00029770206412446437, "loss": 0.0532, "step": 5910 }, { "epoch": 0.02, "learning_rate": 0.0002976981759080929, "loss": 0.0531, "step": 5920 }, { "epoch": 0.02, "learning_rate": 0.00029769428769172145, "loss": 0.0524, "step": 5930 }, { "epoch": 0.02, "learning_rate": 0.00029769039947535, "loss": 0.0608, "step": 5940 }, { "epoch": 0.02, "learning_rate": 0.00029768651125897853, "loss": 0.0459, "step": 5950 }, { "epoch": 0.02, "learning_rate": 0.00029768262304260705, "loss": 0.0515, "step": 5960 }, { "epoch": 0.02, "learning_rate": 0.00029767873482623556, "loss": 0.0522, "step": 5970 }, { "epoch": 0.02, "learning_rate": 0.0002976748466098641, "loss": 0.0501, "step": 5980 }, { "epoch": 0.02, "learning_rate": 0.00029767095839349265, "loss": 0.0513, "step": 5990 }, { "epoch": 0.02, "learning_rate": 0.0002976670701771212, "loss": 0.0551, "step": 6000 }, { "epoch": 0.02, "eval_cer": 0.8817866645392185, "eval_loss": 0.03934020921587944, "eval_runtime": 107.5774, "eval_samples_per_second": 18.591, "eval_steps_per_second": 4.648, "step": 6000 }, { "epoch": 0.02, "learning_rate": 0.00029766318196074973, "loss": 0.048, "step": 6010 }, { "epoch": 0.02, "learning_rate": 0.00029765929374437824, "loss": 0.0518, "step": 6020 }, { "epoch": 0.02, "learning_rate": 0.0002976554055280068, "loss": 0.0474, "step": 6030 }, { "epoch": 0.02, "learning_rate": 0.00029765151731163533, "loss": 0.0529, "step": 6040 }, { "epoch": 0.02, "learning_rate": 0.00029764762909526384, "loss": 0.0457, "step": 6050 }, { "epoch": 0.02, "learning_rate": 0.0002976437408788924, "loss": 0.0507, "step": 6060 }, { "epoch": 0.02, "learning_rate": 0.0002976398526625209, "loss": 0.0534, "step": 6070 }, { "epoch": 0.02, "learning_rate": 0.0002976359644461495, "loss": 0.045, "step": 6080 }, { "epoch": 0.02, "learning_rate": 0.000297632076229778, "loss": 0.0526, "step": 6090 }, { "epoch": 0.02, "learning_rate": 0.0002976281880134065, "loss": 0.0477, "step": 6100 }, { "epoch": 0.02, "learning_rate": 0.0002976242997970351, "loss": 0.0453, "step": 6110 }, { "epoch": 0.02, "learning_rate": 0.0002976204115806636, "loss": 0.0464, "step": 6120 }, { "epoch": 0.02, "learning_rate": 0.0002976165233642921, "loss": 0.0503, "step": 6130 }, { "epoch": 0.02, "learning_rate": 0.0002976126351479207, "loss": 0.0492, "step": 6140 }, { "epoch": 0.02, "learning_rate": 0.00029760874693154926, "loss": 0.0502, "step": 6150 }, { "epoch": 0.02, "learning_rate": 0.0002976048587151778, "loss": 0.0499, "step": 6160 }, { "epoch": 0.02, "learning_rate": 0.0002976009704988063, "loss": 0.0488, "step": 6170 }, { "epoch": 0.02, "learning_rate": 0.0002975970822824348, "loss": 0.054, "step": 6180 }, { "epoch": 0.02, "learning_rate": 0.00029759319406606337, "loss": 0.049, "step": 6190 }, { "epoch": 0.02, "learning_rate": 0.0002975893058496919, "loss": 0.0618, "step": 6200 }, { "epoch": 0.02, "learning_rate": 0.00029758541763332045, "loss": 0.0551, "step": 6210 }, { "epoch": 0.02, "learning_rate": 0.00029758152941694897, "loss": 0.0483, "step": 6220 }, { "epoch": 0.02, "learning_rate": 0.0002975776412005775, "loss": 0.0539, "step": 6230 }, { "epoch": 0.02, "learning_rate": 0.00029757375298420605, "loss": 0.0552, "step": 6240 }, { "epoch": 0.02, "learning_rate": 0.00029756986476783457, "loss": 0.0541, "step": 6250 }, { "epoch": 0.02, "learning_rate": 0.0002975659765514631, "loss": 0.0586, "step": 6260 }, { "epoch": 0.02, "learning_rate": 0.00029756208833509165, "loss": 0.0479, "step": 6270 }, { "epoch": 0.02, "learning_rate": 0.00029755820011872016, "loss": 0.0533, "step": 6280 }, { "epoch": 0.02, "learning_rate": 0.00029755431190234873, "loss": 0.0465, "step": 6290 }, { "epoch": 0.02, "learning_rate": 0.00029755042368597725, "loss": 0.0617, "step": 6300 }, { "epoch": 0.02, "learning_rate": 0.00029754653546960576, "loss": 0.0568, "step": 6310 }, { "epoch": 0.02, "learning_rate": 0.00029754264725323433, "loss": 0.0489, "step": 6320 }, { "epoch": 0.02, "learning_rate": 0.00029753875903686285, "loss": 0.0491, "step": 6330 }, { "epoch": 0.02, "learning_rate": 0.0002975348708204914, "loss": 0.0505, "step": 6340 }, { "epoch": 0.02, "learning_rate": 0.00029753098260411993, "loss": 0.0514, "step": 6350 }, { "epoch": 0.02, "learning_rate": 0.0002975270943877485, "loss": 0.0591, "step": 6360 }, { "epoch": 0.02, "learning_rate": 0.000297523206171377, "loss": 0.0578, "step": 6370 }, { "epoch": 0.02, "learning_rate": 0.0002975193179550055, "loss": 0.0488, "step": 6380 }, { "epoch": 0.02, "learning_rate": 0.00029751542973863404, "loss": 0.0521, "step": 6390 }, { "epoch": 0.02, "learning_rate": 0.0002975115415222626, "loss": 0.0472, "step": 6400 }, { "epoch": 0.02, "learning_rate": 0.0002975076533058911, "loss": 0.0489, "step": 6410 }, { "epoch": 0.02, "learning_rate": 0.0002975037650895197, "loss": 0.0457, "step": 6420 }, { "epoch": 0.02, "learning_rate": 0.0002974998768731482, "loss": 0.0528, "step": 6430 }, { "epoch": 0.02, "learning_rate": 0.0002974959886567768, "loss": 0.0464, "step": 6440 }, { "epoch": 0.02, "learning_rate": 0.0002974921004404053, "loss": 0.0517, "step": 6450 }, { "epoch": 0.02, "learning_rate": 0.0002974882122240338, "loss": 0.0525, "step": 6460 }, { "epoch": 0.02, "learning_rate": 0.0002974843240076623, "loss": 0.0567, "step": 6470 }, { "epoch": 0.02, "learning_rate": 0.0002974804357912909, "loss": 0.0525, "step": 6480 }, { "epoch": 0.02, "learning_rate": 0.00029747654757491946, "loss": 0.0526, "step": 6490 }, { "epoch": 0.02, "learning_rate": 0.00029747265935854797, "loss": 0.0477, "step": 6500 }, { "epoch": 0.02, "learning_rate": 0.0002974687711421765, "loss": 0.0448, "step": 6510 }, { "epoch": 0.02, "learning_rate": 0.000297464882925805, "loss": 0.0526, "step": 6520 }, { "epoch": 0.02, "learning_rate": 0.00029746099470943357, "loss": 0.0513, "step": 6530 }, { "epoch": 0.02, "learning_rate": 0.0002974571064930621, "loss": 0.0535, "step": 6540 }, { "epoch": 0.02, "learning_rate": 0.00029745321827669065, "loss": 0.0449, "step": 6550 }, { "epoch": 0.02, "learning_rate": 0.00029744933006031917, "loss": 0.0575, "step": 6560 }, { "epoch": 0.02, "learning_rate": 0.00029744544184394774, "loss": 0.0505, "step": 6570 }, { "epoch": 0.02, "learning_rate": 0.00029744155362757625, "loss": 0.0517, "step": 6580 }, { "epoch": 0.02, "learning_rate": 0.00029743766541120477, "loss": 0.0496, "step": 6590 }, { "epoch": 0.02, "learning_rate": 0.0002974337771948333, "loss": 0.0481, "step": 6600 }, { "epoch": 0.02, "learning_rate": 0.00029742988897846185, "loss": 0.0545, "step": 6610 }, { "epoch": 0.02, "learning_rate": 0.00029742600076209036, "loss": 0.0474, "step": 6620 }, { "epoch": 0.02, "learning_rate": 0.00029742211254571893, "loss": 0.0515, "step": 6630 }, { "epoch": 0.02, "learning_rate": 0.00029741822432934745, "loss": 0.058, "step": 6640 }, { "epoch": 0.02, "learning_rate": 0.000297414336112976, "loss": 0.0532, "step": 6650 }, { "epoch": 0.02, "learning_rate": 0.00029741044789660453, "loss": 0.0517, "step": 6660 }, { "epoch": 0.02, "learning_rate": 0.00029740655968023304, "loss": 0.0553, "step": 6670 }, { "epoch": 0.02, "learning_rate": 0.00029740267146386156, "loss": 0.0438, "step": 6680 }, { "epoch": 0.02, "learning_rate": 0.00029739878324749013, "loss": 0.0509, "step": 6690 }, { "epoch": 0.02, "learning_rate": 0.0002973948950311187, "loss": 0.0506, "step": 6700 }, { "epoch": 0.02, "learning_rate": 0.0002973910068147472, "loss": 0.0608, "step": 6710 }, { "epoch": 0.02, "learning_rate": 0.0002973871185983757, "loss": 0.0479, "step": 6720 }, { "epoch": 0.02, "learning_rate": 0.00029738323038200424, "loss": 0.0522, "step": 6730 }, { "epoch": 0.02, "learning_rate": 0.0002973793421656328, "loss": 0.0501, "step": 6740 }, { "epoch": 0.02, "learning_rate": 0.0002973754539492613, "loss": 0.064, "step": 6750 }, { "epoch": 0.02, "learning_rate": 0.0002973715657328899, "loss": 0.0531, "step": 6760 }, { "epoch": 0.02, "learning_rate": 0.0002973676775165184, "loss": 0.0522, "step": 6770 }, { "epoch": 0.02, "learning_rate": 0.000297363789300147, "loss": 0.0621, "step": 6780 }, { "epoch": 0.02, "learning_rate": 0.0002973599010837755, "loss": 0.0464, "step": 6790 }, { "epoch": 0.02, "learning_rate": 0.000297356012867404, "loss": 0.0558, "step": 6800 }, { "epoch": 0.02, "learning_rate": 0.0002973521246510325, "loss": 0.0464, "step": 6810 }, { "epoch": 0.02, "learning_rate": 0.0002973482364346611, "loss": 0.0525, "step": 6820 }, { "epoch": 0.02, "learning_rate": 0.00029734434821828966, "loss": 0.0488, "step": 6830 }, { "epoch": 0.02, "learning_rate": 0.00029734046000191817, "loss": 0.0482, "step": 6840 }, { "epoch": 0.02, "learning_rate": 0.0002973365717855467, "loss": 0.0524, "step": 6850 }, { "epoch": 0.02, "learning_rate": 0.00029733268356917525, "loss": 0.0438, "step": 6860 }, { "epoch": 0.02, "learning_rate": 0.00029732879535280377, "loss": 0.0497, "step": 6870 }, { "epoch": 0.02, "learning_rate": 0.0002973249071364323, "loss": 0.0531, "step": 6880 }, { "epoch": 0.02, "learning_rate": 0.00029732101892006085, "loss": 0.0478, "step": 6890 }, { "epoch": 0.02, "learning_rate": 0.00029731713070368937, "loss": 0.047, "step": 6900 }, { "epoch": 0.02, "learning_rate": 0.00029731324248731794, "loss": 0.0419, "step": 6910 }, { "epoch": 0.02, "learning_rate": 0.00029730935427094645, "loss": 0.0493, "step": 6920 }, { "epoch": 0.02, "learning_rate": 0.00029730546605457496, "loss": 0.0551, "step": 6930 }, { "epoch": 0.02, "learning_rate": 0.00029730157783820353, "loss": 0.0529, "step": 6940 }, { "epoch": 0.02, "learning_rate": 0.00029729768962183205, "loss": 0.0515, "step": 6950 }, { "epoch": 0.02, "learning_rate": 0.00029729380140546056, "loss": 0.0476, "step": 6960 }, { "epoch": 0.02, "learning_rate": 0.00029728991318908913, "loss": 0.053, "step": 6970 }, { "epoch": 0.02, "learning_rate": 0.00029728602497271765, "loss": 0.0479, "step": 6980 }, { "epoch": 0.02, "learning_rate": 0.0002972821367563462, "loss": 0.0552, "step": 6990 }, { "epoch": 0.02, "learning_rate": 0.00029727824853997473, "loss": 0.0485, "step": 7000 }, { "epoch": 0.02, "eval_cer": 0.8817964619977577, "eval_loss": 0.03943474590778351, "eval_runtime": 107.6801, "eval_samples_per_second": 18.574, "eval_steps_per_second": 4.643, "step": 7000 }, { "epoch": 0.02, "learning_rate": 0.00029727436032360324, "loss": 0.0459, "step": 7010 }, { "epoch": 0.02, "learning_rate": 0.00029727047210723176, "loss": 0.0515, "step": 7020 }, { "epoch": 0.02, "learning_rate": 0.0002972665838908603, "loss": 0.0483, "step": 7030 }, { "epoch": 0.02, "learning_rate": 0.0002972626956744889, "loss": 0.0517, "step": 7040 }, { "epoch": 0.02, "learning_rate": 0.0002972588074581174, "loss": 0.0473, "step": 7050 }, { "epoch": 0.02, "learning_rate": 0.0002972549192417459, "loss": 0.0432, "step": 7060 }, { "epoch": 0.02, "learning_rate": 0.0002972510310253745, "loss": 0.0509, "step": 7070 }, { "epoch": 0.02, "learning_rate": 0.000297247142809003, "loss": 0.0476, "step": 7080 }, { "epoch": 0.02, "learning_rate": 0.0002972432545926315, "loss": 0.0602, "step": 7090 }, { "epoch": 0.02, "learning_rate": 0.0002972393663762601, "loss": 0.0582, "step": 7100 }, { "epoch": 0.02, "learning_rate": 0.0002972354781598886, "loss": 0.0507, "step": 7110 }, { "epoch": 0.02, "learning_rate": 0.0002972315899435172, "loss": 0.048, "step": 7120 }, { "epoch": 0.02, "learning_rate": 0.0002972277017271457, "loss": 0.0506, "step": 7130 }, { "epoch": 0.02, "learning_rate": 0.0002972238135107742, "loss": 0.0479, "step": 7140 }, { "epoch": 0.02, "learning_rate": 0.00029721992529440277, "loss": 0.0522, "step": 7150 }, { "epoch": 0.02, "learning_rate": 0.0002972160370780313, "loss": 0.0499, "step": 7160 }, { "epoch": 0.02, "learning_rate": 0.0002972121488616598, "loss": 0.0548, "step": 7170 }, { "epoch": 0.02, "learning_rate": 0.00029720826064528837, "loss": 0.0573, "step": 7180 }, { "epoch": 0.02, "learning_rate": 0.00029720437242891694, "loss": 0.0517, "step": 7190 }, { "epoch": 0.02, "learning_rate": 0.00029720048421254545, "loss": 0.0446, "step": 7200 }, { "epoch": 0.02, "learning_rate": 0.00029719659599617397, "loss": 0.0455, "step": 7210 }, { "epoch": 0.02, "learning_rate": 0.0002971927077798025, "loss": 0.0519, "step": 7220 }, { "epoch": 0.02, "learning_rate": 0.00029718881956343105, "loss": 0.0572, "step": 7230 }, { "epoch": 0.02, "learning_rate": 0.00029718493134705957, "loss": 0.057, "step": 7240 }, { "epoch": 0.02, "learning_rate": 0.00029718104313068813, "loss": 0.0536, "step": 7250 }, { "epoch": 0.02, "learning_rate": 0.00029717715491431665, "loss": 0.0533, "step": 7260 }, { "epoch": 0.02, "learning_rate": 0.00029717326669794516, "loss": 0.0466, "step": 7270 }, { "epoch": 0.02, "learning_rate": 0.00029716937848157373, "loss": 0.0638, "step": 7280 }, { "epoch": 0.02, "learning_rate": 0.00029716549026520225, "loss": 0.0516, "step": 7290 }, { "epoch": 0.02, "learning_rate": 0.00029716160204883076, "loss": 0.0661, "step": 7300 }, { "epoch": 0.02, "learning_rate": 0.00029715771383245933, "loss": 0.0678, "step": 7310 }, { "epoch": 0.02, "learning_rate": 0.00029715382561608784, "loss": 0.055, "step": 7320 }, { "epoch": 0.02, "learning_rate": 0.0002971499373997164, "loss": 0.0438, "step": 7330 }, { "epoch": 0.02, "learning_rate": 0.00029714604918334493, "loss": 0.0444, "step": 7340 }, { "epoch": 0.02, "learning_rate": 0.00029714216096697344, "loss": 0.0494, "step": 7350 }, { "epoch": 0.02, "learning_rate": 0.000297138272750602, "loss": 0.0529, "step": 7360 }, { "epoch": 0.02, "learning_rate": 0.0002971343845342305, "loss": 0.0513, "step": 7370 }, { "epoch": 0.02, "learning_rate": 0.0002971304963178591, "loss": 0.0498, "step": 7380 }, { "epoch": 0.02, "learning_rate": 0.0002971266081014876, "loss": 0.0457, "step": 7390 }, { "epoch": 0.02, "learning_rate": 0.0002971227198851162, "loss": 0.0534, "step": 7400 }, { "epoch": 0.02, "learning_rate": 0.0002971188316687447, "loss": 0.0453, "step": 7410 }, { "epoch": 0.02, "learning_rate": 0.0002971149434523732, "loss": 0.0476, "step": 7420 }, { "epoch": 0.02, "learning_rate": 0.0002971110552360017, "loss": 0.0494, "step": 7430 }, { "epoch": 0.02, "learning_rate": 0.0002971071670196303, "loss": 0.0476, "step": 7440 }, { "epoch": 0.02, "learning_rate": 0.0002971032788032588, "loss": 0.0459, "step": 7450 }, { "epoch": 0.02, "learning_rate": 0.0002970993905868874, "loss": 0.0488, "step": 7460 }, { "epoch": 0.02, "learning_rate": 0.0002970955023705159, "loss": 0.0501, "step": 7470 }, { "epoch": 0.02, "learning_rate": 0.0002970916141541444, "loss": 0.0526, "step": 7480 }, { "epoch": 0.02, "learning_rate": 0.00029708772593777297, "loss": 0.0468, "step": 7490 }, { "epoch": 0.02, "learning_rate": 0.0002970838377214015, "loss": 0.0505, "step": 7500 }, { "epoch": 0.02, "learning_rate": 0.00029707994950503, "loss": 0.0486, "step": 7510 }, { "epoch": 0.02, "learning_rate": 0.00029707606128865857, "loss": 0.0435, "step": 7520 }, { "epoch": 0.02, "learning_rate": 0.00029707217307228714, "loss": 0.0515, "step": 7530 }, { "epoch": 0.02, "learning_rate": 0.00029706828485591565, "loss": 0.0514, "step": 7540 }, { "epoch": 0.02, "learning_rate": 0.00029706439663954417, "loss": 0.0541, "step": 7550 }, { "epoch": 0.02, "learning_rate": 0.0002970605084231727, "loss": 0.0557, "step": 7560 }, { "epoch": 0.02, "learning_rate": 0.00029705662020680125, "loss": 0.0506, "step": 7570 }, { "epoch": 0.02, "learning_rate": 0.00029705273199042976, "loss": 0.0463, "step": 7580 }, { "epoch": 0.02, "learning_rate": 0.00029704884377405833, "loss": 0.0448, "step": 7590 }, { "epoch": 0.02, "learning_rate": 0.00029704495555768685, "loss": 0.0422, "step": 7600 }, { "epoch": 0.02, "learning_rate": 0.0002970410673413154, "loss": 0.0496, "step": 7610 }, { "epoch": 0.02, "learning_rate": 0.00029703717912494393, "loss": 0.0584, "step": 7620 }, { "epoch": 0.02, "learning_rate": 0.00029703329090857245, "loss": 0.0454, "step": 7630 }, { "epoch": 0.02, "learning_rate": 0.00029702940269220096, "loss": 0.0481, "step": 7640 }, { "epoch": 0.02, "learning_rate": 0.00029702551447582953, "loss": 0.0491, "step": 7650 }, { "epoch": 0.02, "learning_rate": 0.00029702162625945804, "loss": 0.0431, "step": 7660 }, { "epoch": 0.02, "learning_rate": 0.0002970177380430866, "loss": 0.0459, "step": 7670 }, { "epoch": 0.02, "learning_rate": 0.0002970138498267151, "loss": 0.0475, "step": 7680 }, { "epoch": 0.02, "learning_rate": 0.0002970099616103437, "loss": 0.0542, "step": 7690 }, { "epoch": 0.02, "learning_rate": 0.0002970060733939722, "loss": 0.049, "step": 7700 }, { "epoch": 0.02, "learning_rate": 0.0002970021851776007, "loss": 0.0586, "step": 7710 }, { "epoch": 0.02, "learning_rate": 0.00029699829696122924, "loss": 0.0454, "step": 7720 }, { "epoch": 0.02, "learning_rate": 0.0002969944087448578, "loss": 0.0528, "step": 7730 }, { "epoch": 0.02, "learning_rate": 0.0002969905205284864, "loss": 0.0555, "step": 7740 }, { "epoch": 0.02, "learning_rate": 0.0002969866323121149, "loss": 0.0495, "step": 7750 }, { "epoch": 0.02, "learning_rate": 0.0002969827440957434, "loss": 0.0483, "step": 7760 }, { "epoch": 0.02, "learning_rate": 0.0002969788558793719, "loss": 0.0564, "step": 7770 }, { "epoch": 0.02, "learning_rate": 0.0002969749676630005, "loss": 0.063, "step": 7780 }, { "epoch": 0.02, "learning_rate": 0.000296971079446629, "loss": 0.0394, "step": 7790 }, { "epoch": 0.02, "learning_rate": 0.00029696719123025757, "loss": 0.052, "step": 7800 }, { "epoch": 0.02, "learning_rate": 0.0002969633030138861, "loss": 0.0551, "step": 7810 }, { "epoch": 0.02, "learning_rate": 0.00029695941479751466, "loss": 0.0548, "step": 7820 }, { "epoch": 0.02, "learning_rate": 0.00029695552658114317, "loss": 0.0699, "step": 7830 }, { "epoch": 0.02, "learning_rate": 0.0002969516383647717, "loss": 0.0532, "step": 7840 }, { "epoch": 0.02, "learning_rate": 0.0002969477501484002, "loss": 0.0589, "step": 7850 }, { "epoch": 0.02, "learning_rate": 0.00029694386193202877, "loss": 0.0516, "step": 7860 }, { "epoch": 0.02, "learning_rate": 0.0002969399737156573, "loss": 0.0523, "step": 7870 }, { "epoch": 0.02, "learning_rate": 0.00029693608549928585, "loss": 0.0847, "step": 7880 }, { "epoch": 0.02, "learning_rate": 0.00029693219728291437, "loss": 0.0531, "step": 7890 }, { "epoch": 0.02, "learning_rate": 0.00029692830906654293, "loss": 0.0509, "step": 7900 }, { "epoch": 0.02, "learning_rate": 0.00029692442085017145, "loss": 0.0537, "step": 7910 }, { "epoch": 0.02, "learning_rate": 0.00029692053263379996, "loss": 0.0503, "step": 7920 }, { "epoch": 0.02, "learning_rate": 0.00029691664441742853, "loss": 0.0544, "step": 7930 }, { "epoch": 0.02, "learning_rate": 0.00029691275620105705, "loss": 0.0538, "step": 7940 }, { "epoch": 0.02, "learning_rate": 0.0002969088679846856, "loss": 0.0554, "step": 7950 }, { "epoch": 0.02, "learning_rate": 0.00029690497976831413, "loss": 0.0524, "step": 7960 }, { "epoch": 0.02, "learning_rate": 0.00029690109155194264, "loss": 0.0577, "step": 7970 }, { "epoch": 0.02, "learning_rate": 0.00029689720333557116, "loss": 0.0501, "step": 7980 }, { "epoch": 0.02, "learning_rate": 0.00029689331511919973, "loss": 0.0482, "step": 7990 }, { "epoch": 0.02, "learning_rate": 0.00029688942690282824, "loss": 0.0516, "step": 8000 }, { "epoch": 0.02, "eval_cer": 0.8818510478381908, "eval_loss": 0.038032468408346176, "eval_runtime": 107.8792, "eval_samples_per_second": 18.539, "eval_steps_per_second": 4.635, "step": 8000 }, { "epoch": 0.02, "learning_rate": 0.0002968855386864568, "loss": 0.0487, "step": 8010 }, { "epoch": 0.02, "learning_rate": 0.0002968816504700853, "loss": 0.0506, "step": 8020 }, { "epoch": 0.02, "learning_rate": 0.0002968777622537139, "loss": 0.0475, "step": 8030 }, { "epoch": 0.02, "learning_rate": 0.0002968738740373424, "loss": 0.0567, "step": 8040 }, { "epoch": 0.02, "learning_rate": 0.0002968699858209709, "loss": 0.0503, "step": 8050 }, { "epoch": 0.02, "learning_rate": 0.00029686609760459944, "loss": 0.0664, "step": 8060 }, { "epoch": 0.02, "learning_rate": 0.000296862209388228, "loss": 0.0512, "step": 8070 }, { "epoch": 0.02, "learning_rate": 0.0002968583211718566, "loss": 0.0509, "step": 8080 }, { "epoch": 0.02, "learning_rate": 0.0002968544329554851, "loss": 0.0533, "step": 8090 }, { "epoch": 0.02, "learning_rate": 0.0002968505447391136, "loss": 0.0498, "step": 8100 }, { "epoch": 0.02, "learning_rate": 0.0002968466565227422, "loss": 0.0567, "step": 8110 }, { "epoch": 0.02, "learning_rate": 0.0002968427683063707, "loss": 0.0604, "step": 8120 }, { "epoch": 0.02, "learning_rate": 0.0002968388800899992, "loss": 0.0575, "step": 8130 }, { "epoch": 0.02, "learning_rate": 0.00029683499187362777, "loss": 0.0522, "step": 8140 }, { "epoch": 0.02, "learning_rate": 0.0002968311036572563, "loss": 0.0544, "step": 8150 }, { "epoch": 0.02, "learning_rate": 0.00029682721544088485, "loss": 0.0475, "step": 8160 }, { "epoch": 0.02, "learning_rate": 0.00029682332722451337, "loss": 0.0504, "step": 8170 }, { "epoch": 0.02, "learning_rate": 0.0002968194390081419, "loss": 0.0551, "step": 8180 }, { "epoch": 0.02, "learning_rate": 0.0002968155507917704, "loss": 0.0451, "step": 8190 }, { "epoch": 0.02, "learning_rate": 0.00029681166257539897, "loss": 0.0529, "step": 8200 }, { "epoch": 0.02, "learning_rate": 0.0002968077743590275, "loss": 0.0546, "step": 8210 }, { "epoch": 0.02, "learning_rate": 0.00029680388614265605, "loss": 0.0438, "step": 8220 }, { "epoch": 0.02, "learning_rate": 0.00029679999792628456, "loss": 0.047, "step": 8230 }, { "epoch": 0.02, "learning_rate": 0.00029679610970991313, "loss": 0.0709, "step": 8240 }, { "epoch": 0.02, "learning_rate": 0.00029679222149354165, "loss": 0.0536, "step": 8250 }, { "epoch": 0.02, "learning_rate": 0.00029678833327717016, "loss": 0.0497, "step": 8260 }, { "epoch": 0.02, "learning_rate": 0.0002967844450607987, "loss": 0.0468, "step": 8270 }, { "epoch": 0.02, "learning_rate": 0.00029678055684442725, "loss": 0.0445, "step": 8280 }, { "epoch": 0.02, "learning_rate": 0.0002967766686280558, "loss": 0.042, "step": 8290 }, { "epoch": 0.02, "learning_rate": 0.00029677278041168433, "loss": 0.0506, "step": 8300 }, { "epoch": 0.02, "learning_rate": 0.00029676889219531284, "loss": 0.0503, "step": 8310 }, { "epoch": 0.02, "learning_rate": 0.0002967650039789414, "loss": 0.0518, "step": 8320 }, { "epoch": 0.02, "learning_rate": 0.0002967611157625699, "loss": 0.0551, "step": 8330 }, { "epoch": 0.02, "learning_rate": 0.00029675722754619844, "loss": 0.0548, "step": 8340 }, { "epoch": 0.02, "learning_rate": 0.000296753339329827, "loss": 0.0528, "step": 8350 }, { "epoch": 0.02, "learning_rate": 0.0002967494511134555, "loss": 0.0499, "step": 8360 }, { "epoch": 0.02, "learning_rate": 0.0002967455628970841, "loss": 0.0523, "step": 8370 }, { "epoch": 0.02, "learning_rate": 0.0002967416746807126, "loss": 0.0498, "step": 8380 }, { "epoch": 0.02, "learning_rate": 0.0002967377864643411, "loss": 0.0476, "step": 8390 }, { "epoch": 0.02, "learning_rate": 0.0002967338982479697, "loss": 0.0445, "step": 8400 }, { "epoch": 0.02, "learning_rate": 0.0002967300100315982, "loss": 0.0526, "step": 8410 }, { "epoch": 0.02, "learning_rate": 0.0002967261218152267, "loss": 0.0556, "step": 8420 }, { "epoch": 0.02, "learning_rate": 0.0002967222335988553, "loss": 0.0443, "step": 8430 }, { "epoch": 0.02, "learning_rate": 0.0002967183453824838, "loss": 0.0537, "step": 8440 }, { "epoch": 0.02, "learning_rate": 0.00029671445716611237, "loss": 0.0509, "step": 8450 }, { "epoch": 0.02, "learning_rate": 0.0002967105689497409, "loss": 0.0518, "step": 8460 }, { "epoch": 0.02, "learning_rate": 0.0002967066807333694, "loss": 0.0426, "step": 8470 }, { "epoch": 0.02, "learning_rate": 0.00029670279251699797, "loss": 0.0493, "step": 8480 }, { "epoch": 0.02, "learning_rate": 0.0002966989043006265, "loss": 0.0565, "step": 8490 }, { "epoch": 0.02, "learning_rate": 0.00029669501608425505, "loss": 0.0531, "step": 8500 }, { "epoch": 0.02, "learning_rate": 0.00029669112786788357, "loss": 0.0528, "step": 8510 }, { "epoch": 0.02, "learning_rate": 0.0002966872396515121, "loss": 0.0464, "step": 8520 }, { "epoch": 0.02, "learning_rate": 0.00029668335143514065, "loss": 0.0517, "step": 8530 }, { "epoch": 0.02, "learning_rate": 0.00029667946321876917, "loss": 0.0459, "step": 8540 }, { "epoch": 0.02, "learning_rate": 0.0002966755750023977, "loss": 0.0415, "step": 8550 }, { "epoch": 0.02, "learning_rate": 0.00029667168678602625, "loss": 0.0446, "step": 8560 }, { "epoch": 0.02, "learning_rate": 0.0002966677985696548, "loss": 0.0402, "step": 8570 }, { "epoch": 0.02, "learning_rate": 0.00029666391035328333, "loss": 0.0673, "step": 8580 }, { "epoch": 0.02, "learning_rate": 0.00029666002213691185, "loss": 0.0413, "step": 8590 }, { "epoch": 0.02, "learning_rate": 0.00029665613392054036, "loss": 0.0442, "step": 8600 }, { "epoch": 0.02, "learning_rate": 0.00029665224570416893, "loss": 0.0502, "step": 8610 }, { "epoch": 0.02, "learning_rate": 0.00029664835748779744, "loss": 0.0484, "step": 8620 }, { "epoch": 0.02, "learning_rate": 0.000296644469271426, "loss": 0.0518, "step": 8630 }, { "epoch": 0.02, "learning_rate": 0.00029664058105505453, "loss": 0.0545, "step": 8640 }, { "epoch": 0.02, "learning_rate": 0.0002966366928386831, "loss": 0.0462, "step": 8650 }, { "epoch": 0.02, "learning_rate": 0.0002966328046223116, "loss": 0.0551, "step": 8660 }, { "epoch": 0.02, "learning_rate": 0.0002966289164059401, "loss": 0.0452, "step": 8670 }, { "epoch": 0.02, "learning_rate": 0.00029662502818956864, "loss": 0.0477, "step": 8680 }, { "epoch": 0.02, "learning_rate": 0.0002966211399731972, "loss": 0.0475, "step": 8690 }, { "epoch": 0.02, "learning_rate": 0.0002966172517568257, "loss": 0.047, "step": 8700 }, { "epoch": 0.02, "learning_rate": 0.0002966133635404543, "loss": 0.046, "step": 8710 }, { "epoch": 0.02, "learning_rate": 0.0002966094753240828, "loss": 0.0473, "step": 8720 }, { "epoch": 0.02, "learning_rate": 0.0002966055871077113, "loss": 0.0446, "step": 8730 }, { "epoch": 0.02, "learning_rate": 0.0002966016988913399, "loss": 0.0524, "step": 8740 }, { "epoch": 0.02, "learning_rate": 0.0002965978106749684, "loss": 0.0517, "step": 8750 }, { "epoch": 0.02, "learning_rate": 0.0002965939224585969, "loss": 0.049, "step": 8760 }, { "epoch": 0.02, "learning_rate": 0.0002965900342422255, "loss": 0.0457, "step": 8770 }, { "epoch": 0.02, "learning_rate": 0.00029658614602585406, "loss": 0.0469, "step": 8780 }, { "epoch": 0.02, "learning_rate": 0.00029658225780948257, "loss": 0.0419, "step": 8790 }, { "epoch": 0.02, "learning_rate": 0.0002965783695931111, "loss": 0.064, "step": 8800 }, { "epoch": 0.02, "learning_rate": 0.0002965744813767396, "loss": 0.0499, "step": 8810 }, { "epoch": 0.02, "learning_rate": 0.00029657059316036817, "loss": 0.0464, "step": 8820 }, { "epoch": 0.02, "learning_rate": 0.0002965667049439967, "loss": 0.0468, "step": 8830 }, { "epoch": 0.02, "learning_rate": 0.00029656281672762525, "loss": 0.0513, "step": 8840 }, { "epoch": 0.02, "learning_rate": 0.00029655892851125377, "loss": 0.0491, "step": 8850 }, { "epoch": 0.02, "learning_rate": 0.00029655504029488234, "loss": 0.0457, "step": 8860 }, { "epoch": 0.02, "learning_rate": 0.00029655115207851085, "loss": 0.0529, "step": 8870 }, { "epoch": 0.02, "learning_rate": 0.00029654726386213936, "loss": 0.0471, "step": 8880 }, { "epoch": 0.02, "learning_rate": 0.0002965433756457679, "loss": 0.0504, "step": 8890 }, { "epoch": 0.02, "learning_rate": 0.00029653948742939645, "loss": 0.0428, "step": 8900 }, { "epoch": 0.02, "learning_rate": 0.00029653559921302496, "loss": 0.0444, "step": 8910 }, { "epoch": 0.02, "learning_rate": 0.00029653171099665353, "loss": 0.0504, "step": 8920 }, { "epoch": 0.02, "learning_rate": 0.00029652782278028205, "loss": 0.0523, "step": 8930 }, { "epoch": 0.02, "learning_rate": 0.00029652393456391056, "loss": 0.0561, "step": 8940 }, { "epoch": 0.02, "learning_rate": 0.00029652004634753913, "loss": 0.0561, "step": 8950 }, { "epoch": 0.02, "learning_rate": 0.00029651615813116764, "loss": 0.0484, "step": 8960 }, { "epoch": 0.02, "learning_rate": 0.0002965122699147962, "loss": 0.0507, "step": 8970 }, { "epoch": 0.02, "learning_rate": 0.0002965083816984247, "loss": 0.0458, "step": 8980 }, { "epoch": 0.02, "learning_rate": 0.0002965044934820533, "loss": 0.0392, "step": 8990 }, { "epoch": 0.02, "learning_rate": 0.0002965006052656818, "loss": 0.0534, "step": 9000 }, { "epoch": 0.02, "eval_cer": 0.881751673615864, "eval_loss": 0.0344533696770668, "eval_runtime": 107.61, "eval_samples_per_second": 18.586, "eval_steps_per_second": 4.646, "step": 9000 }, { "epoch": 0.02, "learning_rate": 0.0002964967170493103, "loss": 0.0483, "step": 9010 }, { "epoch": 0.02, "learning_rate": 0.00029649282883293884, "loss": 0.048, "step": 9020 }, { "epoch": 0.02, "learning_rate": 0.0002964889406165674, "loss": 0.0403, "step": 9030 }, { "epoch": 0.02, "learning_rate": 0.0002964850524001959, "loss": 0.0477, "step": 9040 }, { "epoch": 0.02, "learning_rate": 0.0002964811641838245, "loss": 0.043, "step": 9050 }, { "epoch": 0.02, "learning_rate": 0.000296477275967453, "loss": 0.039, "step": 9060 }, { "epoch": 0.02, "learning_rate": 0.0002964733877510816, "loss": 0.0478, "step": 9070 }, { "epoch": 0.02, "learning_rate": 0.0002964694995347101, "loss": 0.0464, "step": 9080 }, { "epoch": 0.02, "learning_rate": 0.0002964656113183386, "loss": 0.0468, "step": 9090 }, { "epoch": 0.02, "learning_rate": 0.0002964617231019671, "loss": 0.0419, "step": 9100 }, { "epoch": 0.02, "learning_rate": 0.0002964578348855957, "loss": 0.0466, "step": 9110 }, { "epoch": 0.02, "learning_rate": 0.00029645394666922426, "loss": 0.046, "step": 9120 }, { "epoch": 0.02, "learning_rate": 0.00029645005845285277, "loss": 0.0473, "step": 9130 }, { "epoch": 0.02, "learning_rate": 0.0002964461702364813, "loss": 0.0506, "step": 9140 }, { "epoch": 0.02, "learning_rate": 0.00029644228202010985, "loss": 0.0387, "step": 9150 }, { "epoch": 0.02, "learning_rate": 0.00029643839380373837, "loss": 0.0425, "step": 9160 }, { "epoch": 0.02, "learning_rate": 0.0002964345055873669, "loss": 0.0444, "step": 9170 }, { "epoch": 0.02, "learning_rate": 0.00029643061737099545, "loss": 0.0444, "step": 9180 }, { "epoch": 0.02, "learning_rate": 0.00029642672915462397, "loss": 0.0434, "step": 9190 }, { "epoch": 0.02, "learning_rate": 0.00029642284093825253, "loss": 0.0576, "step": 9200 }, { "epoch": 0.02, "learning_rate": 0.00029641895272188105, "loss": 0.0476, "step": 9210 }, { "epoch": 0.02, "learning_rate": 0.00029641506450550956, "loss": 0.0518, "step": 9220 }, { "epoch": 0.02, "learning_rate": 0.0002964111762891381, "loss": 0.0487, "step": 9230 }, { "epoch": 0.02, "learning_rate": 0.00029640728807276665, "loss": 0.0588, "step": 9240 }, { "epoch": 0.02, "learning_rate": 0.00029640339985639516, "loss": 0.0524, "step": 9250 }, { "epoch": 0.02, "learning_rate": 0.00029639951164002373, "loss": 0.0535, "step": 9260 }, { "epoch": 0.02, "learning_rate": 0.00029639562342365224, "loss": 0.05, "step": 9270 }, { "epoch": 0.02, "learning_rate": 0.0002963917352072808, "loss": 0.0423, "step": 9280 }, { "epoch": 0.02, "learning_rate": 0.00029638784699090933, "loss": 0.0382, "step": 9290 }, { "epoch": 0.02, "learning_rate": 0.00029638395877453784, "loss": 0.0467, "step": 9300 }, { "epoch": 0.02, "learning_rate": 0.00029638007055816636, "loss": 0.0402, "step": 9310 }, { "epoch": 0.02, "learning_rate": 0.0002963761823417949, "loss": 0.0425, "step": 9320 }, { "epoch": 0.02, "learning_rate": 0.0002963722941254235, "loss": 0.0439, "step": 9330 }, { "epoch": 0.02, "learning_rate": 0.000296368405909052, "loss": 0.0444, "step": 9340 }, { "epoch": 0.02, "learning_rate": 0.0002963645176926805, "loss": 0.046, "step": 9350 }, { "epoch": 0.02, "learning_rate": 0.0002963606294763091, "loss": 0.0374, "step": 9360 }, { "epoch": 0.02, "learning_rate": 0.0002963567412599376, "loss": 0.0395, "step": 9370 }, { "epoch": 0.02, "learning_rate": 0.0002963528530435661, "loss": 0.0458, "step": 9380 }, { "epoch": 0.02, "learning_rate": 0.0002963489648271947, "loss": 0.0361, "step": 9390 }, { "epoch": 0.02, "learning_rate": 0.0002963450766108232, "loss": 0.0402, "step": 9400 }, { "epoch": 0.02, "learning_rate": 0.0002963411883944518, "loss": 0.044, "step": 9410 }, { "epoch": 0.02, "learning_rate": 0.0002963373001780803, "loss": 0.0361, "step": 9420 }, { "epoch": 0.02, "learning_rate": 0.0002963334119617088, "loss": 0.0427, "step": 9430 }, { "epoch": 0.02, "learning_rate": 0.0002963295237453373, "loss": 0.048, "step": 9440 }, { "epoch": 0.02, "learning_rate": 0.0002963256355289659, "loss": 0.0448, "step": 9450 }, { "epoch": 0.02, "learning_rate": 0.0002963217473125944, "loss": 0.0466, "step": 9460 }, { "epoch": 0.02, "learning_rate": 0.00029631785909622297, "loss": 0.0373, "step": 9470 }, { "epoch": 0.02, "learning_rate": 0.0002963139708798515, "loss": 0.0478, "step": 9480 }, { "epoch": 0.02, "learning_rate": 0.00029631008266348005, "loss": 0.0394, "step": 9490 }, { "epoch": 0.02, "learning_rate": 0.00029630619444710857, "loss": 0.0433, "step": 9500 }, { "epoch": 0.02, "learning_rate": 0.0002963023062307371, "loss": 0.0424, "step": 9510 }, { "epoch": 0.02, "learning_rate": 0.00029629841801436565, "loss": 0.0388, "step": 9520 }, { "epoch": 0.02, "learning_rate": 0.00029629452979799416, "loss": 0.0337, "step": 9530 }, { "epoch": 0.02, "learning_rate": 0.00029629064158162273, "loss": 0.0448, "step": 9540 }, { "epoch": 0.02, "learning_rate": 0.00029628675336525125, "loss": 0.0458, "step": 9550 }, { "epoch": 0.02, "learning_rate": 0.00029628286514887976, "loss": 0.0496, "step": 9560 }, { "epoch": 0.02, "learning_rate": 0.00029627897693250833, "loss": 0.0531, "step": 9570 }, { "epoch": 0.02, "learning_rate": 0.00029627508871613685, "loss": 0.0426, "step": 9580 }, { "epoch": 0.02, "learning_rate": 0.00029627120049976536, "loss": 0.0413, "step": 9590 }, { "epoch": 0.02, "learning_rate": 0.00029626731228339393, "loss": 0.0413, "step": 9600 }, { "epoch": 0.02, "learning_rate": 0.00029626342406702244, "loss": 0.0465, "step": 9610 }, { "epoch": 0.02, "learning_rate": 0.000296259535850651, "loss": 0.0445, "step": 9620 }, { "epoch": 0.02, "learning_rate": 0.0002962556476342795, "loss": 0.049, "step": 9630 }, { "epoch": 0.02, "learning_rate": 0.00029625175941790804, "loss": 0.0439, "step": 9640 }, { "epoch": 0.03, "learning_rate": 0.0002962478712015366, "loss": 0.0474, "step": 9650 }, { "epoch": 0.03, "learning_rate": 0.0002962439829851651, "loss": 0.0584, "step": 9660 }, { "epoch": 0.03, "learning_rate": 0.0002962400947687937, "loss": 0.0565, "step": 9670 }, { "epoch": 0.03, "learning_rate": 0.0002962362065524222, "loss": 0.0364, "step": 9680 }, { "epoch": 0.03, "learning_rate": 0.0002962323183360507, "loss": 0.045, "step": 9690 }, { "epoch": 0.03, "learning_rate": 0.0002962284301196793, "loss": 0.0438, "step": 9700 }, { "epoch": 0.03, "learning_rate": 0.0002962245419033078, "loss": 0.0434, "step": 9710 }, { "epoch": 0.03, "learning_rate": 0.0002962206536869363, "loss": 0.0518, "step": 9720 }, { "epoch": 0.03, "learning_rate": 0.0002962167654705649, "loss": 0.055, "step": 9730 }, { "epoch": 0.03, "learning_rate": 0.0002962128772541934, "loss": 0.0492, "step": 9740 }, { "epoch": 0.03, "learning_rate": 0.00029620898903782197, "loss": 0.0436, "step": 9750 }, { "epoch": 0.03, "learning_rate": 0.0002962051008214505, "loss": 0.0577, "step": 9760 }, { "epoch": 0.03, "learning_rate": 0.000296201212605079, "loss": 0.0458, "step": 9770 }, { "epoch": 0.03, "learning_rate": 0.00029619732438870757, "loss": 0.1094, "step": 9780 }, { "epoch": 0.03, "learning_rate": 0.0002961934361723361, "loss": 0.0492, "step": 9790 }, { "epoch": 0.03, "learning_rate": 0.0002961895479559646, "loss": 0.0467, "step": 9800 }, { "epoch": 0.03, "learning_rate": 0.00029618565973959317, "loss": 0.0528, "step": 9810 }, { "epoch": 0.03, "learning_rate": 0.00029618177152322174, "loss": 0.0452, "step": 9820 }, { "epoch": 0.03, "learning_rate": 0.00029617788330685025, "loss": 0.0534, "step": 9830 }, { "epoch": 0.03, "learning_rate": 0.00029617399509047877, "loss": 0.0445, "step": 9840 }, { "epoch": 0.03, "learning_rate": 0.0002961701068741073, "loss": 0.0444, "step": 9850 }, { "epoch": 0.03, "learning_rate": 0.00029616621865773585, "loss": 0.0468, "step": 9860 }, { "epoch": 0.03, "learning_rate": 0.00029616233044136436, "loss": 0.0556, "step": 9870 }, { "epoch": 0.03, "learning_rate": 0.00029615844222499293, "loss": 0.0481, "step": 9880 }, { "epoch": 0.03, "learning_rate": 0.00029615455400862145, "loss": 0.0404, "step": 9890 }, { "epoch": 0.03, "learning_rate": 0.00029615066579225, "loss": 0.0458, "step": 9900 }, { "epoch": 0.03, "learning_rate": 0.00029614677757587853, "loss": 0.0492, "step": 9910 }, { "epoch": 0.03, "learning_rate": 0.00029614288935950704, "loss": 0.0374, "step": 9920 }, { "epoch": 0.03, "learning_rate": 0.00029613900114313556, "loss": 0.044, "step": 9930 }, { "epoch": 0.03, "learning_rate": 0.00029613511292676413, "loss": 0.0472, "step": 9940 }, { "epoch": 0.03, "learning_rate": 0.00029613122471039264, "loss": 0.0439, "step": 9950 }, { "epoch": 0.03, "learning_rate": 0.0002961273364940212, "loss": 0.0491, "step": 9960 }, { "epoch": 0.03, "learning_rate": 0.0002961234482776497, "loss": 0.0458, "step": 9970 }, { "epoch": 0.03, "learning_rate": 0.00029611956006127824, "loss": 0.0467, "step": 9980 }, { "epoch": 0.03, "learning_rate": 0.0002961156718449068, "loss": 0.0472, "step": 9990 }, { "epoch": 0.03, "learning_rate": 0.0002961117836285353, "loss": 0.0457, "step": 10000 }, { "epoch": 0.03, "eval_cer": 0.8818412503796516, "eval_loss": 0.03403039649128914, "eval_runtime": 107.5829, "eval_samples_per_second": 18.59, "eval_steps_per_second": 4.648, "step": 10000 }, { "epoch": 0.03, "learning_rate": 0.00029610789541216384, "loss": 0.0435, "step": 10010 }, { "epoch": 0.03, "learning_rate": 0.0002961040071957924, "loss": 0.0492, "step": 10020 }, { "epoch": 0.03, "learning_rate": 0.000296100118979421, "loss": 0.0422, "step": 10030 }, { "epoch": 0.03, "learning_rate": 0.0002960962307630495, "loss": 0.0445, "step": 10040 }, { "epoch": 0.03, "learning_rate": 0.000296092342546678, "loss": 0.0527, "step": 10050 }, { "epoch": 0.03, "learning_rate": 0.0002960884543303065, "loss": 0.0493, "step": 10060 }, { "epoch": 0.03, "learning_rate": 0.0002960845661139351, "loss": 0.0456, "step": 10070 }, { "epoch": 0.03, "learning_rate": 0.0002960806778975636, "loss": 0.0446, "step": 10080 }, { "epoch": 0.03, "learning_rate": 0.00029607678968119217, "loss": 0.0457, "step": 10090 }, { "epoch": 0.03, "learning_rate": 0.0002960729014648207, "loss": 0.0473, "step": 10100 }, { "epoch": 0.03, "learning_rate": 0.00029606901324844925, "loss": 0.0488, "step": 10110 }, { "epoch": 0.03, "learning_rate": 0.00029606512503207777, "loss": 0.0425, "step": 10120 }, { "epoch": 0.03, "learning_rate": 0.0002960612368157063, "loss": 0.0434, "step": 10130 }, { "epoch": 0.03, "learning_rate": 0.0002960573485993348, "loss": 0.0509, "step": 10140 }, { "epoch": 0.03, "learning_rate": 0.00029605346038296337, "loss": 0.0386, "step": 10150 }, { "epoch": 0.03, "learning_rate": 0.00029604957216659194, "loss": 0.0485, "step": 10160 }, { "epoch": 0.03, "learning_rate": 0.00029604568395022045, "loss": 0.0456, "step": 10170 }, { "epoch": 0.03, "learning_rate": 0.00029604179573384896, "loss": 0.0443, "step": 10180 }, { "epoch": 0.03, "learning_rate": 0.0002960379075174775, "loss": 0.044, "step": 10190 }, { "epoch": 0.03, "learning_rate": 0.00029603401930110605, "loss": 0.0485, "step": 10200 }, { "epoch": 0.03, "learning_rate": 0.00029603013108473456, "loss": 0.0542, "step": 10210 }, { "epoch": 0.03, "learning_rate": 0.00029602624286836313, "loss": 0.05, "step": 10220 }, { "epoch": 0.03, "learning_rate": 0.00029602235465199165, "loss": 0.0417, "step": 10230 }, { "epoch": 0.03, "learning_rate": 0.0002960184664356202, "loss": 0.0518, "step": 10240 }, { "epoch": 0.03, "learning_rate": 0.00029601457821924873, "loss": 0.0441, "step": 10250 }, { "epoch": 0.03, "learning_rate": 0.00029601069000287724, "loss": 0.0403, "step": 10260 }, { "epoch": 0.03, "learning_rate": 0.00029600680178650576, "loss": 0.0421, "step": 10270 }, { "epoch": 0.03, "learning_rate": 0.0002960029135701343, "loss": 0.0424, "step": 10280 }, { "epoch": 0.03, "learning_rate": 0.00029599902535376284, "loss": 0.0642, "step": 10290 }, { "epoch": 0.03, "learning_rate": 0.0002959951371373914, "loss": 0.0554, "step": 10300 }, { "epoch": 0.03, "learning_rate": 0.0002959912489210199, "loss": 0.0489, "step": 10310 }, { "epoch": 0.03, "learning_rate": 0.0002959873607046485, "loss": 0.0455, "step": 10320 }, { "epoch": 0.03, "learning_rate": 0.000295983472488277, "loss": 0.0445, "step": 10330 }, { "epoch": 0.03, "learning_rate": 0.0002959795842719055, "loss": 0.0461, "step": 10340 }, { "epoch": 0.03, "learning_rate": 0.00029597569605553404, "loss": 0.046, "step": 10350 }, { "epoch": 0.03, "learning_rate": 0.0002959718078391626, "loss": 0.0435, "step": 10360 }, { "epoch": 0.03, "learning_rate": 0.0002959679196227912, "loss": 0.0499, "step": 10370 }, { "epoch": 0.03, "learning_rate": 0.0002959640314064197, "loss": 0.0392, "step": 10380 }, { "epoch": 0.03, "learning_rate": 0.0002959601431900482, "loss": 0.0497, "step": 10390 }, { "epoch": 0.03, "learning_rate": 0.00029595625497367677, "loss": 0.0461, "step": 10400 }, { "epoch": 0.03, "learning_rate": 0.0002959523667573053, "loss": 0.0398, "step": 10410 }, { "epoch": 0.03, "learning_rate": 0.0002959484785409338, "loss": 0.0432, "step": 10420 }, { "epoch": 0.03, "learning_rate": 0.00029594459032456237, "loss": 0.045, "step": 10430 }, { "epoch": 0.03, "learning_rate": 0.0002959407021081909, "loss": 0.0415, "step": 10440 }, { "epoch": 0.03, "learning_rate": 0.00029593681389181945, "loss": 0.044, "step": 10450 }, { "epoch": 0.03, "learning_rate": 0.00029593292567544797, "loss": 0.0503, "step": 10460 }, { "epoch": 0.03, "learning_rate": 0.0002959290374590765, "loss": 0.0544, "step": 10470 }, { "epoch": 0.03, "learning_rate": 0.000295925149242705, "loss": 0.0492, "step": 10480 }, { "epoch": 0.03, "learning_rate": 0.00029592126102633357, "loss": 0.0691, "step": 10490 }, { "epoch": 0.03, "learning_rate": 0.0002959173728099621, "loss": 0.0529, "step": 10500 }, { "epoch": 0.03, "learning_rate": 0.00029591348459359065, "loss": 0.0467, "step": 10510 }, { "epoch": 0.03, "learning_rate": 0.00029590959637721916, "loss": 0.0417, "step": 10520 }, { "epoch": 0.03, "learning_rate": 0.00029590570816084773, "loss": 0.0425, "step": 10530 }, { "epoch": 0.03, "learning_rate": 0.00029590181994447625, "loss": 0.0381, "step": 10540 }, { "epoch": 0.03, "learning_rate": 0.00029589793172810476, "loss": 0.0384, "step": 10550 }, { "epoch": 0.03, "learning_rate": 0.00029589404351173333, "loss": 0.044, "step": 10560 }, { "epoch": 0.03, "learning_rate": 0.00029589015529536184, "loss": 0.0468, "step": 10570 }, { "epoch": 0.03, "learning_rate": 0.0002958862670789904, "loss": 0.0444, "step": 10580 }, { "epoch": 0.03, "learning_rate": 0.00029588237886261893, "loss": 0.0466, "step": 10590 }, { "epoch": 0.03, "learning_rate": 0.00029587849064624744, "loss": 0.0451, "step": 10600 }, { "epoch": 0.03, "learning_rate": 0.000295874602429876, "loss": 0.0418, "step": 10610 }, { "epoch": 0.03, "learning_rate": 0.0002958707142135045, "loss": 0.0418, "step": 10620 }, { "epoch": 0.03, "learning_rate": 0.00029586682599713304, "loss": 0.0424, "step": 10630 }, { "epoch": 0.03, "learning_rate": 0.0002958629377807616, "loss": 0.0436, "step": 10640 }, { "epoch": 0.03, "learning_rate": 0.0002958590495643901, "loss": 0.0419, "step": 10650 }, { "epoch": 0.03, "learning_rate": 0.0002958551613480187, "loss": 0.0452, "step": 10660 }, { "epoch": 0.03, "learning_rate": 0.0002958512731316472, "loss": 0.0489, "step": 10670 }, { "epoch": 0.03, "learning_rate": 0.0002958473849152757, "loss": 0.0448, "step": 10680 }, { "epoch": 0.03, "learning_rate": 0.00029584349669890424, "loss": 0.0521, "step": 10690 }, { "epoch": 0.03, "learning_rate": 0.0002958396084825328, "loss": 0.0412, "step": 10700 }, { "epoch": 0.03, "learning_rate": 0.00029583572026616137, "loss": 0.0454, "step": 10710 }, { "epoch": 0.03, "learning_rate": 0.0002958318320497899, "loss": 0.0402, "step": 10720 }, { "epoch": 0.03, "learning_rate": 0.0002958279438334184, "loss": 0.0442, "step": 10730 }, { "epoch": 0.03, "learning_rate": 0.00029582405561704697, "loss": 0.0503, "step": 10740 }, { "epoch": 0.03, "learning_rate": 0.0002958201674006755, "loss": 0.0504, "step": 10750 }, { "epoch": 0.03, "learning_rate": 0.000295816279184304, "loss": 0.0433, "step": 10760 }, { "epoch": 0.03, "learning_rate": 0.00029581239096793257, "loss": 0.0408, "step": 10770 }, { "epoch": 0.03, "learning_rate": 0.0002958085027515611, "loss": 0.0396, "step": 10780 }, { "epoch": 0.03, "learning_rate": 0.00029580461453518965, "loss": 0.0405, "step": 10790 }, { "epoch": 0.03, "learning_rate": 0.00029580072631881817, "loss": 0.0524, "step": 10800 }, { "epoch": 0.03, "learning_rate": 0.0002957968381024467, "loss": 0.0415, "step": 10810 }, { "epoch": 0.03, "learning_rate": 0.00029579294988607525, "loss": 0.0455, "step": 10820 }, { "epoch": 0.03, "learning_rate": 0.00029578906166970376, "loss": 0.0509, "step": 10830 }, { "epoch": 0.03, "learning_rate": 0.0002957851734533323, "loss": 0.0473, "step": 10840 }, { "epoch": 0.03, "learning_rate": 0.00029578128523696085, "loss": 0.0423, "step": 10850 }, { "epoch": 0.03, "learning_rate": 0.0002957773970205894, "loss": 0.0435, "step": 10860 }, { "epoch": 0.03, "learning_rate": 0.00029577350880421793, "loss": 0.0502, "step": 10870 }, { "epoch": 0.03, "learning_rate": 0.00029576962058784645, "loss": 0.0432, "step": 10880 }, { "epoch": 0.03, "learning_rate": 0.00029576573237147496, "loss": 0.0449, "step": 10890 }, { "epoch": 0.03, "learning_rate": 0.00029576184415510353, "loss": 0.0394, "step": 10900 }, { "epoch": 0.03, "learning_rate": 0.00029575795593873204, "loss": 0.048, "step": 10910 }, { "epoch": 0.03, "learning_rate": 0.0002957540677223606, "loss": 0.0475, "step": 10920 }, { "epoch": 0.03, "learning_rate": 0.0002957501795059891, "loss": 0.0491, "step": 10930 }, { "epoch": 0.03, "learning_rate": 0.00029574629128961764, "loss": 0.0499, "step": 10940 }, { "epoch": 0.03, "learning_rate": 0.0002957424030732462, "loss": 0.0462, "step": 10950 }, { "epoch": 0.03, "learning_rate": 0.0002957385148568747, "loss": 0.0449, "step": 10960 }, { "epoch": 0.03, "learning_rate": 0.00029573462664050324, "loss": 0.0464, "step": 10970 }, { "epoch": 0.03, "learning_rate": 0.0002957307384241318, "loss": 0.046, "step": 10980 }, { "epoch": 0.03, "learning_rate": 0.0002957268502077603, "loss": 0.0445, "step": 10990 }, { "epoch": 0.03, "learning_rate": 0.0002957229619913889, "loss": 0.0443, "step": 11000 }, { "epoch": 0.03, "eval_cer": 0.8817390768834564, "eval_loss": 0.03759730979800224, "eval_runtime": 108.4369, "eval_samples_per_second": 18.444, "eval_steps_per_second": 4.611, "step": 11000 }, { "epoch": 0.03, "learning_rate": 0.0002957190737750174, "loss": 0.0462, "step": 11010 }, { "epoch": 0.03, "learning_rate": 0.0002957151855586459, "loss": 0.0469, "step": 11020 }, { "epoch": 0.03, "learning_rate": 0.0002957112973422745, "loss": 0.0517, "step": 11030 }, { "epoch": 0.03, "learning_rate": 0.000295707409125903, "loss": 0.0469, "step": 11040 }, { "epoch": 0.03, "learning_rate": 0.0002957035209095315, "loss": 0.0513, "step": 11050 }, { "epoch": 0.03, "learning_rate": 0.0002956996326931601, "loss": 0.0538, "step": 11060 }, { "epoch": 0.03, "learning_rate": 0.00029569574447678865, "loss": 0.0448, "step": 11070 }, { "epoch": 0.03, "learning_rate": 0.00029569185626041717, "loss": 0.0473, "step": 11080 }, { "epoch": 0.03, "learning_rate": 0.0002956879680440457, "loss": 0.0456, "step": 11090 }, { "epoch": 0.03, "learning_rate": 0.0002956840798276742, "loss": 0.0501, "step": 11100 }, { "epoch": 0.03, "learning_rate": 0.00029568019161130277, "loss": 0.0632, "step": 11110 }, { "epoch": 0.03, "learning_rate": 0.0002956763033949313, "loss": 0.0435, "step": 11120 }, { "epoch": 0.03, "learning_rate": 0.00029567241517855985, "loss": 0.0449, "step": 11130 }, { "epoch": 0.03, "learning_rate": 0.00029566852696218837, "loss": 0.0415, "step": 11140 }, { "epoch": 0.03, "learning_rate": 0.00029566463874581693, "loss": 0.0527, "step": 11150 }, { "epoch": 0.03, "learning_rate": 0.00029566075052944545, "loss": 0.0509, "step": 11160 }, { "epoch": 0.03, "learning_rate": 0.00029565686231307396, "loss": 0.0489, "step": 11170 }, { "epoch": 0.03, "learning_rate": 0.0002956529740967025, "loss": 0.0446, "step": 11180 }, { "epoch": 0.03, "learning_rate": 0.00029564908588033105, "loss": 0.0554, "step": 11190 }, { "epoch": 0.03, "learning_rate": 0.00029564519766395956, "loss": 0.0504, "step": 11200 }, { "epoch": 0.03, "learning_rate": 0.00029564130944758813, "loss": 0.0527, "step": 11210 }, { "epoch": 0.03, "learning_rate": 0.00029563742123121664, "loss": 0.0553, "step": 11220 }, { "epoch": 0.03, "learning_rate": 0.00029563353301484516, "loss": 0.0456, "step": 11230 }, { "epoch": 0.03, "learning_rate": 0.00029562964479847373, "loss": 0.051, "step": 11240 }, { "epoch": 0.03, "learning_rate": 0.00029562575658210224, "loss": 0.0476, "step": 11250 }, { "epoch": 0.03, "learning_rate": 0.0002956218683657308, "loss": 0.0429, "step": 11260 }, { "epoch": 0.03, "learning_rate": 0.0002956179801493593, "loss": 0.044, "step": 11270 }, { "epoch": 0.03, "learning_rate": 0.0002956140919329879, "loss": 0.0444, "step": 11280 }, { "epoch": 0.03, "learning_rate": 0.0002956102037166164, "loss": 0.039, "step": 11290 }, { "epoch": 0.03, "learning_rate": 0.0002956063155002449, "loss": 0.0483, "step": 11300 }, { "epoch": 0.03, "learning_rate": 0.00029560242728387344, "loss": 0.0433, "step": 11310 }, { "epoch": 0.03, "learning_rate": 0.000295598539067502, "loss": 0.044, "step": 11320 }, { "epoch": 0.03, "learning_rate": 0.0002955946508511305, "loss": 0.0446, "step": 11330 }, { "epoch": 0.03, "learning_rate": 0.0002955907626347591, "loss": 0.0466, "step": 11340 }, { "epoch": 0.03, "learning_rate": 0.0002955868744183876, "loss": 0.0429, "step": 11350 }, { "epoch": 0.03, "learning_rate": 0.00029558298620201617, "loss": 0.0442, "step": 11360 }, { "epoch": 0.03, "learning_rate": 0.0002955790979856447, "loss": 0.0403, "step": 11370 }, { "epoch": 0.03, "learning_rate": 0.0002955752097692732, "loss": 0.0422, "step": 11380 }, { "epoch": 0.03, "learning_rate": 0.0002955713215529017, "loss": 0.0347, "step": 11390 }, { "epoch": 0.03, "learning_rate": 0.0002955674333365303, "loss": 0.042, "step": 11400 }, { "epoch": 0.03, "learning_rate": 0.00029556354512015885, "loss": 0.0464, "step": 11410 }, { "epoch": 0.03, "learning_rate": 0.00029555965690378737, "loss": 0.0463, "step": 11420 }, { "epoch": 0.03, "learning_rate": 0.0002955557686874159, "loss": 0.0424, "step": 11430 }, { "epoch": 0.03, "learning_rate": 0.0002955518804710444, "loss": 0.0439, "step": 11440 }, { "epoch": 0.03, "learning_rate": 0.00029554799225467297, "loss": 0.051, "step": 11450 }, { "epoch": 0.03, "learning_rate": 0.0002955441040383015, "loss": 0.0438, "step": 11460 }, { "epoch": 0.03, "learning_rate": 0.00029554021582193005, "loss": 0.0456, "step": 11470 }, { "epoch": 0.03, "learning_rate": 0.00029553632760555856, "loss": 0.0438, "step": 11480 }, { "epoch": 0.03, "learning_rate": 0.00029553243938918713, "loss": 0.0413, "step": 11490 }, { "epoch": 0.03, "learning_rate": 0.00029552855117281565, "loss": 0.0466, "step": 11500 }, { "epoch": 0.03, "learning_rate": 0.00029552466295644416, "loss": 0.0451, "step": 11510 }, { "epoch": 0.03, "learning_rate": 0.0002955207747400727, "loss": 0.0427, "step": 11520 }, { "epoch": 0.03, "learning_rate": 0.00029551688652370125, "loss": 0.0446, "step": 11530 }, { "epoch": 0.03, "learning_rate": 0.00029551299830732976, "loss": 0.0362, "step": 11540 }, { "epoch": 0.03, "learning_rate": 0.00029550911009095833, "loss": 0.0376, "step": 11550 }, { "epoch": 0.03, "learning_rate": 0.00029550522187458684, "loss": 0.0351, "step": 11560 }, { "epoch": 0.03, "learning_rate": 0.0002955013336582154, "loss": 0.0348, "step": 11570 }, { "epoch": 0.03, "learning_rate": 0.0002954974454418439, "loss": 0.0353, "step": 11580 }, { "epoch": 0.03, "learning_rate": 0.00029549355722547244, "loss": 0.0361, "step": 11590 }, { "epoch": 0.03, "learning_rate": 0.00029548966900910096, "loss": 0.0448, "step": 11600 }, { "epoch": 0.03, "learning_rate": 0.0002954857807927295, "loss": 0.0392, "step": 11610 }, { "epoch": 0.03, "learning_rate": 0.0002954818925763581, "loss": 0.0391, "step": 11620 }, { "epoch": 0.03, "learning_rate": 0.0002954780043599866, "loss": 0.0462, "step": 11630 }, { "epoch": 0.03, "learning_rate": 0.0002954741161436151, "loss": 0.0445, "step": 11640 }, { "epoch": 0.03, "learning_rate": 0.0002954702279272437, "loss": 0.0468, "step": 11650 }, { "epoch": 0.03, "learning_rate": 0.0002954663397108722, "loss": 0.046, "step": 11660 }, { "epoch": 0.03, "learning_rate": 0.0002954624514945007, "loss": 0.0475, "step": 11670 }, { "epoch": 0.03, "learning_rate": 0.0002954585632781293, "loss": 0.0418, "step": 11680 }, { "epoch": 0.03, "learning_rate": 0.0002954546750617578, "loss": 0.0418, "step": 11690 }, { "epoch": 0.03, "learning_rate": 0.00029545078684538637, "loss": 0.0466, "step": 11700 }, { "epoch": 0.03, "learning_rate": 0.0002954468986290149, "loss": 0.0441, "step": 11710 }, { "epoch": 0.03, "learning_rate": 0.0002954430104126434, "loss": 0.0455, "step": 11720 }, { "epoch": 0.03, "learning_rate": 0.0002954391221962719, "loss": 0.0395, "step": 11730 }, { "epoch": 0.03, "learning_rate": 0.0002954352339799005, "loss": 0.0817, "step": 11740 }, { "epoch": 0.03, "learning_rate": 0.00029543134576352905, "loss": 0.0446, "step": 11750 }, { "epoch": 0.03, "learning_rate": 0.00029542745754715757, "loss": 0.0474, "step": 11760 }, { "epoch": 0.03, "learning_rate": 0.0002954235693307861, "loss": 0.0458, "step": 11770 }, { "epoch": 0.03, "learning_rate": 0.00029541968111441465, "loss": 0.0439, "step": 11780 }, { "epoch": 0.03, "learning_rate": 0.00029541579289804316, "loss": 0.0462, "step": 11790 }, { "epoch": 0.03, "learning_rate": 0.0002954119046816717, "loss": 0.0359, "step": 11800 }, { "epoch": 0.03, "learning_rate": 0.00029540801646530025, "loss": 0.0424, "step": 11810 }, { "epoch": 0.03, "learning_rate": 0.00029540412824892876, "loss": 0.0409, "step": 11820 }, { "epoch": 0.03, "learning_rate": 0.00029540024003255733, "loss": 0.051, "step": 11830 }, { "epoch": 0.03, "learning_rate": 0.00029539635181618585, "loss": 0.0454, "step": 11840 }, { "epoch": 0.03, "learning_rate": 0.00029539246359981436, "loss": 0.0431, "step": 11850 }, { "epoch": 0.03, "learning_rate": 0.00029538857538344293, "loss": 0.0403, "step": 11860 }, { "epoch": 0.03, "learning_rate": 0.00029538468716707144, "loss": 0.0391, "step": 11870 }, { "epoch": 0.03, "learning_rate": 0.00029538079895069996, "loss": 0.0435, "step": 11880 }, { "epoch": 0.03, "learning_rate": 0.00029537691073432853, "loss": 0.0423, "step": 11890 }, { "epoch": 0.03, "learning_rate": 0.0002953730225179571, "loss": 0.0342, "step": 11900 }, { "epoch": 0.03, "learning_rate": 0.0002953691343015856, "loss": 0.0467, "step": 11910 }, { "epoch": 0.03, "learning_rate": 0.0002953652460852141, "loss": 0.0425, "step": 11920 }, { "epoch": 0.03, "learning_rate": 0.00029536135786884264, "loss": 0.0409, "step": 11930 }, { "epoch": 0.03, "learning_rate": 0.00029535746965247115, "loss": 0.037, "step": 11940 }, { "epoch": 0.03, "learning_rate": 0.0002953535814360997, "loss": 0.0475, "step": 11950 }, { "epoch": 0.03, "learning_rate": 0.0002953496932197283, "loss": 0.0373, "step": 11960 }, { "epoch": 0.03, "learning_rate": 0.0002953458050033568, "loss": 0.0442, "step": 11970 }, { "epoch": 0.03, "learning_rate": 0.0002953419167869853, "loss": 0.0467, "step": 11980 }, { "epoch": 0.03, "learning_rate": 0.0002953380285706139, "loss": 0.0423, "step": 11990 }, { "epoch": 0.03, "learning_rate": 0.0002953341403542424, "loss": 0.0465, "step": 12000 }, { "epoch": 0.03, "eval_cer": 0.8818370514688489, "eval_loss": 0.03303086385130882, "eval_runtime": 107.7286, "eval_samples_per_second": 18.565, "eval_steps_per_second": 4.641, "step": 12000 }, { "epoch": 0.03, "learning_rate": 0.0002953302521378709, "loss": 0.0466, "step": 12010 }, { "epoch": 0.03, "learning_rate": 0.0002953263639214995, "loss": 0.0404, "step": 12020 }, { "epoch": 0.03, "learning_rate": 0.000295322475705128, "loss": 0.0449, "step": 12030 }, { "epoch": 0.03, "learning_rate": 0.00029531858748875657, "loss": 0.0454, "step": 12040 }, { "epoch": 0.03, "learning_rate": 0.0002953146992723851, "loss": 0.0506, "step": 12050 }, { "epoch": 0.03, "learning_rate": 0.0002953108110560136, "loss": 0.0417, "step": 12060 }, { "epoch": 0.03, "learning_rate": 0.00029530692283964217, "loss": 0.0382, "step": 12070 }, { "epoch": 0.03, "learning_rate": 0.0002953030346232707, "loss": 0.0414, "step": 12080 }, { "epoch": 0.03, "learning_rate": 0.0002952991464068992, "loss": 0.0429, "step": 12090 }, { "epoch": 0.03, "learning_rate": 0.00029529525819052777, "loss": 0.039, "step": 12100 }, { "epoch": 0.03, "learning_rate": 0.00029529136997415633, "loss": 0.0418, "step": 12110 }, { "epoch": 0.03, "learning_rate": 0.00029528748175778485, "loss": 0.0458, "step": 12120 }, { "epoch": 0.03, "learning_rate": 0.00029528359354141336, "loss": 0.0449, "step": 12130 }, { "epoch": 0.03, "learning_rate": 0.0002952797053250419, "loss": 0.0387, "step": 12140 }, { "epoch": 0.03, "learning_rate": 0.00029527581710867045, "loss": 0.0439, "step": 12150 }, { "epoch": 0.03, "learning_rate": 0.00029527192889229896, "loss": 0.0375, "step": 12160 }, { "epoch": 0.03, "learning_rate": 0.00029526804067592753, "loss": 0.0394, "step": 12170 }, { "epoch": 0.03, "learning_rate": 0.00029526415245955604, "loss": 0.0427, "step": 12180 }, { "epoch": 0.03, "learning_rate": 0.00029526026424318456, "loss": 0.0395, "step": 12190 }, { "epoch": 0.03, "learning_rate": 0.00029525637602681313, "loss": 0.0553, "step": 12200 }, { "epoch": 0.03, "learning_rate": 0.00029525248781044164, "loss": 0.0489, "step": 12210 }, { "epoch": 0.03, "learning_rate": 0.00029524859959407016, "loss": 0.0444, "step": 12220 }, { "epoch": 0.03, "learning_rate": 0.0002952447113776987, "loss": 0.0469, "step": 12230 }, { "epoch": 0.03, "learning_rate": 0.00029524082316132724, "loss": 0.0504, "step": 12240 }, { "epoch": 0.03, "learning_rate": 0.0002952369349449558, "loss": 0.0476, "step": 12250 }, { "epoch": 0.03, "learning_rate": 0.0002952330467285843, "loss": 0.0459, "step": 12260 }, { "epoch": 0.03, "learning_rate": 0.00029522915851221284, "loss": 0.0454, "step": 12270 }, { "epoch": 0.03, "learning_rate": 0.0002952252702958414, "loss": 0.05, "step": 12280 }, { "epoch": 0.03, "learning_rate": 0.0002952213820794699, "loss": 0.0419, "step": 12290 }, { "epoch": 0.03, "learning_rate": 0.0002952174938630985, "loss": 0.0439, "step": 12300 }, { "epoch": 0.03, "learning_rate": 0.000295213605646727, "loss": 0.0415, "step": 12310 }, { "epoch": 0.03, "learning_rate": 0.0002952097174303556, "loss": 0.0414, "step": 12320 }, { "epoch": 0.03, "learning_rate": 0.0002952058292139841, "loss": 0.0408, "step": 12330 }, { "epoch": 0.03, "learning_rate": 0.0002952019409976126, "loss": 0.0384, "step": 12340 }, { "epoch": 0.03, "learning_rate": 0.0002951980527812411, "loss": 0.0408, "step": 12350 }, { "epoch": 0.03, "learning_rate": 0.0002951941645648697, "loss": 0.0429, "step": 12360 }, { "epoch": 0.03, "learning_rate": 0.0002951902763484982, "loss": 0.0458, "step": 12370 }, { "epoch": 0.03, "learning_rate": 0.00029518638813212677, "loss": 0.0452, "step": 12380 }, { "epoch": 0.03, "learning_rate": 0.0002951824999157553, "loss": 0.0491, "step": 12390 }, { "epoch": 0.03, "learning_rate": 0.00029517861169938385, "loss": 0.0449, "step": 12400 }, { "epoch": 0.03, "learning_rate": 0.00029517472348301237, "loss": 0.0523, "step": 12410 }, { "epoch": 0.03, "learning_rate": 0.0002951708352666409, "loss": 0.0483, "step": 12420 }, { "epoch": 0.03, "learning_rate": 0.0002951669470502694, "loss": 0.0446, "step": 12430 }, { "epoch": 0.03, "learning_rate": 0.00029516305883389796, "loss": 0.0367, "step": 12440 }, { "epoch": 0.03, "learning_rate": 0.00029515917061752653, "loss": 0.0387, "step": 12450 }, { "epoch": 0.03, "learning_rate": 0.00029515528240115505, "loss": 0.0399, "step": 12460 }, { "epoch": 0.03, "learning_rate": 0.00029515139418478356, "loss": 0.0317, "step": 12470 }, { "epoch": 0.03, "learning_rate": 0.0002951475059684121, "loss": 0.0417, "step": 12480 }, { "epoch": 0.03, "learning_rate": 0.00029514361775204065, "loss": 0.0403, "step": 12490 }, { "epoch": 0.03, "learning_rate": 0.00029513972953566916, "loss": 0.0449, "step": 12500 }, { "epoch": 0.03, "learning_rate": 0.00029513584131929773, "loss": 0.0367, "step": 12510 }, { "epoch": 0.03, "learning_rate": 0.00029513195310292624, "loss": 0.041, "step": 12520 }, { "epoch": 0.03, "learning_rate": 0.0002951280648865548, "loss": 0.0453, "step": 12530 }, { "epoch": 0.03, "learning_rate": 0.0002951241766701833, "loss": 0.0404, "step": 12540 }, { "epoch": 0.03, "learning_rate": 0.00029512028845381184, "loss": 0.043, "step": 12550 }, { "epoch": 0.03, "learning_rate": 0.00029511640023744036, "loss": 0.0469, "step": 12560 }, { "epoch": 0.03, "learning_rate": 0.0002951125120210689, "loss": 0.0389, "step": 12570 }, { "epoch": 0.03, "learning_rate": 0.00029510862380469744, "loss": 0.0423, "step": 12580 }, { "epoch": 0.03, "learning_rate": 0.000295104735588326, "loss": 0.0414, "step": 12590 }, { "epoch": 0.03, "learning_rate": 0.0002951008473719545, "loss": 0.0354, "step": 12600 }, { "epoch": 0.03, "learning_rate": 0.0002950969591555831, "loss": 0.0559, "step": 12610 }, { "epoch": 0.03, "learning_rate": 0.0002950930709392116, "loss": 0.0433, "step": 12620 }, { "epoch": 0.03, "learning_rate": 0.0002950891827228401, "loss": 0.0452, "step": 12630 }, { "epoch": 0.03, "learning_rate": 0.00029508529450646863, "loss": 0.041, "step": 12640 }, { "epoch": 0.03, "learning_rate": 0.0002950814062900972, "loss": 0.0385, "step": 12650 }, { "epoch": 0.03, "learning_rate": 0.00029507751807372577, "loss": 0.0467, "step": 12660 }, { "epoch": 0.03, "learning_rate": 0.0002950736298573543, "loss": 0.0454, "step": 12670 }, { "epoch": 0.03, "learning_rate": 0.0002950697416409828, "loss": 0.0451, "step": 12680 }, { "epoch": 0.03, "learning_rate": 0.0002950658534246113, "loss": 0.0438, "step": 12690 }, { "epoch": 0.03, "learning_rate": 0.0002950619652082399, "loss": 0.04, "step": 12700 }, { "epoch": 0.03, "learning_rate": 0.0002950580769918684, "loss": 0.0424, "step": 12710 }, { "epoch": 0.03, "learning_rate": 0.00029505418877549697, "loss": 0.0344, "step": 12720 }, { "epoch": 0.03, "learning_rate": 0.0002950503005591255, "loss": 0.0397, "step": 12730 }, { "epoch": 0.03, "learning_rate": 0.00029504641234275405, "loss": 0.0547, "step": 12740 }, { "epoch": 0.03, "learning_rate": 0.00029504252412638257, "loss": 0.0465, "step": 12750 }, { "epoch": 0.03, "learning_rate": 0.0002950386359100111, "loss": 0.0445, "step": 12760 }, { "epoch": 0.03, "learning_rate": 0.0002950347476936396, "loss": 0.0349, "step": 12770 }, { "epoch": 0.03, "learning_rate": 0.00029503085947726816, "loss": 0.0463, "step": 12780 }, { "epoch": 0.03, "learning_rate": 0.0002950269712608967, "loss": 0.0474, "step": 12790 }, { "epoch": 0.03, "learning_rate": 0.00029502308304452525, "loss": 0.0468, "step": 12800 }, { "epoch": 0.03, "learning_rate": 0.00029501919482815376, "loss": 0.0438, "step": 12810 }, { "epoch": 0.03, "learning_rate": 0.00029501530661178233, "loss": 0.0379, "step": 12820 }, { "epoch": 0.03, "learning_rate": 0.00029501141839541084, "loss": 0.0392, "step": 12830 }, { "epoch": 0.03, "learning_rate": 0.00029500753017903936, "loss": 0.0373, "step": 12840 }, { "epoch": 0.03, "learning_rate": 0.00029500364196266793, "loss": 0.0379, "step": 12850 }, { "epoch": 0.03, "learning_rate": 0.00029499975374629644, "loss": 0.0399, "step": 12860 }, { "epoch": 0.03, "learning_rate": 0.000294995865529925, "loss": 0.0697, "step": 12870 }, { "epoch": 0.03, "learning_rate": 0.0002949919773135535, "loss": 0.044, "step": 12880 }, { "epoch": 0.03, "learning_rate": 0.00029498808909718204, "loss": 0.0547, "step": 12890 }, { "epoch": 0.03, "learning_rate": 0.0002949842008808106, "loss": 0.0418, "step": 12900 }, { "epoch": 0.03, "learning_rate": 0.0002949803126644391, "loss": 0.0382, "step": 12910 }, { "epoch": 0.03, "learning_rate": 0.00029497642444806764, "loss": 0.0419, "step": 12920 }, { "epoch": 0.03, "learning_rate": 0.0002949725362316962, "loss": 0.0372, "step": 12930 }, { "epoch": 0.03, "learning_rate": 0.0002949686480153247, "loss": 0.0394, "step": 12940 }, { "epoch": 0.03, "learning_rate": 0.0002949647597989533, "loss": 0.0428, "step": 12950 }, { "epoch": 0.03, "learning_rate": 0.0002949608715825818, "loss": 0.0479, "step": 12960 }, { "epoch": 0.03, "learning_rate": 0.0002949569833662103, "loss": 0.0435, "step": 12970 }, { "epoch": 0.03, "learning_rate": 0.00029495309514983883, "loss": 0.0362, "step": 12980 }, { "epoch": 0.03, "learning_rate": 0.0002949492069334674, "loss": 0.0365, "step": 12990 }, { "epoch": 0.03, "learning_rate": 0.00029494531871709597, "loss": 0.0465, "step": 13000 }, { "epoch": 0.03, "eval_cer": 0.8818286536472439, "eval_loss": 0.03343910351395607, "eval_runtime": 107.7406, "eval_samples_per_second": 18.563, "eval_steps_per_second": 4.641, "step": 13000 }, { "epoch": 0.03, "learning_rate": 0.0002949414305007245, "loss": 0.041, "step": 13010 }, { "epoch": 0.03, "learning_rate": 0.000294937542284353, "loss": 0.0397, "step": 13020 }, { "epoch": 0.03, "learning_rate": 0.00029493365406798157, "loss": 0.0431, "step": 13030 }, { "epoch": 0.03, "learning_rate": 0.0002949297658516101, "loss": 0.0354, "step": 13040 }, { "epoch": 0.03, "learning_rate": 0.0002949258776352386, "loss": 0.0428, "step": 13050 }, { "epoch": 0.03, "learning_rate": 0.00029492198941886717, "loss": 0.0375, "step": 13060 }, { "epoch": 0.03, "learning_rate": 0.0002949181012024957, "loss": 0.0462, "step": 13070 }, { "epoch": 0.03, "learning_rate": 0.00029491421298612425, "loss": 0.0419, "step": 13080 }, { "epoch": 0.03, "learning_rate": 0.00029491032476975276, "loss": 0.045, "step": 13090 }, { "epoch": 0.03, "learning_rate": 0.0002949064365533813, "loss": 0.0463, "step": 13100 }, { "epoch": 0.03, "learning_rate": 0.00029490254833700985, "loss": 0.0383, "step": 13110 }, { "epoch": 0.03, "learning_rate": 0.00029489866012063836, "loss": 0.0374, "step": 13120 }, { "epoch": 0.03, "learning_rate": 0.0002948947719042669, "loss": 0.0405, "step": 13130 }, { "epoch": 0.03, "learning_rate": 0.00029489088368789545, "loss": 0.0439, "step": 13140 }, { "epoch": 0.03, "learning_rate": 0.00029488699547152396, "loss": 0.0428, "step": 13150 }, { "epoch": 0.03, "learning_rate": 0.00029488310725515253, "loss": 0.0398, "step": 13160 }, { "epoch": 0.03, "learning_rate": 0.00029487921903878104, "loss": 0.0404, "step": 13170 }, { "epoch": 0.03, "learning_rate": 0.00029487533082240956, "loss": 0.0507, "step": 13180 }, { "epoch": 0.03, "learning_rate": 0.00029487144260603807, "loss": 0.0511, "step": 13190 }, { "epoch": 0.03, "learning_rate": 0.00029486755438966664, "loss": 0.0424, "step": 13200 }, { "epoch": 0.03, "learning_rate": 0.0002948636661732952, "loss": 0.0466, "step": 13210 }, { "epoch": 0.03, "learning_rate": 0.0002948597779569237, "loss": 0.0463, "step": 13220 }, { "epoch": 0.03, "learning_rate": 0.00029485588974055224, "loss": 0.0382, "step": 13230 }, { "epoch": 0.03, "learning_rate": 0.0002948520015241808, "loss": 0.0396, "step": 13240 }, { "epoch": 0.03, "learning_rate": 0.0002948481133078093, "loss": 0.0512, "step": 13250 }, { "epoch": 0.03, "learning_rate": 0.00029484422509143784, "loss": 0.0542, "step": 13260 }, { "epoch": 0.03, "learning_rate": 0.0002948403368750664, "loss": 0.0456, "step": 13270 }, { "epoch": 0.03, "learning_rate": 0.0002948364486586949, "loss": 0.0424, "step": 13280 }, { "epoch": 0.03, "learning_rate": 0.0002948325604423235, "loss": 0.0411, "step": 13290 }, { "epoch": 0.03, "learning_rate": 0.000294828672225952, "loss": 0.0407, "step": 13300 }, { "epoch": 0.03, "learning_rate": 0.0002948247840095805, "loss": 0.042, "step": 13310 }, { "epoch": 0.03, "learning_rate": 0.0002948208957932091, "loss": 0.0369, "step": 13320 }, { "epoch": 0.03, "learning_rate": 0.0002948170075768376, "loss": 0.0436, "step": 13330 }, { "epoch": 0.03, "learning_rate": 0.00029481311936046617, "loss": 0.0388, "step": 13340 }, { "epoch": 0.03, "learning_rate": 0.0002948092311440947, "loss": 0.0383, "step": 13350 }, { "epoch": 0.03, "learning_rate": 0.00029480534292772325, "loss": 0.0464, "step": 13360 }, { "epoch": 0.03, "learning_rate": 0.00029480145471135177, "loss": 0.0378, "step": 13370 }, { "epoch": 0.03, "learning_rate": 0.0002947975664949803, "loss": 0.0458, "step": 13380 }, { "epoch": 0.03, "learning_rate": 0.0002947936782786088, "loss": 0.0372, "step": 13390 }, { "epoch": 0.03, "learning_rate": 0.00029478979006223737, "loss": 0.0482, "step": 13400 }, { "epoch": 0.03, "learning_rate": 0.0002947859018458659, "loss": 0.0541, "step": 13410 }, { "epoch": 0.03, "learning_rate": 0.00029478201362949445, "loss": 0.0455, "step": 13420 }, { "epoch": 0.03, "learning_rate": 0.00029477812541312296, "loss": 0.0451, "step": 13430 }, { "epoch": 0.03, "learning_rate": 0.0002947742371967515, "loss": 0.0438, "step": 13440 }, { "epoch": 0.03, "learning_rate": 0.00029477034898038005, "loss": 0.043, "step": 13450 }, { "epoch": 0.03, "learning_rate": 0.00029476646076400856, "loss": 0.0399, "step": 13460 }, { "epoch": 0.03, "learning_rate": 0.0002947625725476371, "loss": 0.0447, "step": 13470 }, { "epoch": 0.03, "learning_rate": 0.00029475868433126564, "loss": 0.0419, "step": 13480 }, { "epoch": 0.03, "learning_rate": 0.0002947547961148942, "loss": 0.0441, "step": 13490 }, { "epoch": 0.03, "learning_rate": 0.00029475090789852273, "loss": 0.0536, "step": 13500 }, { "epoch": 0.04, "learning_rate": 0.00029474701968215124, "loss": 0.0491, "step": 13510 }, { "epoch": 0.04, "learning_rate": 0.00029474313146577976, "loss": 0.0452, "step": 13520 }, { "epoch": 0.04, "learning_rate": 0.0002947392432494083, "loss": 0.0517, "step": 13530 }, { "epoch": 0.04, "learning_rate": 0.00029473535503303684, "loss": 0.0495, "step": 13540 }, { "epoch": 0.04, "learning_rate": 0.0002947314668166654, "loss": 0.046, "step": 13550 }, { "epoch": 0.04, "learning_rate": 0.0002947275786002939, "loss": 0.0433, "step": 13560 }, { "epoch": 0.04, "learning_rate": 0.0002947236903839225, "loss": 0.0379, "step": 13570 }, { "epoch": 0.04, "learning_rate": 0.000294719802167551, "loss": 0.0471, "step": 13580 }, { "epoch": 0.04, "learning_rate": 0.0002947159139511795, "loss": 0.0474, "step": 13590 }, { "epoch": 0.04, "learning_rate": 0.00029471202573480804, "loss": 0.0483, "step": 13600 }, { "epoch": 0.04, "learning_rate": 0.0002947081375184366, "loss": 0.0387, "step": 13610 }, { "epoch": 0.04, "learning_rate": 0.0002947042493020651, "loss": 0.0467, "step": 13620 }, { "epoch": 0.04, "learning_rate": 0.0002947003610856937, "loss": 0.0396, "step": 13630 }, { "epoch": 0.04, "learning_rate": 0.0002946964728693222, "loss": 0.0433, "step": 13640 }, { "epoch": 0.04, "learning_rate": 0.0002946925846529507, "loss": 0.0434, "step": 13650 }, { "epoch": 0.04, "learning_rate": 0.0002946886964365793, "loss": 0.0452, "step": 13660 }, { "epoch": 0.04, "learning_rate": 0.0002946848082202078, "loss": 0.0363, "step": 13670 }, { "epoch": 0.04, "learning_rate": 0.0002946809200038363, "loss": 0.0527, "step": 13680 }, { "epoch": 0.04, "learning_rate": 0.0002946770317874649, "loss": 0.0581, "step": 13690 }, { "epoch": 0.04, "learning_rate": 0.00029467314357109345, "loss": 0.0486, "step": 13700 }, { "epoch": 0.04, "learning_rate": 0.00029466925535472197, "loss": 0.0425, "step": 13710 }, { "epoch": 0.04, "learning_rate": 0.0002946653671383505, "loss": 0.0411, "step": 13720 }, { "epoch": 0.04, "learning_rate": 0.000294661478921979, "loss": 0.0418, "step": 13730 }, { "epoch": 0.04, "learning_rate": 0.00029465759070560756, "loss": 0.037, "step": 13740 }, { "epoch": 0.04, "learning_rate": 0.0002946537024892361, "loss": 0.0554, "step": 13750 }, { "epoch": 0.04, "learning_rate": 0.00029464981427286465, "loss": 0.0383, "step": 13760 }, { "epoch": 0.04, "learning_rate": 0.00029464592605649316, "loss": 0.0416, "step": 13770 }, { "epoch": 0.04, "learning_rate": 0.00029464203784012173, "loss": 0.0443, "step": 13780 }, { "epoch": 0.04, "learning_rate": 0.00029463814962375025, "loss": 0.0395, "step": 13790 }, { "epoch": 0.04, "learning_rate": 0.00029463426140737876, "loss": 0.0361, "step": 13800 }, { "epoch": 0.04, "learning_rate": 0.0002946303731910073, "loss": 0.0396, "step": 13810 }, { "epoch": 0.04, "learning_rate": 0.00029462648497463584, "loss": 0.0374, "step": 13820 }, { "epoch": 0.04, "learning_rate": 0.00029462259675826436, "loss": 0.0421, "step": 13830 }, { "epoch": 0.04, "learning_rate": 0.0002946187085418929, "loss": 0.0422, "step": 13840 }, { "epoch": 0.04, "learning_rate": 0.00029461482032552144, "loss": 0.0475, "step": 13850 }, { "epoch": 0.04, "learning_rate": 0.00029461093210915, "loss": 0.0392, "step": 13860 }, { "epoch": 0.04, "learning_rate": 0.0002946070438927785, "loss": 0.0419, "step": 13870 }, { "epoch": 0.04, "learning_rate": 0.00029460315567640704, "loss": 0.0433, "step": 13880 }, { "epoch": 0.04, "learning_rate": 0.0002945992674600356, "loss": 0.0396, "step": 13890 }, { "epoch": 0.04, "learning_rate": 0.0002945953792436641, "loss": 0.0427, "step": 13900 }, { "epoch": 0.04, "learning_rate": 0.0002945914910272927, "loss": 0.0418, "step": 13910 }, { "epoch": 0.04, "learning_rate": 0.0002945876028109212, "loss": 0.0386, "step": 13920 }, { "epoch": 0.04, "learning_rate": 0.0002945837145945497, "loss": 0.0391, "step": 13930 }, { "epoch": 0.04, "learning_rate": 0.00029457982637817823, "loss": 0.0392, "step": 13940 }, { "epoch": 0.04, "learning_rate": 0.0002945759381618068, "loss": 0.0451, "step": 13950 }, { "epoch": 0.04, "learning_rate": 0.0002945720499454353, "loss": 0.0427, "step": 13960 }, { "epoch": 0.04, "learning_rate": 0.0002945681617290639, "loss": 0.0389, "step": 13970 }, { "epoch": 0.04, "learning_rate": 0.0002945642735126924, "loss": 0.0625, "step": 13980 }, { "epoch": 0.04, "learning_rate": 0.00029456038529632097, "loss": 0.0465, "step": 13990 }, { "epoch": 0.04, "learning_rate": 0.0002945564970799495, "loss": 0.0418, "step": 14000 }, { "epoch": 0.04, "eval_cer": 0.8818748416660718, "eval_loss": 0.031777381896972656, "eval_runtime": 107.6404, "eval_samples_per_second": 18.58, "eval_steps_per_second": 4.645, "step": 14000 }, { "epoch": 0.04, "learning_rate": 0.000294552608863578, "loss": 0.0604, "step": 14010 }, { "epoch": 0.04, "learning_rate": 0.0002945487206472065, "loss": 0.0609, "step": 14020 }, { "epoch": 0.04, "learning_rate": 0.0002945448324308351, "loss": 0.051, "step": 14030 }, { "epoch": 0.04, "learning_rate": 0.00029454094421446365, "loss": 0.0499, "step": 14040 }, { "epoch": 0.04, "learning_rate": 0.00029453705599809217, "loss": 0.0426, "step": 14050 }, { "epoch": 0.04, "learning_rate": 0.0002945331677817207, "loss": 0.0394, "step": 14060 }, { "epoch": 0.04, "learning_rate": 0.00029452927956534925, "loss": 0.0356, "step": 14070 }, { "epoch": 0.04, "learning_rate": 0.00029452539134897776, "loss": 0.0419, "step": 14080 }, { "epoch": 0.04, "learning_rate": 0.0002945215031326063, "loss": 0.0481, "step": 14090 }, { "epoch": 0.04, "learning_rate": 0.00029451761491623485, "loss": 0.0422, "step": 14100 }, { "epoch": 0.04, "learning_rate": 0.00029451372669986336, "loss": 0.0484, "step": 14110 }, { "epoch": 0.04, "learning_rate": 0.00029450983848349193, "loss": 0.048, "step": 14120 }, { "epoch": 0.04, "learning_rate": 0.00029450595026712044, "loss": 0.048, "step": 14130 }, { "epoch": 0.04, "learning_rate": 0.00029450206205074896, "loss": 0.0434, "step": 14140 }, { "epoch": 0.04, "learning_rate": 0.0002944981738343775, "loss": 0.048, "step": 14150 }, { "epoch": 0.04, "learning_rate": 0.00029449428561800604, "loss": 0.0381, "step": 14160 }, { "epoch": 0.04, "learning_rate": 0.00029449039740163456, "loss": 0.049, "step": 14170 }, { "epoch": 0.04, "learning_rate": 0.0002944865091852631, "loss": 0.0402, "step": 14180 }, { "epoch": 0.04, "learning_rate": 0.00029448262096889164, "loss": 0.0459, "step": 14190 }, { "epoch": 0.04, "learning_rate": 0.0002944787327525202, "loss": 0.0411, "step": 14200 }, { "epoch": 0.04, "learning_rate": 0.0002944748445361487, "loss": 0.0427, "step": 14210 }, { "epoch": 0.04, "learning_rate": 0.00029447095631977724, "loss": 0.0468, "step": 14220 }, { "epoch": 0.04, "learning_rate": 0.00029446706810340575, "loss": 0.0364, "step": 14230 }, { "epoch": 0.04, "learning_rate": 0.0002944631798870343, "loss": 0.0475, "step": 14240 }, { "epoch": 0.04, "learning_rate": 0.0002944592916706629, "loss": 0.0434, "step": 14250 }, { "epoch": 0.04, "learning_rate": 0.0002944554034542914, "loss": 0.0376, "step": 14260 }, { "epoch": 0.04, "learning_rate": 0.0002944515152379199, "loss": 0.0427, "step": 14270 }, { "epoch": 0.04, "learning_rate": 0.0002944476270215485, "loss": 0.0383, "step": 14280 }, { "epoch": 0.04, "learning_rate": 0.000294443738805177, "loss": 0.0546, "step": 14290 }, { "epoch": 0.04, "learning_rate": 0.0002944398505888055, "loss": 0.0434, "step": 14300 }, { "epoch": 0.04, "learning_rate": 0.0002944359623724341, "loss": 0.042, "step": 14310 }, { "epoch": 0.04, "learning_rate": 0.0002944320741560626, "loss": 0.0387, "step": 14320 }, { "epoch": 0.04, "learning_rate": 0.00029442818593969117, "loss": 0.0431, "step": 14330 }, { "epoch": 0.04, "learning_rate": 0.0002944242977233197, "loss": 0.0669, "step": 14340 }, { "epoch": 0.04, "learning_rate": 0.0002944204095069482, "loss": 0.0388, "step": 14350 }, { "epoch": 0.04, "learning_rate": 0.00029441652129057677, "loss": 0.0402, "step": 14360 }, { "epoch": 0.04, "learning_rate": 0.0002944126330742053, "loss": 0.0415, "step": 14370 }, { "epoch": 0.04, "learning_rate": 0.0002944087448578338, "loss": 0.038, "step": 14380 }, { "epoch": 0.04, "learning_rate": 0.00029440485664146236, "loss": 0.0456, "step": 14390 }, { "epoch": 0.04, "learning_rate": 0.0002944009684250909, "loss": 0.0446, "step": 14400 }, { "epoch": 0.04, "learning_rate": 0.00029439708020871945, "loss": 0.0364, "step": 14410 }, { "epoch": 0.04, "learning_rate": 0.00029439319199234796, "loss": 0.0492, "step": 14420 }, { "epoch": 0.04, "learning_rate": 0.0002943893037759765, "loss": 0.0389, "step": 14430 }, { "epoch": 0.04, "learning_rate": 0.00029438541555960505, "loss": 0.0368, "step": 14440 }, { "epoch": 0.04, "learning_rate": 0.00029438152734323356, "loss": 0.0439, "step": 14450 }, { "epoch": 0.04, "learning_rate": 0.00029437763912686213, "loss": 0.0417, "step": 14460 }, { "epoch": 0.04, "learning_rate": 0.00029437375091049064, "loss": 0.0384, "step": 14470 }, { "epoch": 0.04, "learning_rate": 0.00029436986269411916, "loss": 0.0442, "step": 14480 }, { "epoch": 0.04, "learning_rate": 0.0002943659744777477, "loss": 0.0466, "step": 14490 }, { "epoch": 0.04, "learning_rate": 0.00029436208626137624, "loss": 0.0407, "step": 14500 }, { "epoch": 0.04, "learning_rate": 0.00029435819804500476, "loss": 0.0419, "step": 14510 }, { "epoch": 0.04, "learning_rate": 0.0002943543098286333, "loss": 0.0443, "step": 14520 }, { "epoch": 0.04, "learning_rate": 0.0002943504216122619, "loss": 0.0698, "step": 14530 }, { "epoch": 0.04, "learning_rate": 0.0002943465333958904, "loss": 0.043, "step": 14540 }, { "epoch": 0.04, "learning_rate": 0.0002943426451795189, "loss": 0.0491, "step": 14550 }, { "epoch": 0.04, "learning_rate": 0.00029433875696314744, "loss": 0.0379, "step": 14560 }, { "epoch": 0.04, "learning_rate": 0.000294334868746776, "loss": 0.0411, "step": 14570 }, { "epoch": 0.04, "learning_rate": 0.0002943309805304045, "loss": 0.0388, "step": 14580 }, { "epoch": 0.04, "learning_rate": 0.0002943270923140331, "loss": 0.0518, "step": 14590 }, { "epoch": 0.04, "learning_rate": 0.0002943232040976616, "loss": 0.0646, "step": 14600 }, { "epoch": 0.04, "learning_rate": 0.00029431931588129017, "loss": 0.0381, "step": 14610 }, { "epoch": 0.04, "learning_rate": 0.0002943154276649187, "loss": 0.039, "step": 14620 }, { "epoch": 0.04, "learning_rate": 0.0002943115394485472, "loss": 0.038, "step": 14630 }, { "epoch": 0.04, "learning_rate": 0.0002943076512321757, "loss": 0.0462, "step": 14640 }, { "epoch": 0.04, "learning_rate": 0.0002943037630158043, "loss": 0.042, "step": 14650 }, { "epoch": 0.04, "learning_rate": 0.0002942998747994328, "loss": 0.0402, "step": 14660 }, { "epoch": 0.04, "learning_rate": 0.00029429598658306137, "loss": 0.0367, "step": 14670 }, { "epoch": 0.04, "learning_rate": 0.0002942920983666899, "loss": 0.0437, "step": 14680 }, { "epoch": 0.04, "learning_rate": 0.0002942882101503184, "loss": 0.0369, "step": 14690 }, { "epoch": 0.04, "learning_rate": 0.00029428432193394697, "loss": 0.0406, "step": 14700 }, { "epoch": 0.04, "learning_rate": 0.0002942804337175755, "loss": 0.0371, "step": 14710 }, { "epoch": 0.04, "learning_rate": 0.000294276545501204, "loss": 0.0411, "step": 14720 }, { "epoch": 0.04, "learning_rate": 0.00029427265728483256, "loss": 0.0397, "step": 14730 }, { "epoch": 0.04, "learning_rate": 0.00029426876906846113, "loss": 0.043, "step": 14740 }, { "epoch": 0.04, "learning_rate": 0.00029426488085208965, "loss": 0.0391, "step": 14750 }, { "epoch": 0.04, "learning_rate": 0.00029426099263571816, "loss": 0.0369, "step": 14760 }, { "epoch": 0.04, "learning_rate": 0.0002942571044193467, "loss": 0.0438, "step": 14770 }, { "epoch": 0.04, "learning_rate": 0.00029425321620297524, "loss": 0.05, "step": 14780 }, { "epoch": 0.04, "learning_rate": 0.00029424932798660376, "loss": 0.0418, "step": 14790 }, { "epoch": 0.04, "learning_rate": 0.00029424543977023233, "loss": 0.0398, "step": 14800 }, { "epoch": 0.04, "learning_rate": 0.00029424155155386084, "loss": 0.0422, "step": 14810 }, { "epoch": 0.04, "learning_rate": 0.0002942376633374894, "loss": 0.039, "step": 14820 }, { "epoch": 0.04, "learning_rate": 0.0002942337751211179, "loss": 0.0404, "step": 14830 }, { "epoch": 0.04, "learning_rate": 0.00029422988690474644, "loss": 0.0349, "step": 14840 }, { "epoch": 0.04, "learning_rate": 0.00029422599868837495, "loss": 0.0414, "step": 14850 }, { "epoch": 0.04, "learning_rate": 0.0002942221104720035, "loss": 0.0419, "step": 14860 }, { "epoch": 0.04, "learning_rate": 0.00029421822225563204, "loss": 0.0429, "step": 14870 }, { "epoch": 0.04, "learning_rate": 0.0002942143340392606, "loss": 0.0405, "step": 14880 }, { "epoch": 0.04, "learning_rate": 0.0002942104458228891, "loss": 0.0481, "step": 14890 }, { "epoch": 0.04, "learning_rate": 0.00029420655760651764, "loss": 0.0373, "step": 14900 }, { "epoch": 0.04, "learning_rate": 0.0002942026693901462, "loss": 0.0443, "step": 14910 }, { "epoch": 0.04, "learning_rate": 0.0002941987811737747, "loss": 0.0433, "step": 14920 }, { "epoch": 0.04, "learning_rate": 0.0002941948929574033, "loss": 0.0481, "step": 14930 }, { "epoch": 0.04, "learning_rate": 0.0002941910047410318, "loss": 0.0463, "step": 14940 }, { "epoch": 0.04, "learning_rate": 0.00029418711652466037, "loss": 0.0501, "step": 14950 }, { "epoch": 0.04, "learning_rate": 0.0002941832283082889, "loss": 0.0442, "step": 14960 }, { "epoch": 0.04, "learning_rate": 0.0002941793400919174, "loss": 0.0422, "step": 14970 }, { "epoch": 0.04, "learning_rate": 0.0002941754518755459, "loss": 0.0515, "step": 14980 }, { "epoch": 0.04, "learning_rate": 0.0002941715636591745, "loss": 0.0412, "step": 14990 }, { "epoch": 0.04, "learning_rate": 0.000294167675442803, "loss": 0.0378, "step": 15000 }, { "epoch": 0.04, "eval_cer": 0.8818076590932312, "eval_loss": 0.03137202188372612, "eval_runtime": 107.683, "eval_samples_per_second": 18.573, "eval_steps_per_second": 4.643, "step": 15000 }, { "epoch": 0.04, "learning_rate": 0.00029416378722643157, "loss": 0.0459, "step": 15010 }, { "epoch": 0.04, "learning_rate": 0.0002941598990100601, "loss": 0.0344, "step": 15020 }, { "epoch": 0.04, "learning_rate": 0.00029415601079368865, "loss": 0.0418, "step": 15030 }, { "epoch": 0.04, "learning_rate": 0.00029415212257731716, "loss": 0.0395, "step": 15040 }, { "epoch": 0.04, "learning_rate": 0.0002941482343609457, "loss": 0.0395, "step": 15050 }, { "epoch": 0.04, "learning_rate": 0.0002941443461445742, "loss": 0.0445, "step": 15060 }, { "epoch": 0.04, "learning_rate": 0.00029414045792820276, "loss": 0.0463, "step": 15070 }, { "epoch": 0.04, "learning_rate": 0.00029413656971183133, "loss": 0.0415, "step": 15080 }, { "epoch": 0.04, "learning_rate": 0.00029413268149545985, "loss": 0.044, "step": 15090 }, { "epoch": 0.04, "learning_rate": 0.00029412879327908836, "loss": 0.0357, "step": 15100 }, { "epoch": 0.04, "learning_rate": 0.00029412490506271693, "loss": 0.0415, "step": 15110 }, { "epoch": 0.04, "learning_rate": 0.00029412101684634544, "loss": 0.0421, "step": 15120 }, { "epoch": 0.04, "learning_rate": 0.00029411712862997396, "loss": 0.0426, "step": 15130 }, { "epoch": 0.04, "learning_rate": 0.0002941132404136025, "loss": 0.0444, "step": 15140 }, { "epoch": 0.04, "learning_rate": 0.00029410935219723104, "loss": 0.0384, "step": 15150 }, { "epoch": 0.04, "learning_rate": 0.0002941054639808596, "loss": 0.0538, "step": 15160 }, { "epoch": 0.04, "learning_rate": 0.0002941015757644881, "loss": 0.0441, "step": 15170 }, { "epoch": 0.04, "learning_rate": 0.00029409768754811664, "loss": 0.0439, "step": 15180 }, { "epoch": 0.04, "learning_rate": 0.00029409379933174515, "loss": 0.0468, "step": 15190 }, { "epoch": 0.04, "learning_rate": 0.0002940899111153737, "loss": 0.0479, "step": 15200 }, { "epoch": 0.04, "learning_rate": 0.00029408602289900224, "loss": 0.0427, "step": 15210 }, { "epoch": 0.04, "learning_rate": 0.0002940821346826308, "loss": 0.0373, "step": 15220 }, { "epoch": 0.04, "learning_rate": 0.0002940782464662593, "loss": 0.0442, "step": 15230 }, { "epoch": 0.04, "learning_rate": 0.0002940743582498879, "loss": 0.0475, "step": 15240 }, { "epoch": 0.04, "learning_rate": 0.0002940704700335164, "loss": 0.0501, "step": 15250 }, { "epoch": 0.04, "learning_rate": 0.0002940665818171449, "loss": 0.0431, "step": 15260 }, { "epoch": 0.04, "learning_rate": 0.00029406269360077343, "loss": 0.0407, "step": 15270 }, { "epoch": 0.04, "learning_rate": 0.000294058805384402, "loss": 0.0506, "step": 15280 }, { "epoch": 0.04, "learning_rate": 0.00029405491716803057, "loss": 0.0416, "step": 15290 }, { "epoch": 0.04, "learning_rate": 0.0002940510289516591, "loss": 0.0431, "step": 15300 }, { "epoch": 0.04, "learning_rate": 0.0002940471407352876, "loss": 0.0457, "step": 15310 }, { "epoch": 0.04, "learning_rate": 0.00029404325251891617, "loss": 0.0432, "step": 15320 }, { "epoch": 0.04, "learning_rate": 0.0002940393643025447, "loss": 0.0412, "step": 15330 }, { "epoch": 0.04, "learning_rate": 0.0002940354760861732, "loss": 0.0355, "step": 15340 }, { "epoch": 0.04, "learning_rate": 0.00029403158786980177, "loss": 0.0439, "step": 15350 }, { "epoch": 0.04, "learning_rate": 0.0002940276996534303, "loss": 0.0419, "step": 15360 }, { "epoch": 0.04, "learning_rate": 0.00029402381143705885, "loss": 0.0392, "step": 15370 }, { "epoch": 0.04, "learning_rate": 0.00029401992322068736, "loss": 0.0348, "step": 15380 }, { "epoch": 0.04, "learning_rate": 0.0002940160350043159, "loss": 0.0445, "step": 15390 }, { "epoch": 0.04, "learning_rate": 0.0002940121467879444, "loss": 0.0373, "step": 15400 }, { "epoch": 0.04, "learning_rate": 0.00029400825857157296, "loss": 0.0367, "step": 15410 }, { "epoch": 0.04, "learning_rate": 0.0002940043703552015, "loss": 0.0375, "step": 15420 }, { "epoch": 0.04, "learning_rate": 0.00029400048213883004, "loss": 0.0389, "step": 15430 }, { "epoch": 0.04, "learning_rate": 0.00029399659392245856, "loss": 0.036, "step": 15440 }, { "epoch": 0.04, "learning_rate": 0.00029399270570608713, "loss": 0.0451, "step": 15450 }, { "epoch": 0.04, "learning_rate": 0.00029398881748971564, "loss": 0.0406, "step": 15460 }, { "epoch": 0.04, "learning_rate": 0.00029398492927334416, "loss": 0.055, "step": 15470 }, { "epoch": 0.04, "learning_rate": 0.0002939810410569727, "loss": 0.0409, "step": 15480 }, { "epoch": 0.04, "learning_rate": 0.00029397715284060124, "loss": 0.0401, "step": 15490 }, { "epoch": 0.04, "learning_rate": 0.0002939732646242298, "loss": 0.0379, "step": 15500 }, { "epoch": 0.04, "learning_rate": 0.0002939693764078583, "loss": 0.0387, "step": 15510 }, { "epoch": 0.04, "learning_rate": 0.00029396548819148684, "loss": 0.0393, "step": 15520 }, { "epoch": 0.04, "learning_rate": 0.0002939615999751154, "loss": 0.0347, "step": 15530 }, { "epoch": 0.04, "learning_rate": 0.0002939577117587439, "loss": 0.0438, "step": 15540 }, { "epoch": 0.04, "learning_rate": 0.00029395382354237244, "loss": 0.0399, "step": 15550 }, { "epoch": 0.04, "learning_rate": 0.000293949935326001, "loss": 0.0379, "step": 15560 }, { "epoch": 0.04, "learning_rate": 0.0002939460471096295, "loss": 0.0491, "step": 15570 }, { "epoch": 0.04, "learning_rate": 0.0002939421588932581, "loss": 0.0469, "step": 15580 }, { "epoch": 0.04, "learning_rate": 0.0002939382706768866, "loss": 0.0389, "step": 15590 }, { "epoch": 0.04, "learning_rate": 0.0002939343824605151, "loss": 0.0356, "step": 15600 }, { "epoch": 0.04, "learning_rate": 0.0002939304942441437, "loss": 0.0429, "step": 15610 }, { "epoch": 0.04, "learning_rate": 0.0002939266060277722, "loss": 0.0406, "step": 15620 }, { "epoch": 0.04, "learning_rate": 0.00029392271781140077, "loss": 0.0413, "step": 15630 }, { "epoch": 0.04, "learning_rate": 0.0002939188295950293, "loss": 0.0406, "step": 15640 }, { "epoch": 0.04, "learning_rate": 0.0002939149413786578, "loss": 0.0394, "step": 15650 }, { "epoch": 0.04, "learning_rate": 0.00029391105316228637, "loss": 0.0466, "step": 15660 }, { "epoch": 0.04, "learning_rate": 0.0002939071649459149, "loss": 0.0357, "step": 15670 }, { "epoch": 0.04, "learning_rate": 0.0002939032767295434, "loss": 0.0417, "step": 15680 }, { "epoch": 0.04, "learning_rate": 0.00029389938851317196, "loss": 0.0405, "step": 15690 }, { "epoch": 0.04, "learning_rate": 0.0002938955002968005, "loss": 0.0324, "step": 15700 }, { "epoch": 0.04, "learning_rate": 0.00029389161208042905, "loss": 0.0376, "step": 15710 }, { "epoch": 0.04, "learning_rate": 0.00029388772386405756, "loss": 0.0348, "step": 15720 }, { "epoch": 0.04, "learning_rate": 0.0002938838356476861, "loss": 0.0417, "step": 15730 }, { "epoch": 0.04, "learning_rate": 0.00029387994743131465, "loss": 0.042, "step": 15740 }, { "epoch": 0.04, "learning_rate": 0.00029387605921494316, "loss": 0.037, "step": 15750 }, { "epoch": 0.04, "learning_rate": 0.0002938721709985717, "loss": 0.0845, "step": 15760 }, { "epoch": 0.04, "learning_rate": 0.00029386828278220024, "loss": 0.0469, "step": 15770 }, { "epoch": 0.04, "learning_rate": 0.0002938643945658288, "loss": 0.048, "step": 15780 }, { "epoch": 0.04, "learning_rate": 0.0002938605063494573, "loss": 0.0423, "step": 15790 }, { "epoch": 0.04, "learning_rate": 0.00029385661813308584, "loss": 0.0448, "step": 15800 }, { "epoch": 0.04, "learning_rate": 0.00029385272991671436, "loss": 0.0631, "step": 15810 }, { "epoch": 0.04, "learning_rate": 0.0002938488417003429, "loss": 0.0448, "step": 15820 }, { "epoch": 0.04, "learning_rate": 0.00029384495348397144, "loss": 0.039, "step": 15830 }, { "epoch": 0.04, "learning_rate": 0.0002938410652676, "loss": 0.0412, "step": 15840 }, { "epoch": 0.04, "learning_rate": 0.0002938371770512285, "loss": 0.0431, "step": 15850 }, { "epoch": 0.04, "learning_rate": 0.0002938332888348571, "loss": 0.0392, "step": 15860 }, { "epoch": 0.04, "learning_rate": 0.0002938294006184856, "loss": 0.0384, "step": 15870 }, { "epoch": 0.04, "learning_rate": 0.0002938255124021141, "loss": 0.0443, "step": 15880 }, { "epoch": 0.04, "learning_rate": 0.00029382162418574263, "loss": 0.0388, "step": 15890 }, { "epoch": 0.04, "learning_rate": 0.0002938177359693712, "loss": 0.0378, "step": 15900 }, { "epoch": 0.04, "learning_rate": 0.0002938138477529997, "loss": 0.039, "step": 15910 }, { "epoch": 0.04, "learning_rate": 0.0002938099595366283, "loss": 0.0373, "step": 15920 }, { "epoch": 0.04, "learning_rate": 0.0002938060713202568, "loss": 0.0344, "step": 15930 }, { "epoch": 0.04, "learning_rate": 0.0002938021831038853, "loss": 0.04, "step": 15940 }, { "epoch": 0.04, "learning_rate": 0.0002937982948875139, "loss": 0.0326, "step": 15950 }, { "epoch": 0.04, "learning_rate": 0.0002937944066711424, "loss": 0.0343, "step": 15960 }, { "epoch": 0.04, "learning_rate": 0.0002937905184547709, "loss": 0.043, "step": 15970 }, { "epoch": 0.04, "learning_rate": 0.0002937866302383995, "loss": 0.0414, "step": 15980 }, { "epoch": 0.04, "learning_rate": 0.00029378274202202805, "loss": 0.0403, "step": 15990 }, { "epoch": 0.04, "learning_rate": 0.00029377885380565657, "loss": 0.0366, "step": 16000 }, { "epoch": 0.04, "eval_cer": 0.88186084529673, "eval_loss": 0.03012273460626602, "eval_runtime": 107.9461, "eval_samples_per_second": 18.528, "eval_steps_per_second": 4.632, "step": 16000 }, { "epoch": 0.04, "learning_rate": 0.0002937749655892851, "loss": 0.0375, "step": 16010 }, { "epoch": 0.04, "learning_rate": 0.0002937710773729136, "loss": 0.0422, "step": 16020 }, { "epoch": 0.04, "learning_rate": 0.00029376718915654216, "loss": 0.0427, "step": 16030 }, { "epoch": 0.04, "learning_rate": 0.0002937633009401707, "loss": 0.0419, "step": 16040 }, { "epoch": 0.04, "learning_rate": 0.00029375941272379925, "loss": 0.0427, "step": 16050 }, { "epoch": 0.04, "learning_rate": 0.00029375552450742776, "loss": 0.0404, "step": 16060 }, { "epoch": 0.04, "learning_rate": 0.00029375163629105633, "loss": 0.0365, "step": 16070 }, { "epoch": 0.04, "learning_rate": 0.00029374774807468484, "loss": 0.0372, "step": 16080 }, { "epoch": 0.04, "learning_rate": 0.00029374385985831336, "loss": 0.0384, "step": 16090 }, { "epoch": 0.04, "learning_rate": 0.0002937399716419419, "loss": 0.0423, "step": 16100 }, { "epoch": 0.04, "learning_rate": 0.00029373608342557044, "loss": 0.0354, "step": 16110 }, { "epoch": 0.04, "learning_rate": 0.000293732195209199, "loss": 0.0394, "step": 16120 }, { "epoch": 0.04, "learning_rate": 0.0002937283069928275, "loss": 0.0427, "step": 16130 }, { "epoch": 0.04, "learning_rate": 0.00029372441877645604, "loss": 0.0432, "step": 16140 }, { "epoch": 0.04, "learning_rate": 0.00029372053056008455, "loss": 0.0402, "step": 16150 }, { "epoch": 0.04, "learning_rate": 0.0002937166423437131, "loss": 0.0474, "step": 16160 }, { "epoch": 0.04, "learning_rate": 0.00029371275412734164, "loss": 0.0369, "step": 16170 }, { "epoch": 0.04, "learning_rate": 0.0002937088659109702, "loss": 0.0425, "step": 16180 }, { "epoch": 0.04, "learning_rate": 0.0002937049776945987, "loss": 0.0391, "step": 16190 }, { "epoch": 0.04, "learning_rate": 0.0002937010894782273, "loss": 0.0389, "step": 16200 }, { "epoch": 0.04, "learning_rate": 0.0002936972012618558, "loss": 0.0424, "step": 16210 }, { "epoch": 0.04, "learning_rate": 0.0002936933130454843, "loss": 0.0423, "step": 16220 }, { "epoch": 0.04, "learning_rate": 0.00029368942482911283, "loss": 0.0427, "step": 16230 }, { "epoch": 0.04, "learning_rate": 0.0002936855366127414, "loss": 0.0383, "step": 16240 }, { "epoch": 0.04, "learning_rate": 0.0002936816483963699, "loss": 0.0419, "step": 16250 }, { "epoch": 0.04, "learning_rate": 0.0002936777601799985, "loss": 0.0345, "step": 16260 }, { "epoch": 0.04, "learning_rate": 0.000293673871963627, "loss": 0.037, "step": 16270 }, { "epoch": 0.04, "learning_rate": 0.00029366998374725557, "loss": 0.0443, "step": 16280 }, { "epoch": 0.04, "learning_rate": 0.0002936660955308841, "loss": 0.0373, "step": 16290 }, { "epoch": 0.04, "learning_rate": 0.0002936622073145126, "loss": 0.036, "step": 16300 }, { "epoch": 0.04, "learning_rate": 0.0002936583190981411, "loss": 0.0403, "step": 16310 }, { "epoch": 0.04, "learning_rate": 0.0002936544308817697, "loss": 0.0389, "step": 16320 }, { "epoch": 0.04, "learning_rate": 0.00029365054266539825, "loss": 0.0413, "step": 16330 }, { "epoch": 0.04, "learning_rate": 0.00029364665444902676, "loss": 0.0449, "step": 16340 }, { "epoch": 0.04, "learning_rate": 0.0002936427662326553, "loss": 0.041, "step": 16350 }, { "epoch": 0.04, "learning_rate": 0.00029363887801628385, "loss": 0.0353, "step": 16360 }, { "epoch": 0.04, "learning_rate": 0.00029363498979991236, "loss": 0.0339, "step": 16370 }, { "epoch": 0.04, "learning_rate": 0.0002936311015835409, "loss": 0.0417, "step": 16380 }, { "epoch": 0.04, "learning_rate": 0.00029362721336716945, "loss": 0.0395, "step": 16390 }, { "epoch": 0.04, "learning_rate": 0.00029362332515079796, "loss": 0.0394, "step": 16400 }, { "epoch": 0.04, "learning_rate": 0.00029361943693442653, "loss": 0.0387, "step": 16410 }, { "epoch": 0.04, "learning_rate": 0.00029361554871805504, "loss": 0.0351, "step": 16420 }, { "epoch": 0.04, "learning_rate": 0.00029361166050168356, "loss": 0.0321, "step": 16430 }, { "epoch": 0.04, "learning_rate": 0.00029360777228531207, "loss": 0.0375, "step": 16440 }, { "epoch": 0.04, "learning_rate": 0.00029360388406894064, "loss": 0.0426, "step": 16450 }, { "epoch": 0.04, "learning_rate": 0.00029359999585256916, "loss": 0.039, "step": 16460 }, { "epoch": 0.04, "learning_rate": 0.0002935961076361977, "loss": 0.0398, "step": 16470 }, { "epoch": 0.04, "learning_rate": 0.00029359221941982624, "loss": 0.043, "step": 16480 }, { "epoch": 0.04, "learning_rate": 0.0002935883312034548, "loss": 0.0445, "step": 16490 }, { "epoch": 0.04, "learning_rate": 0.0002935844429870833, "loss": 0.0398, "step": 16500 }, { "epoch": 0.04, "learning_rate": 0.00029358055477071184, "loss": 0.038, "step": 16510 }, { "epoch": 0.04, "learning_rate": 0.0002935766665543404, "loss": 0.0439, "step": 16520 }, { "epoch": 0.04, "learning_rate": 0.0002935727783379689, "loss": 0.0376, "step": 16530 }, { "epoch": 0.04, "learning_rate": 0.0002935688901215975, "loss": 0.03, "step": 16540 }, { "epoch": 0.04, "learning_rate": 0.000293565001905226, "loss": 0.0415, "step": 16550 }, { "epoch": 0.04, "learning_rate": 0.0002935611136888545, "loss": 0.0394, "step": 16560 }, { "epoch": 0.04, "learning_rate": 0.0002935572254724831, "loss": 0.0356, "step": 16570 }, { "epoch": 0.04, "learning_rate": 0.0002935533372561116, "loss": 0.0372, "step": 16580 }, { "epoch": 0.04, "learning_rate": 0.0002935494490397401, "loss": 0.0391, "step": 16590 }, { "epoch": 0.04, "learning_rate": 0.0002935455608233687, "loss": 0.0421, "step": 16600 }, { "epoch": 0.04, "learning_rate": 0.0002935416726069972, "loss": 0.0335, "step": 16610 }, { "epoch": 0.04, "learning_rate": 0.00029353778439062577, "loss": 0.039, "step": 16620 }, { "epoch": 0.04, "learning_rate": 0.0002935338961742543, "loss": 0.0397, "step": 16630 }, { "epoch": 0.04, "learning_rate": 0.0002935300079578828, "loss": 0.0398, "step": 16640 }, { "epoch": 0.04, "learning_rate": 0.0002935261197415113, "loss": 0.0357, "step": 16650 }, { "epoch": 0.04, "learning_rate": 0.0002935222315251399, "loss": 0.0375, "step": 16660 }, { "epoch": 0.04, "learning_rate": 0.00029351834330876845, "loss": 0.0341, "step": 16670 }, { "epoch": 0.04, "learning_rate": 0.00029351445509239696, "loss": 0.0374, "step": 16680 }, { "epoch": 0.04, "learning_rate": 0.0002935105668760255, "loss": 0.0364, "step": 16690 }, { "epoch": 0.04, "learning_rate": 0.00029350667865965405, "loss": 0.0414, "step": 16700 }, { "epoch": 0.04, "learning_rate": 0.00029350279044328256, "loss": 0.0346, "step": 16710 }, { "epoch": 0.04, "learning_rate": 0.0002934989022269111, "loss": 0.038, "step": 16720 }, { "epoch": 0.04, "learning_rate": 0.00029349501401053964, "loss": 0.0385, "step": 16730 }, { "epoch": 0.04, "learning_rate": 0.00029349112579416816, "loss": 0.0394, "step": 16740 }, { "epoch": 0.04, "learning_rate": 0.00029348723757779673, "loss": 0.042, "step": 16750 }, { "epoch": 0.04, "learning_rate": 0.00029348334936142524, "loss": 0.0362, "step": 16760 }, { "epoch": 0.04, "learning_rate": 0.00029347946114505376, "loss": 0.0386, "step": 16770 }, { "epoch": 0.04, "learning_rate": 0.0002934755729286823, "loss": 0.0346, "step": 16780 }, { "epoch": 0.04, "learning_rate": 0.00029347168471231084, "loss": 0.0407, "step": 16790 }, { "epoch": 0.04, "learning_rate": 0.00029346779649593935, "loss": 0.042, "step": 16800 }, { "epoch": 0.04, "learning_rate": 0.0002934639082795679, "loss": 0.0405, "step": 16810 }, { "epoch": 0.04, "learning_rate": 0.0002934600200631965, "loss": 0.037, "step": 16820 }, { "epoch": 0.04, "learning_rate": 0.000293456131846825, "loss": 0.0323, "step": 16830 }, { "epoch": 0.04, "learning_rate": 0.0002934522436304535, "loss": 0.0396, "step": 16840 }, { "epoch": 0.04, "learning_rate": 0.00029344835541408204, "loss": 0.043, "step": 16850 }, { "epoch": 0.04, "learning_rate": 0.0002934444671977106, "loss": 0.0394, "step": 16860 }, { "epoch": 0.04, "learning_rate": 0.0002934405789813391, "loss": 0.0429, "step": 16870 }, { "epoch": 0.04, "learning_rate": 0.0002934366907649677, "loss": 0.0388, "step": 16880 }, { "epoch": 0.04, "learning_rate": 0.0002934328025485962, "loss": 0.0435, "step": 16890 }, { "epoch": 0.04, "learning_rate": 0.0002934289143322247, "loss": 0.0428, "step": 16900 }, { "epoch": 0.04, "learning_rate": 0.0002934250261158533, "loss": 0.0457, "step": 16910 }, { "epoch": 0.04, "learning_rate": 0.0002934211378994818, "loss": 0.0409, "step": 16920 }, { "epoch": 0.04, "learning_rate": 0.0002934172496831103, "loss": 0.0415, "step": 16930 }, { "epoch": 0.04, "learning_rate": 0.0002934133614667389, "loss": 0.0393, "step": 16940 }, { "epoch": 0.04, "learning_rate": 0.0002934094732503674, "loss": 0.0429, "step": 16950 }, { "epoch": 0.04, "learning_rate": 0.00029340558503399597, "loss": 0.0338, "step": 16960 }, { "epoch": 0.04, "learning_rate": 0.0002934016968176245, "loss": 0.048, "step": 16970 }, { "epoch": 0.04, "learning_rate": 0.000293397808601253, "loss": 0.0363, "step": 16980 }, { "epoch": 0.04, "learning_rate": 0.00029339392038488156, "loss": 0.0343, "step": 16990 }, { "epoch": 0.04, "learning_rate": 0.0002933900321685101, "loss": 0.0352, "step": 17000 }, { "epoch": 0.04, "eval_cer": 0.8818314529211123, "eval_loss": 0.028564387932419777, "eval_runtime": 107.5392, "eval_samples_per_second": 18.598, "eval_steps_per_second": 4.649, "step": 17000 }, { "epoch": 0.04, "learning_rate": 0.0002933861439521386, "loss": 0.0351, "step": 17010 }, { "epoch": 0.04, "learning_rate": 0.00029338225573576716, "loss": 0.045, "step": 17020 }, { "epoch": 0.04, "learning_rate": 0.00029337836751939573, "loss": 0.0414, "step": 17030 }, { "epoch": 0.04, "learning_rate": 0.00029337447930302425, "loss": 0.0377, "step": 17040 }, { "epoch": 0.04, "learning_rate": 0.00029337059108665276, "loss": 0.0351, "step": 17050 }, { "epoch": 0.04, "learning_rate": 0.0002933667028702813, "loss": 0.0405, "step": 17060 }, { "epoch": 0.04, "learning_rate": 0.00029336281465390984, "loss": 0.0365, "step": 17070 }, { "epoch": 0.04, "learning_rate": 0.00029335892643753836, "loss": 0.0401, "step": 17080 }, { "epoch": 0.04, "learning_rate": 0.0002933550382211669, "loss": 0.0421, "step": 17090 }, { "epoch": 0.04, "learning_rate": 0.00029335115000479544, "loss": 0.0378, "step": 17100 }, { "epoch": 0.04, "learning_rate": 0.000293347261788424, "loss": 0.0412, "step": 17110 }, { "epoch": 0.04, "learning_rate": 0.0002933433735720525, "loss": 0.0424, "step": 17120 }, { "epoch": 0.04, "learning_rate": 0.00029333948535568104, "loss": 0.0388, "step": 17130 }, { "epoch": 0.04, "learning_rate": 0.00029333559713930955, "loss": 0.0443, "step": 17140 }, { "epoch": 0.04, "learning_rate": 0.0002933317089229381, "loss": 0.0342, "step": 17150 }, { "epoch": 0.04, "learning_rate": 0.00029332782070656664, "loss": 0.0447, "step": 17160 }, { "epoch": 0.04, "learning_rate": 0.0002933239324901952, "loss": 0.0342, "step": 17170 }, { "epoch": 0.04, "learning_rate": 0.0002933200442738237, "loss": 0.0426, "step": 17180 }, { "epoch": 0.04, "learning_rate": 0.00029331615605745223, "loss": 0.0443, "step": 17190 }, { "epoch": 0.04, "learning_rate": 0.0002933122678410808, "loss": 0.0332, "step": 17200 }, { "epoch": 0.04, "learning_rate": 0.0002933083796247093, "loss": 0.0393, "step": 17210 }, { "epoch": 0.04, "learning_rate": 0.0002933044914083379, "loss": 0.0423, "step": 17220 }, { "epoch": 0.04, "learning_rate": 0.0002933006031919664, "loss": 0.0331, "step": 17230 }, { "epoch": 0.04, "learning_rate": 0.00029329671497559497, "loss": 0.0416, "step": 17240 }, { "epoch": 0.04, "learning_rate": 0.0002932928267592235, "loss": 0.0355, "step": 17250 }, { "epoch": 0.04, "learning_rate": 0.000293288938542852, "loss": 0.0351, "step": 17260 }, { "epoch": 0.04, "learning_rate": 0.0002932850503264805, "loss": 0.045, "step": 17270 }, { "epoch": 0.04, "learning_rate": 0.0002932811621101091, "loss": 0.0364, "step": 17280 }, { "epoch": 0.04, "learning_rate": 0.0002932772738937376, "loss": 0.0329, "step": 17290 }, { "epoch": 0.04, "learning_rate": 0.00029327338567736617, "loss": 0.0359, "step": 17300 }, { "epoch": 0.04, "learning_rate": 0.0002932694974609947, "loss": 0.0427, "step": 17310 }, { "epoch": 0.04, "learning_rate": 0.00029326560924462325, "loss": 0.0444, "step": 17320 }, { "epoch": 0.04, "learning_rate": 0.00029326172102825176, "loss": 0.0363, "step": 17330 }, { "epoch": 0.04, "learning_rate": 0.0002932578328118803, "loss": 0.0453, "step": 17340 }, { "epoch": 0.04, "learning_rate": 0.0002932539445955088, "loss": 0.0377, "step": 17350 }, { "epoch": 0.04, "learning_rate": 0.00029325005637913736, "loss": 0.0508, "step": 17360 }, { "epoch": 0.05, "learning_rate": 0.00029324616816276593, "loss": 0.0391, "step": 17370 }, { "epoch": 0.05, "learning_rate": 0.00029324227994639444, "loss": 0.043, "step": 17380 }, { "epoch": 0.05, "learning_rate": 0.00029323839173002296, "loss": 0.0637, "step": 17390 }, { "epoch": 0.05, "learning_rate": 0.0002932345035136515, "loss": 0.1008, "step": 17400 }, { "epoch": 0.05, "learning_rate": 0.00029323061529728004, "loss": 0.0745, "step": 17410 }, { "epoch": 0.05, "learning_rate": 0.00029322672708090856, "loss": 0.054, "step": 17420 }, { "epoch": 0.05, "learning_rate": 0.0002932228388645371, "loss": 0.0342, "step": 17430 }, { "epoch": 0.05, "learning_rate": 0.00029321895064816564, "loss": 0.038, "step": 17440 }, { "epoch": 0.05, "learning_rate": 0.0002932150624317942, "loss": 0.0426, "step": 17450 }, { "epoch": 0.05, "learning_rate": 0.0002932111742154227, "loss": 0.0394, "step": 17460 }, { "epoch": 0.05, "learning_rate": 0.00029320728599905124, "loss": 0.0476, "step": 17470 }, { "epoch": 0.05, "learning_rate": 0.00029320339778267975, "loss": 0.0438, "step": 17480 }, { "epoch": 0.05, "learning_rate": 0.0002931995095663083, "loss": 0.04, "step": 17490 }, { "epoch": 0.05, "learning_rate": 0.00029319562134993684, "loss": 0.046, "step": 17500 }, { "epoch": 0.05, "learning_rate": 0.0002931917331335654, "loss": 0.045, "step": 17510 }, { "epoch": 0.05, "learning_rate": 0.0002931878449171939, "loss": 0.0622, "step": 17520 }, { "epoch": 0.05, "learning_rate": 0.0002931839567008225, "loss": 0.0487, "step": 17530 }, { "epoch": 0.05, "learning_rate": 0.000293180068484451, "loss": 0.0501, "step": 17540 }, { "epoch": 0.05, "learning_rate": 0.0002931761802680795, "loss": 0.0463, "step": 17550 }, { "epoch": 0.05, "learning_rate": 0.00029317229205170803, "loss": 0.0434, "step": 17560 }, { "epoch": 0.05, "learning_rate": 0.0002931684038353366, "loss": 0.0388, "step": 17570 }, { "epoch": 0.05, "learning_rate": 0.00029316451561896517, "loss": 0.0394, "step": 17580 }, { "epoch": 0.05, "learning_rate": 0.0002931606274025937, "loss": 0.047, "step": 17590 }, { "epoch": 0.05, "learning_rate": 0.0002931567391862222, "loss": 0.0409, "step": 17600 }, { "epoch": 0.05, "learning_rate": 0.00029315285096985077, "loss": 0.0423, "step": 17610 }, { "epoch": 0.05, "learning_rate": 0.0002931489627534793, "loss": 0.0436, "step": 17620 }, { "epoch": 0.05, "learning_rate": 0.0002931450745371078, "loss": 0.0505, "step": 17630 }, { "epoch": 0.05, "learning_rate": 0.00029314118632073636, "loss": 0.0406, "step": 17640 }, { "epoch": 0.05, "learning_rate": 0.0002931372981043649, "loss": 0.0467, "step": 17650 }, { "epoch": 0.05, "learning_rate": 0.00029313340988799345, "loss": 0.0471, "step": 17660 }, { "epoch": 0.05, "learning_rate": 0.00029312952167162196, "loss": 0.0431, "step": 17670 }, { "epoch": 0.05, "learning_rate": 0.0002931256334552505, "loss": 0.0411, "step": 17680 }, { "epoch": 0.05, "learning_rate": 0.000293121745238879, "loss": 0.0391, "step": 17690 }, { "epoch": 0.05, "learning_rate": 0.00029311785702250756, "loss": 0.0407, "step": 17700 }, { "epoch": 0.05, "learning_rate": 0.00029311396880613613, "loss": 0.0371, "step": 17710 }, { "epoch": 0.05, "learning_rate": 0.00029311008058976464, "loss": 0.0345, "step": 17720 }, { "epoch": 0.05, "learning_rate": 0.00029310619237339316, "loss": 0.0467, "step": 17730 }, { "epoch": 0.05, "learning_rate": 0.0002931023041570217, "loss": 0.0382, "step": 17740 }, { "epoch": 0.05, "learning_rate": 0.00029309841594065024, "loss": 0.04, "step": 17750 }, { "epoch": 0.05, "learning_rate": 0.00029309452772427876, "loss": 0.0461, "step": 17760 }, { "epoch": 0.05, "learning_rate": 0.0002930906395079073, "loss": 0.0412, "step": 17770 }, { "epoch": 0.05, "learning_rate": 0.00029308675129153584, "loss": 0.0387, "step": 17780 }, { "epoch": 0.05, "learning_rate": 0.0002930828630751644, "loss": 0.0421, "step": 17790 }, { "epoch": 0.05, "learning_rate": 0.0002930789748587929, "loss": 0.0376, "step": 17800 }, { "epoch": 0.05, "learning_rate": 0.00029307508664242144, "loss": 0.0397, "step": 17810 }, { "epoch": 0.05, "learning_rate": 0.00029307119842605, "loss": 0.0395, "step": 17820 }, { "epoch": 0.05, "learning_rate": 0.0002930673102096785, "loss": 0.0456, "step": 17830 }, { "epoch": 0.05, "learning_rate": 0.00029306342199330703, "loss": 0.0295, "step": 17840 }, { "epoch": 0.05, "learning_rate": 0.0002930595337769356, "loss": 0.0348, "step": 17850 }, { "epoch": 0.05, "learning_rate": 0.00029305564556056417, "loss": 0.0363, "step": 17860 }, { "epoch": 0.05, "learning_rate": 0.0002930517573441927, "loss": 0.0358, "step": 17870 }, { "epoch": 0.05, "learning_rate": 0.0002930478691278212, "loss": 0.0374, "step": 17880 }, { "epoch": 0.05, "learning_rate": 0.0002930439809114497, "loss": 0.0346, "step": 17890 }, { "epoch": 0.05, "learning_rate": 0.00029304009269507823, "loss": 0.0352, "step": 17900 }, { "epoch": 0.05, "learning_rate": 0.0002930362044787068, "loss": 0.0429, "step": 17910 }, { "epoch": 0.05, "learning_rate": 0.00029303231626233537, "loss": 0.0409, "step": 17920 }, { "epoch": 0.05, "learning_rate": 0.0002930284280459639, "loss": 0.0371, "step": 17930 }, { "epoch": 0.05, "learning_rate": 0.0002930245398295924, "loss": 0.036, "step": 17940 }, { "epoch": 0.05, "learning_rate": 0.00029302065161322096, "loss": 0.0396, "step": 17950 }, { "epoch": 0.05, "learning_rate": 0.0002930167633968495, "loss": 0.0401, "step": 17960 }, { "epoch": 0.05, "learning_rate": 0.000293012875180478, "loss": 0.0313, "step": 17970 }, { "epoch": 0.05, "learning_rate": 0.00029300898696410656, "loss": 0.0472, "step": 17980 }, { "epoch": 0.05, "learning_rate": 0.0002930050987477351, "loss": 0.0331, "step": 17990 }, { "epoch": 0.05, "learning_rate": 0.00029300121053136365, "loss": 0.0385, "step": 18000 }, { "epoch": 0.05, "eval_cer": 0.8818174565517705, "eval_loss": 0.02818988636136055, "eval_runtime": 107.7914, "eval_samples_per_second": 18.554, "eval_steps_per_second": 4.639, "step": 18000 }, { "epoch": 0.05, "learning_rate": 0.00029299732231499216, "loss": 0.0375, "step": 18010 }, { "epoch": 0.05, "learning_rate": 0.0002929934340986207, "loss": 0.0344, "step": 18020 }, { "epoch": 0.05, "learning_rate": 0.00029298954588224924, "loss": 0.0401, "step": 18030 }, { "epoch": 0.05, "learning_rate": 0.00029298565766587776, "loss": 0.0356, "step": 18040 }, { "epoch": 0.05, "learning_rate": 0.00029298176944950627, "loss": 0.04, "step": 18050 }, { "epoch": 0.05, "learning_rate": 0.00029297788123313484, "loss": 0.0391, "step": 18060 }, { "epoch": 0.05, "learning_rate": 0.0002929739930167634, "loss": 0.0347, "step": 18070 }, { "epoch": 0.05, "learning_rate": 0.0002929701048003919, "loss": 0.0388, "step": 18080 }, { "epoch": 0.05, "learning_rate": 0.00029296621658402044, "loss": 0.0354, "step": 18090 }, { "epoch": 0.05, "learning_rate": 0.00029296232836764895, "loss": 0.0368, "step": 18100 }, { "epoch": 0.05, "learning_rate": 0.0002929584401512775, "loss": 0.0324, "step": 18110 }, { "epoch": 0.05, "learning_rate": 0.00029295455193490604, "loss": 0.0333, "step": 18120 }, { "epoch": 0.05, "learning_rate": 0.0002929506637185346, "loss": 0.0403, "step": 18130 }, { "epoch": 0.05, "learning_rate": 0.0002929467755021631, "loss": 0.0367, "step": 18140 }, { "epoch": 0.05, "learning_rate": 0.00029294288728579164, "loss": 0.0446, "step": 18150 }, { "epoch": 0.05, "learning_rate": 0.0002929389990694202, "loss": 0.0285, "step": 18160 }, { "epoch": 0.05, "learning_rate": 0.0002929351108530487, "loss": 0.0341, "step": 18170 }, { "epoch": 0.05, "learning_rate": 0.00029293122263667723, "loss": 0.0437, "step": 18180 }, { "epoch": 0.05, "learning_rate": 0.0002929273344203058, "loss": 0.0379, "step": 18190 }, { "epoch": 0.05, "learning_rate": 0.0002929234462039343, "loss": 0.0394, "step": 18200 }, { "epoch": 0.05, "learning_rate": 0.0002929195579875629, "loss": 0.0371, "step": 18210 }, { "epoch": 0.05, "learning_rate": 0.0002929156697711914, "loss": 0.0337, "step": 18220 }, { "epoch": 0.05, "learning_rate": 0.0002929117815548199, "loss": 0.0402, "step": 18230 }, { "epoch": 0.05, "learning_rate": 0.0002929078933384485, "loss": 0.0381, "step": 18240 }, { "epoch": 0.05, "learning_rate": 0.000292904005122077, "loss": 0.0343, "step": 18250 }, { "epoch": 0.05, "learning_rate": 0.00029290011690570557, "loss": 0.0386, "step": 18260 }, { "epoch": 0.05, "learning_rate": 0.0002928962286893341, "loss": 0.0356, "step": 18270 }, { "epoch": 0.05, "learning_rate": 0.00029289234047296265, "loss": 0.0362, "step": 18280 }, { "epoch": 0.05, "learning_rate": 0.00029288845225659116, "loss": 0.0328, "step": 18290 }, { "epoch": 0.05, "learning_rate": 0.0002928845640402197, "loss": 0.0363, "step": 18300 }, { "epoch": 0.05, "learning_rate": 0.0002928806758238482, "loss": 0.0394, "step": 18310 }, { "epoch": 0.05, "learning_rate": 0.00029287678760747676, "loss": 0.0322, "step": 18320 }, { "epoch": 0.05, "learning_rate": 0.0002928728993911053, "loss": 0.0389, "step": 18330 }, { "epoch": 0.05, "learning_rate": 0.00029286901117473384, "loss": 0.0394, "step": 18340 }, { "epoch": 0.05, "learning_rate": 0.00029286512295836236, "loss": 0.0323, "step": 18350 }, { "epoch": 0.05, "learning_rate": 0.0002928612347419909, "loss": 0.0445, "step": 18360 }, { "epoch": 0.05, "learning_rate": 0.00029285734652561944, "loss": 0.0385, "step": 18370 }, { "epoch": 0.05, "learning_rate": 0.00029285345830924796, "loss": 0.0338, "step": 18380 }, { "epoch": 0.05, "learning_rate": 0.00029284957009287647, "loss": 0.0383, "step": 18390 }, { "epoch": 0.05, "learning_rate": 0.00029284568187650504, "loss": 0.0389, "step": 18400 }, { "epoch": 0.05, "learning_rate": 0.0002928417936601336, "loss": 0.0431, "step": 18410 }, { "epoch": 0.05, "learning_rate": 0.0002928379054437621, "loss": 0.0422, "step": 18420 }, { "epoch": 0.05, "learning_rate": 0.00029283401722739064, "loss": 0.0336, "step": 18430 }, { "epoch": 0.05, "learning_rate": 0.00029283012901101915, "loss": 0.0368, "step": 18440 }, { "epoch": 0.05, "learning_rate": 0.0002928262407946477, "loss": 0.0344, "step": 18450 }, { "epoch": 0.05, "learning_rate": 0.00029282235257827624, "loss": 0.0366, "step": 18460 }, { "epoch": 0.05, "learning_rate": 0.0002928184643619048, "loss": 0.0362, "step": 18470 }, { "epoch": 0.05, "learning_rate": 0.0002928145761455333, "loss": 0.0355, "step": 18480 }, { "epoch": 0.05, "learning_rate": 0.0002928106879291619, "loss": 0.038, "step": 18490 }, { "epoch": 0.05, "learning_rate": 0.0002928067997127904, "loss": 0.0385, "step": 18500 }, { "epoch": 0.05, "learning_rate": 0.0002928029114964189, "loss": 0.0376, "step": 18510 }, { "epoch": 0.05, "learning_rate": 0.00029279902328004743, "loss": 0.0368, "step": 18520 }, { "epoch": 0.05, "learning_rate": 0.000292795135063676, "loss": 0.0386, "step": 18530 }, { "epoch": 0.05, "learning_rate": 0.0002927912468473045, "loss": 0.0385, "step": 18540 }, { "epoch": 0.05, "learning_rate": 0.0002927873586309331, "loss": 0.0315, "step": 18550 }, { "epoch": 0.05, "learning_rate": 0.0002927834704145616, "loss": 0.0384, "step": 18560 }, { "epoch": 0.05, "learning_rate": 0.00029277958219819017, "loss": 0.0458, "step": 18570 }, { "epoch": 0.05, "learning_rate": 0.0002927756939818187, "loss": 0.0447, "step": 18580 }, { "epoch": 0.05, "learning_rate": 0.0002927718057654472, "loss": 0.0349, "step": 18590 }, { "epoch": 0.05, "learning_rate": 0.0002927679175490757, "loss": 0.0387, "step": 18600 }, { "epoch": 0.05, "learning_rate": 0.0002927640293327043, "loss": 0.0364, "step": 18610 }, { "epoch": 0.05, "learning_rate": 0.00029276014111633285, "loss": 0.044, "step": 18620 }, { "epoch": 0.05, "learning_rate": 0.00029275625289996136, "loss": 0.046, "step": 18630 }, { "epoch": 0.05, "learning_rate": 0.0002927523646835899, "loss": 0.0397, "step": 18640 }, { "epoch": 0.05, "learning_rate": 0.0002927484764672184, "loss": 0.0341, "step": 18650 }, { "epoch": 0.05, "learning_rate": 0.00029274458825084696, "loss": 0.0383, "step": 18660 }, { "epoch": 0.05, "learning_rate": 0.0002927407000344755, "loss": 0.0353, "step": 18670 }, { "epoch": 0.05, "learning_rate": 0.00029273681181810404, "loss": 0.0344, "step": 18680 }, { "epoch": 0.05, "learning_rate": 0.00029273292360173256, "loss": 0.0338, "step": 18690 }, { "epoch": 0.05, "learning_rate": 0.0002927290353853611, "loss": 0.0347, "step": 18700 }, { "epoch": 0.05, "learning_rate": 0.00029272514716898964, "loss": 0.0395, "step": 18710 }, { "epoch": 0.05, "learning_rate": 0.00029272125895261816, "loss": 0.0338, "step": 18720 }, { "epoch": 0.05, "learning_rate": 0.00029271737073624667, "loss": 0.0386, "step": 18730 }, { "epoch": 0.05, "learning_rate": 0.00029271348251987524, "loss": 0.0397, "step": 18740 }, { "epoch": 0.05, "learning_rate": 0.00029270959430350375, "loss": 0.0413, "step": 18750 }, { "epoch": 0.05, "learning_rate": 0.0002927057060871323, "loss": 0.0482, "step": 18760 }, { "epoch": 0.05, "learning_rate": 0.00029270181787076084, "loss": 0.0363, "step": 18770 }, { "epoch": 0.05, "learning_rate": 0.0002926979296543894, "loss": 0.0381, "step": 18780 }, { "epoch": 0.05, "learning_rate": 0.0002926940414380179, "loss": 0.0376, "step": 18790 }, { "epoch": 0.05, "learning_rate": 0.00029269015322164643, "loss": 0.0393, "step": 18800 }, { "epoch": 0.05, "learning_rate": 0.000292686265005275, "loss": 0.0324, "step": 18810 }, { "epoch": 0.05, "learning_rate": 0.0002926823767889035, "loss": 0.0359, "step": 18820 }, { "epoch": 0.05, "learning_rate": 0.0002926784885725321, "loss": 0.046, "step": 18830 }, { "epoch": 0.05, "learning_rate": 0.0002926746003561606, "loss": 0.031, "step": 18840 }, { "epoch": 0.05, "learning_rate": 0.0002926707121397891, "loss": 0.0393, "step": 18850 }, { "epoch": 0.05, "learning_rate": 0.00029266682392341763, "loss": 0.038, "step": 18860 }, { "epoch": 0.05, "learning_rate": 0.0002926629357070462, "loss": 0.0311, "step": 18870 }, { "epoch": 0.05, "learning_rate": 0.0002926590474906747, "loss": 0.0413, "step": 18880 }, { "epoch": 0.05, "learning_rate": 0.0002926551592743033, "loss": 0.0423, "step": 18890 }, { "epoch": 0.05, "learning_rate": 0.0002926512710579318, "loss": 0.0406, "step": 18900 }, { "epoch": 0.05, "learning_rate": 0.00029264738284156037, "loss": 0.0479, "step": 18910 }, { "epoch": 0.05, "learning_rate": 0.0002926434946251889, "loss": 0.0387, "step": 18920 }, { "epoch": 0.05, "learning_rate": 0.0002926396064088174, "loss": 0.0344, "step": 18930 }, { "epoch": 0.05, "learning_rate": 0.0002926357181924459, "loss": 0.04, "step": 18940 }, { "epoch": 0.05, "learning_rate": 0.0002926318299760745, "loss": 0.0335, "step": 18950 }, { "epoch": 0.05, "learning_rate": 0.00029262794175970305, "loss": 0.0378, "step": 18960 }, { "epoch": 0.05, "learning_rate": 0.00029262405354333156, "loss": 0.0347, "step": 18970 }, { "epoch": 0.05, "learning_rate": 0.0002926201653269601, "loss": 0.0339, "step": 18980 }, { "epoch": 0.05, "learning_rate": 0.00029261627711058864, "loss": 0.0417, "step": 18990 }, { "epoch": 0.05, "learning_rate": 0.00029261238889421716, "loss": 0.0385, "step": 19000 }, { "epoch": 0.05, "eval_cer": 0.8817614710744033, "eval_loss": 0.029142551124095917, "eval_runtime": 107.6868, "eval_samples_per_second": 18.572, "eval_steps_per_second": 4.643, "step": 19000 }, { "epoch": 0.05, "learning_rate": 0.0002926085006778457, "loss": 0.036, "step": 19010 }, { "epoch": 0.05, "learning_rate": 0.00029260461246147424, "loss": 0.0359, "step": 19020 }, { "epoch": 0.05, "learning_rate": 0.00029260072424510276, "loss": 0.0389, "step": 19030 }, { "epoch": 0.05, "learning_rate": 0.0002925968360287313, "loss": 0.0376, "step": 19040 }, { "epoch": 0.05, "learning_rate": 0.00029259294781235984, "loss": 0.0375, "step": 19050 }, { "epoch": 0.05, "learning_rate": 0.00029258905959598835, "loss": 0.0498, "step": 19060 }, { "epoch": 0.05, "learning_rate": 0.0002925851713796169, "loss": 0.0429, "step": 19070 }, { "epoch": 0.05, "learning_rate": 0.00029258128316324544, "loss": 0.0424, "step": 19080 }, { "epoch": 0.05, "learning_rate": 0.00029257739494687395, "loss": 0.037, "step": 19090 }, { "epoch": 0.05, "learning_rate": 0.0002925735067305025, "loss": 0.0332, "step": 19100 }, { "epoch": 0.05, "learning_rate": 0.00029256961851413104, "loss": 0.0364, "step": 19110 }, { "epoch": 0.05, "learning_rate": 0.0002925657302977596, "loss": 0.0383, "step": 19120 }, { "epoch": 0.05, "learning_rate": 0.0002925618420813881, "loss": 0.0387, "step": 19130 }, { "epoch": 0.05, "learning_rate": 0.00029255795386501663, "loss": 0.0358, "step": 19140 }, { "epoch": 0.05, "learning_rate": 0.00029255406564864515, "loss": 0.0325, "step": 19150 }, { "epoch": 0.05, "learning_rate": 0.0002925501774322737, "loss": 0.0372, "step": 19160 }, { "epoch": 0.05, "learning_rate": 0.0002925462892159023, "loss": 0.0343, "step": 19170 }, { "epoch": 0.05, "learning_rate": 0.0002925424009995308, "loss": 0.0406, "step": 19180 }, { "epoch": 0.05, "learning_rate": 0.0002925385127831593, "loss": 0.0339, "step": 19190 }, { "epoch": 0.05, "learning_rate": 0.0002925346245667879, "loss": 0.0362, "step": 19200 }, { "epoch": 0.05, "learning_rate": 0.0002925307363504164, "loss": 0.0328, "step": 19210 }, { "epoch": 0.05, "learning_rate": 0.0002925268481340449, "loss": 0.0357, "step": 19220 }, { "epoch": 0.05, "learning_rate": 0.0002925229599176735, "loss": 0.039, "step": 19230 }, { "epoch": 0.05, "learning_rate": 0.000292519071701302, "loss": 0.034, "step": 19240 }, { "epoch": 0.05, "learning_rate": 0.00029251518348493056, "loss": 0.038, "step": 19250 }, { "epoch": 0.05, "learning_rate": 0.0002925112952685591, "loss": 0.0394, "step": 19260 }, { "epoch": 0.05, "learning_rate": 0.0002925074070521876, "loss": 0.0395, "step": 19270 }, { "epoch": 0.05, "learning_rate": 0.00029250351883581616, "loss": 0.0424, "step": 19280 }, { "epoch": 0.05, "learning_rate": 0.0002924996306194447, "loss": 0.0424, "step": 19290 }, { "epoch": 0.05, "learning_rate": 0.00029249574240307325, "loss": 0.0358, "step": 19300 }, { "epoch": 0.05, "learning_rate": 0.00029249185418670176, "loss": 0.0376, "step": 19310 }, { "epoch": 0.05, "learning_rate": 0.00029248796597033033, "loss": 0.04, "step": 19320 }, { "epoch": 0.05, "learning_rate": 0.00029248407775395884, "loss": 0.0369, "step": 19330 }, { "epoch": 0.05, "learning_rate": 0.00029248018953758736, "loss": 0.0406, "step": 19340 }, { "epoch": 0.05, "learning_rate": 0.00029247630132121587, "loss": 0.0377, "step": 19350 }, { "epoch": 0.05, "learning_rate": 0.00029247241310484444, "loss": 0.0438, "step": 19360 }, { "epoch": 0.05, "learning_rate": 0.00029246852488847296, "loss": 0.0387, "step": 19370 }, { "epoch": 0.05, "learning_rate": 0.0002924646366721015, "loss": 0.0425, "step": 19380 }, { "epoch": 0.05, "learning_rate": 0.00029246074845573004, "loss": 0.0359, "step": 19390 }, { "epoch": 0.05, "learning_rate": 0.00029245686023935855, "loss": 0.041, "step": 19400 }, { "epoch": 0.05, "learning_rate": 0.0002924529720229871, "loss": 0.0454, "step": 19410 }, { "epoch": 0.05, "learning_rate": 0.00029244908380661564, "loss": 0.0362, "step": 19420 }, { "epoch": 0.05, "learning_rate": 0.00029244519559024415, "loss": 0.0341, "step": 19430 }, { "epoch": 0.05, "learning_rate": 0.0002924413073738727, "loss": 0.0332, "step": 19440 }, { "epoch": 0.05, "learning_rate": 0.0002924374191575013, "loss": 0.0405, "step": 19450 }, { "epoch": 0.05, "learning_rate": 0.0002924335309411298, "loss": 0.0355, "step": 19460 }, { "epoch": 0.05, "learning_rate": 0.0002924296427247583, "loss": 0.0296, "step": 19470 }, { "epoch": 0.05, "learning_rate": 0.00029242575450838683, "loss": 0.0384, "step": 19480 }, { "epoch": 0.05, "learning_rate": 0.0002924218662920154, "loss": 0.0378, "step": 19490 }, { "epoch": 0.05, "learning_rate": 0.0002924179780756439, "loss": 0.0392, "step": 19500 }, { "epoch": 0.05, "learning_rate": 0.0002924140898592725, "loss": 0.0311, "step": 19510 }, { "epoch": 0.05, "learning_rate": 0.000292410201642901, "loss": 0.0342, "step": 19520 }, { "epoch": 0.05, "learning_rate": 0.00029240631342652957, "loss": 0.0401, "step": 19530 }, { "epoch": 0.05, "learning_rate": 0.0002924024252101581, "loss": 0.0394, "step": 19540 }, { "epoch": 0.05, "learning_rate": 0.0002923985369937866, "loss": 0.0366, "step": 19550 }, { "epoch": 0.05, "learning_rate": 0.0002923946487774151, "loss": 0.0411, "step": 19560 }, { "epoch": 0.05, "learning_rate": 0.0002923907605610437, "loss": 0.0353, "step": 19570 }, { "epoch": 0.05, "learning_rate": 0.0002923868723446722, "loss": 0.0408, "step": 19580 }, { "epoch": 0.05, "learning_rate": 0.00029238298412830076, "loss": 0.0447, "step": 19590 }, { "epoch": 0.05, "learning_rate": 0.0002923790959119293, "loss": 0.0373, "step": 19600 }, { "epoch": 0.05, "learning_rate": 0.0002923752076955578, "loss": 0.032, "step": 19610 }, { "epoch": 0.05, "learning_rate": 0.00029237131947918636, "loss": 0.0355, "step": 19620 }, { "epoch": 0.05, "learning_rate": 0.0002923674312628149, "loss": 0.0375, "step": 19630 }, { "epoch": 0.05, "learning_rate": 0.0002923635430464434, "loss": 0.0339, "step": 19640 }, { "epoch": 0.05, "learning_rate": 0.00029235965483007196, "loss": 0.0431, "step": 19650 }, { "epoch": 0.05, "learning_rate": 0.00029235576661370053, "loss": 0.0312, "step": 19660 }, { "epoch": 0.05, "learning_rate": 0.00029235187839732904, "loss": 0.0346, "step": 19670 }, { "epoch": 0.05, "learning_rate": 0.00029234799018095756, "loss": 0.0363, "step": 19680 }, { "epoch": 0.05, "learning_rate": 0.00029234410196458607, "loss": 0.0366, "step": 19690 }, { "epoch": 0.05, "learning_rate": 0.00029234021374821464, "loss": 0.0367, "step": 19700 }, { "epoch": 0.05, "learning_rate": 0.00029233632553184315, "loss": 0.0355, "step": 19710 }, { "epoch": 0.05, "learning_rate": 0.0002923324373154717, "loss": 0.0321, "step": 19720 }, { "epoch": 0.05, "learning_rate": 0.00029232854909910024, "loss": 0.0383, "step": 19730 }, { "epoch": 0.05, "learning_rate": 0.0002923246608827288, "loss": 0.0398, "step": 19740 }, { "epoch": 0.05, "learning_rate": 0.0002923207726663573, "loss": 0.0384, "step": 19750 }, { "epoch": 0.05, "learning_rate": 0.00029231688444998584, "loss": 0.0381, "step": 19760 }, { "epoch": 0.05, "learning_rate": 0.00029231299623361435, "loss": 0.0394, "step": 19770 }, { "epoch": 0.05, "learning_rate": 0.0002923091080172429, "loss": 0.0432, "step": 19780 }, { "epoch": 0.05, "learning_rate": 0.00029230521980087143, "loss": 0.0381, "step": 19790 }, { "epoch": 0.05, "learning_rate": 0.0002923013315845, "loss": 0.038, "step": 19800 }, { "epoch": 0.05, "learning_rate": 0.0002922974433681285, "loss": 0.0418, "step": 19810 }, { "epoch": 0.05, "learning_rate": 0.0002922935551517571, "loss": 0.032, "step": 19820 }, { "epoch": 0.05, "learning_rate": 0.0002922896669353856, "loss": 0.041, "step": 19830 }, { "epoch": 0.05, "learning_rate": 0.0002922857787190141, "loss": 0.0354, "step": 19840 }, { "epoch": 0.05, "learning_rate": 0.0002922818905026427, "loss": 0.0404, "step": 19850 }, { "epoch": 0.05, "learning_rate": 0.0002922780022862712, "loss": 0.0393, "step": 19860 }, { "epoch": 0.05, "learning_rate": 0.00029227411406989977, "loss": 0.0415, "step": 19870 }, { "epoch": 0.05, "learning_rate": 0.0002922702258535283, "loss": 0.0352, "step": 19880 }, { "epoch": 0.05, "learning_rate": 0.0002922663376371568, "loss": 0.0356, "step": 19890 }, { "epoch": 0.05, "learning_rate": 0.0002922624494207853, "loss": 0.0384, "step": 19900 }, { "epoch": 0.05, "learning_rate": 0.0002922585612044139, "loss": 0.0385, "step": 19910 }, { "epoch": 0.05, "learning_rate": 0.0002922546729880424, "loss": 0.0382, "step": 19920 }, { "epoch": 0.05, "learning_rate": 0.00029225078477167096, "loss": 0.0401, "step": 19930 }, { "epoch": 0.05, "learning_rate": 0.0002922468965552995, "loss": 0.0401, "step": 19940 }, { "epoch": 0.05, "learning_rate": 0.00029224300833892805, "loss": 0.0317, "step": 19950 }, { "epoch": 0.05, "learning_rate": 0.00029223912012255656, "loss": 0.0323, "step": 19960 }, { "epoch": 0.05, "learning_rate": 0.0002922352319061851, "loss": 0.0318, "step": 19970 }, { "epoch": 0.05, "learning_rate": 0.0002922313436898136, "loss": 0.0376, "step": 19980 }, { "epoch": 0.05, "learning_rate": 0.00029222745547344216, "loss": 0.0419, "step": 19990 }, { "epoch": 0.05, "learning_rate": 0.0002922235672570707, "loss": 0.0358, "step": 20000 }, { "epoch": 0.05, "eval_cer": 0.8818160569148363, "eval_loss": 0.02738848887383938, "eval_runtime": 107.5768, "eval_samples_per_second": 18.591, "eval_steps_per_second": 4.648, "step": 20000 }, { "epoch": 0.05, "learning_rate": 0.00029221967904069924, "loss": 0.036, "step": 20010 }, { "epoch": 0.05, "learning_rate": 0.00029221579082432776, "loss": 0.0371, "step": 20020 }, { "epoch": 0.05, "learning_rate": 0.0002922119026079563, "loss": 0.0364, "step": 20030 }, { "epoch": 0.05, "learning_rate": 0.00029220801439158484, "loss": 0.0379, "step": 20040 }, { "epoch": 0.05, "learning_rate": 0.00029220412617521335, "loss": 0.0432, "step": 20050 }, { "epoch": 0.05, "learning_rate": 0.0002922002379588419, "loss": 0.0375, "step": 20060 }, { "epoch": 0.05, "learning_rate": 0.00029219634974247044, "loss": 0.0394, "step": 20070 }, { "epoch": 0.05, "learning_rate": 0.000292192461526099, "loss": 0.0357, "step": 20080 }, { "epoch": 0.05, "learning_rate": 0.0002921885733097275, "loss": 0.035, "step": 20090 }, { "epoch": 0.05, "learning_rate": 0.00029218468509335603, "loss": 0.0332, "step": 20100 }, { "epoch": 0.05, "learning_rate": 0.00029218079687698455, "loss": 0.0375, "step": 20110 }, { "epoch": 0.05, "learning_rate": 0.0002921769086606131, "loss": 0.0356, "step": 20120 }, { "epoch": 0.05, "learning_rate": 0.00029217302044424163, "loss": 0.0443, "step": 20130 }, { "epoch": 0.05, "learning_rate": 0.0002921691322278702, "loss": 0.0335, "step": 20140 }, { "epoch": 0.05, "learning_rate": 0.0002921652440114987, "loss": 0.0362, "step": 20150 }, { "epoch": 0.05, "learning_rate": 0.0002921613557951273, "loss": 0.0331, "step": 20160 }, { "epoch": 0.05, "learning_rate": 0.0002921574675787558, "loss": 0.0386, "step": 20170 }, { "epoch": 0.05, "learning_rate": 0.0002921535793623843, "loss": 0.0313, "step": 20180 }, { "epoch": 0.05, "learning_rate": 0.00029214969114601283, "loss": 0.0334, "step": 20190 }, { "epoch": 0.05, "learning_rate": 0.0002921458029296414, "loss": 0.0349, "step": 20200 }, { "epoch": 0.05, "learning_rate": 0.00029214191471326997, "loss": 0.0351, "step": 20210 }, { "epoch": 0.05, "learning_rate": 0.0002921380264968985, "loss": 0.0357, "step": 20220 }, { "epoch": 0.05, "learning_rate": 0.000292134138280527, "loss": 0.038, "step": 20230 }, { "epoch": 0.05, "learning_rate": 0.00029213025006415556, "loss": 0.0314, "step": 20240 }, { "epoch": 0.05, "learning_rate": 0.0002921263618477841, "loss": 0.0363, "step": 20250 }, { "epoch": 0.05, "learning_rate": 0.0002921224736314126, "loss": 0.0361, "step": 20260 }, { "epoch": 0.05, "learning_rate": 0.00029211858541504116, "loss": 0.0419, "step": 20270 }, { "epoch": 0.05, "learning_rate": 0.0002921146971986697, "loss": 0.0312, "step": 20280 }, { "epoch": 0.05, "learning_rate": 0.00029211080898229824, "loss": 0.0302, "step": 20290 }, { "epoch": 0.05, "learning_rate": 0.00029210692076592676, "loss": 0.0352, "step": 20300 }, { "epoch": 0.05, "learning_rate": 0.0002921030325495553, "loss": 0.0471, "step": 20310 }, { "epoch": 0.05, "learning_rate": 0.00029209914433318384, "loss": 0.037, "step": 20320 }, { "epoch": 0.05, "learning_rate": 0.00029209525611681236, "loss": 0.0398, "step": 20330 }, { "epoch": 0.05, "learning_rate": 0.00029209136790044087, "loss": 0.0348, "step": 20340 }, { "epoch": 0.05, "learning_rate": 0.00029208747968406944, "loss": 0.037, "step": 20350 }, { "epoch": 0.05, "learning_rate": 0.00029208359146769795, "loss": 0.0348, "step": 20360 }, { "epoch": 0.05, "learning_rate": 0.0002920797032513265, "loss": 0.0292, "step": 20370 }, { "epoch": 0.05, "learning_rate": 0.00029207581503495504, "loss": 0.0399, "step": 20380 }, { "epoch": 0.05, "learning_rate": 0.00029207192681858355, "loss": 0.0363, "step": 20390 }, { "epoch": 0.05, "learning_rate": 0.0002920680386022121, "loss": 0.0336, "step": 20400 }, { "epoch": 0.05, "learning_rate": 0.00029206415038584064, "loss": 0.0371, "step": 20410 }, { "epoch": 0.05, "learning_rate": 0.0002920602621694692, "loss": 0.0343, "step": 20420 }, { "epoch": 0.05, "learning_rate": 0.0002920563739530977, "loss": 0.0317, "step": 20430 }, { "epoch": 0.05, "learning_rate": 0.00029205248573672623, "loss": 0.0344, "step": 20440 }, { "epoch": 0.05, "learning_rate": 0.0002920485975203548, "loss": 0.0355, "step": 20450 }, { "epoch": 0.05, "learning_rate": 0.0002920447093039833, "loss": 0.0441, "step": 20460 }, { "epoch": 0.05, "learning_rate": 0.00029204082108761183, "loss": 0.0342, "step": 20470 }, { "epoch": 0.05, "learning_rate": 0.0002920369328712404, "loss": 0.0392, "step": 20480 }, { "epoch": 0.05, "learning_rate": 0.00029203304465486897, "loss": 0.0422, "step": 20490 }, { "epoch": 0.05, "learning_rate": 0.0002920291564384975, "loss": 0.0379, "step": 20500 }, { "epoch": 0.05, "learning_rate": 0.000292025268222126, "loss": 0.0329, "step": 20510 }, { "epoch": 0.05, "learning_rate": 0.0002920213800057545, "loss": 0.0378, "step": 20520 }, { "epoch": 0.05, "learning_rate": 0.0002920174917893831, "loss": 0.0337, "step": 20530 }, { "epoch": 0.05, "learning_rate": 0.0002920136035730116, "loss": 0.0358, "step": 20540 }, { "epoch": 0.05, "learning_rate": 0.00029200971535664016, "loss": 0.0352, "step": 20550 }, { "epoch": 0.05, "learning_rate": 0.0002920058271402687, "loss": 0.0337, "step": 20560 }, { "epoch": 0.05, "learning_rate": 0.00029200193892389725, "loss": 0.0341, "step": 20570 }, { "epoch": 0.05, "learning_rate": 0.00029199805070752576, "loss": 0.0373, "step": 20580 }, { "epoch": 0.05, "learning_rate": 0.0002919941624911543, "loss": 0.0362, "step": 20590 }, { "epoch": 0.05, "learning_rate": 0.0002919902742747828, "loss": 0.0505, "step": 20600 }, { "epoch": 0.05, "learning_rate": 0.00029198638605841136, "loss": 0.0406, "step": 20610 }, { "epoch": 0.05, "learning_rate": 0.0002919824978420399, "loss": 0.0346, "step": 20620 }, { "epoch": 0.05, "learning_rate": 0.00029197860962566844, "loss": 0.0426, "step": 20630 }, { "epoch": 0.05, "learning_rate": 0.00029197472140929696, "loss": 0.0356, "step": 20640 }, { "epoch": 0.05, "learning_rate": 0.00029197083319292547, "loss": 0.039, "step": 20650 }, { "epoch": 0.05, "learning_rate": 0.00029196694497655404, "loss": 0.0404, "step": 20660 }, { "epoch": 0.05, "learning_rate": 0.00029196305676018256, "loss": 0.0374, "step": 20670 }, { "epoch": 0.05, "learning_rate": 0.00029195916854381107, "loss": 0.0349, "step": 20680 }, { "epoch": 0.05, "learning_rate": 0.00029195528032743964, "loss": 0.0457, "step": 20690 }, { "epoch": 0.05, "learning_rate": 0.0002919513921110682, "loss": 0.0317, "step": 20700 }, { "epoch": 0.05, "learning_rate": 0.0002919475038946967, "loss": 0.0341, "step": 20710 }, { "epoch": 0.05, "learning_rate": 0.00029194361567832524, "loss": 0.0348, "step": 20720 }, { "epoch": 0.05, "learning_rate": 0.00029193972746195375, "loss": 0.0367, "step": 20730 }, { "epoch": 0.05, "learning_rate": 0.0002919358392455823, "loss": 0.0376, "step": 20740 }, { "epoch": 0.05, "learning_rate": 0.00029193195102921083, "loss": 0.0309, "step": 20750 }, { "epoch": 0.05, "learning_rate": 0.0002919280628128394, "loss": 0.0364, "step": 20760 }, { "epoch": 0.05, "learning_rate": 0.0002919241745964679, "loss": 0.0367, "step": 20770 }, { "epoch": 0.05, "learning_rate": 0.0002919202863800965, "loss": 0.0385, "step": 20780 }, { "epoch": 0.05, "learning_rate": 0.000291916398163725, "loss": 0.0486, "step": 20790 }, { "epoch": 0.05, "learning_rate": 0.0002919125099473535, "loss": 0.0373, "step": 20800 }, { "epoch": 0.05, "learning_rate": 0.00029190862173098203, "loss": 0.0353, "step": 20810 }, { "epoch": 0.05, "learning_rate": 0.0002919047335146106, "loss": 0.0388, "step": 20820 }, { "epoch": 0.05, "learning_rate": 0.0002919008452982391, "loss": 0.0368, "step": 20830 }, { "epoch": 0.05, "learning_rate": 0.0002918969570818677, "loss": 0.0323, "step": 20840 }, { "epoch": 0.05, "learning_rate": 0.0002918930688654962, "loss": 0.0404, "step": 20850 }, { "epoch": 0.05, "learning_rate": 0.0002918891806491247, "loss": 0.0334, "step": 20860 }, { "epoch": 0.05, "learning_rate": 0.0002918852924327533, "loss": 0.0344, "step": 20870 }, { "epoch": 0.05, "learning_rate": 0.0002918814042163818, "loss": 0.0366, "step": 20880 }, { "epoch": 0.05, "learning_rate": 0.00029187751600001036, "loss": 0.0553, "step": 20890 }, { "epoch": 0.05, "learning_rate": 0.0002918736277836389, "loss": 0.0316, "step": 20900 }, { "epoch": 0.05, "learning_rate": 0.00029186973956726745, "loss": 0.0348, "step": 20910 }, { "epoch": 0.05, "learning_rate": 0.00029186585135089596, "loss": 0.0324, "step": 20920 }, { "epoch": 0.05, "learning_rate": 0.0002918619631345245, "loss": 0.0363, "step": 20930 }, { "epoch": 0.05, "learning_rate": 0.000291858074918153, "loss": 0.0365, "step": 20940 }, { "epoch": 0.05, "learning_rate": 0.00029185418670178156, "loss": 0.0352, "step": 20950 }, { "epoch": 0.05, "learning_rate": 0.0002918502984854101, "loss": 0.0304, "step": 20960 }, { "epoch": 0.05, "learning_rate": 0.00029184641026903864, "loss": 0.0368, "step": 20970 }, { "epoch": 0.05, "learning_rate": 0.00029184252205266716, "loss": 0.0444, "step": 20980 }, { "epoch": 0.05, "learning_rate": 0.0002918386338362957, "loss": 0.0391, "step": 20990 }, { "epoch": 0.05, "learning_rate": 0.00029183474561992424, "loss": 0.0391, "step": 21000 }, { "epoch": 0.05, "eval_cer": 0.8818048598193629, "eval_loss": 0.026714030653238297, "eval_runtime": 107.7623, "eval_samples_per_second": 18.559, "eval_steps_per_second": 4.64, "step": 21000 }, { "epoch": 0.05, "learning_rate": 0.00029183085740355275, "loss": 0.0367, "step": 21010 }, { "epoch": 0.05, "learning_rate": 0.00029182696918718127, "loss": 0.0383, "step": 21020 }, { "epoch": 0.05, "learning_rate": 0.00029182308097080984, "loss": 0.0365, "step": 21030 }, { "epoch": 0.05, "learning_rate": 0.0002918191927544384, "loss": 0.0391, "step": 21040 }, { "epoch": 0.05, "learning_rate": 0.0002918153045380669, "loss": 0.0364, "step": 21050 }, { "epoch": 0.05, "learning_rate": 0.00029181141632169544, "loss": 0.0309, "step": 21060 }, { "epoch": 0.05, "learning_rate": 0.000291807528105324, "loss": 0.0314, "step": 21070 }, { "epoch": 0.05, "learning_rate": 0.0002918036398889525, "loss": 0.032, "step": 21080 }, { "epoch": 0.05, "learning_rate": 0.00029179975167258103, "loss": 0.0389, "step": 21090 }, { "epoch": 0.05, "learning_rate": 0.0002917958634562096, "loss": 0.0424, "step": 21100 }, { "epoch": 0.05, "learning_rate": 0.0002917919752398381, "loss": 0.0404, "step": 21110 }, { "epoch": 0.05, "learning_rate": 0.0002917880870234667, "loss": 0.0486, "step": 21120 }, { "epoch": 0.05, "learning_rate": 0.0002917841988070952, "loss": 0.0334, "step": 21130 }, { "epoch": 0.05, "learning_rate": 0.0002917803105907237, "loss": 0.0399, "step": 21140 }, { "epoch": 0.05, "learning_rate": 0.00029177642237435223, "loss": 0.0322, "step": 21150 }, { "epoch": 0.05, "learning_rate": 0.0002917725341579808, "loss": 0.0335, "step": 21160 }, { "epoch": 0.05, "learning_rate": 0.0002917686459416093, "loss": 0.0325, "step": 21170 }, { "epoch": 0.05, "learning_rate": 0.0002917647577252379, "loss": 0.0328, "step": 21180 }, { "epoch": 0.05, "learning_rate": 0.0002917608695088664, "loss": 0.0362, "step": 21190 }, { "epoch": 0.05, "learning_rate": 0.00029175698129249496, "loss": 0.0343, "step": 21200 }, { "epoch": 0.05, "learning_rate": 0.0002917530930761235, "loss": 0.0327, "step": 21210 }, { "epoch": 0.06, "learning_rate": 0.000291749204859752, "loss": 0.0313, "step": 21220 }, { "epoch": 0.06, "learning_rate": 0.0002917453166433805, "loss": 0.0376, "step": 21230 }, { "epoch": 0.06, "learning_rate": 0.0002917414284270091, "loss": 0.0405, "step": 21240 }, { "epoch": 0.06, "learning_rate": 0.00029173754021063765, "loss": 0.0379, "step": 21250 }, { "epoch": 0.06, "learning_rate": 0.00029173365199426616, "loss": 0.0343, "step": 21260 }, { "epoch": 0.06, "learning_rate": 0.0002917297637778947, "loss": 0.0393, "step": 21270 }, { "epoch": 0.06, "learning_rate": 0.00029172587556152324, "loss": 0.0396, "step": 21280 }, { "epoch": 0.06, "learning_rate": 0.00029172198734515176, "loss": 0.0369, "step": 21290 }, { "epoch": 0.06, "learning_rate": 0.00029171809912878027, "loss": 0.035, "step": 21300 }, { "epoch": 0.06, "learning_rate": 0.00029171421091240884, "loss": 0.0367, "step": 21310 }, { "epoch": 0.06, "learning_rate": 0.00029171032269603736, "loss": 0.0353, "step": 21320 }, { "epoch": 0.06, "learning_rate": 0.0002917064344796659, "loss": 0.0388, "step": 21330 }, { "epoch": 0.06, "learning_rate": 0.00029170254626329444, "loss": 0.0387, "step": 21340 }, { "epoch": 0.06, "learning_rate": 0.00029169865804692295, "loss": 0.0492, "step": 21350 }, { "epoch": 0.06, "learning_rate": 0.00029169476983055147, "loss": 0.0423, "step": 21360 }, { "epoch": 0.06, "learning_rate": 0.00029169088161418004, "loss": 0.0462, "step": 21370 }, { "epoch": 0.06, "learning_rate": 0.00029168699339780855, "loss": 0.0476, "step": 21380 }, { "epoch": 0.06, "learning_rate": 0.0002916831051814371, "loss": 0.0407, "step": 21390 }, { "epoch": 0.06, "learning_rate": 0.00029167921696506563, "loss": 0.037, "step": 21400 }, { "epoch": 0.06, "learning_rate": 0.0002916753287486942, "loss": 0.0374, "step": 21410 }, { "epoch": 0.06, "learning_rate": 0.0002916714405323227, "loss": 0.0391, "step": 21420 }, { "epoch": 0.06, "learning_rate": 0.00029166755231595123, "loss": 0.0697, "step": 21430 }, { "epoch": 0.06, "learning_rate": 0.0002916636640995798, "loss": 0.0597, "step": 21440 }, { "epoch": 0.06, "learning_rate": 0.0002916597758832083, "loss": 0.0395, "step": 21450 }, { "epoch": 0.06, "learning_rate": 0.0002916558876668369, "loss": 0.0405, "step": 21460 }, { "epoch": 0.06, "learning_rate": 0.0002916519994504654, "loss": 0.0361, "step": 21470 }, { "epoch": 0.06, "learning_rate": 0.0002916481112340939, "loss": 0.0364, "step": 21480 }, { "epoch": 0.06, "learning_rate": 0.0002916442230177225, "loss": 0.0363, "step": 21490 }, { "epoch": 0.06, "learning_rate": 0.000291640334801351, "loss": 0.0324, "step": 21500 }, { "epoch": 0.06, "learning_rate": 0.0002916364465849795, "loss": 0.0314, "step": 21510 }, { "epoch": 0.06, "learning_rate": 0.0002916325583686081, "loss": 0.0352, "step": 21520 }, { "epoch": 0.06, "learning_rate": 0.0002916286701522366, "loss": 0.0442, "step": 21530 }, { "epoch": 0.06, "learning_rate": 0.00029162478193586516, "loss": 0.0365, "step": 21540 }, { "epoch": 0.06, "learning_rate": 0.0002916208937194937, "loss": 0.0354, "step": 21550 }, { "epoch": 0.06, "learning_rate": 0.0002916170055031222, "loss": 0.0343, "step": 21560 }, { "epoch": 0.06, "learning_rate": 0.00029161311728675076, "loss": 0.038, "step": 21570 }, { "epoch": 0.06, "learning_rate": 0.0002916092290703793, "loss": 0.0332, "step": 21580 }, { "epoch": 0.06, "learning_rate": 0.00029160534085400784, "loss": 0.0351, "step": 21590 }, { "epoch": 0.06, "learning_rate": 0.00029160145263763636, "loss": 0.0393, "step": 21600 }, { "epoch": 0.06, "learning_rate": 0.0002915975644212649, "loss": 0.031, "step": 21610 }, { "epoch": 0.06, "learning_rate": 0.00029159367620489344, "loss": 0.0403, "step": 21620 }, { "epoch": 0.06, "learning_rate": 0.00029158978798852196, "loss": 0.0412, "step": 21630 }, { "epoch": 0.06, "learning_rate": 0.00029158589977215047, "loss": 0.0374, "step": 21640 }, { "epoch": 0.06, "learning_rate": 0.00029158201155577904, "loss": 0.0392, "step": 21650 }, { "epoch": 0.06, "learning_rate": 0.00029157812333940755, "loss": 0.0391, "step": 21660 }, { "epoch": 0.06, "learning_rate": 0.0002915742351230361, "loss": 0.0342, "step": 21670 }, { "epoch": 0.06, "learning_rate": 0.00029157034690666464, "loss": 0.0519, "step": 21680 }, { "epoch": 0.06, "learning_rate": 0.00029156645869029315, "loss": 0.0392, "step": 21690 }, { "epoch": 0.06, "learning_rate": 0.0002915625704739217, "loss": 0.0368, "step": 21700 }, { "epoch": 0.06, "learning_rate": 0.00029155868225755024, "loss": 0.0525, "step": 21710 }, { "epoch": 0.06, "learning_rate": 0.00029155479404117875, "loss": 0.0381, "step": 21720 }, { "epoch": 0.06, "learning_rate": 0.0002915509058248073, "loss": 0.0399, "step": 21730 }, { "epoch": 0.06, "learning_rate": 0.0002915470176084359, "loss": 0.0349, "step": 21740 }, { "epoch": 0.06, "learning_rate": 0.0002915431293920644, "loss": 0.0368, "step": 21750 }, { "epoch": 0.06, "learning_rate": 0.0002915392411756929, "loss": 0.0398, "step": 21760 }, { "epoch": 0.06, "learning_rate": 0.00029153535295932143, "loss": 0.0389, "step": 21770 }, { "epoch": 0.06, "learning_rate": 0.00029153146474295, "loss": 0.051, "step": 21780 }, { "epoch": 0.06, "learning_rate": 0.0002915275765265785, "loss": 0.0418, "step": 21790 }, { "epoch": 0.06, "learning_rate": 0.0002915236883102071, "loss": 0.0367, "step": 21800 }, { "epoch": 0.06, "learning_rate": 0.0002915198000938356, "loss": 0.0485, "step": 21810 }, { "epoch": 0.06, "learning_rate": 0.00029151591187746417, "loss": 0.037, "step": 21820 }, { "epoch": 0.06, "learning_rate": 0.0002915120236610927, "loss": 0.0344, "step": 21830 }, { "epoch": 0.06, "learning_rate": 0.0002915081354447212, "loss": 0.0413, "step": 21840 }, { "epoch": 0.06, "learning_rate": 0.0002915042472283497, "loss": 0.0398, "step": 21850 }, { "epoch": 0.06, "learning_rate": 0.0002915003590119783, "loss": 0.039, "step": 21860 }, { "epoch": 0.06, "learning_rate": 0.0002914964707956068, "loss": 0.0343, "step": 21870 }, { "epoch": 0.06, "learning_rate": 0.00029149258257923536, "loss": 0.034, "step": 21880 }, { "epoch": 0.06, "learning_rate": 0.0002914886943628639, "loss": 0.0396, "step": 21890 }, { "epoch": 0.06, "learning_rate": 0.0002914848061464924, "loss": 0.0346, "step": 21900 }, { "epoch": 0.06, "learning_rate": 0.00029148091793012096, "loss": 0.0352, "step": 21910 }, { "epoch": 0.06, "learning_rate": 0.0002914770297137495, "loss": 0.046, "step": 21920 }, { "epoch": 0.06, "learning_rate": 0.000291473141497378, "loss": 0.0363, "step": 21930 }, { "epoch": 0.06, "learning_rate": 0.00029146925328100656, "loss": 0.0429, "step": 21940 }, { "epoch": 0.06, "learning_rate": 0.0002914653650646351, "loss": 0.0336, "step": 21950 }, { "epoch": 0.06, "learning_rate": 0.00029146147684826364, "loss": 0.0381, "step": 21960 }, { "epoch": 0.06, "learning_rate": 0.00029145758863189216, "loss": 0.0368, "step": 21970 }, { "epoch": 0.06, "learning_rate": 0.00029145370041552067, "loss": 0.0387, "step": 21980 }, { "epoch": 0.06, "learning_rate": 0.00029144981219914924, "loss": 0.0389, "step": 21990 }, { "epoch": 0.06, "learning_rate": 0.00029144592398277775, "loss": 0.0383, "step": 22000 }, { "epoch": 0.06, "eval_cer": 0.8817894638130869, "eval_loss": 0.02770763821899891, "eval_runtime": 107.5949, "eval_samples_per_second": 18.588, "eval_steps_per_second": 4.647, "step": 22000 }, { "epoch": 0.06, "learning_rate": 0.0002914420357664063, "loss": 0.0393, "step": 22010 }, { "epoch": 0.06, "learning_rate": 0.00029143814755003484, "loss": 0.0345, "step": 22020 }, { "epoch": 0.06, "learning_rate": 0.0002914342593336634, "loss": 0.0346, "step": 22030 }, { "epoch": 0.06, "learning_rate": 0.0002914303711172919, "loss": 0.0375, "step": 22040 }, { "epoch": 0.06, "learning_rate": 0.00029142648290092043, "loss": 0.0361, "step": 22050 }, { "epoch": 0.06, "learning_rate": 0.00029142259468454895, "loss": 0.0372, "step": 22060 }, { "epoch": 0.06, "learning_rate": 0.0002914187064681775, "loss": 0.0408, "step": 22070 }, { "epoch": 0.06, "learning_rate": 0.0002914148182518061, "loss": 0.039, "step": 22080 }, { "epoch": 0.06, "learning_rate": 0.0002914109300354346, "loss": 0.0367, "step": 22090 }, { "epoch": 0.06, "learning_rate": 0.0002914070418190631, "loss": 0.0401, "step": 22100 }, { "epoch": 0.06, "learning_rate": 0.00029140315360269163, "loss": 0.0365, "step": 22110 }, { "epoch": 0.06, "learning_rate": 0.0002913992653863202, "loss": 0.0398, "step": 22120 }, { "epoch": 0.06, "learning_rate": 0.0002913953771699487, "loss": 0.0327, "step": 22130 }, { "epoch": 0.06, "learning_rate": 0.0002913914889535773, "loss": 0.0374, "step": 22140 }, { "epoch": 0.06, "learning_rate": 0.0002913876007372058, "loss": 0.0284, "step": 22150 }, { "epoch": 0.06, "learning_rate": 0.00029138371252083437, "loss": 0.0356, "step": 22160 }, { "epoch": 0.06, "learning_rate": 0.0002913798243044629, "loss": 0.0363, "step": 22170 }, { "epoch": 0.06, "learning_rate": 0.0002913759360880914, "loss": 0.0389, "step": 22180 }, { "epoch": 0.06, "learning_rate": 0.0002913720478717199, "loss": 0.0423, "step": 22190 }, { "epoch": 0.06, "learning_rate": 0.0002913681596553485, "loss": 0.0353, "step": 22200 }, { "epoch": 0.06, "learning_rate": 0.000291364271438977, "loss": 0.0359, "step": 22210 }, { "epoch": 0.06, "learning_rate": 0.00029136038322260556, "loss": 0.0439, "step": 22220 }, { "epoch": 0.06, "learning_rate": 0.0002913564950062341, "loss": 0.032, "step": 22230 }, { "epoch": 0.06, "learning_rate": 0.00029135260678986264, "loss": 0.0354, "step": 22240 }, { "epoch": 0.06, "learning_rate": 0.00029134871857349116, "loss": 0.0371, "step": 22250 }, { "epoch": 0.06, "learning_rate": 0.0002913448303571197, "loss": 0.0398, "step": 22260 }, { "epoch": 0.06, "learning_rate": 0.0002913409421407482, "loss": 0.0393, "step": 22270 }, { "epoch": 0.06, "learning_rate": 0.00029133705392437676, "loss": 0.032, "step": 22280 }, { "epoch": 0.06, "learning_rate": 0.0002913331657080053, "loss": 0.0398, "step": 22290 }, { "epoch": 0.06, "learning_rate": 0.00029132927749163384, "loss": 0.0361, "step": 22300 }, { "epoch": 0.06, "learning_rate": 0.00029132538927526235, "loss": 0.0414, "step": 22310 }, { "epoch": 0.06, "learning_rate": 0.0002913215010588909, "loss": 0.0333, "step": 22320 }, { "epoch": 0.06, "learning_rate": 0.00029131761284251944, "loss": 0.0355, "step": 22330 }, { "epoch": 0.06, "learning_rate": 0.00029131372462614795, "loss": 0.0386, "step": 22340 }, { "epoch": 0.06, "learning_rate": 0.0002913098364097765, "loss": 0.0365, "step": 22350 }, { "epoch": 0.06, "learning_rate": 0.00029130594819340504, "loss": 0.0343, "step": 22360 }, { "epoch": 0.06, "learning_rate": 0.0002913020599770336, "loss": 0.0365, "step": 22370 }, { "epoch": 0.06, "learning_rate": 0.0002912981717606621, "loss": 0.0327, "step": 22380 }, { "epoch": 0.06, "learning_rate": 0.00029129428354429063, "loss": 0.035, "step": 22390 }, { "epoch": 0.06, "learning_rate": 0.00029129039532791915, "loss": 0.0387, "step": 22400 }, { "epoch": 0.06, "learning_rate": 0.0002912865071115477, "loss": 0.0317, "step": 22410 }, { "epoch": 0.06, "learning_rate": 0.00029128261889517623, "loss": 0.0345, "step": 22420 }, { "epoch": 0.06, "learning_rate": 0.0002912787306788048, "loss": 0.0323, "step": 22430 }, { "epoch": 0.06, "learning_rate": 0.0002912748424624333, "loss": 0.033, "step": 22440 }, { "epoch": 0.06, "learning_rate": 0.0002912709542460619, "loss": 0.0362, "step": 22450 }, { "epoch": 0.06, "learning_rate": 0.0002912670660296904, "loss": 0.0278, "step": 22460 }, { "epoch": 0.06, "learning_rate": 0.0002912631778133189, "loss": 0.0346, "step": 22470 }, { "epoch": 0.06, "learning_rate": 0.0002912592895969475, "loss": 0.0378, "step": 22480 }, { "epoch": 0.06, "learning_rate": 0.000291255401380576, "loss": 0.0334, "step": 22490 }, { "epoch": 0.06, "learning_rate": 0.00029125151316420456, "loss": 0.029, "step": 22500 }, { "epoch": 0.06, "learning_rate": 0.0002912476249478331, "loss": 0.0321, "step": 22510 }, { "epoch": 0.06, "learning_rate": 0.0002912437367314616, "loss": 0.0355, "step": 22520 }, { "epoch": 0.06, "learning_rate": 0.00029123984851509016, "loss": 0.0375, "step": 22530 }, { "epoch": 0.06, "learning_rate": 0.0002912359602987187, "loss": 0.0295, "step": 22540 }, { "epoch": 0.06, "learning_rate": 0.0002912320720823472, "loss": 0.032, "step": 22550 }, { "epoch": 0.06, "learning_rate": 0.00029122818386597576, "loss": 0.0368, "step": 22560 }, { "epoch": 0.06, "learning_rate": 0.0002912242956496043, "loss": 0.0315, "step": 22570 }, { "epoch": 0.06, "learning_rate": 0.00029122040743323284, "loss": 0.034, "step": 22580 }, { "epoch": 0.06, "learning_rate": 0.00029121651921686136, "loss": 0.0398, "step": 22590 }, { "epoch": 0.06, "learning_rate": 0.00029121263100048987, "loss": 0.0338, "step": 22600 }, { "epoch": 0.06, "learning_rate": 0.0002912087427841184, "loss": 0.0363, "step": 22610 }, { "epoch": 0.06, "learning_rate": 0.00029120485456774696, "loss": 0.0246, "step": 22620 }, { "epoch": 0.06, "learning_rate": 0.0002912009663513755, "loss": 0.0397, "step": 22630 }, { "epoch": 0.06, "learning_rate": 0.00029119707813500404, "loss": 0.0357, "step": 22640 }, { "epoch": 0.06, "learning_rate": 0.00029119318991863255, "loss": 0.0426, "step": 22650 }, { "epoch": 0.06, "learning_rate": 0.0002911893017022611, "loss": 0.0436, "step": 22660 }, { "epoch": 0.06, "learning_rate": 0.00029118541348588964, "loss": 0.0381, "step": 22670 }, { "epoch": 0.06, "learning_rate": 0.00029118152526951815, "loss": 0.0376, "step": 22680 }, { "epoch": 0.06, "learning_rate": 0.0002911776370531467, "loss": 0.0375, "step": 22690 }, { "epoch": 0.06, "learning_rate": 0.00029117374883677523, "loss": 0.0345, "step": 22700 }, { "epoch": 0.06, "learning_rate": 0.0002911698606204038, "loss": 0.033, "step": 22710 }, { "epoch": 0.06, "learning_rate": 0.0002911659724040323, "loss": 0.0296, "step": 22720 }, { "epoch": 0.06, "learning_rate": 0.00029116208418766083, "loss": 0.0367, "step": 22730 }, { "epoch": 0.06, "learning_rate": 0.0002911581959712894, "loss": 0.0406, "step": 22740 }, { "epoch": 0.06, "learning_rate": 0.0002911543077549179, "loss": 0.0351, "step": 22750 }, { "epoch": 0.06, "learning_rate": 0.00029115041953854643, "loss": 0.0339, "step": 22760 }, { "epoch": 0.06, "learning_rate": 0.000291146531322175, "loss": 0.0373, "step": 22770 }, { "epoch": 0.06, "learning_rate": 0.00029114264310580357, "loss": 0.0302, "step": 22780 }, { "epoch": 0.06, "learning_rate": 0.0002911387548894321, "loss": 0.0363, "step": 22790 }, { "epoch": 0.06, "learning_rate": 0.0002911348666730606, "loss": 0.0351, "step": 22800 }, { "epoch": 0.06, "learning_rate": 0.0002911309784566891, "loss": 0.0439, "step": 22810 }, { "epoch": 0.06, "learning_rate": 0.0002911270902403177, "loss": 0.0315, "step": 22820 }, { "epoch": 0.06, "learning_rate": 0.0002911232020239462, "loss": 0.0379, "step": 22830 }, { "epoch": 0.06, "learning_rate": 0.00029111931380757476, "loss": 0.0329, "step": 22840 }, { "epoch": 0.06, "learning_rate": 0.0002911154255912033, "loss": 0.0483, "step": 22850 }, { "epoch": 0.06, "learning_rate": 0.0002911115373748318, "loss": 0.0308, "step": 22860 }, { "epoch": 0.06, "learning_rate": 0.00029110764915846036, "loss": 0.029, "step": 22870 }, { "epoch": 0.06, "learning_rate": 0.0002911037609420889, "loss": 0.034, "step": 22880 }, { "epoch": 0.06, "learning_rate": 0.0002910998727257174, "loss": 0.0383, "step": 22890 }, { "epoch": 0.06, "learning_rate": 0.00029109598450934596, "loss": 0.0357, "step": 22900 }, { "epoch": 0.06, "learning_rate": 0.0002910920962929745, "loss": 0.0347, "step": 22910 }, { "epoch": 0.06, "learning_rate": 0.00029108820807660304, "loss": 0.0346, "step": 22920 }, { "epoch": 0.06, "learning_rate": 0.00029108431986023156, "loss": 0.0369, "step": 22930 }, { "epoch": 0.06, "learning_rate": 0.00029108043164386007, "loss": 0.0324, "step": 22940 }, { "epoch": 0.06, "learning_rate": 0.00029107654342748864, "loss": 0.0383, "step": 22950 }, { "epoch": 0.06, "learning_rate": 0.00029107265521111715, "loss": 0.0357, "step": 22960 }, { "epoch": 0.06, "learning_rate": 0.00029106876699474567, "loss": 0.0325, "step": 22970 }, { "epoch": 0.06, "learning_rate": 0.00029106487877837424, "loss": 0.0357, "step": 22980 }, { "epoch": 0.06, "learning_rate": 0.0002910609905620028, "loss": 0.0404, "step": 22990 }, { "epoch": 0.06, "learning_rate": 0.0002910571023456313, "loss": 0.0407, "step": 23000 }, { "epoch": 0.06, "eval_cer": 0.881821655462573, "eval_loss": 0.026583530008792877, "eval_runtime": 107.715, "eval_samples_per_second": 18.568, "eval_steps_per_second": 4.642, "step": 23000 }, { "epoch": 0.06, "learning_rate": 0.00029105321412925984, "loss": 0.0304, "step": 23010 }, { "epoch": 0.06, "learning_rate": 0.00029104932591288835, "loss": 0.0353, "step": 23020 }, { "epoch": 0.06, "learning_rate": 0.0002910454376965169, "loss": 0.0423, "step": 23030 }, { "epoch": 0.06, "learning_rate": 0.00029104154948014543, "loss": 0.033, "step": 23040 }, { "epoch": 0.06, "learning_rate": 0.000291037661263774, "loss": 0.0331, "step": 23050 }, { "epoch": 0.06, "learning_rate": 0.0002910337730474025, "loss": 0.033, "step": 23060 }, { "epoch": 0.06, "learning_rate": 0.0002910298848310311, "loss": 0.0311, "step": 23070 }, { "epoch": 0.06, "learning_rate": 0.0002910259966146596, "loss": 0.0355, "step": 23080 }, { "epoch": 0.06, "learning_rate": 0.0002910221083982881, "loss": 0.0333, "step": 23090 }, { "epoch": 0.06, "learning_rate": 0.00029101822018191663, "loss": 0.0322, "step": 23100 }, { "epoch": 0.06, "learning_rate": 0.0002910143319655452, "loss": 0.0355, "step": 23110 }, { "epoch": 0.06, "learning_rate": 0.0002910104437491737, "loss": 0.0412, "step": 23120 }, { "epoch": 0.06, "learning_rate": 0.0002910065555328023, "loss": 0.0379, "step": 23130 }, { "epoch": 0.06, "learning_rate": 0.0002910026673164308, "loss": 0.0381, "step": 23140 }, { "epoch": 0.06, "learning_rate": 0.0002909987791000593, "loss": 0.0463, "step": 23150 }, { "epoch": 0.06, "learning_rate": 0.0002909948908836879, "loss": 0.0425, "step": 23160 }, { "epoch": 0.06, "learning_rate": 0.0002909910026673164, "loss": 0.0429, "step": 23170 }, { "epoch": 0.06, "learning_rate": 0.00029098711445094496, "loss": 0.0347, "step": 23180 }, { "epoch": 0.06, "learning_rate": 0.0002909832262345735, "loss": 0.0327, "step": 23190 }, { "epoch": 0.06, "learning_rate": 0.00029097933801820205, "loss": 0.0371, "step": 23200 }, { "epoch": 0.06, "learning_rate": 0.00029097544980183056, "loss": 0.0342, "step": 23210 }, { "epoch": 0.06, "learning_rate": 0.0002909715615854591, "loss": 0.0349, "step": 23220 }, { "epoch": 0.06, "learning_rate": 0.0002909676733690876, "loss": 0.0408, "step": 23230 }, { "epoch": 0.06, "learning_rate": 0.00029096378515271616, "loss": 0.0324, "step": 23240 }, { "epoch": 0.06, "learning_rate": 0.00029095989693634467, "loss": 0.0363, "step": 23250 }, { "epoch": 0.06, "learning_rate": 0.00029095600871997324, "loss": 0.0351, "step": 23260 }, { "epoch": 0.06, "learning_rate": 0.00029095212050360176, "loss": 0.0372, "step": 23270 }, { "epoch": 0.06, "learning_rate": 0.0002909482322872303, "loss": 0.0325, "step": 23280 }, { "epoch": 0.06, "learning_rate": 0.00029094434407085884, "loss": 0.0359, "step": 23290 }, { "epoch": 0.06, "learning_rate": 0.00029094045585448735, "loss": 0.0383, "step": 23300 }, { "epoch": 0.06, "learning_rate": 0.00029093656763811587, "loss": 0.0431, "step": 23310 }, { "epoch": 0.06, "learning_rate": 0.00029093267942174444, "loss": 0.0349, "step": 23320 }, { "epoch": 0.06, "learning_rate": 0.000290928791205373, "loss": 0.0317, "step": 23330 }, { "epoch": 0.06, "learning_rate": 0.0002909249029890015, "loss": 0.0365, "step": 23340 }, { "epoch": 0.06, "learning_rate": 0.00029092101477263003, "loss": 0.0377, "step": 23350 }, { "epoch": 0.06, "learning_rate": 0.00029091712655625855, "loss": 0.0302, "step": 23360 }, { "epoch": 0.06, "learning_rate": 0.0002909132383398871, "loss": 0.0395, "step": 23370 }, { "epoch": 0.06, "learning_rate": 0.00029090935012351563, "loss": 0.0347, "step": 23380 }, { "epoch": 0.06, "learning_rate": 0.0002909054619071442, "loss": 0.0308, "step": 23390 }, { "epoch": 0.06, "learning_rate": 0.0002909015736907727, "loss": 0.0377, "step": 23400 }, { "epoch": 0.06, "learning_rate": 0.0002908976854744013, "loss": 0.0349, "step": 23410 }, { "epoch": 0.06, "learning_rate": 0.0002908937972580298, "loss": 0.0347, "step": 23420 }, { "epoch": 0.06, "learning_rate": 0.0002908899090416583, "loss": 0.0363, "step": 23430 }, { "epoch": 0.06, "learning_rate": 0.00029088602082528683, "loss": 0.0345, "step": 23440 }, { "epoch": 0.06, "learning_rate": 0.0002908821326089154, "loss": 0.034, "step": 23450 }, { "epoch": 0.06, "learning_rate": 0.0002908782443925439, "loss": 0.0281, "step": 23460 }, { "epoch": 0.06, "learning_rate": 0.0002908743561761725, "loss": 0.0398, "step": 23470 }, { "epoch": 0.06, "learning_rate": 0.000290870467959801, "loss": 0.0387, "step": 23480 }, { "epoch": 0.06, "learning_rate": 0.00029086657974342956, "loss": 0.037, "step": 23490 }, { "epoch": 0.06, "learning_rate": 0.0002908626915270581, "loss": 0.0396, "step": 23500 }, { "epoch": 0.06, "learning_rate": 0.0002908588033106866, "loss": 0.0428, "step": 23510 }, { "epoch": 0.06, "learning_rate": 0.0002908549150943151, "loss": 0.0331, "step": 23520 }, { "epoch": 0.06, "learning_rate": 0.0002908510268779437, "loss": 0.0489, "step": 23530 }, { "epoch": 0.06, "learning_rate": 0.00029084713866157224, "loss": 0.0399, "step": 23540 }, { "epoch": 0.06, "learning_rate": 0.00029084325044520076, "loss": 0.0437, "step": 23550 }, { "epoch": 0.06, "learning_rate": 0.0002908393622288293, "loss": 0.0319, "step": 23560 }, { "epoch": 0.06, "learning_rate": 0.00029083547401245784, "loss": 0.0296, "step": 23570 }, { "epoch": 0.06, "learning_rate": 0.00029083158579608636, "loss": 0.0296, "step": 23580 }, { "epoch": 0.06, "learning_rate": 0.00029082769757971487, "loss": 0.0374, "step": 23590 }, { "epoch": 0.06, "learning_rate": 0.00029082380936334344, "loss": 0.035, "step": 23600 }, { "epoch": 0.06, "learning_rate": 0.00029081992114697195, "loss": 0.032, "step": 23610 }, { "epoch": 0.06, "learning_rate": 0.0002908160329306005, "loss": 0.0313, "step": 23620 }, { "epoch": 0.06, "learning_rate": 0.00029081214471422904, "loss": 0.0316, "step": 23630 }, { "epoch": 0.06, "learning_rate": 0.00029080825649785755, "loss": 0.0382, "step": 23640 }, { "epoch": 0.06, "learning_rate": 0.00029080436828148607, "loss": 0.0368, "step": 23650 }, { "epoch": 0.06, "learning_rate": 0.00029080048006511464, "loss": 0.0321, "step": 23660 }, { "epoch": 0.06, "learning_rate": 0.00029079659184874315, "loss": 0.0324, "step": 23670 }, { "epoch": 0.06, "learning_rate": 0.0002907927036323717, "loss": 0.037, "step": 23680 }, { "epoch": 0.06, "learning_rate": 0.00029078881541600023, "loss": 0.0368, "step": 23690 }, { "epoch": 0.06, "learning_rate": 0.0002907849271996288, "loss": 0.0371, "step": 23700 }, { "epoch": 0.06, "learning_rate": 0.0002907810389832573, "loss": 0.0313, "step": 23710 }, { "epoch": 0.06, "learning_rate": 0.00029077715076688583, "loss": 0.0296, "step": 23720 }, { "epoch": 0.06, "learning_rate": 0.0002907732625505144, "loss": 0.0345, "step": 23730 }, { "epoch": 0.06, "learning_rate": 0.0002907693743341429, "loss": 0.0359, "step": 23740 }, { "epoch": 0.06, "learning_rate": 0.0002907654861177715, "loss": 0.0309, "step": 23750 }, { "epoch": 0.06, "learning_rate": 0.0002907615979014, "loss": 0.0358, "step": 23760 }, { "epoch": 0.06, "learning_rate": 0.0002907577096850285, "loss": 0.0363, "step": 23770 }, { "epoch": 0.06, "learning_rate": 0.0002907538214686571, "loss": 0.0312, "step": 23780 }, { "epoch": 0.06, "learning_rate": 0.0002907499332522856, "loss": 0.0277, "step": 23790 }, { "epoch": 0.06, "learning_rate": 0.0002907460450359141, "loss": 0.0371, "step": 23800 }, { "epoch": 0.06, "learning_rate": 0.0002907421568195427, "loss": 0.0309, "step": 23810 }, { "epoch": 0.06, "learning_rate": 0.0002907382686031712, "loss": 0.0385, "step": 23820 }, { "epoch": 0.06, "learning_rate": 0.00029073438038679976, "loss": 0.0413, "step": 23830 }, { "epoch": 0.06, "learning_rate": 0.0002907304921704283, "loss": 0.0332, "step": 23840 }, { "epoch": 0.06, "learning_rate": 0.0002907266039540568, "loss": 0.0336, "step": 23850 }, { "epoch": 0.06, "learning_rate": 0.0002907227157376853, "loss": 0.0318, "step": 23860 }, { "epoch": 0.06, "learning_rate": 0.0002907188275213139, "loss": 0.0324, "step": 23870 }, { "epoch": 0.06, "learning_rate": 0.00029071493930494244, "loss": 0.0369, "step": 23880 }, { "epoch": 0.06, "learning_rate": 0.00029071105108857096, "loss": 0.0363, "step": 23890 }, { "epoch": 0.06, "learning_rate": 0.00029070716287219947, "loss": 0.0382, "step": 23900 }, { "epoch": 0.06, "learning_rate": 0.00029070327465582804, "loss": 0.0334, "step": 23910 }, { "epoch": 0.06, "learning_rate": 0.00029069938643945656, "loss": 0.0373, "step": 23920 }, { "epoch": 0.06, "learning_rate": 0.00029069549822308507, "loss": 0.0374, "step": 23930 }, { "epoch": 0.06, "learning_rate": 0.00029069161000671364, "loss": 0.0345, "step": 23940 }, { "epoch": 0.06, "learning_rate": 0.00029068772179034215, "loss": 0.0337, "step": 23950 }, { "epoch": 0.06, "learning_rate": 0.0002906838335739707, "loss": 0.0361, "step": 23960 }, { "epoch": 0.06, "learning_rate": 0.00029067994535759924, "loss": 0.0373, "step": 23970 }, { "epoch": 0.06, "learning_rate": 0.00029067605714122775, "loss": 0.032, "step": 23980 }, { "epoch": 0.06, "learning_rate": 0.0002906721689248563, "loss": 0.0345, "step": 23990 }, { "epoch": 0.06, "learning_rate": 0.00029066828070848483, "loss": 0.0354, "step": 24000 }, { "epoch": 0.06, "eval_cer": 0.8818426500165857, "eval_loss": 0.02564888820052147, "eval_runtime": 107.6719, "eval_samples_per_second": 18.575, "eval_steps_per_second": 4.644, "step": 24000 }, { "epoch": 0.06, "learning_rate": 0.00029066439249211335, "loss": 0.0351, "step": 24010 }, { "epoch": 0.06, "learning_rate": 0.0002906605042757419, "loss": 0.0405, "step": 24020 }, { "epoch": 0.06, "learning_rate": 0.0002906566160593705, "loss": 0.0434, "step": 24030 }, { "epoch": 0.06, "learning_rate": 0.000290652727842999, "loss": 0.041, "step": 24040 }, { "epoch": 0.06, "learning_rate": 0.0002906488396266275, "loss": 0.0341, "step": 24050 }, { "epoch": 0.06, "learning_rate": 0.00029064495141025603, "loss": 0.0342, "step": 24060 }, { "epoch": 0.06, "learning_rate": 0.0002906410631938846, "loss": 0.0389, "step": 24070 }, { "epoch": 0.06, "learning_rate": 0.0002906371749775131, "loss": 0.0329, "step": 24080 }, { "epoch": 0.06, "learning_rate": 0.0002906332867611417, "loss": 0.034, "step": 24090 }, { "epoch": 0.06, "learning_rate": 0.0002906293985447702, "loss": 0.0433, "step": 24100 }, { "epoch": 0.06, "learning_rate": 0.0002906255103283987, "loss": 0.0386, "step": 24110 }, { "epoch": 0.06, "learning_rate": 0.0002906216221120273, "loss": 0.0353, "step": 24120 }, { "epoch": 0.06, "learning_rate": 0.0002906177338956558, "loss": 0.0318, "step": 24130 }, { "epoch": 0.06, "learning_rate": 0.0002906138456792843, "loss": 0.0364, "step": 24140 }, { "epoch": 0.06, "learning_rate": 0.0002906099574629129, "loss": 0.0332, "step": 24150 }, { "epoch": 0.06, "learning_rate": 0.0002906060692465414, "loss": 0.0358, "step": 24160 }, { "epoch": 0.06, "learning_rate": 0.00029060218103016996, "loss": 0.0386, "step": 24170 }, { "epoch": 0.06, "learning_rate": 0.0002905982928137985, "loss": 0.0343, "step": 24180 }, { "epoch": 0.06, "learning_rate": 0.000290594404597427, "loss": 0.0343, "step": 24190 }, { "epoch": 0.06, "learning_rate": 0.00029059051638105556, "loss": 0.0414, "step": 24200 }, { "epoch": 0.06, "learning_rate": 0.00029058662816468407, "loss": 0.0352, "step": 24210 }, { "epoch": 0.06, "learning_rate": 0.00029058273994831264, "loss": 0.0368, "step": 24220 }, { "epoch": 0.06, "learning_rate": 0.00029057885173194116, "loss": 0.0334, "step": 24230 }, { "epoch": 0.06, "learning_rate": 0.0002905749635155697, "loss": 0.0373, "step": 24240 }, { "epoch": 0.06, "learning_rate": 0.00029057107529919824, "loss": 0.0297, "step": 24250 }, { "epoch": 0.06, "learning_rate": 0.00029056718708282675, "loss": 0.039, "step": 24260 }, { "epoch": 0.06, "learning_rate": 0.00029056329886645527, "loss": 0.0354, "step": 24270 }, { "epoch": 0.06, "learning_rate": 0.00029055941065008384, "loss": 0.0384, "step": 24280 }, { "epoch": 0.06, "learning_rate": 0.00029055552243371235, "loss": 0.0384, "step": 24290 }, { "epoch": 0.06, "learning_rate": 0.0002905516342173409, "loss": 0.0395, "step": 24300 }, { "epoch": 0.06, "learning_rate": 0.00029054774600096943, "loss": 0.0397, "step": 24310 }, { "epoch": 0.06, "learning_rate": 0.00029054385778459795, "loss": 0.0343, "step": 24320 }, { "epoch": 0.06, "learning_rate": 0.0002905399695682265, "loss": 0.0393, "step": 24330 }, { "epoch": 0.06, "learning_rate": 0.00029053608135185503, "loss": 0.039, "step": 24340 }, { "epoch": 0.06, "learning_rate": 0.00029053219313548355, "loss": 0.0343, "step": 24350 }, { "epoch": 0.06, "learning_rate": 0.0002905283049191121, "loss": 0.0327, "step": 24360 }, { "epoch": 0.06, "learning_rate": 0.0002905244167027407, "loss": 0.0349, "step": 24370 }, { "epoch": 0.06, "learning_rate": 0.0002905205284863692, "loss": 0.034, "step": 24380 }, { "epoch": 0.06, "learning_rate": 0.0002905166402699977, "loss": 0.0361, "step": 24390 }, { "epoch": 0.06, "learning_rate": 0.00029051275205362623, "loss": 0.0444, "step": 24400 }, { "epoch": 0.06, "learning_rate": 0.0002905088638372548, "loss": 0.036, "step": 24410 }, { "epoch": 0.06, "learning_rate": 0.0002905049756208833, "loss": 0.0334, "step": 24420 }, { "epoch": 0.06, "learning_rate": 0.0002905010874045119, "loss": 0.0348, "step": 24430 }, { "epoch": 0.06, "learning_rate": 0.0002904971991881404, "loss": 0.0389, "step": 24440 }, { "epoch": 0.06, "learning_rate": 0.00029049331097176896, "loss": 0.0367, "step": 24450 }, { "epoch": 0.06, "learning_rate": 0.0002904894227553975, "loss": 0.0363, "step": 24460 }, { "epoch": 0.06, "learning_rate": 0.000290485534539026, "loss": 0.0428, "step": 24470 }, { "epoch": 0.06, "learning_rate": 0.0002904816463226545, "loss": 0.0314, "step": 24480 }, { "epoch": 0.06, "learning_rate": 0.0002904777581062831, "loss": 0.0357, "step": 24490 }, { "epoch": 0.06, "learning_rate": 0.0002904738698899116, "loss": 0.0733, "step": 24500 }, { "epoch": 0.06, "learning_rate": 0.00029046998167354016, "loss": 0.0377, "step": 24510 }, { "epoch": 0.06, "learning_rate": 0.0002904660934571687, "loss": 0.0396, "step": 24520 }, { "epoch": 0.06, "learning_rate": 0.00029046220524079724, "loss": 0.0404, "step": 24530 }, { "epoch": 0.06, "learning_rate": 0.00029045831702442576, "loss": 0.0347, "step": 24540 }, { "epoch": 0.06, "learning_rate": 0.00029045442880805427, "loss": 0.0387, "step": 24550 }, { "epoch": 0.06, "learning_rate": 0.0002904505405916828, "loss": 0.0359, "step": 24560 }, { "epoch": 0.06, "learning_rate": 0.00029044665237531135, "loss": 0.0341, "step": 24570 }, { "epoch": 0.06, "learning_rate": 0.0002904427641589399, "loss": 0.035, "step": 24580 }, { "epoch": 0.06, "learning_rate": 0.00029043887594256844, "loss": 0.0327, "step": 24590 }, { "epoch": 0.06, "learning_rate": 0.00029043498772619695, "loss": 0.0543, "step": 24600 }, { "epoch": 0.06, "learning_rate": 0.00029043109950982547, "loss": 0.0431, "step": 24610 }, { "epoch": 0.06, "learning_rate": 0.00029042721129345404, "loss": 0.0408, "step": 24620 }, { "epoch": 0.06, "learning_rate": 0.00029042332307708255, "loss": 0.0399, "step": 24630 }, { "epoch": 0.06, "learning_rate": 0.0002904194348607111, "loss": 0.0351, "step": 24640 }, { "epoch": 0.06, "learning_rate": 0.00029041554664433963, "loss": 0.0339, "step": 24650 }, { "epoch": 0.06, "learning_rate": 0.0002904116584279682, "loss": 0.0366, "step": 24660 }, { "epoch": 0.06, "learning_rate": 0.0002904077702115967, "loss": 0.037, "step": 24670 }, { "epoch": 0.06, "learning_rate": 0.00029040388199522523, "loss": 0.0321, "step": 24680 }, { "epoch": 0.06, "learning_rate": 0.00029039999377885375, "loss": 0.0378, "step": 24690 }, { "epoch": 0.06, "learning_rate": 0.0002903961055624823, "loss": 0.0398, "step": 24700 }, { "epoch": 0.06, "learning_rate": 0.00029039221734611083, "loss": 0.0322, "step": 24710 }, { "epoch": 0.06, "learning_rate": 0.0002903883291297394, "loss": 0.0359, "step": 24720 }, { "epoch": 0.06, "learning_rate": 0.0002903844409133679, "loss": 0.043, "step": 24730 }, { "epoch": 0.06, "learning_rate": 0.0002903805526969965, "loss": 0.0356, "step": 24740 }, { "epoch": 0.06, "learning_rate": 0.000290376664480625, "loss": 0.0279, "step": 24750 }, { "epoch": 0.06, "learning_rate": 0.0002903727762642535, "loss": 0.0325, "step": 24760 }, { "epoch": 0.06, "learning_rate": 0.0002903688880478821, "loss": 0.0365, "step": 24770 }, { "epoch": 0.06, "learning_rate": 0.0002903649998315106, "loss": 0.027, "step": 24780 }, { "epoch": 0.06, "learning_rate": 0.00029036111161513916, "loss": 0.031, "step": 24790 }, { "epoch": 0.06, "learning_rate": 0.0002903572233987677, "loss": 0.0348, "step": 24800 }, { "epoch": 0.06, "learning_rate": 0.0002903533351823962, "loss": 0.0312, "step": 24810 }, { "epoch": 0.06, "learning_rate": 0.0002903494469660247, "loss": 0.038, "step": 24820 }, { "epoch": 0.06, "learning_rate": 0.0002903455587496533, "loss": 0.0326, "step": 24830 }, { "epoch": 0.06, "learning_rate": 0.0002903416705332818, "loss": 0.0385, "step": 24840 }, { "epoch": 0.06, "learning_rate": 0.00029033778231691036, "loss": 0.0322, "step": 24850 }, { "epoch": 0.06, "learning_rate": 0.00029033389410053887, "loss": 0.0375, "step": 24860 }, { "epoch": 0.06, "learning_rate": 0.00029033000588416744, "loss": 0.0401, "step": 24870 }, { "epoch": 0.06, "learning_rate": 0.00029032611766779596, "loss": 0.0332, "step": 24880 }, { "epoch": 0.06, "learning_rate": 0.00029032222945142447, "loss": 0.0376, "step": 24890 }, { "epoch": 0.06, "learning_rate": 0.000290318341235053, "loss": 0.0359, "step": 24900 }, { "epoch": 0.06, "learning_rate": 0.00029031445301868155, "loss": 0.0294, "step": 24910 }, { "epoch": 0.06, "learning_rate": 0.0002903105648023101, "loss": 0.0352, "step": 24920 }, { "epoch": 0.06, "learning_rate": 0.00029030667658593864, "loss": 0.0338, "step": 24930 }, { "epoch": 0.06, "learning_rate": 0.00029030278836956715, "loss": 0.0333, "step": 24940 }, { "epoch": 0.06, "learning_rate": 0.0002902989001531957, "loss": 0.0507, "step": 24950 }, { "epoch": 0.06, "learning_rate": 0.00029029501193682423, "loss": 0.0395, "step": 24960 }, { "epoch": 0.06, "learning_rate": 0.00029029112372045275, "loss": 0.0346, "step": 24970 }, { "epoch": 0.06, "learning_rate": 0.0002902872355040813, "loss": 0.0448, "step": 24980 }, { "epoch": 0.06, "learning_rate": 0.00029028334728770983, "loss": 0.0373, "step": 24990 }, { "epoch": 0.06, "learning_rate": 0.0002902794590713384, "loss": 0.0422, "step": 25000 }, { "epoch": 0.06, "eval_cer": 0.8817572721636008, "eval_loss": 0.02701452560722828, "eval_runtime": 107.7133, "eval_samples_per_second": 18.568, "eval_steps_per_second": 4.642, "step": 25000 }, { "epoch": 0.06, "learning_rate": 0.0002902755708549669, "loss": 0.0373, "step": 25010 }, { "epoch": 0.06, "learning_rate": 0.00029027168263859543, "loss": 0.0321, "step": 25020 }, { "epoch": 0.06, "learning_rate": 0.000290267794422224, "loss": 0.0294, "step": 25030 }, { "epoch": 0.06, "learning_rate": 0.0002902639062058525, "loss": 0.0417, "step": 25040 }, { "epoch": 0.06, "learning_rate": 0.00029026001798948103, "loss": 0.0475, "step": 25050 }, { "epoch": 0.06, "learning_rate": 0.0002902561297731096, "loss": 0.0352, "step": 25060 }, { "epoch": 0.06, "learning_rate": 0.0002902522415567381, "loss": 0.0366, "step": 25070 }, { "epoch": 0.07, "learning_rate": 0.0002902483533403667, "loss": 0.0311, "step": 25080 }, { "epoch": 0.07, "learning_rate": 0.0002902444651239952, "loss": 0.0345, "step": 25090 }, { "epoch": 0.07, "learning_rate": 0.0002902405769076237, "loss": 0.0367, "step": 25100 }, { "epoch": 0.07, "learning_rate": 0.0002902366886912522, "loss": 0.0324, "step": 25110 }, { "epoch": 0.07, "learning_rate": 0.0002902328004748808, "loss": 0.0297, "step": 25120 }, { "epoch": 0.07, "learning_rate": 0.00029022891225850936, "loss": 0.0319, "step": 25130 }, { "epoch": 0.07, "learning_rate": 0.0002902250240421379, "loss": 0.0395, "step": 25140 }, { "epoch": 0.07, "learning_rate": 0.0002902211358257664, "loss": 0.0356, "step": 25150 }, { "epoch": 0.07, "learning_rate": 0.00029021724760939496, "loss": 0.0357, "step": 25160 }, { "epoch": 0.07, "learning_rate": 0.0002902133593930235, "loss": 0.0358, "step": 25170 }, { "epoch": 0.07, "learning_rate": 0.000290209471176652, "loss": 0.0391, "step": 25180 }, { "epoch": 0.07, "learning_rate": 0.00029020558296028056, "loss": 0.0336, "step": 25190 }, { "epoch": 0.07, "learning_rate": 0.00029020169474390907, "loss": 0.0365, "step": 25200 }, { "epoch": 0.07, "learning_rate": 0.00029019780652753764, "loss": 0.0317, "step": 25210 }, { "epoch": 0.07, "learning_rate": 0.00029019391831116615, "loss": 0.032, "step": 25220 }, { "epoch": 0.07, "learning_rate": 0.00029019003009479467, "loss": 0.0358, "step": 25230 }, { "epoch": 0.07, "learning_rate": 0.00029018614187842324, "loss": 0.0365, "step": 25240 }, { "epoch": 0.07, "learning_rate": 0.00029018225366205175, "loss": 0.0332, "step": 25250 }, { "epoch": 0.07, "learning_rate": 0.00029017836544568027, "loss": 0.0307, "step": 25260 }, { "epoch": 0.07, "learning_rate": 0.00029017447722930884, "loss": 0.0353, "step": 25270 }, { "epoch": 0.07, "learning_rate": 0.0002901705890129374, "loss": 0.0405, "step": 25280 }, { "epoch": 0.07, "learning_rate": 0.0002901667007965659, "loss": 0.0326, "step": 25290 }, { "epoch": 0.07, "learning_rate": 0.00029016281258019443, "loss": 0.0387, "step": 25300 }, { "epoch": 0.07, "learning_rate": 0.00029015892436382295, "loss": 0.0313, "step": 25310 }, { "epoch": 0.07, "learning_rate": 0.0002901550361474515, "loss": 0.0332, "step": 25320 }, { "epoch": 0.07, "learning_rate": 0.00029015114793108003, "loss": 0.0324, "step": 25330 }, { "epoch": 0.07, "learning_rate": 0.0002901472597147086, "loss": 0.0318, "step": 25340 }, { "epoch": 0.07, "learning_rate": 0.0002901433714983371, "loss": 0.0352, "step": 25350 }, { "epoch": 0.07, "learning_rate": 0.00029013948328196563, "loss": 0.0319, "step": 25360 }, { "epoch": 0.07, "learning_rate": 0.0002901355950655942, "loss": 0.0372, "step": 25370 }, { "epoch": 0.07, "learning_rate": 0.0002901317068492227, "loss": 0.0371, "step": 25380 }, { "epoch": 0.07, "learning_rate": 0.00029012781863285123, "loss": 0.034, "step": 25390 }, { "epoch": 0.07, "learning_rate": 0.0002901239304164798, "loss": 0.0368, "step": 25400 }, { "epoch": 0.07, "learning_rate": 0.00029012004220010836, "loss": 0.0325, "step": 25410 }, { "epoch": 0.07, "learning_rate": 0.0002901161539837369, "loss": 0.0379, "step": 25420 }, { "epoch": 0.07, "learning_rate": 0.0002901122657673654, "loss": 0.0327, "step": 25430 }, { "epoch": 0.07, "learning_rate": 0.0002901083775509939, "loss": 0.0344, "step": 25440 }, { "epoch": 0.07, "learning_rate": 0.0002901044893346225, "loss": 0.0385, "step": 25450 }, { "epoch": 0.07, "learning_rate": 0.000290100601118251, "loss": 0.034, "step": 25460 }, { "epoch": 0.07, "learning_rate": 0.00029009671290187956, "loss": 0.0345, "step": 25470 }, { "epoch": 0.07, "learning_rate": 0.0002900928246855081, "loss": 0.0333, "step": 25480 }, { "epoch": 0.07, "learning_rate": 0.00029008893646913664, "loss": 0.0377, "step": 25490 }, { "epoch": 0.07, "learning_rate": 0.00029008504825276516, "loss": 0.0362, "step": 25500 }, { "epoch": 0.07, "learning_rate": 0.00029008116003639367, "loss": 0.0311, "step": 25510 }, { "epoch": 0.07, "learning_rate": 0.0002900772718200222, "loss": 0.0361, "step": 25520 }, { "epoch": 0.07, "learning_rate": 0.00029007338360365076, "loss": 0.0378, "step": 25530 }, { "epoch": 0.07, "learning_rate": 0.00029006949538727927, "loss": 0.036, "step": 25540 }, { "epoch": 0.07, "learning_rate": 0.00029006560717090784, "loss": 0.0353, "step": 25550 }, { "epoch": 0.07, "learning_rate": 0.00029006171895453635, "loss": 0.0397, "step": 25560 }, { "epoch": 0.07, "learning_rate": 0.00029005783073816487, "loss": 0.0317, "step": 25570 }, { "epoch": 0.07, "learning_rate": 0.00029005394252179344, "loss": 0.0372, "step": 25580 }, { "epoch": 0.07, "learning_rate": 0.00029005005430542195, "loss": 0.0342, "step": 25590 }, { "epoch": 0.07, "learning_rate": 0.00029004616608905047, "loss": 0.043, "step": 25600 }, { "epoch": 0.07, "learning_rate": 0.00029004227787267903, "loss": 0.0406, "step": 25610 }, { "epoch": 0.07, "learning_rate": 0.0002900383896563076, "loss": 0.0318, "step": 25620 }, { "epoch": 0.07, "learning_rate": 0.0002900345014399361, "loss": 0.0329, "step": 25630 }, { "epoch": 0.07, "learning_rate": 0.00029003061322356463, "loss": 0.0394, "step": 25640 }, { "epoch": 0.07, "learning_rate": 0.00029002672500719315, "loss": 0.0391, "step": 25650 }, { "epoch": 0.07, "learning_rate": 0.0002900228367908217, "loss": 0.0311, "step": 25660 }, { "epoch": 0.07, "learning_rate": 0.00029001894857445023, "loss": 0.0319, "step": 25670 }, { "epoch": 0.07, "learning_rate": 0.0002900150603580788, "loss": 0.0367, "step": 25680 }, { "epoch": 0.07, "learning_rate": 0.0002900111721417073, "loss": 0.0434, "step": 25690 }, { "epoch": 0.07, "learning_rate": 0.0002900072839253359, "loss": 0.0338, "step": 25700 }, { "epoch": 0.07, "learning_rate": 0.0002900033957089644, "loss": 0.0317, "step": 25710 }, { "epoch": 0.07, "learning_rate": 0.0002899995074925929, "loss": 0.035, "step": 25720 }, { "epoch": 0.07, "learning_rate": 0.0002899956192762214, "loss": 0.0325, "step": 25730 }, { "epoch": 0.07, "learning_rate": 0.00028999173105985, "loss": 0.0321, "step": 25740 }, { "epoch": 0.07, "learning_rate": 0.0002899878428434785, "loss": 0.033, "step": 25750 }, { "epoch": 0.07, "learning_rate": 0.0002899839546271071, "loss": 0.0314, "step": 25760 }, { "epoch": 0.07, "learning_rate": 0.0002899800664107356, "loss": 0.0327, "step": 25770 }, { "epoch": 0.07, "learning_rate": 0.00028997617819436416, "loss": 0.0327, "step": 25780 }, { "epoch": 0.07, "learning_rate": 0.0002899722899779927, "loss": 0.0316, "step": 25790 }, { "epoch": 0.07, "learning_rate": 0.0002899684017616212, "loss": 0.0346, "step": 25800 }, { "epoch": 0.07, "learning_rate": 0.00028996451354524976, "loss": 0.0316, "step": 25810 }, { "epoch": 0.07, "learning_rate": 0.0002899606253288783, "loss": 0.0307, "step": 25820 }, { "epoch": 0.07, "learning_rate": 0.00028995673711250684, "loss": 0.0454, "step": 25830 }, { "epoch": 0.07, "learning_rate": 0.00028995284889613536, "loss": 0.0352, "step": 25840 }, { "epoch": 0.07, "learning_rate": 0.00028994896067976387, "loss": 0.0362, "step": 25850 }, { "epoch": 0.07, "learning_rate": 0.0002899450724633924, "loss": 0.0352, "step": 25860 }, { "epoch": 0.07, "learning_rate": 0.00028994118424702095, "loss": 0.0371, "step": 25870 }, { "epoch": 0.07, "learning_rate": 0.00028993729603064947, "loss": 0.0364, "step": 25880 }, { "epoch": 0.07, "learning_rate": 0.00028993340781427804, "loss": 0.0386, "step": 25890 }, { "epoch": 0.07, "learning_rate": 0.00028992951959790655, "loss": 0.0342, "step": 25900 }, { "epoch": 0.07, "learning_rate": 0.0002899256313815351, "loss": 0.0301, "step": 25910 }, { "epoch": 0.07, "learning_rate": 0.00028992174316516364, "loss": 0.0284, "step": 25920 }, { "epoch": 0.07, "learning_rate": 0.00028991785494879215, "loss": 0.0371, "step": 25930 }, { "epoch": 0.07, "learning_rate": 0.00028991396673242066, "loss": 0.0315, "step": 25940 }, { "epoch": 0.07, "learning_rate": 0.00028991007851604923, "loss": 0.0365, "step": 25950 }, { "epoch": 0.07, "learning_rate": 0.0002899061902996778, "loss": 0.0318, "step": 25960 }, { "epoch": 0.07, "learning_rate": 0.0002899023020833063, "loss": 0.0324, "step": 25970 }, { "epoch": 0.07, "learning_rate": 0.00028989841386693483, "loss": 0.0333, "step": 25980 }, { "epoch": 0.07, "learning_rate": 0.0002898945256505634, "loss": 0.0352, "step": 25990 }, { "epoch": 0.07, "learning_rate": 0.0002898906374341919, "loss": 0.0374, "step": 26000 }, { "epoch": 0.07, "eval_cer": 0.881813257640968, "eval_loss": 0.026022659614682198, "eval_runtime": 107.6573, "eval_samples_per_second": 18.577, "eval_steps_per_second": 4.644, "step": 26000 }, { "epoch": 0.07, "learning_rate": 0.00028988674921782043, "loss": 0.035, "step": 26010 }, { "epoch": 0.07, "learning_rate": 0.000289882861001449, "loss": 0.0385, "step": 26020 }, { "epoch": 0.07, "learning_rate": 0.0002898789727850775, "loss": 0.0352, "step": 26030 }, { "epoch": 0.07, "learning_rate": 0.0002898750845687061, "loss": 0.0372, "step": 26040 }, { "epoch": 0.07, "learning_rate": 0.0002898711963523346, "loss": 0.035, "step": 26050 }, { "epoch": 0.07, "learning_rate": 0.0002898673081359631, "loss": 0.0335, "step": 26060 }, { "epoch": 0.07, "learning_rate": 0.0002898634199195916, "loss": 0.039, "step": 26070 }, { "epoch": 0.07, "learning_rate": 0.0002898595317032202, "loss": 0.0349, "step": 26080 }, { "epoch": 0.07, "learning_rate": 0.0002898556434868487, "loss": 0.0357, "step": 26090 }, { "epoch": 0.07, "learning_rate": 0.0002898517552704773, "loss": 0.0339, "step": 26100 }, { "epoch": 0.07, "learning_rate": 0.0002898478670541058, "loss": 0.0368, "step": 26110 }, { "epoch": 0.07, "learning_rate": 0.00028984397883773436, "loss": 0.0325, "step": 26120 }, { "epoch": 0.07, "learning_rate": 0.0002898400906213629, "loss": 0.0362, "step": 26130 }, { "epoch": 0.07, "learning_rate": 0.0002898362024049914, "loss": 0.0374, "step": 26140 }, { "epoch": 0.07, "learning_rate": 0.0002898323141886199, "loss": 0.0433, "step": 26150 }, { "epoch": 0.07, "learning_rate": 0.00028982842597224847, "loss": 0.0362, "step": 26160 }, { "epoch": 0.07, "learning_rate": 0.00028982453775587704, "loss": 0.0322, "step": 26170 }, { "epoch": 0.07, "learning_rate": 0.00028982064953950556, "loss": 0.038, "step": 26180 }, { "epoch": 0.07, "learning_rate": 0.00028981676132313407, "loss": 0.0332, "step": 26190 }, { "epoch": 0.07, "learning_rate": 0.00028981287310676264, "loss": 0.0311, "step": 26200 }, { "epoch": 0.07, "learning_rate": 0.00028980898489039115, "loss": 0.0396, "step": 26210 }, { "epoch": 0.07, "learning_rate": 0.00028980509667401967, "loss": 0.0351, "step": 26220 }, { "epoch": 0.07, "learning_rate": 0.00028980120845764824, "loss": 0.0349, "step": 26230 }, { "epoch": 0.07, "learning_rate": 0.00028979732024127675, "loss": 0.0309, "step": 26240 }, { "epoch": 0.07, "learning_rate": 0.0002897934320249053, "loss": 0.0354, "step": 26250 }, { "epoch": 0.07, "learning_rate": 0.00028978954380853383, "loss": 0.0324, "step": 26260 }, { "epoch": 0.07, "learning_rate": 0.00028978565559216235, "loss": 0.0281, "step": 26270 }, { "epoch": 0.07, "learning_rate": 0.0002897817673757909, "loss": 0.0306, "step": 26280 }, { "epoch": 0.07, "learning_rate": 0.00028977787915941943, "loss": 0.0299, "step": 26290 }, { "epoch": 0.07, "learning_rate": 0.00028977399094304795, "loss": 0.0325, "step": 26300 }, { "epoch": 0.07, "learning_rate": 0.0002897701027266765, "loss": 0.0416, "step": 26310 }, { "epoch": 0.07, "learning_rate": 0.00028976621451030503, "loss": 0.0288, "step": 26320 }, { "epoch": 0.07, "learning_rate": 0.0002897623262939336, "loss": 0.0392, "step": 26330 }, { "epoch": 0.07, "learning_rate": 0.0002897584380775621, "loss": 0.0374, "step": 26340 }, { "epoch": 0.07, "learning_rate": 0.00028975454986119063, "loss": 0.0349, "step": 26350 }, { "epoch": 0.07, "learning_rate": 0.0002897506616448192, "loss": 0.0373, "step": 26360 }, { "epoch": 0.07, "learning_rate": 0.0002897467734284477, "loss": 0.0336, "step": 26370 }, { "epoch": 0.07, "learning_rate": 0.0002897428852120763, "loss": 0.0351, "step": 26380 }, { "epoch": 0.07, "learning_rate": 0.0002897389969957048, "loss": 0.0354, "step": 26390 }, { "epoch": 0.07, "learning_rate": 0.0002897351087793333, "loss": 0.036, "step": 26400 }, { "epoch": 0.07, "learning_rate": 0.0002897312205629619, "loss": 0.0383, "step": 26410 }, { "epoch": 0.07, "learning_rate": 0.0002897273323465904, "loss": 0.0336, "step": 26420 }, { "epoch": 0.07, "learning_rate": 0.0002897234441302189, "loss": 0.0367, "step": 26430 }, { "epoch": 0.07, "learning_rate": 0.0002897195559138475, "loss": 0.0347, "step": 26440 }, { "epoch": 0.07, "learning_rate": 0.000289715667697476, "loss": 0.0349, "step": 26450 }, { "epoch": 0.07, "learning_rate": 0.00028971177948110456, "loss": 0.0411, "step": 26460 }, { "epoch": 0.07, "learning_rate": 0.0002897078912647331, "loss": 0.0333, "step": 26470 }, { "epoch": 0.07, "learning_rate": 0.0002897040030483616, "loss": 0.0306, "step": 26480 }, { "epoch": 0.07, "learning_rate": 0.00028970011483199016, "loss": 0.0342, "step": 26490 }, { "epoch": 0.07, "learning_rate": 0.00028969622661561867, "loss": 0.0316, "step": 26500 }, { "epoch": 0.07, "learning_rate": 0.00028969233839924724, "loss": 0.0351, "step": 26510 }, { "epoch": 0.07, "learning_rate": 0.00028968845018287575, "loss": 0.0394, "step": 26520 }, { "epoch": 0.07, "learning_rate": 0.0002896845619665043, "loss": 0.0353, "step": 26530 }, { "epoch": 0.07, "learning_rate": 0.00028968067375013284, "loss": 0.0306, "step": 26540 }, { "epoch": 0.07, "learning_rate": 0.00028967678553376135, "loss": 0.0342, "step": 26550 }, { "epoch": 0.07, "learning_rate": 0.00028967289731738987, "loss": 0.0328, "step": 26560 }, { "epoch": 0.07, "learning_rate": 0.00028966900910101844, "loss": 0.0311, "step": 26570 }, { "epoch": 0.07, "learning_rate": 0.00028966512088464695, "loss": 0.0351, "step": 26580 }, { "epoch": 0.07, "learning_rate": 0.0002896612326682755, "loss": 0.0317, "step": 26590 }, { "epoch": 0.07, "learning_rate": 0.00028965734445190403, "loss": 0.0341, "step": 26600 }, { "epoch": 0.07, "learning_rate": 0.00028965345623553255, "loss": 0.0319, "step": 26610 }, { "epoch": 0.07, "learning_rate": 0.0002896495680191611, "loss": 0.0304, "step": 26620 }, { "epoch": 0.07, "learning_rate": 0.00028964567980278963, "loss": 0.0272, "step": 26630 }, { "epoch": 0.07, "learning_rate": 0.00028964179158641815, "loss": 0.0341, "step": 26640 }, { "epoch": 0.07, "learning_rate": 0.0002896379033700467, "loss": 0.03, "step": 26650 }, { "epoch": 0.07, "learning_rate": 0.0002896340151536753, "loss": 0.0326, "step": 26660 }, { "epoch": 0.07, "learning_rate": 0.0002896301269373038, "loss": 0.0306, "step": 26670 }, { "epoch": 0.07, "learning_rate": 0.0002896262387209323, "loss": 0.0325, "step": 26680 }, { "epoch": 0.07, "learning_rate": 0.0002896223505045608, "loss": 0.0294, "step": 26690 }, { "epoch": 0.07, "learning_rate": 0.0002896184622881894, "loss": 0.0329, "step": 26700 }, { "epoch": 0.07, "learning_rate": 0.0002896145740718179, "loss": 0.0288, "step": 26710 }, { "epoch": 0.07, "learning_rate": 0.0002896106858554465, "loss": 0.0319, "step": 26720 }, { "epoch": 0.07, "learning_rate": 0.000289606797639075, "loss": 0.04, "step": 26730 }, { "epoch": 0.07, "learning_rate": 0.00028960290942270356, "loss": 0.0396, "step": 26740 }, { "epoch": 0.07, "learning_rate": 0.0002895990212063321, "loss": 0.0302, "step": 26750 }, { "epoch": 0.07, "learning_rate": 0.0002895951329899606, "loss": 0.0364, "step": 26760 }, { "epoch": 0.07, "learning_rate": 0.0002895912447735891, "loss": 0.0368, "step": 26770 }, { "epoch": 0.07, "learning_rate": 0.0002895873565572177, "loss": 0.0342, "step": 26780 }, { "epoch": 0.07, "learning_rate": 0.0002895834683408462, "loss": 0.0284, "step": 26790 }, { "epoch": 0.07, "learning_rate": 0.00028957958012447476, "loss": 0.0342, "step": 26800 }, { "epoch": 0.07, "learning_rate": 0.00028957569190810327, "loss": 0.0314, "step": 26810 }, { "epoch": 0.07, "learning_rate": 0.0002895718036917318, "loss": 0.0313, "step": 26820 }, { "epoch": 0.07, "learning_rate": 0.00028956791547536036, "loss": 0.0385, "step": 26830 }, { "epoch": 0.07, "learning_rate": 0.00028956402725898887, "loss": 0.0329, "step": 26840 }, { "epoch": 0.07, "learning_rate": 0.0002895601390426174, "loss": 0.0337, "step": 26850 }, { "epoch": 0.07, "learning_rate": 0.00028955625082624595, "loss": 0.0347, "step": 26860 }, { "epoch": 0.07, "learning_rate": 0.0002895523626098745, "loss": 0.0368, "step": 26870 }, { "epoch": 0.07, "learning_rate": 0.00028954847439350304, "loss": 0.0302, "step": 26880 }, { "epoch": 0.07, "learning_rate": 0.00028954458617713155, "loss": 0.0334, "step": 26890 }, { "epoch": 0.07, "learning_rate": 0.00028954069796076007, "loss": 0.037, "step": 26900 }, { "epoch": 0.07, "learning_rate": 0.00028953680974438863, "loss": 0.0365, "step": 26910 }, { "epoch": 0.07, "learning_rate": 0.00028953292152801715, "loss": 0.0287, "step": 26920 }, { "epoch": 0.07, "learning_rate": 0.0002895290333116457, "loss": 0.0257, "step": 26930 }, { "epoch": 0.07, "learning_rate": 0.00028952514509527423, "loss": 0.0266, "step": 26940 }, { "epoch": 0.07, "learning_rate": 0.0002895212568789028, "loss": 0.0342, "step": 26950 }, { "epoch": 0.07, "learning_rate": 0.0002895173686625313, "loss": 0.0419, "step": 26960 }, { "epoch": 0.07, "learning_rate": 0.00028951348044615983, "loss": 0.0388, "step": 26970 }, { "epoch": 0.07, "learning_rate": 0.00028950959222978834, "loss": 0.0325, "step": 26980 }, { "epoch": 0.07, "learning_rate": 0.0002895057040134169, "loss": 0.0393, "step": 26990 }, { "epoch": 0.07, "learning_rate": 0.0002895018157970455, "loss": 0.037, "step": 27000 }, { "epoch": 0.07, "eval_cer": 0.8818118580040337, "eval_loss": 0.02456413209438324, "eval_runtime": 107.6789, "eval_samples_per_second": 18.574, "eval_steps_per_second": 4.643, "step": 27000 }, { "epoch": 0.07, "learning_rate": 0.000289497927580674, "loss": 0.0335, "step": 27010 }, { "epoch": 0.07, "learning_rate": 0.0002894940393643025, "loss": 0.0275, "step": 27020 }, { "epoch": 0.07, "learning_rate": 0.0002894901511479311, "loss": 0.0362, "step": 27030 }, { "epoch": 0.07, "learning_rate": 0.0002894862629315596, "loss": 0.0328, "step": 27040 }, { "epoch": 0.07, "learning_rate": 0.0002894823747151881, "loss": 0.0327, "step": 27050 }, { "epoch": 0.07, "learning_rate": 0.0002894784864988167, "loss": 0.0287, "step": 27060 }, { "epoch": 0.07, "learning_rate": 0.0002894745982824452, "loss": 0.0298, "step": 27070 }, { "epoch": 0.07, "learning_rate": 0.00028947071006607376, "loss": 0.0335, "step": 27080 }, { "epoch": 0.07, "learning_rate": 0.0002894668218497023, "loss": 0.032, "step": 27090 }, { "epoch": 0.07, "learning_rate": 0.0002894629336333308, "loss": 0.0295, "step": 27100 }, { "epoch": 0.07, "learning_rate": 0.0002894590454169593, "loss": 0.0311, "step": 27110 }, { "epoch": 0.07, "learning_rate": 0.0002894551572005879, "loss": 0.0332, "step": 27120 }, { "epoch": 0.07, "learning_rate": 0.0002894512689842164, "loss": 0.0339, "step": 27130 }, { "epoch": 0.07, "learning_rate": 0.00028944738076784496, "loss": 0.0314, "step": 27140 }, { "epoch": 0.07, "learning_rate": 0.00028944349255147347, "loss": 0.0325, "step": 27150 }, { "epoch": 0.07, "learning_rate": 0.00028943960433510204, "loss": 0.0342, "step": 27160 }, { "epoch": 0.07, "learning_rate": 0.00028943571611873055, "loss": 0.0355, "step": 27170 }, { "epoch": 0.07, "learning_rate": 0.00028943182790235907, "loss": 0.0386, "step": 27180 }, { "epoch": 0.07, "learning_rate": 0.0002894279396859876, "loss": 0.0285, "step": 27190 }, { "epoch": 0.07, "learning_rate": 0.00028942405146961615, "loss": 0.0305, "step": 27200 }, { "epoch": 0.07, "learning_rate": 0.0002894201632532447, "loss": 0.0341, "step": 27210 }, { "epoch": 0.07, "learning_rate": 0.00028941627503687324, "loss": 0.0358, "step": 27220 }, { "epoch": 0.07, "learning_rate": 0.00028941238682050175, "loss": 0.0342, "step": 27230 }, { "epoch": 0.07, "learning_rate": 0.0002894084986041303, "loss": 0.0336, "step": 27240 }, { "epoch": 0.07, "learning_rate": 0.00028940461038775883, "loss": 0.0313, "step": 27250 }, { "epoch": 0.07, "learning_rate": 0.00028940072217138735, "loss": 0.0362, "step": 27260 }, { "epoch": 0.07, "learning_rate": 0.0002893968339550159, "loss": 0.035, "step": 27270 }, { "epoch": 0.07, "learning_rate": 0.00028939294573864443, "loss": 0.0319, "step": 27280 }, { "epoch": 0.07, "learning_rate": 0.000289389057522273, "loss": 0.0364, "step": 27290 }, { "epoch": 0.07, "learning_rate": 0.0002893851693059015, "loss": 0.0341, "step": 27300 }, { "epoch": 0.07, "learning_rate": 0.00028938128108953003, "loss": 0.0383, "step": 27310 }, { "epoch": 0.07, "learning_rate": 0.00028937739287315854, "loss": 0.0351, "step": 27320 }, { "epoch": 0.07, "learning_rate": 0.0002893735046567871, "loss": 0.0324, "step": 27330 }, { "epoch": 0.07, "learning_rate": 0.0002893696164404156, "loss": 0.0386, "step": 27340 }, { "epoch": 0.07, "learning_rate": 0.0002893657282240442, "loss": 0.0321, "step": 27350 }, { "epoch": 0.07, "learning_rate": 0.0002893618400076727, "loss": 0.035, "step": 27360 }, { "epoch": 0.07, "learning_rate": 0.0002893579517913013, "loss": 0.0381, "step": 27370 }, { "epoch": 0.07, "learning_rate": 0.0002893540635749298, "loss": 0.035, "step": 27380 }, { "epoch": 0.07, "learning_rate": 0.0002893501753585583, "loss": 0.0346, "step": 27390 }, { "epoch": 0.07, "learning_rate": 0.0002893462871421869, "loss": 0.0354, "step": 27400 }, { "epoch": 0.07, "learning_rate": 0.0002893423989258154, "loss": 0.0323, "step": 27410 }, { "epoch": 0.07, "learning_rate": 0.00028933851070944396, "loss": 0.0372, "step": 27420 }, { "epoch": 0.07, "learning_rate": 0.0002893346224930725, "loss": 0.0361, "step": 27430 }, { "epoch": 0.07, "learning_rate": 0.000289330734276701, "loss": 0.053, "step": 27440 }, { "epoch": 0.07, "learning_rate": 0.00028932684606032956, "loss": 0.032, "step": 27450 }, { "epoch": 0.07, "learning_rate": 0.00028932295784395807, "loss": 0.0357, "step": 27460 }, { "epoch": 0.07, "learning_rate": 0.0002893190696275866, "loss": 0.0399, "step": 27470 }, { "epoch": 0.07, "learning_rate": 0.00028931518141121516, "loss": 0.0398, "step": 27480 }, { "epoch": 0.07, "learning_rate": 0.00028931129319484367, "loss": 0.0398, "step": 27490 }, { "epoch": 0.07, "learning_rate": 0.00028930740497847224, "loss": 0.0303, "step": 27500 }, { "epoch": 0.07, "learning_rate": 0.00028930351676210075, "loss": 0.0415, "step": 27510 }, { "epoch": 0.07, "learning_rate": 0.00028929962854572927, "loss": 0.0326, "step": 27520 }, { "epoch": 0.07, "learning_rate": 0.00028929574032935784, "loss": 0.0299, "step": 27530 }, { "epoch": 0.07, "learning_rate": 0.00028929185211298635, "loss": 0.0301, "step": 27540 }, { "epoch": 0.07, "learning_rate": 0.0002892879638966149, "loss": 0.0317, "step": 27550 }, { "epoch": 0.07, "learning_rate": 0.00028928407568024343, "loss": 0.0326, "step": 27560 }, { "epoch": 0.07, "learning_rate": 0.00028928018746387195, "loss": 0.0353, "step": 27570 }, { "epoch": 0.07, "learning_rate": 0.0002892762992475005, "loss": 0.0322, "step": 27580 }, { "epoch": 0.07, "learning_rate": 0.00028927241103112903, "loss": 0.0308, "step": 27590 }, { "epoch": 0.07, "learning_rate": 0.00028926852281475755, "loss": 0.035, "step": 27600 }, { "epoch": 0.07, "learning_rate": 0.0002892646345983861, "loss": 0.0303, "step": 27610 }, { "epoch": 0.07, "learning_rate": 0.00028926074638201463, "loss": 0.0347, "step": 27620 }, { "epoch": 0.07, "learning_rate": 0.0002892568581656432, "loss": 0.0482, "step": 27630 }, { "epoch": 0.07, "learning_rate": 0.0002892529699492717, "loss": 0.0316, "step": 27640 }, { "epoch": 0.07, "learning_rate": 0.00028924908173290023, "loss": 0.0404, "step": 27650 }, { "epoch": 0.07, "learning_rate": 0.0002892451935165288, "loss": 0.0306, "step": 27660 }, { "epoch": 0.07, "learning_rate": 0.0002892413053001573, "loss": 0.0321, "step": 27670 }, { "epoch": 0.07, "learning_rate": 0.0002892374170837858, "loss": 0.032, "step": 27680 }, { "epoch": 0.07, "learning_rate": 0.0002892335288674144, "loss": 0.029, "step": 27690 }, { "epoch": 0.07, "learning_rate": 0.00028922964065104296, "loss": 0.0425, "step": 27700 }, { "epoch": 0.07, "learning_rate": 0.0002892257524346715, "loss": 0.0343, "step": 27710 }, { "epoch": 0.07, "learning_rate": 0.0002892218642183, "loss": 0.0358, "step": 27720 }, { "epoch": 0.07, "learning_rate": 0.0002892179760019285, "loss": 0.0361, "step": 27730 }, { "epoch": 0.07, "learning_rate": 0.0002892140877855571, "loss": 0.0378, "step": 27740 }, { "epoch": 0.07, "learning_rate": 0.0002892101995691856, "loss": 0.0409, "step": 27750 }, { "epoch": 0.07, "learning_rate": 0.00028920631135281416, "loss": 0.0355, "step": 27760 }, { "epoch": 0.07, "learning_rate": 0.0002892024231364427, "loss": 0.0429, "step": 27770 }, { "epoch": 0.07, "learning_rate": 0.00028919853492007124, "loss": 0.039, "step": 27780 }, { "epoch": 0.07, "learning_rate": 0.00028919464670369976, "loss": 0.0479, "step": 27790 }, { "epoch": 0.07, "learning_rate": 0.00028919075848732827, "loss": 0.0405, "step": 27800 }, { "epoch": 0.07, "learning_rate": 0.0002891868702709568, "loss": 0.0421, "step": 27810 }, { "epoch": 0.07, "learning_rate": 0.00028918298205458535, "loss": 0.037, "step": 27820 }, { "epoch": 0.07, "learning_rate": 0.00028917909383821387, "loss": 0.0369, "step": 27830 }, { "epoch": 0.07, "learning_rate": 0.00028917520562184244, "loss": 0.0393, "step": 27840 }, { "epoch": 0.07, "learning_rate": 0.00028917131740547095, "loss": 0.0407, "step": 27850 }, { "epoch": 0.07, "learning_rate": 0.00028916742918909947, "loss": 0.0313, "step": 27860 }, { "epoch": 0.07, "learning_rate": 0.00028916354097272804, "loss": 0.0363, "step": 27870 }, { "epoch": 0.07, "learning_rate": 0.00028915965275635655, "loss": 0.0338, "step": 27880 }, { "epoch": 0.07, "learning_rate": 0.00028915576453998506, "loss": 0.038, "step": 27890 }, { "epoch": 0.07, "learning_rate": 0.00028915187632361363, "loss": 0.0322, "step": 27900 }, { "epoch": 0.07, "learning_rate": 0.0002891479881072422, "loss": 0.0338, "step": 27910 }, { "epoch": 0.07, "learning_rate": 0.0002891440998908707, "loss": 0.032, "step": 27920 }, { "epoch": 0.07, "learning_rate": 0.00028914021167449923, "loss": 0.0371, "step": 27930 }, { "epoch": 0.07, "learning_rate": 0.00028913632345812775, "loss": 0.0339, "step": 27940 }, { "epoch": 0.07, "learning_rate": 0.0002891324352417563, "loss": 0.0333, "step": 27950 }, { "epoch": 0.07, "learning_rate": 0.00028912854702538483, "loss": 0.0331, "step": 27960 }, { "epoch": 0.07, "learning_rate": 0.0002891246588090134, "loss": 0.0361, "step": 27970 }, { "epoch": 0.07, "learning_rate": 0.0002891207705926419, "loss": 0.0316, "step": 27980 }, { "epoch": 0.07, "learning_rate": 0.0002891168823762705, "loss": 0.0386, "step": 27990 }, { "epoch": 0.07, "learning_rate": 0.000289112994159899, "loss": 0.0344, "step": 28000 }, { "epoch": 0.07, "eval_cer": 0.8817950623608236, "eval_loss": 0.024856723845005035, "eval_runtime": 107.5236, "eval_samples_per_second": 18.601, "eval_steps_per_second": 4.65, "step": 28000 }, { "epoch": 0.07, "learning_rate": 0.0002891091059435275, "loss": 0.0365, "step": 28010 }, { "epoch": 0.07, "learning_rate": 0.000289105217727156, "loss": 0.0353, "step": 28020 }, { "epoch": 0.07, "learning_rate": 0.0002891013295107846, "loss": 0.0339, "step": 28030 }, { "epoch": 0.07, "learning_rate": 0.0002890974412944131, "loss": 0.0346, "step": 28040 }, { "epoch": 0.07, "learning_rate": 0.0002890935530780417, "loss": 0.0321, "step": 28050 }, { "epoch": 0.07, "learning_rate": 0.0002890896648616702, "loss": 0.0319, "step": 28060 }, { "epoch": 0.07, "learning_rate": 0.0002890857766452987, "loss": 0.0321, "step": 28070 }, { "epoch": 0.07, "learning_rate": 0.0002890818884289273, "loss": 0.0357, "step": 28080 }, { "epoch": 0.07, "learning_rate": 0.0002890780002125558, "loss": 0.0356, "step": 28090 }, { "epoch": 0.07, "learning_rate": 0.00028907411199618436, "loss": 0.0343, "step": 28100 }, { "epoch": 0.07, "learning_rate": 0.00028907022377981287, "loss": 0.0389, "step": 28110 }, { "epoch": 0.07, "learning_rate": 0.00028906633556344144, "loss": 0.0303, "step": 28120 }, { "epoch": 0.07, "learning_rate": 0.00028906244734706996, "loss": 0.0359, "step": 28130 }, { "epoch": 0.07, "learning_rate": 0.00028905855913069847, "loss": 0.0319, "step": 28140 }, { "epoch": 0.07, "learning_rate": 0.000289054670914327, "loss": 0.0268, "step": 28150 }, { "epoch": 0.07, "learning_rate": 0.00028905078269795555, "loss": 0.0301, "step": 28160 }, { "epoch": 0.07, "learning_rate": 0.00028904689448158407, "loss": 0.0348, "step": 28170 }, { "epoch": 0.07, "learning_rate": 0.00028904300626521264, "loss": 0.0315, "step": 28180 }, { "epoch": 0.07, "learning_rate": 0.00028903911804884115, "loss": 0.0329, "step": 28190 }, { "epoch": 0.07, "learning_rate": 0.0002890352298324697, "loss": 0.0283, "step": 28200 }, { "epoch": 0.07, "learning_rate": 0.00028903134161609823, "loss": 0.0328, "step": 28210 }, { "epoch": 0.07, "learning_rate": 0.00028902745339972675, "loss": 0.0257, "step": 28220 }, { "epoch": 0.07, "learning_rate": 0.00028902356518335526, "loss": 0.0321, "step": 28230 }, { "epoch": 0.07, "learning_rate": 0.00028901967696698383, "loss": 0.0426, "step": 28240 }, { "epoch": 0.07, "learning_rate": 0.0002890157887506124, "loss": 0.0314, "step": 28250 }, { "epoch": 0.07, "learning_rate": 0.0002890119005342409, "loss": 0.0341, "step": 28260 }, { "epoch": 0.07, "learning_rate": 0.00028900801231786943, "loss": 0.0303, "step": 28270 }, { "epoch": 0.07, "learning_rate": 0.000289004124101498, "loss": 0.0337, "step": 28280 }, { "epoch": 0.07, "learning_rate": 0.0002890002358851265, "loss": 0.0356, "step": 28290 }, { "epoch": 0.07, "learning_rate": 0.00028899634766875503, "loss": 0.0282, "step": 28300 }, { "epoch": 0.07, "learning_rate": 0.0002889924594523836, "loss": 0.0354, "step": 28310 }, { "epoch": 0.07, "learning_rate": 0.0002889885712360121, "loss": 0.0336, "step": 28320 }, { "epoch": 0.07, "learning_rate": 0.0002889846830196407, "loss": 0.0272, "step": 28330 }, { "epoch": 0.07, "learning_rate": 0.0002889807948032692, "loss": 0.039, "step": 28340 }, { "epoch": 0.07, "learning_rate": 0.0002889769065868977, "loss": 0.0331, "step": 28350 }, { "epoch": 0.07, "learning_rate": 0.0002889730183705262, "loss": 0.0309, "step": 28360 }, { "epoch": 0.07, "learning_rate": 0.0002889691301541548, "loss": 0.0328, "step": 28370 }, { "epoch": 0.07, "learning_rate": 0.0002889652419377833, "loss": 0.0331, "step": 28380 }, { "epoch": 0.07, "learning_rate": 0.0002889613537214119, "loss": 0.0305, "step": 28390 }, { "epoch": 0.07, "learning_rate": 0.0002889574655050404, "loss": 0.0328, "step": 28400 }, { "epoch": 0.07, "learning_rate": 0.00028895357728866896, "loss": 0.0326, "step": 28410 }, { "epoch": 0.07, "learning_rate": 0.0002889496890722975, "loss": 0.0326, "step": 28420 }, { "epoch": 0.07, "learning_rate": 0.000288945800855926, "loss": 0.0333, "step": 28430 }, { "epoch": 0.07, "learning_rate": 0.0002889419126395545, "loss": 0.0292, "step": 28440 }, { "epoch": 0.07, "learning_rate": 0.00028893802442318307, "loss": 0.0374, "step": 28450 }, { "epoch": 0.07, "learning_rate": 0.00028893413620681164, "loss": 0.0346, "step": 28460 }, { "epoch": 0.07, "learning_rate": 0.00028893024799044015, "loss": 0.0338, "step": 28470 }, { "epoch": 0.07, "learning_rate": 0.00028892635977406867, "loss": 0.032, "step": 28480 }, { "epoch": 0.07, "learning_rate": 0.00028892247155769724, "loss": 0.0345, "step": 28490 }, { "epoch": 0.07, "learning_rate": 0.00028891858334132575, "loss": 0.0358, "step": 28500 }, { "epoch": 0.07, "learning_rate": 0.00028891469512495427, "loss": 0.0346, "step": 28510 }, { "epoch": 0.07, "learning_rate": 0.00028891080690858284, "loss": 0.0403, "step": 28520 }, { "epoch": 0.07, "learning_rate": 0.00028890691869221135, "loss": 0.0347, "step": 28530 }, { "epoch": 0.07, "learning_rate": 0.0002889030304758399, "loss": 0.0312, "step": 28540 }, { "epoch": 0.07, "learning_rate": 0.00028889914225946843, "loss": 0.0315, "step": 28550 }, { "epoch": 0.07, "learning_rate": 0.00028889525404309695, "loss": 0.0325, "step": 28560 }, { "epoch": 0.07, "learning_rate": 0.00028889136582672546, "loss": 0.0344, "step": 28570 }, { "epoch": 0.07, "learning_rate": 0.00028888747761035403, "loss": 0.0315, "step": 28580 }, { "epoch": 0.07, "learning_rate": 0.0002888835893939826, "loss": 0.0466, "step": 28590 }, { "epoch": 0.07, "learning_rate": 0.0002888797011776111, "loss": 0.0387, "step": 28600 }, { "epoch": 0.07, "learning_rate": 0.00028887581296123963, "loss": 0.03, "step": 28610 }, { "epoch": 0.07, "learning_rate": 0.0002888719247448682, "loss": 0.0335, "step": 28620 }, { "epoch": 0.07, "learning_rate": 0.0002888680365284967, "loss": 0.0349, "step": 28630 }, { "epoch": 0.07, "learning_rate": 0.0002888641483121252, "loss": 0.0327, "step": 28640 }, { "epoch": 0.07, "learning_rate": 0.0002888602600957538, "loss": 0.0487, "step": 28650 }, { "epoch": 0.07, "learning_rate": 0.0002888563718793823, "loss": 0.0422, "step": 28660 }, { "epoch": 0.07, "learning_rate": 0.0002888524836630109, "loss": 0.0338, "step": 28670 }, { "epoch": 0.07, "learning_rate": 0.0002888485954466394, "loss": 0.0331, "step": 28680 }, { "epoch": 0.07, "learning_rate": 0.0002888447072302679, "loss": 0.0352, "step": 28690 }, { "epoch": 0.07, "learning_rate": 0.0002888408190138965, "loss": 0.0318, "step": 28700 }, { "epoch": 0.07, "learning_rate": 0.000288836930797525, "loss": 0.0325, "step": 28710 }, { "epoch": 0.07, "learning_rate": 0.0002888330425811535, "loss": 0.0363, "step": 28720 }, { "epoch": 0.07, "learning_rate": 0.0002888291543647821, "loss": 0.0294, "step": 28730 }, { "epoch": 0.07, "learning_rate": 0.00028882526614841064, "loss": 0.0366, "step": 28740 }, { "epoch": 0.07, "learning_rate": 0.00028882137793203916, "loss": 0.0347, "step": 28750 }, { "epoch": 0.07, "learning_rate": 0.00028881748971566767, "loss": 0.0305, "step": 28760 }, { "epoch": 0.07, "learning_rate": 0.0002888136014992962, "loss": 0.0282, "step": 28770 }, { "epoch": 0.07, "learning_rate": 0.00028880971328292476, "loss": 0.0287, "step": 28780 }, { "epoch": 0.07, "learning_rate": 0.00028880582506655327, "loss": 0.029, "step": 28790 }, { "epoch": 0.07, "learning_rate": 0.00028880193685018184, "loss": 0.0328, "step": 28800 }, { "epoch": 0.07, "learning_rate": 0.00028879804863381035, "loss": 0.0293, "step": 28810 }, { "epoch": 0.07, "learning_rate": 0.00028879416041743887, "loss": 0.0347, "step": 28820 }, { "epoch": 0.07, "learning_rate": 0.00028879027220106744, "loss": 0.0318, "step": 28830 }, { "epoch": 0.07, "learning_rate": 0.00028878638398469595, "loss": 0.0332, "step": 28840 }, { "epoch": 0.07, "learning_rate": 0.00028878249576832447, "loss": 0.0395, "step": 28850 }, { "epoch": 0.07, "learning_rate": 0.00028877860755195303, "loss": 0.0373, "step": 28860 }, { "epoch": 0.07, "learning_rate": 0.00028877471933558155, "loss": 0.0273, "step": 28870 }, { "epoch": 0.07, "learning_rate": 0.0002887708311192101, "loss": 0.0367, "step": 28880 }, { "epoch": 0.07, "learning_rate": 0.00028876694290283863, "loss": 0.0304, "step": 28890 }, { "epoch": 0.07, "learning_rate": 0.00028876305468646715, "loss": 0.0342, "step": 28900 }, { "epoch": 0.07, "learning_rate": 0.0002887591664700957, "loss": 0.0293, "step": 28910 }, { "epoch": 0.07, "learning_rate": 0.00028875527825372423, "loss": 0.0299, "step": 28920 }, { "epoch": 0.07, "learning_rate": 0.00028875139003735274, "loss": 0.0288, "step": 28930 }, { "epoch": 0.08, "learning_rate": 0.0002887475018209813, "loss": 0.0382, "step": 28940 }, { "epoch": 0.08, "learning_rate": 0.0002887436136046099, "loss": 0.0306, "step": 28950 }, { "epoch": 0.08, "learning_rate": 0.0002887397253882384, "loss": 0.038, "step": 28960 }, { "epoch": 0.08, "learning_rate": 0.0002887358371718669, "loss": 0.0357, "step": 28970 }, { "epoch": 0.08, "learning_rate": 0.0002887319489554954, "loss": 0.0379, "step": 28980 }, { "epoch": 0.08, "learning_rate": 0.000288728060739124, "loss": 0.0357, "step": 28990 }, { "epoch": 0.08, "learning_rate": 0.0002887241725227525, "loss": 0.0386, "step": 29000 }, { "epoch": 0.08, "eval_cer": 0.8817614710744033, "eval_loss": 0.025074917823076248, "eval_runtime": 107.6332, "eval_samples_per_second": 18.582, "eval_steps_per_second": 4.645, "step": 29000 }, { "epoch": 0.08, "learning_rate": 0.0002887202843063811, "loss": 0.0372, "step": 29010 }, { "epoch": 0.08, "learning_rate": 0.0002887163960900096, "loss": 0.0475, "step": 29020 }, { "epoch": 0.08, "learning_rate": 0.0002887125078736381, "loss": 0.0303, "step": 29030 }, { "epoch": 0.08, "learning_rate": 0.0002887086196572667, "loss": 0.0469, "step": 29040 }, { "epoch": 0.08, "learning_rate": 0.0002887047314408952, "loss": 0.0362, "step": 29050 }, { "epoch": 0.08, "learning_rate": 0.0002887008432245237, "loss": 0.0339, "step": 29060 }, { "epoch": 0.08, "learning_rate": 0.0002886969550081523, "loss": 0.0362, "step": 29070 }, { "epoch": 0.08, "learning_rate": 0.0002886930667917808, "loss": 0.0383, "step": 29080 }, { "epoch": 0.08, "learning_rate": 0.00028868917857540936, "loss": 0.0317, "step": 29090 }, { "epoch": 0.08, "learning_rate": 0.00028868529035903787, "loss": 0.037, "step": 29100 }, { "epoch": 0.08, "learning_rate": 0.0002886814021426664, "loss": 0.0378, "step": 29110 }, { "epoch": 0.08, "learning_rate": 0.00028867751392629495, "loss": 0.032, "step": 29120 }, { "epoch": 0.08, "learning_rate": 0.00028867362570992347, "loss": 0.035, "step": 29130 }, { "epoch": 0.08, "learning_rate": 0.00028866973749355204, "loss": 0.0373, "step": 29140 }, { "epoch": 0.08, "learning_rate": 0.00028866584927718055, "loss": 0.0312, "step": 29150 }, { "epoch": 0.08, "learning_rate": 0.0002886619610608091, "loss": 0.0383, "step": 29160 }, { "epoch": 0.08, "learning_rate": 0.00028865807284443764, "loss": 0.0414, "step": 29170 }, { "epoch": 0.08, "learning_rate": 0.00028865418462806615, "loss": 0.0331, "step": 29180 }, { "epoch": 0.08, "learning_rate": 0.00028865029641169466, "loss": 0.0357, "step": 29190 }, { "epoch": 0.08, "learning_rate": 0.00028864640819532323, "loss": 0.0307, "step": 29200 }, { "epoch": 0.08, "learning_rate": 0.00028864251997895175, "loss": 0.0375, "step": 29210 }, { "epoch": 0.08, "learning_rate": 0.0002886386317625803, "loss": 0.0391, "step": 29220 }, { "epoch": 0.08, "learning_rate": 0.00028863474354620883, "loss": 0.0402, "step": 29230 }, { "epoch": 0.08, "learning_rate": 0.0002886308553298374, "loss": 0.0324, "step": 29240 }, { "epoch": 0.08, "learning_rate": 0.0002886269671134659, "loss": 0.034, "step": 29250 }, { "epoch": 0.08, "learning_rate": 0.00028862307889709443, "loss": 0.0355, "step": 29260 }, { "epoch": 0.08, "learning_rate": 0.00028861919068072294, "loss": 0.0317, "step": 29270 }, { "epoch": 0.08, "learning_rate": 0.0002886153024643515, "loss": 0.0336, "step": 29280 }, { "epoch": 0.08, "learning_rate": 0.0002886114142479801, "loss": 0.0366, "step": 29290 }, { "epoch": 0.08, "learning_rate": 0.0002886075260316086, "loss": 0.0272, "step": 29300 }, { "epoch": 0.08, "learning_rate": 0.0002886036378152371, "loss": 0.0328, "step": 29310 }, { "epoch": 0.08, "learning_rate": 0.0002885997495988656, "loss": 0.0319, "step": 29320 }, { "epoch": 0.08, "learning_rate": 0.0002885958613824942, "loss": 0.0321, "step": 29330 }, { "epoch": 0.08, "learning_rate": 0.0002885919731661227, "loss": 0.0425, "step": 29340 }, { "epoch": 0.08, "learning_rate": 0.0002885880849497513, "loss": 0.0501, "step": 29350 }, { "epoch": 0.08, "learning_rate": 0.0002885841967333798, "loss": 0.0415, "step": 29360 }, { "epoch": 0.08, "learning_rate": 0.00028858030851700836, "loss": 0.0321, "step": 29370 }, { "epoch": 0.08, "learning_rate": 0.0002885764203006369, "loss": 0.0336, "step": 29380 }, { "epoch": 0.08, "learning_rate": 0.0002885725320842654, "loss": 0.0342, "step": 29390 }, { "epoch": 0.08, "learning_rate": 0.0002885686438678939, "loss": 0.0331, "step": 29400 }, { "epoch": 0.08, "learning_rate": 0.00028856475565152247, "loss": 0.0329, "step": 29410 }, { "epoch": 0.08, "learning_rate": 0.000288560867435151, "loss": 0.0275, "step": 29420 }, { "epoch": 0.08, "learning_rate": 0.00028855697921877956, "loss": 0.031, "step": 29430 }, { "epoch": 0.08, "learning_rate": 0.00028855309100240807, "loss": 0.0302, "step": 29440 }, { "epoch": 0.08, "learning_rate": 0.00028854920278603664, "loss": 0.0327, "step": 29450 }, { "epoch": 0.08, "learning_rate": 0.00028854531456966515, "loss": 0.0299, "step": 29460 }, { "epoch": 0.08, "learning_rate": 0.00028854142635329367, "loss": 0.0373, "step": 29470 }, { "epoch": 0.08, "learning_rate": 0.0002885375381369222, "loss": 0.0286, "step": 29480 }, { "epoch": 0.08, "learning_rate": 0.00028853364992055075, "loss": 0.0327, "step": 29490 }, { "epoch": 0.08, "learning_rate": 0.0002885297617041793, "loss": 0.0321, "step": 29500 }, { "epoch": 0.08, "learning_rate": 0.00028852587348780783, "loss": 0.0366, "step": 29510 }, { "epoch": 0.08, "learning_rate": 0.00028852198527143635, "loss": 0.0285, "step": 29520 }, { "epoch": 0.08, "learning_rate": 0.00028851809705506486, "loss": 0.0406, "step": 29530 }, { "epoch": 0.08, "learning_rate": 0.00028851420883869343, "loss": 0.0319, "step": 29540 }, { "epoch": 0.08, "learning_rate": 0.00028851032062232195, "loss": 0.0315, "step": 29550 }, { "epoch": 0.08, "learning_rate": 0.0002885064324059505, "loss": 0.025, "step": 29560 }, { "epoch": 0.08, "learning_rate": 0.00028850254418957903, "loss": 0.0294, "step": 29570 }, { "epoch": 0.08, "learning_rate": 0.0002884986559732076, "loss": 0.0326, "step": 29580 }, { "epoch": 0.08, "learning_rate": 0.0002884947677568361, "loss": 0.0372, "step": 29590 }, { "epoch": 0.08, "learning_rate": 0.00028849087954046463, "loss": 0.0328, "step": 29600 }, { "epoch": 0.08, "learning_rate": 0.00028848699132409314, "loss": 0.0367, "step": 29610 }, { "epoch": 0.08, "learning_rate": 0.0002884831031077217, "loss": 0.0265, "step": 29620 }, { "epoch": 0.08, "learning_rate": 0.0002884792148913502, "loss": 0.0367, "step": 29630 }, { "epoch": 0.08, "learning_rate": 0.0002884753266749788, "loss": 0.0323, "step": 29640 }, { "epoch": 0.08, "learning_rate": 0.0002884714384586073, "loss": 0.0297, "step": 29650 }, { "epoch": 0.08, "learning_rate": 0.0002884675502422359, "loss": 0.0381, "step": 29660 }, { "epoch": 0.08, "learning_rate": 0.0002884636620258644, "loss": 0.0275, "step": 29670 }, { "epoch": 0.08, "learning_rate": 0.0002884597738094929, "loss": 0.0308, "step": 29680 }, { "epoch": 0.08, "learning_rate": 0.0002884558855931215, "loss": 0.035, "step": 29690 }, { "epoch": 0.08, "learning_rate": 0.00028845199737675, "loss": 0.0338, "step": 29700 }, { "epoch": 0.08, "learning_rate": 0.00028844810916037856, "loss": 0.0297, "step": 29710 }, { "epoch": 0.08, "learning_rate": 0.0002884442209440071, "loss": 0.0256, "step": 29720 }, { "epoch": 0.08, "learning_rate": 0.0002884403327276356, "loss": 0.0324, "step": 29730 }, { "epoch": 0.08, "learning_rate": 0.00028843644451126416, "loss": 0.0384, "step": 29740 }, { "epoch": 0.08, "learning_rate": 0.00028843255629489267, "loss": 0.0324, "step": 29750 }, { "epoch": 0.08, "learning_rate": 0.0002884286680785212, "loss": 0.0379, "step": 29760 }, { "epoch": 0.08, "learning_rate": 0.00028842477986214975, "loss": 0.0283, "step": 29770 }, { "epoch": 0.08, "learning_rate": 0.00028842089164577827, "loss": 0.0356, "step": 29780 }, { "epoch": 0.08, "learning_rate": 0.00028841700342940684, "loss": 0.0307, "step": 29790 }, { "epoch": 0.08, "learning_rate": 0.00028841311521303535, "loss": 0.0298, "step": 29800 }, { "epoch": 0.08, "learning_rate": 0.00028840922699666387, "loss": 0.0293, "step": 29810 }, { "epoch": 0.08, "learning_rate": 0.0002884053387802924, "loss": 0.0339, "step": 29820 }, { "epoch": 0.08, "learning_rate": 0.00028840145056392095, "loss": 0.0323, "step": 29830 }, { "epoch": 0.08, "learning_rate": 0.0002883975623475495, "loss": 0.0314, "step": 29840 }, { "epoch": 0.08, "learning_rate": 0.00028839367413117803, "loss": 0.0357, "step": 29850 }, { "epoch": 0.08, "learning_rate": 0.00028838978591480655, "loss": 0.0256, "step": 29860 }, { "epoch": 0.08, "learning_rate": 0.0002883858976984351, "loss": 0.0299, "step": 29870 }, { "epoch": 0.08, "learning_rate": 0.00028838200948206363, "loss": 0.0372, "step": 29880 }, { "epoch": 0.08, "learning_rate": 0.00028837812126569215, "loss": 0.0332, "step": 29890 }, { "epoch": 0.08, "learning_rate": 0.0002883742330493207, "loss": 0.0286, "step": 29900 }, { "epoch": 0.08, "learning_rate": 0.00028837034483294923, "loss": 0.0302, "step": 29910 }, { "epoch": 0.08, "learning_rate": 0.0002883664566165778, "loss": 0.0327, "step": 29920 }, { "epoch": 0.08, "learning_rate": 0.0002883625684002063, "loss": 0.0326, "step": 29930 }, { "epoch": 0.08, "learning_rate": 0.0002883586801838348, "loss": 0.0315, "step": 29940 }, { "epoch": 0.08, "learning_rate": 0.0002883547919674634, "loss": 0.0438, "step": 29950 }, { "epoch": 0.08, "learning_rate": 0.0002883509037510919, "loss": 0.0303, "step": 29960 }, { "epoch": 0.08, "learning_rate": 0.0002883470155347204, "loss": 0.0308, "step": 29970 }, { "epoch": 0.08, "learning_rate": 0.000288343127318349, "loss": 0.0305, "step": 29980 }, { "epoch": 0.08, "learning_rate": 0.00028833923910197756, "loss": 0.0316, "step": 29990 }, { "epoch": 0.08, "learning_rate": 0.0002883353508856061, "loss": 0.0343, "step": 30000 }, { "epoch": 0.08, "eval_cer": 0.8817922630869552, "eval_loss": 0.025351664051413536, "eval_runtime": 107.6228, "eval_samples_per_second": 18.583, "eval_steps_per_second": 4.646, "step": 30000 }, { "epoch": 0.08, "learning_rate": 0.0002883314626692346, "loss": 0.0313, "step": 30010 }, { "epoch": 0.08, "learning_rate": 0.0002883275744528631, "loss": 0.0321, "step": 30020 }, { "epoch": 0.08, "learning_rate": 0.0002883236862364916, "loss": 0.0361, "step": 30030 }, { "epoch": 0.08, "learning_rate": 0.0002883197980201202, "loss": 0.0415, "step": 30040 }, { "epoch": 0.08, "learning_rate": 0.00028831590980374876, "loss": 0.0308, "step": 30050 }, { "epoch": 0.08, "learning_rate": 0.00028831202158737727, "loss": 0.0352, "step": 30060 }, { "epoch": 0.08, "learning_rate": 0.0002883081333710058, "loss": 0.0298, "step": 30070 }, { "epoch": 0.08, "learning_rate": 0.00028830424515463436, "loss": 0.0322, "step": 30080 }, { "epoch": 0.08, "learning_rate": 0.00028830035693826287, "loss": 0.0335, "step": 30090 }, { "epoch": 0.08, "learning_rate": 0.0002882964687218914, "loss": 0.0322, "step": 30100 }, { "epoch": 0.08, "learning_rate": 0.00028829258050551995, "loss": 0.0349, "step": 30110 }, { "epoch": 0.08, "learning_rate": 0.00028828869228914847, "loss": 0.0306, "step": 30120 }, { "epoch": 0.08, "learning_rate": 0.00028828480407277704, "loss": 0.0318, "step": 30130 }, { "epoch": 0.08, "learning_rate": 0.00028828091585640555, "loss": 0.033, "step": 30140 }, { "epoch": 0.08, "learning_rate": 0.00028827702764003407, "loss": 0.031, "step": 30150 }, { "epoch": 0.08, "learning_rate": 0.00028827313942366263, "loss": 0.0318, "step": 30160 }, { "epoch": 0.08, "learning_rate": 0.00028826925120729115, "loss": 0.031, "step": 30170 }, { "epoch": 0.08, "learning_rate": 0.0002882653629909197, "loss": 0.0347, "step": 30180 }, { "epoch": 0.08, "learning_rate": 0.00028826147477454823, "loss": 0.0335, "step": 30190 }, { "epoch": 0.08, "learning_rate": 0.0002882575865581768, "loss": 0.033, "step": 30200 }, { "epoch": 0.08, "learning_rate": 0.0002882536983418053, "loss": 0.0303, "step": 30210 }, { "epoch": 0.08, "learning_rate": 0.00028824981012543383, "loss": 0.031, "step": 30220 }, { "epoch": 0.08, "learning_rate": 0.00028824592190906234, "loss": 0.0387, "step": 30230 }, { "epoch": 0.08, "learning_rate": 0.0002882420336926909, "loss": 0.0299, "step": 30240 }, { "epoch": 0.08, "learning_rate": 0.00028823814547631943, "loss": 0.034, "step": 30250 }, { "epoch": 0.08, "learning_rate": 0.000288234257259948, "loss": 0.0368, "step": 30260 }, { "epoch": 0.08, "learning_rate": 0.0002882303690435765, "loss": 0.0399, "step": 30270 }, { "epoch": 0.08, "learning_rate": 0.000288226480827205, "loss": 0.0332, "step": 30280 }, { "epoch": 0.08, "learning_rate": 0.0002882225926108336, "loss": 0.0335, "step": 30290 }, { "epoch": 0.08, "learning_rate": 0.0002882187043944621, "loss": 0.0334, "step": 30300 }, { "epoch": 0.08, "learning_rate": 0.0002882148161780906, "loss": 0.0371, "step": 30310 }, { "epoch": 0.08, "learning_rate": 0.0002882109279617192, "loss": 0.0328, "step": 30320 }, { "epoch": 0.08, "learning_rate": 0.00028820703974534776, "loss": 0.0317, "step": 30330 }, { "epoch": 0.08, "learning_rate": 0.0002882031515289763, "loss": 0.039, "step": 30340 }, { "epoch": 0.08, "learning_rate": 0.0002881992633126048, "loss": 0.0291, "step": 30350 }, { "epoch": 0.08, "learning_rate": 0.0002881953750962333, "loss": 0.0364, "step": 30360 }, { "epoch": 0.08, "learning_rate": 0.00028819148687986187, "loss": 0.0346, "step": 30370 }, { "epoch": 0.08, "learning_rate": 0.0002881875986634904, "loss": 0.0317, "step": 30380 }, { "epoch": 0.08, "learning_rate": 0.00028818371044711896, "loss": 0.0364, "step": 30390 }, { "epoch": 0.08, "learning_rate": 0.00028817982223074747, "loss": 0.0364, "step": 30400 }, { "epoch": 0.08, "learning_rate": 0.00028817593401437604, "loss": 0.0307, "step": 30410 }, { "epoch": 0.08, "learning_rate": 0.00028817204579800455, "loss": 0.0359, "step": 30420 }, { "epoch": 0.08, "learning_rate": 0.00028816815758163307, "loss": 0.0347, "step": 30430 }, { "epoch": 0.08, "learning_rate": 0.0002881642693652616, "loss": 0.0341, "step": 30440 }, { "epoch": 0.08, "learning_rate": 0.00028816038114889015, "loss": 0.0381, "step": 30450 }, { "epoch": 0.08, "learning_rate": 0.00028815649293251867, "loss": 0.0294, "step": 30460 }, { "epoch": 0.08, "learning_rate": 0.00028815260471614723, "loss": 0.0411, "step": 30470 }, { "epoch": 0.08, "learning_rate": 0.00028814871649977575, "loss": 0.033, "step": 30480 }, { "epoch": 0.08, "learning_rate": 0.0002881448282834043, "loss": 0.0317, "step": 30490 }, { "epoch": 0.08, "learning_rate": 0.00028814094006703283, "loss": 0.028, "step": 30500 }, { "epoch": 0.08, "learning_rate": 0.00028813705185066135, "loss": 0.0338, "step": 30510 }, { "epoch": 0.08, "learning_rate": 0.00028813316363428986, "loss": 0.0351, "step": 30520 }, { "epoch": 0.08, "learning_rate": 0.00028812927541791843, "loss": 0.028, "step": 30530 }, { "epoch": 0.08, "learning_rate": 0.000288125387201547, "loss": 0.0345, "step": 30540 }, { "epoch": 0.08, "learning_rate": 0.0002881214989851755, "loss": 0.0317, "step": 30550 }, { "epoch": 0.08, "learning_rate": 0.00028811761076880403, "loss": 0.0353, "step": 30560 }, { "epoch": 0.08, "learning_rate": 0.00028811372255243254, "loss": 0.031, "step": 30570 }, { "epoch": 0.08, "learning_rate": 0.0002881098343360611, "loss": 0.0313, "step": 30580 }, { "epoch": 0.08, "learning_rate": 0.0002881059461196896, "loss": 0.0326, "step": 30590 }, { "epoch": 0.08, "learning_rate": 0.0002881020579033182, "loss": 0.0322, "step": 30600 }, { "epoch": 0.08, "learning_rate": 0.0002880981696869467, "loss": 0.0293, "step": 30610 }, { "epoch": 0.08, "learning_rate": 0.0002880942814705753, "loss": 0.0309, "step": 30620 }, { "epoch": 0.08, "learning_rate": 0.0002880903932542038, "loss": 0.0354, "step": 30630 }, { "epoch": 0.08, "learning_rate": 0.0002880865050378323, "loss": 0.0312, "step": 30640 }, { "epoch": 0.08, "learning_rate": 0.0002880826168214608, "loss": 0.0271, "step": 30650 }, { "epoch": 0.08, "learning_rate": 0.0002880787286050894, "loss": 0.0303, "step": 30660 }, { "epoch": 0.08, "learning_rate": 0.0002880748403887179, "loss": 0.036, "step": 30670 }, { "epoch": 0.08, "learning_rate": 0.0002880709521723465, "loss": 0.0343, "step": 30680 }, { "epoch": 0.08, "learning_rate": 0.000288067063955975, "loss": 0.0343, "step": 30690 }, { "epoch": 0.08, "learning_rate": 0.00028806317573960356, "loss": 0.0337, "step": 30700 }, { "epoch": 0.08, "learning_rate": 0.00028805928752323207, "loss": 0.0365, "step": 30710 }, { "epoch": 0.08, "learning_rate": 0.0002880553993068606, "loss": 0.0289, "step": 30720 }, { "epoch": 0.08, "learning_rate": 0.00028805151109048915, "loss": 0.0342, "step": 30730 }, { "epoch": 0.08, "learning_rate": 0.00028804762287411767, "loss": 0.0331, "step": 30740 }, { "epoch": 0.08, "learning_rate": 0.00028804373465774624, "loss": 0.0298, "step": 30750 }, { "epoch": 0.08, "learning_rate": 0.00028803984644137475, "loss": 0.0297, "step": 30760 }, { "epoch": 0.08, "learning_rate": 0.00028803595822500327, "loss": 0.032, "step": 30770 }, { "epoch": 0.08, "learning_rate": 0.0002880320700086318, "loss": 0.032, "step": 30780 }, { "epoch": 0.08, "learning_rate": 0.00028802818179226035, "loss": 0.0379, "step": 30790 }, { "epoch": 0.08, "learning_rate": 0.00028802429357588887, "loss": 0.0366, "step": 30800 }, { "epoch": 0.08, "learning_rate": 0.00028802040535951743, "loss": 0.0324, "step": 30810 }, { "epoch": 0.08, "learning_rate": 0.00028801651714314595, "loss": 0.0296, "step": 30820 }, { "epoch": 0.08, "learning_rate": 0.0002880126289267745, "loss": 0.0352, "step": 30830 }, { "epoch": 0.08, "learning_rate": 0.00028800874071040303, "loss": 0.0351, "step": 30840 }, { "epoch": 0.08, "learning_rate": 0.00028800485249403155, "loss": 0.0305, "step": 30850 }, { "epoch": 0.08, "learning_rate": 0.00028800096427766006, "loss": 0.0295, "step": 30860 }, { "epoch": 0.08, "learning_rate": 0.00028799707606128863, "loss": 0.0255, "step": 30870 }, { "epoch": 0.08, "learning_rate": 0.0002879931878449172, "loss": 0.0359, "step": 30880 }, { "epoch": 0.08, "learning_rate": 0.0002879892996285457, "loss": 0.0283, "step": 30890 }, { "epoch": 0.08, "learning_rate": 0.00028798541141217423, "loss": 0.0315, "step": 30900 }, { "epoch": 0.08, "learning_rate": 0.0002879815231958028, "loss": 0.0365, "step": 30910 }, { "epoch": 0.08, "learning_rate": 0.0002879776349794313, "loss": 0.0342, "step": 30920 }, { "epoch": 0.08, "learning_rate": 0.0002879737467630598, "loss": 0.0349, "step": 30930 }, { "epoch": 0.08, "learning_rate": 0.0002879698585466884, "loss": 0.037, "step": 30940 }, { "epoch": 0.08, "learning_rate": 0.0002879659703303169, "loss": 0.0346, "step": 30950 }, { "epoch": 0.08, "learning_rate": 0.0002879620821139455, "loss": 0.0316, "step": 30960 }, { "epoch": 0.08, "learning_rate": 0.000287958193897574, "loss": 0.0305, "step": 30970 }, { "epoch": 0.08, "learning_rate": 0.0002879543056812025, "loss": 0.0367, "step": 30980 }, { "epoch": 0.08, "learning_rate": 0.0002879504174648311, "loss": 0.0339, "step": 30990 }, { "epoch": 0.08, "learning_rate": 0.0002879465292484596, "loss": 0.03, "step": 31000 }, { "epoch": 0.08, "eval_cer": 0.8817726681698768, "eval_loss": 0.023973068222403526, "eval_runtime": 107.5545, "eval_samples_per_second": 18.595, "eval_steps_per_second": 4.649, "step": 31000 }, { "epoch": 0.08, "learning_rate": 0.0002879426410320881, "loss": 0.0354, "step": 31010 }, { "epoch": 0.08, "learning_rate": 0.00028793875281571667, "loss": 0.0306, "step": 31020 }, { "epoch": 0.08, "learning_rate": 0.0002879348645993452, "loss": 0.0324, "step": 31030 }, { "epoch": 0.08, "learning_rate": 0.00028793097638297376, "loss": 0.0316, "step": 31040 }, { "epoch": 0.08, "learning_rate": 0.00028792708816660227, "loss": 0.0367, "step": 31050 }, { "epoch": 0.08, "learning_rate": 0.0002879231999502308, "loss": 0.0393, "step": 31060 }, { "epoch": 0.08, "learning_rate": 0.0002879193117338593, "loss": 0.0355, "step": 31070 }, { "epoch": 0.08, "learning_rate": 0.00028791542351748787, "loss": 0.0279, "step": 31080 }, { "epoch": 0.08, "learning_rate": 0.00028791153530111644, "loss": 0.0308, "step": 31090 }, { "epoch": 0.08, "learning_rate": 0.00028790764708474495, "loss": 0.0329, "step": 31100 }, { "epoch": 0.08, "learning_rate": 0.00028790375886837347, "loss": 0.032, "step": 31110 }, { "epoch": 0.08, "learning_rate": 0.00028789987065200203, "loss": 0.0361, "step": 31120 }, { "epoch": 0.08, "learning_rate": 0.00028789598243563055, "loss": 0.0338, "step": 31130 }, { "epoch": 0.08, "learning_rate": 0.00028789209421925906, "loss": 0.0334, "step": 31140 }, { "epoch": 0.08, "learning_rate": 0.00028788820600288763, "loss": 0.0287, "step": 31150 }, { "epoch": 0.08, "learning_rate": 0.00028788431778651615, "loss": 0.0313, "step": 31160 }, { "epoch": 0.08, "learning_rate": 0.0002878804295701447, "loss": 0.0306, "step": 31170 }, { "epoch": 0.08, "learning_rate": 0.00028787654135377323, "loss": 0.0385, "step": 31180 }, { "epoch": 0.08, "learning_rate": 0.00028787265313740174, "loss": 0.0339, "step": 31190 }, { "epoch": 0.08, "learning_rate": 0.0002878687649210303, "loss": 0.0334, "step": 31200 }, { "epoch": 0.08, "learning_rate": 0.00028786487670465883, "loss": 0.0439, "step": 31210 }, { "epoch": 0.08, "learning_rate": 0.00028786098848828734, "loss": 0.0324, "step": 31220 }, { "epoch": 0.08, "learning_rate": 0.0002878571002719159, "loss": 0.0353, "step": 31230 }, { "epoch": 0.08, "learning_rate": 0.0002878532120555445, "loss": 0.0402, "step": 31240 }, { "epoch": 0.08, "learning_rate": 0.000287849323839173, "loss": 0.0371, "step": 31250 }, { "epoch": 0.08, "learning_rate": 0.0002878454356228015, "loss": 0.0288, "step": 31260 }, { "epoch": 0.08, "learning_rate": 0.00028784154740643, "loss": 0.0303, "step": 31270 }, { "epoch": 0.08, "learning_rate": 0.0002878376591900586, "loss": 0.0383, "step": 31280 }, { "epoch": 0.08, "learning_rate": 0.0002878337709736871, "loss": 0.0335, "step": 31290 }, { "epoch": 0.08, "learning_rate": 0.0002878298827573157, "loss": 0.0322, "step": 31300 }, { "epoch": 0.08, "learning_rate": 0.0002878259945409442, "loss": 0.0329, "step": 31310 }, { "epoch": 0.08, "learning_rate": 0.0002878221063245727, "loss": 0.0316, "step": 31320 }, { "epoch": 0.08, "learning_rate": 0.0002878182181082013, "loss": 0.0339, "step": 31330 }, { "epoch": 0.08, "learning_rate": 0.0002878143298918298, "loss": 0.0365, "step": 31340 }, { "epoch": 0.08, "learning_rate": 0.0002878104416754583, "loss": 0.0339, "step": 31350 }, { "epoch": 0.08, "learning_rate": 0.00028780655345908687, "loss": 0.0332, "step": 31360 }, { "epoch": 0.08, "learning_rate": 0.00028780266524271544, "loss": 0.035, "step": 31370 }, { "epoch": 0.08, "learning_rate": 0.00028779877702634395, "loss": 0.0298, "step": 31380 }, { "epoch": 0.08, "learning_rate": 0.00028779488880997247, "loss": 0.0298, "step": 31390 }, { "epoch": 0.08, "learning_rate": 0.000287791000593601, "loss": 0.0271, "step": 31400 }, { "epoch": 0.08, "learning_rate": 0.00028778711237722955, "loss": 0.0337, "step": 31410 }, { "epoch": 0.08, "learning_rate": 0.00028778322416085807, "loss": 0.0319, "step": 31420 }, { "epoch": 0.08, "learning_rate": 0.00028777933594448664, "loss": 0.0292, "step": 31430 }, { "epoch": 0.08, "learning_rate": 0.00028777544772811515, "loss": 0.0343, "step": 31440 }, { "epoch": 0.08, "learning_rate": 0.0002877715595117437, "loss": 0.026, "step": 31450 }, { "epoch": 0.08, "learning_rate": 0.00028776767129537223, "loss": 0.0295, "step": 31460 }, { "epoch": 0.08, "learning_rate": 0.00028776378307900075, "loss": 0.0339, "step": 31470 }, { "epoch": 0.08, "learning_rate": 0.00028775989486262926, "loss": 0.0352, "step": 31480 }, { "epoch": 0.08, "learning_rate": 0.00028775600664625783, "loss": 0.0302, "step": 31490 }, { "epoch": 0.08, "learning_rate": 0.00028775211842988635, "loss": 0.0315, "step": 31500 }, { "epoch": 0.08, "learning_rate": 0.0002877482302135149, "loss": 0.0315, "step": 31510 }, { "epoch": 0.08, "learning_rate": 0.00028774434199714343, "loss": 0.0312, "step": 31520 }, { "epoch": 0.08, "learning_rate": 0.00028774045378077194, "loss": 0.0338, "step": 31530 }, { "epoch": 0.08, "learning_rate": 0.0002877365655644005, "loss": 0.0351, "step": 31540 }, { "epoch": 0.08, "learning_rate": 0.000287732677348029, "loss": 0.029, "step": 31550 }, { "epoch": 0.08, "learning_rate": 0.00028772878913165754, "loss": 0.0308, "step": 31560 }, { "epoch": 0.08, "learning_rate": 0.0002877249009152861, "loss": 0.0329, "step": 31570 }, { "epoch": 0.08, "learning_rate": 0.0002877210126989147, "loss": 0.0364, "step": 31580 }, { "epoch": 0.08, "learning_rate": 0.0002877171244825432, "loss": 0.0328, "step": 31590 }, { "epoch": 0.08, "learning_rate": 0.0002877132362661717, "loss": 0.032, "step": 31600 }, { "epoch": 0.08, "learning_rate": 0.0002877093480498002, "loss": 0.0311, "step": 31610 }, { "epoch": 0.08, "learning_rate": 0.0002877054598334288, "loss": 0.0403, "step": 31620 }, { "epoch": 0.08, "learning_rate": 0.0002877015716170573, "loss": 0.0307, "step": 31630 }, { "epoch": 0.08, "learning_rate": 0.0002876976834006859, "loss": 0.029, "step": 31640 }, { "epoch": 0.08, "learning_rate": 0.0002876937951843144, "loss": 0.0379, "step": 31650 }, { "epoch": 0.08, "learning_rate": 0.00028768990696794296, "loss": 0.0394, "step": 31660 }, { "epoch": 0.08, "learning_rate": 0.00028768601875157147, "loss": 0.0378, "step": 31670 }, { "epoch": 0.08, "learning_rate": 0.0002876821305352, "loss": 0.0393, "step": 31680 }, { "epoch": 0.08, "learning_rate": 0.0002876782423188285, "loss": 0.0278, "step": 31690 }, { "epoch": 0.08, "learning_rate": 0.00028767435410245707, "loss": 0.0379, "step": 31700 }, { "epoch": 0.08, "learning_rate": 0.0002876704658860856, "loss": 0.0393, "step": 31710 }, { "epoch": 0.08, "learning_rate": 0.00028766657766971415, "loss": 0.0372, "step": 31720 }, { "epoch": 0.08, "learning_rate": 0.00028766268945334267, "loss": 0.0287, "step": 31730 }, { "epoch": 0.08, "learning_rate": 0.00028765880123697124, "loss": 0.0295, "step": 31740 }, { "epoch": 0.08, "learning_rate": 0.00028765491302059975, "loss": 0.0311, "step": 31750 }, { "epoch": 0.08, "learning_rate": 0.00028765102480422827, "loss": 0.0326, "step": 31760 }, { "epoch": 0.08, "learning_rate": 0.00028764713658785683, "loss": 0.0271, "step": 31770 }, { "epoch": 0.08, "learning_rate": 0.00028764324837148535, "loss": 0.0331, "step": 31780 }, { "epoch": 0.08, "learning_rate": 0.0002876393601551139, "loss": 0.0262, "step": 31790 }, { "epoch": 0.08, "learning_rate": 0.00028763547193874243, "loss": 0.0293, "step": 31800 }, { "epoch": 0.08, "learning_rate": 0.00028763158372237095, "loss": 0.0293, "step": 31810 }, { "epoch": 0.08, "learning_rate": 0.00028762769550599946, "loss": 0.035, "step": 31820 }, { "epoch": 0.08, "learning_rate": 0.00028762380728962803, "loss": 0.0363, "step": 31830 }, { "epoch": 0.08, "learning_rate": 0.00028761991907325654, "loss": 0.0354, "step": 31840 }, { "epoch": 0.08, "learning_rate": 0.0002876160308568851, "loss": 0.0243, "step": 31850 }, { "epoch": 0.08, "learning_rate": 0.00028761214264051363, "loss": 0.0381, "step": 31860 }, { "epoch": 0.08, "learning_rate": 0.0002876082544241422, "loss": 0.0334, "step": 31870 }, { "epoch": 0.08, "learning_rate": 0.0002876043662077707, "loss": 0.0345, "step": 31880 }, { "epoch": 0.08, "learning_rate": 0.0002876004779913992, "loss": 0.0329, "step": 31890 }, { "epoch": 0.08, "learning_rate": 0.00028759658977502774, "loss": 0.0262, "step": 31900 }, { "epoch": 0.08, "learning_rate": 0.0002875927015586563, "loss": 0.0255, "step": 31910 }, { "epoch": 0.08, "learning_rate": 0.0002875888133422849, "loss": 0.0292, "step": 31920 }, { "epoch": 0.08, "learning_rate": 0.0002875849251259134, "loss": 0.0303, "step": 31930 }, { "epoch": 0.08, "learning_rate": 0.0002875810369095419, "loss": 0.0283, "step": 31940 }, { "epoch": 0.08, "learning_rate": 0.0002875771486931705, "loss": 0.0312, "step": 31950 }, { "epoch": 0.08, "learning_rate": 0.000287573260476799, "loss": 0.0283, "step": 31960 }, { "epoch": 0.08, "learning_rate": 0.0002875693722604275, "loss": 0.0326, "step": 31970 }, { "epoch": 0.08, "learning_rate": 0.0002875654840440561, "loss": 0.0305, "step": 31980 }, { "epoch": 0.08, "learning_rate": 0.0002875615958276846, "loss": 0.0384, "step": 31990 }, { "epoch": 0.08, "learning_rate": 0.00028755770761131316, "loss": 0.0307, "step": 32000 }, { "epoch": 0.08, "eval_cer": 0.8818356518319148, "eval_loss": 0.023202601820230484, "eval_runtime": 107.5432, "eval_samples_per_second": 18.597, "eval_steps_per_second": 4.649, "step": 32000 }, { "epoch": 0.08, "learning_rate": 0.00028755381939494167, "loss": 0.033, "step": 32010 }, { "epoch": 0.08, "learning_rate": 0.0002875499311785702, "loss": 0.0317, "step": 32020 }, { "epoch": 0.08, "learning_rate": 0.0002875460429621987, "loss": 0.0327, "step": 32030 }, { "epoch": 0.08, "learning_rate": 0.00028754215474582727, "loss": 0.0276, "step": 32040 }, { "epoch": 0.08, "learning_rate": 0.0002875382665294558, "loss": 0.0281, "step": 32050 }, { "epoch": 0.08, "learning_rate": 0.00028753437831308435, "loss": 0.031, "step": 32060 }, { "epoch": 0.08, "learning_rate": 0.00028753049009671287, "loss": 0.0366, "step": 32070 }, { "epoch": 0.08, "learning_rate": 0.00028752660188034144, "loss": 0.0353, "step": 32080 }, { "epoch": 0.08, "learning_rate": 0.00028752271366396995, "loss": 0.0351, "step": 32090 }, { "epoch": 0.08, "learning_rate": 0.00028751882544759846, "loss": 0.0293, "step": 32100 }, { "epoch": 0.08, "learning_rate": 0.000287514937231227, "loss": 0.0291, "step": 32110 }, { "epoch": 0.08, "learning_rate": 0.00028751104901485555, "loss": 0.0267, "step": 32120 }, { "epoch": 0.08, "learning_rate": 0.0002875071607984841, "loss": 0.0338, "step": 32130 }, { "epoch": 0.08, "learning_rate": 0.00028750327258211263, "loss": 0.034, "step": 32140 }, { "epoch": 0.08, "learning_rate": 0.00028749938436574115, "loss": 0.0325, "step": 32150 }, { "epoch": 0.08, "learning_rate": 0.0002874954961493697, "loss": 0.0282, "step": 32160 }, { "epoch": 0.08, "learning_rate": 0.00028749160793299823, "loss": 0.031, "step": 32170 }, { "epoch": 0.08, "learning_rate": 0.00028748771971662674, "loss": 0.0295, "step": 32180 }, { "epoch": 0.08, "learning_rate": 0.0002874838315002553, "loss": 0.0346, "step": 32190 }, { "epoch": 0.08, "learning_rate": 0.0002874799432838838, "loss": 0.0336, "step": 32200 }, { "epoch": 0.08, "learning_rate": 0.0002874760550675124, "loss": 0.0409, "step": 32210 }, { "epoch": 0.08, "learning_rate": 0.0002874721668511409, "loss": 0.0342, "step": 32220 }, { "epoch": 0.08, "learning_rate": 0.0002874682786347694, "loss": 0.0307, "step": 32230 }, { "epoch": 0.08, "learning_rate": 0.000287464390418398, "loss": 0.0332, "step": 32240 }, { "epoch": 0.08, "learning_rate": 0.0002874605022020265, "loss": 0.0323, "step": 32250 }, { "epoch": 0.08, "learning_rate": 0.000287456613985655, "loss": 0.045, "step": 32260 }, { "epoch": 0.08, "learning_rate": 0.0002874527257692836, "loss": 0.0573, "step": 32270 }, { "epoch": 0.08, "learning_rate": 0.0002874488375529121, "loss": 0.032, "step": 32280 }, { "epoch": 0.08, "learning_rate": 0.0002874449493365407, "loss": 0.0495, "step": 32290 }, { "epoch": 0.08, "learning_rate": 0.0002874410611201692, "loss": 0.0366, "step": 32300 }, { "epoch": 0.08, "learning_rate": 0.0002874371729037977, "loss": 0.0432, "step": 32310 }, { "epoch": 0.08, "learning_rate": 0.00028743328468742627, "loss": 0.0371, "step": 32320 }, { "epoch": 0.08, "learning_rate": 0.0002874293964710548, "loss": 0.0369, "step": 32330 }, { "epoch": 0.08, "learning_rate": 0.00028742550825468336, "loss": 0.0288, "step": 32340 }, { "epoch": 0.08, "learning_rate": 0.00028742162003831187, "loss": 0.0353, "step": 32350 }, { "epoch": 0.08, "learning_rate": 0.0002874177318219404, "loss": 0.0327, "step": 32360 }, { "epoch": 0.08, "learning_rate": 0.00028741384360556895, "loss": 0.0323, "step": 32370 }, { "epoch": 0.08, "learning_rate": 0.00028740995538919747, "loss": 0.0359, "step": 32380 }, { "epoch": 0.08, "learning_rate": 0.000287406067172826, "loss": 0.0355, "step": 32390 }, { "epoch": 0.08, "learning_rate": 0.00028740217895645455, "loss": 0.0327, "step": 32400 }, { "epoch": 0.08, "learning_rate": 0.00028739829074008307, "loss": 0.0384, "step": 32410 }, { "epoch": 0.08, "learning_rate": 0.00028739440252371163, "loss": 0.0356, "step": 32420 }, { "epoch": 0.08, "learning_rate": 0.00028739051430734015, "loss": 0.036, "step": 32430 }, { "epoch": 0.08, "learning_rate": 0.00028738662609096866, "loss": 0.0294, "step": 32440 }, { "epoch": 0.08, "learning_rate": 0.00028738273787459723, "loss": 0.033, "step": 32450 }, { "epoch": 0.08, "learning_rate": 0.00028737884965822575, "loss": 0.0361, "step": 32460 }, { "epoch": 0.08, "learning_rate": 0.0002873749614418543, "loss": 0.0327, "step": 32470 }, { "epoch": 0.08, "learning_rate": 0.00028737107322548283, "loss": 0.0336, "step": 32480 }, { "epoch": 0.08, "learning_rate": 0.0002873671850091114, "loss": 0.0345, "step": 32490 }, { "epoch": 0.08, "learning_rate": 0.0002873632967927399, "loss": 0.0411, "step": 32500 }, { "epoch": 0.08, "learning_rate": 0.00028735940857636843, "loss": 0.0387, "step": 32510 }, { "epoch": 0.08, "learning_rate": 0.00028735552035999694, "loss": 0.0329, "step": 32520 }, { "epoch": 0.08, "learning_rate": 0.0002873516321436255, "loss": 0.0352, "step": 32530 }, { "epoch": 0.08, "learning_rate": 0.000287347743927254, "loss": 0.03, "step": 32540 }, { "epoch": 0.08, "learning_rate": 0.0002873438557108826, "loss": 0.0287, "step": 32550 }, { "epoch": 0.08, "learning_rate": 0.0002873399674945111, "loss": 0.0328, "step": 32560 }, { "epoch": 0.08, "learning_rate": 0.0002873360792781396, "loss": 0.0363, "step": 32570 }, { "epoch": 0.08, "learning_rate": 0.0002873321910617682, "loss": 0.0316, "step": 32580 }, { "epoch": 0.08, "learning_rate": 0.0002873283028453967, "loss": 0.0301, "step": 32590 }, { "epoch": 0.08, "learning_rate": 0.0002873244146290252, "loss": 0.0346, "step": 32600 }, { "epoch": 0.08, "learning_rate": 0.0002873205264126538, "loss": 0.035, "step": 32610 }, { "epoch": 0.08, "learning_rate": 0.00028731663819628236, "loss": 0.0339, "step": 32620 }, { "epoch": 0.08, "learning_rate": 0.0002873127499799109, "loss": 0.0302, "step": 32630 }, { "epoch": 0.08, "learning_rate": 0.0002873088617635394, "loss": 0.0285, "step": 32640 }, { "epoch": 0.08, "learning_rate": 0.0002873049735471679, "loss": 0.0342, "step": 32650 }, { "epoch": 0.08, "learning_rate": 0.00028730108533079647, "loss": 0.0297, "step": 32660 }, { "epoch": 0.08, "learning_rate": 0.000287297197114425, "loss": 0.0369, "step": 32670 }, { "epoch": 0.08, "learning_rate": 0.00028729330889805355, "loss": 0.0314, "step": 32680 }, { "epoch": 0.08, "learning_rate": 0.00028728942068168207, "loss": 0.0362, "step": 32690 }, { "epoch": 0.08, "learning_rate": 0.00028728553246531064, "loss": 0.0354, "step": 32700 }, { "epoch": 0.08, "learning_rate": 0.00028728164424893915, "loss": 0.0336, "step": 32710 }, { "epoch": 0.08, "learning_rate": 0.00028727775603256767, "loss": 0.0311, "step": 32720 }, { "epoch": 0.08, "learning_rate": 0.0002872738678161962, "loss": 0.0296, "step": 32730 }, { "epoch": 0.08, "learning_rate": 0.00028726997959982475, "loss": 0.0322, "step": 32740 }, { "epoch": 0.08, "learning_rate": 0.00028726609138345326, "loss": 0.0319, "step": 32750 }, { "epoch": 0.08, "learning_rate": 0.00028726220316708183, "loss": 0.0274, "step": 32760 }, { "epoch": 0.08, "learning_rate": 0.00028725831495071035, "loss": 0.0307, "step": 32770 }, { "epoch": 0.08, "learning_rate": 0.00028725442673433886, "loss": 0.0315, "step": 32780 }, { "epoch": 0.08, "learning_rate": 0.00028725053851796743, "loss": 0.0315, "step": 32790 }, { "epoch": 0.09, "learning_rate": 0.00028724665030159595, "loss": 0.039, "step": 32800 }, { "epoch": 0.09, "learning_rate": 0.00028724276208522446, "loss": 0.0286, "step": 32810 }, { "epoch": 0.09, "learning_rate": 0.00028723887386885303, "loss": 0.0323, "step": 32820 }, { "epoch": 0.09, "learning_rate": 0.0002872349856524816, "loss": 0.0329, "step": 32830 }, { "epoch": 0.09, "learning_rate": 0.0002872310974361101, "loss": 0.0308, "step": 32840 }, { "epoch": 0.09, "learning_rate": 0.0002872272092197386, "loss": 0.0288, "step": 32850 }, { "epoch": 0.09, "learning_rate": 0.00028722332100336714, "loss": 0.036, "step": 32860 }, { "epoch": 0.09, "learning_rate": 0.0002872194327869957, "loss": 0.0312, "step": 32870 }, { "epoch": 0.09, "learning_rate": 0.0002872155445706242, "loss": 0.0365, "step": 32880 }, { "epoch": 0.09, "learning_rate": 0.0002872116563542528, "loss": 0.0306, "step": 32890 }, { "epoch": 0.09, "learning_rate": 0.0002872077681378813, "loss": 0.0303, "step": 32900 }, { "epoch": 0.09, "learning_rate": 0.0002872038799215099, "loss": 0.0298, "step": 32910 }, { "epoch": 0.09, "learning_rate": 0.0002871999917051384, "loss": 0.0312, "step": 32920 }, { "epoch": 0.09, "learning_rate": 0.0002871961034887669, "loss": 0.0349, "step": 32930 }, { "epoch": 0.09, "learning_rate": 0.0002871922152723954, "loss": 0.0328, "step": 32940 }, { "epoch": 0.09, "learning_rate": 0.000287188327056024, "loss": 0.0277, "step": 32950 }, { "epoch": 0.09, "learning_rate": 0.00028718443883965256, "loss": 0.0347, "step": 32960 }, { "epoch": 0.09, "learning_rate": 0.00028718055062328107, "loss": 0.0461, "step": 32970 }, { "epoch": 0.09, "learning_rate": 0.0002871766624069096, "loss": 0.0306, "step": 32980 }, { "epoch": 0.09, "learning_rate": 0.00028717277419053816, "loss": 0.0336, "step": 32990 }, { "epoch": 0.09, "learning_rate": 0.00028716888597416667, "loss": 0.0394, "step": 33000 }, { "epoch": 0.09, "eval_cer": 0.8818328525580464, "eval_loss": 0.023882215842604637, "eval_runtime": 107.6564, "eval_samples_per_second": 18.578, "eval_steps_per_second": 4.644, "step": 33000 }, { "epoch": 0.09, "learning_rate": 0.0002871649977577952, "loss": 0.0326, "step": 33010 }, { "epoch": 0.09, "learning_rate": 0.00028716110954142375, "loss": 0.029, "step": 33020 }, { "epoch": 0.09, "learning_rate": 0.00028715722132505227, "loss": 0.033, "step": 33030 }, { "epoch": 0.09, "learning_rate": 0.00028715333310868084, "loss": 0.0307, "step": 33040 }, { "epoch": 0.09, "learning_rate": 0.00028714944489230935, "loss": 0.0291, "step": 33050 }, { "epoch": 0.09, "learning_rate": 0.00028714555667593787, "loss": 0.0328, "step": 33060 }, { "epoch": 0.09, "learning_rate": 0.0002871416684595664, "loss": 0.0315, "step": 33070 }, { "epoch": 0.09, "learning_rate": 0.00028713778024319495, "loss": 0.0304, "step": 33080 }, { "epoch": 0.09, "learning_rate": 0.00028713389202682346, "loss": 0.0315, "step": 33090 }, { "epoch": 0.09, "learning_rate": 0.00028713000381045203, "loss": 0.0404, "step": 33100 }, { "epoch": 0.09, "learning_rate": 0.00028712611559408055, "loss": 0.0391, "step": 33110 }, { "epoch": 0.09, "learning_rate": 0.0002871222273777091, "loss": 0.0296, "step": 33120 }, { "epoch": 0.09, "learning_rate": 0.00028711833916133763, "loss": 0.0303, "step": 33130 }, { "epoch": 0.09, "learning_rate": 0.00028711445094496614, "loss": 0.0335, "step": 33140 }, { "epoch": 0.09, "learning_rate": 0.00028711056272859466, "loss": 0.0321, "step": 33150 }, { "epoch": 0.09, "learning_rate": 0.00028710667451222323, "loss": 0.0279, "step": 33160 }, { "epoch": 0.09, "learning_rate": 0.0002871027862958518, "loss": 0.0261, "step": 33170 }, { "epoch": 0.09, "learning_rate": 0.0002870988980794803, "loss": 0.0291, "step": 33180 }, { "epoch": 0.09, "learning_rate": 0.0002870950098631088, "loss": 0.0313, "step": 33190 }, { "epoch": 0.09, "learning_rate": 0.0002870911216467374, "loss": 0.0384, "step": 33200 }, { "epoch": 0.09, "learning_rate": 0.0002870872334303659, "loss": 0.0365, "step": 33210 }, { "epoch": 0.09, "learning_rate": 0.0002870833452139944, "loss": 0.0316, "step": 33220 }, { "epoch": 0.09, "learning_rate": 0.000287079456997623, "loss": 0.0352, "step": 33230 }, { "epoch": 0.09, "learning_rate": 0.0002870755687812515, "loss": 0.0312, "step": 33240 }, { "epoch": 0.09, "learning_rate": 0.0002870716805648801, "loss": 0.0288, "step": 33250 }, { "epoch": 0.09, "learning_rate": 0.0002870677923485086, "loss": 0.0325, "step": 33260 }, { "epoch": 0.09, "learning_rate": 0.0002870639041321371, "loss": 0.033, "step": 33270 }, { "epoch": 0.09, "learning_rate": 0.0002870600159157656, "loss": 0.0323, "step": 33280 }, { "epoch": 0.09, "learning_rate": 0.0002870561276993942, "loss": 0.0279, "step": 33290 }, { "epoch": 0.09, "learning_rate": 0.0002870522394830227, "loss": 0.0306, "step": 33300 }, { "epoch": 0.09, "learning_rate": 0.00028704835126665127, "loss": 0.0351, "step": 33310 }, { "epoch": 0.09, "learning_rate": 0.0002870444630502798, "loss": 0.0497, "step": 33320 }, { "epoch": 0.09, "learning_rate": 0.00028704057483390835, "loss": 0.0317, "step": 33330 }, { "epoch": 0.09, "learning_rate": 0.00028703668661753687, "loss": 0.0278, "step": 33340 }, { "epoch": 0.09, "learning_rate": 0.0002870327984011654, "loss": 0.0333, "step": 33350 }, { "epoch": 0.09, "learning_rate": 0.00028702891018479395, "loss": 0.0301, "step": 33360 }, { "epoch": 0.09, "learning_rate": 0.00028702502196842247, "loss": 0.0316, "step": 33370 }, { "epoch": 0.09, "learning_rate": 0.00028702113375205104, "loss": 0.0333, "step": 33380 }, { "epoch": 0.09, "learning_rate": 0.00028701724553567955, "loss": 0.0299, "step": 33390 }, { "epoch": 0.09, "learning_rate": 0.00028701335731930806, "loss": 0.0354, "step": 33400 }, { "epoch": 0.09, "learning_rate": 0.00028700946910293663, "loss": 0.0288, "step": 33410 }, { "epoch": 0.09, "learning_rate": 0.00028700558088656515, "loss": 0.0303, "step": 33420 }, { "epoch": 0.09, "learning_rate": 0.00028700169267019366, "loss": 0.0297, "step": 33430 }, { "epoch": 0.09, "learning_rate": 0.00028699780445382223, "loss": 0.0298, "step": 33440 }, { "epoch": 0.09, "learning_rate": 0.00028699391623745075, "loss": 0.0323, "step": 33450 }, { "epoch": 0.09, "learning_rate": 0.0002869900280210793, "loss": 0.0319, "step": 33460 }, { "epoch": 0.09, "learning_rate": 0.00028698613980470783, "loss": 0.036, "step": 33470 }, { "epoch": 0.09, "learning_rate": 0.00028698225158833634, "loss": 0.0271, "step": 33480 }, { "epoch": 0.09, "learning_rate": 0.0002869783633719649, "loss": 0.0328, "step": 33490 }, { "epoch": 0.09, "learning_rate": 0.0002869744751555934, "loss": 0.0286, "step": 33500 }, { "epoch": 0.09, "learning_rate": 0.000286970586939222, "loss": 0.0378, "step": 33510 }, { "epoch": 0.09, "learning_rate": 0.0002869666987228505, "loss": 0.0305, "step": 33520 }, { "epoch": 0.09, "learning_rate": 0.000286962810506479, "loss": 0.0308, "step": 33530 }, { "epoch": 0.09, "learning_rate": 0.0002869589222901076, "loss": 0.0266, "step": 33540 }, { "epoch": 0.09, "learning_rate": 0.0002869550340737361, "loss": 0.0338, "step": 33550 }, { "epoch": 0.09, "learning_rate": 0.0002869511458573646, "loss": 0.0331, "step": 33560 }, { "epoch": 0.09, "learning_rate": 0.0002869472576409932, "loss": 0.0367, "step": 33570 }, { "epoch": 0.09, "learning_rate": 0.0002869433694246217, "loss": 0.0282, "step": 33580 }, { "epoch": 0.09, "learning_rate": 0.0002869394812082503, "loss": 0.033, "step": 33590 }, { "epoch": 0.09, "learning_rate": 0.0002869355929918788, "loss": 0.0286, "step": 33600 }, { "epoch": 0.09, "learning_rate": 0.0002869317047755073, "loss": 0.0301, "step": 33610 }, { "epoch": 0.09, "learning_rate": 0.00028692781655913587, "loss": 0.0323, "step": 33620 }, { "epoch": 0.09, "learning_rate": 0.0002869239283427644, "loss": 0.0329, "step": 33630 }, { "epoch": 0.09, "learning_rate": 0.0002869200401263929, "loss": 0.0284, "step": 33640 }, { "epoch": 0.09, "learning_rate": 0.00028691615191002147, "loss": 0.0356, "step": 33650 }, { "epoch": 0.09, "learning_rate": 0.00028691226369365004, "loss": 0.0388, "step": 33660 }, { "epoch": 0.09, "learning_rate": 0.00028690837547727855, "loss": 0.069, "step": 33670 }, { "epoch": 0.09, "learning_rate": 0.00028690448726090707, "loss": 0.0371, "step": 33680 }, { "epoch": 0.09, "learning_rate": 0.0002869005990445356, "loss": 0.0328, "step": 33690 }, { "epoch": 0.09, "learning_rate": 0.00028689671082816415, "loss": 0.037, "step": 33700 }, { "epoch": 0.09, "learning_rate": 0.00028689282261179267, "loss": 0.0314, "step": 33710 }, { "epoch": 0.09, "learning_rate": 0.00028688893439542123, "loss": 0.1216, "step": 33720 }, { "epoch": 0.09, "learning_rate": 0.00028688504617904975, "loss": 0.0316, "step": 33730 }, { "epoch": 0.09, "learning_rate": 0.0002868811579626783, "loss": 0.0441, "step": 33740 }, { "epoch": 0.09, "learning_rate": 0.00028687726974630683, "loss": 0.0281, "step": 33750 }, { "epoch": 0.09, "learning_rate": 0.00028687338152993535, "loss": 0.0325, "step": 33760 }, { "epoch": 0.09, "learning_rate": 0.00028686949331356386, "loss": 0.0315, "step": 33770 }, { "epoch": 0.09, "learning_rate": 0.00028686560509719243, "loss": 0.036, "step": 33780 }, { "epoch": 0.09, "learning_rate": 0.00028686171688082094, "loss": 0.028, "step": 33790 }, { "epoch": 0.09, "learning_rate": 0.0002868578286644495, "loss": 0.0285, "step": 33800 }, { "epoch": 0.09, "learning_rate": 0.00028685394044807803, "loss": 0.033, "step": 33810 }, { "epoch": 0.09, "learning_rate": 0.00028685005223170654, "loss": 0.0301, "step": 33820 }, { "epoch": 0.09, "learning_rate": 0.0002868461640153351, "loss": 0.0344, "step": 33830 }, { "epoch": 0.09, "learning_rate": 0.0002868422757989636, "loss": 0.0335, "step": 33840 }, { "epoch": 0.09, "learning_rate": 0.00028683838758259214, "loss": 0.0314, "step": 33850 }, { "epoch": 0.09, "learning_rate": 0.0002868344993662207, "loss": 0.0339, "step": 33860 }, { "epoch": 0.09, "learning_rate": 0.0002868306111498493, "loss": 0.0257, "step": 33870 }, { "epoch": 0.09, "learning_rate": 0.0002868267229334778, "loss": 0.0361, "step": 33880 }, { "epoch": 0.09, "learning_rate": 0.0002868228347171063, "loss": 0.0263, "step": 33890 }, { "epoch": 0.09, "learning_rate": 0.0002868189465007348, "loss": 0.0232, "step": 33900 }, { "epoch": 0.09, "learning_rate": 0.0002868150582843634, "loss": 0.0308, "step": 33910 }, { "epoch": 0.09, "learning_rate": 0.0002868111700679919, "loss": 0.0342, "step": 33920 }, { "epoch": 0.09, "learning_rate": 0.0002868072818516205, "loss": 0.0294, "step": 33930 }, { "epoch": 0.09, "learning_rate": 0.000286803393635249, "loss": 0.0492, "step": 33940 }, { "epoch": 0.09, "learning_rate": 0.00028679950541887756, "loss": 0.0311, "step": 33950 }, { "epoch": 0.09, "learning_rate": 0.00028679561720250607, "loss": 0.0352, "step": 33960 }, { "epoch": 0.09, "learning_rate": 0.0002867917289861346, "loss": 0.0396, "step": 33970 }, { "epoch": 0.09, "learning_rate": 0.0002867878407697631, "loss": 0.0353, "step": 33980 }, { "epoch": 0.09, "learning_rate": 0.00028678395255339167, "loss": 0.0274, "step": 33990 }, { "epoch": 0.09, "learning_rate": 0.0002867800643370202, "loss": 0.0357, "step": 34000 }, { "epoch": 0.09, "eval_cer": 0.8817866645392185, "eval_loss": 0.023611877113580704, "eval_runtime": 107.9395, "eval_samples_per_second": 18.529, "eval_steps_per_second": 4.632, "step": 34000 }, { "epoch": 0.09, "learning_rate": 0.00028677617612064875, "loss": 0.0383, "step": 34010 }, { "epoch": 0.09, "learning_rate": 0.00028677228790427727, "loss": 0.0348, "step": 34020 }, { "epoch": 0.09, "learning_rate": 0.0002867683996879058, "loss": 0.0358, "step": 34030 }, { "epoch": 0.09, "learning_rate": 0.00028676451147153435, "loss": 0.0304, "step": 34040 }, { "epoch": 0.09, "learning_rate": 0.00028676062325516286, "loss": 0.031, "step": 34050 }, { "epoch": 0.09, "learning_rate": 0.00028675673503879143, "loss": 0.034, "step": 34060 }, { "epoch": 0.09, "learning_rate": 0.00028675284682241995, "loss": 0.0355, "step": 34070 }, { "epoch": 0.09, "learning_rate": 0.0002867489586060485, "loss": 0.038, "step": 34080 }, { "epoch": 0.09, "learning_rate": 0.00028674507038967703, "loss": 0.0641, "step": 34090 }, { "epoch": 0.09, "learning_rate": 0.00028674118217330555, "loss": 0.0373, "step": 34100 }, { "epoch": 0.09, "learning_rate": 0.00028673729395693406, "loss": 0.0295, "step": 34110 }, { "epoch": 0.09, "learning_rate": 0.00028673340574056263, "loss": 0.0351, "step": 34120 }, { "epoch": 0.09, "learning_rate": 0.00028672951752419114, "loss": 0.0314, "step": 34130 }, { "epoch": 0.09, "learning_rate": 0.0002867256293078197, "loss": 0.0331, "step": 34140 }, { "epoch": 0.09, "learning_rate": 0.0002867217410914482, "loss": 0.038, "step": 34150 }, { "epoch": 0.09, "learning_rate": 0.0002867178528750768, "loss": 0.0367, "step": 34160 }, { "epoch": 0.09, "learning_rate": 0.0002867139646587053, "loss": 0.0297, "step": 34170 }, { "epoch": 0.09, "learning_rate": 0.0002867100764423338, "loss": 0.0313, "step": 34180 }, { "epoch": 0.09, "learning_rate": 0.00028670618822596234, "loss": 0.0955, "step": 34190 }, { "epoch": 0.09, "learning_rate": 0.0002867023000095909, "loss": 0.0364, "step": 34200 }, { "epoch": 0.09, "learning_rate": 0.0002866984117932195, "loss": 0.025, "step": 34210 }, { "epoch": 0.09, "learning_rate": 0.000286694523576848, "loss": 0.0329, "step": 34220 }, { "epoch": 0.09, "learning_rate": 0.0002866906353604765, "loss": 0.0296, "step": 34230 }, { "epoch": 0.09, "learning_rate": 0.000286686747144105, "loss": 0.0349, "step": 34240 }, { "epoch": 0.09, "learning_rate": 0.0002866828589277336, "loss": 0.0629, "step": 34250 }, { "epoch": 0.09, "learning_rate": 0.0002866789707113621, "loss": 0.033, "step": 34260 }, { "epoch": 0.09, "learning_rate": 0.00028667508249499067, "loss": 0.0349, "step": 34270 }, { "epoch": 0.09, "learning_rate": 0.0002866711942786192, "loss": 0.0357, "step": 34280 }, { "epoch": 0.09, "learning_rate": 0.00028666730606224776, "loss": 0.0318, "step": 34290 }, { "epoch": 0.09, "learning_rate": 0.00028666341784587627, "loss": 0.0318, "step": 34300 }, { "epoch": 0.09, "learning_rate": 0.0002866595296295048, "loss": 0.0316, "step": 34310 }, { "epoch": 0.09, "learning_rate": 0.0002866556414131333, "loss": 0.0368, "step": 34320 }, { "epoch": 0.09, "learning_rate": 0.00028665175319676187, "loss": 0.0302, "step": 34330 }, { "epoch": 0.09, "learning_rate": 0.0002866478649803904, "loss": 0.0298, "step": 34340 }, { "epoch": 0.09, "learning_rate": 0.00028664397676401895, "loss": 0.0325, "step": 34350 }, { "epoch": 0.09, "learning_rate": 0.00028664008854764747, "loss": 0.0331, "step": 34360 }, { "epoch": 0.09, "learning_rate": 0.00028663620033127603, "loss": 0.0473, "step": 34370 }, { "epoch": 0.09, "learning_rate": 0.00028663231211490455, "loss": 0.0404, "step": 34380 }, { "epoch": 0.09, "learning_rate": 0.00028662842389853306, "loss": 0.0357, "step": 34390 }, { "epoch": 0.09, "learning_rate": 0.0002866245356821616, "loss": 0.0317, "step": 34400 }, { "epoch": 0.09, "learning_rate": 0.00028662064746579015, "loss": 0.0334, "step": 34410 }, { "epoch": 0.09, "learning_rate": 0.0002866167592494187, "loss": 0.0366, "step": 34420 }, { "epoch": 0.09, "learning_rate": 0.00028661287103304723, "loss": 0.0337, "step": 34430 }, { "epoch": 0.09, "learning_rate": 0.00028660898281667574, "loss": 0.0334, "step": 34440 }, { "epoch": 0.09, "learning_rate": 0.0002866050946003043, "loss": 0.0324, "step": 34450 }, { "epoch": 0.09, "learning_rate": 0.00028660120638393283, "loss": 0.0362, "step": 34460 }, { "epoch": 0.09, "learning_rate": 0.00028659731816756134, "loss": 0.0342, "step": 34470 }, { "epoch": 0.09, "learning_rate": 0.0002865934299511899, "loss": 0.0281, "step": 34480 }, { "epoch": 0.09, "learning_rate": 0.0002865895417348184, "loss": 0.0316, "step": 34490 }, { "epoch": 0.09, "learning_rate": 0.000286585653518447, "loss": 0.0301, "step": 34500 }, { "epoch": 0.09, "learning_rate": 0.0002865817653020755, "loss": 0.0347, "step": 34510 }, { "epoch": 0.09, "learning_rate": 0.000286577877085704, "loss": 0.0344, "step": 34520 }, { "epoch": 0.09, "learning_rate": 0.00028657398886933254, "loss": 0.0392, "step": 34530 }, { "epoch": 0.09, "learning_rate": 0.0002865701006529611, "loss": 0.0526, "step": 34540 }, { "epoch": 0.09, "learning_rate": 0.0002865662124365897, "loss": 0.0416, "step": 34550 }, { "epoch": 0.09, "learning_rate": 0.0002865623242202182, "loss": 0.0348, "step": 34560 }, { "epoch": 0.09, "learning_rate": 0.0002865584360038467, "loss": 0.0352, "step": 34570 }, { "epoch": 0.09, "learning_rate": 0.0002865545477874753, "loss": 0.0297, "step": 34580 }, { "epoch": 0.09, "learning_rate": 0.0002865506595711038, "loss": 0.0363, "step": 34590 }, { "epoch": 0.09, "learning_rate": 0.0002865467713547323, "loss": 0.0632, "step": 34600 }, { "epoch": 0.09, "learning_rate": 0.00028654288313836087, "loss": 0.0357, "step": 34610 }, { "epoch": 0.09, "learning_rate": 0.0002865389949219894, "loss": 0.0312, "step": 34620 }, { "epoch": 0.09, "learning_rate": 0.00028653510670561795, "loss": 0.0295, "step": 34630 }, { "epoch": 0.09, "learning_rate": 0.00028653121848924647, "loss": 0.0305, "step": 34640 }, { "epoch": 0.09, "learning_rate": 0.000286527330272875, "loss": 0.0392, "step": 34650 }, { "epoch": 0.09, "learning_rate": 0.00028652344205650355, "loss": 0.0279, "step": 34660 }, { "epoch": 0.09, "learning_rate": 0.00028651955384013207, "loss": 0.037, "step": 34670 }, { "epoch": 0.09, "learning_rate": 0.0002865156656237606, "loss": 0.0366, "step": 34680 }, { "epoch": 0.09, "learning_rate": 0.00028651177740738915, "loss": 0.031, "step": 34690 }, { "epoch": 0.09, "learning_rate": 0.0002865078891910177, "loss": 0.032, "step": 34700 }, { "epoch": 0.09, "learning_rate": 0.00028650400097464623, "loss": 0.0319, "step": 34710 }, { "epoch": 0.09, "learning_rate": 0.00028650011275827475, "loss": 0.0321, "step": 34720 }, { "epoch": 0.09, "learning_rate": 0.00028649622454190326, "loss": 0.0305, "step": 34730 }, { "epoch": 0.09, "learning_rate": 0.0002864923363255318, "loss": 0.0333, "step": 34740 }, { "epoch": 0.09, "learning_rate": 0.00028648844810916035, "loss": 0.0372, "step": 34750 }, { "epoch": 0.09, "learning_rate": 0.0002864845598927889, "loss": 0.0374, "step": 34760 }, { "epoch": 0.09, "learning_rate": 0.00028648067167641743, "loss": 0.0301, "step": 34770 }, { "epoch": 0.09, "learning_rate": 0.00028647678346004594, "loss": 0.0296, "step": 34780 }, { "epoch": 0.09, "learning_rate": 0.0002864728952436745, "loss": 0.0301, "step": 34790 }, { "epoch": 0.09, "learning_rate": 0.000286469007027303, "loss": 0.0389, "step": 34800 }, { "epoch": 0.09, "learning_rate": 0.00028646511881093154, "loss": 0.034, "step": 34810 }, { "epoch": 0.09, "learning_rate": 0.0002864612305945601, "loss": 0.0327, "step": 34820 }, { "epoch": 0.09, "learning_rate": 0.0002864573423781886, "loss": 0.034, "step": 34830 }, { "epoch": 0.09, "learning_rate": 0.0002864534541618172, "loss": 0.0349, "step": 34840 }, { "epoch": 0.09, "learning_rate": 0.0002864495659454457, "loss": 0.0327, "step": 34850 }, { "epoch": 0.09, "learning_rate": 0.0002864456777290742, "loss": 0.0286, "step": 34860 }, { "epoch": 0.09, "learning_rate": 0.0002864417895127028, "loss": 0.0297, "step": 34870 }, { "epoch": 0.09, "learning_rate": 0.0002864379012963313, "loss": 0.0224, "step": 34880 }, { "epoch": 0.09, "learning_rate": 0.0002864340130799598, "loss": 0.0296, "step": 34890 }, { "epoch": 0.09, "learning_rate": 0.0002864301248635884, "loss": 0.0295, "step": 34900 }, { "epoch": 0.09, "learning_rate": 0.00028642623664721696, "loss": 0.0271, "step": 34910 }, { "epoch": 0.09, "learning_rate": 0.00028642234843084547, "loss": 0.0348, "step": 34920 }, { "epoch": 0.09, "learning_rate": 0.000286418460214474, "loss": 0.0335, "step": 34930 }, { "epoch": 0.09, "learning_rate": 0.0002864145719981025, "loss": 0.0311, "step": 34940 }, { "epoch": 0.09, "learning_rate": 0.00028641068378173107, "loss": 0.031, "step": 34950 }, { "epoch": 0.09, "learning_rate": 0.0002864067955653596, "loss": 0.0303, "step": 34960 }, { "epoch": 0.09, "learning_rate": 0.00028640290734898815, "loss": 0.0375, "step": 34970 }, { "epoch": 0.09, "learning_rate": 0.00028639901913261667, "loss": 0.0322, "step": 34980 }, { "epoch": 0.09, "learning_rate": 0.0002863951309162452, "loss": 0.0291, "step": 34990 }, { "epoch": 0.09, "learning_rate": 0.00028639124269987375, "loss": 0.0372, "step": 35000 }, { "epoch": 0.09, "eval_cer": 0.8818622449336642, "eval_loss": 0.023330524563789368, "eval_runtime": 107.4947, "eval_samples_per_second": 18.606, "eval_steps_per_second": 4.651, "step": 35000 }, { "epoch": 0.09, "learning_rate": 0.00028638735448350227, "loss": 0.0309, "step": 35010 }, { "epoch": 0.09, "learning_rate": 0.0002863834662671308, "loss": 0.0395, "step": 35020 }, { "epoch": 0.09, "learning_rate": 0.00028637957805075935, "loss": 0.0353, "step": 35030 }, { "epoch": 0.09, "learning_rate": 0.00028637568983438786, "loss": 0.0329, "step": 35040 }, { "epoch": 0.09, "learning_rate": 0.00028637180161801643, "loss": 0.035, "step": 35050 }, { "epoch": 0.09, "learning_rate": 0.00028636791340164495, "loss": 0.0342, "step": 35060 }, { "epoch": 0.09, "learning_rate": 0.00028636402518527346, "loss": 0.0281, "step": 35070 }, { "epoch": 0.09, "learning_rate": 0.00028636013696890203, "loss": 0.0355, "step": 35080 }, { "epoch": 0.09, "learning_rate": 0.00028635624875253054, "loss": 0.0348, "step": 35090 }, { "epoch": 0.09, "learning_rate": 0.0002863523605361591, "loss": 0.0323, "step": 35100 }, { "epoch": 0.09, "learning_rate": 0.00028634847231978763, "loss": 0.0315, "step": 35110 }, { "epoch": 0.09, "learning_rate": 0.0002863445841034162, "loss": 0.0297, "step": 35120 }, { "epoch": 0.09, "learning_rate": 0.0002863406958870447, "loss": 0.0361, "step": 35130 }, { "epoch": 0.09, "learning_rate": 0.0002863368076706732, "loss": 0.0356, "step": 35140 }, { "epoch": 0.09, "learning_rate": 0.00028633291945430174, "loss": 0.0347, "step": 35150 }, { "epoch": 0.09, "learning_rate": 0.0002863290312379303, "loss": 0.028, "step": 35160 }, { "epoch": 0.09, "learning_rate": 0.0002863251430215588, "loss": 0.0314, "step": 35170 }, { "epoch": 0.09, "learning_rate": 0.0002863212548051874, "loss": 0.0365, "step": 35180 }, { "epoch": 0.09, "learning_rate": 0.0002863173665888159, "loss": 0.0377, "step": 35190 }, { "epoch": 0.09, "learning_rate": 0.0002863134783724445, "loss": 0.0276, "step": 35200 }, { "epoch": 0.09, "learning_rate": 0.000286309590156073, "loss": 0.0345, "step": 35210 }, { "epoch": 0.09, "learning_rate": 0.0002863057019397015, "loss": 0.0278, "step": 35220 }, { "epoch": 0.09, "learning_rate": 0.00028630181372333, "loss": 0.0336, "step": 35230 }, { "epoch": 0.09, "learning_rate": 0.0002862979255069586, "loss": 0.0361, "step": 35240 }, { "epoch": 0.09, "learning_rate": 0.00028629403729058716, "loss": 0.0316, "step": 35250 }, { "epoch": 0.09, "learning_rate": 0.00028629014907421567, "loss": 0.041, "step": 35260 }, { "epoch": 0.09, "learning_rate": 0.0002862862608578442, "loss": 0.0273, "step": 35270 }, { "epoch": 0.09, "learning_rate": 0.0002862823726414727, "loss": 0.0333, "step": 35280 }, { "epoch": 0.09, "learning_rate": 0.00028627848442510127, "loss": 0.0311, "step": 35290 }, { "epoch": 0.09, "learning_rate": 0.0002862745962087298, "loss": 0.0359, "step": 35300 }, { "epoch": 0.09, "learning_rate": 0.00028627070799235835, "loss": 0.0289, "step": 35310 }, { "epoch": 0.09, "learning_rate": 0.00028626681977598687, "loss": 0.0288, "step": 35320 }, { "epoch": 0.09, "learning_rate": 0.00028626293155961544, "loss": 0.0372, "step": 35330 }, { "epoch": 0.09, "learning_rate": 0.00028625904334324395, "loss": 0.0263, "step": 35340 }, { "epoch": 0.09, "learning_rate": 0.00028625515512687246, "loss": 0.0221, "step": 35350 }, { "epoch": 0.09, "learning_rate": 0.000286251266910501, "loss": 0.0304, "step": 35360 }, { "epoch": 0.09, "learning_rate": 0.00028624737869412955, "loss": 0.0283, "step": 35370 }, { "epoch": 0.09, "learning_rate": 0.00028624349047775806, "loss": 0.0278, "step": 35380 }, { "epoch": 0.09, "learning_rate": 0.00028623960226138663, "loss": 0.0317, "step": 35390 }, { "epoch": 0.09, "learning_rate": 0.00028623571404501515, "loss": 0.0385, "step": 35400 }, { "epoch": 0.09, "learning_rate": 0.0002862318258286437, "loss": 0.0314, "step": 35410 }, { "epoch": 0.09, "learning_rate": 0.00028622793761227223, "loss": 0.033, "step": 35420 }, { "epoch": 0.09, "learning_rate": 0.00028622404939590074, "loss": 0.0306, "step": 35430 }, { "epoch": 0.09, "learning_rate": 0.00028622016117952926, "loss": 0.0333, "step": 35440 }, { "epoch": 0.09, "learning_rate": 0.0002862162729631578, "loss": 0.0344, "step": 35450 }, { "epoch": 0.09, "learning_rate": 0.0002862123847467864, "loss": 0.0276, "step": 35460 }, { "epoch": 0.09, "learning_rate": 0.0002862084965304149, "loss": 0.0299, "step": 35470 }, { "epoch": 0.09, "learning_rate": 0.0002862046083140434, "loss": 0.0278, "step": 35480 }, { "epoch": 0.09, "learning_rate": 0.00028620072009767194, "loss": 0.0278, "step": 35490 }, { "epoch": 0.09, "learning_rate": 0.0002861968318813005, "loss": 0.0301, "step": 35500 }, { "epoch": 0.09, "learning_rate": 0.000286192943664929, "loss": 0.035, "step": 35510 }, { "epoch": 0.09, "learning_rate": 0.0002861890554485576, "loss": 0.032, "step": 35520 }, { "epoch": 0.09, "learning_rate": 0.0002861851672321861, "loss": 0.0361, "step": 35530 }, { "epoch": 0.09, "learning_rate": 0.0002861812790158147, "loss": 0.0395, "step": 35540 }, { "epoch": 0.09, "learning_rate": 0.0002861773907994432, "loss": 0.0301, "step": 35550 }, { "epoch": 0.09, "learning_rate": 0.0002861735025830717, "loss": 0.0344, "step": 35560 }, { "epoch": 0.09, "learning_rate": 0.0002861696143667002, "loss": 0.029, "step": 35570 }, { "epoch": 0.09, "learning_rate": 0.0002861657261503288, "loss": 0.0337, "step": 35580 }, { "epoch": 0.09, "learning_rate": 0.0002861618379339573, "loss": 0.0277, "step": 35590 }, { "epoch": 0.09, "learning_rate": 0.00028615794971758587, "loss": 0.0283, "step": 35600 }, { "epoch": 0.09, "learning_rate": 0.0002861540615012144, "loss": 0.0341, "step": 35610 }, { "epoch": 0.09, "learning_rate": 0.00028615017328484295, "loss": 0.0324, "step": 35620 }, { "epoch": 0.09, "learning_rate": 0.00028614628506847147, "loss": 0.0267, "step": 35630 }, { "epoch": 0.09, "learning_rate": 0.0002861423968521, "loss": 0.0308, "step": 35640 }, { "epoch": 0.09, "learning_rate": 0.00028613850863572855, "loss": 0.0315, "step": 35650 }, { "epoch": 0.09, "learning_rate": 0.00028613462041935707, "loss": 0.028, "step": 35660 }, { "epoch": 0.09, "learning_rate": 0.00028613073220298563, "loss": 0.0361, "step": 35670 }, { "epoch": 0.09, "learning_rate": 0.00028612684398661415, "loss": 0.0362, "step": 35680 }, { "epoch": 0.09, "learning_rate": 0.00028612295577024266, "loss": 0.0338, "step": 35690 }, { "epoch": 0.09, "learning_rate": 0.00028611906755387123, "loss": 0.0311, "step": 35700 }, { "epoch": 0.09, "learning_rate": 0.00028611517933749975, "loss": 0.0286, "step": 35710 }, { "epoch": 0.09, "learning_rate": 0.00028611129112112826, "loss": 0.0324, "step": 35720 }, { "epoch": 0.09, "learning_rate": 0.00028610740290475683, "loss": 0.0299, "step": 35730 }, { "epoch": 0.09, "learning_rate": 0.00028610351468838534, "loss": 0.0268, "step": 35740 }, { "epoch": 0.09, "learning_rate": 0.0002860996264720139, "loss": 0.0258, "step": 35750 }, { "epoch": 0.09, "learning_rate": 0.00028609573825564243, "loss": 0.0281, "step": 35760 }, { "epoch": 0.09, "learning_rate": 0.00028609185003927094, "loss": 0.028, "step": 35770 }, { "epoch": 0.09, "learning_rate": 0.00028608796182289946, "loss": 0.0323, "step": 35780 }, { "epoch": 0.09, "learning_rate": 0.000286084073606528, "loss": 0.0346, "step": 35790 }, { "epoch": 0.09, "learning_rate": 0.0002860801853901566, "loss": 0.0326, "step": 35800 }, { "epoch": 0.09, "learning_rate": 0.0002860762971737851, "loss": 0.0301, "step": 35810 }, { "epoch": 0.09, "learning_rate": 0.0002860724089574136, "loss": 0.0346, "step": 35820 }, { "epoch": 0.09, "learning_rate": 0.0002860685207410422, "loss": 0.0287, "step": 35830 }, { "epoch": 0.09, "learning_rate": 0.0002860646325246707, "loss": 0.0321, "step": 35840 }, { "epoch": 0.09, "learning_rate": 0.0002860607443082992, "loss": 0.0401, "step": 35850 }, { "epoch": 0.09, "learning_rate": 0.0002860568560919278, "loss": 0.0338, "step": 35860 }, { "epoch": 0.09, "learning_rate": 0.0002860529678755563, "loss": 0.0291, "step": 35870 }, { "epoch": 0.09, "learning_rate": 0.00028604907965918487, "loss": 0.0344, "step": 35880 }, { "epoch": 0.09, "learning_rate": 0.0002860451914428134, "loss": 0.0319, "step": 35890 }, { "epoch": 0.09, "learning_rate": 0.0002860413032264419, "loss": 0.0288, "step": 35900 }, { "epoch": 0.09, "learning_rate": 0.00028603741501007047, "loss": 0.029, "step": 35910 }, { "epoch": 0.09, "learning_rate": 0.000286033526793699, "loss": 0.0317, "step": 35920 }, { "epoch": 0.09, "learning_rate": 0.0002860296385773275, "loss": 0.0317, "step": 35930 }, { "epoch": 0.09, "learning_rate": 0.00028602575036095607, "loss": 0.0344, "step": 35940 }, { "epoch": 0.09, "learning_rate": 0.00028602186214458464, "loss": 0.0313, "step": 35950 }, { "epoch": 0.09, "learning_rate": 0.00028601797392821315, "loss": 0.0289, "step": 35960 }, { "epoch": 0.09, "learning_rate": 0.00028601408571184167, "loss": 0.0288, "step": 35970 }, { "epoch": 0.09, "learning_rate": 0.0002860101974954702, "loss": 0.0304, "step": 35980 }, { "epoch": 0.09, "learning_rate": 0.0002860063092790987, "loss": 0.0291, "step": 35990 }, { "epoch": 0.09, "learning_rate": 0.00028600242106272726, "loss": 0.0372, "step": 36000 }, { "epoch": 0.09, "eval_cer": 0.8818356518319148, "eval_loss": 0.022460658103227615, "eval_runtime": 107.7073, "eval_samples_per_second": 18.569, "eval_steps_per_second": 4.642, "step": 36000 }, { "epoch": 0.09, "learning_rate": 0.00028599853284635583, "loss": 0.034, "step": 36010 }, { "epoch": 0.09, "learning_rate": 0.00028599464462998435, "loss": 0.032, "step": 36020 }, { "epoch": 0.09, "learning_rate": 0.00028599075641361286, "loss": 0.0327, "step": 36030 }, { "epoch": 0.09, "learning_rate": 0.00028598686819724143, "loss": 0.0305, "step": 36040 }, { "epoch": 0.09, "learning_rate": 0.00028598297998086995, "loss": 0.0342, "step": 36050 }, { "epoch": 0.09, "learning_rate": 0.00028597909176449846, "loss": 0.0327, "step": 36060 }, { "epoch": 0.09, "learning_rate": 0.00028597520354812703, "loss": 0.0262, "step": 36070 }, { "epoch": 0.09, "learning_rate": 0.00028597131533175554, "loss": 0.0342, "step": 36080 }, { "epoch": 0.09, "learning_rate": 0.0002859674271153841, "loss": 0.028, "step": 36090 }, { "epoch": 0.09, "learning_rate": 0.0002859635388990126, "loss": 0.0308, "step": 36100 }, { "epoch": 0.09, "learning_rate": 0.00028595965068264114, "loss": 0.0296, "step": 36110 }, { "epoch": 0.09, "learning_rate": 0.0002859557624662697, "loss": 0.0303, "step": 36120 }, { "epoch": 0.09, "learning_rate": 0.0002859518742498982, "loss": 0.0283, "step": 36130 }, { "epoch": 0.09, "learning_rate": 0.0002859479860335268, "loss": 0.0245, "step": 36140 }, { "epoch": 0.09, "learning_rate": 0.0002859440978171553, "loss": 0.0319, "step": 36150 }, { "epoch": 0.09, "learning_rate": 0.0002859402096007839, "loss": 0.0341, "step": 36160 }, { "epoch": 0.09, "learning_rate": 0.0002859363213844124, "loss": 0.0275, "step": 36170 }, { "epoch": 0.09, "learning_rate": 0.0002859324331680409, "loss": 0.0256, "step": 36180 }, { "epoch": 0.09, "learning_rate": 0.0002859285449516694, "loss": 0.0579, "step": 36190 }, { "epoch": 0.09, "learning_rate": 0.000285924656735298, "loss": 0.0266, "step": 36200 }, { "epoch": 0.09, "learning_rate": 0.0002859207685189265, "loss": 0.0296, "step": 36210 }, { "epoch": 0.09, "learning_rate": 0.00028591688030255507, "loss": 0.0374, "step": 36220 }, { "epoch": 0.09, "learning_rate": 0.0002859129920861836, "loss": 0.0298, "step": 36230 }, { "epoch": 0.09, "learning_rate": 0.0002859091038698121, "loss": 0.0305, "step": 36240 }, { "epoch": 0.09, "learning_rate": 0.00028590521565344067, "loss": 0.0346, "step": 36250 }, { "epoch": 0.09, "learning_rate": 0.0002859013274370692, "loss": 0.028, "step": 36260 }, { "epoch": 0.09, "learning_rate": 0.0002858974392206977, "loss": 0.031, "step": 36270 }, { "epoch": 0.09, "learning_rate": 0.00028589355100432627, "loss": 0.025, "step": 36280 }, { "epoch": 0.09, "learning_rate": 0.00028588966278795484, "loss": 0.0344, "step": 36290 }, { "epoch": 0.09, "learning_rate": 0.00028588577457158335, "loss": 0.0286, "step": 36300 }, { "epoch": 0.09, "learning_rate": 0.00028588188635521187, "loss": 0.0284, "step": 36310 }, { "epoch": 0.09, "learning_rate": 0.0002858779981388404, "loss": 0.0237, "step": 36320 }, { "epoch": 0.09, "learning_rate": 0.00028587410992246895, "loss": 0.0293, "step": 36330 }, { "epoch": 0.09, "learning_rate": 0.00028587022170609746, "loss": 0.0281, "step": 36340 }, { "epoch": 0.09, "learning_rate": 0.00028586633348972603, "loss": 0.0276, "step": 36350 }, { "epoch": 0.09, "learning_rate": 0.00028586244527335455, "loss": 0.0321, "step": 36360 }, { "epoch": 0.09, "learning_rate": 0.0002858585570569831, "loss": 0.0316, "step": 36370 }, { "epoch": 0.09, "learning_rate": 0.00028585466884061163, "loss": 0.0259, "step": 36380 }, { "epoch": 0.09, "learning_rate": 0.00028585078062424014, "loss": 0.0289, "step": 36390 }, { "epoch": 0.09, "learning_rate": 0.00028584689240786866, "loss": 0.0255, "step": 36400 }, { "epoch": 0.09, "learning_rate": 0.00028584300419149723, "loss": 0.0272, "step": 36410 }, { "epoch": 0.09, "learning_rate": 0.00028583911597512574, "loss": 0.0289, "step": 36420 }, { "epoch": 0.09, "learning_rate": 0.0002858352277587543, "loss": 0.0277, "step": 36430 }, { "epoch": 0.09, "learning_rate": 0.0002858313395423828, "loss": 0.0284, "step": 36440 }, { "epoch": 0.09, "learning_rate": 0.0002858274513260114, "loss": 0.0298, "step": 36450 }, { "epoch": 0.09, "learning_rate": 0.0002858235631096399, "loss": 0.026, "step": 36460 }, { "epoch": 0.09, "learning_rate": 0.0002858196748932684, "loss": 0.0295, "step": 36470 }, { "epoch": 0.09, "learning_rate": 0.00028581578667689694, "loss": 0.0297, "step": 36480 }, { "epoch": 0.09, "learning_rate": 0.0002858118984605255, "loss": 0.0267, "step": 36490 }, { "epoch": 0.09, "learning_rate": 0.0002858080102441541, "loss": 0.0366, "step": 36500 }, { "epoch": 0.09, "learning_rate": 0.0002858041220277826, "loss": 0.0315, "step": 36510 }, { "epoch": 0.09, "learning_rate": 0.0002858002338114111, "loss": 0.0275, "step": 36520 }, { "epoch": 0.09, "learning_rate": 0.0002857963455950396, "loss": 0.0272, "step": 36530 }, { "epoch": 0.09, "learning_rate": 0.0002857924573786682, "loss": 0.032, "step": 36540 }, { "epoch": 0.09, "learning_rate": 0.0002857885691622967, "loss": 0.0262, "step": 36550 }, { "epoch": 0.09, "learning_rate": 0.00028578468094592527, "loss": 0.0332, "step": 36560 }, { "epoch": 0.09, "learning_rate": 0.0002857807927295538, "loss": 0.0296, "step": 36570 }, { "epoch": 0.09, "learning_rate": 0.00028577690451318235, "loss": 0.0298, "step": 36580 }, { "epoch": 0.09, "learning_rate": 0.00028577301629681087, "loss": 0.0333, "step": 36590 }, { "epoch": 0.09, "learning_rate": 0.0002857691280804394, "loss": 0.0276, "step": 36600 }, { "epoch": 0.09, "learning_rate": 0.0002857652398640679, "loss": 0.034, "step": 36610 }, { "epoch": 0.09, "learning_rate": 0.00028576135164769647, "loss": 0.0351, "step": 36620 }, { "epoch": 0.09, "learning_rate": 0.000285757463431325, "loss": 0.032, "step": 36630 }, { "epoch": 0.09, "learning_rate": 0.00028575357521495355, "loss": 0.0305, "step": 36640 }, { "epoch": 0.1, "learning_rate": 0.00028574968699858206, "loss": 0.0288, "step": 36650 }, { "epoch": 0.1, "learning_rate": 0.00028574579878221063, "loss": 0.0332, "step": 36660 }, { "epoch": 0.1, "learning_rate": 0.00028574191056583915, "loss": 0.0299, "step": 36670 }, { "epoch": 0.1, "learning_rate": 0.00028573802234946766, "loss": 0.0318, "step": 36680 }, { "epoch": 0.1, "learning_rate": 0.00028573413413309623, "loss": 0.0247, "step": 36690 }, { "epoch": 0.1, "learning_rate": 0.00028573024591672475, "loss": 0.0333, "step": 36700 }, { "epoch": 0.1, "learning_rate": 0.0002857263577003533, "loss": 0.0323, "step": 36710 }, { "epoch": 0.1, "learning_rate": 0.00028572246948398183, "loss": 0.0277, "step": 36720 }, { "epoch": 0.1, "learning_rate": 0.00028571858126761034, "loss": 0.03, "step": 36730 }, { "epoch": 0.1, "learning_rate": 0.00028571469305123886, "loss": 0.0312, "step": 36740 }, { "epoch": 0.1, "learning_rate": 0.0002857108048348674, "loss": 0.0307, "step": 36750 }, { "epoch": 0.1, "learning_rate": 0.00028570691661849594, "loss": 0.0284, "step": 36760 }, { "epoch": 0.1, "learning_rate": 0.0002857030284021245, "loss": 0.029, "step": 36770 }, { "epoch": 0.1, "learning_rate": 0.000285699140185753, "loss": 0.0252, "step": 36780 }, { "epoch": 0.1, "learning_rate": 0.0002856952519693816, "loss": 0.0301, "step": 36790 }, { "epoch": 0.1, "learning_rate": 0.0002856913637530101, "loss": 0.0351, "step": 36800 }, { "epoch": 0.1, "learning_rate": 0.0002856874755366386, "loss": 0.033, "step": 36810 }, { "epoch": 0.1, "learning_rate": 0.00028568358732026714, "loss": 0.0307, "step": 36820 }, { "epoch": 0.1, "learning_rate": 0.0002856796991038957, "loss": 0.0361, "step": 36830 }, { "epoch": 0.1, "learning_rate": 0.0002856758108875243, "loss": 0.0343, "step": 36840 }, { "epoch": 0.1, "learning_rate": 0.0002856719226711528, "loss": 0.0289, "step": 36850 }, { "epoch": 0.1, "learning_rate": 0.0002856680344547813, "loss": 0.0337, "step": 36860 }, { "epoch": 0.1, "learning_rate": 0.00028566414623840987, "loss": 0.0312, "step": 36870 }, { "epoch": 0.1, "learning_rate": 0.0002856602580220384, "loss": 0.0296, "step": 36880 }, { "epoch": 0.1, "learning_rate": 0.0002856563698056669, "loss": 0.0514, "step": 36890 }, { "epoch": 0.1, "learning_rate": 0.00028565248158929547, "loss": 0.0326, "step": 36900 }, { "epoch": 0.1, "learning_rate": 0.000285648593372924, "loss": 0.033, "step": 36910 }, { "epoch": 0.1, "learning_rate": 0.00028564470515655255, "loss": 0.0338, "step": 36920 }, { "epoch": 0.1, "learning_rate": 0.00028564081694018107, "loss": 0.0336, "step": 36930 }, { "epoch": 0.1, "learning_rate": 0.0002856369287238096, "loss": 0.031, "step": 36940 }, { "epoch": 0.1, "learning_rate": 0.00028563304050743815, "loss": 0.0262, "step": 36950 }, { "epoch": 0.1, "learning_rate": 0.00028562915229106666, "loss": 0.032, "step": 36960 }, { "epoch": 0.1, "learning_rate": 0.0002856252640746952, "loss": 0.0305, "step": 36970 }, { "epoch": 0.1, "learning_rate": 0.00028562137585832375, "loss": 0.0383, "step": 36980 }, { "epoch": 0.1, "learning_rate": 0.00028561748764195226, "loss": 0.0298, "step": 36990 }, { "epoch": 0.1, "learning_rate": 0.00028561359942558083, "loss": 0.03, "step": 37000 }, { "epoch": 0.1, "eval_cer": 0.8817502739789299, "eval_loss": 0.02250346727669239, "eval_runtime": 107.7374, "eval_samples_per_second": 18.564, "eval_steps_per_second": 4.641, "step": 37000 }, { "epoch": 0.1, "learning_rate": 0.00028560971120920935, "loss": 0.0322, "step": 37010 }, { "epoch": 0.1, "learning_rate": 0.00028560582299283786, "loss": 0.0336, "step": 37020 }, { "epoch": 0.1, "learning_rate": 0.0002856019347764664, "loss": 0.0268, "step": 37030 }, { "epoch": 0.1, "learning_rate": 0.00028559804656009494, "loss": 0.0301, "step": 37040 }, { "epoch": 0.1, "learning_rate": 0.0002855941583437235, "loss": 0.0341, "step": 37050 }, { "epoch": 0.1, "learning_rate": 0.00028559027012735203, "loss": 0.0292, "step": 37060 }, { "epoch": 0.1, "learning_rate": 0.00028558638191098054, "loss": 0.0333, "step": 37070 }, { "epoch": 0.1, "learning_rate": 0.0002855824936946091, "loss": 0.0304, "step": 37080 }, { "epoch": 0.1, "learning_rate": 0.0002855786054782376, "loss": 0.0321, "step": 37090 }, { "epoch": 0.1, "learning_rate": 0.00028557471726186614, "loss": 0.0288, "step": 37100 }, { "epoch": 0.1, "learning_rate": 0.0002855708290454947, "loss": 0.0275, "step": 37110 }, { "epoch": 0.1, "learning_rate": 0.0002855669408291232, "loss": 0.0328, "step": 37120 }, { "epoch": 0.1, "learning_rate": 0.0002855630526127518, "loss": 0.0338, "step": 37130 }, { "epoch": 0.1, "learning_rate": 0.0002855591643963803, "loss": 0.0276, "step": 37140 }, { "epoch": 0.1, "learning_rate": 0.0002855552761800088, "loss": 0.032, "step": 37150 }, { "epoch": 0.1, "learning_rate": 0.0002855513879636374, "loss": 0.0378, "step": 37160 }, { "epoch": 0.1, "learning_rate": 0.0002855474997472659, "loss": 0.0328, "step": 37170 }, { "epoch": 0.1, "learning_rate": 0.0002855436115308944, "loss": 0.032, "step": 37180 }, { "epoch": 0.1, "learning_rate": 0.000285539723314523, "loss": 0.032, "step": 37190 }, { "epoch": 0.1, "learning_rate": 0.00028553583509815156, "loss": 0.0383, "step": 37200 }, { "epoch": 0.1, "learning_rate": 0.00028553194688178007, "loss": 0.0316, "step": 37210 }, { "epoch": 0.1, "learning_rate": 0.0002855280586654086, "loss": 0.035, "step": 37220 }, { "epoch": 0.1, "learning_rate": 0.0002855241704490371, "loss": 0.0316, "step": 37230 }, { "epoch": 0.1, "learning_rate": 0.00028552028223266567, "loss": 0.027, "step": 37240 }, { "epoch": 0.1, "learning_rate": 0.0002855163940162942, "loss": 0.0265, "step": 37250 }, { "epoch": 0.1, "learning_rate": 0.00028551250579992275, "loss": 0.0335, "step": 37260 }, { "epoch": 0.1, "learning_rate": 0.00028550861758355127, "loss": 0.0256, "step": 37270 }, { "epoch": 0.1, "learning_rate": 0.0002855047293671798, "loss": 0.0276, "step": 37280 }, { "epoch": 0.1, "learning_rate": 0.00028550084115080835, "loss": 0.0314, "step": 37290 }, { "epoch": 0.1, "learning_rate": 0.00028549695293443686, "loss": 0.0337, "step": 37300 }, { "epoch": 0.1, "learning_rate": 0.0002854930647180654, "loss": 0.0308, "step": 37310 }, { "epoch": 0.1, "learning_rate": 0.00028548917650169395, "loss": 0.0299, "step": 37320 }, { "epoch": 0.1, "learning_rate": 0.0002854852882853225, "loss": 0.0302, "step": 37330 }, { "epoch": 0.1, "learning_rate": 0.00028548140006895103, "loss": 0.0315, "step": 37340 }, { "epoch": 0.1, "learning_rate": 0.00028547751185257954, "loss": 0.0273, "step": 37350 }, { "epoch": 0.1, "learning_rate": 0.00028547362363620806, "loss": 0.0298, "step": 37360 }, { "epoch": 0.1, "learning_rate": 0.00028546973541983663, "loss": 0.0329, "step": 37370 }, { "epoch": 0.1, "learning_rate": 0.00028546584720346514, "loss": 0.0343, "step": 37380 }, { "epoch": 0.1, "learning_rate": 0.0002854619589870937, "loss": 0.0472, "step": 37390 }, { "epoch": 0.1, "learning_rate": 0.0002854580707707222, "loss": 0.0341, "step": 37400 }, { "epoch": 0.1, "learning_rate": 0.0002854541825543508, "loss": 0.0344, "step": 37410 }, { "epoch": 0.1, "learning_rate": 0.0002854502943379793, "loss": 0.031, "step": 37420 }, { "epoch": 0.1, "learning_rate": 0.0002854464061216078, "loss": 0.0344, "step": 37430 }, { "epoch": 0.1, "learning_rate": 0.00028544251790523634, "loss": 0.0331, "step": 37440 }, { "epoch": 0.1, "learning_rate": 0.0002854386296888649, "loss": 0.0265, "step": 37450 }, { "epoch": 0.1, "learning_rate": 0.0002854347414724934, "loss": 0.0249, "step": 37460 }, { "epoch": 0.1, "learning_rate": 0.000285430853256122, "loss": 0.0341, "step": 37470 }, { "epoch": 0.1, "learning_rate": 0.0002854269650397505, "loss": 0.0334, "step": 37480 }, { "epoch": 0.1, "learning_rate": 0.000285423076823379, "loss": 0.0287, "step": 37490 }, { "epoch": 0.1, "learning_rate": 0.0002854191886070076, "loss": 0.0327, "step": 37500 }, { "epoch": 0.1, "learning_rate": 0.0002854153003906361, "loss": 0.0408, "step": 37510 }, { "epoch": 0.1, "learning_rate": 0.0002854114121742646, "loss": 0.0322, "step": 37520 }, { "epoch": 0.1, "learning_rate": 0.0002854075239578932, "loss": 0.0328, "step": 37530 }, { "epoch": 0.1, "learning_rate": 0.00028540363574152175, "loss": 0.0287, "step": 37540 }, { "epoch": 0.1, "learning_rate": 0.00028539974752515027, "loss": 0.034, "step": 37550 }, { "epoch": 0.1, "learning_rate": 0.0002853958593087788, "loss": 0.0364, "step": 37560 }, { "epoch": 0.1, "learning_rate": 0.0002853919710924073, "loss": 0.0293, "step": 37570 }, { "epoch": 0.1, "learning_rate": 0.00028538808287603587, "loss": 0.0333, "step": 37580 }, { "epoch": 0.1, "learning_rate": 0.0002853841946596644, "loss": 0.0338, "step": 37590 }, { "epoch": 0.1, "learning_rate": 0.00028538030644329295, "loss": 0.0333, "step": 37600 }, { "epoch": 0.1, "learning_rate": 0.00028537641822692146, "loss": 0.0276, "step": 37610 }, { "epoch": 0.1, "learning_rate": 0.00028537253001055003, "loss": 0.0341, "step": 37620 }, { "epoch": 0.1, "learning_rate": 0.00028536864179417855, "loss": 0.0269, "step": 37630 }, { "epoch": 0.1, "learning_rate": 0.00028536475357780706, "loss": 0.0295, "step": 37640 }, { "epoch": 0.1, "learning_rate": 0.0002853608653614356, "loss": 0.0314, "step": 37650 }, { "epoch": 0.1, "learning_rate": 0.00028535697714506415, "loss": 0.0314, "step": 37660 }, { "epoch": 0.1, "learning_rate": 0.00028535308892869266, "loss": 0.0303, "step": 37670 }, { "epoch": 0.1, "learning_rate": 0.00028534920071232123, "loss": 0.0468, "step": 37680 }, { "epoch": 0.1, "learning_rate": 0.00028534531249594974, "loss": 0.0265, "step": 37690 }, { "epoch": 0.1, "learning_rate": 0.0002853414242795783, "loss": 0.0257, "step": 37700 }, { "epoch": 0.1, "learning_rate": 0.0002853375360632068, "loss": 0.0313, "step": 37710 }, { "epoch": 0.1, "learning_rate": 0.00028533364784683534, "loss": 0.0317, "step": 37720 }, { "epoch": 0.1, "learning_rate": 0.0002853297596304639, "loss": 0.0322, "step": 37730 }, { "epoch": 0.1, "learning_rate": 0.0002853258714140924, "loss": 0.0383, "step": 37740 }, { "epoch": 0.1, "learning_rate": 0.000285321983197721, "loss": 0.0301, "step": 37750 }, { "epoch": 0.1, "learning_rate": 0.0002853180949813495, "loss": 0.0298, "step": 37760 }, { "epoch": 0.1, "learning_rate": 0.000285314206764978, "loss": 0.032, "step": 37770 }, { "epoch": 0.1, "learning_rate": 0.00028531031854860654, "loss": 0.0334, "step": 37780 }, { "epoch": 0.1, "learning_rate": 0.0002853064303322351, "loss": 0.0304, "step": 37790 }, { "epoch": 0.1, "learning_rate": 0.0002853025421158636, "loss": 0.0345, "step": 37800 }, { "epoch": 0.1, "learning_rate": 0.0002852986538994922, "loss": 0.0326, "step": 37810 }, { "epoch": 0.1, "learning_rate": 0.0002852947656831207, "loss": 0.0311, "step": 37820 }, { "epoch": 0.1, "learning_rate": 0.00028529087746674927, "loss": 0.0332, "step": 37830 }, { "epoch": 0.1, "learning_rate": 0.0002852869892503778, "loss": 0.0292, "step": 37840 }, { "epoch": 0.1, "learning_rate": 0.0002852831010340063, "loss": 0.0429, "step": 37850 }, { "epoch": 0.1, "learning_rate": 0.0002852792128176348, "loss": 0.033, "step": 37860 }, { "epoch": 0.1, "learning_rate": 0.0002852753246012634, "loss": 0.0322, "step": 37870 }, { "epoch": 0.1, "learning_rate": 0.00028527143638489195, "loss": 0.0347, "step": 37880 }, { "epoch": 0.1, "learning_rate": 0.00028526754816852047, "loss": 0.0276, "step": 37890 }, { "epoch": 0.1, "learning_rate": 0.000285263659952149, "loss": 0.0364, "step": 37900 }, { "epoch": 0.1, "learning_rate": 0.00028525977173577755, "loss": 0.0331, "step": 37910 }, { "epoch": 0.1, "learning_rate": 0.00028525588351940607, "loss": 0.0336, "step": 37920 }, { "epoch": 0.1, "learning_rate": 0.0002852519953030346, "loss": 0.0293, "step": 37930 }, { "epoch": 0.1, "learning_rate": 0.00028524810708666315, "loss": 0.028, "step": 37940 }, { "epoch": 0.1, "learning_rate": 0.00028524421887029166, "loss": 0.035, "step": 37950 }, { "epoch": 0.1, "learning_rate": 0.00028524033065392023, "loss": 0.0305, "step": 37960 }, { "epoch": 0.1, "learning_rate": 0.00028523644243754875, "loss": 0.0321, "step": 37970 }, { "epoch": 0.1, "learning_rate": 0.00028523255422117726, "loss": 0.0342, "step": 37980 }, { "epoch": 0.1, "learning_rate": 0.0002852286660048058, "loss": 0.0324, "step": 37990 }, { "epoch": 0.1, "learning_rate": 0.00028522477778843434, "loss": 0.0355, "step": 38000 }, { "epoch": 0.1, "eval_cer": 0.8817740678068109, "eval_loss": 0.021771151572465897, "eval_runtime": 107.8634, "eval_samples_per_second": 18.542, "eval_steps_per_second": 4.635, "step": 38000 }, { "epoch": 0.1, "learning_rate": 0.00028522088957206286, "loss": 0.0256, "step": 38010 }, { "epoch": 0.1, "learning_rate": 0.00028521700135569143, "loss": 0.0292, "step": 38020 }, { "epoch": 0.1, "learning_rate": 0.00028521311313931994, "loss": 0.0239, "step": 38030 }, { "epoch": 0.1, "learning_rate": 0.0002852092249229485, "loss": 0.0332, "step": 38040 }, { "epoch": 0.1, "learning_rate": 0.000285205336706577, "loss": 0.0325, "step": 38050 }, { "epoch": 0.1, "learning_rate": 0.00028520144849020554, "loss": 0.0322, "step": 38060 }, { "epoch": 0.1, "learning_rate": 0.00028519756027383405, "loss": 0.0298, "step": 38070 }, { "epoch": 0.1, "learning_rate": 0.0002851936720574626, "loss": 0.031, "step": 38080 }, { "epoch": 0.1, "learning_rate": 0.0002851897838410912, "loss": 0.0345, "step": 38090 }, { "epoch": 0.1, "learning_rate": 0.0002851858956247197, "loss": 0.0301, "step": 38100 }, { "epoch": 0.1, "learning_rate": 0.0002851820074083482, "loss": 0.0325, "step": 38110 }, { "epoch": 0.1, "learning_rate": 0.0002851781191919768, "loss": 0.0318, "step": 38120 }, { "epoch": 0.1, "learning_rate": 0.0002851742309756053, "loss": 0.0281, "step": 38130 }, { "epoch": 0.1, "learning_rate": 0.0002851703427592338, "loss": 0.0284, "step": 38140 }, { "epoch": 0.1, "learning_rate": 0.0002851664545428624, "loss": 0.0275, "step": 38150 }, { "epoch": 0.1, "learning_rate": 0.0002851625663264909, "loss": 0.0334, "step": 38160 }, { "epoch": 0.1, "learning_rate": 0.00028515867811011947, "loss": 0.0368, "step": 38170 }, { "epoch": 0.1, "learning_rate": 0.000285154789893748, "loss": 0.0311, "step": 38180 }, { "epoch": 0.1, "learning_rate": 0.0002851509016773765, "loss": 0.0318, "step": 38190 }, { "epoch": 0.1, "learning_rate": 0.00028514701346100507, "loss": 0.0351, "step": 38200 }, { "epoch": 0.1, "learning_rate": 0.0002851431252446336, "loss": 0.0384, "step": 38210 }, { "epoch": 0.1, "learning_rate": 0.0002851392370282621, "loss": 0.0378, "step": 38220 }, { "epoch": 0.1, "learning_rate": 0.00028513534881189067, "loss": 0.0335, "step": 38230 }, { "epoch": 0.1, "learning_rate": 0.0002851314605955192, "loss": 0.0279, "step": 38240 }, { "epoch": 0.1, "learning_rate": 0.00028512757237914775, "loss": 0.0381, "step": 38250 }, { "epoch": 0.1, "learning_rate": 0.00028512368416277626, "loss": 0.0287, "step": 38260 }, { "epoch": 0.1, "learning_rate": 0.0002851197959464048, "loss": 0.0275, "step": 38270 }, { "epoch": 0.1, "learning_rate": 0.00028511590773003335, "loss": 0.0266, "step": 38280 }, { "epoch": 0.1, "learning_rate": 0.00028511201951366186, "loss": 0.0359, "step": 38290 }, { "epoch": 0.1, "learning_rate": 0.00028510813129729043, "loss": 0.0344, "step": 38300 }, { "epoch": 0.1, "learning_rate": 0.00028510424308091895, "loss": 0.0307, "step": 38310 }, { "epoch": 0.1, "learning_rate": 0.00028510035486454746, "loss": 0.0303, "step": 38320 }, { "epoch": 0.1, "learning_rate": 0.00028509646664817603, "loss": 0.0276, "step": 38330 }, { "epoch": 0.1, "learning_rate": 0.00028509257843180454, "loss": 0.0309, "step": 38340 }, { "epoch": 0.1, "learning_rate": 0.00028508869021543306, "loss": 0.0281, "step": 38350 }, { "epoch": 0.1, "learning_rate": 0.0002850848019990616, "loss": 0.0303, "step": 38360 }, { "epoch": 0.1, "learning_rate": 0.00028508091378269014, "loss": 0.0337, "step": 38370 }, { "epoch": 0.1, "learning_rate": 0.0002850770255663187, "loss": 0.0322, "step": 38380 }, { "epoch": 0.1, "learning_rate": 0.0002850731373499472, "loss": 0.0342, "step": 38390 }, { "epoch": 0.1, "learning_rate": 0.00028506924913357574, "loss": 0.0296, "step": 38400 }, { "epoch": 0.1, "learning_rate": 0.0002850653609172043, "loss": 0.0332, "step": 38410 }, { "epoch": 0.1, "learning_rate": 0.0002850614727008328, "loss": 0.0285, "step": 38420 }, { "epoch": 0.1, "learning_rate": 0.0002850575844844614, "loss": 0.0282, "step": 38430 }, { "epoch": 0.1, "learning_rate": 0.0002850536962680899, "loss": 0.0321, "step": 38440 }, { "epoch": 0.1, "learning_rate": 0.0002850498080517185, "loss": 0.0287, "step": 38450 }, { "epoch": 0.1, "learning_rate": 0.000285045919835347, "loss": 0.033, "step": 38460 }, { "epoch": 0.1, "learning_rate": 0.0002850420316189755, "loss": 0.0252, "step": 38470 }, { "epoch": 0.1, "learning_rate": 0.000285038143402604, "loss": 0.0287, "step": 38480 }, { "epoch": 0.1, "learning_rate": 0.0002850342551862326, "loss": 0.0332, "step": 38490 }, { "epoch": 0.1, "learning_rate": 0.0002850303669698611, "loss": 0.0268, "step": 38500 }, { "epoch": 0.1, "learning_rate": 0.00028502647875348967, "loss": 0.0328, "step": 38510 }, { "epoch": 0.1, "learning_rate": 0.0002850225905371182, "loss": 0.0238, "step": 38520 }, { "epoch": 0.1, "learning_rate": 0.0002850187023207467, "loss": 0.0267, "step": 38530 }, { "epoch": 0.1, "learning_rate": 0.00028501481410437527, "loss": 0.0326, "step": 38540 }, { "epoch": 0.1, "learning_rate": 0.0002850109258880038, "loss": 0.0312, "step": 38550 }, { "epoch": 0.1, "learning_rate": 0.0002850070376716323, "loss": 0.0255, "step": 38560 }, { "epoch": 0.1, "learning_rate": 0.00028500314945526087, "loss": 0.0318, "step": 38570 }, { "epoch": 0.1, "learning_rate": 0.00028499926123888943, "loss": 0.0277, "step": 38580 }, { "epoch": 0.1, "learning_rate": 0.00028499537302251795, "loss": 0.03, "step": 38590 }, { "epoch": 0.1, "learning_rate": 0.00028499148480614646, "loss": 0.0332, "step": 38600 }, { "epoch": 0.1, "learning_rate": 0.000284987596589775, "loss": 0.0313, "step": 38610 }, { "epoch": 0.1, "learning_rate": 0.00028498370837340355, "loss": 0.03, "step": 38620 }, { "epoch": 0.1, "learning_rate": 0.00028497982015703206, "loss": 0.0259, "step": 38630 }, { "epoch": 0.1, "learning_rate": 0.00028497593194066063, "loss": 0.0337, "step": 38640 }, { "epoch": 0.1, "learning_rate": 0.00028497204372428914, "loss": 0.0317, "step": 38650 }, { "epoch": 0.1, "learning_rate": 0.0002849681555079177, "loss": 0.0346, "step": 38660 }, { "epoch": 0.1, "learning_rate": 0.00028496426729154623, "loss": 0.0352, "step": 38670 }, { "epoch": 0.1, "learning_rate": 0.00028496037907517474, "loss": 0.0281, "step": 38680 }, { "epoch": 0.1, "learning_rate": 0.00028495649085880326, "loss": 0.0263, "step": 38690 }, { "epoch": 0.1, "learning_rate": 0.0002849526026424318, "loss": 0.0351, "step": 38700 }, { "epoch": 0.1, "learning_rate": 0.00028494871442606034, "loss": 0.0329, "step": 38710 }, { "epoch": 0.1, "learning_rate": 0.0002849448262096889, "loss": 0.0275, "step": 38720 }, { "epoch": 0.1, "learning_rate": 0.0002849409379933174, "loss": 0.034, "step": 38730 }, { "epoch": 0.1, "learning_rate": 0.00028493704977694594, "loss": 0.0297, "step": 38740 }, { "epoch": 0.1, "learning_rate": 0.0002849331615605745, "loss": 0.0285, "step": 38750 }, { "epoch": 0.1, "learning_rate": 0.000284929273344203, "loss": 0.0289, "step": 38760 }, { "epoch": 0.1, "learning_rate": 0.00028492538512783154, "loss": 0.0331, "step": 38770 }, { "epoch": 0.1, "learning_rate": 0.0002849214969114601, "loss": 0.0282, "step": 38780 }, { "epoch": 0.1, "learning_rate": 0.0002849176086950887, "loss": 0.0304, "step": 38790 }, { "epoch": 0.1, "learning_rate": 0.0002849137204787172, "loss": 0.0279, "step": 38800 }, { "epoch": 0.1, "learning_rate": 0.0002849098322623457, "loss": 0.0342, "step": 38810 }, { "epoch": 0.1, "learning_rate": 0.0002849059440459742, "loss": 0.0346, "step": 38820 }, { "epoch": 0.1, "learning_rate": 0.0002849020558296028, "loss": 0.0327, "step": 38830 }, { "epoch": 0.1, "learning_rate": 0.0002848981676132313, "loss": 0.0335, "step": 38840 }, { "epoch": 0.1, "learning_rate": 0.00028489427939685987, "loss": 0.0272, "step": 38850 }, { "epoch": 0.1, "learning_rate": 0.0002848903911804884, "loss": 0.027, "step": 38860 }, { "epoch": 0.1, "learning_rate": 0.00028488650296411695, "loss": 0.0305, "step": 38870 }, { "epoch": 0.1, "learning_rate": 0.00028488261474774547, "loss": 0.0309, "step": 38880 }, { "epoch": 0.1, "learning_rate": 0.000284878726531374, "loss": 0.0306, "step": 38890 }, { "epoch": 0.1, "learning_rate": 0.0002848748383150025, "loss": 0.0338, "step": 38900 }, { "epoch": 0.1, "learning_rate": 0.00028487095009863106, "loss": 0.0293, "step": 38910 }, { "epoch": 0.1, "learning_rate": 0.0002848670618822596, "loss": 0.0275, "step": 38920 }, { "epoch": 0.1, "learning_rate": 0.00028486317366588815, "loss": 0.0313, "step": 38930 }, { "epoch": 0.1, "learning_rate": 0.00028485928544951666, "loss": 0.0314, "step": 38940 }, { "epoch": 0.1, "learning_rate": 0.00028485539723314523, "loss": 0.0304, "step": 38950 }, { "epoch": 0.1, "learning_rate": 0.00028485150901677375, "loss": 0.0325, "step": 38960 }, { "epoch": 0.1, "learning_rate": 0.00028484762080040226, "loss": 0.0333, "step": 38970 }, { "epoch": 0.1, "learning_rate": 0.00028484373258403083, "loss": 0.0292, "step": 38980 }, { "epoch": 0.1, "learning_rate": 0.00028483984436765934, "loss": 0.0328, "step": 38990 }, { "epoch": 0.1, "learning_rate": 0.0002848359561512879, "loss": 0.0246, "step": 39000 }, { "epoch": 0.1, "eval_cer": 0.8818440496535199, "eval_loss": 0.02235816977918148, "eval_runtime": 107.7775, "eval_samples_per_second": 18.557, "eval_steps_per_second": 4.639, "step": 39000 }, { "epoch": 0.1, "learning_rate": 0.0002848320679349164, "loss": 0.0275, "step": 39010 }, { "epoch": 0.1, "learning_rate": 0.00028482817971854494, "loss": 0.0276, "step": 39020 }, { "epoch": 0.1, "learning_rate": 0.00028482429150217346, "loss": 0.036, "step": 39030 }, { "epoch": 0.1, "learning_rate": 0.000284820403285802, "loss": 0.0324, "step": 39040 }, { "epoch": 0.1, "learning_rate": 0.00028481651506943054, "loss": 0.0348, "step": 39050 }, { "epoch": 0.1, "learning_rate": 0.0002848126268530591, "loss": 0.0296, "step": 39060 }, { "epoch": 0.1, "learning_rate": 0.0002848087386366876, "loss": 0.0348, "step": 39070 }, { "epoch": 0.1, "learning_rate": 0.0002848048504203162, "loss": 0.0315, "step": 39080 }, { "epoch": 0.1, "learning_rate": 0.0002848009622039447, "loss": 0.0303, "step": 39090 }, { "epoch": 0.1, "learning_rate": 0.0002847970739875732, "loss": 0.0276, "step": 39100 }, { "epoch": 0.1, "learning_rate": 0.00028479318577120173, "loss": 0.0277, "step": 39110 }, { "epoch": 0.1, "learning_rate": 0.0002847892975548303, "loss": 0.0327, "step": 39120 }, { "epoch": 0.1, "learning_rate": 0.00028478540933845887, "loss": 0.0329, "step": 39130 }, { "epoch": 0.1, "learning_rate": 0.0002847815211220874, "loss": 0.0293, "step": 39140 }, { "epoch": 0.1, "learning_rate": 0.0002847776329057159, "loss": 0.0371, "step": 39150 }, { "epoch": 0.1, "learning_rate": 0.00028477374468934447, "loss": 0.0287, "step": 39160 }, { "epoch": 0.1, "learning_rate": 0.000284769856472973, "loss": 0.0404, "step": 39170 }, { "epoch": 0.1, "learning_rate": 0.0002847659682566015, "loss": 0.0294, "step": 39180 }, { "epoch": 0.1, "learning_rate": 0.00028476208004023007, "loss": 0.0288, "step": 39190 }, { "epoch": 0.1, "learning_rate": 0.0002847581918238586, "loss": 0.0261, "step": 39200 }, { "epoch": 0.1, "learning_rate": 0.00028475430360748715, "loss": 0.0405, "step": 39210 }, { "epoch": 0.1, "learning_rate": 0.00028475041539111567, "loss": 0.0286, "step": 39220 }, { "epoch": 0.1, "learning_rate": 0.0002847465271747442, "loss": 0.03, "step": 39230 }, { "epoch": 0.1, "learning_rate": 0.0002847426389583727, "loss": 0.0284, "step": 39240 }, { "epoch": 0.1, "learning_rate": 0.00028473875074200126, "loss": 0.0267, "step": 39250 }, { "epoch": 0.1, "learning_rate": 0.0002847348625256298, "loss": 0.0326, "step": 39260 }, { "epoch": 0.1, "learning_rate": 0.00028473097430925835, "loss": 0.0301, "step": 39270 }, { "epoch": 0.1, "learning_rate": 0.00028472708609288686, "loss": 0.0312, "step": 39280 }, { "epoch": 0.1, "learning_rate": 0.00028472319787651543, "loss": 0.0335, "step": 39290 }, { "epoch": 0.1, "learning_rate": 0.00028471930966014394, "loss": 0.0272, "step": 39300 }, { "epoch": 0.1, "learning_rate": 0.00028471542144377246, "loss": 0.0278, "step": 39310 }, { "epoch": 0.1, "learning_rate": 0.00028471153322740103, "loss": 0.0315, "step": 39320 }, { "epoch": 0.1, "learning_rate": 0.00028470764501102954, "loss": 0.0341, "step": 39330 }, { "epoch": 0.1, "learning_rate": 0.0002847037567946581, "loss": 0.0305, "step": 39340 }, { "epoch": 0.1, "learning_rate": 0.0002846998685782866, "loss": 0.0275, "step": 39350 }, { "epoch": 0.1, "learning_rate": 0.00028469598036191514, "loss": 0.03, "step": 39360 }, { "epoch": 0.1, "learning_rate": 0.0002846920921455437, "loss": 0.0229, "step": 39370 }, { "epoch": 0.1, "learning_rate": 0.0002846882039291722, "loss": 0.0297, "step": 39380 }, { "epoch": 0.1, "learning_rate": 0.00028468431571280074, "loss": 0.0358, "step": 39390 }, { "epoch": 0.1, "learning_rate": 0.0002846804274964293, "loss": 0.031, "step": 39400 }, { "epoch": 0.1, "learning_rate": 0.0002846765392800578, "loss": 0.0367, "step": 39410 }, { "epoch": 0.1, "learning_rate": 0.0002846726510636864, "loss": 0.0347, "step": 39420 }, { "epoch": 0.1, "learning_rate": 0.0002846687628473149, "loss": 0.0286, "step": 39430 }, { "epoch": 0.1, "learning_rate": 0.0002846648746309434, "loss": 0.0445, "step": 39440 }, { "epoch": 0.1, "learning_rate": 0.00028466098641457193, "loss": 0.0323, "step": 39450 }, { "epoch": 0.1, "learning_rate": 0.0002846570981982005, "loss": 0.0269, "step": 39460 }, { "epoch": 0.1, "learning_rate": 0.00028465320998182907, "loss": 0.0386, "step": 39470 }, { "epoch": 0.1, "learning_rate": 0.0002846493217654576, "loss": 0.033, "step": 39480 }, { "epoch": 0.1, "learning_rate": 0.0002846454335490861, "loss": 0.0264, "step": 39490 }, { "epoch": 0.1, "learning_rate": 0.00028464154533271467, "loss": 0.0302, "step": 39500 }, { "epoch": 0.1, "learning_rate": 0.0002846376571163432, "loss": 0.0324, "step": 39510 }, { "epoch": 0.1, "learning_rate": 0.0002846337688999717, "loss": 0.0285, "step": 39520 }, { "epoch": 0.1, "learning_rate": 0.00028462988068360027, "loss": 0.0301, "step": 39530 }, { "epoch": 0.1, "learning_rate": 0.0002846259924672288, "loss": 0.029, "step": 39540 }, { "epoch": 0.1, "learning_rate": 0.00028462210425085735, "loss": 0.0306, "step": 39550 }, { "epoch": 0.1, "learning_rate": 0.00028461821603448586, "loss": 0.0271, "step": 39560 }, { "epoch": 0.1, "learning_rate": 0.0002846143278181144, "loss": 0.0278, "step": 39570 }, { "epoch": 0.1, "learning_rate": 0.00028461043960174295, "loss": 0.0255, "step": 39580 }, { "epoch": 0.1, "learning_rate": 0.00028460655138537146, "loss": 0.0313, "step": 39590 }, { "epoch": 0.1, "learning_rate": 0.000284602663169, "loss": 0.0303, "step": 39600 }, { "epoch": 0.1, "learning_rate": 0.00028459877495262855, "loss": 0.0315, "step": 39610 }, { "epoch": 0.1, "learning_rate": 0.0002845948867362571, "loss": 0.0272, "step": 39620 }, { "epoch": 0.1, "learning_rate": 0.00028459099851988563, "loss": 0.0344, "step": 39630 }, { "epoch": 0.1, "learning_rate": 0.00028458711030351414, "loss": 0.0323, "step": 39640 }, { "epoch": 0.1, "learning_rate": 0.00028458322208714266, "loss": 0.0306, "step": 39650 }, { "epoch": 0.1, "learning_rate": 0.0002845793338707712, "loss": 0.0327, "step": 39660 }, { "epoch": 0.1, "learning_rate": 0.00028457544565439974, "loss": 0.0354, "step": 39670 }, { "epoch": 0.1, "learning_rate": 0.0002845715574380283, "loss": 0.034, "step": 39680 }, { "epoch": 0.1, "learning_rate": 0.0002845676692216568, "loss": 0.0307, "step": 39690 }, { "epoch": 0.1, "learning_rate": 0.00028456378100528534, "loss": 0.027, "step": 39700 }, { "epoch": 0.1, "learning_rate": 0.0002845598927889139, "loss": 0.0289, "step": 39710 }, { "epoch": 0.1, "learning_rate": 0.0002845560045725424, "loss": 0.0325, "step": 39720 }, { "epoch": 0.1, "learning_rate": 0.00028455211635617094, "loss": 0.0302, "step": 39730 }, { "epoch": 0.1, "learning_rate": 0.0002845482281397995, "loss": 0.0358, "step": 39740 }, { "epoch": 0.1, "learning_rate": 0.000284544339923428, "loss": 0.0296, "step": 39750 }, { "epoch": 0.1, "learning_rate": 0.0002845404517070566, "loss": 0.0301, "step": 39760 }, { "epoch": 0.1, "learning_rate": 0.0002845365634906851, "loss": 0.0334, "step": 39770 }, { "epoch": 0.1, "learning_rate": 0.0002845326752743136, "loss": 0.0274, "step": 39780 }, { "epoch": 0.1, "learning_rate": 0.0002845287870579422, "loss": 0.0336, "step": 39790 }, { "epoch": 0.1, "learning_rate": 0.0002845248988415707, "loss": 0.0319, "step": 39800 }, { "epoch": 0.1, "learning_rate": 0.0002845210106251992, "loss": 0.0263, "step": 39810 }, { "epoch": 0.1, "learning_rate": 0.0002845171224088278, "loss": 0.0309, "step": 39820 }, { "epoch": 0.1, "learning_rate": 0.00028451323419245635, "loss": 0.0287, "step": 39830 }, { "epoch": 0.1, "learning_rate": 0.00028450934597608487, "loss": 0.0281, "step": 39840 }, { "epoch": 0.1, "learning_rate": 0.0002845054577597134, "loss": 0.0271, "step": 39850 }, { "epoch": 0.1, "learning_rate": 0.0002845015695433419, "loss": 0.0331, "step": 39860 }, { "epoch": 0.1, "learning_rate": 0.00028449768132697047, "loss": 0.0324, "step": 39870 }, { "epoch": 0.1, "learning_rate": 0.000284493793110599, "loss": 0.0356, "step": 39880 }, { "epoch": 0.1, "learning_rate": 0.00028448990489422755, "loss": 0.0268, "step": 39890 }, { "epoch": 0.1, "learning_rate": 0.00028448601667785606, "loss": 0.0351, "step": 39900 }, { "epoch": 0.1, "learning_rate": 0.00028448212846148463, "loss": 0.0314, "step": 39910 }, { "epoch": 0.1, "learning_rate": 0.00028447824024511315, "loss": 0.0313, "step": 39920 }, { "epoch": 0.1, "learning_rate": 0.00028447435202874166, "loss": 0.0259, "step": 39930 }, { "epoch": 0.1, "learning_rate": 0.0002844704638123702, "loss": 0.0296, "step": 39940 }, { "epoch": 0.1, "learning_rate": 0.00028446657559599874, "loss": 0.0262, "step": 39950 }, { "epoch": 0.1, "learning_rate": 0.00028446268737962726, "loss": 0.0349, "step": 39960 }, { "epoch": 0.1, "learning_rate": 0.00028445879916325583, "loss": 0.0335, "step": 39970 }, { "epoch": 0.1, "learning_rate": 0.00028445491094688434, "loss": 0.0311, "step": 39980 }, { "epoch": 0.1, "learning_rate": 0.00028445102273051286, "loss": 0.027, "step": 39990 }, { "epoch": 0.1, "learning_rate": 0.0002844471345141414, "loss": 0.026, "step": 40000 }, { "epoch": 0.1, "eval_cer": 0.8818636445705984, "eval_loss": 0.021385852247476578, "eval_runtime": 107.7355, "eval_samples_per_second": 18.564, "eval_steps_per_second": 4.641, "step": 40000 }, { "epoch": 0.1, "learning_rate": 0.00028444324629776994, "loss": 0.0295, "step": 40010 }, { "epoch": 0.1, "learning_rate": 0.0002844393580813985, "loss": 0.0276, "step": 40020 }, { "epoch": 0.1, "learning_rate": 0.000284435469865027, "loss": 0.0319, "step": 40030 }, { "epoch": 0.1, "learning_rate": 0.0002844315816486556, "loss": 0.0306, "step": 40040 }, { "epoch": 0.1, "learning_rate": 0.0002844276934322841, "loss": 0.028, "step": 40050 }, { "epoch": 0.1, "learning_rate": 0.0002844238052159126, "loss": 0.0282, "step": 40060 }, { "epoch": 0.1, "learning_rate": 0.00028441991699954114, "loss": 0.0311, "step": 40070 }, { "epoch": 0.1, "learning_rate": 0.0002844160287831697, "loss": 0.0329, "step": 40080 }, { "epoch": 0.1, "learning_rate": 0.0002844121405667982, "loss": 0.0337, "step": 40090 }, { "epoch": 0.1, "learning_rate": 0.0002844082523504268, "loss": 0.0276, "step": 40100 }, { "epoch": 0.1, "learning_rate": 0.0002844043641340553, "loss": 0.0268, "step": 40110 }, { "epoch": 0.1, "learning_rate": 0.00028440047591768387, "loss": 0.0316, "step": 40120 }, { "epoch": 0.1, "learning_rate": 0.0002843965877013124, "loss": 0.0298, "step": 40130 }, { "epoch": 0.1, "learning_rate": 0.0002843926994849409, "loss": 0.0266, "step": 40140 }, { "epoch": 0.1, "learning_rate": 0.0002843888112685694, "loss": 0.0247, "step": 40150 }, { "epoch": 0.1, "learning_rate": 0.000284384923052198, "loss": 0.0309, "step": 40160 }, { "epoch": 0.1, "learning_rate": 0.00028438103483582655, "loss": 0.0235, "step": 40170 }, { "epoch": 0.1, "learning_rate": 0.00028437714661945507, "loss": 0.0284, "step": 40180 }, { "epoch": 0.1, "learning_rate": 0.0002843732584030836, "loss": 0.0255, "step": 40190 }, { "epoch": 0.1, "learning_rate": 0.0002843693701867121, "loss": 0.0324, "step": 40200 }, { "epoch": 0.1, "learning_rate": 0.00028436548197034066, "loss": 0.0328, "step": 40210 }, { "epoch": 0.1, "learning_rate": 0.0002843615937539692, "loss": 0.0286, "step": 40220 }, { "epoch": 0.1, "learning_rate": 0.00028435770553759775, "loss": 0.0269, "step": 40230 }, { "epoch": 0.1, "learning_rate": 0.00028435381732122626, "loss": 0.0279, "step": 40240 }, { "epoch": 0.1, "learning_rate": 0.00028434992910485483, "loss": 0.0304, "step": 40250 }, { "epoch": 0.1, "learning_rate": 0.00028434604088848335, "loss": 0.0279, "step": 40260 }, { "epoch": 0.1, "learning_rate": 0.00028434215267211186, "loss": 0.0428, "step": 40270 }, { "epoch": 0.1, "learning_rate": 0.0002843382644557404, "loss": 0.028, "step": 40280 }, { "epoch": 0.1, "learning_rate": 0.00028433437623936894, "loss": 0.0275, "step": 40290 }, { "epoch": 0.1, "learning_rate": 0.00028433048802299746, "loss": 0.0412, "step": 40300 }, { "epoch": 0.1, "learning_rate": 0.000284326599806626, "loss": 0.0324, "step": 40310 }, { "epoch": 0.1, "learning_rate": 0.00028432271159025454, "loss": 0.0407, "step": 40320 }, { "epoch": 0.1, "learning_rate": 0.0002843188233738831, "loss": 0.0344, "step": 40330 }, { "epoch": 0.1, "learning_rate": 0.0002843149351575116, "loss": 0.0359, "step": 40340 }, { "epoch": 0.1, "learning_rate": 0.00028431104694114014, "loss": 0.0333, "step": 40350 }, { "epoch": 0.1, "learning_rate": 0.00028430715872476865, "loss": 0.0334, "step": 40360 }, { "epoch": 0.1, "learning_rate": 0.0002843032705083972, "loss": 0.0357, "step": 40370 }, { "epoch": 0.1, "learning_rate": 0.0002842993822920258, "loss": 0.0295, "step": 40380 }, { "epoch": 0.1, "learning_rate": 0.0002842954940756543, "loss": 0.0316, "step": 40390 }, { "epoch": 0.1, "learning_rate": 0.0002842916058592828, "loss": 0.0302, "step": 40400 }, { "epoch": 0.1, "learning_rate": 0.0002842877176429114, "loss": 0.0393, "step": 40410 }, { "epoch": 0.1, "learning_rate": 0.0002842838294265399, "loss": 0.0333, "step": 40420 }, { "epoch": 0.1, "learning_rate": 0.0002842799412101684, "loss": 0.0307, "step": 40430 }, { "epoch": 0.1, "learning_rate": 0.000284276052993797, "loss": 0.0377, "step": 40440 }, { "epoch": 0.1, "learning_rate": 0.0002842721647774255, "loss": 0.0407, "step": 40450 }, { "epoch": 0.1, "learning_rate": 0.00028426827656105407, "loss": 0.029, "step": 40460 }, { "epoch": 0.1, "learning_rate": 0.0002842643883446826, "loss": 0.0357, "step": 40470 }, { "epoch": 0.1, "learning_rate": 0.0002842605001283111, "loss": 0.0327, "step": 40480 }, { "epoch": 0.1, "learning_rate": 0.0002842566119119396, "loss": 0.0365, "step": 40490 }, { "epoch": 0.1, "learning_rate": 0.0002842527236955682, "loss": 0.0325, "step": 40500 }, { "epoch": 0.11, "learning_rate": 0.0002842488354791967, "loss": 0.0313, "step": 40510 }, { "epoch": 0.11, "learning_rate": 0.00028424494726282527, "loss": 0.0333, "step": 40520 }, { "epoch": 0.11, "learning_rate": 0.0002842410590464538, "loss": 0.049, "step": 40530 }, { "epoch": 0.11, "learning_rate": 0.00028423717083008235, "loss": 0.0323, "step": 40540 }, { "epoch": 0.11, "learning_rate": 0.00028423328261371086, "loss": 0.0306, "step": 40550 }, { "epoch": 0.11, "learning_rate": 0.0002842293943973394, "loss": 0.0267, "step": 40560 }, { "epoch": 0.11, "learning_rate": 0.00028422550618096795, "loss": 0.0278, "step": 40570 }, { "epoch": 0.11, "learning_rate": 0.00028422161796459646, "loss": 0.0314, "step": 40580 }, { "epoch": 0.11, "learning_rate": 0.00028421772974822503, "loss": 0.0352, "step": 40590 }, { "epoch": 0.11, "learning_rate": 0.00028421384153185354, "loss": 0.029, "step": 40600 }, { "epoch": 0.11, "learning_rate": 0.00028420995331548206, "loss": 0.027, "step": 40610 }, { "epoch": 0.11, "learning_rate": 0.00028420606509911063, "loss": 0.0341, "step": 40620 }, { "epoch": 0.11, "learning_rate": 0.00028420217688273914, "loss": 0.0319, "step": 40630 }, { "epoch": 0.11, "learning_rate": 0.00028419828866636766, "loss": 0.0291, "step": 40640 }, { "epoch": 0.11, "learning_rate": 0.0002841944004499962, "loss": 0.0287, "step": 40650 }, { "epoch": 0.11, "learning_rate": 0.0002841905122336248, "loss": 0.0222, "step": 40660 }, { "epoch": 0.11, "learning_rate": 0.0002841866240172533, "loss": 0.0276, "step": 40670 }, { "epoch": 0.11, "learning_rate": 0.0002841827358008818, "loss": 0.0278, "step": 40680 }, { "epoch": 0.11, "learning_rate": 0.00028417884758451034, "loss": 0.0241, "step": 40690 }, { "epoch": 0.11, "learning_rate": 0.00028417495936813885, "loss": 0.0363, "step": 40700 }, { "epoch": 0.11, "learning_rate": 0.0002841710711517674, "loss": 0.0301, "step": 40710 }, { "epoch": 0.11, "learning_rate": 0.000284167182935396, "loss": 0.0317, "step": 40720 }, { "epoch": 0.11, "learning_rate": 0.0002841632947190245, "loss": 0.029, "step": 40730 }, { "epoch": 0.11, "learning_rate": 0.000284159406502653, "loss": 0.0256, "step": 40740 }, { "epoch": 0.11, "learning_rate": 0.0002841555182862816, "loss": 0.0302, "step": 40750 }, { "epoch": 0.11, "learning_rate": 0.0002841516300699101, "loss": 0.0325, "step": 40760 }, { "epoch": 0.11, "learning_rate": 0.0002841477418535386, "loss": 0.0277, "step": 40770 }, { "epoch": 0.11, "learning_rate": 0.0002841438536371672, "loss": 0.0359, "step": 40780 }, { "epoch": 0.11, "learning_rate": 0.0002841399654207957, "loss": 0.0309, "step": 40790 }, { "epoch": 0.11, "learning_rate": 0.00028413607720442427, "loss": 0.0382, "step": 40800 }, { "epoch": 0.11, "learning_rate": 0.0002841321889880528, "loss": 0.0288, "step": 40810 }, { "epoch": 0.11, "learning_rate": 0.0002841283007716813, "loss": 0.0356, "step": 40820 }, { "epoch": 0.11, "learning_rate": 0.00028412441255530987, "loss": 0.0288, "step": 40830 }, { "epoch": 0.11, "learning_rate": 0.0002841205243389384, "loss": 0.0284, "step": 40840 }, { "epoch": 0.11, "learning_rate": 0.0002841166361225669, "loss": 0.0347, "step": 40850 }, { "epoch": 0.11, "learning_rate": 0.00028411274790619546, "loss": 0.0309, "step": 40860 }, { "epoch": 0.11, "learning_rate": 0.00028410885968982403, "loss": 0.031, "step": 40870 }, { "epoch": 0.11, "learning_rate": 0.00028410497147345255, "loss": 0.0314, "step": 40880 }, { "epoch": 0.11, "learning_rate": 0.00028410108325708106, "loss": 0.0338, "step": 40890 }, { "epoch": 0.11, "learning_rate": 0.0002840971950407096, "loss": 0.0299, "step": 40900 }, { "epoch": 0.11, "learning_rate": 0.00028409330682433815, "loss": 0.0261, "step": 40910 }, { "epoch": 0.11, "learning_rate": 0.00028408941860796666, "loss": 0.0303, "step": 40920 }, { "epoch": 0.11, "learning_rate": 0.00028408553039159523, "loss": 0.0382, "step": 40930 }, { "epoch": 0.11, "learning_rate": 0.00028408164217522374, "loss": 0.0284, "step": 40940 }, { "epoch": 0.11, "learning_rate": 0.00028407775395885226, "loss": 0.0329, "step": 40950 }, { "epoch": 0.11, "learning_rate": 0.0002840738657424808, "loss": 0.0319, "step": 40960 }, { "epoch": 0.11, "learning_rate": 0.00028406997752610934, "loss": 0.0302, "step": 40970 }, { "epoch": 0.11, "learning_rate": 0.00028406608930973786, "loss": 0.0452, "step": 40980 }, { "epoch": 0.11, "learning_rate": 0.0002840622010933664, "loss": 0.0274, "step": 40990 }, { "epoch": 0.11, "learning_rate": 0.00028405831287699494, "loss": 0.0318, "step": 41000 }, { "epoch": 0.11, "eval_cer": 0.8817656699852059, "eval_loss": 0.021903902292251587, "eval_runtime": 107.5953, "eval_samples_per_second": 18.588, "eval_steps_per_second": 4.647, "step": 41000 }, { "epoch": 0.11, "learning_rate": 0.0002840544246606235, "loss": 0.0273, "step": 41010 }, { "epoch": 0.11, "learning_rate": 0.000284050536444252, "loss": 0.0282, "step": 41020 }, { "epoch": 0.11, "learning_rate": 0.00028404664822788054, "loss": 0.0419, "step": 41030 }, { "epoch": 0.11, "learning_rate": 0.0002840427600115091, "loss": 0.0402, "step": 41040 }, { "epoch": 0.11, "learning_rate": 0.0002840388717951376, "loss": 0.0249, "step": 41050 }, { "epoch": 0.11, "learning_rate": 0.0002840349835787662, "loss": 0.0277, "step": 41060 }, { "epoch": 0.11, "learning_rate": 0.0002840310953623947, "loss": 0.0476, "step": 41070 }, { "epoch": 0.11, "learning_rate": 0.00028402720714602327, "loss": 0.0341, "step": 41080 }, { "epoch": 0.11, "learning_rate": 0.0002840233189296518, "loss": 0.029, "step": 41090 }, { "epoch": 0.11, "learning_rate": 0.0002840194307132803, "loss": 0.0277, "step": 41100 }, { "epoch": 0.11, "learning_rate": 0.0002840155424969088, "loss": 0.0313, "step": 41110 }, { "epoch": 0.11, "learning_rate": 0.0002840116542805374, "loss": 0.0384, "step": 41120 }, { "epoch": 0.11, "learning_rate": 0.0002840077660641659, "loss": 0.0338, "step": 41130 }, { "epoch": 0.11, "learning_rate": 0.00028400387784779447, "loss": 0.0266, "step": 41140 }, { "epoch": 0.11, "learning_rate": 0.000283999989631423, "loss": 0.0282, "step": 41150 }, { "epoch": 0.11, "learning_rate": 0.00028399610141505155, "loss": 0.0289, "step": 41160 }, { "epoch": 0.11, "learning_rate": 0.00028399221319868007, "loss": 0.0283, "step": 41170 }, { "epoch": 0.11, "learning_rate": 0.0002839883249823086, "loss": 0.0336, "step": 41180 }, { "epoch": 0.11, "learning_rate": 0.0002839844367659371, "loss": 0.0297, "step": 41190 }, { "epoch": 0.11, "learning_rate": 0.00028398054854956566, "loss": 0.0293, "step": 41200 }, { "epoch": 0.11, "learning_rate": 0.00028397666033319423, "loss": 0.0285, "step": 41210 }, { "epoch": 0.11, "learning_rate": 0.00028397277211682275, "loss": 0.0361, "step": 41220 }, { "epoch": 0.11, "learning_rate": 0.00028396888390045126, "loss": 0.0385, "step": 41230 }, { "epoch": 0.11, "learning_rate": 0.0002839649956840798, "loss": 0.0343, "step": 41240 }, { "epoch": 0.11, "learning_rate": 0.00028396110746770834, "loss": 0.0273, "step": 41250 }, { "epoch": 0.11, "learning_rate": 0.00028395721925133686, "loss": 0.0335, "step": 41260 }, { "epoch": 0.11, "learning_rate": 0.00028395333103496543, "loss": 0.0348, "step": 41270 }, { "epoch": 0.11, "learning_rate": 0.00028394944281859394, "loss": 0.0277, "step": 41280 }, { "epoch": 0.11, "learning_rate": 0.0002839455546022225, "loss": 0.0299, "step": 41290 }, { "epoch": 0.11, "learning_rate": 0.000283941666385851, "loss": 0.0232, "step": 41300 }, { "epoch": 0.11, "learning_rate": 0.00028393777816947954, "loss": 0.0273, "step": 41310 }, { "epoch": 0.11, "learning_rate": 0.00028393388995310805, "loss": 0.0396, "step": 41320 }, { "epoch": 0.11, "learning_rate": 0.0002839300017367366, "loss": 0.034, "step": 41330 }, { "epoch": 0.11, "learning_rate": 0.00028392611352036514, "loss": 0.0325, "step": 41340 }, { "epoch": 0.11, "learning_rate": 0.0002839222253039937, "loss": 0.0282, "step": 41350 }, { "epoch": 0.11, "learning_rate": 0.0002839183370876222, "loss": 0.0296, "step": 41360 }, { "epoch": 0.11, "learning_rate": 0.0002839144488712508, "loss": 0.0303, "step": 41370 }, { "epoch": 0.11, "learning_rate": 0.0002839105606548793, "loss": 0.0312, "step": 41380 }, { "epoch": 0.11, "learning_rate": 0.0002839066724385078, "loss": 0.0268, "step": 41390 }, { "epoch": 0.11, "learning_rate": 0.00028390278422213633, "loss": 0.0451, "step": 41400 }, { "epoch": 0.11, "learning_rate": 0.0002838988960057649, "loss": 0.0574, "step": 41410 }, { "epoch": 0.11, "learning_rate": 0.00028389500778939347, "loss": 0.0366, "step": 41420 }, { "epoch": 0.11, "learning_rate": 0.000283891119573022, "loss": 0.0339, "step": 41430 }, { "epoch": 0.11, "learning_rate": 0.0002838872313566505, "loss": 0.034, "step": 41440 }, { "epoch": 0.11, "learning_rate": 0.000283883343140279, "loss": 0.0261, "step": 41450 }, { "epoch": 0.11, "learning_rate": 0.0002838794549239076, "loss": 0.0342, "step": 41460 }, { "epoch": 0.11, "learning_rate": 0.0002838755667075361, "loss": 0.0331, "step": 41470 }, { "epoch": 0.11, "learning_rate": 0.00028387167849116467, "loss": 0.0402, "step": 41480 }, { "epoch": 0.11, "learning_rate": 0.0002838677902747932, "loss": 0.0346, "step": 41490 }, { "epoch": 0.11, "learning_rate": 0.00028386390205842175, "loss": 0.0287, "step": 41500 }, { "epoch": 0.11, "learning_rate": 0.00028386001384205026, "loss": 0.0288, "step": 41510 }, { "epoch": 0.11, "learning_rate": 0.0002838561256256788, "loss": 0.0298, "step": 41520 }, { "epoch": 0.11, "learning_rate": 0.0002838522374093073, "loss": 0.028, "step": 41530 }, { "epoch": 0.11, "learning_rate": 0.00028384834919293586, "loss": 0.0305, "step": 41540 }, { "epoch": 0.11, "learning_rate": 0.0002838444609765644, "loss": 0.0319, "step": 41550 }, { "epoch": 0.11, "learning_rate": 0.00028384057276019295, "loss": 0.0295, "step": 41560 }, { "epoch": 0.11, "learning_rate": 0.00028383668454382146, "loss": 0.0277, "step": 41570 }, { "epoch": 0.11, "learning_rate": 0.00028383279632745003, "loss": 0.0274, "step": 41580 }, { "epoch": 0.11, "learning_rate": 0.00028382890811107854, "loss": 0.032, "step": 41590 }, { "epoch": 0.11, "learning_rate": 0.00028382501989470706, "loss": 0.0369, "step": 41600 }, { "epoch": 0.11, "learning_rate": 0.0002838211316783356, "loss": 0.0296, "step": 41610 }, { "epoch": 0.11, "learning_rate": 0.00028381724346196414, "loss": 0.0256, "step": 41620 }, { "epoch": 0.11, "learning_rate": 0.0002838133552455927, "loss": 0.0282, "step": 41630 }, { "epoch": 0.11, "learning_rate": 0.0002838094670292212, "loss": 0.0269, "step": 41640 }, { "epoch": 0.11, "learning_rate": 0.00028380557881284974, "loss": 0.029, "step": 41650 }, { "epoch": 0.11, "learning_rate": 0.0002838016905964783, "loss": 0.0286, "step": 41660 }, { "epoch": 0.11, "learning_rate": 0.0002837978023801068, "loss": 0.0286, "step": 41670 }, { "epoch": 0.11, "learning_rate": 0.00028379391416373534, "loss": 0.0315, "step": 41680 }, { "epoch": 0.11, "learning_rate": 0.0002837900259473639, "loss": 0.0336, "step": 41690 }, { "epoch": 0.11, "learning_rate": 0.0002837861377309924, "loss": 0.0297, "step": 41700 }, { "epoch": 0.11, "learning_rate": 0.000283782249514621, "loss": 0.0372, "step": 41710 }, { "epoch": 0.11, "learning_rate": 0.0002837783612982495, "loss": 0.0326, "step": 41720 }, { "epoch": 0.11, "learning_rate": 0.000283774473081878, "loss": 0.0365, "step": 41730 }, { "epoch": 0.11, "learning_rate": 0.00028377058486550653, "loss": 0.0522, "step": 41740 }, { "epoch": 0.11, "learning_rate": 0.0002837666966491351, "loss": 0.0514, "step": 41750 }, { "epoch": 0.11, "learning_rate": 0.00028376280843276367, "loss": 0.0338, "step": 41760 }, { "epoch": 0.11, "learning_rate": 0.0002837589202163922, "loss": 0.0357, "step": 41770 }, { "epoch": 0.11, "learning_rate": 0.0002837550320000207, "loss": 0.0431, "step": 41780 }, { "epoch": 0.11, "learning_rate": 0.00028375114378364927, "loss": 0.0317, "step": 41790 }, { "epoch": 0.11, "learning_rate": 0.0002837472555672778, "loss": 0.0376, "step": 41800 }, { "epoch": 0.11, "learning_rate": 0.0002837433673509063, "loss": 0.0296, "step": 41810 }, { "epoch": 0.11, "learning_rate": 0.00028373947913453487, "loss": 0.0338, "step": 41820 }, { "epoch": 0.11, "learning_rate": 0.0002837355909181634, "loss": 0.0276, "step": 41830 }, { "epoch": 0.11, "learning_rate": 0.00028373170270179195, "loss": 0.0262, "step": 41840 }, { "epoch": 0.11, "learning_rate": 0.00028372781448542046, "loss": 0.0261, "step": 41850 }, { "epoch": 0.11, "learning_rate": 0.000283723926269049, "loss": 0.0226, "step": 41860 }, { "epoch": 0.11, "learning_rate": 0.00028372003805267755, "loss": 0.0252, "step": 41870 }, { "epoch": 0.11, "learning_rate": 0.00028371614983630606, "loss": 0.0305, "step": 41880 }, { "epoch": 0.11, "learning_rate": 0.0002837122616199346, "loss": 0.0301, "step": 41890 }, { "epoch": 0.11, "learning_rate": 0.00028370837340356314, "loss": 0.0268, "step": 41900 }, { "epoch": 0.11, "learning_rate": 0.0002837044851871917, "loss": 0.0303, "step": 41910 }, { "epoch": 0.11, "learning_rate": 0.00028370059697082023, "loss": 0.0286, "step": 41920 }, { "epoch": 0.11, "learning_rate": 0.00028369670875444874, "loss": 0.0286, "step": 41930 }, { "epoch": 0.11, "learning_rate": 0.00028369282053807726, "loss": 0.0263, "step": 41940 }, { "epoch": 0.11, "learning_rate": 0.00028368893232170577, "loss": 0.0313, "step": 41950 }, { "epoch": 0.11, "learning_rate": 0.00028368504410533434, "loss": 0.0275, "step": 41960 }, { "epoch": 0.11, "learning_rate": 0.0002836811558889629, "loss": 0.0372, "step": 41970 }, { "epoch": 0.11, "learning_rate": 0.0002836772676725914, "loss": 0.0287, "step": 41980 }, { "epoch": 0.11, "learning_rate": 0.00028367337945621994, "loss": 0.0279, "step": 41990 }, { "epoch": 0.11, "learning_rate": 0.0002836694912398485, "loss": 0.0328, "step": 42000 }, { "epoch": 0.11, "eval_cer": 0.8818510478381908, "eval_loss": 0.021058108657598495, "eval_runtime": 107.6507, "eval_samples_per_second": 18.579, "eval_steps_per_second": 4.645, "step": 42000 }, { "epoch": 0.11, "learning_rate": 0.000283665603023477, "loss": 0.0316, "step": 42010 }, { "epoch": 0.11, "learning_rate": 0.00028366171480710554, "loss": 0.0273, "step": 42020 }, { "epoch": 0.11, "learning_rate": 0.0002836578265907341, "loss": 0.028, "step": 42030 }, { "epoch": 0.11, "learning_rate": 0.0002836539383743626, "loss": 0.0314, "step": 42040 }, { "epoch": 0.11, "learning_rate": 0.0002836500501579912, "loss": 0.0286, "step": 42050 }, { "epoch": 0.11, "learning_rate": 0.0002836461619416197, "loss": 0.029, "step": 42060 }, { "epoch": 0.11, "learning_rate": 0.0002836422737252482, "loss": 0.0283, "step": 42070 }, { "epoch": 0.11, "learning_rate": 0.0002836383855088768, "loss": 0.0291, "step": 42080 }, { "epoch": 0.11, "learning_rate": 0.0002836344972925053, "loss": 0.0267, "step": 42090 }, { "epoch": 0.11, "learning_rate": 0.0002836306090761338, "loss": 0.0297, "step": 42100 }, { "epoch": 0.11, "learning_rate": 0.0002836267208597624, "loss": 0.0268, "step": 42110 }, { "epoch": 0.11, "learning_rate": 0.00028362283264339095, "loss": 0.0276, "step": 42120 }, { "epoch": 0.11, "learning_rate": 0.00028361894442701947, "loss": 0.0341, "step": 42130 }, { "epoch": 0.11, "learning_rate": 0.000283615056210648, "loss": 0.0344, "step": 42140 }, { "epoch": 0.11, "learning_rate": 0.0002836111679942765, "loss": 0.0328, "step": 42150 }, { "epoch": 0.11, "learning_rate": 0.00028360727977790506, "loss": 0.0322, "step": 42160 }, { "epoch": 0.11, "learning_rate": 0.0002836033915615336, "loss": 0.0313, "step": 42170 }, { "epoch": 0.11, "learning_rate": 0.00028359950334516215, "loss": 0.0338, "step": 42180 }, { "epoch": 0.11, "learning_rate": 0.00028359561512879066, "loss": 0.0277, "step": 42190 }, { "epoch": 0.11, "learning_rate": 0.0002835917269124192, "loss": 0.0323, "step": 42200 }, { "epoch": 0.11, "learning_rate": 0.00028358783869604775, "loss": 0.0229, "step": 42210 }, { "epoch": 0.11, "learning_rate": 0.00028358395047967626, "loss": 0.0256, "step": 42220 }, { "epoch": 0.11, "learning_rate": 0.0002835800622633048, "loss": 0.0296, "step": 42230 }, { "epoch": 0.11, "learning_rate": 0.00028357617404693334, "loss": 0.0357, "step": 42240 }, { "epoch": 0.11, "learning_rate": 0.0002835722858305619, "loss": 0.0308, "step": 42250 }, { "epoch": 0.11, "learning_rate": 0.0002835683976141904, "loss": 0.0284, "step": 42260 }, { "epoch": 0.11, "learning_rate": 0.00028356450939781894, "loss": 0.033, "step": 42270 }, { "epoch": 0.11, "learning_rate": 0.00028356062118144746, "loss": 0.0296, "step": 42280 }, { "epoch": 0.11, "learning_rate": 0.000283556732965076, "loss": 0.0311, "step": 42290 }, { "epoch": 0.11, "learning_rate": 0.00028355284474870454, "loss": 0.0243, "step": 42300 }, { "epoch": 0.11, "learning_rate": 0.0002835489565323331, "loss": 0.0288, "step": 42310 }, { "epoch": 0.11, "learning_rate": 0.0002835450683159616, "loss": 0.0271, "step": 42320 }, { "epoch": 0.11, "learning_rate": 0.0002835411800995902, "loss": 0.0281, "step": 42330 }, { "epoch": 0.11, "learning_rate": 0.0002835372918832187, "loss": 0.0293, "step": 42340 }, { "epoch": 0.11, "learning_rate": 0.0002835334036668472, "loss": 0.0308, "step": 42350 }, { "epoch": 0.11, "learning_rate": 0.00028352951545047573, "loss": 0.0275, "step": 42360 }, { "epoch": 0.11, "learning_rate": 0.0002835256272341043, "loss": 0.0265, "step": 42370 }, { "epoch": 0.11, "learning_rate": 0.0002835217390177328, "loss": 0.0283, "step": 42380 }, { "epoch": 0.11, "learning_rate": 0.0002835178508013614, "loss": 0.0291, "step": 42390 }, { "epoch": 0.11, "learning_rate": 0.0002835139625849899, "loss": 0.0306, "step": 42400 }, { "epoch": 0.11, "learning_rate": 0.00028351007436861847, "loss": 0.0271, "step": 42410 }, { "epoch": 0.11, "learning_rate": 0.000283506186152247, "loss": 0.034, "step": 42420 }, { "epoch": 0.11, "learning_rate": 0.0002835022979358755, "loss": 0.0371, "step": 42430 }, { "epoch": 0.11, "learning_rate": 0.000283498409719504, "loss": 0.0263, "step": 42440 }, { "epoch": 0.11, "learning_rate": 0.0002834945215031326, "loss": 0.0301, "step": 42450 }, { "epoch": 0.11, "learning_rate": 0.00028349063328676115, "loss": 0.0298, "step": 42460 }, { "epoch": 0.11, "learning_rate": 0.00028348674507038967, "loss": 0.024, "step": 42470 }, { "epoch": 0.11, "learning_rate": 0.0002834828568540182, "loss": 0.0288, "step": 42480 }, { "epoch": 0.11, "learning_rate": 0.0002834789686376467, "loss": 0.0472, "step": 42490 }, { "epoch": 0.11, "learning_rate": 0.00028347508042127526, "loss": 0.0345, "step": 42500 }, { "epoch": 0.11, "learning_rate": 0.0002834711922049038, "loss": 0.0334, "step": 42510 }, { "epoch": 0.11, "learning_rate": 0.00028346730398853235, "loss": 0.0276, "step": 42520 }, { "epoch": 0.11, "learning_rate": 0.00028346341577216086, "loss": 0.0272, "step": 42530 }, { "epoch": 0.11, "learning_rate": 0.00028345952755578943, "loss": 0.0251, "step": 42540 }, { "epoch": 0.11, "learning_rate": 0.00028345563933941794, "loss": 0.0258, "step": 42550 }, { "epoch": 0.11, "learning_rate": 0.00028345175112304646, "loss": 0.0294, "step": 42560 }, { "epoch": 0.11, "learning_rate": 0.000283447862906675, "loss": 0.0338, "step": 42570 }, { "epoch": 0.11, "learning_rate": 0.00028344397469030354, "loss": 0.0319, "step": 42580 }, { "epoch": 0.11, "learning_rate": 0.00028344008647393206, "loss": 0.0287, "step": 42590 }, { "epoch": 0.11, "learning_rate": 0.0002834361982575606, "loss": 0.0253, "step": 42600 }, { "epoch": 0.11, "learning_rate": 0.00028343231004118914, "loss": 0.031, "step": 42610 }, { "epoch": 0.11, "learning_rate": 0.0002834284218248177, "loss": 0.0294, "step": 42620 }, { "epoch": 0.11, "learning_rate": 0.0002834245336084462, "loss": 0.0276, "step": 42630 }, { "epoch": 0.11, "learning_rate": 0.00028342064539207474, "loss": 0.0299, "step": 42640 }, { "epoch": 0.11, "learning_rate": 0.0002834167571757033, "loss": 0.031, "step": 42650 }, { "epoch": 0.11, "learning_rate": 0.0002834128689593318, "loss": 0.026, "step": 42660 }, { "epoch": 0.11, "learning_rate": 0.0002834089807429604, "loss": 0.0259, "step": 42670 }, { "epoch": 0.11, "learning_rate": 0.0002834050925265889, "loss": 0.0279, "step": 42680 }, { "epoch": 0.11, "learning_rate": 0.0002834012043102174, "loss": 0.0292, "step": 42690 }, { "epoch": 0.11, "learning_rate": 0.00028339731609384593, "loss": 0.0269, "step": 42700 }, { "epoch": 0.11, "learning_rate": 0.0002833934278774745, "loss": 0.0286, "step": 42710 }, { "epoch": 0.11, "learning_rate": 0.000283389539661103, "loss": 0.0314, "step": 42720 }, { "epoch": 0.11, "learning_rate": 0.0002833856514447316, "loss": 0.0348, "step": 42730 }, { "epoch": 0.11, "learning_rate": 0.0002833817632283601, "loss": 0.0255, "step": 42740 }, { "epoch": 0.11, "learning_rate": 0.00028337787501198867, "loss": 0.0318, "step": 42750 }, { "epoch": 0.11, "learning_rate": 0.0002833739867956172, "loss": 0.0276, "step": 42760 }, { "epoch": 0.11, "learning_rate": 0.0002833700985792457, "loss": 0.0303, "step": 42770 }, { "epoch": 0.11, "learning_rate": 0.0002833662103628742, "loss": 0.0301, "step": 42780 }, { "epoch": 0.11, "learning_rate": 0.0002833623221465028, "loss": 0.0336, "step": 42790 }, { "epoch": 0.11, "learning_rate": 0.00028335843393013135, "loss": 0.0304, "step": 42800 }, { "epoch": 0.11, "learning_rate": 0.00028335454571375986, "loss": 0.0244, "step": 42810 }, { "epoch": 0.11, "learning_rate": 0.0002833506574973884, "loss": 0.0318, "step": 42820 }, { "epoch": 0.11, "learning_rate": 0.00028334676928101695, "loss": 0.026, "step": 42830 }, { "epoch": 0.11, "learning_rate": 0.00028334288106464546, "loss": 0.0327, "step": 42840 }, { "epoch": 0.11, "learning_rate": 0.000283338992848274, "loss": 0.0325, "step": 42850 }, { "epoch": 0.11, "learning_rate": 0.00028333510463190254, "loss": 0.028, "step": 42860 }, { "epoch": 0.11, "learning_rate": 0.00028333121641553106, "loss": 0.0374, "step": 42870 }, { "epoch": 0.11, "learning_rate": 0.00028332732819915963, "loss": 0.0341, "step": 42880 }, { "epoch": 0.11, "learning_rate": 0.00028332343998278814, "loss": 0.0304, "step": 42890 }, { "epoch": 0.11, "learning_rate": 0.00028331955176641666, "loss": 0.0458, "step": 42900 }, { "epoch": 0.11, "learning_rate": 0.0002833156635500452, "loss": 0.0376, "step": 42910 }, { "epoch": 0.11, "learning_rate": 0.00028331177533367374, "loss": 0.0365, "step": 42920 }, { "epoch": 0.11, "learning_rate": 0.00028330788711730226, "loss": 0.0309, "step": 42930 }, { "epoch": 0.11, "learning_rate": 0.0002833039989009308, "loss": 0.0263, "step": 42940 }, { "epoch": 0.11, "learning_rate": 0.00028330011068455934, "loss": 0.0353, "step": 42950 }, { "epoch": 0.11, "learning_rate": 0.0002832962224681879, "loss": 0.0337, "step": 42960 }, { "epoch": 0.11, "learning_rate": 0.0002832923342518164, "loss": 0.0267, "step": 42970 }, { "epoch": 0.11, "learning_rate": 0.00028328844603544494, "loss": 0.0302, "step": 42980 }, { "epoch": 0.11, "learning_rate": 0.00028328455781907345, "loss": 0.0297, "step": 42990 }, { "epoch": 0.11, "learning_rate": 0.000283280669602702, "loss": 0.0374, "step": 43000 }, { "epoch": 0.11, "eval_cer": 0.8818090587301654, "eval_loss": 0.02232929691672325, "eval_runtime": 107.3768, "eval_samples_per_second": 18.626, "eval_steps_per_second": 4.657, "step": 43000 }, { "epoch": 0.11, "learning_rate": 0.0002832767813863306, "loss": 0.0275, "step": 43010 }, { "epoch": 0.11, "learning_rate": 0.0002832728931699591, "loss": 0.0277, "step": 43020 }, { "epoch": 0.11, "learning_rate": 0.0002832690049535876, "loss": 0.0287, "step": 43030 }, { "epoch": 0.11, "learning_rate": 0.0002832651167372162, "loss": 0.0317, "step": 43040 }, { "epoch": 0.11, "learning_rate": 0.0002832612285208447, "loss": 0.0281, "step": 43050 }, { "epoch": 0.11, "learning_rate": 0.0002832573403044732, "loss": 0.0234, "step": 43060 }, { "epoch": 0.11, "learning_rate": 0.0002832534520881018, "loss": 0.0339, "step": 43070 }, { "epoch": 0.11, "learning_rate": 0.0002832495638717303, "loss": 0.0329, "step": 43080 }, { "epoch": 0.11, "learning_rate": 0.00028324567565535887, "loss": 0.0299, "step": 43090 }, { "epoch": 0.11, "learning_rate": 0.0002832417874389874, "loss": 0.0307, "step": 43100 }, { "epoch": 0.11, "learning_rate": 0.0002832378992226159, "loss": 0.0258, "step": 43110 }, { "epoch": 0.11, "learning_rate": 0.00028323401100624446, "loss": 0.0375, "step": 43120 }, { "epoch": 0.11, "learning_rate": 0.000283230122789873, "loss": 0.0275, "step": 43130 }, { "epoch": 0.11, "learning_rate": 0.0002832262345735015, "loss": 0.0349, "step": 43140 }, { "epoch": 0.11, "learning_rate": 0.00028322234635713006, "loss": 0.042, "step": 43150 }, { "epoch": 0.11, "learning_rate": 0.00028321845814075863, "loss": 0.0289, "step": 43160 }, { "epoch": 0.11, "learning_rate": 0.00028321456992438715, "loss": 0.0303, "step": 43170 }, { "epoch": 0.11, "learning_rate": 0.00028321068170801566, "loss": 0.0291, "step": 43180 }, { "epoch": 0.11, "learning_rate": 0.0002832067934916442, "loss": 0.0276, "step": 43190 }, { "epoch": 0.11, "learning_rate": 0.00028320290527527274, "loss": 0.0328, "step": 43200 }, { "epoch": 0.11, "learning_rate": 0.00028319901705890126, "loss": 0.029, "step": 43210 }, { "epoch": 0.11, "learning_rate": 0.00028319512884252983, "loss": 0.0264, "step": 43220 }, { "epoch": 0.11, "learning_rate": 0.00028319124062615834, "loss": 0.0308, "step": 43230 }, { "epoch": 0.11, "learning_rate": 0.00028318735240978686, "loss": 0.03, "step": 43240 }, { "epoch": 0.11, "learning_rate": 0.0002831834641934154, "loss": 0.0335, "step": 43250 }, { "epoch": 0.11, "learning_rate": 0.00028317957597704394, "loss": 0.0259, "step": 43260 }, { "epoch": 0.11, "learning_rate": 0.00028317568776067245, "loss": 0.0306, "step": 43270 }, { "epoch": 0.11, "learning_rate": 0.000283171799544301, "loss": 0.0323, "step": 43280 }, { "epoch": 0.11, "learning_rate": 0.00028316791132792954, "loss": 0.0304, "step": 43290 }, { "epoch": 0.11, "learning_rate": 0.0002831640231115581, "loss": 0.0278, "step": 43300 }, { "epoch": 0.11, "learning_rate": 0.0002831601348951866, "loss": 0.0264, "step": 43310 }, { "epoch": 0.11, "learning_rate": 0.00028315624667881514, "loss": 0.0258, "step": 43320 }, { "epoch": 0.11, "learning_rate": 0.0002831523584624437, "loss": 0.0279, "step": 43330 }, { "epoch": 0.11, "learning_rate": 0.0002831484702460722, "loss": 0.0271, "step": 43340 }, { "epoch": 0.11, "learning_rate": 0.0002831445820297008, "loss": 0.0225, "step": 43350 }, { "epoch": 0.11, "learning_rate": 0.0002831406938133293, "loss": 0.0287, "step": 43360 }, { "epoch": 0.11, "learning_rate": 0.00028313680559695787, "loss": 0.0308, "step": 43370 }, { "epoch": 0.11, "learning_rate": 0.0002831329173805864, "loss": 0.0239, "step": 43380 }, { "epoch": 0.11, "learning_rate": 0.0002831290291642149, "loss": 0.0283, "step": 43390 }, { "epoch": 0.11, "learning_rate": 0.0002831251409478434, "loss": 0.025, "step": 43400 }, { "epoch": 0.11, "learning_rate": 0.000283121252731472, "loss": 0.025, "step": 43410 }, { "epoch": 0.11, "learning_rate": 0.0002831173645151005, "loss": 0.0256, "step": 43420 }, { "epoch": 0.11, "learning_rate": 0.00028311347629872907, "loss": 0.0251, "step": 43430 }, { "epoch": 0.11, "learning_rate": 0.0002831095880823576, "loss": 0.0298, "step": 43440 }, { "epoch": 0.11, "learning_rate": 0.0002831056998659861, "loss": 0.0307, "step": 43450 }, { "epoch": 0.11, "learning_rate": 0.00028310181164961466, "loss": 0.0296, "step": 43460 }, { "epoch": 0.11, "learning_rate": 0.0002830979234332432, "loss": 0.0355, "step": 43470 }, { "epoch": 0.11, "learning_rate": 0.0002830940352168717, "loss": 0.0314, "step": 43480 }, { "epoch": 0.11, "learning_rate": 0.00028309014700050026, "loss": 0.0292, "step": 43490 }, { "epoch": 0.11, "learning_rate": 0.00028308625878412883, "loss": 0.0326, "step": 43500 }, { "epoch": 0.11, "learning_rate": 0.00028308237056775734, "loss": 0.024, "step": 43510 }, { "epoch": 0.11, "learning_rate": 0.00028307848235138586, "loss": 0.0304, "step": 43520 }, { "epoch": 0.11, "learning_rate": 0.0002830745941350144, "loss": 0.0283, "step": 43530 }, { "epoch": 0.11, "learning_rate": 0.00028307070591864294, "loss": 0.0279, "step": 43540 }, { "epoch": 0.11, "learning_rate": 0.00028306681770227146, "loss": 0.0288, "step": 43550 }, { "epoch": 0.11, "learning_rate": 0.0002830629294859, "loss": 0.0277, "step": 43560 }, { "epoch": 0.11, "learning_rate": 0.00028305904126952854, "loss": 0.0321, "step": 43570 }, { "epoch": 0.11, "learning_rate": 0.0002830551530531571, "loss": 0.034, "step": 43580 }, { "epoch": 0.11, "learning_rate": 0.0002830512648367856, "loss": 0.035, "step": 43590 }, { "epoch": 0.11, "learning_rate": 0.00028304737662041414, "loss": 0.0304, "step": 43600 }, { "epoch": 0.11, "learning_rate": 0.00028304348840404265, "loss": 0.0259, "step": 43610 }, { "epoch": 0.11, "learning_rate": 0.0002830396001876712, "loss": 0.0285, "step": 43620 }, { "epoch": 0.11, "learning_rate": 0.00028303571197129974, "loss": 0.03, "step": 43630 }, { "epoch": 0.11, "learning_rate": 0.0002830318237549283, "loss": 0.0308, "step": 43640 }, { "epoch": 0.11, "learning_rate": 0.0002830279355385568, "loss": 0.0274, "step": 43650 }, { "epoch": 0.11, "learning_rate": 0.0002830240473221854, "loss": 0.0285, "step": 43660 }, { "epoch": 0.11, "learning_rate": 0.0002830201591058139, "loss": 0.0318, "step": 43670 }, { "epoch": 0.11, "learning_rate": 0.0002830162708894424, "loss": 0.0249, "step": 43680 }, { "epoch": 0.11, "learning_rate": 0.00028301238267307093, "loss": 0.0261, "step": 43690 }, { "epoch": 0.11, "learning_rate": 0.0002830084944566995, "loss": 0.0241, "step": 43700 }, { "epoch": 0.11, "learning_rate": 0.00028300460624032807, "loss": 0.0317, "step": 43710 }, { "epoch": 0.11, "learning_rate": 0.0002830007180239566, "loss": 0.035, "step": 43720 }, { "epoch": 0.11, "learning_rate": 0.0002829968298075851, "loss": 0.0293, "step": 43730 }, { "epoch": 0.11, "learning_rate": 0.0002829929415912136, "loss": 0.0277, "step": 43740 }, { "epoch": 0.11, "learning_rate": 0.0002829890533748422, "loss": 0.0304, "step": 43750 }, { "epoch": 0.11, "learning_rate": 0.0002829851651584707, "loss": 0.0278, "step": 43760 }, { "epoch": 0.11, "learning_rate": 0.00028298127694209926, "loss": 0.0293, "step": 43770 }, { "epoch": 0.11, "learning_rate": 0.0002829773887257278, "loss": 0.0331, "step": 43780 }, { "epoch": 0.11, "learning_rate": 0.00028297350050935635, "loss": 0.0267, "step": 43790 }, { "epoch": 0.11, "learning_rate": 0.00028296961229298486, "loss": 0.0265, "step": 43800 }, { "epoch": 0.11, "learning_rate": 0.0002829657240766134, "loss": 0.0371, "step": 43810 }, { "epoch": 0.11, "learning_rate": 0.0002829618358602419, "loss": 0.0293, "step": 43820 }, { "epoch": 0.11, "learning_rate": 0.00028295794764387046, "loss": 0.0276, "step": 43830 }, { "epoch": 0.11, "learning_rate": 0.00028295405942749903, "loss": 0.0315, "step": 43840 }, { "epoch": 0.11, "learning_rate": 0.00028295017121112754, "loss": 0.0266, "step": 43850 }, { "epoch": 0.11, "learning_rate": 0.00028294628299475606, "loss": 0.0315, "step": 43860 }, { "epoch": 0.11, "learning_rate": 0.0002829423947783846, "loss": 0.0337, "step": 43870 }, { "epoch": 0.11, "learning_rate": 0.00028293850656201314, "loss": 0.0277, "step": 43880 }, { "epoch": 0.11, "learning_rate": 0.00028293461834564166, "loss": 0.0306, "step": 43890 }, { "epoch": 0.11, "learning_rate": 0.0002829307301292702, "loss": 0.0292, "step": 43900 }, { "epoch": 0.11, "learning_rate": 0.00028292684191289874, "loss": 0.038, "step": 43910 }, { "epoch": 0.11, "learning_rate": 0.0002829229536965273, "loss": 0.0258, "step": 43920 }, { "epoch": 0.11, "learning_rate": 0.0002829190654801558, "loss": 0.0453, "step": 43930 }, { "epoch": 0.11, "learning_rate": 0.00028291517726378434, "loss": 0.0287, "step": 43940 }, { "epoch": 0.11, "learning_rate": 0.00028291128904741285, "loss": 0.0278, "step": 43950 }, { "epoch": 0.11, "learning_rate": 0.0002829074008310414, "loss": 0.0318, "step": 43960 }, { "epoch": 0.11, "learning_rate": 0.00028290351261466993, "loss": 0.0292, "step": 43970 }, { "epoch": 0.11, "learning_rate": 0.0002828996243982985, "loss": 0.0281, "step": 43980 }, { "epoch": 0.11, "learning_rate": 0.000282895736181927, "loss": 0.0261, "step": 43990 }, { "epoch": 0.11, "learning_rate": 0.0002828918479655556, "loss": 0.03, "step": 44000 }, { "epoch": 0.11, "eval_cer": 0.8818090587301654, "eval_loss": 0.021903708577156067, "eval_runtime": 107.4337, "eval_samples_per_second": 18.616, "eval_steps_per_second": 4.654, "step": 44000 }, { "epoch": 0.11, "learning_rate": 0.0002828879597491841, "loss": 0.0297, "step": 44010 }, { "epoch": 0.11, "learning_rate": 0.0002828840715328126, "loss": 0.0263, "step": 44020 }, { "epoch": 0.11, "learning_rate": 0.00028288018331644113, "loss": 0.0313, "step": 44030 }, { "epoch": 0.11, "learning_rate": 0.0002828762951000697, "loss": 0.0305, "step": 44040 }, { "epoch": 0.11, "learning_rate": 0.00028287240688369827, "loss": 0.0283, "step": 44050 }, { "epoch": 0.11, "learning_rate": 0.0002828685186673268, "loss": 0.028, "step": 44060 }, { "epoch": 0.11, "learning_rate": 0.0002828646304509553, "loss": 0.0352, "step": 44070 }, { "epoch": 0.11, "learning_rate": 0.00028286074223458387, "loss": 0.0306, "step": 44080 }, { "epoch": 0.11, "learning_rate": 0.0002828568540182124, "loss": 0.0267, "step": 44090 }, { "epoch": 0.11, "learning_rate": 0.0002828529658018409, "loss": 0.0222, "step": 44100 }, { "epoch": 0.11, "learning_rate": 0.00028284907758546946, "loss": 0.0327, "step": 44110 }, { "epoch": 0.11, "learning_rate": 0.000282845189369098, "loss": 0.0406, "step": 44120 }, { "epoch": 0.11, "learning_rate": 0.00028284130115272655, "loss": 0.0248, "step": 44130 }, { "epoch": 0.11, "learning_rate": 0.00028283741293635506, "loss": 0.03, "step": 44140 }, { "epoch": 0.11, "learning_rate": 0.0002828335247199836, "loss": 0.0296, "step": 44150 }, { "epoch": 0.11, "learning_rate": 0.00028282963650361214, "loss": 0.0326, "step": 44160 }, { "epoch": 0.11, "learning_rate": 0.00028282574828724066, "loss": 0.0277, "step": 44170 }, { "epoch": 0.11, "learning_rate": 0.0002828218600708692, "loss": 0.0342, "step": 44180 }, { "epoch": 0.11, "learning_rate": 0.00028281797185449774, "loss": 0.0285, "step": 44190 }, { "epoch": 0.11, "learning_rate": 0.00028281408363812626, "loss": 0.0311, "step": 44200 }, { "epoch": 0.11, "learning_rate": 0.0002828101954217548, "loss": 0.0301, "step": 44210 }, { "epoch": 0.11, "learning_rate": 0.00028280630720538334, "loss": 0.0303, "step": 44220 }, { "epoch": 0.11, "learning_rate": 0.00028280241898901185, "loss": 0.0254, "step": 44230 }, { "epoch": 0.11, "learning_rate": 0.0002827985307726404, "loss": 0.0236, "step": 44240 }, { "epoch": 0.11, "learning_rate": 0.00028279464255626894, "loss": 0.0321, "step": 44250 }, { "epoch": 0.11, "learning_rate": 0.0002827907543398975, "loss": 0.0271, "step": 44260 }, { "epoch": 0.11, "learning_rate": 0.000282786866123526, "loss": 0.0267, "step": 44270 }, { "epoch": 0.11, "learning_rate": 0.00028278297790715454, "loss": 0.027, "step": 44280 }, { "epoch": 0.11, "learning_rate": 0.0002827790896907831, "loss": 0.0272, "step": 44290 }, { "epoch": 0.11, "learning_rate": 0.0002827752014744116, "loss": 0.0353, "step": 44300 }, { "epoch": 0.11, "learning_rate": 0.00028277131325804013, "loss": 0.0283, "step": 44310 }, { "epoch": 0.11, "learning_rate": 0.0002827674250416687, "loss": 0.0268, "step": 44320 }, { "epoch": 0.11, "learning_rate": 0.0002827635368252972, "loss": 0.0412, "step": 44330 }, { "epoch": 0.11, "learning_rate": 0.0002827596486089258, "loss": 0.0309, "step": 44340 }, { "epoch": 0.11, "learning_rate": 0.0002827557603925543, "loss": 0.036, "step": 44350 }, { "epoch": 0.11, "learning_rate": 0.0002827518721761828, "loss": 0.03, "step": 44360 }, { "epoch": 0.12, "learning_rate": 0.0002827479839598114, "loss": 0.0266, "step": 44370 }, { "epoch": 0.12, "learning_rate": 0.0002827440957434399, "loss": 0.0283, "step": 44380 }, { "epoch": 0.12, "learning_rate": 0.00028274020752706847, "loss": 0.0257, "step": 44390 }, { "epoch": 0.12, "learning_rate": 0.000282736319310697, "loss": 0.0322, "step": 44400 }, { "epoch": 0.12, "learning_rate": 0.00028273243109432555, "loss": 0.0314, "step": 44410 }, { "epoch": 0.12, "learning_rate": 0.00028272854287795406, "loss": 0.0296, "step": 44420 }, { "epoch": 0.12, "learning_rate": 0.0002827246546615826, "loss": 0.034, "step": 44430 }, { "epoch": 0.12, "learning_rate": 0.0002827207664452111, "loss": 0.0361, "step": 44440 }, { "epoch": 0.12, "learning_rate": 0.00028271687822883966, "loss": 0.0273, "step": 44450 }, { "epoch": 0.12, "learning_rate": 0.0002827129900124682, "loss": 0.0284, "step": 44460 }, { "epoch": 0.12, "learning_rate": 0.00028270910179609675, "loss": 0.0249, "step": 44470 }, { "epoch": 0.12, "learning_rate": 0.00028270521357972526, "loss": 0.0281, "step": 44480 }, { "epoch": 0.12, "learning_rate": 0.0002827013253633538, "loss": 0.0287, "step": 44490 }, { "epoch": 0.12, "learning_rate": 0.00028269743714698234, "loss": 0.0246, "step": 44500 }, { "epoch": 0.12, "learning_rate": 0.00028269354893061086, "loss": 0.0291, "step": 44510 }, { "epoch": 0.12, "learning_rate": 0.00028268966071423937, "loss": 0.0314, "step": 44520 }, { "epoch": 0.12, "learning_rate": 0.00028268577249786794, "loss": 0.0271, "step": 44530 }, { "epoch": 0.12, "learning_rate": 0.0002826818842814965, "loss": 0.0297, "step": 44540 }, { "epoch": 0.12, "learning_rate": 0.000282677996065125, "loss": 0.0317, "step": 44550 }, { "epoch": 0.12, "learning_rate": 0.00028267410784875354, "loss": 0.0274, "step": 44560 }, { "epoch": 0.12, "learning_rate": 0.00028267021963238205, "loss": 0.031, "step": 44570 }, { "epoch": 0.12, "learning_rate": 0.0002826663314160106, "loss": 0.022, "step": 44580 }, { "epoch": 0.12, "learning_rate": 0.00028266244319963914, "loss": 0.0351, "step": 44590 }, { "epoch": 0.12, "learning_rate": 0.0002826585549832677, "loss": 0.031, "step": 44600 }, { "epoch": 0.12, "learning_rate": 0.0002826546667668962, "loss": 0.0264, "step": 44610 }, { "epoch": 0.12, "learning_rate": 0.0002826507785505248, "loss": 0.0335, "step": 44620 }, { "epoch": 0.12, "learning_rate": 0.0002826468903341533, "loss": 0.0289, "step": 44630 }, { "epoch": 0.12, "learning_rate": 0.0002826430021177818, "loss": 0.0288, "step": 44640 }, { "epoch": 0.12, "learning_rate": 0.00028263911390141033, "loss": 0.0301, "step": 44650 }, { "epoch": 0.12, "learning_rate": 0.0002826352256850389, "loss": 0.0327, "step": 44660 }, { "epoch": 0.12, "learning_rate": 0.0002826313374686674, "loss": 0.0264, "step": 44670 }, { "epoch": 0.12, "learning_rate": 0.000282627449252296, "loss": 0.0274, "step": 44680 }, { "epoch": 0.12, "learning_rate": 0.0002826235610359245, "loss": 0.0264, "step": 44690 }, { "epoch": 0.12, "learning_rate": 0.000282619672819553, "loss": 0.031, "step": 44700 }, { "epoch": 0.12, "learning_rate": 0.0002826157846031816, "loss": 0.0238, "step": 44710 }, { "epoch": 0.12, "learning_rate": 0.0002826118963868101, "loss": 0.0283, "step": 44720 }, { "epoch": 0.12, "learning_rate": 0.0002826080081704386, "loss": 0.0308, "step": 44730 }, { "epoch": 0.12, "learning_rate": 0.0002826041199540672, "loss": 0.0235, "step": 44740 }, { "epoch": 0.12, "learning_rate": 0.00028260023173769575, "loss": 0.0365, "step": 44750 }, { "epoch": 0.12, "learning_rate": 0.00028259634352132426, "loss": 0.0329, "step": 44760 }, { "epoch": 0.12, "learning_rate": 0.0002825924553049528, "loss": 0.0331, "step": 44770 }, { "epoch": 0.12, "learning_rate": 0.0002825885670885813, "loss": 0.0272, "step": 44780 }, { "epoch": 0.12, "learning_rate": 0.00028258467887220986, "loss": 0.0353, "step": 44790 }, { "epoch": 0.12, "learning_rate": 0.0002825807906558384, "loss": 0.0306, "step": 44800 }, { "epoch": 0.12, "learning_rate": 0.00028257690243946694, "loss": 0.0278, "step": 44810 }, { "epoch": 0.12, "learning_rate": 0.00028257301422309546, "loss": 0.0354, "step": 44820 }, { "epoch": 0.12, "learning_rate": 0.00028256912600672403, "loss": 0.0241, "step": 44830 }, { "epoch": 0.12, "learning_rate": 0.00028256523779035254, "loss": 0.0307, "step": 44840 }, { "epoch": 0.12, "learning_rate": 0.00028256134957398106, "loss": 0.0252, "step": 44850 }, { "epoch": 0.12, "learning_rate": 0.00028255746135760957, "loss": 0.0263, "step": 44860 }, { "epoch": 0.12, "learning_rate": 0.00028255357314123814, "loss": 0.0267, "step": 44870 }, { "epoch": 0.12, "learning_rate": 0.00028254968492486665, "loss": 0.0255, "step": 44880 }, { "epoch": 0.12, "learning_rate": 0.0002825457967084952, "loss": 0.0259, "step": 44890 }, { "epoch": 0.12, "learning_rate": 0.00028254190849212374, "loss": 0.0291, "step": 44900 }, { "epoch": 0.12, "learning_rate": 0.00028253802027575225, "loss": 0.0322, "step": 44910 }, { "epoch": 0.12, "learning_rate": 0.0002825341320593808, "loss": 0.0335, "step": 44920 }, { "epoch": 0.12, "learning_rate": 0.00028253024384300934, "loss": 0.0328, "step": 44930 }, { "epoch": 0.12, "learning_rate": 0.0002825263556266379, "loss": 0.0301, "step": 44940 }, { "epoch": 0.12, "learning_rate": 0.0002825224674102664, "loss": 0.0332, "step": 44950 }, { "epoch": 0.12, "learning_rate": 0.000282518579193895, "loss": 0.0337, "step": 44960 }, { "epoch": 0.12, "learning_rate": 0.0002825146909775235, "loss": 0.0315, "step": 44970 }, { "epoch": 0.12, "learning_rate": 0.000282510802761152, "loss": 0.0344, "step": 44980 }, { "epoch": 0.12, "learning_rate": 0.00028250691454478053, "loss": 0.0285, "step": 44990 }, { "epoch": 0.12, "learning_rate": 0.0002825030263284091, "loss": 0.0283, "step": 45000 }, { "epoch": 0.12, "eval_cer": 0.8818104583670996, "eval_loss": 0.022675270214676857, "eval_runtime": 107.7182, "eval_samples_per_second": 18.567, "eval_steps_per_second": 4.642, "step": 45000 }, { "epoch": 0.12, "learning_rate": 0.0002824991381120376, "loss": 0.0301, "step": 45010 }, { "epoch": 0.12, "learning_rate": 0.0002824952498956662, "loss": 0.0281, "step": 45020 }, { "epoch": 0.12, "learning_rate": 0.0002824913616792947, "loss": 0.0262, "step": 45030 }, { "epoch": 0.12, "learning_rate": 0.00028248747346292327, "loss": 0.0351, "step": 45040 }, { "epoch": 0.12, "learning_rate": 0.0002824835852465518, "loss": 0.0307, "step": 45050 }, { "epoch": 0.12, "learning_rate": 0.0002824796970301803, "loss": 0.0333, "step": 45060 }, { "epoch": 0.12, "learning_rate": 0.0002824758088138088, "loss": 0.0274, "step": 45070 }, { "epoch": 0.12, "learning_rate": 0.0002824719205974374, "loss": 0.0271, "step": 45080 }, { "epoch": 0.12, "learning_rate": 0.00028246803238106595, "loss": 0.0355, "step": 45090 }, { "epoch": 0.12, "learning_rate": 0.00028246414416469446, "loss": 0.0275, "step": 45100 }, { "epoch": 0.12, "learning_rate": 0.000282460255948323, "loss": 0.0341, "step": 45110 }, { "epoch": 0.12, "learning_rate": 0.00028245636773195155, "loss": 0.0319, "step": 45120 }, { "epoch": 0.12, "learning_rate": 0.00028245247951558006, "loss": 0.0303, "step": 45130 }, { "epoch": 0.12, "learning_rate": 0.0002824485912992086, "loss": 0.0306, "step": 45140 }, { "epoch": 0.12, "learning_rate": 0.00028244470308283714, "loss": 0.0303, "step": 45150 }, { "epoch": 0.12, "learning_rate": 0.00028244081486646566, "loss": 0.0303, "step": 45160 }, { "epoch": 0.12, "learning_rate": 0.0002824369266500942, "loss": 0.0304, "step": 45170 }, { "epoch": 0.12, "learning_rate": 0.00028243303843372274, "loss": 0.0306, "step": 45180 }, { "epoch": 0.12, "learning_rate": 0.00028242915021735126, "loss": 0.0296, "step": 45190 }, { "epoch": 0.12, "learning_rate": 0.00028242526200097977, "loss": 0.0291, "step": 45200 }, { "epoch": 0.12, "learning_rate": 0.00028242137378460834, "loss": 0.0305, "step": 45210 }, { "epoch": 0.12, "learning_rate": 0.00028241748556823685, "loss": 0.0361, "step": 45220 }, { "epoch": 0.12, "learning_rate": 0.0002824135973518654, "loss": 0.032, "step": 45230 }, { "epoch": 0.12, "learning_rate": 0.00028240970913549394, "loss": 0.0316, "step": 45240 }, { "epoch": 0.12, "learning_rate": 0.0002824058209191225, "loss": 0.0272, "step": 45250 }, { "epoch": 0.12, "learning_rate": 0.000282401932702751, "loss": 0.0317, "step": 45260 }, { "epoch": 0.12, "learning_rate": 0.00028239804448637953, "loss": 0.0307, "step": 45270 }, { "epoch": 0.12, "learning_rate": 0.00028239415627000805, "loss": 0.0262, "step": 45280 }, { "epoch": 0.12, "learning_rate": 0.0002823902680536366, "loss": 0.0356, "step": 45290 }, { "epoch": 0.12, "learning_rate": 0.0002823863798372652, "loss": 0.0297, "step": 45300 }, { "epoch": 0.12, "learning_rate": 0.0002823824916208937, "loss": 0.0297, "step": 45310 }, { "epoch": 0.12, "learning_rate": 0.0002823786034045222, "loss": 0.032, "step": 45320 }, { "epoch": 0.12, "learning_rate": 0.0002823747151881508, "loss": 0.0413, "step": 45330 }, { "epoch": 0.12, "learning_rate": 0.0002823708269717793, "loss": 0.0324, "step": 45340 }, { "epoch": 0.12, "learning_rate": 0.0002823669387554078, "loss": 0.0331, "step": 45350 }, { "epoch": 0.12, "learning_rate": 0.0002823630505390364, "loss": 0.0358, "step": 45360 }, { "epoch": 0.12, "learning_rate": 0.0002823591623226649, "loss": 0.027, "step": 45370 }, { "epoch": 0.12, "learning_rate": 0.00028235527410629347, "loss": 0.027, "step": 45380 }, { "epoch": 0.12, "learning_rate": 0.000282351385889922, "loss": 0.032, "step": 45390 }, { "epoch": 0.12, "learning_rate": 0.0002823474976735505, "loss": 0.0284, "step": 45400 }, { "epoch": 0.12, "learning_rate": 0.000282343609457179, "loss": 0.032, "step": 45410 }, { "epoch": 0.12, "learning_rate": 0.0002823397212408076, "loss": 0.0277, "step": 45420 }, { "epoch": 0.12, "learning_rate": 0.00028233583302443615, "loss": 0.0298, "step": 45430 }, { "epoch": 0.12, "learning_rate": 0.00028233194480806466, "loss": 0.0326, "step": 45440 }, { "epoch": 0.12, "learning_rate": 0.0002823280565916932, "loss": 0.0313, "step": 45450 }, { "epoch": 0.12, "learning_rate": 0.00028232416837532174, "loss": 0.0301, "step": 45460 }, { "epoch": 0.12, "learning_rate": 0.00028232028015895026, "loss": 0.034, "step": 45470 }, { "epoch": 0.12, "learning_rate": 0.0002823163919425788, "loss": 0.027, "step": 45480 }, { "epoch": 0.12, "learning_rate": 0.00028231250372620734, "loss": 0.0292, "step": 45490 }, { "epoch": 0.12, "learning_rate": 0.00028230861550983586, "loss": 0.0306, "step": 45500 }, { "epoch": 0.12, "learning_rate": 0.0002823047272934644, "loss": 0.0268, "step": 45510 }, { "epoch": 0.12, "learning_rate": 0.00028230083907709294, "loss": 0.0359, "step": 45520 }, { "epoch": 0.12, "learning_rate": 0.00028229695086072145, "loss": 0.0326, "step": 45530 }, { "epoch": 0.12, "learning_rate": 0.00028229306264435, "loss": 0.0294, "step": 45540 }, { "epoch": 0.12, "learning_rate": 0.00028228917442797854, "loss": 0.0288, "step": 45550 }, { "epoch": 0.12, "learning_rate": 0.00028228528621160705, "loss": 0.03, "step": 45560 }, { "epoch": 0.12, "learning_rate": 0.0002822813979952356, "loss": 0.0289, "step": 45570 }, { "epoch": 0.12, "learning_rate": 0.0002822775097788642, "loss": 0.0303, "step": 45580 }, { "epoch": 0.12, "learning_rate": 0.0002822736215624927, "loss": 0.0327, "step": 45590 }, { "epoch": 0.12, "learning_rate": 0.0002822697333461212, "loss": 0.0327, "step": 45600 }, { "epoch": 0.12, "learning_rate": 0.00028226584512974973, "loss": 0.0294, "step": 45610 }, { "epoch": 0.12, "learning_rate": 0.0002822619569133783, "loss": 0.0287, "step": 45620 }, { "epoch": 0.12, "learning_rate": 0.0002822580686970068, "loss": 0.0318, "step": 45630 }, { "epoch": 0.12, "learning_rate": 0.0002822541804806354, "loss": 0.032, "step": 45640 }, { "epoch": 0.12, "learning_rate": 0.0002822502922642639, "loss": 0.0259, "step": 45650 }, { "epoch": 0.12, "learning_rate": 0.0002822464040478924, "loss": 0.0351, "step": 45660 }, { "epoch": 0.12, "learning_rate": 0.000282242515831521, "loss": 0.0298, "step": 45670 }, { "epoch": 0.12, "learning_rate": 0.0002822386276151495, "loss": 0.0294, "step": 45680 }, { "epoch": 0.12, "learning_rate": 0.000282234739398778, "loss": 0.0252, "step": 45690 }, { "epoch": 0.12, "learning_rate": 0.0002822308511824066, "loss": 0.03, "step": 45700 }, { "epoch": 0.12, "learning_rate": 0.0002822269629660351, "loss": 0.0287, "step": 45710 }, { "epoch": 0.12, "learning_rate": 0.00028222307474966366, "loss": 0.0287, "step": 45720 }, { "epoch": 0.12, "learning_rate": 0.0002822191865332922, "loss": 0.0261, "step": 45730 }, { "epoch": 0.12, "learning_rate": 0.0002822152983169207, "loss": 0.0248, "step": 45740 }, { "epoch": 0.12, "learning_rate": 0.00028221141010054926, "loss": 0.0268, "step": 45750 }, { "epoch": 0.12, "learning_rate": 0.0002822075218841778, "loss": 0.0305, "step": 45760 }, { "epoch": 0.12, "learning_rate": 0.0002822036336678063, "loss": 0.0302, "step": 45770 }, { "epoch": 0.12, "learning_rate": 0.00028219974545143486, "loss": 0.0481, "step": 45780 }, { "epoch": 0.12, "learning_rate": 0.00028219585723506343, "loss": 0.0333, "step": 45790 }, { "epoch": 0.12, "learning_rate": 0.00028219196901869194, "loss": 0.0333, "step": 45800 }, { "epoch": 0.12, "learning_rate": 0.00028218808080232046, "loss": 0.0279, "step": 45810 }, { "epoch": 0.12, "learning_rate": 0.00028218419258594897, "loss": 0.0329, "step": 45820 }, { "epoch": 0.12, "learning_rate": 0.00028218030436957754, "loss": 0.0272, "step": 45830 }, { "epoch": 0.12, "learning_rate": 0.00028217641615320606, "loss": 0.0295, "step": 45840 }, { "epoch": 0.12, "learning_rate": 0.0002821725279368346, "loss": 0.0339, "step": 45850 }, { "epoch": 0.12, "learning_rate": 0.00028216863972046314, "loss": 0.0275, "step": 45860 }, { "epoch": 0.12, "learning_rate": 0.0002821647515040917, "loss": 0.0287, "step": 45870 }, { "epoch": 0.12, "learning_rate": 0.0002821608632877202, "loss": 0.0248, "step": 45880 }, { "epoch": 0.12, "learning_rate": 0.00028215697507134874, "loss": 0.0258, "step": 45890 }, { "epoch": 0.12, "learning_rate": 0.00028215308685497725, "loss": 0.0278, "step": 45900 }, { "epoch": 0.12, "learning_rate": 0.0002821491986386058, "loss": 0.0287, "step": 45910 }, { "epoch": 0.12, "learning_rate": 0.00028214531042223433, "loss": 0.0326, "step": 45920 }, { "epoch": 0.12, "learning_rate": 0.0002821414222058629, "loss": 0.0274, "step": 45930 }, { "epoch": 0.12, "learning_rate": 0.0002821375339894914, "loss": 0.0359, "step": 45940 }, { "epoch": 0.12, "learning_rate": 0.00028213364577311993, "loss": 0.0237, "step": 45950 }, { "epoch": 0.12, "learning_rate": 0.0002821297575567485, "loss": 0.0273, "step": 45960 }, { "epoch": 0.12, "learning_rate": 0.000282125869340377, "loss": 0.0334, "step": 45970 }, { "epoch": 0.12, "learning_rate": 0.0002821219811240056, "loss": 0.0267, "step": 45980 }, { "epoch": 0.12, "learning_rate": 0.0002821180929076341, "loss": 0.0267, "step": 45990 }, { "epoch": 0.12, "learning_rate": 0.00028211420469126267, "loss": 0.0273, "step": 46000 }, { "epoch": 0.12, "eval_cer": 0.8817810659914818, "eval_loss": 0.020111197605729103, "eval_runtime": 107.811, "eval_samples_per_second": 18.551, "eval_steps_per_second": 4.638, "step": 46000 }, { "epoch": 0.12, "learning_rate": 0.0002821103164748912, "loss": 0.0337, "step": 46010 }, { "epoch": 0.12, "learning_rate": 0.0002821064282585197, "loss": 0.0304, "step": 46020 }, { "epoch": 0.12, "learning_rate": 0.0002821025400421482, "loss": 0.0265, "step": 46030 }, { "epoch": 0.12, "learning_rate": 0.0002820986518257768, "loss": 0.0301, "step": 46040 }, { "epoch": 0.12, "learning_rate": 0.0002820947636094053, "loss": 0.0251, "step": 46050 }, { "epoch": 0.12, "learning_rate": 0.00028209087539303386, "loss": 0.0269, "step": 46060 }, { "epoch": 0.12, "learning_rate": 0.0002820869871766624, "loss": 0.0322, "step": 46070 }, { "epoch": 0.12, "learning_rate": 0.00028208309896029095, "loss": 0.0335, "step": 46080 }, { "epoch": 0.12, "learning_rate": 0.00028207921074391946, "loss": 0.0328, "step": 46090 }, { "epoch": 0.12, "learning_rate": 0.000282075322527548, "loss": 0.028, "step": 46100 }, { "epoch": 0.12, "learning_rate": 0.0002820714343111765, "loss": 0.0333, "step": 46110 }, { "epoch": 0.12, "learning_rate": 0.00028206754609480506, "loss": 0.0302, "step": 46120 }, { "epoch": 0.12, "learning_rate": 0.00028206365787843363, "loss": 0.0294, "step": 46130 }, { "epoch": 0.12, "learning_rate": 0.00028205976966206214, "loss": 0.0319, "step": 46140 }, { "epoch": 0.12, "learning_rate": 0.00028205588144569066, "loss": 0.0258, "step": 46150 }, { "epoch": 0.12, "learning_rate": 0.00028205199322931917, "loss": 0.0267, "step": 46160 }, { "epoch": 0.12, "learning_rate": 0.00028204810501294774, "loss": 0.0381, "step": 46170 }, { "epoch": 0.12, "learning_rate": 0.00028204421679657625, "loss": 0.0276, "step": 46180 }, { "epoch": 0.12, "learning_rate": 0.0002820403285802048, "loss": 0.0291, "step": 46190 }, { "epoch": 0.12, "learning_rate": 0.00028203644036383334, "loss": 0.0263, "step": 46200 }, { "epoch": 0.12, "learning_rate": 0.0002820325521474619, "loss": 0.0387, "step": 46210 }, { "epoch": 0.12, "learning_rate": 0.0002820286639310904, "loss": 0.0258, "step": 46220 }, { "epoch": 0.12, "learning_rate": 0.00028202477571471894, "loss": 0.0281, "step": 46230 }, { "epoch": 0.12, "learning_rate": 0.00028202088749834745, "loss": 0.0356, "step": 46240 }, { "epoch": 0.12, "learning_rate": 0.000282016999281976, "loss": 0.0301, "step": 46250 }, { "epoch": 0.12, "learning_rate": 0.00028201311106560453, "loss": 0.0267, "step": 46260 }, { "epoch": 0.12, "learning_rate": 0.0002820092228492331, "loss": 0.0322, "step": 46270 }, { "epoch": 0.12, "learning_rate": 0.0002820053346328616, "loss": 0.0226, "step": 46280 }, { "epoch": 0.12, "learning_rate": 0.0002820014464164902, "loss": 0.0276, "step": 46290 }, { "epoch": 0.12, "learning_rate": 0.0002819975582001187, "loss": 0.0239, "step": 46300 }, { "epoch": 0.12, "learning_rate": 0.0002819936699837472, "loss": 0.0373, "step": 46310 }, { "epoch": 0.12, "learning_rate": 0.00028198978176737573, "loss": 0.0328, "step": 46320 }, { "epoch": 0.12, "learning_rate": 0.0002819858935510043, "loss": 0.029, "step": 46330 }, { "epoch": 0.12, "learning_rate": 0.00028198200533463287, "loss": 0.0305, "step": 46340 }, { "epoch": 0.12, "learning_rate": 0.0002819781171182614, "loss": 0.0274, "step": 46350 }, { "epoch": 0.12, "learning_rate": 0.0002819742289018899, "loss": 0.0275, "step": 46360 }, { "epoch": 0.12, "learning_rate": 0.00028197034068551846, "loss": 0.0285, "step": 46370 }, { "epoch": 0.12, "learning_rate": 0.000281966452469147, "loss": 0.0266, "step": 46380 }, { "epoch": 0.12, "learning_rate": 0.0002819625642527755, "loss": 0.0407, "step": 46390 }, { "epoch": 0.12, "learning_rate": 0.00028195867603640406, "loss": 0.0296, "step": 46400 }, { "epoch": 0.12, "learning_rate": 0.0002819547878200326, "loss": 0.0303, "step": 46410 }, { "epoch": 0.12, "learning_rate": 0.00028195089960366115, "loss": 0.0289, "step": 46420 }, { "epoch": 0.12, "learning_rate": 0.00028194701138728966, "loss": 0.0238, "step": 46430 }, { "epoch": 0.12, "learning_rate": 0.0002819431231709182, "loss": 0.0265, "step": 46440 }, { "epoch": 0.12, "learning_rate": 0.0002819392349545467, "loss": 0.0262, "step": 46450 }, { "epoch": 0.12, "learning_rate": 0.00028193534673817526, "loss": 0.0257, "step": 46460 }, { "epoch": 0.12, "learning_rate": 0.00028193145852180377, "loss": 0.0289, "step": 46470 }, { "epoch": 0.12, "learning_rate": 0.00028192757030543234, "loss": 0.0309, "step": 46480 }, { "epoch": 0.12, "learning_rate": 0.00028192368208906086, "loss": 0.0263, "step": 46490 }, { "epoch": 0.12, "learning_rate": 0.0002819197938726894, "loss": 0.0262, "step": 46500 }, { "epoch": 0.12, "learning_rate": 0.00028191590565631794, "loss": 0.0211, "step": 46510 }, { "epoch": 0.12, "learning_rate": 0.00028191201743994645, "loss": 0.0271, "step": 46520 }, { "epoch": 0.12, "learning_rate": 0.000281908129223575, "loss": 0.0327, "step": 46530 }, { "epoch": 0.12, "learning_rate": 0.00028190424100720354, "loss": 0.029, "step": 46540 }, { "epoch": 0.12, "learning_rate": 0.0002819003527908321, "loss": 0.0336, "step": 46550 }, { "epoch": 0.12, "learning_rate": 0.0002818964645744606, "loss": 0.0295, "step": 46560 }, { "epoch": 0.12, "learning_rate": 0.00028189257635808913, "loss": 0.0346, "step": 46570 }, { "epoch": 0.12, "learning_rate": 0.0002818886881417177, "loss": 0.0261, "step": 46580 }, { "epoch": 0.12, "learning_rate": 0.0002818847999253462, "loss": 0.0323, "step": 46590 }, { "epoch": 0.12, "learning_rate": 0.00028188091170897473, "loss": 0.0311, "step": 46600 }, { "epoch": 0.12, "learning_rate": 0.0002818770234926033, "loss": 0.03, "step": 46610 }, { "epoch": 0.12, "learning_rate": 0.00028187313527623187, "loss": 0.0279, "step": 46620 }, { "epoch": 0.12, "learning_rate": 0.0002818692470598604, "loss": 0.0281, "step": 46630 }, { "epoch": 0.12, "learning_rate": 0.0002818653588434889, "loss": 0.0268, "step": 46640 }, { "epoch": 0.12, "learning_rate": 0.0002818614706271174, "loss": 0.0356, "step": 46650 }, { "epoch": 0.12, "learning_rate": 0.00028185758241074593, "loss": 0.0254, "step": 46660 }, { "epoch": 0.12, "learning_rate": 0.0002818536941943745, "loss": 0.0273, "step": 46670 }, { "epoch": 0.12, "learning_rate": 0.00028184980597800307, "loss": 0.0293, "step": 46680 }, { "epoch": 0.12, "learning_rate": 0.0002818459177616316, "loss": 0.031, "step": 46690 }, { "epoch": 0.12, "learning_rate": 0.0002818420295452601, "loss": 0.0308, "step": 46700 }, { "epoch": 0.12, "learning_rate": 0.00028183814132888866, "loss": 0.0258, "step": 46710 }, { "epoch": 0.12, "learning_rate": 0.0002818342531125172, "loss": 0.0277, "step": 46720 }, { "epoch": 0.12, "learning_rate": 0.0002818303648961457, "loss": 0.0291, "step": 46730 }, { "epoch": 0.12, "learning_rate": 0.00028182647667977426, "loss": 0.0226, "step": 46740 }, { "epoch": 0.12, "learning_rate": 0.0002818225884634028, "loss": 0.0295, "step": 46750 }, { "epoch": 0.12, "learning_rate": 0.00028181870024703134, "loss": 0.0288, "step": 46760 }, { "epoch": 0.12, "learning_rate": 0.00028181481203065986, "loss": 0.0289, "step": 46770 }, { "epoch": 0.12, "learning_rate": 0.0002818109238142884, "loss": 0.0343, "step": 46780 }, { "epoch": 0.12, "learning_rate": 0.00028180703559791694, "loss": 0.0333, "step": 46790 }, { "epoch": 0.12, "learning_rate": 0.00028180314738154546, "loss": 0.0305, "step": 46800 }, { "epoch": 0.12, "learning_rate": 0.00028179925916517397, "loss": 0.0304, "step": 46810 }, { "epoch": 0.12, "learning_rate": 0.00028179537094880254, "loss": 0.029, "step": 46820 }, { "epoch": 0.12, "learning_rate": 0.0002817914827324311, "loss": 0.0281, "step": 46830 }, { "epoch": 0.12, "learning_rate": 0.0002817875945160596, "loss": 0.0312, "step": 46840 }, { "epoch": 0.12, "learning_rate": 0.00028178370629968814, "loss": 0.0259, "step": 46850 }, { "epoch": 0.12, "learning_rate": 0.00028177981808331665, "loss": 0.0311, "step": 46860 }, { "epoch": 0.12, "learning_rate": 0.0002817759298669452, "loss": 0.0267, "step": 46870 }, { "epoch": 0.12, "learning_rate": 0.00028177204165057374, "loss": 0.0283, "step": 46880 }, { "epoch": 0.12, "learning_rate": 0.0002817681534342023, "loss": 0.0283, "step": 46890 }, { "epoch": 0.12, "learning_rate": 0.0002817642652178308, "loss": 0.0253, "step": 46900 }, { "epoch": 0.12, "learning_rate": 0.00028176037700145933, "loss": 0.028, "step": 46910 }, { "epoch": 0.12, "learning_rate": 0.0002817564887850879, "loss": 0.0301, "step": 46920 }, { "epoch": 0.12, "learning_rate": 0.0002817526005687164, "loss": 0.0294, "step": 46930 }, { "epoch": 0.12, "learning_rate": 0.00028174871235234493, "loss": 0.028, "step": 46940 }, { "epoch": 0.12, "learning_rate": 0.0002817448241359735, "loss": 0.0311, "step": 46950 }, { "epoch": 0.12, "learning_rate": 0.000281740935919602, "loss": 0.0291, "step": 46960 }, { "epoch": 0.12, "learning_rate": 0.0002817370477032306, "loss": 0.024, "step": 46970 }, { "epoch": 0.12, "learning_rate": 0.0002817331594868591, "loss": 0.025, "step": 46980 }, { "epoch": 0.12, "learning_rate": 0.0002817292712704876, "loss": 0.0316, "step": 46990 }, { "epoch": 0.12, "learning_rate": 0.0002817253830541162, "loss": 0.0307, "step": 47000 }, { "epoch": 0.12, "eval_cer": 0.8818650442075325, "eval_loss": 0.02089322730898857, "eval_runtime": 107.6372, "eval_samples_per_second": 18.581, "eval_steps_per_second": 4.645, "step": 47000 }, { "epoch": 0.12, "learning_rate": 0.0002817214948377447, "loss": 0.0258, "step": 47010 }, { "epoch": 0.12, "learning_rate": 0.00028171760662137326, "loss": 0.0238, "step": 47020 }, { "epoch": 0.12, "learning_rate": 0.0002817137184050018, "loss": 0.0305, "step": 47030 }, { "epoch": 0.12, "learning_rate": 0.00028170983018863035, "loss": 0.0248, "step": 47040 }, { "epoch": 0.12, "learning_rate": 0.00028170594197225886, "loss": 0.034, "step": 47050 }, { "epoch": 0.12, "learning_rate": 0.0002817020537558874, "loss": 0.024, "step": 47060 }, { "epoch": 0.12, "learning_rate": 0.0002816981655395159, "loss": 0.031, "step": 47070 }, { "epoch": 0.12, "learning_rate": 0.00028169427732314446, "loss": 0.0247, "step": 47080 }, { "epoch": 0.12, "learning_rate": 0.000281690389106773, "loss": 0.0263, "step": 47090 }, { "epoch": 0.12, "learning_rate": 0.00028168650089040154, "loss": 0.0316, "step": 47100 }, { "epoch": 0.12, "learning_rate": 0.00028168261267403006, "loss": 0.0308, "step": 47110 }, { "epoch": 0.12, "learning_rate": 0.0002816787244576586, "loss": 0.0297, "step": 47120 }, { "epoch": 0.12, "learning_rate": 0.00028167483624128714, "loss": 0.028, "step": 47130 }, { "epoch": 0.12, "learning_rate": 0.00028167094802491566, "loss": 0.0303, "step": 47140 }, { "epoch": 0.12, "learning_rate": 0.00028166705980854417, "loss": 0.0303, "step": 47150 }, { "epoch": 0.12, "learning_rate": 0.00028166317159217274, "loss": 0.0348, "step": 47160 }, { "epoch": 0.12, "learning_rate": 0.0002816592833758013, "loss": 0.0326, "step": 47170 }, { "epoch": 0.12, "learning_rate": 0.0002816553951594298, "loss": 0.0305, "step": 47180 }, { "epoch": 0.12, "learning_rate": 0.00028165150694305834, "loss": 0.0253, "step": 47190 }, { "epoch": 0.12, "learning_rate": 0.00028164761872668685, "loss": 0.0233, "step": 47200 }, { "epoch": 0.12, "learning_rate": 0.0002816437305103154, "loss": 0.0277, "step": 47210 }, { "epoch": 0.12, "learning_rate": 0.00028163984229394393, "loss": 0.0305, "step": 47220 }, { "epoch": 0.12, "learning_rate": 0.0002816359540775725, "loss": 0.0285, "step": 47230 }, { "epoch": 0.12, "learning_rate": 0.000281632065861201, "loss": 0.0248, "step": 47240 }, { "epoch": 0.12, "learning_rate": 0.0002816281776448296, "loss": 0.0286, "step": 47250 }, { "epoch": 0.12, "learning_rate": 0.0002816242894284581, "loss": 0.0276, "step": 47260 }, { "epoch": 0.12, "learning_rate": 0.0002816204012120866, "loss": 0.0283, "step": 47270 }, { "epoch": 0.12, "learning_rate": 0.00028161651299571513, "loss": 0.0307, "step": 47280 }, { "epoch": 0.12, "learning_rate": 0.0002816126247793437, "loss": 0.0289, "step": 47290 }, { "epoch": 0.12, "learning_rate": 0.0002816087365629722, "loss": 0.0319, "step": 47300 }, { "epoch": 0.12, "learning_rate": 0.0002816048483466008, "loss": 0.0227, "step": 47310 }, { "epoch": 0.12, "learning_rate": 0.0002816009601302293, "loss": 0.026, "step": 47320 }, { "epoch": 0.12, "learning_rate": 0.00028159707191385787, "loss": 0.0254, "step": 47330 }, { "epoch": 0.12, "learning_rate": 0.0002815931836974864, "loss": 0.0296, "step": 47340 }, { "epoch": 0.12, "learning_rate": 0.0002815892954811149, "loss": 0.0248, "step": 47350 }, { "epoch": 0.12, "learning_rate": 0.0002815854072647434, "loss": 0.0279, "step": 47360 }, { "epoch": 0.12, "learning_rate": 0.000281581519048372, "loss": 0.0297, "step": 47370 }, { "epoch": 0.12, "learning_rate": 0.00028157763083200055, "loss": 0.0295, "step": 47380 }, { "epoch": 0.12, "learning_rate": 0.00028157374261562906, "loss": 0.0248, "step": 47390 }, { "epoch": 0.12, "learning_rate": 0.0002815698543992576, "loss": 0.0293, "step": 47400 }, { "epoch": 0.12, "learning_rate": 0.0002815659661828861, "loss": 0.0307, "step": 47410 }, { "epoch": 0.12, "learning_rate": 0.00028156207796651466, "loss": 0.0279, "step": 47420 }, { "epoch": 0.12, "learning_rate": 0.0002815581897501432, "loss": 0.0323, "step": 47430 }, { "epoch": 0.12, "learning_rate": 0.00028155430153377174, "loss": 0.0361, "step": 47440 }, { "epoch": 0.12, "learning_rate": 0.00028155041331740026, "loss": 0.0246, "step": 47450 }, { "epoch": 0.12, "learning_rate": 0.0002815465251010288, "loss": 0.0361, "step": 47460 }, { "epoch": 0.12, "learning_rate": 0.00028154263688465734, "loss": 0.0318, "step": 47470 }, { "epoch": 0.12, "learning_rate": 0.00028153874866828585, "loss": 0.0314, "step": 47480 }, { "epoch": 0.12, "learning_rate": 0.00028153486045191437, "loss": 0.0273, "step": 47490 }, { "epoch": 0.12, "learning_rate": 0.00028153097223554294, "loss": 0.029, "step": 47500 }, { "epoch": 0.12, "learning_rate": 0.00028152708401917145, "loss": 0.0278, "step": 47510 }, { "epoch": 0.12, "learning_rate": 0.0002815231958028, "loss": 0.0287, "step": 47520 }, { "epoch": 0.12, "learning_rate": 0.00028151930758642854, "loss": 0.0312, "step": 47530 }, { "epoch": 0.12, "learning_rate": 0.0002815154193700571, "loss": 0.0244, "step": 47540 }, { "epoch": 0.12, "learning_rate": 0.0002815115311536856, "loss": 0.0266, "step": 47550 }, { "epoch": 0.12, "learning_rate": 0.00028150764293731413, "loss": 0.0312, "step": 47560 }, { "epoch": 0.12, "learning_rate": 0.0002815037547209427, "loss": 0.0281, "step": 47570 }, { "epoch": 0.12, "learning_rate": 0.0002814998665045712, "loss": 0.0292, "step": 47580 }, { "epoch": 0.12, "learning_rate": 0.0002814959782881998, "loss": 0.0256, "step": 47590 }, { "epoch": 0.12, "learning_rate": 0.0002814920900718283, "loss": 0.0293, "step": 47600 }, { "epoch": 0.12, "learning_rate": 0.0002814882018554568, "loss": 0.0283, "step": 47610 }, { "epoch": 0.12, "learning_rate": 0.0002814843136390854, "loss": 0.03, "step": 47620 }, { "epoch": 0.12, "learning_rate": 0.0002814804254227139, "loss": 0.0246, "step": 47630 }, { "epoch": 0.12, "learning_rate": 0.0002814765372063424, "loss": 0.024, "step": 47640 }, { "epoch": 0.12, "learning_rate": 0.000281472648989971, "loss": 0.0301, "step": 47650 }, { "epoch": 0.12, "learning_rate": 0.0002814687607735995, "loss": 0.0262, "step": 47660 }, { "epoch": 0.12, "learning_rate": 0.00028146487255722806, "loss": 0.0239, "step": 47670 }, { "epoch": 0.12, "learning_rate": 0.0002814609843408566, "loss": 0.0255, "step": 47680 }, { "epoch": 0.12, "learning_rate": 0.0002814570961244851, "loss": 0.0311, "step": 47690 }, { "epoch": 0.12, "learning_rate": 0.0002814532079081136, "loss": 0.0281, "step": 47700 }, { "epoch": 0.12, "learning_rate": 0.0002814493196917422, "loss": 0.0296, "step": 47710 }, { "epoch": 0.12, "learning_rate": 0.00028144543147537075, "loss": 0.025, "step": 47720 }, { "epoch": 0.12, "learning_rate": 0.00028144154325899926, "loss": 0.0343, "step": 47730 }, { "epoch": 0.12, "learning_rate": 0.0002814376550426278, "loss": 0.0263, "step": 47740 }, { "epoch": 0.12, "learning_rate": 0.00028143376682625634, "loss": 0.0259, "step": 47750 }, { "epoch": 0.12, "learning_rate": 0.00028142987860988486, "loss": 0.0297, "step": 47760 }, { "epoch": 0.12, "learning_rate": 0.00028142599039351337, "loss": 0.0241, "step": 47770 }, { "epoch": 0.12, "learning_rate": 0.00028142210217714194, "loss": 0.0332, "step": 47780 }, { "epoch": 0.12, "learning_rate": 0.00028141821396077046, "loss": 0.0379, "step": 47790 }, { "epoch": 0.12, "learning_rate": 0.000281414325744399, "loss": 0.0292, "step": 47800 }, { "epoch": 0.12, "learning_rate": 0.00028141043752802754, "loss": 0.0324, "step": 47810 }, { "epoch": 0.12, "learning_rate": 0.00028140654931165605, "loss": 0.035, "step": 47820 }, { "epoch": 0.12, "learning_rate": 0.0002814026610952846, "loss": 0.0326, "step": 47830 }, { "epoch": 0.12, "learning_rate": 0.00028139877287891314, "loss": 0.0324, "step": 47840 }, { "epoch": 0.12, "learning_rate": 0.00028139488466254165, "loss": 0.0317, "step": 47850 }, { "epoch": 0.12, "learning_rate": 0.0002813909964461702, "loss": 0.03, "step": 47860 }, { "epoch": 0.12, "learning_rate": 0.0002813871082297988, "loss": 0.0272, "step": 47870 }, { "epoch": 0.12, "learning_rate": 0.0002813832200134273, "loss": 0.025, "step": 47880 }, { "epoch": 0.12, "learning_rate": 0.0002813793317970558, "loss": 0.027, "step": 47890 }, { "epoch": 0.12, "learning_rate": 0.00028137544358068433, "loss": 0.026, "step": 47900 }, { "epoch": 0.12, "learning_rate": 0.00028137155536431285, "loss": 0.0281, "step": 47910 }, { "epoch": 0.12, "learning_rate": 0.0002813676671479414, "loss": 0.0295, "step": 47920 }, { "epoch": 0.12, "learning_rate": 0.00028136377893157, "loss": 0.0275, "step": 47930 }, { "epoch": 0.12, "learning_rate": 0.0002813598907151985, "loss": 0.028, "step": 47940 }, { "epoch": 0.12, "learning_rate": 0.000281356002498827, "loss": 0.0316, "step": 47950 }, { "epoch": 0.12, "learning_rate": 0.0002813521142824556, "loss": 0.0295, "step": 47960 }, { "epoch": 0.12, "learning_rate": 0.0002813482260660841, "loss": 0.0303, "step": 47970 }, { "epoch": 0.12, "learning_rate": 0.0002813443378497126, "loss": 0.0277, "step": 47980 }, { "epoch": 0.12, "learning_rate": 0.0002813404496333412, "loss": 0.035, "step": 47990 }, { "epoch": 0.12, "learning_rate": 0.0002813365614169697, "loss": 0.0302, "step": 48000 }, { "epoch": 0.12, "eval_cer": 0.8818804402138085, "eval_loss": 0.022080879658460617, "eval_runtime": 107.5098, "eval_samples_per_second": 18.603, "eval_steps_per_second": 4.651, "step": 48000 }, { "epoch": 0.12, "learning_rate": 0.00028133267320059826, "loss": 0.0361, "step": 48010 }, { "epoch": 0.12, "learning_rate": 0.0002813287849842268, "loss": 0.0382, "step": 48020 }, { "epoch": 0.12, "learning_rate": 0.0002813248967678553, "loss": 0.035, "step": 48030 }, { "epoch": 0.12, "learning_rate": 0.00028132100855148386, "loss": 0.0309, "step": 48040 }, { "epoch": 0.12, "learning_rate": 0.0002813171203351124, "loss": 0.0334, "step": 48050 }, { "epoch": 0.12, "learning_rate": 0.0002813132321187409, "loss": 0.0357, "step": 48060 }, { "epoch": 0.12, "learning_rate": 0.00028130934390236946, "loss": 0.0288, "step": 48070 }, { "epoch": 0.12, "learning_rate": 0.00028130545568599803, "loss": 0.0278, "step": 48080 }, { "epoch": 0.12, "learning_rate": 0.00028130156746962654, "loss": 0.0275, "step": 48090 }, { "epoch": 0.12, "learning_rate": 0.00028129767925325506, "loss": 0.0322, "step": 48100 }, { "epoch": 0.12, "learning_rate": 0.00028129379103688357, "loss": 0.0331, "step": 48110 }, { "epoch": 0.12, "learning_rate": 0.00028128990282051214, "loss": 0.0265, "step": 48120 }, { "epoch": 0.12, "learning_rate": 0.00028128601460414065, "loss": 0.0345, "step": 48130 }, { "epoch": 0.12, "learning_rate": 0.0002812821263877692, "loss": 0.0296, "step": 48140 }, { "epoch": 0.12, "learning_rate": 0.00028127823817139774, "loss": 0.0284, "step": 48150 }, { "epoch": 0.12, "learning_rate": 0.00028127434995502625, "loss": 0.0307, "step": 48160 }, { "epoch": 0.12, "learning_rate": 0.0002812704617386548, "loss": 0.0248, "step": 48170 }, { "epoch": 0.12, "learning_rate": 0.00028126657352228334, "loss": 0.027, "step": 48180 }, { "epoch": 0.12, "learning_rate": 0.00028126268530591185, "loss": 0.0269, "step": 48190 }, { "epoch": 0.12, "learning_rate": 0.0002812587970895404, "loss": 0.0261, "step": 48200 }, { "epoch": 0.12, "learning_rate": 0.000281254908873169, "loss": 0.0284, "step": 48210 }, { "epoch": 0.12, "learning_rate": 0.0002812510206567975, "loss": 0.0282, "step": 48220 }, { "epoch": 0.13, "learning_rate": 0.000281247132440426, "loss": 0.0316, "step": 48230 }, { "epoch": 0.13, "learning_rate": 0.00028124324422405453, "loss": 0.0289, "step": 48240 }, { "epoch": 0.13, "learning_rate": 0.0002812393560076831, "loss": 0.0227, "step": 48250 }, { "epoch": 0.13, "learning_rate": 0.0002812354677913116, "loss": 0.0289, "step": 48260 }, { "epoch": 0.13, "learning_rate": 0.0002812315795749402, "loss": 0.0284, "step": 48270 }, { "epoch": 0.13, "learning_rate": 0.0002812276913585687, "loss": 0.0277, "step": 48280 }, { "epoch": 0.13, "learning_rate": 0.00028122380314219727, "loss": 0.0284, "step": 48290 }, { "epoch": 0.13, "learning_rate": 0.0002812199149258258, "loss": 0.0313, "step": 48300 }, { "epoch": 0.13, "learning_rate": 0.0002812160267094543, "loss": 0.0291, "step": 48310 }, { "epoch": 0.13, "learning_rate": 0.0002812121384930828, "loss": 0.0306, "step": 48320 }, { "epoch": 0.13, "learning_rate": 0.0002812082502767114, "loss": 0.0282, "step": 48330 }, { "epoch": 0.13, "learning_rate": 0.0002812043620603399, "loss": 0.0255, "step": 48340 }, { "epoch": 0.13, "learning_rate": 0.00028120047384396846, "loss": 0.0291, "step": 48350 }, { "epoch": 0.13, "learning_rate": 0.000281196585627597, "loss": 0.0329, "step": 48360 }, { "epoch": 0.13, "learning_rate": 0.00028119269741122555, "loss": 0.0359, "step": 48370 }, { "epoch": 0.13, "learning_rate": 0.00028118880919485406, "loss": 0.0247, "step": 48380 }, { "epoch": 0.13, "learning_rate": 0.0002811849209784826, "loss": 0.0338, "step": 48390 }, { "epoch": 0.13, "learning_rate": 0.0002811810327621111, "loss": 0.0289, "step": 48400 }, { "epoch": 0.13, "learning_rate": 0.00028117714454573966, "loss": 0.0311, "step": 48410 }, { "epoch": 0.13, "learning_rate": 0.0002811732563293682, "loss": 0.0247, "step": 48420 }, { "epoch": 0.13, "learning_rate": 0.00028116936811299674, "loss": 0.0291, "step": 48430 }, { "epoch": 0.13, "learning_rate": 0.00028116547989662526, "loss": 0.0283, "step": 48440 }, { "epoch": 0.13, "learning_rate": 0.00028116159168025377, "loss": 0.0268, "step": 48450 }, { "epoch": 0.13, "learning_rate": 0.00028115770346388234, "loss": 0.0244, "step": 48460 }, { "epoch": 0.13, "learning_rate": 0.00028115381524751085, "loss": 0.0248, "step": 48470 }, { "epoch": 0.13, "learning_rate": 0.0002811499270311394, "loss": 0.0289, "step": 48480 }, { "epoch": 0.13, "learning_rate": 0.00028114603881476794, "loss": 0.0285, "step": 48490 }, { "epoch": 0.13, "learning_rate": 0.0002811421505983965, "loss": 0.0285, "step": 48500 }, { "epoch": 0.13, "learning_rate": 0.000281138262382025, "loss": 0.0267, "step": 48510 }, { "epoch": 0.13, "learning_rate": 0.00028113437416565353, "loss": 0.0342, "step": 48520 }, { "epoch": 0.13, "learning_rate": 0.00028113048594928205, "loss": 0.0265, "step": 48530 }, { "epoch": 0.13, "learning_rate": 0.0002811265977329106, "loss": 0.029, "step": 48540 }, { "epoch": 0.13, "learning_rate": 0.00028112270951653913, "loss": 0.0251, "step": 48550 }, { "epoch": 0.13, "learning_rate": 0.0002811188213001677, "loss": 0.0317, "step": 48560 }, { "epoch": 0.13, "learning_rate": 0.0002811149330837962, "loss": 0.031, "step": 48570 }, { "epoch": 0.13, "learning_rate": 0.0002811110448674248, "loss": 0.0264, "step": 48580 }, { "epoch": 0.13, "learning_rate": 0.0002811071566510533, "loss": 0.0299, "step": 48590 }, { "epoch": 0.13, "learning_rate": 0.0002811032684346818, "loss": 0.0243, "step": 48600 }, { "epoch": 0.13, "learning_rate": 0.0002810993802183104, "loss": 0.031, "step": 48610 }, { "epoch": 0.13, "learning_rate": 0.0002810954920019389, "loss": 0.0336, "step": 48620 }, { "epoch": 0.13, "learning_rate": 0.00028109160378556747, "loss": 0.0308, "step": 48630 }, { "epoch": 0.13, "learning_rate": 0.000281087715569196, "loss": 0.03, "step": 48640 }, { "epoch": 0.13, "learning_rate": 0.0002810838273528245, "loss": 0.0256, "step": 48650 }, { "epoch": 0.13, "learning_rate": 0.000281079939136453, "loss": 0.0254, "step": 48660 }, { "epoch": 0.13, "learning_rate": 0.0002810760509200816, "loss": 0.0291, "step": 48670 }, { "epoch": 0.13, "learning_rate": 0.0002810721627037101, "loss": 0.0263, "step": 48680 }, { "epoch": 0.13, "learning_rate": 0.00028106827448733866, "loss": 0.0332, "step": 48690 }, { "epoch": 0.13, "learning_rate": 0.0002810643862709672, "loss": 0.0293, "step": 48700 }, { "epoch": 0.13, "learning_rate": 0.00028106049805459574, "loss": 0.0271, "step": 48710 }, { "epoch": 0.13, "learning_rate": 0.00028105660983822426, "loss": 0.0298, "step": 48720 }, { "epoch": 0.13, "learning_rate": 0.0002810527216218528, "loss": 0.0304, "step": 48730 }, { "epoch": 0.13, "learning_rate": 0.0002810488334054813, "loss": 0.0308, "step": 48740 }, { "epoch": 0.13, "learning_rate": 0.00028104494518910986, "loss": 0.031, "step": 48750 }, { "epoch": 0.13, "learning_rate": 0.0002810410569727384, "loss": 0.0335, "step": 48760 }, { "epoch": 0.13, "learning_rate": 0.00028103716875636694, "loss": 0.0317, "step": 48770 }, { "epoch": 0.13, "learning_rate": 0.00028103328053999545, "loss": 0.0321, "step": 48780 }, { "epoch": 0.13, "learning_rate": 0.000281029392323624, "loss": 0.0397, "step": 48790 }, { "epoch": 0.13, "learning_rate": 0.00028102550410725254, "loss": 0.0366, "step": 48800 }, { "epoch": 0.13, "learning_rate": 0.00028102161589088105, "loss": 0.0299, "step": 48810 }, { "epoch": 0.13, "learning_rate": 0.0002810177276745096, "loss": 0.0304, "step": 48820 }, { "epoch": 0.13, "learning_rate": 0.00028101383945813814, "loss": 0.0324, "step": 48830 }, { "epoch": 0.13, "learning_rate": 0.0002810099512417667, "loss": 0.0282, "step": 48840 }, { "epoch": 0.13, "learning_rate": 0.0002810060630253952, "loss": 0.035, "step": 48850 }, { "epoch": 0.13, "learning_rate": 0.00028100217480902373, "loss": 0.0211, "step": 48860 }, { "epoch": 0.13, "learning_rate": 0.0002809982865926523, "loss": 0.0299, "step": 48870 }, { "epoch": 0.13, "learning_rate": 0.0002809943983762808, "loss": 0.025, "step": 48880 }, { "epoch": 0.13, "learning_rate": 0.00028099051015990933, "loss": 0.0299, "step": 48890 }, { "epoch": 0.13, "learning_rate": 0.0002809866219435379, "loss": 0.025, "step": 48900 }, { "epoch": 0.13, "learning_rate": 0.0002809827337271664, "loss": 0.0307, "step": 48910 }, { "epoch": 0.13, "learning_rate": 0.000280978845510795, "loss": 0.0284, "step": 48920 }, { "epoch": 0.13, "learning_rate": 0.0002809749572944235, "loss": 0.0309, "step": 48930 }, { "epoch": 0.13, "learning_rate": 0.000280971069078052, "loss": 0.0274, "step": 48940 }, { "epoch": 0.13, "learning_rate": 0.0002809671808616805, "loss": 0.0312, "step": 48950 }, { "epoch": 0.13, "learning_rate": 0.0002809632926453091, "loss": 0.0292, "step": 48960 }, { "epoch": 0.13, "learning_rate": 0.00028095940442893766, "loss": 0.0294, "step": 48970 }, { "epoch": 0.13, "learning_rate": 0.0002809555162125662, "loss": 0.0323, "step": 48980 }, { "epoch": 0.13, "learning_rate": 0.0002809516279961947, "loss": 0.0294, "step": 48990 }, { "epoch": 0.13, "learning_rate": 0.00028094773977982326, "loss": 0.0309, "step": 49000 }, { "epoch": 0.13, "eval_cer": 0.881806259456297, "eval_loss": 0.021124470978975296, "eval_runtime": 107.4686, "eval_samples_per_second": 18.61, "eval_steps_per_second": 4.653, "step": 49000 }, { "epoch": 0.13, "learning_rate": 0.0002809438515634518, "loss": 0.0327, "step": 49010 }, { "epoch": 0.13, "learning_rate": 0.0002809399633470803, "loss": 0.025, "step": 49020 }, { "epoch": 0.13, "learning_rate": 0.00028093607513070886, "loss": 0.0292, "step": 49030 }, { "epoch": 0.13, "learning_rate": 0.0002809321869143374, "loss": 0.0272, "step": 49040 }, { "epoch": 0.13, "learning_rate": 0.00028092829869796594, "loss": 0.0309, "step": 49050 }, { "epoch": 0.13, "learning_rate": 0.00028092441048159446, "loss": 0.0352, "step": 49060 }, { "epoch": 0.13, "learning_rate": 0.00028092052226522297, "loss": 0.0299, "step": 49070 }, { "epoch": 0.13, "learning_rate": 0.00028091663404885154, "loss": 0.0306, "step": 49080 }, { "epoch": 0.13, "learning_rate": 0.00028091274583248006, "loss": 0.0239, "step": 49090 }, { "epoch": 0.13, "learning_rate": 0.00028090885761610857, "loss": 0.0272, "step": 49100 }, { "epoch": 0.13, "learning_rate": 0.00028090496939973714, "loss": 0.0276, "step": 49110 }, { "epoch": 0.13, "learning_rate": 0.0002809010811833657, "loss": 0.0355, "step": 49120 }, { "epoch": 0.13, "learning_rate": 0.0002808971929669942, "loss": 0.0292, "step": 49130 }, { "epoch": 0.13, "learning_rate": 0.00028089330475062274, "loss": 0.0361, "step": 49140 }, { "epoch": 0.13, "learning_rate": 0.00028088941653425125, "loss": 0.0298, "step": 49150 }, { "epoch": 0.13, "learning_rate": 0.0002808855283178798, "loss": 0.0257, "step": 49160 }, { "epoch": 0.13, "learning_rate": 0.00028088164010150833, "loss": 0.0259, "step": 49170 }, { "epoch": 0.13, "learning_rate": 0.0002808777518851369, "loss": 0.0255, "step": 49180 }, { "epoch": 0.13, "learning_rate": 0.0002808738636687654, "loss": 0.0277, "step": 49190 }, { "epoch": 0.13, "learning_rate": 0.00028086997545239393, "loss": 0.0282, "step": 49200 }, { "epoch": 0.13, "learning_rate": 0.0002808660872360225, "loss": 0.0269, "step": 49210 }, { "epoch": 0.13, "learning_rate": 0.000280862199019651, "loss": 0.0293, "step": 49220 }, { "epoch": 0.13, "learning_rate": 0.00028085831080327953, "loss": 0.0295, "step": 49230 }, { "epoch": 0.13, "learning_rate": 0.0002808544225869081, "loss": 0.0243, "step": 49240 }, { "epoch": 0.13, "learning_rate": 0.0002808505343705366, "loss": 0.0281, "step": 49250 }, { "epoch": 0.13, "learning_rate": 0.0002808466461541652, "loss": 0.0358, "step": 49260 }, { "epoch": 0.13, "learning_rate": 0.0002808427579377937, "loss": 0.0275, "step": 49270 }, { "epoch": 0.13, "learning_rate": 0.0002808388697214222, "loss": 0.0269, "step": 49280 }, { "epoch": 0.13, "learning_rate": 0.0002808349815050508, "loss": 0.0233, "step": 49290 }, { "epoch": 0.13, "learning_rate": 0.0002808310932886793, "loss": 0.0294, "step": 49300 }, { "epoch": 0.13, "learning_rate": 0.00028082720507230786, "loss": 0.0313, "step": 49310 }, { "epoch": 0.13, "learning_rate": 0.0002808233168559364, "loss": 0.0321, "step": 49320 }, { "epoch": 0.13, "learning_rate": 0.00028081942863956495, "loss": 0.0236, "step": 49330 }, { "epoch": 0.13, "learning_rate": 0.00028081554042319346, "loss": 0.0271, "step": 49340 }, { "epoch": 0.13, "learning_rate": 0.000280811652206822, "loss": 0.0241, "step": 49350 }, { "epoch": 0.13, "learning_rate": 0.0002808077639904505, "loss": 0.0263, "step": 49360 }, { "epoch": 0.13, "learning_rate": 0.00028080387577407906, "loss": 0.028, "step": 49370 }, { "epoch": 0.13, "learning_rate": 0.00028079998755770757, "loss": 0.0303, "step": 49380 }, { "epoch": 0.13, "learning_rate": 0.00028079609934133614, "loss": 0.0297, "step": 49390 }, { "epoch": 0.13, "learning_rate": 0.00028079221112496466, "loss": 0.0262, "step": 49400 }, { "epoch": 0.13, "learning_rate": 0.00028078832290859317, "loss": 0.0301, "step": 49410 }, { "epoch": 0.13, "learning_rate": 0.00028078443469222174, "loss": 0.0276, "step": 49420 }, { "epoch": 0.13, "learning_rate": 0.00028078054647585025, "loss": 0.0287, "step": 49430 }, { "epoch": 0.13, "learning_rate": 0.00028077665825947877, "loss": 0.0292, "step": 49440 }, { "epoch": 0.13, "learning_rate": 0.00028077277004310734, "loss": 0.0295, "step": 49450 }, { "epoch": 0.13, "learning_rate": 0.0002807688818267359, "loss": 0.028, "step": 49460 }, { "epoch": 0.13, "learning_rate": 0.0002807649936103644, "loss": 0.0276, "step": 49470 }, { "epoch": 0.13, "learning_rate": 0.00028076110539399294, "loss": 0.0265, "step": 49480 }, { "epoch": 0.13, "learning_rate": 0.00028075721717762145, "loss": 0.0309, "step": 49490 }, { "epoch": 0.13, "learning_rate": 0.00028075332896125, "loss": 0.0311, "step": 49500 }, { "epoch": 0.13, "learning_rate": 0.00028074944074487853, "loss": 0.0545, "step": 49510 }, { "epoch": 0.13, "learning_rate": 0.0002807455525285071, "loss": 0.0313, "step": 49520 }, { "epoch": 0.13, "learning_rate": 0.0002807416643121356, "loss": 0.0258, "step": 49530 }, { "epoch": 0.13, "learning_rate": 0.0002807377760957642, "loss": 0.0303, "step": 49540 }, { "epoch": 0.13, "learning_rate": 0.0002807338878793927, "loss": 0.0289, "step": 49550 }, { "epoch": 0.13, "learning_rate": 0.0002807299996630212, "loss": 0.0299, "step": 49560 }, { "epoch": 0.13, "learning_rate": 0.00028072611144664973, "loss": 0.0301, "step": 49570 }, { "epoch": 0.13, "learning_rate": 0.0002807222232302783, "loss": 0.0313, "step": 49580 }, { "epoch": 0.13, "learning_rate": 0.0002807183350139068, "loss": 0.024, "step": 49590 }, { "epoch": 0.13, "learning_rate": 0.0002807144467975354, "loss": 0.0261, "step": 49600 }, { "epoch": 0.13, "learning_rate": 0.0002807105585811639, "loss": 0.0333, "step": 49610 }, { "epoch": 0.13, "learning_rate": 0.00028070667036479246, "loss": 0.0305, "step": 49620 }, { "epoch": 0.13, "learning_rate": 0.000280702782148421, "loss": 0.0272, "step": 49630 }, { "epoch": 0.13, "learning_rate": 0.0002806988939320495, "loss": 0.0264, "step": 49640 }, { "epoch": 0.13, "learning_rate": 0.000280695005715678, "loss": 0.031, "step": 49650 }, { "epoch": 0.13, "learning_rate": 0.0002806911174993066, "loss": 0.0265, "step": 49660 }, { "epoch": 0.13, "learning_rate": 0.00028068722928293514, "loss": 0.0313, "step": 49670 }, { "epoch": 0.13, "learning_rate": 0.00028068334106656366, "loss": 0.0324, "step": 49680 }, { "epoch": 0.13, "learning_rate": 0.0002806794528501922, "loss": 0.0316, "step": 49690 }, { "epoch": 0.13, "learning_rate": 0.0002806755646338207, "loss": 0.027, "step": 49700 }, { "epoch": 0.13, "learning_rate": 0.00028067167641744926, "loss": 0.0375, "step": 49710 }, { "epoch": 0.13, "learning_rate": 0.00028066778820107777, "loss": 0.0281, "step": 49720 }, { "epoch": 0.13, "learning_rate": 0.00028066389998470634, "loss": 0.0231, "step": 49730 }, { "epoch": 0.13, "learning_rate": 0.00028066001176833485, "loss": 0.0346, "step": 49740 }, { "epoch": 0.13, "learning_rate": 0.0002806561235519634, "loss": 0.0316, "step": 49750 }, { "epoch": 0.13, "learning_rate": 0.00028065223533559194, "loss": 0.0265, "step": 49760 }, { "epoch": 0.13, "learning_rate": 0.00028064834711922045, "loss": 0.0267, "step": 49770 }, { "epoch": 0.13, "learning_rate": 0.00028064445890284897, "loss": 0.03, "step": 49780 }, { "epoch": 0.13, "learning_rate": 0.00028064057068647754, "loss": 0.0275, "step": 49790 }, { "epoch": 0.13, "learning_rate": 0.0002806366824701061, "loss": 0.0276, "step": 49800 }, { "epoch": 0.13, "learning_rate": 0.0002806327942537346, "loss": 0.0302, "step": 49810 }, { "epoch": 0.13, "learning_rate": 0.00028062890603736313, "loss": 0.041, "step": 49820 }, { "epoch": 0.13, "learning_rate": 0.0002806250178209917, "loss": 0.029, "step": 49830 }, { "epoch": 0.13, "learning_rate": 0.0002806211296046202, "loss": 0.0273, "step": 49840 }, { "epoch": 0.13, "learning_rate": 0.00028061724138824873, "loss": 0.0328, "step": 49850 }, { "epoch": 0.13, "learning_rate": 0.0002806133531718773, "loss": 0.0269, "step": 49860 }, { "epoch": 0.13, "learning_rate": 0.0002806094649555058, "loss": 0.0333, "step": 49870 }, { "epoch": 0.13, "learning_rate": 0.0002806055767391344, "loss": 0.0357, "step": 49880 }, { "epoch": 0.13, "learning_rate": 0.0002806016885227629, "loss": 0.0299, "step": 49890 }, { "epoch": 0.13, "learning_rate": 0.0002805978003063914, "loss": 0.0313, "step": 49900 }, { "epoch": 0.13, "learning_rate": 0.00028059391209001993, "loss": 0.0323, "step": 49910 }, { "epoch": 0.13, "learning_rate": 0.0002805900238736485, "loss": 0.0291, "step": 49920 }, { "epoch": 0.13, "learning_rate": 0.000280586135657277, "loss": 0.0295, "step": 49930 }, { "epoch": 0.13, "learning_rate": 0.0002805822474409056, "loss": 0.0317, "step": 49940 }, { "epoch": 0.13, "learning_rate": 0.0002805783592245341, "loss": 0.0314, "step": 49950 }, { "epoch": 0.13, "learning_rate": 0.00028057447100816266, "loss": 0.0293, "step": 49960 }, { "epoch": 0.13, "learning_rate": 0.0002805705827917912, "loss": 0.027, "step": 49970 }, { "epoch": 0.13, "learning_rate": 0.0002805666945754197, "loss": 0.0279, "step": 49980 }, { "epoch": 0.13, "learning_rate": 0.0002805628063590482, "loss": 0.0253, "step": 49990 }, { "epoch": 0.13, "learning_rate": 0.0002805589181426768, "loss": 0.0373, "step": 50000 }, { "epoch": 0.13, "eval_cer": 0.881797861634692, "eval_loss": 0.021269751712679863, "eval_runtime": 107.6876, "eval_samples_per_second": 18.572, "eval_steps_per_second": 4.643, "step": 50000 }, { "epoch": 0.13, "learning_rate": 0.00028055502992630534, "loss": 0.028, "step": 50010 }, { "epoch": 0.13, "learning_rate": 0.00028055114170993386, "loss": 0.0291, "step": 50020 }, { "epoch": 0.13, "learning_rate": 0.00028054725349356237, "loss": 0.0269, "step": 50030 }, { "epoch": 0.13, "learning_rate": 0.00028054336527719094, "loss": 0.0263, "step": 50040 }, { "epoch": 0.13, "learning_rate": 0.00028053947706081946, "loss": 0.034, "step": 50050 }, { "epoch": 0.13, "learning_rate": 0.00028053558884444797, "loss": 0.0332, "step": 50060 }, { "epoch": 0.13, "learning_rate": 0.00028053170062807654, "loss": 0.0274, "step": 50070 }, { "epoch": 0.13, "learning_rate": 0.00028052781241170505, "loss": 0.0248, "step": 50080 }, { "epoch": 0.13, "learning_rate": 0.0002805239241953336, "loss": 0.0263, "step": 50090 }, { "epoch": 0.13, "learning_rate": 0.00028052003597896214, "loss": 0.0294, "step": 50100 }, { "epoch": 0.13, "learning_rate": 0.00028051614776259065, "loss": 0.0294, "step": 50110 }, { "epoch": 0.13, "learning_rate": 0.00028051225954621917, "loss": 0.0273, "step": 50120 }, { "epoch": 0.13, "learning_rate": 0.00028050837132984773, "loss": 0.0308, "step": 50130 }, { "epoch": 0.13, "learning_rate": 0.00028050448311347625, "loss": 0.0288, "step": 50140 }, { "epoch": 0.13, "learning_rate": 0.0002805005948971048, "loss": 0.0287, "step": 50150 }, { "epoch": 0.13, "learning_rate": 0.00028049670668073333, "loss": 0.0277, "step": 50160 }, { "epoch": 0.13, "learning_rate": 0.0002804928184643619, "loss": 0.0346, "step": 50170 }, { "epoch": 0.13, "learning_rate": 0.0002804889302479904, "loss": 0.029, "step": 50180 }, { "epoch": 0.13, "learning_rate": 0.00028048504203161893, "loss": 0.028, "step": 50190 }, { "epoch": 0.13, "learning_rate": 0.0002804811538152475, "loss": 0.0286, "step": 50200 }, { "epoch": 0.13, "learning_rate": 0.000280477265598876, "loss": 0.0264, "step": 50210 }, { "epoch": 0.13, "learning_rate": 0.0002804733773825046, "loss": 0.0299, "step": 50220 }, { "epoch": 0.13, "learning_rate": 0.0002804694891661331, "loss": 0.0304, "step": 50230 }, { "epoch": 0.13, "learning_rate": 0.0002804656009497616, "loss": 0.0308, "step": 50240 }, { "epoch": 0.13, "learning_rate": 0.0002804617127333902, "loss": 0.028, "step": 50250 }, { "epoch": 0.13, "learning_rate": 0.0002804578245170187, "loss": 0.0283, "step": 50260 }, { "epoch": 0.13, "learning_rate": 0.0002804539363006472, "loss": 0.0331, "step": 50270 }, { "epoch": 0.13, "learning_rate": 0.0002804500480842758, "loss": 0.0288, "step": 50280 }, { "epoch": 0.13, "learning_rate": 0.0002804461598679043, "loss": 0.0278, "step": 50290 }, { "epoch": 0.13, "learning_rate": 0.00028044227165153286, "loss": 0.0298, "step": 50300 }, { "epoch": 0.13, "learning_rate": 0.0002804383834351614, "loss": 0.0261, "step": 50310 }, { "epoch": 0.13, "learning_rate": 0.0002804344952187899, "loss": 0.0255, "step": 50320 }, { "epoch": 0.13, "learning_rate": 0.00028043060700241846, "loss": 0.0331, "step": 50330 }, { "epoch": 0.13, "learning_rate": 0.000280426718786047, "loss": 0.031, "step": 50340 }, { "epoch": 0.13, "learning_rate": 0.00028042283056967554, "loss": 0.0292, "step": 50350 }, { "epoch": 0.13, "learning_rate": 0.00028041894235330406, "loss": 0.0299, "step": 50360 }, { "epoch": 0.13, "learning_rate": 0.00028041505413693257, "loss": 0.0222, "step": 50370 }, { "epoch": 0.13, "learning_rate": 0.00028041116592056114, "loss": 0.0233, "step": 50380 }, { "epoch": 0.13, "learning_rate": 0.00028040727770418965, "loss": 0.0307, "step": 50390 }, { "epoch": 0.13, "learning_rate": 0.00028040338948781817, "loss": 0.0248, "step": 50400 }, { "epoch": 0.13, "learning_rate": 0.00028039950127144674, "loss": 0.0288, "step": 50410 }, { "epoch": 0.13, "learning_rate": 0.00028039561305507525, "loss": 0.0296, "step": 50420 }, { "epoch": 0.13, "learning_rate": 0.0002803917248387038, "loss": 0.0241, "step": 50430 }, { "epoch": 0.13, "learning_rate": 0.00028038783662233234, "loss": 0.0219, "step": 50440 }, { "epoch": 0.13, "learning_rate": 0.00028038394840596085, "loss": 0.026, "step": 50450 }, { "epoch": 0.13, "learning_rate": 0.0002803800601895894, "loss": 0.0288, "step": 50460 }, { "epoch": 0.13, "learning_rate": 0.00028037617197321793, "loss": 0.0256, "step": 50470 }, { "epoch": 0.13, "learning_rate": 0.00028037228375684645, "loss": 0.0286, "step": 50480 }, { "epoch": 0.13, "learning_rate": 0.000280368395540475, "loss": 0.0282, "step": 50490 }, { "epoch": 0.13, "learning_rate": 0.0002803645073241036, "loss": 0.0251, "step": 50500 }, { "epoch": 0.13, "learning_rate": 0.0002803606191077321, "loss": 0.0281, "step": 50510 }, { "epoch": 0.13, "learning_rate": 0.0002803567308913606, "loss": 0.028, "step": 50520 }, { "epoch": 0.13, "learning_rate": 0.00028035284267498913, "loss": 0.0279, "step": 50530 }, { "epoch": 0.13, "learning_rate": 0.0002803489544586177, "loss": 0.0272, "step": 50540 }, { "epoch": 0.13, "learning_rate": 0.0002803450662422462, "loss": 0.029, "step": 50550 }, { "epoch": 0.13, "learning_rate": 0.0002803411780258748, "loss": 0.028, "step": 50560 }, { "epoch": 0.13, "learning_rate": 0.0002803372898095033, "loss": 0.0258, "step": 50570 }, { "epoch": 0.13, "learning_rate": 0.00028033340159313186, "loss": 0.0269, "step": 50580 }, { "epoch": 0.13, "learning_rate": 0.0002803295133767604, "loss": 0.0291, "step": 50590 }, { "epoch": 0.13, "learning_rate": 0.0002803256251603889, "loss": 0.0243, "step": 50600 }, { "epoch": 0.13, "learning_rate": 0.0002803217369440174, "loss": 0.0269, "step": 50610 }, { "epoch": 0.13, "learning_rate": 0.000280317848727646, "loss": 0.0329, "step": 50620 }, { "epoch": 0.13, "learning_rate": 0.0002803139605112745, "loss": 0.0312, "step": 50630 }, { "epoch": 0.13, "learning_rate": 0.00028031007229490306, "loss": 0.0294, "step": 50640 }, { "epoch": 0.13, "learning_rate": 0.0002803061840785316, "loss": 0.0263, "step": 50650 }, { "epoch": 0.13, "learning_rate": 0.0002803022958621601, "loss": 0.0208, "step": 50660 }, { "epoch": 0.13, "learning_rate": 0.00028029840764578866, "loss": 0.0259, "step": 50670 }, { "epoch": 0.13, "learning_rate": 0.00028029451942941717, "loss": 0.0322, "step": 50680 }, { "epoch": 0.13, "learning_rate": 0.0002802906312130457, "loss": 0.0251, "step": 50690 }, { "epoch": 0.13, "learning_rate": 0.00028028674299667426, "loss": 0.0364, "step": 50700 }, { "epoch": 0.13, "learning_rate": 0.0002802828547803028, "loss": 0.0249, "step": 50710 }, { "epoch": 0.13, "learning_rate": 0.00028027896656393134, "loss": 0.0241, "step": 50720 }, { "epoch": 0.13, "learning_rate": 0.00028027507834755985, "loss": 0.0314, "step": 50730 }, { "epoch": 0.13, "learning_rate": 0.00028027119013118837, "loss": 0.0283, "step": 50740 }, { "epoch": 0.13, "learning_rate": 0.00028026730191481694, "loss": 0.027, "step": 50750 }, { "epoch": 0.13, "learning_rate": 0.00028026341369844545, "loss": 0.0269, "step": 50760 }, { "epoch": 0.13, "learning_rate": 0.000280259525482074, "loss": 0.0276, "step": 50770 }, { "epoch": 0.13, "learning_rate": 0.00028025563726570253, "loss": 0.028, "step": 50780 }, { "epoch": 0.13, "learning_rate": 0.0002802517490493311, "loss": 0.0344, "step": 50790 }, { "epoch": 0.13, "learning_rate": 0.0002802478608329596, "loss": 0.0257, "step": 50800 }, { "epoch": 0.13, "learning_rate": 0.00028024397261658813, "loss": 0.0267, "step": 50810 }, { "epoch": 0.13, "learning_rate": 0.00028024008440021665, "loss": 0.0282, "step": 50820 }, { "epoch": 0.13, "learning_rate": 0.0002802361961838452, "loss": 0.0238, "step": 50830 }, { "epoch": 0.13, "learning_rate": 0.00028023230796747373, "loss": 0.0294, "step": 50840 }, { "epoch": 0.13, "learning_rate": 0.0002802284197511023, "loss": 0.0288, "step": 50850 }, { "epoch": 0.13, "learning_rate": 0.0002802245315347308, "loss": 0.0303, "step": 50860 }, { "epoch": 0.13, "learning_rate": 0.00028022064331835933, "loss": 0.0335, "step": 50870 }, { "epoch": 0.13, "learning_rate": 0.0002802167551019879, "loss": 0.0314, "step": 50880 }, { "epoch": 0.13, "learning_rate": 0.0002802128668856164, "loss": 0.0256, "step": 50890 }, { "epoch": 0.13, "learning_rate": 0.000280208978669245, "loss": 0.0281, "step": 50900 }, { "epoch": 0.13, "learning_rate": 0.0002802050904528735, "loss": 0.0309, "step": 50910 }, { "epoch": 0.13, "learning_rate": 0.00028020120223650206, "loss": 0.0277, "step": 50920 }, { "epoch": 0.13, "learning_rate": 0.0002801973140201306, "loss": 0.0313, "step": 50930 }, { "epoch": 0.13, "learning_rate": 0.0002801934258037591, "loss": 0.0286, "step": 50940 }, { "epoch": 0.13, "learning_rate": 0.0002801895375873876, "loss": 0.0263, "step": 50950 }, { "epoch": 0.13, "learning_rate": 0.0002801856493710162, "loss": 0.0297, "step": 50960 }, { "epoch": 0.13, "learning_rate": 0.0002801817611546447, "loss": 0.0256, "step": 50970 }, { "epoch": 0.13, "learning_rate": 0.00028017787293827326, "loss": 0.0248, "step": 50980 }, { "epoch": 0.13, "learning_rate": 0.0002801739847219018, "loss": 0.0314, "step": 50990 }, { "epoch": 0.13, "learning_rate": 0.00028017009650553034, "loss": 0.0292, "step": 51000 }, { "epoch": 0.13, "eval_cer": 0.8818202558256388, "eval_loss": 0.020461125299334526, "eval_runtime": 107.4733, "eval_samples_per_second": 18.609, "eval_steps_per_second": 4.652, "step": 51000 }, { "epoch": 0.13, "learning_rate": 0.00028016620828915886, "loss": 0.028, "step": 51010 }, { "epoch": 0.13, "learning_rate": 0.00028016232007278737, "loss": 0.0323, "step": 51020 }, { "epoch": 0.13, "learning_rate": 0.0002801584318564159, "loss": 0.0288, "step": 51030 }, { "epoch": 0.13, "learning_rate": 0.00028015454364004445, "loss": 0.0278, "step": 51040 }, { "epoch": 0.13, "learning_rate": 0.000280150655423673, "loss": 0.0249, "step": 51050 }, { "epoch": 0.13, "learning_rate": 0.00028014676720730154, "loss": 0.0273, "step": 51060 }, { "epoch": 0.13, "learning_rate": 0.00028014287899093005, "loss": 0.0278, "step": 51070 }, { "epoch": 0.13, "learning_rate": 0.0002801389907745586, "loss": 0.0275, "step": 51080 }, { "epoch": 0.13, "learning_rate": 0.00028013510255818714, "loss": 0.0269, "step": 51090 }, { "epoch": 0.13, "learning_rate": 0.00028013121434181565, "loss": 0.0232, "step": 51100 }, { "epoch": 0.13, "learning_rate": 0.0002801273261254442, "loss": 0.0294, "step": 51110 }, { "epoch": 0.13, "learning_rate": 0.00028012343790907273, "loss": 0.0274, "step": 51120 }, { "epoch": 0.13, "learning_rate": 0.0002801195496927013, "loss": 0.0305, "step": 51130 }, { "epoch": 0.13, "learning_rate": 0.0002801156614763298, "loss": 0.0256, "step": 51140 }, { "epoch": 0.13, "learning_rate": 0.00028011177325995833, "loss": 0.0367, "step": 51150 }, { "epoch": 0.13, "learning_rate": 0.00028010788504358685, "loss": 0.027, "step": 51160 }, { "epoch": 0.13, "learning_rate": 0.0002801039968272154, "loss": 0.0288, "step": 51170 }, { "epoch": 0.13, "learning_rate": 0.00028010010861084393, "loss": 0.0298, "step": 51180 }, { "epoch": 0.13, "learning_rate": 0.0002800962203944725, "loss": 0.0238, "step": 51190 }, { "epoch": 0.13, "learning_rate": 0.000280092332178101, "loss": 0.0255, "step": 51200 }, { "epoch": 0.13, "learning_rate": 0.0002800884439617296, "loss": 0.0274, "step": 51210 }, { "epoch": 0.13, "learning_rate": 0.0002800845557453581, "loss": 0.0322, "step": 51220 }, { "epoch": 0.13, "learning_rate": 0.0002800806675289866, "loss": 0.0251, "step": 51230 }, { "epoch": 0.13, "learning_rate": 0.0002800767793126151, "loss": 0.0273, "step": 51240 }, { "epoch": 0.13, "learning_rate": 0.0002800728910962437, "loss": 0.0275, "step": 51250 }, { "epoch": 0.13, "learning_rate": 0.00028006900287987226, "loss": 0.0223, "step": 51260 }, { "epoch": 0.13, "learning_rate": 0.0002800651146635008, "loss": 0.0266, "step": 51270 }, { "epoch": 0.13, "learning_rate": 0.0002800612264471293, "loss": 0.0312, "step": 51280 }, { "epoch": 0.13, "learning_rate": 0.00028005733823075786, "loss": 0.028, "step": 51290 }, { "epoch": 0.13, "learning_rate": 0.0002800534500143864, "loss": 0.0317, "step": 51300 }, { "epoch": 0.13, "learning_rate": 0.0002800495617980149, "loss": 0.0269, "step": 51310 }, { "epoch": 0.13, "learning_rate": 0.00028004567358164346, "loss": 0.0353, "step": 51320 }, { "epoch": 0.13, "learning_rate": 0.00028004178536527197, "loss": 0.0361, "step": 51330 }, { "epoch": 0.13, "learning_rate": 0.00028003789714890054, "loss": 0.0274, "step": 51340 }, { "epoch": 0.13, "learning_rate": 0.00028003400893252906, "loss": 0.0253, "step": 51350 }, { "epoch": 0.13, "learning_rate": 0.00028003012071615757, "loss": 0.0251, "step": 51360 }, { "epoch": 0.13, "learning_rate": 0.0002800262324997861, "loss": 0.0277, "step": 51370 }, { "epoch": 0.13, "learning_rate": 0.00028002234428341465, "loss": 0.0279, "step": 51380 }, { "epoch": 0.13, "learning_rate": 0.0002800184560670432, "loss": 0.0306, "step": 51390 }, { "epoch": 0.13, "learning_rate": 0.00028001456785067174, "loss": 0.0273, "step": 51400 }, { "epoch": 0.13, "learning_rate": 0.00028001067963430025, "loss": 0.0254, "step": 51410 }, { "epoch": 0.13, "learning_rate": 0.0002800067914179288, "loss": 0.0327, "step": 51420 }, { "epoch": 0.13, "learning_rate": 0.00028000290320155733, "loss": 0.0243, "step": 51430 }, { "epoch": 0.13, "learning_rate": 0.00027999901498518585, "loss": 0.0327, "step": 51440 }, { "epoch": 0.13, "learning_rate": 0.0002799951267688144, "loss": 0.0299, "step": 51450 }, { "epoch": 0.13, "learning_rate": 0.00027999123855244293, "loss": 0.0243, "step": 51460 }, { "epoch": 0.13, "learning_rate": 0.0002799873503360715, "loss": 0.0336, "step": 51470 }, { "epoch": 0.13, "learning_rate": 0.0002799834621197, "loss": 0.0253, "step": 51480 }, { "epoch": 0.13, "learning_rate": 0.00027997957390332853, "loss": 0.0293, "step": 51490 }, { "epoch": 0.13, "learning_rate": 0.0002799756856869571, "loss": 0.0309, "step": 51500 }, { "epoch": 0.13, "learning_rate": 0.0002799717974705856, "loss": 0.0287, "step": 51510 }, { "epoch": 0.13, "learning_rate": 0.00027996790925421413, "loss": 0.0306, "step": 51520 }, { "epoch": 0.13, "learning_rate": 0.0002799640210378427, "loss": 0.0288, "step": 51530 }, { "epoch": 0.13, "learning_rate": 0.00027996013282147127, "loss": 0.0249, "step": 51540 }, { "epoch": 0.13, "learning_rate": 0.0002799562446050998, "loss": 0.0277, "step": 51550 }, { "epoch": 0.13, "learning_rate": 0.0002799523563887283, "loss": 0.0294, "step": 51560 }, { "epoch": 0.13, "learning_rate": 0.0002799484681723568, "loss": 0.0297, "step": 51570 }, { "epoch": 0.13, "learning_rate": 0.0002799445799559854, "loss": 0.029, "step": 51580 }, { "epoch": 0.13, "learning_rate": 0.0002799406917396139, "loss": 0.0294, "step": 51590 }, { "epoch": 0.13, "learning_rate": 0.00027993680352324246, "loss": 0.0252, "step": 51600 }, { "epoch": 0.13, "learning_rate": 0.000279932915306871, "loss": 0.0259, "step": 51610 }, { "epoch": 0.13, "learning_rate": 0.0002799290270904995, "loss": 0.0261, "step": 51620 }, { "epoch": 0.13, "learning_rate": 0.00027992513887412806, "loss": 0.0277, "step": 51630 }, { "epoch": 0.13, "learning_rate": 0.0002799212506577566, "loss": 0.0225, "step": 51640 }, { "epoch": 0.13, "learning_rate": 0.0002799173624413851, "loss": 0.031, "step": 51650 }, { "epoch": 0.13, "learning_rate": 0.00027991347422501366, "loss": 0.0316, "step": 51660 }, { "epoch": 0.13, "learning_rate": 0.00027990958600864217, "loss": 0.026, "step": 51670 }, { "epoch": 0.13, "learning_rate": 0.00027990569779227074, "loss": 0.031, "step": 51680 }, { "epoch": 0.13, "learning_rate": 0.00027990180957589925, "loss": 0.0294, "step": 51690 }, { "epoch": 0.13, "learning_rate": 0.00027989792135952777, "loss": 0.0216, "step": 51700 }, { "epoch": 0.13, "learning_rate": 0.00027989403314315634, "loss": 0.0308, "step": 51710 }, { "epoch": 0.13, "learning_rate": 0.00027989014492678485, "loss": 0.0441, "step": 51720 }, { "epoch": 0.13, "learning_rate": 0.00027988625671041337, "loss": 0.0328, "step": 51730 }, { "epoch": 0.13, "learning_rate": 0.00027988236849404194, "loss": 0.0343, "step": 51740 }, { "epoch": 0.13, "learning_rate": 0.0002798784802776705, "loss": 0.0302, "step": 51750 }, { "epoch": 0.13, "learning_rate": 0.000279874592061299, "loss": 0.0296, "step": 51760 }, { "epoch": 0.13, "learning_rate": 0.00027987070384492753, "loss": 0.0279, "step": 51770 }, { "epoch": 0.13, "learning_rate": 0.00027986681562855605, "loss": 0.0276, "step": 51780 }, { "epoch": 0.13, "learning_rate": 0.0002798629274121846, "loss": 0.0312, "step": 51790 }, { "epoch": 0.13, "learning_rate": 0.00027985903919581313, "loss": 0.0278, "step": 51800 }, { "epoch": 0.13, "learning_rate": 0.0002798551509794417, "loss": 0.0274, "step": 51810 }, { "epoch": 0.13, "learning_rate": 0.0002798512627630702, "loss": 0.026, "step": 51820 }, { "epoch": 0.13, "learning_rate": 0.0002798473745466988, "loss": 0.0344, "step": 51830 }, { "epoch": 0.13, "learning_rate": 0.0002798434863303273, "loss": 0.0263, "step": 51840 }, { "epoch": 0.13, "learning_rate": 0.0002798395981139558, "loss": 0.0309, "step": 51850 }, { "epoch": 0.13, "learning_rate": 0.0002798357098975843, "loss": 0.0266, "step": 51860 }, { "epoch": 0.13, "learning_rate": 0.0002798318216812129, "loss": 0.0297, "step": 51870 }, { "epoch": 0.13, "learning_rate": 0.0002798279334648414, "loss": 0.0284, "step": 51880 }, { "epoch": 0.13, "learning_rate": 0.00027982404524847, "loss": 0.0326, "step": 51890 }, { "epoch": 0.13, "learning_rate": 0.0002798201570320985, "loss": 0.0276, "step": 51900 }, { "epoch": 0.13, "learning_rate": 0.000279816268815727, "loss": 0.0303, "step": 51910 }, { "epoch": 0.13, "learning_rate": 0.0002798123805993556, "loss": 0.0332, "step": 51920 }, { "epoch": 0.13, "learning_rate": 0.0002798084923829841, "loss": 0.0305, "step": 51930 }, { "epoch": 0.13, "learning_rate": 0.00027980460416661266, "loss": 0.0308, "step": 51940 }, { "epoch": 0.13, "learning_rate": 0.0002798007159502412, "loss": 0.0275, "step": 51950 }, { "epoch": 0.13, "learning_rate": 0.00027979682773386974, "loss": 0.0318, "step": 51960 }, { "epoch": 0.13, "learning_rate": 0.00027979293951749826, "loss": 0.0323, "step": 51970 }, { "epoch": 0.13, "learning_rate": 0.00027978905130112677, "loss": 0.0259, "step": 51980 }, { "epoch": 0.13, "learning_rate": 0.0002797851630847553, "loss": 0.0316, "step": 51990 }, { "epoch": 0.13, "learning_rate": 0.00027978127486838386, "loss": 0.0273, "step": 52000 }, { "epoch": 0.13, "eval_cer": 0.8817740678068109, "eval_loss": 0.019722141325473785, "eval_runtime": 107.1814, "eval_samples_per_second": 18.66, "eval_steps_per_second": 4.665, "step": 52000 }, { "epoch": 0.13, "learning_rate": 0.00027977738665201237, "loss": 0.0406, "step": 52010 }, { "epoch": 0.13, "learning_rate": 0.00027977349843564094, "loss": 0.0343, "step": 52020 }, { "epoch": 0.13, "learning_rate": 0.00027976961021926945, "loss": 0.0278, "step": 52030 }, { "epoch": 0.13, "learning_rate": 0.000279765722002898, "loss": 0.0293, "step": 52040 }, { "epoch": 0.13, "learning_rate": 0.00027976183378652654, "loss": 0.0307, "step": 52050 }, { "epoch": 0.13, "learning_rate": 0.00027975794557015505, "loss": 0.0325, "step": 52060 }, { "epoch": 0.13, "learning_rate": 0.00027975405735378357, "loss": 0.0264, "step": 52070 }, { "epoch": 0.13, "learning_rate": 0.00027975016913741213, "loss": 0.0306, "step": 52080 }, { "epoch": 0.14, "learning_rate": 0.0002797462809210407, "loss": 0.0297, "step": 52090 }, { "epoch": 0.14, "learning_rate": 0.0002797423927046692, "loss": 0.0268, "step": 52100 }, { "epoch": 0.14, "learning_rate": 0.00027973850448829773, "loss": 0.0286, "step": 52110 }, { "epoch": 0.14, "learning_rate": 0.00027973461627192625, "loss": 0.0286, "step": 52120 }, { "epoch": 0.14, "learning_rate": 0.0002797307280555548, "loss": 0.023, "step": 52130 }, { "epoch": 0.14, "learning_rate": 0.00027972683983918333, "loss": 0.0258, "step": 52140 }, { "epoch": 0.14, "learning_rate": 0.0002797229516228119, "loss": 0.0292, "step": 52150 }, { "epoch": 0.14, "learning_rate": 0.0002797190634064404, "loss": 0.0272, "step": 52160 }, { "epoch": 0.14, "learning_rate": 0.000279715175190069, "loss": 0.0306, "step": 52170 }, { "epoch": 0.14, "learning_rate": 0.0002797112869736975, "loss": 0.027, "step": 52180 }, { "epoch": 0.14, "learning_rate": 0.000279707398757326, "loss": 0.0263, "step": 52190 }, { "epoch": 0.14, "learning_rate": 0.0002797035105409545, "loss": 0.0296, "step": 52200 }, { "epoch": 0.14, "learning_rate": 0.0002796996223245831, "loss": 0.0246, "step": 52210 }, { "epoch": 0.14, "learning_rate": 0.0002796957341082116, "loss": 0.0272, "step": 52220 }, { "epoch": 0.14, "learning_rate": 0.0002796918458918402, "loss": 0.0306, "step": 52230 }, { "epoch": 0.14, "learning_rate": 0.0002796879576754687, "loss": 0.0287, "step": 52240 }, { "epoch": 0.14, "learning_rate": 0.00027968406945909726, "loss": 0.0206, "step": 52250 }, { "epoch": 0.14, "learning_rate": 0.0002796801812427258, "loss": 0.0282, "step": 52260 }, { "epoch": 0.14, "learning_rate": 0.0002796762930263543, "loss": 0.0304, "step": 52270 }, { "epoch": 0.14, "learning_rate": 0.0002796724048099828, "loss": 0.0236, "step": 52280 }, { "epoch": 0.14, "learning_rate": 0.0002796685165936114, "loss": 0.0356, "step": 52290 }, { "epoch": 0.14, "learning_rate": 0.00027966462837723994, "loss": 0.0268, "step": 52300 }, { "epoch": 0.14, "learning_rate": 0.00027966074016086846, "loss": 0.0241, "step": 52310 }, { "epoch": 0.14, "learning_rate": 0.00027965685194449697, "loss": 0.0315, "step": 52320 }, { "epoch": 0.14, "learning_rate": 0.00027965296372812554, "loss": 0.0294, "step": 52330 }, { "epoch": 0.14, "learning_rate": 0.00027964907551175405, "loss": 0.0247, "step": 52340 }, { "epoch": 0.14, "learning_rate": 0.00027964518729538257, "loss": 0.0254, "step": 52350 }, { "epoch": 0.14, "learning_rate": 0.00027964129907901114, "loss": 0.0323, "step": 52360 }, { "epoch": 0.14, "learning_rate": 0.00027963741086263965, "loss": 0.0249, "step": 52370 }, { "epoch": 0.14, "learning_rate": 0.0002796335226462682, "loss": 0.0249, "step": 52380 }, { "epoch": 0.14, "learning_rate": 0.00027962963442989674, "loss": 0.0357, "step": 52390 }, { "epoch": 0.14, "learning_rate": 0.00027962574621352525, "loss": 0.027, "step": 52400 }, { "epoch": 0.14, "learning_rate": 0.00027962185799715376, "loss": 0.0332, "step": 52410 }, { "epoch": 0.14, "learning_rate": 0.00027961796978078233, "loss": 0.0262, "step": 52420 }, { "epoch": 0.14, "learning_rate": 0.00027961408156441085, "loss": 0.0225, "step": 52430 }, { "epoch": 0.14, "learning_rate": 0.0002796101933480394, "loss": 0.0284, "step": 52440 }, { "epoch": 0.14, "learning_rate": 0.00027960630513166793, "loss": 0.0239, "step": 52450 }, { "epoch": 0.14, "learning_rate": 0.0002796024169152965, "loss": 0.0265, "step": 52460 }, { "epoch": 0.14, "learning_rate": 0.000279598528698925, "loss": 0.0358, "step": 52470 }, { "epoch": 0.14, "learning_rate": 0.00027959464048255353, "loss": 0.0269, "step": 52480 }, { "epoch": 0.14, "learning_rate": 0.0002795907522661821, "loss": 0.0314, "step": 52490 }, { "epoch": 0.14, "learning_rate": 0.0002795868640498106, "loss": 0.0262, "step": 52500 }, { "epoch": 0.14, "learning_rate": 0.0002795829758334392, "loss": 0.0306, "step": 52510 }, { "epoch": 0.14, "learning_rate": 0.0002795790876170677, "loss": 0.0272, "step": 52520 }, { "epoch": 0.14, "learning_rate": 0.0002795751994006962, "loss": 0.0287, "step": 52530 }, { "epoch": 0.14, "learning_rate": 0.0002795713111843248, "loss": 0.0269, "step": 52540 }, { "epoch": 0.14, "learning_rate": 0.0002795674229679533, "loss": 0.0289, "step": 52550 }, { "epoch": 0.14, "learning_rate": 0.0002795635347515818, "loss": 0.026, "step": 52560 }, { "epoch": 0.14, "learning_rate": 0.0002795596465352104, "loss": 0.0259, "step": 52570 }, { "epoch": 0.14, "learning_rate": 0.00027955575831883895, "loss": 0.0306, "step": 52580 }, { "epoch": 0.14, "learning_rate": 0.00027955187010246746, "loss": 0.0282, "step": 52590 }, { "epoch": 0.14, "learning_rate": 0.000279547981886096, "loss": 0.0276, "step": 52600 }, { "epoch": 0.14, "learning_rate": 0.0002795440936697245, "loss": 0.0306, "step": 52610 }, { "epoch": 0.14, "learning_rate": 0.000279540205453353, "loss": 0.0253, "step": 52620 }, { "epoch": 0.14, "learning_rate": 0.00027953631723698157, "loss": 0.0317, "step": 52630 }, { "epoch": 0.14, "learning_rate": 0.00027953242902061014, "loss": 0.0285, "step": 52640 }, { "epoch": 0.14, "learning_rate": 0.00027952854080423866, "loss": 0.0237, "step": 52650 }, { "epoch": 0.14, "learning_rate": 0.00027952465258786717, "loss": 0.0256, "step": 52660 }, { "epoch": 0.14, "learning_rate": 0.00027952076437149574, "loss": 0.0275, "step": 52670 }, { "epoch": 0.14, "learning_rate": 0.00027951687615512425, "loss": 0.0261, "step": 52680 }, { "epoch": 0.14, "learning_rate": 0.00027951298793875277, "loss": 0.0256, "step": 52690 }, { "epoch": 0.14, "learning_rate": 0.00027950909972238134, "loss": 0.0246, "step": 52700 }, { "epoch": 0.14, "learning_rate": 0.00027950521150600985, "loss": 0.0341, "step": 52710 }, { "epoch": 0.14, "learning_rate": 0.0002795013232896384, "loss": 0.0258, "step": 52720 }, { "epoch": 0.14, "learning_rate": 0.00027949743507326693, "loss": 0.0322, "step": 52730 }, { "epoch": 0.14, "learning_rate": 0.00027949354685689545, "loss": 0.0261, "step": 52740 }, { "epoch": 0.14, "learning_rate": 0.000279489658640524, "loss": 0.0232, "step": 52750 }, { "epoch": 0.14, "learning_rate": 0.00027948577042415253, "loss": 0.0271, "step": 52760 }, { "epoch": 0.14, "learning_rate": 0.00027948188220778105, "loss": 0.0307, "step": 52770 }, { "epoch": 0.14, "learning_rate": 0.0002794779939914096, "loss": 0.0267, "step": 52780 }, { "epoch": 0.14, "learning_rate": 0.0002794741057750382, "loss": 0.021, "step": 52790 }, { "epoch": 0.14, "learning_rate": 0.0002794702175586667, "loss": 0.0284, "step": 52800 }, { "epoch": 0.14, "learning_rate": 0.0002794663293422952, "loss": 0.0262, "step": 52810 }, { "epoch": 0.14, "learning_rate": 0.00027946244112592373, "loss": 0.0275, "step": 52820 }, { "epoch": 0.14, "learning_rate": 0.0002794585529095523, "loss": 0.0279, "step": 52830 }, { "epoch": 0.14, "learning_rate": 0.0002794546646931808, "loss": 0.0372, "step": 52840 }, { "epoch": 0.14, "learning_rate": 0.0002794507764768094, "loss": 0.0284, "step": 52850 }, { "epoch": 0.14, "learning_rate": 0.0002794468882604379, "loss": 0.024, "step": 52860 }, { "epoch": 0.14, "learning_rate": 0.0002794430000440664, "loss": 0.03, "step": 52870 }, { "epoch": 0.14, "learning_rate": 0.000279439111827695, "loss": 0.0271, "step": 52880 }, { "epoch": 0.14, "learning_rate": 0.0002794352236113235, "loss": 0.0279, "step": 52890 }, { "epoch": 0.14, "learning_rate": 0.000279431335394952, "loss": 0.0286, "step": 52900 }, { "epoch": 0.14, "learning_rate": 0.0002794274471785806, "loss": 0.0233, "step": 52910 }, { "epoch": 0.14, "learning_rate": 0.0002794235589622091, "loss": 0.0276, "step": 52920 }, { "epoch": 0.14, "learning_rate": 0.00027941967074583766, "loss": 0.0199, "step": 52930 }, { "epoch": 0.14, "learning_rate": 0.0002794157825294662, "loss": 0.0299, "step": 52940 }, { "epoch": 0.14, "learning_rate": 0.0002794118943130947, "loss": 0.0275, "step": 52950 }, { "epoch": 0.14, "learning_rate": 0.00027940800609672326, "loss": 0.0238, "step": 52960 }, { "epoch": 0.14, "learning_rate": 0.00027940411788035177, "loss": 0.04, "step": 52970 }, { "epoch": 0.14, "learning_rate": 0.00027940022966398034, "loss": 0.0266, "step": 52980 }, { "epoch": 0.14, "learning_rate": 0.00027939634144760885, "loss": 0.0243, "step": 52990 }, { "epoch": 0.14, "learning_rate": 0.0002793924532312374, "loss": 0.0283, "step": 53000 }, { "epoch": 0.14, "eval_cer": 0.8818118580040337, "eval_loss": 0.020349837839603424, "eval_runtime": 107.4292, "eval_samples_per_second": 18.617, "eval_steps_per_second": 4.654, "step": 53000 }, { "epoch": 0.14, "learning_rate": 0.00027938856501486594, "loss": 0.0208, "step": 53010 }, { "epoch": 0.14, "learning_rate": 0.00027938467679849445, "loss": 0.0279, "step": 53020 }, { "epoch": 0.14, "learning_rate": 0.00027938078858212297, "loss": 0.026, "step": 53030 }, { "epoch": 0.14, "learning_rate": 0.00027937690036575154, "loss": 0.0276, "step": 53040 }, { "epoch": 0.14, "learning_rate": 0.00027937301214938005, "loss": 0.0284, "step": 53050 }, { "epoch": 0.14, "learning_rate": 0.0002793691239330086, "loss": 0.0289, "step": 53060 }, { "epoch": 0.14, "learning_rate": 0.00027936523571663713, "loss": 0.0238, "step": 53070 }, { "epoch": 0.14, "learning_rate": 0.0002793613475002657, "loss": 0.0247, "step": 53080 }, { "epoch": 0.14, "learning_rate": 0.0002793574592838942, "loss": 0.023, "step": 53090 }, { "epoch": 0.14, "learning_rate": 0.00027935357106752273, "loss": 0.0326, "step": 53100 }, { "epoch": 0.14, "learning_rate": 0.00027934968285115125, "loss": 0.0278, "step": 53110 }, { "epoch": 0.14, "learning_rate": 0.0002793457946347798, "loss": 0.0372, "step": 53120 }, { "epoch": 0.14, "learning_rate": 0.0002793419064184084, "loss": 0.0275, "step": 53130 }, { "epoch": 0.14, "learning_rate": 0.0002793380182020369, "loss": 0.0295, "step": 53140 }, { "epoch": 0.14, "learning_rate": 0.0002793341299856654, "loss": 0.0253, "step": 53150 }, { "epoch": 0.14, "learning_rate": 0.0002793302417692939, "loss": 0.0303, "step": 53160 }, { "epoch": 0.14, "learning_rate": 0.0002793263535529225, "loss": 0.0257, "step": 53170 }, { "epoch": 0.14, "learning_rate": 0.000279322465336551, "loss": 0.028, "step": 53180 }, { "epoch": 0.14, "learning_rate": 0.0002793185771201796, "loss": 0.0219, "step": 53190 }, { "epoch": 0.14, "learning_rate": 0.0002793146889038081, "loss": 0.0224, "step": 53200 }, { "epoch": 0.14, "learning_rate": 0.00027931080068743666, "loss": 0.0261, "step": 53210 }, { "epoch": 0.14, "learning_rate": 0.0002793069124710652, "loss": 0.0321, "step": 53220 }, { "epoch": 0.14, "learning_rate": 0.0002793030242546937, "loss": 0.0288, "step": 53230 }, { "epoch": 0.14, "learning_rate": 0.0002792991360383222, "loss": 0.0248, "step": 53240 }, { "epoch": 0.14, "learning_rate": 0.0002792952478219508, "loss": 0.0248, "step": 53250 }, { "epoch": 0.14, "learning_rate": 0.0002792913596055793, "loss": 0.0246, "step": 53260 }, { "epoch": 0.14, "learning_rate": 0.00027928747138920786, "loss": 0.0273, "step": 53270 }, { "epoch": 0.14, "learning_rate": 0.00027928358317283637, "loss": 0.025, "step": 53280 }, { "epoch": 0.14, "learning_rate": 0.00027927969495646494, "loss": 0.0269, "step": 53290 }, { "epoch": 0.14, "learning_rate": 0.00027927580674009346, "loss": 0.0237, "step": 53300 }, { "epoch": 0.14, "learning_rate": 0.00027927191852372197, "loss": 0.0304, "step": 53310 }, { "epoch": 0.14, "learning_rate": 0.0002792680303073505, "loss": 0.0289, "step": 53320 }, { "epoch": 0.14, "learning_rate": 0.00027926414209097905, "loss": 0.0296, "step": 53330 }, { "epoch": 0.14, "learning_rate": 0.0002792602538746076, "loss": 0.028, "step": 53340 }, { "epoch": 0.14, "learning_rate": 0.00027925636565823614, "loss": 0.0249, "step": 53350 }, { "epoch": 0.14, "learning_rate": 0.00027925247744186465, "loss": 0.0297, "step": 53360 }, { "epoch": 0.14, "learning_rate": 0.00027924858922549317, "loss": 0.0312, "step": 53370 }, { "epoch": 0.14, "learning_rate": 0.00027924470100912173, "loss": 0.0266, "step": 53380 }, { "epoch": 0.14, "learning_rate": 0.00027924081279275025, "loss": 0.0266, "step": 53390 }, { "epoch": 0.14, "learning_rate": 0.0002792369245763788, "loss": 0.0334, "step": 53400 }, { "epoch": 0.14, "learning_rate": 0.00027923303636000733, "loss": 0.027, "step": 53410 }, { "epoch": 0.14, "learning_rate": 0.0002792291481436359, "loss": 0.0301, "step": 53420 }, { "epoch": 0.14, "learning_rate": 0.0002792252599272644, "loss": 0.0268, "step": 53430 }, { "epoch": 0.14, "learning_rate": 0.00027922137171089293, "loss": 0.0275, "step": 53440 }, { "epoch": 0.14, "learning_rate": 0.00027921748349452144, "loss": 0.0273, "step": 53450 }, { "epoch": 0.14, "learning_rate": 0.00027921359527815, "loss": 0.0315, "step": 53460 }, { "epoch": 0.14, "learning_rate": 0.00027920970706177853, "loss": 0.0252, "step": 53470 }, { "epoch": 0.14, "learning_rate": 0.0002792058188454071, "loss": 0.0251, "step": 53480 }, { "epoch": 0.14, "learning_rate": 0.0002792019306290356, "loss": 0.0304, "step": 53490 }, { "epoch": 0.14, "learning_rate": 0.0002791980424126642, "loss": 0.0264, "step": 53500 }, { "epoch": 0.14, "learning_rate": 0.0002791941541962927, "loss": 0.03, "step": 53510 }, { "epoch": 0.14, "learning_rate": 0.0002791902659799212, "loss": 0.0276, "step": 53520 }, { "epoch": 0.14, "learning_rate": 0.0002791863777635498, "loss": 0.0242, "step": 53530 }, { "epoch": 0.14, "learning_rate": 0.0002791824895471783, "loss": 0.0283, "step": 53540 }, { "epoch": 0.14, "learning_rate": 0.00027917860133080686, "loss": 0.0299, "step": 53550 }, { "epoch": 0.14, "learning_rate": 0.0002791747131144354, "loss": 0.0294, "step": 53560 }, { "epoch": 0.14, "learning_rate": 0.0002791708248980639, "loss": 0.0317, "step": 53570 }, { "epoch": 0.14, "learning_rate": 0.00027916693668169246, "loss": 0.0282, "step": 53580 }, { "epoch": 0.14, "learning_rate": 0.000279163048465321, "loss": 0.0258, "step": 53590 }, { "epoch": 0.14, "learning_rate": 0.0002791591602489495, "loss": 0.0248, "step": 53600 }, { "epoch": 0.14, "learning_rate": 0.00027915527203257806, "loss": 0.0225, "step": 53610 }, { "epoch": 0.14, "learning_rate": 0.00027915138381620657, "loss": 0.0363, "step": 53620 }, { "epoch": 0.14, "learning_rate": 0.00027914749559983514, "loss": 0.0251, "step": 53630 }, { "epoch": 0.14, "learning_rate": 0.00027914360738346365, "loss": 0.0259, "step": 53640 }, { "epoch": 0.14, "learning_rate": 0.00027913971916709217, "loss": 0.0321, "step": 53650 }, { "epoch": 0.14, "learning_rate": 0.0002791358309507207, "loss": 0.023, "step": 53660 }, { "epoch": 0.14, "learning_rate": 0.00027913194273434925, "loss": 0.0282, "step": 53670 }, { "epoch": 0.14, "learning_rate": 0.0002791280545179778, "loss": 0.0234, "step": 53680 }, { "epoch": 0.14, "learning_rate": 0.00027912416630160634, "loss": 0.0338, "step": 53690 }, { "epoch": 0.14, "learning_rate": 0.00027912027808523485, "loss": 0.0284, "step": 53700 }, { "epoch": 0.14, "learning_rate": 0.0002791163898688634, "loss": 0.0284, "step": 53710 }, { "epoch": 0.14, "learning_rate": 0.00027911250165249193, "loss": 0.0309, "step": 53720 }, { "epoch": 0.14, "learning_rate": 0.00027910861343612045, "loss": 0.0338, "step": 53730 }, { "epoch": 0.14, "learning_rate": 0.000279104725219749, "loss": 0.0288, "step": 53740 }, { "epoch": 0.14, "learning_rate": 0.00027910083700337753, "loss": 0.0241, "step": 53750 }, { "epoch": 0.14, "learning_rate": 0.0002790969487870061, "loss": 0.0306, "step": 53760 }, { "epoch": 0.14, "learning_rate": 0.0002790930605706346, "loss": 0.0242, "step": 53770 }, { "epoch": 0.14, "learning_rate": 0.00027908917235426313, "loss": 0.0248, "step": 53780 }, { "epoch": 0.14, "learning_rate": 0.0002790852841378917, "loss": 0.0295, "step": 53790 }, { "epoch": 0.14, "learning_rate": 0.0002790813959215202, "loss": 0.0266, "step": 53800 }, { "epoch": 0.14, "learning_rate": 0.0002790775077051487, "loss": 0.0224, "step": 53810 }, { "epoch": 0.14, "learning_rate": 0.0002790736194887773, "loss": 0.029, "step": 53820 }, { "epoch": 0.14, "learning_rate": 0.00027906973127240586, "loss": 0.0346, "step": 53830 }, { "epoch": 0.14, "learning_rate": 0.0002790658430560344, "loss": 0.0281, "step": 53840 }, { "epoch": 0.14, "learning_rate": 0.0002790619548396629, "loss": 0.0242, "step": 53850 }, { "epoch": 0.14, "learning_rate": 0.0002790580666232914, "loss": 0.032, "step": 53860 }, { "epoch": 0.14, "learning_rate": 0.0002790541784069199, "loss": 0.0319, "step": 53870 }, { "epoch": 0.14, "learning_rate": 0.0002790502901905485, "loss": 0.0296, "step": 53880 }, { "epoch": 0.14, "learning_rate": 0.00027904640197417706, "loss": 0.0288, "step": 53890 }, { "epoch": 0.14, "learning_rate": 0.0002790425137578056, "loss": 0.0279, "step": 53900 }, { "epoch": 0.14, "learning_rate": 0.0002790386255414341, "loss": 0.0271, "step": 53910 }, { "epoch": 0.14, "learning_rate": 0.00027903473732506266, "loss": 0.025, "step": 53920 }, { "epoch": 0.14, "learning_rate": 0.00027903084910869117, "loss": 0.0272, "step": 53930 }, { "epoch": 0.14, "learning_rate": 0.0002790269608923197, "loss": 0.0277, "step": 53940 }, { "epoch": 0.14, "learning_rate": 0.00027902307267594826, "loss": 0.0297, "step": 53950 }, { "epoch": 0.14, "learning_rate": 0.00027901918445957677, "loss": 0.0205, "step": 53960 }, { "epoch": 0.14, "learning_rate": 0.00027901529624320534, "loss": 0.0264, "step": 53970 }, { "epoch": 0.14, "learning_rate": 0.00027901140802683385, "loss": 0.031, "step": 53980 }, { "epoch": 0.14, "learning_rate": 0.00027900751981046237, "loss": 0.0285, "step": 53990 }, { "epoch": 0.14, "learning_rate": 0.00027900363159409094, "loss": 0.0264, "step": 54000 }, { "epoch": 0.14, "eval_cer": 0.8818370514688489, "eval_loss": 0.02024264447391033, "eval_runtime": 108.1973, "eval_samples_per_second": 18.485, "eval_steps_per_second": 4.621, "step": 54000 }, { "epoch": 0.14, "learning_rate": 0.00027899974337771945, "loss": 0.0249, "step": 54010 }, { "epoch": 0.14, "learning_rate": 0.00027899585516134797, "loss": 0.03, "step": 54020 }, { "epoch": 0.14, "learning_rate": 0.00027899196694497653, "loss": 0.0298, "step": 54030 }, { "epoch": 0.14, "learning_rate": 0.0002789880787286051, "loss": 0.0303, "step": 54040 }, { "epoch": 0.14, "learning_rate": 0.0002789841905122336, "loss": 0.0265, "step": 54050 }, { "epoch": 0.14, "learning_rate": 0.00027898030229586213, "loss": 0.028, "step": 54060 }, { "epoch": 0.14, "learning_rate": 0.00027897641407949065, "loss": 0.0231, "step": 54070 }, { "epoch": 0.14, "learning_rate": 0.0002789725258631192, "loss": 0.0276, "step": 54080 }, { "epoch": 0.14, "learning_rate": 0.00027896863764674773, "loss": 0.0264, "step": 54090 }, { "epoch": 0.14, "learning_rate": 0.0002789647494303763, "loss": 0.0235, "step": 54100 }, { "epoch": 0.14, "learning_rate": 0.0002789608612140048, "loss": 0.0299, "step": 54110 }, { "epoch": 0.14, "learning_rate": 0.00027895697299763333, "loss": 0.0258, "step": 54120 }, { "epoch": 0.14, "learning_rate": 0.0002789530847812619, "loss": 0.028, "step": 54130 }, { "epoch": 0.14, "learning_rate": 0.0002789491965648904, "loss": 0.0259, "step": 54140 }, { "epoch": 0.14, "learning_rate": 0.0002789453083485189, "loss": 0.0242, "step": 54150 }, { "epoch": 0.14, "learning_rate": 0.0002789414201321475, "loss": 0.0272, "step": 54160 }, { "epoch": 0.14, "learning_rate": 0.000278937531915776, "loss": 0.0273, "step": 54170 }, { "epoch": 0.14, "learning_rate": 0.0002789336436994046, "loss": 0.0258, "step": 54180 }, { "epoch": 0.14, "learning_rate": 0.0002789297554830331, "loss": 0.0296, "step": 54190 }, { "epoch": 0.14, "learning_rate": 0.0002789258672666616, "loss": 0.0272, "step": 54200 }, { "epoch": 0.14, "learning_rate": 0.0002789219790502902, "loss": 0.0248, "step": 54210 }, { "epoch": 0.14, "learning_rate": 0.0002789180908339187, "loss": 0.0284, "step": 54220 }, { "epoch": 0.14, "learning_rate": 0.00027891420261754726, "loss": 0.0257, "step": 54230 }, { "epoch": 0.14, "learning_rate": 0.0002789103144011758, "loss": 0.0261, "step": 54240 }, { "epoch": 0.14, "learning_rate": 0.00027890642618480434, "loss": 0.0293, "step": 54250 }, { "epoch": 0.14, "learning_rate": 0.00027890253796843286, "loss": 0.0233, "step": 54260 }, { "epoch": 0.14, "learning_rate": 0.00027889864975206137, "loss": 0.0297, "step": 54270 }, { "epoch": 0.14, "learning_rate": 0.0002788947615356899, "loss": 0.0333, "step": 54280 }, { "epoch": 0.14, "learning_rate": 0.00027889087331931845, "loss": 0.0267, "step": 54290 }, { "epoch": 0.14, "learning_rate": 0.00027888698510294697, "loss": 0.0313, "step": 54300 }, { "epoch": 0.14, "learning_rate": 0.00027888309688657554, "loss": 0.0264, "step": 54310 }, { "epoch": 0.14, "learning_rate": 0.00027887920867020405, "loss": 0.028, "step": 54320 }, { "epoch": 0.14, "learning_rate": 0.0002788753204538326, "loss": 0.0311, "step": 54330 }, { "epoch": 0.14, "learning_rate": 0.00027887143223746114, "loss": 0.0268, "step": 54340 }, { "epoch": 0.14, "learning_rate": 0.00027886754402108965, "loss": 0.0298, "step": 54350 }, { "epoch": 0.14, "learning_rate": 0.00027886365580471816, "loss": 0.0248, "step": 54360 }, { "epoch": 0.14, "learning_rate": 0.00027885976758834673, "loss": 0.0289, "step": 54370 }, { "epoch": 0.14, "learning_rate": 0.0002788558793719753, "loss": 0.0236, "step": 54380 }, { "epoch": 0.14, "learning_rate": 0.0002788519911556038, "loss": 0.0311, "step": 54390 }, { "epoch": 0.14, "learning_rate": 0.00027884810293923233, "loss": 0.0295, "step": 54400 }, { "epoch": 0.14, "learning_rate": 0.00027884421472286085, "loss": 0.0223, "step": 54410 }, { "epoch": 0.14, "learning_rate": 0.0002788403265064894, "loss": 0.0294, "step": 54420 }, { "epoch": 0.14, "learning_rate": 0.00027883643829011793, "loss": 0.0312, "step": 54430 }, { "epoch": 0.14, "learning_rate": 0.0002788325500737465, "loss": 0.0252, "step": 54440 }, { "epoch": 0.14, "learning_rate": 0.000278828661857375, "loss": 0.0241, "step": 54450 }, { "epoch": 0.14, "learning_rate": 0.0002788247736410036, "loss": 0.0263, "step": 54460 }, { "epoch": 0.14, "learning_rate": 0.0002788208854246321, "loss": 0.0316, "step": 54470 }, { "epoch": 0.14, "learning_rate": 0.0002788169972082606, "loss": 0.0284, "step": 54480 }, { "epoch": 0.14, "learning_rate": 0.0002788131089918891, "loss": 0.0258, "step": 54490 }, { "epoch": 0.14, "learning_rate": 0.0002788092207755177, "loss": 0.0238, "step": 54500 }, { "epoch": 0.14, "learning_rate": 0.0002788053325591462, "loss": 0.0301, "step": 54510 }, { "epoch": 0.14, "learning_rate": 0.0002788014443427748, "loss": 0.029, "step": 54520 }, { "epoch": 0.14, "learning_rate": 0.0002787975561264033, "loss": 0.0262, "step": 54530 }, { "epoch": 0.14, "learning_rate": 0.00027879366791003186, "loss": 0.0293, "step": 54540 }, { "epoch": 0.14, "learning_rate": 0.0002787897796936604, "loss": 0.0256, "step": 54550 }, { "epoch": 0.14, "learning_rate": 0.0002787858914772889, "loss": 0.0244, "step": 54560 }, { "epoch": 0.14, "learning_rate": 0.00027878200326091746, "loss": 0.0242, "step": 54570 }, { "epoch": 0.14, "learning_rate": 0.00027877811504454597, "loss": 0.0308, "step": 54580 }, { "epoch": 0.14, "learning_rate": 0.00027877422682817454, "loss": 0.0271, "step": 54590 }, { "epoch": 0.14, "learning_rate": 0.00027877033861180306, "loss": 0.028, "step": 54600 }, { "epoch": 0.14, "learning_rate": 0.00027876645039543157, "loss": 0.0256, "step": 54610 }, { "epoch": 0.14, "learning_rate": 0.0002787625621790601, "loss": 0.0297, "step": 54620 }, { "epoch": 0.14, "learning_rate": 0.00027875867396268865, "loss": 0.0266, "step": 54630 }, { "epoch": 0.14, "learning_rate": 0.00027875478574631717, "loss": 0.0247, "step": 54640 }, { "epoch": 0.14, "learning_rate": 0.00027875089752994574, "loss": 0.0288, "step": 54650 }, { "epoch": 0.14, "learning_rate": 0.00027874700931357425, "loss": 0.0288, "step": 54660 }, { "epoch": 0.14, "learning_rate": 0.0002787431210972028, "loss": 0.0273, "step": 54670 }, { "epoch": 0.14, "learning_rate": 0.00027873923288083133, "loss": 0.0334, "step": 54680 }, { "epoch": 0.14, "learning_rate": 0.00027873534466445985, "loss": 0.0261, "step": 54690 }, { "epoch": 0.14, "learning_rate": 0.00027873145644808836, "loss": 0.0263, "step": 54700 }, { "epoch": 0.14, "learning_rate": 0.00027872756823171693, "loss": 0.0279, "step": 54710 }, { "epoch": 0.14, "learning_rate": 0.0002787236800153455, "loss": 0.0281, "step": 54720 }, { "epoch": 0.14, "learning_rate": 0.000278719791798974, "loss": 0.0227, "step": 54730 }, { "epoch": 0.14, "learning_rate": 0.00027871590358260253, "loss": 0.025, "step": 54740 }, { "epoch": 0.14, "learning_rate": 0.0002787120153662311, "loss": 0.0274, "step": 54750 }, { "epoch": 0.14, "learning_rate": 0.0002787081271498596, "loss": 0.0281, "step": 54760 }, { "epoch": 0.14, "learning_rate": 0.00027870423893348813, "loss": 0.0291, "step": 54770 }, { "epoch": 0.14, "learning_rate": 0.0002787003507171167, "loss": 0.0305, "step": 54780 }, { "epoch": 0.14, "learning_rate": 0.0002786964625007452, "loss": 0.0258, "step": 54790 }, { "epoch": 0.14, "learning_rate": 0.0002786925742843738, "loss": 0.0268, "step": 54800 }, { "epoch": 0.14, "learning_rate": 0.0002786886860680023, "loss": 0.0278, "step": 54810 }, { "epoch": 0.14, "learning_rate": 0.0002786847978516308, "loss": 0.0316, "step": 54820 }, { "epoch": 0.14, "learning_rate": 0.0002786809096352594, "loss": 0.0279, "step": 54830 }, { "epoch": 0.14, "learning_rate": 0.0002786770214188879, "loss": 0.0246, "step": 54840 }, { "epoch": 0.14, "learning_rate": 0.0002786731332025164, "loss": 0.0288, "step": 54850 }, { "epoch": 0.14, "learning_rate": 0.000278669244986145, "loss": 0.0266, "step": 54860 }, { "epoch": 0.14, "learning_rate": 0.0002786653567697735, "loss": 0.0304, "step": 54870 }, { "epoch": 0.14, "learning_rate": 0.00027866146855340206, "loss": 0.0289, "step": 54880 }, { "epoch": 0.14, "learning_rate": 0.0002786575803370306, "loss": 0.0261, "step": 54890 }, { "epoch": 0.14, "learning_rate": 0.0002786536921206591, "loss": 0.0237, "step": 54900 }, { "epoch": 0.14, "learning_rate": 0.0002786498039042876, "loss": 0.0234, "step": 54910 }, { "epoch": 0.14, "learning_rate": 0.00027864591568791617, "loss": 0.0295, "step": 54920 }, { "epoch": 0.14, "learning_rate": 0.00027864202747154474, "loss": 0.0272, "step": 54930 }, { "epoch": 0.14, "learning_rate": 0.00027863813925517325, "loss": 0.0233, "step": 54940 }, { "epoch": 0.14, "learning_rate": 0.00027863425103880177, "loss": 0.0316, "step": 54950 }, { "epoch": 0.14, "learning_rate": 0.00027863036282243034, "loss": 0.0307, "step": 54960 }, { "epoch": 0.14, "learning_rate": 0.00027862647460605885, "loss": 0.0311, "step": 54970 }, { "epoch": 0.14, "learning_rate": 0.00027862258638968737, "loss": 0.0273, "step": 54980 }, { "epoch": 0.14, "learning_rate": 0.00027861869817331594, "loss": 0.0253, "step": 54990 }, { "epoch": 0.14, "learning_rate": 0.00027861480995694445, "loss": 0.0254, "step": 55000 }, { "epoch": 0.14, "eval_cer": 0.881821655462573, "eval_loss": 0.02109946869313717, "eval_runtime": 108.1363, "eval_samples_per_second": 18.495, "eval_steps_per_second": 4.624, "step": 55000 }, { "epoch": 0.14, "learning_rate": 0.000278610921740573, "loss": 0.0242, "step": 55010 }, { "epoch": 0.14, "learning_rate": 0.00027860703352420153, "loss": 0.0291, "step": 55020 }, { "epoch": 0.14, "learning_rate": 0.00027860314530783005, "loss": 0.0259, "step": 55030 }, { "epoch": 0.14, "learning_rate": 0.0002785992570914586, "loss": 0.0267, "step": 55040 }, { "epoch": 0.14, "learning_rate": 0.00027859536887508713, "loss": 0.0314, "step": 55050 }, { "epoch": 0.14, "learning_rate": 0.00027859148065871565, "loss": 0.0352, "step": 55060 }, { "epoch": 0.14, "learning_rate": 0.0002785875924423442, "loss": 0.0326, "step": 55070 }, { "epoch": 0.14, "learning_rate": 0.00027858370422597273, "loss": 0.0299, "step": 55080 }, { "epoch": 0.14, "learning_rate": 0.0002785798160096013, "loss": 0.031, "step": 55090 }, { "epoch": 0.14, "learning_rate": 0.0002785759277932298, "loss": 0.0238, "step": 55100 }, { "epoch": 0.14, "learning_rate": 0.0002785720395768583, "loss": 0.0287, "step": 55110 }, { "epoch": 0.14, "learning_rate": 0.0002785681513604869, "loss": 0.0305, "step": 55120 }, { "epoch": 0.14, "learning_rate": 0.0002785642631441154, "loss": 0.0259, "step": 55130 }, { "epoch": 0.14, "learning_rate": 0.000278560374927744, "loss": 0.0293, "step": 55140 }, { "epoch": 0.14, "learning_rate": 0.0002785564867113725, "loss": 0.0296, "step": 55150 }, { "epoch": 0.14, "learning_rate": 0.000278552598495001, "loss": 0.028, "step": 55160 }, { "epoch": 0.14, "learning_rate": 0.0002785487102786296, "loss": 0.0301, "step": 55170 }, { "epoch": 0.14, "learning_rate": 0.0002785448220622581, "loss": 0.0271, "step": 55180 }, { "epoch": 0.14, "learning_rate": 0.0002785409338458866, "loss": 0.0272, "step": 55190 }, { "epoch": 0.14, "learning_rate": 0.0002785370456295152, "loss": 0.0272, "step": 55200 }, { "epoch": 0.14, "learning_rate": 0.0002785331574131437, "loss": 0.0304, "step": 55210 }, { "epoch": 0.14, "learning_rate": 0.00027852926919677226, "loss": 0.028, "step": 55220 }, { "epoch": 0.14, "learning_rate": 0.00027852538098040077, "loss": 0.0258, "step": 55230 }, { "epoch": 0.14, "learning_rate": 0.0002785214927640293, "loss": 0.0265, "step": 55240 }, { "epoch": 0.14, "learning_rate": 0.00027851760454765786, "loss": 0.0239, "step": 55250 }, { "epoch": 0.14, "learning_rate": 0.00027851371633128637, "loss": 0.0218, "step": 55260 }, { "epoch": 0.14, "learning_rate": 0.00027850982811491494, "loss": 0.0293, "step": 55270 }, { "epoch": 0.14, "learning_rate": 0.00027850593989854345, "loss": 0.0278, "step": 55280 }, { "epoch": 0.14, "learning_rate": 0.000278502051682172, "loss": 0.0247, "step": 55290 }, { "epoch": 0.14, "learning_rate": 0.00027849816346580054, "loss": 0.03, "step": 55300 }, { "epoch": 0.14, "learning_rate": 0.00027849427524942905, "loss": 0.0294, "step": 55310 }, { "epoch": 0.14, "learning_rate": 0.00027849038703305757, "loss": 0.0237, "step": 55320 }, { "epoch": 0.14, "learning_rate": 0.00027848649881668613, "loss": 0.0271, "step": 55330 }, { "epoch": 0.14, "learning_rate": 0.00027848261060031465, "loss": 0.0272, "step": 55340 }, { "epoch": 0.14, "learning_rate": 0.0002784787223839432, "loss": 0.027, "step": 55350 }, { "epoch": 0.14, "learning_rate": 0.00027847483416757173, "loss": 0.0265, "step": 55360 }, { "epoch": 0.14, "learning_rate": 0.00027847094595120025, "loss": 0.0304, "step": 55370 }, { "epoch": 0.14, "learning_rate": 0.0002784670577348288, "loss": 0.0313, "step": 55380 }, { "epoch": 0.14, "learning_rate": 0.00027846316951845733, "loss": 0.0259, "step": 55390 }, { "epoch": 0.14, "learning_rate": 0.00027845928130208584, "loss": 0.0366, "step": 55400 }, { "epoch": 0.14, "learning_rate": 0.0002784553930857144, "loss": 0.0232, "step": 55410 }, { "epoch": 0.14, "learning_rate": 0.000278451504869343, "loss": 0.0275, "step": 55420 }, { "epoch": 0.14, "learning_rate": 0.0002784476166529715, "loss": 0.0275, "step": 55430 }, { "epoch": 0.14, "learning_rate": 0.0002784437284366, "loss": 0.0243, "step": 55440 }, { "epoch": 0.14, "learning_rate": 0.0002784398402202285, "loss": 0.0304, "step": 55450 }, { "epoch": 0.14, "learning_rate": 0.0002784359520038571, "loss": 0.0289, "step": 55460 }, { "epoch": 0.14, "learning_rate": 0.0002784320637874856, "loss": 0.027, "step": 55470 }, { "epoch": 0.14, "learning_rate": 0.0002784281755711142, "loss": 0.026, "step": 55480 }, { "epoch": 0.14, "learning_rate": 0.0002784242873547427, "loss": 0.0303, "step": 55490 }, { "epoch": 0.14, "learning_rate": 0.00027842039913837126, "loss": 0.0218, "step": 55500 }, { "epoch": 0.14, "learning_rate": 0.0002784165109219998, "loss": 0.0262, "step": 55510 }, { "epoch": 0.14, "learning_rate": 0.0002784126227056283, "loss": 0.0268, "step": 55520 }, { "epoch": 0.14, "learning_rate": 0.0002784087344892568, "loss": 0.0276, "step": 55530 }, { "epoch": 0.14, "learning_rate": 0.00027840484627288537, "loss": 0.0285, "step": 55540 }, { "epoch": 0.14, "learning_rate": 0.0002784009580565139, "loss": 0.0295, "step": 55550 }, { "epoch": 0.14, "learning_rate": 0.00027839706984014246, "loss": 0.0271, "step": 55560 }, { "epoch": 0.14, "learning_rate": 0.00027839318162377097, "loss": 0.0258, "step": 55570 }, { "epoch": 0.14, "learning_rate": 0.0002783892934073995, "loss": 0.0302, "step": 55580 }, { "epoch": 0.14, "learning_rate": 0.00027838540519102805, "loss": 0.024, "step": 55590 }, { "epoch": 0.14, "learning_rate": 0.00027838151697465657, "loss": 0.0267, "step": 55600 }, { "epoch": 0.14, "learning_rate": 0.0002783776287582851, "loss": 0.022, "step": 55610 }, { "epoch": 0.14, "learning_rate": 0.00027837374054191365, "loss": 0.0253, "step": 55620 }, { "epoch": 0.14, "learning_rate": 0.0002783698523255422, "loss": 0.0271, "step": 55630 }, { "epoch": 0.14, "learning_rate": 0.00027836596410917073, "loss": 0.0259, "step": 55640 }, { "epoch": 0.14, "learning_rate": 0.00027836207589279925, "loss": 0.0312, "step": 55650 }, { "epoch": 0.14, "learning_rate": 0.00027835818767642776, "loss": 0.0251, "step": 55660 }, { "epoch": 0.14, "learning_rate": 0.00027835429946005633, "loss": 0.0289, "step": 55670 }, { "epoch": 0.14, "learning_rate": 0.00027835041124368485, "loss": 0.033, "step": 55680 }, { "epoch": 0.14, "learning_rate": 0.0002783465230273134, "loss": 0.0286, "step": 55690 }, { "epoch": 0.14, "learning_rate": 0.00027834263481094193, "loss": 0.0254, "step": 55700 }, { "epoch": 0.14, "learning_rate": 0.0002783387465945705, "loss": 0.0237, "step": 55710 }, { "epoch": 0.14, "learning_rate": 0.000278334858378199, "loss": 0.0239, "step": 55720 }, { "epoch": 0.14, "learning_rate": 0.00027833097016182753, "loss": 0.0207, "step": 55730 }, { "epoch": 0.14, "learning_rate": 0.00027832708194545604, "loss": 0.0277, "step": 55740 }, { "epoch": 0.14, "learning_rate": 0.0002783231937290846, "loss": 0.0256, "step": 55750 }, { "epoch": 0.14, "learning_rate": 0.0002783193055127131, "loss": 0.0277, "step": 55760 }, { "epoch": 0.14, "learning_rate": 0.0002783154172963417, "loss": 0.0232, "step": 55770 }, { "epoch": 0.14, "learning_rate": 0.0002783115290799702, "loss": 0.0303, "step": 55780 }, { "epoch": 0.14, "learning_rate": 0.0002783076408635988, "loss": 0.0273, "step": 55790 }, { "epoch": 0.14, "learning_rate": 0.0002783037526472273, "loss": 0.029, "step": 55800 }, { "epoch": 0.14, "learning_rate": 0.0002782998644308558, "loss": 0.0389, "step": 55810 }, { "epoch": 0.14, "learning_rate": 0.0002782959762144844, "loss": 0.025, "step": 55820 }, { "epoch": 0.14, "learning_rate": 0.0002782920879981129, "loss": 0.0285, "step": 55830 }, { "epoch": 0.14, "learning_rate": 0.00027828819978174146, "loss": 0.0303, "step": 55840 }, { "epoch": 0.14, "learning_rate": 0.00027828431156537, "loss": 0.0269, "step": 55850 }, { "epoch": 0.14, "learning_rate": 0.0002782804233489985, "loss": 0.036, "step": 55860 }, { "epoch": 0.14, "learning_rate": 0.000278276535132627, "loss": 0.0322, "step": 55870 }, { "epoch": 0.14, "learning_rate": 0.00027827264691625557, "loss": 0.0303, "step": 55880 }, { "epoch": 0.14, "learning_rate": 0.0002782687586998841, "loss": 0.0244, "step": 55890 }, { "epoch": 0.14, "learning_rate": 0.00027826487048351265, "loss": 0.0295, "step": 55900 }, { "epoch": 0.14, "learning_rate": 0.00027826098226714117, "loss": 0.0312, "step": 55910 }, { "epoch": 0.14, "learning_rate": 0.00027825709405076974, "loss": 0.0245, "step": 55920 }, { "epoch": 0.14, "learning_rate": 0.00027825320583439825, "loss": 0.0291, "step": 55930 }, { "epoch": 0.15, "learning_rate": 0.00027824931761802677, "loss": 0.0426, "step": 55940 }, { "epoch": 0.15, "learning_rate": 0.0002782454294016553, "loss": 0.0298, "step": 55950 }, { "epoch": 0.15, "learning_rate": 0.00027824154118528385, "loss": 0.0274, "step": 55960 }, { "epoch": 0.15, "learning_rate": 0.0002782376529689124, "loss": 0.0271, "step": 55970 }, { "epoch": 0.15, "learning_rate": 0.00027823376475254093, "loss": 0.0384, "step": 55980 }, { "epoch": 0.15, "learning_rate": 0.00027822987653616945, "loss": 0.0299, "step": 55990 }, { "epoch": 0.15, "learning_rate": 0.000278225988319798, "loss": 0.0241, "step": 56000 }, { "epoch": 0.15, "eval_cer": 0.8818426500165857, "eval_loss": 0.020007161423563957, "eval_runtime": 108.0119, "eval_samples_per_second": 18.516, "eval_steps_per_second": 4.629, "step": 56000 }, { "epoch": 0.15, "learning_rate": 0.00027822210010342653, "loss": 0.0327, "step": 56010 }, { "epoch": 0.15, "learning_rate": 0.00027821821188705505, "loss": 0.0303, "step": 56020 }, { "epoch": 0.15, "learning_rate": 0.0002782143236706836, "loss": 0.0272, "step": 56030 }, { "epoch": 0.15, "learning_rate": 0.00027821043545431213, "loss": 0.0292, "step": 56040 }, { "epoch": 0.15, "learning_rate": 0.0002782065472379407, "loss": 0.0261, "step": 56050 }, { "epoch": 0.15, "learning_rate": 0.0002782026590215692, "loss": 0.0303, "step": 56060 }, { "epoch": 0.15, "learning_rate": 0.00027819877080519773, "loss": 0.0298, "step": 56070 }, { "epoch": 0.15, "learning_rate": 0.00027819488258882624, "loss": 0.0248, "step": 56080 }, { "epoch": 0.15, "learning_rate": 0.0002781909943724548, "loss": 0.0269, "step": 56090 }, { "epoch": 0.15, "learning_rate": 0.0002781871061560833, "loss": 0.0291, "step": 56100 }, { "epoch": 0.15, "learning_rate": 0.0002781832179397119, "loss": 0.0246, "step": 56110 }, { "epoch": 0.15, "learning_rate": 0.0002781793297233404, "loss": 0.0282, "step": 56120 }, { "epoch": 0.15, "learning_rate": 0.000278175441506969, "loss": 0.0294, "step": 56130 }, { "epoch": 0.15, "learning_rate": 0.0002781715532905975, "loss": 0.029, "step": 56140 }, { "epoch": 0.15, "learning_rate": 0.000278167665074226, "loss": 0.0283, "step": 56150 }, { "epoch": 0.15, "learning_rate": 0.0002781637768578546, "loss": 0.036, "step": 56160 }, { "epoch": 0.15, "learning_rate": 0.0002781598886414831, "loss": 0.0245, "step": 56170 }, { "epoch": 0.15, "learning_rate": 0.00027815600042511166, "loss": 0.0371, "step": 56180 }, { "epoch": 0.15, "learning_rate": 0.00027815211220874017, "loss": 0.0281, "step": 56190 }, { "epoch": 0.15, "learning_rate": 0.0002781482239923687, "loss": 0.0245, "step": 56200 }, { "epoch": 0.15, "learning_rate": 0.00027814433577599726, "loss": 0.0276, "step": 56210 }, { "epoch": 0.15, "learning_rate": 0.00027814044755962577, "loss": 0.0325, "step": 56220 }, { "epoch": 0.15, "learning_rate": 0.0002781365593432543, "loss": 0.0291, "step": 56230 }, { "epoch": 0.15, "learning_rate": 0.00027813267112688285, "loss": 0.0312, "step": 56240 }, { "epoch": 0.15, "learning_rate": 0.00027812878291051137, "loss": 0.0254, "step": 56250 }, { "epoch": 0.15, "learning_rate": 0.00027812489469413994, "loss": 0.0322, "step": 56260 }, { "epoch": 0.15, "learning_rate": 0.00027812100647776845, "loss": 0.0256, "step": 56270 }, { "epoch": 0.15, "learning_rate": 0.00027811711826139697, "loss": 0.0283, "step": 56280 }, { "epoch": 0.15, "learning_rate": 0.00027811323004502553, "loss": 0.0231, "step": 56290 }, { "epoch": 0.15, "learning_rate": 0.00027810934182865405, "loss": 0.0205, "step": 56300 }, { "epoch": 0.15, "learning_rate": 0.0002781054536122826, "loss": 0.0273, "step": 56310 }, { "epoch": 0.15, "learning_rate": 0.00027810156539591113, "loss": 0.0252, "step": 56320 }, { "epoch": 0.15, "learning_rate": 0.00027809767717953965, "loss": 0.0249, "step": 56330 }, { "epoch": 0.15, "learning_rate": 0.0002780937889631682, "loss": 0.0308, "step": 56340 }, { "epoch": 0.15, "learning_rate": 0.00027808990074679673, "loss": 0.0273, "step": 56350 }, { "epoch": 0.15, "learning_rate": 0.00027808601253042525, "loss": 0.0259, "step": 56360 }, { "epoch": 0.15, "learning_rate": 0.0002780821243140538, "loss": 0.0275, "step": 56370 }, { "epoch": 0.15, "learning_rate": 0.00027807823609768233, "loss": 0.0267, "step": 56380 }, { "epoch": 0.15, "learning_rate": 0.0002780743478813109, "loss": 0.0259, "step": 56390 }, { "epoch": 0.15, "learning_rate": 0.0002780704596649394, "loss": 0.0284, "step": 56400 }, { "epoch": 0.15, "learning_rate": 0.0002780665714485679, "loss": 0.0261, "step": 56410 }, { "epoch": 0.15, "learning_rate": 0.0002780626832321965, "loss": 0.0305, "step": 56420 }, { "epoch": 0.15, "learning_rate": 0.000278058795015825, "loss": 0.0438, "step": 56430 }, { "epoch": 0.15, "learning_rate": 0.0002780549067994535, "loss": 0.0279, "step": 56440 }, { "epoch": 0.15, "learning_rate": 0.0002780510185830821, "loss": 0.0401, "step": 56450 }, { "epoch": 0.15, "learning_rate": 0.00027804713036671066, "loss": 0.0323, "step": 56460 }, { "epoch": 0.15, "learning_rate": 0.0002780432421503392, "loss": 0.0336, "step": 56470 }, { "epoch": 0.15, "learning_rate": 0.0002780393539339677, "loss": 0.0274, "step": 56480 }, { "epoch": 0.15, "learning_rate": 0.0002780354657175962, "loss": 0.0306, "step": 56490 }, { "epoch": 0.15, "learning_rate": 0.0002780315775012248, "loss": 0.0284, "step": 56500 }, { "epoch": 0.15, "learning_rate": 0.0002780276892848533, "loss": 0.0277, "step": 56510 }, { "epoch": 0.15, "learning_rate": 0.00027802380106848186, "loss": 0.0322, "step": 56520 }, { "epoch": 0.15, "learning_rate": 0.00027801991285211037, "loss": 0.0315, "step": 56530 }, { "epoch": 0.15, "learning_rate": 0.00027801602463573894, "loss": 0.0295, "step": 56540 }, { "epoch": 0.15, "learning_rate": 0.00027801213641936745, "loss": 0.026, "step": 56550 }, { "epoch": 0.15, "learning_rate": 0.00027800824820299597, "loss": 0.0237, "step": 56560 }, { "epoch": 0.15, "learning_rate": 0.0002780043599866245, "loss": 0.0287, "step": 56570 }, { "epoch": 0.15, "learning_rate": 0.00027800047177025305, "loss": 0.0281, "step": 56580 }, { "epoch": 0.15, "learning_rate": 0.00027799658355388157, "loss": 0.024, "step": 56590 }, { "epoch": 0.15, "learning_rate": 0.00027799269533751014, "loss": 0.0312, "step": 56600 }, { "epoch": 0.15, "learning_rate": 0.00027798880712113865, "loss": 0.0261, "step": 56610 }, { "epoch": 0.15, "learning_rate": 0.00027798491890476716, "loss": 0.0261, "step": 56620 }, { "epoch": 0.15, "learning_rate": 0.00027798103068839573, "loss": 0.0282, "step": 56630 }, { "epoch": 0.15, "learning_rate": 0.00027797714247202425, "loss": 0.03, "step": 56640 }, { "epoch": 0.15, "learning_rate": 0.00027797325425565276, "loss": 0.0283, "step": 56650 }, { "epoch": 0.15, "learning_rate": 0.00027796936603928133, "loss": 0.0225, "step": 56660 }, { "epoch": 0.15, "learning_rate": 0.0002779654778229099, "loss": 0.0279, "step": 56670 }, { "epoch": 0.15, "learning_rate": 0.0002779615896065384, "loss": 0.0243, "step": 56680 }, { "epoch": 0.15, "learning_rate": 0.00027795770139016693, "loss": 0.0286, "step": 56690 }, { "epoch": 0.15, "learning_rate": 0.00027795381317379544, "loss": 0.0258, "step": 56700 }, { "epoch": 0.15, "learning_rate": 0.000277949924957424, "loss": 0.0305, "step": 56710 }, { "epoch": 0.15, "learning_rate": 0.00027794603674105253, "loss": 0.0384, "step": 56720 }, { "epoch": 0.15, "learning_rate": 0.0002779421485246811, "loss": 0.0287, "step": 56730 }, { "epoch": 0.15, "learning_rate": 0.0002779382603083096, "loss": 0.0336, "step": 56740 }, { "epoch": 0.15, "learning_rate": 0.0002779343720919382, "loss": 0.0268, "step": 56750 }, { "epoch": 0.15, "learning_rate": 0.0002779304838755667, "loss": 0.0294, "step": 56760 }, { "epoch": 0.15, "learning_rate": 0.0002779265956591952, "loss": 0.0268, "step": 56770 }, { "epoch": 0.15, "learning_rate": 0.0002779227074428237, "loss": 0.0287, "step": 56780 }, { "epoch": 0.15, "learning_rate": 0.0002779188192264523, "loss": 0.0226, "step": 56790 }, { "epoch": 0.15, "learning_rate": 0.0002779149310100808, "loss": 0.0305, "step": 56800 }, { "epoch": 0.15, "learning_rate": 0.0002779110427937094, "loss": 0.0281, "step": 56810 }, { "epoch": 0.15, "learning_rate": 0.0002779071545773379, "loss": 0.0256, "step": 56820 }, { "epoch": 0.15, "learning_rate": 0.0002779032663609664, "loss": 0.0229, "step": 56830 }, { "epoch": 0.15, "learning_rate": 0.00027789937814459497, "loss": 0.0258, "step": 56840 }, { "epoch": 0.15, "learning_rate": 0.0002778954899282235, "loss": 0.0283, "step": 56850 }, { "epoch": 0.15, "learning_rate": 0.00027789160171185206, "loss": 0.0366, "step": 56860 }, { "epoch": 0.15, "learning_rate": 0.00027788771349548057, "loss": 0.0334, "step": 56870 }, { "epoch": 0.15, "learning_rate": 0.00027788382527910914, "loss": 0.0329, "step": 56880 }, { "epoch": 0.15, "learning_rate": 0.00027787993706273765, "loss": 0.0277, "step": 56890 }, { "epoch": 0.15, "learning_rate": 0.00027787604884636617, "loss": 0.0304, "step": 56900 }, { "epoch": 0.15, "learning_rate": 0.0002778721606299947, "loss": 0.0268, "step": 56910 }, { "epoch": 0.15, "learning_rate": 0.00027786827241362325, "loss": 0.0311, "step": 56920 }, { "epoch": 0.15, "learning_rate": 0.00027786438419725177, "loss": 0.0267, "step": 56930 }, { "epoch": 0.15, "learning_rate": 0.00027786049598088033, "loss": 0.0317, "step": 56940 }, { "epoch": 0.15, "learning_rate": 0.00027785660776450885, "loss": 0.0263, "step": 56950 }, { "epoch": 0.15, "learning_rate": 0.0002778527195481374, "loss": 0.0246, "step": 56960 }, { "epoch": 0.15, "learning_rate": 0.00027784883133176593, "loss": 0.029, "step": 56970 }, { "epoch": 0.15, "learning_rate": 0.00027784494311539445, "loss": 0.0297, "step": 56980 }, { "epoch": 0.15, "learning_rate": 0.00027784105489902296, "loss": 0.0256, "step": 56990 }, { "epoch": 0.15, "learning_rate": 0.00027783716668265153, "loss": 0.0255, "step": 57000 }, { "epoch": 0.15, "eval_cer": 0.8818160569148363, "eval_loss": 0.019956447184085846, "eval_runtime": 108.1102, "eval_samples_per_second": 18.5, "eval_steps_per_second": 4.625, "step": 57000 }, { "epoch": 0.15, "learning_rate": 0.0002778332784662801, "loss": 0.0228, "step": 57010 }, { "epoch": 0.15, "learning_rate": 0.0002778293902499086, "loss": 0.0259, "step": 57020 }, { "epoch": 0.15, "learning_rate": 0.00027782550203353713, "loss": 0.0268, "step": 57030 }, { "epoch": 0.15, "learning_rate": 0.0002778216138171657, "loss": 0.0231, "step": 57040 }, { "epoch": 0.15, "learning_rate": 0.0002778177256007942, "loss": 0.0226, "step": 57050 }, { "epoch": 0.15, "learning_rate": 0.0002778138373844227, "loss": 0.0271, "step": 57060 }, { "epoch": 0.15, "learning_rate": 0.0002778099491680513, "loss": 0.025, "step": 57070 }, { "epoch": 0.15, "learning_rate": 0.0002778060609516798, "loss": 0.0199, "step": 57080 }, { "epoch": 0.15, "learning_rate": 0.0002778021727353084, "loss": 0.0268, "step": 57090 }, { "epoch": 0.15, "learning_rate": 0.0002777982845189369, "loss": 0.0276, "step": 57100 }, { "epoch": 0.15, "learning_rate": 0.0002777943963025654, "loss": 0.0268, "step": 57110 }, { "epoch": 0.15, "learning_rate": 0.0002777905080861939, "loss": 0.0247, "step": 57120 }, { "epoch": 0.15, "learning_rate": 0.0002777866198698225, "loss": 0.0251, "step": 57130 }, { "epoch": 0.15, "learning_rate": 0.000277782731653451, "loss": 0.0292, "step": 57140 }, { "epoch": 0.15, "learning_rate": 0.0002777788434370796, "loss": 0.0312, "step": 57150 }, { "epoch": 0.15, "learning_rate": 0.0002777749552207081, "loss": 0.0261, "step": 57160 }, { "epoch": 0.15, "learning_rate": 0.00027777106700433666, "loss": 0.0274, "step": 57170 }, { "epoch": 0.15, "learning_rate": 0.00027776717878796517, "loss": 0.0243, "step": 57180 }, { "epoch": 0.15, "learning_rate": 0.0002777632905715937, "loss": 0.0315, "step": 57190 }, { "epoch": 0.15, "learning_rate": 0.0002777594023552222, "loss": 0.0331, "step": 57200 }, { "epoch": 0.15, "learning_rate": 0.00027775551413885077, "loss": 0.028, "step": 57210 }, { "epoch": 0.15, "learning_rate": 0.00027775162592247934, "loss": 0.0277, "step": 57220 }, { "epoch": 0.15, "learning_rate": 0.00027774773770610785, "loss": 0.0275, "step": 57230 }, { "epoch": 0.15, "learning_rate": 0.00027774384948973637, "loss": 0.0303, "step": 57240 }, { "epoch": 0.15, "learning_rate": 0.00027773996127336494, "loss": 0.0311, "step": 57250 }, { "epoch": 0.15, "learning_rate": 0.00027773607305699345, "loss": 0.0248, "step": 57260 }, { "epoch": 0.15, "learning_rate": 0.00027773218484062196, "loss": 0.0287, "step": 57270 }, { "epoch": 0.15, "learning_rate": 0.00027772829662425053, "loss": 0.0336, "step": 57280 }, { "epoch": 0.15, "learning_rate": 0.00027772440840787905, "loss": 0.0283, "step": 57290 }, { "epoch": 0.15, "learning_rate": 0.0002777205201915076, "loss": 0.0257, "step": 57300 }, { "epoch": 0.15, "learning_rate": 0.00027771663197513613, "loss": 0.0238, "step": 57310 }, { "epoch": 0.15, "learning_rate": 0.00027771274375876465, "loss": 0.028, "step": 57320 }, { "epoch": 0.15, "learning_rate": 0.00027770885554239316, "loss": 0.0286, "step": 57330 }, { "epoch": 0.15, "learning_rate": 0.00027770496732602173, "loss": 0.0318, "step": 57340 }, { "epoch": 0.15, "learning_rate": 0.00027770107910965024, "loss": 0.0303, "step": 57350 }, { "epoch": 0.15, "learning_rate": 0.0002776971908932788, "loss": 0.0283, "step": 57360 }, { "epoch": 0.15, "learning_rate": 0.0002776933026769073, "loss": 0.0254, "step": 57370 }, { "epoch": 0.15, "learning_rate": 0.0002776894144605359, "loss": 0.0278, "step": 57380 }, { "epoch": 0.15, "learning_rate": 0.0002776855262441644, "loss": 0.0253, "step": 57390 }, { "epoch": 0.15, "learning_rate": 0.0002776816380277929, "loss": 0.03, "step": 57400 }, { "epoch": 0.15, "learning_rate": 0.0002776777498114215, "loss": 0.0273, "step": 57410 }, { "epoch": 0.15, "learning_rate": 0.00027767386159505, "loss": 0.0253, "step": 57420 }, { "epoch": 0.15, "learning_rate": 0.0002776699733786786, "loss": 0.0267, "step": 57430 }, { "epoch": 0.15, "learning_rate": 0.0002776660851623071, "loss": 0.0416, "step": 57440 }, { "epoch": 0.15, "learning_rate": 0.0002776621969459356, "loss": 0.0365, "step": 57450 }, { "epoch": 0.15, "learning_rate": 0.0002776583087295642, "loss": 0.0286, "step": 57460 }, { "epoch": 0.15, "learning_rate": 0.0002776544205131927, "loss": 0.0269, "step": 57470 }, { "epoch": 0.15, "learning_rate": 0.0002776505322968212, "loss": 0.0345, "step": 57480 }, { "epoch": 0.15, "learning_rate": 0.00027764664408044977, "loss": 0.0265, "step": 57490 }, { "epoch": 0.15, "learning_rate": 0.00027764275586407834, "loss": 0.0281, "step": 57500 }, { "epoch": 0.15, "learning_rate": 0.00027763886764770686, "loss": 0.0258, "step": 57510 }, { "epoch": 0.15, "learning_rate": 0.00027763497943133537, "loss": 0.0558, "step": 57520 }, { "epoch": 0.15, "learning_rate": 0.0002776310912149639, "loss": 0.0267, "step": 57530 }, { "epoch": 0.15, "learning_rate": 0.00027762720299859245, "loss": 0.0245, "step": 57540 }, { "epoch": 0.15, "learning_rate": 0.00027762331478222097, "loss": 0.0244, "step": 57550 }, { "epoch": 0.15, "learning_rate": 0.00027761942656584954, "loss": 0.0315, "step": 57560 }, { "epoch": 0.15, "learning_rate": 0.00027761553834947805, "loss": 0.0246, "step": 57570 }, { "epoch": 0.15, "learning_rate": 0.00027761165013310657, "loss": 0.0295, "step": 57580 }, { "epoch": 0.15, "learning_rate": 0.00027760776191673513, "loss": 0.0295, "step": 57590 }, { "epoch": 0.15, "learning_rate": 0.00027760387370036365, "loss": 0.0249, "step": 57600 }, { "epoch": 0.15, "learning_rate": 0.00027759998548399216, "loss": 0.0266, "step": 57610 }, { "epoch": 0.15, "learning_rate": 0.00027759609726762073, "loss": 0.0261, "step": 57620 }, { "epoch": 0.15, "learning_rate": 0.00027759220905124925, "loss": 0.0277, "step": 57630 }, { "epoch": 0.15, "learning_rate": 0.0002775883208348778, "loss": 0.0275, "step": 57640 }, { "epoch": 0.15, "learning_rate": 0.00027758443261850633, "loss": 0.0242, "step": 57650 }, { "epoch": 0.15, "learning_rate": 0.00027758054440213484, "loss": 0.0286, "step": 57660 }, { "epoch": 0.15, "learning_rate": 0.0002775766561857634, "loss": 0.0274, "step": 57670 }, { "epoch": 0.15, "learning_rate": 0.00027757276796939193, "loss": 0.0266, "step": 57680 }, { "epoch": 0.15, "learning_rate": 0.00027756887975302044, "loss": 0.0261, "step": 57690 }, { "epoch": 0.15, "learning_rate": 0.000277564991536649, "loss": 0.0243, "step": 57700 }, { "epoch": 0.15, "learning_rate": 0.0002775611033202776, "loss": 0.0273, "step": 57710 }, { "epoch": 0.15, "learning_rate": 0.0002775572151039061, "loss": 0.0258, "step": 57720 }, { "epoch": 0.15, "learning_rate": 0.0002775533268875346, "loss": 0.0257, "step": 57730 }, { "epoch": 0.15, "learning_rate": 0.0002775494386711631, "loss": 0.0265, "step": 57740 }, { "epoch": 0.15, "learning_rate": 0.0002775455504547917, "loss": 0.0281, "step": 57750 }, { "epoch": 0.15, "learning_rate": 0.0002775416622384202, "loss": 0.0263, "step": 57760 }, { "epoch": 0.15, "learning_rate": 0.0002775377740220488, "loss": 0.0285, "step": 57770 }, { "epoch": 0.15, "learning_rate": 0.0002775338858056773, "loss": 0.0228, "step": 57780 }, { "epoch": 0.15, "learning_rate": 0.00027752999758930586, "loss": 0.0251, "step": 57790 }, { "epoch": 0.15, "learning_rate": 0.0002775261093729344, "loss": 0.0255, "step": 57800 }, { "epoch": 0.15, "learning_rate": 0.0002775222211565629, "loss": 0.0277, "step": 57810 }, { "epoch": 0.15, "learning_rate": 0.0002775183329401914, "loss": 0.0368, "step": 57820 }, { "epoch": 0.15, "learning_rate": 0.00027751444472381997, "loss": 0.0335, "step": 57830 }, { "epoch": 0.15, "learning_rate": 0.0002775105565074485, "loss": 0.0301, "step": 57840 }, { "epoch": 0.15, "learning_rate": 0.00027750666829107705, "loss": 0.0249, "step": 57850 }, { "epoch": 0.15, "learning_rate": 0.00027750278007470557, "loss": 0.0249, "step": 57860 }, { "epoch": 0.15, "learning_rate": 0.0002774988918583341, "loss": 0.0253, "step": 57870 }, { "epoch": 0.15, "learning_rate": 0.00027749500364196265, "loss": 0.0253, "step": 57880 }, { "epoch": 0.15, "learning_rate": 0.00027749111542559117, "loss": 0.0274, "step": 57890 }, { "epoch": 0.15, "learning_rate": 0.00027748722720921974, "loss": 0.0368, "step": 57900 }, { "epoch": 0.15, "learning_rate": 0.00027748333899284825, "loss": 0.0268, "step": 57910 }, { "epoch": 0.15, "learning_rate": 0.0002774794507764768, "loss": 0.0258, "step": 57920 }, { "epoch": 0.15, "learning_rate": 0.00027747556256010533, "loss": 0.0239, "step": 57930 }, { "epoch": 0.15, "learning_rate": 0.00027747167434373385, "loss": 0.0275, "step": 57940 }, { "epoch": 0.15, "learning_rate": 0.00027746778612736236, "loss": 0.0253, "step": 57950 }, { "epoch": 0.15, "learning_rate": 0.00027746389791099093, "loss": 0.026, "step": 57960 }, { "epoch": 0.15, "learning_rate": 0.00027746000969461945, "loss": 0.0269, "step": 57970 }, { "epoch": 0.15, "learning_rate": 0.000277456121478248, "loss": 0.0267, "step": 57980 }, { "epoch": 0.15, "learning_rate": 0.00027745223326187653, "loss": 0.0265, "step": 57990 }, { "epoch": 0.15, "learning_rate": 0.0002774483450455051, "loss": 0.0277, "step": 58000 }, { "epoch": 0.15, "eval_cer": 0.881845449290454, "eval_loss": 0.01981378346681595, "eval_runtime": 107.9556, "eval_samples_per_second": 18.526, "eval_steps_per_second": 4.632, "step": 58000 }, { "epoch": 0.15, "learning_rate": 0.0002774444568291336, "loss": 0.0355, "step": 58010 }, { "epoch": 0.15, "learning_rate": 0.0002774405686127621, "loss": 0.028, "step": 58020 }, { "epoch": 0.15, "learning_rate": 0.00027743668039639064, "loss": 0.0293, "step": 58030 }, { "epoch": 0.15, "learning_rate": 0.0002774327921800192, "loss": 0.0288, "step": 58040 }, { "epoch": 0.15, "learning_rate": 0.0002774289039636478, "loss": 0.0322, "step": 58050 }, { "epoch": 0.15, "learning_rate": 0.0002774250157472763, "loss": 0.023, "step": 58060 }, { "epoch": 0.15, "learning_rate": 0.0002774211275309048, "loss": 0.0285, "step": 58070 }, { "epoch": 0.15, "learning_rate": 0.0002774172393145333, "loss": 0.031, "step": 58080 }, { "epoch": 0.15, "learning_rate": 0.0002774133510981619, "loss": 0.0254, "step": 58090 }, { "epoch": 0.15, "learning_rate": 0.0002774094628817904, "loss": 0.0268, "step": 58100 }, { "epoch": 0.15, "learning_rate": 0.000277405574665419, "loss": 0.0285, "step": 58110 }, { "epoch": 0.15, "learning_rate": 0.0002774016864490475, "loss": 0.0243, "step": 58120 }, { "epoch": 0.15, "learning_rate": 0.00027739779823267606, "loss": 0.025, "step": 58130 }, { "epoch": 0.15, "learning_rate": 0.00027739391001630457, "loss": 0.024, "step": 58140 }, { "epoch": 0.15, "learning_rate": 0.0002773900217999331, "loss": 0.0292, "step": 58150 }, { "epoch": 0.15, "learning_rate": 0.0002773861335835616, "loss": 0.0305, "step": 58160 }, { "epoch": 0.15, "learning_rate": 0.00027738224536719017, "loss": 0.0285, "step": 58170 }, { "epoch": 0.15, "learning_rate": 0.0002773783571508187, "loss": 0.0235, "step": 58180 }, { "epoch": 0.15, "learning_rate": 0.00027737446893444725, "loss": 0.0289, "step": 58190 }, { "epoch": 0.15, "learning_rate": 0.00027737058071807577, "loss": 0.0297, "step": 58200 }, { "epoch": 0.15, "learning_rate": 0.00027736669250170434, "loss": 0.0265, "step": 58210 }, { "epoch": 0.15, "learning_rate": 0.00027736280428533285, "loss": 0.0344, "step": 58220 }, { "epoch": 0.15, "learning_rate": 0.00027735891606896137, "loss": 0.0283, "step": 58230 }, { "epoch": 0.15, "learning_rate": 0.0002773550278525899, "loss": 0.0264, "step": 58240 }, { "epoch": 0.15, "learning_rate": 0.00027735113963621845, "loss": 0.0321, "step": 58250 }, { "epoch": 0.15, "learning_rate": 0.000277347251419847, "loss": 0.0273, "step": 58260 }, { "epoch": 0.15, "learning_rate": 0.00027734336320347553, "loss": 0.0232, "step": 58270 }, { "epoch": 0.15, "learning_rate": 0.00027733947498710405, "loss": 0.0315, "step": 58280 }, { "epoch": 0.15, "learning_rate": 0.0002773355867707326, "loss": 0.0298, "step": 58290 }, { "epoch": 0.15, "learning_rate": 0.00027733169855436113, "loss": 0.0253, "step": 58300 }, { "epoch": 0.15, "learning_rate": 0.00027732781033798964, "loss": 0.0244, "step": 58310 }, { "epoch": 0.15, "learning_rate": 0.0002773239221216182, "loss": 0.022, "step": 58320 }, { "epoch": 0.15, "learning_rate": 0.00027732003390524673, "loss": 0.0304, "step": 58330 }, { "epoch": 0.15, "learning_rate": 0.0002773161456888753, "loss": 0.025, "step": 58340 }, { "epoch": 0.15, "learning_rate": 0.0002773122574725038, "loss": 0.0272, "step": 58350 }, { "epoch": 0.15, "learning_rate": 0.0002773083692561323, "loss": 0.0251, "step": 58360 }, { "epoch": 0.15, "learning_rate": 0.00027730448103976084, "loss": 0.0292, "step": 58370 }, { "epoch": 0.15, "learning_rate": 0.0002773005928233894, "loss": 0.0281, "step": 58380 }, { "epoch": 0.15, "learning_rate": 0.0002772967046070179, "loss": 0.0314, "step": 58390 }, { "epoch": 0.15, "learning_rate": 0.0002772928163906465, "loss": 0.0265, "step": 58400 }, { "epoch": 0.15, "learning_rate": 0.000277288928174275, "loss": 0.0289, "step": 58410 }, { "epoch": 0.15, "learning_rate": 0.0002772850399579036, "loss": 0.0273, "step": 58420 }, { "epoch": 0.15, "learning_rate": 0.0002772811517415321, "loss": 0.0215, "step": 58430 }, { "epoch": 0.15, "learning_rate": 0.0002772772635251606, "loss": 0.0237, "step": 58440 }, { "epoch": 0.15, "learning_rate": 0.0002772733753087892, "loss": 0.0271, "step": 58450 }, { "epoch": 0.15, "learning_rate": 0.0002772694870924177, "loss": 0.0295, "step": 58460 }, { "epoch": 0.15, "learning_rate": 0.00027726559887604626, "loss": 0.0223, "step": 58470 }, { "epoch": 0.15, "learning_rate": 0.00027726171065967477, "loss": 0.0261, "step": 58480 }, { "epoch": 0.15, "learning_rate": 0.0002772578224433033, "loss": 0.0266, "step": 58490 }, { "epoch": 0.15, "learning_rate": 0.00027725393422693185, "loss": 0.0265, "step": 58500 }, { "epoch": 0.15, "learning_rate": 0.00027725004601056037, "loss": 0.0318, "step": 58510 }, { "epoch": 0.15, "learning_rate": 0.0002772461577941889, "loss": 0.0267, "step": 58520 }, { "epoch": 0.15, "learning_rate": 0.00027724226957781745, "loss": 0.027, "step": 58530 }, { "epoch": 0.15, "learning_rate": 0.00027723838136144597, "loss": 0.0265, "step": 58540 }, { "epoch": 0.15, "learning_rate": 0.00027723449314507454, "loss": 0.0267, "step": 58550 }, { "epoch": 0.15, "learning_rate": 0.00027723060492870305, "loss": 0.0196, "step": 58560 }, { "epoch": 0.15, "learning_rate": 0.00027722671671233156, "loss": 0.0299, "step": 58570 }, { "epoch": 0.15, "learning_rate": 0.0002772228284959601, "loss": 0.0221, "step": 58580 }, { "epoch": 0.15, "learning_rate": 0.00027721894027958865, "loss": 0.0315, "step": 58590 }, { "epoch": 0.15, "learning_rate": 0.0002772150520632172, "loss": 0.0251, "step": 58600 }, { "epoch": 0.15, "learning_rate": 0.00027721116384684573, "loss": 0.0281, "step": 58610 }, { "epoch": 0.15, "learning_rate": 0.00027720727563047425, "loss": 0.0292, "step": 58620 }, { "epoch": 0.15, "learning_rate": 0.0002772033874141028, "loss": 0.0258, "step": 58630 }, { "epoch": 0.15, "learning_rate": 0.00027719949919773133, "loss": 0.0275, "step": 58640 }, { "epoch": 0.15, "learning_rate": 0.00027719561098135984, "loss": 0.0281, "step": 58650 }, { "epoch": 0.15, "learning_rate": 0.0002771917227649884, "loss": 0.0288, "step": 58660 }, { "epoch": 0.15, "learning_rate": 0.0002771878345486169, "loss": 0.0264, "step": 58670 }, { "epoch": 0.15, "learning_rate": 0.0002771839463322455, "loss": 0.0291, "step": 58680 }, { "epoch": 0.15, "learning_rate": 0.000277180058115874, "loss": 0.0261, "step": 58690 }, { "epoch": 0.15, "learning_rate": 0.0002771761698995025, "loss": 0.0267, "step": 58700 }, { "epoch": 0.15, "learning_rate": 0.0002771722816831311, "loss": 0.0273, "step": 58710 }, { "epoch": 0.15, "learning_rate": 0.0002771683934667596, "loss": 0.0261, "step": 58720 }, { "epoch": 0.15, "learning_rate": 0.0002771645052503881, "loss": 0.0251, "step": 58730 }, { "epoch": 0.15, "learning_rate": 0.0002771606170340167, "loss": 0.0278, "step": 58740 }, { "epoch": 0.15, "learning_rate": 0.00027715672881764526, "loss": 0.0247, "step": 58750 }, { "epoch": 0.15, "learning_rate": 0.0002771528406012738, "loss": 0.0295, "step": 58760 }, { "epoch": 0.15, "learning_rate": 0.0002771489523849023, "loss": 0.0252, "step": 58770 }, { "epoch": 0.15, "learning_rate": 0.0002771450641685308, "loss": 0.0308, "step": 58780 }, { "epoch": 0.15, "learning_rate": 0.00027714117595215937, "loss": 0.0279, "step": 58790 }, { "epoch": 0.15, "learning_rate": 0.0002771372877357879, "loss": 0.0316, "step": 58800 }, { "epoch": 0.15, "learning_rate": 0.00027713339951941646, "loss": 0.0331, "step": 58810 }, { "epoch": 0.15, "learning_rate": 0.00027712951130304497, "loss": 0.0241, "step": 58820 }, { "epoch": 0.15, "learning_rate": 0.0002771256230866735, "loss": 0.0315, "step": 58830 }, { "epoch": 0.15, "learning_rate": 0.00027712173487030205, "loss": 0.0278, "step": 58840 }, { "epoch": 0.15, "learning_rate": 0.00027711784665393057, "loss": 0.0322, "step": 58850 }, { "epoch": 0.15, "learning_rate": 0.0002771139584375591, "loss": 0.0269, "step": 58860 }, { "epoch": 0.15, "learning_rate": 0.00027711007022118765, "loss": 0.0257, "step": 58870 }, { "epoch": 0.15, "learning_rate": 0.00027710618200481617, "loss": 0.0303, "step": 58880 }, { "epoch": 0.15, "learning_rate": 0.00027710229378844473, "loss": 0.0245, "step": 58890 }, { "epoch": 0.15, "learning_rate": 0.00027709840557207325, "loss": 0.0301, "step": 58900 }, { "epoch": 0.15, "learning_rate": 0.00027709451735570176, "loss": 0.0221, "step": 58910 }, { "epoch": 0.15, "learning_rate": 0.00027709062913933033, "loss": 0.0262, "step": 58920 }, { "epoch": 0.15, "learning_rate": 0.00027708674092295885, "loss": 0.0275, "step": 58930 }, { "epoch": 0.15, "learning_rate": 0.00027708285270658736, "loss": 0.0291, "step": 58940 }, { "epoch": 0.15, "learning_rate": 0.00027707896449021593, "loss": 0.031, "step": 58950 }, { "epoch": 0.15, "learning_rate": 0.0002770750762738445, "loss": 0.0265, "step": 58960 }, { "epoch": 0.15, "learning_rate": 0.000277071188057473, "loss": 0.0246, "step": 58970 }, { "epoch": 0.15, "learning_rate": 0.00027706729984110153, "loss": 0.0278, "step": 58980 }, { "epoch": 0.15, "learning_rate": 0.00027706341162473004, "loss": 0.031, "step": 58990 }, { "epoch": 0.15, "learning_rate": 0.0002770595234083586, "loss": 0.0268, "step": 59000 }, { "epoch": 0.15, "eval_cer": 0.8817992612716261, "eval_loss": 0.0200749970972538, "eval_runtime": 108.3189, "eval_samples_per_second": 18.464, "eval_steps_per_second": 4.616, "step": 59000 }, { "epoch": 0.15, "learning_rate": 0.0002770556351919871, "loss": 0.0253, "step": 59010 }, { "epoch": 0.15, "learning_rate": 0.0002770517469756157, "loss": 0.0222, "step": 59020 }, { "epoch": 0.15, "learning_rate": 0.0002770478587592442, "loss": 0.0317, "step": 59030 }, { "epoch": 0.15, "learning_rate": 0.0002770439705428728, "loss": 0.0278, "step": 59040 }, { "epoch": 0.15, "learning_rate": 0.0002770400823265013, "loss": 0.027, "step": 59050 }, { "epoch": 0.15, "learning_rate": 0.0002770361941101298, "loss": 0.0349, "step": 59060 }, { "epoch": 0.15, "learning_rate": 0.0002770323058937583, "loss": 0.0242, "step": 59070 }, { "epoch": 0.15, "learning_rate": 0.0002770284176773869, "loss": 0.0218, "step": 59080 }, { "epoch": 0.15, "learning_rate": 0.00027702452946101546, "loss": 0.0219, "step": 59090 }, { "epoch": 0.15, "learning_rate": 0.000277020641244644, "loss": 0.0258, "step": 59100 }, { "epoch": 0.15, "learning_rate": 0.0002770167530282725, "loss": 0.03, "step": 59110 }, { "epoch": 0.15, "learning_rate": 0.000277012864811901, "loss": 0.0311, "step": 59120 }, { "epoch": 0.15, "learning_rate": 0.00027700897659552957, "loss": 0.0279, "step": 59130 }, { "epoch": 0.15, "learning_rate": 0.0002770050883791581, "loss": 0.0255, "step": 59140 }, { "epoch": 0.15, "learning_rate": 0.00027700120016278665, "loss": 0.0285, "step": 59150 }, { "epoch": 0.15, "learning_rate": 0.00027699731194641517, "loss": 0.0235, "step": 59160 }, { "epoch": 0.15, "learning_rate": 0.00027699342373004374, "loss": 0.0264, "step": 59170 }, { "epoch": 0.15, "learning_rate": 0.00027698953551367225, "loss": 0.035, "step": 59180 }, { "epoch": 0.15, "learning_rate": 0.00027698564729730077, "loss": 0.0274, "step": 59190 }, { "epoch": 0.15, "learning_rate": 0.0002769817590809293, "loss": 0.0267, "step": 59200 }, { "epoch": 0.15, "learning_rate": 0.00027697787086455785, "loss": 0.0358, "step": 59210 }, { "epoch": 0.15, "learning_rate": 0.00027697398264818636, "loss": 0.0288, "step": 59220 }, { "epoch": 0.15, "learning_rate": 0.00027697009443181493, "loss": 0.0429, "step": 59230 }, { "epoch": 0.15, "learning_rate": 0.00027696620621544345, "loss": 0.026, "step": 59240 }, { "epoch": 0.15, "learning_rate": 0.000276962317999072, "loss": 0.0264, "step": 59250 }, { "epoch": 0.15, "learning_rate": 0.00027695842978270053, "loss": 0.0238, "step": 59260 }, { "epoch": 0.15, "learning_rate": 0.00027695454156632905, "loss": 0.0304, "step": 59270 }, { "epoch": 0.15, "learning_rate": 0.00027695065334995756, "loss": 0.0257, "step": 59280 }, { "epoch": 0.15, "learning_rate": 0.00027694676513358613, "loss": 0.0252, "step": 59290 }, { "epoch": 0.15, "learning_rate": 0.0002769428769172147, "loss": 0.0239, "step": 59300 }, { "epoch": 0.15, "learning_rate": 0.0002769389887008432, "loss": 0.0357, "step": 59310 }, { "epoch": 0.15, "learning_rate": 0.0002769351004844717, "loss": 0.0269, "step": 59320 }, { "epoch": 0.15, "learning_rate": 0.00027693121226810024, "loss": 0.028, "step": 59330 }, { "epoch": 0.15, "learning_rate": 0.0002769273240517288, "loss": 0.0247, "step": 59340 }, { "epoch": 0.15, "learning_rate": 0.0002769234358353573, "loss": 0.0244, "step": 59350 }, { "epoch": 0.15, "learning_rate": 0.0002769195476189859, "loss": 0.0275, "step": 59360 }, { "epoch": 0.15, "learning_rate": 0.0002769156594026144, "loss": 0.027, "step": 59370 }, { "epoch": 0.15, "learning_rate": 0.000276911771186243, "loss": 0.0288, "step": 59380 }, { "epoch": 0.15, "learning_rate": 0.0002769078829698715, "loss": 0.0224, "step": 59390 }, { "epoch": 0.15, "learning_rate": 0.0002769039947535, "loss": 0.0296, "step": 59400 }, { "epoch": 0.15, "learning_rate": 0.0002769001065371285, "loss": 0.0206, "step": 59410 }, { "epoch": 0.15, "learning_rate": 0.0002768962183207571, "loss": 0.0241, "step": 59420 }, { "epoch": 0.15, "learning_rate": 0.0002768923301043856, "loss": 0.0233, "step": 59430 }, { "epoch": 0.15, "learning_rate": 0.00027688844188801417, "loss": 0.0301, "step": 59440 }, { "epoch": 0.15, "learning_rate": 0.0002768845536716427, "loss": 0.0383, "step": 59450 }, { "epoch": 0.15, "learning_rate": 0.00027688066545527126, "loss": 0.0316, "step": 59460 }, { "epoch": 0.15, "learning_rate": 0.00027687677723889977, "loss": 0.0251, "step": 59470 }, { "epoch": 0.15, "learning_rate": 0.0002768728890225283, "loss": 0.0253, "step": 59480 }, { "epoch": 0.15, "learning_rate": 0.00027686900080615685, "loss": 0.0246, "step": 59490 }, { "epoch": 0.15, "learning_rate": 0.00027686511258978537, "loss": 0.0247, "step": 59500 }, { "epoch": 0.15, "learning_rate": 0.00027686122437341394, "loss": 0.0303, "step": 59510 }, { "epoch": 0.15, "learning_rate": 0.00027685733615704245, "loss": 0.0277, "step": 59520 }, { "epoch": 0.15, "learning_rate": 0.00027685344794067097, "loss": 0.032, "step": 59530 }, { "epoch": 0.15, "learning_rate": 0.00027684955972429953, "loss": 0.0234, "step": 59540 }, { "epoch": 0.15, "learning_rate": 0.00027684567150792805, "loss": 0.026, "step": 59550 }, { "epoch": 0.15, "learning_rate": 0.00027684178329155656, "loss": 0.0293, "step": 59560 }, { "epoch": 0.15, "learning_rate": 0.00027683789507518513, "loss": 0.0252, "step": 59570 }, { "epoch": 0.15, "learning_rate": 0.00027683400685881365, "loss": 0.0272, "step": 59580 }, { "epoch": 0.15, "learning_rate": 0.0002768301186424422, "loss": 0.0248, "step": 59590 }, { "epoch": 0.15, "learning_rate": 0.00027682623042607073, "loss": 0.0325, "step": 59600 }, { "epoch": 0.15, "learning_rate": 0.00027682234220969924, "loss": 0.0271, "step": 59610 }, { "epoch": 0.15, "learning_rate": 0.00027681845399332776, "loss": 0.0263, "step": 59620 }, { "epoch": 0.15, "learning_rate": 0.00027681456577695633, "loss": 0.0285, "step": 59630 }, { "epoch": 0.15, "learning_rate": 0.0002768106775605849, "loss": 0.0295, "step": 59640 }, { "epoch": 0.15, "learning_rate": 0.0002768067893442134, "loss": 0.0252, "step": 59650 }, { "epoch": 0.15, "learning_rate": 0.0002768029011278419, "loss": 0.0303, "step": 59660 }, { "epoch": 0.15, "learning_rate": 0.0002767990129114705, "loss": 0.0281, "step": 59670 }, { "epoch": 0.15, "learning_rate": 0.000276795124695099, "loss": 0.0277, "step": 59680 }, { "epoch": 0.15, "learning_rate": 0.0002767912364787275, "loss": 0.0271, "step": 59690 }, { "epoch": 0.15, "learning_rate": 0.0002767873482623561, "loss": 0.0294, "step": 59700 }, { "epoch": 0.15, "learning_rate": 0.0002767834600459846, "loss": 0.0227, "step": 59710 }, { "epoch": 0.15, "learning_rate": 0.0002767795718296132, "loss": 0.0233, "step": 59720 }, { "epoch": 0.15, "learning_rate": 0.0002767756836132417, "loss": 0.0245, "step": 59730 }, { "epoch": 0.15, "learning_rate": 0.0002767717953968702, "loss": 0.0296, "step": 59740 }, { "epoch": 0.15, "learning_rate": 0.0002767679071804988, "loss": 0.0276, "step": 59750 }, { "epoch": 0.15, "learning_rate": 0.0002767640189641273, "loss": 0.0249, "step": 59760 }, { "epoch": 0.15, "learning_rate": 0.0002767601307477558, "loss": 0.0292, "step": 59770 }, { "epoch": 0.15, "learning_rate": 0.00027675624253138437, "loss": 0.0272, "step": 59780 }, { "epoch": 0.15, "learning_rate": 0.00027675235431501294, "loss": 0.0258, "step": 59790 }, { "epoch": 0.16, "learning_rate": 0.00027674846609864145, "loss": 0.0257, "step": 59800 }, { "epoch": 0.16, "learning_rate": 0.00027674457788226997, "loss": 0.0243, "step": 59810 }, { "epoch": 0.16, "learning_rate": 0.0002767406896658985, "loss": 0.026, "step": 59820 }, { "epoch": 0.16, "learning_rate": 0.000276736801449527, "loss": 0.0263, "step": 59830 }, { "epoch": 0.16, "learning_rate": 0.00027673291323315557, "loss": 0.0296, "step": 59840 }, { "epoch": 0.16, "learning_rate": 0.00027672902501678414, "loss": 0.0266, "step": 59850 }, { "epoch": 0.16, "learning_rate": 0.00027672513680041265, "loss": 0.0276, "step": 59860 }, { "epoch": 0.16, "learning_rate": 0.00027672124858404116, "loss": 0.0268, "step": 59870 }, { "epoch": 0.16, "learning_rate": 0.00027671736036766973, "loss": 0.0285, "step": 59880 }, { "epoch": 0.16, "learning_rate": 0.00027671347215129825, "loss": 0.026, "step": 59890 }, { "epoch": 0.16, "learning_rate": 0.00027670958393492676, "loss": 0.0262, "step": 59900 }, { "epoch": 0.16, "learning_rate": 0.00027670569571855533, "loss": 0.0349, "step": 59910 }, { "epoch": 0.16, "learning_rate": 0.00027670180750218385, "loss": 0.0277, "step": 59920 }, { "epoch": 0.16, "learning_rate": 0.0002766979192858124, "loss": 0.0278, "step": 59930 }, { "epoch": 0.16, "learning_rate": 0.00027669403106944093, "loss": 0.0327, "step": 59940 }, { "epoch": 0.16, "learning_rate": 0.00027669014285306944, "loss": 0.0287, "step": 59950 }, { "epoch": 0.16, "learning_rate": 0.000276686254636698, "loss": 0.0251, "step": 59960 }, { "epoch": 0.16, "learning_rate": 0.0002766823664203265, "loss": 0.0294, "step": 59970 }, { "epoch": 0.16, "learning_rate": 0.00027667847820395504, "loss": 0.0298, "step": 59980 }, { "epoch": 0.16, "learning_rate": 0.0002766745899875836, "loss": 0.0255, "step": 59990 }, { "epoch": 0.16, "learning_rate": 0.0002766707017712122, "loss": 0.0276, "step": 60000 }, { "epoch": 0.16, "eval_cer": 0.8818426500165857, "eval_loss": 0.01959504745900631, "eval_runtime": 108.0446, "eval_samples_per_second": 18.511, "eval_steps_per_second": 4.628, "step": 60000 }, { "epoch": 0.16, "learning_rate": 0.0002766668135548407, "loss": 0.0247, "step": 60010 }, { "epoch": 0.16, "learning_rate": 0.0002766629253384692, "loss": 0.0283, "step": 60020 }, { "epoch": 0.16, "learning_rate": 0.0002766590371220977, "loss": 0.0262, "step": 60030 }, { "epoch": 0.16, "learning_rate": 0.0002766551489057263, "loss": 0.0234, "step": 60040 }, { "epoch": 0.16, "learning_rate": 0.0002766512606893548, "loss": 0.0299, "step": 60050 }, { "epoch": 0.16, "learning_rate": 0.0002766473724729834, "loss": 0.0319, "step": 60060 }, { "epoch": 0.16, "learning_rate": 0.0002766434842566119, "loss": 0.0294, "step": 60070 }, { "epoch": 0.16, "learning_rate": 0.0002766395960402404, "loss": 0.027, "step": 60080 }, { "epoch": 0.16, "learning_rate": 0.00027663570782386897, "loss": 0.0289, "step": 60090 }, { "epoch": 0.16, "learning_rate": 0.0002766318196074975, "loss": 0.0263, "step": 60100 }, { "epoch": 0.16, "learning_rate": 0.000276627931391126, "loss": 0.0258, "step": 60110 }, { "epoch": 0.16, "learning_rate": 0.00027662404317475457, "loss": 0.0313, "step": 60120 }, { "epoch": 0.16, "learning_rate": 0.0002766201549583831, "loss": 0.0317, "step": 60130 }, { "epoch": 0.16, "learning_rate": 0.00027661626674201165, "loss": 0.0316, "step": 60140 }, { "epoch": 0.16, "learning_rate": 0.00027661237852564017, "loss": 0.0224, "step": 60150 }, { "epoch": 0.16, "learning_rate": 0.0002766084903092687, "loss": 0.025, "step": 60160 }, { "epoch": 0.16, "learning_rate": 0.00027660460209289725, "loss": 0.0259, "step": 60170 }, { "epoch": 0.16, "learning_rate": 0.00027660071387652577, "loss": 0.0275, "step": 60180 }, { "epoch": 0.16, "learning_rate": 0.00027659682566015433, "loss": 0.0258, "step": 60190 }, { "epoch": 0.16, "learning_rate": 0.00027659293744378285, "loss": 0.0209, "step": 60200 }, { "epoch": 0.16, "learning_rate": 0.0002765890492274114, "loss": 0.0296, "step": 60210 }, { "epoch": 0.16, "learning_rate": 0.00027658516101103993, "loss": 0.0258, "step": 60220 }, { "epoch": 0.16, "learning_rate": 0.00027658127279466845, "loss": 0.0322, "step": 60230 }, { "epoch": 0.16, "learning_rate": 0.00027657738457829696, "loss": 0.0231, "step": 60240 }, { "epoch": 0.16, "learning_rate": 0.00027657349636192553, "loss": 0.0259, "step": 60250 }, { "epoch": 0.16, "learning_rate": 0.00027656960814555404, "loss": 0.0231, "step": 60260 }, { "epoch": 0.16, "learning_rate": 0.0002765657199291826, "loss": 0.0237, "step": 60270 }, { "epoch": 0.16, "learning_rate": 0.00027656183171281113, "loss": 0.0218, "step": 60280 }, { "epoch": 0.16, "learning_rate": 0.00027655794349643964, "loss": 0.0258, "step": 60290 }, { "epoch": 0.16, "learning_rate": 0.0002765540552800682, "loss": 0.0267, "step": 60300 }, { "epoch": 0.16, "learning_rate": 0.0002765501670636967, "loss": 0.0226, "step": 60310 }, { "epoch": 0.16, "learning_rate": 0.00027654627884732524, "loss": 0.0233, "step": 60320 }, { "epoch": 0.16, "learning_rate": 0.0002765423906309538, "loss": 0.0207, "step": 60330 }, { "epoch": 0.16, "learning_rate": 0.0002765385024145824, "loss": 0.0277, "step": 60340 }, { "epoch": 0.16, "learning_rate": 0.0002765346141982109, "loss": 0.0268, "step": 60350 }, { "epoch": 0.16, "learning_rate": 0.0002765307259818394, "loss": 0.0253, "step": 60360 }, { "epoch": 0.16, "learning_rate": 0.0002765268377654679, "loss": 0.0211, "step": 60370 }, { "epoch": 0.16, "learning_rate": 0.0002765229495490965, "loss": 0.0266, "step": 60380 }, { "epoch": 0.16, "learning_rate": 0.000276519061332725, "loss": 0.0229, "step": 60390 }, { "epoch": 0.16, "learning_rate": 0.0002765151731163536, "loss": 0.0271, "step": 60400 }, { "epoch": 0.16, "learning_rate": 0.0002765112848999821, "loss": 0.0263, "step": 60410 }, { "epoch": 0.16, "learning_rate": 0.00027650739668361066, "loss": 0.0251, "step": 60420 }, { "epoch": 0.16, "learning_rate": 0.00027650350846723917, "loss": 0.0364, "step": 60430 }, { "epoch": 0.16, "learning_rate": 0.0002764996202508677, "loss": 0.0299, "step": 60440 }, { "epoch": 0.16, "learning_rate": 0.0002764957320344962, "loss": 0.0271, "step": 60450 }, { "epoch": 0.16, "learning_rate": 0.00027649184381812477, "loss": 0.0295, "step": 60460 }, { "epoch": 0.16, "learning_rate": 0.0002764879556017533, "loss": 0.0292, "step": 60470 }, { "epoch": 0.16, "learning_rate": 0.00027648406738538185, "loss": 0.0293, "step": 60480 }, { "epoch": 0.16, "learning_rate": 0.00027648017916901037, "loss": 0.0244, "step": 60490 }, { "epoch": 0.16, "learning_rate": 0.00027647629095263894, "loss": 0.0296, "step": 60500 }, { "epoch": 0.16, "learning_rate": 0.00027647240273626745, "loss": 0.0283, "step": 60510 }, { "epoch": 0.16, "learning_rate": 0.00027646851451989596, "loss": 0.0242, "step": 60520 }, { "epoch": 0.16, "learning_rate": 0.0002764646263035245, "loss": 0.0274, "step": 60530 }, { "epoch": 0.16, "learning_rate": 0.00027646073808715305, "loss": 0.0298, "step": 60540 }, { "epoch": 0.16, "learning_rate": 0.0002764568498707816, "loss": 0.0303, "step": 60550 }, { "epoch": 0.16, "learning_rate": 0.00027645296165441013, "loss": 0.0305, "step": 60560 }, { "epoch": 0.16, "learning_rate": 0.00027644907343803865, "loss": 0.0231, "step": 60570 }, { "epoch": 0.16, "learning_rate": 0.00027644518522166716, "loss": 0.0301, "step": 60580 }, { "epoch": 0.16, "learning_rate": 0.00027644129700529573, "loss": 0.029, "step": 60590 }, { "epoch": 0.16, "learning_rate": 0.00027643740878892424, "loss": 0.0223, "step": 60600 }, { "epoch": 0.16, "learning_rate": 0.0002764335205725528, "loss": 0.0274, "step": 60610 }, { "epoch": 0.16, "learning_rate": 0.0002764296323561813, "loss": 0.0257, "step": 60620 }, { "epoch": 0.16, "learning_rate": 0.0002764257441398099, "loss": 0.0287, "step": 60630 }, { "epoch": 0.16, "learning_rate": 0.0002764218559234384, "loss": 0.0335, "step": 60640 }, { "epoch": 0.16, "learning_rate": 0.0002764179677070669, "loss": 0.025, "step": 60650 }, { "epoch": 0.16, "learning_rate": 0.00027641407949069544, "loss": 0.0271, "step": 60660 }, { "epoch": 0.16, "learning_rate": 0.000276410191274324, "loss": 0.0265, "step": 60670 }, { "epoch": 0.16, "learning_rate": 0.0002764063030579526, "loss": 0.0291, "step": 60680 }, { "epoch": 0.16, "learning_rate": 0.0002764024148415811, "loss": 0.0241, "step": 60690 }, { "epoch": 0.16, "learning_rate": 0.0002763985266252096, "loss": 0.0251, "step": 60700 }, { "epoch": 0.16, "learning_rate": 0.0002763946384088382, "loss": 0.0203, "step": 60710 }, { "epoch": 0.16, "learning_rate": 0.0002763907501924667, "loss": 0.0278, "step": 60720 }, { "epoch": 0.16, "learning_rate": 0.0002763868619760952, "loss": 0.0324, "step": 60730 }, { "epoch": 0.16, "learning_rate": 0.00027638297375972377, "loss": 0.0273, "step": 60740 }, { "epoch": 0.16, "learning_rate": 0.0002763790855433523, "loss": 0.0352, "step": 60750 }, { "epoch": 0.16, "learning_rate": 0.00027637519732698086, "loss": 0.0265, "step": 60760 }, { "epoch": 0.16, "learning_rate": 0.00027637130911060937, "loss": 0.0235, "step": 60770 }, { "epoch": 0.16, "learning_rate": 0.0002763674208942379, "loss": 0.0247, "step": 60780 }, { "epoch": 0.16, "learning_rate": 0.0002763635326778664, "loss": 0.0265, "step": 60790 }, { "epoch": 0.16, "learning_rate": 0.00027635964446149497, "loss": 0.0272, "step": 60800 }, { "epoch": 0.16, "learning_rate": 0.0002763557562451235, "loss": 0.0235, "step": 60810 }, { "epoch": 0.16, "learning_rate": 0.00027635186802875205, "loss": 0.0265, "step": 60820 }, { "epoch": 0.16, "learning_rate": 0.00027634797981238057, "loss": 0.0268, "step": 60830 }, { "epoch": 0.16, "learning_rate": 0.00027634409159600913, "loss": 0.0237, "step": 60840 }, { "epoch": 0.16, "learning_rate": 0.00027634020337963765, "loss": 0.0257, "step": 60850 }, { "epoch": 0.16, "learning_rate": 0.00027633631516326616, "loss": 0.0231, "step": 60860 }, { "epoch": 0.16, "learning_rate": 0.0002763324269468947, "loss": 0.0306, "step": 60870 }, { "epoch": 0.16, "learning_rate": 0.00027632853873052325, "loss": 0.0213, "step": 60880 }, { "epoch": 0.16, "learning_rate": 0.0002763246505141518, "loss": 0.0235, "step": 60890 }, { "epoch": 0.16, "learning_rate": 0.00027632076229778033, "loss": 0.021, "step": 60900 }, { "epoch": 0.16, "learning_rate": 0.00027631687408140884, "loss": 0.0308, "step": 60910 }, { "epoch": 0.16, "learning_rate": 0.0002763129858650374, "loss": 0.0208, "step": 60920 }, { "epoch": 0.16, "learning_rate": 0.00027630909764866593, "loss": 0.0252, "step": 60930 }, { "epoch": 0.16, "learning_rate": 0.00027630520943229444, "loss": 0.0225, "step": 60940 }, { "epoch": 0.16, "learning_rate": 0.000276301321215923, "loss": 0.0268, "step": 60950 }, { "epoch": 0.16, "learning_rate": 0.0002762974329995515, "loss": 0.0253, "step": 60960 }, { "epoch": 0.16, "learning_rate": 0.0002762935447831801, "loss": 0.0256, "step": 60970 }, { "epoch": 0.16, "learning_rate": 0.0002762896565668086, "loss": 0.0266, "step": 60980 }, { "epoch": 0.16, "learning_rate": 0.0002762857683504371, "loss": 0.0265, "step": 60990 }, { "epoch": 0.16, "learning_rate": 0.0002762818801340657, "loss": 0.0256, "step": 61000 }, { "epoch": 0.16, "eval_cer": 0.8818818398507428, "eval_loss": 0.01873914897441864, "eval_runtime": 107.4676, "eval_samples_per_second": 18.61, "eval_steps_per_second": 4.653, "step": 61000 }, { "epoch": 0.16, "learning_rate": 0.0002762779919176942, "loss": 0.0292, "step": 61010 }, { "epoch": 0.16, "learning_rate": 0.0002762741037013227, "loss": 0.0257, "step": 61020 }, { "epoch": 0.16, "learning_rate": 0.0002762702154849513, "loss": 0.0312, "step": 61030 }, { "epoch": 0.16, "learning_rate": 0.0002762663272685798, "loss": 0.0251, "step": 61040 }, { "epoch": 0.16, "learning_rate": 0.00027626243905220837, "loss": 0.0263, "step": 61050 }, { "epoch": 0.16, "learning_rate": 0.0002762585508358369, "loss": 0.023, "step": 61060 }, { "epoch": 0.16, "learning_rate": 0.0002762546626194654, "loss": 0.0265, "step": 61070 }, { "epoch": 0.16, "learning_rate": 0.00027625077440309397, "loss": 0.0332, "step": 61080 }, { "epoch": 0.16, "learning_rate": 0.0002762468861867225, "loss": 0.0207, "step": 61090 }, { "epoch": 0.16, "learning_rate": 0.00027624299797035105, "loss": 0.0291, "step": 61100 }, { "epoch": 0.16, "learning_rate": 0.00027623910975397957, "loss": 0.0322, "step": 61110 }, { "epoch": 0.16, "learning_rate": 0.0002762352215376081, "loss": 0.0253, "step": 61120 }, { "epoch": 0.16, "learning_rate": 0.00027623133332123665, "loss": 0.0258, "step": 61130 }, { "epoch": 0.16, "learning_rate": 0.00027622744510486517, "loss": 0.0297, "step": 61140 }, { "epoch": 0.16, "learning_rate": 0.0002762235568884937, "loss": 0.0251, "step": 61150 }, { "epoch": 0.16, "learning_rate": 0.00027621966867212225, "loss": 0.0242, "step": 61160 }, { "epoch": 0.16, "learning_rate": 0.00027621578045575076, "loss": 0.0253, "step": 61170 }, { "epoch": 0.16, "learning_rate": 0.00027621189223937933, "loss": 0.0224, "step": 61180 }, { "epoch": 0.16, "learning_rate": 0.00027620800402300785, "loss": 0.0306, "step": 61190 }, { "epoch": 0.16, "learning_rate": 0.00027620411580663636, "loss": 0.031, "step": 61200 }, { "epoch": 0.16, "learning_rate": 0.00027620022759026493, "loss": 0.0303, "step": 61210 }, { "epoch": 0.16, "learning_rate": 0.00027619633937389345, "loss": 0.0243, "step": 61220 }, { "epoch": 0.16, "learning_rate": 0.000276192451157522, "loss": 0.0259, "step": 61230 }, { "epoch": 0.16, "learning_rate": 0.00027618856294115053, "loss": 0.0276, "step": 61240 }, { "epoch": 0.16, "learning_rate": 0.0002761846747247791, "loss": 0.0316, "step": 61250 }, { "epoch": 0.16, "learning_rate": 0.0002761807865084076, "loss": 0.029, "step": 61260 }, { "epoch": 0.16, "learning_rate": 0.0002761768982920361, "loss": 0.0299, "step": 61270 }, { "epoch": 0.16, "learning_rate": 0.00027617301007566464, "loss": 0.0275, "step": 61280 }, { "epoch": 0.16, "learning_rate": 0.0002761691218592932, "loss": 0.0279, "step": 61290 }, { "epoch": 0.16, "learning_rate": 0.0002761652336429217, "loss": 0.0204, "step": 61300 }, { "epoch": 0.16, "learning_rate": 0.0002761613454265503, "loss": 0.034, "step": 61310 }, { "epoch": 0.16, "learning_rate": 0.0002761574572101788, "loss": 0.0285, "step": 61320 }, { "epoch": 0.16, "learning_rate": 0.0002761535689938073, "loss": 0.0228, "step": 61330 }, { "epoch": 0.16, "learning_rate": 0.0002761496807774359, "loss": 0.0285, "step": 61340 }, { "epoch": 0.16, "learning_rate": 0.0002761457925610644, "loss": 0.0247, "step": 61350 }, { "epoch": 0.16, "learning_rate": 0.0002761419043446929, "loss": 0.0285, "step": 61360 }, { "epoch": 0.16, "learning_rate": 0.0002761380161283215, "loss": 0.0313, "step": 61370 }, { "epoch": 0.16, "learning_rate": 0.00027613412791195006, "loss": 0.0329, "step": 61380 }, { "epoch": 0.16, "learning_rate": 0.00027613023969557857, "loss": 0.0258, "step": 61390 }, { "epoch": 0.16, "learning_rate": 0.0002761263514792071, "loss": 0.0229, "step": 61400 }, { "epoch": 0.16, "learning_rate": 0.0002761224632628356, "loss": 0.0275, "step": 61410 }, { "epoch": 0.16, "learning_rate": 0.00027611857504646417, "loss": 0.0273, "step": 61420 }, { "epoch": 0.16, "learning_rate": 0.0002761146868300927, "loss": 0.0265, "step": 61430 }, { "epoch": 0.16, "learning_rate": 0.00027611079861372125, "loss": 0.0336, "step": 61440 }, { "epoch": 0.16, "learning_rate": 0.00027610691039734977, "loss": 0.0306, "step": 61450 }, { "epoch": 0.16, "learning_rate": 0.00027610302218097834, "loss": 0.0322, "step": 61460 }, { "epoch": 0.16, "learning_rate": 0.00027609913396460685, "loss": 0.0274, "step": 61470 }, { "epoch": 0.16, "learning_rate": 0.00027609524574823537, "loss": 0.027, "step": 61480 }, { "epoch": 0.16, "learning_rate": 0.0002760913575318639, "loss": 0.0229, "step": 61490 }, { "epoch": 0.16, "learning_rate": 0.00027608746931549245, "loss": 0.0282, "step": 61500 }, { "epoch": 0.16, "learning_rate": 0.00027608358109912096, "loss": 0.0301, "step": 61510 }, { "epoch": 0.16, "learning_rate": 0.00027607969288274953, "loss": 0.0297, "step": 61520 }, { "epoch": 0.16, "learning_rate": 0.00027607580466637805, "loss": 0.0321, "step": 61530 }, { "epoch": 0.16, "learning_rate": 0.00027607191645000656, "loss": 0.0362, "step": 61540 }, { "epoch": 0.16, "learning_rate": 0.00027606802823363513, "loss": 0.029, "step": 61550 }, { "epoch": 0.16, "learning_rate": 0.00027606414001726364, "loss": 0.0211, "step": 61560 }, { "epoch": 0.16, "learning_rate": 0.00027606025180089216, "loss": 0.0226, "step": 61570 }, { "epoch": 0.16, "learning_rate": 0.00027605636358452073, "loss": 0.0274, "step": 61580 }, { "epoch": 0.16, "learning_rate": 0.0002760524753681493, "loss": 0.0259, "step": 61590 }, { "epoch": 0.16, "learning_rate": 0.0002760485871517778, "loss": 0.0238, "step": 61600 }, { "epoch": 0.16, "learning_rate": 0.0002760446989354063, "loss": 0.0272, "step": 61610 }, { "epoch": 0.16, "learning_rate": 0.00027604081071903484, "loss": 0.0208, "step": 61620 }, { "epoch": 0.16, "learning_rate": 0.0002760369225026634, "loss": 0.0267, "step": 61630 }, { "epoch": 0.16, "learning_rate": 0.0002760330342862919, "loss": 0.0266, "step": 61640 }, { "epoch": 0.16, "learning_rate": 0.0002760291460699205, "loss": 0.0246, "step": 61650 }, { "epoch": 0.16, "learning_rate": 0.000276025257853549, "loss": 0.0324, "step": 61660 }, { "epoch": 0.16, "learning_rate": 0.0002760213696371776, "loss": 0.0311, "step": 61670 }, { "epoch": 0.16, "learning_rate": 0.0002760174814208061, "loss": 0.0251, "step": 61680 }, { "epoch": 0.16, "learning_rate": 0.0002760135932044346, "loss": 0.0263, "step": 61690 }, { "epoch": 0.16, "learning_rate": 0.0002760097049880631, "loss": 0.0284, "step": 61700 }, { "epoch": 0.16, "learning_rate": 0.0002760058167716917, "loss": 0.0242, "step": 61710 }, { "epoch": 0.16, "learning_rate": 0.0002760019285553202, "loss": 0.0273, "step": 61720 }, { "epoch": 0.16, "learning_rate": 0.00027599804033894877, "loss": 0.0321, "step": 61730 }, { "epoch": 0.16, "learning_rate": 0.0002759941521225773, "loss": 0.0251, "step": 61740 }, { "epoch": 0.16, "learning_rate": 0.00027599026390620585, "loss": 0.0264, "step": 61750 }, { "epoch": 0.16, "learning_rate": 0.00027598637568983437, "loss": 0.0254, "step": 61760 }, { "epoch": 0.16, "learning_rate": 0.0002759824874734629, "loss": 0.0242, "step": 61770 }, { "epoch": 0.16, "learning_rate": 0.00027597859925709145, "loss": 0.0265, "step": 61780 }, { "epoch": 0.16, "learning_rate": 0.00027597471104071997, "loss": 0.0285, "step": 61790 }, { "epoch": 0.16, "learning_rate": 0.00027597082282434853, "loss": 0.0272, "step": 61800 }, { "epoch": 0.16, "learning_rate": 0.00027596693460797705, "loss": 0.0256, "step": 61810 }, { "epoch": 0.16, "learning_rate": 0.00027596304639160556, "loss": 0.0233, "step": 61820 }, { "epoch": 0.16, "learning_rate": 0.0002759591581752341, "loss": 0.0261, "step": 61830 }, { "epoch": 0.16, "learning_rate": 0.00027595526995886265, "loss": 0.0269, "step": 61840 }, { "epoch": 0.16, "learning_rate": 0.00027595138174249116, "loss": 0.029, "step": 61850 }, { "epoch": 0.16, "learning_rate": 0.00027594749352611973, "loss": 0.0199, "step": 61860 }, { "epoch": 0.16, "learning_rate": 0.00027594360530974825, "loss": 0.0327, "step": 61870 }, { "epoch": 0.16, "learning_rate": 0.0002759397170933768, "loss": 0.0215, "step": 61880 }, { "epoch": 0.16, "learning_rate": 0.00027593582887700533, "loss": 0.0264, "step": 61890 }, { "epoch": 0.16, "learning_rate": 0.00027593194066063384, "loss": 0.0233, "step": 61900 }, { "epoch": 0.16, "learning_rate": 0.00027592805244426236, "loss": 0.031, "step": 61910 }, { "epoch": 0.16, "learning_rate": 0.0002759241642278909, "loss": 0.0286, "step": 61920 }, { "epoch": 0.16, "learning_rate": 0.0002759202760115195, "loss": 0.0252, "step": 61930 }, { "epoch": 0.16, "learning_rate": 0.000275916387795148, "loss": 0.0302, "step": 61940 }, { "epoch": 0.16, "learning_rate": 0.0002759124995787765, "loss": 0.0252, "step": 61950 }, { "epoch": 0.16, "learning_rate": 0.0002759086113624051, "loss": 0.0249, "step": 61960 }, { "epoch": 0.16, "learning_rate": 0.0002759047231460336, "loss": 0.0222, "step": 61970 }, { "epoch": 0.16, "learning_rate": 0.0002759008349296621, "loss": 0.0317, "step": 61980 }, { "epoch": 0.16, "learning_rate": 0.0002758969467132907, "loss": 0.0284, "step": 61990 }, { "epoch": 0.16, "learning_rate": 0.0002758930584969192, "loss": 0.0285, "step": 62000 }, { "epoch": 0.16, "eval_cer": 0.8818426500165857, "eval_loss": 0.019648298621177673, "eval_runtime": 107.6017, "eval_samples_per_second": 18.587, "eval_steps_per_second": 4.647, "step": 62000 }, { "epoch": 0.16, "learning_rate": 0.0002758891702805478, "loss": 0.0248, "step": 62010 }, { "epoch": 0.16, "learning_rate": 0.0002758852820641763, "loss": 0.0273, "step": 62020 }, { "epoch": 0.16, "learning_rate": 0.0002758813938478048, "loss": 0.024, "step": 62030 }, { "epoch": 0.16, "learning_rate": 0.0002758775056314333, "loss": 0.0296, "step": 62040 }, { "epoch": 0.16, "learning_rate": 0.0002758736174150619, "loss": 0.0298, "step": 62050 }, { "epoch": 0.16, "learning_rate": 0.0002758697291986904, "loss": 0.0245, "step": 62060 }, { "epoch": 0.16, "learning_rate": 0.00027586584098231897, "loss": 0.0359, "step": 62070 }, { "epoch": 0.16, "learning_rate": 0.0002758619527659475, "loss": 0.0327, "step": 62080 }, { "epoch": 0.16, "learning_rate": 0.00027585806454957605, "loss": 0.0267, "step": 62090 }, { "epoch": 0.16, "learning_rate": 0.00027585417633320457, "loss": 0.0293, "step": 62100 }, { "epoch": 0.16, "learning_rate": 0.0002758502881168331, "loss": 0.0269, "step": 62110 }, { "epoch": 0.16, "learning_rate": 0.0002758463999004616, "loss": 0.0266, "step": 62120 }, { "epoch": 0.16, "learning_rate": 0.00027584251168409017, "loss": 0.028, "step": 62130 }, { "epoch": 0.16, "learning_rate": 0.00027583862346771873, "loss": 0.0241, "step": 62140 }, { "epoch": 0.16, "learning_rate": 0.00027583473525134725, "loss": 0.0287, "step": 62150 }, { "epoch": 0.16, "learning_rate": 0.00027583084703497576, "loss": 0.0248, "step": 62160 }, { "epoch": 0.16, "learning_rate": 0.00027582695881860433, "loss": 0.0303, "step": 62170 }, { "epoch": 0.16, "learning_rate": 0.00027582307060223285, "loss": 0.0273, "step": 62180 }, { "epoch": 0.16, "learning_rate": 0.00027581918238586136, "loss": 0.0284, "step": 62190 }, { "epoch": 0.16, "learning_rate": 0.00027581529416948993, "loss": 0.0233, "step": 62200 }, { "epoch": 0.16, "learning_rate": 0.00027581140595311844, "loss": 0.028, "step": 62210 }, { "epoch": 0.16, "learning_rate": 0.000275807517736747, "loss": 0.023, "step": 62220 }, { "epoch": 0.16, "learning_rate": 0.00027580362952037553, "loss": 0.0239, "step": 62230 }, { "epoch": 0.16, "learning_rate": 0.00027579974130400404, "loss": 0.027, "step": 62240 }, { "epoch": 0.16, "learning_rate": 0.0002757958530876326, "loss": 0.022, "step": 62250 }, { "epoch": 0.16, "learning_rate": 0.0002757919648712611, "loss": 0.0208, "step": 62260 }, { "epoch": 0.16, "learning_rate": 0.0002757880766548897, "loss": 0.0277, "step": 62270 }, { "epoch": 0.16, "learning_rate": 0.0002757841884385182, "loss": 0.0259, "step": 62280 }, { "epoch": 0.16, "learning_rate": 0.0002757803002221467, "loss": 0.0204, "step": 62290 }, { "epoch": 0.16, "learning_rate": 0.0002757764120057753, "loss": 0.0294, "step": 62300 }, { "epoch": 0.16, "learning_rate": 0.0002757725237894038, "loss": 0.0282, "step": 62310 }, { "epoch": 0.16, "learning_rate": 0.0002757686355730323, "loss": 0.0234, "step": 62320 }, { "epoch": 0.16, "learning_rate": 0.0002757647473566609, "loss": 0.0227, "step": 62330 }, { "epoch": 0.16, "learning_rate": 0.0002757608591402894, "loss": 0.0266, "step": 62340 }, { "epoch": 0.16, "learning_rate": 0.00027575697092391797, "loss": 0.0288, "step": 62350 }, { "epoch": 0.16, "learning_rate": 0.0002757530827075465, "loss": 0.0238, "step": 62360 }, { "epoch": 0.16, "learning_rate": 0.000275749194491175, "loss": 0.0267, "step": 62370 }, { "epoch": 0.16, "learning_rate": 0.00027574530627480357, "loss": 0.0227, "step": 62380 }, { "epoch": 0.16, "learning_rate": 0.0002757414180584321, "loss": 0.0236, "step": 62390 }, { "epoch": 0.16, "learning_rate": 0.0002757375298420606, "loss": 0.0182, "step": 62400 }, { "epoch": 0.16, "learning_rate": 0.00027573364162568917, "loss": 0.0221, "step": 62410 }, { "epoch": 0.16, "learning_rate": 0.00027572975340931774, "loss": 0.0257, "step": 62420 }, { "epoch": 0.16, "learning_rate": 0.00027572586519294625, "loss": 0.0237, "step": 62430 }, { "epoch": 0.16, "learning_rate": 0.00027572197697657477, "loss": 0.0242, "step": 62440 }, { "epoch": 0.16, "learning_rate": 0.0002757180887602033, "loss": 0.0282, "step": 62450 }, { "epoch": 0.16, "learning_rate": 0.00027571420054383185, "loss": 0.0231, "step": 62460 }, { "epoch": 0.16, "learning_rate": 0.00027571031232746036, "loss": 0.0287, "step": 62470 }, { "epoch": 0.16, "learning_rate": 0.00027570642411108893, "loss": 0.0286, "step": 62480 }, { "epoch": 0.16, "learning_rate": 0.00027570253589471745, "loss": 0.026, "step": 62490 }, { "epoch": 0.16, "learning_rate": 0.000275698647678346, "loss": 0.0264, "step": 62500 }, { "epoch": 0.16, "learning_rate": 0.00027569475946197453, "loss": 0.0237, "step": 62510 }, { "epoch": 0.16, "learning_rate": 0.00027569087124560304, "loss": 0.0246, "step": 62520 }, { "epoch": 0.16, "learning_rate": 0.00027568698302923156, "loss": 0.0248, "step": 62530 }, { "epoch": 0.16, "learning_rate": 0.00027568309481286013, "loss": 0.0283, "step": 62540 }, { "epoch": 0.16, "learning_rate": 0.00027567920659648864, "loss": 0.0263, "step": 62550 }, { "epoch": 0.16, "learning_rate": 0.0002756753183801172, "loss": 0.0284, "step": 62560 }, { "epoch": 0.16, "learning_rate": 0.0002756714301637457, "loss": 0.0251, "step": 62570 }, { "epoch": 0.16, "learning_rate": 0.00027566754194737424, "loss": 0.0244, "step": 62580 }, { "epoch": 0.16, "learning_rate": 0.0002756636537310028, "loss": 0.0269, "step": 62590 }, { "epoch": 0.16, "learning_rate": 0.0002756597655146313, "loss": 0.0209, "step": 62600 }, { "epoch": 0.16, "learning_rate": 0.00027565587729825984, "loss": 0.0225, "step": 62610 }, { "epoch": 0.16, "learning_rate": 0.0002756519890818884, "loss": 0.0275, "step": 62620 }, { "epoch": 0.16, "learning_rate": 0.000275648100865517, "loss": 0.027, "step": 62630 }, { "epoch": 0.16, "learning_rate": 0.0002756442126491455, "loss": 0.0224, "step": 62640 }, { "epoch": 0.16, "learning_rate": 0.000275640324432774, "loss": 0.0238, "step": 62650 }, { "epoch": 0.16, "learning_rate": 0.0002756364362164025, "loss": 0.0244, "step": 62660 }, { "epoch": 0.16, "learning_rate": 0.0002756325480000311, "loss": 0.0273, "step": 62670 }, { "epoch": 0.16, "learning_rate": 0.0002756286597836596, "loss": 0.0261, "step": 62680 }, { "epoch": 0.16, "learning_rate": 0.00027562477156728817, "loss": 0.0263, "step": 62690 }, { "epoch": 0.16, "learning_rate": 0.0002756208833509167, "loss": 0.0275, "step": 62700 }, { "epoch": 0.16, "learning_rate": 0.00027561699513454525, "loss": 0.0275, "step": 62710 }, { "epoch": 0.16, "learning_rate": 0.00027561310691817377, "loss": 0.0265, "step": 62720 }, { "epoch": 0.16, "learning_rate": 0.0002756092187018023, "loss": 0.0225, "step": 62730 }, { "epoch": 0.16, "learning_rate": 0.0002756053304854308, "loss": 0.0264, "step": 62740 }, { "epoch": 0.16, "learning_rate": 0.00027560144226905937, "loss": 0.0224, "step": 62750 }, { "epoch": 0.16, "learning_rate": 0.0002755975540526879, "loss": 0.0265, "step": 62760 }, { "epoch": 0.16, "learning_rate": 0.00027559366583631645, "loss": 0.026, "step": 62770 }, { "epoch": 0.16, "learning_rate": 0.00027558977761994496, "loss": 0.0277, "step": 62780 }, { "epoch": 0.16, "learning_rate": 0.0002755858894035735, "loss": 0.0247, "step": 62790 }, { "epoch": 0.16, "learning_rate": 0.00027558200118720205, "loss": 0.0303, "step": 62800 }, { "epoch": 0.16, "learning_rate": 0.00027557811297083056, "loss": 0.021, "step": 62810 }, { "epoch": 0.16, "learning_rate": 0.00027557422475445913, "loss": 0.021, "step": 62820 }, { "epoch": 0.16, "learning_rate": 0.00027557033653808765, "loss": 0.0234, "step": 62830 }, { "epoch": 0.16, "learning_rate": 0.0002755664483217162, "loss": 0.0216, "step": 62840 }, { "epoch": 0.16, "learning_rate": 0.00027556256010534473, "loss": 0.0305, "step": 62850 }, { "epoch": 0.16, "learning_rate": 0.00027555867188897324, "loss": 0.0251, "step": 62860 }, { "epoch": 0.16, "learning_rate": 0.00027555478367260176, "loss": 0.0249, "step": 62870 }, { "epoch": 0.16, "learning_rate": 0.0002755508954562303, "loss": 0.026, "step": 62880 }, { "epoch": 0.16, "learning_rate": 0.00027554700723985884, "loss": 0.0329, "step": 62890 }, { "epoch": 0.16, "learning_rate": 0.0002755431190234874, "loss": 0.0272, "step": 62900 }, { "epoch": 0.16, "learning_rate": 0.0002755392308071159, "loss": 0.0276, "step": 62910 }, { "epoch": 0.16, "learning_rate": 0.0002755353425907445, "loss": 0.0329, "step": 62920 }, { "epoch": 0.16, "learning_rate": 0.000275531454374373, "loss": 0.0223, "step": 62930 }, { "epoch": 0.16, "learning_rate": 0.0002755275661580015, "loss": 0.0293, "step": 62940 }, { "epoch": 0.16, "learning_rate": 0.00027552367794163004, "loss": 0.0323, "step": 62950 }, { "epoch": 0.16, "learning_rate": 0.0002755197897252586, "loss": 0.0246, "step": 62960 }, { "epoch": 0.16, "learning_rate": 0.0002755159015088872, "loss": 0.0205, "step": 62970 }, { "epoch": 0.16, "learning_rate": 0.0002755120132925157, "loss": 0.0242, "step": 62980 }, { "epoch": 0.16, "learning_rate": 0.0002755081250761442, "loss": 0.028, "step": 62990 }, { "epoch": 0.16, "learning_rate": 0.00027550423685977277, "loss": 0.0253, "step": 63000 }, { "epoch": 0.16, "eval_cer": 0.8818356518319148, "eval_loss": 0.018866481259465218, "eval_runtime": 107.714, "eval_samples_per_second": 18.568, "eval_steps_per_second": 4.642, "step": 63000 }, { "epoch": 0.16, "learning_rate": 0.0002755003486434013, "loss": 0.0263, "step": 63010 }, { "epoch": 0.16, "learning_rate": 0.0002754964604270298, "loss": 0.0276, "step": 63020 }, { "epoch": 0.16, "learning_rate": 0.00027549257221065837, "loss": 0.0318, "step": 63030 }, { "epoch": 0.16, "learning_rate": 0.0002754886839942869, "loss": 0.0266, "step": 63040 }, { "epoch": 0.16, "learning_rate": 0.00027548479577791545, "loss": 0.0235, "step": 63050 }, { "epoch": 0.16, "learning_rate": 0.00027548090756154397, "loss": 0.026, "step": 63060 }, { "epoch": 0.16, "learning_rate": 0.0002754770193451725, "loss": 0.0332, "step": 63070 }, { "epoch": 0.16, "learning_rate": 0.000275473131128801, "loss": 0.0296, "step": 63080 }, { "epoch": 0.16, "learning_rate": 0.00027546924291242957, "loss": 0.0264, "step": 63090 }, { "epoch": 0.16, "learning_rate": 0.0002754653546960581, "loss": 0.0284, "step": 63100 }, { "epoch": 0.16, "learning_rate": 0.00027546146647968665, "loss": 0.033, "step": 63110 }, { "epoch": 0.16, "learning_rate": 0.00027545757826331516, "loss": 0.0239, "step": 63120 }, { "epoch": 0.16, "learning_rate": 0.00027545369004694373, "loss": 0.0235, "step": 63130 }, { "epoch": 0.16, "learning_rate": 0.00027544980183057225, "loss": 0.0327, "step": 63140 }, { "epoch": 0.16, "learning_rate": 0.00027544591361420076, "loss": 0.0312, "step": 63150 }, { "epoch": 0.16, "learning_rate": 0.0002754420253978293, "loss": 0.0286, "step": 63160 }, { "epoch": 0.16, "learning_rate": 0.00027543813718145784, "loss": 0.0312, "step": 63170 }, { "epoch": 0.16, "learning_rate": 0.0002754342489650864, "loss": 0.0279, "step": 63180 }, { "epoch": 0.16, "learning_rate": 0.00027543036074871493, "loss": 0.0279, "step": 63190 }, { "epoch": 0.16, "learning_rate": 0.00027542647253234344, "loss": 0.0277, "step": 63200 }, { "epoch": 0.16, "learning_rate": 0.000275422584315972, "loss": 0.0268, "step": 63210 }, { "epoch": 0.16, "learning_rate": 0.0002754186960996005, "loss": 0.0261, "step": 63220 }, { "epoch": 0.16, "learning_rate": 0.00027541480788322904, "loss": 0.0263, "step": 63230 }, { "epoch": 0.16, "learning_rate": 0.0002754109196668576, "loss": 0.0303, "step": 63240 }, { "epoch": 0.16, "learning_rate": 0.0002754070314504861, "loss": 0.0272, "step": 63250 }, { "epoch": 0.16, "learning_rate": 0.0002754031432341147, "loss": 0.0268, "step": 63260 }, { "epoch": 0.16, "learning_rate": 0.0002753992550177432, "loss": 0.0267, "step": 63270 }, { "epoch": 0.16, "learning_rate": 0.0002753953668013717, "loss": 0.0275, "step": 63280 }, { "epoch": 0.16, "learning_rate": 0.00027539147858500024, "loss": 0.0348, "step": 63290 }, { "epoch": 0.16, "learning_rate": 0.0002753875903686288, "loss": 0.0329, "step": 63300 }, { "epoch": 0.16, "learning_rate": 0.0002753837021522573, "loss": 0.0228, "step": 63310 }, { "epoch": 0.16, "learning_rate": 0.0002753798139358859, "loss": 0.0277, "step": 63320 }, { "epoch": 0.16, "learning_rate": 0.0002753759257195144, "loss": 0.028, "step": 63330 }, { "epoch": 0.16, "learning_rate": 0.00027537203750314297, "loss": 0.026, "step": 63340 }, { "epoch": 0.16, "learning_rate": 0.0002753681492867715, "loss": 0.02, "step": 63350 }, { "epoch": 0.16, "learning_rate": 0.0002753642610704, "loss": 0.0251, "step": 63360 }, { "epoch": 0.16, "learning_rate": 0.00027536037285402857, "loss": 0.0275, "step": 63370 }, { "epoch": 0.16, "learning_rate": 0.0002753564846376571, "loss": 0.0266, "step": 63380 }, { "epoch": 0.16, "learning_rate": 0.00027535259642128565, "loss": 0.023, "step": 63390 }, { "epoch": 0.16, "learning_rate": 0.00027534870820491417, "loss": 0.0268, "step": 63400 }, { "epoch": 0.16, "learning_rate": 0.0002753448199885427, "loss": 0.0251, "step": 63410 }, { "epoch": 0.16, "learning_rate": 0.00027534093177217125, "loss": 0.027, "step": 63420 }, { "epoch": 0.16, "learning_rate": 0.00027533704355579976, "loss": 0.0268, "step": 63430 }, { "epoch": 0.16, "learning_rate": 0.0002753331553394283, "loss": 0.0329, "step": 63440 }, { "epoch": 0.16, "learning_rate": 0.00027532926712305685, "loss": 0.0252, "step": 63450 }, { "epoch": 0.16, "learning_rate": 0.0002753253789066854, "loss": 0.0243, "step": 63460 }, { "epoch": 0.16, "learning_rate": 0.00027532149069031393, "loss": 0.0221, "step": 63470 }, { "epoch": 0.16, "learning_rate": 0.00027531760247394245, "loss": 0.0275, "step": 63480 }, { "epoch": 0.16, "learning_rate": 0.00027531371425757096, "loss": 0.0262, "step": 63490 }, { "epoch": 0.16, "learning_rate": 0.00027530982604119953, "loss": 0.0242, "step": 63500 }, { "epoch": 0.16, "learning_rate": 0.00027530593782482804, "loss": 0.0245, "step": 63510 }, { "epoch": 0.16, "learning_rate": 0.0002753020496084566, "loss": 0.0283, "step": 63520 }, { "epoch": 0.16, "learning_rate": 0.0002752981613920851, "loss": 0.0261, "step": 63530 }, { "epoch": 0.16, "learning_rate": 0.00027529427317571364, "loss": 0.0288, "step": 63540 }, { "epoch": 0.16, "learning_rate": 0.0002752903849593422, "loss": 0.0249, "step": 63550 }, { "epoch": 0.16, "learning_rate": 0.0002752864967429707, "loss": 0.0302, "step": 63560 }, { "epoch": 0.16, "learning_rate": 0.00027528260852659924, "loss": 0.0242, "step": 63570 }, { "epoch": 0.16, "learning_rate": 0.0002752787203102278, "loss": 0.0252, "step": 63580 }, { "epoch": 0.16, "learning_rate": 0.0002752748320938563, "loss": 0.0258, "step": 63590 }, { "epoch": 0.16, "learning_rate": 0.0002752709438774849, "loss": 0.0233, "step": 63600 }, { "epoch": 0.16, "learning_rate": 0.0002752670556611134, "loss": 0.0321, "step": 63610 }, { "epoch": 0.16, "learning_rate": 0.0002752631674447419, "loss": 0.0242, "step": 63620 }, { "epoch": 0.16, "learning_rate": 0.0002752592792283705, "loss": 0.0584, "step": 63630 }, { "epoch": 0.16, "learning_rate": 0.000275255391011999, "loss": 0.0265, "step": 63640 }, { "epoch": 0.16, "learning_rate": 0.0002752515027956275, "loss": 0.0271, "step": 63650 }, { "epoch": 0.17, "learning_rate": 0.0002752476145792561, "loss": 0.0306, "step": 63660 }, { "epoch": 0.17, "learning_rate": 0.00027524372636288466, "loss": 0.0429, "step": 63670 }, { "epoch": 0.17, "learning_rate": 0.00027523983814651317, "loss": 0.0229, "step": 63680 }, { "epoch": 0.17, "learning_rate": 0.0002752359499301417, "loss": 0.0288, "step": 63690 }, { "epoch": 0.17, "learning_rate": 0.0002752320617137702, "loss": 0.0421, "step": 63700 }, { "epoch": 0.17, "learning_rate": 0.00027522817349739877, "loss": 0.0224, "step": 63710 }, { "epoch": 0.17, "learning_rate": 0.0002752242852810273, "loss": 0.024, "step": 63720 }, { "epoch": 0.17, "learning_rate": 0.00027522039706465585, "loss": 0.0271, "step": 63730 }, { "epoch": 0.17, "learning_rate": 0.00027521650884828437, "loss": 0.0318, "step": 63740 }, { "epoch": 0.17, "learning_rate": 0.00027521262063191293, "loss": 0.0251, "step": 63750 }, { "epoch": 0.17, "learning_rate": 0.00027520873241554145, "loss": 0.0245, "step": 63760 }, { "epoch": 0.17, "learning_rate": 0.00027520484419916996, "loss": 0.0247, "step": 63770 }, { "epoch": 0.17, "learning_rate": 0.0002752009559827985, "loss": 0.0263, "step": 63780 }, { "epoch": 0.17, "learning_rate": 0.00027519706776642705, "loss": 0.0275, "step": 63790 }, { "epoch": 0.17, "learning_rate": 0.00027519317955005556, "loss": 0.032, "step": 63800 }, { "epoch": 0.17, "learning_rate": 0.00027518929133368413, "loss": 0.0243, "step": 63810 }, { "epoch": 0.17, "learning_rate": 0.00027518540311731264, "loss": 0.031, "step": 63820 }, { "epoch": 0.17, "learning_rate": 0.00027518151490094116, "loss": 0.0237, "step": 63830 }, { "epoch": 0.17, "learning_rate": 0.00027517762668456973, "loss": 0.0221, "step": 63840 }, { "epoch": 0.17, "learning_rate": 0.00027517373846819824, "loss": 0.0221, "step": 63850 }, { "epoch": 0.17, "learning_rate": 0.0002751698502518268, "loss": 0.0277, "step": 63860 }, { "epoch": 0.17, "learning_rate": 0.0002751659620354553, "loss": 0.0251, "step": 63870 }, { "epoch": 0.17, "learning_rate": 0.0002751620738190839, "loss": 0.0268, "step": 63880 }, { "epoch": 0.17, "learning_rate": 0.0002751581856027124, "loss": 0.0249, "step": 63890 }, { "epoch": 0.17, "learning_rate": 0.0002751542973863409, "loss": 0.0273, "step": 63900 }, { "epoch": 0.17, "learning_rate": 0.00027515040916996944, "loss": 0.027, "step": 63910 }, { "epoch": 0.17, "learning_rate": 0.000275146520953598, "loss": 0.0246, "step": 63920 }, { "epoch": 0.17, "learning_rate": 0.0002751426327372265, "loss": 0.0269, "step": 63930 }, { "epoch": 0.17, "learning_rate": 0.0002751387445208551, "loss": 0.022, "step": 63940 }, { "epoch": 0.17, "learning_rate": 0.0002751348563044836, "loss": 0.0288, "step": 63950 }, { "epoch": 0.17, "learning_rate": 0.0002751309680881122, "loss": 0.0265, "step": 63960 }, { "epoch": 0.17, "learning_rate": 0.0002751270798717407, "loss": 0.0233, "step": 63970 }, { "epoch": 0.17, "learning_rate": 0.0002751231916553692, "loss": 0.0273, "step": 63980 }, { "epoch": 0.17, "learning_rate": 0.0002751193034389977, "loss": 0.0279, "step": 63990 }, { "epoch": 0.17, "learning_rate": 0.0002751154152226263, "loss": 0.0284, "step": 64000 }, { "epoch": 0.17, "eval_cer": 0.8818384511057832, "eval_loss": 0.018597625195980072, "eval_runtime": 108.1781, "eval_samples_per_second": 18.488, "eval_steps_per_second": 4.622, "step": 64000 }, { "epoch": 0.17, "learning_rate": 0.00027511152700625485, "loss": 0.0261, "step": 64010 }, { "epoch": 0.17, "learning_rate": 0.00027510763878988337, "loss": 0.0258, "step": 64020 }, { "epoch": 0.17, "learning_rate": 0.0002751037505735119, "loss": 0.0294, "step": 64030 }, { "epoch": 0.17, "learning_rate": 0.0002750998623571404, "loss": 0.0255, "step": 64040 }, { "epoch": 0.17, "learning_rate": 0.00027509597414076897, "loss": 0.031, "step": 64050 }, { "epoch": 0.17, "learning_rate": 0.0002750920859243975, "loss": 0.0274, "step": 64060 }, { "epoch": 0.17, "learning_rate": 0.00027508819770802605, "loss": 0.0303, "step": 64070 }, { "epoch": 0.17, "learning_rate": 0.00027508430949165456, "loss": 0.0212, "step": 64080 }, { "epoch": 0.17, "learning_rate": 0.00027508042127528313, "loss": 0.0259, "step": 64090 }, { "epoch": 0.17, "learning_rate": 0.00027507653305891165, "loss": 0.0248, "step": 64100 }, { "epoch": 0.17, "learning_rate": 0.00027507264484254016, "loss": 0.0264, "step": 64110 }, { "epoch": 0.17, "learning_rate": 0.0002750687566261687, "loss": 0.025, "step": 64120 }, { "epoch": 0.17, "learning_rate": 0.00027506486840979725, "loss": 0.0237, "step": 64130 }, { "epoch": 0.17, "learning_rate": 0.00027506098019342576, "loss": 0.0234, "step": 64140 }, { "epoch": 0.17, "learning_rate": 0.00027505709197705433, "loss": 0.0264, "step": 64150 }, { "epoch": 0.17, "learning_rate": 0.00027505320376068284, "loss": 0.0264, "step": 64160 }, { "epoch": 0.17, "learning_rate": 0.0002750493155443114, "loss": 0.0233, "step": 64170 }, { "epoch": 0.17, "learning_rate": 0.0002750454273279399, "loss": 0.0258, "step": 64180 }, { "epoch": 0.17, "learning_rate": 0.00027504153911156844, "loss": 0.0301, "step": 64190 }, { "epoch": 0.17, "learning_rate": 0.00027503765089519696, "loss": 0.0313, "step": 64200 }, { "epoch": 0.17, "learning_rate": 0.0002750337626788255, "loss": 0.0259, "step": 64210 }, { "epoch": 0.17, "learning_rate": 0.0002750298744624541, "loss": 0.0273, "step": 64220 }, { "epoch": 0.17, "learning_rate": 0.0002750259862460826, "loss": 0.0283, "step": 64230 }, { "epoch": 0.17, "learning_rate": 0.0002750220980297111, "loss": 0.0263, "step": 64240 }, { "epoch": 0.17, "learning_rate": 0.0002750182098133397, "loss": 0.0256, "step": 64250 }, { "epoch": 0.17, "learning_rate": 0.0002750143215969682, "loss": 0.0214, "step": 64260 }, { "epoch": 0.17, "learning_rate": 0.0002750104333805967, "loss": 0.0282, "step": 64270 }, { "epoch": 0.17, "learning_rate": 0.0002750065451642253, "loss": 0.0258, "step": 64280 }, { "epoch": 0.17, "learning_rate": 0.0002750026569478538, "loss": 0.0301, "step": 64290 }, { "epoch": 0.17, "learning_rate": 0.00027499876873148237, "loss": 0.0254, "step": 64300 }, { "epoch": 0.17, "learning_rate": 0.0002749948805151109, "loss": 0.0218, "step": 64310 }, { "epoch": 0.17, "learning_rate": 0.0002749909922987394, "loss": 0.0278, "step": 64320 }, { "epoch": 0.17, "learning_rate": 0.0002749871040823679, "loss": 0.0279, "step": 64330 }, { "epoch": 0.17, "learning_rate": 0.0002749832158659965, "loss": 0.0325, "step": 64340 }, { "epoch": 0.17, "learning_rate": 0.000274979327649625, "loss": 0.0253, "step": 64350 }, { "epoch": 0.17, "learning_rate": 0.00027497543943325357, "loss": 0.024, "step": 64360 }, { "epoch": 0.17, "learning_rate": 0.0002749715512168821, "loss": 0.0245, "step": 64370 }, { "epoch": 0.17, "learning_rate": 0.00027496766300051065, "loss": 0.0221, "step": 64380 }, { "epoch": 0.17, "learning_rate": 0.00027496377478413917, "loss": 0.0277, "step": 64390 }, { "epoch": 0.17, "learning_rate": 0.0002749598865677677, "loss": 0.0284, "step": 64400 }, { "epoch": 0.17, "learning_rate": 0.00027495599835139625, "loss": 0.0265, "step": 64410 }, { "epoch": 0.17, "learning_rate": 0.00027495211013502476, "loss": 0.0267, "step": 64420 }, { "epoch": 0.17, "learning_rate": 0.00027494822191865333, "loss": 0.0267, "step": 64430 }, { "epoch": 0.17, "learning_rate": 0.00027494433370228185, "loss": 0.0266, "step": 64440 }, { "epoch": 0.17, "learning_rate": 0.00027494044548591036, "loss": 0.0265, "step": 64450 }, { "epoch": 0.17, "learning_rate": 0.00027493655726953893, "loss": 0.027, "step": 64460 }, { "epoch": 0.17, "learning_rate": 0.00027493266905316744, "loss": 0.0246, "step": 64470 }, { "epoch": 0.17, "learning_rate": 0.00027492878083679596, "loss": 0.0293, "step": 64480 }, { "epoch": 0.17, "learning_rate": 0.00027492489262042453, "loss": 0.026, "step": 64490 }, { "epoch": 0.17, "learning_rate": 0.00027492100440405304, "loss": 0.0191, "step": 64500 }, { "epoch": 0.17, "learning_rate": 0.0002749171161876816, "loss": 0.0247, "step": 64510 }, { "epoch": 0.17, "learning_rate": 0.0002749132279713101, "loss": 0.0205, "step": 64520 }, { "epoch": 0.17, "learning_rate": 0.00027490933975493864, "loss": 0.0273, "step": 64530 }, { "epoch": 0.17, "learning_rate": 0.00027490545153856715, "loss": 0.0248, "step": 64540 }, { "epoch": 0.17, "learning_rate": 0.0002749015633221957, "loss": 0.0281, "step": 64550 }, { "epoch": 0.17, "learning_rate": 0.0002748976751058243, "loss": 0.0248, "step": 64560 }, { "epoch": 0.17, "learning_rate": 0.0002748937868894528, "loss": 0.0246, "step": 64570 }, { "epoch": 0.17, "learning_rate": 0.0002748898986730813, "loss": 0.0262, "step": 64580 }, { "epoch": 0.17, "learning_rate": 0.0002748860104567099, "loss": 0.0312, "step": 64590 }, { "epoch": 0.17, "learning_rate": 0.0002748821222403384, "loss": 0.0202, "step": 64600 }, { "epoch": 0.17, "learning_rate": 0.0002748782340239669, "loss": 0.0259, "step": 64610 }, { "epoch": 0.17, "learning_rate": 0.0002748743458075955, "loss": 0.0266, "step": 64620 }, { "epoch": 0.17, "learning_rate": 0.000274870457591224, "loss": 0.027, "step": 64630 }, { "epoch": 0.17, "learning_rate": 0.00027486656937485257, "loss": 0.0333, "step": 64640 }, { "epoch": 0.17, "learning_rate": 0.0002748626811584811, "loss": 0.022, "step": 64650 }, { "epoch": 0.17, "learning_rate": 0.0002748587929421096, "loss": 0.0242, "step": 64660 }, { "epoch": 0.17, "learning_rate": 0.00027485490472573817, "loss": 0.0283, "step": 64670 }, { "epoch": 0.17, "learning_rate": 0.0002748510165093667, "loss": 0.0289, "step": 64680 }, { "epoch": 0.17, "learning_rate": 0.0002748471282929952, "loss": 0.0288, "step": 64690 }, { "epoch": 0.17, "learning_rate": 0.00027484324007662377, "loss": 0.0247, "step": 64700 }, { "epoch": 0.17, "learning_rate": 0.00027483935186025234, "loss": 0.0241, "step": 64710 }, { "epoch": 0.17, "learning_rate": 0.00027483546364388085, "loss": 0.0298, "step": 64720 }, { "epoch": 0.17, "learning_rate": 0.00027483157542750936, "loss": 0.03, "step": 64730 }, { "epoch": 0.17, "learning_rate": 0.0002748276872111379, "loss": 0.0253, "step": 64740 }, { "epoch": 0.17, "learning_rate": 0.00027482379899476645, "loss": 0.0283, "step": 64750 }, { "epoch": 0.17, "learning_rate": 0.00027481991077839496, "loss": 0.0256, "step": 64760 }, { "epoch": 0.17, "learning_rate": 0.00027481602256202353, "loss": 0.0206, "step": 64770 }, { "epoch": 0.17, "learning_rate": 0.00027481213434565205, "loss": 0.0265, "step": 64780 }, { "epoch": 0.17, "learning_rate": 0.00027480824612928056, "loss": 0.0283, "step": 64790 }, { "epoch": 0.17, "learning_rate": 0.00027480435791290913, "loss": 0.0224, "step": 64800 }, { "epoch": 0.17, "learning_rate": 0.00027480046969653764, "loss": 0.0224, "step": 64810 }, { "epoch": 0.17, "learning_rate": 0.00027479658148016616, "loss": 0.0237, "step": 64820 }, { "epoch": 0.17, "learning_rate": 0.0002747926932637947, "loss": 0.025, "step": 64830 }, { "epoch": 0.17, "learning_rate": 0.00027478880504742324, "loss": 0.0228, "step": 64840 }, { "epoch": 0.17, "learning_rate": 0.0002747849168310518, "loss": 0.0251, "step": 64850 }, { "epoch": 0.17, "learning_rate": 0.0002747810286146803, "loss": 0.0255, "step": 64860 }, { "epoch": 0.17, "learning_rate": 0.00027477714039830884, "loss": 0.0273, "step": 64870 }, { "epoch": 0.17, "learning_rate": 0.0002747732521819374, "loss": 0.0296, "step": 64880 }, { "epoch": 0.17, "learning_rate": 0.0002747693639655659, "loss": 0.0263, "step": 64890 }, { "epoch": 0.17, "learning_rate": 0.00027476547574919444, "loss": 0.0279, "step": 64900 }, { "epoch": 0.17, "learning_rate": 0.000274761587532823, "loss": 0.0305, "step": 64910 }, { "epoch": 0.17, "learning_rate": 0.0002747576993164516, "loss": 0.0248, "step": 64920 }, { "epoch": 0.17, "learning_rate": 0.0002747538111000801, "loss": 0.0212, "step": 64930 }, { "epoch": 0.17, "learning_rate": 0.0002747499228837086, "loss": 0.0241, "step": 64940 }, { "epoch": 0.17, "learning_rate": 0.0002747460346673371, "loss": 0.0242, "step": 64950 }, { "epoch": 0.17, "learning_rate": 0.0002747421464509657, "loss": 0.0305, "step": 64960 }, { "epoch": 0.17, "learning_rate": 0.0002747382582345942, "loss": 0.0241, "step": 64970 }, { "epoch": 0.17, "learning_rate": 0.00027473437001822277, "loss": 0.0277, "step": 64980 }, { "epoch": 0.17, "learning_rate": 0.0002747304818018513, "loss": 0.0225, "step": 64990 }, { "epoch": 0.17, "learning_rate": 0.00027472659358547985, "loss": 0.0214, "step": 65000 }, { "epoch": 0.17, "eval_cer": 0.8818076590932312, "eval_loss": 0.01859799586236477, "eval_runtime": 108.2159, "eval_samples_per_second": 18.482, "eval_steps_per_second": 4.62, "step": 65000 }, { "epoch": 0.17, "learning_rate": 0.00027472270536910837, "loss": 0.025, "step": 65010 }, { "epoch": 0.17, "learning_rate": 0.0002747188171527369, "loss": 0.0277, "step": 65020 }, { "epoch": 0.17, "learning_rate": 0.0002747149289363654, "loss": 0.0265, "step": 65030 }, { "epoch": 0.17, "learning_rate": 0.00027471104071999397, "loss": 0.0267, "step": 65040 }, { "epoch": 0.17, "learning_rate": 0.00027470715250362253, "loss": 0.0231, "step": 65050 }, { "epoch": 0.17, "learning_rate": 0.00027470326428725105, "loss": 0.0262, "step": 65060 }, { "epoch": 0.17, "learning_rate": 0.00027469937607087956, "loss": 0.0302, "step": 65070 }, { "epoch": 0.17, "learning_rate": 0.0002746954878545081, "loss": 0.0231, "step": 65080 }, { "epoch": 0.17, "learning_rate": 0.00027469159963813665, "loss": 0.028, "step": 65090 }, { "epoch": 0.17, "learning_rate": 0.00027468771142176516, "loss": 0.0265, "step": 65100 }, { "epoch": 0.17, "learning_rate": 0.00027468382320539373, "loss": 0.0236, "step": 65110 }, { "epoch": 0.17, "learning_rate": 0.00027467993498902224, "loss": 0.0311, "step": 65120 }, { "epoch": 0.17, "learning_rate": 0.0002746760467726508, "loss": 0.0234, "step": 65130 }, { "epoch": 0.17, "learning_rate": 0.00027467215855627933, "loss": 0.0255, "step": 65140 }, { "epoch": 0.17, "learning_rate": 0.00027466827033990784, "loss": 0.0277, "step": 65150 }, { "epoch": 0.17, "learning_rate": 0.00027466438212353636, "loss": 0.0282, "step": 65160 }, { "epoch": 0.17, "learning_rate": 0.0002746604939071649, "loss": 0.0267, "step": 65170 }, { "epoch": 0.17, "learning_rate": 0.00027465660569079344, "loss": 0.027, "step": 65180 }, { "epoch": 0.17, "learning_rate": 0.000274652717474422, "loss": 0.0255, "step": 65190 }, { "epoch": 0.17, "learning_rate": 0.0002746488292580505, "loss": 0.0267, "step": 65200 }, { "epoch": 0.17, "learning_rate": 0.0002746449410416791, "loss": 0.0258, "step": 65210 }, { "epoch": 0.17, "learning_rate": 0.0002746410528253076, "loss": 0.0233, "step": 65220 }, { "epoch": 0.17, "learning_rate": 0.0002746371646089361, "loss": 0.0289, "step": 65230 }, { "epoch": 0.17, "learning_rate": 0.00027463327639256464, "loss": 0.0288, "step": 65240 }, { "epoch": 0.17, "learning_rate": 0.0002746293881761932, "loss": 0.0235, "step": 65250 }, { "epoch": 0.17, "learning_rate": 0.0002746254999598218, "loss": 0.0218, "step": 65260 }, { "epoch": 0.17, "learning_rate": 0.0002746216117434503, "loss": 0.0259, "step": 65270 }, { "epoch": 0.17, "learning_rate": 0.0002746177235270788, "loss": 0.0287, "step": 65280 }, { "epoch": 0.17, "learning_rate": 0.0002746138353107073, "loss": 0.0262, "step": 65290 }, { "epoch": 0.17, "learning_rate": 0.0002746099470943359, "loss": 0.0246, "step": 65300 }, { "epoch": 0.17, "learning_rate": 0.0002746060588779644, "loss": 0.0204, "step": 65310 }, { "epoch": 0.17, "learning_rate": 0.00027460217066159297, "loss": 0.0184, "step": 65320 }, { "epoch": 0.17, "learning_rate": 0.0002745982824452215, "loss": 0.0363, "step": 65330 }, { "epoch": 0.17, "learning_rate": 0.00027459439422885005, "loss": 0.0258, "step": 65340 }, { "epoch": 0.17, "learning_rate": 0.00027459050601247857, "loss": 0.0224, "step": 65350 }, { "epoch": 0.17, "learning_rate": 0.0002745866177961071, "loss": 0.0294, "step": 65360 }, { "epoch": 0.17, "learning_rate": 0.0002745827295797356, "loss": 0.0231, "step": 65370 }, { "epoch": 0.17, "learning_rate": 0.00027457884136336416, "loss": 0.0283, "step": 65380 }, { "epoch": 0.17, "learning_rate": 0.0002745749531469927, "loss": 0.0257, "step": 65390 }, { "epoch": 0.17, "learning_rate": 0.00027457106493062125, "loss": 0.0227, "step": 65400 }, { "epoch": 0.17, "learning_rate": 0.00027456717671424976, "loss": 0.0276, "step": 65410 }, { "epoch": 0.17, "learning_rate": 0.00027456328849787833, "loss": 0.0265, "step": 65420 }, { "epoch": 0.17, "learning_rate": 0.00027455940028150685, "loss": 0.0295, "step": 65430 }, { "epoch": 0.17, "learning_rate": 0.00027455551206513536, "loss": 0.0237, "step": 65440 }, { "epoch": 0.17, "learning_rate": 0.00027455162384876393, "loss": 0.0249, "step": 65450 }, { "epoch": 0.17, "learning_rate": 0.00027454773563239244, "loss": 0.0223, "step": 65460 }, { "epoch": 0.17, "learning_rate": 0.000274543847416021, "loss": 0.0236, "step": 65470 }, { "epoch": 0.17, "learning_rate": 0.0002745399591996495, "loss": 0.0227, "step": 65480 }, { "epoch": 0.17, "learning_rate": 0.00027453607098327804, "loss": 0.0263, "step": 65490 }, { "epoch": 0.17, "learning_rate": 0.0002745321827669066, "loss": 0.0275, "step": 65500 }, { "epoch": 0.17, "learning_rate": 0.0002745282945505351, "loss": 0.0243, "step": 65510 }, { "epoch": 0.17, "learning_rate": 0.00027452440633416364, "loss": 0.0242, "step": 65520 }, { "epoch": 0.17, "learning_rate": 0.0002745205181177922, "loss": 0.0266, "step": 65530 }, { "epoch": 0.17, "learning_rate": 0.0002745166299014207, "loss": 0.0181, "step": 65540 }, { "epoch": 0.17, "learning_rate": 0.0002745127416850493, "loss": 0.023, "step": 65550 }, { "epoch": 0.17, "learning_rate": 0.0002745088534686778, "loss": 0.0269, "step": 65560 }, { "epoch": 0.17, "learning_rate": 0.0002745049652523063, "loss": 0.0315, "step": 65570 }, { "epoch": 0.17, "learning_rate": 0.00027450107703593483, "loss": 0.0225, "step": 65580 }, { "epoch": 0.17, "learning_rate": 0.0002744971888195634, "loss": 0.0246, "step": 65590 }, { "epoch": 0.17, "learning_rate": 0.00027449330060319197, "loss": 0.0248, "step": 65600 }, { "epoch": 0.17, "learning_rate": 0.0002744894123868205, "loss": 0.0247, "step": 65610 }, { "epoch": 0.17, "learning_rate": 0.000274485524170449, "loss": 0.0263, "step": 65620 }, { "epoch": 0.17, "learning_rate": 0.00027448163595407757, "loss": 0.0229, "step": 65630 }, { "epoch": 0.17, "learning_rate": 0.0002744777477377061, "loss": 0.0253, "step": 65640 }, { "epoch": 0.17, "learning_rate": 0.0002744738595213346, "loss": 0.0288, "step": 65650 }, { "epoch": 0.17, "learning_rate": 0.00027446997130496317, "loss": 0.0243, "step": 65660 }, { "epoch": 0.17, "learning_rate": 0.0002744660830885917, "loss": 0.0315, "step": 65670 }, { "epoch": 0.17, "learning_rate": 0.00027446219487222025, "loss": 0.0247, "step": 65680 }, { "epoch": 0.17, "learning_rate": 0.00027445830665584877, "loss": 0.0216, "step": 65690 }, { "epoch": 0.17, "learning_rate": 0.0002744544184394773, "loss": 0.0254, "step": 65700 }, { "epoch": 0.17, "learning_rate": 0.00027445053022310585, "loss": 0.0276, "step": 65710 }, { "epoch": 0.17, "learning_rate": 0.00027444664200673436, "loss": 0.0233, "step": 65720 }, { "epoch": 0.17, "learning_rate": 0.0002744427537903629, "loss": 0.0396, "step": 65730 }, { "epoch": 0.17, "learning_rate": 0.00027443886557399145, "loss": 0.0263, "step": 65740 }, { "epoch": 0.17, "learning_rate": 0.00027443497735761996, "loss": 0.0271, "step": 65750 }, { "epoch": 0.17, "learning_rate": 0.00027443108914124853, "loss": 0.0301, "step": 65760 }, { "epoch": 0.17, "learning_rate": 0.00027442720092487704, "loss": 0.0237, "step": 65770 }, { "epoch": 0.17, "learning_rate": 0.00027442331270850556, "loss": 0.0264, "step": 65780 }, { "epoch": 0.17, "learning_rate": 0.0002744194244921341, "loss": 0.0264, "step": 65790 }, { "epoch": 0.17, "learning_rate": 0.00027441553627576264, "loss": 0.0298, "step": 65800 }, { "epoch": 0.17, "learning_rate": 0.0002744116480593912, "loss": 0.0225, "step": 65810 }, { "epoch": 0.17, "learning_rate": 0.0002744077598430197, "loss": 0.026, "step": 65820 }, { "epoch": 0.17, "learning_rate": 0.00027440387162664824, "loss": 0.0318, "step": 65830 }, { "epoch": 0.17, "learning_rate": 0.0002743999834102768, "loss": 0.0239, "step": 65840 }, { "epoch": 0.17, "learning_rate": 0.0002743960951939053, "loss": 0.0249, "step": 65850 }, { "epoch": 0.17, "learning_rate": 0.00027439220697753384, "loss": 0.0241, "step": 65860 }, { "epoch": 0.17, "learning_rate": 0.0002743883187611624, "loss": 0.0218, "step": 65870 }, { "epoch": 0.17, "learning_rate": 0.0002743844305447909, "loss": 0.0328, "step": 65880 }, { "epoch": 0.17, "learning_rate": 0.0002743805423284195, "loss": 0.0286, "step": 65890 }, { "epoch": 0.17, "learning_rate": 0.000274376654112048, "loss": 0.0223, "step": 65900 }, { "epoch": 0.17, "learning_rate": 0.0002743727658956765, "loss": 0.0273, "step": 65910 }, { "epoch": 0.17, "learning_rate": 0.0002743688776793051, "loss": 0.0296, "step": 65920 }, { "epoch": 0.17, "learning_rate": 0.0002743649894629336, "loss": 0.0274, "step": 65930 }, { "epoch": 0.17, "learning_rate": 0.0002743611012465621, "loss": 0.0317, "step": 65940 }, { "epoch": 0.17, "learning_rate": 0.0002743572130301907, "loss": 0.0261, "step": 65950 }, { "epoch": 0.17, "learning_rate": 0.00027435332481381925, "loss": 0.025, "step": 65960 }, { "epoch": 0.17, "learning_rate": 0.00027434943659744777, "loss": 0.025, "step": 65970 }, { "epoch": 0.17, "learning_rate": 0.0002743455483810763, "loss": 0.0216, "step": 65980 }, { "epoch": 0.17, "learning_rate": 0.0002743416601647048, "loss": 0.0246, "step": 65990 }, { "epoch": 0.17, "learning_rate": 0.00027433777194833337, "loss": 0.0272, "step": 66000 }, { "epoch": 0.17, "eval_cer": 0.8818118580040337, "eval_loss": 0.018492352217435837, "eval_runtime": 108.0625, "eval_samples_per_second": 18.508, "eval_steps_per_second": 4.627, "step": 66000 }, { "epoch": 0.17, "learning_rate": 0.0002743338837319619, "loss": 0.0291, "step": 66010 }, { "epoch": 0.17, "learning_rate": 0.00027432999551559045, "loss": 0.0265, "step": 66020 }, { "epoch": 0.17, "learning_rate": 0.00027432610729921896, "loss": 0.0258, "step": 66030 }, { "epoch": 0.17, "learning_rate": 0.0002743222190828475, "loss": 0.0287, "step": 66040 }, { "epoch": 0.17, "learning_rate": 0.00027431833086647605, "loss": 0.0267, "step": 66050 }, { "epoch": 0.17, "learning_rate": 0.00027431444265010456, "loss": 0.0273, "step": 66060 }, { "epoch": 0.17, "learning_rate": 0.0002743105544337331, "loss": 0.0247, "step": 66070 }, { "epoch": 0.17, "learning_rate": 0.00027430666621736165, "loss": 0.025, "step": 66080 }, { "epoch": 0.17, "learning_rate": 0.00027430277800099016, "loss": 0.032, "step": 66090 }, { "epoch": 0.17, "learning_rate": 0.00027429888978461873, "loss": 0.0281, "step": 66100 }, { "epoch": 0.17, "learning_rate": 0.00027429500156824724, "loss": 0.0244, "step": 66110 }, { "epoch": 0.17, "learning_rate": 0.00027429111335187576, "loss": 0.0295, "step": 66120 }, { "epoch": 0.17, "learning_rate": 0.0002742872251355043, "loss": 0.0241, "step": 66130 }, { "epoch": 0.17, "learning_rate": 0.00027428333691913284, "loss": 0.0253, "step": 66140 }, { "epoch": 0.17, "learning_rate": 0.0002742794487027614, "loss": 0.0279, "step": 66150 }, { "epoch": 0.17, "learning_rate": 0.0002742755604863899, "loss": 0.025, "step": 66160 }, { "epoch": 0.17, "learning_rate": 0.0002742716722700185, "loss": 0.0307, "step": 66170 }, { "epoch": 0.17, "learning_rate": 0.000274267784053647, "loss": 0.0261, "step": 66180 }, { "epoch": 0.17, "learning_rate": 0.0002742638958372755, "loss": 0.0228, "step": 66190 }, { "epoch": 0.17, "learning_rate": 0.00027426000762090404, "loss": 0.0253, "step": 66200 }, { "epoch": 0.17, "learning_rate": 0.0002742561194045326, "loss": 0.0254, "step": 66210 }, { "epoch": 0.17, "learning_rate": 0.0002742522311881611, "loss": 0.0245, "step": 66220 }, { "epoch": 0.17, "learning_rate": 0.0002742483429717897, "loss": 0.0238, "step": 66230 }, { "epoch": 0.17, "learning_rate": 0.0002742444547554182, "loss": 0.0209, "step": 66240 }, { "epoch": 0.17, "learning_rate": 0.0002742405665390467, "loss": 0.027, "step": 66250 }, { "epoch": 0.17, "learning_rate": 0.0002742366783226753, "loss": 0.0257, "step": 66260 }, { "epoch": 0.17, "learning_rate": 0.0002742327901063038, "loss": 0.0275, "step": 66270 }, { "epoch": 0.17, "learning_rate": 0.0002742289018899323, "loss": 0.0254, "step": 66280 }, { "epoch": 0.17, "learning_rate": 0.0002742250136735609, "loss": 0.0282, "step": 66290 }, { "epoch": 0.17, "learning_rate": 0.00027422112545718945, "loss": 0.0222, "step": 66300 }, { "epoch": 0.17, "learning_rate": 0.00027421723724081797, "loss": 0.026, "step": 66310 }, { "epoch": 0.17, "learning_rate": 0.0002742133490244465, "loss": 0.029, "step": 66320 }, { "epoch": 0.17, "learning_rate": 0.000274209460808075, "loss": 0.0267, "step": 66330 }, { "epoch": 0.17, "learning_rate": 0.00027420557259170357, "loss": 0.0304, "step": 66340 }, { "epoch": 0.17, "learning_rate": 0.0002742016843753321, "loss": 0.0245, "step": 66350 }, { "epoch": 0.17, "learning_rate": 0.00027419779615896065, "loss": 0.0246, "step": 66360 }, { "epoch": 0.17, "learning_rate": 0.00027419390794258916, "loss": 0.0285, "step": 66370 }, { "epoch": 0.17, "learning_rate": 0.00027419001972621773, "loss": 0.0258, "step": 66380 }, { "epoch": 0.17, "learning_rate": 0.00027418613150984625, "loss": 0.0251, "step": 66390 }, { "epoch": 0.17, "learning_rate": 0.00027418224329347476, "loss": 0.0299, "step": 66400 }, { "epoch": 0.17, "learning_rate": 0.0002741783550771033, "loss": 0.0239, "step": 66410 }, { "epoch": 0.17, "learning_rate": 0.00027417446686073184, "loss": 0.0284, "step": 66420 }, { "epoch": 0.17, "learning_rate": 0.00027417057864436036, "loss": 0.0256, "step": 66430 }, { "epoch": 0.17, "learning_rate": 0.00027416669042798893, "loss": 0.0265, "step": 66440 }, { "epoch": 0.17, "learning_rate": 0.00027416280221161744, "loss": 0.031, "step": 66450 }, { "epoch": 0.17, "learning_rate": 0.000274158913995246, "loss": 0.0381, "step": 66460 }, { "epoch": 0.17, "learning_rate": 0.0002741550257788745, "loss": 0.0308, "step": 66470 }, { "epoch": 0.17, "learning_rate": 0.00027415113756250304, "loss": 0.0336, "step": 66480 }, { "epoch": 0.17, "learning_rate": 0.00027414724934613155, "loss": 0.0305, "step": 66490 }, { "epoch": 0.17, "learning_rate": 0.0002741433611297601, "loss": 0.0261, "step": 66500 }, { "epoch": 0.17, "learning_rate": 0.0002741394729133887, "loss": 0.0229, "step": 66510 }, { "epoch": 0.17, "learning_rate": 0.0002741355846970172, "loss": 0.033, "step": 66520 }, { "epoch": 0.17, "learning_rate": 0.0002741316964806457, "loss": 0.0273, "step": 66530 }, { "epoch": 0.17, "learning_rate": 0.00027412780826427424, "loss": 0.0289, "step": 66540 }, { "epoch": 0.17, "learning_rate": 0.0002741239200479028, "loss": 0.0232, "step": 66550 }, { "epoch": 0.17, "learning_rate": 0.0002741200318315313, "loss": 0.0274, "step": 66560 }, { "epoch": 0.17, "learning_rate": 0.0002741161436151599, "loss": 0.0227, "step": 66570 }, { "epoch": 0.17, "learning_rate": 0.0002741122553987884, "loss": 0.0303, "step": 66580 }, { "epoch": 0.17, "learning_rate": 0.00027410836718241697, "loss": 0.0241, "step": 66590 }, { "epoch": 0.17, "learning_rate": 0.0002741044789660455, "loss": 0.0288, "step": 66600 }, { "epoch": 0.17, "learning_rate": 0.000274100590749674, "loss": 0.0293, "step": 66610 }, { "epoch": 0.17, "learning_rate": 0.0002740967025333025, "loss": 0.0273, "step": 66620 }, { "epoch": 0.17, "learning_rate": 0.0002740928143169311, "loss": 0.022, "step": 66630 }, { "epoch": 0.17, "learning_rate": 0.00027408892610055965, "loss": 0.03, "step": 66640 }, { "epoch": 0.17, "learning_rate": 0.00027408503788418817, "loss": 0.0228, "step": 66650 }, { "epoch": 0.17, "learning_rate": 0.0002740811496678167, "loss": 0.0278, "step": 66660 }, { "epoch": 0.17, "learning_rate": 0.00027407726145144525, "loss": 0.0326, "step": 66670 }, { "epoch": 0.17, "learning_rate": 0.00027407337323507376, "loss": 0.0262, "step": 66680 }, { "epoch": 0.17, "learning_rate": 0.0002740694850187023, "loss": 0.0205, "step": 66690 }, { "epoch": 0.17, "learning_rate": 0.00027406559680233085, "loss": 0.0227, "step": 66700 }, { "epoch": 0.17, "learning_rate": 0.00027406170858595936, "loss": 0.0257, "step": 66710 }, { "epoch": 0.17, "learning_rate": 0.00027405782036958793, "loss": 0.0218, "step": 66720 }, { "epoch": 0.17, "learning_rate": 0.00027405393215321645, "loss": 0.0243, "step": 66730 }, { "epoch": 0.17, "learning_rate": 0.00027405004393684496, "loss": 0.024, "step": 66740 }, { "epoch": 0.17, "learning_rate": 0.0002740461557204735, "loss": 0.0274, "step": 66750 }, { "epoch": 0.17, "learning_rate": 0.00027404226750410204, "loss": 0.022, "step": 66760 }, { "epoch": 0.17, "learning_rate": 0.00027403837928773056, "loss": 0.0271, "step": 66770 }, { "epoch": 0.17, "learning_rate": 0.0002740344910713591, "loss": 0.0261, "step": 66780 }, { "epoch": 0.17, "learning_rate": 0.00027403060285498764, "loss": 0.0293, "step": 66790 }, { "epoch": 0.17, "learning_rate": 0.0002740267146386162, "loss": 0.0312, "step": 66800 }, { "epoch": 0.17, "learning_rate": 0.0002740228264222447, "loss": 0.0282, "step": 66810 }, { "epoch": 0.17, "learning_rate": 0.00027401893820587324, "loss": 0.0271, "step": 66820 }, { "epoch": 0.17, "learning_rate": 0.00027401504998950175, "loss": 0.0308, "step": 66830 }, { "epoch": 0.17, "learning_rate": 0.0002740111617731303, "loss": 0.0227, "step": 66840 }, { "epoch": 0.17, "learning_rate": 0.0002740072735567589, "loss": 0.0252, "step": 66850 }, { "epoch": 0.17, "learning_rate": 0.0002740033853403874, "loss": 0.0303, "step": 66860 }, { "epoch": 0.17, "learning_rate": 0.0002739994971240159, "loss": 0.027, "step": 66870 }, { "epoch": 0.17, "learning_rate": 0.0002739956089076445, "loss": 0.0312, "step": 66880 }, { "epoch": 0.17, "learning_rate": 0.000273991720691273, "loss": 0.0241, "step": 66890 }, { "epoch": 0.17, "learning_rate": 0.0002739878324749015, "loss": 0.0225, "step": 66900 }, { "epoch": 0.17, "learning_rate": 0.0002739839442585301, "loss": 0.0244, "step": 66910 }, { "epoch": 0.17, "learning_rate": 0.0002739800560421586, "loss": 0.0294, "step": 66920 }, { "epoch": 0.17, "learning_rate": 0.00027397616782578717, "loss": 0.0251, "step": 66930 }, { "epoch": 0.17, "learning_rate": 0.0002739722796094157, "loss": 0.0347, "step": 66940 }, { "epoch": 0.17, "learning_rate": 0.0002739683913930442, "loss": 0.0246, "step": 66950 }, { "epoch": 0.17, "learning_rate": 0.00027396450317667277, "loss": 0.0295, "step": 66960 }, { "epoch": 0.17, "learning_rate": 0.0002739606149603013, "loss": 0.0274, "step": 66970 }, { "epoch": 0.17, "learning_rate": 0.0002739567267439298, "loss": 0.0297, "step": 66980 }, { "epoch": 0.17, "learning_rate": 0.00027395283852755837, "loss": 0.0259, "step": 66990 }, { "epoch": 0.17, "learning_rate": 0.0002739489503111869, "loss": 0.0232, "step": 67000 }, { "epoch": 0.17, "eval_cer": 0.8818006609085604, "eval_loss": 0.018520452082157135, "eval_runtime": 107.7331, "eval_samples_per_second": 18.564, "eval_steps_per_second": 4.641, "step": 67000 }, { "epoch": 0.17, "learning_rate": 0.00027394506209481545, "loss": 0.0253, "step": 67010 }, { "epoch": 0.17, "learning_rate": 0.00027394117387844396, "loss": 0.0284, "step": 67020 }, { "epoch": 0.17, "learning_rate": 0.0002739372856620725, "loss": 0.0239, "step": 67030 }, { "epoch": 0.17, "learning_rate": 0.00027393339744570105, "loss": 0.0325, "step": 67040 }, { "epoch": 0.17, "learning_rate": 0.00027392950922932956, "loss": 0.0328, "step": 67050 }, { "epoch": 0.17, "learning_rate": 0.00027392562101295813, "loss": 0.0247, "step": 67060 }, { "epoch": 0.17, "learning_rate": 0.00027392173279658664, "loss": 0.0337, "step": 67070 }, { "epoch": 0.17, "learning_rate": 0.00027391784458021516, "loss": 0.027, "step": 67080 }, { "epoch": 0.17, "learning_rate": 0.00027391395636384373, "loss": 0.0277, "step": 67090 }, { "epoch": 0.17, "learning_rate": 0.00027391006814747224, "loss": 0.0272, "step": 67100 }, { "epoch": 0.17, "learning_rate": 0.00027390617993110076, "loss": 0.0258, "step": 67110 }, { "epoch": 0.17, "learning_rate": 0.0002739022917147293, "loss": 0.0243, "step": 67120 }, { "epoch": 0.17, "learning_rate": 0.00027389840349835784, "loss": 0.0256, "step": 67130 }, { "epoch": 0.17, "learning_rate": 0.0002738945152819864, "loss": 0.0268, "step": 67140 }, { "epoch": 0.17, "learning_rate": 0.0002738906270656149, "loss": 0.025, "step": 67150 }, { "epoch": 0.17, "learning_rate": 0.00027388673884924344, "loss": 0.0288, "step": 67160 }, { "epoch": 0.17, "learning_rate": 0.000273882850632872, "loss": 0.0276, "step": 67170 }, { "epoch": 0.17, "learning_rate": 0.0002738789624165005, "loss": 0.0277, "step": 67180 }, { "epoch": 0.17, "learning_rate": 0.0002738750742001291, "loss": 0.0253, "step": 67190 }, { "epoch": 0.17, "learning_rate": 0.0002738711859837576, "loss": 0.0278, "step": 67200 }, { "epoch": 0.17, "learning_rate": 0.00027386729776738617, "loss": 0.0261, "step": 67210 }, { "epoch": 0.17, "learning_rate": 0.0002738634095510147, "loss": 0.0272, "step": 67220 }, { "epoch": 0.17, "learning_rate": 0.0002738595213346432, "loss": 0.0268, "step": 67230 }, { "epoch": 0.17, "learning_rate": 0.0002738556331182717, "loss": 0.03, "step": 67240 }, { "epoch": 0.17, "learning_rate": 0.0002738517449019003, "loss": 0.0273, "step": 67250 }, { "epoch": 0.17, "learning_rate": 0.0002738478566855288, "loss": 0.0264, "step": 67260 }, { "epoch": 0.17, "learning_rate": 0.00027384396846915737, "loss": 0.0257, "step": 67270 }, { "epoch": 0.17, "learning_rate": 0.0002738400802527859, "loss": 0.0239, "step": 67280 }, { "epoch": 0.17, "learning_rate": 0.0002738361920364144, "loss": 0.0264, "step": 67290 }, { "epoch": 0.17, "learning_rate": 0.00027383230382004297, "loss": 0.0259, "step": 67300 }, { "epoch": 0.17, "learning_rate": 0.0002738284156036715, "loss": 0.0277, "step": 67310 }, { "epoch": 0.17, "learning_rate": 0.0002738245273873, "loss": 0.0231, "step": 67320 }, { "epoch": 0.17, "learning_rate": 0.00027382063917092856, "loss": 0.0211, "step": 67330 }, { "epoch": 0.17, "learning_rate": 0.00027381675095455713, "loss": 0.0212, "step": 67340 }, { "epoch": 0.17, "learning_rate": 0.00027381286273818565, "loss": 0.0278, "step": 67350 }, { "epoch": 0.17, "learning_rate": 0.00027380897452181416, "loss": 0.021, "step": 67360 }, { "epoch": 0.17, "learning_rate": 0.0002738050863054427, "loss": 0.0265, "step": 67370 }, { "epoch": 0.17, "learning_rate": 0.00027380119808907125, "loss": 0.0272, "step": 67380 }, { "epoch": 0.17, "learning_rate": 0.00027379730987269976, "loss": 0.0248, "step": 67390 }, { "epoch": 0.17, "learning_rate": 0.00027379342165632833, "loss": 0.0305, "step": 67400 }, { "epoch": 0.17, "learning_rate": 0.00027378953343995684, "loss": 0.028, "step": 67410 }, { "epoch": 0.17, "learning_rate": 0.0002737856452235854, "loss": 0.0269, "step": 67420 }, { "epoch": 0.17, "learning_rate": 0.0002737817570072139, "loss": 0.0284, "step": 67430 }, { "epoch": 0.17, "learning_rate": 0.00027377786879084244, "loss": 0.0239, "step": 67440 }, { "epoch": 0.17, "learning_rate": 0.00027377398057447096, "loss": 0.0236, "step": 67450 }, { "epoch": 0.17, "learning_rate": 0.0002737700923580995, "loss": 0.022, "step": 67460 }, { "epoch": 0.17, "learning_rate": 0.00027376620414172804, "loss": 0.0296, "step": 67470 }, { "epoch": 0.17, "learning_rate": 0.0002737623159253566, "loss": 0.0234, "step": 67480 }, { "epoch": 0.17, "learning_rate": 0.0002737584277089851, "loss": 0.029, "step": 67490 }, { "epoch": 0.17, "learning_rate": 0.00027375453949261364, "loss": 0.0277, "step": 67500 }, { "epoch": 0.17, "learning_rate": 0.0002737506512762422, "loss": 0.0246, "step": 67510 }, { "epoch": 0.18, "learning_rate": 0.0002737467630598707, "loss": 0.0275, "step": 67520 }, { "epoch": 0.18, "learning_rate": 0.00027374287484349923, "loss": 0.0246, "step": 67530 }, { "epoch": 0.18, "learning_rate": 0.0002737389866271278, "loss": 0.03, "step": 67540 }, { "epoch": 0.18, "learning_rate": 0.00027373509841075637, "loss": 0.0228, "step": 67550 }, { "epoch": 0.18, "learning_rate": 0.0002737312101943849, "loss": 0.0251, "step": 67560 }, { "epoch": 0.18, "learning_rate": 0.0002737273219780134, "loss": 0.0265, "step": 67570 }, { "epoch": 0.18, "learning_rate": 0.0002737234337616419, "loss": 0.026, "step": 67580 }, { "epoch": 0.18, "learning_rate": 0.0002737195455452705, "loss": 0.0213, "step": 67590 }, { "epoch": 0.18, "learning_rate": 0.000273715657328899, "loss": 0.0212, "step": 67600 }, { "epoch": 0.18, "learning_rate": 0.00027371176911252757, "loss": 0.0247, "step": 67610 }, { "epoch": 0.18, "learning_rate": 0.0002737078808961561, "loss": 0.0256, "step": 67620 }, { "epoch": 0.18, "learning_rate": 0.00027370399267978465, "loss": 0.0247, "step": 67630 }, { "epoch": 0.18, "learning_rate": 0.00027370010446341317, "loss": 0.0259, "step": 67640 }, { "epoch": 0.18, "learning_rate": 0.0002736962162470417, "loss": 0.0303, "step": 67650 }, { "epoch": 0.18, "learning_rate": 0.0002736923280306702, "loss": 0.0227, "step": 67660 }, { "epoch": 0.18, "learning_rate": 0.00027368843981429876, "loss": 0.0273, "step": 67670 }, { "epoch": 0.18, "learning_rate": 0.0002736845515979273, "loss": 0.0304, "step": 67680 }, { "epoch": 0.18, "learning_rate": 0.00027368066338155585, "loss": 0.0272, "step": 67690 }, { "epoch": 0.18, "learning_rate": 0.00027367677516518436, "loss": 0.0238, "step": 67700 }, { "epoch": 0.18, "learning_rate": 0.00027367288694881293, "loss": 0.0231, "step": 67710 }, { "epoch": 0.18, "learning_rate": 0.00027366899873244144, "loss": 0.0278, "step": 67720 }, { "epoch": 0.18, "learning_rate": 0.00027366511051606996, "loss": 0.029, "step": 67730 }, { "epoch": 0.18, "learning_rate": 0.00027366122229969853, "loss": 0.0254, "step": 67740 }, { "epoch": 0.18, "learning_rate": 0.00027365733408332704, "loss": 0.0247, "step": 67750 }, { "epoch": 0.18, "learning_rate": 0.0002736534458669556, "loss": 0.0227, "step": 67760 }, { "epoch": 0.18, "learning_rate": 0.0002736495576505841, "loss": 0.0299, "step": 67770 }, { "epoch": 0.18, "learning_rate": 0.00027364566943421264, "loss": 0.0267, "step": 67780 }, { "epoch": 0.18, "learning_rate": 0.00027364178121784115, "loss": 0.0257, "step": 67790 }, { "epoch": 0.18, "learning_rate": 0.0002736378930014697, "loss": 0.025, "step": 67800 }, { "epoch": 0.18, "learning_rate": 0.00027363400478509824, "loss": 0.0256, "step": 67810 }, { "epoch": 0.18, "learning_rate": 0.0002736301165687268, "loss": 0.0219, "step": 67820 }, { "epoch": 0.18, "learning_rate": 0.0002736262283523553, "loss": 0.0261, "step": 67830 }, { "epoch": 0.18, "learning_rate": 0.0002736223401359839, "loss": 0.0294, "step": 67840 }, { "epoch": 0.18, "learning_rate": 0.0002736184519196124, "loss": 0.0253, "step": 67850 }, { "epoch": 0.18, "learning_rate": 0.0002736145637032409, "loss": 0.03, "step": 67860 }, { "epoch": 0.18, "learning_rate": 0.00027361067548686943, "loss": 0.0211, "step": 67870 }, { "epoch": 0.18, "learning_rate": 0.000273606787270498, "loss": 0.0237, "step": 67880 }, { "epoch": 0.18, "learning_rate": 0.00027360289905412657, "loss": 0.0248, "step": 67890 }, { "epoch": 0.18, "learning_rate": 0.0002735990108377551, "loss": 0.0281, "step": 67900 }, { "epoch": 0.18, "learning_rate": 0.0002735951226213836, "loss": 0.0272, "step": 67910 }, { "epoch": 0.18, "learning_rate": 0.00027359123440501217, "loss": 0.0248, "step": 67920 }, { "epoch": 0.18, "learning_rate": 0.0002735873461886407, "loss": 0.0271, "step": 67930 }, { "epoch": 0.18, "learning_rate": 0.0002735834579722692, "loss": 0.0277, "step": 67940 }, { "epoch": 0.18, "learning_rate": 0.00027357956975589777, "loss": 0.022, "step": 67950 }, { "epoch": 0.18, "learning_rate": 0.0002735756815395263, "loss": 0.0331, "step": 67960 }, { "epoch": 0.18, "learning_rate": 0.00027357179332315485, "loss": 0.0221, "step": 67970 }, { "epoch": 0.18, "learning_rate": 0.00027356790510678336, "loss": 0.0254, "step": 67980 }, { "epoch": 0.18, "learning_rate": 0.0002735640168904119, "loss": 0.029, "step": 67990 }, { "epoch": 0.18, "learning_rate": 0.0002735601286740404, "loss": 0.024, "step": 68000 }, { "epoch": 0.18, "eval_cer": 0.8818412503796516, "eval_loss": 0.018042191863059998, "eval_runtime": 107.7307, "eval_samples_per_second": 18.565, "eval_steps_per_second": 4.641, "step": 68000 }, { "epoch": 0.18, "learning_rate": 0.00027355624045766896, "loss": 0.0292, "step": 68010 }, { "epoch": 0.18, "learning_rate": 0.0002735523522412975, "loss": 0.0249, "step": 68020 }, { "epoch": 0.18, "learning_rate": 0.00027354846402492605, "loss": 0.0307, "step": 68030 }, { "epoch": 0.18, "learning_rate": 0.00027354457580855456, "loss": 0.0248, "step": 68040 }, { "epoch": 0.18, "learning_rate": 0.00027354068759218313, "loss": 0.0259, "step": 68050 }, { "epoch": 0.18, "learning_rate": 0.00027353679937581164, "loss": 0.0192, "step": 68060 }, { "epoch": 0.18, "learning_rate": 0.00027353291115944016, "loss": 0.0284, "step": 68070 }, { "epoch": 0.18, "learning_rate": 0.00027352902294306867, "loss": 0.0231, "step": 68080 }, { "epoch": 0.18, "learning_rate": 0.00027352513472669724, "loss": 0.0287, "step": 68090 }, { "epoch": 0.18, "learning_rate": 0.0002735212465103258, "loss": 0.0274, "step": 68100 }, { "epoch": 0.18, "learning_rate": 0.0002735173582939543, "loss": 0.0262, "step": 68110 }, { "epoch": 0.18, "learning_rate": 0.00027351347007758284, "loss": 0.0282, "step": 68120 }, { "epoch": 0.18, "learning_rate": 0.0002735095818612114, "loss": 0.0245, "step": 68130 }, { "epoch": 0.18, "learning_rate": 0.0002735056936448399, "loss": 0.0254, "step": 68140 }, { "epoch": 0.18, "learning_rate": 0.00027350180542846844, "loss": 0.0272, "step": 68150 }, { "epoch": 0.18, "learning_rate": 0.000273497917212097, "loss": 0.0253, "step": 68160 }, { "epoch": 0.18, "learning_rate": 0.0002734940289957255, "loss": 0.0253, "step": 68170 }, { "epoch": 0.18, "learning_rate": 0.0002734901407793541, "loss": 0.0338, "step": 68180 }, { "epoch": 0.18, "learning_rate": 0.0002734862525629826, "loss": 0.0253, "step": 68190 }, { "epoch": 0.18, "learning_rate": 0.0002734823643466111, "loss": 0.0255, "step": 68200 }, { "epoch": 0.18, "learning_rate": 0.0002734784761302397, "loss": 0.0275, "step": 68210 }, { "epoch": 0.18, "learning_rate": 0.0002734745879138682, "loss": 0.0244, "step": 68220 }, { "epoch": 0.18, "learning_rate": 0.00027347069969749677, "loss": 0.0256, "step": 68230 }, { "epoch": 0.18, "learning_rate": 0.0002734668114811253, "loss": 0.0275, "step": 68240 }, { "epoch": 0.18, "learning_rate": 0.0002734629232647538, "loss": 0.0271, "step": 68250 }, { "epoch": 0.18, "learning_rate": 0.00027345903504838237, "loss": 0.0233, "step": 68260 }, { "epoch": 0.18, "learning_rate": 0.0002734551468320109, "loss": 0.0226, "step": 68270 }, { "epoch": 0.18, "learning_rate": 0.0002734512586156394, "loss": 0.0227, "step": 68280 }, { "epoch": 0.18, "learning_rate": 0.00027344737039926796, "loss": 0.025, "step": 68290 }, { "epoch": 0.18, "learning_rate": 0.0002734434821828965, "loss": 0.0235, "step": 68300 }, { "epoch": 0.18, "learning_rate": 0.00027343959396652505, "loss": 0.0275, "step": 68310 }, { "epoch": 0.18, "learning_rate": 0.00027343570575015356, "loss": 0.0264, "step": 68320 }, { "epoch": 0.18, "learning_rate": 0.0002734318175337821, "loss": 0.0203, "step": 68330 }, { "epoch": 0.18, "learning_rate": 0.00027342792931741065, "loss": 0.0284, "step": 68340 }, { "epoch": 0.18, "learning_rate": 0.00027342404110103916, "loss": 0.0246, "step": 68350 }, { "epoch": 0.18, "learning_rate": 0.0002734201528846677, "loss": 0.0221, "step": 68360 }, { "epoch": 0.18, "learning_rate": 0.00027341626466829624, "loss": 0.0284, "step": 68370 }, { "epoch": 0.18, "learning_rate": 0.0002734123764519248, "loss": 0.0295, "step": 68380 }, { "epoch": 0.18, "learning_rate": 0.00027340848823555333, "loss": 0.0304, "step": 68390 }, { "epoch": 0.18, "learning_rate": 0.00027340460001918184, "loss": 0.0323, "step": 68400 }, { "epoch": 0.18, "learning_rate": 0.00027340071180281036, "loss": 0.0307, "step": 68410 }, { "epoch": 0.18, "learning_rate": 0.0002733968235864389, "loss": 0.0283, "step": 68420 }, { "epoch": 0.18, "learning_rate": 0.00027339293537006744, "loss": 0.024, "step": 68430 }, { "epoch": 0.18, "learning_rate": 0.000273389047153696, "loss": 0.0223, "step": 68440 }, { "epoch": 0.18, "learning_rate": 0.0002733851589373245, "loss": 0.0249, "step": 68450 }, { "epoch": 0.18, "learning_rate": 0.0002733812707209531, "loss": 0.0258, "step": 68460 }, { "epoch": 0.18, "learning_rate": 0.0002733773825045816, "loss": 0.0233, "step": 68470 }, { "epoch": 0.18, "learning_rate": 0.0002733734942882101, "loss": 0.0307, "step": 68480 }, { "epoch": 0.18, "learning_rate": 0.00027336960607183864, "loss": 0.03, "step": 68490 }, { "epoch": 0.18, "learning_rate": 0.0002733657178554672, "loss": 0.0241, "step": 68500 }, { "epoch": 0.18, "learning_rate": 0.0002733618296390957, "loss": 0.022, "step": 68510 }, { "epoch": 0.18, "learning_rate": 0.0002733579414227243, "loss": 0.0266, "step": 68520 }, { "epoch": 0.18, "learning_rate": 0.0002733540532063528, "loss": 0.0242, "step": 68530 }, { "epoch": 0.18, "learning_rate": 0.0002733501649899813, "loss": 0.0295, "step": 68540 }, { "epoch": 0.18, "learning_rate": 0.0002733462767736099, "loss": 0.0272, "step": 68550 }, { "epoch": 0.18, "learning_rate": 0.0002733423885572384, "loss": 0.0257, "step": 68560 }, { "epoch": 0.18, "learning_rate": 0.0002733385003408669, "loss": 0.0253, "step": 68570 }, { "epoch": 0.18, "learning_rate": 0.0002733346121244955, "loss": 0.0235, "step": 68580 }, { "epoch": 0.18, "learning_rate": 0.00027333072390812405, "loss": 0.0259, "step": 68590 }, { "epoch": 0.18, "learning_rate": 0.00027332683569175257, "loss": 0.0221, "step": 68600 }, { "epoch": 0.18, "learning_rate": 0.0002733229474753811, "loss": 0.0235, "step": 68610 }, { "epoch": 0.18, "learning_rate": 0.0002733190592590096, "loss": 0.0274, "step": 68620 }, { "epoch": 0.18, "learning_rate": 0.00027331517104263816, "loss": 0.0256, "step": 68630 }, { "epoch": 0.18, "learning_rate": 0.0002733112828262667, "loss": 0.0251, "step": 68640 }, { "epoch": 0.18, "learning_rate": 0.00027330739460989525, "loss": 0.0255, "step": 68650 }, { "epoch": 0.18, "learning_rate": 0.00027330350639352376, "loss": 0.027, "step": 68660 }, { "epoch": 0.18, "learning_rate": 0.00027329961817715233, "loss": 0.025, "step": 68670 }, { "epoch": 0.18, "learning_rate": 0.00027329572996078084, "loss": 0.0265, "step": 68680 }, { "epoch": 0.18, "learning_rate": 0.00027329184174440936, "loss": 0.0246, "step": 68690 }, { "epoch": 0.18, "learning_rate": 0.0002732879535280379, "loss": 0.024, "step": 68700 }, { "epoch": 0.18, "learning_rate": 0.00027328406531166644, "loss": 0.0287, "step": 68710 }, { "epoch": 0.18, "learning_rate": 0.00027328017709529496, "loss": 0.0282, "step": 68720 }, { "epoch": 0.18, "learning_rate": 0.0002732762888789235, "loss": 0.0261, "step": 68730 }, { "epoch": 0.18, "learning_rate": 0.00027327240066255204, "loss": 0.0263, "step": 68740 }, { "epoch": 0.18, "learning_rate": 0.00027326851244618056, "loss": 0.024, "step": 68750 }, { "epoch": 0.18, "learning_rate": 0.0002732646242298091, "loss": 0.0249, "step": 68760 }, { "epoch": 0.18, "learning_rate": 0.00027326073601343764, "loss": 0.0278, "step": 68770 }, { "epoch": 0.18, "learning_rate": 0.0002732568477970662, "loss": 0.0229, "step": 68780 }, { "epoch": 0.18, "learning_rate": 0.0002732529595806947, "loss": 0.0269, "step": 68790 }, { "epoch": 0.18, "learning_rate": 0.0002732490713643233, "loss": 0.0317, "step": 68800 }, { "epoch": 0.18, "learning_rate": 0.0002732451831479518, "loss": 0.0278, "step": 68810 }, { "epoch": 0.18, "learning_rate": 0.0002732412949315803, "loss": 0.028, "step": 68820 }, { "epoch": 0.18, "learning_rate": 0.00027323740671520883, "loss": 0.0262, "step": 68830 }, { "epoch": 0.18, "learning_rate": 0.0002732335184988374, "loss": 0.0289, "step": 68840 }, { "epoch": 0.18, "learning_rate": 0.0002732296302824659, "loss": 0.0257, "step": 68850 }, { "epoch": 0.18, "learning_rate": 0.0002732257420660945, "loss": 0.0245, "step": 68860 }, { "epoch": 0.18, "learning_rate": 0.000273221853849723, "loss": 0.0272, "step": 68870 }, { "epoch": 0.18, "learning_rate": 0.00027321796563335157, "loss": 0.0257, "step": 68880 }, { "epoch": 0.18, "learning_rate": 0.0002732140774169801, "loss": 0.028, "step": 68890 }, { "epoch": 0.18, "learning_rate": 0.0002732101892006086, "loss": 0.0228, "step": 68900 }, { "epoch": 0.18, "learning_rate": 0.0002732063009842371, "loss": 0.0276, "step": 68910 }, { "epoch": 0.18, "learning_rate": 0.0002732024127678657, "loss": 0.0257, "step": 68920 }, { "epoch": 0.18, "learning_rate": 0.00027319852455149425, "loss": 0.0274, "step": 68930 }, { "epoch": 0.18, "learning_rate": 0.00027319463633512276, "loss": 0.0231, "step": 68940 }, { "epoch": 0.18, "learning_rate": 0.0002731907481187513, "loss": 0.0222, "step": 68950 }, { "epoch": 0.18, "learning_rate": 0.00027318685990237985, "loss": 0.0253, "step": 68960 }, { "epoch": 0.18, "learning_rate": 0.00027318297168600836, "loss": 0.0268, "step": 68970 }, { "epoch": 0.18, "learning_rate": 0.0002731790834696369, "loss": 0.0241, "step": 68980 }, { "epoch": 0.18, "learning_rate": 0.00027317519525326545, "loss": 0.0266, "step": 68990 }, { "epoch": 0.18, "learning_rate": 0.00027317130703689396, "loss": 0.0215, "step": 69000 }, { "epoch": 0.18, "eval_cer": 0.8818076590932312, "eval_loss": 0.018843624740839005, "eval_runtime": 108.0702, "eval_samples_per_second": 18.506, "eval_steps_per_second": 4.627, "step": 69000 }, { "epoch": 0.18, "learning_rate": 0.00027316741882052253, "loss": 0.0239, "step": 69010 }, { "epoch": 0.18, "learning_rate": 0.00027316353060415104, "loss": 0.0228, "step": 69020 }, { "epoch": 0.18, "learning_rate": 0.00027315964238777956, "loss": 0.0217, "step": 69030 }, { "epoch": 0.18, "learning_rate": 0.00027315575417140807, "loss": 0.0292, "step": 69040 }, { "epoch": 0.18, "learning_rate": 0.00027315186595503664, "loss": 0.0241, "step": 69050 }, { "epoch": 0.18, "learning_rate": 0.00027314797773866516, "loss": 0.0256, "step": 69060 }, { "epoch": 0.18, "learning_rate": 0.0002731440895222937, "loss": 0.0302, "step": 69070 }, { "epoch": 0.18, "learning_rate": 0.00027314020130592224, "loss": 0.0222, "step": 69080 }, { "epoch": 0.18, "learning_rate": 0.0002731363130895508, "loss": 0.0275, "step": 69090 }, { "epoch": 0.18, "learning_rate": 0.0002731324248731793, "loss": 0.0257, "step": 69100 }, { "epoch": 0.18, "learning_rate": 0.00027312853665680784, "loss": 0.0312, "step": 69110 }, { "epoch": 0.18, "learning_rate": 0.00027312464844043635, "loss": 0.033, "step": 69120 }, { "epoch": 0.18, "learning_rate": 0.0002731207602240649, "loss": 0.0272, "step": 69130 }, { "epoch": 0.18, "learning_rate": 0.0002731168720076935, "loss": 0.0382, "step": 69140 }, { "epoch": 0.18, "learning_rate": 0.000273112983791322, "loss": 0.0329, "step": 69150 }, { "epoch": 0.18, "learning_rate": 0.0002731090955749505, "loss": 0.0305, "step": 69160 }, { "epoch": 0.18, "learning_rate": 0.0002731052073585791, "loss": 0.0268, "step": 69170 }, { "epoch": 0.18, "learning_rate": 0.0002731013191422076, "loss": 0.0268, "step": 69180 }, { "epoch": 0.18, "learning_rate": 0.0002730974309258361, "loss": 0.0238, "step": 69190 }, { "epoch": 0.18, "learning_rate": 0.0002730935427094647, "loss": 0.0283, "step": 69200 }, { "epoch": 0.18, "learning_rate": 0.0002730896544930932, "loss": 0.0247, "step": 69210 }, { "epoch": 0.18, "learning_rate": 0.00027308576627672177, "loss": 0.0231, "step": 69220 }, { "epoch": 0.18, "learning_rate": 0.0002730818780603503, "loss": 0.0276, "step": 69230 }, { "epoch": 0.18, "learning_rate": 0.0002730779898439788, "loss": 0.0193, "step": 69240 }, { "epoch": 0.18, "learning_rate": 0.0002730741016276073, "loss": 0.0286, "step": 69250 }, { "epoch": 0.18, "learning_rate": 0.0002730702134112359, "loss": 0.0225, "step": 69260 }, { "epoch": 0.18, "learning_rate": 0.0002730663251948644, "loss": 0.024, "step": 69270 }, { "epoch": 0.18, "learning_rate": 0.00027306243697849296, "loss": 0.0238, "step": 69280 }, { "epoch": 0.18, "learning_rate": 0.0002730585487621215, "loss": 0.0257, "step": 69290 }, { "epoch": 0.18, "learning_rate": 0.00027305466054575005, "loss": 0.0229, "step": 69300 }, { "epoch": 0.18, "learning_rate": 0.00027305077232937856, "loss": 0.0236, "step": 69310 }, { "epoch": 0.18, "learning_rate": 0.0002730468841130071, "loss": 0.0285, "step": 69320 }, { "epoch": 0.18, "learning_rate": 0.00027304299589663564, "loss": 0.0273, "step": 69330 }, { "epoch": 0.18, "learning_rate": 0.00027303910768026416, "loss": 0.02, "step": 69340 }, { "epoch": 0.18, "learning_rate": 0.00027303521946389273, "loss": 0.0206, "step": 69350 }, { "epoch": 0.18, "learning_rate": 0.00027303133124752124, "loss": 0.028, "step": 69360 }, { "epoch": 0.18, "learning_rate": 0.00027302744303114976, "loss": 0.0276, "step": 69370 }, { "epoch": 0.18, "learning_rate": 0.0002730235548147783, "loss": 0.0259, "step": 69380 }, { "epoch": 0.18, "learning_rate": 0.00027301966659840684, "loss": 0.0245, "step": 69390 }, { "epoch": 0.18, "learning_rate": 0.00027301577838203535, "loss": 0.0289, "step": 69400 }, { "epoch": 0.18, "learning_rate": 0.0002730118901656639, "loss": 0.0215, "step": 69410 }, { "epoch": 0.18, "learning_rate": 0.00027300800194929244, "loss": 0.0276, "step": 69420 }, { "epoch": 0.18, "learning_rate": 0.000273004113732921, "loss": 0.023, "step": 69430 }, { "epoch": 0.18, "learning_rate": 0.0002730002255165495, "loss": 0.0266, "step": 69440 }, { "epoch": 0.18, "learning_rate": 0.00027299633730017804, "loss": 0.0277, "step": 69450 }, { "epoch": 0.18, "learning_rate": 0.0002729924490838066, "loss": 0.0264, "step": 69460 }, { "epoch": 0.18, "learning_rate": 0.0002729885608674351, "loss": 0.0231, "step": 69470 }, { "epoch": 0.18, "learning_rate": 0.0002729846726510637, "loss": 0.0239, "step": 69480 }, { "epoch": 0.18, "learning_rate": 0.0002729807844346922, "loss": 0.0263, "step": 69490 }, { "epoch": 0.18, "learning_rate": 0.0002729768962183207, "loss": 0.0314, "step": 69500 }, { "epoch": 0.18, "learning_rate": 0.0002729730080019493, "loss": 0.025, "step": 69510 }, { "epoch": 0.18, "learning_rate": 0.0002729691197855778, "loss": 0.0225, "step": 69520 }, { "epoch": 0.18, "learning_rate": 0.0002729652315692063, "loss": 0.0219, "step": 69530 }, { "epoch": 0.18, "learning_rate": 0.0002729613433528349, "loss": 0.0223, "step": 69540 }, { "epoch": 0.18, "learning_rate": 0.0002729574551364634, "loss": 0.0226, "step": 69550 }, { "epoch": 0.18, "learning_rate": 0.00027295356692009197, "loss": 0.0248, "step": 69560 }, { "epoch": 0.18, "learning_rate": 0.0002729496787037205, "loss": 0.0244, "step": 69570 }, { "epoch": 0.18, "learning_rate": 0.000272945790487349, "loss": 0.0253, "step": 69580 }, { "epoch": 0.18, "learning_rate": 0.00027294190227097756, "loss": 0.0246, "step": 69590 }, { "epoch": 0.18, "learning_rate": 0.0002729380140546061, "loss": 0.028, "step": 69600 }, { "epoch": 0.18, "learning_rate": 0.0002729341258382346, "loss": 0.0262, "step": 69610 }, { "epoch": 0.18, "learning_rate": 0.00027293023762186316, "loss": 0.0274, "step": 69620 }, { "epoch": 0.18, "learning_rate": 0.00027292634940549173, "loss": 0.0261, "step": 69630 }, { "epoch": 0.18, "learning_rate": 0.00027292246118912025, "loss": 0.0303, "step": 69640 }, { "epoch": 0.18, "learning_rate": 0.00027291857297274876, "loss": 0.0253, "step": 69650 }, { "epoch": 0.18, "learning_rate": 0.0002729146847563773, "loss": 0.028, "step": 69660 }, { "epoch": 0.18, "learning_rate": 0.00027291079654000584, "loss": 0.025, "step": 69670 }, { "epoch": 0.18, "learning_rate": 0.00027290690832363436, "loss": 0.0302, "step": 69680 }, { "epoch": 0.18, "learning_rate": 0.0002729030201072629, "loss": 0.0208, "step": 69690 }, { "epoch": 0.18, "learning_rate": 0.00027289913189089144, "loss": 0.0267, "step": 69700 }, { "epoch": 0.18, "learning_rate": 0.00027289524367452, "loss": 0.0238, "step": 69710 }, { "epoch": 0.18, "learning_rate": 0.0002728913554581485, "loss": 0.0236, "step": 69720 }, { "epoch": 0.18, "learning_rate": 0.00027288746724177704, "loss": 0.0322, "step": 69730 }, { "epoch": 0.18, "learning_rate": 0.00027288357902540555, "loss": 0.0254, "step": 69740 }, { "epoch": 0.18, "learning_rate": 0.0002728796908090341, "loss": 0.0264, "step": 69750 }, { "epoch": 0.18, "learning_rate": 0.00027287580259266264, "loss": 0.02, "step": 69760 }, { "epoch": 0.18, "learning_rate": 0.0002728719143762912, "loss": 0.0294, "step": 69770 }, { "epoch": 0.18, "learning_rate": 0.0002728680261599197, "loss": 0.0253, "step": 69780 }, { "epoch": 0.18, "learning_rate": 0.00027286413794354823, "loss": 0.0257, "step": 69790 }, { "epoch": 0.18, "learning_rate": 0.0002728602497271768, "loss": 0.0253, "step": 69800 }, { "epoch": 0.18, "learning_rate": 0.0002728563615108053, "loss": 0.0279, "step": 69810 }, { "epoch": 0.18, "learning_rate": 0.0002728524732944339, "loss": 0.0262, "step": 69820 }, { "epoch": 0.18, "learning_rate": 0.0002728485850780624, "loss": 0.0284, "step": 69830 }, { "epoch": 0.18, "learning_rate": 0.00027284469686169097, "loss": 0.0247, "step": 69840 }, { "epoch": 0.18, "learning_rate": 0.0002728408086453195, "loss": 0.0251, "step": 69850 }, { "epoch": 0.18, "learning_rate": 0.000272836920428948, "loss": 0.026, "step": 69860 }, { "epoch": 0.18, "learning_rate": 0.0002728330322125765, "loss": 0.0267, "step": 69870 }, { "epoch": 0.18, "learning_rate": 0.0002728291439962051, "loss": 0.0333, "step": 69880 }, { "epoch": 0.18, "learning_rate": 0.0002728252557798336, "loss": 0.023, "step": 69890 }, { "epoch": 0.18, "learning_rate": 0.00027282136756346217, "loss": 0.0273, "step": 69900 }, { "epoch": 0.18, "learning_rate": 0.0002728174793470907, "loss": 0.0298, "step": 69910 }, { "epoch": 0.18, "learning_rate": 0.00027281359113071925, "loss": 0.0236, "step": 69920 }, { "epoch": 0.18, "learning_rate": 0.00027280970291434776, "loss": 0.0246, "step": 69930 }, { "epoch": 0.18, "learning_rate": 0.0002728058146979763, "loss": 0.0234, "step": 69940 }, { "epoch": 0.18, "learning_rate": 0.0002728019264816048, "loss": 0.0255, "step": 69950 }, { "epoch": 0.18, "learning_rate": 0.00027279803826523336, "loss": 0.0211, "step": 69960 }, { "epoch": 0.18, "learning_rate": 0.00027279415004886193, "loss": 0.0312, "step": 69970 }, { "epoch": 0.18, "learning_rate": 0.00027279026183249044, "loss": 0.0303, "step": 69980 }, { "epoch": 0.18, "learning_rate": 0.00027278637361611896, "loss": 0.0208, "step": 69990 }, { "epoch": 0.18, "learning_rate": 0.0002727824853997475, "loss": 0.0227, "step": 70000 }, { "epoch": 0.18, "eval_cer": 0.8817880641761527, "eval_loss": 0.018043356016278267, "eval_runtime": 107.6403, "eval_samples_per_second": 18.58, "eval_steps_per_second": 4.645, "step": 70000 }, { "epoch": 0.18, "learning_rate": 0.00027277859718337604, "loss": 0.0231, "step": 70010 }, { "epoch": 0.18, "learning_rate": 0.00027277470896700456, "loss": 0.0225, "step": 70020 }, { "epoch": 0.18, "learning_rate": 0.0002727708207506331, "loss": 0.0296, "step": 70030 }, { "epoch": 0.18, "learning_rate": 0.00027276693253426164, "loss": 0.0258, "step": 70040 }, { "epoch": 0.18, "learning_rate": 0.0002727630443178902, "loss": 0.0214, "step": 70050 }, { "epoch": 0.18, "learning_rate": 0.0002727591561015187, "loss": 0.0262, "step": 70060 }, { "epoch": 0.18, "learning_rate": 0.00027275526788514724, "loss": 0.0263, "step": 70070 }, { "epoch": 0.18, "learning_rate": 0.00027275137966877575, "loss": 0.0296, "step": 70080 }, { "epoch": 0.18, "learning_rate": 0.0002727474914524043, "loss": 0.0283, "step": 70090 }, { "epoch": 0.18, "learning_rate": 0.00027274360323603284, "loss": 0.0255, "step": 70100 }, { "epoch": 0.18, "learning_rate": 0.0002727397150196614, "loss": 0.024, "step": 70110 }, { "epoch": 0.18, "learning_rate": 0.0002727358268032899, "loss": 0.0333, "step": 70120 }, { "epoch": 0.18, "learning_rate": 0.0002727319385869185, "loss": 0.0253, "step": 70130 }, { "epoch": 0.18, "learning_rate": 0.000272728050370547, "loss": 0.022, "step": 70140 }, { "epoch": 0.18, "learning_rate": 0.0002727241621541755, "loss": 0.0259, "step": 70150 }, { "epoch": 0.18, "learning_rate": 0.00027272027393780403, "loss": 0.027, "step": 70160 }, { "epoch": 0.18, "learning_rate": 0.0002727163857214326, "loss": 0.0287, "step": 70170 }, { "epoch": 0.18, "learning_rate": 0.00027271249750506117, "loss": 0.0286, "step": 70180 }, { "epoch": 0.18, "learning_rate": 0.0002727086092886897, "loss": 0.023, "step": 70190 }, { "epoch": 0.18, "learning_rate": 0.0002727047210723182, "loss": 0.0229, "step": 70200 }, { "epoch": 0.18, "learning_rate": 0.00027270083285594677, "loss": 0.0233, "step": 70210 }, { "epoch": 0.18, "learning_rate": 0.0002726969446395753, "loss": 0.029, "step": 70220 }, { "epoch": 0.18, "learning_rate": 0.0002726930564232038, "loss": 0.026, "step": 70230 }, { "epoch": 0.18, "learning_rate": 0.00027268916820683236, "loss": 0.0238, "step": 70240 }, { "epoch": 0.18, "learning_rate": 0.0002726852799904609, "loss": 0.0225, "step": 70250 }, { "epoch": 0.18, "learning_rate": 0.00027268139177408945, "loss": 0.0245, "step": 70260 }, { "epoch": 0.18, "learning_rate": 0.00027267750355771796, "loss": 0.0263, "step": 70270 }, { "epoch": 0.18, "learning_rate": 0.0002726736153413465, "loss": 0.024, "step": 70280 }, { "epoch": 0.18, "learning_rate": 0.000272669727124975, "loss": 0.0256, "step": 70290 }, { "epoch": 0.18, "learning_rate": 0.00027266583890860356, "loss": 0.025, "step": 70300 }, { "epoch": 0.18, "learning_rate": 0.0002726619506922321, "loss": 0.0233, "step": 70310 }, { "epoch": 0.18, "learning_rate": 0.00027265806247586064, "loss": 0.021, "step": 70320 }, { "epoch": 0.18, "learning_rate": 0.00027265417425948916, "loss": 0.0252, "step": 70330 }, { "epoch": 0.18, "learning_rate": 0.0002726502860431177, "loss": 0.0227, "step": 70340 }, { "epoch": 0.18, "learning_rate": 0.00027264639782674624, "loss": 0.0283, "step": 70350 }, { "epoch": 0.18, "learning_rate": 0.00027264250961037476, "loss": 0.0275, "step": 70360 }, { "epoch": 0.18, "learning_rate": 0.0002726386213940033, "loss": 0.0248, "step": 70370 }, { "epoch": 0.18, "learning_rate": 0.00027263473317763184, "loss": 0.0253, "step": 70380 }, { "epoch": 0.18, "learning_rate": 0.0002726308449612604, "loss": 0.0222, "step": 70390 }, { "epoch": 0.18, "learning_rate": 0.0002726269567448889, "loss": 0.0266, "step": 70400 }, { "epoch": 0.18, "learning_rate": 0.00027262306852851744, "loss": 0.0232, "step": 70410 }, { "epoch": 0.18, "learning_rate": 0.000272619180312146, "loss": 0.0293, "step": 70420 }, { "epoch": 0.18, "learning_rate": 0.0002726152920957745, "loss": 0.0266, "step": 70430 }, { "epoch": 0.18, "learning_rate": 0.00027261140387940303, "loss": 0.0235, "step": 70440 }, { "epoch": 0.18, "learning_rate": 0.0002726075156630316, "loss": 0.0231, "step": 70450 }, { "epoch": 0.18, "learning_rate": 0.0002726036274466601, "loss": 0.0241, "step": 70460 }, { "epoch": 0.18, "learning_rate": 0.0002725997392302887, "loss": 0.0235, "step": 70470 }, { "epoch": 0.18, "learning_rate": 0.0002725958510139172, "loss": 0.0288, "step": 70480 }, { "epoch": 0.18, "learning_rate": 0.0002725919627975457, "loss": 0.0276, "step": 70490 }, { "epoch": 0.18, "learning_rate": 0.00027258807458117423, "loss": 0.0282, "step": 70500 }, { "epoch": 0.18, "learning_rate": 0.0002725841863648028, "loss": 0.0244, "step": 70510 }, { "epoch": 0.18, "learning_rate": 0.00027258029814843137, "loss": 0.0259, "step": 70520 }, { "epoch": 0.18, "learning_rate": 0.0002725764099320599, "loss": 0.0247, "step": 70530 }, { "epoch": 0.18, "learning_rate": 0.0002725725217156884, "loss": 0.0283, "step": 70540 }, { "epoch": 0.18, "learning_rate": 0.00027256863349931697, "loss": 0.029, "step": 70550 }, { "epoch": 0.18, "learning_rate": 0.0002725647452829455, "loss": 0.0201, "step": 70560 }, { "epoch": 0.18, "learning_rate": 0.000272560857066574, "loss": 0.0241, "step": 70570 }, { "epoch": 0.18, "learning_rate": 0.00027255696885020256, "loss": 0.0225, "step": 70580 }, { "epoch": 0.18, "learning_rate": 0.0002725530806338311, "loss": 0.0304, "step": 70590 }, { "epoch": 0.18, "learning_rate": 0.00027254919241745965, "loss": 0.024, "step": 70600 }, { "epoch": 0.18, "learning_rate": 0.00027254530420108816, "loss": 0.025, "step": 70610 }, { "epoch": 0.18, "learning_rate": 0.0002725414159847167, "loss": 0.03, "step": 70620 }, { "epoch": 0.18, "learning_rate": 0.00027253752776834524, "loss": 0.0248, "step": 70630 }, { "epoch": 0.18, "learning_rate": 0.00027253363955197376, "loss": 0.025, "step": 70640 }, { "epoch": 0.18, "learning_rate": 0.0002725297513356023, "loss": 0.0302, "step": 70650 }, { "epoch": 0.18, "learning_rate": 0.00027252586311923084, "loss": 0.024, "step": 70660 }, { "epoch": 0.18, "learning_rate": 0.0002725219749028594, "loss": 0.0189, "step": 70670 }, { "epoch": 0.18, "learning_rate": 0.0002725180866864879, "loss": 0.0284, "step": 70680 }, { "epoch": 0.18, "learning_rate": 0.00027251419847011644, "loss": 0.0274, "step": 70690 }, { "epoch": 0.18, "learning_rate": 0.00027251031025374495, "loss": 0.0262, "step": 70700 }, { "epoch": 0.18, "learning_rate": 0.0002725064220373735, "loss": 0.0214, "step": 70710 }, { "epoch": 0.18, "learning_rate": 0.00027250253382100204, "loss": 0.0293, "step": 70720 }, { "epoch": 0.18, "learning_rate": 0.0002724986456046306, "loss": 0.0256, "step": 70730 }, { "epoch": 0.18, "learning_rate": 0.0002724947573882591, "loss": 0.0253, "step": 70740 }, { "epoch": 0.18, "learning_rate": 0.00027249086917188764, "loss": 0.0279, "step": 70750 }, { "epoch": 0.18, "learning_rate": 0.0002724869809555162, "loss": 0.0271, "step": 70760 }, { "epoch": 0.18, "learning_rate": 0.0002724830927391447, "loss": 0.025, "step": 70770 }, { "epoch": 0.18, "learning_rate": 0.00027247920452277323, "loss": 0.0229, "step": 70780 }, { "epoch": 0.18, "learning_rate": 0.0002724753163064018, "loss": 0.0223, "step": 70790 }, { "epoch": 0.18, "learning_rate": 0.0002724714280900303, "loss": 0.0248, "step": 70800 }, { "epoch": 0.18, "learning_rate": 0.0002724675398736589, "loss": 0.0301, "step": 70810 }, { "epoch": 0.18, "learning_rate": 0.0002724636516572874, "loss": 0.0287, "step": 70820 }, { "epoch": 0.18, "learning_rate": 0.0002724597634409159, "loss": 0.021, "step": 70830 }, { "epoch": 0.18, "learning_rate": 0.0002724558752245445, "loss": 0.0273, "step": 70840 }, { "epoch": 0.18, "learning_rate": 0.000272451987008173, "loss": 0.0256, "step": 70850 }, { "epoch": 0.18, "learning_rate": 0.0002724480987918015, "loss": 0.0272, "step": 70860 }, { "epoch": 0.18, "learning_rate": 0.0002724442105754301, "loss": 0.0217, "step": 70870 }, { "epoch": 0.18, "learning_rate": 0.00027244032235905865, "loss": 0.0211, "step": 70880 }, { "epoch": 0.18, "learning_rate": 0.00027243643414268716, "loss": 0.027, "step": 70890 }, { "epoch": 0.18, "learning_rate": 0.0002724325459263157, "loss": 0.0255, "step": 70900 }, { "epoch": 0.18, "learning_rate": 0.0002724286577099442, "loss": 0.0289, "step": 70910 }, { "epoch": 0.18, "learning_rate": 0.00027242476949357276, "loss": 0.0258, "step": 70920 }, { "epoch": 0.18, "learning_rate": 0.0002724208812772013, "loss": 0.0269, "step": 70930 }, { "epoch": 0.18, "learning_rate": 0.00027241699306082985, "loss": 0.0267, "step": 70940 }, { "epoch": 0.18, "learning_rate": 0.00027241310484445836, "loss": 0.0251, "step": 70950 }, { "epoch": 0.18, "learning_rate": 0.0002724092166280869, "loss": 0.0276, "step": 70960 }, { "epoch": 0.18, "learning_rate": 0.00027240532841171544, "loss": 0.024, "step": 70970 }, { "epoch": 0.18, "learning_rate": 0.00027240144019534396, "loss": 0.0263, "step": 70980 }, { "epoch": 0.18, "learning_rate": 0.00027239755197897247, "loss": 0.0249, "step": 70990 }, { "epoch": 0.18, "learning_rate": 0.00027239366376260104, "loss": 0.0223, "step": 71000 }, { "epoch": 0.18, "eval_cer": 0.8818048598193629, "eval_loss": 0.018395202234387398, "eval_runtime": 107.9247, "eval_samples_per_second": 18.531, "eval_steps_per_second": 4.633, "step": 71000 }, { "epoch": 0.18, "learning_rate": 0.00027238977554622956, "loss": 0.0266, "step": 71010 }, { "epoch": 0.18, "learning_rate": 0.0002723858873298581, "loss": 0.0295, "step": 71020 }, { "epoch": 0.18, "learning_rate": 0.00027238199911348664, "loss": 0.0319, "step": 71030 }, { "epoch": 0.18, "learning_rate": 0.00027237811089711515, "loss": 0.0221, "step": 71040 }, { "epoch": 0.18, "learning_rate": 0.0002723742226807437, "loss": 0.0247, "step": 71050 }, { "epoch": 0.18, "learning_rate": 0.00027237033446437224, "loss": 0.0252, "step": 71060 }, { "epoch": 0.18, "learning_rate": 0.0002723664462480008, "loss": 0.0236, "step": 71070 }, { "epoch": 0.18, "learning_rate": 0.0002723625580316293, "loss": 0.0266, "step": 71080 }, { "epoch": 0.18, "learning_rate": 0.0002723586698152579, "loss": 0.0239, "step": 71090 }, { "epoch": 0.18, "learning_rate": 0.0002723547815988864, "loss": 0.0283, "step": 71100 }, { "epoch": 0.18, "learning_rate": 0.0002723508933825149, "loss": 0.0235, "step": 71110 }, { "epoch": 0.18, "learning_rate": 0.00027234700516614343, "loss": 0.0249, "step": 71120 }, { "epoch": 0.18, "learning_rate": 0.000272343116949772, "loss": 0.0268, "step": 71130 }, { "epoch": 0.18, "learning_rate": 0.0002723392287334005, "loss": 0.027, "step": 71140 }, { "epoch": 0.18, "learning_rate": 0.0002723353405170291, "loss": 0.025, "step": 71150 }, { "epoch": 0.18, "learning_rate": 0.0002723314523006576, "loss": 0.0329, "step": 71160 }, { "epoch": 0.18, "learning_rate": 0.00027232756408428617, "loss": 0.0262, "step": 71170 }, { "epoch": 0.18, "learning_rate": 0.0002723236758679147, "loss": 0.0227, "step": 71180 }, { "epoch": 0.18, "learning_rate": 0.0002723197876515432, "loss": 0.0232, "step": 71190 }, { "epoch": 0.18, "learning_rate": 0.0002723158994351717, "loss": 0.0228, "step": 71200 }, { "epoch": 0.18, "learning_rate": 0.0002723120112188003, "loss": 0.0254, "step": 71210 }, { "epoch": 0.18, "learning_rate": 0.00027230812300242885, "loss": 0.0231, "step": 71220 }, { "epoch": 0.18, "learning_rate": 0.00027230423478605736, "loss": 0.0236, "step": 71230 }, { "epoch": 0.18, "learning_rate": 0.0002723003465696859, "loss": 0.0235, "step": 71240 }, { "epoch": 0.18, "learning_rate": 0.0002722964583533144, "loss": 0.0299, "step": 71250 }, { "epoch": 0.18, "learning_rate": 0.00027229257013694296, "loss": 0.0242, "step": 71260 }, { "epoch": 0.18, "learning_rate": 0.0002722886819205715, "loss": 0.0258, "step": 71270 }, { "epoch": 0.18, "learning_rate": 0.00027228479370420004, "loss": 0.0276, "step": 71280 }, { "epoch": 0.18, "learning_rate": 0.00027228090548782856, "loss": 0.0312, "step": 71290 }, { "epoch": 0.18, "learning_rate": 0.00027227701727145713, "loss": 0.0292, "step": 71300 }, { "epoch": 0.18, "learning_rate": 0.00027227312905508564, "loss": 0.0282, "step": 71310 }, { "epoch": 0.18, "learning_rate": 0.00027226924083871416, "loss": 0.0364, "step": 71320 }, { "epoch": 0.18, "learning_rate": 0.00027226535262234267, "loss": 0.029, "step": 71330 }, { "epoch": 0.18, "learning_rate": 0.00027226146440597124, "loss": 0.035, "step": 71340 }, { "epoch": 0.18, "learning_rate": 0.00027225757618959975, "loss": 0.0239, "step": 71350 }, { "epoch": 0.18, "learning_rate": 0.0002722536879732283, "loss": 0.0236, "step": 71360 }, { "epoch": 0.19, "learning_rate": 0.00027224979975685684, "loss": 0.0246, "step": 71370 }, { "epoch": 0.19, "learning_rate": 0.0002722459115404854, "loss": 0.0244, "step": 71380 }, { "epoch": 0.19, "learning_rate": 0.0002722420233241139, "loss": 0.0295, "step": 71390 }, { "epoch": 0.19, "learning_rate": 0.00027223813510774244, "loss": 0.0222, "step": 71400 }, { "epoch": 0.19, "learning_rate": 0.000272234246891371, "loss": 0.0234, "step": 71410 }, { "epoch": 0.19, "learning_rate": 0.0002722303586749995, "loss": 0.0245, "step": 71420 }, { "epoch": 0.19, "learning_rate": 0.0002722264704586281, "loss": 0.0281, "step": 71430 }, { "epoch": 0.19, "learning_rate": 0.0002722225822422566, "loss": 0.0317, "step": 71440 }, { "epoch": 0.19, "learning_rate": 0.0002722186940258851, "loss": 0.03, "step": 71450 }, { "epoch": 0.19, "learning_rate": 0.00027221480580951363, "loss": 0.0288, "step": 71460 }, { "epoch": 0.19, "learning_rate": 0.0002722109175931422, "loss": 0.0248, "step": 71470 }, { "epoch": 0.19, "learning_rate": 0.0002722070293767707, "loss": 0.0243, "step": 71480 }, { "epoch": 0.19, "learning_rate": 0.0002722031411603993, "loss": 0.0296, "step": 71490 }, { "epoch": 0.19, "learning_rate": 0.0002721992529440278, "loss": 0.0226, "step": 71500 }, { "epoch": 0.19, "learning_rate": 0.00027219536472765637, "loss": 0.0257, "step": 71510 }, { "epoch": 0.19, "learning_rate": 0.0002721914765112849, "loss": 0.0286, "step": 71520 }, { "epoch": 0.19, "learning_rate": 0.0002721875882949134, "loss": 0.026, "step": 71530 }, { "epoch": 0.19, "learning_rate": 0.0002721837000785419, "loss": 0.0317, "step": 71540 }, { "epoch": 0.19, "learning_rate": 0.0002721798118621705, "loss": 0.0327, "step": 71550 }, { "epoch": 0.19, "learning_rate": 0.00027217592364579905, "loss": 0.023, "step": 71560 }, { "epoch": 0.19, "learning_rate": 0.00027217203542942756, "loss": 0.024, "step": 71570 }, { "epoch": 0.19, "learning_rate": 0.0002721681472130561, "loss": 0.028, "step": 71580 }, { "epoch": 0.19, "learning_rate": 0.00027216425899668465, "loss": 0.0226, "step": 71590 }, { "epoch": 0.19, "learning_rate": 0.00027216037078031316, "loss": 0.0252, "step": 71600 }, { "epoch": 0.19, "learning_rate": 0.0002721564825639417, "loss": 0.0245, "step": 71610 }, { "epoch": 0.19, "learning_rate": 0.00027215259434757024, "loss": 0.0229, "step": 71620 }, { "epoch": 0.19, "learning_rate": 0.00027214870613119876, "loss": 0.0209, "step": 71630 }, { "epoch": 0.19, "learning_rate": 0.0002721448179148273, "loss": 0.0253, "step": 71640 }, { "epoch": 0.19, "learning_rate": 0.00027214092969845584, "loss": 0.0194, "step": 71650 }, { "epoch": 0.19, "learning_rate": 0.00027213704148208436, "loss": 0.0219, "step": 71660 }, { "epoch": 0.19, "learning_rate": 0.0002721331532657129, "loss": 0.028, "step": 71670 }, { "epoch": 0.19, "learning_rate": 0.00027212926504934144, "loss": 0.0312, "step": 71680 }, { "epoch": 0.19, "learning_rate": 0.00027212537683296995, "loss": 0.0244, "step": 71690 }, { "epoch": 0.19, "learning_rate": 0.0002721214886165985, "loss": 0.0225, "step": 71700 }, { "epoch": 0.19, "learning_rate": 0.00027211760040022704, "loss": 0.0233, "step": 71710 }, { "epoch": 0.19, "learning_rate": 0.0002721137121838556, "loss": 0.0271, "step": 71720 }, { "epoch": 0.19, "learning_rate": 0.0002721098239674841, "loss": 0.0228, "step": 71730 }, { "epoch": 0.19, "learning_rate": 0.00027210593575111263, "loss": 0.0287, "step": 71740 }, { "epoch": 0.19, "learning_rate": 0.00027210204753474115, "loss": 0.0256, "step": 71750 }, { "epoch": 0.19, "learning_rate": 0.0002720981593183697, "loss": 0.0236, "step": 71760 }, { "epoch": 0.19, "learning_rate": 0.0002720942711019983, "loss": 0.031, "step": 71770 }, { "epoch": 0.19, "learning_rate": 0.0002720903828856268, "loss": 0.0268, "step": 71780 }, { "epoch": 0.19, "learning_rate": 0.0002720864946692553, "loss": 0.0238, "step": 71790 }, { "epoch": 0.19, "learning_rate": 0.0002720826064528839, "loss": 0.0247, "step": 71800 }, { "epoch": 0.19, "learning_rate": 0.0002720787182365124, "loss": 0.028, "step": 71810 }, { "epoch": 0.19, "learning_rate": 0.0002720748300201409, "loss": 0.0289, "step": 71820 }, { "epoch": 0.19, "learning_rate": 0.0002720709418037695, "loss": 0.0246, "step": 71830 }, { "epoch": 0.19, "learning_rate": 0.000272067053587398, "loss": 0.0284, "step": 71840 }, { "epoch": 0.19, "learning_rate": 0.00027206316537102657, "loss": 0.0241, "step": 71850 }, { "epoch": 0.19, "learning_rate": 0.0002720592771546551, "loss": 0.0271, "step": 71860 }, { "epoch": 0.19, "learning_rate": 0.0002720553889382836, "loss": 0.0204, "step": 71870 }, { "epoch": 0.19, "learning_rate": 0.00027205150072191216, "loss": 0.0252, "step": 71880 }, { "epoch": 0.19, "learning_rate": 0.0002720476125055407, "loss": 0.0263, "step": 71890 }, { "epoch": 0.19, "learning_rate": 0.0002720437242891692, "loss": 0.0269, "step": 71900 }, { "epoch": 0.19, "learning_rate": 0.00027203983607279776, "loss": 0.0371, "step": 71910 }, { "epoch": 0.19, "learning_rate": 0.00027203594785642633, "loss": 0.022, "step": 71920 }, { "epoch": 0.19, "learning_rate": 0.00027203205964005484, "loss": 0.0208, "step": 71930 }, { "epoch": 0.19, "learning_rate": 0.00027202817142368336, "loss": 0.0248, "step": 71940 }, { "epoch": 0.19, "learning_rate": 0.0002720242832073119, "loss": 0.0213, "step": 71950 }, { "epoch": 0.19, "learning_rate": 0.00027202039499094044, "loss": 0.0282, "step": 71960 }, { "epoch": 0.19, "learning_rate": 0.00027201650677456896, "loss": 0.025, "step": 71970 }, { "epoch": 0.19, "learning_rate": 0.0002720126185581975, "loss": 0.0241, "step": 71980 }, { "epoch": 0.19, "learning_rate": 0.00027200873034182604, "loss": 0.0236, "step": 71990 }, { "epoch": 0.19, "learning_rate": 0.00027200484212545455, "loss": 0.0262, "step": 72000 }, { "epoch": 0.19, "eval_cer": 0.8818034601824287, "eval_loss": 0.017536072060465813, "eval_runtime": 107.8637, "eval_samples_per_second": 18.542, "eval_steps_per_second": 4.635, "step": 72000 }, { "epoch": 0.19, "learning_rate": 0.0002720009539090831, "loss": 0.0243, "step": 72010 }, { "epoch": 0.19, "learning_rate": 0.00027199706569271164, "loss": 0.0249, "step": 72020 }, { "epoch": 0.19, "learning_rate": 0.00027199317747634015, "loss": 0.0276, "step": 72030 }, { "epoch": 0.19, "learning_rate": 0.0002719892892599687, "loss": 0.0289, "step": 72040 }, { "epoch": 0.19, "learning_rate": 0.00027198540104359724, "loss": 0.0276, "step": 72050 }, { "epoch": 0.19, "learning_rate": 0.0002719815128272258, "loss": 0.0213, "step": 72060 }, { "epoch": 0.19, "learning_rate": 0.0002719776246108543, "loss": 0.0212, "step": 72070 }, { "epoch": 0.19, "learning_rate": 0.00027197373639448283, "loss": 0.0258, "step": 72080 }, { "epoch": 0.19, "learning_rate": 0.0002719698481781114, "loss": 0.02, "step": 72090 }, { "epoch": 0.19, "learning_rate": 0.0002719659599617399, "loss": 0.0279, "step": 72100 }, { "epoch": 0.19, "learning_rate": 0.0002719620717453685, "loss": 0.0279, "step": 72110 }, { "epoch": 0.19, "learning_rate": 0.000271958183528997, "loss": 0.0213, "step": 72120 }, { "epoch": 0.19, "learning_rate": 0.00027195429531262557, "loss": 0.0213, "step": 72130 }, { "epoch": 0.19, "learning_rate": 0.0002719504070962541, "loss": 0.0195, "step": 72140 }, { "epoch": 0.19, "learning_rate": 0.0002719465188798826, "loss": 0.0314, "step": 72150 }, { "epoch": 0.19, "learning_rate": 0.0002719426306635111, "loss": 0.0227, "step": 72160 }, { "epoch": 0.19, "learning_rate": 0.0002719387424471397, "loss": 0.0253, "step": 72170 }, { "epoch": 0.19, "learning_rate": 0.0002719348542307682, "loss": 0.0216, "step": 72180 }, { "epoch": 0.19, "learning_rate": 0.00027193096601439676, "loss": 0.0229, "step": 72190 }, { "epoch": 0.19, "learning_rate": 0.0002719270777980253, "loss": 0.0207, "step": 72200 }, { "epoch": 0.19, "learning_rate": 0.0002719231895816538, "loss": 0.0263, "step": 72210 }, { "epoch": 0.19, "learning_rate": 0.00027191930136528236, "loss": 0.0246, "step": 72220 }, { "epoch": 0.19, "learning_rate": 0.0002719154131489109, "loss": 0.0273, "step": 72230 }, { "epoch": 0.19, "learning_rate": 0.0002719115249325394, "loss": 0.0212, "step": 72240 }, { "epoch": 0.19, "learning_rate": 0.00027190763671616796, "loss": 0.0273, "step": 72250 }, { "epoch": 0.19, "learning_rate": 0.00027190374849979653, "loss": 0.0264, "step": 72260 }, { "epoch": 0.19, "learning_rate": 0.00027189986028342504, "loss": 0.0251, "step": 72270 }, { "epoch": 0.19, "learning_rate": 0.00027189597206705356, "loss": 0.0223, "step": 72280 }, { "epoch": 0.19, "learning_rate": 0.00027189208385068207, "loss": 0.0229, "step": 72290 }, { "epoch": 0.19, "learning_rate": 0.00027188819563431064, "loss": 0.0206, "step": 72300 }, { "epoch": 0.19, "learning_rate": 0.00027188430741793916, "loss": 0.0302, "step": 72310 }, { "epoch": 0.19, "learning_rate": 0.0002718804192015677, "loss": 0.0233, "step": 72320 }, { "epoch": 0.19, "learning_rate": 0.00027187653098519624, "loss": 0.031, "step": 72330 }, { "epoch": 0.19, "learning_rate": 0.0002718726427688248, "loss": 0.0289, "step": 72340 }, { "epoch": 0.19, "learning_rate": 0.0002718687545524533, "loss": 0.022, "step": 72350 }, { "epoch": 0.19, "learning_rate": 0.00027186486633608184, "loss": 0.0194, "step": 72360 }, { "epoch": 0.19, "learning_rate": 0.00027186097811971035, "loss": 0.0236, "step": 72370 }, { "epoch": 0.19, "learning_rate": 0.0002718570899033389, "loss": 0.0274, "step": 72380 }, { "epoch": 0.19, "learning_rate": 0.00027185320168696743, "loss": 0.0198, "step": 72390 }, { "epoch": 0.19, "learning_rate": 0.000271849313470596, "loss": 0.0251, "step": 72400 }, { "epoch": 0.19, "learning_rate": 0.0002718454252542245, "loss": 0.0277, "step": 72410 }, { "epoch": 0.19, "learning_rate": 0.0002718415370378531, "loss": 0.025, "step": 72420 }, { "epoch": 0.19, "learning_rate": 0.0002718376488214816, "loss": 0.0239, "step": 72430 }, { "epoch": 0.19, "learning_rate": 0.0002718337606051101, "loss": 0.0236, "step": 72440 }, { "epoch": 0.19, "learning_rate": 0.00027182987238873863, "loss": 0.0201, "step": 72450 }, { "epoch": 0.19, "learning_rate": 0.0002718259841723672, "loss": 0.0253, "step": 72460 }, { "epoch": 0.19, "learning_rate": 0.00027182209595599577, "loss": 0.0237, "step": 72470 }, { "epoch": 0.19, "learning_rate": 0.0002718182077396243, "loss": 0.0224, "step": 72480 }, { "epoch": 0.19, "learning_rate": 0.0002718143195232528, "loss": 0.0219, "step": 72490 }, { "epoch": 0.19, "learning_rate": 0.0002718104313068813, "loss": 0.026, "step": 72500 }, { "epoch": 0.19, "learning_rate": 0.0002718065430905099, "loss": 0.0227, "step": 72510 }, { "epoch": 0.19, "learning_rate": 0.0002718026548741384, "loss": 0.0285, "step": 72520 }, { "epoch": 0.19, "learning_rate": 0.00027179876665776696, "loss": 0.0261, "step": 72530 }, { "epoch": 0.19, "learning_rate": 0.0002717948784413955, "loss": 0.0258, "step": 72540 }, { "epoch": 0.19, "learning_rate": 0.00027179099022502405, "loss": 0.0329, "step": 72550 }, { "epoch": 0.19, "learning_rate": 0.00027178710200865256, "loss": 0.0234, "step": 72560 }, { "epoch": 0.19, "learning_rate": 0.0002717832137922811, "loss": 0.0279, "step": 72570 }, { "epoch": 0.19, "learning_rate": 0.0002717793255759096, "loss": 0.0297, "step": 72580 }, { "epoch": 0.19, "learning_rate": 0.00027177543735953816, "loss": 0.0264, "step": 72590 }, { "epoch": 0.19, "learning_rate": 0.0002717715491431667, "loss": 0.0297, "step": 72600 }, { "epoch": 0.19, "learning_rate": 0.00027176766092679524, "loss": 0.0237, "step": 72610 }, { "epoch": 0.19, "learning_rate": 0.00027176377271042376, "loss": 0.0294, "step": 72620 }, { "epoch": 0.19, "learning_rate": 0.0002717598844940523, "loss": 0.0236, "step": 72630 }, { "epoch": 0.19, "learning_rate": 0.00027175599627768084, "loss": 0.03, "step": 72640 }, { "epoch": 0.19, "learning_rate": 0.00027175210806130935, "loss": 0.0274, "step": 72650 }, { "epoch": 0.19, "learning_rate": 0.0002717482198449379, "loss": 0.0272, "step": 72660 }, { "epoch": 0.19, "learning_rate": 0.00027174433162856644, "loss": 0.0296, "step": 72670 }, { "epoch": 0.19, "learning_rate": 0.000271740443412195, "loss": 0.0211, "step": 72680 }, { "epoch": 0.19, "learning_rate": 0.0002717365551958235, "loss": 0.0235, "step": 72690 }, { "epoch": 0.19, "learning_rate": 0.00027173266697945204, "loss": 0.0234, "step": 72700 }, { "epoch": 0.19, "learning_rate": 0.00027172877876308055, "loss": 0.0282, "step": 72710 }, { "epoch": 0.19, "learning_rate": 0.0002717248905467091, "loss": 0.0283, "step": 72720 }, { "epoch": 0.19, "learning_rate": 0.00027172100233033763, "loss": 0.0239, "step": 72730 }, { "epoch": 0.19, "learning_rate": 0.0002717171141139662, "loss": 0.0273, "step": 72740 }, { "epoch": 0.19, "learning_rate": 0.0002717132258975947, "loss": 0.0243, "step": 72750 }, { "epoch": 0.19, "learning_rate": 0.0002717093376812233, "loss": 0.0236, "step": 72760 }, { "epoch": 0.19, "learning_rate": 0.0002717054494648518, "loss": 0.0244, "step": 72770 }, { "epoch": 0.19, "learning_rate": 0.0002717015612484803, "loss": 0.0239, "step": 72780 }, { "epoch": 0.19, "learning_rate": 0.00027169767303210883, "loss": 0.032, "step": 72790 }, { "epoch": 0.19, "learning_rate": 0.0002716937848157374, "loss": 0.0278, "step": 72800 }, { "epoch": 0.19, "learning_rate": 0.00027168989659936597, "loss": 0.022, "step": 72810 }, { "epoch": 0.19, "learning_rate": 0.0002716860083829945, "loss": 0.0232, "step": 72820 }, { "epoch": 0.19, "learning_rate": 0.000271682120166623, "loss": 0.0312, "step": 72830 }, { "epoch": 0.19, "learning_rate": 0.00027167823195025156, "loss": 0.0208, "step": 72840 }, { "epoch": 0.19, "learning_rate": 0.0002716743437338801, "loss": 0.0289, "step": 72850 }, { "epoch": 0.19, "learning_rate": 0.0002716704555175086, "loss": 0.0228, "step": 72860 }, { "epoch": 0.19, "learning_rate": 0.00027166656730113716, "loss": 0.0246, "step": 72870 }, { "epoch": 0.19, "learning_rate": 0.0002716626790847657, "loss": 0.023, "step": 72880 }, { "epoch": 0.19, "learning_rate": 0.00027165879086839425, "loss": 0.028, "step": 72890 }, { "epoch": 0.19, "learning_rate": 0.00027165490265202276, "loss": 0.02, "step": 72900 }, { "epoch": 0.19, "learning_rate": 0.0002716510144356513, "loss": 0.0226, "step": 72910 }, { "epoch": 0.19, "learning_rate": 0.00027164712621927984, "loss": 0.0234, "step": 72920 }, { "epoch": 0.19, "learning_rate": 0.00027164323800290836, "loss": 0.0267, "step": 72930 }, { "epoch": 0.19, "learning_rate": 0.00027163934978653687, "loss": 0.0315, "step": 72940 }, { "epoch": 0.19, "learning_rate": 0.00027163546157016544, "loss": 0.0257, "step": 72950 }, { "epoch": 0.19, "learning_rate": 0.00027163157335379396, "loss": 0.0262, "step": 72960 }, { "epoch": 0.19, "learning_rate": 0.0002716276851374225, "loss": 0.0246, "step": 72970 }, { "epoch": 0.19, "learning_rate": 0.00027162379692105104, "loss": 0.0295, "step": 72980 }, { "epoch": 0.19, "learning_rate": 0.00027161990870467955, "loss": 0.0236, "step": 72990 }, { "epoch": 0.19, "learning_rate": 0.0002716160204883081, "loss": 0.0234, "step": 73000 }, { "epoch": 0.19, "eval_cer": 0.88176706962214, "eval_loss": 0.018438469618558884, "eval_runtime": 107.9064, "eval_samples_per_second": 18.535, "eval_steps_per_second": 4.634, "step": 73000 }, { "epoch": 0.19, "learning_rate": 0.00027161213227193664, "loss": 0.0253, "step": 73010 }, { "epoch": 0.19, "learning_rate": 0.0002716082440555652, "loss": 0.0262, "step": 73020 }, { "epoch": 0.19, "learning_rate": 0.0002716043558391937, "loss": 0.059, "step": 73030 }, { "epoch": 0.19, "learning_rate": 0.00027160046762282223, "loss": 0.0958, "step": 73040 }, { "epoch": 0.19, "learning_rate": 0.0002715965794064508, "loss": 0.0285, "step": 73050 }, { "epoch": 0.19, "learning_rate": 0.0002715926911900793, "loss": 0.0338, "step": 73060 }, { "epoch": 0.19, "learning_rate": 0.00027158880297370783, "loss": 0.0242, "step": 73070 }, { "epoch": 0.19, "learning_rate": 0.0002715849147573364, "loss": 0.0243, "step": 73080 }, { "epoch": 0.19, "learning_rate": 0.0002715810265409649, "loss": 0.0243, "step": 73090 }, { "epoch": 0.19, "learning_rate": 0.0002715771383245935, "loss": 0.0256, "step": 73100 }, { "epoch": 0.19, "learning_rate": 0.000271573250108222, "loss": 0.0281, "step": 73110 }, { "epoch": 0.19, "learning_rate": 0.0002715693618918505, "loss": 0.0276, "step": 73120 }, { "epoch": 0.19, "learning_rate": 0.0002715654736754791, "loss": 0.027, "step": 73130 }, { "epoch": 0.19, "learning_rate": 0.0002715615854591076, "loss": 0.0202, "step": 73140 }, { "epoch": 0.19, "learning_rate": 0.00027155769724273617, "loss": 0.0324, "step": 73150 }, { "epoch": 0.19, "learning_rate": 0.0002715538090263647, "loss": 0.0307, "step": 73160 }, { "epoch": 0.19, "learning_rate": 0.00027154992080999325, "loss": 0.0325, "step": 73170 }, { "epoch": 0.19, "learning_rate": 0.00027154603259362176, "loss": 0.0237, "step": 73180 }, { "epoch": 0.19, "learning_rate": 0.0002715421443772503, "loss": 0.0225, "step": 73190 }, { "epoch": 0.19, "learning_rate": 0.0002715382561608788, "loss": 0.0251, "step": 73200 }, { "epoch": 0.19, "learning_rate": 0.00027153436794450736, "loss": 0.0284, "step": 73210 }, { "epoch": 0.19, "learning_rate": 0.0002715304797281359, "loss": 0.0257, "step": 73220 }, { "epoch": 0.19, "learning_rate": 0.00027152659151176444, "loss": 0.0231, "step": 73230 }, { "epoch": 0.19, "learning_rate": 0.00027152270329539296, "loss": 0.0222, "step": 73240 }, { "epoch": 0.19, "learning_rate": 0.0002715188150790215, "loss": 0.0268, "step": 73250 }, { "epoch": 0.19, "learning_rate": 0.00027151492686265004, "loss": 0.0214, "step": 73260 }, { "epoch": 0.19, "learning_rate": 0.00027151103864627856, "loss": 0.0233, "step": 73270 }, { "epoch": 0.19, "learning_rate": 0.00027150715042990707, "loss": 0.0486, "step": 73280 }, { "epoch": 0.19, "learning_rate": 0.00027150326221353564, "loss": 0.0237, "step": 73290 }, { "epoch": 0.19, "learning_rate": 0.0002714993739971642, "loss": 0.019, "step": 73300 }, { "epoch": 0.19, "learning_rate": 0.0002714954857807927, "loss": 0.0259, "step": 73310 }, { "epoch": 0.19, "learning_rate": 0.00027149159756442124, "loss": 0.0289, "step": 73320 }, { "epoch": 0.19, "learning_rate": 0.00027148770934804975, "loss": 0.0238, "step": 73330 }, { "epoch": 0.19, "learning_rate": 0.0002714838211316783, "loss": 0.0284, "step": 73340 }, { "epoch": 0.19, "learning_rate": 0.00027147993291530684, "loss": 0.0258, "step": 73350 }, { "epoch": 0.19, "learning_rate": 0.0002714760446989354, "loss": 0.0265, "step": 73360 }, { "epoch": 0.19, "learning_rate": 0.0002714721564825639, "loss": 0.0241, "step": 73370 }, { "epoch": 0.19, "learning_rate": 0.0002714682682661925, "loss": 0.0312, "step": 73380 }, { "epoch": 0.19, "learning_rate": 0.000271464380049821, "loss": 0.0221, "step": 73390 }, { "epoch": 0.19, "learning_rate": 0.0002714604918334495, "loss": 0.0209, "step": 73400 }, { "epoch": 0.19, "learning_rate": 0.00027145660361707803, "loss": 0.026, "step": 73410 }, { "epoch": 0.19, "learning_rate": 0.0002714527154007066, "loss": 0.0232, "step": 73420 }, { "epoch": 0.19, "learning_rate": 0.0002714488271843351, "loss": 0.0195, "step": 73430 }, { "epoch": 0.19, "learning_rate": 0.0002714449389679637, "loss": 0.0285, "step": 73440 }, { "epoch": 0.19, "learning_rate": 0.0002714410507515922, "loss": 0.0213, "step": 73450 }, { "epoch": 0.19, "learning_rate": 0.0002714371625352207, "loss": 0.027, "step": 73460 }, { "epoch": 0.19, "learning_rate": 0.0002714332743188493, "loss": 0.0263, "step": 73470 }, { "epoch": 0.19, "learning_rate": 0.0002714293861024778, "loss": 0.0242, "step": 73480 }, { "epoch": 0.19, "learning_rate": 0.0002714254978861063, "loss": 0.0189, "step": 73490 }, { "epoch": 0.19, "learning_rate": 0.0002714216096697349, "loss": 0.026, "step": 73500 }, { "epoch": 0.19, "learning_rate": 0.00027141772145336345, "loss": 0.028, "step": 73510 }, { "epoch": 0.19, "learning_rate": 0.00027141383323699196, "loss": 0.0284, "step": 73520 }, { "epoch": 0.19, "learning_rate": 0.0002714099450206205, "loss": 0.0267, "step": 73530 }, { "epoch": 0.19, "learning_rate": 0.000271406056804249, "loss": 0.0253, "step": 73540 }, { "epoch": 0.19, "learning_rate": 0.00027140216858787756, "loss": 0.0196, "step": 73550 }, { "epoch": 0.19, "learning_rate": 0.0002713982803715061, "loss": 0.0249, "step": 73560 }, { "epoch": 0.19, "learning_rate": 0.00027139439215513464, "loss": 0.0271, "step": 73570 }, { "epoch": 0.19, "learning_rate": 0.00027139050393876316, "loss": 0.0269, "step": 73580 }, { "epoch": 0.19, "learning_rate": 0.0002713866157223917, "loss": 0.0262, "step": 73590 }, { "epoch": 0.19, "learning_rate": 0.00027138272750602024, "loss": 0.0298, "step": 73600 }, { "epoch": 0.19, "learning_rate": 0.00027137883928964876, "loss": 0.0231, "step": 73610 }, { "epoch": 0.19, "learning_rate": 0.00027137495107327727, "loss": 0.0229, "step": 73620 }, { "epoch": 0.19, "learning_rate": 0.00027137106285690584, "loss": 0.0335, "step": 73630 }, { "epoch": 0.19, "learning_rate": 0.00027136717464053435, "loss": 0.0243, "step": 73640 }, { "epoch": 0.19, "learning_rate": 0.0002713632864241629, "loss": 0.026, "step": 73650 }, { "epoch": 0.19, "learning_rate": 0.00027135939820779144, "loss": 0.0323, "step": 73660 }, { "epoch": 0.19, "learning_rate": 0.00027135550999142, "loss": 0.023, "step": 73670 }, { "epoch": 0.19, "learning_rate": 0.0002713516217750485, "loss": 0.0251, "step": 73680 }, { "epoch": 0.19, "learning_rate": 0.00027134773355867703, "loss": 0.0235, "step": 73690 }, { "epoch": 0.19, "learning_rate": 0.0002713438453423056, "loss": 0.0256, "step": 73700 }, { "epoch": 0.19, "learning_rate": 0.0002713399571259341, "loss": 0.0254, "step": 73710 }, { "epoch": 0.19, "learning_rate": 0.0002713360689095627, "loss": 0.0187, "step": 73720 }, { "epoch": 0.19, "learning_rate": 0.0002713321806931912, "loss": 0.0275, "step": 73730 }, { "epoch": 0.19, "learning_rate": 0.0002713282924768197, "loss": 0.0239, "step": 73740 }, { "epoch": 0.19, "learning_rate": 0.00027132440426044823, "loss": 0.0231, "step": 73750 }, { "epoch": 0.19, "learning_rate": 0.0002713205160440768, "loss": 0.0223, "step": 73760 }, { "epoch": 0.19, "learning_rate": 0.0002713166278277053, "loss": 0.0248, "step": 73770 }, { "epoch": 0.19, "learning_rate": 0.0002713127396113339, "loss": 0.0278, "step": 73780 }, { "epoch": 0.19, "learning_rate": 0.0002713088513949624, "loss": 0.026, "step": 73790 }, { "epoch": 0.19, "learning_rate": 0.00027130496317859097, "loss": 0.0189, "step": 73800 }, { "epoch": 0.19, "learning_rate": 0.0002713010749622195, "loss": 0.0219, "step": 73810 }, { "epoch": 0.19, "learning_rate": 0.000271297186745848, "loss": 0.026, "step": 73820 }, { "epoch": 0.19, "learning_rate": 0.0002712932985294765, "loss": 0.0217, "step": 73830 }, { "epoch": 0.19, "learning_rate": 0.0002712894103131051, "loss": 0.0218, "step": 73840 }, { "epoch": 0.19, "learning_rate": 0.00027128552209673365, "loss": 0.0312, "step": 73850 }, { "epoch": 0.19, "learning_rate": 0.00027128163388036216, "loss": 0.0279, "step": 73860 }, { "epoch": 0.19, "learning_rate": 0.0002712777456639907, "loss": 0.0234, "step": 73870 }, { "epoch": 0.19, "learning_rate": 0.00027127385744761924, "loss": 0.0232, "step": 73880 }, { "epoch": 0.19, "learning_rate": 0.00027126996923124776, "loss": 0.0226, "step": 73890 }, { "epoch": 0.19, "learning_rate": 0.0002712660810148763, "loss": 0.0224, "step": 73900 }, { "epoch": 0.19, "learning_rate": 0.00027126219279850484, "loss": 0.0251, "step": 73910 }, { "epoch": 0.19, "learning_rate": 0.00027125830458213336, "loss": 0.0315, "step": 73920 }, { "epoch": 0.19, "learning_rate": 0.0002712544163657619, "loss": 0.0274, "step": 73930 }, { "epoch": 0.19, "learning_rate": 0.00027125052814939044, "loss": 0.026, "step": 73940 }, { "epoch": 0.19, "learning_rate": 0.00027124663993301895, "loss": 0.0312, "step": 73950 }, { "epoch": 0.19, "learning_rate": 0.00027124275171664747, "loss": 0.0209, "step": 73960 }, { "epoch": 0.19, "learning_rate": 0.00027123886350027604, "loss": 0.0228, "step": 73970 }, { "epoch": 0.19, "learning_rate": 0.00027123497528390455, "loss": 0.023, "step": 73980 }, { "epoch": 0.19, "learning_rate": 0.0002712310870675331, "loss": 0.024, "step": 73990 }, { "epoch": 0.19, "learning_rate": 0.00027122719885116164, "loss": 0.0253, "step": 74000 }, { "epoch": 0.19, "eval_cer": 0.8818370514688489, "eval_loss": 0.018291616812348366, "eval_runtime": 108.0408, "eval_samples_per_second": 18.512, "eval_steps_per_second": 4.628, "step": 74000 }, { "epoch": 0.19, "learning_rate": 0.0002712233106347902, "loss": 0.0218, "step": 74010 }, { "epoch": 0.19, "learning_rate": 0.0002712194224184187, "loss": 0.03, "step": 74020 }, { "epoch": 0.19, "learning_rate": 0.00027121553420204723, "loss": 0.025, "step": 74030 }, { "epoch": 0.19, "learning_rate": 0.00027121164598567575, "loss": 0.0264, "step": 74040 }, { "epoch": 0.19, "learning_rate": 0.0002712077577693043, "loss": 0.0199, "step": 74050 }, { "epoch": 0.19, "learning_rate": 0.0002712038695529329, "loss": 0.029, "step": 74060 }, { "epoch": 0.19, "learning_rate": 0.0002711999813365614, "loss": 0.0227, "step": 74070 }, { "epoch": 0.19, "learning_rate": 0.0002711960931201899, "loss": 0.0317, "step": 74080 }, { "epoch": 0.19, "learning_rate": 0.0002711922049038185, "loss": 0.0344, "step": 74090 }, { "epoch": 0.19, "learning_rate": 0.000271188316687447, "loss": 0.0263, "step": 74100 }, { "epoch": 0.19, "learning_rate": 0.0002711844284710755, "loss": 0.0234, "step": 74110 }, { "epoch": 0.19, "learning_rate": 0.0002711805402547041, "loss": 0.0211, "step": 74120 }, { "epoch": 0.19, "learning_rate": 0.0002711766520383326, "loss": 0.0246, "step": 74130 }, { "epoch": 0.19, "learning_rate": 0.00027117276382196116, "loss": 0.0197, "step": 74140 }, { "epoch": 0.19, "learning_rate": 0.0002711688756055897, "loss": 0.0255, "step": 74150 }, { "epoch": 0.19, "learning_rate": 0.0002711649873892182, "loss": 0.0242, "step": 74160 }, { "epoch": 0.19, "learning_rate": 0.00027116109917284676, "loss": 0.0246, "step": 74170 }, { "epoch": 0.19, "learning_rate": 0.0002711572109564753, "loss": 0.0192, "step": 74180 }, { "epoch": 0.19, "learning_rate": 0.0002711533227401038, "loss": 0.0227, "step": 74190 }, { "epoch": 0.19, "learning_rate": 0.00027114943452373236, "loss": 0.0238, "step": 74200 }, { "epoch": 0.19, "learning_rate": 0.0002711455463073609, "loss": 0.0252, "step": 74210 }, { "epoch": 0.19, "learning_rate": 0.00027114165809098944, "loss": 0.024, "step": 74220 }, { "epoch": 0.19, "learning_rate": 0.00027113776987461796, "loss": 0.0205, "step": 74230 }, { "epoch": 0.19, "learning_rate": 0.00027113388165824647, "loss": 0.0236, "step": 74240 }, { "epoch": 0.19, "learning_rate": 0.00027112999344187504, "loss": 0.0231, "step": 74250 }, { "epoch": 0.19, "learning_rate": 0.00027112610522550356, "loss": 0.0226, "step": 74260 }, { "epoch": 0.19, "learning_rate": 0.0002711222170091321, "loss": 0.0251, "step": 74270 }, { "epoch": 0.19, "learning_rate": 0.00027111832879276064, "loss": 0.024, "step": 74280 }, { "epoch": 0.19, "learning_rate": 0.00027111444057638915, "loss": 0.0223, "step": 74290 }, { "epoch": 0.19, "learning_rate": 0.0002711105523600177, "loss": 0.0217, "step": 74300 }, { "epoch": 0.19, "learning_rate": 0.00027110666414364624, "loss": 0.0252, "step": 74310 }, { "epoch": 0.19, "learning_rate": 0.00027110277592727475, "loss": 0.0228, "step": 74320 }, { "epoch": 0.19, "learning_rate": 0.0002710988877109033, "loss": 0.0239, "step": 74330 }, { "epoch": 0.19, "learning_rate": 0.0002710949994945319, "loss": 0.0257, "step": 74340 }, { "epoch": 0.19, "learning_rate": 0.0002710911112781604, "loss": 0.0287, "step": 74350 }, { "epoch": 0.19, "learning_rate": 0.0002710872230617889, "loss": 0.0217, "step": 74360 }, { "epoch": 0.19, "learning_rate": 0.00027108333484541743, "loss": 0.0289, "step": 74370 }, { "epoch": 0.19, "learning_rate": 0.000271079446629046, "loss": 0.0211, "step": 74380 }, { "epoch": 0.19, "learning_rate": 0.0002710755584126745, "loss": 0.0262, "step": 74390 }, { "epoch": 0.19, "learning_rate": 0.0002710716701963031, "loss": 0.0212, "step": 74400 }, { "epoch": 0.19, "learning_rate": 0.0002710677819799316, "loss": 0.0295, "step": 74410 }, { "epoch": 0.19, "learning_rate": 0.00027106389376356017, "loss": 0.0229, "step": 74420 }, { "epoch": 0.19, "learning_rate": 0.0002710600055471887, "loss": 0.0237, "step": 74430 }, { "epoch": 0.19, "learning_rate": 0.0002710561173308172, "loss": 0.022, "step": 74440 }, { "epoch": 0.19, "learning_rate": 0.0002710522291144457, "loss": 0.0258, "step": 74450 }, { "epoch": 0.19, "learning_rate": 0.0002710483408980743, "loss": 0.0225, "step": 74460 }, { "epoch": 0.19, "learning_rate": 0.0002710444526817028, "loss": 0.0241, "step": 74470 }, { "epoch": 0.19, "learning_rate": 0.00027104056446533136, "loss": 0.0224, "step": 74480 }, { "epoch": 0.19, "learning_rate": 0.0002710366762489599, "loss": 0.0221, "step": 74490 }, { "epoch": 0.19, "learning_rate": 0.0002710327880325884, "loss": 0.0256, "step": 74500 }, { "epoch": 0.19, "learning_rate": 0.00027102889981621696, "loss": 0.0215, "step": 74510 }, { "epoch": 0.19, "learning_rate": 0.0002710250115998455, "loss": 0.0243, "step": 74520 }, { "epoch": 0.19, "learning_rate": 0.000271021123383474, "loss": 0.0276, "step": 74530 }, { "epoch": 0.19, "learning_rate": 0.00027101723516710256, "loss": 0.0257, "step": 74540 }, { "epoch": 0.19, "learning_rate": 0.0002710133469507311, "loss": 0.0221, "step": 74550 }, { "epoch": 0.19, "learning_rate": 0.00027100945873435964, "loss": 0.0205, "step": 74560 }, { "epoch": 0.19, "learning_rate": 0.00027100557051798816, "loss": 0.0243, "step": 74570 }, { "epoch": 0.19, "learning_rate": 0.00027100168230161667, "loss": 0.0241, "step": 74580 }, { "epoch": 0.19, "learning_rate": 0.00027099779408524524, "loss": 0.0225, "step": 74590 }, { "epoch": 0.19, "learning_rate": 0.00027099390586887375, "loss": 0.0258, "step": 74600 }, { "epoch": 0.19, "learning_rate": 0.0002709900176525023, "loss": 0.0232, "step": 74610 }, { "epoch": 0.19, "learning_rate": 0.00027098612943613084, "loss": 0.0261, "step": 74620 }, { "epoch": 0.19, "learning_rate": 0.0002709822412197594, "loss": 0.0293, "step": 74630 }, { "epoch": 0.19, "learning_rate": 0.0002709783530033879, "loss": 0.0216, "step": 74640 }, { "epoch": 0.19, "learning_rate": 0.00027097446478701644, "loss": 0.0237, "step": 74650 }, { "epoch": 0.19, "learning_rate": 0.00027097057657064495, "loss": 0.0264, "step": 74660 }, { "epoch": 0.19, "learning_rate": 0.0002709666883542735, "loss": 0.0215, "step": 74670 }, { "epoch": 0.19, "learning_rate": 0.00027096280013790203, "loss": 0.026, "step": 74680 }, { "epoch": 0.19, "learning_rate": 0.0002709589119215306, "loss": 0.0278, "step": 74690 }, { "epoch": 0.19, "learning_rate": 0.0002709550237051591, "loss": 0.0263, "step": 74700 }, { "epoch": 0.19, "learning_rate": 0.00027095113548878763, "loss": 0.0221, "step": 74710 }, { "epoch": 0.19, "learning_rate": 0.0002709472472724162, "loss": 0.0199, "step": 74720 }, { "epoch": 0.19, "learning_rate": 0.0002709433590560447, "loss": 0.0344, "step": 74730 }, { "epoch": 0.19, "learning_rate": 0.0002709394708396733, "loss": 0.0208, "step": 74740 }, { "epoch": 0.19, "learning_rate": 0.0002709355826233018, "loss": 0.0255, "step": 74750 }, { "epoch": 0.19, "learning_rate": 0.00027093169440693037, "loss": 0.0226, "step": 74760 }, { "epoch": 0.19, "learning_rate": 0.0002709278061905589, "loss": 0.0227, "step": 74770 }, { "epoch": 0.19, "learning_rate": 0.0002709239179741874, "loss": 0.03, "step": 74780 }, { "epoch": 0.19, "learning_rate": 0.0002709200297578159, "loss": 0.0244, "step": 74790 }, { "epoch": 0.19, "learning_rate": 0.0002709161415414445, "loss": 0.024, "step": 74800 }, { "epoch": 0.19, "learning_rate": 0.000270912253325073, "loss": 0.0225, "step": 74810 }, { "epoch": 0.19, "learning_rate": 0.00027090836510870156, "loss": 0.0248, "step": 74820 }, { "epoch": 0.19, "learning_rate": 0.0002709044768923301, "loss": 0.027, "step": 74830 }, { "epoch": 0.19, "learning_rate": 0.00027090058867595864, "loss": 0.0234, "step": 74840 }, { "epoch": 0.19, "learning_rate": 0.00027089670045958716, "loss": 0.0226, "step": 74850 }, { "epoch": 0.19, "learning_rate": 0.0002708928122432157, "loss": 0.0232, "step": 74860 }, { "epoch": 0.19, "learning_rate": 0.0002708889240268442, "loss": 0.0217, "step": 74870 }, { "epoch": 0.19, "learning_rate": 0.00027088503581047276, "loss": 0.0247, "step": 74880 }, { "epoch": 0.19, "learning_rate": 0.0002708811475941013, "loss": 0.025, "step": 74890 }, { "epoch": 0.19, "learning_rate": 0.00027087725937772984, "loss": 0.0283, "step": 74900 }, { "epoch": 0.19, "learning_rate": 0.00027087337116135836, "loss": 0.0281, "step": 74910 }, { "epoch": 0.19, "learning_rate": 0.0002708694829449869, "loss": 0.0219, "step": 74920 }, { "epoch": 0.19, "learning_rate": 0.00027086559472861544, "loss": 0.0246, "step": 74930 }, { "epoch": 0.19, "learning_rate": 0.00027086170651224395, "loss": 0.0287, "step": 74940 }, { "epoch": 0.19, "learning_rate": 0.0002708578182958725, "loss": 0.0302, "step": 74950 }, { "epoch": 0.19, "learning_rate": 0.00027085393007950104, "loss": 0.0209, "step": 74960 }, { "epoch": 0.19, "learning_rate": 0.0002708500418631296, "loss": 0.0235, "step": 74970 }, { "epoch": 0.19, "learning_rate": 0.0002708461536467581, "loss": 0.0288, "step": 74980 }, { "epoch": 0.19, "learning_rate": 0.00027084226543038663, "loss": 0.0222, "step": 74990 }, { "epoch": 0.19, "learning_rate": 0.00027083837721401515, "loss": 0.0261, "step": 75000 }, { "epoch": 0.19, "eval_cer": 0.8817908634500211, "eval_loss": 0.017617717385292053, "eval_runtime": 107.5409, "eval_samples_per_second": 18.598, "eval_steps_per_second": 4.649, "step": 75000 }, { "epoch": 0.19, "learning_rate": 0.0002708344889976437, "loss": 0.0273, "step": 75010 }, { "epoch": 0.19, "learning_rate": 0.00027083060078127223, "loss": 0.0304, "step": 75020 }, { "epoch": 0.19, "learning_rate": 0.0002708267125649008, "loss": 0.0268, "step": 75030 }, { "epoch": 0.19, "learning_rate": 0.0002708228243485293, "loss": 0.0246, "step": 75040 }, { "epoch": 0.19, "learning_rate": 0.0002708189361321579, "loss": 0.0229, "step": 75050 }, { "epoch": 0.19, "learning_rate": 0.0002708150479157864, "loss": 0.0187, "step": 75060 }, { "epoch": 0.19, "learning_rate": 0.0002708111596994149, "loss": 0.021, "step": 75070 }, { "epoch": 0.19, "learning_rate": 0.00027080727148304343, "loss": 0.0253, "step": 75080 }, { "epoch": 0.19, "learning_rate": 0.000270803383266672, "loss": 0.0316, "step": 75090 }, { "epoch": 0.19, "learning_rate": 0.00027079949505030056, "loss": 0.0222, "step": 75100 }, { "epoch": 0.19, "learning_rate": 0.0002707956068339291, "loss": 0.0262, "step": 75110 }, { "epoch": 0.19, "learning_rate": 0.0002707917186175576, "loss": 0.0212, "step": 75120 }, { "epoch": 0.19, "learning_rate": 0.00027078783040118616, "loss": 0.0282, "step": 75130 }, { "epoch": 0.19, "learning_rate": 0.0002707839421848147, "loss": 0.0218, "step": 75140 }, { "epoch": 0.19, "learning_rate": 0.0002707800539684432, "loss": 0.0212, "step": 75150 }, { "epoch": 0.19, "learning_rate": 0.00027077616575207176, "loss": 0.0256, "step": 75160 }, { "epoch": 0.19, "learning_rate": 0.0002707722775357003, "loss": 0.0209, "step": 75170 }, { "epoch": 0.19, "learning_rate": 0.00027076838931932884, "loss": 0.0254, "step": 75180 }, { "epoch": 0.19, "learning_rate": 0.00027076450110295736, "loss": 0.0281, "step": 75190 }, { "epoch": 0.19, "learning_rate": 0.00027076061288658587, "loss": 0.027, "step": 75200 }, { "epoch": 0.19, "learning_rate": 0.0002707567246702144, "loss": 0.0245, "step": 75210 }, { "epoch": 0.19, "learning_rate": 0.00027075283645384296, "loss": 0.0248, "step": 75220 }, { "epoch": 0.2, "learning_rate": 0.00027074894823747147, "loss": 0.0269, "step": 75230 }, { "epoch": 0.2, "learning_rate": 0.00027074506002110004, "loss": 0.0242, "step": 75240 }, { "epoch": 0.2, "learning_rate": 0.00027074117180472855, "loss": 0.0269, "step": 75250 }, { "epoch": 0.2, "learning_rate": 0.0002707372835883571, "loss": 0.026, "step": 75260 }, { "epoch": 0.2, "learning_rate": 0.00027073339537198564, "loss": 0.0225, "step": 75270 }, { "epoch": 0.2, "learning_rate": 0.00027072950715561415, "loss": 0.0253, "step": 75280 }, { "epoch": 0.2, "learning_rate": 0.0002707256189392427, "loss": 0.0256, "step": 75290 }, { "epoch": 0.2, "learning_rate": 0.00027072173072287123, "loss": 0.0255, "step": 75300 }, { "epoch": 0.2, "learning_rate": 0.0002707178425064998, "loss": 0.0228, "step": 75310 }, { "epoch": 0.2, "learning_rate": 0.0002707139542901283, "loss": 0.026, "step": 75320 }, { "epoch": 0.2, "learning_rate": 0.00027071006607375683, "loss": 0.0263, "step": 75330 }, { "epoch": 0.2, "learning_rate": 0.0002707061778573854, "loss": 0.0239, "step": 75340 }, { "epoch": 0.2, "learning_rate": 0.0002707022896410139, "loss": 0.0314, "step": 75350 }, { "epoch": 0.2, "learning_rate": 0.00027069840142464243, "loss": 0.0213, "step": 75360 }, { "epoch": 0.2, "learning_rate": 0.000270694513208271, "loss": 0.0265, "step": 75370 }, { "epoch": 0.2, "learning_rate": 0.0002706906249918995, "loss": 0.025, "step": 75380 }, { "epoch": 0.2, "learning_rate": 0.0002706867367755281, "loss": 0.0244, "step": 75390 }, { "epoch": 0.2, "learning_rate": 0.0002706828485591566, "loss": 0.0243, "step": 75400 }, { "epoch": 0.2, "learning_rate": 0.0002706789603427851, "loss": 0.0262, "step": 75410 }, { "epoch": 0.2, "learning_rate": 0.0002706750721264137, "loss": 0.0208, "step": 75420 }, { "epoch": 0.2, "learning_rate": 0.0002706711839100422, "loss": 0.0218, "step": 75430 }, { "epoch": 0.2, "learning_rate": 0.00027066729569367076, "loss": 0.0266, "step": 75440 }, { "epoch": 0.2, "learning_rate": 0.0002706634074772993, "loss": 0.0226, "step": 75450 }, { "epoch": 0.2, "learning_rate": 0.0002706595192609278, "loss": 0.0269, "step": 75460 }, { "epoch": 0.2, "learning_rate": 0.00027065563104455636, "loss": 0.0266, "step": 75470 }, { "epoch": 0.2, "learning_rate": 0.0002706517428281849, "loss": 0.0259, "step": 75480 }, { "epoch": 0.2, "learning_rate": 0.0002706478546118134, "loss": 0.0221, "step": 75490 }, { "epoch": 0.2, "learning_rate": 0.00027064396639544196, "loss": 0.0263, "step": 75500 }, { "epoch": 0.2, "learning_rate": 0.0002706400781790705, "loss": 0.0281, "step": 75510 }, { "epoch": 0.2, "learning_rate": 0.00027063618996269904, "loss": 0.0217, "step": 75520 }, { "epoch": 0.2, "learning_rate": 0.00027063230174632756, "loss": 0.0242, "step": 75530 }, { "epoch": 0.2, "learning_rate": 0.00027062841352995607, "loss": 0.026, "step": 75540 }, { "epoch": 0.2, "learning_rate": 0.00027062452531358464, "loss": 0.0252, "step": 75550 }, { "epoch": 0.2, "learning_rate": 0.00027062063709721315, "loss": 0.0263, "step": 75560 }, { "epoch": 0.2, "learning_rate": 0.00027061674888084167, "loss": 0.021, "step": 75570 }, { "epoch": 0.2, "learning_rate": 0.00027061286066447024, "loss": 0.0246, "step": 75580 }, { "epoch": 0.2, "learning_rate": 0.0002706089724480988, "loss": 0.0261, "step": 75590 }, { "epoch": 0.2, "learning_rate": 0.0002706050842317273, "loss": 0.0371, "step": 75600 }, { "epoch": 0.2, "learning_rate": 0.00027060119601535584, "loss": 0.0294, "step": 75610 }, { "epoch": 0.2, "learning_rate": 0.00027059730779898435, "loss": 0.0215, "step": 75620 }, { "epoch": 0.2, "learning_rate": 0.0002705934195826129, "loss": 0.0237, "step": 75630 }, { "epoch": 0.2, "learning_rate": 0.00027058953136624143, "loss": 0.0228, "step": 75640 }, { "epoch": 0.2, "learning_rate": 0.00027058564314987, "loss": 0.0233, "step": 75650 }, { "epoch": 0.2, "learning_rate": 0.0002705817549334985, "loss": 0.0231, "step": 75660 }, { "epoch": 0.2, "learning_rate": 0.0002705778667171271, "loss": 0.0231, "step": 75670 }, { "epoch": 0.2, "learning_rate": 0.0002705739785007556, "loss": 0.0245, "step": 75680 }, { "epoch": 0.2, "learning_rate": 0.0002705700902843841, "loss": 0.0199, "step": 75690 }, { "epoch": 0.2, "learning_rate": 0.00027056620206801263, "loss": 0.0215, "step": 75700 }, { "epoch": 0.2, "learning_rate": 0.0002705623138516412, "loss": 0.0222, "step": 75710 }, { "epoch": 0.2, "learning_rate": 0.0002705584256352697, "loss": 0.0256, "step": 75720 }, { "epoch": 0.2, "learning_rate": 0.0002705545374188983, "loss": 0.024, "step": 75730 }, { "epoch": 0.2, "learning_rate": 0.0002705506492025268, "loss": 0.0255, "step": 75740 }, { "epoch": 0.2, "learning_rate": 0.0002705467609861553, "loss": 0.0294, "step": 75750 }, { "epoch": 0.2, "learning_rate": 0.0002705428727697839, "loss": 0.0229, "step": 75760 }, { "epoch": 0.2, "learning_rate": 0.0002705389845534124, "loss": 0.0271, "step": 75770 }, { "epoch": 0.2, "learning_rate": 0.0002705350963370409, "loss": 0.0217, "step": 75780 }, { "epoch": 0.2, "learning_rate": 0.0002705312081206695, "loss": 0.0213, "step": 75790 }, { "epoch": 0.2, "learning_rate": 0.00027052731990429805, "loss": 0.0218, "step": 75800 }, { "epoch": 0.2, "learning_rate": 0.00027052343168792656, "loss": 0.0227, "step": 75810 }, { "epoch": 0.2, "learning_rate": 0.0002705195434715551, "loss": 0.0246, "step": 75820 }, { "epoch": 0.2, "learning_rate": 0.0002705156552551836, "loss": 0.0255, "step": 75830 }, { "epoch": 0.2, "learning_rate": 0.00027051176703881216, "loss": 0.0242, "step": 75840 }, { "epoch": 0.2, "learning_rate": 0.00027050787882244067, "loss": 0.0202, "step": 75850 }, { "epoch": 0.2, "learning_rate": 0.00027050399060606924, "loss": 0.0232, "step": 75860 }, { "epoch": 0.2, "learning_rate": 0.00027050010238969776, "loss": 0.0248, "step": 75870 }, { "epoch": 0.2, "learning_rate": 0.0002704962141733263, "loss": 0.0217, "step": 75880 }, { "epoch": 0.2, "learning_rate": 0.00027049232595695484, "loss": 0.0251, "step": 75890 }, { "epoch": 0.2, "learning_rate": 0.00027048843774058335, "loss": 0.0356, "step": 75900 }, { "epoch": 0.2, "learning_rate": 0.00027048454952421187, "loss": 0.0193, "step": 75910 }, { "epoch": 0.2, "learning_rate": 0.00027048066130784044, "loss": 0.0293, "step": 75920 }, { "epoch": 0.2, "learning_rate": 0.000270476773091469, "loss": 0.0324, "step": 75930 }, { "epoch": 0.2, "learning_rate": 0.0002704728848750975, "loss": 0.0213, "step": 75940 }, { "epoch": 0.2, "learning_rate": 0.00027046899665872603, "loss": 0.0238, "step": 75950 }, { "epoch": 0.2, "learning_rate": 0.00027046510844235455, "loss": 0.025, "step": 75960 }, { "epoch": 0.2, "learning_rate": 0.0002704612202259831, "loss": 0.0213, "step": 75970 }, { "epoch": 0.2, "learning_rate": 0.00027045733200961163, "loss": 0.0241, "step": 75980 }, { "epoch": 0.2, "learning_rate": 0.0002704534437932402, "loss": 0.0274, "step": 75990 }, { "epoch": 0.2, "learning_rate": 0.0002704495555768687, "loss": 0.0284, "step": 76000 }, { "epoch": 0.2, "eval_cer": 0.8817768670806793, "eval_loss": 0.01834818534553051, "eval_runtime": 107.643, "eval_samples_per_second": 18.58, "eval_steps_per_second": 4.645, "step": 76000 }, { "epoch": 0.2, "learning_rate": 0.0002704456673604973, "loss": 0.0234, "step": 76010 }, { "epoch": 0.2, "learning_rate": 0.0002704417791441258, "loss": 0.0233, "step": 76020 }, { "epoch": 0.2, "learning_rate": 0.0002704378909277543, "loss": 0.0239, "step": 76030 }, { "epoch": 0.2, "learning_rate": 0.00027043400271138283, "loss": 0.0215, "step": 76040 }, { "epoch": 0.2, "learning_rate": 0.0002704301144950114, "loss": 0.022, "step": 76050 }, { "epoch": 0.2, "learning_rate": 0.0002704262262786399, "loss": 0.0293, "step": 76060 }, { "epoch": 0.2, "learning_rate": 0.0002704223380622685, "loss": 0.0302, "step": 76070 }, { "epoch": 0.2, "learning_rate": 0.000270418449845897, "loss": 0.0194, "step": 76080 }, { "epoch": 0.2, "learning_rate": 0.00027041456162952556, "loss": 0.0285, "step": 76090 }, { "epoch": 0.2, "learning_rate": 0.0002704106734131541, "loss": 0.0267, "step": 76100 }, { "epoch": 0.2, "learning_rate": 0.0002704067851967826, "loss": 0.0225, "step": 76110 }, { "epoch": 0.2, "learning_rate": 0.0002704028969804111, "loss": 0.0238, "step": 76120 }, { "epoch": 0.2, "learning_rate": 0.0002703990087640397, "loss": 0.0276, "step": 76130 }, { "epoch": 0.2, "learning_rate": 0.00027039512054766824, "loss": 0.0308, "step": 76140 }, { "epoch": 0.2, "learning_rate": 0.00027039123233129676, "loss": 0.0212, "step": 76150 }, { "epoch": 0.2, "learning_rate": 0.0002703873441149253, "loss": 0.0248, "step": 76160 }, { "epoch": 0.2, "learning_rate": 0.0002703834558985538, "loss": 0.0292, "step": 76170 }, { "epoch": 0.2, "learning_rate": 0.00027037956768218236, "loss": 0.023, "step": 76180 }, { "epoch": 0.2, "learning_rate": 0.00027037567946581087, "loss": 0.0233, "step": 76190 }, { "epoch": 0.2, "learning_rate": 0.00027037179124943944, "loss": 0.0208, "step": 76200 }, { "epoch": 0.2, "learning_rate": 0.00027036790303306795, "loss": 0.0249, "step": 76210 }, { "epoch": 0.2, "learning_rate": 0.0002703640148166965, "loss": 0.0288, "step": 76220 }, { "epoch": 0.2, "learning_rate": 0.00027036012660032504, "loss": 0.0227, "step": 76230 }, { "epoch": 0.2, "learning_rate": 0.00027035623838395355, "loss": 0.0211, "step": 76240 }, { "epoch": 0.2, "learning_rate": 0.00027035235016758207, "loss": 0.0218, "step": 76250 }, { "epoch": 0.2, "learning_rate": 0.00027034846195121064, "loss": 0.0211, "step": 76260 }, { "epoch": 0.2, "learning_rate": 0.00027034457373483915, "loss": 0.0323, "step": 76270 }, { "epoch": 0.2, "learning_rate": 0.0002703406855184677, "loss": 0.0256, "step": 76280 }, { "epoch": 0.2, "learning_rate": 0.00027033679730209623, "loss": 0.0237, "step": 76290 }, { "epoch": 0.2, "learning_rate": 0.0002703329090857248, "loss": 0.0209, "step": 76300 }, { "epoch": 0.2, "learning_rate": 0.0002703290208693533, "loss": 0.0264, "step": 76310 }, { "epoch": 0.2, "learning_rate": 0.00027032513265298183, "loss": 0.0264, "step": 76320 }, { "epoch": 0.2, "learning_rate": 0.0002703212444366104, "loss": 0.0307, "step": 76330 }, { "epoch": 0.2, "learning_rate": 0.0002703173562202389, "loss": 0.0252, "step": 76340 }, { "epoch": 0.2, "learning_rate": 0.0002703134680038675, "loss": 0.0228, "step": 76350 }, { "epoch": 0.2, "learning_rate": 0.000270309579787496, "loss": 0.0238, "step": 76360 }, { "epoch": 0.2, "learning_rate": 0.0002703056915711245, "loss": 0.0247, "step": 76370 }, { "epoch": 0.2, "learning_rate": 0.0002703018033547531, "loss": 0.0238, "step": 76380 }, { "epoch": 0.2, "learning_rate": 0.0002702979151383816, "loss": 0.0234, "step": 76390 }, { "epoch": 0.2, "learning_rate": 0.0002702940269220101, "loss": 0.0269, "step": 76400 }, { "epoch": 0.2, "learning_rate": 0.0002702901387056387, "loss": 0.0253, "step": 76410 }, { "epoch": 0.2, "learning_rate": 0.0002702862504892672, "loss": 0.0252, "step": 76420 }, { "epoch": 0.2, "learning_rate": 0.00027028236227289576, "loss": 0.0273, "step": 76430 }, { "epoch": 0.2, "learning_rate": 0.0002702784740565243, "loss": 0.0265, "step": 76440 }, { "epoch": 0.2, "learning_rate": 0.0002702745858401528, "loss": 0.0297, "step": 76450 }, { "epoch": 0.2, "learning_rate": 0.0002702706976237813, "loss": 0.031, "step": 76460 }, { "epoch": 0.2, "learning_rate": 0.0002702668094074099, "loss": 0.0296, "step": 76470 }, { "epoch": 0.2, "learning_rate": 0.00027026292119103844, "loss": 0.0238, "step": 76480 }, { "epoch": 0.2, "learning_rate": 0.00027025903297466696, "loss": 0.0253, "step": 76490 }, { "epoch": 0.2, "learning_rate": 0.00027025514475829547, "loss": 0.0237, "step": 76500 }, { "epoch": 0.2, "learning_rate": 0.00027025125654192404, "loss": 0.0183, "step": 76510 }, { "epoch": 0.2, "learning_rate": 0.00027024736832555256, "loss": 0.0271, "step": 76520 }, { "epoch": 0.2, "learning_rate": 0.00027024348010918107, "loss": 0.0244, "step": 76530 }, { "epoch": 0.2, "learning_rate": 0.00027023959189280964, "loss": 0.0218, "step": 76540 }, { "epoch": 0.2, "learning_rate": 0.00027023570367643815, "loss": 0.0185, "step": 76550 }, { "epoch": 0.2, "learning_rate": 0.0002702318154600667, "loss": 0.0285, "step": 76560 }, { "epoch": 0.2, "learning_rate": 0.00027022792724369524, "loss": 0.0186, "step": 76570 }, { "epoch": 0.2, "learning_rate": 0.00027022403902732375, "loss": 0.0271, "step": 76580 }, { "epoch": 0.2, "learning_rate": 0.0002702201508109523, "loss": 0.0243, "step": 76590 }, { "epoch": 0.2, "learning_rate": 0.00027021626259458083, "loss": 0.0316, "step": 76600 }, { "epoch": 0.2, "learning_rate": 0.00027021237437820935, "loss": 0.0297, "step": 76610 }, { "epoch": 0.2, "learning_rate": 0.0002702084861618379, "loss": 0.0279, "step": 76620 }, { "epoch": 0.2, "learning_rate": 0.0002702045979454665, "loss": 0.0243, "step": 76630 }, { "epoch": 0.2, "learning_rate": 0.000270200709729095, "loss": 0.0257, "step": 76640 }, { "epoch": 0.2, "learning_rate": 0.0002701968215127235, "loss": 0.0271, "step": 76650 }, { "epoch": 0.2, "learning_rate": 0.00027019293329635203, "loss": 0.0259, "step": 76660 }, { "epoch": 0.2, "learning_rate": 0.00027018904507998054, "loss": 0.0311, "step": 76670 }, { "epoch": 0.2, "learning_rate": 0.0002701851568636091, "loss": 0.034, "step": 76680 }, { "epoch": 0.2, "learning_rate": 0.0002701812686472377, "loss": 0.0346, "step": 76690 }, { "epoch": 0.2, "learning_rate": 0.0002701773804308662, "loss": 0.0285, "step": 76700 }, { "epoch": 0.2, "learning_rate": 0.0002701734922144947, "loss": 0.0245, "step": 76710 }, { "epoch": 0.2, "learning_rate": 0.0002701696039981233, "loss": 0.0274, "step": 76720 }, { "epoch": 0.2, "learning_rate": 0.0002701657157817518, "loss": 0.0248, "step": 76730 }, { "epoch": 0.2, "learning_rate": 0.0002701618275653803, "loss": 0.0272, "step": 76740 }, { "epoch": 0.2, "learning_rate": 0.0002701579393490089, "loss": 0.0239, "step": 76750 }, { "epoch": 0.2, "learning_rate": 0.0002701540511326374, "loss": 0.0291, "step": 76760 }, { "epoch": 0.2, "learning_rate": 0.00027015016291626596, "loss": 0.0234, "step": 76770 }, { "epoch": 0.2, "learning_rate": 0.0002701462746998945, "loss": 0.0256, "step": 76780 }, { "epoch": 0.2, "learning_rate": 0.000270142386483523, "loss": 0.0239, "step": 76790 }, { "epoch": 0.2, "learning_rate": 0.00027013849826715156, "loss": 0.0302, "step": 76800 }, { "epoch": 0.2, "learning_rate": 0.0002701346100507801, "loss": 0.0246, "step": 76810 }, { "epoch": 0.2, "learning_rate": 0.0002701307218344086, "loss": 0.0244, "step": 76820 }, { "epoch": 0.2, "learning_rate": 0.00027012683361803716, "loss": 0.0242, "step": 76830 }, { "epoch": 0.2, "learning_rate": 0.0002701229454016657, "loss": 0.0282, "step": 76840 }, { "epoch": 0.2, "learning_rate": 0.00027011905718529424, "loss": 0.023, "step": 76850 }, { "epoch": 0.2, "learning_rate": 0.00027011516896892275, "loss": 0.0275, "step": 76860 }, { "epoch": 0.2, "learning_rate": 0.00027011128075255127, "loss": 0.0283, "step": 76870 }, { "epoch": 0.2, "learning_rate": 0.00027010739253617984, "loss": 0.0184, "step": 76880 }, { "epoch": 0.2, "learning_rate": 0.00027010350431980835, "loss": 0.0268, "step": 76890 }, { "epoch": 0.2, "learning_rate": 0.0002700996161034369, "loss": 0.0282, "step": 76900 }, { "epoch": 0.2, "learning_rate": 0.00027009572788706544, "loss": 0.0222, "step": 76910 }, { "epoch": 0.2, "learning_rate": 0.00027009183967069395, "loss": 0.0248, "step": 76920 }, { "epoch": 0.2, "learning_rate": 0.0002700879514543225, "loss": 0.0254, "step": 76930 }, { "epoch": 0.2, "learning_rate": 0.00027008406323795103, "loss": 0.0246, "step": 76940 }, { "epoch": 0.2, "learning_rate": 0.00027008017502157955, "loss": 0.024, "step": 76950 }, { "epoch": 0.2, "learning_rate": 0.0002700762868052081, "loss": 0.0265, "step": 76960 }, { "epoch": 0.2, "learning_rate": 0.00027007239858883663, "loss": 0.0252, "step": 76970 }, { "epoch": 0.2, "learning_rate": 0.0002700685103724652, "loss": 0.0282, "step": 76980 }, { "epoch": 0.2, "learning_rate": 0.0002700646221560937, "loss": 0.0246, "step": 76990 }, { "epoch": 0.2, "learning_rate": 0.00027006073393972223, "loss": 0.028, "step": 77000 }, { "epoch": 0.2, "eval_cer": 0.8818398507427173, "eval_loss": 0.01785467006266117, "eval_runtime": 107.5617, "eval_samples_per_second": 18.594, "eval_steps_per_second": 4.648, "step": 77000 }, { "epoch": 0.2, "learning_rate": 0.0002700568457233508, "loss": 0.025, "step": 77010 }, { "epoch": 0.2, "learning_rate": 0.0002700529575069793, "loss": 0.0253, "step": 77020 }, { "epoch": 0.2, "learning_rate": 0.0002700490692906079, "loss": 0.0227, "step": 77030 }, { "epoch": 0.2, "learning_rate": 0.0002700451810742364, "loss": 0.0252, "step": 77040 }, { "epoch": 0.2, "learning_rate": 0.00027004129285786496, "loss": 0.0235, "step": 77050 }, { "epoch": 0.2, "learning_rate": 0.0002700374046414935, "loss": 0.0248, "step": 77060 }, { "epoch": 0.2, "learning_rate": 0.000270033516425122, "loss": 0.0287, "step": 77070 }, { "epoch": 0.2, "learning_rate": 0.0002700296282087505, "loss": 0.0279, "step": 77080 }, { "epoch": 0.2, "learning_rate": 0.0002700257399923791, "loss": 0.0249, "step": 77090 }, { "epoch": 0.2, "learning_rate": 0.0002700218517760076, "loss": 0.0236, "step": 77100 }, { "epoch": 0.2, "learning_rate": 0.00027001796355963616, "loss": 0.0214, "step": 77110 }, { "epoch": 0.2, "learning_rate": 0.0002700140753432647, "loss": 0.0204, "step": 77120 }, { "epoch": 0.2, "learning_rate": 0.00027001018712689324, "loss": 0.0287, "step": 77130 }, { "epoch": 0.2, "learning_rate": 0.00027000629891052176, "loss": 0.0271, "step": 77140 }, { "epoch": 0.2, "learning_rate": 0.00027000241069415027, "loss": 0.0312, "step": 77150 }, { "epoch": 0.2, "learning_rate": 0.0002699985224777788, "loss": 0.0255, "step": 77160 }, { "epoch": 0.2, "learning_rate": 0.00026999463426140736, "loss": 0.025, "step": 77170 }, { "epoch": 0.2, "learning_rate": 0.0002699907460450359, "loss": 0.0225, "step": 77180 }, { "epoch": 0.2, "learning_rate": 0.00026998685782866444, "loss": 0.0278, "step": 77190 }, { "epoch": 0.2, "learning_rate": 0.00026998296961229295, "loss": 0.0221, "step": 77200 }, { "epoch": 0.2, "learning_rate": 0.00026997908139592147, "loss": 0.0267, "step": 77210 }, { "epoch": 0.2, "learning_rate": 0.00026997519317955004, "loss": 0.0254, "step": 77220 }, { "epoch": 0.2, "learning_rate": 0.00026997130496317855, "loss": 0.0251, "step": 77230 }, { "epoch": 0.2, "learning_rate": 0.0002699674167468071, "loss": 0.0195, "step": 77240 }, { "epoch": 0.2, "learning_rate": 0.00026996352853043563, "loss": 0.0225, "step": 77250 }, { "epoch": 0.2, "learning_rate": 0.0002699596403140642, "loss": 0.032, "step": 77260 }, { "epoch": 0.2, "learning_rate": 0.0002699557520976927, "loss": 0.0241, "step": 77270 }, { "epoch": 0.2, "learning_rate": 0.00026995186388132123, "loss": 0.0248, "step": 77280 }, { "epoch": 0.2, "learning_rate": 0.00026994797566494975, "loss": 0.0246, "step": 77290 }, { "epoch": 0.2, "learning_rate": 0.0002699440874485783, "loss": 0.0283, "step": 77300 }, { "epoch": 0.2, "learning_rate": 0.00026994019923220683, "loss": 0.024, "step": 77310 }, { "epoch": 0.2, "learning_rate": 0.0002699363110158354, "loss": 0.0241, "step": 77320 }, { "epoch": 0.2, "learning_rate": 0.0002699324227994639, "loss": 0.023, "step": 77330 }, { "epoch": 0.2, "learning_rate": 0.0002699285345830925, "loss": 0.025, "step": 77340 }, { "epoch": 0.2, "learning_rate": 0.000269924646366721, "loss": 0.0244, "step": 77350 }, { "epoch": 0.2, "learning_rate": 0.0002699207581503495, "loss": 0.0269, "step": 77360 }, { "epoch": 0.2, "learning_rate": 0.000269916869933978, "loss": 0.0267, "step": 77370 }, { "epoch": 0.2, "learning_rate": 0.0002699129817176066, "loss": 0.0249, "step": 77380 }, { "epoch": 0.2, "learning_rate": 0.00026990909350123516, "loss": 0.0237, "step": 77390 }, { "epoch": 0.2, "learning_rate": 0.0002699052052848637, "loss": 0.0225, "step": 77400 }, { "epoch": 0.2, "learning_rate": 0.0002699013170684922, "loss": 0.0258, "step": 77410 }, { "epoch": 0.2, "learning_rate": 0.0002698974288521207, "loss": 0.0317, "step": 77420 }, { "epoch": 0.2, "learning_rate": 0.0002698935406357493, "loss": 0.0248, "step": 77430 }, { "epoch": 0.2, "learning_rate": 0.0002698896524193778, "loss": 0.0236, "step": 77440 }, { "epoch": 0.2, "learning_rate": 0.00026988576420300636, "loss": 0.0233, "step": 77450 }, { "epoch": 0.2, "learning_rate": 0.0002698818759866349, "loss": 0.0254, "step": 77460 }, { "epoch": 0.2, "learning_rate": 0.00026987798777026344, "loss": 0.0346, "step": 77470 }, { "epoch": 0.2, "learning_rate": 0.00026987409955389196, "loss": 0.0269, "step": 77480 }, { "epoch": 0.2, "learning_rate": 0.00026987021133752047, "loss": 0.0207, "step": 77490 }, { "epoch": 0.2, "learning_rate": 0.000269866323121149, "loss": 0.0267, "step": 77500 }, { "epoch": 0.2, "learning_rate": 0.00026986243490477755, "loss": 0.0226, "step": 77510 }, { "epoch": 0.2, "learning_rate": 0.0002698585466884061, "loss": 0.0266, "step": 77520 }, { "epoch": 0.2, "learning_rate": 0.00026985465847203464, "loss": 0.0226, "step": 77530 }, { "epoch": 0.2, "learning_rate": 0.00026985077025566315, "loss": 0.0217, "step": 77540 }, { "epoch": 0.2, "learning_rate": 0.0002698468820392917, "loss": 0.0256, "step": 77550 }, { "epoch": 0.2, "learning_rate": 0.00026984299382292024, "loss": 0.0305, "step": 77560 }, { "epoch": 0.2, "learning_rate": 0.00026983910560654875, "loss": 0.0263, "step": 77570 }, { "epoch": 0.2, "learning_rate": 0.0002698352173901773, "loss": 0.0222, "step": 77580 }, { "epoch": 0.2, "learning_rate": 0.00026983132917380583, "loss": 0.0276, "step": 77590 }, { "epoch": 0.2, "learning_rate": 0.0002698274409574344, "loss": 0.0266, "step": 77600 }, { "epoch": 0.2, "learning_rate": 0.0002698235527410629, "loss": 0.0298, "step": 77610 }, { "epoch": 0.2, "learning_rate": 0.00026981966452469143, "loss": 0.0228, "step": 77620 }, { "epoch": 0.2, "learning_rate": 0.00026981577630832, "loss": 0.0256, "step": 77630 }, { "epoch": 0.2, "learning_rate": 0.0002698118880919485, "loss": 0.0304, "step": 77640 }, { "epoch": 0.2, "learning_rate": 0.00026980799987557703, "loss": 0.0246, "step": 77650 }, { "epoch": 0.2, "learning_rate": 0.0002698041116592056, "loss": 0.0246, "step": 77660 }, { "epoch": 0.2, "learning_rate": 0.0002698002234428341, "loss": 0.0281, "step": 77670 }, { "epoch": 0.2, "learning_rate": 0.0002697963352264627, "loss": 0.0175, "step": 77680 }, { "epoch": 0.2, "learning_rate": 0.0002697924470100912, "loss": 0.0241, "step": 77690 }, { "epoch": 0.2, "learning_rate": 0.0002697885587937197, "loss": 0.0256, "step": 77700 }, { "epoch": 0.2, "learning_rate": 0.0002697846705773482, "loss": 0.0268, "step": 77710 }, { "epoch": 0.2, "learning_rate": 0.0002697807823609768, "loss": 0.029, "step": 77720 }, { "epoch": 0.2, "learning_rate": 0.00026977689414460536, "loss": 0.021, "step": 77730 }, { "epoch": 0.2, "learning_rate": 0.0002697730059282339, "loss": 0.0181, "step": 77740 }, { "epoch": 0.2, "learning_rate": 0.0002697691177118624, "loss": 0.0237, "step": 77750 }, { "epoch": 0.2, "learning_rate": 0.00026976522949549096, "loss": 0.0266, "step": 77760 }, { "epoch": 0.2, "learning_rate": 0.0002697613412791195, "loss": 0.0244, "step": 77770 }, { "epoch": 0.2, "learning_rate": 0.000269757453062748, "loss": 0.0185, "step": 77780 }, { "epoch": 0.2, "learning_rate": 0.00026975356484637656, "loss": 0.0228, "step": 77790 }, { "epoch": 0.2, "learning_rate": 0.00026974967663000507, "loss": 0.0242, "step": 77800 }, { "epoch": 0.2, "learning_rate": 0.00026974578841363364, "loss": 0.0216, "step": 77810 }, { "epoch": 0.2, "learning_rate": 0.00026974190019726216, "loss": 0.0216, "step": 77820 }, { "epoch": 0.2, "learning_rate": 0.00026973801198089067, "loss": 0.0239, "step": 77830 }, { "epoch": 0.2, "learning_rate": 0.00026973412376451924, "loss": 0.0254, "step": 77840 }, { "epoch": 0.2, "learning_rate": 0.00026973023554814775, "loss": 0.0238, "step": 77850 }, { "epoch": 0.2, "learning_rate": 0.00026972634733177627, "loss": 0.0256, "step": 77860 }, { "epoch": 0.2, "learning_rate": 0.00026972245911540484, "loss": 0.0232, "step": 77870 }, { "epoch": 0.2, "learning_rate": 0.0002697185708990334, "loss": 0.0287, "step": 77880 }, { "epoch": 0.2, "learning_rate": 0.0002697146826826619, "loss": 0.0219, "step": 77890 }, { "epoch": 0.2, "learning_rate": 0.00026971079446629043, "loss": 0.0214, "step": 77900 }, { "epoch": 0.2, "learning_rate": 0.00026970690624991895, "loss": 0.0218, "step": 77910 }, { "epoch": 0.2, "learning_rate": 0.0002697030180335475, "loss": 0.0287, "step": 77920 }, { "epoch": 0.2, "learning_rate": 0.00026969912981717603, "loss": 0.0268, "step": 77930 }, { "epoch": 0.2, "learning_rate": 0.0002696952416008046, "loss": 0.025, "step": 77940 }, { "epoch": 0.2, "learning_rate": 0.0002696913533844331, "loss": 0.0256, "step": 77950 }, { "epoch": 0.2, "learning_rate": 0.00026968746516806163, "loss": 0.0193, "step": 77960 }, { "epoch": 0.2, "learning_rate": 0.0002696835769516902, "loss": 0.0234, "step": 77970 }, { "epoch": 0.2, "learning_rate": 0.0002696796887353187, "loss": 0.0241, "step": 77980 }, { "epoch": 0.2, "learning_rate": 0.00026967580051894723, "loss": 0.0197, "step": 77990 }, { "epoch": 0.2, "learning_rate": 0.0002696719123025758, "loss": 0.0258, "step": 78000 }, { "epoch": 0.2, "eval_cer": 0.8817250805141147, "eval_loss": 0.01774117723107338, "eval_runtime": 107.8059, "eval_samples_per_second": 18.552, "eval_steps_per_second": 4.638, "step": 78000 }, { "epoch": 0.2, "learning_rate": 0.0002696680240862043, "loss": 0.0261, "step": 78010 }, { "epoch": 0.2, "learning_rate": 0.0002696641358698329, "loss": 0.0231, "step": 78020 }, { "epoch": 0.2, "learning_rate": 0.0002696602476534614, "loss": 0.0281, "step": 78030 }, { "epoch": 0.2, "learning_rate": 0.0002696563594370899, "loss": 0.0205, "step": 78040 }, { "epoch": 0.2, "learning_rate": 0.0002696524712207185, "loss": 0.0233, "step": 78050 }, { "epoch": 0.2, "learning_rate": 0.000269648583004347, "loss": 0.0248, "step": 78060 }, { "epoch": 0.2, "learning_rate": 0.00026964469478797556, "loss": 0.0262, "step": 78070 }, { "epoch": 0.2, "learning_rate": 0.0002696408065716041, "loss": 0.0312, "step": 78080 }, { "epoch": 0.2, "learning_rate": 0.00026963691835523264, "loss": 0.0224, "step": 78090 }, { "epoch": 0.2, "learning_rate": 0.00026963303013886116, "loss": 0.0233, "step": 78100 }, { "epoch": 0.2, "learning_rate": 0.0002696291419224897, "loss": 0.0242, "step": 78110 }, { "epoch": 0.2, "learning_rate": 0.0002696252537061182, "loss": 0.0223, "step": 78120 }, { "epoch": 0.2, "learning_rate": 0.00026962136548974676, "loss": 0.027, "step": 78130 }, { "epoch": 0.2, "learning_rate": 0.00026961747727337527, "loss": 0.024, "step": 78140 }, { "epoch": 0.2, "learning_rate": 0.00026961358905700384, "loss": 0.0219, "step": 78150 }, { "epoch": 0.2, "learning_rate": 0.00026960970084063235, "loss": 0.0213, "step": 78160 }, { "epoch": 0.2, "learning_rate": 0.00026960581262426087, "loss": 0.0249, "step": 78170 }, { "epoch": 0.2, "learning_rate": 0.00026960192440788944, "loss": 0.0232, "step": 78180 }, { "epoch": 0.2, "learning_rate": 0.00026959803619151795, "loss": 0.0221, "step": 78190 }, { "epoch": 0.2, "learning_rate": 0.00026959414797514647, "loss": 0.0252, "step": 78200 }, { "epoch": 0.2, "learning_rate": 0.00026959025975877504, "loss": 0.0314, "step": 78210 }, { "epoch": 0.2, "learning_rate": 0.0002695863715424036, "loss": 0.0235, "step": 78220 }, { "epoch": 0.2, "learning_rate": 0.0002695824833260321, "loss": 0.0234, "step": 78230 }, { "epoch": 0.2, "learning_rate": 0.00026957859510966063, "loss": 0.0224, "step": 78240 }, { "epoch": 0.2, "learning_rate": 0.00026957470689328915, "loss": 0.0231, "step": 78250 }, { "epoch": 0.2, "learning_rate": 0.0002695708186769177, "loss": 0.0229, "step": 78260 }, { "epoch": 0.2, "learning_rate": 0.00026956693046054623, "loss": 0.0235, "step": 78270 }, { "epoch": 0.2, "learning_rate": 0.0002695630422441748, "loss": 0.0225, "step": 78280 }, { "epoch": 0.2, "learning_rate": 0.0002695591540278033, "loss": 0.0276, "step": 78290 }, { "epoch": 0.2, "learning_rate": 0.0002695552658114319, "loss": 0.0275, "step": 78300 }, { "epoch": 0.2, "learning_rate": 0.0002695513775950604, "loss": 0.0263, "step": 78310 }, { "epoch": 0.2, "learning_rate": 0.0002695474893786889, "loss": 0.0213, "step": 78320 }, { "epoch": 0.2, "learning_rate": 0.0002695436011623174, "loss": 0.0244, "step": 78330 }, { "epoch": 0.2, "learning_rate": 0.000269539712945946, "loss": 0.0234, "step": 78340 }, { "epoch": 0.2, "learning_rate": 0.0002695358247295745, "loss": 0.0252, "step": 78350 }, { "epoch": 0.2, "learning_rate": 0.0002695319365132031, "loss": 0.0204, "step": 78360 }, { "epoch": 0.2, "learning_rate": 0.0002695280482968316, "loss": 0.0205, "step": 78370 }, { "epoch": 0.2, "learning_rate": 0.00026952416008046016, "loss": 0.0267, "step": 78380 }, { "epoch": 0.2, "learning_rate": 0.0002695202718640887, "loss": 0.0332, "step": 78390 }, { "epoch": 0.2, "learning_rate": 0.0002695163836477172, "loss": 0.0212, "step": 78400 }, { "epoch": 0.2, "learning_rate": 0.0002695124954313457, "loss": 0.0268, "step": 78410 }, { "epoch": 0.2, "learning_rate": 0.0002695086072149743, "loss": 0.028, "step": 78420 }, { "epoch": 0.2, "learning_rate": 0.00026950471899860284, "loss": 0.0267, "step": 78430 }, { "epoch": 0.2, "learning_rate": 0.00026950083078223136, "loss": 0.024, "step": 78440 }, { "epoch": 0.2, "learning_rate": 0.00026949694256585987, "loss": 0.0244, "step": 78450 }, { "epoch": 0.2, "learning_rate": 0.0002694930543494884, "loss": 0.0251, "step": 78460 }, { "epoch": 0.2, "learning_rate": 0.00026948916613311696, "loss": 0.0189, "step": 78470 }, { "epoch": 0.2, "learning_rate": 0.00026948527791674547, "loss": 0.0274, "step": 78480 }, { "epoch": 0.2, "learning_rate": 0.00026948138970037404, "loss": 0.0277, "step": 78490 }, { "epoch": 0.2, "learning_rate": 0.00026947750148400255, "loss": 0.0319, "step": 78500 }, { "epoch": 0.2, "learning_rate": 0.0002694736132676311, "loss": 0.0239, "step": 78510 }, { "epoch": 0.2, "learning_rate": 0.00026946972505125964, "loss": 0.0296, "step": 78520 }, { "epoch": 0.2, "learning_rate": 0.00026946583683488815, "loss": 0.0329, "step": 78530 }, { "epoch": 0.2, "learning_rate": 0.00026946194861851667, "loss": 0.0314, "step": 78540 }, { "epoch": 0.2, "learning_rate": 0.00026945806040214523, "loss": 0.0246, "step": 78550 }, { "epoch": 0.2, "learning_rate": 0.00026945417218577375, "loss": 0.0223, "step": 78560 }, { "epoch": 0.2, "learning_rate": 0.0002694502839694023, "loss": 0.0225, "step": 78570 }, { "epoch": 0.2, "learning_rate": 0.00026944639575303083, "loss": 0.0274, "step": 78580 }, { "epoch": 0.2, "learning_rate": 0.0002694425075366594, "loss": 0.0273, "step": 78590 }, { "epoch": 0.2, "learning_rate": 0.0002694386193202879, "loss": 0.0247, "step": 78600 }, { "epoch": 0.2, "learning_rate": 0.00026943473110391643, "loss": 0.0216, "step": 78610 }, { "epoch": 0.2, "learning_rate": 0.000269430842887545, "loss": 0.0239, "step": 78620 }, { "epoch": 0.2, "learning_rate": 0.0002694269546711735, "loss": 0.0266, "step": 78630 }, { "epoch": 0.2, "learning_rate": 0.0002694230664548021, "loss": 0.0243, "step": 78640 }, { "epoch": 0.2, "learning_rate": 0.0002694191782384306, "loss": 0.0271, "step": 78650 }, { "epoch": 0.2, "learning_rate": 0.0002694152900220591, "loss": 0.0225, "step": 78660 }, { "epoch": 0.2, "learning_rate": 0.0002694114018056876, "loss": 0.0286, "step": 78670 }, { "epoch": 0.2, "learning_rate": 0.0002694075135893162, "loss": 0.0242, "step": 78680 }, { "epoch": 0.2, "learning_rate": 0.0002694036253729447, "loss": 0.033, "step": 78690 }, { "epoch": 0.2, "learning_rate": 0.0002693997371565733, "loss": 0.0265, "step": 78700 }, { "epoch": 0.2, "learning_rate": 0.0002693958489402018, "loss": 0.025, "step": 78710 }, { "epoch": 0.2, "learning_rate": 0.00026939196072383036, "loss": 0.021, "step": 78720 }, { "epoch": 0.2, "learning_rate": 0.0002693880725074589, "loss": 0.0214, "step": 78730 }, { "epoch": 0.2, "learning_rate": 0.0002693841842910874, "loss": 0.0197, "step": 78740 }, { "epoch": 0.2, "learning_rate": 0.0002693802960747159, "loss": 0.0263, "step": 78750 }, { "epoch": 0.2, "learning_rate": 0.0002693764078583445, "loss": 0.0234, "step": 78760 }, { "epoch": 0.2, "learning_rate": 0.00026937251964197304, "loss": 0.025, "step": 78770 }, { "epoch": 0.2, "learning_rate": 0.00026936863142560156, "loss": 0.0254, "step": 78780 }, { "epoch": 0.2, "learning_rate": 0.00026936474320923007, "loss": 0.0284, "step": 78790 }, { "epoch": 0.2, "learning_rate": 0.00026936085499285864, "loss": 0.0228, "step": 78800 }, { "epoch": 0.2, "learning_rate": 0.00026935696677648715, "loss": 0.0291, "step": 78810 }, { "epoch": 0.2, "learning_rate": 0.00026935307856011567, "loss": 0.0255, "step": 78820 }, { "epoch": 0.2, "learning_rate": 0.00026934919034374424, "loss": 0.0222, "step": 78830 }, { "epoch": 0.2, "learning_rate": 0.00026934530212737275, "loss": 0.0222, "step": 78840 }, { "epoch": 0.2, "learning_rate": 0.0002693414139110013, "loss": 0.0233, "step": 78850 }, { "epoch": 0.2, "learning_rate": 0.00026933752569462984, "loss": 0.0219, "step": 78860 }, { "epoch": 0.2, "learning_rate": 0.00026933363747825835, "loss": 0.0258, "step": 78870 }, { "epoch": 0.2, "learning_rate": 0.0002693297492618869, "loss": 0.0276, "step": 78880 }, { "epoch": 0.2, "learning_rate": 0.00026932586104551543, "loss": 0.0231, "step": 78890 }, { "epoch": 0.2, "learning_rate": 0.00026932197282914395, "loss": 0.0262, "step": 78900 }, { "epoch": 0.2, "learning_rate": 0.0002693180846127725, "loss": 0.0211, "step": 78910 }, { "epoch": 0.2, "learning_rate": 0.00026931419639640103, "loss": 0.0238, "step": 78920 }, { "epoch": 0.2, "learning_rate": 0.0002693103081800296, "loss": 0.0312, "step": 78930 }, { "epoch": 0.2, "learning_rate": 0.0002693064199636581, "loss": 0.0219, "step": 78940 }, { "epoch": 0.2, "learning_rate": 0.00026930253174728663, "loss": 0.0204, "step": 78950 }, { "epoch": 0.2, "learning_rate": 0.00026929864353091514, "loss": 0.0251, "step": 78960 }, { "epoch": 0.2, "learning_rate": 0.0002692947553145437, "loss": 0.0263, "step": 78970 }, { "epoch": 0.2, "learning_rate": 0.0002692908670981723, "loss": 0.0219, "step": 78980 }, { "epoch": 0.2, "learning_rate": 0.0002692869788818008, "loss": 0.0273, "step": 78990 }, { "epoch": 0.2, "learning_rate": 0.0002692830906654293, "loss": 0.0241, "step": 79000 }, { "epoch": 0.2, "eval_cer": 0.8817754674437451, "eval_loss": 0.017790012061595917, "eval_runtime": 107.9618, "eval_samples_per_second": 18.525, "eval_steps_per_second": 4.631, "step": 79000 }, { "epoch": 0.2, "learning_rate": 0.0002692792024490579, "loss": 0.0259, "step": 79010 }, { "epoch": 0.2, "learning_rate": 0.0002692753142326864, "loss": 0.0266, "step": 79020 }, { "epoch": 0.2, "learning_rate": 0.0002692714260163149, "loss": 0.027, "step": 79030 }, { "epoch": 0.2, "learning_rate": 0.0002692675377999435, "loss": 0.0262, "step": 79040 }, { "epoch": 0.2, "learning_rate": 0.000269263649583572, "loss": 0.0243, "step": 79050 }, { "epoch": 0.2, "learning_rate": 0.00026925976136720056, "loss": 0.0239, "step": 79060 }, { "epoch": 0.2, "learning_rate": 0.0002692558731508291, "loss": 0.0233, "step": 79070 }, { "epoch": 0.2, "learning_rate": 0.0002692519849344576, "loss": 0.0212, "step": 79080 }, { "epoch": 0.21, "learning_rate": 0.00026924809671808616, "loss": 0.0258, "step": 79090 }, { "epoch": 0.21, "learning_rate": 0.00026924420850171467, "loss": 0.0214, "step": 79100 }, { "epoch": 0.21, "learning_rate": 0.00026924032028534324, "loss": 0.025, "step": 79110 }, { "epoch": 0.21, "learning_rate": 0.00026923643206897176, "loss": 0.0282, "step": 79120 }, { "epoch": 0.21, "learning_rate": 0.0002692325438526003, "loss": 0.0258, "step": 79130 }, { "epoch": 0.21, "learning_rate": 0.00026922865563622884, "loss": 0.0238, "step": 79140 }, { "epoch": 0.21, "learning_rate": 0.00026922476741985735, "loss": 0.0249, "step": 79150 }, { "epoch": 0.21, "learning_rate": 0.00026922087920348587, "loss": 0.0255, "step": 79160 }, { "epoch": 0.21, "learning_rate": 0.00026921699098711444, "loss": 0.0265, "step": 79170 }, { "epoch": 0.21, "learning_rate": 0.00026921310277074295, "loss": 0.0283, "step": 79180 }, { "epoch": 0.21, "learning_rate": 0.0002692092145543715, "loss": 0.0265, "step": 79190 }, { "epoch": 0.21, "learning_rate": 0.00026920532633800003, "loss": 0.0229, "step": 79200 }, { "epoch": 0.21, "learning_rate": 0.00026920143812162855, "loss": 0.0229, "step": 79210 }, { "epoch": 0.21, "learning_rate": 0.0002691975499052571, "loss": 0.0223, "step": 79220 }, { "epoch": 0.21, "learning_rate": 0.00026919366168888563, "loss": 0.0247, "step": 79230 }, { "epoch": 0.21, "learning_rate": 0.00026918977347251415, "loss": 0.0247, "step": 79240 }, { "epoch": 0.21, "learning_rate": 0.0002691858852561427, "loss": 0.031, "step": 79250 }, { "epoch": 0.21, "learning_rate": 0.0002691819970397713, "loss": 0.0256, "step": 79260 }, { "epoch": 0.21, "learning_rate": 0.0002691781088233998, "loss": 0.02, "step": 79270 }, { "epoch": 0.21, "learning_rate": 0.0002691742206070283, "loss": 0.0285, "step": 79280 }, { "epoch": 0.21, "learning_rate": 0.00026917033239065683, "loss": 0.0251, "step": 79290 }, { "epoch": 0.21, "learning_rate": 0.0002691664441742854, "loss": 0.0223, "step": 79300 }, { "epoch": 0.21, "learning_rate": 0.0002691625559579139, "loss": 0.0252, "step": 79310 }, { "epoch": 0.21, "learning_rate": 0.0002691586677415425, "loss": 0.0218, "step": 79320 }, { "epoch": 0.21, "learning_rate": 0.000269154779525171, "loss": 0.0254, "step": 79330 }, { "epoch": 0.21, "learning_rate": 0.00026915089130879956, "loss": 0.0257, "step": 79340 }, { "epoch": 0.21, "learning_rate": 0.0002691470030924281, "loss": 0.0242, "step": 79350 }, { "epoch": 0.21, "learning_rate": 0.0002691431148760566, "loss": 0.0252, "step": 79360 }, { "epoch": 0.21, "learning_rate": 0.0002691392266596851, "loss": 0.0261, "step": 79370 }, { "epoch": 0.21, "learning_rate": 0.0002691353384433137, "loss": 0.027, "step": 79380 }, { "epoch": 0.21, "learning_rate": 0.0002691314502269422, "loss": 0.0243, "step": 79390 }, { "epoch": 0.21, "learning_rate": 0.00026912756201057076, "loss": 0.0222, "step": 79400 }, { "epoch": 0.21, "learning_rate": 0.0002691236737941993, "loss": 0.024, "step": 79410 }, { "epoch": 0.21, "learning_rate": 0.0002691197855778278, "loss": 0.0287, "step": 79420 }, { "epoch": 0.21, "learning_rate": 0.00026911589736145636, "loss": 0.0185, "step": 79430 }, { "epoch": 0.21, "learning_rate": 0.00026911200914508487, "loss": 0.0211, "step": 79440 }, { "epoch": 0.21, "learning_rate": 0.0002691081209287134, "loss": 0.0209, "step": 79450 }, { "epoch": 0.21, "learning_rate": 0.00026910423271234195, "loss": 0.0275, "step": 79460 }, { "epoch": 0.21, "learning_rate": 0.0002691003444959705, "loss": 0.0258, "step": 79470 }, { "epoch": 0.21, "learning_rate": 0.00026909645627959904, "loss": 0.0275, "step": 79480 }, { "epoch": 0.21, "learning_rate": 0.00026909256806322755, "loss": 0.0215, "step": 79490 }, { "epoch": 0.21, "learning_rate": 0.00026908867984685607, "loss": 0.0251, "step": 79500 }, { "epoch": 0.21, "learning_rate": 0.00026908479163048464, "loss": 0.025, "step": 79510 }, { "epoch": 0.21, "learning_rate": 0.00026908090341411315, "loss": 0.0206, "step": 79520 }, { "epoch": 0.21, "learning_rate": 0.0002690770151977417, "loss": 0.0224, "step": 79530 }, { "epoch": 0.21, "learning_rate": 0.00026907312698137023, "loss": 0.0213, "step": 79540 }, { "epoch": 0.21, "learning_rate": 0.0002690692387649988, "loss": 0.021, "step": 79550 }, { "epoch": 0.21, "learning_rate": 0.0002690653505486273, "loss": 0.0197, "step": 79560 }, { "epoch": 0.21, "learning_rate": 0.00026906146233225583, "loss": 0.0188, "step": 79570 }, { "epoch": 0.21, "learning_rate": 0.00026905757411588435, "loss": 0.0249, "step": 79580 }, { "epoch": 0.21, "learning_rate": 0.0002690536858995129, "loss": 0.0222, "step": 79590 }, { "epoch": 0.21, "learning_rate": 0.00026904979768314143, "loss": 0.0225, "step": 79600 }, { "epoch": 0.21, "learning_rate": 0.00026904590946677, "loss": 0.0253, "step": 79610 }, { "epoch": 0.21, "learning_rate": 0.0002690420212503985, "loss": 0.0293, "step": 79620 }, { "epoch": 0.21, "learning_rate": 0.0002690381330340271, "loss": 0.0268, "step": 79630 }, { "epoch": 0.21, "learning_rate": 0.0002690342448176556, "loss": 0.0221, "step": 79640 }, { "epoch": 0.21, "learning_rate": 0.0002690303566012841, "loss": 0.0226, "step": 79650 }, { "epoch": 0.21, "learning_rate": 0.0002690264683849127, "loss": 0.027, "step": 79660 }, { "epoch": 0.21, "learning_rate": 0.0002690225801685412, "loss": 0.026, "step": 79670 }, { "epoch": 0.21, "learning_rate": 0.00026901869195216976, "loss": 0.0233, "step": 79680 }, { "epoch": 0.21, "learning_rate": 0.0002690148037357983, "loss": 0.0224, "step": 79690 }, { "epoch": 0.21, "learning_rate": 0.0002690109155194268, "loss": 0.0222, "step": 79700 }, { "epoch": 0.21, "learning_rate": 0.0002690070273030553, "loss": 0.0287, "step": 79710 }, { "epoch": 0.21, "learning_rate": 0.0002690031390866839, "loss": 0.0246, "step": 79720 }, { "epoch": 0.21, "learning_rate": 0.0002689992508703124, "loss": 0.0276, "step": 79730 }, { "epoch": 0.21, "learning_rate": 0.00026899536265394096, "loss": 0.0239, "step": 79740 }, { "epoch": 0.21, "learning_rate": 0.00026899147443756947, "loss": 0.0272, "step": 79750 }, { "epoch": 0.21, "learning_rate": 0.00026898758622119804, "loss": 0.023, "step": 79760 }, { "epoch": 0.21, "learning_rate": 0.00026898369800482656, "loss": 0.0254, "step": 79770 }, { "epoch": 0.21, "learning_rate": 0.00026897980978845507, "loss": 0.0278, "step": 79780 }, { "epoch": 0.21, "learning_rate": 0.0002689759215720836, "loss": 0.0205, "step": 79790 }, { "epoch": 0.21, "learning_rate": 0.00026897203335571215, "loss": 0.0228, "step": 79800 }, { "epoch": 0.21, "learning_rate": 0.0002689681451393407, "loss": 0.026, "step": 79810 }, { "epoch": 0.21, "learning_rate": 0.00026896425692296924, "loss": 0.0258, "step": 79820 }, { "epoch": 0.21, "learning_rate": 0.00026896036870659775, "loss": 0.0226, "step": 79830 }, { "epoch": 0.21, "learning_rate": 0.0002689564804902263, "loss": 0.0205, "step": 79840 }, { "epoch": 0.21, "learning_rate": 0.00026895259227385483, "loss": 0.0295, "step": 79850 }, { "epoch": 0.21, "learning_rate": 0.00026894870405748335, "loss": 0.025, "step": 79860 }, { "epoch": 0.21, "learning_rate": 0.0002689448158411119, "loss": 0.0289, "step": 79870 }, { "epoch": 0.21, "learning_rate": 0.00026894092762474043, "loss": 0.0245, "step": 79880 }, { "epoch": 0.21, "learning_rate": 0.000268937039408369, "loss": 0.0288, "step": 79890 }, { "epoch": 0.21, "learning_rate": 0.0002689331511919975, "loss": 0.0215, "step": 79900 }, { "epoch": 0.21, "learning_rate": 0.00026892926297562603, "loss": 0.0312, "step": 79910 }, { "epoch": 0.21, "learning_rate": 0.00026892537475925454, "loss": 0.0261, "step": 79920 }, { "epoch": 0.21, "learning_rate": 0.0002689214865428831, "loss": 0.0219, "step": 79930 }, { "epoch": 0.21, "learning_rate": 0.00026891759832651163, "loss": 0.0242, "step": 79940 }, { "epoch": 0.21, "learning_rate": 0.0002689137101101402, "loss": 0.0259, "step": 79950 }, { "epoch": 0.21, "learning_rate": 0.0002689098218937687, "loss": 0.0296, "step": 79960 }, { "epoch": 0.21, "learning_rate": 0.0002689059336773973, "loss": 0.0249, "step": 79970 }, { "epoch": 0.21, "learning_rate": 0.0002689020454610258, "loss": 0.0232, "step": 79980 }, { "epoch": 0.21, "learning_rate": 0.0002688981572446543, "loss": 0.0199, "step": 79990 }, { "epoch": 0.21, "learning_rate": 0.0002688942690282828, "loss": 0.0253, "step": 80000 }, { "epoch": 0.21, "eval_cer": 0.8818090587301654, "eval_loss": 0.01771540753543377, "eval_runtime": 108.1716, "eval_samples_per_second": 18.489, "eval_steps_per_second": 4.622, "step": 80000 }, { "epoch": 0.21, "learning_rate": 0.0002688903808119114, "loss": 0.0206, "step": 80010 }, { "epoch": 0.21, "learning_rate": 0.00026888649259553996, "loss": 0.0233, "step": 80020 }, { "epoch": 0.21, "learning_rate": 0.0002688826043791685, "loss": 0.0202, "step": 80030 }, { "epoch": 0.21, "learning_rate": 0.000268878716162797, "loss": 0.0244, "step": 80040 }, { "epoch": 0.21, "learning_rate": 0.00026887482794642556, "loss": 0.0195, "step": 80050 }, { "epoch": 0.21, "learning_rate": 0.0002688709397300541, "loss": 0.0162, "step": 80060 }, { "epoch": 0.21, "learning_rate": 0.0002688670515136826, "loss": 0.0295, "step": 80070 }, { "epoch": 0.21, "learning_rate": 0.00026886316329731116, "loss": 0.0213, "step": 80080 }, { "epoch": 0.21, "learning_rate": 0.00026885927508093967, "loss": 0.021, "step": 80090 }, { "epoch": 0.21, "learning_rate": 0.00026885538686456824, "loss": 0.0259, "step": 80100 }, { "epoch": 0.21, "learning_rate": 0.00026885149864819675, "loss": 0.0232, "step": 80110 }, { "epoch": 0.21, "learning_rate": 0.00026884761043182527, "loss": 0.0244, "step": 80120 }, { "epoch": 0.21, "learning_rate": 0.00026884372221545384, "loss": 0.0244, "step": 80130 }, { "epoch": 0.21, "learning_rate": 0.00026883983399908235, "loss": 0.0239, "step": 80140 }, { "epoch": 0.21, "learning_rate": 0.00026883594578271087, "loss": 0.0205, "step": 80150 }, { "epoch": 0.21, "learning_rate": 0.00026883205756633944, "loss": 0.0288, "step": 80160 }, { "epoch": 0.21, "learning_rate": 0.00026882816934996795, "loss": 0.0231, "step": 80170 }, { "epoch": 0.21, "learning_rate": 0.0002688242811335965, "loss": 0.0256, "step": 80180 }, { "epoch": 0.21, "learning_rate": 0.00026882039291722503, "loss": 0.028, "step": 80190 }, { "epoch": 0.21, "learning_rate": 0.00026881650470085355, "loss": 0.0248, "step": 80200 }, { "epoch": 0.21, "learning_rate": 0.0002688126164844821, "loss": 0.0229, "step": 80210 }, { "epoch": 0.21, "learning_rate": 0.00026880872826811063, "loss": 0.0225, "step": 80220 }, { "epoch": 0.21, "learning_rate": 0.0002688048400517392, "loss": 0.0298, "step": 80230 }, { "epoch": 0.21, "learning_rate": 0.0002688009518353677, "loss": 0.0234, "step": 80240 }, { "epoch": 0.21, "learning_rate": 0.00026879706361899623, "loss": 0.0267, "step": 80250 }, { "epoch": 0.21, "learning_rate": 0.0002687931754026248, "loss": 0.022, "step": 80260 }, { "epoch": 0.21, "learning_rate": 0.0002687892871862533, "loss": 0.0261, "step": 80270 }, { "epoch": 0.21, "learning_rate": 0.0002687853989698818, "loss": 0.0239, "step": 80280 }, { "epoch": 0.21, "learning_rate": 0.0002687815107535104, "loss": 0.0229, "step": 80290 }, { "epoch": 0.21, "learning_rate": 0.00026877762253713896, "loss": 0.0238, "step": 80300 }, { "epoch": 0.21, "learning_rate": 0.0002687737343207675, "loss": 0.0266, "step": 80310 }, { "epoch": 0.21, "learning_rate": 0.000268769846104396, "loss": 0.0316, "step": 80320 }, { "epoch": 0.21, "learning_rate": 0.0002687659578880245, "loss": 0.0255, "step": 80330 }, { "epoch": 0.21, "learning_rate": 0.0002687620696716531, "loss": 0.0261, "step": 80340 }, { "epoch": 0.21, "learning_rate": 0.0002687581814552816, "loss": 0.0289, "step": 80350 }, { "epoch": 0.21, "learning_rate": 0.00026875429323891016, "loss": 0.0235, "step": 80360 }, { "epoch": 0.21, "learning_rate": 0.0002687504050225387, "loss": 0.0204, "step": 80370 }, { "epoch": 0.21, "learning_rate": 0.00026874651680616724, "loss": 0.021, "step": 80380 }, { "epoch": 0.21, "learning_rate": 0.00026874262858979576, "loss": 0.0264, "step": 80390 }, { "epoch": 0.21, "learning_rate": 0.00026873874037342427, "loss": 0.0289, "step": 80400 }, { "epoch": 0.21, "learning_rate": 0.0002687348521570528, "loss": 0.0291, "step": 80410 }, { "epoch": 0.21, "learning_rate": 0.00026873096394068136, "loss": 0.0233, "step": 80420 }, { "epoch": 0.21, "learning_rate": 0.00026872707572430987, "loss": 0.0228, "step": 80430 }, { "epoch": 0.21, "learning_rate": 0.00026872318750793844, "loss": 0.0233, "step": 80440 }, { "epoch": 0.21, "learning_rate": 0.00026871929929156695, "loss": 0.0229, "step": 80450 }, { "epoch": 0.21, "learning_rate": 0.00026871541107519547, "loss": 0.0239, "step": 80460 }, { "epoch": 0.21, "learning_rate": 0.00026871152285882404, "loss": 0.0268, "step": 80470 }, { "epoch": 0.21, "learning_rate": 0.00026870763464245255, "loss": 0.0241, "step": 80480 }, { "epoch": 0.21, "learning_rate": 0.00026870374642608107, "loss": 0.0224, "step": 80490 }, { "epoch": 0.21, "learning_rate": 0.00026869985820970963, "loss": 0.0305, "step": 80500 }, { "epoch": 0.21, "learning_rate": 0.0002686959699933382, "loss": 0.0272, "step": 80510 }, { "epoch": 0.21, "learning_rate": 0.0002686920817769667, "loss": 0.0247, "step": 80520 }, { "epoch": 0.21, "learning_rate": 0.00026868819356059523, "loss": 0.0258, "step": 80530 }, { "epoch": 0.21, "learning_rate": 0.00026868430534422375, "loss": 0.0274, "step": 80540 }, { "epoch": 0.21, "learning_rate": 0.0002686804171278523, "loss": 0.0269, "step": 80550 }, { "epoch": 0.21, "learning_rate": 0.00026867652891148083, "loss": 0.0221, "step": 80560 }, { "epoch": 0.21, "learning_rate": 0.0002686726406951094, "loss": 0.0266, "step": 80570 }, { "epoch": 0.21, "learning_rate": 0.0002686687524787379, "loss": 0.0226, "step": 80580 }, { "epoch": 0.21, "learning_rate": 0.0002686648642623665, "loss": 0.0207, "step": 80590 }, { "epoch": 0.21, "learning_rate": 0.000268660976045995, "loss": 0.0244, "step": 80600 }, { "epoch": 0.21, "learning_rate": 0.0002686570878296235, "loss": 0.0246, "step": 80610 }, { "epoch": 0.21, "learning_rate": 0.000268653199613252, "loss": 0.0276, "step": 80620 }, { "epoch": 0.21, "learning_rate": 0.0002686493113968806, "loss": 0.0243, "step": 80630 }, { "epoch": 0.21, "learning_rate": 0.0002686454231805091, "loss": 0.0217, "step": 80640 }, { "epoch": 0.21, "learning_rate": 0.0002686415349641377, "loss": 0.0237, "step": 80650 }, { "epoch": 0.21, "learning_rate": 0.0002686376467477662, "loss": 0.0202, "step": 80660 }, { "epoch": 0.21, "learning_rate": 0.0002686337585313947, "loss": 0.0207, "step": 80670 }, { "epoch": 0.21, "learning_rate": 0.0002686298703150233, "loss": 0.021, "step": 80680 }, { "epoch": 0.21, "learning_rate": 0.0002686259820986518, "loss": 0.0253, "step": 80690 }, { "epoch": 0.21, "learning_rate": 0.00026862209388228036, "loss": 0.0223, "step": 80700 }, { "epoch": 0.21, "learning_rate": 0.00026861820566590887, "loss": 0.0203, "step": 80710 }, { "epoch": 0.21, "learning_rate": 0.00026861431744953744, "loss": 0.0216, "step": 80720 }, { "epoch": 0.21, "learning_rate": 0.00026861042923316596, "loss": 0.0259, "step": 80730 }, { "epoch": 0.21, "learning_rate": 0.00026860654101679447, "loss": 0.025, "step": 80740 }, { "epoch": 0.21, "learning_rate": 0.000268602652800423, "loss": 0.0214, "step": 80750 }, { "epoch": 0.21, "learning_rate": 0.00026859876458405155, "loss": 0.0232, "step": 80760 }, { "epoch": 0.21, "learning_rate": 0.00026859487636768007, "loss": 0.0255, "step": 80770 }, { "epoch": 0.21, "learning_rate": 0.00026859098815130864, "loss": 0.0276, "step": 80780 }, { "epoch": 0.21, "learning_rate": 0.00026858709993493715, "loss": 0.026, "step": 80790 }, { "epoch": 0.21, "learning_rate": 0.0002685832117185657, "loss": 0.0273, "step": 80800 }, { "epoch": 0.21, "learning_rate": 0.00026857932350219424, "loss": 0.0227, "step": 80810 }, { "epoch": 0.21, "learning_rate": 0.00026857543528582275, "loss": 0.0215, "step": 80820 }, { "epoch": 0.21, "learning_rate": 0.00026857154706945126, "loss": 0.025, "step": 80830 }, { "epoch": 0.21, "learning_rate": 0.00026856765885307983, "loss": 0.0265, "step": 80840 }, { "epoch": 0.21, "learning_rate": 0.0002685637706367084, "loss": 0.0239, "step": 80850 }, { "epoch": 0.21, "learning_rate": 0.0002685598824203369, "loss": 0.0307, "step": 80860 }, { "epoch": 0.21, "learning_rate": 0.00026855599420396543, "loss": 0.0375, "step": 80870 }, { "epoch": 0.21, "learning_rate": 0.000268552105987594, "loss": 0.0256, "step": 80880 }, { "epoch": 0.21, "learning_rate": 0.0002685482177712225, "loss": 0.0243, "step": 80890 }, { "epoch": 0.21, "learning_rate": 0.00026854432955485103, "loss": 0.0195, "step": 80900 }, { "epoch": 0.21, "learning_rate": 0.0002685404413384796, "loss": 0.0251, "step": 80910 }, { "epoch": 0.21, "learning_rate": 0.0002685365531221081, "loss": 0.0241, "step": 80920 }, { "epoch": 0.21, "learning_rate": 0.0002685326649057367, "loss": 0.0263, "step": 80930 }, { "epoch": 0.21, "learning_rate": 0.0002685287766893652, "loss": 0.0248, "step": 80940 }, { "epoch": 0.21, "learning_rate": 0.0002685248884729937, "loss": 0.0218, "step": 80950 }, { "epoch": 0.21, "learning_rate": 0.0002685210002566222, "loss": 0.0239, "step": 80960 }, { "epoch": 0.21, "learning_rate": 0.0002685171120402508, "loss": 0.0267, "step": 80970 }, { "epoch": 0.21, "learning_rate": 0.0002685132238238793, "loss": 0.0225, "step": 80980 }, { "epoch": 0.21, "learning_rate": 0.0002685093356075079, "loss": 0.0234, "step": 80990 }, { "epoch": 0.21, "learning_rate": 0.0002685054473911364, "loss": 0.0252, "step": 81000 }, { "epoch": 0.21, "eval_cer": 0.8817964619977577, "eval_loss": 0.017585597932338715, "eval_runtime": 107.7913, "eval_samples_per_second": 18.554, "eval_steps_per_second": 4.639, "step": 81000 }, { "epoch": 0.21, "learning_rate": 0.00026850155917476496, "loss": 0.0256, "step": 81010 }, { "epoch": 0.21, "learning_rate": 0.0002684976709583935, "loss": 0.021, "step": 81020 }, { "epoch": 0.21, "learning_rate": 0.000268493782742022, "loss": 0.0247, "step": 81030 }, { "epoch": 0.21, "learning_rate": 0.0002684898945256505, "loss": 0.0239, "step": 81040 }, { "epoch": 0.21, "learning_rate": 0.00026848600630927907, "loss": 0.0215, "step": 81050 }, { "epoch": 0.21, "learning_rate": 0.00026848211809290764, "loss": 0.0254, "step": 81060 }, { "epoch": 0.21, "learning_rate": 0.00026847822987653615, "loss": 0.0208, "step": 81070 }, { "epoch": 0.21, "learning_rate": 0.00026847434166016467, "loss": 0.0251, "step": 81080 }, { "epoch": 0.21, "learning_rate": 0.00026847045344379324, "loss": 0.0246, "step": 81090 }, { "epoch": 0.21, "learning_rate": 0.00026846656522742175, "loss": 0.0216, "step": 81100 }, { "epoch": 0.21, "learning_rate": 0.00026846267701105027, "loss": 0.0236, "step": 81110 }, { "epoch": 0.21, "learning_rate": 0.00026845878879467884, "loss": 0.0222, "step": 81120 }, { "epoch": 0.21, "learning_rate": 0.00026845490057830735, "loss": 0.0254, "step": 81130 }, { "epoch": 0.21, "learning_rate": 0.0002684510123619359, "loss": 0.0267, "step": 81140 }, { "epoch": 0.21, "learning_rate": 0.00026844712414556443, "loss": 0.0208, "step": 81150 }, { "epoch": 0.21, "learning_rate": 0.00026844323592919295, "loss": 0.0276, "step": 81160 }, { "epoch": 0.21, "learning_rate": 0.00026843934771282146, "loss": 0.0233, "step": 81170 }, { "epoch": 0.21, "learning_rate": 0.00026843545949645003, "loss": 0.0253, "step": 81180 }, { "epoch": 0.21, "learning_rate": 0.00026843157128007855, "loss": 0.0213, "step": 81190 }, { "epoch": 0.21, "learning_rate": 0.0002684276830637071, "loss": 0.0192, "step": 81200 }, { "epoch": 0.21, "learning_rate": 0.00026842379484733563, "loss": 0.0233, "step": 81210 }, { "epoch": 0.21, "learning_rate": 0.0002684199066309642, "loss": 0.0222, "step": 81220 }, { "epoch": 0.21, "learning_rate": 0.0002684160184145927, "loss": 0.0248, "step": 81230 }, { "epoch": 0.21, "learning_rate": 0.00026841213019822123, "loss": 0.024, "step": 81240 }, { "epoch": 0.21, "learning_rate": 0.0002684082419818498, "loss": 0.0213, "step": 81250 }, { "epoch": 0.21, "learning_rate": 0.0002684043537654783, "loss": 0.0247, "step": 81260 }, { "epoch": 0.21, "learning_rate": 0.0002684004655491069, "loss": 0.0267, "step": 81270 }, { "epoch": 0.21, "learning_rate": 0.0002683965773327354, "loss": 0.027, "step": 81280 }, { "epoch": 0.21, "learning_rate": 0.0002683926891163639, "loss": 0.0223, "step": 81290 }, { "epoch": 0.21, "learning_rate": 0.0002683888008999925, "loss": 0.0214, "step": 81300 }, { "epoch": 0.21, "learning_rate": 0.000268384912683621, "loss": 0.0241, "step": 81310 }, { "epoch": 0.21, "learning_rate": 0.0002683810244672495, "loss": 0.0242, "step": 81320 }, { "epoch": 0.21, "learning_rate": 0.0002683771362508781, "loss": 0.024, "step": 81330 }, { "epoch": 0.21, "learning_rate": 0.0002683732480345066, "loss": 0.0239, "step": 81340 }, { "epoch": 0.21, "learning_rate": 0.00026836935981813516, "loss": 0.0229, "step": 81350 }, { "epoch": 0.21, "learning_rate": 0.00026836547160176367, "loss": 0.0264, "step": 81360 }, { "epoch": 0.21, "learning_rate": 0.0002683615833853922, "loss": 0.0273, "step": 81370 }, { "epoch": 0.21, "learning_rate": 0.0002683576951690207, "loss": 0.0276, "step": 81380 }, { "epoch": 0.21, "learning_rate": 0.00026835380695264927, "loss": 0.0302, "step": 81390 }, { "epoch": 0.21, "learning_rate": 0.00026834991873627784, "loss": 0.0264, "step": 81400 }, { "epoch": 0.21, "learning_rate": 0.00026834603051990635, "loss": 0.0287, "step": 81410 }, { "epoch": 0.21, "learning_rate": 0.00026834214230353487, "loss": 0.0202, "step": 81420 }, { "epoch": 0.21, "learning_rate": 0.00026833825408716344, "loss": 0.022, "step": 81430 }, { "epoch": 0.21, "learning_rate": 0.00026833436587079195, "loss": 0.0267, "step": 81440 }, { "epoch": 0.21, "learning_rate": 0.00026833047765442047, "loss": 0.0245, "step": 81450 }, { "epoch": 0.21, "learning_rate": 0.00026832658943804903, "loss": 0.0255, "step": 81460 }, { "epoch": 0.21, "learning_rate": 0.00026832270122167755, "loss": 0.0183, "step": 81470 }, { "epoch": 0.21, "learning_rate": 0.0002683188130053061, "loss": 0.0253, "step": 81480 }, { "epoch": 0.21, "learning_rate": 0.00026831492478893463, "loss": 0.0228, "step": 81490 }, { "epoch": 0.21, "learning_rate": 0.00026831103657256315, "loss": 0.0243, "step": 81500 }, { "epoch": 0.21, "learning_rate": 0.0002683071483561917, "loss": 0.0286, "step": 81510 }, { "epoch": 0.21, "learning_rate": 0.00026830326013982023, "loss": 0.023, "step": 81520 }, { "epoch": 0.21, "learning_rate": 0.00026829937192344875, "loss": 0.0234, "step": 81530 }, { "epoch": 0.21, "learning_rate": 0.0002682954837070773, "loss": 0.0261, "step": 81540 }, { "epoch": 0.21, "learning_rate": 0.0002682915954907059, "loss": 0.0257, "step": 81550 }, { "epoch": 0.21, "learning_rate": 0.0002682877072743344, "loss": 0.0252, "step": 81560 }, { "epoch": 0.21, "learning_rate": 0.0002682838190579629, "loss": 0.0249, "step": 81570 }, { "epoch": 0.21, "learning_rate": 0.0002682799308415914, "loss": 0.0251, "step": 81580 }, { "epoch": 0.21, "learning_rate": 0.00026827604262522, "loss": 0.0195, "step": 81590 }, { "epoch": 0.21, "learning_rate": 0.0002682721544088485, "loss": 0.0234, "step": 81600 }, { "epoch": 0.21, "learning_rate": 0.0002682682661924771, "loss": 0.0253, "step": 81610 }, { "epoch": 0.21, "learning_rate": 0.0002682643779761056, "loss": 0.0239, "step": 81620 }, { "epoch": 0.21, "learning_rate": 0.0002682604897597341, "loss": 0.0254, "step": 81630 }, { "epoch": 0.21, "learning_rate": 0.0002682566015433627, "loss": 0.0237, "step": 81640 }, { "epoch": 0.21, "learning_rate": 0.0002682527133269912, "loss": 0.0226, "step": 81650 }, { "epoch": 0.21, "learning_rate": 0.0002682488251106197, "loss": 0.0201, "step": 81660 }, { "epoch": 0.21, "learning_rate": 0.0002682449368942483, "loss": 0.0238, "step": 81670 }, { "epoch": 0.21, "learning_rate": 0.0002682410486778768, "loss": 0.0276, "step": 81680 }, { "epoch": 0.21, "learning_rate": 0.00026823716046150536, "loss": 0.0334, "step": 81690 }, { "epoch": 0.21, "learning_rate": 0.00026823327224513387, "loss": 0.0405, "step": 81700 }, { "epoch": 0.21, "learning_rate": 0.0002682293840287624, "loss": 0.053, "step": 81710 }, { "epoch": 0.21, "learning_rate": 0.00026822549581239095, "loss": 0.0338, "step": 81720 }, { "epoch": 0.21, "learning_rate": 0.00026822160759601947, "loss": 0.0381, "step": 81730 }, { "epoch": 0.21, "learning_rate": 0.000268217719379648, "loss": 0.0248, "step": 81740 }, { "epoch": 0.21, "learning_rate": 0.00026821383116327655, "loss": 0.0251, "step": 81750 }, { "epoch": 0.21, "learning_rate": 0.0002682099429469051, "loss": 0.0318, "step": 81760 }, { "epoch": 0.21, "learning_rate": 0.00026820605473053364, "loss": 0.0243, "step": 81770 }, { "epoch": 0.21, "learning_rate": 0.00026820216651416215, "loss": 0.0267, "step": 81780 }, { "epoch": 0.21, "learning_rate": 0.00026819827829779066, "loss": 0.0327, "step": 81790 }, { "epoch": 0.21, "learning_rate": 0.00026819439008141923, "loss": 0.0303, "step": 81800 }, { "epoch": 0.21, "learning_rate": 0.00026819050186504775, "loss": 0.0281, "step": 81810 }, { "epoch": 0.21, "learning_rate": 0.0002681866136486763, "loss": 0.0204, "step": 81820 }, { "epoch": 0.21, "learning_rate": 0.00026818272543230483, "loss": 0.0226, "step": 81830 }, { "epoch": 0.21, "learning_rate": 0.0002681788372159334, "loss": 0.0277, "step": 81840 }, { "epoch": 0.21, "learning_rate": 0.0002681749489995619, "loss": 0.0238, "step": 81850 }, { "epoch": 0.21, "learning_rate": 0.00026817106078319043, "loss": 0.0246, "step": 81860 }, { "epoch": 0.21, "learning_rate": 0.00026816717256681894, "loss": 0.0247, "step": 81870 }, { "epoch": 0.21, "learning_rate": 0.0002681632843504475, "loss": 0.0205, "step": 81880 }, { "epoch": 0.21, "learning_rate": 0.0002681593961340761, "loss": 0.0256, "step": 81890 }, { "epoch": 0.21, "learning_rate": 0.0002681555079177046, "loss": 0.0251, "step": 81900 }, { "epoch": 0.21, "learning_rate": 0.0002681516197013331, "loss": 0.0245, "step": 81910 }, { "epoch": 0.21, "learning_rate": 0.0002681477314849616, "loss": 0.0272, "step": 81920 }, { "epoch": 0.21, "learning_rate": 0.0002681438432685902, "loss": 0.0229, "step": 81930 }, { "epoch": 0.21, "learning_rate": 0.0002681399550522187, "loss": 0.0256, "step": 81940 }, { "epoch": 0.21, "learning_rate": 0.0002681360668358473, "loss": 0.022, "step": 81950 }, { "epoch": 0.21, "learning_rate": 0.0002681321786194758, "loss": 0.0225, "step": 81960 }, { "epoch": 0.21, "learning_rate": 0.00026812829040310436, "loss": 0.0209, "step": 81970 }, { "epoch": 0.21, "learning_rate": 0.0002681244021867329, "loss": 0.0273, "step": 81980 }, { "epoch": 0.21, "learning_rate": 0.0002681205139703614, "loss": 0.0267, "step": 81990 }, { "epoch": 0.21, "learning_rate": 0.0002681166257539899, "loss": 0.0225, "step": 82000 }, { "epoch": 0.21, "eval_cer": 0.8817264801510488, "eval_loss": 0.017370792105793953, "eval_runtime": 108.1353, "eval_samples_per_second": 18.495, "eval_steps_per_second": 4.624, "step": 82000 }, { "epoch": 0.21, "learning_rate": 0.00026811273753761847, "loss": 0.0232, "step": 82010 }, { "epoch": 0.21, "learning_rate": 0.000268108849321247, "loss": 0.0268, "step": 82020 }, { "epoch": 0.21, "learning_rate": 0.00026810496110487556, "loss": 0.0222, "step": 82030 }, { "epoch": 0.21, "learning_rate": 0.00026810107288850407, "loss": 0.0364, "step": 82040 }, { "epoch": 0.21, "learning_rate": 0.00026809718467213264, "loss": 0.0216, "step": 82050 }, { "epoch": 0.21, "learning_rate": 0.00026809329645576115, "loss": 0.0272, "step": 82060 }, { "epoch": 0.21, "learning_rate": 0.00026808940823938967, "loss": 0.0251, "step": 82070 }, { "epoch": 0.21, "learning_rate": 0.0002680855200230182, "loss": 0.0244, "step": 82080 }, { "epoch": 0.21, "learning_rate": 0.00026808163180664675, "loss": 0.0249, "step": 82090 }, { "epoch": 0.21, "learning_rate": 0.0002680777435902753, "loss": 0.024, "step": 82100 }, { "epoch": 0.21, "learning_rate": 0.00026807385537390383, "loss": 0.0209, "step": 82110 }, { "epoch": 0.21, "learning_rate": 0.00026806996715753235, "loss": 0.0302, "step": 82120 }, { "epoch": 0.21, "learning_rate": 0.00026806607894116086, "loss": 0.028, "step": 82130 }, { "epoch": 0.21, "learning_rate": 0.00026806219072478943, "loss": 0.0233, "step": 82140 }, { "epoch": 0.21, "learning_rate": 0.00026805830250841795, "loss": 0.0238, "step": 82150 }, { "epoch": 0.21, "learning_rate": 0.0002680544142920465, "loss": 0.0252, "step": 82160 }, { "epoch": 0.21, "learning_rate": 0.00026805052607567503, "loss": 0.0247, "step": 82170 }, { "epoch": 0.21, "learning_rate": 0.0002680466378593036, "loss": 0.0246, "step": 82180 }, { "epoch": 0.21, "learning_rate": 0.0002680427496429321, "loss": 0.0252, "step": 82190 }, { "epoch": 0.21, "learning_rate": 0.00026803886142656063, "loss": 0.0223, "step": 82200 }, { "epoch": 0.21, "learning_rate": 0.00026803497321018914, "loss": 0.0213, "step": 82210 }, { "epoch": 0.21, "learning_rate": 0.0002680310849938177, "loss": 0.0224, "step": 82220 }, { "epoch": 0.21, "learning_rate": 0.0002680271967774462, "loss": 0.0222, "step": 82230 }, { "epoch": 0.21, "learning_rate": 0.0002680233085610748, "loss": 0.0258, "step": 82240 }, { "epoch": 0.21, "learning_rate": 0.0002680194203447033, "loss": 0.0231, "step": 82250 }, { "epoch": 0.21, "learning_rate": 0.0002680155321283319, "loss": 0.0266, "step": 82260 }, { "epoch": 0.21, "learning_rate": 0.0002680116439119604, "loss": 0.0216, "step": 82270 }, { "epoch": 0.21, "learning_rate": 0.0002680077556955889, "loss": 0.024, "step": 82280 }, { "epoch": 0.21, "learning_rate": 0.0002680038674792175, "loss": 0.0274, "step": 82290 }, { "epoch": 0.21, "learning_rate": 0.000267999979262846, "loss": 0.0234, "step": 82300 }, { "epoch": 0.21, "learning_rate": 0.00026799609104647456, "loss": 0.0218, "step": 82310 }, { "epoch": 0.21, "learning_rate": 0.0002679922028301031, "loss": 0.0206, "step": 82320 }, { "epoch": 0.21, "learning_rate": 0.0002679883146137316, "loss": 0.0179, "step": 82330 }, { "epoch": 0.21, "learning_rate": 0.00026798442639736016, "loss": 0.0233, "step": 82340 }, { "epoch": 0.21, "learning_rate": 0.00026798053818098867, "loss": 0.0247, "step": 82350 }, { "epoch": 0.21, "learning_rate": 0.0002679766499646172, "loss": 0.0311, "step": 82360 }, { "epoch": 0.21, "learning_rate": 0.00026797276174824575, "loss": 0.0234, "step": 82370 }, { "epoch": 0.21, "learning_rate": 0.00026796887353187427, "loss": 0.0249, "step": 82380 }, { "epoch": 0.21, "learning_rate": 0.00026796498531550284, "loss": 0.0234, "step": 82390 }, { "epoch": 0.21, "learning_rate": 0.00026796109709913135, "loss": 0.026, "step": 82400 }, { "epoch": 0.21, "learning_rate": 0.00026795720888275987, "loss": 0.0307, "step": 82410 }, { "epoch": 0.21, "learning_rate": 0.0002679533206663884, "loss": 0.029, "step": 82420 }, { "epoch": 0.21, "learning_rate": 0.00026794943245001695, "loss": 0.0259, "step": 82430 }, { "epoch": 0.21, "learning_rate": 0.0002679455442336455, "loss": 0.0244, "step": 82440 }, { "epoch": 0.21, "learning_rate": 0.00026794165601727403, "loss": 0.0216, "step": 82450 }, { "epoch": 0.21, "learning_rate": 0.00026793776780090255, "loss": 0.0268, "step": 82460 }, { "epoch": 0.21, "learning_rate": 0.0002679338795845311, "loss": 0.0214, "step": 82470 }, { "epoch": 0.21, "learning_rate": 0.00026792999136815963, "loss": 0.021, "step": 82480 }, { "epoch": 0.21, "learning_rate": 0.00026792610315178815, "loss": 0.0217, "step": 82490 }, { "epoch": 0.21, "learning_rate": 0.0002679222149354167, "loss": 0.0223, "step": 82500 }, { "epoch": 0.21, "learning_rate": 0.00026791832671904523, "loss": 0.0261, "step": 82510 }, { "epoch": 0.21, "learning_rate": 0.0002679144385026738, "loss": 0.023, "step": 82520 }, { "epoch": 0.21, "learning_rate": 0.0002679105502863023, "loss": 0.0281, "step": 82530 }, { "epoch": 0.21, "learning_rate": 0.0002679066620699308, "loss": 0.0275, "step": 82540 }, { "epoch": 0.21, "learning_rate": 0.0002679027738535594, "loss": 0.0303, "step": 82550 }, { "epoch": 0.21, "learning_rate": 0.0002678988856371879, "loss": 0.0251, "step": 82560 }, { "epoch": 0.21, "learning_rate": 0.0002678949974208164, "loss": 0.0245, "step": 82570 }, { "epoch": 0.21, "learning_rate": 0.000267891109204445, "loss": 0.0239, "step": 82580 }, { "epoch": 0.21, "learning_rate": 0.00026788722098807356, "loss": 0.0248, "step": 82590 }, { "epoch": 0.21, "learning_rate": 0.0002678833327717021, "loss": 0.0245, "step": 82600 }, { "epoch": 0.21, "learning_rate": 0.0002678794445553306, "loss": 0.025, "step": 82610 }, { "epoch": 0.21, "learning_rate": 0.0002678755563389591, "loss": 0.025, "step": 82620 }, { "epoch": 0.21, "learning_rate": 0.0002678716681225876, "loss": 0.0234, "step": 82630 }, { "epoch": 0.21, "learning_rate": 0.0002678677799062162, "loss": 0.0258, "step": 82640 }, { "epoch": 0.21, "learning_rate": 0.00026786389168984476, "loss": 0.0279, "step": 82650 }, { "epoch": 0.21, "learning_rate": 0.00026786000347347327, "loss": 0.0216, "step": 82660 }, { "epoch": 0.21, "learning_rate": 0.0002678561152571018, "loss": 0.0217, "step": 82670 }, { "epoch": 0.21, "learning_rate": 0.00026785222704073036, "loss": 0.0248, "step": 82680 }, { "epoch": 0.21, "learning_rate": 0.00026784833882435887, "loss": 0.0234, "step": 82690 }, { "epoch": 0.21, "learning_rate": 0.0002678444506079874, "loss": 0.0258, "step": 82700 }, { "epoch": 0.21, "learning_rate": 0.00026784056239161595, "loss": 0.0237, "step": 82710 }, { "epoch": 0.21, "learning_rate": 0.00026783667417524447, "loss": 0.0189, "step": 82720 }, { "epoch": 0.21, "learning_rate": 0.00026783278595887304, "loss": 0.024, "step": 82730 }, { "epoch": 0.21, "learning_rate": 0.00026782889774250155, "loss": 0.0214, "step": 82740 }, { "epoch": 0.21, "learning_rate": 0.00026782500952613007, "loss": 0.0244, "step": 82750 }, { "epoch": 0.21, "learning_rate": 0.00026782112130975863, "loss": 0.0249, "step": 82760 }, { "epoch": 0.21, "learning_rate": 0.00026781723309338715, "loss": 0.0243, "step": 82770 }, { "epoch": 0.21, "learning_rate": 0.00026781334487701566, "loss": 0.022, "step": 82780 }, { "epoch": 0.21, "learning_rate": 0.00026780945666064423, "loss": 0.0192, "step": 82790 }, { "epoch": 0.21, "learning_rate": 0.0002678055684442728, "loss": 0.0182, "step": 82800 }, { "epoch": 0.21, "learning_rate": 0.0002678016802279013, "loss": 0.0244, "step": 82810 }, { "epoch": 0.21, "learning_rate": 0.00026779779201152983, "loss": 0.0276, "step": 82820 }, { "epoch": 0.21, "learning_rate": 0.00026779390379515834, "loss": 0.0227, "step": 82830 }, { "epoch": 0.21, "learning_rate": 0.0002677900155787869, "loss": 0.0231, "step": 82840 }, { "epoch": 0.21, "learning_rate": 0.00026778612736241543, "loss": 0.023, "step": 82850 }, { "epoch": 0.21, "learning_rate": 0.000267782239146044, "loss": 0.0219, "step": 82860 }, { "epoch": 0.21, "learning_rate": 0.0002677783509296725, "loss": 0.0242, "step": 82870 }, { "epoch": 0.21, "learning_rate": 0.000267774462713301, "loss": 0.0256, "step": 82880 }, { "epoch": 0.21, "learning_rate": 0.0002677705744969296, "loss": 0.0262, "step": 82890 }, { "epoch": 0.21, "learning_rate": 0.0002677666862805581, "loss": 0.0232, "step": 82900 }, { "epoch": 0.21, "learning_rate": 0.0002677627980641866, "loss": 0.0279, "step": 82910 }, { "epoch": 0.21, "learning_rate": 0.0002677589098478152, "loss": 0.0253, "step": 82920 }, { "epoch": 0.21, "learning_rate": 0.0002677550216314437, "loss": 0.0207, "step": 82930 }, { "epoch": 0.21, "learning_rate": 0.0002677511334150723, "loss": 0.0234, "step": 82940 }, { "epoch": 0.22, "learning_rate": 0.0002677472451987008, "loss": 0.0211, "step": 82950 }, { "epoch": 0.22, "learning_rate": 0.0002677433569823293, "loss": 0.0269, "step": 82960 }, { "epoch": 0.22, "learning_rate": 0.0002677394687659579, "loss": 0.0197, "step": 82970 }, { "epoch": 0.22, "learning_rate": 0.0002677355805495864, "loss": 0.0216, "step": 82980 }, { "epoch": 0.22, "learning_rate": 0.00026773169233321496, "loss": 0.0202, "step": 82990 }, { "epoch": 0.22, "learning_rate": 0.00026772780411684347, "loss": 0.0236, "step": 83000 }, { "epoch": 0.22, "eval_cer": 0.881797861634692, "eval_loss": 0.017287341877818108, "eval_runtime": 108.0739, "eval_samples_per_second": 18.506, "eval_steps_per_second": 4.626, "step": 83000 }, { "epoch": 0.22, "learning_rate": 0.00026772391590047204, "loss": 0.0273, "step": 83010 }, { "epoch": 0.22, "learning_rate": 0.00026772002768410055, "loss": 0.0227, "step": 83020 }, { "epoch": 0.22, "learning_rate": 0.00026771613946772907, "loss": 0.0252, "step": 83030 }, { "epoch": 0.22, "learning_rate": 0.0002677122512513576, "loss": 0.0159, "step": 83040 }, { "epoch": 0.22, "learning_rate": 0.00026770836303498615, "loss": 0.0257, "step": 83050 }, { "epoch": 0.22, "learning_rate": 0.00026770447481861467, "loss": 0.0197, "step": 83060 }, { "epoch": 0.22, "learning_rate": 0.00026770058660224324, "loss": 0.0199, "step": 83070 }, { "epoch": 0.22, "learning_rate": 0.00026769669838587175, "loss": 0.0243, "step": 83080 }, { "epoch": 0.22, "learning_rate": 0.0002676928101695003, "loss": 0.0239, "step": 83090 }, { "epoch": 0.22, "learning_rate": 0.00026768892195312883, "loss": 0.0248, "step": 83100 }, { "epoch": 0.22, "learning_rate": 0.00026768503373675735, "loss": 0.0243, "step": 83110 }, { "epoch": 0.22, "learning_rate": 0.00026768114552038586, "loss": 0.0253, "step": 83120 }, { "epoch": 0.22, "learning_rate": 0.00026767725730401443, "loss": 0.0228, "step": 83130 }, { "epoch": 0.22, "learning_rate": 0.000267673369087643, "loss": 0.023, "step": 83140 }, { "epoch": 0.22, "learning_rate": 0.0002676694808712715, "loss": 0.0217, "step": 83150 }, { "epoch": 0.22, "learning_rate": 0.00026766559265490003, "loss": 0.025, "step": 83160 }, { "epoch": 0.22, "learning_rate": 0.00026766170443852854, "loss": 0.024, "step": 83170 }, { "epoch": 0.22, "learning_rate": 0.0002676578162221571, "loss": 0.0237, "step": 83180 }, { "epoch": 0.22, "learning_rate": 0.0002676539280057856, "loss": 0.0236, "step": 83190 }, { "epoch": 0.22, "learning_rate": 0.0002676500397894142, "loss": 0.0214, "step": 83200 }, { "epoch": 0.22, "learning_rate": 0.0002676461515730427, "loss": 0.0226, "step": 83210 }, { "epoch": 0.22, "learning_rate": 0.0002676422633566713, "loss": 0.0259, "step": 83220 }, { "epoch": 0.22, "learning_rate": 0.0002676383751402998, "loss": 0.0232, "step": 83230 }, { "epoch": 0.22, "learning_rate": 0.0002676344869239283, "loss": 0.0196, "step": 83240 }, { "epoch": 0.22, "learning_rate": 0.0002676305987075568, "loss": 0.0255, "step": 83250 }, { "epoch": 0.22, "learning_rate": 0.0002676267104911854, "loss": 0.0233, "step": 83260 }, { "epoch": 0.22, "learning_rate": 0.0002676228222748139, "loss": 0.0232, "step": 83270 }, { "epoch": 0.22, "learning_rate": 0.0002676189340584425, "loss": 0.0239, "step": 83280 }, { "epoch": 0.22, "learning_rate": 0.000267615045842071, "loss": 0.0239, "step": 83290 }, { "epoch": 0.22, "learning_rate": 0.00026761115762569956, "loss": 0.0247, "step": 83300 }, { "epoch": 0.22, "learning_rate": 0.00026760726940932807, "loss": 0.0216, "step": 83310 }, { "epoch": 0.22, "learning_rate": 0.0002676033811929566, "loss": 0.032, "step": 83320 }, { "epoch": 0.22, "learning_rate": 0.0002675994929765851, "loss": 0.0268, "step": 83330 }, { "epoch": 0.22, "learning_rate": 0.00026759560476021367, "loss": 0.0257, "step": 83340 }, { "epoch": 0.22, "learning_rate": 0.00026759171654384224, "loss": 0.027, "step": 83350 }, { "epoch": 0.22, "learning_rate": 0.00026758782832747075, "loss": 0.019, "step": 83360 }, { "epoch": 0.22, "learning_rate": 0.00026758394011109927, "loss": 0.0247, "step": 83370 }, { "epoch": 0.22, "learning_rate": 0.0002675800518947278, "loss": 0.0209, "step": 83380 }, { "epoch": 0.22, "learning_rate": 0.00026757616367835635, "loss": 0.0182, "step": 83390 }, { "epoch": 0.22, "learning_rate": 0.00026757227546198487, "loss": 0.0215, "step": 83400 }, { "epoch": 0.22, "learning_rate": 0.00026756838724561343, "loss": 0.0241, "step": 83410 }, { "epoch": 0.22, "learning_rate": 0.00026756449902924195, "loss": 0.02, "step": 83420 }, { "epoch": 0.22, "learning_rate": 0.0002675606108128705, "loss": 0.0284, "step": 83430 }, { "epoch": 0.22, "learning_rate": 0.00026755672259649903, "loss": 0.021, "step": 83440 }, { "epoch": 0.22, "learning_rate": 0.00026755283438012755, "loss": 0.021, "step": 83450 }, { "epoch": 0.22, "learning_rate": 0.00026754894616375606, "loss": 0.0297, "step": 83460 }, { "epoch": 0.22, "learning_rate": 0.00026754505794738463, "loss": 0.0278, "step": 83470 }, { "epoch": 0.22, "learning_rate": 0.0002675411697310132, "loss": 0.0225, "step": 83480 }, { "epoch": 0.22, "learning_rate": 0.0002675372815146417, "loss": 0.0237, "step": 83490 }, { "epoch": 0.22, "learning_rate": 0.00026753339329827023, "loss": 0.0244, "step": 83500 }, { "epoch": 0.22, "learning_rate": 0.0002675295050818988, "loss": 0.0223, "step": 83510 }, { "epoch": 0.22, "learning_rate": 0.0002675256168655273, "loss": 0.0288, "step": 83520 }, { "epoch": 0.22, "learning_rate": 0.0002675217286491558, "loss": 0.0206, "step": 83530 }, { "epoch": 0.22, "learning_rate": 0.0002675178404327844, "loss": 0.0254, "step": 83540 }, { "epoch": 0.22, "learning_rate": 0.0002675139522164129, "loss": 0.0242, "step": 83550 }, { "epoch": 0.22, "learning_rate": 0.0002675100640000415, "loss": 0.0279, "step": 83560 }, { "epoch": 0.22, "learning_rate": 0.00026750617578367, "loss": 0.023, "step": 83570 }, { "epoch": 0.22, "learning_rate": 0.0002675022875672985, "loss": 0.0221, "step": 83580 }, { "epoch": 0.22, "learning_rate": 0.0002674983993509271, "loss": 0.0229, "step": 83590 }, { "epoch": 0.22, "learning_rate": 0.0002674945111345556, "loss": 0.0234, "step": 83600 }, { "epoch": 0.22, "learning_rate": 0.0002674906229181841, "loss": 0.021, "step": 83610 }, { "epoch": 0.22, "learning_rate": 0.0002674867347018127, "loss": 0.0223, "step": 83620 }, { "epoch": 0.22, "learning_rate": 0.0002674828464854412, "loss": 0.0217, "step": 83630 }, { "epoch": 0.22, "learning_rate": 0.00026747895826906976, "loss": 0.0206, "step": 83640 }, { "epoch": 0.22, "learning_rate": 0.00026747507005269827, "loss": 0.0212, "step": 83650 }, { "epoch": 0.22, "learning_rate": 0.0002674711818363268, "loss": 0.0233, "step": 83660 }, { "epoch": 0.22, "learning_rate": 0.0002674672936199553, "loss": 0.0218, "step": 83670 }, { "epoch": 0.22, "learning_rate": 0.00026746340540358387, "loss": 0.017, "step": 83680 }, { "epoch": 0.22, "learning_rate": 0.00026745951718721244, "loss": 0.0264, "step": 83690 }, { "epoch": 0.22, "learning_rate": 0.00026745562897084095, "loss": 0.0213, "step": 83700 }, { "epoch": 0.22, "learning_rate": 0.00026745174075446947, "loss": 0.0224, "step": 83710 }, { "epoch": 0.22, "learning_rate": 0.00026744785253809804, "loss": 0.022, "step": 83720 }, { "epoch": 0.22, "learning_rate": 0.00026744396432172655, "loss": 0.0255, "step": 83730 }, { "epoch": 0.22, "learning_rate": 0.00026744007610535506, "loss": 0.0242, "step": 83740 }, { "epoch": 0.22, "learning_rate": 0.00026743618788898363, "loss": 0.024, "step": 83750 }, { "epoch": 0.22, "learning_rate": 0.00026743229967261215, "loss": 0.0228, "step": 83760 }, { "epoch": 0.22, "learning_rate": 0.0002674284114562407, "loss": 0.0167, "step": 83770 }, { "epoch": 0.22, "learning_rate": 0.00026742452323986923, "loss": 0.0229, "step": 83780 }, { "epoch": 0.22, "learning_rate": 0.00026742063502349775, "loss": 0.0249, "step": 83790 }, { "epoch": 0.22, "learning_rate": 0.0002674167468071263, "loss": 0.0289, "step": 83800 }, { "epoch": 0.22, "learning_rate": 0.00026741285859075483, "loss": 0.0249, "step": 83810 }, { "epoch": 0.22, "learning_rate": 0.00026740897037438334, "loss": 0.0228, "step": 83820 }, { "epoch": 0.22, "learning_rate": 0.0002674050821580119, "loss": 0.0296, "step": 83830 }, { "epoch": 0.22, "learning_rate": 0.0002674011939416405, "loss": 0.0269, "step": 83840 }, { "epoch": 0.22, "learning_rate": 0.000267397305725269, "loss": 0.0248, "step": 83850 }, { "epoch": 0.22, "learning_rate": 0.0002673934175088975, "loss": 0.0205, "step": 83860 }, { "epoch": 0.22, "learning_rate": 0.000267389529292526, "loss": 0.023, "step": 83870 }, { "epoch": 0.22, "learning_rate": 0.0002673856410761546, "loss": 0.0248, "step": 83880 }, { "epoch": 0.22, "learning_rate": 0.0002673817528597831, "loss": 0.0212, "step": 83890 }, { "epoch": 0.22, "learning_rate": 0.0002673778646434117, "loss": 0.0241, "step": 83900 }, { "epoch": 0.22, "learning_rate": 0.0002673739764270402, "loss": 0.0207, "step": 83910 }, { "epoch": 0.22, "learning_rate": 0.0002673700882106687, "loss": 0.0293, "step": 83920 }, { "epoch": 0.22, "learning_rate": 0.0002673661999942973, "loss": 0.0247, "step": 83930 }, { "epoch": 0.22, "learning_rate": 0.0002673623117779258, "loss": 0.0251, "step": 83940 }, { "epoch": 0.22, "learning_rate": 0.0002673584235615543, "loss": 0.0196, "step": 83950 }, { "epoch": 0.22, "learning_rate": 0.00026735453534518287, "loss": 0.0231, "step": 83960 }, { "epoch": 0.22, "learning_rate": 0.0002673506471288114, "loss": 0.0242, "step": 83970 }, { "epoch": 0.22, "learning_rate": 0.00026734675891243996, "loss": 0.0296, "step": 83980 }, { "epoch": 0.22, "learning_rate": 0.00026734287069606847, "loss": 0.0224, "step": 83990 }, { "epoch": 0.22, "learning_rate": 0.000267338982479697, "loss": 0.0256, "step": 84000 }, { "epoch": 0.22, "eval_cer": 0.8817796663545476, "eval_loss": 0.017041249200701714, "eval_runtime": 108.2013, "eval_samples_per_second": 18.484, "eval_steps_per_second": 4.621, "step": 84000 }, { "epoch": 0.22, "learning_rate": 0.00026733509426332555, "loss": 0.0181, "step": 84010 }, { "epoch": 0.22, "learning_rate": 0.00026733120604695407, "loss": 0.0207, "step": 84020 }, { "epoch": 0.22, "learning_rate": 0.00026732731783058264, "loss": 0.0231, "step": 84030 }, { "epoch": 0.22, "learning_rate": 0.00026732342961421115, "loss": 0.0226, "step": 84040 }, { "epoch": 0.22, "learning_rate": 0.0002673195413978397, "loss": 0.0216, "step": 84050 }, { "epoch": 0.22, "learning_rate": 0.00026731565318146823, "loss": 0.0223, "step": 84060 }, { "epoch": 0.22, "learning_rate": 0.00026731176496509675, "loss": 0.0222, "step": 84070 }, { "epoch": 0.22, "learning_rate": 0.00026730787674872526, "loss": 0.0187, "step": 84080 }, { "epoch": 0.22, "learning_rate": 0.00026730398853235383, "loss": 0.0238, "step": 84090 }, { "epoch": 0.22, "learning_rate": 0.00026730010031598235, "loss": 0.0211, "step": 84100 }, { "epoch": 0.22, "learning_rate": 0.0002672962120996109, "loss": 0.0271, "step": 84110 }, { "epoch": 0.22, "learning_rate": 0.00026729232388323943, "loss": 0.0261, "step": 84120 }, { "epoch": 0.22, "learning_rate": 0.00026728843566686794, "loss": 0.0178, "step": 84130 }, { "epoch": 0.22, "learning_rate": 0.0002672845474504965, "loss": 0.0259, "step": 84140 }, { "epoch": 0.22, "learning_rate": 0.00026728065923412503, "loss": 0.0198, "step": 84150 }, { "epoch": 0.22, "learning_rate": 0.00026727677101775354, "loss": 0.0205, "step": 84160 }, { "epoch": 0.22, "learning_rate": 0.0002672728828013821, "loss": 0.0233, "step": 84170 }, { "epoch": 0.22, "learning_rate": 0.0002672689945850107, "loss": 0.0219, "step": 84180 }, { "epoch": 0.22, "learning_rate": 0.0002672651063686392, "loss": 0.0272, "step": 84190 }, { "epoch": 0.22, "learning_rate": 0.0002672612181522677, "loss": 0.0217, "step": 84200 }, { "epoch": 0.22, "learning_rate": 0.0002672573299358962, "loss": 0.0192, "step": 84210 }, { "epoch": 0.22, "learning_rate": 0.0002672534417195248, "loss": 0.0277, "step": 84220 }, { "epoch": 0.22, "learning_rate": 0.0002672495535031533, "loss": 0.0225, "step": 84230 }, { "epoch": 0.22, "learning_rate": 0.0002672456652867819, "loss": 0.0214, "step": 84240 }, { "epoch": 0.22, "learning_rate": 0.0002672417770704104, "loss": 0.0306, "step": 84250 }, { "epoch": 0.22, "learning_rate": 0.00026723788885403896, "loss": 0.0198, "step": 84260 }, { "epoch": 0.22, "learning_rate": 0.0002672340006376675, "loss": 0.0214, "step": 84270 }, { "epoch": 0.22, "learning_rate": 0.000267230112421296, "loss": 0.0236, "step": 84280 }, { "epoch": 0.22, "learning_rate": 0.0002672262242049245, "loss": 0.023, "step": 84290 }, { "epoch": 0.22, "learning_rate": 0.00026722233598855307, "loss": 0.021, "step": 84300 }, { "epoch": 0.22, "learning_rate": 0.0002672184477721816, "loss": 0.0321, "step": 84310 }, { "epoch": 0.22, "learning_rate": 0.00026721455955581015, "loss": 0.0218, "step": 84320 }, { "epoch": 0.22, "learning_rate": 0.00026721067133943867, "loss": 0.0262, "step": 84330 }, { "epoch": 0.22, "learning_rate": 0.00026720678312306724, "loss": 0.0248, "step": 84340 }, { "epoch": 0.22, "learning_rate": 0.00026720289490669575, "loss": 0.0222, "step": 84350 }, { "epoch": 0.22, "learning_rate": 0.00026719900669032427, "loss": 0.0263, "step": 84360 }, { "epoch": 0.22, "learning_rate": 0.0002671951184739528, "loss": 0.0282, "step": 84370 }, { "epoch": 0.22, "learning_rate": 0.00026719123025758135, "loss": 0.0238, "step": 84380 }, { "epoch": 0.22, "learning_rate": 0.0002671873420412099, "loss": 0.0216, "step": 84390 }, { "epoch": 0.22, "learning_rate": 0.00026718345382483843, "loss": 0.0263, "step": 84400 }, { "epoch": 0.22, "learning_rate": 0.00026717956560846695, "loss": 0.0235, "step": 84410 }, { "epoch": 0.22, "learning_rate": 0.00026717567739209546, "loss": 0.0241, "step": 84420 }, { "epoch": 0.22, "learning_rate": 0.00026717178917572403, "loss": 0.0208, "step": 84430 }, { "epoch": 0.22, "learning_rate": 0.00026716790095935255, "loss": 0.0195, "step": 84440 }, { "epoch": 0.22, "learning_rate": 0.0002671640127429811, "loss": 0.0238, "step": 84450 }, { "epoch": 0.22, "learning_rate": 0.00026716012452660963, "loss": 0.0274, "step": 84460 }, { "epoch": 0.22, "learning_rate": 0.0002671562363102382, "loss": 0.0219, "step": 84470 }, { "epoch": 0.22, "learning_rate": 0.0002671523480938667, "loss": 0.0259, "step": 84480 }, { "epoch": 0.22, "learning_rate": 0.0002671484598774952, "loss": 0.0235, "step": 84490 }, { "epoch": 0.22, "learning_rate": 0.00026714457166112374, "loss": 0.0226, "step": 84500 }, { "epoch": 0.22, "learning_rate": 0.0002671406834447523, "loss": 0.02, "step": 84510 }, { "epoch": 0.22, "learning_rate": 0.0002671367952283808, "loss": 0.0261, "step": 84520 }, { "epoch": 0.22, "learning_rate": 0.0002671329070120094, "loss": 0.0226, "step": 84530 }, { "epoch": 0.22, "learning_rate": 0.0002671290187956379, "loss": 0.0231, "step": 84540 }, { "epoch": 0.22, "learning_rate": 0.0002671251305792665, "loss": 0.0191, "step": 84550 }, { "epoch": 0.22, "learning_rate": 0.000267121242362895, "loss": 0.0236, "step": 84560 }, { "epoch": 0.22, "learning_rate": 0.0002671173541465235, "loss": 0.024, "step": 84570 }, { "epoch": 0.22, "learning_rate": 0.0002671134659301521, "loss": 0.0221, "step": 84580 }, { "epoch": 0.22, "learning_rate": 0.0002671095777137806, "loss": 0.0253, "step": 84590 }, { "epoch": 0.22, "learning_rate": 0.00026710568949740916, "loss": 0.0212, "step": 84600 }, { "epoch": 0.22, "learning_rate": 0.00026710180128103767, "loss": 0.0243, "step": 84610 }, { "epoch": 0.22, "learning_rate": 0.0002670979130646662, "loss": 0.0235, "step": 84620 }, { "epoch": 0.22, "learning_rate": 0.0002670940248482947, "loss": 0.0226, "step": 84630 }, { "epoch": 0.22, "learning_rate": 0.00026709013663192327, "loss": 0.0206, "step": 84640 }, { "epoch": 0.22, "learning_rate": 0.0002670862484155518, "loss": 0.0299, "step": 84650 }, { "epoch": 0.22, "learning_rate": 0.00026708236019918035, "loss": 0.0224, "step": 84660 }, { "epoch": 0.22, "learning_rate": 0.00026707847198280887, "loss": 0.0321, "step": 84670 }, { "epoch": 0.22, "learning_rate": 0.00026707458376643744, "loss": 0.0238, "step": 84680 }, { "epoch": 0.22, "learning_rate": 0.00026707069555006595, "loss": 0.025, "step": 84690 }, { "epoch": 0.22, "learning_rate": 0.00026706680733369447, "loss": 0.0226, "step": 84700 }, { "epoch": 0.22, "learning_rate": 0.000267062919117323, "loss": 0.0234, "step": 84710 }, { "epoch": 0.22, "learning_rate": 0.00026705903090095155, "loss": 0.0303, "step": 84720 }, { "epoch": 0.22, "learning_rate": 0.0002670551426845801, "loss": 0.0172, "step": 84730 }, { "epoch": 0.22, "learning_rate": 0.00026705125446820863, "loss": 0.0247, "step": 84740 }, { "epoch": 0.22, "learning_rate": 0.00026704736625183715, "loss": 0.0246, "step": 84750 }, { "epoch": 0.22, "learning_rate": 0.0002670434780354657, "loss": 0.0255, "step": 84760 }, { "epoch": 0.22, "learning_rate": 0.00026703958981909423, "loss": 0.023, "step": 84770 }, { "epoch": 0.22, "learning_rate": 0.00026703570160272274, "loss": 0.0277, "step": 84780 }, { "epoch": 0.22, "learning_rate": 0.0002670318133863513, "loss": 0.0267, "step": 84790 }, { "epoch": 0.22, "learning_rate": 0.00026702792516997983, "loss": 0.0235, "step": 84800 }, { "epoch": 0.22, "learning_rate": 0.0002670240369536084, "loss": 0.0277, "step": 84810 }, { "epoch": 0.22, "learning_rate": 0.0002670201487372369, "loss": 0.0231, "step": 84820 }, { "epoch": 0.22, "learning_rate": 0.0002670162605208654, "loss": 0.0226, "step": 84830 }, { "epoch": 0.22, "learning_rate": 0.000267012372304494, "loss": 0.0237, "step": 84840 }, { "epoch": 0.22, "learning_rate": 0.0002670084840881225, "loss": 0.0245, "step": 84850 }, { "epoch": 0.22, "learning_rate": 0.000267004595871751, "loss": 0.0229, "step": 84860 }, { "epoch": 0.22, "learning_rate": 0.0002670007076553796, "loss": 0.0195, "step": 84870 }, { "epoch": 0.22, "learning_rate": 0.0002669968194390081, "loss": 0.0256, "step": 84880 }, { "epoch": 0.22, "learning_rate": 0.0002669929312226367, "loss": 0.0237, "step": 84890 }, { "epoch": 0.22, "learning_rate": 0.0002669890430062652, "loss": 0.0219, "step": 84900 }, { "epoch": 0.22, "learning_rate": 0.0002669851547898937, "loss": 0.0272, "step": 84910 }, { "epoch": 0.22, "learning_rate": 0.0002669812665735222, "loss": 0.0224, "step": 84920 }, { "epoch": 0.22, "learning_rate": 0.0002669773783571508, "loss": 0.0248, "step": 84930 }, { "epoch": 0.22, "learning_rate": 0.00026697349014077936, "loss": 0.018, "step": 84940 }, { "epoch": 0.22, "learning_rate": 0.00026696960192440787, "loss": 0.031, "step": 84950 }, { "epoch": 0.22, "learning_rate": 0.0002669657137080364, "loss": 0.0223, "step": 84960 }, { "epoch": 0.22, "learning_rate": 0.00026696182549166495, "loss": 0.0245, "step": 84970 }, { "epoch": 0.22, "learning_rate": 0.00026695793727529347, "loss": 0.0246, "step": 84980 }, { "epoch": 0.22, "learning_rate": 0.000266954049058922, "loss": 0.0211, "step": 84990 }, { "epoch": 0.22, "learning_rate": 0.00026695016084255055, "loss": 0.0232, "step": 85000 }, { "epoch": 0.22, "eval_cer": 0.8817908634500211, "eval_loss": 0.017778005450963974, "eval_runtime": 108.2093, "eval_samples_per_second": 18.483, "eval_steps_per_second": 4.621, "step": 85000 }, { "epoch": 0.22, "learning_rate": 0.00026694627262617907, "loss": 0.0212, "step": 85010 }, { "epoch": 0.22, "learning_rate": 0.00026694238440980764, "loss": 0.0298, "step": 85020 }, { "epoch": 0.22, "learning_rate": 0.00026693849619343615, "loss": 0.0245, "step": 85030 }, { "epoch": 0.22, "learning_rate": 0.00026693460797706466, "loss": 0.0234, "step": 85040 }, { "epoch": 0.22, "learning_rate": 0.00026693071976069323, "loss": 0.0232, "step": 85050 }, { "epoch": 0.22, "learning_rate": 0.00026692683154432175, "loss": 0.0186, "step": 85060 }, { "epoch": 0.22, "learning_rate": 0.0002669229433279503, "loss": 0.0321, "step": 85070 }, { "epoch": 0.22, "learning_rate": 0.00026691905511157883, "loss": 0.0247, "step": 85080 }, { "epoch": 0.22, "learning_rate": 0.0002669151668952074, "loss": 0.0245, "step": 85090 }, { "epoch": 0.22, "learning_rate": 0.0002669112786788359, "loss": 0.0263, "step": 85100 }, { "epoch": 0.22, "learning_rate": 0.00026690739046246443, "loss": 0.0235, "step": 85110 }, { "epoch": 0.22, "learning_rate": 0.00026690350224609294, "loss": 0.0194, "step": 85120 }, { "epoch": 0.22, "learning_rate": 0.0002668996140297215, "loss": 0.023, "step": 85130 }, { "epoch": 0.22, "learning_rate": 0.00026689572581335, "loss": 0.0212, "step": 85140 }, { "epoch": 0.22, "learning_rate": 0.0002668918375969786, "loss": 0.0245, "step": 85150 }, { "epoch": 0.22, "learning_rate": 0.0002668879493806071, "loss": 0.0223, "step": 85160 }, { "epoch": 0.22, "learning_rate": 0.0002668840611642356, "loss": 0.0277, "step": 85170 }, { "epoch": 0.22, "learning_rate": 0.0002668801729478642, "loss": 0.0267, "step": 85180 }, { "epoch": 0.22, "learning_rate": 0.0002668762847314927, "loss": 0.0233, "step": 85190 }, { "epoch": 0.22, "learning_rate": 0.0002668723965151212, "loss": 0.0211, "step": 85200 }, { "epoch": 0.22, "learning_rate": 0.0002668685082987498, "loss": 0.0263, "step": 85210 }, { "epoch": 0.22, "learning_rate": 0.00026686462008237836, "loss": 0.025, "step": 85220 }, { "epoch": 0.22, "learning_rate": 0.0002668607318660069, "loss": 0.0248, "step": 85230 }, { "epoch": 0.22, "learning_rate": 0.0002668568436496354, "loss": 0.0232, "step": 85240 }, { "epoch": 0.22, "learning_rate": 0.0002668529554332639, "loss": 0.0227, "step": 85250 }, { "epoch": 0.22, "learning_rate": 0.00026684906721689247, "loss": 0.0302, "step": 85260 }, { "epoch": 0.22, "learning_rate": 0.000266845179000521, "loss": 0.0242, "step": 85270 }, { "epoch": 0.22, "learning_rate": 0.00026684129078414956, "loss": 0.029, "step": 85280 }, { "epoch": 0.22, "learning_rate": 0.00026683740256777807, "loss": 0.0237, "step": 85290 }, { "epoch": 0.22, "learning_rate": 0.00026683351435140664, "loss": 0.0255, "step": 85300 }, { "epoch": 0.22, "learning_rate": 0.00026682962613503515, "loss": 0.0204, "step": 85310 }, { "epoch": 0.22, "learning_rate": 0.00026682573791866367, "loss": 0.0251, "step": 85320 }, { "epoch": 0.22, "learning_rate": 0.0002668218497022922, "loss": 0.0263, "step": 85330 }, { "epoch": 0.22, "learning_rate": 0.00026681796148592075, "loss": 0.0208, "step": 85340 }, { "epoch": 0.22, "learning_rate": 0.00026681407326954927, "loss": 0.0253, "step": 85350 }, { "epoch": 0.22, "learning_rate": 0.00026681018505317783, "loss": 0.0274, "step": 85360 }, { "epoch": 0.22, "learning_rate": 0.00026680629683680635, "loss": 0.0217, "step": 85370 }, { "epoch": 0.22, "learning_rate": 0.00026680240862043486, "loss": 0.0241, "step": 85380 }, { "epoch": 0.22, "learning_rate": 0.00026679852040406343, "loss": 0.028, "step": 85390 }, { "epoch": 0.22, "learning_rate": 0.00026679463218769195, "loss": 0.0222, "step": 85400 }, { "epoch": 0.22, "learning_rate": 0.00026679074397132046, "loss": 0.0296, "step": 85410 }, { "epoch": 0.22, "learning_rate": 0.00026678685575494903, "loss": 0.0244, "step": 85420 }, { "epoch": 0.22, "learning_rate": 0.0002667829675385776, "loss": 0.0251, "step": 85430 }, { "epoch": 0.22, "learning_rate": 0.0002667790793222061, "loss": 0.028, "step": 85440 }, { "epoch": 0.22, "learning_rate": 0.00026677519110583463, "loss": 0.0236, "step": 85450 }, { "epoch": 0.22, "learning_rate": 0.00026677130288946314, "loss": 0.0242, "step": 85460 }, { "epoch": 0.22, "learning_rate": 0.0002667674146730917, "loss": 0.0287, "step": 85470 }, { "epoch": 0.22, "learning_rate": 0.0002667635264567202, "loss": 0.0222, "step": 85480 }, { "epoch": 0.22, "learning_rate": 0.0002667596382403488, "loss": 0.0236, "step": 85490 }, { "epoch": 0.22, "learning_rate": 0.0002667557500239773, "loss": 0.024, "step": 85500 }, { "epoch": 0.22, "learning_rate": 0.0002667518618076059, "loss": 0.0204, "step": 85510 }, { "epoch": 0.22, "learning_rate": 0.0002667479735912344, "loss": 0.0264, "step": 85520 }, { "epoch": 0.22, "learning_rate": 0.0002667440853748629, "loss": 0.0227, "step": 85530 }, { "epoch": 0.22, "learning_rate": 0.0002667401971584914, "loss": 0.021, "step": 85540 }, { "epoch": 0.22, "learning_rate": 0.00026673630894212, "loss": 0.0225, "step": 85550 }, { "epoch": 0.22, "learning_rate": 0.0002667324207257485, "loss": 0.0245, "step": 85560 }, { "epoch": 0.22, "learning_rate": 0.0002667285325093771, "loss": 0.0172, "step": 85570 }, { "epoch": 0.22, "learning_rate": 0.0002667246442930056, "loss": 0.0195, "step": 85580 }, { "epoch": 0.22, "learning_rate": 0.00026672075607663416, "loss": 0.0277, "step": 85590 }, { "epoch": 0.22, "learning_rate": 0.00026671686786026267, "loss": 0.0222, "step": 85600 }, { "epoch": 0.22, "learning_rate": 0.0002667129796438912, "loss": 0.0225, "step": 85610 }, { "epoch": 0.22, "learning_rate": 0.00026670909142751975, "loss": 0.0213, "step": 85620 }, { "epoch": 0.22, "learning_rate": 0.00026670520321114827, "loss": 0.0245, "step": 85630 }, { "epoch": 0.22, "learning_rate": 0.00026670131499477684, "loss": 0.0247, "step": 85640 }, { "epoch": 0.22, "learning_rate": 0.00026669742677840535, "loss": 0.0261, "step": 85650 }, { "epoch": 0.22, "learning_rate": 0.00026669353856203387, "loss": 0.0244, "step": 85660 }, { "epoch": 0.22, "learning_rate": 0.0002666896503456624, "loss": 0.0318, "step": 85670 }, { "epoch": 0.22, "learning_rate": 0.00026668576212929095, "loss": 0.0236, "step": 85680 }, { "epoch": 0.22, "learning_rate": 0.00026668187391291946, "loss": 0.0216, "step": 85690 }, { "epoch": 0.22, "learning_rate": 0.00026667798569654803, "loss": 0.0239, "step": 85700 }, { "epoch": 0.22, "learning_rate": 0.00026667409748017655, "loss": 0.0245, "step": 85710 }, { "epoch": 0.22, "learning_rate": 0.0002666702092638051, "loss": 0.026, "step": 85720 }, { "epoch": 0.22, "learning_rate": 0.00026666632104743363, "loss": 0.0292, "step": 85730 }, { "epoch": 0.22, "learning_rate": 0.00026666243283106215, "loss": 0.0255, "step": 85740 }, { "epoch": 0.22, "learning_rate": 0.00026665854461469066, "loss": 0.023, "step": 85750 }, { "epoch": 0.22, "learning_rate": 0.00026665465639831923, "loss": 0.0191, "step": 85760 }, { "epoch": 0.22, "learning_rate": 0.0002666507681819478, "loss": 0.025, "step": 85770 }, { "epoch": 0.22, "learning_rate": 0.0002666468799655763, "loss": 0.0227, "step": 85780 }, { "epoch": 0.22, "learning_rate": 0.0002666429917492048, "loss": 0.0275, "step": 85790 }, { "epoch": 0.22, "learning_rate": 0.0002666391035328334, "loss": 0.0272, "step": 85800 }, { "epoch": 0.22, "learning_rate": 0.0002666352153164619, "loss": 0.0245, "step": 85810 }, { "epoch": 0.22, "learning_rate": 0.0002666313271000904, "loss": 0.0241, "step": 85820 }, { "epoch": 0.22, "learning_rate": 0.000266627438883719, "loss": 0.0236, "step": 85830 }, { "epoch": 0.22, "learning_rate": 0.0002666235506673475, "loss": 0.0206, "step": 85840 }, { "epoch": 0.22, "learning_rate": 0.0002666196624509761, "loss": 0.0258, "step": 85850 }, { "epoch": 0.22, "learning_rate": 0.0002666157742346046, "loss": 0.0255, "step": 85860 }, { "epoch": 0.22, "learning_rate": 0.0002666118860182331, "loss": 0.0197, "step": 85870 }, { "epoch": 0.22, "learning_rate": 0.0002666079978018616, "loss": 0.0233, "step": 85880 }, { "epoch": 0.22, "learning_rate": 0.0002666041095854902, "loss": 0.0262, "step": 85890 }, { "epoch": 0.22, "learning_rate": 0.0002666002213691187, "loss": 0.0266, "step": 85900 }, { "epoch": 0.22, "learning_rate": 0.00026659633315274727, "loss": 0.0248, "step": 85910 }, { "epoch": 0.22, "learning_rate": 0.0002665924449363758, "loss": 0.0244, "step": 85920 }, { "epoch": 0.22, "learning_rate": 0.00026658855672000436, "loss": 0.0233, "step": 85930 }, { "epoch": 0.22, "learning_rate": 0.00026658466850363287, "loss": 0.0227, "step": 85940 }, { "epoch": 0.22, "learning_rate": 0.0002665807802872614, "loss": 0.0238, "step": 85950 }, { "epoch": 0.22, "learning_rate": 0.0002665768920708899, "loss": 0.0257, "step": 85960 }, { "epoch": 0.22, "learning_rate": 0.00026657300385451847, "loss": 0.0241, "step": 85970 }, { "epoch": 0.22, "learning_rate": 0.00026656911563814704, "loss": 0.021, "step": 85980 }, { "epoch": 0.22, "learning_rate": 0.00026656522742177555, "loss": 0.0232, "step": 85990 }, { "epoch": 0.22, "learning_rate": 0.00026656133920540407, "loss": 0.0236, "step": 86000 }, { "epoch": 0.22, "eval_cer": 0.8817950623608236, "eval_loss": 0.017185769975185394, "eval_runtime": 107.5803, "eval_samples_per_second": 18.591, "eval_steps_per_second": 4.648, "step": 86000 }, { "epoch": 0.22, "learning_rate": 0.00026655745098903263, "loss": 0.0215, "step": 86010 }, { "epoch": 0.22, "learning_rate": 0.00026655356277266115, "loss": 0.032, "step": 86020 }, { "epoch": 0.22, "learning_rate": 0.00026654967455628966, "loss": 0.0219, "step": 86030 }, { "epoch": 0.22, "learning_rate": 0.00026654578633991823, "loss": 0.0273, "step": 86040 }, { "epoch": 0.22, "learning_rate": 0.00026654189812354675, "loss": 0.0252, "step": 86050 }, { "epoch": 0.22, "learning_rate": 0.0002665380099071753, "loss": 0.0206, "step": 86060 }, { "epoch": 0.22, "learning_rate": 0.00026653412169080383, "loss": 0.0244, "step": 86070 }, { "epoch": 0.22, "learning_rate": 0.00026653023347443234, "loss": 0.0289, "step": 86080 }, { "epoch": 0.22, "learning_rate": 0.0002665263452580609, "loss": 0.0235, "step": 86090 }, { "epoch": 0.22, "learning_rate": 0.00026652245704168943, "loss": 0.0226, "step": 86100 }, { "epoch": 0.22, "learning_rate": 0.00026651856882531794, "loss": 0.0278, "step": 86110 }, { "epoch": 0.22, "learning_rate": 0.0002665146806089465, "loss": 0.0233, "step": 86120 }, { "epoch": 0.22, "learning_rate": 0.000266510792392575, "loss": 0.0228, "step": 86130 }, { "epoch": 0.22, "learning_rate": 0.0002665069041762036, "loss": 0.0224, "step": 86140 }, { "epoch": 0.22, "learning_rate": 0.0002665030159598321, "loss": 0.0263, "step": 86150 }, { "epoch": 0.22, "learning_rate": 0.0002664991277434606, "loss": 0.0269, "step": 86160 }, { "epoch": 0.22, "learning_rate": 0.0002664952395270892, "loss": 0.0238, "step": 86170 }, { "epoch": 0.22, "learning_rate": 0.0002664913513107177, "loss": 0.026, "step": 86180 }, { "epoch": 0.22, "learning_rate": 0.0002664874630943463, "loss": 0.0211, "step": 86190 }, { "epoch": 0.22, "learning_rate": 0.0002664835748779748, "loss": 0.0215, "step": 86200 }, { "epoch": 0.22, "learning_rate": 0.0002664796866616033, "loss": 0.0246, "step": 86210 }, { "epoch": 0.22, "learning_rate": 0.0002664757984452319, "loss": 0.0254, "step": 86220 }, { "epoch": 0.22, "learning_rate": 0.0002664719102288604, "loss": 0.0253, "step": 86230 }, { "epoch": 0.22, "learning_rate": 0.0002664680220124889, "loss": 0.0195, "step": 86240 }, { "epoch": 0.22, "learning_rate": 0.00026646413379611747, "loss": 0.0259, "step": 86250 }, { "epoch": 0.22, "learning_rate": 0.000266460245579746, "loss": 0.024, "step": 86260 }, { "epoch": 0.22, "learning_rate": 0.00026645635736337455, "loss": 0.0219, "step": 86270 }, { "epoch": 0.22, "learning_rate": 0.00026645246914700307, "loss": 0.0189, "step": 86280 }, { "epoch": 0.22, "learning_rate": 0.0002664485809306316, "loss": 0.0269, "step": 86290 }, { "epoch": 0.22, "learning_rate": 0.00026644469271426015, "loss": 0.0334, "step": 86300 }, { "epoch": 0.22, "learning_rate": 0.00026644080449788867, "loss": 0.0241, "step": 86310 }, { "epoch": 0.22, "learning_rate": 0.00026643691628151724, "loss": 0.0214, "step": 86320 }, { "epoch": 0.22, "learning_rate": 0.00026643302806514575, "loss": 0.0231, "step": 86330 }, { "epoch": 0.22, "learning_rate": 0.0002664291398487743, "loss": 0.0268, "step": 86340 }, { "epoch": 0.22, "learning_rate": 0.00026642525163240283, "loss": 0.0226, "step": 86350 }, { "epoch": 0.22, "learning_rate": 0.00026642136341603135, "loss": 0.0248, "step": 86360 }, { "epoch": 0.22, "learning_rate": 0.00026641747519965986, "loss": 0.0222, "step": 86370 }, { "epoch": 0.22, "learning_rate": 0.00026641358698328843, "loss": 0.0253, "step": 86380 }, { "epoch": 0.22, "learning_rate": 0.00026640969876691695, "loss": 0.0222, "step": 86390 }, { "epoch": 0.22, "learning_rate": 0.0002664058105505455, "loss": 0.0197, "step": 86400 }, { "epoch": 0.22, "learning_rate": 0.00026640192233417403, "loss": 0.0207, "step": 86410 }, { "epoch": 0.22, "learning_rate": 0.00026639803411780254, "loss": 0.0242, "step": 86420 }, { "epoch": 0.22, "learning_rate": 0.0002663941459014311, "loss": 0.0238, "step": 86430 }, { "epoch": 0.22, "learning_rate": 0.0002663902576850596, "loss": 0.0212, "step": 86440 }, { "epoch": 0.22, "learning_rate": 0.00026638636946868814, "loss": 0.0186, "step": 86450 }, { "epoch": 0.22, "learning_rate": 0.0002663824812523167, "loss": 0.0233, "step": 86460 }, { "epoch": 0.22, "learning_rate": 0.0002663785930359453, "loss": 0.026, "step": 86470 }, { "epoch": 0.22, "learning_rate": 0.0002663747048195738, "loss": 0.0218, "step": 86480 }, { "epoch": 0.22, "learning_rate": 0.0002663708166032023, "loss": 0.0253, "step": 86490 }, { "epoch": 0.22, "learning_rate": 0.0002663669283868308, "loss": 0.0236, "step": 86500 }, { "epoch": 0.22, "learning_rate": 0.0002663630401704594, "loss": 0.0227, "step": 86510 }, { "epoch": 0.22, "learning_rate": 0.0002663591519540879, "loss": 0.0213, "step": 86520 }, { "epoch": 0.22, "learning_rate": 0.0002663552637377165, "loss": 0.0287, "step": 86530 }, { "epoch": 0.22, "learning_rate": 0.000266351375521345, "loss": 0.025, "step": 86540 }, { "epoch": 0.22, "learning_rate": 0.00026634748730497356, "loss": 0.0259, "step": 86550 }, { "epoch": 0.22, "learning_rate": 0.00026634359908860207, "loss": 0.0219, "step": 86560 }, { "epoch": 0.22, "learning_rate": 0.0002663397108722306, "loss": 0.0208, "step": 86570 }, { "epoch": 0.22, "learning_rate": 0.0002663358226558591, "loss": 0.0216, "step": 86580 }, { "epoch": 0.22, "learning_rate": 0.00026633193443948767, "loss": 0.0231, "step": 86590 }, { "epoch": 0.22, "learning_rate": 0.0002663280462231162, "loss": 0.0241, "step": 86600 }, { "epoch": 0.22, "learning_rate": 0.00026632415800674475, "loss": 0.0268, "step": 86610 }, { "epoch": 0.22, "learning_rate": 0.00026632026979037327, "loss": 0.0232, "step": 86620 }, { "epoch": 0.22, "learning_rate": 0.0002663163815740018, "loss": 0.0248, "step": 86630 }, { "epoch": 0.22, "learning_rate": 0.00026631249335763035, "loss": 0.026, "step": 86640 }, { "epoch": 0.22, "learning_rate": 0.00026630860514125887, "loss": 0.0222, "step": 86650 }, { "epoch": 0.22, "learning_rate": 0.00026630471692488743, "loss": 0.0265, "step": 86660 }, { "epoch": 0.22, "learning_rate": 0.00026630082870851595, "loss": 0.0216, "step": 86670 }, { "epoch": 0.22, "learning_rate": 0.0002662969404921445, "loss": 0.0262, "step": 86680 }, { "epoch": 0.22, "learning_rate": 0.00026629305227577303, "loss": 0.0245, "step": 86690 }, { "epoch": 0.22, "learning_rate": 0.00026628916405940155, "loss": 0.0211, "step": 86700 }, { "epoch": 0.22, "learning_rate": 0.00026628527584303006, "loss": 0.0246, "step": 86710 }, { "epoch": 0.22, "learning_rate": 0.00026628138762665863, "loss": 0.026, "step": 86720 }, { "epoch": 0.22, "learning_rate": 0.00026627749941028714, "loss": 0.02, "step": 86730 }, { "epoch": 0.22, "learning_rate": 0.0002662736111939157, "loss": 0.0186, "step": 86740 }, { "epoch": 0.22, "learning_rate": 0.00026626972297754423, "loss": 0.0265, "step": 86750 }, { "epoch": 0.22, "learning_rate": 0.0002662658347611728, "loss": 0.0197, "step": 86760 }, { "epoch": 0.22, "learning_rate": 0.0002662619465448013, "loss": 0.0199, "step": 86770 }, { "epoch": 0.22, "learning_rate": 0.0002662580583284298, "loss": 0.0193, "step": 86780 }, { "epoch": 0.22, "learning_rate": 0.00026625417011205834, "loss": 0.0254, "step": 86790 }, { "epoch": 0.22, "learning_rate": 0.0002662502818956869, "loss": 0.0278, "step": 86800 }, { "epoch": 0.23, "learning_rate": 0.0002662463936793155, "loss": 0.0232, "step": 86810 }, { "epoch": 0.23, "learning_rate": 0.000266242505462944, "loss": 0.0222, "step": 86820 }, { "epoch": 0.23, "learning_rate": 0.0002662386172465725, "loss": 0.0206, "step": 86830 }, { "epoch": 0.23, "learning_rate": 0.000266234729030201, "loss": 0.0219, "step": 86840 }, { "epoch": 0.23, "learning_rate": 0.0002662308408138296, "loss": 0.0205, "step": 86850 }, { "epoch": 0.23, "learning_rate": 0.0002662269525974581, "loss": 0.0208, "step": 86860 }, { "epoch": 0.23, "learning_rate": 0.00026622306438108667, "loss": 0.0203, "step": 86870 }, { "epoch": 0.23, "learning_rate": 0.0002662191761647152, "loss": 0.0225, "step": 86880 }, { "epoch": 0.23, "learning_rate": 0.00026621528794834376, "loss": 0.0265, "step": 86890 }, { "epoch": 0.23, "learning_rate": 0.00026621139973197227, "loss": 0.0268, "step": 86900 }, { "epoch": 0.23, "learning_rate": 0.0002662075115156008, "loss": 0.0244, "step": 86910 }, { "epoch": 0.23, "learning_rate": 0.0002662036232992293, "loss": 0.0228, "step": 86920 }, { "epoch": 0.23, "learning_rate": 0.00026619973508285787, "loss": 0.0203, "step": 86930 }, { "epoch": 0.23, "learning_rate": 0.0002661958468664864, "loss": 0.0226, "step": 86940 }, { "epoch": 0.23, "learning_rate": 0.00026619195865011495, "loss": 0.0195, "step": 86950 }, { "epoch": 0.23, "learning_rate": 0.00026618807043374347, "loss": 0.0263, "step": 86960 }, { "epoch": 0.23, "learning_rate": 0.00026618418221737203, "loss": 0.0193, "step": 86970 }, { "epoch": 0.23, "learning_rate": 0.00026618029400100055, "loss": 0.0186, "step": 86980 }, { "epoch": 0.23, "learning_rate": 0.00026617640578462906, "loss": 0.0222, "step": 86990 }, { "epoch": 0.23, "learning_rate": 0.0002661725175682576, "loss": 0.0225, "step": 87000 }, { "epoch": 0.23, "eval_cer": 0.8817950623608236, "eval_loss": 0.017446931451559067, "eval_runtime": 107.4054, "eval_samples_per_second": 18.621, "eval_steps_per_second": 4.655, "step": 87000 }, { "epoch": 0.23, "learning_rate": 0.00026616862935188615, "loss": 0.0236, "step": 87010 }, { "epoch": 0.23, "learning_rate": 0.0002661647411355147, "loss": 0.024, "step": 87020 }, { "epoch": 0.23, "learning_rate": 0.00026616085291914323, "loss": 0.0211, "step": 87030 }, { "epoch": 0.23, "learning_rate": 0.00026615696470277175, "loss": 0.0237, "step": 87040 }, { "epoch": 0.23, "learning_rate": 0.0002661530764864003, "loss": 0.0267, "step": 87050 }, { "epoch": 0.23, "learning_rate": 0.00026614918827002883, "loss": 0.0251, "step": 87060 }, { "epoch": 0.23, "learning_rate": 0.00026614530005365734, "loss": 0.0212, "step": 87070 }, { "epoch": 0.23, "learning_rate": 0.0002661414118372859, "loss": 0.0268, "step": 87080 }, { "epoch": 0.23, "learning_rate": 0.0002661375236209144, "loss": 0.026, "step": 87090 }, { "epoch": 0.23, "learning_rate": 0.000266133635404543, "loss": 0.0206, "step": 87100 }, { "epoch": 0.23, "learning_rate": 0.0002661297471881715, "loss": 0.0271, "step": 87110 }, { "epoch": 0.23, "learning_rate": 0.0002661258589718, "loss": 0.0241, "step": 87120 }, { "epoch": 0.23, "learning_rate": 0.00026612197075542854, "loss": 0.0321, "step": 87130 }, { "epoch": 0.23, "learning_rate": 0.0002661180825390571, "loss": 0.0255, "step": 87140 }, { "epoch": 0.23, "learning_rate": 0.0002661141943226856, "loss": 0.024, "step": 87150 }, { "epoch": 0.23, "learning_rate": 0.0002661103061063142, "loss": 0.0217, "step": 87160 }, { "epoch": 0.23, "learning_rate": 0.0002661064178899427, "loss": 0.025, "step": 87170 }, { "epoch": 0.23, "learning_rate": 0.0002661025296735713, "loss": 0.0264, "step": 87180 }, { "epoch": 0.23, "learning_rate": 0.0002660986414571998, "loss": 0.0302, "step": 87190 }, { "epoch": 0.23, "learning_rate": 0.0002660947532408283, "loss": 0.0263, "step": 87200 }, { "epoch": 0.23, "learning_rate": 0.00026609086502445687, "loss": 0.0264, "step": 87210 }, { "epoch": 0.23, "learning_rate": 0.0002660869768080854, "loss": 0.0297, "step": 87220 }, { "epoch": 0.23, "learning_rate": 0.00026608308859171395, "loss": 0.0233, "step": 87230 }, { "epoch": 0.23, "learning_rate": 0.00026607920037534247, "loss": 0.0222, "step": 87240 }, { "epoch": 0.23, "learning_rate": 0.000266075312158971, "loss": 0.0302, "step": 87250 }, { "epoch": 0.23, "learning_rate": 0.00026607142394259955, "loss": 0.0211, "step": 87260 }, { "epoch": 0.23, "learning_rate": 0.00026606753572622807, "loss": 0.0216, "step": 87270 }, { "epoch": 0.23, "learning_rate": 0.0002660636475098566, "loss": 0.0228, "step": 87280 }, { "epoch": 0.23, "learning_rate": 0.00026605975929348515, "loss": 0.0228, "step": 87290 }, { "epoch": 0.23, "learning_rate": 0.00026605587107711367, "loss": 0.0226, "step": 87300 }, { "epoch": 0.23, "learning_rate": 0.00026605198286074223, "loss": 0.0197, "step": 87310 }, { "epoch": 0.23, "learning_rate": 0.00026604809464437075, "loss": 0.0256, "step": 87320 }, { "epoch": 0.23, "learning_rate": 0.00026604420642799926, "loss": 0.0252, "step": 87330 }, { "epoch": 0.23, "learning_rate": 0.0002660403182116278, "loss": 0.0274, "step": 87340 }, { "epoch": 0.23, "learning_rate": 0.00026603642999525635, "loss": 0.0263, "step": 87350 }, { "epoch": 0.23, "learning_rate": 0.0002660325417788849, "loss": 0.0255, "step": 87360 }, { "epoch": 0.23, "learning_rate": 0.00026602865356251343, "loss": 0.0268, "step": 87370 }, { "epoch": 0.23, "learning_rate": 0.00026602476534614194, "loss": 0.0247, "step": 87380 }, { "epoch": 0.23, "learning_rate": 0.0002660208771297705, "loss": 0.0262, "step": 87390 }, { "epoch": 0.23, "learning_rate": 0.00026601698891339903, "loss": 0.0247, "step": 87400 }, { "epoch": 0.23, "learning_rate": 0.00026601310069702754, "loss": 0.0249, "step": 87410 }, { "epoch": 0.23, "learning_rate": 0.0002660092124806561, "loss": 0.0328, "step": 87420 }, { "epoch": 0.23, "learning_rate": 0.0002660053242642846, "loss": 0.0305, "step": 87430 }, { "epoch": 0.23, "learning_rate": 0.0002660014360479132, "loss": 0.0216, "step": 87440 }, { "epoch": 0.23, "learning_rate": 0.0002659975478315417, "loss": 0.02, "step": 87450 }, { "epoch": 0.23, "learning_rate": 0.0002659936596151702, "loss": 0.0247, "step": 87460 }, { "epoch": 0.23, "learning_rate": 0.0002659897713987988, "loss": 0.031, "step": 87470 }, { "epoch": 0.23, "learning_rate": 0.0002659858831824273, "loss": 0.0235, "step": 87480 }, { "epoch": 0.23, "learning_rate": 0.0002659819949660558, "loss": 0.0243, "step": 87490 }, { "epoch": 0.23, "learning_rate": 0.0002659781067496844, "loss": 0.0237, "step": 87500 }, { "epoch": 0.23, "learning_rate": 0.00026597421853331296, "loss": 0.0248, "step": 87510 }, { "epoch": 0.23, "learning_rate": 0.00026597033031694147, "loss": 0.0258, "step": 87520 }, { "epoch": 0.23, "learning_rate": 0.00026596644210057, "loss": 0.0231, "step": 87530 }, { "epoch": 0.23, "learning_rate": 0.0002659625538841985, "loss": 0.0214, "step": 87540 }, { "epoch": 0.23, "learning_rate": 0.00026595866566782707, "loss": 0.0255, "step": 87550 }, { "epoch": 0.23, "learning_rate": 0.0002659547774514556, "loss": 0.0251, "step": 87560 }, { "epoch": 0.23, "learning_rate": 0.00026595088923508415, "loss": 0.0335, "step": 87570 }, { "epoch": 0.23, "learning_rate": 0.00026594700101871267, "loss": 0.0243, "step": 87580 }, { "epoch": 0.23, "learning_rate": 0.0002659431128023412, "loss": 0.019, "step": 87590 }, { "epoch": 0.23, "learning_rate": 0.00026593922458596975, "loss": 0.0243, "step": 87600 }, { "epoch": 0.23, "learning_rate": 0.00026593533636959827, "loss": 0.0281, "step": 87610 }, { "epoch": 0.23, "learning_rate": 0.0002659314481532268, "loss": 0.0213, "step": 87620 }, { "epoch": 0.23, "learning_rate": 0.00026592755993685535, "loss": 0.0245, "step": 87630 }, { "epoch": 0.23, "learning_rate": 0.00026592367172048386, "loss": 0.0185, "step": 87640 }, { "epoch": 0.23, "learning_rate": 0.00026591978350411243, "loss": 0.0232, "step": 87650 }, { "epoch": 0.23, "learning_rate": 0.00026591589528774095, "loss": 0.0183, "step": 87660 }, { "epoch": 0.23, "learning_rate": 0.00026591200707136946, "loss": 0.0258, "step": 87670 }, { "epoch": 0.23, "learning_rate": 0.00026590811885499803, "loss": 0.0211, "step": 87680 }, { "epoch": 0.23, "learning_rate": 0.00026590423063862654, "loss": 0.025, "step": 87690 }, { "epoch": 0.23, "learning_rate": 0.00026590034242225506, "loss": 0.0242, "step": 87700 }, { "epoch": 0.23, "learning_rate": 0.00026589645420588363, "loss": 0.0207, "step": 87710 }, { "epoch": 0.23, "learning_rate": 0.0002658925659895122, "loss": 0.0225, "step": 87720 }, { "epoch": 0.23, "learning_rate": 0.0002658886777731407, "loss": 0.0244, "step": 87730 }, { "epoch": 0.23, "learning_rate": 0.0002658847895567692, "loss": 0.0228, "step": 87740 }, { "epoch": 0.23, "learning_rate": 0.00026588090134039774, "loss": 0.0259, "step": 87750 }, { "epoch": 0.23, "learning_rate": 0.0002658770131240263, "loss": 0.0217, "step": 87760 }, { "epoch": 0.23, "learning_rate": 0.0002658731249076548, "loss": 0.02, "step": 87770 }, { "epoch": 0.23, "learning_rate": 0.0002658692366912834, "loss": 0.0208, "step": 87780 }, { "epoch": 0.23, "learning_rate": 0.0002658653484749119, "loss": 0.0268, "step": 87790 }, { "epoch": 0.23, "learning_rate": 0.0002658614602585405, "loss": 0.0224, "step": 87800 }, { "epoch": 0.23, "learning_rate": 0.000265857572042169, "loss": 0.0203, "step": 87810 }, { "epoch": 0.23, "learning_rate": 0.0002658536838257975, "loss": 0.0258, "step": 87820 }, { "epoch": 0.23, "learning_rate": 0.000265849795609426, "loss": 0.0247, "step": 87830 }, { "epoch": 0.23, "learning_rate": 0.0002658459073930546, "loss": 0.026, "step": 87840 }, { "epoch": 0.23, "learning_rate": 0.0002658420191766831, "loss": 0.0189, "step": 87850 }, { "epoch": 0.23, "learning_rate": 0.00026583813096031167, "loss": 0.026, "step": 87860 }, { "epoch": 0.23, "learning_rate": 0.0002658342427439402, "loss": 0.0228, "step": 87870 }, { "epoch": 0.23, "learning_rate": 0.0002658303545275687, "loss": 0.025, "step": 87880 }, { "epoch": 0.23, "learning_rate": 0.00026582646631119727, "loss": 0.0237, "step": 87890 }, { "epoch": 0.23, "learning_rate": 0.0002658225780948258, "loss": 0.0246, "step": 87900 }, { "epoch": 0.23, "learning_rate": 0.00026581868987845435, "loss": 0.0247, "step": 87910 }, { "epoch": 0.23, "learning_rate": 0.00026581480166208287, "loss": 0.0216, "step": 87920 }, { "epoch": 0.23, "learning_rate": 0.00026581091344571144, "loss": 0.0244, "step": 87930 }, { "epoch": 0.23, "learning_rate": 0.00026580702522933995, "loss": 0.0251, "step": 87940 }, { "epoch": 0.23, "learning_rate": 0.00026580313701296846, "loss": 0.038, "step": 87950 }, { "epoch": 0.23, "learning_rate": 0.000265799248796597, "loss": 0.0268, "step": 87960 }, { "epoch": 0.23, "learning_rate": 0.00026579536058022555, "loss": 0.0212, "step": 87970 }, { "epoch": 0.23, "learning_rate": 0.00026579147236385406, "loss": 0.0237, "step": 87980 }, { "epoch": 0.23, "learning_rate": 0.00026578758414748263, "loss": 0.025, "step": 87990 }, { "epoch": 0.23, "learning_rate": 0.00026578369593111115, "loss": 0.0223, "step": 88000 }, { "epoch": 0.23, "eval_cer": 0.8818174565517705, "eval_loss": 0.016908327117562294, "eval_runtime": 107.5726, "eval_samples_per_second": 18.592, "eval_steps_per_second": 4.648, "step": 88000 }, { "epoch": 0.23, "learning_rate": 0.0002657798077147397, "loss": 0.0258, "step": 88010 }, { "epoch": 0.23, "learning_rate": 0.00026577591949836823, "loss": 0.0243, "step": 88020 }, { "epoch": 0.23, "learning_rate": 0.00026577203128199674, "loss": 0.0249, "step": 88030 }, { "epoch": 0.23, "learning_rate": 0.00026576814306562526, "loss": 0.0247, "step": 88040 }, { "epoch": 0.23, "learning_rate": 0.0002657642548492538, "loss": 0.0197, "step": 88050 }, { "epoch": 0.23, "learning_rate": 0.0002657603666328824, "loss": 0.0195, "step": 88060 }, { "epoch": 0.23, "learning_rate": 0.0002657564784165109, "loss": 0.0263, "step": 88070 }, { "epoch": 0.23, "learning_rate": 0.0002657525902001394, "loss": 0.0211, "step": 88080 }, { "epoch": 0.23, "learning_rate": 0.00026574870198376794, "loss": 0.0204, "step": 88090 }, { "epoch": 0.23, "learning_rate": 0.0002657448137673965, "loss": 0.0286, "step": 88100 }, { "epoch": 0.23, "learning_rate": 0.000265740925551025, "loss": 0.0279, "step": 88110 }, { "epoch": 0.23, "learning_rate": 0.0002657370373346536, "loss": 0.0252, "step": 88120 }, { "epoch": 0.23, "learning_rate": 0.0002657331491182821, "loss": 0.0224, "step": 88130 }, { "epoch": 0.23, "learning_rate": 0.0002657292609019107, "loss": 0.0267, "step": 88140 }, { "epoch": 0.23, "learning_rate": 0.0002657253726855392, "loss": 0.0192, "step": 88150 }, { "epoch": 0.23, "learning_rate": 0.0002657214844691677, "loss": 0.0229, "step": 88160 }, { "epoch": 0.23, "learning_rate": 0.0002657175962527962, "loss": 0.0232, "step": 88170 }, { "epoch": 0.23, "learning_rate": 0.0002657137080364248, "loss": 0.0207, "step": 88180 }, { "epoch": 0.23, "learning_rate": 0.0002657098198200533, "loss": 0.024, "step": 88190 }, { "epoch": 0.23, "learning_rate": 0.00026570593160368187, "loss": 0.0221, "step": 88200 }, { "epoch": 0.23, "learning_rate": 0.0002657020433873104, "loss": 0.02, "step": 88210 }, { "epoch": 0.23, "learning_rate": 0.00026569815517093895, "loss": 0.0225, "step": 88220 }, { "epoch": 0.23, "learning_rate": 0.00026569426695456747, "loss": 0.0172, "step": 88230 }, { "epoch": 0.23, "learning_rate": 0.000265690378738196, "loss": 0.0252, "step": 88240 }, { "epoch": 0.23, "learning_rate": 0.00026568649052182455, "loss": 0.0227, "step": 88250 }, { "epoch": 0.23, "learning_rate": 0.00026568260230545307, "loss": 0.017, "step": 88260 }, { "epoch": 0.23, "learning_rate": 0.00026567871408908163, "loss": 0.0235, "step": 88270 }, { "epoch": 0.23, "learning_rate": 0.00026567482587271015, "loss": 0.0203, "step": 88280 }, { "epoch": 0.23, "learning_rate": 0.00026567093765633866, "loss": 0.026, "step": 88290 }, { "epoch": 0.23, "learning_rate": 0.00026566704943996723, "loss": 0.0215, "step": 88300 }, { "epoch": 0.23, "learning_rate": 0.00026566316122359575, "loss": 0.025, "step": 88310 }, { "epoch": 0.23, "learning_rate": 0.00026565927300722426, "loss": 0.0221, "step": 88320 }, { "epoch": 0.23, "learning_rate": 0.00026565538479085283, "loss": 0.02, "step": 88330 }, { "epoch": 0.23, "learning_rate": 0.00026565149657448134, "loss": 0.0222, "step": 88340 }, { "epoch": 0.23, "learning_rate": 0.0002656476083581099, "loss": 0.0228, "step": 88350 }, { "epoch": 0.23, "learning_rate": 0.00026564372014173843, "loss": 0.0211, "step": 88360 }, { "epoch": 0.23, "learning_rate": 0.00026563983192536694, "loss": 0.0244, "step": 88370 }, { "epoch": 0.23, "learning_rate": 0.00026563594370899546, "loss": 0.0256, "step": 88380 }, { "epoch": 0.23, "learning_rate": 0.000265632055492624, "loss": 0.0229, "step": 88390 }, { "epoch": 0.23, "learning_rate": 0.0002656281672762526, "loss": 0.025, "step": 88400 }, { "epoch": 0.23, "learning_rate": 0.0002656242790598811, "loss": 0.0193, "step": 88410 }, { "epoch": 0.23, "learning_rate": 0.0002656203908435096, "loss": 0.0205, "step": 88420 }, { "epoch": 0.23, "learning_rate": 0.0002656165026271382, "loss": 0.0235, "step": 88430 }, { "epoch": 0.23, "learning_rate": 0.0002656126144107667, "loss": 0.0248, "step": 88440 }, { "epoch": 0.23, "learning_rate": 0.0002656087261943952, "loss": 0.0188, "step": 88450 }, { "epoch": 0.23, "learning_rate": 0.0002656048379780238, "loss": 0.0269, "step": 88460 }, { "epoch": 0.23, "learning_rate": 0.0002656009497616523, "loss": 0.023, "step": 88470 }, { "epoch": 0.23, "learning_rate": 0.0002655970615452809, "loss": 0.0264, "step": 88480 }, { "epoch": 0.23, "learning_rate": 0.0002655931733289094, "loss": 0.0214, "step": 88490 }, { "epoch": 0.23, "learning_rate": 0.0002655892851125379, "loss": 0.0237, "step": 88500 }, { "epoch": 0.23, "learning_rate": 0.00026558539689616647, "loss": 0.0211, "step": 88510 }, { "epoch": 0.23, "learning_rate": 0.000265581508679795, "loss": 0.0235, "step": 88520 }, { "epoch": 0.23, "learning_rate": 0.0002655776204634235, "loss": 0.0257, "step": 88530 }, { "epoch": 0.23, "learning_rate": 0.00026557373224705207, "loss": 0.0251, "step": 88540 }, { "epoch": 0.23, "learning_rate": 0.00026556984403068064, "loss": 0.0271, "step": 88550 }, { "epoch": 0.23, "learning_rate": 0.00026556595581430915, "loss": 0.0292, "step": 88560 }, { "epoch": 0.23, "learning_rate": 0.00026556206759793767, "loss": 0.0197, "step": 88570 }, { "epoch": 0.23, "learning_rate": 0.0002655581793815662, "loss": 0.0228, "step": 88580 }, { "epoch": 0.23, "learning_rate": 0.0002655542911651947, "loss": 0.023, "step": 88590 }, { "epoch": 0.23, "learning_rate": 0.00026555040294882326, "loss": 0.0259, "step": 88600 }, { "epoch": 0.23, "learning_rate": 0.00026554651473245183, "loss": 0.0251, "step": 88610 }, { "epoch": 0.23, "learning_rate": 0.00026554262651608035, "loss": 0.0218, "step": 88620 }, { "epoch": 0.23, "learning_rate": 0.00026553873829970886, "loss": 0.0241, "step": 88630 }, { "epoch": 0.23, "learning_rate": 0.00026553485008333743, "loss": 0.0239, "step": 88640 }, { "epoch": 0.23, "learning_rate": 0.00026553096186696595, "loss": 0.0217, "step": 88650 }, { "epoch": 0.23, "learning_rate": 0.00026552707365059446, "loss": 0.0206, "step": 88660 }, { "epoch": 0.23, "learning_rate": 0.00026552318543422303, "loss": 0.0261, "step": 88670 }, { "epoch": 0.23, "learning_rate": 0.00026551929721785154, "loss": 0.0253, "step": 88680 }, { "epoch": 0.23, "learning_rate": 0.0002655154090014801, "loss": 0.0197, "step": 88690 }, { "epoch": 0.23, "learning_rate": 0.0002655115207851086, "loss": 0.0256, "step": 88700 }, { "epoch": 0.23, "learning_rate": 0.00026550763256873714, "loss": 0.0227, "step": 88710 }, { "epoch": 0.23, "learning_rate": 0.0002655037443523657, "loss": 0.021, "step": 88720 }, { "epoch": 0.23, "learning_rate": 0.0002654998561359942, "loss": 0.0266, "step": 88730 }, { "epoch": 0.23, "learning_rate": 0.00026549596791962274, "loss": 0.0228, "step": 88740 }, { "epoch": 0.23, "learning_rate": 0.0002654920797032513, "loss": 0.0268, "step": 88750 }, { "epoch": 0.23, "learning_rate": 0.0002654881914868799, "loss": 0.0274, "step": 88760 }, { "epoch": 0.23, "learning_rate": 0.0002654843032705084, "loss": 0.0243, "step": 88770 }, { "epoch": 0.23, "learning_rate": 0.0002654804150541369, "loss": 0.0223, "step": 88780 }, { "epoch": 0.23, "learning_rate": 0.0002654765268377654, "loss": 0.0212, "step": 88790 }, { "epoch": 0.23, "learning_rate": 0.000265472638621394, "loss": 0.0233, "step": 88800 }, { "epoch": 0.23, "learning_rate": 0.0002654687504050225, "loss": 0.0243, "step": 88810 }, { "epoch": 0.23, "learning_rate": 0.00026546486218865107, "loss": 0.0226, "step": 88820 }, { "epoch": 0.23, "learning_rate": 0.0002654609739722796, "loss": 0.0213, "step": 88830 }, { "epoch": 0.23, "learning_rate": 0.0002654570857559081, "loss": 0.0223, "step": 88840 }, { "epoch": 0.23, "learning_rate": 0.00026545319753953667, "loss": 0.024, "step": 88850 }, { "epoch": 0.23, "learning_rate": 0.0002654493093231652, "loss": 0.0198, "step": 88860 }, { "epoch": 0.23, "learning_rate": 0.0002654454211067937, "loss": 0.0244, "step": 88870 }, { "epoch": 0.23, "learning_rate": 0.00026544153289042227, "loss": 0.0219, "step": 88880 }, { "epoch": 0.23, "learning_rate": 0.0002654376446740508, "loss": 0.0232, "step": 88890 }, { "epoch": 0.23, "learning_rate": 0.00026543375645767935, "loss": 0.0213, "step": 88900 }, { "epoch": 0.23, "learning_rate": 0.00026542986824130787, "loss": 0.025, "step": 88910 }, { "epoch": 0.23, "learning_rate": 0.0002654259800249364, "loss": 0.0254, "step": 88920 }, { "epoch": 0.23, "learning_rate": 0.00026542209180856495, "loss": 0.0191, "step": 88930 }, { "epoch": 0.23, "learning_rate": 0.00026541820359219346, "loss": 0.0238, "step": 88940 }, { "epoch": 0.23, "learning_rate": 0.00026541431537582203, "loss": 0.0318, "step": 88950 }, { "epoch": 0.23, "learning_rate": 0.00026541042715945055, "loss": 0.03, "step": 88960 }, { "epoch": 0.23, "learning_rate": 0.0002654065389430791, "loss": 0.0256, "step": 88970 }, { "epoch": 0.23, "learning_rate": 0.00026540265072670763, "loss": 0.0204, "step": 88980 }, { "epoch": 0.23, "learning_rate": 0.00026539876251033614, "loss": 0.0232, "step": 88990 }, { "epoch": 0.23, "learning_rate": 0.00026539487429396466, "loss": 0.0214, "step": 89000 }, { "epoch": 0.23, "eval_cer": 0.8818370514688489, "eval_loss": 0.017352329567074776, "eval_runtime": 107.8338, "eval_samples_per_second": 18.547, "eval_steps_per_second": 4.637, "step": 89000 }, { "epoch": 0.23, "learning_rate": 0.00026539098607759323, "loss": 0.0279, "step": 89010 }, { "epoch": 0.23, "learning_rate": 0.00026538709786122174, "loss": 0.0255, "step": 89020 }, { "epoch": 0.23, "learning_rate": 0.0002653832096448503, "loss": 0.0242, "step": 89030 }, { "epoch": 0.23, "learning_rate": 0.0002653793214284788, "loss": 0.0247, "step": 89040 }, { "epoch": 0.23, "learning_rate": 0.0002653754332121074, "loss": 0.0216, "step": 89050 }, { "epoch": 0.23, "learning_rate": 0.0002653715449957359, "loss": 0.0241, "step": 89060 }, { "epoch": 0.23, "learning_rate": 0.0002653676567793644, "loss": 0.0189, "step": 89070 }, { "epoch": 0.23, "learning_rate": 0.00026536376856299294, "loss": 0.028, "step": 89080 }, { "epoch": 0.23, "learning_rate": 0.0002653598803466215, "loss": 0.0288, "step": 89090 }, { "epoch": 0.23, "learning_rate": 0.0002653559921302501, "loss": 0.0241, "step": 89100 }, { "epoch": 0.23, "learning_rate": 0.0002653521039138786, "loss": 0.0254, "step": 89110 }, { "epoch": 0.23, "learning_rate": 0.0002653482156975071, "loss": 0.0269, "step": 89120 }, { "epoch": 0.23, "learning_rate": 0.0002653443274811356, "loss": 0.034, "step": 89130 }, { "epoch": 0.23, "learning_rate": 0.0002653404392647642, "loss": 0.0245, "step": 89140 }, { "epoch": 0.23, "learning_rate": 0.0002653365510483927, "loss": 0.031, "step": 89150 }, { "epoch": 0.23, "learning_rate": 0.00026533266283202127, "loss": 0.0258, "step": 89160 }, { "epoch": 0.23, "learning_rate": 0.0002653287746156498, "loss": 0.027, "step": 89170 }, { "epoch": 0.23, "learning_rate": 0.00026532488639927835, "loss": 0.0232, "step": 89180 }, { "epoch": 0.23, "learning_rate": 0.00026532099818290687, "loss": 0.0256, "step": 89190 }, { "epoch": 0.23, "learning_rate": 0.0002653171099665354, "loss": 0.0192, "step": 89200 }, { "epoch": 0.23, "learning_rate": 0.0002653132217501639, "loss": 0.0295, "step": 89210 }, { "epoch": 0.23, "learning_rate": 0.00026530933353379247, "loss": 0.0272, "step": 89220 }, { "epoch": 0.23, "learning_rate": 0.000265305445317421, "loss": 0.0266, "step": 89230 }, { "epoch": 0.23, "learning_rate": 0.00026530155710104955, "loss": 0.0196, "step": 89240 }, { "epoch": 0.23, "learning_rate": 0.00026529766888467806, "loss": 0.0235, "step": 89250 }, { "epoch": 0.23, "learning_rate": 0.00026529378066830663, "loss": 0.0195, "step": 89260 }, { "epoch": 0.23, "learning_rate": 0.00026528989245193515, "loss": 0.0224, "step": 89270 }, { "epoch": 0.23, "learning_rate": 0.00026528600423556366, "loss": 0.0279, "step": 89280 }, { "epoch": 0.23, "learning_rate": 0.0002652821160191922, "loss": 0.0232, "step": 89290 }, { "epoch": 0.23, "learning_rate": 0.00026527822780282075, "loss": 0.0271, "step": 89300 }, { "epoch": 0.23, "learning_rate": 0.0002652743395864493, "loss": 0.0241, "step": 89310 }, { "epoch": 0.23, "learning_rate": 0.00026527045137007783, "loss": 0.0247, "step": 89320 }, { "epoch": 0.23, "learning_rate": 0.00026526656315370634, "loss": 0.0229, "step": 89330 }, { "epoch": 0.23, "learning_rate": 0.00026526267493733486, "loss": 0.0221, "step": 89340 }, { "epoch": 0.23, "learning_rate": 0.0002652587867209634, "loss": 0.024, "step": 89350 }, { "epoch": 0.23, "learning_rate": 0.00026525489850459194, "loss": 0.0245, "step": 89360 }, { "epoch": 0.23, "learning_rate": 0.0002652510102882205, "loss": 0.0196, "step": 89370 }, { "epoch": 0.23, "learning_rate": 0.000265247122071849, "loss": 0.0232, "step": 89380 }, { "epoch": 0.23, "learning_rate": 0.0002652432338554776, "loss": 0.0187, "step": 89390 }, { "epoch": 0.23, "learning_rate": 0.0002652393456391061, "loss": 0.0218, "step": 89400 }, { "epoch": 0.23, "learning_rate": 0.0002652354574227346, "loss": 0.0266, "step": 89410 }, { "epoch": 0.23, "learning_rate": 0.00026523156920636314, "loss": 0.0218, "step": 89420 }, { "epoch": 0.23, "learning_rate": 0.0002652276809899917, "loss": 0.0229, "step": 89430 }, { "epoch": 0.23, "learning_rate": 0.0002652237927736202, "loss": 0.0211, "step": 89440 }, { "epoch": 0.23, "learning_rate": 0.0002652199045572488, "loss": 0.0227, "step": 89450 }, { "epoch": 0.23, "learning_rate": 0.0002652160163408773, "loss": 0.026, "step": 89460 }, { "epoch": 0.23, "learning_rate": 0.00026521212812450587, "loss": 0.0218, "step": 89470 }, { "epoch": 0.23, "learning_rate": 0.0002652082399081344, "loss": 0.0222, "step": 89480 }, { "epoch": 0.23, "learning_rate": 0.0002652043516917629, "loss": 0.0207, "step": 89490 }, { "epoch": 0.23, "learning_rate": 0.00026520046347539147, "loss": 0.0222, "step": 89500 }, { "epoch": 0.23, "learning_rate": 0.00026519657525902, "loss": 0.0214, "step": 89510 }, { "epoch": 0.23, "learning_rate": 0.00026519268704264855, "loss": 0.0189, "step": 89520 }, { "epoch": 0.23, "learning_rate": 0.00026518879882627707, "loss": 0.0243, "step": 89530 }, { "epoch": 0.23, "learning_rate": 0.0002651849106099056, "loss": 0.0208, "step": 89540 }, { "epoch": 0.23, "learning_rate": 0.00026518102239353415, "loss": 0.0213, "step": 89550 }, { "epoch": 0.23, "learning_rate": 0.00026517713417716267, "loss": 0.0214, "step": 89560 }, { "epoch": 0.23, "learning_rate": 0.0002651732459607912, "loss": 0.0227, "step": 89570 }, { "epoch": 0.23, "learning_rate": 0.00026516935774441975, "loss": 0.0286, "step": 89580 }, { "epoch": 0.23, "learning_rate": 0.00026516546952804826, "loss": 0.0222, "step": 89590 }, { "epoch": 0.23, "learning_rate": 0.00026516158131167683, "loss": 0.028, "step": 89600 }, { "epoch": 0.23, "learning_rate": 0.00026515769309530535, "loss": 0.0208, "step": 89610 }, { "epoch": 0.23, "learning_rate": 0.00026515380487893386, "loss": 0.0227, "step": 89620 }, { "epoch": 0.23, "learning_rate": 0.0002651499166625624, "loss": 0.02, "step": 89630 }, { "epoch": 0.23, "learning_rate": 0.00026514602844619094, "loss": 0.024, "step": 89640 }, { "epoch": 0.23, "learning_rate": 0.0002651421402298195, "loss": 0.0233, "step": 89650 }, { "epoch": 0.23, "learning_rate": 0.00026513825201344803, "loss": 0.0219, "step": 89660 }, { "epoch": 0.23, "learning_rate": 0.00026513436379707654, "loss": 0.0228, "step": 89670 }, { "epoch": 0.23, "learning_rate": 0.0002651304755807051, "loss": 0.0218, "step": 89680 }, { "epoch": 0.23, "learning_rate": 0.0002651265873643336, "loss": 0.0248, "step": 89690 }, { "epoch": 0.23, "learning_rate": 0.00026512269914796214, "loss": 0.0289, "step": 89700 }, { "epoch": 0.23, "learning_rate": 0.0002651188109315907, "loss": 0.023, "step": 89710 }, { "epoch": 0.23, "learning_rate": 0.0002651149227152192, "loss": 0.0194, "step": 89720 }, { "epoch": 0.23, "learning_rate": 0.0002651110344988478, "loss": 0.0206, "step": 89730 }, { "epoch": 0.23, "learning_rate": 0.0002651071462824763, "loss": 0.0258, "step": 89740 }, { "epoch": 0.23, "learning_rate": 0.0002651032580661048, "loss": 0.0208, "step": 89750 }, { "epoch": 0.23, "learning_rate": 0.0002650993698497334, "loss": 0.0228, "step": 89760 }, { "epoch": 0.23, "learning_rate": 0.0002650954816333619, "loss": 0.0232, "step": 89770 }, { "epoch": 0.23, "learning_rate": 0.0002650915934169904, "loss": 0.0242, "step": 89780 }, { "epoch": 0.23, "learning_rate": 0.000265087705200619, "loss": 0.0218, "step": 89790 }, { "epoch": 0.23, "learning_rate": 0.00026508381698424756, "loss": 0.0228, "step": 89800 }, { "epoch": 0.23, "learning_rate": 0.00026507992876787607, "loss": 0.0245, "step": 89810 }, { "epoch": 0.23, "learning_rate": 0.0002650760405515046, "loss": 0.024, "step": 89820 }, { "epoch": 0.23, "learning_rate": 0.0002650721523351331, "loss": 0.0252, "step": 89830 }, { "epoch": 0.23, "learning_rate": 0.0002650682641187616, "loss": 0.0286, "step": 89840 }, { "epoch": 0.23, "learning_rate": 0.0002650643759023902, "loss": 0.0223, "step": 89850 }, { "epoch": 0.23, "learning_rate": 0.00026506048768601875, "loss": 0.0191, "step": 89860 }, { "epoch": 0.23, "learning_rate": 0.00026505659946964727, "loss": 0.0219, "step": 89870 }, { "epoch": 0.23, "learning_rate": 0.0002650527112532758, "loss": 0.0276, "step": 89880 }, { "epoch": 0.23, "learning_rate": 0.00026504882303690435, "loss": 0.0242, "step": 89890 }, { "epoch": 0.23, "learning_rate": 0.00026504493482053286, "loss": 0.0239, "step": 89900 }, { "epoch": 0.23, "learning_rate": 0.0002650410466041614, "loss": 0.0223, "step": 89910 }, { "epoch": 0.23, "learning_rate": 0.00026503715838778995, "loss": 0.0198, "step": 89920 }, { "epoch": 0.23, "learning_rate": 0.00026503327017141846, "loss": 0.0223, "step": 89930 }, { "epoch": 0.23, "learning_rate": 0.00026502938195504703, "loss": 0.028, "step": 89940 }, { "epoch": 0.23, "learning_rate": 0.00026502549373867555, "loss": 0.0261, "step": 89950 }, { "epoch": 0.23, "learning_rate": 0.00026502160552230406, "loss": 0.0237, "step": 89960 }, { "epoch": 0.23, "learning_rate": 0.00026501771730593263, "loss": 0.025, "step": 89970 }, { "epoch": 0.23, "learning_rate": 0.00026501382908956114, "loss": 0.0226, "step": 89980 }, { "epoch": 0.23, "learning_rate": 0.0002650099408731897, "loss": 0.0293, "step": 89990 }, { "epoch": 0.23, "learning_rate": 0.0002650060526568182, "loss": 0.0216, "step": 90000 }, { "epoch": 0.23, "eval_cer": 0.8817908634500211, "eval_loss": 0.016553279012441635, "eval_runtime": 107.9226, "eval_samples_per_second": 18.532, "eval_steps_per_second": 4.633, "step": 90000 }, { "epoch": 0.23, "learning_rate": 0.0002650021644404468, "loss": 0.0248, "step": 90010 }, { "epoch": 0.23, "learning_rate": 0.0002649982762240753, "loss": 0.0222, "step": 90020 }, { "epoch": 0.23, "learning_rate": 0.0002649943880077038, "loss": 0.0301, "step": 90030 }, { "epoch": 0.23, "learning_rate": 0.00026499049979133234, "loss": 0.0276, "step": 90040 }, { "epoch": 0.23, "learning_rate": 0.0002649866115749609, "loss": 0.0208, "step": 90050 }, { "epoch": 0.23, "learning_rate": 0.0002649827233585894, "loss": 0.0272, "step": 90060 }, { "epoch": 0.23, "learning_rate": 0.000264978835142218, "loss": 0.025, "step": 90070 }, { "epoch": 0.23, "learning_rate": 0.0002649749469258465, "loss": 0.0236, "step": 90080 }, { "epoch": 0.23, "learning_rate": 0.000264971058709475, "loss": 0.02, "step": 90090 }, { "epoch": 0.23, "learning_rate": 0.0002649671704931036, "loss": 0.0234, "step": 90100 }, { "epoch": 0.23, "learning_rate": 0.0002649632822767321, "loss": 0.0252, "step": 90110 }, { "epoch": 0.23, "learning_rate": 0.0002649593940603606, "loss": 0.0217, "step": 90120 }, { "epoch": 0.23, "learning_rate": 0.0002649555058439892, "loss": 0.0208, "step": 90130 }, { "epoch": 0.23, "learning_rate": 0.00026495161762761776, "loss": 0.0267, "step": 90140 }, { "epoch": 0.23, "learning_rate": 0.00026494772941124627, "loss": 0.0237, "step": 90150 }, { "epoch": 0.23, "learning_rate": 0.0002649438411948748, "loss": 0.0224, "step": 90160 }, { "epoch": 0.23, "learning_rate": 0.0002649399529785033, "loss": 0.0245, "step": 90170 }, { "epoch": 0.23, "learning_rate": 0.00026493606476213187, "loss": 0.0193, "step": 90180 }, { "epoch": 0.23, "learning_rate": 0.0002649321765457604, "loss": 0.0224, "step": 90190 }, { "epoch": 0.23, "learning_rate": 0.00026492828832938895, "loss": 0.0214, "step": 90200 }, { "epoch": 0.23, "learning_rate": 0.00026492440011301747, "loss": 0.0257, "step": 90210 }, { "epoch": 0.23, "learning_rate": 0.00026492051189664603, "loss": 0.0214, "step": 90220 }, { "epoch": 0.23, "learning_rate": 0.00026491662368027455, "loss": 0.0227, "step": 90230 }, { "epoch": 0.23, "learning_rate": 0.00026491273546390306, "loss": 0.0307, "step": 90240 }, { "epoch": 0.23, "learning_rate": 0.0002649088472475316, "loss": 0.0233, "step": 90250 }, { "epoch": 0.23, "learning_rate": 0.00026490495903116015, "loss": 0.0292, "step": 90260 }, { "epoch": 0.23, "learning_rate": 0.00026490107081478866, "loss": 0.0223, "step": 90270 }, { "epoch": 0.23, "learning_rate": 0.00026489718259841723, "loss": 0.0219, "step": 90280 }, { "epoch": 0.23, "learning_rate": 0.00026489329438204574, "loss": 0.0218, "step": 90290 }, { "epoch": 0.23, "learning_rate": 0.0002648894061656743, "loss": 0.0248, "step": 90300 }, { "epoch": 0.23, "learning_rate": 0.00026488551794930283, "loss": 0.0229, "step": 90310 }, { "epoch": 0.23, "learning_rate": 0.00026488162973293134, "loss": 0.0276, "step": 90320 }, { "epoch": 0.23, "learning_rate": 0.00026487774151655986, "loss": 0.0322, "step": 90330 }, { "epoch": 0.23, "learning_rate": 0.0002648738533001884, "loss": 0.025, "step": 90340 }, { "epoch": 0.23, "learning_rate": 0.000264869965083817, "loss": 0.0259, "step": 90350 }, { "epoch": 0.23, "learning_rate": 0.0002648660768674455, "loss": 0.0236, "step": 90360 }, { "epoch": 0.23, "learning_rate": 0.000264862188651074, "loss": 0.0214, "step": 90370 }, { "epoch": 0.23, "learning_rate": 0.00026485830043470254, "loss": 0.0258, "step": 90380 }, { "epoch": 0.23, "learning_rate": 0.0002648544122183311, "loss": 0.0252, "step": 90390 }, { "epoch": 0.23, "learning_rate": 0.0002648505240019596, "loss": 0.0248, "step": 90400 }, { "epoch": 0.23, "learning_rate": 0.0002648466357855882, "loss": 0.0182, "step": 90410 }, { "epoch": 0.23, "learning_rate": 0.0002648427475692167, "loss": 0.0244, "step": 90420 }, { "epoch": 0.23, "learning_rate": 0.0002648388593528453, "loss": 0.0302, "step": 90430 }, { "epoch": 0.23, "learning_rate": 0.0002648349711364738, "loss": 0.0194, "step": 90440 }, { "epoch": 0.23, "learning_rate": 0.0002648310829201023, "loss": 0.0249, "step": 90450 }, { "epoch": 0.23, "learning_rate": 0.0002648271947037308, "loss": 0.0208, "step": 90460 }, { "epoch": 0.23, "learning_rate": 0.0002648233064873594, "loss": 0.0227, "step": 90470 }, { "epoch": 0.23, "learning_rate": 0.0002648194182709879, "loss": 0.0315, "step": 90480 }, { "epoch": 0.23, "learning_rate": 0.00026481553005461647, "loss": 0.0255, "step": 90490 }, { "epoch": 0.23, "learning_rate": 0.000264811641838245, "loss": 0.0182, "step": 90500 }, { "epoch": 0.23, "learning_rate": 0.00026480775362187355, "loss": 0.024, "step": 90510 }, { "epoch": 0.23, "learning_rate": 0.00026480386540550207, "loss": 0.0215, "step": 90520 }, { "epoch": 0.23, "learning_rate": 0.0002647999771891306, "loss": 0.0251, "step": 90530 }, { "epoch": 0.23, "learning_rate": 0.00026479608897275915, "loss": 0.0241, "step": 90540 }, { "epoch": 0.23, "learning_rate": 0.00026479220075638766, "loss": 0.0233, "step": 90550 }, { "epoch": 0.23, "learning_rate": 0.00026478831254001623, "loss": 0.023, "step": 90560 }, { "epoch": 0.23, "learning_rate": 0.00026478442432364475, "loss": 0.0267, "step": 90570 }, { "epoch": 0.23, "learning_rate": 0.00026478053610727326, "loss": 0.0205, "step": 90580 }, { "epoch": 0.23, "learning_rate": 0.0002647766478909018, "loss": 0.0202, "step": 90590 }, { "epoch": 0.23, "learning_rate": 0.00026477275967453035, "loss": 0.0228, "step": 90600 }, { "epoch": 0.23, "learning_rate": 0.00026476887145815886, "loss": 0.0229, "step": 90610 }, { "epoch": 0.23, "learning_rate": 0.00026476498324178743, "loss": 0.0302, "step": 90620 }, { "epoch": 0.23, "learning_rate": 0.00026476109502541594, "loss": 0.0241, "step": 90630 }, { "epoch": 0.23, "learning_rate": 0.0002647572068090445, "loss": 0.0227, "step": 90640 }, { "epoch": 0.23, "learning_rate": 0.000264753318592673, "loss": 0.024, "step": 90650 }, { "epoch": 0.24, "learning_rate": 0.00026474943037630154, "loss": 0.0269, "step": 90660 }, { "epoch": 0.24, "learning_rate": 0.00026474554215993006, "loss": 0.0262, "step": 90670 }, { "epoch": 0.24, "learning_rate": 0.0002647416539435586, "loss": 0.0245, "step": 90680 }, { "epoch": 0.24, "learning_rate": 0.0002647377657271872, "loss": 0.0231, "step": 90690 }, { "epoch": 0.24, "learning_rate": 0.0002647338775108157, "loss": 0.0242, "step": 90700 }, { "epoch": 0.24, "learning_rate": 0.0002647299892944442, "loss": 0.0248, "step": 90710 }, { "epoch": 0.24, "learning_rate": 0.0002647261010780728, "loss": 0.0253, "step": 90720 }, { "epoch": 0.24, "learning_rate": 0.0002647222128617013, "loss": 0.0251, "step": 90730 }, { "epoch": 0.24, "learning_rate": 0.0002647183246453298, "loss": 0.0212, "step": 90740 }, { "epoch": 0.24, "learning_rate": 0.0002647144364289584, "loss": 0.0184, "step": 90750 }, { "epoch": 0.24, "learning_rate": 0.0002647105482125869, "loss": 0.0244, "step": 90760 }, { "epoch": 0.24, "learning_rate": 0.00026470665999621547, "loss": 0.0194, "step": 90770 }, { "epoch": 0.24, "learning_rate": 0.000264702771779844, "loss": 0.0215, "step": 90780 }, { "epoch": 0.24, "learning_rate": 0.0002646988835634725, "loss": 0.021, "step": 90790 }, { "epoch": 0.24, "learning_rate": 0.00026469499534710107, "loss": 0.0274, "step": 90800 }, { "epoch": 0.24, "learning_rate": 0.0002646911071307296, "loss": 0.0228, "step": 90810 }, { "epoch": 0.24, "learning_rate": 0.0002646872189143581, "loss": 0.0266, "step": 90820 }, { "epoch": 0.24, "learning_rate": 0.00026468333069798667, "loss": 0.0224, "step": 90830 }, { "epoch": 0.24, "learning_rate": 0.0002646794424816152, "loss": 0.0233, "step": 90840 }, { "epoch": 0.24, "learning_rate": 0.00026467555426524375, "loss": 0.0257, "step": 90850 }, { "epoch": 0.24, "learning_rate": 0.00026467166604887227, "loss": 0.0223, "step": 90860 }, { "epoch": 0.24, "learning_rate": 0.0002646677778325008, "loss": 0.0226, "step": 90870 }, { "epoch": 0.24, "learning_rate": 0.0002646638896161293, "loss": 0.0302, "step": 90880 }, { "epoch": 0.24, "learning_rate": 0.00026466000139975786, "loss": 0.0241, "step": 90890 }, { "epoch": 0.24, "learning_rate": 0.00026465611318338643, "loss": 0.0209, "step": 90900 }, { "epoch": 0.24, "learning_rate": 0.00026465222496701495, "loss": 0.0247, "step": 90910 }, { "epoch": 0.24, "learning_rate": 0.00026464833675064346, "loss": 0.0226, "step": 90920 }, { "epoch": 0.24, "learning_rate": 0.00026464444853427203, "loss": 0.0227, "step": 90930 }, { "epoch": 0.24, "learning_rate": 0.00026464056031790054, "loss": 0.0215, "step": 90940 }, { "epoch": 0.24, "learning_rate": 0.00026463667210152906, "loss": 0.0187, "step": 90950 }, { "epoch": 0.24, "learning_rate": 0.00026463278388515763, "loss": 0.0236, "step": 90960 }, { "epoch": 0.24, "learning_rate": 0.00026462889566878614, "loss": 0.0259, "step": 90970 }, { "epoch": 0.24, "learning_rate": 0.0002646250074524147, "loss": 0.0225, "step": 90980 }, { "epoch": 0.24, "learning_rate": 0.0002646211192360432, "loss": 0.0193, "step": 90990 }, { "epoch": 0.24, "learning_rate": 0.00026461723101967174, "loss": 0.0276, "step": 91000 }, { "epoch": 0.24, "eval_cer": 0.8817712685329425, "eval_loss": 0.01665649563074112, "eval_runtime": 107.8663, "eval_samples_per_second": 18.541, "eval_steps_per_second": 4.635, "step": 91000 }, { "epoch": 0.24, "learning_rate": 0.0002646133428033003, "loss": 0.0229, "step": 91010 }, { "epoch": 0.24, "learning_rate": 0.0002646094545869288, "loss": 0.0249, "step": 91020 }, { "epoch": 0.24, "learning_rate": 0.00026460556637055734, "loss": 0.0241, "step": 91030 }, { "epoch": 0.24, "learning_rate": 0.0002646016781541859, "loss": 0.024, "step": 91040 }, { "epoch": 0.24, "learning_rate": 0.0002645977899378145, "loss": 0.0218, "step": 91050 }, { "epoch": 0.24, "learning_rate": 0.000264593901721443, "loss": 0.0206, "step": 91060 }, { "epoch": 0.24, "learning_rate": 0.0002645900135050715, "loss": 0.0247, "step": 91070 }, { "epoch": 0.24, "learning_rate": 0.0002645861252887, "loss": 0.027, "step": 91080 }, { "epoch": 0.24, "learning_rate": 0.0002645822370723286, "loss": 0.0251, "step": 91090 }, { "epoch": 0.24, "learning_rate": 0.0002645783488559571, "loss": 0.0222, "step": 91100 }, { "epoch": 0.24, "learning_rate": 0.00026457446063958567, "loss": 0.0186, "step": 91110 }, { "epoch": 0.24, "learning_rate": 0.0002645705724232142, "loss": 0.0212, "step": 91120 }, { "epoch": 0.24, "learning_rate": 0.0002645666842068427, "loss": 0.0225, "step": 91130 }, { "epoch": 0.24, "learning_rate": 0.00026456279599047127, "loss": 0.0313, "step": 91140 }, { "epoch": 0.24, "learning_rate": 0.0002645589077740998, "loss": 0.0237, "step": 91150 }, { "epoch": 0.24, "learning_rate": 0.0002645550195577283, "loss": 0.0196, "step": 91160 }, { "epoch": 0.24, "learning_rate": 0.00026455113134135687, "loss": 0.0213, "step": 91170 }, { "epoch": 0.24, "learning_rate": 0.00026454724312498544, "loss": 0.0243, "step": 91180 }, { "epoch": 0.24, "learning_rate": 0.00026454335490861395, "loss": 0.0213, "step": 91190 }, { "epoch": 0.24, "learning_rate": 0.00026453946669224246, "loss": 0.0206, "step": 91200 }, { "epoch": 0.24, "learning_rate": 0.000264535578475871, "loss": 0.0234, "step": 91210 }, { "epoch": 0.24, "learning_rate": 0.00026453169025949955, "loss": 0.0234, "step": 91220 }, { "epoch": 0.24, "learning_rate": 0.00026452780204312806, "loss": 0.0281, "step": 91230 }, { "epoch": 0.24, "learning_rate": 0.00026452391382675663, "loss": 0.0243, "step": 91240 }, { "epoch": 0.24, "learning_rate": 0.00026452002561038515, "loss": 0.0278, "step": 91250 }, { "epoch": 0.24, "learning_rate": 0.0002645161373940137, "loss": 0.0222, "step": 91260 }, { "epoch": 0.24, "learning_rate": 0.00026451224917764223, "loss": 0.0227, "step": 91270 }, { "epoch": 0.24, "learning_rate": 0.00026450836096127074, "loss": 0.0222, "step": 91280 }, { "epoch": 0.24, "learning_rate": 0.00026450447274489926, "loss": 0.0293, "step": 91290 }, { "epoch": 0.24, "learning_rate": 0.0002645005845285278, "loss": 0.023, "step": 91300 }, { "epoch": 0.24, "learning_rate": 0.00026449669631215634, "loss": 0.0244, "step": 91310 }, { "epoch": 0.24, "learning_rate": 0.0002644928080957849, "loss": 0.0232, "step": 91320 }, { "epoch": 0.24, "learning_rate": 0.0002644889198794134, "loss": 0.0254, "step": 91330 }, { "epoch": 0.24, "learning_rate": 0.00026448503166304194, "loss": 0.0213, "step": 91340 }, { "epoch": 0.24, "learning_rate": 0.0002644811434466705, "loss": 0.0227, "step": 91350 }, { "epoch": 0.24, "learning_rate": 0.000264477255230299, "loss": 0.0255, "step": 91360 }, { "epoch": 0.24, "learning_rate": 0.00026447336701392754, "loss": 0.0234, "step": 91370 }, { "epoch": 0.24, "learning_rate": 0.0002644694787975561, "loss": 0.0234, "step": 91380 }, { "epoch": 0.24, "learning_rate": 0.0002644655905811847, "loss": 0.0242, "step": 91390 }, { "epoch": 0.24, "learning_rate": 0.0002644617023648132, "loss": 0.0236, "step": 91400 }, { "epoch": 0.24, "learning_rate": 0.0002644578141484417, "loss": 0.0179, "step": 91410 }, { "epoch": 0.24, "learning_rate": 0.0002644539259320702, "loss": 0.0289, "step": 91420 }, { "epoch": 0.24, "learning_rate": 0.0002644500377156988, "loss": 0.0207, "step": 91430 }, { "epoch": 0.24, "learning_rate": 0.0002644461494993273, "loss": 0.0259, "step": 91440 }, { "epoch": 0.24, "learning_rate": 0.00026444226128295587, "loss": 0.0192, "step": 91450 }, { "epoch": 0.24, "learning_rate": 0.0002644383730665844, "loss": 0.0186, "step": 91460 }, { "epoch": 0.24, "learning_rate": 0.00026443448485021295, "loss": 0.0195, "step": 91470 }, { "epoch": 0.24, "learning_rate": 0.00026443059663384147, "loss": 0.0201, "step": 91480 }, { "epoch": 0.24, "learning_rate": 0.00026442670841747, "loss": 0.0207, "step": 91490 }, { "epoch": 0.24, "learning_rate": 0.0002644228202010985, "loss": 0.0218, "step": 91500 }, { "epoch": 0.24, "learning_rate": 0.00026441893198472707, "loss": 0.0231, "step": 91510 }, { "epoch": 0.24, "learning_rate": 0.0002644150437683556, "loss": 0.0226, "step": 91520 }, { "epoch": 0.24, "learning_rate": 0.00026441115555198415, "loss": 0.022, "step": 91530 }, { "epoch": 0.24, "learning_rate": 0.00026440726733561266, "loss": 0.0249, "step": 91540 }, { "epoch": 0.24, "learning_rate": 0.00026440337911924123, "loss": 0.0238, "step": 91550 }, { "epoch": 0.24, "learning_rate": 0.00026439949090286975, "loss": 0.0216, "step": 91560 }, { "epoch": 0.24, "learning_rate": 0.00026439560268649826, "loss": 0.0273, "step": 91570 }, { "epoch": 0.24, "learning_rate": 0.00026439171447012683, "loss": 0.0245, "step": 91580 }, { "epoch": 0.24, "learning_rate": 0.00026438782625375534, "loss": 0.02, "step": 91590 }, { "epoch": 0.24, "learning_rate": 0.0002643839380373839, "loss": 0.0192, "step": 91600 }, { "epoch": 0.24, "learning_rate": 0.00026438004982101243, "loss": 0.0261, "step": 91610 }, { "epoch": 0.24, "learning_rate": 0.00026437616160464094, "loss": 0.0234, "step": 91620 }, { "epoch": 0.24, "learning_rate": 0.00026437227338826946, "loss": 0.0193, "step": 91630 }, { "epoch": 0.24, "learning_rate": 0.000264368385171898, "loss": 0.0206, "step": 91640 }, { "epoch": 0.24, "learning_rate": 0.00026436449695552654, "loss": 0.0219, "step": 91650 }, { "epoch": 0.24, "learning_rate": 0.0002643606087391551, "loss": 0.0233, "step": 91660 }, { "epoch": 0.24, "learning_rate": 0.0002643567205227836, "loss": 0.0254, "step": 91670 }, { "epoch": 0.24, "learning_rate": 0.0002643528323064122, "loss": 0.0265, "step": 91680 }, { "epoch": 0.24, "learning_rate": 0.0002643489440900407, "loss": 0.0223, "step": 91690 }, { "epoch": 0.24, "learning_rate": 0.0002643450558736692, "loss": 0.0236, "step": 91700 }, { "epoch": 0.24, "learning_rate": 0.00026434116765729774, "loss": 0.0263, "step": 91710 }, { "epoch": 0.24, "learning_rate": 0.0002643372794409263, "loss": 0.0239, "step": 91720 }, { "epoch": 0.24, "learning_rate": 0.0002643333912245549, "loss": 0.0206, "step": 91730 }, { "epoch": 0.24, "learning_rate": 0.0002643295030081834, "loss": 0.0224, "step": 91740 }, { "epoch": 0.24, "learning_rate": 0.0002643256147918119, "loss": 0.0244, "step": 91750 }, { "epoch": 0.24, "learning_rate": 0.00026432172657544047, "loss": 0.0227, "step": 91760 }, { "epoch": 0.24, "learning_rate": 0.000264317838359069, "loss": 0.0255, "step": 91770 }, { "epoch": 0.24, "learning_rate": 0.0002643139501426975, "loss": 0.0223, "step": 91780 }, { "epoch": 0.24, "learning_rate": 0.00026431006192632607, "loss": 0.0219, "step": 91790 }, { "epoch": 0.24, "learning_rate": 0.0002643061737099546, "loss": 0.0253, "step": 91800 }, { "epoch": 0.24, "learning_rate": 0.00026430228549358315, "loss": 0.0257, "step": 91810 }, { "epoch": 0.24, "learning_rate": 0.00026429839727721167, "loss": 0.0213, "step": 91820 }, { "epoch": 0.24, "learning_rate": 0.0002642945090608402, "loss": 0.0212, "step": 91830 }, { "epoch": 0.24, "learning_rate": 0.0002642906208444687, "loss": 0.022, "step": 91840 }, { "epoch": 0.24, "learning_rate": 0.00026428673262809726, "loss": 0.0252, "step": 91850 }, { "epoch": 0.24, "learning_rate": 0.0002642828444117258, "loss": 0.0264, "step": 91860 }, { "epoch": 0.24, "learning_rate": 0.00026427895619535435, "loss": 0.0204, "step": 91870 }, { "epoch": 0.24, "learning_rate": 0.00026427506797898286, "loss": 0.0252, "step": 91880 }, { "epoch": 0.24, "learning_rate": 0.00026427117976261143, "loss": 0.0242, "step": 91890 }, { "epoch": 0.24, "learning_rate": 0.00026426729154623995, "loss": 0.0243, "step": 91900 }, { "epoch": 0.24, "learning_rate": 0.00026426340332986846, "loss": 0.0231, "step": 91910 }, { "epoch": 0.24, "learning_rate": 0.000264259515113497, "loss": 0.0237, "step": 91920 }, { "epoch": 0.24, "learning_rate": 0.00026425562689712554, "loss": 0.0241, "step": 91930 }, { "epoch": 0.24, "learning_rate": 0.0002642517386807541, "loss": 0.0211, "step": 91940 }, { "epoch": 0.24, "learning_rate": 0.0002642478504643826, "loss": 0.0227, "step": 91950 }, { "epoch": 0.24, "learning_rate": 0.00026424396224801114, "loss": 0.0242, "step": 91960 }, { "epoch": 0.24, "learning_rate": 0.0002642400740316397, "loss": 0.0209, "step": 91970 }, { "epoch": 0.24, "learning_rate": 0.0002642361858152682, "loss": 0.025, "step": 91980 }, { "epoch": 0.24, "learning_rate": 0.00026423229759889674, "loss": 0.0241, "step": 91990 }, { "epoch": 0.24, "learning_rate": 0.0002642284093825253, "loss": 0.021, "step": 92000 }, { "epoch": 0.24, "eval_cer": 0.881813257640968, "eval_loss": 0.01661667600274086, "eval_runtime": 108.0448, "eval_samples_per_second": 18.511, "eval_steps_per_second": 4.628, "step": 92000 }, { "epoch": 0.24, "learning_rate": 0.0002642245211661538, "loss": 0.023, "step": 92010 }, { "epoch": 0.24, "learning_rate": 0.0002642206329497824, "loss": 0.0262, "step": 92020 }, { "epoch": 0.24, "learning_rate": 0.0002642167447334109, "loss": 0.0172, "step": 92030 }, { "epoch": 0.24, "learning_rate": 0.0002642128565170394, "loss": 0.0251, "step": 92040 }, { "epoch": 0.24, "learning_rate": 0.00026420896830066793, "loss": 0.0206, "step": 92050 }, { "epoch": 0.24, "learning_rate": 0.0002642050800842965, "loss": 0.0226, "step": 92060 }, { "epoch": 0.24, "learning_rate": 0.000264201191867925, "loss": 0.0262, "step": 92070 }, { "epoch": 0.24, "learning_rate": 0.0002641973036515536, "loss": 0.0224, "step": 92080 }, { "epoch": 0.24, "learning_rate": 0.0002641934154351821, "loss": 0.0252, "step": 92090 }, { "epoch": 0.24, "learning_rate": 0.00026418952721881067, "loss": 0.0276, "step": 92100 }, { "epoch": 0.24, "learning_rate": 0.0002641856390024392, "loss": 0.0239, "step": 92110 }, { "epoch": 0.24, "learning_rate": 0.0002641817507860677, "loss": 0.0231, "step": 92120 }, { "epoch": 0.24, "learning_rate": 0.00026417786256969627, "loss": 0.029, "step": 92130 }, { "epoch": 0.24, "learning_rate": 0.0002641739743533248, "loss": 0.0256, "step": 92140 }, { "epoch": 0.24, "learning_rate": 0.00026417008613695335, "loss": 0.0206, "step": 92150 }, { "epoch": 0.24, "learning_rate": 0.00026416619792058187, "loss": 0.0234, "step": 92160 }, { "epoch": 0.24, "learning_rate": 0.0002641623097042104, "loss": 0.0239, "step": 92170 }, { "epoch": 0.24, "learning_rate": 0.00026415842148783895, "loss": 0.0247, "step": 92180 }, { "epoch": 0.24, "learning_rate": 0.00026415453327146746, "loss": 0.028, "step": 92190 }, { "epoch": 0.24, "learning_rate": 0.000264150645055096, "loss": 0.023, "step": 92200 }, { "epoch": 0.24, "learning_rate": 0.00026414675683872455, "loss": 0.027, "step": 92210 }, { "epoch": 0.24, "learning_rate": 0.00026414286862235306, "loss": 0.0219, "step": 92220 }, { "epoch": 0.24, "learning_rate": 0.00026413898040598163, "loss": 0.0177, "step": 92230 }, { "epoch": 0.24, "learning_rate": 0.00026413509218961014, "loss": 0.0214, "step": 92240 }, { "epoch": 0.24, "learning_rate": 0.00026413120397323866, "loss": 0.0281, "step": 92250 }, { "epoch": 0.24, "learning_rate": 0.00026412731575686723, "loss": 0.025, "step": 92260 }, { "epoch": 0.24, "learning_rate": 0.00026412342754049574, "loss": 0.0286, "step": 92270 }, { "epoch": 0.24, "learning_rate": 0.0002641195393241243, "loss": 0.0233, "step": 92280 }, { "epoch": 0.24, "learning_rate": 0.0002641156511077528, "loss": 0.0201, "step": 92290 }, { "epoch": 0.24, "learning_rate": 0.00026411176289138134, "loss": 0.0218, "step": 92300 }, { "epoch": 0.24, "learning_rate": 0.0002641078746750099, "loss": 0.0286, "step": 92310 }, { "epoch": 0.24, "learning_rate": 0.0002641039864586384, "loss": 0.0216, "step": 92320 }, { "epoch": 0.24, "learning_rate": 0.00026410009824226694, "loss": 0.0227, "step": 92330 }, { "epoch": 0.24, "learning_rate": 0.0002640962100258955, "loss": 0.0204, "step": 92340 }, { "epoch": 0.24, "learning_rate": 0.000264092321809524, "loss": 0.0247, "step": 92350 }, { "epoch": 0.24, "learning_rate": 0.0002640884335931526, "loss": 0.0253, "step": 92360 }, { "epoch": 0.24, "learning_rate": 0.0002640845453767811, "loss": 0.0197, "step": 92370 }, { "epoch": 0.24, "learning_rate": 0.0002640806571604096, "loss": 0.0221, "step": 92380 }, { "epoch": 0.24, "learning_rate": 0.0002640767689440382, "loss": 0.0203, "step": 92390 }, { "epoch": 0.24, "learning_rate": 0.0002640728807276667, "loss": 0.0251, "step": 92400 }, { "epoch": 0.24, "learning_rate": 0.0002640689925112952, "loss": 0.0241, "step": 92410 }, { "epoch": 0.24, "learning_rate": 0.0002640651042949238, "loss": 0.0233, "step": 92420 }, { "epoch": 0.24, "learning_rate": 0.00026406121607855235, "loss": 0.0187, "step": 92430 }, { "epoch": 0.24, "learning_rate": 0.00026405732786218087, "loss": 0.0242, "step": 92440 }, { "epoch": 0.24, "learning_rate": 0.0002640534396458094, "loss": 0.0235, "step": 92450 }, { "epoch": 0.24, "learning_rate": 0.0002640495514294379, "loss": 0.0201, "step": 92460 }, { "epoch": 0.24, "learning_rate": 0.00026404566321306647, "loss": 0.0241, "step": 92470 }, { "epoch": 0.24, "learning_rate": 0.000264041774996695, "loss": 0.0288, "step": 92480 }, { "epoch": 0.24, "learning_rate": 0.00026403788678032355, "loss": 0.0239, "step": 92490 }, { "epoch": 0.24, "learning_rate": 0.00026403399856395206, "loss": 0.0253, "step": 92500 }, { "epoch": 0.24, "learning_rate": 0.00026403011034758063, "loss": 0.0206, "step": 92510 }, { "epoch": 0.24, "learning_rate": 0.00026402622213120915, "loss": 0.0185, "step": 92520 }, { "epoch": 0.24, "learning_rate": 0.00026402233391483766, "loss": 0.0201, "step": 92530 }, { "epoch": 0.24, "learning_rate": 0.0002640184456984662, "loss": 0.0264, "step": 92540 }, { "epoch": 0.24, "learning_rate": 0.00026401455748209475, "loss": 0.0254, "step": 92550 }, { "epoch": 0.24, "learning_rate": 0.00026401066926572326, "loss": 0.0217, "step": 92560 }, { "epoch": 0.24, "learning_rate": 0.00026400678104935183, "loss": 0.0203, "step": 92570 }, { "epoch": 0.24, "learning_rate": 0.00026400289283298034, "loss": 0.029, "step": 92580 }, { "epoch": 0.24, "learning_rate": 0.00026399900461660886, "loss": 0.024, "step": 92590 }, { "epoch": 0.24, "learning_rate": 0.0002639951164002374, "loss": 0.0231, "step": 92600 }, { "epoch": 0.24, "learning_rate": 0.00026399122818386594, "loss": 0.0295, "step": 92610 }, { "epoch": 0.24, "learning_rate": 0.00026398733996749446, "loss": 0.0231, "step": 92620 }, { "epoch": 0.24, "learning_rate": 0.000263983451751123, "loss": 0.0224, "step": 92630 }, { "epoch": 0.24, "learning_rate": 0.0002639795635347516, "loss": 0.0256, "step": 92640 }, { "epoch": 0.24, "learning_rate": 0.0002639756753183801, "loss": 0.0254, "step": 92650 }, { "epoch": 0.24, "learning_rate": 0.0002639717871020086, "loss": 0.0232, "step": 92660 }, { "epoch": 0.24, "learning_rate": 0.00026396789888563714, "loss": 0.0192, "step": 92670 }, { "epoch": 0.24, "learning_rate": 0.0002639640106692657, "loss": 0.0297, "step": 92680 }, { "epoch": 0.24, "learning_rate": 0.0002639601224528942, "loss": 0.0254, "step": 92690 }, { "epoch": 0.24, "learning_rate": 0.0002639562342365228, "loss": 0.0223, "step": 92700 }, { "epoch": 0.24, "learning_rate": 0.0002639523460201513, "loss": 0.0215, "step": 92710 }, { "epoch": 0.24, "learning_rate": 0.00026394845780377987, "loss": 0.0241, "step": 92720 }, { "epoch": 0.24, "learning_rate": 0.0002639445695874084, "loss": 0.0244, "step": 92730 }, { "epoch": 0.24, "learning_rate": 0.0002639406813710369, "loss": 0.021, "step": 92740 }, { "epoch": 0.24, "learning_rate": 0.0002639367931546654, "loss": 0.0221, "step": 92750 }, { "epoch": 0.24, "learning_rate": 0.000263932904938294, "loss": 0.0234, "step": 92760 }, { "epoch": 0.24, "learning_rate": 0.00026392901672192255, "loss": 0.0228, "step": 92770 }, { "epoch": 0.24, "learning_rate": 0.00026392512850555107, "loss": 0.0207, "step": 92780 }, { "epoch": 0.24, "learning_rate": 0.0002639212402891796, "loss": 0.0211, "step": 92790 }, { "epoch": 0.24, "learning_rate": 0.0002639173520728081, "loss": 0.0221, "step": 92800 }, { "epoch": 0.24, "learning_rate": 0.00026391346385643667, "loss": 0.02, "step": 92810 }, { "epoch": 0.24, "learning_rate": 0.0002639095756400652, "loss": 0.0174, "step": 92820 }, { "epoch": 0.24, "learning_rate": 0.00026390568742369375, "loss": 0.0253, "step": 92830 }, { "epoch": 0.24, "learning_rate": 0.00026390179920732226, "loss": 0.026, "step": 92840 }, { "epoch": 0.24, "learning_rate": 0.00026389791099095083, "loss": 0.024, "step": 92850 }, { "epoch": 0.24, "learning_rate": 0.00026389402277457935, "loss": 0.0203, "step": 92860 }, { "epoch": 0.24, "learning_rate": 0.00026389013455820786, "loss": 0.0233, "step": 92870 }, { "epoch": 0.24, "learning_rate": 0.0002638862463418364, "loss": 0.0219, "step": 92880 }, { "epoch": 0.24, "learning_rate": 0.00026388235812546494, "loss": 0.0217, "step": 92890 }, { "epoch": 0.24, "learning_rate": 0.00026387846990909346, "loss": 0.0199, "step": 92900 }, { "epoch": 0.24, "learning_rate": 0.00026387458169272203, "loss": 0.0192, "step": 92910 }, { "epoch": 0.24, "learning_rate": 0.00026387069347635054, "loss": 0.0264, "step": 92920 }, { "epoch": 0.24, "learning_rate": 0.0002638668052599791, "loss": 0.0237, "step": 92930 }, { "epoch": 0.24, "learning_rate": 0.0002638629170436076, "loss": 0.0223, "step": 92940 }, { "epoch": 0.24, "learning_rate": 0.00026385902882723614, "loss": 0.0233, "step": 92950 }, { "epoch": 0.24, "learning_rate": 0.00026385514061086465, "loss": 0.017, "step": 92960 }, { "epoch": 0.24, "learning_rate": 0.0002638512523944932, "loss": 0.02, "step": 92970 }, { "epoch": 0.24, "learning_rate": 0.0002638473641781218, "loss": 0.0249, "step": 92980 }, { "epoch": 0.24, "learning_rate": 0.0002638434759617503, "loss": 0.0195, "step": 92990 }, { "epoch": 0.24, "learning_rate": 0.0002638395877453788, "loss": 0.0226, "step": 93000 }, { "epoch": 0.24, "eval_cer": 0.881806259456297, "eval_loss": 0.016998477280139923, "eval_runtime": 108.1066, "eval_samples_per_second": 18.5, "eval_steps_per_second": 4.625, "step": 93000 }, { "epoch": 0.24, "learning_rate": 0.0002638356995290074, "loss": 0.0262, "step": 93010 }, { "epoch": 0.24, "learning_rate": 0.0002638318113126359, "loss": 0.0273, "step": 93020 }, { "epoch": 0.24, "learning_rate": 0.0002638279230962644, "loss": 0.0274, "step": 93030 }, { "epoch": 0.24, "learning_rate": 0.000263824034879893, "loss": 0.0271, "step": 93040 }, { "epoch": 0.24, "learning_rate": 0.0002638201466635215, "loss": 0.022, "step": 93050 }, { "epoch": 0.24, "learning_rate": 0.00026381625844715007, "loss": 0.021, "step": 93060 }, { "epoch": 0.24, "learning_rate": 0.0002638123702307786, "loss": 0.0232, "step": 93070 }, { "epoch": 0.24, "learning_rate": 0.0002638084820144071, "loss": 0.0202, "step": 93080 }, { "epoch": 0.24, "learning_rate": 0.0002638045937980356, "loss": 0.021, "step": 93090 }, { "epoch": 0.24, "learning_rate": 0.0002638007055816642, "loss": 0.0228, "step": 93100 }, { "epoch": 0.24, "learning_rate": 0.0002637968173652927, "loss": 0.0204, "step": 93110 }, { "epoch": 0.24, "learning_rate": 0.00026379292914892127, "loss": 0.0215, "step": 93120 }, { "epoch": 0.24, "learning_rate": 0.0002637890409325498, "loss": 0.0249, "step": 93130 }, { "epoch": 0.24, "learning_rate": 0.00026378515271617835, "loss": 0.0228, "step": 93140 }, { "epoch": 0.24, "learning_rate": 0.00026378126449980686, "loss": 0.0274, "step": 93150 }, { "epoch": 0.24, "learning_rate": 0.0002637773762834354, "loss": 0.0242, "step": 93160 }, { "epoch": 0.24, "learning_rate": 0.00026377348806706395, "loss": 0.0232, "step": 93170 }, { "epoch": 0.24, "learning_rate": 0.00026376959985069246, "loss": 0.0272, "step": 93180 }, { "epoch": 0.24, "learning_rate": 0.00026376571163432103, "loss": 0.0205, "step": 93190 }, { "epoch": 0.24, "learning_rate": 0.00026376182341794955, "loss": 0.0225, "step": 93200 }, { "epoch": 0.24, "learning_rate": 0.00026375793520157806, "loss": 0.022, "step": 93210 }, { "epoch": 0.24, "learning_rate": 0.00026375404698520663, "loss": 0.0236, "step": 93220 }, { "epoch": 0.24, "learning_rate": 0.00026375015876883514, "loss": 0.0207, "step": 93230 }, { "epoch": 0.24, "learning_rate": 0.00026374627055246366, "loss": 0.0234, "step": 93240 }, { "epoch": 0.24, "learning_rate": 0.0002637423823360922, "loss": 0.0234, "step": 93250 }, { "epoch": 0.24, "learning_rate": 0.00026373849411972074, "loss": 0.0224, "step": 93260 }, { "epoch": 0.24, "learning_rate": 0.0002637346059033493, "loss": 0.0238, "step": 93270 }, { "epoch": 0.24, "learning_rate": 0.0002637307176869778, "loss": 0.022, "step": 93280 }, { "epoch": 0.24, "learning_rate": 0.00026372682947060634, "loss": 0.0223, "step": 93290 }, { "epoch": 0.24, "learning_rate": 0.00026372294125423485, "loss": 0.026, "step": 93300 }, { "epoch": 0.24, "learning_rate": 0.0002637190530378634, "loss": 0.0222, "step": 93310 }, { "epoch": 0.24, "learning_rate": 0.000263715164821492, "loss": 0.0229, "step": 93320 }, { "epoch": 0.24, "learning_rate": 0.0002637112766051205, "loss": 0.02, "step": 93330 }, { "epoch": 0.24, "learning_rate": 0.000263707388388749, "loss": 0.0199, "step": 93340 }, { "epoch": 0.24, "learning_rate": 0.0002637035001723776, "loss": 0.0264, "step": 93350 }, { "epoch": 0.24, "learning_rate": 0.0002636996119560061, "loss": 0.0211, "step": 93360 }, { "epoch": 0.24, "learning_rate": 0.0002636957237396346, "loss": 0.0294, "step": 93370 }, { "epoch": 0.24, "learning_rate": 0.0002636918355232632, "loss": 0.0266, "step": 93380 }, { "epoch": 0.24, "learning_rate": 0.0002636879473068917, "loss": 0.0297, "step": 93390 }, { "epoch": 0.24, "learning_rate": 0.00026368405909052027, "loss": 0.026, "step": 93400 }, { "epoch": 0.24, "learning_rate": 0.0002636801708741488, "loss": 0.0232, "step": 93410 }, { "epoch": 0.24, "learning_rate": 0.0002636762826577773, "loss": 0.022, "step": 93420 }, { "epoch": 0.24, "learning_rate": 0.00026367239444140587, "loss": 0.0227, "step": 93430 }, { "epoch": 0.24, "learning_rate": 0.0002636685062250344, "loss": 0.0208, "step": 93440 }, { "epoch": 0.24, "learning_rate": 0.0002636646180086629, "loss": 0.0214, "step": 93450 }, { "epoch": 0.24, "learning_rate": 0.00026366072979229147, "loss": 0.0206, "step": 93460 }, { "epoch": 0.24, "learning_rate": 0.00026365684157592003, "loss": 0.025, "step": 93470 }, { "epoch": 0.24, "learning_rate": 0.00026365295335954855, "loss": 0.0234, "step": 93480 }, { "epoch": 0.24, "learning_rate": 0.00026364906514317706, "loss": 0.0239, "step": 93490 }, { "epoch": 0.24, "learning_rate": 0.0002636451769268056, "loss": 0.0226, "step": 93500 }, { "epoch": 0.24, "learning_rate": 0.00026364128871043415, "loss": 0.0287, "step": 93510 }, { "epoch": 0.24, "learning_rate": 0.00026363740049406266, "loss": 0.022, "step": 93520 }, { "epoch": 0.24, "learning_rate": 0.00026363351227769123, "loss": 0.0216, "step": 93530 }, { "epoch": 0.24, "learning_rate": 0.00026362962406131974, "loss": 0.0222, "step": 93540 }, { "epoch": 0.24, "learning_rate": 0.00026362573584494826, "loss": 0.0232, "step": 93550 }, { "epoch": 0.24, "learning_rate": 0.00026362184762857683, "loss": 0.0203, "step": 93560 }, { "epoch": 0.24, "learning_rate": 0.00026361795941220534, "loss": 0.0207, "step": 93570 }, { "epoch": 0.24, "learning_rate": 0.00026361407119583386, "loss": 0.0263, "step": 93580 }, { "epoch": 0.24, "learning_rate": 0.0002636101829794624, "loss": 0.028, "step": 93590 }, { "epoch": 0.24, "learning_rate": 0.00026360629476309094, "loss": 0.0223, "step": 93600 }, { "epoch": 0.24, "learning_rate": 0.0002636024065467195, "loss": 0.0196, "step": 93610 }, { "epoch": 0.24, "learning_rate": 0.000263598518330348, "loss": 0.0227, "step": 93620 }, { "epoch": 0.24, "learning_rate": 0.00026359463011397654, "loss": 0.0236, "step": 93630 }, { "epoch": 0.24, "learning_rate": 0.0002635907418976051, "loss": 0.0192, "step": 93640 }, { "epoch": 0.24, "learning_rate": 0.0002635868536812336, "loss": 0.0231, "step": 93650 }, { "epoch": 0.24, "learning_rate": 0.00026358296546486214, "loss": 0.0226, "step": 93660 }, { "epoch": 0.24, "learning_rate": 0.0002635790772484907, "loss": 0.0187, "step": 93670 }, { "epoch": 0.24, "learning_rate": 0.00026357518903211927, "loss": 0.0239, "step": 93680 }, { "epoch": 0.24, "learning_rate": 0.0002635713008157478, "loss": 0.0206, "step": 93690 }, { "epoch": 0.24, "learning_rate": 0.0002635674125993763, "loss": 0.0194, "step": 93700 }, { "epoch": 0.24, "learning_rate": 0.0002635635243830048, "loss": 0.0309, "step": 93710 }, { "epoch": 0.24, "learning_rate": 0.0002635596361666334, "loss": 0.0199, "step": 93720 }, { "epoch": 0.24, "learning_rate": 0.0002635557479502619, "loss": 0.0194, "step": 93730 }, { "epoch": 0.24, "learning_rate": 0.00026355185973389047, "loss": 0.0204, "step": 93740 }, { "epoch": 0.24, "learning_rate": 0.000263547971517519, "loss": 0.023, "step": 93750 }, { "epoch": 0.24, "learning_rate": 0.00026354408330114755, "loss": 0.0246, "step": 93760 }, { "epoch": 0.24, "learning_rate": 0.00026354019508477607, "loss": 0.0218, "step": 93770 }, { "epoch": 0.24, "learning_rate": 0.0002635363068684046, "loss": 0.0221, "step": 93780 }, { "epoch": 0.24, "learning_rate": 0.0002635324186520331, "loss": 0.0243, "step": 93790 }, { "epoch": 0.24, "learning_rate": 0.00026352853043566166, "loss": 0.0224, "step": 93800 }, { "epoch": 0.24, "learning_rate": 0.0002635246422192902, "loss": 0.0304, "step": 93810 }, { "epoch": 0.24, "learning_rate": 0.00026352075400291875, "loss": 0.0194, "step": 93820 }, { "epoch": 0.24, "learning_rate": 0.00026351686578654726, "loss": 0.0253, "step": 93830 }, { "epoch": 0.24, "learning_rate": 0.0002635129775701758, "loss": 0.0189, "step": 93840 }, { "epoch": 0.24, "learning_rate": 0.00026350908935380434, "loss": 0.0235, "step": 93850 }, { "epoch": 0.24, "learning_rate": 0.00026350520113743286, "loss": 0.0208, "step": 93860 }, { "epoch": 0.24, "learning_rate": 0.00026350131292106143, "loss": 0.0219, "step": 93870 }, { "epoch": 0.24, "learning_rate": 0.00026349742470468994, "loss": 0.0197, "step": 93880 }, { "epoch": 0.24, "learning_rate": 0.0002634935364883185, "loss": 0.0204, "step": 93890 }, { "epoch": 0.24, "learning_rate": 0.000263489648271947, "loss": 0.0216, "step": 93900 }, { "epoch": 0.24, "learning_rate": 0.00026348576005557554, "loss": 0.0215, "step": 93910 }, { "epoch": 0.24, "learning_rate": 0.00026348187183920406, "loss": 0.0267, "step": 93920 }, { "epoch": 0.24, "learning_rate": 0.0002634779836228326, "loss": 0.0273, "step": 93930 }, { "epoch": 0.24, "learning_rate": 0.00026347409540646114, "loss": 0.0219, "step": 93940 }, { "epoch": 0.24, "learning_rate": 0.0002634702071900897, "loss": 0.0194, "step": 93950 }, { "epoch": 0.24, "learning_rate": 0.0002634663189737182, "loss": 0.0244, "step": 93960 }, { "epoch": 0.24, "learning_rate": 0.0002634624307573468, "loss": 0.0198, "step": 93970 }, { "epoch": 0.24, "learning_rate": 0.0002634585425409753, "loss": 0.0219, "step": 93980 }, { "epoch": 0.24, "learning_rate": 0.0002634546543246038, "loss": 0.0236, "step": 93990 }, { "epoch": 0.24, "learning_rate": 0.00026345076610823233, "loss": 0.023, "step": 94000 }, { "epoch": 0.24, "eval_cer": 0.8818440496535199, "eval_loss": 0.016325943171977997, "eval_runtime": 108.0327, "eval_samples_per_second": 18.513, "eval_steps_per_second": 4.628, "step": 94000 }, { "epoch": 0.24, "learning_rate": 0.0002634468778918609, "loss": 0.0215, "step": 94010 }, { "epoch": 0.24, "learning_rate": 0.00026344298967548947, "loss": 0.0205, "step": 94020 }, { "epoch": 0.24, "learning_rate": 0.000263439101459118, "loss": 0.0206, "step": 94030 }, { "epoch": 0.24, "learning_rate": 0.0002634352132427465, "loss": 0.0208, "step": 94040 }, { "epoch": 0.24, "learning_rate": 0.000263431325026375, "loss": 0.0246, "step": 94050 }, { "epoch": 0.24, "learning_rate": 0.0002634274368100036, "loss": 0.021, "step": 94060 }, { "epoch": 0.24, "learning_rate": 0.0002634235485936321, "loss": 0.0289, "step": 94070 }, { "epoch": 0.24, "learning_rate": 0.00026341966037726067, "loss": 0.0201, "step": 94080 }, { "epoch": 0.24, "learning_rate": 0.0002634157721608892, "loss": 0.0218, "step": 94090 }, { "epoch": 0.24, "learning_rate": 0.00026341188394451775, "loss": 0.0234, "step": 94100 }, { "epoch": 0.24, "learning_rate": 0.00026340799572814626, "loss": 0.0196, "step": 94110 }, { "epoch": 0.24, "learning_rate": 0.0002634041075117748, "loss": 0.0222, "step": 94120 }, { "epoch": 0.24, "learning_rate": 0.0002634002192954033, "loss": 0.0242, "step": 94130 }, { "epoch": 0.24, "learning_rate": 0.00026339633107903186, "loss": 0.024, "step": 94140 }, { "epoch": 0.24, "learning_rate": 0.0002633924428626604, "loss": 0.0206, "step": 94150 }, { "epoch": 0.24, "learning_rate": 0.00026338855464628895, "loss": 0.0227, "step": 94160 }, { "epoch": 0.24, "learning_rate": 0.00026338466642991746, "loss": 0.0258, "step": 94170 }, { "epoch": 0.24, "learning_rate": 0.00026338077821354603, "loss": 0.0218, "step": 94180 }, { "epoch": 0.24, "learning_rate": 0.00026337688999717454, "loss": 0.0222, "step": 94190 }, { "epoch": 0.24, "learning_rate": 0.00026337300178080306, "loss": 0.0222, "step": 94200 }, { "epoch": 0.24, "learning_rate": 0.00026336911356443157, "loss": 0.0246, "step": 94210 }, { "epoch": 0.24, "learning_rate": 0.00026336522534806014, "loss": 0.0252, "step": 94220 }, { "epoch": 0.24, "learning_rate": 0.0002633613371316887, "loss": 0.0266, "step": 94230 }, { "epoch": 0.24, "learning_rate": 0.0002633574489153172, "loss": 0.0234, "step": 94240 }, { "epoch": 0.24, "learning_rate": 0.00026335356069894574, "loss": 0.0229, "step": 94250 }, { "epoch": 0.24, "learning_rate": 0.0002633496724825743, "loss": 0.0185, "step": 94260 }, { "epoch": 0.24, "learning_rate": 0.0002633457842662028, "loss": 0.0255, "step": 94270 }, { "epoch": 0.24, "learning_rate": 0.00026334189604983134, "loss": 0.0269, "step": 94280 }, { "epoch": 0.24, "learning_rate": 0.0002633380078334599, "loss": 0.0192, "step": 94290 }, { "epoch": 0.24, "learning_rate": 0.0002633341196170884, "loss": 0.0236, "step": 94300 }, { "epoch": 0.24, "learning_rate": 0.000263330231400717, "loss": 0.0185, "step": 94310 }, { "epoch": 0.24, "learning_rate": 0.0002633263431843455, "loss": 0.0194, "step": 94320 }, { "epoch": 0.24, "learning_rate": 0.000263322454967974, "loss": 0.0258, "step": 94330 }, { "epoch": 0.24, "learning_rate": 0.00026331856675160253, "loss": 0.0274, "step": 94340 }, { "epoch": 0.24, "learning_rate": 0.0002633146785352311, "loss": 0.0206, "step": 94350 }, { "epoch": 0.24, "learning_rate": 0.00026331079031885967, "loss": 0.0191, "step": 94360 }, { "epoch": 0.24, "learning_rate": 0.0002633069021024882, "loss": 0.0232, "step": 94370 }, { "epoch": 0.24, "learning_rate": 0.0002633030138861167, "loss": 0.02, "step": 94380 }, { "epoch": 0.24, "learning_rate": 0.00026329912566974527, "loss": 0.0191, "step": 94390 }, { "epoch": 0.24, "learning_rate": 0.0002632952374533738, "loss": 0.0211, "step": 94400 }, { "epoch": 0.24, "learning_rate": 0.0002632913492370023, "loss": 0.0249, "step": 94410 }, { "epoch": 0.24, "learning_rate": 0.00026328746102063087, "loss": 0.0226, "step": 94420 }, { "epoch": 0.24, "learning_rate": 0.0002632835728042594, "loss": 0.0212, "step": 94430 }, { "epoch": 0.24, "learning_rate": 0.00026327968458788795, "loss": 0.0227, "step": 94440 }, { "epoch": 0.24, "learning_rate": 0.00026327579637151646, "loss": 0.0257, "step": 94450 }, { "epoch": 0.24, "learning_rate": 0.000263271908155145, "loss": 0.0225, "step": 94460 }, { "epoch": 0.24, "learning_rate": 0.00026326801993877355, "loss": 0.0234, "step": 94470 }, { "epoch": 0.24, "learning_rate": 0.00026326413172240206, "loss": 0.0265, "step": 94480 }, { "epoch": 0.24, "learning_rate": 0.0002632602435060306, "loss": 0.0265, "step": 94490 }, { "epoch": 0.24, "learning_rate": 0.00026325635528965914, "loss": 0.0278, "step": 94500 }, { "epoch": 0.24, "learning_rate": 0.0002632524670732877, "loss": 0.0201, "step": 94510 }, { "epoch": 0.25, "learning_rate": 0.00026324857885691623, "loss": 0.0162, "step": 94520 }, { "epoch": 0.25, "learning_rate": 0.00026324469064054474, "loss": 0.0243, "step": 94530 }, { "epoch": 0.25, "learning_rate": 0.00026324080242417326, "loss": 0.0195, "step": 94540 }, { "epoch": 0.25, "learning_rate": 0.00026323691420780177, "loss": 0.0202, "step": 94550 }, { "epoch": 0.25, "learning_rate": 0.00026323302599143034, "loss": 0.0293, "step": 94560 }, { "epoch": 0.25, "learning_rate": 0.0002632291377750589, "loss": 0.0206, "step": 94570 }, { "epoch": 0.25, "learning_rate": 0.0002632252495586874, "loss": 0.023, "step": 94580 }, { "epoch": 0.25, "learning_rate": 0.00026322136134231594, "loss": 0.022, "step": 94590 }, { "epoch": 0.25, "learning_rate": 0.0002632174731259445, "loss": 0.0211, "step": 94600 }, { "epoch": 0.25, "learning_rate": 0.000263213584909573, "loss": 0.024, "step": 94610 }, { "epoch": 0.25, "learning_rate": 0.00026320969669320154, "loss": 0.0224, "step": 94620 }, { "epoch": 0.25, "learning_rate": 0.0002632058084768301, "loss": 0.0222, "step": 94630 }, { "epoch": 0.25, "learning_rate": 0.0002632019202604586, "loss": 0.0227, "step": 94640 }, { "epoch": 0.25, "learning_rate": 0.0002631980320440872, "loss": 0.0218, "step": 94650 }, { "epoch": 0.25, "learning_rate": 0.0002631941438277157, "loss": 0.0234, "step": 94660 }, { "epoch": 0.25, "learning_rate": 0.0002631902556113442, "loss": 0.0164, "step": 94670 }, { "epoch": 0.25, "learning_rate": 0.0002631863673949728, "loss": 0.0212, "step": 94680 }, { "epoch": 0.25, "learning_rate": 0.0002631824791786013, "loss": 0.0219, "step": 94690 }, { "epoch": 0.25, "learning_rate": 0.0002631785909622298, "loss": 0.0235, "step": 94700 }, { "epoch": 0.25, "learning_rate": 0.0002631747027458584, "loss": 0.0225, "step": 94710 }, { "epoch": 0.25, "learning_rate": 0.00026317081452948695, "loss": 0.0271, "step": 94720 }, { "epoch": 0.25, "learning_rate": 0.00026316692631311547, "loss": 0.0222, "step": 94730 }, { "epoch": 0.25, "learning_rate": 0.000263163038096744, "loss": 0.0277, "step": 94740 }, { "epoch": 0.25, "learning_rate": 0.0002631591498803725, "loss": 0.018, "step": 94750 }, { "epoch": 0.25, "learning_rate": 0.00026315526166400106, "loss": 0.0245, "step": 94760 }, { "epoch": 0.25, "learning_rate": 0.0002631513734476296, "loss": 0.0267, "step": 94770 }, { "epoch": 0.25, "learning_rate": 0.00026314748523125815, "loss": 0.0243, "step": 94780 }, { "epoch": 0.25, "learning_rate": 0.00026314359701488666, "loss": 0.0243, "step": 94790 }, { "epoch": 0.25, "learning_rate": 0.0002631397087985152, "loss": 0.0244, "step": 94800 }, { "epoch": 0.25, "learning_rate": 0.00026313582058214375, "loss": 0.0194, "step": 94810 }, { "epoch": 0.25, "learning_rate": 0.00026313193236577226, "loss": 0.023, "step": 94820 }, { "epoch": 0.25, "learning_rate": 0.0002631280441494008, "loss": 0.0247, "step": 94830 }, { "epoch": 0.25, "learning_rate": 0.00026312415593302934, "loss": 0.0257, "step": 94840 }, { "epoch": 0.25, "learning_rate": 0.00026312026771665786, "loss": 0.021, "step": 94850 }, { "epoch": 0.25, "learning_rate": 0.0002631163795002864, "loss": 0.0169, "step": 94860 }, { "epoch": 0.25, "learning_rate": 0.00026311249128391494, "loss": 0.0242, "step": 94870 }, { "epoch": 0.25, "learning_rate": 0.00026310860306754346, "loss": 0.0234, "step": 94880 }, { "epoch": 0.25, "learning_rate": 0.000263104714851172, "loss": 0.0205, "step": 94890 }, { "epoch": 0.25, "learning_rate": 0.00026310082663480054, "loss": 0.0228, "step": 94900 }, { "epoch": 0.25, "learning_rate": 0.0002630969384184291, "loss": 0.0248, "step": 94910 }, { "epoch": 0.25, "learning_rate": 0.0002630930502020576, "loss": 0.0303, "step": 94920 }, { "epoch": 0.25, "learning_rate": 0.0002630891619856862, "loss": 0.0204, "step": 94930 }, { "epoch": 0.25, "learning_rate": 0.0002630852737693147, "loss": 0.019, "step": 94940 }, { "epoch": 0.25, "learning_rate": 0.0002630813855529432, "loss": 0.0221, "step": 94950 }, { "epoch": 0.25, "learning_rate": 0.00026307749733657173, "loss": 0.0193, "step": 94960 }, { "epoch": 0.25, "learning_rate": 0.0002630736091202003, "loss": 0.0259, "step": 94970 }, { "epoch": 0.25, "learning_rate": 0.0002630697209038288, "loss": 0.0214, "step": 94980 }, { "epoch": 0.25, "learning_rate": 0.0002630658326874574, "loss": 0.0231, "step": 94990 }, { "epoch": 0.25, "learning_rate": 0.0002630619444710859, "loss": 0.0236, "step": 95000 }, { "epoch": 0.25, "eval_cer": 0.8818146572779021, "eval_loss": 0.01712987571954727, "eval_runtime": 108.1006, "eval_samples_per_second": 18.501, "eval_steps_per_second": 4.625, "step": 95000 }, { "epoch": 0.25, "learning_rate": 0.00026305805625471447, "loss": 0.0222, "step": 95010 }, { "epoch": 0.25, "learning_rate": 0.000263054168038343, "loss": 0.0312, "step": 95020 }, { "epoch": 0.25, "learning_rate": 0.0002630502798219715, "loss": 0.0223, "step": 95030 }, { "epoch": 0.25, "learning_rate": 0.0002630463916056, "loss": 0.0236, "step": 95040 }, { "epoch": 0.25, "learning_rate": 0.0002630425033892286, "loss": 0.0203, "step": 95050 }, { "epoch": 0.25, "learning_rate": 0.00026303861517285715, "loss": 0.0268, "step": 95060 }, { "epoch": 0.25, "learning_rate": 0.00026303472695648567, "loss": 0.0258, "step": 95070 }, { "epoch": 0.25, "learning_rate": 0.0002630308387401142, "loss": 0.0242, "step": 95080 }, { "epoch": 0.25, "learning_rate": 0.0002630269505237427, "loss": 0.0207, "step": 95090 }, { "epoch": 0.25, "learning_rate": 0.00026302306230737126, "loss": 0.0302, "step": 95100 }, { "epoch": 0.25, "learning_rate": 0.0002630191740909998, "loss": 0.0394, "step": 95110 }, { "epoch": 0.25, "learning_rate": 0.00026301528587462835, "loss": 0.0264, "step": 95120 }, { "epoch": 0.25, "learning_rate": 0.00026301139765825686, "loss": 0.0219, "step": 95130 }, { "epoch": 0.25, "learning_rate": 0.00026300750944188543, "loss": 0.0278, "step": 95140 }, { "epoch": 0.25, "learning_rate": 0.00026300362122551394, "loss": 0.0278, "step": 95150 }, { "epoch": 0.25, "learning_rate": 0.00026299973300914246, "loss": 0.0267, "step": 95160 }, { "epoch": 0.25, "learning_rate": 0.000262995844792771, "loss": 0.0246, "step": 95170 }, { "epoch": 0.25, "learning_rate": 0.00026299195657639954, "loss": 0.0247, "step": 95180 }, { "epoch": 0.25, "learning_rate": 0.00026298806836002806, "loss": 0.024, "step": 95190 }, { "epoch": 0.25, "learning_rate": 0.0002629841801436566, "loss": 0.0246, "step": 95200 }, { "epoch": 0.25, "learning_rate": 0.00026298029192728514, "loss": 0.0258, "step": 95210 }, { "epoch": 0.25, "learning_rate": 0.0002629764037109137, "loss": 0.0233, "step": 95220 }, { "epoch": 0.25, "learning_rate": 0.0002629725154945422, "loss": 0.0232, "step": 95230 }, { "epoch": 0.25, "learning_rate": 0.00026296862727817074, "loss": 0.0231, "step": 95240 }, { "epoch": 0.25, "learning_rate": 0.00026296473906179925, "loss": 0.0219, "step": 95250 }, { "epoch": 0.25, "learning_rate": 0.0002629608508454278, "loss": 0.0233, "step": 95260 }, { "epoch": 0.25, "learning_rate": 0.0002629569626290564, "loss": 0.0215, "step": 95270 }, { "epoch": 0.25, "learning_rate": 0.0002629530744126849, "loss": 0.024, "step": 95280 }, { "epoch": 0.25, "learning_rate": 0.0002629491861963134, "loss": 0.0246, "step": 95290 }, { "epoch": 0.25, "learning_rate": 0.00026294529797994193, "loss": 0.0181, "step": 95300 }, { "epoch": 0.25, "learning_rate": 0.0002629414097635705, "loss": 0.0273, "step": 95310 }, { "epoch": 0.25, "learning_rate": 0.000262937521547199, "loss": 0.03, "step": 95320 }, { "epoch": 0.25, "learning_rate": 0.0002629336333308276, "loss": 0.0268, "step": 95330 }, { "epoch": 0.25, "learning_rate": 0.0002629297451144561, "loss": 0.0232, "step": 95340 }, { "epoch": 0.25, "learning_rate": 0.00026292585689808467, "loss": 0.02, "step": 95350 }, { "epoch": 0.25, "learning_rate": 0.0002629219686817132, "loss": 0.0213, "step": 95360 }, { "epoch": 0.25, "learning_rate": 0.0002629180804653417, "loss": 0.0252, "step": 95370 }, { "epoch": 0.25, "learning_rate": 0.0002629141922489702, "loss": 0.0187, "step": 95380 }, { "epoch": 0.25, "learning_rate": 0.0002629103040325988, "loss": 0.0474, "step": 95390 }, { "epoch": 0.25, "learning_rate": 0.0002629064158162273, "loss": 0.0239, "step": 95400 }, { "epoch": 0.25, "learning_rate": 0.00026290252759985586, "loss": 0.0216, "step": 95410 }, { "epoch": 0.25, "learning_rate": 0.0002628986393834844, "loss": 0.0224, "step": 95420 }, { "epoch": 0.25, "learning_rate": 0.00026289475116711295, "loss": 0.0261, "step": 95430 }, { "epoch": 0.25, "learning_rate": 0.00026289086295074146, "loss": 0.0242, "step": 95440 }, { "epoch": 0.25, "learning_rate": 0.00026288697473437, "loss": 0.0195, "step": 95450 }, { "epoch": 0.25, "learning_rate": 0.00026288308651799855, "loss": 0.0212, "step": 95460 }, { "epoch": 0.25, "learning_rate": 0.00026287919830162706, "loss": 0.0232, "step": 95470 }, { "epoch": 0.25, "learning_rate": 0.00026287531008525563, "loss": 0.023, "step": 95480 }, { "epoch": 0.25, "learning_rate": 0.00026287142186888414, "loss": 0.021, "step": 95490 }, { "epoch": 0.25, "learning_rate": 0.00026286753365251266, "loss": 0.024, "step": 95500 }, { "epoch": 0.25, "learning_rate": 0.0002628636454361412, "loss": 0.0206, "step": 95510 }, { "epoch": 0.25, "learning_rate": 0.00026285975721976974, "loss": 0.0242, "step": 95520 }, { "epoch": 0.25, "learning_rate": 0.00026285586900339826, "loss": 0.0225, "step": 95530 }, { "epoch": 0.25, "learning_rate": 0.0002628519807870268, "loss": 0.0296, "step": 95540 }, { "epoch": 0.25, "learning_rate": 0.00026284809257065534, "loss": 0.0278, "step": 95550 }, { "epoch": 0.25, "learning_rate": 0.0002628442043542839, "loss": 0.0302, "step": 95560 }, { "epoch": 0.25, "learning_rate": 0.0002628403161379124, "loss": 0.0253, "step": 95570 }, { "epoch": 0.25, "learning_rate": 0.00026283642792154094, "loss": 0.0206, "step": 95580 }, { "epoch": 0.25, "learning_rate": 0.00026283253970516945, "loss": 0.0221, "step": 95590 }, { "epoch": 0.25, "learning_rate": 0.000262828651488798, "loss": 0.0269, "step": 95600 }, { "epoch": 0.25, "learning_rate": 0.0002628247632724266, "loss": 0.0239, "step": 95610 }, { "epoch": 0.25, "learning_rate": 0.0002628208750560551, "loss": 0.0263, "step": 95620 }, { "epoch": 0.25, "learning_rate": 0.0002628169868396836, "loss": 0.0246, "step": 95630 }, { "epoch": 0.25, "learning_rate": 0.0002628130986233122, "loss": 0.0213, "step": 95640 }, { "epoch": 0.25, "learning_rate": 0.0002628092104069407, "loss": 0.0205, "step": 95650 }, { "epoch": 0.25, "learning_rate": 0.0002628053221905692, "loss": 0.0243, "step": 95660 }, { "epoch": 0.25, "learning_rate": 0.0002628014339741978, "loss": 0.0259, "step": 95670 }, { "epoch": 0.25, "learning_rate": 0.0002627975457578263, "loss": 0.0225, "step": 95680 }, { "epoch": 0.25, "learning_rate": 0.00026279365754145487, "loss": 0.0225, "step": 95690 }, { "epoch": 0.25, "learning_rate": 0.0002627897693250834, "loss": 0.0246, "step": 95700 }, { "epoch": 0.25, "learning_rate": 0.0002627858811087119, "loss": 0.0295, "step": 95710 }, { "epoch": 0.25, "learning_rate": 0.00026278199289234047, "loss": 0.0247, "step": 95720 }, { "epoch": 0.25, "learning_rate": 0.000262778104675969, "loss": 0.0198, "step": 95730 }, { "epoch": 0.25, "learning_rate": 0.0002627742164595975, "loss": 0.0252, "step": 95740 }, { "epoch": 0.25, "learning_rate": 0.00026277032824322606, "loss": 0.0224, "step": 95750 }, { "epoch": 0.25, "learning_rate": 0.00026276644002685463, "loss": 0.0235, "step": 95760 }, { "epoch": 0.25, "learning_rate": 0.00026276255181048315, "loss": 0.02, "step": 95770 }, { "epoch": 0.25, "learning_rate": 0.00026275866359411166, "loss": 0.0227, "step": 95780 }, { "epoch": 0.25, "learning_rate": 0.0002627547753777402, "loss": 0.0249, "step": 95790 }, { "epoch": 0.25, "learning_rate": 0.0002627508871613687, "loss": 0.018, "step": 95800 }, { "epoch": 0.25, "learning_rate": 0.00026274699894499726, "loss": 0.0222, "step": 95810 }, { "epoch": 0.25, "learning_rate": 0.00026274311072862583, "loss": 0.0268, "step": 95820 }, { "epoch": 0.25, "learning_rate": 0.00026273922251225434, "loss": 0.0263, "step": 95830 }, { "epoch": 0.25, "learning_rate": 0.00026273533429588286, "loss": 0.0219, "step": 95840 }, { "epoch": 0.25, "learning_rate": 0.0002627314460795114, "loss": 0.0213, "step": 95850 }, { "epoch": 0.25, "learning_rate": 0.00026272755786313994, "loss": 0.0186, "step": 95860 }, { "epoch": 0.25, "learning_rate": 0.00026272366964676845, "loss": 0.0234, "step": 95870 }, { "epoch": 0.25, "learning_rate": 0.000262719781430397, "loss": 0.0201, "step": 95880 }, { "epoch": 0.25, "learning_rate": 0.00026271589321402554, "loss": 0.0196, "step": 95890 }, { "epoch": 0.25, "learning_rate": 0.0002627120049976541, "loss": 0.0332, "step": 95900 }, { "epoch": 0.25, "learning_rate": 0.0002627081167812826, "loss": 0.0205, "step": 95910 }, { "epoch": 0.25, "learning_rate": 0.00026270422856491114, "loss": 0.0223, "step": 95920 }, { "epoch": 0.25, "learning_rate": 0.0002627003403485397, "loss": 0.0253, "step": 95930 }, { "epoch": 0.25, "learning_rate": 0.0002626964521321682, "loss": 0.0275, "step": 95940 }, { "epoch": 0.25, "learning_rate": 0.0002626925639157968, "loss": 0.0231, "step": 95950 }, { "epoch": 0.25, "learning_rate": 0.0002626886756994253, "loss": 0.0235, "step": 95960 }, { "epoch": 0.25, "learning_rate": 0.00026268478748305387, "loss": 0.0194, "step": 95970 }, { "epoch": 0.25, "learning_rate": 0.0002626808992666824, "loss": 0.0291, "step": 95980 }, { "epoch": 0.25, "learning_rate": 0.0002626770110503109, "loss": 0.0247, "step": 95990 }, { "epoch": 0.25, "learning_rate": 0.0002626731228339394, "loss": 0.0224, "step": 96000 }, { "epoch": 0.25, "eval_cer": 0.881751673615864, "eval_loss": 0.017516400665044785, "eval_runtime": 107.996, "eval_samples_per_second": 18.519, "eval_steps_per_second": 4.63, "step": 96000 }, { "epoch": 0.25, "learning_rate": 0.000262669234617568, "loss": 0.03, "step": 96010 }, { "epoch": 0.25, "learning_rate": 0.0002626653464011965, "loss": 0.0249, "step": 96020 }, { "epoch": 0.25, "learning_rate": 0.00026266145818482507, "loss": 0.0214, "step": 96030 }, { "epoch": 0.25, "learning_rate": 0.0002626575699684536, "loss": 0.0229, "step": 96040 }, { "epoch": 0.25, "learning_rate": 0.0002626536817520821, "loss": 0.0199, "step": 96050 }, { "epoch": 0.25, "learning_rate": 0.00026264979353571066, "loss": 0.0229, "step": 96060 }, { "epoch": 0.25, "learning_rate": 0.0002626459053193392, "loss": 0.0228, "step": 96070 }, { "epoch": 0.25, "learning_rate": 0.0002626420171029677, "loss": 0.0202, "step": 96080 }, { "epoch": 0.25, "learning_rate": 0.00026263812888659626, "loss": 0.0246, "step": 96090 }, { "epoch": 0.25, "learning_rate": 0.00026263424067022483, "loss": 0.0272, "step": 96100 }, { "epoch": 0.25, "learning_rate": 0.00026263035245385335, "loss": 0.0252, "step": 96110 }, { "epoch": 0.25, "learning_rate": 0.00026262646423748186, "loss": 0.0245, "step": 96120 }, { "epoch": 0.25, "learning_rate": 0.0002626225760211104, "loss": 0.0236, "step": 96130 }, { "epoch": 0.25, "learning_rate": 0.00026261868780473894, "loss": 0.0206, "step": 96140 }, { "epoch": 0.25, "learning_rate": 0.00026261479958836746, "loss": 0.0211, "step": 96150 }, { "epoch": 0.25, "learning_rate": 0.000262610911371996, "loss": 0.019, "step": 96160 }, { "epoch": 0.25, "learning_rate": 0.00026260702315562454, "loss": 0.0243, "step": 96170 }, { "epoch": 0.25, "learning_rate": 0.0002626031349392531, "loss": 0.0239, "step": 96180 }, { "epoch": 0.25, "learning_rate": 0.0002625992467228816, "loss": 0.0226, "step": 96190 }, { "epoch": 0.25, "learning_rate": 0.00026259535850651014, "loss": 0.0216, "step": 96200 }, { "epoch": 0.25, "learning_rate": 0.00026259147029013865, "loss": 0.0244, "step": 96210 }, { "epoch": 0.25, "learning_rate": 0.0002625875820737672, "loss": 0.0203, "step": 96220 }, { "epoch": 0.25, "learning_rate": 0.00026258369385739574, "loss": 0.0193, "step": 96230 }, { "epoch": 0.25, "learning_rate": 0.0002625798056410243, "loss": 0.0216, "step": 96240 }, { "epoch": 0.25, "learning_rate": 0.0002625759174246528, "loss": 0.0192, "step": 96250 }, { "epoch": 0.25, "learning_rate": 0.0002625720292082814, "loss": 0.0254, "step": 96260 }, { "epoch": 0.25, "learning_rate": 0.0002625681409919099, "loss": 0.0176, "step": 96270 }, { "epoch": 0.25, "learning_rate": 0.0002625642527755384, "loss": 0.0225, "step": 96280 }, { "epoch": 0.25, "learning_rate": 0.00026256036455916693, "loss": 0.0221, "step": 96290 }, { "epoch": 0.25, "learning_rate": 0.0002625564763427955, "loss": 0.0228, "step": 96300 }, { "epoch": 0.25, "learning_rate": 0.00026255258812642407, "loss": 0.0239, "step": 96310 }, { "epoch": 0.25, "learning_rate": 0.0002625486999100526, "loss": 0.0254, "step": 96320 }, { "epoch": 0.25, "learning_rate": 0.0002625448116936811, "loss": 0.0238, "step": 96330 }, { "epoch": 0.25, "learning_rate": 0.0002625409234773096, "loss": 0.0202, "step": 96340 }, { "epoch": 0.25, "learning_rate": 0.0002625370352609382, "loss": 0.0183, "step": 96350 }, { "epoch": 0.25, "learning_rate": 0.0002625331470445667, "loss": 0.0207, "step": 96360 }, { "epoch": 0.25, "learning_rate": 0.00026252925882819527, "loss": 0.0237, "step": 96370 }, { "epoch": 0.25, "learning_rate": 0.0002625253706118238, "loss": 0.0236, "step": 96380 }, { "epoch": 0.25, "learning_rate": 0.00026252148239545235, "loss": 0.0191, "step": 96390 }, { "epoch": 0.25, "learning_rate": 0.00026251759417908086, "loss": 0.0277, "step": 96400 }, { "epoch": 0.25, "learning_rate": 0.0002625137059627094, "loss": 0.019, "step": 96410 }, { "epoch": 0.25, "learning_rate": 0.0002625098177463379, "loss": 0.0202, "step": 96420 }, { "epoch": 0.25, "learning_rate": 0.00026250592952996646, "loss": 0.0288, "step": 96430 }, { "epoch": 0.25, "learning_rate": 0.000262502041313595, "loss": 0.0273, "step": 96440 }, { "epoch": 0.25, "learning_rate": 0.00026249815309722354, "loss": 0.0206, "step": 96450 }, { "epoch": 0.25, "learning_rate": 0.00026249426488085206, "loss": 0.0216, "step": 96460 }, { "epoch": 0.25, "learning_rate": 0.00026249037666448063, "loss": 0.0235, "step": 96470 }, { "epoch": 0.25, "learning_rate": 0.00026248648844810914, "loss": 0.0196, "step": 96480 }, { "epoch": 0.25, "learning_rate": 0.00026248260023173766, "loss": 0.0204, "step": 96490 }, { "epoch": 0.25, "learning_rate": 0.0002624787120153662, "loss": 0.0219, "step": 96500 }, { "epoch": 0.25, "learning_rate": 0.00026247482379899474, "loss": 0.0186, "step": 96510 }, { "epoch": 0.25, "learning_rate": 0.0002624709355826233, "loss": 0.0247, "step": 96520 }, { "epoch": 0.25, "learning_rate": 0.0002624670473662518, "loss": 0.0307, "step": 96530 }, { "epoch": 0.25, "learning_rate": 0.00026246315914988034, "loss": 0.0238, "step": 96540 }, { "epoch": 0.25, "learning_rate": 0.00026245927093350885, "loss": 0.0259, "step": 96550 }, { "epoch": 0.25, "learning_rate": 0.0002624553827171374, "loss": 0.0231, "step": 96560 }, { "epoch": 0.25, "learning_rate": 0.00026245149450076594, "loss": 0.0279, "step": 96570 }, { "epoch": 0.25, "learning_rate": 0.0002624476062843945, "loss": 0.0199, "step": 96580 }, { "epoch": 0.25, "learning_rate": 0.000262443718068023, "loss": 0.0186, "step": 96590 }, { "epoch": 0.25, "learning_rate": 0.0002624398298516516, "loss": 0.0189, "step": 96600 }, { "epoch": 0.25, "learning_rate": 0.0002624359416352801, "loss": 0.022, "step": 96610 }, { "epoch": 0.25, "learning_rate": 0.0002624320534189086, "loss": 0.0252, "step": 96620 }, { "epoch": 0.25, "learning_rate": 0.00026242816520253713, "loss": 0.0194, "step": 96630 }, { "epoch": 0.25, "learning_rate": 0.0002624242769861657, "loss": 0.0182, "step": 96640 }, { "epoch": 0.25, "learning_rate": 0.00026242038876979427, "loss": 0.0244, "step": 96650 }, { "epoch": 0.25, "learning_rate": 0.0002624165005534228, "loss": 0.0255, "step": 96660 }, { "epoch": 0.25, "learning_rate": 0.0002624126123370513, "loss": 0.0238, "step": 96670 }, { "epoch": 0.25, "learning_rate": 0.00026240872412067987, "loss": 0.0243, "step": 96680 }, { "epoch": 0.25, "learning_rate": 0.0002624048359043084, "loss": 0.0197, "step": 96690 }, { "epoch": 0.25, "learning_rate": 0.0002624009476879369, "loss": 0.0253, "step": 96700 }, { "epoch": 0.25, "learning_rate": 0.00026239705947156546, "loss": 0.0206, "step": 96710 }, { "epoch": 0.25, "learning_rate": 0.000262393171255194, "loss": 0.0228, "step": 96720 }, { "epoch": 0.25, "learning_rate": 0.00026238928303882255, "loss": 0.0206, "step": 96730 }, { "epoch": 0.25, "learning_rate": 0.00026238539482245106, "loss": 0.0258, "step": 96740 }, { "epoch": 0.25, "learning_rate": 0.0002623815066060796, "loss": 0.0245, "step": 96750 }, { "epoch": 0.25, "learning_rate": 0.00026237761838970815, "loss": 0.0176, "step": 96760 }, { "epoch": 0.25, "learning_rate": 0.00026237373017333666, "loss": 0.0235, "step": 96770 }, { "epoch": 0.25, "learning_rate": 0.0002623698419569652, "loss": 0.0234, "step": 96780 }, { "epoch": 0.25, "learning_rate": 0.00026236595374059374, "loss": 0.0259, "step": 96790 }, { "epoch": 0.25, "learning_rate": 0.00026236206552422226, "loss": 0.0218, "step": 96800 }, { "epoch": 0.25, "learning_rate": 0.0002623581773078508, "loss": 0.0227, "step": 96810 }, { "epoch": 0.25, "learning_rate": 0.00026235428909147934, "loss": 0.0229, "step": 96820 }, { "epoch": 0.25, "learning_rate": 0.00026235040087510786, "loss": 0.025, "step": 96830 }, { "epoch": 0.25, "learning_rate": 0.00026234651265873637, "loss": 0.0188, "step": 96840 }, { "epoch": 0.25, "learning_rate": 0.00026234262444236494, "loss": 0.0253, "step": 96850 }, { "epoch": 0.25, "learning_rate": 0.0002623387362259935, "loss": 0.0241, "step": 96860 }, { "epoch": 0.25, "learning_rate": 0.000262334848009622, "loss": 0.0215, "step": 96870 }, { "epoch": 0.25, "learning_rate": 0.00026233095979325054, "loss": 0.021, "step": 96880 }, { "epoch": 0.25, "learning_rate": 0.0002623270715768791, "loss": 0.0251, "step": 96890 }, { "epoch": 0.25, "learning_rate": 0.0002623231833605076, "loss": 0.0225, "step": 96900 }, { "epoch": 0.25, "learning_rate": 0.00026231929514413613, "loss": 0.0237, "step": 96910 }, { "epoch": 0.25, "learning_rate": 0.0002623154069277647, "loss": 0.0289, "step": 96920 }, { "epoch": 0.25, "learning_rate": 0.0002623115187113932, "loss": 0.0258, "step": 96930 }, { "epoch": 0.25, "learning_rate": 0.0002623076304950218, "loss": 0.0183, "step": 96940 }, { "epoch": 0.25, "learning_rate": 0.0002623037422786503, "loss": 0.0241, "step": 96950 }, { "epoch": 0.25, "learning_rate": 0.0002622998540622788, "loss": 0.0189, "step": 96960 }, { "epoch": 0.25, "learning_rate": 0.0002622959658459074, "loss": 0.0213, "step": 96970 }, { "epoch": 0.25, "learning_rate": 0.0002622920776295359, "loss": 0.0244, "step": 96980 }, { "epoch": 0.25, "learning_rate": 0.0002622881894131644, "loss": 0.024, "step": 96990 }, { "epoch": 0.25, "learning_rate": 0.000262284301196793, "loss": 0.0202, "step": 97000 }, { "epoch": 0.25, "eval_cer": 0.8818160569148363, "eval_loss": 0.016042526811361313, "eval_runtime": 107.9667, "eval_samples_per_second": 18.524, "eval_steps_per_second": 4.631, "step": 97000 }, { "epoch": 0.25, "learning_rate": 0.0002622804129804215, "loss": 0.0227, "step": 97010 }, { "epoch": 0.25, "learning_rate": 0.00026227652476405007, "loss": 0.0175, "step": 97020 }, { "epoch": 0.25, "learning_rate": 0.0002622726365476786, "loss": 0.0196, "step": 97030 }, { "epoch": 0.25, "learning_rate": 0.0002622687483313071, "loss": 0.0252, "step": 97040 }, { "epoch": 0.25, "learning_rate": 0.00026226486011493566, "loss": 0.021, "step": 97050 }, { "epoch": 0.25, "learning_rate": 0.0002622609718985642, "loss": 0.0247, "step": 97060 }, { "epoch": 0.25, "learning_rate": 0.00026225708368219275, "loss": 0.0296, "step": 97070 }, { "epoch": 0.25, "learning_rate": 0.00026225319546582126, "loss": 0.0238, "step": 97080 }, { "epoch": 0.25, "learning_rate": 0.0002622493072494498, "loss": 0.0204, "step": 97090 }, { "epoch": 0.25, "learning_rate": 0.00026224541903307834, "loss": 0.0246, "step": 97100 }, { "epoch": 0.25, "learning_rate": 0.00026224153081670686, "loss": 0.0229, "step": 97110 }, { "epoch": 0.25, "learning_rate": 0.0002622376426003354, "loss": 0.0236, "step": 97120 }, { "epoch": 0.25, "learning_rate": 0.00026223375438396394, "loss": 0.021, "step": 97130 }, { "epoch": 0.25, "learning_rate": 0.0002622298661675925, "loss": 0.0214, "step": 97140 }, { "epoch": 0.25, "learning_rate": 0.000262225977951221, "loss": 0.0232, "step": 97150 }, { "epoch": 0.25, "learning_rate": 0.00026222208973484954, "loss": 0.0223, "step": 97160 }, { "epoch": 0.25, "learning_rate": 0.00026221820151847805, "loss": 0.0248, "step": 97170 }, { "epoch": 0.25, "learning_rate": 0.0002622143133021066, "loss": 0.0238, "step": 97180 }, { "epoch": 0.25, "learning_rate": 0.00026221042508573514, "loss": 0.0227, "step": 97190 }, { "epoch": 0.25, "learning_rate": 0.0002622065368693637, "loss": 0.022, "step": 97200 }, { "epoch": 0.25, "learning_rate": 0.0002622026486529922, "loss": 0.0239, "step": 97210 }, { "epoch": 0.25, "learning_rate": 0.0002621987604366208, "loss": 0.02, "step": 97220 }, { "epoch": 0.25, "learning_rate": 0.0002621948722202493, "loss": 0.023, "step": 97230 }, { "epoch": 0.25, "learning_rate": 0.0002621909840038778, "loss": 0.0185, "step": 97240 }, { "epoch": 0.25, "learning_rate": 0.00026218709578750633, "loss": 0.0222, "step": 97250 }, { "epoch": 0.25, "learning_rate": 0.0002621832075711349, "loss": 0.022, "step": 97260 }, { "epoch": 0.25, "learning_rate": 0.0002621793193547634, "loss": 0.0252, "step": 97270 }, { "epoch": 0.25, "learning_rate": 0.000262175431138392, "loss": 0.027, "step": 97280 }, { "epoch": 0.25, "learning_rate": 0.0002621715429220205, "loss": 0.0224, "step": 97290 }, { "epoch": 0.25, "learning_rate": 0.000262167654705649, "loss": 0.0209, "step": 97300 }, { "epoch": 0.25, "learning_rate": 0.0002621637664892776, "loss": 0.0219, "step": 97310 }, { "epoch": 0.25, "learning_rate": 0.0002621598782729061, "loss": 0.0227, "step": 97320 }, { "epoch": 0.25, "learning_rate": 0.0002621559900565346, "loss": 0.0263, "step": 97330 }, { "epoch": 0.25, "learning_rate": 0.0002621521018401632, "loss": 0.0215, "step": 97340 }, { "epoch": 0.25, "learning_rate": 0.00026214821362379175, "loss": 0.0214, "step": 97350 }, { "epoch": 0.25, "learning_rate": 0.00026214432540742026, "loss": 0.0172, "step": 97360 }, { "epoch": 0.25, "learning_rate": 0.0002621404371910488, "loss": 0.0268, "step": 97370 }, { "epoch": 0.25, "learning_rate": 0.0002621365489746773, "loss": 0.0224, "step": 97380 }, { "epoch": 0.25, "learning_rate": 0.00026213266075830586, "loss": 0.0195, "step": 97390 }, { "epoch": 0.25, "learning_rate": 0.0002621287725419344, "loss": 0.0219, "step": 97400 }, { "epoch": 0.25, "learning_rate": 0.00026212488432556295, "loss": 0.02, "step": 97410 }, { "epoch": 0.25, "learning_rate": 0.00026212099610919146, "loss": 0.0233, "step": 97420 }, { "epoch": 0.25, "learning_rate": 0.00026211710789282003, "loss": 0.0182, "step": 97430 }, { "epoch": 0.25, "learning_rate": 0.00026211321967644854, "loss": 0.0235, "step": 97440 }, { "epoch": 0.25, "learning_rate": 0.00026210933146007706, "loss": 0.0277, "step": 97450 }, { "epoch": 0.25, "learning_rate": 0.00026210544324370557, "loss": 0.0193, "step": 97460 }, { "epoch": 0.25, "learning_rate": 0.00026210155502733414, "loss": 0.0187, "step": 97470 }, { "epoch": 0.25, "learning_rate": 0.00026209766681096266, "loss": 0.0199, "step": 97480 }, { "epoch": 0.25, "learning_rate": 0.0002620937785945912, "loss": 0.0221, "step": 97490 }, { "epoch": 0.25, "learning_rate": 0.00026208989037821974, "loss": 0.023, "step": 97500 }, { "epoch": 0.25, "learning_rate": 0.00026208600216184825, "loss": 0.0252, "step": 97510 }, { "epoch": 0.25, "learning_rate": 0.0002620821139454768, "loss": 0.0199, "step": 97520 }, { "epoch": 0.25, "learning_rate": 0.00026207822572910534, "loss": 0.0201, "step": 97530 }, { "epoch": 0.25, "learning_rate": 0.0002620743375127339, "loss": 0.0221, "step": 97540 }, { "epoch": 0.25, "learning_rate": 0.0002620704492963624, "loss": 0.0242, "step": 97550 }, { "epoch": 0.25, "learning_rate": 0.000262066561079991, "loss": 0.0248, "step": 97560 }, { "epoch": 0.25, "learning_rate": 0.0002620626728636195, "loss": 0.0214, "step": 97570 }, { "epoch": 0.25, "learning_rate": 0.000262058784647248, "loss": 0.0246, "step": 97580 }, { "epoch": 0.25, "learning_rate": 0.00026205489643087653, "loss": 0.0233, "step": 97590 }, { "epoch": 0.25, "learning_rate": 0.0002620510082145051, "loss": 0.02, "step": 97600 }, { "epoch": 0.25, "learning_rate": 0.0002620471199981336, "loss": 0.021, "step": 97610 }, { "epoch": 0.25, "learning_rate": 0.0002620432317817622, "loss": 0.0219, "step": 97620 }, { "epoch": 0.25, "learning_rate": 0.0002620393435653907, "loss": 0.0237, "step": 97630 }, { "epoch": 0.25, "learning_rate": 0.00026203545534901927, "loss": 0.0237, "step": 97640 }, { "epoch": 0.25, "learning_rate": 0.0002620315671326478, "loss": 0.0202, "step": 97650 }, { "epoch": 0.25, "learning_rate": 0.0002620276789162763, "loss": 0.0219, "step": 97660 }, { "epoch": 0.25, "learning_rate": 0.0002620237906999048, "loss": 0.0214, "step": 97670 }, { "epoch": 0.25, "learning_rate": 0.0002620199024835334, "loss": 0.0295, "step": 97680 }, { "epoch": 0.25, "learning_rate": 0.00026201601426716195, "loss": 0.0185, "step": 97690 }, { "epoch": 0.25, "learning_rate": 0.00026201212605079046, "loss": 0.0212, "step": 97700 }, { "epoch": 0.25, "learning_rate": 0.000262008237834419, "loss": 0.0268, "step": 97710 }, { "epoch": 0.25, "learning_rate": 0.00026200434961804755, "loss": 0.0236, "step": 97720 }, { "epoch": 0.25, "learning_rate": 0.00026200046140167606, "loss": 0.0239, "step": 97730 }, { "epoch": 0.25, "learning_rate": 0.0002619965731853046, "loss": 0.0194, "step": 97740 }, { "epoch": 0.25, "learning_rate": 0.00026199268496893314, "loss": 0.0236, "step": 97750 }, { "epoch": 0.25, "learning_rate": 0.00026198879675256166, "loss": 0.02, "step": 97760 }, { "epoch": 0.25, "learning_rate": 0.00026198490853619023, "loss": 0.0215, "step": 97770 }, { "epoch": 0.25, "learning_rate": 0.00026198102031981874, "loss": 0.0231, "step": 97780 }, { "epoch": 0.25, "learning_rate": 0.00026197713210344726, "loss": 0.0298, "step": 97790 }, { "epoch": 0.25, "learning_rate": 0.00026197324388707577, "loss": 0.0227, "step": 97800 }, { "epoch": 0.25, "learning_rate": 0.00026196935567070434, "loss": 0.0215, "step": 97810 }, { "epoch": 0.25, "learning_rate": 0.00026196546745433285, "loss": 0.0186, "step": 97820 }, { "epoch": 0.25, "learning_rate": 0.0002619615792379614, "loss": 0.0246, "step": 97830 }, { "epoch": 0.25, "learning_rate": 0.00026195769102158994, "loss": 0.0229, "step": 97840 }, { "epoch": 0.25, "learning_rate": 0.0002619538028052185, "loss": 0.0218, "step": 97850 }, { "epoch": 0.25, "learning_rate": 0.000261949914588847, "loss": 0.018, "step": 97860 }, { "epoch": 0.25, "learning_rate": 0.00026194602637247554, "loss": 0.0201, "step": 97870 }, { "epoch": 0.25, "learning_rate": 0.00026194213815610405, "loss": 0.0216, "step": 97880 }, { "epoch": 0.25, "learning_rate": 0.0002619382499397326, "loss": 0.0217, "step": 97890 }, { "epoch": 0.25, "learning_rate": 0.0002619343617233612, "loss": 0.0193, "step": 97900 }, { "epoch": 0.25, "learning_rate": 0.0002619304735069897, "loss": 0.0183, "step": 97910 }, { "epoch": 0.25, "learning_rate": 0.0002619265852906182, "loss": 0.0198, "step": 97920 }, { "epoch": 0.25, "learning_rate": 0.0002619226970742468, "loss": 0.0229, "step": 97930 }, { "epoch": 0.25, "learning_rate": 0.0002619188088578753, "loss": 0.0204, "step": 97940 }, { "epoch": 0.25, "learning_rate": 0.0002619149206415038, "loss": 0.0208, "step": 97950 }, { "epoch": 0.25, "learning_rate": 0.0002619110324251324, "loss": 0.0247, "step": 97960 }, { "epoch": 0.25, "learning_rate": 0.0002619071442087609, "loss": 0.0209, "step": 97970 }, { "epoch": 0.25, "learning_rate": 0.00026190325599238947, "loss": 0.0225, "step": 97980 }, { "epoch": 0.25, "learning_rate": 0.000261899367776018, "loss": 0.0227, "step": 97990 }, { "epoch": 0.25, "learning_rate": 0.0002618954795596465, "loss": 0.0202, "step": 98000 }, { "epoch": 0.25, "eval_cer": 0.8818538471120592, "eval_loss": 0.016256479546427727, "eval_runtime": 107.9645, "eval_samples_per_second": 18.525, "eval_steps_per_second": 4.631, "step": 98000 }, { "epoch": 0.25, "learning_rate": 0.000261891591343275, "loss": 0.0266, "step": 98010 }, { "epoch": 0.25, "learning_rate": 0.0002618877031269036, "loss": 0.0213, "step": 98020 }, { "epoch": 0.25, "learning_rate": 0.0002618838149105321, "loss": 0.0209, "step": 98030 }, { "epoch": 0.25, "learning_rate": 0.00026187992669416066, "loss": 0.0241, "step": 98040 }, { "epoch": 0.25, "learning_rate": 0.0002618760384777892, "loss": 0.0208, "step": 98050 }, { "epoch": 0.25, "learning_rate": 0.00026187215026141775, "loss": 0.0212, "step": 98060 }, { "epoch": 0.25, "learning_rate": 0.00026186826204504626, "loss": 0.0241, "step": 98070 }, { "epoch": 0.25, "learning_rate": 0.0002618643738286748, "loss": 0.0228, "step": 98080 }, { "epoch": 0.25, "learning_rate": 0.00026186048561230334, "loss": 0.0236, "step": 98090 }, { "epoch": 0.25, "learning_rate": 0.00026185659739593186, "loss": 0.0243, "step": 98100 }, { "epoch": 0.25, "learning_rate": 0.0002618527091795604, "loss": 0.0225, "step": 98110 }, { "epoch": 0.25, "learning_rate": 0.00026184882096318894, "loss": 0.0208, "step": 98120 }, { "epoch": 0.25, "learning_rate": 0.00026184493274681746, "loss": 0.0218, "step": 98130 }, { "epoch": 0.25, "learning_rate": 0.000261841044530446, "loss": 0.0229, "step": 98140 }, { "epoch": 0.25, "learning_rate": 0.00026183715631407454, "loss": 0.0221, "step": 98150 }, { "epoch": 0.25, "learning_rate": 0.00026183326809770305, "loss": 0.0188, "step": 98160 }, { "epoch": 0.25, "learning_rate": 0.0002618293798813316, "loss": 0.0269, "step": 98170 }, { "epoch": 0.25, "learning_rate": 0.00026182549166496014, "loss": 0.021, "step": 98180 }, { "epoch": 0.25, "learning_rate": 0.0002618216034485887, "loss": 0.0239, "step": 98190 }, { "epoch": 0.25, "learning_rate": 0.0002618177152322172, "loss": 0.025, "step": 98200 }, { "epoch": 0.25, "learning_rate": 0.00026181382701584573, "loss": 0.0194, "step": 98210 }, { "epoch": 0.25, "learning_rate": 0.0002618099387994743, "loss": 0.0218, "step": 98220 }, { "epoch": 0.25, "learning_rate": 0.0002618060505831028, "loss": 0.0222, "step": 98230 }, { "epoch": 0.25, "learning_rate": 0.0002618021623667314, "loss": 0.0166, "step": 98240 }, { "epoch": 0.25, "learning_rate": 0.0002617982741503599, "loss": 0.0207, "step": 98250 }, { "epoch": 0.25, "learning_rate": 0.0002617943859339884, "loss": 0.0205, "step": 98260 }, { "epoch": 0.25, "learning_rate": 0.000261790497717617, "loss": 0.0233, "step": 98270 }, { "epoch": 0.25, "learning_rate": 0.0002617866095012455, "loss": 0.0188, "step": 98280 }, { "epoch": 0.25, "learning_rate": 0.000261782721284874, "loss": 0.0242, "step": 98290 }, { "epoch": 0.25, "learning_rate": 0.0002617788330685026, "loss": 0.0202, "step": 98300 }, { "epoch": 0.25, "learning_rate": 0.0002617749448521311, "loss": 0.0292, "step": 98310 }, { "epoch": 0.25, "learning_rate": 0.00026177105663575967, "loss": 0.0216, "step": 98320 }, { "epoch": 0.25, "learning_rate": 0.0002617671684193882, "loss": 0.0205, "step": 98330 }, { "epoch": 0.25, "learning_rate": 0.0002617632802030167, "loss": 0.024, "step": 98340 }, { "epoch": 0.25, "learning_rate": 0.00026175939198664526, "loss": 0.0222, "step": 98350 }, { "epoch": 0.25, "learning_rate": 0.0002617555037702738, "loss": 0.03, "step": 98360 }, { "epoch": 0.25, "learning_rate": 0.0002617516155539023, "loss": 0.0225, "step": 98370 }, { "epoch": 0.26, "learning_rate": 0.00026174772733753086, "loss": 0.028, "step": 98380 }, { "epoch": 0.26, "learning_rate": 0.00026174383912115943, "loss": 0.0211, "step": 98390 }, { "epoch": 0.26, "learning_rate": 0.00026173995090478794, "loss": 0.027, "step": 98400 }, { "epoch": 0.26, "learning_rate": 0.00026173606268841646, "loss": 0.022, "step": 98410 }, { "epoch": 0.26, "learning_rate": 0.000261732174472045, "loss": 0.0218, "step": 98420 }, { "epoch": 0.26, "learning_rate": 0.00026172828625567354, "loss": 0.0186, "step": 98430 }, { "epoch": 0.26, "learning_rate": 0.00026172439803930206, "loss": 0.0247, "step": 98440 }, { "epoch": 0.26, "learning_rate": 0.0002617205098229306, "loss": 0.0229, "step": 98450 }, { "epoch": 0.26, "learning_rate": 0.00026171662160655914, "loss": 0.0177, "step": 98460 }, { "epoch": 0.26, "learning_rate": 0.0002617127333901877, "loss": 0.0238, "step": 98470 }, { "epoch": 0.26, "learning_rate": 0.0002617088451738162, "loss": 0.0207, "step": 98480 }, { "epoch": 0.26, "learning_rate": 0.00026170495695744474, "loss": 0.0229, "step": 98490 }, { "epoch": 0.26, "learning_rate": 0.00026170106874107325, "loss": 0.0228, "step": 98500 }, { "epoch": 0.26, "learning_rate": 0.0002616971805247018, "loss": 0.0234, "step": 98510 }, { "epoch": 0.26, "learning_rate": 0.00026169329230833034, "loss": 0.0276, "step": 98520 }, { "epoch": 0.26, "learning_rate": 0.0002616894040919589, "loss": 0.0217, "step": 98530 }, { "epoch": 0.26, "learning_rate": 0.0002616855158755874, "loss": 0.0235, "step": 98540 }, { "epoch": 0.26, "learning_rate": 0.00026168162765921593, "loss": 0.0204, "step": 98550 }, { "epoch": 0.26, "learning_rate": 0.0002616777394428445, "loss": 0.0252, "step": 98560 }, { "epoch": 0.26, "learning_rate": 0.000261673851226473, "loss": 0.0271, "step": 98570 }, { "epoch": 0.26, "learning_rate": 0.00026166996301010153, "loss": 0.0296, "step": 98580 }, { "epoch": 0.26, "learning_rate": 0.0002616660747937301, "loss": 0.0246, "step": 98590 }, { "epoch": 0.26, "learning_rate": 0.00026166218657735867, "loss": 0.0202, "step": 98600 }, { "epoch": 0.26, "learning_rate": 0.0002616582983609872, "loss": 0.0229, "step": 98610 }, { "epoch": 0.26, "learning_rate": 0.0002616544101446157, "loss": 0.0245, "step": 98620 }, { "epoch": 0.26, "learning_rate": 0.0002616505219282442, "loss": 0.021, "step": 98630 }, { "epoch": 0.26, "learning_rate": 0.0002616466337118728, "loss": 0.0212, "step": 98640 }, { "epoch": 0.26, "learning_rate": 0.0002616427454955013, "loss": 0.0243, "step": 98650 }, { "epoch": 0.26, "learning_rate": 0.00026163885727912986, "loss": 0.0236, "step": 98660 }, { "epoch": 0.26, "learning_rate": 0.0002616349690627584, "loss": 0.0226, "step": 98670 }, { "epoch": 0.26, "learning_rate": 0.00026163108084638695, "loss": 0.0222, "step": 98680 }, { "epoch": 0.26, "learning_rate": 0.00026162719263001546, "loss": 0.0247, "step": 98690 }, { "epoch": 0.26, "learning_rate": 0.000261623304413644, "loss": 0.0238, "step": 98700 }, { "epoch": 0.26, "learning_rate": 0.0002616194161972725, "loss": 0.0241, "step": 98710 }, { "epoch": 0.26, "learning_rate": 0.00026161552798090106, "loss": 0.0229, "step": 98720 }, { "epoch": 0.26, "learning_rate": 0.00026161163976452963, "loss": 0.0178, "step": 98730 }, { "epoch": 0.26, "learning_rate": 0.00026160775154815814, "loss": 0.0238, "step": 98740 }, { "epoch": 0.26, "learning_rate": 0.00026160386333178666, "loss": 0.019, "step": 98750 }, { "epoch": 0.26, "learning_rate": 0.00026159997511541517, "loss": 0.022, "step": 98760 }, { "epoch": 0.26, "learning_rate": 0.00026159608689904374, "loss": 0.0239, "step": 98770 }, { "epoch": 0.26, "learning_rate": 0.00026159219868267226, "loss": 0.0189, "step": 98780 }, { "epoch": 0.26, "learning_rate": 0.0002615883104663008, "loss": 0.0236, "step": 98790 }, { "epoch": 0.26, "learning_rate": 0.00026158442224992934, "loss": 0.0194, "step": 98800 }, { "epoch": 0.26, "learning_rate": 0.0002615805340335579, "loss": 0.0263, "step": 98810 }, { "epoch": 0.26, "learning_rate": 0.0002615766458171864, "loss": 0.0217, "step": 98820 }, { "epoch": 0.26, "learning_rate": 0.00026157275760081494, "loss": 0.0203, "step": 98830 }, { "epoch": 0.26, "learning_rate": 0.00026156886938444345, "loss": 0.0248, "step": 98840 }, { "epoch": 0.26, "learning_rate": 0.000261564981168072, "loss": 0.0175, "step": 98850 }, { "epoch": 0.26, "learning_rate": 0.00026156109295170053, "loss": 0.0217, "step": 98860 }, { "epoch": 0.26, "learning_rate": 0.0002615572047353291, "loss": 0.0209, "step": 98870 }, { "epoch": 0.26, "learning_rate": 0.0002615533165189576, "loss": 0.0261, "step": 98880 }, { "epoch": 0.26, "learning_rate": 0.0002615494283025862, "loss": 0.0221, "step": 98890 }, { "epoch": 0.26, "learning_rate": 0.0002615455400862147, "loss": 0.0204, "step": 98900 }, { "epoch": 0.26, "learning_rate": 0.0002615416518698432, "loss": 0.0233, "step": 98910 }, { "epoch": 0.26, "learning_rate": 0.00026153776365347173, "loss": 0.0231, "step": 98920 }, { "epoch": 0.26, "learning_rate": 0.0002615338754371003, "loss": 0.0212, "step": 98930 }, { "epoch": 0.26, "learning_rate": 0.00026152998722072887, "loss": 0.019, "step": 98940 }, { "epoch": 0.26, "learning_rate": 0.0002615260990043574, "loss": 0.0218, "step": 98950 }, { "epoch": 0.26, "learning_rate": 0.0002615222107879859, "loss": 0.0286, "step": 98960 }, { "epoch": 0.26, "learning_rate": 0.00026151832257161447, "loss": 0.0237, "step": 98970 }, { "epoch": 0.26, "learning_rate": 0.000261514434355243, "loss": 0.0218, "step": 98980 }, { "epoch": 0.26, "learning_rate": 0.0002615105461388715, "loss": 0.0207, "step": 98990 }, { "epoch": 0.26, "learning_rate": 0.00026150665792250006, "loss": 0.0205, "step": 99000 }, { "epoch": 0.26, "eval_cer": 0.8817950623608236, "eval_loss": 0.015839723870158195, "eval_runtime": 108.0387, "eval_samples_per_second": 18.512, "eval_steps_per_second": 4.628, "step": 99000 }, { "epoch": 0.26, "learning_rate": 0.0002615027697061286, "loss": 0.0234, "step": 99010 }, { "epoch": 0.26, "learning_rate": 0.00026149888148975715, "loss": 0.0225, "step": 99020 }, { "epoch": 0.26, "learning_rate": 0.00026149499327338566, "loss": 0.0271, "step": 99030 }, { "epoch": 0.26, "learning_rate": 0.0002614911050570142, "loss": 0.0229, "step": 99040 }, { "epoch": 0.26, "learning_rate": 0.0002614872168406427, "loss": 0.0305, "step": 99050 }, { "epoch": 0.26, "learning_rate": 0.00026148332862427126, "loss": 0.0265, "step": 99060 }, { "epoch": 0.26, "learning_rate": 0.0002614794404078998, "loss": 0.0224, "step": 99070 }, { "epoch": 0.26, "learning_rate": 0.00026147555219152834, "loss": 0.0176, "step": 99080 }, { "epoch": 0.26, "learning_rate": 0.00026147166397515686, "loss": 0.0172, "step": 99090 }, { "epoch": 0.26, "learning_rate": 0.0002614677757587854, "loss": 0.0232, "step": 99100 }, { "epoch": 0.26, "learning_rate": 0.00026146388754241394, "loss": 0.0228, "step": 99110 }, { "epoch": 0.26, "learning_rate": 0.00026145999932604245, "loss": 0.0266, "step": 99120 }, { "epoch": 0.26, "learning_rate": 0.000261456111109671, "loss": 0.0196, "step": 99130 }, { "epoch": 0.26, "learning_rate": 0.00026145222289329954, "loss": 0.0225, "step": 99140 }, { "epoch": 0.26, "learning_rate": 0.0002614483346769281, "loss": 0.0243, "step": 99150 }, { "epoch": 0.26, "learning_rate": 0.0002614444464605566, "loss": 0.0239, "step": 99160 }, { "epoch": 0.26, "learning_rate": 0.00026144055824418514, "loss": 0.0237, "step": 99170 }, { "epoch": 0.26, "learning_rate": 0.0002614366700278137, "loss": 0.0182, "step": 99180 }, { "epoch": 0.26, "learning_rate": 0.0002614327818114422, "loss": 0.0192, "step": 99190 }, { "epoch": 0.26, "learning_rate": 0.00026142889359507073, "loss": 0.0272, "step": 99200 }, { "epoch": 0.26, "learning_rate": 0.0002614250053786993, "loss": 0.0214, "step": 99210 }, { "epoch": 0.26, "learning_rate": 0.0002614211171623278, "loss": 0.0237, "step": 99220 }, { "epoch": 0.26, "learning_rate": 0.0002614172289459564, "loss": 0.0208, "step": 99230 }, { "epoch": 0.26, "learning_rate": 0.0002614133407295849, "loss": 0.0245, "step": 99240 }, { "epoch": 0.26, "learning_rate": 0.0002614094525132134, "loss": 0.0259, "step": 99250 }, { "epoch": 0.26, "learning_rate": 0.00026140556429684193, "loss": 0.0242, "step": 99260 }, { "epoch": 0.26, "learning_rate": 0.0002614016760804705, "loss": 0.0194, "step": 99270 }, { "epoch": 0.26, "learning_rate": 0.00026139778786409907, "loss": 0.0268, "step": 99280 }, { "epoch": 0.26, "learning_rate": 0.0002613938996477276, "loss": 0.0219, "step": 99290 }, { "epoch": 0.26, "learning_rate": 0.0002613900114313561, "loss": 0.0215, "step": 99300 }, { "epoch": 0.26, "learning_rate": 0.00026138612321498466, "loss": 0.0217, "step": 99310 }, { "epoch": 0.26, "learning_rate": 0.0002613822349986132, "loss": 0.0239, "step": 99320 }, { "epoch": 0.26, "learning_rate": 0.0002613783467822417, "loss": 0.0217, "step": 99330 }, { "epoch": 0.26, "learning_rate": 0.00026137445856587026, "loss": 0.0265, "step": 99340 }, { "epoch": 0.26, "learning_rate": 0.0002613705703494988, "loss": 0.0266, "step": 99350 }, { "epoch": 0.26, "learning_rate": 0.00026136668213312734, "loss": 0.0191, "step": 99360 }, { "epoch": 0.26, "learning_rate": 0.00026136279391675586, "loss": 0.0228, "step": 99370 }, { "epoch": 0.26, "learning_rate": 0.0002613589057003844, "loss": 0.0236, "step": 99380 }, { "epoch": 0.26, "learning_rate": 0.00026135501748401294, "loss": 0.0258, "step": 99390 }, { "epoch": 0.26, "learning_rate": 0.00026135112926764146, "loss": 0.0284, "step": 99400 }, { "epoch": 0.26, "learning_rate": 0.00026134724105126997, "loss": 0.0198, "step": 99410 }, { "epoch": 0.26, "learning_rate": 0.00026134335283489854, "loss": 0.0243, "step": 99420 }, { "epoch": 0.26, "learning_rate": 0.0002613394646185271, "loss": 0.024, "step": 99430 }, { "epoch": 0.26, "learning_rate": 0.0002613355764021556, "loss": 0.0189, "step": 99440 }, { "epoch": 0.26, "learning_rate": 0.00026133168818578414, "loss": 0.0216, "step": 99450 }, { "epoch": 0.26, "learning_rate": 0.00026132779996941265, "loss": 0.0211, "step": 99460 }, { "epoch": 0.26, "learning_rate": 0.0002613239117530412, "loss": 0.0249, "step": 99470 }, { "epoch": 0.26, "learning_rate": 0.00026132002353666974, "loss": 0.0242, "step": 99480 }, { "epoch": 0.26, "learning_rate": 0.0002613161353202983, "loss": 0.0225, "step": 99490 }, { "epoch": 0.26, "learning_rate": 0.0002613122471039268, "loss": 0.0191, "step": 99500 }, { "epoch": 0.26, "learning_rate": 0.00026130835888755533, "loss": 0.0225, "step": 99510 }, { "epoch": 0.26, "learning_rate": 0.0002613044706711839, "loss": 0.0226, "step": 99520 }, { "epoch": 0.26, "learning_rate": 0.0002613005824548124, "loss": 0.0258, "step": 99530 }, { "epoch": 0.26, "learning_rate": 0.00026129669423844093, "loss": 0.0223, "step": 99540 }, { "epoch": 0.26, "learning_rate": 0.0002612928060220695, "loss": 0.0273, "step": 99550 }, { "epoch": 0.26, "learning_rate": 0.000261288917805698, "loss": 0.0221, "step": 99560 }, { "epoch": 0.26, "learning_rate": 0.0002612850295893266, "loss": 0.0271, "step": 99570 }, { "epoch": 0.26, "learning_rate": 0.0002612811413729551, "loss": 0.021, "step": 99580 }, { "epoch": 0.26, "learning_rate": 0.0002612772531565836, "loss": 0.0252, "step": 99590 }, { "epoch": 0.26, "learning_rate": 0.0002612733649402122, "loss": 0.0385, "step": 99600 }, { "epoch": 0.26, "learning_rate": 0.0002612694767238407, "loss": 0.0196, "step": 99610 }, { "epoch": 0.26, "learning_rate": 0.0002612655885074692, "loss": 0.0225, "step": 99620 }, { "epoch": 0.26, "learning_rate": 0.0002612617002910978, "loss": 0.0233, "step": 99630 }, { "epoch": 0.26, "learning_rate": 0.00026125781207472635, "loss": 0.0218, "step": 99640 }, { "epoch": 0.26, "learning_rate": 0.00026125392385835486, "loss": 0.0198, "step": 99650 }, { "epoch": 0.26, "learning_rate": 0.0002612500356419834, "loss": 0.0203, "step": 99660 }, { "epoch": 0.26, "learning_rate": 0.0002612461474256119, "loss": 0.0211, "step": 99670 }, { "epoch": 0.26, "learning_rate": 0.00026124225920924046, "loss": 0.0228, "step": 99680 }, { "epoch": 0.26, "learning_rate": 0.000261238370992869, "loss": 0.0217, "step": 99690 }, { "epoch": 0.26, "learning_rate": 0.00026123448277649754, "loss": 0.0228, "step": 99700 }, { "epoch": 0.26, "learning_rate": 0.00026123059456012606, "loss": 0.0227, "step": 99710 }, { "epoch": 0.26, "learning_rate": 0.00026122670634375463, "loss": 0.0241, "step": 99720 }, { "epoch": 0.26, "learning_rate": 0.00026122281812738314, "loss": 0.0253, "step": 99730 }, { "epoch": 0.26, "learning_rate": 0.00026121892991101166, "loss": 0.02, "step": 99740 }, { "epoch": 0.26, "learning_rate": 0.00026121504169464017, "loss": 0.0224, "step": 99750 }, { "epoch": 0.26, "learning_rate": 0.00026121115347826874, "loss": 0.0276, "step": 99760 }, { "epoch": 0.26, "learning_rate": 0.00026120726526189725, "loss": 0.0225, "step": 99770 }, { "epoch": 0.26, "learning_rate": 0.0002612033770455258, "loss": 0.0234, "step": 99780 }, { "epoch": 0.26, "learning_rate": 0.00026119948882915434, "loss": 0.0194, "step": 99790 }, { "epoch": 0.26, "learning_rate": 0.00026119560061278285, "loss": 0.021, "step": 99800 }, { "epoch": 0.26, "learning_rate": 0.0002611917123964114, "loss": 0.0239, "step": 99810 }, { "epoch": 0.26, "learning_rate": 0.00026118782418003994, "loss": 0.0196, "step": 99820 }, { "epoch": 0.26, "learning_rate": 0.0002611839359636685, "loss": 0.0227, "step": 99830 }, { "epoch": 0.26, "learning_rate": 0.000261180047747297, "loss": 0.0228, "step": 99840 }, { "epoch": 0.26, "learning_rate": 0.0002611761595309256, "loss": 0.0228, "step": 99850 }, { "epoch": 0.26, "learning_rate": 0.0002611722713145541, "loss": 0.0219, "step": 99860 }, { "epoch": 0.26, "learning_rate": 0.0002611683830981826, "loss": 0.0187, "step": 99870 }, { "epoch": 0.26, "learning_rate": 0.00026116449488181113, "loss": 0.0194, "step": 99880 }, { "epoch": 0.26, "learning_rate": 0.0002611606066654397, "loss": 0.0174, "step": 99890 }, { "epoch": 0.26, "learning_rate": 0.0002611567184490682, "loss": 0.0234, "step": 99900 }, { "epoch": 0.26, "learning_rate": 0.0002611528302326968, "loss": 0.0185, "step": 99910 }, { "epoch": 0.26, "learning_rate": 0.0002611489420163253, "loss": 0.0366, "step": 99920 }, { "epoch": 0.26, "learning_rate": 0.00026114505379995387, "loss": 0.0209, "step": 99930 }, { "epoch": 0.26, "learning_rate": 0.0002611411655835824, "loss": 0.0215, "step": 99940 }, { "epoch": 0.26, "learning_rate": 0.0002611372773672109, "loss": 0.0184, "step": 99950 }, { "epoch": 0.26, "learning_rate": 0.0002611333891508394, "loss": 0.0215, "step": 99960 }, { "epoch": 0.26, "learning_rate": 0.000261129500934468, "loss": 0.0276, "step": 99970 }, { "epoch": 0.26, "learning_rate": 0.00026112561271809655, "loss": 0.0232, "step": 99980 }, { "epoch": 0.26, "learning_rate": 0.00026112172450172506, "loss": 0.0189, "step": 99990 }, { "epoch": 0.26, "learning_rate": 0.0002611178362853536, "loss": 0.0244, "step": 100000 }, { "epoch": 0.26, "eval_cer": 0.8818048598193629, "eval_loss": 0.01607738994061947, "eval_runtime": 108.1372, "eval_samples_per_second": 18.495, "eval_steps_per_second": 4.624, "step": 100000 }, { "epoch": 0.26, "learning_rate": 0.0002611139480689821, "loss": 0.0241, "step": 100010 }, { "epoch": 0.26, "learning_rate": 0.00026111005985261066, "loss": 0.0211, "step": 100020 }, { "epoch": 0.26, "learning_rate": 0.0002611061716362392, "loss": 0.046, "step": 100030 }, { "epoch": 0.26, "learning_rate": 0.00026110228341986774, "loss": 0.0293, "step": 100040 }, { "epoch": 0.26, "learning_rate": 0.00026109839520349626, "loss": 0.0233, "step": 100050 }, { "epoch": 0.26, "learning_rate": 0.0002610945069871248, "loss": 0.0241, "step": 100060 }, { "epoch": 0.26, "learning_rate": 0.00026109061877075334, "loss": 0.0217, "step": 100070 }, { "epoch": 0.26, "learning_rate": 0.00026108673055438186, "loss": 0.0227, "step": 100080 }, { "epoch": 0.26, "learning_rate": 0.00026108284233801037, "loss": 0.0247, "step": 100090 }, { "epoch": 0.26, "learning_rate": 0.00026107895412163894, "loss": 0.023, "step": 100100 }, { "epoch": 0.26, "learning_rate": 0.00026107506590526745, "loss": 0.0218, "step": 100110 }, { "epoch": 0.26, "learning_rate": 0.000261071177688896, "loss": 0.0217, "step": 100120 }, { "epoch": 0.26, "learning_rate": 0.00026106728947252454, "loss": 0.0204, "step": 100130 }, { "epoch": 0.26, "learning_rate": 0.0002610634012561531, "loss": 0.0181, "step": 100140 }, { "epoch": 0.26, "learning_rate": 0.0002610595130397816, "loss": 0.021, "step": 100150 }, { "epoch": 0.26, "learning_rate": 0.00026105562482341013, "loss": 0.0241, "step": 100160 }, { "epoch": 0.26, "learning_rate": 0.00026105173660703865, "loss": 0.0221, "step": 100170 }, { "epoch": 0.26, "learning_rate": 0.0002610478483906672, "loss": 0.0231, "step": 100180 }, { "epoch": 0.26, "learning_rate": 0.0002610439601742958, "loss": 0.0257, "step": 100190 }, { "epoch": 0.26, "learning_rate": 0.0002610400719579243, "loss": 0.024, "step": 100200 }, { "epoch": 0.26, "learning_rate": 0.0002610361837415528, "loss": 0.0207, "step": 100210 }, { "epoch": 0.26, "learning_rate": 0.0002610322955251814, "loss": 0.0226, "step": 100220 }, { "epoch": 0.26, "learning_rate": 0.0002610284073088099, "loss": 0.029, "step": 100230 }, { "epoch": 0.26, "learning_rate": 0.0002610245190924384, "loss": 0.0264, "step": 100240 }, { "epoch": 0.26, "learning_rate": 0.000261020630876067, "loss": 0.0246, "step": 100250 }, { "epoch": 0.26, "learning_rate": 0.0002610167426596955, "loss": 0.0245, "step": 100260 }, { "epoch": 0.26, "learning_rate": 0.00026101285444332406, "loss": 0.0193, "step": 100270 }, { "epoch": 0.26, "learning_rate": 0.0002610089662269526, "loss": 0.0197, "step": 100280 }, { "epoch": 0.26, "learning_rate": 0.0002610050780105811, "loss": 0.0241, "step": 100290 }, { "epoch": 0.26, "learning_rate": 0.0002610011897942096, "loss": 0.0238, "step": 100300 }, { "epoch": 0.26, "learning_rate": 0.0002609973015778382, "loss": 0.0232, "step": 100310 }, { "epoch": 0.26, "learning_rate": 0.00026099341336146675, "loss": 0.0185, "step": 100320 }, { "epoch": 0.26, "learning_rate": 0.00026098952514509526, "loss": 0.0279, "step": 100330 }, { "epoch": 0.26, "learning_rate": 0.0002609856369287238, "loss": 0.0223, "step": 100340 }, { "epoch": 0.26, "learning_rate": 0.00026098174871235234, "loss": 0.0223, "step": 100350 }, { "epoch": 0.26, "learning_rate": 0.00026097786049598086, "loss": 0.0231, "step": 100360 }, { "epoch": 0.26, "learning_rate": 0.00026097397227960937, "loss": 0.0207, "step": 100370 }, { "epoch": 0.26, "learning_rate": 0.00026097008406323794, "loss": 0.0213, "step": 100380 }, { "epoch": 0.26, "learning_rate": 0.00026096619584686646, "loss": 0.0245, "step": 100390 }, { "epoch": 0.26, "learning_rate": 0.000260962307630495, "loss": 0.0227, "step": 100400 }, { "epoch": 0.26, "learning_rate": 0.00026095841941412354, "loss": 0.0236, "step": 100410 }, { "epoch": 0.26, "learning_rate": 0.00026095453119775205, "loss": 0.0216, "step": 100420 }, { "epoch": 0.26, "learning_rate": 0.0002609506429813806, "loss": 0.0227, "step": 100430 }, { "epoch": 0.26, "learning_rate": 0.00026094675476500914, "loss": 0.027, "step": 100440 }, { "epoch": 0.26, "learning_rate": 0.00026094286654863765, "loss": 0.0248, "step": 100450 }, { "epoch": 0.26, "learning_rate": 0.0002609389783322662, "loss": 0.0228, "step": 100460 }, { "epoch": 0.26, "learning_rate": 0.0002609350901158948, "loss": 0.0181, "step": 100470 }, { "epoch": 0.26, "learning_rate": 0.0002609312018995233, "loss": 0.0184, "step": 100480 }, { "epoch": 0.26, "learning_rate": 0.0002609273136831518, "loss": 0.0245, "step": 100490 }, { "epoch": 0.26, "learning_rate": 0.00026092342546678033, "loss": 0.0253, "step": 100500 }, { "epoch": 0.26, "learning_rate": 0.00026091953725040885, "loss": 0.0218, "step": 100510 }, { "epoch": 0.26, "learning_rate": 0.0002609156490340374, "loss": 0.0249, "step": 100520 }, { "epoch": 0.26, "learning_rate": 0.000260911760817666, "loss": 0.0237, "step": 100530 }, { "epoch": 0.26, "learning_rate": 0.0002609078726012945, "loss": 0.0275, "step": 100540 }, { "epoch": 0.26, "learning_rate": 0.000260903984384923, "loss": 0.0228, "step": 100550 }, { "epoch": 0.26, "learning_rate": 0.0002609000961685516, "loss": 0.0279, "step": 100560 }, { "epoch": 0.26, "learning_rate": 0.0002608962079521801, "loss": 0.0254, "step": 100570 }, { "epoch": 0.26, "learning_rate": 0.0002608923197358086, "loss": 0.0253, "step": 100580 }, { "epoch": 0.26, "learning_rate": 0.0002608884315194372, "loss": 0.0215, "step": 100590 }, { "epoch": 0.26, "learning_rate": 0.0002608845433030657, "loss": 0.024, "step": 100600 }, { "epoch": 0.26, "learning_rate": 0.00026088065508669426, "loss": 0.0226, "step": 100610 }, { "epoch": 0.26, "learning_rate": 0.0002608767668703228, "loss": 0.0256, "step": 100620 }, { "epoch": 0.26, "learning_rate": 0.0002608728786539513, "loss": 0.0261, "step": 100630 }, { "epoch": 0.26, "learning_rate": 0.00026086899043757986, "loss": 0.0236, "step": 100640 }, { "epoch": 0.26, "learning_rate": 0.0002608651022212084, "loss": 0.0191, "step": 100650 }, { "epoch": 0.26, "learning_rate": 0.0002608612140048369, "loss": 0.0231, "step": 100660 }, { "epoch": 0.26, "learning_rate": 0.00026085732578846546, "loss": 0.0195, "step": 100670 }, { "epoch": 0.26, "learning_rate": 0.00026085343757209403, "loss": 0.0232, "step": 100680 }, { "epoch": 0.26, "learning_rate": 0.00026084954935572254, "loss": 0.0223, "step": 100690 }, { "epoch": 0.26, "learning_rate": 0.00026084566113935106, "loss": 0.0222, "step": 100700 }, { "epoch": 0.26, "learning_rate": 0.00026084177292297957, "loss": 0.0238, "step": 100710 }, { "epoch": 0.26, "learning_rate": 0.00026083788470660814, "loss": 0.0177, "step": 100720 }, { "epoch": 0.26, "learning_rate": 0.00026083399649023665, "loss": 0.0284, "step": 100730 }, { "epoch": 0.26, "learning_rate": 0.0002608301082738652, "loss": 0.0255, "step": 100740 }, { "epoch": 0.26, "learning_rate": 0.00026082622005749374, "loss": 0.0242, "step": 100750 }, { "epoch": 0.26, "learning_rate": 0.00026082233184112225, "loss": 0.0192, "step": 100760 }, { "epoch": 0.26, "learning_rate": 0.0002608184436247508, "loss": 0.0256, "step": 100770 }, { "epoch": 0.26, "learning_rate": 0.00026081455540837934, "loss": 0.0208, "step": 100780 }, { "epoch": 0.26, "learning_rate": 0.00026081066719200785, "loss": 0.0274, "step": 100790 }, { "epoch": 0.26, "learning_rate": 0.0002608067789756364, "loss": 0.0235, "step": 100800 }, { "epoch": 0.26, "learning_rate": 0.00026080289075926493, "loss": 0.0306, "step": 100810 }, { "epoch": 0.26, "learning_rate": 0.0002607990025428935, "loss": 0.0194, "step": 100820 }, { "epoch": 0.26, "learning_rate": 0.000260795114326522, "loss": 0.0222, "step": 100830 }, { "epoch": 0.26, "learning_rate": 0.00026079122611015053, "loss": 0.0261, "step": 100840 }, { "epoch": 0.26, "learning_rate": 0.0002607873378937791, "loss": 0.029, "step": 100850 }, { "epoch": 0.26, "learning_rate": 0.0002607834496774076, "loss": 0.0205, "step": 100860 }, { "epoch": 0.26, "learning_rate": 0.0002607795614610362, "loss": 0.0206, "step": 100870 }, { "epoch": 0.26, "learning_rate": 0.0002607756732446647, "loss": 0.0235, "step": 100880 }, { "epoch": 0.26, "learning_rate": 0.00026077178502829327, "loss": 0.02, "step": 100890 }, { "epoch": 0.26, "learning_rate": 0.0002607678968119218, "loss": 0.0231, "step": 100900 }, { "epoch": 0.26, "learning_rate": 0.0002607640085955503, "loss": 0.0265, "step": 100910 }, { "epoch": 0.26, "learning_rate": 0.0002607601203791788, "loss": 0.0222, "step": 100920 }, { "epoch": 0.26, "learning_rate": 0.0002607562321628074, "loss": 0.0176, "step": 100930 }, { "epoch": 0.26, "learning_rate": 0.0002607523439464359, "loss": 0.0242, "step": 100940 }, { "epoch": 0.26, "learning_rate": 0.00026074845573006446, "loss": 0.0206, "step": 100950 }, { "epoch": 0.26, "learning_rate": 0.000260744567513693, "loss": 0.0225, "step": 100960 }, { "epoch": 0.26, "learning_rate": 0.00026074067929732155, "loss": 0.0296, "step": 100970 }, { "epoch": 0.26, "learning_rate": 0.00026073679108095006, "loss": 0.0254, "step": 100980 }, { "epoch": 0.26, "learning_rate": 0.0002607329028645786, "loss": 0.0212, "step": 100990 }, { "epoch": 0.26, "learning_rate": 0.0002607290146482071, "loss": 0.0226, "step": 101000 }, { "epoch": 0.26, "eval_cer": 0.8817740678068109, "eval_loss": 0.01563679240643978, "eval_runtime": 108.1764, "eval_samples_per_second": 18.488, "eval_steps_per_second": 4.622, "step": 101000 }, { "epoch": 0.26, "learning_rate": 0.00026072512643183566, "loss": 0.0201, "step": 101010 }, { "epoch": 0.26, "learning_rate": 0.0002607212382154642, "loss": 0.0201, "step": 101020 }, { "epoch": 0.26, "learning_rate": 0.00026071734999909274, "loss": 0.0254, "step": 101030 }, { "epoch": 0.26, "learning_rate": 0.00026071346178272126, "loss": 0.0207, "step": 101040 }, { "epoch": 0.26, "learning_rate": 0.00026070957356634977, "loss": 0.0215, "step": 101050 }, { "epoch": 0.26, "learning_rate": 0.00026070568534997834, "loss": 0.0232, "step": 101060 }, { "epoch": 0.26, "learning_rate": 0.00026070179713360685, "loss": 0.0203, "step": 101070 }, { "epoch": 0.26, "learning_rate": 0.0002606979089172354, "loss": 0.0196, "step": 101080 }, { "epoch": 0.26, "learning_rate": 0.00026069402070086394, "loss": 0.0232, "step": 101090 }, { "epoch": 0.26, "learning_rate": 0.0002606901324844925, "loss": 0.0243, "step": 101100 }, { "epoch": 0.26, "learning_rate": 0.000260686244268121, "loss": 0.0192, "step": 101110 }, { "epoch": 0.26, "learning_rate": 0.00026068235605174953, "loss": 0.0193, "step": 101120 }, { "epoch": 0.26, "learning_rate": 0.00026067846783537805, "loss": 0.0203, "step": 101130 }, { "epoch": 0.26, "learning_rate": 0.0002606745796190066, "loss": 0.0181, "step": 101140 }, { "epoch": 0.26, "learning_rate": 0.00026067069140263513, "loss": 0.0202, "step": 101150 }, { "epoch": 0.26, "learning_rate": 0.0002606668031862637, "loss": 0.024, "step": 101160 }, { "epoch": 0.26, "learning_rate": 0.0002606629149698922, "loss": 0.0217, "step": 101170 }, { "epoch": 0.26, "learning_rate": 0.0002606590267535208, "loss": 0.0239, "step": 101180 }, { "epoch": 0.26, "learning_rate": 0.0002606551385371493, "loss": 0.0188, "step": 101190 }, { "epoch": 0.26, "learning_rate": 0.0002606512503207778, "loss": 0.0195, "step": 101200 }, { "epoch": 0.26, "learning_rate": 0.00026064736210440633, "loss": 0.0211, "step": 101210 }, { "epoch": 0.26, "learning_rate": 0.0002606434738880349, "loss": 0.0213, "step": 101220 }, { "epoch": 0.26, "learning_rate": 0.00026063958567166347, "loss": 0.0299, "step": 101230 }, { "epoch": 0.26, "learning_rate": 0.000260635697455292, "loss": 0.0198, "step": 101240 }, { "epoch": 0.26, "learning_rate": 0.0002606318092389205, "loss": 0.0223, "step": 101250 }, { "epoch": 0.26, "learning_rate": 0.000260627921022549, "loss": 0.0198, "step": 101260 }, { "epoch": 0.26, "learning_rate": 0.0002606240328061776, "loss": 0.0201, "step": 101270 }, { "epoch": 0.26, "learning_rate": 0.0002606201445898061, "loss": 0.0251, "step": 101280 }, { "epoch": 0.26, "learning_rate": 0.00026061625637343466, "loss": 0.0141, "step": 101290 }, { "epoch": 0.26, "learning_rate": 0.0002606123681570632, "loss": 0.0219, "step": 101300 }, { "epoch": 0.26, "learning_rate": 0.00026060847994069174, "loss": 0.0223, "step": 101310 }, { "epoch": 0.26, "learning_rate": 0.00026060459172432026, "loss": 0.0216, "step": 101320 }, { "epoch": 0.26, "learning_rate": 0.0002606007035079488, "loss": 0.0209, "step": 101330 }, { "epoch": 0.26, "learning_rate": 0.0002605968152915773, "loss": 0.0244, "step": 101340 }, { "epoch": 0.26, "learning_rate": 0.00026059292707520586, "loss": 0.0212, "step": 101350 }, { "epoch": 0.26, "learning_rate": 0.00026058903885883437, "loss": 0.0246, "step": 101360 }, { "epoch": 0.26, "learning_rate": 0.00026058515064246294, "loss": 0.02, "step": 101370 }, { "epoch": 0.26, "learning_rate": 0.00026058126242609145, "loss": 0.0214, "step": 101380 }, { "epoch": 0.26, "learning_rate": 0.00026057737420972, "loss": 0.0216, "step": 101390 }, { "epoch": 0.26, "learning_rate": 0.00026057348599334854, "loss": 0.0249, "step": 101400 }, { "epoch": 0.26, "learning_rate": 0.00026056959777697705, "loss": 0.0288, "step": 101410 }, { "epoch": 0.26, "learning_rate": 0.0002605657095606056, "loss": 0.029, "step": 101420 }, { "epoch": 0.26, "learning_rate": 0.00026056182134423414, "loss": 0.021, "step": 101430 }, { "epoch": 0.26, "learning_rate": 0.0002605579331278627, "loss": 0.0176, "step": 101440 }, { "epoch": 0.26, "learning_rate": 0.0002605540449114912, "loss": 0.0212, "step": 101450 }, { "epoch": 0.26, "learning_rate": 0.00026055015669511973, "loss": 0.019, "step": 101460 }, { "epoch": 0.26, "learning_rate": 0.0002605462684787483, "loss": 0.0265, "step": 101470 }, { "epoch": 0.26, "learning_rate": 0.0002605423802623768, "loss": 0.0243, "step": 101480 }, { "epoch": 0.26, "learning_rate": 0.00026053849204600533, "loss": 0.0266, "step": 101490 }, { "epoch": 0.26, "learning_rate": 0.0002605346038296339, "loss": 0.0262, "step": 101500 }, { "epoch": 0.26, "learning_rate": 0.0002605307156132624, "loss": 0.0278, "step": 101510 }, { "epoch": 0.26, "learning_rate": 0.000260526827396891, "loss": 0.0215, "step": 101520 }, { "epoch": 0.26, "learning_rate": 0.0002605229391805195, "loss": 0.024, "step": 101530 }, { "epoch": 0.26, "learning_rate": 0.000260519050964148, "loss": 0.0204, "step": 101540 }, { "epoch": 0.26, "learning_rate": 0.0002605151627477765, "loss": 0.0228, "step": 101550 }, { "epoch": 0.26, "learning_rate": 0.0002605112745314051, "loss": 0.0247, "step": 101560 }, { "epoch": 0.26, "learning_rate": 0.00026050738631503366, "loss": 0.0179, "step": 101570 }, { "epoch": 0.26, "learning_rate": 0.0002605034980986622, "loss": 0.0184, "step": 101580 }, { "epoch": 0.26, "learning_rate": 0.0002604996098822907, "loss": 0.0192, "step": 101590 }, { "epoch": 0.26, "learning_rate": 0.00026049572166591926, "loss": 0.0194, "step": 101600 }, { "epoch": 0.26, "learning_rate": 0.0002604918334495478, "loss": 0.0202, "step": 101610 }, { "epoch": 0.26, "learning_rate": 0.0002604879452331763, "loss": 0.0197, "step": 101620 }, { "epoch": 0.26, "learning_rate": 0.00026048405701680486, "loss": 0.0195, "step": 101630 }, { "epoch": 0.26, "learning_rate": 0.0002604801688004334, "loss": 0.0209, "step": 101640 }, { "epoch": 0.26, "learning_rate": 0.00026047628058406194, "loss": 0.0172, "step": 101650 }, { "epoch": 0.26, "learning_rate": 0.00026047239236769046, "loss": 0.0262, "step": 101660 }, { "epoch": 0.26, "learning_rate": 0.00026046850415131897, "loss": 0.0229, "step": 101670 }, { "epoch": 0.26, "learning_rate": 0.00026046461593494754, "loss": 0.0266, "step": 101680 }, { "epoch": 0.26, "learning_rate": 0.00026046072771857606, "loss": 0.0252, "step": 101690 }, { "epoch": 0.26, "learning_rate": 0.00026045683950220457, "loss": 0.0202, "step": 101700 }, { "epoch": 0.26, "learning_rate": 0.00026045295128583314, "loss": 0.0222, "step": 101710 }, { "epoch": 0.26, "learning_rate": 0.0002604490630694617, "loss": 0.0185, "step": 101720 }, { "epoch": 0.26, "learning_rate": 0.0002604451748530902, "loss": 0.0232, "step": 101730 }, { "epoch": 0.26, "learning_rate": 0.00026044128663671874, "loss": 0.0213, "step": 101740 }, { "epoch": 0.26, "learning_rate": 0.00026043739842034725, "loss": 0.023, "step": 101750 }, { "epoch": 0.26, "learning_rate": 0.00026043351020397577, "loss": 0.0213, "step": 101760 }, { "epoch": 0.26, "learning_rate": 0.00026042962198760433, "loss": 0.0235, "step": 101770 }, { "epoch": 0.26, "learning_rate": 0.0002604257337712329, "loss": 0.0256, "step": 101780 }, { "epoch": 0.26, "learning_rate": 0.0002604218455548614, "loss": 0.0209, "step": 101790 }, { "epoch": 0.26, "learning_rate": 0.00026041795733848993, "loss": 0.0241, "step": 101800 }, { "epoch": 0.26, "learning_rate": 0.0002604140691221185, "loss": 0.0203, "step": 101810 }, { "epoch": 0.26, "learning_rate": 0.000260410180905747, "loss": 0.026, "step": 101820 }, { "epoch": 0.26, "learning_rate": 0.00026040629268937553, "loss": 0.0194, "step": 101830 }, { "epoch": 0.26, "learning_rate": 0.0002604024044730041, "loss": 0.0298, "step": 101840 }, { "epoch": 0.26, "learning_rate": 0.0002603985162566326, "loss": 0.0223, "step": 101850 }, { "epoch": 0.26, "learning_rate": 0.0002603946280402612, "loss": 0.0252, "step": 101860 }, { "epoch": 0.26, "learning_rate": 0.0002603907398238897, "loss": 0.0211, "step": 101870 }, { "epoch": 0.26, "learning_rate": 0.0002603868516075182, "loss": 0.0221, "step": 101880 }, { "epoch": 0.26, "learning_rate": 0.0002603829633911468, "loss": 0.0239, "step": 101890 }, { "epoch": 0.26, "learning_rate": 0.0002603790751747753, "loss": 0.0209, "step": 101900 }, { "epoch": 0.26, "learning_rate": 0.00026037518695840386, "loss": 0.0233, "step": 101910 }, { "epoch": 0.26, "learning_rate": 0.0002603712987420324, "loss": 0.0232, "step": 101920 }, { "epoch": 0.26, "learning_rate": 0.00026036741052566095, "loss": 0.019, "step": 101930 }, { "epoch": 0.26, "learning_rate": 0.00026036352230928946, "loss": 0.0206, "step": 101940 }, { "epoch": 0.26, "learning_rate": 0.000260359634092918, "loss": 0.0181, "step": 101950 }, { "epoch": 0.26, "learning_rate": 0.0002603557458765465, "loss": 0.0232, "step": 101960 }, { "epoch": 0.26, "learning_rate": 0.00026035185766017506, "loss": 0.0202, "step": 101970 }, { "epoch": 0.26, "learning_rate": 0.0002603479694438036, "loss": 0.0261, "step": 101980 }, { "epoch": 0.26, "learning_rate": 0.00026034408122743214, "loss": 0.0205, "step": 101990 }, { "epoch": 0.26, "learning_rate": 0.00026034019301106066, "loss": 0.0178, "step": 102000 }, { "epoch": 0.26, "eval_cer": 0.8817614710744033, "eval_loss": 0.016096029430627823, "eval_runtime": 108.1492, "eval_samples_per_second": 18.493, "eval_steps_per_second": 4.623, "step": 102000 }, { "epoch": 0.26, "learning_rate": 0.00026033630479468917, "loss": 0.0204, "step": 102010 }, { "epoch": 0.26, "learning_rate": 0.00026033241657831774, "loss": 0.0265, "step": 102020 }, { "epoch": 0.26, "learning_rate": 0.00026032852836194625, "loss": 0.0247, "step": 102030 }, { "epoch": 0.26, "learning_rate": 0.00026032464014557477, "loss": 0.0232, "step": 102040 }, { "epoch": 0.26, "learning_rate": 0.00026032075192920334, "loss": 0.0182, "step": 102050 }, { "epoch": 0.26, "learning_rate": 0.0002603168637128319, "loss": 0.0215, "step": 102060 }, { "epoch": 0.26, "learning_rate": 0.0002603129754964604, "loss": 0.0235, "step": 102070 }, { "epoch": 0.26, "learning_rate": 0.00026030908728008894, "loss": 0.0246, "step": 102080 }, { "epoch": 0.26, "learning_rate": 0.00026030519906371745, "loss": 0.0203, "step": 102090 }, { "epoch": 0.26, "learning_rate": 0.000260301310847346, "loss": 0.0218, "step": 102100 }, { "epoch": 0.26, "learning_rate": 0.00026029742263097453, "loss": 0.0203, "step": 102110 }, { "epoch": 0.26, "learning_rate": 0.0002602935344146031, "loss": 0.0229, "step": 102120 }, { "epoch": 0.26, "learning_rate": 0.0002602896461982316, "loss": 0.0193, "step": 102130 }, { "epoch": 0.26, "learning_rate": 0.0002602857579818602, "loss": 0.0247, "step": 102140 }, { "epoch": 0.26, "learning_rate": 0.0002602818697654887, "loss": 0.0252, "step": 102150 }, { "epoch": 0.26, "learning_rate": 0.0002602779815491172, "loss": 0.018, "step": 102160 }, { "epoch": 0.26, "learning_rate": 0.00026027409333274573, "loss": 0.0245, "step": 102170 }, { "epoch": 0.26, "learning_rate": 0.0002602702051163743, "loss": 0.0187, "step": 102180 }, { "epoch": 0.26, "learning_rate": 0.0002602663169000028, "loss": 0.0228, "step": 102190 }, { "epoch": 0.26, "learning_rate": 0.0002602624286836314, "loss": 0.0218, "step": 102200 }, { "epoch": 0.26, "learning_rate": 0.0002602585404672599, "loss": 0.023, "step": 102210 }, { "epoch": 0.26, "learning_rate": 0.0002602546522508884, "loss": 0.023, "step": 102220 }, { "epoch": 0.26, "learning_rate": 0.000260250764034517, "loss": 0.0262, "step": 102230 }, { "epoch": 0.27, "learning_rate": 0.0002602468758181455, "loss": 0.0173, "step": 102240 }, { "epoch": 0.27, "learning_rate": 0.000260242987601774, "loss": 0.0263, "step": 102250 }, { "epoch": 0.27, "learning_rate": 0.0002602390993854026, "loss": 0.0231, "step": 102260 }, { "epoch": 0.27, "learning_rate": 0.00026023521116903115, "loss": 0.0287, "step": 102270 }, { "epoch": 0.27, "learning_rate": 0.00026023132295265966, "loss": 0.0219, "step": 102280 }, { "epoch": 0.27, "learning_rate": 0.0002602274347362882, "loss": 0.0237, "step": 102290 }, { "epoch": 0.27, "learning_rate": 0.0002602235465199167, "loss": 0.0212, "step": 102300 }, { "epoch": 0.27, "learning_rate": 0.00026021965830354526, "loss": 0.0219, "step": 102310 }, { "epoch": 0.27, "learning_rate": 0.00026021577008717377, "loss": 0.0232, "step": 102320 }, { "epoch": 0.27, "learning_rate": 0.00026021188187080234, "loss": 0.0262, "step": 102330 }, { "epoch": 0.27, "learning_rate": 0.00026020799365443086, "loss": 0.0234, "step": 102340 }, { "epoch": 0.27, "learning_rate": 0.0002602041054380594, "loss": 0.0228, "step": 102350 }, { "epoch": 0.27, "learning_rate": 0.00026020021722168794, "loss": 0.0192, "step": 102360 }, { "epoch": 0.27, "learning_rate": 0.00026019632900531645, "loss": 0.0245, "step": 102370 }, { "epoch": 0.27, "learning_rate": 0.00026019244078894497, "loss": 0.0228, "step": 102380 }, { "epoch": 0.27, "learning_rate": 0.00026018855257257354, "loss": 0.0248, "step": 102390 }, { "epoch": 0.27, "learning_rate": 0.00026018466435620205, "loss": 0.0218, "step": 102400 }, { "epoch": 0.27, "learning_rate": 0.0002601807761398306, "loss": 0.0213, "step": 102410 }, { "epoch": 0.27, "learning_rate": 0.00026017688792345913, "loss": 0.0205, "step": 102420 }, { "epoch": 0.27, "learning_rate": 0.0002601729997070877, "loss": 0.0196, "step": 102430 }, { "epoch": 0.27, "learning_rate": 0.0002601691114907162, "loss": 0.021, "step": 102440 }, { "epoch": 0.27, "learning_rate": 0.00026016522327434473, "loss": 0.0212, "step": 102450 }, { "epoch": 0.27, "learning_rate": 0.0002601613350579733, "loss": 0.024, "step": 102460 }, { "epoch": 0.27, "learning_rate": 0.0002601574468416018, "loss": 0.0204, "step": 102470 }, { "epoch": 0.27, "learning_rate": 0.0002601535586252304, "loss": 0.0252, "step": 102480 }, { "epoch": 0.27, "learning_rate": 0.0002601496704088589, "loss": 0.0236, "step": 102490 }, { "epoch": 0.27, "learning_rate": 0.0002601457821924874, "loss": 0.0225, "step": 102500 }, { "epoch": 0.27, "learning_rate": 0.00026014189397611593, "loss": 0.0265, "step": 102510 }, { "epoch": 0.27, "learning_rate": 0.0002601380057597445, "loss": 0.0227, "step": 102520 }, { "epoch": 0.27, "learning_rate": 0.000260134117543373, "loss": 0.0204, "step": 102530 }, { "epoch": 0.27, "learning_rate": 0.0002601302293270016, "loss": 0.0248, "step": 102540 }, { "epoch": 0.27, "learning_rate": 0.0002601263411106301, "loss": 0.0226, "step": 102550 }, { "epoch": 0.27, "learning_rate": 0.00026012245289425866, "loss": 0.0213, "step": 102560 }, { "epoch": 0.27, "learning_rate": 0.0002601185646778872, "loss": 0.0233, "step": 102570 }, { "epoch": 0.27, "learning_rate": 0.0002601146764615157, "loss": 0.0225, "step": 102580 }, { "epoch": 0.27, "learning_rate": 0.0002601107882451442, "loss": 0.0209, "step": 102590 }, { "epoch": 0.27, "learning_rate": 0.0002601069000287728, "loss": 0.0224, "step": 102600 }, { "epoch": 0.27, "learning_rate": 0.00026010301181240134, "loss": 0.0187, "step": 102610 }, { "epoch": 0.27, "learning_rate": 0.00026009912359602986, "loss": 0.0184, "step": 102620 }, { "epoch": 0.27, "learning_rate": 0.0002600952353796584, "loss": 0.0252, "step": 102630 }, { "epoch": 0.27, "learning_rate": 0.00026009134716328694, "loss": 0.0234, "step": 102640 }, { "epoch": 0.27, "learning_rate": 0.00026008745894691546, "loss": 0.0215, "step": 102650 }, { "epoch": 0.27, "learning_rate": 0.00026008357073054397, "loss": 0.0236, "step": 102660 }, { "epoch": 0.27, "learning_rate": 0.00026007968251417254, "loss": 0.0207, "step": 102670 }, { "epoch": 0.27, "learning_rate": 0.00026007579429780105, "loss": 0.0205, "step": 102680 }, { "epoch": 0.27, "learning_rate": 0.0002600719060814296, "loss": 0.0192, "step": 102690 }, { "epoch": 0.27, "learning_rate": 0.00026006801786505814, "loss": 0.0207, "step": 102700 }, { "epoch": 0.27, "learning_rate": 0.00026006412964868665, "loss": 0.038, "step": 102710 }, { "epoch": 0.27, "learning_rate": 0.00026006024143231517, "loss": 0.0287, "step": 102720 }, { "epoch": 0.27, "learning_rate": 0.00026005635321594374, "loss": 0.0215, "step": 102730 }, { "epoch": 0.27, "learning_rate": 0.00026005246499957225, "loss": 0.0255, "step": 102740 }, { "epoch": 0.27, "learning_rate": 0.0002600485767832008, "loss": 0.0299, "step": 102750 }, { "epoch": 0.27, "learning_rate": 0.00026004468856682933, "loss": 0.0219, "step": 102760 }, { "epoch": 0.27, "learning_rate": 0.0002600408003504579, "loss": 0.0325, "step": 102770 }, { "epoch": 0.27, "learning_rate": 0.0002600369121340864, "loss": 0.0274, "step": 102780 }, { "epoch": 0.27, "learning_rate": 0.00026003302391771493, "loss": 0.0242, "step": 102790 }, { "epoch": 0.27, "learning_rate": 0.00026002913570134345, "loss": 0.0253, "step": 102800 }, { "epoch": 0.27, "learning_rate": 0.000260025247484972, "loss": 0.0203, "step": 102810 }, { "epoch": 0.27, "learning_rate": 0.0002600213592686006, "loss": 0.023, "step": 102820 }, { "epoch": 0.27, "learning_rate": 0.0002600174710522291, "loss": 0.0176, "step": 102830 }, { "epoch": 0.27, "learning_rate": 0.0002600135828358576, "loss": 0.0224, "step": 102840 }, { "epoch": 0.27, "learning_rate": 0.0002600096946194862, "loss": 0.0232, "step": 102850 }, { "epoch": 0.27, "learning_rate": 0.0002600058064031147, "loss": 0.0216, "step": 102860 }, { "epoch": 0.27, "learning_rate": 0.0002600019181867432, "loss": 0.0218, "step": 102870 }, { "epoch": 0.27, "learning_rate": 0.0002599980299703718, "loss": 0.0226, "step": 102880 }, { "epoch": 0.27, "learning_rate": 0.0002599941417540003, "loss": 0.0242, "step": 102890 }, { "epoch": 0.27, "learning_rate": 0.00025999025353762886, "loss": 0.023, "step": 102900 }, { "epoch": 0.27, "learning_rate": 0.0002599863653212574, "loss": 0.0215, "step": 102910 }, { "epoch": 0.27, "learning_rate": 0.0002599824771048859, "loss": 0.0189, "step": 102920 }, { "epoch": 0.27, "learning_rate": 0.00025997858888851446, "loss": 0.0189, "step": 102930 }, { "epoch": 0.27, "learning_rate": 0.000259974700672143, "loss": 0.0222, "step": 102940 }, { "epoch": 0.27, "learning_rate": 0.0002599708124557715, "loss": 0.026, "step": 102950 }, { "epoch": 0.27, "learning_rate": 0.00025996692423940006, "loss": 0.0221, "step": 102960 }, { "epoch": 0.27, "learning_rate": 0.00025996303602302857, "loss": 0.0236, "step": 102970 }, { "epoch": 0.27, "learning_rate": 0.00025995914780665714, "loss": 0.0222, "step": 102980 }, { "epoch": 0.27, "learning_rate": 0.00025995525959028566, "loss": 0.0254, "step": 102990 }, { "epoch": 0.27, "learning_rate": 0.00025995137137391417, "loss": 0.0274, "step": 103000 }, { "epoch": 0.27, "eval_cer": 0.8817922630869552, "eval_loss": 0.01607452891767025, "eval_runtime": 108.0632, "eval_samples_per_second": 18.508, "eval_steps_per_second": 4.627, "step": 103000 }, { "epoch": 0.27, "learning_rate": 0.00025994748315754274, "loss": 0.0228, "step": 103010 }, { "epoch": 0.27, "learning_rate": 0.00025994359494117125, "loss": 0.0228, "step": 103020 }, { "epoch": 0.27, "learning_rate": 0.0002599397067247998, "loss": 0.0239, "step": 103030 }, { "epoch": 0.27, "learning_rate": 0.00025993581850842834, "loss": 0.0223, "step": 103040 }, { "epoch": 0.27, "learning_rate": 0.00025993193029205685, "loss": 0.0216, "step": 103050 }, { "epoch": 0.27, "learning_rate": 0.0002599280420756854, "loss": 0.0254, "step": 103060 }, { "epoch": 0.27, "learning_rate": 0.00025992415385931393, "loss": 0.0222, "step": 103070 }, { "epoch": 0.27, "learning_rate": 0.00025992026564294245, "loss": 0.0226, "step": 103080 }, { "epoch": 0.27, "learning_rate": 0.000259916377426571, "loss": 0.0283, "step": 103090 }, { "epoch": 0.27, "learning_rate": 0.00025991248921019953, "loss": 0.0223, "step": 103100 }, { "epoch": 0.27, "learning_rate": 0.0002599086009938281, "loss": 0.0225, "step": 103110 }, { "epoch": 0.27, "learning_rate": 0.0002599047127774566, "loss": 0.0225, "step": 103120 }, { "epoch": 0.27, "learning_rate": 0.00025990082456108513, "loss": 0.0256, "step": 103130 }, { "epoch": 0.27, "learning_rate": 0.0002598969363447137, "loss": 0.0211, "step": 103140 }, { "epoch": 0.27, "learning_rate": 0.0002598930481283422, "loss": 0.0195, "step": 103150 }, { "epoch": 0.27, "learning_rate": 0.0002598891599119708, "loss": 0.024, "step": 103160 }, { "epoch": 0.27, "learning_rate": 0.0002598852716955993, "loss": 0.0273, "step": 103170 }, { "epoch": 0.27, "learning_rate": 0.00025988138347922787, "loss": 0.0194, "step": 103180 }, { "epoch": 0.27, "learning_rate": 0.0002598774952628564, "loss": 0.025, "step": 103190 }, { "epoch": 0.27, "learning_rate": 0.0002598736070464849, "loss": 0.0207, "step": 103200 }, { "epoch": 0.27, "learning_rate": 0.0002598697188301134, "loss": 0.0245, "step": 103210 }, { "epoch": 0.27, "learning_rate": 0.000259865830613742, "loss": 0.0213, "step": 103220 }, { "epoch": 0.27, "learning_rate": 0.0002598619423973705, "loss": 0.0222, "step": 103230 }, { "epoch": 0.27, "learning_rate": 0.00025985805418099906, "loss": 0.0201, "step": 103240 }, { "epoch": 0.27, "learning_rate": 0.0002598541659646276, "loss": 0.0252, "step": 103250 }, { "epoch": 0.27, "learning_rate": 0.0002598502777482561, "loss": 0.0311, "step": 103260 }, { "epoch": 0.27, "learning_rate": 0.00025984638953188466, "loss": 0.0249, "step": 103270 }, { "epoch": 0.27, "learning_rate": 0.0002598425013155132, "loss": 0.0222, "step": 103280 }, { "epoch": 0.27, "learning_rate": 0.0002598386130991417, "loss": 0.0226, "step": 103290 }, { "epoch": 0.27, "learning_rate": 0.00025983472488277026, "loss": 0.0213, "step": 103300 }, { "epoch": 0.27, "learning_rate": 0.0002598308366663988, "loss": 0.0233, "step": 103310 }, { "epoch": 0.27, "learning_rate": 0.00025982694845002734, "loss": 0.023, "step": 103320 }, { "epoch": 0.27, "learning_rate": 0.00025982306023365585, "loss": 0.0206, "step": 103330 }, { "epoch": 0.27, "learning_rate": 0.00025981917201728437, "loss": 0.0207, "step": 103340 }, { "epoch": 0.27, "learning_rate": 0.00025981528380091294, "loss": 0.0251, "step": 103350 }, { "epoch": 0.27, "learning_rate": 0.00025981139558454145, "loss": 0.0238, "step": 103360 }, { "epoch": 0.27, "learning_rate": 0.00025980750736817, "loss": 0.0199, "step": 103370 }, { "epoch": 0.27, "learning_rate": 0.00025980361915179854, "loss": 0.0233, "step": 103380 }, { "epoch": 0.27, "learning_rate": 0.0002597997309354271, "loss": 0.0244, "step": 103390 }, { "epoch": 0.27, "learning_rate": 0.0002597958427190556, "loss": 0.0286, "step": 103400 }, { "epoch": 0.27, "learning_rate": 0.00025979195450268413, "loss": 0.0271, "step": 103410 }, { "epoch": 0.27, "learning_rate": 0.00025978806628631265, "loss": 0.0238, "step": 103420 }, { "epoch": 0.27, "learning_rate": 0.0002597841780699412, "loss": 0.0216, "step": 103430 }, { "epoch": 0.27, "learning_rate": 0.00025978028985356973, "loss": 0.0199, "step": 103440 }, { "epoch": 0.27, "learning_rate": 0.0002597764016371983, "loss": 0.0258, "step": 103450 }, { "epoch": 0.27, "learning_rate": 0.0002597725134208268, "loss": 0.0259, "step": 103460 }, { "epoch": 0.27, "learning_rate": 0.00025976862520445533, "loss": 0.019, "step": 103470 }, { "epoch": 0.27, "learning_rate": 0.0002597647369880839, "loss": 0.0189, "step": 103480 }, { "epoch": 0.27, "learning_rate": 0.0002597608487717124, "loss": 0.025, "step": 103490 }, { "epoch": 0.27, "learning_rate": 0.000259756960555341, "loss": 0.0208, "step": 103500 }, { "epoch": 0.27, "learning_rate": 0.0002597530723389695, "loss": 0.0244, "step": 103510 }, { "epoch": 0.27, "learning_rate": 0.00025974918412259806, "loss": 0.0229, "step": 103520 }, { "epoch": 0.27, "learning_rate": 0.0002597452959062266, "loss": 0.0199, "step": 103530 }, { "epoch": 0.27, "learning_rate": 0.0002597414076898551, "loss": 0.0228, "step": 103540 }, { "epoch": 0.27, "learning_rate": 0.0002597375194734836, "loss": 0.0211, "step": 103550 }, { "epoch": 0.27, "learning_rate": 0.0002597336312571122, "loss": 0.0234, "step": 103560 }, { "epoch": 0.27, "learning_rate": 0.0002597297430407407, "loss": 0.025, "step": 103570 }, { "epoch": 0.27, "learning_rate": 0.00025972585482436926, "loss": 0.0225, "step": 103580 }, { "epoch": 0.27, "learning_rate": 0.0002597219666079978, "loss": 0.0224, "step": 103590 }, { "epoch": 0.27, "learning_rate": 0.00025971807839162634, "loss": 0.0223, "step": 103600 }, { "epoch": 0.27, "learning_rate": 0.00025971419017525486, "loss": 0.0231, "step": 103610 }, { "epoch": 0.27, "learning_rate": 0.00025971030195888337, "loss": 0.0224, "step": 103620 }, { "epoch": 0.27, "learning_rate": 0.0002597064137425119, "loss": 0.0183, "step": 103630 }, { "epoch": 0.27, "learning_rate": 0.00025970252552614046, "loss": 0.023, "step": 103640 }, { "epoch": 0.27, "learning_rate": 0.000259698637309769, "loss": 0.0193, "step": 103650 }, { "epoch": 0.27, "learning_rate": 0.00025969474909339754, "loss": 0.0231, "step": 103660 }, { "epoch": 0.27, "learning_rate": 0.00025969086087702605, "loss": 0.0204, "step": 103670 }, { "epoch": 0.27, "learning_rate": 0.0002596869726606546, "loss": 0.0194, "step": 103680 }, { "epoch": 0.27, "learning_rate": 0.00025968308444428314, "loss": 0.0245, "step": 103690 }, { "epoch": 0.27, "learning_rate": 0.00025967919622791165, "loss": 0.0229, "step": 103700 }, { "epoch": 0.27, "learning_rate": 0.0002596753080115402, "loss": 0.0213, "step": 103710 }, { "epoch": 0.27, "learning_rate": 0.00025967141979516873, "loss": 0.0242, "step": 103720 }, { "epoch": 0.27, "learning_rate": 0.0002596675315787973, "loss": 0.0221, "step": 103730 }, { "epoch": 0.27, "learning_rate": 0.0002596636433624258, "loss": 0.0292, "step": 103740 }, { "epoch": 0.27, "learning_rate": 0.00025965975514605433, "loss": 0.0289, "step": 103750 }, { "epoch": 0.27, "learning_rate": 0.00025965586692968285, "loss": 0.0242, "step": 103760 }, { "epoch": 0.27, "learning_rate": 0.0002596519787133114, "loss": 0.0205, "step": 103770 }, { "epoch": 0.27, "learning_rate": 0.00025964809049693993, "loss": 0.0193, "step": 103780 }, { "epoch": 0.27, "learning_rate": 0.0002596442022805685, "loss": 0.0229, "step": 103790 }, { "epoch": 0.27, "learning_rate": 0.000259640314064197, "loss": 0.0211, "step": 103800 }, { "epoch": 0.27, "learning_rate": 0.0002596364258478256, "loss": 0.0227, "step": 103810 }, { "epoch": 0.27, "learning_rate": 0.0002596325376314541, "loss": 0.0283, "step": 103820 }, { "epoch": 0.27, "learning_rate": 0.0002596286494150826, "loss": 0.02, "step": 103830 }, { "epoch": 0.27, "learning_rate": 0.0002596247611987111, "loss": 0.0248, "step": 103840 }, { "epoch": 0.27, "learning_rate": 0.0002596208729823397, "loss": 0.022, "step": 103850 }, { "epoch": 0.27, "learning_rate": 0.00025961698476596826, "loss": 0.026, "step": 103860 }, { "epoch": 0.27, "learning_rate": 0.0002596130965495968, "loss": 0.0227, "step": 103870 }, { "epoch": 0.27, "learning_rate": 0.0002596092083332253, "loss": 0.0201, "step": 103880 }, { "epoch": 0.27, "learning_rate": 0.00025960532011685386, "loss": 0.0211, "step": 103890 }, { "epoch": 0.27, "learning_rate": 0.0002596014319004824, "loss": 0.0245, "step": 103900 }, { "epoch": 0.27, "learning_rate": 0.0002595975436841109, "loss": 0.0263, "step": 103910 }, { "epoch": 0.27, "learning_rate": 0.00025959365546773946, "loss": 0.0287, "step": 103920 }, { "epoch": 0.27, "learning_rate": 0.000259589767251368, "loss": 0.0211, "step": 103930 }, { "epoch": 0.27, "learning_rate": 0.00025958587903499654, "loss": 0.0261, "step": 103940 }, { "epoch": 0.27, "learning_rate": 0.00025958199081862506, "loss": 0.022, "step": 103950 }, { "epoch": 0.27, "learning_rate": 0.00025957810260225357, "loss": 0.0207, "step": 103960 }, { "epoch": 0.27, "learning_rate": 0.0002595742143858821, "loss": 0.0229, "step": 103970 }, { "epoch": 0.27, "learning_rate": 0.00025957032616951065, "loss": 0.0238, "step": 103980 }, { "epoch": 0.27, "learning_rate": 0.00025956643795313917, "loss": 0.0224, "step": 103990 }, { "epoch": 0.27, "learning_rate": 0.00025956254973676774, "loss": 0.0207, "step": 104000 }, { "epoch": 0.27, "eval_cer": 0.8818706427552693, "eval_loss": 0.01605622097849846, "eval_runtime": 108.0768, "eval_samples_per_second": 18.505, "eval_steps_per_second": 4.626, "step": 104000 }, { "epoch": 0.27, "learning_rate": 0.00025955866152039625, "loss": 0.0184, "step": 104010 }, { "epoch": 0.27, "learning_rate": 0.0002595547733040248, "loss": 0.0211, "step": 104020 }, { "epoch": 0.27, "learning_rate": 0.00025955088508765334, "loss": 0.0221, "step": 104030 }, { "epoch": 0.27, "learning_rate": 0.00025954699687128185, "loss": 0.0233, "step": 104040 }, { "epoch": 0.27, "learning_rate": 0.0002595431086549104, "loss": 0.0246, "step": 104050 }, { "epoch": 0.27, "learning_rate": 0.00025953922043853893, "loss": 0.0202, "step": 104060 }, { "epoch": 0.27, "learning_rate": 0.0002595353322221675, "loss": 0.028, "step": 104070 }, { "epoch": 0.27, "learning_rate": 0.000259531444005796, "loss": 0.0202, "step": 104080 }, { "epoch": 0.27, "learning_rate": 0.00025952755578942453, "loss": 0.0262, "step": 104090 }, { "epoch": 0.27, "learning_rate": 0.0002595236675730531, "loss": 0.0242, "step": 104100 }, { "epoch": 0.27, "learning_rate": 0.0002595197793566816, "loss": 0.0228, "step": 104110 }, { "epoch": 0.27, "learning_rate": 0.00025951589114031013, "loss": 0.0226, "step": 104120 }, { "epoch": 0.27, "learning_rate": 0.0002595120029239387, "loss": 0.0183, "step": 104130 }, { "epoch": 0.27, "learning_rate": 0.0002595081147075672, "loss": 0.0297, "step": 104140 }, { "epoch": 0.27, "learning_rate": 0.0002595042264911958, "loss": 0.0289, "step": 104150 }, { "epoch": 0.27, "learning_rate": 0.0002595003382748243, "loss": 0.0192, "step": 104160 }, { "epoch": 0.27, "learning_rate": 0.0002594964500584528, "loss": 0.0206, "step": 104170 }, { "epoch": 0.27, "learning_rate": 0.0002594925618420814, "loss": 0.0242, "step": 104180 }, { "epoch": 0.27, "learning_rate": 0.0002594886736257099, "loss": 0.0188, "step": 104190 }, { "epoch": 0.27, "learning_rate": 0.00025948478540933846, "loss": 0.0211, "step": 104200 }, { "epoch": 0.27, "learning_rate": 0.000259480897192967, "loss": 0.0196, "step": 104210 }, { "epoch": 0.27, "learning_rate": 0.0002594770089765955, "loss": 0.0242, "step": 104220 }, { "epoch": 0.27, "learning_rate": 0.00025947312076022406, "loss": 0.0237, "step": 104230 }, { "epoch": 0.27, "learning_rate": 0.0002594692325438526, "loss": 0.0244, "step": 104240 }, { "epoch": 0.27, "learning_rate": 0.0002594653443274811, "loss": 0.0178, "step": 104250 }, { "epoch": 0.27, "learning_rate": 0.00025946145611110966, "loss": 0.0218, "step": 104260 }, { "epoch": 0.27, "learning_rate": 0.00025945756789473817, "loss": 0.0218, "step": 104270 }, { "epoch": 0.27, "learning_rate": 0.00025945367967836674, "loss": 0.0248, "step": 104280 }, { "epoch": 0.27, "learning_rate": 0.00025944979146199526, "loss": 0.0276, "step": 104290 }, { "epoch": 0.27, "learning_rate": 0.00025944590324562377, "loss": 0.021, "step": 104300 }, { "epoch": 0.27, "learning_rate": 0.00025944201502925234, "loss": 0.026, "step": 104310 }, { "epoch": 0.27, "learning_rate": 0.00025943812681288085, "loss": 0.0212, "step": 104320 }, { "epoch": 0.27, "learning_rate": 0.00025943423859650937, "loss": 0.022, "step": 104330 }, { "epoch": 0.27, "learning_rate": 0.00025943035038013794, "loss": 0.0201, "step": 104340 }, { "epoch": 0.27, "learning_rate": 0.0002594264621637665, "loss": 0.0268, "step": 104350 }, { "epoch": 0.27, "learning_rate": 0.000259422573947395, "loss": 0.0214, "step": 104360 }, { "epoch": 0.27, "learning_rate": 0.00025941868573102353, "loss": 0.0221, "step": 104370 }, { "epoch": 0.27, "learning_rate": 0.00025941479751465205, "loss": 0.0212, "step": 104380 }, { "epoch": 0.27, "learning_rate": 0.0002594109092982806, "loss": 0.0234, "step": 104390 }, { "epoch": 0.27, "learning_rate": 0.00025940702108190913, "loss": 0.0228, "step": 104400 }, { "epoch": 0.27, "learning_rate": 0.0002594031328655377, "loss": 0.021, "step": 104410 }, { "epoch": 0.27, "learning_rate": 0.0002593992446491662, "loss": 0.0208, "step": 104420 }, { "epoch": 0.27, "learning_rate": 0.0002593953564327948, "loss": 0.0237, "step": 104430 }, { "epoch": 0.27, "learning_rate": 0.0002593914682164233, "loss": 0.0283, "step": 104440 }, { "epoch": 0.27, "learning_rate": 0.0002593875800000518, "loss": 0.0163, "step": 104450 }, { "epoch": 0.27, "learning_rate": 0.00025938369178368033, "loss": 0.0202, "step": 104460 }, { "epoch": 0.27, "learning_rate": 0.0002593798035673089, "loss": 0.0197, "step": 104470 }, { "epoch": 0.27, "learning_rate": 0.0002593759153509374, "loss": 0.0176, "step": 104480 }, { "epoch": 0.27, "learning_rate": 0.000259372027134566, "loss": 0.0226, "step": 104490 }, { "epoch": 0.27, "learning_rate": 0.0002593681389181945, "loss": 0.019, "step": 104500 }, { "epoch": 0.27, "learning_rate": 0.000259364250701823, "loss": 0.0245, "step": 104510 }, { "epoch": 0.27, "learning_rate": 0.0002593603624854516, "loss": 0.0179, "step": 104520 }, { "epoch": 0.27, "learning_rate": 0.0002593564742690801, "loss": 0.0228, "step": 104530 }, { "epoch": 0.27, "learning_rate": 0.0002593525860527086, "loss": 0.0245, "step": 104540 }, { "epoch": 0.27, "learning_rate": 0.0002593486978363372, "loss": 0.0224, "step": 104550 }, { "epoch": 0.27, "learning_rate": 0.00025934480961996574, "loss": 0.018, "step": 104560 }, { "epoch": 0.27, "learning_rate": 0.00025934092140359426, "loss": 0.0235, "step": 104570 }, { "epoch": 0.27, "learning_rate": 0.0002593370331872228, "loss": 0.0226, "step": 104580 }, { "epoch": 0.27, "learning_rate": 0.0002593331449708513, "loss": 0.0219, "step": 104590 }, { "epoch": 0.27, "learning_rate": 0.00025932925675447986, "loss": 0.0183, "step": 104600 }, { "epoch": 0.27, "learning_rate": 0.00025932536853810837, "loss": 0.0246, "step": 104610 }, { "epoch": 0.27, "learning_rate": 0.00025932148032173694, "loss": 0.0213, "step": 104620 }, { "epoch": 0.27, "learning_rate": 0.00025931759210536545, "loss": 0.022, "step": 104630 }, { "epoch": 0.27, "learning_rate": 0.000259313703888994, "loss": 0.0248, "step": 104640 }, { "epoch": 0.27, "learning_rate": 0.00025930981567262254, "loss": 0.0233, "step": 104650 }, { "epoch": 0.27, "learning_rate": 0.00025930592745625105, "loss": 0.0218, "step": 104660 }, { "epoch": 0.27, "learning_rate": 0.00025930203923987957, "loss": 0.0231, "step": 104670 }, { "epoch": 0.27, "learning_rate": 0.00025929815102350814, "loss": 0.0208, "step": 104680 }, { "epoch": 0.27, "learning_rate": 0.00025929426280713665, "loss": 0.0179, "step": 104690 }, { "epoch": 0.27, "learning_rate": 0.0002592903745907652, "loss": 0.022, "step": 104700 }, { "epoch": 0.27, "learning_rate": 0.00025928648637439373, "loss": 0.0231, "step": 104710 }, { "epoch": 0.27, "learning_rate": 0.00025928259815802225, "loss": 0.0225, "step": 104720 }, { "epoch": 0.27, "learning_rate": 0.0002592787099416508, "loss": 0.0278, "step": 104730 }, { "epoch": 0.27, "learning_rate": 0.00025927482172527933, "loss": 0.0204, "step": 104740 }, { "epoch": 0.27, "learning_rate": 0.0002592709335089079, "loss": 0.0194, "step": 104750 }, { "epoch": 0.27, "learning_rate": 0.0002592670452925364, "loss": 0.0254, "step": 104760 }, { "epoch": 0.27, "learning_rate": 0.000259263157076165, "loss": 0.0322, "step": 104770 }, { "epoch": 0.27, "learning_rate": 0.0002592592688597935, "loss": 0.0241, "step": 104780 }, { "epoch": 0.27, "learning_rate": 0.000259255380643422, "loss": 0.02, "step": 104790 }, { "epoch": 0.27, "learning_rate": 0.0002592514924270505, "loss": 0.0224, "step": 104800 }, { "epoch": 0.27, "learning_rate": 0.0002592476042106791, "loss": 0.025, "step": 104810 }, { "epoch": 0.27, "learning_rate": 0.0002592437159943076, "loss": 0.025, "step": 104820 }, { "epoch": 0.27, "learning_rate": 0.0002592398277779362, "loss": 0.0223, "step": 104830 }, { "epoch": 0.27, "learning_rate": 0.0002592359395615647, "loss": 0.0234, "step": 104840 }, { "epoch": 0.27, "learning_rate": 0.00025923205134519326, "loss": 0.019, "step": 104850 }, { "epoch": 0.27, "learning_rate": 0.0002592281631288218, "loss": 0.0263, "step": 104860 }, { "epoch": 0.27, "learning_rate": 0.0002592242749124503, "loss": 0.0286, "step": 104870 }, { "epoch": 0.27, "learning_rate": 0.0002592203866960788, "loss": 0.0264, "step": 104880 }, { "epoch": 0.27, "learning_rate": 0.0002592164984797074, "loss": 0.0244, "step": 104890 }, { "epoch": 0.27, "learning_rate": 0.00025921261026333594, "loss": 0.0249, "step": 104900 }, { "epoch": 0.27, "learning_rate": 0.00025920872204696446, "loss": 0.0239, "step": 104910 }, { "epoch": 0.27, "learning_rate": 0.00025920483383059297, "loss": 0.0215, "step": 104920 }, { "epoch": 0.27, "learning_rate": 0.00025920094561422154, "loss": 0.0195, "step": 104930 }, { "epoch": 0.27, "learning_rate": 0.00025919705739785006, "loss": 0.0241, "step": 104940 }, { "epoch": 0.27, "learning_rate": 0.00025919316918147857, "loss": 0.0228, "step": 104950 }, { "epoch": 0.27, "learning_rate": 0.00025918928096510714, "loss": 0.0248, "step": 104960 }, { "epoch": 0.27, "learning_rate": 0.00025918539274873565, "loss": 0.0211, "step": 104970 }, { "epoch": 0.27, "learning_rate": 0.0002591815045323642, "loss": 0.0212, "step": 104980 }, { "epoch": 0.27, "learning_rate": 0.00025917761631599274, "loss": 0.0263, "step": 104990 }, { "epoch": 0.27, "learning_rate": 0.00025917372809962125, "loss": 0.029, "step": 105000 }, { "epoch": 0.27, "eval_cer": 0.8818118580040337, "eval_loss": 0.01607823558151722, "eval_runtime": 108.0567, "eval_samples_per_second": 18.509, "eval_steps_per_second": 4.627, "step": 105000 }, { "epoch": 0.27, "learning_rate": 0.00025916983988324977, "loss": 0.0226, "step": 105010 }, { "epoch": 0.27, "learning_rate": 0.00025916595166687833, "loss": 0.0231, "step": 105020 }, { "epoch": 0.27, "learning_rate": 0.00025916206345050685, "loss": 0.0302, "step": 105030 }, { "epoch": 0.27, "learning_rate": 0.0002591581752341354, "loss": 0.02, "step": 105040 }, { "epoch": 0.27, "learning_rate": 0.00025915428701776393, "loss": 0.0235, "step": 105050 }, { "epoch": 0.27, "learning_rate": 0.0002591503988013925, "loss": 0.0243, "step": 105060 }, { "epoch": 0.27, "learning_rate": 0.000259146510585021, "loss": 0.0219, "step": 105070 }, { "epoch": 0.27, "learning_rate": 0.00025914262236864953, "loss": 0.0244, "step": 105080 }, { "epoch": 0.27, "learning_rate": 0.00025913873415227804, "loss": 0.0231, "step": 105090 }, { "epoch": 0.27, "learning_rate": 0.0002591348459359066, "loss": 0.0244, "step": 105100 }, { "epoch": 0.27, "learning_rate": 0.0002591309577195352, "loss": 0.0199, "step": 105110 }, { "epoch": 0.27, "learning_rate": 0.0002591270695031637, "loss": 0.0269, "step": 105120 }, { "epoch": 0.27, "learning_rate": 0.0002591231812867922, "loss": 0.0225, "step": 105130 }, { "epoch": 0.27, "learning_rate": 0.0002591192930704208, "loss": 0.0226, "step": 105140 }, { "epoch": 0.27, "learning_rate": 0.0002591154048540493, "loss": 0.0216, "step": 105150 }, { "epoch": 0.27, "learning_rate": 0.0002591115166376778, "loss": 0.0258, "step": 105160 }, { "epoch": 0.27, "learning_rate": 0.0002591076284213064, "loss": 0.0206, "step": 105170 }, { "epoch": 0.27, "learning_rate": 0.0002591037402049349, "loss": 0.0167, "step": 105180 }, { "epoch": 0.27, "learning_rate": 0.00025909985198856346, "loss": 0.0209, "step": 105190 }, { "epoch": 0.27, "learning_rate": 0.000259095963772192, "loss": 0.0213, "step": 105200 }, { "epoch": 0.27, "learning_rate": 0.0002590920755558205, "loss": 0.0249, "step": 105210 }, { "epoch": 0.27, "learning_rate": 0.000259088187339449, "loss": 0.0194, "step": 105220 }, { "epoch": 0.27, "learning_rate": 0.0002590842991230776, "loss": 0.021, "step": 105230 }, { "epoch": 0.27, "learning_rate": 0.00025908041090670614, "loss": 0.0155, "step": 105240 }, { "epoch": 0.27, "learning_rate": 0.00025907652269033466, "loss": 0.0196, "step": 105250 }, { "epoch": 0.27, "learning_rate": 0.00025907263447396317, "loss": 0.0219, "step": 105260 }, { "epoch": 0.27, "learning_rate": 0.00025906874625759174, "loss": 0.0184, "step": 105270 }, { "epoch": 0.27, "learning_rate": 0.00025906485804122025, "loss": 0.0233, "step": 105280 }, { "epoch": 0.27, "learning_rate": 0.00025906096982484877, "loss": 0.027, "step": 105290 }, { "epoch": 0.27, "learning_rate": 0.00025905708160847734, "loss": 0.0251, "step": 105300 }, { "epoch": 0.27, "learning_rate": 0.00025905319339210585, "loss": 0.0178, "step": 105310 }, { "epoch": 0.27, "learning_rate": 0.0002590493051757344, "loss": 0.0208, "step": 105320 }, { "epoch": 0.27, "learning_rate": 0.00025904541695936294, "loss": 0.0249, "step": 105330 }, { "epoch": 0.27, "learning_rate": 0.00025904152874299145, "loss": 0.0219, "step": 105340 }, { "epoch": 0.27, "learning_rate": 0.00025903764052662, "loss": 0.0226, "step": 105350 }, { "epoch": 0.27, "learning_rate": 0.00025903375231024853, "loss": 0.0244, "step": 105360 }, { "epoch": 0.27, "learning_rate": 0.00025902986409387705, "loss": 0.0237, "step": 105370 }, { "epoch": 0.27, "learning_rate": 0.0002590259758775056, "loss": 0.0231, "step": 105380 }, { "epoch": 0.27, "learning_rate": 0.0002590220876611342, "loss": 0.0243, "step": 105390 }, { "epoch": 0.27, "learning_rate": 0.0002590181994447627, "loss": 0.0205, "step": 105400 }, { "epoch": 0.27, "learning_rate": 0.0002590143112283912, "loss": 0.023, "step": 105410 }, { "epoch": 0.27, "learning_rate": 0.00025901042301201973, "loss": 0.022, "step": 105420 }, { "epoch": 0.27, "learning_rate": 0.0002590065347956483, "loss": 0.0213, "step": 105430 }, { "epoch": 0.27, "learning_rate": 0.0002590026465792768, "loss": 0.0218, "step": 105440 }, { "epoch": 0.27, "learning_rate": 0.0002589987583629054, "loss": 0.0167, "step": 105450 }, { "epoch": 0.27, "learning_rate": 0.0002589948701465339, "loss": 0.0178, "step": 105460 }, { "epoch": 0.27, "learning_rate": 0.0002589909819301624, "loss": 0.0212, "step": 105470 }, { "epoch": 0.27, "learning_rate": 0.000258987093713791, "loss": 0.0242, "step": 105480 }, { "epoch": 0.27, "learning_rate": 0.0002589832054974195, "loss": 0.0238, "step": 105490 }, { "epoch": 0.27, "learning_rate": 0.000258979317281048, "loss": 0.0201, "step": 105500 }, { "epoch": 0.27, "learning_rate": 0.0002589754290646766, "loss": 0.0201, "step": 105510 }, { "epoch": 0.27, "learning_rate": 0.0002589715408483051, "loss": 0.0261, "step": 105520 }, { "epoch": 0.27, "learning_rate": 0.00025896765263193366, "loss": 0.0201, "step": 105530 }, { "epoch": 0.27, "learning_rate": 0.0002589637644155622, "loss": 0.02, "step": 105540 }, { "epoch": 0.27, "learning_rate": 0.0002589598761991907, "loss": 0.0218, "step": 105550 }, { "epoch": 0.27, "learning_rate": 0.00025895598798281926, "loss": 0.0228, "step": 105560 }, { "epoch": 0.27, "learning_rate": 0.00025895209976644777, "loss": 0.0232, "step": 105570 }, { "epoch": 0.27, "learning_rate": 0.0002589482115500763, "loss": 0.0205, "step": 105580 }, { "epoch": 0.27, "learning_rate": 0.00025894432333370486, "loss": 0.0214, "step": 105590 }, { "epoch": 0.27, "learning_rate": 0.0002589404351173334, "loss": 0.0217, "step": 105600 }, { "epoch": 0.27, "learning_rate": 0.00025893654690096194, "loss": 0.0203, "step": 105610 }, { "epoch": 0.27, "learning_rate": 0.00025893265868459045, "loss": 0.0192, "step": 105620 }, { "epoch": 0.27, "learning_rate": 0.00025892877046821897, "loss": 0.0302, "step": 105630 }, { "epoch": 0.27, "learning_rate": 0.00025892488225184754, "loss": 0.0219, "step": 105640 }, { "epoch": 0.27, "learning_rate": 0.00025892099403547605, "loss": 0.0284, "step": 105650 }, { "epoch": 0.27, "learning_rate": 0.0002589171058191046, "loss": 0.0227, "step": 105660 }, { "epoch": 0.27, "learning_rate": 0.00025891321760273313, "loss": 0.0287, "step": 105670 }, { "epoch": 0.27, "learning_rate": 0.0002589093293863617, "loss": 0.0239, "step": 105680 }, { "epoch": 0.27, "learning_rate": 0.0002589054411699902, "loss": 0.0215, "step": 105690 }, { "epoch": 0.27, "learning_rate": 0.00025890155295361873, "loss": 0.0226, "step": 105700 }, { "epoch": 0.27, "learning_rate": 0.00025889766473724725, "loss": 0.0244, "step": 105710 }, { "epoch": 0.27, "learning_rate": 0.0002588937765208758, "loss": 0.024, "step": 105720 }, { "epoch": 0.27, "learning_rate": 0.00025888988830450433, "loss": 0.0263, "step": 105730 }, { "epoch": 0.27, "learning_rate": 0.0002588860000881329, "loss": 0.0243, "step": 105740 }, { "epoch": 0.27, "learning_rate": 0.0002588821118717614, "loss": 0.0243, "step": 105750 }, { "epoch": 0.27, "learning_rate": 0.00025887822365538993, "loss": 0.0187, "step": 105760 }, { "epoch": 0.27, "learning_rate": 0.0002588743354390185, "loss": 0.0284, "step": 105770 }, { "epoch": 0.27, "learning_rate": 0.000258870447222647, "loss": 0.0211, "step": 105780 }, { "epoch": 0.27, "learning_rate": 0.0002588665590062756, "loss": 0.0202, "step": 105790 }, { "epoch": 0.27, "learning_rate": 0.0002588626707899041, "loss": 0.0195, "step": 105800 }, { "epoch": 0.27, "learning_rate": 0.00025885878257353266, "loss": 0.1621, "step": 105810 }, { "epoch": 0.27, "learning_rate": 0.0002588548943571612, "loss": 0.0283, "step": 105820 }, { "epoch": 0.27, "learning_rate": 0.0002588510061407897, "loss": 0.0251, "step": 105830 }, { "epoch": 0.27, "learning_rate": 0.0002588471179244182, "loss": 0.027, "step": 105840 }, { "epoch": 0.27, "learning_rate": 0.0002588432297080468, "loss": 0.0229, "step": 105850 }, { "epoch": 0.27, "learning_rate": 0.0002588393414916753, "loss": 0.0342, "step": 105860 }, { "epoch": 0.27, "learning_rate": 0.00025883545327530386, "loss": 0.0246, "step": 105870 }, { "epoch": 0.27, "learning_rate": 0.00025883156505893237, "loss": 0.0222, "step": 105880 }, { "epoch": 0.27, "learning_rate": 0.00025882767684256094, "loss": 0.023, "step": 105890 }, { "epoch": 0.27, "learning_rate": 0.00025882378862618946, "loss": 0.0236, "step": 105900 }, { "epoch": 0.27, "learning_rate": 0.00025881990040981797, "loss": 0.0262, "step": 105910 }, { "epoch": 0.27, "learning_rate": 0.0002588160121934465, "loss": 0.0186, "step": 105920 }, { "epoch": 0.27, "learning_rate": 0.00025881212397707505, "loss": 0.025, "step": 105930 }, { "epoch": 0.27, "learning_rate": 0.0002588082357607036, "loss": 0.0226, "step": 105940 }, { "epoch": 0.27, "learning_rate": 0.00025880434754433214, "loss": 0.0217, "step": 105950 }, { "epoch": 0.27, "learning_rate": 0.00025880045932796065, "loss": 0.02, "step": 105960 }, { "epoch": 0.27, "learning_rate": 0.00025879657111158917, "loss": 0.0279, "step": 105970 }, { "epoch": 0.27, "learning_rate": 0.00025879268289521774, "loss": 0.029, "step": 105980 }, { "epoch": 0.27, "learning_rate": 0.00025878879467884625, "loss": 0.0252, "step": 105990 }, { "epoch": 0.27, "learning_rate": 0.0002587849064624748, "loss": 0.0186, "step": 106000 }, { "epoch": 0.27, "eval_cer": 0.8818118580040337, "eval_loss": 0.016281619668006897, "eval_runtime": 107.9063, "eval_samples_per_second": 18.535, "eval_steps_per_second": 4.634, "step": 106000 }, { "epoch": 0.27, "learning_rate": 0.00025878101824610333, "loss": 0.0226, "step": 106010 }, { "epoch": 0.27, "learning_rate": 0.0002587771300297319, "loss": 0.0201, "step": 106020 }, { "epoch": 0.27, "learning_rate": 0.0002587732418133604, "loss": 0.0224, "step": 106030 }, { "epoch": 0.27, "learning_rate": 0.00025876935359698893, "loss": 0.0183, "step": 106040 }, { "epoch": 0.27, "learning_rate": 0.00025876546538061745, "loss": 0.0205, "step": 106050 }, { "epoch": 0.27, "learning_rate": 0.000258761577164246, "loss": 0.0176, "step": 106060 }, { "epoch": 0.27, "learning_rate": 0.00025875768894787453, "loss": 0.0208, "step": 106070 }, { "epoch": 0.27, "learning_rate": 0.0002587538007315031, "loss": 0.0234, "step": 106080 }, { "epoch": 0.28, "learning_rate": 0.0002587499125151316, "loss": 0.0255, "step": 106090 }, { "epoch": 0.28, "learning_rate": 0.0002587460242987602, "loss": 0.022, "step": 106100 }, { "epoch": 0.28, "learning_rate": 0.0002587421360823887, "loss": 0.0204, "step": 106110 }, { "epoch": 0.28, "learning_rate": 0.0002587382478660172, "loss": 0.0262, "step": 106120 }, { "epoch": 0.28, "learning_rate": 0.0002587343596496457, "loss": 0.0248, "step": 106130 }, { "epoch": 0.28, "learning_rate": 0.0002587304714332743, "loss": 0.0177, "step": 106140 }, { "epoch": 0.28, "learning_rate": 0.00025872658321690286, "loss": 0.022, "step": 106150 }, { "epoch": 0.28, "learning_rate": 0.0002587226950005314, "loss": 0.0208, "step": 106160 }, { "epoch": 0.28, "learning_rate": 0.0002587188067841599, "loss": 0.0206, "step": 106170 }, { "epoch": 0.28, "learning_rate": 0.00025871491856778846, "loss": 0.0228, "step": 106180 }, { "epoch": 0.28, "learning_rate": 0.000258711030351417, "loss": 0.0223, "step": 106190 }, { "epoch": 0.28, "learning_rate": 0.0002587071421350455, "loss": 0.0208, "step": 106200 }, { "epoch": 0.28, "learning_rate": 0.00025870325391867406, "loss": 0.0219, "step": 106210 }, { "epoch": 0.28, "learning_rate": 0.00025869936570230257, "loss": 0.0294, "step": 106220 }, { "epoch": 0.28, "learning_rate": 0.00025869547748593114, "loss": 0.0223, "step": 106230 }, { "epoch": 0.28, "learning_rate": 0.00025869158926955965, "loss": 0.0202, "step": 106240 }, { "epoch": 0.28, "learning_rate": 0.00025868770105318817, "loss": 0.0192, "step": 106250 }, { "epoch": 0.28, "learning_rate": 0.0002586838128368167, "loss": 0.0159, "step": 106260 }, { "epoch": 0.28, "learning_rate": 0.00025867992462044525, "loss": 0.0194, "step": 106270 }, { "epoch": 0.28, "learning_rate": 0.00025867603640407377, "loss": 0.0178, "step": 106280 }, { "epoch": 0.28, "learning_rate": 0.00025867214818770234, "loss": 0.0219, "step": 106290 }, { "epoch": 0.28, "learning_rate": 0.00025866825997133085, "loss": 0.0237, "step": 106300 }, { "epoch": 0.28, "learning_rate": 0.0002586643717549594, "loss": 0.0208, "step": 106310 }, { "epoch": 0.28, "learning_rate": 0.00025866048353858793, "loss": 0.024, "step": 106320 }, { "epoch": 0.28, "learning_rate": 0.00025865659532221645, "loss": 0.0222, "step": 106330 }, { "epoch": 0.28, "learning_rate": 0.000258652707105845, "loss": 0.0211, "step": 106340 }, { "epoch": 0.28, "learning_rate": 0.00025864881888947353, "loss": 0.0209, "step": 106350 }, { "epoch": 0.28, "learning_rate": 0.0002586449306731021, "loss": 0.0204, "step": 106360 }, { "epoch": 0.28, "learning_rate": 0.0002586410424567306, "loss": 0.0217, "step": 106370 }, { "epoch": 0.28, "learning_rate": 0.00025863715424035913, "loss": 0.0173, "step": 106380 }, { "epoch": 0.28, "learning_rate": 0.0002586332660239877, "loss": 0.0237, "step": 106390 }, { "epoch": 0.28, "learning_rate": 0.0002586293778076162, "loss": 0.0216, "step": 106400 }, { "epoch": 0.28, "learning_rate": 0.00025862548959124473, "loss": 0.0207, "step": 106410 }, { "epoch": 0.28, "learning_rate": 0.0002586216013748733, "loss": 0.0204, "step": 106420 }, { "epoch": 0.28, "learning_rate": 0.00025861771315850186, "loss": 0.0215, "step": 106430 }, { "epoch": 0.28, "learning_rate": 0.0002586138249421304, "loss": 0.0244, "step": 106440 }, { "epoch": 0.28, "learning_rate": 0.0002586099367257589, "loss": 0.0232, "step": 106450 }, { "epoch": 0.28, "learning_rate": 0.0002586060485093874, "loss": 0.0292, "step": 106460 }, { "epoch": 0.28, "learning_rate": 0.0002586021602930159, "loss": 0.0233, "step": 106470 }, { "epoch": 0.28, "learning_rate": 0.0002585982720766445, "loss": 0.0212, "step": 106480 }, { "epoch": 0.28, "learning_rate": 0.00025859438386027306, "loss": 0.022, "step": 106490 }, { "epoch": 0.28, "learning_rate": 0.0002585904956439016, "loss": 0.0221, "step": 106500 }, { "epoch": 0.28, "learning_rate": 0.0002585866074275301, "loss": 0.023, "step": 106510 }, { "epoch": 0.28, "learning_rate": 0.00025858271921115866, "loss": 0.0239, "step": 106520 }, { "epoch": 0.28, "learning_rate": 0.00025857883099478717, "loss": 0.0247, "step": 106530 }, { "epoch": 0.28, "learning_rate": 0.0002585749427784157, "loss": 0.0191, "step": 106540 }, { "epoch": 0.28, "learning_rate": 0.00025857105456204426, "loss": 0.0249, "step": 106550 }, { "epoch": 0.28, "learning_rate": 0.00025856716634567277, "loss": 0.0228, "step": 106560 }, { "epoch": 0.28, "learning_rate": 0.00025856327812930134, "loss": 0.022, "step": 106570 }, { "epoch": 0.28, "learning_rate": 0.00025855938991292985, "loss": 0.0259, "step": 106580 }, { "epoch": 0.28, "learning_rate": 0.00025855550169655837, "loss": 0.0219, "step": 106590 }, { "epoch": 0.28, "learning_rate": 0.00025855161348018694, "loss": 0.0226, "step": 106600 }, { "epoch": 0.28, "learning_rate": 0.00025854772526381545, "loss": 0.0292, "step": 106610 }, { "epoch": 0.28, "learning_rate": 0.00025854383704744397, "loss": 0.0251, "step": 106620 }, { "epoch": 0.28, "learning_rate": 0.00025853994883107253, "loss": 0.025, "step": 106630 }, { "epoch": 0.28, "learning_rate": 0.0002585360606147011, "loss": 0.0238, "step": 106640 }, { "epoch": 0.28, "learning_rate": 0.0002585321723983296, "loss": 0.0234, "step": 106650 }, { "epoch": 0.28, "learning_rate": 0.00025852828418195813, "loss": 0.0202, "step": 106660 }, { "epoch": 0.28, "learning_rate": 0.00025852439596558665, "loss": 0.0269, "step": 106670 }, { "epoch": 0.28, "learning_rate": 0.0002585205077492152, "loss": 0.023, "step": 106680 }, { "epoch": 0.28, "learning_rate": 0.00025851661953284373, "loss": 0.022, "step": 106690 }, { "epoch": 0.28, "learning_rate": 0.0002585127313164723, "loss": 0.0244, "step": 106700 }, { "epoch": 0.28, "learning_rate": 0.0002585088431001008, "loss": 0.0223, "step": 106710 }, { "epoch": 0.28, "learning_rate": 0.00025850495488372933, "loss": 0.0187, "step": 106720 }, { "epoch": 0.28, "learning_rate": 0.0002585010666673579, "loss": 0.0182, "step": 106730 }, { "epoch": 0.28, "learning_rate": 0.0002584971784509864, "loss": 0.0182, "step": 106740 }, { "epoch": 0.28, "learning_rate": 0.0002584932902346149, "loss": 0.0187, "step": 106750 }, { "epoch": 0.28, "learning_rate": 0.0002584894020182435, "loss": 0.0228, "step": 106760 }, { "epoch": 0.28, "learning_rate": 0.000258485513801872, "loss": 0.026, "step": 106770 }, { "epoch": 0.28, "learning_rate": 0.0002584816255855006, "loss": 0.0246, "step": 106780 }, { "epoch": 0.28, "learning_rate": 0.0002584777373691291, "loss": 0.021, "step": 106790 }, { "epoch": 0.28, "learning_rate": 0.0002584738491527576, "loss": 0.0238, "step": 106800 }, { "epoch": 0.28, "learning_rate": 0.0002584699609363862, "loss": 0.0225, "step": 106810 }, { "epoch": 0.28, "learning_rate": 0.0002584660727200147, "loss": 0.0187, "step": 106820 }, { "epoch": 0.28, "learning_rate": 0.00025846218450364326, "loss": 0.0206, "step": 106830 }, { "epoch": 0.28, "learning_rate": 0.0002584582962872718, "loss": 0.0227, "step": 106840 }, { "epoch": 0.28, "learning_rate": 0.00025845440807090034, "loss": 0.0179, "step": 106850 }, { "epoch": 0.28, "learning_rate": 0.00025845051985452886, "loss": 0.0262, "step": 106860 }, { "epoch": 0.28, "learning_rate": 0.00025844663163815737, "loss": 0.0178, "step": 106870 }, { "epoch": 0.28, "learning_rate": 0.0002584427434217859, "loss": 0.0258, "step": 106880 }, { "epoch": 0.28, "learning_rate": 0.00025843885520541445, "loss": 0.0245, "step": 106890 }, { "epoch": 0.28, "learning_rate": 0.00025843496698904297, "loss": 0.0285, "step": 106900 }, { "epoch": 0.28, "learning_rate": 0.00025843107877267154, "loss": 0.0283, "step": 106910 }, { "epoch": 0.28, "learning_rate": 0.00025842719055630005, "loss": 0.0239, "step": 106920 }, { "epoch": 0.28, "learning_rate": 0.0002584233023399286, "loss": 0.0235, "step": 106930 }, { "epoch": 0.28, "learning_rate": 0.00025841941412355714, "loss": 0.0221, "step": 106940 }, { "epoch": 0.28, "learning_rate": 0.00025841552590718565, "loss": 0.0223, "step": 106950 }, { "epoch": 0.28, "learning_rate": 0.00025841163769081417, "loss": 0.0192, "step": 106960 }, { "epoch": 0.28, "learning_rate": 0.00025840774947444273, "loss": 0.0261, "step": 106970 }, { "epoch": 0.28, "learning_rate": 0.0002584038612580713, "loss": 0.0217, "step": 106980 }, { "epoch": 0.28, "learning_rate": 0.0002583999730416998, "loss": 0.02, "step": 106990 }, { "epoch": 0.28, "learning_rate": 0.00025839608482532833, "loss": 0.0276, "step": 107000 }, { "epoch": 0.28, "eval_cer": 0.8818300532841781, "eval_loss": 0.01527465507388115, "eval_runtime": 108.0078, "eval_samples_per_second": 18.517, "eval_steps_per_second": 4.629, "step": 107000 }, { "epoch": 0.28, "learning_rate": 0.00025839219660895685, "loss": 0.0254, "step": 107010 }, { "epoch": 0.28, "learning_rate": 0.0002583883083925854, "loss": 0.0237, "step": 107020 }, { "epoch": 0.28, "learning_rate": 0.00025838442017621393, "loss": 0.022, "step": 107030 }, { "epoch": 0.28, "learning_rate": 0.0002583805319598425, "loss": 0.0197, "step": 107040 }, { "epoch": 0.28, "learning_rate": 0.000258376643743471, "loss": 0.0205, "step": 107050 }, { "epoch": 0.28, "learning_rate": 0.0002583727555270996, "loss": 0.0228, "step": 107060 }, { "epoch": 0.28, "learning_rate": 0.0002583688673107281, "loss": 0.0245, "step": 107070 }, { "epoch": 0.28, "learning_rate": 0.0002583649790943566, "loss": 0.0182, "step": 107080 }, { "epoch": 0.28, "learning_rate": 0.0002583610908779851, "loss": 0.0297, "step": 107090 }, { "epoch": 0.28, "learning_rate": 0.0002583572026616137, "loss": 0.0242, "step": 107100 }, { "epoch": 0.28, "learning_rate": 0.0002583533144452422, "loss": 0.0244, "step": 107110 }, { "epoch": 0.28, "learning_rate": 0.0002583494262288708, "loss": 0.0221, "step": 107120 }, { "epoch": 0.28, "learning_rate": 0.0002583455380124993, "loss": 0.0231, "step": 107130 }, { "epoch": 0.28, "learning_rate": 0.00025834164979612786, "loss": 0.0224, "step": 107140 }, { "epoch": 0.28, "learning_rate": 0.0002583377615797564, "loss": 0.0194, "step": 107150 }, { "epoch": 0.28, "learning_rate": 0.0002583338733633849, "loss": 0.0175, "step": 107160 }, { "epoch": 0.28, "learning_rate": 0.0002583299851470134, "loss": 0.0215, "step": 107170 }, { "epoch": 0.28, "learning_rate": 0.00025832609693064197, "loss": 0.0264, "step": 107180 }, { "epoch": 0.28, "learning_rate": 0.00025832220871427054, "loss": 0.0214, "step": 107190 }, { "epoch": 0.28, "learning_rate": 0.00025831832049789906, "loss": 0.022, "step": 107200 }, { "epoch": 0.28, "learning_rate": 0.00025831443228152757, "loss": 0.0236, "step": 107210 }, { "epoch": 0.28, "learning_rate": 0.0002583105440651561, "loss": 0.0234, "step": 107220 }, { "epoch": 0.28, "learning_rate": 0.00025830665584878465, "loss": 0.0257, "step": 107230 }, { "epoch": 0.28, "learning_rate": 0.00025830276763241317, "loss": 0.0184, "step": 107240 }, { "epoch": 0.28, "learning_rate": 0.00025829887941604174, "loss": 0.0213, "step": 107250 }, { "epoch": 0.28, "learning_rate": 0.00025829499119967025, "loss": 0.0219, "step": 107260 }, { "epoch": 0.28, "learning_rate": 0.0002582911029832988, "loss": 0.0222, "step": 107270 }, { "epoch": 0.28, "learning_rate": 0.00025828721476692733, "loss": 0.0227, "step": 107280 }, { "epoch": 0.28, "learning_rate": 0.00025828332655055585, "loss": 0.0175, "step": 107290 }, { "epoch": 0.28, "learning_rate": 0.00025827943833418436, "loss": 0.0207, "step": 107300 }, { "epoch": 0.28, "learning_rate": 0.00025827555011781293, "loss": 0.023, "step": 107310 }, { "epoch": 0.28, "learning_rate": 0.00025827166190144145, "loss": 0.0207, "step": 107320 }, { "epoch": 0.28, "learning_rate": 0.00025826777368507, "loss": 0.0236, "step": 107330 }, { "epoch": 0.28, "learning_rate": 0.00025826388546869853, "loss": 0.0219, "step": 107340 }, { "epoch": 0.28, "learning_rate": 0.0002582599972523271, "loss": 0.0228, "step": 107350 }, { "epoch": 0.28, "learning_rate": 0.0002582561090359556, "loss": 0.0209, "step": 107360 }, { "epoch": 0.28, "learning_rate": 0.00025825222081958413, "loss": 0.0197, "step": 107370 }, { "epoch": 0.28, "learning_rate": 0.0002582483326032127, "loss": 0.027, "step": 107380 }, { "epoch": 0.28, "learning_rate": 0.0002582444443868412, "loss": 0.0255, "step": 107390 }, { "epoch": 0.28, "learning_rate": 0.0002582405561704698, "loss": 0.0193, "step": 107400 }, { "epoch": 0.28, "learning_rate": 0.0002582366679540983, "loss": 0.0231, "step": 107410 }, { "epoch": 0.28, "learning_rate": 0.0002582327797377268, "loss": 0.02, "step": 107420 }, { "epoch": 0.28, "learning_rate": 0.0002582288915213554, "loss": 0.0211, "step": 107430 }, { "epoch": 0.28, "learning_rate": 0.0002582250033049839, "loss": 0.0234, "step": 107440 }, { "epoch": 0.28, "learning_rate": 0.0002582211150886124, "loss": 0.0261, "step": 107450 }, { "epoch": 0.28, "learning_rate": 0.000258217226872241, "loss": 0.0282, "step": 107460 }, { "epoch": 0.28, "learning_rate": 0.0002582133386558695, "loss": 0.0224, "step": 107470 }, { "epoch": 0.28, "learning_rate": 0.00025820945043949806, "loss": 0.0216, "step": 107480 }, { "epoch": 0.28, "learning_rate": 0.0002582055622231266, "loss": 0.0215, "step": 107490 }, { "epoch": 0.28, "learning_rate": 0.0002582016740067551, "loss": 0.0206, "step": 107500 }, { "epoch": 0.28, "learning_rate": 0.0002581977857903836, "loss": 0.018, "step": 107510 }, { "epoch": 0.28, "learning_rate": 0.00025819389757401217, "loss": 0.0195, "step": 107520 }, { "epoch": 0.28, "learning_rate": 0.00025819000935764074, "loss": 0.0236, "step": 107530 }, { "epoch": 0.28, "learning_rate": 0.00025818612114126925, "loss": 0.0307, "step": 107540 }, { "epoch": 0.28, "learning_rate": 0.00025818223292489777, "loss": 0.0197, "step": 107550 }, { "epoch": 0.28, "learning_rate": 0.00025817834470852634, "loss": 0.0247, "step": 107560 }, { "epoch": 0.28, "learning_rate": 0.00025817445649215485, "loss": 0.0217, "step": 107570 }, { "epoch": 0.28, "learning_rate": 0.00025817056827578337, "loss": 0.0279, "step": 107580 }, { "epoch": 0.28, "learning_rate": 0.00025816668005941194, "loss": 0.021, "step": 107590 }, { "epoch": 0.28, "learning_rate": 0.00025816279184304045, "loss": 0.0283, "step": 107600 }, { "epoch": 0.28, "learning_rate": 0.000258158903626669, "loss": 0.0193, "step": 107610 }, { "epoch": 0.28, "learning_rate": 0.00025815501541029753, "loss": 0.023, "step": 107620 }, { "epoch": 0.28, "learning_rate": 0.00025815112719392605, "loss": 0.0198, "step": 107630 }, { "epoch": 0.28, "learning_rate": 0.0002581472389775546, "loss": 0.0207, "step": 107640 }, { "epoch": 0.28, "learning_rate": 0.00025814335076118313, "loss": 0.0219, "step": 107650 }, { "epoch": 0.28, "learning_rate": 0.00025813946254481165, "loss": 0.0187, "step": 107660 }, { "epoch": 0.28, "learning_rate": 0.0002581355743284402, "loss": 0.0238, "step": 107670 }, { "epoch": 0.28, "learning_rate": 0.00025813168611206873, "loss": 0.0191, "step": 107680 }, { "epoch": 0.28, "learning_rate": 0.0002581277978956973, "loss": 0.0215, "step": 107690 }, { "epoch": 0.28, "learning_rate": 0.0002581239096793258, "loss": 0.0268, "step": 107700 }, { "epoch": 0.28, "learning_rate": 0.0002581200214629543, "loss": 0.0232, "step": 107710 }, { "epoch": 0.28, "learning_rate": 0.00025811613324658284, "loss": 0.0224, "step": 107720 }, { "epoch": 0.28, "learning_rate": 0.0002581122450302114, "loss": 0.0255, "step": 107730 }, { "epoch": 0.28, "learning_rate": 0.00025810835681384, "loss": 0.0223, "step": 107740 }, { "epoch": 0.28, "learning_rate": 0.0002581044685974685, "loss": 0.024, "step": 107750 }, { "epoch": 0.28, "learning_rate": 0.000258100580381097, "loss": 0.0188, "step": 107760 }, { "epoch": 0.28, "learning_rate": 0.0002580966921647256, "loss": 0.0217, "step": 107770 }, { "epoch": 0.28, "learning_rate": 0.0002580928039483541, "loss": 0.0216, "step": 107780 }, { "epoch": 0.28, "learning_rate": 0.0002580889157319826, "loss": 0.0179, "step": 107790 }, { "epoch": 0.28, "learning_rate": 0.0002580850275156112, "loss": 0.0261, "step": 107800 }, { "epoch": 0.28, "learning_rate": 0.0002580811392992397, "loss": 0.0266, "step": 107810 }, { "epoch": 0.28, "learning_rate": 0.00025807725108286826, "loss": 0.0195, "step": 107820 }, { "epoch": 0.28, "learning_rate": 0.00025807336286649677, "loss": 0.0209, "step": 107830 }, { "epoch": 0.28, "learning_rate": 0.0002580694746501253, "loss": 0.026, "step": 107840 }, { "epoch": 0.28, "learning_rate": 0.00025806558643375386, "loss": 0.0256, "step": 107850 }, { "epoch": 0.28, "learning_rate": 0.00025806169821738237, "loss": 0.0209, "step": 107860 }, { "epoch": 0.28, "learning_rate": 0.0002580578100010109, "loss": 0.0206, "step": 107870 }, { "epoch": 0.28, "learning_rate": 0.00025805392178463945, "loss": 0.0207, "step": 107880 }, { "epoch": 0.28, "learning_rate": 0.000258050033568268, "loss": 0.0201, "step": 107890 }, { "epoch": 0.28, "learning_rate": 0.00025804614535189654, "loss": 0.0208, "step": 107900 }, { "epoch": 0.28, "learning_rate": 0.00025804225713552505, "loss": 0.0212, "step": 107910 }, { "epoch": 0.28, "learning_rate": 0.00025803836891915357, "loss": 0.0233, "step": 107920 }, { "epoch": 0.28, "learning_rate": 0.00025803448070278213, "loss": 0.0252, "step": 107930 }, { "epoch": 0.28, "learning_rate": 0.00025803059248641065, "loss": 0.022, "step": 107940 }, { "epoch": 0.28, "learning_rate": 0.0002580267042700392, "loss": 0.0214, "step": 107950 }, { "epoch": 0.28, "learning_rate": 0.00025802281605366773, "loss": 0.0284, "step": 107960 }, { "epoch": 0.28, "learning_rate": 0.00025801892783729625, "loss": 0.0172, "step": 107970 }, { "epoch": 0.28, "learning_rate": 0.0002580150396209248, "loss": 0.0183, "step": 107980 }, { "epoch": 0.28, "learning_rate": 0.00025801115140455333, "loss": 0.0229, "step": 107990 }, { "epoch": 0.28, "learning_rate": 0.00025800726318818184, "loss": 0.0215, "step": 108000 }, { "epoch": 0.28, "eval_cer": 0.8817796663545476, "eval_loss": 0.015666382387280464, "eval_runtime": 108.1495, "eval_samples_per_second": 18.493, "eval_steps_per_second": 4.623, "step": 108000 }, { "epoch": 0.28, "learning_rate": 0.0002580033749718104, "loss": 0.023, "step": 108010 }, { "epoch": 0.28, "learning_rate": 0.000257999486755439, "loss": 0.0263, "step": 108020 }, { "epoch": 0.28, "learning_rate": 0.0002579955985390675, "loss": 0.0264, "step": 108030 }, { "epoch": 0.28, "learning_rate": 0.000257991710322696, "loss": 0.0242, "step": 108040 }, { "epoch": 0.28, "learning_rate": 0.0002579878221063245, "loss": 0.0232, "step": 108050 }, { "epoch": 0.28, "learning_rate": 0.0002579839338899531, "loss": 0.0198, "step": 108060 }, { "epoch": 0.28, "learning_rate": 0.0002579800456735816, "loss": 0.0242, "step": 108070 }, { "epoch": 0.28, "learning_rate": 0.0002579761574572102, "loss": 0.0188, "step": 108080 }, { "epoch": 0.28, "learning_rate": 0.0002579722692408387, "loss": 0.0236, "step": 108090 }, { "epoch": 0.28, "learning_rate": 0.00025796838102446726, "loss": 0.0189, "step": 108100 }, { "epoch": 0.28, "learning_rate": 0.0002579644928080958, "loss": 0.0216, "step": 108110 }, { "epoch": 0.28, "learning_rate": 0.0002579606045917243, "loss": 0.0237, "step": 108120 }, { "epoch": 0.28, "learning_rate": 0.0002579567163753528, "loss": 0.0222, "step": 108130 }, { "epoch": 0.28, "learning_rate": 0.0002579528281589814, "loss": 0.0203, "step": 108140 }, { "epoch": 0.28, "learning_rate": 0.0002579489399426099, "loss": 0.0217, "step": 108150 }, { "epoch": 0.28, "learning_rate": 0.00025794505172623846, "loss": 0.0234, "step": 108160 }, { "epoch": 0.28, "learning_rate": 0.00025794116350986697, "loss": 0.0203, "step": 108170 }, { "epoch": 0.28, "learning_rate": 0.0002579372752934955, "loss": 0.0218, "step": 108180 }, { "epoch": 0.28, "learning_rate": 0.00025793338707712405, "loss": 0.0195, "step": 108190 }, { "epoch": 0.28, "learning_rate": 0.00025792949886075257, "loss": 0.0189, "step": 108200 }, { "epoch": 0.28, "learning_rate": 0.0002579256106443811, "loss": 0.0199, "step": 108210 }, { "epoch": 0.28, "learning_rate": 0.00025792172242800965, "loss": 0.0198, "step": 108220 }, { "epoch": 0.28, "learning_rate": 0.0002579178342116382, "loss": 0.0193, "step": 108230 }, { "epoch": 0.28, "learning_rate": 0.00025791394599526674, "loss": 0.02, "step": 108240 }, { "epoch": 0.28, "learning_rate": 0.00025791005777889525, "loss": 0.0224, "step": 108250 }, { "epoch": 0.28, "learning_rate": 0.00025790616956252376, "loss": 0.0213, "step": 108260 }, { "epoch": 0.28, "learning_rate": 0.00025790228134615233, "loss": 0.0217, "step": 108270 }, { "epoch": 0.28, "learning_rate": 0.00025789839312978085, "loss": 0.0221, "step": 108280 }, { "epoch": 0.28, "learning_rate": 0.0002578945049134094, "loss": 0.0254, "step": 108290 }, { "epoch": 0.28, "learning_rate": 0.00025789061669703793, "loss": 0.0167, "step": 108300 }, { "epoch": 0.28, "learning_rate": 0.0002578867284806665, "loss": 0.0195, "step": 108310 }, { "epoch": 0.28, "learning_rate": 0.000257882840264295, "loss": 0.0226, "step": 108320 }, { "epoch": 0.28, "learning_rate": 0.00025787895204792353, "loss": 0.0268, "step": 108330 }, { "epoch": 0.28, "learning_rate": 0.00025787506383155204, "loss": 0.0205, "step": 108340 }, { "epoch": 0.28, "learning_rate": 0.0002578711756151806, "loss": 0.0256, "step": 108350 }, { "epoch": 0.28, "learning_rate": 0.0002578672873988091, "loss": 0.0284, "step": 108360 }, { "epoch": 0.28, "learning_rate": 0.0002578633991824377, "loss": 0.0218, "step": 108370 }, { "epoch": 0.28, "learning_rate": 0.0002578595109660662, "loss": 0.0226, "step": 108380 }, { "epoch": 0.28, "learning_rate": 0.0002578556227496948, "loss": 0.0244, "step": 108390 }, { "epoch": 0.28, "learning_rate": 0.0002578517345333233, "loss": 0.0202, "step": 108400 }, { "epoch": 0.28, "learning_rate": 0.0002578478463169518, "loss": 0.0227, "step": 108410 }, { "epoch": 0.28, "learning_rate": 0.0002578439581005804, "loss": 0.0245, "step": 108420 }, { "epoch": 0.28, "learning_rate": 0.0002578400698842089, "loss": 0.0199, "step": 108430 }, { "epoch": 0.28, "learning_rate": 0.00025783618166783746, "loss": 0.0197, "step": 108440 }, { "epoch": 0.28, "learning_rate": 0.000257832293451466, "loss": 0.0235, "step": 108450 }, { "epoch": 0.28, "learning_rate": 0.0002578284052350945, "loss": 0.0236, "step": 108460 }, { "epoch": 0.28, "learning_rate": 0.000257824517018723, "loss": 0.0243, "step": 108470 }, { "epoch": 0.28, "learning_rate": 0.00025782062880235157, "loss": 0.0202, "step": 108480 }, { "epoch": 0.28, "learning_rate": 0.0002578167405859801, "loss": 0.0254, "step": 108490 }, { "epoch": 0.28, "learning_rate": 0.00025781285236960866, "loss": 0.0234, "step": 108500 }, { "epoch": 0.28, "learning_rate": 0.00025780896415323717, "loss": 0.0199, "step": 108510 }, { "epoch": 0.28, "learning_rate": 0.00025780507593686574, "loss": 0.0249, "step": 108520 }, { "epoch": 0.28, "learning_rate": 0.00025780118772049425, "loss": 0.0236, "step": 108530 }, { "epoch": 0.28, "learning_rate": 0.00025779729950412277, "loss": 0.0274, "step": 108540 }, { "epoch": 0.28, "learning_rate": 0.0002577934112877513, "loss": 0.0202, "step": 108550 }, { "epoch": 0.28, "learning_rate": 0.00025778952307137985, "loss": 0.0241, "step": 108560 }, { "epoch": 0.28, "learning_rate": 0.0002577856348550084, "loss": 0.0239, "step": 108570 }, { "epoch": 0.28, "learning_rate": 0.00025778174663863693, "loss": 0.0218, "step": 108580 }, { "epoch": 0.28, "learning_rate": 0.00025777785842226545, "loss": 0.0177, "step": 108590 }, { "epoch": 0.28, "learning_rate": 0.000257773970205894, "loss": 0.022, "step": 108600 }, { "epoch": 0.28, "learning_rate": 0.00025777008198952253, "loss": 0.0217, "step": 108610 }, { "epoch": 0.28, "learning_rate": 0.00025776619377315105, "loss": 0.0259, "step": 108620 }, { "epoch": 0.28, "learning_rate": 0.0002577623055567796, "loss": 0.0246, "step": 108630 }, { "epoch": 0.28, "learning_rate": 0.00025775841734040813, "loss": 0.0237, "step": 108640 }, { "epoch": 0.28, "learning_rate": 0.0002577545291240367, "loss": 0.0241, "step": 108650 }, { "epoch": 0.28, "learning_rate": 0.0002577506409076652, "loss": 0.0229, "step": 108660 }, { "epoch": 0.28, "learning_rate": 0.00025774675269129373, "loss": 0.0248, "step": 108670 }, { "epoch": 0.28, "learning_rate": 0.00025774286447492224, "loss": 0.0264, "step": 108680 }, { "epoch": 0.28, "learning_rate": 0.0002577389762585508, "loss": 0.0248, "step": 108690 }, { "epoch": 0.28, "learning_rate": 0.0002577350880421793, "loss": 0.0237, "step": 108700 }, { "epoch": 0.28, "learning_rate": 0.0002577311998258079, "loss": 0.0256, "step": 108710 }, { "epoch": 0.28, "learning_rate": 0.0002577273116094364, "loss": 0.0216, "step": 108720 }, { "epoch": 0.28, "learning_rate": 0.000257723423393065, "loss": 0.0202, "step": 108730 }, { "epoch": 0.28, "learning_rate": 0.0002577195351766935, "loss": 0.0274, "step": 108740 }, { "epoch": 0.28, "learning_rate": 0.000257715646960322, "loss": 0.0233, "step": 108750 }, { "epoch": 0.28, "learning_rate": 0.0002577117587439505, "loss": 0.0202, "step": 108760 }, { "epoch": 0.28, "learning_rate": 0.0002577078705275791, "loss": 0.021, "step": 108770 }, { "epoch": 0.28, "learning_rate": 0.00025770398231120766, "loss": 0.0233, "step": 108780 }, { "epoch": 0.28, "learning_rate": 0.0002577000940948362, "loss": 0.0219, "step": 108790 }, { "epoch": 0.28, "learning_rate": 0.0002576962058784647, "loss": 0.019, "step": 108800 }, { "epoch": 0.28, "learning_rate": 0.00025769231766209326, "loss": 0.0215, "step": 108810 }, { "epoch": 0.28, "learning_rate": 0.00025768842944572177, "loss": 0.0254, "step": 108820 }, { "epoch": 0.28, "learning_rate": 0.0002576845412293503, "loss": 0.0184, "step": 108830 }, { "epoch": 0.28, "learning_rate": 0.00025768065301297885, "loss": 0.0195, "step": 108840 }, { "epoch": 0.28, "learning_rate": 0.00025767676479660737, "loss": 0.0212, "step": 108850 }, { "epoch": 0.28, "learning_rate": 0.00025767287658023594, "loss": 0.022, "step": 108860 }, { "epoch": 0.28, "learning_rate": 0.00025766898836386445, "loss": 0.0202, "step": 108870 }, { "epoch": 0.28, "learning_rate": 0.00025766510014749297, "loss": 0.0198, "step": 108880 }, { "epoch": 0.28, "learning_rate": 0.00025766121193112154, "loss": 0.0236, "step": 108890 }, { "epoch": 0.28, "learning_rate": 0.00025765732371475005, "loss": 0.0221, "step": 108900 }, { "epoch": 0.28, "learning_rate": 0.00025765343549837856, "loss": 0.0211, "step": 108910 }, { "epoch": 0.28, "learning_rate": 0.00025764954728200713, "loss": 0.0228, "step": 108920 }, { "epoch": 0.28, "learning_rate": 0.00025764565906563565, "loss": 0.0187, "step": 108930 }, { "epoch": 0.28, "learning_rate": 0.0002576417708492642, "loss": 0.0232, "step": 108940 }, { "epoch": 0.28, "learning_rate": 0.00025763788263289273, "loss": 0.0217, "step": 108950 }, { "epoch": 0.28, "learning_rate": 0.00025763399441652125, "loss": 0.018, "step": 108960 }, { "epoch": 0.28, "learning_rate": 0.0002576301062001498, "loss": 0.0197, "step": 108970 }, { "epoch": 0.28, "learning_rate": 0.00025762621798377833, "loss": 0.0196, "step": 108980 }, { "epoch": 0.28, "learning_rate": 0.0002576223297674069, "loss": 0.0274, "step": 108990 }, { "epoch": 0.28, "learning_rate": 0.0002576184415510354, "loss": 0.0261, "step": 109000 }, { "epoch": 0.28, "eval_cer": 0.8818188561887047, "eval_loss": 0.015223901718854904, "eval_runtime": 107.9791, "eval_samples_per_second": 18.522, "eval_steps_per_second": 4.631, "step": 109000 }, { "epoch": 0.28, "learning_rate": 0.0002576145533346639, "loss": 0.0208, "step": 109010 }, { "epoch": 0.28, "learning_rate": 0.0002576106651182925, "loss": 0.0222, "step": 109020 }, { "epoch": 0.28, "learning_rate": 0.000257606776901921, "loss": 0.0232, "step": 109030 }, { "epoch": 0.28, "learning_rate": 0.0002576028886855495, "loss": 0.0207, "step": 109040 }, { "epoch": 0.28, "learning_rate": 0.0002575990004691781, "loss": 0.0246, "step": 109050 }, { "epoch": 0.28, "learning_rate": 0.0002575951122528066, "loss": 0.0203, "step": 109060 }, { "epoch": 0.28, "learning_rate": 0.0002575912240364352, "loss": 0.0244, "step": 109070 }, { "epoch": 0.28, "learning_rate": 0.0002575873358200637, "loss": 0.0191, "step": 109080 }, { "epoch": 0.28, "learning_rate": 0.0002575834476036922, "loss": 0.0215, "step": 109090 }, { "epoch": 0.28, "learning_rate": 0.0002575795593873208, "loss": 0.0185, "step": 109100 }, { "epoch": 0.28, "learning_rate": 0.0002575756711709493, "loss": 0.0202, "step": 109110 }, { "epoch": 0.28, "learning_rate": 0.00025757178295457786, "loss": 0.0197, "step": 109120 }, { "epoch": 0.28, "learning_rate": 0.00025756789473820637, "loss": 0.0281, "step": 109130 }, { "epoch": 0.28, "learning_rate": 0.00025756400652183494, "loss": 0.0189, "step": 109140 }, { "epoch": 0.28, "learning_rate": 0.00025756011830546346, "loss": 0.0202, "step": 109150 }, { "epoch": 0.28, "learning_rate": 0.00025755623008909197, "loss": 0.0213, "step": 109160 }, { "epoch": 0.28, "learning_rate": 0.0002575523418727205, "loss": 0.021, "step": 109170 }, { "epoch": 0.28, "learning_rate": 0.00025754845365634905, "loss": 0.0239, "step": 109180 }, { "epoch": 0.28, "learning_rate": 0.00025754456543997757, "loss": 0.0215, "step": 109190 }, { "epoch": 0.28, "learning_rate": 0.00025754067722360614, "loss": 0.0238, "step": 109200 }, { "epoch": 0.28, "learning_rate": 0.00025753678900723465, "loss": 0.0175, "step": 109210 }, { "epoch": 0.28, "learning_rate": 0.00025753290079086317, "loss": 0.0167, "step": 109220 }, { "epoch": 0.28, "learning_rate": 0.00025752901257449173, "loss": 0.0215, "step": 109230 }, { "epoch": 0.28, "learning_rate": 0.00025752512435812025, "loss": 0.0168, "step": 109240 }, { "epoch": 0.28, "learning_rate": 0.00025752123614174876, "loss": 0.0192, "step": 109250 }, { "epoch": 0.28, "learning_rate": 0.00025751734792537733, "loss": 0.0218, "step": 109260 }, { "epoch": 0.28, "learning_rate": 0.0002575134597090059, "loss": 0.0212, "step": 109270 }, { "epoch": 0.28, "learning_rate": 0.0002575095714926344, "loss": 0.0231, "step": 109280 }, { "epoch": 0.28, "learning_rate": 0.00025750568327626293, "loss": 0.0226, "step": 109290 }, { "epoch": 0.28, "learning_rate": 0.00025750179505989144, "loss": 0.0241, "step": 109300 }, { "epoch": 0.28, "learning_rate": 0.00025749790684352, "loss": 0.0224, "step": 109310 }, { "epoch": 0.28, "learning_rate": 0.00025749401862714853, "loss": 0.0214, "step": 109320 }, { "epoch": 0.28, "learning_rate": 0.0002574901304107771, "loss": 0.0227, "step": 109330 }, { "epoch": 0.28, "learning_rate": 0.0002574862421944056, "loss": 0.0185, "step": 109340 }, { "epoch": 0.28, "learning_rate": 0.0002574823539780342, "loss": 0.0197, "step": 109350 }, { "epoch": 0.28, "learning_rate": 0.0002574784657616627, "loss": 0.0195, "step": 109360 }, { "epoch": 0.28, "learning_rate": 0.0002574745775452912, "loss": 0.0177, "step": 109370 }, { "epoch": 0.28, "learning_rate": 0.0002574706893289197, "loss": 0.0205, "step": 109380 }, { "epoch": 0.28, "learning_rate": 0.0002574668011125483, "loss": 0.0208, "step": 109390 }, { "epoch": 0.28, "learning_rate": 0.0002574629128961768, "loss": 0.0256, "step": 109400 }, { "epoch": 0.28, "learning_rate": 0.0002574590246798054, "loss": 0.0169, "step": 109410 }, { "epoch": 0.28, "learning_rate": 0.0002574551364634339, "loss": 0.0218, "step": 109420 }, { "epoch": 0.28, "learning_rate": 0.0002574512482470624, "loss": 0.0201, "step": 109430 }, { "epoch": 0.28, "learning_rate": 0.000257447360030691, "loss": 0.0205, "step": 109440 }, { "epoch": 0.28, "learning_rate": 0.0002574434718143195, "loss": 0.0203, "step": 109450 }, { "epoch": 0.28, "learning_rate": 0.000257439583597948, "loss": 0.0186, "step": 109460 }, { "epoch": 0.28, "learning_rate": 0.00025743569538157657, "loss": 0.0241, "step": 109470 }, { "epoch": 0.28, "learning_rate": 0.00025743180716520514, "loss": 0.0164, "step": 109480 }, { "epoch": 0.28, "learning_rate": 0.00025742791894883365, "loss": 0.019, "step": 109490 }, { "epoch": 0.28, "learning_rate": 0.00025742403073246217, "loss": 0.0174, "step": 109500 }, { "epoch": 0.28, "learning_rate": 0.0002574201425160907, "loss": 0.0209, "step": 109510 }, { "epoch": 0.28, "learning_rate": 0.00025741625429971925, "loss": 0.0232, "step": 109520 }, { "epoch": 0.28, "learning_rate": 0.00025741236608334777, "loss": 0.0191, "step": 109530 }, { "epoch": 0.28, "learning_rate": 0.00025740847786697634, "loss": 0.0218, "step": 109540 }, { "epoch": 0.28, "learning_rate": 0.00025740458965060485, "loss": 0.0238, "step": 109550 }, { "epoch": 0.28, "learning_rate": 0.0002574007014342334, "loss": 0.0251, "step": 109560 }, { "epoch": 0.28, "learning_rate": 0.00025739681321786193, "loss": 0.0235, "step": 109570 }, { "epoch": 0.28, "learning_rate": 0.00025739292500149045, "loss": 0.0253, "step": 109580 }, { "epoch": 0.28, "learning_rate": 0.00025738903678511896, "loss": 0.0196, "step": 109590 }, { "epoch": 0.28, "learning_rate": 0.00025738514856874753, "loss": 0.0223, "step": 109600 }, { "epoch": 0.28, "learning_rate": 0.0002573812603523761, "loss": 0.0206, "step": 109610 }, { "epoch": 0.28, "learning_rate": 0.0002573773721360046, "loss": 0.0238, "step": 109620 }, { "epoch": 0.28, "learning_rate": 0.00025737348391963313, "loss": 0.0256, "step": 109630 }, { "epoch": 0.28, "learning_rate": 0.0002573695957032617, "loss": 0.0183, "step": 109640 }, { "epoch": 0.28, "learning_rate": 0.0002573657074868902, "loss": 0.0223, "step": 109650 }, { "epoch": 0.28, "learning_rate": 0.0002573618192705187, "loss": 0.0202, "step": 109660 }, { "epoch": 0.28, "learning_rate": 0.0002573579310541473, "loss": 0.0204, "step": 109670 }, { "epoch": 0.28, "learning_rate": 0.0002573540428377758, "loss": 0.0226, "step": 109680 }, { "epoch": 0.28, "learning_rate": 0.0002573501546214044, "loss": 0.0218, "step": 109690 }, { "epoch": 0.28, "learning_rate": 0.0002573462664050329, "loss": 0.0223, "step": 109700 }, { "epoch": 0.28, "learning_rate": 0.0002573423781886614, "loss": 0.0228, "step": 109710 }, { "epoch": 0.28, "learning_rate": 0.0002573384899722899, "loss": 0.0213, "step": 109720 }, { "epoch": 0.28, "learning_rate": 0.0002573346017559185, "loss": 0.0266, "step": 109730 }, { "epoch": 0.28, "learning_rate": 0.000257330713539547, "loss": 0.0202, "step": 109740 }, { "epoch": 0.28, "learning_rate": 0.0002573268253231756, "loss": 0.0275, "step": 109750 }, { "epoch": 0.28, "learning_rate": 0.0002573229371068041, "loss": 0.025, "step": 109760 }, { "epoch": 0.28, "learning_rate": 0.00025731904889043266, "loss": 0.0211, "step": 109770 }, { "epoch": 0.28, "learning_rate": 0.00025731516067406117, "loss": 0.0222, "step": 109780 }, { "epoch": 0.28, "learning_rate": 0.0002573112724576897, "loss": 0.0186, "step": 109790 }, { "epoch": 0.28, "learning_rate": 0.0002573073842413182, "loss": 0.0222, "step": 109800 }, { "epoch": 0.28, "learning_rate": 0.00025730349602494677, "loss": 0.0212, "step": 109810 }, { "epoch": 0.28, "learning_rate": 0.00025729960780857534, "loss": 0.0257, "step": 109820 }, { "epoch": 0.28, "learning_rate": 0.00025729571959220385, "loss": 0.0221, "step": 109830 }, { "epoch": 0.28, "learning_rate": 0.00025729183137583237, "loss": 0.0223, "step": 109840 }, { "epoch": 0.28, "learning_rate": 0.00025728794315946094, "loss": 0.0256, "step": 109850 }, { "epoch": 0.28, "learning_rate": 0.00025728405494308945, "loss": 0.0196, "step": 109860 }, { "epoch": 0.28, "learning_rate": 0.00025728016672671797, "loss": 0.0204, "step": 109870 }, { "epoch": 0.28, "learning_rate": 0.00025727627851034653, "loss": 0.0242, "step": 109880 }, { "epoch": 0.28, "learning_rate": 0.00025727239029397505, "loss": 0.0205, "step": 109890 }, { "epoch": 0.28, "learning_rate": 0.0002572685020776036, "loss": 0.0211, "step": 109900 }, { "epoch": 0.28, "learning_rate": 0.00025726461386123213, "loss": 0.0192, "step": 109910 }, { "epoch": 0.28, "learning_rate": 0.00025726072564486065, "loss": 0.0177, "step": 109920 }, { "epoch": 0.28, "learning_rate": 0.00025725683742848916, "loss": 0.0231, "step": 109930 }, { "epoch": 0.28, "learning_rate": 0.00025725294921211773, "loss": 0.0218, "step": 109940 }, { "epoch": 0.29, "learning_rate": 0.00025724906099574624, "loss": 0.0221, "step": 109950 }, { "epoch": 0.29, "learning_rate": 0.0002572451727793748, "loss": 0.0207, "step": 109960 }, { "epoch": 0.29, "learning_rate": 0.00025724128456300333, "loss": 0.0224, "step": 109970 }, { "epoch": 0.29, "learning_rate": 0.0002572373963466319, "loss": 0.0183, "step": 109980 }, { "epoch": 0.29, "learning_rate": 0.0002572335081302604, "loss": 0.0168, "step": 109990 }, { "epoch": 0.29, "learning_rate": 0.0002572296199138889, "loss": 0.0189, "step": 110000 }, { "epoch": 0.29, "eval_cer": 0.8817908634500211, "eval_loss": 0.01513556856662035, "eval_runtime": 108.099, "eval_samples_per_second": 18.502, "eval_steps_per_second": 4.625, "step": 110000 }, { "epoch": 0.29, "learning_rate": 0.0002572257316975175, "loss": 0.0182, "step": 110010 }, { "epoch": 0.29, "learning_rate": 0.000257221843481146, "loss": 0.0203, "step": 110020 }, { "epoch": 0.29, "learning_rate": 0.0002572179552647746, "loss": 0.0241, "step": 110030 }, { "epoch": 0.29, "learning_rate": 0.0002572140670484031, "loss": 0.0205, "step": 110040 }, { "epoch": 0.29, "learning_rate": 0.0002572101788320316, "loss": 0.0173, "step": 110050 }, { "epoch": 0.29, "learning_rate": 0.0002572062906156602, "loss": 0.02, "step": 110060 }, { "epoch": 0.29, "learning_rate": 0.0002572024023992887, "loss": 0.0204, "step": 110070 }, { "epoch": 0.29, "learning_rate": 0.0002571985141829172, "loss": 0.0193, "step": 110080 }, { "epoch": 0.29, "learning_rate": 0.0002571946259665458, "loss": 0.0222, "step": 110090 }, { "epoch": 0.29, "learning_rate": 0.0002571907377501743, "loss": 0.0211, "step": 110100 }, { "epoch": 0.29, "learning_rate": 0.00025718684953380286, "loss": 0.022, "step": 110110 }, { "epoch": 0.29, "learning_rate": 0.00025718296131743137, "loss": 0.0216, "step": 110120 }, { "epoch": 0.29, "learning_rate": 0.0002571790731010599, "loss": 0.0221, "step": 110130 }, { "epoch": 0.29, "learning_rate": 0.00025717518488468845, "loss": 0.0183, "step": 110140 }, { "epoch": 0.29, "learning_rate": 0.00025717129666831697, "loss": 0.0219, "step": 110150 }, { "epoch": 0.29, "learning_rate": 0.00025716740845194554, "loss": 0.0193, "step": 110160 }, { "epoch": 0.29, "learning_rate": 0.00025716352023557405, "loss": 0.0228, "step": 110170 }, { "epoch": 0.29, "learning_rate": 0.00025715963201920257, "loss": 0.0214, "step": 110180 }, { "epoch": 0.29, "learning_rate": 0.00025715574380283114, "loss": 0.0222, "step": 110190 }, { "epoch": 0.29, "learning_rate": 0.00025715185558645965, "loss": 0.0171, "step": 110200 }, { "epoch": 0.29, "learning_rate": 0.00025714796737008816, "loss": 0.0174, "step": 110210 }, { "epoch": 0.29, "learning_rate": 0.00025714407915371673, "loss": 0.0217, "step": 110220 }, { "epoch": 0.29, "learning_rate": 0.00025714019093734525, "loss": 0.0259, "step": 110230 }, { "epoch": 0.29, "learning_rate": 0.0002571363027209738, "loss": 0.0193, "step": 110240 }, { "epoch": 0.29, "learning_rate": 0.00025713241450460233, "loss": 0.024, "step": 110250 }, { "epoch": 0.29, "learning_rate": 0.00025712852628823085, "loss": 0.0211, "step": 110260 }, { "epoch": 0.29, "learning_rate": 0.0002571246380718594, "loss": 0.022, "step": 110270 }, { "epoch": 0.29, "learning_rate": 0.00025712074985548793, "loss": 0.0226, "step": 110280 }, { "epoch": 0.29, "learning_rate": 0.00025711686163911644, "loss": 0.0248, "step": 110290 }, { "epoch": 0.29, "learning_rate": 0.000257112973422745, "loss": 0.0216, "step": 110300 }, { "epoch": 0.29, "learning_rate": 0.0002571090852063736, "loss": 0.0293, "step": 110310 }, { "epoch": 0.29, "learning_rate": 0.0002571051969900021, "loss": 0.0251, "step": 110320 }, { "epoch": 0.29, "learning_rate": 0.0002571013087736306, "loss": 0.0201, "step": 110330 }, { "epoch": 0.29, "learning_rate": 0.0002570974205572591, "loss": 0.0238, "step": 110340 }, { "epoch": 0.29, "learning_rate": 0.0002570935323408877, "loss": 0.0224, "step": 110350 }, { "epoch": 0.29, "learning_rate": 0.0002570896441245162, "loss": 0.0234, "step": 110360 }, { "epoch": 0.29, "learning_rate": 0.0002570857559081448, "loss": 0.0218, "step": 110370 }, { "epoch": 0.29, "learning_rate": 0.0002570818676917733, "loss": 0.0251, "step": 110380 }, { "epoch": 0.29, "learning_rate": 0.00025707797947540186, "loss": 0.0265, "step": 110390 }, { "epoch": 0.29, "learning_rate": 0.0002570740912590304, "loss": 0.025, "step": 110400 }, { "epoch": 0.29, "learning_rate": 0.0002570702030426589, "loss": 0.0197, "step": 110410 }, { "epoch": 0.29, "learning_rate": 0.0002570663148262874, "loss": 0.0283, "step": 110420 }, { "epoch": 0.29, "learning_rate": 0.00025706242660991597, "loss": 0.0254, "step": 110430 }, { "epoch": 0.29, "learning_rate": 0.0002570585383935445, "loss": 0.0272, "step": 110440 }, { "epoch": 0.29, "learning_rate": 0.00025705465017717306, "loss": 0.0203, "step": 110450 }, { "epoch": 0.29, "learning_rate": 0.00025705076196080157, "loss": 0.0258, "step": 110460 }, { "epoch": 0.29, "learning_rate": 0.0002570468737444301, "loss": 0.024, "step": 110470 }, { "epoch": 0.29, "learning_rate": 0.00025704298552805865, "loss": 0.0201, "step": 110480 }, { "epoch": 0.29, "learning_rate": 0.00025703909731168717, "loss": 0.0203, "step": 110490 }, { "epoch": 0.29, "learning_rate": 0.0002570352090953157, "loss": 0.0204, "step": 110500 }, { "epoch": 0.29, "learning_rate": 0.00025703132087894425, "loss": 0.0207, "step": 110510 }, { "epoch": 0.29, "learning_rate": 0.0002570274326625728, "loss": 0.0206, "step": 110520 }, { "epoch": 0.29, "learning_rate": 0.00025702354444620133, "loss": 0.0223, "step": 110530 }, { "epoch": 0.29, "learning_rate": 0.00025701965622982985, "loss": 0.0181, "step": 110540 }, { "epoch": 0.29, "learning_rate": 0.00025701576801345836, "loss": 0.0215, "step": 110550 }, { "epoch": 0.29, "learning_rate": 0.00025701187979708693, "loss": 0.0214, "step": 110560 }, { "epoch": 0.29, "learning_rate": 0.00025700799158071545, "loss": 0.0217, "step": 110570 }, { "epoch": 0.29, "learning_rate": 0.000257004103364344, "loss": 0.0212, "step": 110580 }, { "epoch": 0.29, "learning_rate": 0.00025700021514797253, "loss": 0.0182, "step": 110590 }, { "epoch": 0.29, "learning_rate": 0.0002569963269316011, "loss": 0.0223, "step": 110600 }, { "epoch": 0.29, "learning_rate": 0.0002569924387152296, "loss": 0.0213, "step": 110610 }, { "epoch": 0.29, "learning_rate": 0.00025698855049885813, "loss": 0.0233, "step": 110620 }, { "epoch": 0.29, "learning_rate": 0.00025698466228248664, "loss": 0.0208, "step": 110630 }, { "epoch": 0.29, "learning_rate": 0.0002569807740661152, "loss": 0.0198, "step": 110640 }, { "epoch": 0.29, "learning_rate": 0.0002569768858497437, "loss": 0.0181, "step": 110650 }, { "epoch": 0.29, "learning_rate": 0.0002569729976333723, "loss": 0.0178, "step": 110660 }, { "epoch": 0.29, "learning_rate": 0.0002569691094170008, "loss": 0.0212, "step": 110670 }, { "epoch": 0.29, "learning_rate": 0.0002569652212006293, "loss": 0.023, "step": 110680 }, { "epoch": 0.29, "learning_rate": 0.0002569613329842579, "loss": 0.0227, "step": 110690 }, { "epoch": 0.29, "learning_rate": 0.0002569574447678864, "loss": 0.0243, "step": 110700 }, { "epoch": 0.29, "learning_rate": 0.000256953556551515, "loss": 0.0203, "step": 110710 }, { "epoch": 0.29, "learning_rate": 0.0002569496683351435, "loss": 0.0212, "step": 110720 }, { "epoch": 0.29, "learning_rate": 0.00025694578011877206, "loss": 0.0208, "step": 110730 }, { "epoch": 0.29, "learning_rate": 0.0002569418919024006, "loss": 0.0243, "step": 110740 }, { "epoch": 0.29, "learning_rate": 0.0002569380036860291, "loss": 0.0183, "step": 110750 }, { "epoch": 0.29, "learning_rate": 0.0002569341154696576, "loss": 0.0196, "step": 110760 }, { "epoch": 0.29, "learning_rate": 0.00025693022725328617, "loss": 0.0196, "step": 110770 }, { "epoch": 0.29, "learning_rate": 0.0002569263390369147, "loss": 0.0209, "step": 110780 }, { "epoch": 0.29, "learning_rate": 0.00025692245082054325, "loss": 0.0202, "step": 110790 }, { "epoch": 0.29, "learning_rate": 0.00025691856260417177, "loss": 0.0227, "step": 110800 }, { "epoch": 0.29, "learning_rate": 0.00025691467438780034, "loss": 0.0204, "step": 110810 }, { "epoch": 0.29, "learning_rate": 0.00025691078617142885, "loss": 0.0221, "step": 110820 }, { "epoch": 0.29, "learning_rate": 0.00025690689795505737, "loss": 0.0219, "step": 110830 }, { "epoch": 0.29, "learning_rate": 0.0002569030097386859, "loss": 0.028, "step": 110840 }, { "epoch": 0.29, "learning_rate": 0.00025689912152231445, "loss": 0.0185, "step": 110850 }, { "epoch": 0.29, "learning_rate": 0.000256895233305943, "loss": 0.0245, "step": 110860 }, { "epoch": 0.29, "learning_rate": 0.00025689134508957153, "loss": 0.0203, "step": 110870 }, { "epoch": 0.29, "learning_rate": 0.00025688745687320005, "loss": 0.0255, "step": 110880 }, { "epoch": 0.29, "learning_rate": 0.0002568835686568286, "loss": 0.0221, "step": 110890 }, { "epoch": 0.29, "learning_rate": 0.00025687968044045713, "loss": 0.0208, "step": 110900 }, { "epoch": 0.29, "learning_rate": 0.00025687579222408565, "loss": 0.0195, "step": 110910 }, { "epoch": 0.29, "learning_rate": 0.0002568719040077142, "loss": 0.0185, "step": 110920 }, { "epoch": 0.29, "learning_rate": 0.00025686801579134273, "loss": 0.0215, "step": 110930 }, { "epoch": 0.29, "learning_rate": 0.0002568641275749713, "loss": 0.023, "step": 110940 }, { "epoch": 0.29, "learning_rate": 0.0002568602393585998, "loss": 0.0179, "step": 110950 }, { "epoch": 0.29, "learning_rate": 0.0002568563511422283, "loss": 0.0208, "step": 110960 }, { "epoch": 0.29, "learning_rate": 0.00025685246292585684, "loss": 0.0222, "step": 110970 }, { "epoch": 0.29, "learning_rate": 0.0002568485747094854, "loss": 0.0232, "step": 110980 }, { "epoch": 0.29, "learning_rate": 0.0002568446864931139, "loss": 0.0218, "step": 110990 }, { "epoch": 0.29, "learning_rate": 0.0002568407982767425, "loss": 0.0216, "step": 111000 }, { "epoch": 0.29, "eval_cer": 0.8817768670806793, "eval_loss": 0.015027694404125214, "eval_runtime": 107.3953, "eval_samples_per_second": 18.623, "eval_steps_per_second": 4.656, "step": 111000 }, { "epoch": 0.29, "learning_rate": 0.000256836910060371, "loss": 0.0184, "step": 111010 }, { "epoch": 0.29, "learning_rate": 0.0002568330218439996, "loss": 0.0263, "step": 111020 }, { "epoch": 0.29, "learning_rate": 0.0002568291336276281, "loss": 0.0229, "step": 111030 }, { "epoch": 0.29, "learning_rate": 0.0002568252454112566, "loss": 0.0244, "step": 111040 }, { "epoch": 0.29, "learning_rate": 0.0002568213571948851, "loss": 0.0261, "step": 111050 }, { "epoch": 0.29, "learning_rate": 0.0002568174689785137, "loss": 0.0261, "step": 111060 }, { "epoch": 0.29, "learning_rate": 0.00025681358076214226, "loss": 0.0212, "step": 111070 }, { "epoch": 0.29, "learning_rate": 0.00025680969254577077, "loss": 0.023, "step": 111080 }, { "epoch": 0.29, "learning_rate": 0.0002568058043293993, "loss": 0.0245, "step": 111090 }, { "epoch": 0.29, "learning_rate": 0.00025680191611302786, "loss": 0.0261, "step": 111100 }, { "epoch": 0.29, "learning_rate": 0.00025679802789665637, "loss": 0.0242, "step": 111110 }, { "epoch": 0.29, "learning_rate": 0.0002567941396802849, "loss": 0.0203, "step": 111120 }, { "epoch": 0.29, "learning_rate": 0.00025679025146391345, "loss": 0.0209, "step": 111130 }, { "epoch": 0.29, "learning_rate": 0.00025678636324754197, "loss": 0.0235, "step": 111140 }, { "epoch": 0.29, "learning_rate": 0.00025678247503117054, "loss": 0.0218, "step": 111150 }, { "epoch": 0.29, "learning_rate": 0.00025677858681479905, "loss": 0.0181, "step": 111160 }, { "epoch": 0.29, "learning_rate": 0.00025677469859842757, "loss": 0.0223, "step": 111170 }, { "epoch": 0.29, "learning_rate": 0.0002567708103820561, "loss": 0.0178, "step": 111180 }, { "epoch": 0.29, "learning_rate": 0.00025676692216568465, "loss": 0.0201, "step": 111190 }, { "epoch": 0.29, "learning_rate": 0.0002567630339493132, "loss": 0.0222, "step": 111200 }, { "epoch": 0.29, "learning_rate": 0.00025675914573294173, "loss": 0.0233, "step": 111210 }, { "epoch": 0.29, "learning_rate": 0.00025675525751657025, "loss": 0.02, "step": 111220 }, { "epoch": 0.29, "learning_rate": 0.0002567513693001988, "loss": 0.0214, "step": 111230 }, { "epoch": 0.29, "learning_rate": 0.00025674748108382733, "loss": 0.0224, "step": 111240 }, { "epoch": 0.29, "learning_rate": 0.00025674359286745584, "loss": 0.02, "step": 111250 }, { "epoch": 0.29, "learning_rate": 0.0002567397046510844, "loss": 0.0188, "step": 111260 }, { "epoch": 0.29, "learning_rate": 0.00025673581643471293, "loss": 0.0176, "step": 111270 }, { "epoch": 0.29, "learning_rate": 0.0002567319282183415, "loss": 0.0215, "step": 111280 }, { "epoch": 0.29, "learning_rate": 0.00025672804000197, "loss": 0.0214, "step": 111290 }, { "epoch": 0.29, "learning_rate": 0.0002567241517855985, "loss": 0.0276, "step": 111300 }, { "epoch": 0.29, "learning_rate": 0.0002567202635692271, "loss": 0.0264, "step": 111310 }, { "epoch": 0.29, "learning_rate": 0.0002567163753528556, "loss": 0.0247, "step": 111320 }, { "epoch": 0.29, "learning_rate": 0.0002567124871364841, "loss": 0.0254, "step": 111330 }, { "epoch": 0.29, "learning_rate": 0.0002567085989201127, "loss": 0.0247, "step": 111340 }, { "epoch": 0.29, "learning_rate": 0.00025670471070374126, "loss": 0.0222, "step": 111350 }, { "epoch": 0.29, "learning_rate": 0.0002567008224873698, "loss": 0.0237, "step": 111360 }, { "epoch": 0.29, "learning_rate": 0.0002566969342709983, "loss": 0.0229, "step": 111370 }, { "epoch": 0.29, "learning_rate": 0.0002566930460546268, "loss": 0.0257, "step": 111380 }, { "epoch": 0.29, "learning_rate": 0.0002566891578382554, "loss": 0.0203, "step": 111390 }, { "epoch": 0.29, "learning_rate": 0.0002566852696218839, "loss": 0.0259, "step": 111400 }, { "epoch": 0.29, "learning_rate": 0.00025668138140551246, "loss": 0.0197, "step": 111410 }, { "epoch": 0.29, "learning_rate": 0.00025667749318914097, "loss": 0.0206, "step": 111420 }, { "epoch": 0.29, "learning_rate": 0.0002566736049727695, "loss": 0.0165, "step": 111430 }, { "epoch": 0.29, "learning_rate": 0.00025666971675639805, "loss": 0.0222, "step": 111440 }, { "epoch": 0.29, "learning_rate": 0.00025666582854002657, "loss": 0.0198, "step": 111450 }, { "epoch": 0.29, "learning_rate": 0.0002566619403236551, "loss": 0.0193, "step": 111460 }, { "epoch": 0.29, "learning_rate": 0.00025665805210728365, "loss": 0.0248, "step": 111470 }, { "epoch": 0.29, "learning_rate": 0.00025665416389091217, "loss": 0.0193, "step": 111480 }, { "epoch": 0.29, "learning_rate": 0.00025665027567454074, "loss": 0.0249, "step": 111490 }, { "epoch": 0.29, "learning_rate": 0.00025664638745816925, "loss": 0.0228, "step": 111500 }, { "epoch": 0.29, "learning_rate": 0.00025664249924179776, "loss": 0.0266, "step": 111510 }, { "epoch": 0.29, "learning_rate": 0.00025663861102542633, "loss": 0.0218, "step": 111520 }, { "epoch": 0.29, "learning_rate": 0.00025663472280905485, "loss": 0.0217, "step": 111530 }, { "epoch": 0.29, "learning_rate": 0.00025663083459268336, "loss": 0.0193, "step": 111540 }, { "epoch": 0.29, "learning_rate": 0.00025662694637631193, "loss": 0.0245, "step": 111550 }, { "epoch": 0.29, "learning_rate": 0.0002566230581599405, "loss": 0.0206, "step": 111560 }, { "epoch": 0.29, "learning_rate": 0.000256619169943569, "loss": 0.0195, "step": 111570 }, { "epoch": 0.29, "learning_rate": 0.00025661528172719753, "loss": 0.0179, "step": 111580 }, { "epoch": 0.29, "learning_rate": 0.00025661139351082604, "loss": 0.019, "step": 111590 }, { "epoch": 0.29, "learning_rate": 0.0002566075052944546, "loss": 0.0215, "step": 111600 }, { "epoch": 0.29, "learning_rate": 0.0002566036170780831, "loss": 0.0229, "step": 111610 }, { "epoch": 0.29, "learning_rate": 0.0002565997288617117, "loss": 0.0212, "step": 111620 }, { "epoch": 0.29, "learning_rate": 0.0002565958406453402, "loss": 0.0206, "step": 111630 }, { "epoch": 0.29, "learning_rate": 0.0002565919524289688, "loss": 0.0237, "step": 111640 }, { "epoch": 0.29, "learning_rate": 0.0002565880642125973, "loss": 0.0206, "step": 111650 }, { "epoch": 0.29, "learning_rate": 0.0002565841759962258, "loss": 0.0248, "step": 111660 }, { "epoch": 0.29, "learning_rate": 0.0002565802877798543, "loss": 0.0244, "step": 111670 }, { "epoch": 0.29, "learning_rate": 0.0002565763995634829, "loss": 0.0221, "step": 111680 }, { "epoch": 0.29, "learning_rate": 0.0002565725113471114, "loss": 0.0193, "step": 111690 }, { "epoch": 0.29, "learning_rate": 0.00025656862313074, "loss": 0.0303, "step": 111700 }, { "epoch": 0.29, "learning_rate": 0.0002565647349143685, "loss": 0.0178, "step": 111710 }, { "epoch": 0.29, "learning_rate": 0.000256560846697997, "loss": 0.0268, "step": 111720 }, { "epoch": 0.29, "learning_rate": 0.00025655695848162557, "loss": 0.022, "step": 111730 }, { "epoch": 0.29, "learning_rate": 0.0002565530702652541, "loss": 0.0282, "step": 111740 }, { "epoch": 0.29, "learning_rate": 0.00025654918204888266, "loss": 0.0237, "step": 111750 }, { "epoch": 0.29, "learning_rate": 0.00025654529383251117, "loss": 0.0197, "step": 111760 }, { "epoch": 0.29, "learning_rate": 0.00025654140561613974, "loss": 0.0217, "step": 111770 }, { "epoch": 0.29, "learning_rate": 0.00025653751739976825, "loss": 0.0259, "step": 111780 }, { "epoch": 0.29, "learning_rate": 0.00025653362918339677, "loss": 0.0278, "step": 111790 }, { "epoch": 0.29, "learning_rate": 0.0002565297409670253, "loss": 0.02, "step": 111800 }, { "epoch": 0.29, "learning_rate": 0.00025652585275065385, "loss": 0.025, "step": 111810 }, { "epoch": 0.29, "learning_rate": 0.00025652196453428237, "loss": 0.0207, "step": 111820 }, { "epoch": 0.29, "learning_rate": 0.00025651807631791093, "loss": 0.0216, "step": 111830 }, { "epoch": 0.29, "learning_rate": 0.00025651418810153945, "loss": 0.0175, "step": 111840 }, { "epoch": 0.29, "learning_rate": 0.000256510299885168, "loss": 0.0194, "step": 111850 }, { "epoch": 0.29, "learning_rate": 0.00025650641166879653, "loss": 0.0175, "step": 111860 }, { "epoch": 0.29, "learning_rate": 0.00025650252345242505, "loss": 0.0198, "step": 111870 }, { "epoch": 0.29, "learning_rate": 0.00025649863523605356, "loss": 0.0211, "step": 111880 }, { "epoch": 0.29, "learning_rate": 0.00025649474701968213, "loss": 0.0205, "step": 111890 }, { "epoch": 0.29, "learning_rate": 0.0002564908588033107, "loss": 0.0208, "step": 111900 }, { "epoch": 0.29, "learning_rate": 0.0002564869705869392, "loss": 0.0216, "step": 111910 }, { "epoch": 0.29, "learning_rate": 0.00025648308237056773, "loss": 0.0177, "step": 111920 }, { "epoch": 0.29, "learning_rate": 0.00025647919415419624, "loss": 0.0228, "step": 111930 }, { "epoch": 0.29, "learning_rate": 0.0002564753059378248, "loss": 0.0206, "step": 111940 }, { "epoch": 0.29, "learning_rate": 0.0002564714177214533, "loss": 0.0187, "step": 111950 }, { "epoch": 0.29, "learning_rate": 0.0002564675295050819, "loss": 0.0284, "step": 111960 }, { "epoch": 0.29, "learning_rate": 0.0002564636412887104, "loss": 0.0221, "step": 111970 }, { "epoch": 0.29, "learning_rate": 0.000256459753072339, "loss": 0.0197, "step": 111980 }, { "epoch": 0.29, "learning_rate": 0.0002564558648559675, "loss": 0.0229, "step": 111990 }, { "epoch": 0.29, "learning_rate": 0.000256451976639596, "loss": 0.0198, "step": 112000 }, { "epoch": 0.29, "eval_cer": 0.8818104583670996, "eval_loss": 0.014513031579554081, "eval_runtime": 107.5973, "eval_samples_per_second": 18.588, "eval_steps_per_second": 4.647, "step": 112000 }, { "epoch": 0.29, "learning_rate": 0.0002564480884232245, "loss": 0.0193, "step": 112010 }, { "epoch": 0.29, "learning_rate": 0.0002564442002068531, "loss": 0.0259, "step": 112020 }, { "epoch": 0.29, "learning_rate": 0.0002564403119904816, "loss": 0.0191, "step": 112030 }, { "epoch": 0.29, "learning_rate": 0.00025643642377411017, "loss": 0.0239, "step": 112040 }, { "epoch": 0.29, "learning_rate": 0.0002564325355577387, "loss": 0.0213, "step": 112050 }, { "epoch": 0.29, "learning_rate": 0.00025642864734136726, "loss": 0.0212, "step": 112060 }, { "epoch": 0.29, "learning_rate": 0.00025642475912499577, "loss": 0.023, "step": 112070 }, { "epoch": 0.29, "learning_rate": 0.0002564208709086243, "loss": 0.018, "step": 112080 }, { "epoch": 0.29, "learning_rate": 0.0002564169826922528, "loss": 0.022, "step": 112090 }, { "epoch": 0.29, "learning_rate": 0.00025641309447588137, "loss": 0.0197, "step": 112100 }, { "epoch": 0.29, "learning_rate": 0.00025640920625950994, "loss": 0.0261, "step": 112110 }, { "epoch": 0.29, "learning_rate": 0.00025640531804313845, "loss": 0.019, "step": 112120 }, { "epoch": 0.29, "learning_rate": 0.00025640142982676697, "loss": 0.0225, "step": 112130 }, { "epoch": 0.29, "learning_rate": 0.00025639754161039553, "loss": 0.0282, "step": 112140 }, { "epoch": 0.29, "learning_rate": 0.00025639365339402405, "loss": 0.0186, "step": 112150 }, { "epoch": 0.29, "learning_rate": 0.00025638976517765256, "loss": 0.02, "step": 112160 }, { "epoch": 0.29, "learning_rate": 0.00025638587696128113, "loss": 0.0325, "step": 112170 }, { "epoch": 0.29, "learning_rate": 0.00025638198874490965, "loss": 0.0204, "step": 112180 }, { "epoch": 0.29, "learning_rate": 0.0002563781005285382, "loss": 0.0177, "step": 112190 }, { "epoch": 0.29, "learning_rate": 0.00025637421231216673, "loss": 0.0204, "step": 112200 }, { "epoch": 0.29, "learning_rate": 0.00025637032409579525, "loss": 0.0215, "step": 112210 }, { "epoch": 0.29, "learning_rate": 0.00025636643587942376, "loss": 0.0195, "step": 112220 }, { "epoch": 0.29, "learning_rate": 0.00025636254766305233, "loss": 0.0216, "step": 112230 }, { "epoch": 0.29, "learning_rate": 0.00025635865944668084, "loss": 0.023, "step": 112240 }, { "epoch": 0.29, "learning_rate": 0.0002563547712303094, "loss": 0.0198, "step": 112250 }, { "epoch": 0.29, "learning_rate": 0.0002563508830139379, "loss": 0.0223, "step": 112260 }, { "epoch": 0.29, "learning_rate": 0.0002563469947975665, "loss": 0.0184, "step": 112270 }, { "epoch": 0.29, "learning_rate": 0.000256343106581195, "loss": 0.0204, "step": 112280 }, { "epoch": 0.29, "learning_rate": 0.0002563392183648235, "loss": 0.0226, "step": 112290 }, { "epoch": 0.29, "learning_rate": 0.0002563353301484521, "loss": 0.0317, "step": 112300 }, { "epoch": 0.29, "learning_rate": 0.0002563314419320806, "loss": 0.0268, "step": 112310 }, { "epoch": 0.29, "learning_rate": 0.0002563275537157092, "loss": 0.0247, "step": 112320 }, { "epoch": 0.29, "learning_rate": 0.0002563236654993377, "loss": 0.0246, "step": 112330 }, { "epoch": 0.29, "learning_rate": 0.0002563197772829662, "loss": 0.0198, "step": 112340 }, { "epoch": 0.29, "learning_rate": 0.0002563158890665948, "loss": 0.0226, "step": 112350 }, { "epoch": 0.29, "learning_rate": 0.0002563120008502233, "loss": 0.0214, "step": 112360 }, { "epoch": 0.29, "learning_rate": 0.0002563081126338518, "loss": 0.0207, "step": 112370 }, { "epoch": 0.29, "learning_rate": 0.00025630422441748037, "loss": 0.023, "step": 112380 }, { "epoch": 0.29, "learning_rate": 0.00025630033620110894, "loss": 0.0205, "step": 112390 }, { "epoch": 0.29, "learning_rate": 0.00025629644798473745, "loss": 0.0296, "step": 112400 }, { "epoch": 0.29, "learning_rate": 0.00025629255976836597, "loss": 0.0195, "step": 112410 }, { "epoch": 0.29, "learning_rate": 0.0002562886715519945, "loss": 0.0336, "step": 112420 }, { "epoch": 0.29, "learning_rate": 0.000256284783335623, "loss": 0.0191, "step": 112430 }, { "epoch": 0.29, "learning_rate": 0.00025628089511925157, "loss": 0.0231, "step": 112440 }, { "epoch": 0.29, "learning_rate": 0.00025627700690288014, "loss": 0.0214, "step": 112450 }, { "epoch": 0.29, "learning_rate": 0.00025627311868650865, "loss": 0.0366, "step": 112460 }, { "epoch": 0.29, "learning_rate": 0.00025626923047013717, "loss": 0.0222, "step": 112470 }, { "epoch": 0.29, "learning_rate": 0.00025626534225376573, "loss": 0.0205, "step": 112480 }, { "epoch": 0.29, "learning_rate": 0.00025626145403739425, "loss": 0.021, "step": 112490 }, { "epoch": 0.29, "learning_rate": 0.00025625756582102276, "loss": 0.0244, "step": 112500 }, { "epoch": 0.29, "learning_rate": 0.00025625367760465133, "loss": 0.0211, "step": 112510 }, { "epoch": 0.29, "learning_rate": 0.00025624978938827985, "loss": 0.0202, "step": 112520 }, { "epoch": 0.29, "learning_rate": 0.0002562459011719084, "loss": 0.0184, "step": 112530 }, { "epoch": 0.29, "learning_rate": 0.00025624201295553693, "loss": 0.0196, "step": 112540 }, { "epoch": 0.29, "learning_rate": 0.00025623812473916544, "loss": 0.0208, "step": 112550 }, { "epoch": 0.29, "learning_rate": 0.000256234236522794, "loss": 0.0204, "step": 112560 }, { "epoch": 0.29, "learning_rate": 0.00025623034830642253, "loss": 0.0196, "step": 112570 }, { "epoch": 0.29, "learning_rate": 0.00025622646009005104, "loss": 0.0266, "step": 112580 }, { "epoch": 0.29, "learning_rate": 0.0002562225718736796, "loss": 0.0209, "step": 112590 }, { "epoch": 0.29, "learning_rate": 0.0002562186836573082, "loss": 0.0248, "step": 112600 }, { "epoch": 0.29, "learning_rate": 0.0002562147954409367, "loss": 0.0199, "step": 112610 }, { "epoch": 0.29, "learning_rate": 0.0002562109072245652, "loss": 0.0228, "step": 112620 }, { "epoch": 0.29, "learning_rate": 0.0002562070190081937, "loss": 0.0294, "step": 112630 }, { "epoch": 0.29, "learning_rate": 0.0002562031307918223, "loss": 0.0217, "step": 112640 }, { "epoch": 0.29, "learning_rate": 0.0002561992425754508, "loss": 0.0192, "step": 112650 }, { "epoch": 0.29, "learning_rate": 0.0002561953543590794, "loss": 0.0228, "step": 112660 }, { "epoch": 0.29, "learning_rate": 0.0002561914661427079, "loss": 0.0229, "step": 112670 }, { "epoch": 0.29, "learning_rate": 0.0002561875779263364, "loss": 0.0264, "step": 112680 }, { "epoch": 0.29, "learning_rate": 0.00025618368970996497, "loss": 0.0239, "step": 112690 }, { "epoch": 0.29, "learning_rate": 0.0002561798014935935, "loss": 0.0209, "step": 112700 }, { "epoch": 0.29, "learning_rate": 0.000256175913277222, "loss": 0.023, "step": 112710 }, { "epoch": 0.29, "learning_rate": 0.00025617202506085057, "loss": 0.0176, "step": 112720 }, { "epoch": 0.29, "learning_rate": 0.0002561681368444791, "loss": 0.0204, "step": 112730 }, { "epoch": 0.29, "learning_rate": 0.00025616424862810765, "loss": 0.0192, "step": 112740 }, { "epoch": 0.29, "learning_rate": 0.00025616036041173617, "loss": 0.0244, "step": 112750 }, { "epoch": 0.29, "learning_rate": 0.0002561564721953647, "loss": 0.0233, "step": 112760 }, { "epoch": 0.29, "learning_rate": 0.00025615258397899325, "loss": 0.0216, "step": 112770 }, { "epoch": 0.29, "learning_rate": 0.00025614869576262177, "loss": 0.0232, "step": 112780 }, { "epoch": 0.29, "learning_rate": 0.00025614480754625033, "loss": 0.0215, "step": 112790 }, { "epoch": 0.29, "learning_rate": 0.00025614091932987885, "loss": 0.0228, "step": 112800 }, { "epoch": 0.29, "learning_rate": 0.0002561370311135074, "loss": 0.0231, "step": 112810 }, { "epoch": 0.29, "learning_rate": 0.00025613314289713593, "loss": 0.0226, "step": 112820 }, { "epoch": 0.29, "learning_rate": 0.00025612925468076445, "loss": 0.0259, "step": 112830 }, { "epoch": 0.29, "learning_rate": 0.00025612536646439296, "loss": 0.0187, "step": 112840 }, { "epoch": 0.29, "learning_rate": 0.00025612147824802153, "loss": 0.0247, "step": 112850 }, { "epoch": 0.29, "learning_rate": 0.00025611759003165005, "loss": 0.018, "step": 112860 }, { "epoch": 0.29, "learning_rate": 0.0002561137018152786, "loss": 0.0238, "step": 112870 }, { "epoch": 0.29, "learning_rate": 0.00025610981359890713, "loss": 0.0218, "step": 112880 }, { "epoch": 0.29, "learning_rate": 0.00025610592538253564, "loss": 0.0219, "step": 112890 }, { "epoch": 0.29, "learning_rate": 0.0002561020371661642, "loss": 0.0236, "step": 112900 }, { "epoch": 0.29, "learning_rate": 0.0002560981489497927, "loss": 0.0201, "step": 112910 }, { "epoch": 0.29, "learning_rate": 0.00025609426073342124, "loss": 0.0227, "step": 112920 }, { "epoch": 0.29, "learning_rate": 0.0002560903725170498, "loss": 0.0221, "step": 112930 }, { "epoch": 0.29, "learning_rate": 0.0002560864843006784, "loss": 0.0248, "step": 112940 }, { "epoch": 0.29, "learning_rate": 0.0002560825960843069, "loss": 0.0201, "step": 112950 }, { "epoch": 0.29, "learning_rate": 0.0002560787078679354, "loss": 0.0302, "step": 112960 }, { "epoch": 0.29, "learning_rate": 0.0002560748196515639, "loss": 0.0223, "step": 112970 }, { "epoch": 0.29, "learning_rate": 0.0002560709314351925, "loss": 0.0267, "step": 112980 }, { "epoch": 0.29, "learning_rate": 0.000256067043218821, "loss": 0.0223, "step": 112990 }, { "epoch": 0.29, "learning_rate": 0.0002560631550024496, "loss": 0.0195, "step": 113000 }, { "epoch": 0.29, "eval_cer": 0.881782465628416, "eval_loss": 0.015686366707086563, "eval_runtime": 107.7549, "eval_samples_per_second": 18.561, "eval_steps_per_second": 4.64, "step": 113000 }, { "epoch": 0.29, "learning_rate": 0.0002560592667860781, "loss": 0.018, "step": 113010 }, { "epoch": 0.29, "learning_rate": 0.00025605537856970666, "loss": 0.0211, "step": 113020 }, { "epoch": 0.29, "learning_rate": 0.00025605149035333517, "loss": 0.0255, "step": 113030 }, { "epoch": 0.29, "learning_rate": 0.0002560476021369637, "loss": 0.0197, "step": 113040 }, { "epoch": 0.29, "learning_rate": 0.0002560437139205922, "loss": 0.0235, "step": 113050 }, { "epoch": 0.29, "learning_rate": 0.00025603982570422077, "loss": 0.0211, "step": 113060 }, { "epoch": 0.29, "learning_rate": 0.0002560359374878493, "loss": 0.0195, "step": 113070 }, { "epoch": 0.29, "learning_rate": 0.00025603204927147785, "loss": 0.0229, "step": 113080 }, { "epoch": 0.29, "learning_rate": 0.00025602816105510637, "loss": 0.0226, "step": 113090 }, { "epoch": 0.29, "learning_rate": 0.00025602427283873494, "loss": 0.0202, "step": 113100 }, { "epoch": 0.29, "learning_rate": 0.00025602038462236345, "loss": 0.0269, "step": 113110 }, { "epoch": 0.29, "learning_rate": 0.00025601649640599196, "loss": 0.025, "step": 113120 }, { "epoch": 0.29, "learning_rate": 0.0002560126081896205, "loss": 0.0194, "step": 113130 }, { "epoch": 0.29, "learning_rate": 0.00025600871997324905, "loss": 0.0276, "step": 113140 }, { "epoch": 0.29, "learning_rate": 0.0002560048317568776, "loss": 0.0211, "step": 113150 }, { "epoch": 0.29, "learning_rate": 0.00025600094354050613, "loss": 0.0219, "step": 113160 }, { "epoch": 0.29, "learning_rate": 0.00025599705532413465, "loss": 0.0227, "step": 113170 }, { "epoch": 0.29, "learning_rate": 0.00025599316710776316, "loss": 0.0203, "step": 113180 }, { "epoch": 0.29, "learning_rate": 0.00025598927889139173, "loss": 0.0216, "step": 113190 }, { "epoch": 0.29, "learning_rate": 0.00025598539067502024, "loss": 0.0183, "step": 113200 }, { "epoch": 0.29, "learning_rate": 0.0002559815024586488, "loss": 0.0243, "step": 113210 }, { "epoch": 0.29, "learning_rate": 0.00025597761424227733, "loss": 0.0169, "step": 113220 }, { "epoch": 0.29, "learning_rate": 0.0002559737260259059, "loss": 0.0185, "step": 113230 }, { "epoch": 0.29, "learning_rate": 0.0002559698378095344, "loss": 0.0218, "step": 113240 }, { "epoch": 0.29, "learning_rate": 0.0002559659495931629, "loss": 0.0206, "step": 113250 }, { "epoch": 0.29, "learning_rate": 0.00025596206137679144, "loss": 0.0198, "step": 113260 }, { "epoch": 0.29, "learning_rate": 0.00025595817316042, "loss": 0.0201, "step": 113270 }, { "epoch": 0.29, "learning_rate": 0.0002559542849440485, "loss": 0.0222, "step": 113280 }, { "epoch": 0.29, "learning_rate": 0.0002559503967276771, "loss": 0.02, "step": 113290 }, { "epoch": 0.29, "learning_rate": 0.0002559465085113056, "loss": 0.0238, "step": 113300 }, { "epoch": 0.29, "learning_rate": 0.0002559426202949342, "loss": 0.0193, "step": 113310 }, { "epoch": 0.29, "learning_rate": 0.0002559387320785627, "loss": 0.0174, "step": 113320 }, { "epoch": 0.29, "learning_rate": 0.0002559348438621912, "loss": 0.0216, "step": 113330 }, { "epoch": 0.29, "learning_rate": 0.00025593095564581977, "loss": 0.0217, "step": 113340 }, { "epoch": 0.29, "learning_rate": 0.0002559270674294483, "loss": 0.0231, "step": 113350 }, { "epoch": 0.29, "learning_rate": 0.00025592317921307686, "loss": 0.0232, "step": 113360 }, { "epoch": 0.29, "learning_rate": 0.00025591929099670537, "loss": 0.0269, "step": 113370 }, { "epoch": 0.29, "learning_rate": 0.0002559154027803339, "loss": 0.0205, "step": 113380 }, { "epoch": 0.29, "learning_rate": 0.0002559115145639624, "loss": 0.0204, "step": 113390 }, { "epoch": 0.29, "learning_rate": 0.00025590762634759097, "loss": 0.0214, "step": 113400 }, { "epoch": 0.29, "learning_rate": 0.0002559037381312195, "loss": 0.0195, "step": 113410 }, { "epoch": 0.29, "learning_rate": 0.00025589984991484805, "loss": 0.0221, "step": 113420 }, { "epoch": 0.29, "learning_rate": 0.00025589596169847657, "loss": 0.0228, "step": 113430 }, { "epoch": 0.29, "learning_rate": 0.00025589207348210513, "loss": 0.022, "step": 113440 }, { "epoch": 0.29, "learning_rate": 0.00025588818526573365, "loss": 0.0197, "step": 113450 }, { "epoch": 0.29, "learning_rate": 0.00025588429704936216, "loss": 0.0226, "step": 113460 }, { "epoch": 0.29, "learning_rate": 0.0002558804088329907, "loss": 0.0212, "step": 113470 }, { "epoch": 0.29, "learning_rate": 0.00025587652061661925, "loss": 0.0322, "step": 113480 }, { "epoch": 0.29, "learning_rate": 0.0002558726324002478, "loss": 0.0199, "step": 113490 }, { "epoch": 0.29, "learning_rate": 0.00025586874418387633, "loss": 0.0212, "step": 113500 }, { "epoch": 0.29, "learning_rate": 0.00025586485596750484, "loss": 0.0203, "step": 113510 }, { "epoch": 0.29, "learning_rate": 0.0002558609677511334, "loss": 0.0266, "step": 113520 }, { "epoch": 0.29, "learning_rate": 0.00025585707953476193, "loss": 0.0209, "step": 113530 }, { "epoch": 0.29, "learning_rate": 0.00025585319131839044, "loss": 0.0232, "step": 113540 }, { "epoch": 0.29, "learning_rate": 0.000255849303102019, "loss": 0.0195, "step": 113550 }, { "epoch": 0.29, "learning_rate": 0.0002558454148856475, "loss": 0.0258, "step": 113560 }, { "epoch": 0.29, "learning_rate": 0.0002558415266692761, "loss": 0.0208, "step": 113570 }, { "epoch": 0.29, "learning_rate": 0.0002558376384529046, "loss": 0.0214, "step": 113580 }, { "epoch": 0.29, "learning_rate": 0.0002558337502365331, "loss": 0.0206, "step": 113590 }, { "epoch": 0.29, "learning_rate": 0.0002558298620201617, "loss": 0.0238, "step": 113600 }, { "epoch": 0.29, "learning_rate": 0.0002558259738037902, "loss": 0.0208, "step": 113610 }, { "epoch": 0.29, "learning_rate": 0.0002558220855874187, "loss": 0.019, "step": 113620 }, { "epoch": 0.29, "learning_rate": 0.0002558181973710473, "loss": 0.0192, "step": 113630 }, { "epoch": 0.29, "learning_rate": 0.0002558143091546758, "loss": 0.0201, "step": 113640 }, { "epoch": 0.29, "learning_rate": 0.0002558104209383044, "loss": 0.0194, "step": 113650 }, { "epoch": 0.29, "learning_rate": 0.0002558065327219329, "loss": 0.0223, "step": 113660 }, { "epoch": 0.29, "learning_rate": 0.0002558026445055614, "loss": 0.0227, "step": 113670 }, { "epoch": 0.29, "learning_rate": 0.0002557987562891899, "loss": 0.0186, "step": 113680 }, { "epoch": 0.29, "learning_rate": 0.0002557948680728185, "loss": 0.0192, "step": 113690 }, { "epoch": 0.29, "learning_rate": 0.00025579097985644705, "loss": 0.0265, "step": 113700 }, { "epoch": 0.29, "learning_rate": 0.00025578709164007557, "loss": 0.02, "step": 113710 }, { "epoch": 0.29, "learning_rate": 0.0002557832034237041, "loss": 0.0197, "step": 113720 }, { "epoch": 0.29, "learning_rate": 0.00025577931520733265, "loss": 0.0253, "step": 113730 }, { "epoch": 0.29, "learning_rate": 0.00025577542699096117, "loss": 0.02, "step": 113740 }, { "epoch": 0.29, "learning_rate": 0.0002557715387745897, "loss": 0.0237, "step": 113750 }, { "epoch": 0.29, "learning_rate": 0.00025576765055821825, "loss": 0.0243, "step": 113760 }, { "epoch": 0.29, "learning_rate": 0.00025576376234184676, "loss": 0.022, "step": 113770 }, { "epoch": 0.29, "learning_rate": 0.00025575987412547533, "loss": 0.0217, "step": 113780 }, { "epoch": 0.29, "learning_rate": 0.00025575598590910385, "loss": 0.0213, "step": 113790 }, { "epoch": 0.29, "learning_rate": 0.00025575209769273236, "loss": 0.0167, "step": 113800 }, { "epoch": 0.3, "learning_rate": 0.00025574820947636093, "loss": 0.0228, "step": 113810 }, { "epoch": 0.3, "learning_rate": 0.00025574432125998945, "loss": 0.0182, "step": 113820 }, { "epoch": 0.3, "learning_rate": 0.00025574043304361796, "loss": 0.0174, "step": 113830 }, { "epoch": 0.3, "learning_rate": 0.00025573654482724653, "loss": 0.0182, "step": 113840 }, { "epoch": 0.3, "learning_rate": 0.0002557326566108751, "loss": 0.0195, "step": 113850 }, { "epoch": 0.3, "learning_rate": 0.0002557287683945036, "loss": 0.0219, "step": 113860 }, { "epoch": 0.3, "learning_rate": 0.0002557248801781321, "loss": 0.017, "step": 113870 }, { "epoch": 0.3, "learning_rate": 0.00025572099196176064, "loss": 0.0233, "step": 113880 }, { "epoch": 0.3, "learning_rate": 0.0002557171037453892, "loss": 0.0201, "step": 113890 }, { "epoch": 0.3, "learning_rate": 0.0002557132155290177, "loss": 0.0208, "step": 113900 }, { "epoch": 0.3, "learning_rate": 0.0002557093273126463, "loss": 0.0187, "step": 113910 }, { "epoch": 0.3, "learning_rate": 0.0002557054390962748, "loss": 0.0216, "step": 113920 }, { "epoch": 0.3, "learning_rate": 0.0002557015508799033, "loss": 0.0215, "step": 113930 }, { "epoch": 0.3, "learning_rate": 0.0002556976626635319, "loss": 0.0257, "step": 113940 }, { "epoch": 0.3, "learning_rate": 0.0002556937744471604, "loss": 0.0241, "step": 113950 }, { "epoch": 0.3, "learning_rate": 0.0002556898862307889, "loss": 0.0205, "step": 113960 }, { "epoch": 0.3, "learning_rate": 0.0002556859980144175, "loss": 0.0199, "step": 113970 }, { "epoch": 0.3, "learning_rate": 0.00025568210979804606, "loss": 0.0186, "step": 113980 }, { "epoch": 0.3, "learning_rate": 0.00025567822158167457, "loss": 0.0213, "step": 113990 }, { "epoch": 0.3, "learning_rate": 0.0002556743333653031, "loss": 0.025, "step": 114000 }, { "epoch": 0.3, "eval_cer": 0.881782465628416, "eval_loss": 0.015355234034359455, "eval_runtime": 107.8728, "eval_samples_per_second": 18.54, "eval_steps_per_second": 4.635, "step": 114000 }, { "epoch": 0.3, "learning_rate": 0.0002556704451489316, "loss": 0.0244, "step": 114010 }, { "epoch": 0.3, "learning_rate": 0.00025566655693256017, "loss": 0.0278, "step": 114020 }, { "epoch": 0.3, "learning_rate": 0.0002556626687161887, "loss": 0.0215, "step": 114030 }, { "epoch": 0.3, "learning_rate": 0.00025565878049981725, "loss": 0.0179, "step": 114040 }, { "epoch": 0.3, "learning_rate": 0.00025565489228344577, "loss": 0.0199, "step": 114050 }, { "epoch": 0.3, "learning_rate": 0.00025565100406707434, "loss": 0.025, "step": 114060 }, { "epoch": 0.3, "learning_rate": 0.00025564711585070285, "loss": 0.0258, "step": 114070 }, { "epoch": 0.3, "learning_rate": 0.00025564322763433137, "loss": 0.0193, "step": 114080 }, { "epoch": 0.3, "learning_rate": 0.0002556393394179599, "loss": 0.0183, "step": 114090 }, { "epoch": 0.3, "learning_rate": 0.00025563545120158845, "loss": 0.0202, "step": 114100 }, { "epoch": 0.3, "learning_rate": 0.00025563156298521696, "loss": 0.0207, "step": 114110 }, { "epoch": 0.3, "learning_rate": 0.00025562767476884553, "loss": 0.0218, "step": 114120 }, { "epoch": 0.3, "learning_rate": 0.00025562378655247405, "loss": 0.0231, "step": 114130 }, { "epoch": 0.3, "learning_rate": 0.00025561989833610256, "loss": 0.0192, "step": 114140 }, { "epoch": 0.3, "learning_rate": 0.00025561601011973113, "loss": 0.0231, "step": 114150 }, { "epoch": 0.3, "learning_rate": 0.00025561212190335964, "loss": 0.0217, "step": 114160 }, { "epoch": 0.3, "learning_rate": 0.00025560823368698816, "loss": 0.0277, "step": 114170 }, { "epoch": 0.3, "learning_rate": 0.00025560434547061673, "loss": 0.0228, "step": 114180 }, { "epoch": 0.3, "learning_rate": 0.0002556004572542453, "loss": 0.0203, "step": 114190 }, { "epoch": 0.3, "learning_rate": 0.0002555965690378738, "loss": 0.0259, "step": 114200 }, { "epoch": 0.3, "learning_rate": 0.0002555926808215023, "loss": 0.0199, "step": 114210 }, { "epoch": 0.3, "learning_rate": 0.00025558879260513084, "loss": 0.0235, "step": 114220 }, { "epoch": 0.3, "learning_rate": 0.0002555849043887594, "loss": 0.0211, "step": 114230 }, { "epoch": 0.3, "learning_rate": 0.0002555810161723879, "loss": 0.0206, "step": 114240 }, { "epoch": 0.3, "learning_rate": 0.0002555771279560165, "loss": 0.0187, "step": 114250 }, { "epoch": 0.3, "learning_rate": 0.000255573239739645, "loss": 0.0203, "step": 114260 }, { "epoch": 0.3, "learning_rate": 0.0002555693515232736, "loss": 0.0241, "step": 114270 }, { "epoch": 0.3, "learning_rate": 0.0002555654633069021, "loss": 0.0217, "step": 114280 }, { "epoch": 0.3, "learning_rate": 0.0002555615750905306, "loss": 0.026, "step": 114290 }, { "epoch": 0.3, "learning_rate": 0.0002555576868741591, "loss": 0.0187, "step": 114300 }, { "epoch": 0.3, "learning_rate": 0.0002555537986577877, "loss": 0.0185, "step": 114310 }, { "epoch": 0.3, "learning_rate": 0.0002555499104414162, "loss": 0.0251, "step": 114320 }, { "epoch": 0.3, "learning_rate": 0.00025554602222504477, "loss": 0.0204, "step": 114330 }, { "epoch": 0.3, "learning_rate": 0.0002555421340086733, "loss": 0.0209, "step": 114340 }, { "epoch": 0.3, "learning_rate": 0.00025553824579230185, "loss": 0.0231, "step": 114350 }, { "epoch": 0.3, "learning_rate": 0.00025553435757593037, "loss": 0.0213, "step": 114360 }, { "epoch": 0.3, "learning_rate": 0.0002555304693595589, "loss": 0.0175, "step": 114370 }, { "epoch": 0.3, "learning_rate": 0.00025552658114318745, "loss": 0.0267, "step": 114380 }, { "epoch": 0.3, "learning_rate": 0.00025552269292681597, "loss": 0.0205, "step": 114390 }, { "epoch": 0.3, "learning_rate": 0.00025551880471044454, "loss": 0.0195, "step": 114400 }, { "epoch": 0.3, "learning_rate": 0.00025551491649407305, "loss": 0.02, "step": 114410 }, { "epoch": 0.3, "learning_rate": 0.00025551102827770156, "loss": 0.0203, "step": 114420 }, { "epoch": 0.3, "learning_rate": 0.0002555071400613301, "loss": 0.0238, "step": 114430 }, { "epoch": 0.3, "learning_rate": 0.00025550325184495865, "loss": 0.0234, "step": 114440 }, { "epoch": 0.3, "learning_rate": 0.00025549936362858716, "loss": 0.0232, "step": 114450 }, { "epoch": 0.3, "learning_rate": 0.00025549547541221573, "loss": 0.0203, "step": 114460 }, { "epoch": 0.3, "learning_rate": 0.00025549158719584425, "loss": 0.0215, "step": 114470 }, { "epoch": 0.3, "learning_rate": 0.0002554876989794728, "loss": 0.0237, "step": 114480 }, { "epoch": 0.3, "learning_rate": 0.00025548381076310133, "loss": 0.0181, "step": 114490 }, { "epoch": 0.3, "learning_rate": 0.00025547992254672984, "loss": 0.0194, "step": 114500 }, { "epoch": 0.3, "learning_rate": 0.00025547603433035836, "loss": 0.0186, "step": 114510 }, { "epoch": 0.3, "learning_rate": 0.0002554721461139869, "loss": 0.021, "step": 114520 }, { "epoch": 0.3, "learning_rate": 0.0002554682578976155, "loss": 0.0206, "step": 114530 }, { "epoch": 0.3, "learning_rate": 0.000255464369681244, "loss": 0.0186, "step": 114540 }, { "epoch": 0.3, "learning_rate": 0.0002554604814648725, "loss": 0.0196, "step": 114550 }, { "epoch": 0.3, "learning_rate": 0.0002554565932485011, "loss": 0.0195, "step": 114560 }, { "epoch": 0.3, "learning_rate": 0.0002554527050321296, "loss": 0.0193, "step": 114570 }, { "epoch": 0.3, "learning_rate": 0.0002554488168157581, "loss": 0.0156, "step": 114580 }, { "epoch": 0.3, "learning_rate": 0.0002554449285993867, "loss": 0.0186, "step": 114590 }, { "epoch": 0.3, "learning_rate": 0.0002554410403830152, "loss": 0.0207, "step": 114600 }, { "epoch": 0.3, "learning_rate": 0.0002554371521666438, "loss": 0.0213, "step": 114610 }, { "epoch": 0.3, "learning_rate": 0.0002554332639502723, "loss": 0.022, "step": 114620 }, { "epoch": 0.3, "learning_rate": 0.0002554293757339008, "loss": 0.0173, "step": 114630 }, { "epoch": 0.3, "learning_rate": 0.0002554254875175293, "loss": 0.021, "step": 114640 }, { "epoch": 0.3, "learning_rate": 0.0002554215993011579, "loss": 0.0197, "step": 114650 }, { "epoch": 0.3, "learning_rate": 0.0002554177110847864, "loss": 0.0207, "step": 114660 }, { "epoch": 0.3, "learning_rate": 0.00025541382286841497, "loss": 0.0202, "step": 114670 }, { "epoch": 0.3, "learning_rate": 0.0002554099346520435, "loss": 0.0195, "step": 114680 }, { "epoch": 0.3, "learning_rate": 0.00025540604643567205, "loss": 0.0218, "step": 114690 }, { "epoch": 0.3, "learning_rate": 0.00025540215821930057, "loss": 0.04, "step": 114700 }, { "epoch": 0.3, "learning_rate": 0.0002553982700029291, "loss": 0.0181, "step": 114710 }, { "epoch": 0.3, "learning_rate": 0.0002553943817865576, "loss": 0.0224, "step": 114720 }, { "epoch": 0.3, "learning_rate": 0.00025539049357018617, "loss": 0.0232, "step": 114730 }, { "epoch": 0.3, "learning_rate": 0.00025538660535381473, "loss": 0.0207, "step": 114740 }, { "epoch": 0.3, "learning_rate": 0.00025538271713744325, "loss": 0.0202, "step": 114750 }, { "epoch": 0.3, "learning_rate": 0.00025537882892107176, "loss": 0.0271, "step": 114760 }, { "epoch": 0.3, "learning_rate": 0.00025537494070470033, "loss": 0.0231, "step": 114770 }, { "epoch": 0.3, "learning_rate": 0.00025537105248832885, "loss": 0.0199, "step": 114780 }, { "epoch": 0.3, "learning_rate": 0.00025536716427195736, "loss": 0.0193, "step": 114790 }, { "epoch": 0.3, "learning_rate": 0.00025536327605558593, "loss": 0.0194, "step": 114800 }, { "epoch": 0.3, "learning_rate": 0.00025535938783921444, "loss": 0.0207, "step": 114810 }, { "epoch": 0.3, "learning_rate": 0.000255355499622843, "loss": 0.0233, "step": 114820 }, { "epoch": 0.3, "learning_rate": 0.00025535161140647153, "loss": 0.0252, "step": 114830 }, { "epoch": 0.3, "learning_rate": 0.00025534772319010004, "loss": 0.0262, "step": 114840 }, { "epoch": 0.3, "learning_rate": 0.0002553438349737286, "loss": 0.0193, "step": 114850 }, { "epoch": 0.3, "learning_rate": 0.0002553399467573571, "loss": 0.0226, "step": 114860 }, { "epoch": 0.3, "learning_rate": 0.00025533605854098564, "loss": 0.0194, "step": 114870 }, { "epoch": 0.3, "learning_rate": 0.0002553321703246142, "loss": 0.0183, "step": 114880 }, { "epoch": 0.3, "learning_rate": 0.0002553282821082427, "loss": 0.0174, "step": 114890 }, { "epoch": 0.3, "learning_rate": 0.0002553243938918713, "loss": 0.0189, "step": 114900 }, { "epoch": 0.3, "learning_rate": 0.0002553205056754998, "loss": 0.0272, "step": 114910 }, { "epoch": 0.3, "learning_rate": 0.0002553166174591283, "loss": 0.02, "step": 114920 }, { "epoch": 0.3, "learning_rate": 0.0002553127292427569, "loss": 0.0211, "step": 114930 }, { "epoch": 0.3, "learning_rate": 0.0002553088410263854, "loss": 0.0223, "step": 114940 }, { "epoch": 0.3, "learning_rate": 0.000255304952810014, "loss": 0.0208, "step": 114950 }, { "epoch": 0.3, "learning_rate": 0.0002553010645936425, "loss": 0.0195, "step": 114960 }, { "epoch": 0.3, "learning_rate": 0.000255297176377271, "loss": 0.0182, "step": 114970 }, { "epoch": 0.3, "learning_rate": 0.00025529328816089957, "loss": 0.026, "step": 114980 }, { "epoch": 0.3, "learning_rate": 0.0002552893999445281, "loss": 0.0227, "step": 114990 }, { "epoch": 0.3, "learning_rate": 0.0002552855117281566, "loss": 0.0228, "step": 115000 }, { "epoch": 0.3, "eval_cer": 0.8817908634500211, "eval_loss": 0.015144613571465015, "eval_runtime": 107.6259, "eval_samples_per_second": 18.583, "eval_steps_per_second": 4.646, "step": 115000 }, { "epoch": 0.3, "learning_rate": 0.00025528162351178517, "loss": 0.022, "step": 115010 }, { "epoch": 0.3, "learning_rate": 0.0002552777352954137, "loss": 0.0163, "step": 115020 }, { "epoch": 0.3, "learning_rate": 0.00025527384707904225, "loss": 0.0192, "step": 115030 }, { "epoch": 0.3, "learning_rate": 0.00025526995886267077, "loss": 0.0187, "step": 115040 }, { "epoch": 0.3, "learning_rate": 0.0002552660706462993, "loss": 0.0206, "step": 115050 }, { "epoch": 0.3, "learning_rate": 0.00025526218242992785, "loss": 0.021, "step": 115060 }, { "epoch": 0.3, "learning_rate": 0.00025525829421355636, "loss": 0.0214, "step": 115070 }, { "epoch": 0.3, "learning_rate": 0.00025525440599718493, "loss": 0.0222, "step": 115080 }, { "epoch": 0.3, "learning_rate": 0.00025525051778081345, "loss": 0.0186, "step": 115090 }, { "epoch": 0.3, "learning_rate": 0.000255246629564442, "loss": 0.0262, "step": 115100 }, { "epoch": 0.3, "learning_rate": 0.00025524274134807053, "loss": 0.0235, "step": 115110 }, { "epoch": 0.3, "learning_rate": 0.00025523885313169905, "loss": 0.0195, "step": 115120 }, { "epoch": 0.3, "learning_rate": 0.00025523496491532756, "loss": 0.0191, "step": 115130 }, { "epoch": 0.3, "learning_rate": 0.00025523107669895613, "loss": 0.0203, "step": 115140 }, { "epoch": 0.3, "learning_rate": 0.00025522718848258464, "loss": 0.018, "step": 115150 }, { "epoch": 0.3, "learning_rate": 0.0002552233002662132, "loss": 0.0212, "step": 115160 }, { "epoch": 0.3, "learning_rate": 0.0002552194120498417, "loss": 0.0229, "step": 115170 }, { "epoch": 0.3, "learning_rate": 0.00025521552383347024, "loss": 0.019, "step": 115180 }, { "epoch": 0.3, "learning_rate": 0.0002552116356170988, "loss": 0.018, "step": 115190 }, { "epoch": 0.3, "learning_rate": 0.0002552077474007273, "loss": 0.0253, "step": 115200 }, { "epoch": 0.3, "learning_rate": 0.00025520385918435584, "loss": 0.0282, "step": 115210 }, { "epoch": 0.3, "learning_rate": 0.0002551999709679844, "loss": 0.019, "step": 115220 }, { "epoch": 0.3, "learning_rate": 0.000255196082751613, "loss": 0.0257, "step": 115230 }, { "epoch": 0.3, "learning_rate": 0.0002551921945352415, "loss": 0.0339, "step": 115240 }, { "epoch": 0.3, "learning_rate": 0.00025518830631887, "loss": 0.0211, "step": 115250 }, { "epoch": 0.3, "learning_rate": 0.0002551844181024985, "loss": 0.0225, "step": 115260 }, { "epoch": 0.3, "learning_rate": 0.0002551805298861271, "loss": 0.0246, "step": 115270 }, { "epoch": 0.3, "learning_rate": 0.0002551766416697556, "loss": 0.0216, "step": 115280 }, { "epoch": 0.3, "learning_rate": 0.00025517275345338417, "loss": 0.0232, "step": 115290 }, { "epoch": 0.3, "learning_rate": 0.0002551688652370127, "loss": 0.0202, "step": 115300 }, { "epoch": 0.3, "learning_rate": 0.00025516497702064126, "loss": 0.0195, "step": 115310 }, { "epoch": 0.3, "learning_rate": 0.00025516108880426977, "loss": 0.0257, "step": 115320 }, { "epoch": 0.3, "learning_rate": 0.0002551572005878983, "loss": 0.0199, "step": 115330 }, { "epoch": 0.3, "learning_rate": 0.0002551533123715268, "loss": 0.0216, "step": 115340 }, { "epoch": 0.3, "learning_rate": 0.00025514942415515537, "loss": 0.0211, "step": 115350 }, { "epoch": 0.3, "learning_rate": 0.0002551455359387839, "loss": 0.0184, "step": 115360 }, { "epoch": 0.3, "learning_rate": 0.00025514164772241245, "loss": 0.0212, "step": 115370 }, { "epoch": 0.3, "learning_rate": 0.00025513775950604097, "loss": 0.0153, "step": 115380 }, { "epoch": 0.3, "learning_rate": 0.0002551338712896695, "loss": 0.0221, "step": 115390 }, { "epoch": 0.3, "learning_rate": 0.00025512998307329805, "loss": 0.0267, "step": 115400 }, { "epoch": 0.3, "learning_rate": 0.00025512609485692656, "loss": 0.0244, "step": 115410 }, { "epoch": 0.3, "learning_rate": 0.0002551222066405551, "loss": 0.0245, "step": 115420 }, { "epoch": 0.3, "learning_rate": 0.00025511831842418365, "loss": 0.0227, "step": 115430 }, { "epoch": 0.3, "learning_rate": 0.0002551144302078122, "loss": 0.0183, "step": 115440 }, { "epoch": 0.3, "learning_rate": 0.00025511054199144073, "loss": 0.0203, "step": 115450 }, { "epoch": 0.3, "learning_rate": 0.00025510665377506924, "loss": 0.0214, "step": 115460 }, { "epoch": 0.3, "learning_rate": 0.00025510276555869776, "loss": 0.0212, "step": 115470 }, { "epoch": 0.3, "learning_rate": 0.00025509887734232633, "loss": 0.0207, "step": 115480 }, { "epoch": 0.3, "learning_rate": 0.00025509498912595484, "loss": 0.0247, "step": 115490 }, { "epoch": 0.3, "learning_rate": 0.0002550911009095834, "loss": 0.0275, "step": 115500 }, { "epoch": 0.3, "learning_rate": 0.0002550872126932119, "loss": 0.0182, "step": 115510 }, { "epoch": 0.3, "learning_rate": 0.0002550833244768405, "loss": 0.0294, "step": 115520 }, { "epoch": 0.3, "learning_rate": 0.000255079436260469, "loss": 0.0199, "step": 115530 }, { "epoch": 0.3, "learning_rate": 0.0002550755480440975, "loss": 0.0167, "step": 115540 }, { "epoch": 0.3, "learning_rate": 0.00025507165982772604, "loss": 0.022, "step": 115550 }, { "epoch": 0.3, "learning_rate": 0.0002550677716113546, "loss": 0.024, "step": 115560 }, { "epoch": 0.3, "learning_rate": 0.0002550638833949832, "loss": 0.0184, "step": 115570 }, { "epoch": 0.3, "learning_rate": 0.0002550599951786117, "loss": 0.0216, "step": 115580 }, { "epoch": 0.3, "learning_rate": 0.0002550561069622402, "loss": 0.0188, "step": 115590 }, { "epoch": 0.3, "learning_rate": 0.0002550522187458688, "loss": 0.0237, "step": 115600 }, { "epoch": 0.3, "learning_rate": 0.0002550483305294973, "loss": 0.025, "step": 115610 }, { "epoch": 0.3, "learning_rate": 0.0002550444423131258, "loss": 0.0268, "step": 115620 }, { "epoch": 0.3, "learning_rate": 0.00025504055409675437, "loss": 0.0286, "step": 115630 }, { "epoch": 0.3, "learning_rate": 0.0002550366658803829, "loss": 0.0239, "step": 115640 }, { "epoch": 0.3, "learning_rate": 0.00025503277766401145, "loss": 0.0213, "step": 115650 }, { "epoch": 0.3, "learning_rate": 0.00025502888944763997, "loss": 0.0227, "step": 115660 }, { "epoch": 0.3, "learning_rate": 0.0002550250012312685, "loss": 0.0234, "step": 115670 }, { "epoch": 0.3, "learning_rate": 0.000255021113014897, "loss": 0.0248, "step": 115680 }, { "epoch": 0.3, "learning_rate": 0.00025501722479852557, "loss": 0.0198, "step": 115690 }, { "epoch": 0.3, "learning_rate": 0.0002550133365821541, "loss": 0.0175, "step": 115700 }, { "epoch": 0.3, "learning_rate": 0.00025500944836578265, "loss": 0.0212, "step": 115710 }, { "epoch": 0.3, "learning_rate": 0.00025500556014941116, "loss": 0.0252, "step": 115720 }, { "epoch": 0.3, "learning_rate": 0.00025500167193303973, "loss": 0.0208, "step": 115730 }, { "epoch": 0.3, "learning_rate": 0.00025499778371666825, "loss": 0.0196, "step": 115740 }, { "epoch": 0.3, "learning_rate": 0.00025499389550029676, "loss": 0.0213, "step": 115750 }, { "epoch": 0.3, "learning_rate": 0.0002549900072839253, "loss": 0.0201, "step": 115760 }, { "epoch": 0.3, "learning_rate": 0.00025498611906755385, "loss": 0.0186, "step": 115770 }, { "epoch": 0.3, "learning_rate": 0.0002549822308511824, "loss": 0.023, "step": 115780 }, { "epoch": 0.3, "learning_rate": 0.00025497834263481093, "loss": 0.021, "step": 115790 }, { "epoch": 0.3, "learning_rate": 0.00025497445441843944, "loss": 0.0283, "step": 115800 }, { "epoch": 0.3, "learning_rate": 0.000254970566202068, "loss": 0.0212, "step": 115810 }, { "epoch": 0.3, "learning_rate": 0.0002549666779856965, "loss": 0.0266, "step": 115820 }, { "epoch": 0.3, "learning_rate": 0.00025496278976932504, "loss": 0.0206, "step": 115830 }, { "epoch": 0.3, "learning_rate": 0.0002549589015529536, "loss": 0.0193, "step": 115840 }, { "epoch": 0.3, "learning_rate": 0.0002549550133365821, "loss": 0.0229, "step": 115850 }, { "epoch": 0.3, "learning_rate": 0.0002549511251202107, "loss": 0.0203, "step": 115860 }, { "epoch": 0.3, "learning_rate": 0.0002549472369038392, "loss": 0.0216, "step": 115870 }, { "epoch": 0.3, "learning_rate": 0.0002549433486874677, "loss": 0.0194, "step": 115880 }, { "epoch": 0.3, "learning_rate": 0.00025493946047109624, "loss": 0.0246, "step": 115890 }, { "epoch": 0.3, "learning_rate": 0.0002549355722547248, "loss": 0.0267, "step": 115900 }, { "epoch": 0.3, "learning_rate": 0.0002549316840383533, "loss": 0.021, "step": 115910 }, { "epoch": 0.3, "learning_rate": 0.0002549277958219819, "loss": 0.0204, "step": 115920 }, { "epoch": 0.3, "learning_rate": 0.0002549239076056104, "loss": 0.0262, "step": 115930 }, { "epoch": 0.3, "learning_rate": 0.00025492001938923897, "loss": 0.0229, "step": 115940 }, { "epoch": 0.3, "learning_rate": 0.0002549161311728675, "loss": 0.0204, "step": 115950 }, { "epoch": 0.3, "learning_rate": 0.000254912242956496, "loss": 0.0202, "step": 115960 }, { "epoch": 0.3, "learning_rate": 0.00025490835474012457, "loss": 0.0223, "step": 115970 }, { "epoch": 0.3, "learning_rate": 0.0002549044665237531, "loss": 0.0209, "step": 115980 }, { "epoch": 0.3, "learning_rate": 0.00025490057830738165, "loss": 0.0197, "step": 115990 }, { "epoch": 0.3, "learning_rate": 0.00025489669009101017, "loss": 0.0192, "step": 116000 }, { "epoch": 0.3, "eval_cer": 0.8818174565517705, "eval_loss": 0.01587188057601452, "eval_runtime": 107.3455, "eval_samples_per_second": 18.631, "eval_steps_per_second": 4.658, "step": 116000 }, { "epoch": 0.3, "learning_rate": 0.0002548928018746387, "loss": 0.0173, "step": 116010 }, { "epoch": 0.3, "learning_rate": 0.00025488891365826725, "loss": 0.0195, "step": 116020 }, { "epoch": 0.3, "learning_rate": 0.00025488502544189577, "loss": 0.0254, "step": 116030 }, { "epoch": 0.3, "learning_rate": 0.0002548811372255243, "loss": 0.0293, "step": 116040 }, { "epoch": 0.3, "learning_rate": 0.00025487724900915285, "loss": 0.0287, "step": 116050 }, { "epoch": 0.3, "learning_rate": 0.00025487336079278136, "loss": 0.0235, "step": 116060 }, { "epoch": 0.3, "learning_rate": 0.00025486947257640993, "loss": 0.0197, "step": 116070 }, { "epoch": 0.3, "learning_rate": 0.00025486558436003845, "loss": 0.0195, "step": 116080 }, { "epoch": 0.3, "learning_rate": 0.00025486169614366696, "loss": 0.0204, "step": 116090 }, { "epoch": 0.3, "learning_rate": 0.00025485780792729553, "loss": 0.0207, "step": 116100 }, { "epoch": 0.3, "learning_rate": 0.00025485391971092404, "loss": 0.0156, "step": 116110 }, { "epoch": 0.3, "learning_rate": 0.0002548500314945526, "loss": 0.0231, "step": 116120 }, { "epoch": 0.3, "learning_rate": 0.00025484614327818113, "loss": 0.0221, "step": 116130 }, { "epoch": 0.3, "learning_rate": 0.00025484225506180964, "loss": 0.0162, "step": 116140 }, { "epoch": 0.3, "learning_rate": 0.0002548383668454382, "loss": 0.0211, "step": 116150 }, { "epoch": 0.3, "learning_rate": 0.0002548344786290667, "loss": 0.0206, "step": 116160 }, { "epoch": 0.3, "learning_rate": 0.00025483059041269524, "loss": 0.0179, "step": 116170 }, { "epoch": 0.3, "learning_rate": 0.0002548267021963238, "loss": 0.0178, "step": 116180 }, { "epoch": 0.3, "learning_rate": 0.0002548228139799523, "loss": 0.0238, "step": 116190 }, { "epoch": 0.3, "learning_rate": 0.0002548189257635809, "loss": 0.0222, "step": 116200 }, { "epoch": 0.3, "learning_rate": 0.0002548150375472094, "loss": 0.018, "step": 116210 }, { "epoch": 0.3, "learning_rate": 0.0002548111493308379, "loss": 0.0243, "step": 116220 }, { "epoch": 0.3, "learning_rate": 0.0002548072611144665, "loss": 0.0186, "step": 116230 }, { "epoch": 0.3, "learning_rate": 0.000254803372898095, "loss": 0.0178, "step": 116240 }, { "epoch": 0.3, "learning_rate": 0.0002547994846817235, "loss": 0.025, "step": 116250 }, { "epoch": 0.3, "learning_rate": 0.0002547955964653521, "loss": 0.0211, "step": 116260 }, { "epoch": 0.3, "learning_rate": 0.00025479170824898066, "loss": 0.0183, "step": 116270 }, { "epoch": 0.3, "learning_rate": 0.00025478782003260917, "loss": 0.0219, "step": 116280 }, { "epoch": 0.3, "learning_rate": 0.0002547839318162377, "loss": 0.0191, "step": 116290 }, { "epoch": 0.3, "learning_rate": 0.0002547800435998662, "loss": 0.0219, "step": 116300 }, { "epoch": 0.3, "learning_rate": 0.00025477615538349477, "loss": 0.024, "step": 116310 }, { "epoch": 0.3, "learning_rate": 0.0002547722671671233, "loss": 0.0217, "step": 116320 }, { "epoch": 0.3, "learning_rate": 0.00025476837895075185, "loss": 0.0228, "step": 116330 }, { "epoch": 0.3, "learning_rate": 0.00025476449073438037, "loss": 0.0164, "step": 116340 }, { "epoch": 0.3, "learning_rate": 0.00025476060251800894, "loss": 0.0224, "step": 116350 }, { "epoch": 0.3, "learning_rate": 0.00025475671430163745, "loss": 0.0201, "step": 116360 }, { "epoch": 0.3, "learning_rate": 0.00025475282608526596, "loss": 0.0243, "step": 116370 }, { "epoch": 0.3, "learning_rate": 0.0002547489378688945, "loss": 0.0305, "step": 116380 }, { "epoch": 0.3, "learning_rate": 0.00025474504965252305, "loss": 0.0223, "step": 116390 }, { "epoch": 0.3, "learning_rate": 0.00025474116143615156, "loss": 0.0229, "step": 116400 }, { "epoch": 0.3, "learning_rate": 0.00025473727321978013, "loss": 0.0213, "step": 116410 }, { "epoch": 0.3, "learning_rate": 0.00025473338500340865, "loss": 0.0213, "step": 116420 }, { "epoch": 0.3, "learning_rate": 0.00025472949678703716, "loss": 0.0185, "step": 116430 }, { "epoch": 0.3, "learning_rate": 0.00025472560857066573, "loss": 0.0238, "step": 116440 }, { "epoch": 0.3, "learning_rate": 0.00025472172035429424, "loss": 0.0227, "step": 116450 }, { "epoch": 0.3, "learning_rate": 0.00025471783213792276, "loss": 0.0221, "step": 116460 }, { "epoch": 0.3, "learning_rate": 0.0002547139439215513, "loss": 0.0186, "step": 116470 }, { "epoch": 0.3, "learning_rate": 0.0002547100557051799, "loss": 0.0214, "step": 116480 }, { "epoch": 0.3, "learning_rate": 0.0002547061674888084, "loss": 0.0214, "step": 116490 }, { "epoch": 0.3, "learning_rate": 0.0002547022792724369, "loss": 0.0194, "step": 116500 }, { "epoch": 0.3, "learning_rate": 0.00025469839105606544, "loss": 0.0203, "step": 116510 }, { "epoch": 0.3, "learning_rate": 0.000254694502839694, "loss": 0.0224, "step": 116520 }, { "epoch": 0.3, "learning_rate": 0.0002546906146233225, "loss": 0.0245, "step": 116530 }, { "epoch": 0.3, "learning_rate": 0.0002546867264069511, "loss": 0.0227, "step": 116540 }, { "epoch": 0.3, "learning_rate": 0.0002546828381905796, "loss": 0.0244, "step": 116550 }, { "epoch": 0.3, "learning_rate": 0.0002546789499742082, "loss": 0.0213, "step": 116560 }, { "epoch": 0.3, "learning_rate": 0.0002546750617578367, "loss": 0.0196, "step": 116570 }, { "epoch": 0.3, "learning_rate": 0.0002546711735414652, "loss": 0.0202, "step": 116580 }, { "epoch": 0.3, "learning_rate": 0.0002546672853250937, "loss": 0.02, "step": 116590 }, { "epoch": 0.3, "learning_rate": 0.0002546633971087223, "loss": 0.0189, "step": 116600 }, { "epoch": 0.3, "learning_rate": 0.0002546595088923508, "loss": 0.0183, "step": 116610 }, { "epoch": 0.3, "learning_rate": 0.00025465562067597937, "loss": 0.0207, "step": 116620 }, { "epoch": 0.3, "learning_rate": 0.0002546517324596079, "loss": 0.0189, "step": 116630 }, { "epoch": 0.3, "learning_rate": 0.0002546478442432364, "loss": 0.0219, "step": 116640 }, { "epoch": 0.3, "learning_rate": 0.00025464395602686497, "loss": 0.0228, "step": 116650 }, { "epoch": 0.3, "learning_rate": 0.0002546400678104935, "loss": 0.0261, "step": 116660 }, { "epoch": 0.3, "learning_rate": 0.00025463617959412205, "loss": 0.021, "step": 116670 }, { "epoch": 0.3, "learning_rate": 0.00025463229137775057, "loss": 0.0192, "step": 116680 }, { "epoch": 0.3, "learning_rate": 0.00025462840316137913, "loss": 0.0216, "step": 116690 }, { "epoch": 0.3, "learning_rate": 0.00025462451494500765, "loss": 0.0198, "step": 116700 }, { "epoch": 0.3, "learning_rate": 0.00025462062672863616, "loss": 0.0197, "step": 116710 }, { "epoch": 0.3, "learning_rate": 0.0002546167385122647, "loss": 0.0247, "step": 116720 }, { "epoch": 0.3, "learning_rate": 0.00025461285029589325, "loss": 0.022, "step": 116730 }, { "epoch": 0.3, "learning_rate": 0.00025460896207952176, "loss": 0.0283, "step": 116740 }, { "epoch": 0.3, "learning_rate": 0.00025460507386315033, "loss": 0.0268, "step": 116750 }, { "epoch": 0.3, "learning_rate": 0.00025460118564677884, "loss": 0.0178, "step": 116760 }, { "epoch": 0.3, "learning_rate": 0.0002545972974304074, "loss": 0.0195, "step": 116770 }, { "epoch": 0.3, "learning_rate": 0.00025459340921403593, "loss": 0.0205, "step": 116780 }, { "epoch": 0.3, "learning_rate": 0.00025458952099766444, "loss": 0.0243, "step": 116790 }, { "epoch": 0.3, "learning_rate": 0.00025458563278129296, "loss": 0.02, "step": 116800 }, { "epoch": 0.3, "learning_rate": 0.0002545817445649215, "loss": 0.0239, "step": 116810 }, { "epoch": 0.3, "learning_rate": 0.0002545778563485501, "loss": 0.0248, "step": 116820 }, { "epoch": 0.3, "learning_rate": 0.0002545739681321786, "loss": 0.023, "step": 116830 }, { "epoch": 0.3, "learning_rate": 0.0002545700799158071, "loss": 0.0212, "step": 116840 }, { "epoch": 0.3, "learning_rate": 0.0002545661916994357, "loss": 0.0209, "step": 116850 }, { "epoch": 0.3, "learning_rate": 0.0002545623034830642, "loss": 0.0228, "step": 116860 }, { "epoch": 0.3, "learning_rate": 0.0002545584152666927, "loss": 0.0211, "step": 116870 }, { "epoch": 0.3, "learning_rate": 0.0002545545270503213, "loss": 0.0278, "step": 116880 }, { "epoch": 0.3, "learning_rate": 0.0002545506388339498, "loss": 0.0188, "step": 116890 }, { "epoch": 0.3, "learning_rate": 0.0002545467506175784, "loss": 0.0211, "step": 116900 }, { "epoch": 0.3, "learning_rate": 0.0002545428624012069, "loss": 0.0238, "step": 116910 }, { "epoch": 0.3, "learning_rate": 0.0002545389741848354, "loss": 0.0189, "step": 116920 }, { "epoch": 0.3, "learning_rate": 0.0002545350859684639, "loss": 0.0178, "step": 116930 }, { "epoch": 0.3, "learning_rate": 0.0002545311977520925, "loss": 0.02, "step": 116940 }, { "epoch": 0.3, "learning_rate": 0.000254527309535721, "loss": 0.0202, "step": 116950 }, { "epoch": 0.3, "learning_rate": 0.00025452342131934957, "loss": 0.018, "step": 116960 }, { "epoch": 0.3, "learning_rate": 0.0002545195331029781, "loss": 0.0244, "step": 116970 }, { "epoch": 0.3, "learning_rate": 0.00025451564488660665, "loss": 0.0263, "step": 116980 }, { "epoch": 0.3, "learning_rate": 0.00025451175667023517, "loss": 0.0231, "step": 116990 }, { "epoch": 0.3, "learning_rate": 0.0002545078684538637, "loss": 0.0218, "step": 117000 }, { "epoch": 0.3, "eval_cer": 0.8818328525580464, "eval_loss": 0.015921663492918015, "eval_runtime": 107.4591, "eval_samples_per_second": 18.612, "eval_steps_per_second": 4.653, "step": 117000 }, { "epoch": 0.3, "learning_rate": 0.0002545039802374922, "loss": 0.028, "step": 117010 }, { "epoch": 0.3, "learning_rate": 0.00025450009202112076, "loss": 0.0212, "step": 117020 }, { "epoch": 0.3, "learning_rate": 0.00025449620380474933, "loss": 0.023, "step": 117030 }, { "epoch": 0.3, "learning_rate": 0.00025449231558837785, "loss": 0.0256, "step": 117040 }, { "epoch": 0.3, "learning_rate": 0.00025448842737200636, "loss": 0.0259, "step": 117050 }, { "epoch": 0.3, "learning_rate": 0.00025448453915563493, "loss": 0.0243, "step": 117060 }, { "epoch": 0.3, "learning_rate": 0.00025448065093926345, "loss": 0.0193, "step": 117070 }, { "epoch": 0.3, "learning_rate": 0.00025447676272289196, "loss": 0.0229, "step": 117080 }, { "epoch": 0.3, "learning_rate": 0.00025447287450652053, "loss": 0.0233, "step": 117090 }, { "epoch": 0.3, "learning_rate": 0.00025446898629014904, "loss": 0.0187, "step": 117100 }, { "epoch": 0.3, "learning_rate": 0.0002544650980737776, "loss": 0.0268, "step": 117110 }, { "epoch": 0.3, "learning_rate": 0.0002544612098574061, "loss": 0.0267, "step": 117120 }, { "epoch": 0.3, "learning_rate": 0.00025445732164103464, "loss": 0.0208, "step": 117130 }, { "epoch": 0.3, "learning_rate": 0.00025445343342466316, "loss": 0.0315, "step": 117140 }, { "epoch": 0.3, "learning_rate": 0.0002544495452082917, "loss": 0.0196, "step": 117150 }, { "epoch": 0.3, "learning_rate": 0.0002544456569919203, "loss": 0.0302, "step": 117160 }, { "epoch": 0.3, "learning_rate": 0.0002544417687755488, "loss": 0.021, "step": 117170 }, { "epoch": 0.3, "learning_rate": 0.0002544378805591773, "loss": 0.022, "step": 117180 }, { "epoch": 0.3, "learning_rate": 0.0002544339923428059, "loss": 0.0208, "step": 117190 }, { "epoch": 0.3, "learning_rate": 0.0002544301041264344, "loss": 0.0187, "step": 117200 }, { "epoch": 0.3, "learning_rate": 0.0002544262159100629, "loss": 0.0224, "step": 117210 }, { "epoch": 0.3, "learning_rate": 0.0002544223276936915, "loss": 0.0218, "step": 117220 }, { "epoch": 0.3, "learning_rate": 0.00025441843947732, "loss": 0.0214, "step": 117230 }, { "epoch": 0.3, "learning_rate": 0.00025441455126094857, "loss": 0.0171, "step": 117240 }, { "epoch": 0.3, "learning_rate": 0.0002544106630445771, "loss": 0.0236, "step": 117250 }, { "epoch": 0.3, "learning_rate": 0.0002544067748282056, "loss": 0.0218, "step": 117260 }, { "epoch": 0.3, "learning_rate": 0.00025440288661183417, "loss": 0.0273, "step": 117270 }, { "epoch": 0.3, "learning_rate": 0.0002543989983954627, "loss": 0.0197, "step": 117280 }, { "epoch": 0.3, "learning_rate": 0.0002543951101790912, "loss": 0.0227, "step": 117290 }, { "epoch": 0.3, "learning_rate": 0.00025439122196271977, "loss": 0.0224, "step": 117300 }, { "epoch": 0.3, "learning_rate": 0.00025438733374634834, "loss": 0.0215, "step": 117310 }, { "epoch": 0.3, "learning_rate": 0.00025438344552997685, "loss": 0.0262, "step": 117320 }, { "epoch": 0.3, "learning_rate": 0.00025437955731360537, "loss": 0.0221, "step": 117330 }, { "epoch": 0.3, "learning_rate": 0.0002543756690972339, "loss": 0.0211, "step": 117340 }, { "epoch": 0.3, "learning_rate": 0.00025437178088086245, "loss": 0.018, "step": 117350 }, { "epoch": 0.3, "learning_rate": 0.00025436789266449096, "loss": 0.0231, "step": 117360 }, { "epoch": 0.3, "learning_rate": 0.00025436400444811953, "loss": 0.0187, "step": 117370 }, { "epoch": 0.3, "learning_rate": 0.00025436011623174805, "loss": 0.019, "step": 117380 }, { "epoch": 0.3, "learning_rate": 0.00025435622801537656, "loss": 0.0188, "step": 117390 }, { "epoch": 0.3, "learning_rate": 0.00025435233979900513, "loss": 0.0216, "step": 117400 }, { "epoch": 0.3, "learning_rate": 0.00025434845158263364, "loss": 0.0248, "step": 117410 }, { "epoch": 0.3, "learning_rate": 0.00025434456336626216, "loss": 0.0224, "step": 117420 }, { "epoch": 0.3, "learning_rate": 0.00025434067514989073, "loss": 0.0303, "step": 117430 }, { "epoch": 0.3, "learning_rate": 0.00025433678693351924, "loss": 0.0186, "step": 117440 }, { "epoch": 0.3, "learning_rate": 0.0002543328987171478, "loss": 0.0206, "step": 117450 }, { "epoch": 0.3, "learning_rate": 0.0002543290105007763, "loss": 0.0188, "step": 117460 }, { "epoch": 0.3, "learning_rate": 0.00025432512228440484, "loss": 0.0189, "step": 117470 }, { "epoch": 0.3, "learning_rate": 0.0002543212340680334, "loss": 0.0211, "step": 117480 }, { "epoch": 0.3, "learning_rate": 0.0002543173458516619, "loss": 0.0202, "step": 117490 }, { "epoch": 0.3, "learning_rate": 0.00025431345763529044, "loss": 0.0207, "step": 117500 }, { "epoch": 0.3, "learning_rate": 0.000254309569418919, "loss": 0.018, "step": 117510 }, { "epoch": 0.3, "learning_rate": 0.0002543056812025476, "loss": 0.0247, "step": 117520 }, { "epoch": 0.3, "learning_rate": 0.0002543017929861761, "loss": 0.025, "step": 117530 }, { "epoch": 0.3, "learning_rate": 0.0002542979047698046, "loss": 0.0197, "step": 117540 }, { "epoch": 0.3, "learning_rate": 0.0002542940165534331, "loss": 0.0258, "step": 117550 }, { "epoch": 0.3, "learning_rate": 0.0002542901283370617, "loss": 0.0203, "step": 117560 }, { "epoch": 0.3, "learning_rate": 0.0002542862401206902, "loss": 0.0233, "step": 117570 }, { "epoch": 0.3, "learning_rate": 0.00025428235190431877, "loss": 0.0198, "step": 117580 }, { "epoch": 0.3, "learning_rate": 0.0002542784636879473, "loss": 0.0202, "step": 117590 }, { "epoch": 0.3, "learning_rate": 0.00025427457547157585, "loss": 0.0177, "step": 117600 }, { "epoch": 0.3, "learning_rate": 0.00025427068725520437, "loss": 0.0217, "step": 117610 }, { "epoch": 0.3, "learning_rate": 0.0002542667990388329, "loss": 0.0155, "step": 117620 }, { "epoch": 0.3, "learning_rate": 0.0002542629108224614, "loss": 0.021, "step": 117630 }, { "epoch": 0.3, "learning_rate": 0.00025425902260608997, "loss": 0.043, "step": 117640 }, { "epoch": 0.3, "learning_rate": 0.0002542551343897185, "loss": 0.0243, "step": 117650 }, { "epoch": 0.3, "learning_rate": 0.00025425124617334705, "loss": 0.0247, "step": 117660 }, { "epoch": 0.31, "learning_rate": 0.00025424735795697556, "loss": 0.0206, "step": 117670 }, { "epoch": 0.31, "learning_rate": 0.0002542434697406041, "loss": 0.0204, "step": 117680 }, { "epoch": 0.31, "learning_rate": 0.00025423958152423265, "loss": 0.0211, "step": 117690 }, { "epoch": 0.31, "learning_rate": 0.00025423569330786116, "loss": 0.0222, "step": 117700 }, { "epoch": 0.31, "learning_rate": 0.00025423180509148973, "loss": 0.0199, "step": 117710 }, { "epoch": 0.31, "learning_rate": 0.00025422791687511825, "loss": 0.0241, "step": 117720 }, { "epoch": 0.31, "learning_rate": 0.0002542240286587468, "loss": 0.0281, "step": 117730 }, { "epoch": 0.31, "learning_rate": 0.00025422014044237533, "loss": 0.0241, "step": 117740 }, { "epoch": 0.31, "learning_rate": 0.00025421625222600384, "loss": 0.0257, "step": 117750 }, { "epoch": 0.31, "learning_rate": 0.00025421236400963236, "loss": 0.0217, "step": 117760 }, { "epoch": 0.31, "learning_rate": 0.0002542084757932609, "loss": 0.0205, "step": 117770 }, { "epoch": 0.31, "learning_rate": 0.00025420458757688944, "loss": 0.0203, "step": 117780 }, { "epoch": 0.31, "learning_rate": 0.000254200699360518, "loss": 0.0186, "step": 117790 }, { "epoch": 0.31, "learning_rate": 0.0002541968111441465, "loss": 0.0244, "step": 117800 }, { "epoch": 0.31, "learning_rate": 0.0002541929229277751, "loss": 0.0226, "step": 117810 }, { "epoch": 0.31, "learning_rate": 0.0002541890347114036, "loss": 0.0232, "step": 117820 }, { "epoch": 0.31, "learning_rate": 0.0002541851464950321, "loss": 0.0186, "step": 117830 }, { "epoch": 0.31, "learning_rate": 0.00025418125827866064, "loss": 0.0266, "step": 117840 }, { "epoch": 0.31, "learning_rate": 0.0002541773700622892, "loss": 0.0207, "step": 117850 }, { "epoch": 0.31, "learning_rate": 0.0002541734818459178, "loss": 0.0221, "step": 117860 }, { "epoch": 0.31, "learning_rate": 0.0002541695936295463, "loss": 0.0163, "step": 117870 }, { "epoch": 0.31, "learning_rate": 0.0002541657054131748, "loss": 0.0258, "step": 117880 }, { "epoch": 0.31, "learning_rate": 0.0002541618171968033, "loss": 0.0186, "step": 117890 }, { "epoch": 0.31, "learning_rate": 0.0002541579289804319, "loss": 0.023, "step": 117900 }, { "epoch": 0.31, "learning_rate": 0.0002541540407640604, "loss": 0.0194, "step": 117910 }, { "epoch": 0.31, "learning_rate": 0.00025415015254768897, "loss": 0.0269, "step": 117920 }, { "epoch": 0.31, "learning_rate": 0.0002541462643313175, "loss": 0.0249, "step": 117930 }, { "epoch": 0.31, "learning_rate": 0.00025414237611494605, "loss": 0.0177, "step": 117940 }, { "epoch": 0.31, "learning_rate": 0.00025413848789857457, "loss": 0.0282, "step": 117950 }, { "epoch": 0.31, "learning_rate": 0.0002541345996822031, "loss": 0.0198, "step": 117960 }, { "epoch": 0.31, "learning_rate": 0.0002541307114658316, "loss": 0.0197, "step": 117970 }, { "epoch": 0.31, "learning_rate": 0.00025412682324946017, "loss": 0.0248, "step": 117980 }, { "epoch": 0.31, "learning_rate": 0.0002541229350330887, "loss": 0.0281, "step": 117990 }, { "epoch": 0.31, "learning_rate": 0.00025411904681671725, "loss": 0.0184, "step": 118000 }, { "epoch": 0.31, "eval_cer": 0.8817810659914818, "eval_loss": 0.014615286141633987, "eval_runtime": 107.2768, "eval_samples_per_second": 18.643, "eval_steps_per_second": 4.661, "step": 118000 }, { "epoch": 0.31, "learning_rate": 0.00025411515860034576, "loss": 0.0351, "step": 118010 }, { "epoch": 0.31, "learning_rate": 0.00025411127038397433, "loss": 0.0185, "step": 118020 }, { "epoch": 0.31, "learning_rate": 0.00025410738216760285, "loss": 0.0203, "step": 118030 }, { "epoch": 0.31, "learning_rate": 0.00025410349395123136, "loss": 0.0176, "step": 118040 }, { "epoch": 0.31, "learning_rate": 0.0002540996057348599, "loss": 0.021, "step": 118050 }, { "epoch": 0.31, "learning_rate": 0.00025409571751848844, "loss": 0.0182, "step": 118060 }, { "epoch": 0.31, "learning_rate": 0.000254091829302117, "loss": 0.0255, "step": 118070 }, { "epoch": 0.31, "learning_rate": 0.00025408794108574553, "loss": 0.0211, "step": 118080 }, { "epoch": 0.31, "learning_rate": 0.00025408405286937404, "loss": 0.0226, "step": 118090 }, { "epoch": 0.31, "learning_rate": 0.00025408016465300256, "loss": 0.018, "step": 118100 }, { "epoch": 0.31, "learning_rate": 0.0002540762764366311, "loss": 0.0234, "step": 118110 }, { "epoch": 0.31, "learning_rate": 0.00025407238822025964, "loss": 0.0198, "step": 118120 }, { "epoch": 0.31, "learning_rate": 0.0002540685000038882, "loss": 0.0257, "step": 118130 }, { "epoch": 0.31, "learning_rate": 0.0002540646117875167, "loss": 0.018, "step": 118140 }, { "epoch": 0.31, "learning_rate": 0.0002540607235711453, "loss": 0.0205, "step": 118150 }, { "epoch": 0.31, "learning_rate": 0.0002540568353547738, "loss": 0.0227, "step": 118160 }, { "epoch": 0.31, "learning_rate": 0.0002540529471384023, "loss": 0.0208, "step": 118170 }, { "epoch": 0.31, "learning_rate": 0.00025404905892203084, "loss": 0.0199, "step": 118180 }, { "epoch": 0.31, "learning_rate": 0.0002540451707056594, "loss": 0.0237, "step": 118190 }, { "epoch": 0.31, "learning_rate": 0.0002540412824892879, "loss": 0.023, "step": 118200 }, { "epoch": 0.31, "learning_rate": 0.0002540373942729165, "loss": 0.0218, "step": 118210 }, { "epoch": 0.31, "learning_rate": 0.000254033506056545, "loss": 0.0221, "step": 118220 }, { "epoch": 0.31, "learning_rate": 0.00025402961784017357, "loss": 0.0237, "step": 118230 }, { "epoch": 0.31, "learning_rate": 0.0002540257296238021, "loss": 0.0222, "step": 118240 }, { "epoch": 0.31, "learning_rate": 0.0002540218414074306, "loss": 0.0172, "step": 118250 }, { "epoch": 0.31, "learning_rate": 0.00025401795319105917, "loss": 0.0208, "step": 118260 }, { "epoch": 0.31, "learning_rate": 0.0002540140649746877, "loss": 0.0176, "step": 118270 }, { "epoch": 0.31, "learning_rate": 0.00025401017675831625, "loss": 0.0218, "step": 118280 }, { "epoch": 0.31, "learning_rate": 0.00025400628854194477, "loss": 0.0168, "step": 118290 }, { "epoch": 0.31, "learning_rate": 0.0002540024003255733, "loss": 0.0242, "step": 118300 }, { "epoch": 0.31, "learning_rate": 0.00025399851210920185, "loss": 0.0189, "step": 118310 }, { "epoch": 0.31, "learning_rate": 0.00025399462389283036, "loss": 0.0214, "step": 118320 }, { "epoch": 0.31, "learning_rate": 0.0002539907356764589, "loss": 0.0241, "step": 118330 }, { "epoch": 0.31, "learning_rate": 0.00025398684746008745, "loss": 0.0176, "step": 118340 }, { "epoch": 0.31, "learning_rate": 0.00025398295924371596, "loss": 0.0227, "step": 118350 }, { "epoch": 0.31, "learning_rate": 0.00025397907102734453, "loss": 0.0192, "step": 118360 }, { "epoch": 0.31, "learning_rate": 0.00025397518281097305, "loss": 0.02, "step": 118370 }, { "epoch": 0.31, "learning_rate": 0.00025397129459460156, "loss": 0.0205, "step": 118380 }, { "epoch": 0.31, "learning_rate": 0.0002539674063782301, "loss": 0.0226, "step": 118390 }, { "epoch": 0.31, "learning_rate": 0.00025396351816185864, "loss": 0.0194, "step": 118400 }, { "epoch": 0.31, "learning_rate": 0.0002539596299454872, "loss": 0.0232, "step": 118410 }, { "epoch": 0.31, "learning_rate": 0.0002539557417291157, "loss": 0.0188, "step": 118420 }, { "epoch": 0.31, "learning_rate": 0.00025395185351274424, "loss": 0.0221, "step": 118430 }, { "epoch": 0.31, "learning_rate": 0.0002539479652963728, "loss": 0.0273, "step": 118440 }, { "epoch": 0.31, "learning_rate": 0.0002539440770800013, "loss": 0.0191, "step": 118450 }, { "epoch": 0.31, "learning_rate": 0.00025394018886362984, "loss": 0.0211, "step": 118460 }, { "epoch": 0.31, "learning_rate": 0.0002539363006472584, "loss": 0.023, "step": 118470 }, { "epoch": 0.31, "learning_rate": 0.0002539324124308869, "loss": 0.0215, "step": 118480 }, { "epoch": 0.31, "learning_rate": 0.0002539285242145155, "loss": 0.0231, "step": 118490 }, { "epoch": 0.31, "learning_rate": 0.000253924635998144, "loss": 0.0247, "step": 118500 }, { "epoch": 0.31, "learning_rate": 0.0002539207477817725, "loss": 0.0252, "step": 118510 }, { "epoch": 0.31, "learning_rate": 0.0002539168595654011, "loss": 0.0252, "step": 118520 }, { "epoch": 0.31, "learning_rate": 0.0002539129713490296, "loss": 0.0214, "step": 118530 }, { "epoch": 0.31, "learning_rate": 0.0002539090831326581, "loss": 0.0218, "step": 118540 }, { "epoch": 0.31, "learning_rate": 0.0002539051949162867, "loss": 0.0194, "step": 118550 }, { "epoch": 0.31, "learning_rate": 0.00025390130669991525, "loss": 0.02, "step": 118560 }, { "epoch": 0.31, "learning_rate": 0.00025389741848354377, "loss": 0.024, "step": 118570 }, { "epoch": 0.31, "learning_rate": 0.0002538935302671723, "loss": 0.0187, "step": 118580 }, { "epoch": 0.31, "learning_rate": 0.0002538896420508008, "loss": 0.0226, "step": 118590 }, { "epoch": 0.31, "learning_rate": 0.0002538857538344293, "loss": 0.0191, "step": 118600 }, { "epoch": 0.31, "learning_rate": 0.0002538818656180579, "loss": 0.026, "step": 118610 }, { "epoch": 0.31, "learning_rate": 0.00025387797740168645, "loss": 0.0223, "step": 118620 }, { "epoch": 0.31, "learning_rate": 0.00025387408918531497, "loss": 0.0209, "step": 118630 }, { "epoch": 0.31, "learning_rate": 0.0002538702009689435, "loss": 0.0221, "step": 118640 }, { "epoch": 0.31, "learning_rate": 0.00025386631275257205, "loss": 0.0205, "step": 118650 }, { "epoch": 0.31, "learning_rate": 0.00025386242453620056, "loss": 0.0199, "step": 118660 }, { "epoch": 0.31, "learning_rate": 0.0002538585363198291, "loss": 0.0172, "step": 118670 }, { "epoch": 0.31, "learning_rate": 0.00025385464810345765, "loss": 0.0188, "step": 118680 }, { "epoch": 0.31, "learning_rate": 0.00025385075988708616, "loss": 0.0229, "step": 118690 }, { "epoch": 0.31, "learning_rate": 0.00025384687167071473, "loss": 0.0167, "step": 118700 }, { "epoch": 0.31, "learning_rate": 0.00025384298345434324, "loss": 0.019, "step": 118710 }, { "epoch": 0.31, "learning_rate": 0.00025383909523797176, "loss": 0.0179, "step": 118720 }, { "epoch": 0.31, "learning_rate": 0.00025383520702160033, "loss": 0.0163, "step": 118730 }, { "epoch": 0.31, "learning_rate": 0.00025383131880522884, "loss": 0.0211, "step": 118740 }, { "epoch": 0.31, "learning_rate": 0.0002538274305888574, "loss": 0.0199, "step": 118750 }, { "epoch": 0.31, "learning_rate": 0.0002538235423724859, "loss": 0.0213, "step": 118760 }, { "epoch": 0.31, "learning_rate": 0.0002538196541561145, "loss": 0.0189, "step": 118770 }, { "epoch": 0.31, "learning_rate": 0.000253815765939743, "loss": 0.016, "step": 118780 }, { "epoch": 0.31, "learning_rate": 0.0002538118777233715, "loss": 0.0246, "step": 118790 }, { "epoch": 0.31, "learning_rate": 0.00025380798950700004, "loss": 0.0209, "step": 118800 }, { "epoch": 0.31, "learning_rate": 0.0002538041012906286, "loss": 0.0209, "step": 118810 }, { "epoch": 0.31, "learning_rate": 0.0002538002130742571, "loss": 0.0254, "step": 118820 }, { "epoch": 0.31, "learning_rate": 0.0002537963248578857, "loss": 0.0237, "step": 118830 }, { "epoch": 0.31, "learning_rate": 0.0002537924366415142, "loss": 0.0206, "step": 118840 }, { "epoch": 0.31, "learning_rate": 0.0002537885484251427, "loss": 0.023, "step": 118850 }, { "epoch": 0.31, "learning_rate": 0.0002537846602087713, "loss": 0.0228, "step": 118860 }, { "epoch": 0.31, "learning_rate": 0.0002537807719923998, "loss": 0.0221, "step": 118870 }, { "epoch": 0.31, "learning_rate": 0.0002537768837760283, "loss": 0.0232, "step": 118880 }, { "epoch": 0.31, "learning_rate": 0.0002537729955596569, "loss": 0.022, "step": 118890 }, { "epoch": 0.31, "learning_rate": 0.00025376910734328545, "loss": 0.0168, "step": 118900 }, { "epoch": 0.31, "learning_rate": 0.00025376521912691397, "loss": 0.0212, "step": 118910 }, { "epoch": 0.31, "learning_rate": 0.0002537613309105425, "loss": 0.0207, "step": 118920 }, { "epoch": 0.31, "learning_rate": 0.000253757442694171, "loss": 0.0229, "step": 118930 }, { "epoch": 0.31, "learning_rate": 0.00025375355447779957, "loss": 0.0207, "step": 118940 }, { "epoch": 0.31, "learning_rate": 0.0002537496662614281, "loss": 0.0226, "step": 118950 }, { "epoch": 0.31, "learning_rate": 0.00025374577804505665, "loss": 0.0188, "step": 118960 }, { "epoch": 0.31, "learning_rate": 0.00025374188982868516, "loss": 0.0273, "step": 118970 }, { "epoch": 0.31, "learning_rate": 0.00025373800161231373, "loss": 0.018, "step": 118980 }, { "epoch": 0.31, "learning_rate": 0.00025373411339594225, "loss": 0.0232, "step": 118990 }, { "epoch": 0.31, "learning_rate": 0.00025373022517957076, "loss": 0.0183, "step": 119000 }, { "epoch": 0.31, "eval_cer": 0.8817894638130869, "eval_loss": 0.01590069569647312, "eval_runtime": 107.3244, "eval_samples_per_second": 18.635, "eval_steps_per_second": 4.659, "step": 119000 }, { "epoch": 0.31, "learning_rate": 0.0002537263369631993, "loss": 0.0201, "step": 119010 }, { "epoch": 0.31, "learning_rate": 0.00025372244874682784, "loss": 0.0195, "step": 119020 }, { "epoch": 0.31, "learning_rate": 0.00025371856053045636, "loss": 0.0243, "step": 119030 }, { "epoch": 0.31, "learning_rate": 0.00025371467231408493, "loss": 0.0203, "step": 119040 }, { "epoch": 0.31, "learning_rate": 0.00025371078409771344, "loss": 0.0212, "step": 119050 }, { "epoch": 0.31, "learning_rate": 0.000253706895881342, "loss": 0.021, "step": 119060 }, { "epoch": 0.31, "learning_rate": 0.0002537030076649705, "loss": 0.0214, "step": 119070 }, { "epoch": 0.31, "learning_rate": 0.00025369911944859904, "loss": 0.0175, "step": 119080 }, { "epoch": 0.31, "learning_rate": 0.00025369523123222756, "loss": 0.0196, "step": 119090 }, { "epoch": 0.31, "learning_rate": 0.0002536913430158561, "loss": 0.025, "step": 119100 }, { "epoch": 0.31, "learning_rate": 0.0002536874547994847, "loss": 0.0209, "step": 119110 }, { "epoch": 0.31, "learning_rate": 0.0002536835665831132, "loss": 0.0221, "step": 119120 }, { "epoch": 0.31, "learning_rate": 0.0002536796783667417, "loss": 0.0219, "step": 119130 }, { "epoch": 0.31, "learning_rate": 0.00025367579015037024, "loss": 0.0196, "step": 119140 }, { "epoch": 0.31, "learning_rate": 0.0002536719019339988, "loss": 0.0194, "step": 119150 }, { "epoch": 0.31, "learning_rate": 0.0002536680137176273, "loss": 0.0205, "step": 119160 }, { "epoch": 0.31, "learning_rate": 0.0002536641255012559, "loss": 0.0215, "step": 119170 }, { "epoch": 0.31, "learning_rate": 0.0002536602372848844, "loss": 0.0177, "step": 119180 }, { "epoch": 0.31, "learning_rate": 0.00025365634906851297, "loss": 0.0243, "step": 119190 }, { "epoch": 0.31, "learning_rate": 0.0002536524608521415, "loss": 0.0204, "step": 119200 }, { "epoch": 0.31, "learning_rate": 0.00025364857263577, "loss": 0.0201, "step": 119210 }, { "epoch": 0.31, "learning_rate": 0.0002536446844193985, "loss": 0.0267, "step": 119220 }, { "epoch": 0.31, "learning_rate": 0.0002536407962030271, "loss": 0.026, "step": 119230 }, { "epoch": 0.31, "learning_rate": 0.0002536369079866556, "loss": 0.0255, "step": 119240 }, { "epoch": 0.31, "learning_rate": 0.00025363301977028417, "loss": 0.0215, "step": 119250 }, { "epoch": 0.31, "learning_rate": 0.0002536291315539127, "loss": 0.0256, "step": 119260 }, { "epoch": 0.31, "learning_rate": 0.00025362524333754125, "loss": 0.0251, "step": 119270 }, { "epoch": 0.31, "learning_rate": 0.00025362135512116976, "loss": 0.0196, "step": 119280 }, { "epoch": 0.31, "learning_rate": 0.0002536174669047983, "loss": 0.019, "step": 119290 }, { "epoch": 0.31, "learning_rate": 0.00025361357868842685, "loss": 0.0174, "step": 119300 }, { "epoch": 0.31, "learning_rate": 0.00025360969047205536, "loss": 0.023, "step": 119310 }, { "epoch": 0.31, "learning_rate": 0.00025360580225568393, "loss": 0.0217, "step": 119320 }, { "epoch": 0.31, "learning_rate": 0.00025360191403931245, "loss": 0.0207, "step": 119330 }, { "epoch": 0.31, "learning_rate": 0.00025359802582294096, "loss": 0.0217, "step": 119340 }, { "epoch": 0.31, "learning_rate": 0.0002535941376065695, "loss": 0.0228, "step": 119350 }, { "epoch": 0.31, "learning_rate": 0.00025359024939019804, "loss": 0.0221, "step": 119360 }, { "epoch": 0.31, "learning_rate": 0.00025358636117382656, "loss": 0.019, "step": 119370 }, { "epoch": 0.31, "learning_rate": 0.0002535824729574551, "loss": 0.0182, "step": 119380 }, { "epoch": 0.31, "learning_rate": 0.00025357858474108364, "loss": 0.0196, "step": 119390 }, { "epoch": 0.31, "learning_rate": 0.0002535746965247122, "loss": 0.0273, "step": 119400 }, { "epoch": 0.31, "learning_rate": 0.0002535708083083407, "loss": 0.0263, "step": 119410 }, { "epoch": 0.31, "learning_rate": 0.00025356692009196924, "loss": 0.0232, "step": 119420 }, { "epoch": 0.31, "learning_rate": 0.00025356303187559775, "loss": 0.0197, "step": 119430 }, { "epoch": 0.31, "learning_rate": 0.0002535591436592263, "loss": 0.0188, "step": 119440 }, { "epoch": 0.31, "learning_rate": 0.0002535552554428549, "loss": 0.0196, "step": 119450 }, { "epoch": 0.31, "learning_rate": 0.0002535513672264834, "loss": 0.0199, "step": 119460 }, { "epoch": 0.31, "learning_rate": 0.0002535474790101119, "loss": 0.029, "step": 119470 }, { "epoch": 0.31, "learning_rate": 0.0002535435907937405, "loss": 0.0221, "step": 119480 }, { "epoch": 0.31, "learning_rate": 0.000253539702577369, "loss": 0.0217, "step": 119490 }, { "epoch": 0.31, "learning_rate": 0.0002535358143609975, "loss": 0.0198, "step": 119500 }, { "epoch": 0.31, "learning_rate": 0.0002535319261446261, "loss": 0.0203, "step": 119510 }, { "epoch": 0.31, "learning_rate": 0.0002535280379282546, "loss": 0.0198, "step": 119520 }, { "epoch": 0.31, "learning_rate": 0.00025352414971188317, "loss": 0.0197, "step": 119530 }, { "epoch": 0.31, "learning_rate": 0.0002535202614955117, "loss": 0.0214, "step": 119540 }, { "epoch": 0.31, "learning_rate": 0.0002535163732791402, "loss": 0.02, "step": 119550 }, { "epoch": 0.31, "learning_rate": 0.00025351248506276877, "loss": 0.0213, "step": 119560 }, { "epoch": 0.31, "learning_rate": 0.0002535085968463973, "loss": 0.0279, "step": 119570 }, { "epoch": 0.31, "learning_rate": 0.0002535047086300258, "loss": 0.0245, "step": 119580 }, { "epoch": 0.31, "learning_rate": 0.00025350082041365437, "loss": 0.0212, "step": 119590 }, { "epoch": 0.31, "learning_rate": 0.0002534969321972829, "loss": 0.0231, "step": 119600 }, { "epoch": 0.31, "learning_rate": 0.00025349304398091145, "loss": 0.0271, "step": 119610 }, { "epoch": 0.31, "learning_rate": 0.00025348915576453996, "loss": 0.0231, "step": 119620 }, { "epoch": 0.31, "learning_rate": 0.0002534852675481685, "loss": 0.0225, "step": 119630 }, { "epoch": 0.31, "learning_rate": 0.000253481379331797, "loss": 0.0233, "step": 119640 }, { "epoch": 0.31, "learning_rate": 0.00025347749111542556, "loss": 0.0263, "step": 119650 }, { "epoch": 0.31, "learning_rate": 0.00025347360289905413, "loss": 0.0222, "step": 119660 }, { "epoch": 0.31, "learning_rate": 0.00025346971468268264, "loss": 0.0228, "step": 119670 }, { "epoch": 0.31, "learning_rate": 0.00025346582646631116, "loss": 0.0186, "step": 119680 }, { "epoch": 0.31, "learning_rate": 0.00025346193824993973, "loss": 0.0223, "step": 119690 }, { "epoch": 0.31, "learning_rate": 0.00025345805003356824, "loss": 0.0225, "step": 119700 }, { "epoch": 0.31, "learning_rate": 0.00025345416181719676, "loss": 0.0237, "step": 119710 }, { "epoch": 0.31, "learning_rate": 0.0002534502736008253, "loss": 0.022, "step": 119720 }, { "epoch": 0.31, "learning_rate": 0.00025344638538445384, "loss": 0.0168, "step": 119730 }, { "epoch": 0.31, "learning_rate": 0.0002534424971680824, "loss": 0.0217, "step": 119740 }, { "epoch": 0.31, "learning_rate": 0.0002534386089517109, "loss": 0.0207, "step": 119750 }, { "epoch": 0.31, "learning_rate": 0.00025343472073533944, "loss": 0.0375, "step": 119760 }, { "epoch": 0.31, "learning_rate": 0.000253430832518968, "loss": 0.025, "step": 119770 }, { "epoch": 0.31, "learning_rate": 0.0002534269443025965, "loss": 0.0153, "step": 119780 }, { "epoch": 0.31, "learning_rate": 0.00025342305608622504, "loss": 0.0274, "step": 119790 }, { "epoch": 0.31, "learning_rate": 0.0002534191678698536, "loss": 0.0189, "step": 119800 }, { "epoch": 0.31, "learning_rate": 0.0002534152796534822, "loss": 0.0216, "step": 119810 }, { "epoch": 0.31, "learning_rate": 0.0002534113914371107, "loss": 0.0214, "step": 119820 }, { "epoch": 0.31, "learning_rate": 0.0002534075032207392, "loss": 0.0193, "step": 119830 }, { "epoch": 0.31, "learning_rate": 0.0002534036150043677, "loss": 0.0212, "step": 119840 }, { "epoch": 0.31, "learning_rate": 0.0002533997267879963, "loss": 0.0262, "step": 119850 }, { "epoch": 0.31, "learning_rate": 0.0002533958385716248, "loss": 0.0227, "step": 119860 }, { "epoch": 0.31, "learning_rate": 0.00025339195035525337, "loss": 0.0193, "step": 119870 }, { "epoch": 0.31, "learning_rate": 0.0002533880621388819, "loss": 0.0178, "step": 119880 }, { "epoch": 0.31, "learning_rate": 0.0002533841739225104, "loss": 0.0253, "step": 119890 }, { "epoch": 0.31, "learning_rate": 0.00025338028570613897, "loss": 0.0181, "step": 119900 }, { "epoch": 0.31, "learning_rate": 0.0002533763974897675, "loss": 0.0215, "step": 119910 }, { "epoch": 0.31, "learning_rate": 0.000253372509273396, "loss": 0.0196, "step": 119920 }, { "epoch": 0.31, "learning_rate": 0.00025336862105702456, "loss": 0.0246, "step": 119930 }, { "epoch": 0.31, "learning_rate": 0.0002533647328406531, "loss": 0.0221, "step": 119940 }, { "epoch": 0.31, "learning_rate": 0.00025336084462428165, "loss": 0.0208, "step": 119950 }, { "epoch": 0.31, "learning_rate": 0.00025335695640791016, "loss": 0.0248, "step": 119960 }, { "epoch": 0.31, "learning_rate": 0.0002533530681915387, "loss": 0.028, "step": 119970 }, { "epoch": 0.31, "learning_rate": 0.00025334917997516725, "loss": 0.0217, "step": 119980 }, { "epoch": 0.31, "learning_rate": 0.00025334529175879576, "loss": 0.0274, "step": 119990 }, { "epoch": 0.31, "learning_rate": 0.00025334140354242433, "loss": 0.0192, "step": 120000 }, { "epoch": 0.31, "eval_cer": 0.8818244547364413, "eval_loss": 0.015779657289385796, "eval_runtime": 107.2547, "eval_samples_per_second": 18.647, "eval_steps_per_second": 4.662, "step": 120000 }, { "epoch": 0.31, "learning_rate": 0.00025333751532605284, "loss": 0.0188, "step": 120010 }, { "epoch": 0.31, "learning_rate": 0.0002533336271096814, "loss": 0.0222, "step": 120020 }, { "epoch": 0.31, "learning_rate": 0.0002533297388933099, "loss": 0.0204, "step": 120030 }, { "epoch": 0.31, "learning_rate": 0.00025332585067693844, "loss": 0.0215, "step": 120040 }, { "epoch": 0.31, "learning_rate": 0.00025332196246056696, "loss": 0.0209, "step": 120050 }, { "epoch": 0.31, "learning_rate": 0.0002533180742441955, "loss": 0.023, "step": 120060 }, { "epoch": 0.31, "learning_rate": 0.00025331418602782404, "loss": 0.0249, "step": 120070 }, { "epoch": 0.31, "learning_rate": 0.0002533102978114526, "loss": 0.0184, "step": 120080 }, { "epoch": 0.31, "learning_rate": 0.0002533064095950811, "loss": 0.0216, "step": 120090 }, { "epoch": 0.31, "learning_rate": 0.00025330252137870964, "loss": 0.021, "step": 120100 }, { "epoch": 0.31, "learning_rate": 0.0002532986331623382, "loss": 0.0233, "step": 120110 }, { "epoch": 0.31, "learning_rate": 0.0002532947449459667, "loss": 0.0195, "step": 120120 }, { "epoch": 0.31, "learning_rate": 0.00025329085672959523, "loss": 0.021, "step": 120130 }, { "epoch": 0.31, "learning_rate": 0.0002532869685132238, "loss": 0.0314, "step": 120140 }, { "epoch": 0.31, "learning_rate": 0.00025328308029685237, "loss": 0.0195, "step": 120150 }, { "epoch": 0.31, "learning_rate": 0.0002532791920804809, "loss": 0.0249, "step": 120160 }, { "epoch": 0.31, "learning_rate": 0.0002532753038641094, "loss": 0.025, "step": 120170 }, { "epoch": 0.31, "learning_rate": 0.0002532714156477379, "loss": 0.0184, "step": 120180 }, { "epoch": 0.31, "learning_rate": 0.0002532675274313665, "loss": 0.0183, "step": 120190 }, { "epoch": 0.31, "learning_rate": 0.000253263639214995, "loss": 0.0205, "step": 120200 }, { "epoch": 0.31, "learning_rate": 0.00025325975099862357, "loss": 0.023, "step": 120210 }, { "epoch": 0.31, "learning_rate": 0.0002532558627822521, "loss": 0.0265, "step": 120220 }, { "epoch": 0.31, "learning_rate": 0.00025325197456588065, "loss": 0.0284, "step": 120230 }, { "epoch": 0.31, "learning_rate": 0.00025324808634950917, "loss": 0.0227, "step": 120240 }, { "epoch": 0.31, "learning_rate": 0.0002532441981331377, "loss": 0.0238, "step": 120250 }, { "epoch": 0.31, "learning_rate": 0.0002532403099167662, "loss": 0.0244, "step": 120260 }, { "epoch": 0.31, "learning_rate": 0.00025323642170039476, "loss": 0.0201, "step": 120270 }, { "epoch": 0.31, "learning_rate": 0.0002532325334840233, "loss": 0.0197, "step": 120280 }, { "epoch": 0.31, "learning_rate": 0.00025322864526765185, "loss": 0.0228, "step": 120290 }, { "epoch": 0.31, "learning_rate": 0.00025322475705128036, "loss": 0.0239, "step": 120300 }, { "epoch": 0.31, "learning_rate": 0.00025322086883490893, "loss": 0.0221, "step": 120310 }, { "epoch": 0.31, "learning_rate": 0.00025321698061853744, "loss": 0.0221, "step": 120320 }, { "epoch": 0.31, "learning_rate": 0.00025321309240216596, "loss": 0.0271, "step": 120330 }, { "epoch": 0.31, "learning_rate": 0.0002532092041857945, "loss": 0.0165, "step": 120340 }, { "epoch": 0.31, "learning_rate": 0.00025320531596942304, "loss": 0.0212, "step": 120350 }, { "epoch": 0.31, "learning_rate": 0.0002532014277530516, "loss": 0.0216, "step": 120360 }, { "epoch": 0.31, "learning_rate": 0.0002531975395366801, "loss": 0.0253, "step": 120370 }, { "epoch": 0.31, "learning_rate": 0.00025319365132030864, "loss": 0.0224, "step": 120380 }, { "epoch": 0.31, "learning_rate": 0.00025318976310393715, "loss": 0.0218, "step": 120390 }, { "epoch": 0.31, "learning_rate": 0.0002531858748875657, "loss": 0.0203, "step": 120400 }, { "epoch": 0.31, "learning_rate": 0.00025318198667119424, "loss": 0.0248, "step": 120410 }, { "epoch": 0.31, "learning_rate": 0.0002531780984548228, "loss": 0.0233, "step": 120420 }, { "epoch": 0.31, "learning_rate": 0.0002531742102384513, "loss": 0.0258, "step": 120430 }, { "epoch": 0.31, "learning_rate": 0.0002531703220220799, "loss": 0.0204, "step": 120440 }, { "epoch": 0.31, "learning_rate": 0.0002531664338057084, "loss": 0.0221, "step": 120450 }, { "epoch": 0.31, "learning_rate": 0.0002531625455893369, "loss": 0.0202, "step": 120460 }, { "epoch": 0.31, "learning_rate": 0.00025315865737296543, "loss": 0.0231, "step": 120470 }, { "epoch": 0.31, "learning_rate": 0.000253154769156594, "loss": 0.019, "step": 120480 }, { "epoch": 0.31, "learning_rate": 0.00025315088094022257, "loss": 0.0284, "step": 120490 }, { "epoch": 0.31, "learning_rate": 0.0002531469927238511, "loss": 0.021, "step": 120500 }, { "epoch": 0.31, "learning_rate": 0.0002531431045074796, "loss": 0.0211, "step": 120510 }, { "epoch": 0.31, "learning_rate": 0.00025313921629110817, "loss": 0.02, "step": 120520 }, { "epoch": 0.31, "learning_rate": 0.0002531353280747367, "loss": 0.0216, "step": 120530 }, { "epoch": 0.31, "learning_rate": 0.0002531314398583652, "loss": 0.02, "step": 120540 }, { "epoch": 0.31, "learning_rate": 0.00025312755164199377, "loss": 0.0221, "step": 120550 }, { "epoch": 0.31, "learning_rate": 0.0002531236634256223, "loss": 0.0222, "step": 120560 }, { "epoch": 0.31, "learning_rate": 0.00025311977520925085, "loss": 0.0253, "step": 120570 }, { "epoch": 0.31, "learning_rate": 0.00025311588699287936, "loss": 0.0226, "step": 120580 }, { "epoch": 0.31, "learning_rate": 0.0002531119987765079, "loss": 0.0218, "step": 120590 }, { "epoch": 0.31, "learning_rate": 0.0002531081105601364, "loss": 0.0267, "step": 120600 }, { "epoch": 0.31, "learning_rate": 0.00025310422234376496, "loss": 0.0252, "step": 120610 }, { "epoch": 0.31, "learning_rate": 0.0002531003341273935, "loss": 0.0192, "step": 120620 }, { "epoch": 0.31, "learning_rate": 0.00025309644591102205, "loss": 0.0202, "step": 120630 }, { "epoch": 0.31, "learning_rate": 0.00025309255769465056, "loss": 0.0211, "step": 120640 }, { "epoch": 0.31, "learning_rate": 0.00025308866947827913, "loss": 0.0169, "step": 120650 }, { "epoch": 0.31, "learning_rate": 0.00025308478126190764, "loss": 0.0209, "step": 120660 }, { "epoch": 0.31, "learning_rate": 0.00025308089304553616, "loss": 0.0205, "step": 120670 }, { "epoch": 0.31, "learning_rate": 0.00025307700482916467, "loss": 0.0186, "step": 120680 }, { "epoch": 0.31, "learning_rate": 0.00025307311661279324, "loss": 0.0213, "step": 120690 }, { "epoch": 0.31, "learning_rate": 0.0002530692283964218, "loss": 0.0186, "step": 120700 }, { "epoch": 0.31, "learning_rate": 0.0002530653401800503, "loss": 0.022, "step": 120710 }, { "epoch": 0.31, "learning_rate": 0.00025306145196367884, "loss": 0.0214, "step": 120720 }, { "epoch": 0.31, "learning_rate": 0.0002530575637473074, "loss": 0.018, "step": 120730 }, { "epoch": 0.31, "learning_rate": 0.0002530536755309359, "loss": 0.0217, "step": 120740 }, { "epoch": 0.31, "learning_rate": 0.00025304978731456444, "loss": 0.0224, "step": 120750 }, { "epoch": 0.31, "learning_rate": 0.000253045899098193, "loss": 0.0227, "step": 120760 }, { "epoch": 0.31, "learning_rate": 0.0002530420108818215, "loss": 0.026, "step": 120770 }, { "epoch": 0.31, "learning_rate": 0.0002530381226654501, "loss": 0.02, "step": 120780 }, { "epoch": 0.31, "learning_rate": 0.0002530342344490786, "loss": 0.0237, "step": 120790 }, { "epoch": 0.31, "learning_rate": 0.0002530303462327071, "loss": 0.0217, "step": 120800 }, { "epoch": 0.31, "learning_rate": 0.0002530264580163357, "loss": 0.022, "step": 120810 }, { "epoch": 0.31, "learning_rate": 0.0002530225697999642, "loss": 0.0209, "step": 120820 }, { "epoch": 0.31, "learning_rate": 0.0002530186815835927, "loss": 0.0259, "step": 120830 }, { "epoch": 0.31, "learning_rate": 0.0002530147933672213, "loss": 0.0202, "step": 120840 }, { "epoch": 0.31, "learning_rate": 0.0002530109051508498, "loss": 0.0181, "step": 120850 }, { "epoch": 0.31, "learning_rate": 0.00025300701693447837, "loss": 0.0178, "step": 120860 }, { "epoch": 0.31, "learning_rate": 0.0002530031287181069, "loss": 0.0198, "step": 120870 }, { "epoch": 0.31, "learning_rate": 0.0002529992405017354, "loss": 0.0252, "step": 120880 }, { "epoch": 0.31, "learning_rate": 0.00025299535228536397, "loss": 0.0201, "step": 120890 }, { "epoch": 0.31, "learning_rate": 0.0002529914640689925, "loss": 0.018, "step": 120900 }, { "epoch": 0.31, "learning_rate": 0.00025298757585262105, "loss": 0.0197, "step": 120910 }, { "epoch": 0.31, "learning_rate": 0.00025298368763624956, "loss": 0.0238, "step": 120920 }, { "epoch": 0.31, "learning_rate": 0.0002529797994198781, "loss": 0.0183, "step": 120930 }, { "epoch": 0.31, "learning_rate": 0.00025297591120350665, "loss": 0.0201, "step": 120940 }, { "epoch": 0.31, "learning_rate": 0.00025297202298713516, "loss": 0.0222, "step": 120950 }, { "epoch": 0.31, "learning_rate": 0.0002529681347707637, "loss": 0.0182, "step": 120960 }, { "epoch": 0.31, "learning_rate": 0.00025296424655439224, "loss": 0.0213, "step": 120970 }, { "epoch": 0.31, "learning_rate": 0.00025296035833802076, "loss": 0.0224, "step": 120980 }, { "epoch": 0.31, "learning_rate": 0.00025295647012164933, "loss": 0.0173, "step": 120990 }, { "epoch": 0.31, "learning_rate": 0.00025295258190527784, "loss": 0.0219, "step": 121000 }, { "epoch": 0.31, "eval_cer": 0.8817992612716261, "eval_loss": 0.015187835320830345, "eval_runtime": 107.3871, "eval_samples_per_second": 18.624, "eval_steps_per_second": 4.656, "step": 121000 }, { "epoch": 0.31, "learning_rate": 0.00025294869368890636, "loss": 0.0245, "step": 121010 }, { "epoch": 0.31, "learning_rate": 0.0002529448054725349, "loss": 0.0248, "step": 121020 }, { "epoch": 0.31, "learning_rate": 0.00025294091725616344, "loss": 0.0209, "step": 121030 }, { "epoch": 0.31, "learning_rate": 0.000252937029039792, "loss": 0.0217, "step": 121040 }, { "epoch": 0.31, "learning_rate": 0.0002529331408234205, "loss": 0.0222, "step": 121050 }, { "epoch": 0.31, "learning_rate": 0.0002529292526070491, "loss": 0.0213, "step": 121060 }, { "epoch": 0.31, "learning_rate": 0.0002529253643906776, "loss": 0.0208, "step": 121070 }, { "epoch": 0.31, "learning_rate": 0.0002529214761743061, "loss": 0.0194, "step": 121080 }, { "epoch": 0.31, "learning_rate": 0.00025291758795793464, "loss": 0.0206, "step": 121090 }, { "epoch": 0.31, "learning_rate": 0.0002529136997415632, "loss": 0.0216, "step": 121100 }, { "epoch": 0.31, "learning_rate": 0.0002529098115251917, "loss": 0.0208, "step": 121110 }, { "epoch": 0.31, "learning_rate": 0.0002529059233088203, "loss": 0.0183, "step": 121120 }, { "epoch": 0.31, "learning_rate": 0.0002529020350924488, "loss": 0.0198, "step": 121130 }, { "epoch": 0.31, "learning_rate": 0.0002528981468760773, "loss": 0.0227, "step": 121140 }, { "epoch": 0.31, "learning_rate": 0.0002528942586597059, "loss": 0.0174, "step": 121150 }, { "epoch": 0.31, "learning_rate": 0.0002528903704433344, "loss": 0.0201, "step": 121160 }, { "epoch": 0.31, "learning_rate": 0.0002528864822269629, "loss": 0.0207, "step": 121170 }, { "epoch": 0.31, "learning_rate": 0.0002528825940105915, "loss": 0.0196, "step": 121180 }, { "epoch": 0.31, "learning_rate": 0.00025287870579422005, "loss": 0.0244, "step": 121190 }, { "epoch": 0.31, "learning_rate": 0.00025287481757784857, "loss": 0.0205, "step": 121200 }, { "epoch": 0.31, "learning_rate": 0.0002528709293614771, "loss": 0.0209, "step": 121210 }, { "epoch": 0.31, "learning_rate": 0.0002528670411451056, "loss": 0.021, "step": 121220 }, { "epoch": 0.31, "learning_rate": 0.00025286315292873416, "loss": 0.0207, "step": 121230 }, { "epoch": 0.31, "learning_rate": 0.0002528592647123627, "loss": 0.0232, "step": 121240 }, { "epoch": 0.31, "learning_rate": 0.00025285537649599125, "loss": 0.0245, "step": 121250 }, { "epoch": 0.31, "learning_rate": 0.00025285148827961976, "loss": 0.0224, "step": 121260 }, { "epoch": 0.31, "learning_rate": 0.00025284760006324833, "loss": 0.0206, "step": 121270 }, { "epoch": 0.31, "learning_rate": 0.00025284371184687685, "loss": 0.0188, "step": 121280 }, { "epoch": 0.31, "learning_rate": 0.00025283982363050536, "loss": 0.0211, "step": 121290 }, { "epoch": 0.31, "learning_rate": 0.0002528359354141339, "loss": 0.0218, "step": 121300 }, { "epoch": 0.31, "learning_rate": 0.00025283204719776244, "loss": 0.0212, "step": 121310 }, { "epoch": 0.31, "learning_rate": 0.00025282815898139096, "loss": 0.0267, "step": 121320 }, { "epoch": 0.31, "learning_rate": 0.0002528242707650195, "loss": 0.0202, "step": 121330 }, { "epoch": 0.31, "learning_rate": 0.00025282038254864804, "loss": 0.0201, "step": 121340 }, { "epoch": 0.31, "learning_rate": 0.00025281649433227656, "loss": 0.0165, "step": 121350 }, { "epoch": 0.31, "learning_rate": 0.0002528126061159051, "loss": 0.0182, "step": 121360 }, { "epoch": 0.31, "learning_rate": 0.00025280871789953364, "loss": 0.0164, "step": 121370 }, { "epoch": 0.31, "learning_rate": 0.00025280482968316215, "loss": 0.0263, "step": 121380 }, { "epoch": 0.31, "learning_rate": 0.0002528009414667907, "loss": 0.0191, "step": 121390 }, { "epoch": 0.31, "learning_rate": 0.0002527970532504193, "loss": 0.018, "step": 121400 }, { "epoch": 0.31, "learning_rate": 0.0002527931650340478, "loss": 0.0179, "step": 121410 }, { "epoch": 0.31, "learning_rate": 0.0002527892768176763, "loss": 0.0237, "step": 121420 }, { "epoch": 0.31, "learning_rate": 0.00025278538860130483, "loss": 0.0168, "step": 121430 }, { "epoch": 0.31, "learning_rate": 0.0002527815003849334, "loss": 0.0226, "step": 121440 }, { "epoch": 0.31, "learning_rate": 0.0002527776121685619, "loss": 0.0178, "step": 121450 }, { "epoch": 0.31, "learning_rate": 0.0002527737239521905, "loss": 0.0236, "step": 121460 }, { "epoch": 0.31, "learning_rate": 0.000252769835735819, "loss": 0.0255, "step": 121470 }, { "epoch": 0.31, "learning_rate": 0.00025276594751944757, "loss": 0.0256, "step": 121480 }, { "epoch": 0.31, "learning_rate": 0.0002527620593030761, "loss": 0.0208, "step": 121490 }, { "epoch": 0.31, "learning_rate": 0.0002527581710867046, "loss": 0.0197, "step": 121500 }, { "epoch": 0.31, "learning_rate": 0.0002527542828703331, "loss": 0.0202, "step": 121510 }, { "epoch": 0.31, "learning_rate": 0.0002527503946539617, "loss": 0.0247, "step": 121520 }, { "epoch": 0.32, "learning_rate": 0.0002527465064375902, "loss": 0.0168, "step": 121530 }, { "epoch": 0.32, "learning_rate": 0.00025274261822121877, "loss": 0.0154, "step": 121540 }, { "epoch": 0.32, "learning_rate": 0.0002527387300048473, "loss": 0.0227, "step": 121550 }, { "epoch": 0.32, "learning_rate": 0.00025273484178847585, "loss": 0.0195, "step": 121560 }, { "epoch": 0.32, "learning_rate": 0.00025273095357210436, "loss": 0.0211, "step": 121570 }, { "epoch": 0.32, "learning_rate": 0.0002527270653557329, "loss": 0.0187, "step": 121580 }, { "epoch": 0.32, "learning_rate": 0.00025272317713936145, "loss": 0.0191, "step": 121590 }, { "epoch": 0.32, "learning_rate": 0.00025271928892298996, "loss": 0.0189, "step": 121600 }, { "epoch": 0.32, "learning_rate": 0.00025271540070661853, "loss": 0.0172, "step": 121610 }, { "epoch": 0.32, "learning_rate": 0.00025271151249024704, "loss": 0.0167, "step": 121620 }, { "epoch": 0.32, "learning_rate": 0.00025270762427387556, "loss": 0.027, "step": 121630 }, { "epoch": 0.32, "learning_rate": 0.0002527037360575041, "loss": 0.0156, "step": 121640 }, { "epoch": 0.32, "learning_rate": 0.00025269984784113264, "loss": 0.0225, "step": 121650 }, { "epoch": 0.32, "learning_rate": 0.00025269595962476116, "loss": 0.0206, "step": 121660 }, { "epoch": 0.32, "learning_rate": 0.0002526920714083897, "loss": 0.0227, "step": 121670 }, { "epoch": 0.32, "learning_rate": 0.00025268818319201824, "loss": 0.0271, "step": 121680 }, { "epoch": 0.32, "learning_rate": 0.0002526842949756468, "loss": 0.0195, "step": 121690 }, { "epoch": 0.32, "learning_rate": 0.0002526804067592753, "loss": 0.0181, "step": 121700 }, { "epoch": 0.32, "learning_rate": 0.00025267651854290384, "loss": 0.0248, "step": 121710 }, { "epoch": 0.32, "learning_rate": 0.00025267263032653235, "loss": 0.0211, "step": 121720 }, { "epoch": 0.32, "learning_rate": 0.0002526687421101609, "loss": 0.0165, "step": 121730 }, { "epoch": 0.32, "learning_rate": 0.0002526648538937895, "loss": 0.0188, "step": 121740 }, { "epoch": 0.32, "learning_rate": 0.000252660965677418, "loss": 0.0176, "step": 121750 }, { "epoch": 0.32, "learning_rate": 0.0002526570774610465, "loss": 0.0165, "step": 121760 }, { "epoch": 0.32, "learning_rate": 0.0002526531892446751, "loss": 0.0231, "step": 121770 }, { "epoch": 0.32, "learning_rate": 0.0002526493010283036, "loss": 0.0189, "step": 121780 }, { "epoch": 0.32, "learning_rate": 0.0002526454128119321, "loss": 0.0177, "step": 121790 }, { "epoch": 0.32, "learning_rate": 0.0002526415245955607, "loss": 0.0243, "step": 121800 }, { "epoch": 0.32, "learning_rate": 0.0002526376363791892, "loss": 0.0218, "step": 121810 }, { "epoch": 0.32, "learning_rate": 0.00025263374816281777, "loss": 0.022, "step": 121820 }, { "epoch": 0.32, "learning_rate": 0.0002526298599464463, "loss": 0.0189, "step": 121830 }, { "epoch": 0.32, "learning_rate": 0.0002526259717300748, "loss": 0.0157, "step": 121840 }, { "epoch": 0.32, "learning_rate": 0.0002526220835137033, "loss": 0.0208, "step": 121850 }, { "epoch": 0.32, "learning_rate": 0.0002526181952973319, "loss": 0.0236, "step": 121860 }, { "epoch": 0.32, "learning_rate": 0.0002526143070809604, "loss": 0.0174, "step": 121870 }, { "epoch": 0.32, "learning_rate": 0.00025261041886458896, "loss": 0.0222, "step": 121880 }, { "epoch": 0.32, "learning_rate": 0.0002526065306482175, "loss": 0.0222, "step": 121890 }, { "epoch": 0.32, "learning_rate": 0.00025260264243184605, "loss": 0.0183, "step": 121900 }, { "epoch": 0.32, "learning_rate": 0.00025259875421547456, "loss": 0.0179, "step": 121910 }, { "epoch": 0.32, "learning_rate": 0.0002525948659991031, "loss": 0.0251, "step": 121920 }, { "epoch": 0.32, "learning_rate": 0.0002525909777827316, "loss": 0.0172, "step": 121930 }, { "epoch": 0.32, "learning_rate": 0.00025258708956636016, "loss": 0.0188, "step": 121940 }, { "epoch": 0.32, "learning_rate": 0.00025258320134998873, "loss": 0.0169, "step": 121950 }, { "epoch": 0.32, "learning_rate": 0.00025257931313361724, "loss": 0.0192, "step": 121960 }, { "epoch": 0.32, "learning_rate": 0.00025257542491724576, "loss": 0.019, "step": 121970 }, { "epoch": 0.32, "learning_rate": 0.0002525715367008743, "loss": 0.0195, "step": 121980 }, { "epoch": 0.32, "learning_rate": 0.00025256764848450284, "loss": 0.0207, "step": 121990 }, { "epoch": 0.32, "learning_rate": 0.00025256376026813136, "loss": 0.022, "step": 122000 }, { "epoch": 0.32, "eval_cer": 0.8817992612716261, "eval_loss": 0.014596437104046345, "eval_runtime": 107.3326, "eval_samples_per_second": 18.634, "eval_steps_per_second": 4.658, "step": 122000 }, { "epoch": 0.32, "learning_rate": 0.0002525598720517599, "loss": 0.0222, "step": 122010 }, { "epoch": 0.32, "learning_rate": 0.00025255598383538844, "loss": 0.021, "step": 122020 }, { "epoch": 0.32, "learning_rate": 0.000252552095619017, "loss": 0.0211, "step": 122030 }, { "epoch": 0.32, "learning_rate": 0.0002525482074026455, "loss": 0.0231, "step": 122040 }, { "epoch": 0.32, "learning_rate": 0.00025254431918627404, "loss": 0.025, "step": 122050 }, { "epoch": 0.32, "learning_rate": 0.0002525404309699026, "loss": 0.0221, "step": 122060 }, { "epoch": 0.32, "learning_rate": 0.0002525365427535311, "loss": 0.0211, "step": 122070 }, { "epoch": 0.32, "learning_rate": 0.0002525326545371597, "loss": 0.0206, "step": 122080 }, { "epoch": 0.32, "learning_rate": 0.0002525287663207882, "loss": 0.0259, "step": 122090 }, { "epoch": 0.32, "learning_rate": 0.0002525248781044167, "loss": 0.0188, "step": 122100 }, { "epoch": 0.32, "learning_rate": 0.0002525209898880453, "loss": 0.0224, "step": 122110 }, { "epoch": 0.32, "learning_rate": 0.0002525171016716738, "loss": 0.0218, "step": 122120 }, { "epoch": 0.32, "learning_rate": 0.0002525132134553023, "loss": 0.0206, "step": 122130 }, { "epoch": 0.32, "learning_rate": 0.0002525093252389309, "loss": 0.028, "step": 122140 }, { "epoch": 0.32, "learning_rate": 0.0002525054370225594, "loss": 0.0221, "step": 122150 }, { "epoch": 0.32, "learning_rate": 0.00025250154880618797, "loss": 0.0199, "step": 122160 }, { "epoch": 0.32, "learning_rate": 0.0002524976605898165, "loss": 0.0213, "step": 122170 }, { "epoch": 0.32, "learning_rate": 0.000252493772373445, "loss": 0.0235, "step": 122180 }, { "epoch": 0.32, "learning_rate": 0.00025248988415707357, "loss": 0.0197, "step": 122190 }, { "epoch": 0.32, "learning_rate": 0.0002524859959407021, "loss": 0.0199, "step": 122200 }, { "epoch": 0.32, "learning_rate": 0.0002524821077243306, "loss": 0.0241, "step": 122210 }, { "epoch": 0.32, "learning_rate": 0.00025247821950795916, "loss": 0.0236, "step": 122220 }, { "epoch": 0.32, "learning_rate": 0.00025247433129158773, "loss": 0.021, "step": 122230 }, { "epoch": 0.32, "learning_rate": 0.00025247044307521625, "loss": 0.0214, "step": 122240 }, { "epoch": 0.32, "learning_rate": 0.00025246655485884476, "loss": 0.0242, "step": 122250 }, { "epoch": 0.32, "learning_rate": 0.0002524626666424733, "loss": 0.0202, "step": 122260 }, { "epoch": 0.32, "learning_rate": 0.00025245877842610184, "loss": 0.0181, "step": 122270 }, { "epoch": 0.32, "learning_rate": 0.00025245489020973036, "loss": 0.0225, "step": 122280 }, { "epoch": 0.32, "learning_rate": 0.00025245100199335893, "loss": 0.0226, "step": 122290 }, { "epoch": 0.32, "learning_rate": 0.00025244711377698744, "loss": 0.0238, "step": 122300 }, { "epoch": 0.32, "learning_rate": 0.000252443225560616, "loss": 0.0197, "step": 122310 }, { "epoch": 0.32, "learning_rate": 0.0002524393373442445, "loss": 0.0215, "step": 122320 }, { "epoch": 0.32, "learning_rate": 0.00025243544912787304, "loss": 0.0239, "step": 122330 }, { "epoch": 0.32, "learning_rate": 0.00025243156091150155, "loss": 0.0213, "step": 122340 }, { "epoch": 0.32, "learning_rate": 0.0002524276726951301, "loss": 0.0194, "step": 122350 }, { "epoch": 0.32, "learning_rate": 0.00025242378447875864, "loss": 0.0188, "step": 122360 }, { "epoch": 0.32, "learning_rate": 0.0002524198962623872, "loss": 0.0185, "step": 122370 }, { "epoch": 0.32, "learning_rate": 0.0002524160080460157, "loss": 0.0214, "step": 122380 }, { "epoch": 0.32, "learning_rate": 0.00025241211982964424, "loss": 0.0222, "step": 122390 }, { "epoch": 0.32, "learning_rate": 0.0002524082316132728, "loss": 0.0225, "step": 122400 }, { "epoch": 0.32, "learning_rate": 0.0002524043433969013, "loss": 0.02, "step": 122410 }, { "epoch": 0.32, "learning_rate": 0.00025240045518052983, "loss": 0.0207, "step": 122420 }, { "epoch": 0.32, "learning_rate": 0.0002523965669641584, "loss": 0.0228, "step": 122430 }, { "epoch": 0.32, "learning_rate": 0.00025239267874778697, "loss": 0.0216, "step": 122440 }, { "epoch": 0.32, "learning_rate": 0.0002523887905314155, "loss": 0.0292, "step": 122450 }, { "epoch": 0.32, "learning_rate": 0.000252384902315044, "loss": 0.0216, "step": 122460 }, { "epoch": 0.32, "learning_rate": 0.0002523810140986725, "loss": 0.0214, "step": 122470 }, { "epoch": 0.32, "learning_rate": 0.0002523771258823011, "loss": 0.0217, "step": 122480 }, { "epoch": 0.32, "learning_rate": 0.0002523732376659296, "loss": 0.0212, "step": 122490 }, { "epoch": 0.32, "learning_rate": 0.00025236934944955817, "loss": 0.0199, "step": 122500 }, { "epoch": 0.32, "learning_rate": 0.0002523654612331867, "loss": 0.0219, "step": 122510 }, { "epoch": 0.32, "learning_rate": 0.00025236157301681525, "loss": 0.0232, "step": 122520 }, { "epoch": 0.32, "learning_rate": 0.00025235768480044376, "loss": 0.0243, "step": 122530 }, { "epoch": 0.32, "learning_rate": 0.0002523537965840723, "loss": 0.0204, "step": 122540 }, { "epoch": 0.32, "learning_rate": 0.0002523499083677008, "loss": 0.0185, "step": 122550 }, { "epoch": 0.32, "learning_rate": 0.00025234602015132936, "loss": 0.0233, "step": 122560 }, { "epoch": 0.32, "learning_rate": 0.0002523421319349579, "loss": 0.0249, "step": 122570 }, { "epoch": 0.32, "learning_rate": 0.00025233824371858645, "loss": 0.0151, "step": 122580 }, { "epoch": 0.32, "learning_rate": 0.00025233435550221496, "loss": 0.0225, "step": 122590 }, { "epoch": 0.32, "learning_rate": 0.0002523304672858435, "loss": 0.0215, "step": 122600 }, { "epoch": 0.32, "learning_rate": 0.00025232657906947204, "loss": 0.0184, "step": 122610 }, { "epoch": 0.32, "learning_rate": 0.00025232269085310056, "loss": 0.0186, "step": 122620 }, { "epoch": 0.32, "learning_rate": 0.0002523188026367291, "loss": 0.0216, "step": 122630 }, { "epoch": 0.32, "learning_rate": 0.00025231491442035764, "loss": 0.0255, "step": 122640 }, { "epoch": 0.32, "learning_rate": 0.0002523110262039862, "loss": 0.0215, "step": 122650 }, { "epoch": 0.32, "learning_rate": 0.0002523071379876147, "loss": 0.0246, "step": 122660 }, { "epoch": 0.32, "learning_rate": 0.00025230324977124324, "loss": 0.025, "step": 122670 }, { "epoch": 0.32, "learning_rate": 0.00025229936155487175, "loss": 0.0224, "step": 122680 }, { "epoch": 0.32, "learning_rate": 0.0002522954733385003, "loss": 0.0175, "step": 122690 }, { "epoch": 0.32, "learning_rate": 0.00025229158512212884, "loss": 0.0198, "step": 122700 }, { "epoch": 0.32, "learning_rate": 0.0002522876969057574, "loss": 0.0201, "step": 122710 }, { "epoch": 0.32, "learning_rate": 0.0002522838086893859, "loss": 0.0172, "step": 122720 }, { "epoch": 0.32, "learning_rate": 0.0002522799204730145, "loss": 0.0209, "step": 122730 }, { "epoch": 0.32, "learning_rate": 0.000252276032256643, "loss": 0.0203, "step": 122740 }, { "epoch": 0.32, "learning_rate": 0.0002522721440402715, "loss": 0.0225, "step": 122750 }, { "epoch": 0.32, "learning_rate": 0.00025226825582390003, "loss": 0.023, "step": 122760 }, { "epoch": 0.32, "learning_rate": 0.0002522643676075286, "loss": 0.0218, "step": 122770 }, { "epoch": 0.32, "learning_rate": 0.00025226047939115717, "loss": 0.0203, "step": 122780 }, { "epoch": 0.32, "learning_rate": 0.0002522565911747857, "loss": 0.0195, "step": 122790 }, { "epoch": 0.32, "learning_rate": 0.0002522527029584142, "loss": 0.018, "step": 122800 }, { "epoch": 0.32, "learning_rate": 0.00025224881474204277, "loss": 0.0222, "step": 122810 }, { "epoch": 0.32, "learning_rate": 0.0002522449265256713, "loss": 0.0215, "step": 122820 }, { "epoch": 0.32, "learning_rate": 0.0002522410383092998, "loss": 0.0203, "step": 122830 }, { "epoch": 0.32, "learning_rate": 0.00025223715009292837, "loss": 0.0382, "step": 122840 }, { "epoch": 0.32, "learning_rate": 0.0002522332618765569, "loss": 0.021, "step": 122850 }, { "epoch": 0.32, "learning_rate": 0.00025222937366018545, "loss": 0.0275, "step": 122860 }, { "epoch": 0.32, "learning_rate": 0.00025222548544381396, "loss": 0.0171, "step": 122870 }, { "epoch": 0.32, "learning_rate": 0.0002522215972274425, "loss": 0.0314, "step": 122880 }, { "epoch": 0.32, "learning_rate": 0.000252217709011071, "loss": 0.0213, "step": 122890 }, { "epoch": 0.32, "learning_rate": 0.00025221382079469956, "loss": 0.0243, "step": 122900 }, { "epoch": 0.32, "learning_rate": 0.0002522099325783281, "loss": 0.0176, "step": 122910 }, { "epoch": 0.32, "learning_rate": 0.00025220604436195664, "loss": 0.0387, "step": 122920 }, { "epoch": 0.32, "learning_rate": 0.00025220215614558516, "loss": 0.038, "step": 122930 }, { "epoch": 0.32, "learning_rate": 0.00025219826792921373, "loss": 0.0198, "step": 122940 }, { "epoch": 0.32, "learning_rate": 0.00025219437971284224, "loss": 0.0229, "step": 122950 }, { "epoch": 0.32, "learning_rate": 0.00025219049149647076, "loss": 0.0242, "step": 122960 }, { "epoch": 0.32, "learning_rate": 0.00025218660328009927, "loss": 0.0191, "step": 122970 }, { "epoch": 0.32, "learning_rate": 0.00025218271506372784, "loss": 0.025, "step": 122980 }, { "epoch": 0.32, "learning_rate": 0.0002521788268473564, "loss": 0.0173, "step": 122990 }, { "epoch": 0.32, "learning_rate": 0.0002521749386309849, "loss": 0.0186, "step": 123000 }, { "epoch": 0.32, "eval_cer": 0.8817936627238894, "eval_loss": 0.014675342477858067, "eval_runtime": 107.4618, "eval_samples_per_second": 18.611, "eval_steps_per_second": 4.653, "step": 123000 }, { "epoch": 0.32, "learning_rate": 0.00025217105041461344, "loss": 0.0247, "step": 123010 }, { "epoch": 0.32, "learning_rate": 0.000252167162198242, "loss": 0.025, "step": 123020 }, { "epoch": 0.32, "learning_rate": 0.0002521632739818705, "loss": 0.0311, "step": 123030 }, { "epoch": 0.32, "learning_rate": 0.00025215938576549904, "loss": 0.0247, "step": 123040 }, { "epoch": 0.32, "learning_rate": 0.0002521554975491276, "loss": 0.022, "step": 123050 }, { "epoch": 0.32, "learning_rate": 0.0002521516093327561, "loss": 0.0219, "step": 123060 }, { "epoch": 0.32, "learning_rate": 0.0002521477211163847, "loss": 0.0271, "step": 123070 }, { "epoch": 0.32, "learning_rate": 0.0002521438329000132, "loss": 0.0209, "step": 123080 }, { "epoch": 0.32, "learning_rate": 0.0002521399446836417, "loss": 0.0216, "step": 123090 }, { "epoch": 0.32, "learning_rate": 0.00025213605646727023, "loss": 0.019, "step": 123100 }, { "epoch": 0.32, "learning_rate": 0.0002521321682508988, "loss": 0.0241, "step": 123110 }, { "epoch": 0.32, "learning_rate": 0.0002521282800345273, "loss": 0.0206, "step": 123120 }, { "epoch": 0.32, "learning_rate": 0.0002521243918181559, "loss": 0.0212, "step": 123130 }, { "epoch": 0.32, "learning_rate": 0.0002521205036017844, "loss": 0.0256, "step": 123140 }, { "epoch": 0.32, "learning_rate": 0.00025211661538541297, "loss": 0.0208, "step": 123150 }, { "epoch": 0.32, "learning_rate": 0.0002521127271690415, "loss": 0.0233, "step": 123160 }, { "epoch": 0.32, "learning_rate": 0.00025210883895267, "loss": 0.0223, "step": 123170 }, { "epoch": 0.32, "learning_rate": 0.00025210495073629856, "loss": 0.0203, "step": 123180 }, { "epoch": 0.32, "learning_rate": 0.0002521010625199271, "loss": 0.0176, "step": 123190 }, { "epoch": 0.32, "learning_rate": 0.00025209717430355565, "loss": 0.0208, "step": 123200 }, { "epoch": 0.32, "learning_rate": 0.00025209328608718416, "loss": 0.0216, "step": 123210 }, { "epoch": 0.32, "learning_rate": 0.0002520893978708127, "loss": 0.0249, "step": 123220 }, { "epoch": 0.32, "learning_rate": 0.00025208550965444125, "loss": 0.0181, "step": 123230 }, { "epoch": 0.32, "learning_rate": 0.00025208162143806976, "loss": 0.0198, "step": 123240 }, { "epoch": 0.32, "learning_rate": 0.0002520777332216983, "loss": 0.0192, "step": 123250 }, { "epoch": 0.32, "learning_rate": 0.00025207384500532684, "loss": 0.023, "step": 123260 }, { "epoch": 0.32, "learning_rate": 0.0002520699567889554, "loss": 0.0213, "step": 123270 }, { "epoch": 0.32, "learning_rate": 0.0002520660685725839, "loss": 0.0185, "step": 123280 }, { "epoch": 0.32, "learning_rate": 0.00025206218035621244, "loss": 0.0276, "step": 123290 }, { "epoch": 0.32, "learning_rate": 0.00025205829213984096, "loss": 0.0242, "step": 123300 }, { "epoch": 0.32, "learning_rate": 0.00025205440392346947, "loss": 0.0188, "step": 123310 }, { "epoch": 0.32, "learning_rate": 0.00025205051570709804, "loss": 0.0214, "step": 123320 }, { "epoch": 0.32, "learning_rate": 0.0002520466274907266, "loss": 0.0244, "step": 123330 }, { "epoch": 0.32, "learning_rate": 0.0002520427392743551, "loss": 0.0188, "step": 123340 }, { "epoch": 0.32, "learning_rate": 0.00025203885105798364, "loss": 0.0222, "step": 123350 }, { "epoch": 0.32, "learning_rate": 0.0002520349628416122, "loss": 0.0228, "step": 123360 }, { "epoch": 0.32, "learning_rate": 0.0002520310746252407, "loss": 0.0228, "step": 123370 }, { "epoch": 0.32, "learning_rate": 0.00025202718640886923, "loss": 0.0202, "step": 123380 }, { "epoch": 0.32, "learning_rate": 0.0002520232981924978, "loss": 0.025, "step": 123390 }, { "epoch": 0.32, "learning_rate": 0.0002520194099761263, "loss": 0.0188, "step": 123400 }, { "epoch": 0.32, "learning_rate": 0.0002520155217597549, "loss": 0.0209, "step": 123410 }, { "epoch": 0.32, "learning_rate": 0.0002520116335433834, "loss": 0.0214, "step": 123420 }, { "epoch": 0.32, "learning_rate": 0.0002520077453270119, "loss": 0.0203, "step": 123430 }, { "epoch": 0.32, "learning_rate": 0.0002520038571106405, "loss": 0.0194, "step": 123440 }, { "epoch": 0.32, "learning_rate": 0.000251999968894269, "loss": 0.0243, "step": 123450 }, { "epoch": 0.32, "learning_rate": 0.0002519960806778975, "loss": 0.0217, "step": 123460 }, { "epoch": 0.32, "learning_rate": 0.0002519921924615261, "loss": 0.0196, "step": 123470 }, { "epoch": 0.32, "learning_rate": 0.00025198830424515465, "loss": 0.017, "step": 123480 }, { "epoch": 0.32, "learning_rate": 0.00025198441602878317, "loss": 0.0212, "step": 123490 }, { "epoch": 0.32, "learning_rate": 0.0002519805278124117, "loss": 0.0238, "step": 123500 }, { "epoch": 0.32, "learning_rate": 0.0002519766395960402, "loss": 0.0215, "step": 123510 }, { "epoch": 0.32, "learning_rate": 0.00025197275137966876, "loss": 0.023, "step": 123520 }, { "epoch": 0.32, "learning_rate": 0.0002519688631632973, "loss": 0.0194, "step": 123530 }, { "epoch": 0.32, "learning_rate": 0.00025196497494692585, "loss": 0.0211, "step": 123540 }, { "epoch": 0.32, "learning_rate": 0.00025196108673055436, "loss": 0.0182, "step": 123550 }, { "epoch": 0.32, "learning_rate": 0.0002519571985141829, "loss": 0.0201, "step": 123560 }, { "epoch": 0.32, "learning_rate": 0.00025195331029781144, "loss": 0.0198, "step": 123570 }, { "epoch": 0.32, "learning_rate": 0.00025194942208143996, "loss": 0.0202, "step": 123580 }, { "epoch": 0.32, "learning_rate": 0.0002519455338650685, "loss": 0.022, "step": 123590 }, { "epoch": 0.32, "learning_rate": 0.00025194164564869704, "loss": 0.0167, "step": 123600 }, { "epoch": 0.32, "learning_rate": 0.00025193775743232556, "loss": 0.0187, "step": 123610 }, { "epoch": 0.32, "learning_rate": 0.0002519338692159541, "loss": 0.0217, "step": 123620 }, { "epoch": 0.32, "learning_rate": 0.00025192998099958264, "loss": 0.0202, "step": 123630 }, { "epoch": 0.32, "learning_rate": 0.00025192609278321115, "loss": 0.0227, "step": 123640 }, { "epoch": 0.32, "learning_rate": 0.0002519222045668397, "loss": 0.0162, "step": 123650 }, { "epoch": 0.32, "learning_rate": 0.00025191831635046824, "loss": 0.0172, "step": 123660 }, { "epoch": 0.32, "learning_rate": 0.0002519144281340968, "loss": 0.0285, "step": 123670 }, { "epoch": 0.32, "learning_rate": 0.0002519105399177253, "loss": 0.022, "step": 123680 }, { "epoch": 0.32, "learning_rate": 0.0002519066517013539, "loss": 0.0183, "step": 123690 }, { "epoch": 0.32, "learning_rate": 0.0002519027634849824, "loss": 0.0222, "step": 123700 }, { "epoch": 0.32, "learning_rate": 0.0002518988752686109, "loss": 0.021, "step": 123710 }, { "epoch": 0.32, "learning_rate": 0.00025189498705223943, "loss": 0.018, "step": 123720 }, { "epoch": 0.32, "learning_rate": 0.000251891098835868, "loss": 0.0232, "step": 123730 }, { "epoch": 0.32, "learning_rate": 0.0002518872106194965, "loss": 0.0166, "step": 123740 }, { "epoch": 0.32, "learning_rate": 0.0002518833224031251, "loss": 0.0203, "step": 123750 }, { "epoch": 0.32, "learning_rate": 0.0002518794341867536, "loss": 0.0287, "step": 123760 }, { "epoch": 0.32, "learning_rate": 0.00025187554597038217, "loss": 0.0179, "step": 123770 }, { "epoch": 0.32, "learning_rate": 0.0002518716577540107, "loss": 0.0211, "step": 123780 }, { "epoch": 0.32, "learning_rate": 0.0002518677695376392, "loss": 0.018, "step": 123790 }, { "epoch": 0.32, "learning_rate": 0.0002518638813212677, "loss": 0.0184, "step": 123800 }, { "epoch": 0.32, "learning_rate": 0.0002518599931048963, "loss": 0.028, "step": 123810 }, { "epoch": 0.32, "learning_rate": 0.00025185610488852485, "loss": 0.0213, "step": 123820 }, { "epoch": 0.32, "learning_rate": 0.00025185221667215336, "loss": 0.0255, "step": 123830 }, { "epoch": 0.32, "learning_rate": 0.0002518483284557819, "loss": 0.0208, "step": 123840 }, { "epoch": 0.32, "learning_rate": 0.0002518444402394104, "loss": 0.0195, "step": 123850 }, { "epoch": 0.32, "learning_rate": 0.00025184055202303896, "loss": 0.0225, "step": 123860 }, { "epoch": 0.32, "learning_rate": 0.0002518366638066675, "loss": 0.0196, "step": 123870 }, { "epoch": 0.32, "learning_rate": 0.00025183277559029605, "loss": 0.0244, "step": 123880 }, { "epoch": 0.32, "learning_rate": 0.00025182888737392456, "loss": 0.0204, "step": 123890 }, { "epoch": 0.32, "learning_rate": 0.00025182499915755313, "loss": 0.0255, "step": 123900 }, { "epoch": 0.32, "learning_rate": 0.00025182111094118164, "loss": 0.0199, "step": 123910 }, { "epoch": 0.32, "learning_rate": 0.00025181722272481016, "loss": 0.0199, "step": 123920 }, { "epoch": 0.32, "learning_rate": 0.00025181333450843867, "loss": 0.0196, "step": 123930 }, { "epoch": 0.32, "learning_rate": 0.00025180944629206724, "loss": 0.0216, "step": 123940 }, { "epoch": 0.32, "learning_rate": 0.00025180555807569576, "loss": 0.0196, "step": 123950 }, { "epoch": 0.32, "learning_rate": 0.0002518016698593243, "loss": 0.0168, "step": 123960 }, { "epoch": 0.32, "learning_rate": 0.00025179778164295284, "loss": 0.0189, "step": 123970 }, { "epoch": 0.32, "learning_rate": 0.0002517938934265814, "loss": 0.0192, "step": 123980 }, { "epoch": 0.32, "learning_rate": 0.0002517900052102099, "loss": 0.0225, "step": 123990 }, { "epoch": 0.32, "learning_rate": 0.00025178611699383844, "loss": 0.0202, "step": 124000 }, { "epoch": 0.32, "eval_cer": 0.8818104583670996, "eval_loss": 0.014676877297461033, "eval_runtime": 107.4759, "eval_samples_per_second": 18.609, "eval_steps_per_second": 4.652, "step": 124000 }, { "epoch": 0.32, "learning_rate": 0.00025178222877746695, "loss": 0.0221, "step": 124010 }, { "epoch": 0.32, "learning_rate": 0.0002517783405610955, "loss": 0.0261, "step": 124020 }, { "epoch": 0.32, "learning_rate": 0.0002517744523447241, "loss": 0.0192, "step": 124030 }, { "epoch": 0.32, "learning_rate": 0.0002517705641283526, "loss": 0.0195, "step": 124040 }, { "epoch": 0.32, "learning_rate": 0.0002517666759119811, "loss": 0.0262, "step": 124050 }, { "epoch": 0.32, "learning_rate": 0.00025176278769560963, "loss": 0.0215, "step": 124060 }, { "epoch": 0.32, "learning_rate": 0.0002517588994792382, "loss": 0.0199, "step": 124070 }, { "epoch": 0.32, "learning_rate": 0.0002517550112628667, "loss": 0.0188, "step": 124080 }, { "epoch": 0.32, "learning_rate": 0.0002517511230464953, "loss": 0.02, "step": 124090 }, { "epoch": 0.32, "learning_rate": 0.0002517472348301238, "loss": 0.0207, "step": 124100 }, { "epoch": 0.32, "learning_rate": 0.00025174334661375237, "loss": 0.0262, "step": 124110 }, { "epoch": 0.32, "learning_rate": 0.0002517394583973809, "loss": 0.0236, "step": 124120 }, { "epoch": 0.32, "learning_rate": 0.0002517355701810094, "loss": 0.0206, "step": 124130 }, { "epoch": 0.32, "learning_rate": 0.0002517316819646379, "loss": 0.0224, "step": 124140 }, { "epoch": 0.32, "learning_rate": 0.0002517277937482665, "loss": 0.0224, "step": 124150 }, { "epoch": 0.32, "learning_rate": 0.000251723905531895, "loss": 0.0225, "step": 124160 }, { "epoch": 0.32, "learning_rate": 0.00025172001731552356, "loss": 0.0191, "step": 124170 }, { "epoch": 0.32, "learning_rate": 0.0002517161290991521, "loss": 0.0218, "step": 124180 }, { "epoch": 0.32, "learning_rate": 0.00025171224088278065, "loss": 0.0212, "step": 124190 }, { "epoch": 0.32, "learning_rate": 0.00025170835266640916, "loss": 0.0253, "step": 124200 }, { "epoch": 0.32, "learning_rate": 0.0002517044644500377, "loss": 0.0269, "step": 124210 }, { "epoch": 0.32, "learning_rate": 0.00025170057623366624, "loss": 0.0265, "step": 124220 }, { "epoch": 0.32, "learning_rate": 0.00025169668801729476, "loss": 0.0196, "step": 124230 }, { "epoch": 0.32, "learning_rate": 0.00025169279980092333, "loss": 0.0232, "step": 124240 }, { "epoch": 0.32, "learning_rate": 0.00025168891158455184, "loss": 0.0222, "step": 124250 }, { "epoch": 0.32, "learning_rate": 0.00025168502336818036, "loss": 0.0178, "step": 124260 }, { "epoch": 0.32, "learning_rate": 0.0002516811351518089, "loss": 0.0208, "step": 124270 }, { "epoch": 0.32, "learning_rate": 0.00025167724693543744, "loss": 0.0233, "step": 124280 }, { "epoch": 0.32, "learning_rate": 0.00025167335871906595, "loss": 0.016, "step": 124290 }, { "epoch": 0.32, "learning_rate": 0.0002516694705026945, "loss": 0.0219, "step": 124300 }, { "epoch": 0.32, "learning_rate": 0.00025166558228632304, "loss": 0.0211, "step": 124310 }, { "epoch": 0.32, "learning_rate": 0.0002516616940699516, "loss": 0.0177, "step": 124320 }, { "epoch": 0.32, "learning_rate": 0.0002516578058535801, "loss": 0.023, "step": 124330 }, { "epoch": 0.32, "learning_rate": 0.00025165391763720864, "loss": 0.0228, "step": 124340 }, { "epoch": 0.32, "learning_rate": 0.00025165002942083715, "loss": 0.0186, "step": 124350 }, { "epoch": 0.32, "learning_rate": 0.0002516461412044657, "loss": 0.0283, "step": 124360 }, { "epoch": 0.32, "learning_rate": 0.0002516422529880943, "loss": 0.0212, "step": 124370 }, { "epoch": 0.32, "learning_rate": 0.0002516383647717228, "loss": 0.0202, "step": 124380 }, { "epoch": 0.32, "learning_rate": 0.0002516344765553513, "loss": 0.0259, "step": 124390 }, { "epoch": 0.32, "learning_rate": 0.0002516305883389799, "loss": 0.0225, "step": 124400 }, { "epoch": 0.32, "learning_rate": 0.0002516267001226084, "loss": 0.0201, "step": 124410 }, { "epoch": 0.32, "learning_rate": 0.0002516228119062369, "loss": 0.0157, "step": 124420 }, { "epoch": 0.32, "learning_rate": 0.0002516189236898655, "loss": 0.0159, "step": 124430 }, { "epoch": 0.32, "learning_rate": 0.000251615035473494, "loss": 0.0193, "step": 124440 }, { "epoch": 0.32, "learning_rate": 0.00025161114725712257, "loss": 0.0249, "step": 124450 }, { "epoch": 0.32, "learning_rate": 0.0002516072590407511, "loss": 0.019, "step": 124460 }, { "epoch": 0.32, "learning_rate": 0.0002516033708243796, "loss": 0.024, "step": 124470 }, { "epoch": 0.32, "learning_rate": 0.00025159948260800816, "loss": 0.0227, "step": 124480 }, { "epoch": 0.32, "learning_rate": 0.0002515955943916367, "loss": 0.0208, "step": 124490 }, { "epoch": 0.32, "learning_rate": 0.0002515917061752652, "loss": 0.0205, "step": 124500 }, { "epoch": 0.32, "learning_rate": 0.00025158781795889376, "loss": 0.022, "step": 124510 }, { "epoch": 0.32, "learning_rate": 0.00025158392974252233, "loss": 0.0238, "step": 124520 }, { "epoch": 0.32, "learning_rate": 0.00025158004152615085, "loss": 0.0198, "step": 124530 }, { "epoch": 0.32, "learning_rate": 0.00025157615330977936, "loss": 0.0205, "step": 124540 }, { "epoch": 0.32, "learning_rate": 0.0002515722650934079, "loss": 0.0181, "step": 124550 }, { "epoch": 0.32, "learning_rate": 0.0002515683768770364, "loss": 0.0204, "step": 124560 }, { "epoch": 0.32, "learning_rate": 0.00025156448866066496, "loss": 0.0172, "step": 124570 }, { "epoch": 0.32, "learning_rate": 0.0002515606004442935, "loss": 0.0179, "step": 124580 }, { "epoch": 0.32, "learning_rate": 0.00025155671222792204, "loss": 0.0209, "step": 124590 }, { "epoch": 0.32, "learning_rate": 0.00025155282401155056, "loss": 0.0255, "step": 124600 }, { "epoch": 0.32, "learning_rate": 0.0002515489357951791, "loss": 0.0176, "step": 124610 }, { "epoch": 0.32, "learning_rate": 0.00025154504757880764, "loss": 0.019, "step": 124620 }, { "epoch": 0.32, "learning_rate": 0.00025154115936243615, "loss": 0.0169, "step": 124630 }, { "epoch": 0.32, "learning_rate": 0.0002515372711460647, "loss": 0.0262, "step": 124640 }, { "epoch": 0.32, "learning_rate": 0.00025153338292969324, "loss": 0.0184, "step": 124650 }, { "epoch": 0.32, "learning_rate": 0.0002515294947133218, "loss": 0.0194, "step": 124660 }, { "epoch": 0.32, "learning_rate": 0.0002515256064969503, "loss": 0.0214, "step": 124670 }, { "epoch": 0.32, "learning_rate": 0.00025152171828057883, "loss": 0.0153, "step": 124680 }, { "epoch": 0.32, "learning_rate": 0.0002515178300642074, "loss": 0.0226, "step": 124690 }, { "epoch": 0.32, "learning_rate": 0.0002515139418478359, "loss": 0.0199, "step": 124700 }, { "epoch": 0.32, "learning_rate": 0.00025151005363146443, "loss": 0.0219, "step": 124710 }, { "epoch": 0.32, "learning_rate": 0.000251506165415093, "loss": 0.0261, "step": 124720 }, { "epoch": 0.32, "learning_rate": 0.00025150227719872157, "loss": 0.022, "step": 124730 }, { "epoch": 0.32, "learning_rate": 0.0002514983889823501, "loss": 0.0253, "step": 124740 }, { "epoch": 0.32, "learning_rate": 0.0002514945007659786, "loss": 0.0252, "step": 124750 }, { "epoch": 0.32, "learning_rate": 0.0002514906125496071, "loss": 0.018, "step": 124760 }, { "epoch": 0.32, "learning_rate": 0.0002514867243332357, "loss": 0.0213, "step": 124770 }, { "epoch": 0.32, "learning_rate": 0.0002514828361168642, "loss": 0.0212, "step": 124780 }, { "epoch": 0.32, "learning_rate": 0.00025147894790049276, "loss": 0.018, "step": 124790 }, { "epoch": 0.32, "learning_rate": 0.0002514750596841213, "loss": 0.0188, "step": 124800 }, { "epoch": 0.32, "learning_rate": 0.0002514711714677498, "loss": 0.0222, "step": 124810 }, { "epoch": 0.32, "learning_rate": 0.00025146728325137836, "loss": 0.0192, "step": 124820 }, { "epoch": 0.32, "learning_rate": 0.0002514633950350069, "loss": 0.0219, "step": 124830 }, { "epoch": 0.32, "learning_rate": 0.0002514595068186354, "loss": 0.0234, "step": 124840 }, { "epoch": 0.32, "learning_rate": 0.00025145561860226396, "loss": 0.0169, "step": 124850 }, { "epoch": 0.32, "learning_rate": 0.00025145173038589253, "loss": 0.021, "step": 124860 }, { "epoch": 0.32, "learning_rate": 0.00025144784216952104, "loss": 0.0215, "step": 124870 }, { "epoch": 0.32, "learning_rate": 0.00025144395395314956, "loss": 0.0225, "step": 124880 }, { "epoch": 0.32, "learning_rate": 0.0002514400657367781, "loss": 0.0195, "step": 124890 }, { "epoch": 0.32, "learning_rate": 0.00025143617752040664, "loss": 0.0213, "step": 124900 }, { "epoch": 0.32, "learning_rate": 0.00025143228930403516, "loss": 0.0206, "step": 124910 }, { "epoch": 0.32, "learning_rate": 0.0002514284010876637, "loss": 0.0211, "step": 124920 }, { "epoch": 0.32, "learning_rate": 0.00025142451287129224, "loss": 0.0205, "step": 124930 }, { "epoch": 0.32, "learning_rate": 0.0002514206246549208, "loss": 0.026, "step": 124940 }, { "epoch": 0.32, "learning_rate": 0.0002514167364385493, "loss": 0.062, "step": 124950 }, { "epoch": 0.32, "learning_rate": 0.00025141284822217784, "loss": 0.0207, "step": 124960 }, { "epoch": 0.32, "learning_rate": 0.00025140896000580635, "loss": 0.0191, "step": 124970 }, { "epoch": 0.32, "learning_rate": 0.0002514050717894349, "loss": 0.0331, "step": 124980 }, { "epoch": 0.32, "learning_rate": 0.00025140118357306344, "loss": 0.0186, "step": 124990 }, { "epoch": 0.32, "learning_rate": 0.000251397295356692, "loss": 0.0224, "step": 125000 }, { "epoch": 0.32, "eval_cer": 0.8818118580040337, "eval_loss": 0.01477042119950056, "eval_runtime": 107.7289, "eval_samples_per_second": 18.565, "eval_steps_per_second": 4.641, "step": 125000 }, { "epoch": 0.32, "learning_rate": 0.0002513934071403205, "loss": 0.0177, "step": 125010 }, { "epoch": 0.32, "learning_rate": 0.0002513895189239491, "loss": 0.0228, "step": 125020 }, { "epoch": 0.32, "learning_rate": 0.0002513856307075776, "loss": 0.02, "step": 125030 }, { "epoch": 0.32, "learning_rate": 0.0002513817424912061, "loss": 0.0206, "step": 125040 }, { "epoch": 0.32, "learning_rate": 0.00025137785427483463, "loss": 0.0192, "step": 125050 }, { "epoch": 0.32, "learning_rate": 0.0002513739660584632, "loss": 0.0262, "step": 125060 }, { "epoch": 0.32, "learning_rate": 0.00025137007784209177, "loss": 0.0206, "step": 125070 }, { "epoch": 0.32, "learning_rate": 0.0002513661896257203, "loss": 0.022, "step": 125080 }, { "epoch": 0.32, "learning_rate": 0.0002513623014093488, "loss": 0.0263, "step": 125090 }, { "epoch": 0.32, "learning_rate": 0.0002513584131929773, "loss": 0.0224, "step": 125100 }, { "epoch": 0.32, "learning_rate": 0.0002513545249766059, "loss": 0.023, "step": 125110 }, { "epoch": 0.32, "learning_rate": 0.0002513506367602344, "loss": 0.018, "step": 125120 }, { "epoch": 0.32, "learning_rate": 0.00025134674854386296, "loss": 0.0184, "step": 125130 }, { "epoch": 0.32, "learning_rate": 0.0002513428603274915, "loss": 0.0243, "step": 125140 }, { "epoch": 0.32, "learning_rate": 0.00025133897211112005, "loss": 0.0185, "step": 125150 }, { "epoch": 0.32, "learning_rate": 0.00025133508389474856, "loss": 0.0221, "step": 125160 }, { "epoch": 0.32, "learning_rate": 0.0002513311956783771, "loss": 0.0222, "step": 125170 }, { "epoch": 0.32, "learning_rate": 0.0002513273074620056, "loss": 0.0198, "step": 125180 }, { "epoch": 0.32, "learning_rate": 0.00025132341924563416, "loss": 0.0197, "step": 125190 }, { "epoch": 0.32, "learning_rate": 0.0002513195310292627, "loss": 0.018, "step": 125200 }, { "epoch": 0.32, "learning_rate": 0.00025131564281289124, "loss": 0.0199, "step": 125210 }, { "epoch": 0.32, "learning_rate": 0.00025131175459651976, "loss": 0.0224, "step": 125220 }, { "epoch": 0.32, "learning_rate": 0.0002513078663801483, "loss": 0.0217, "step": 125230 }, { "epoch": 0.32, "learning_rate": 0.00025130397816377684, "loss": 0.0217, "step": 125240 }, { "epoch": 0.32, "learning_rate": 0.00025130008994740536, "loss": 0.0231, "step": 125250 }, { "epoch": 0.32, "learning_rate": 0.0002512962017310339, "loss": 0.027, "step": 125260 }, { "epoch": 0.32, "learning_rate": 0.00025129231351466244, "loss": 0.0207, "step": 125270 }, { "epoch": 0.32, "learning_rate": 0.000251288425298291, "loss": 0.0191, "step": 125280 }, { "epoch": 0.32, "learning_rate": 0.0002512845370819195, "loss": 0.0158, "step": 125290 }, { "epoch": 0.32, "learning_rate": 0.00025128064886554804, "loss": 0.0265, "step": 125300 }, { "epoch": 0.32, "learning_rate": 0.00025127676064917655, "loss": 0.0198, "step": 125310 }, { "epoch": 0.32, "learning_rate": 0.0002512728724328051, "loss": 0.0228, "step": 125320 }, { "epoch": 0.32, "learning_rate": 0.00025126898421643363, "loss": 0.0218, "step": 125330 }, { "epoch": 0.32, "learning_rate": 0.0002512650960000622, "loss": 0.0233, "step": 125340 }, { "epoch": 0.32, "learning_rate": 0.0002512612077836907, "loss": 0.024, "step": 125350 }, { "epoch": 0.32, "learning_rate": 0.0002512573195673193, "loss": 0.021, "step": 125360 }, { "epoch": 0.32, "learning_rate": 0.0002512534313509478, "loss": 0.0163, "step": 125370 }, { "epoch": 0.33, "learning_rate": 0.0002512495431345763, "loss": 0.0362, "step": 125380 }, { "epoch": 0.33, "learning_rate": 0.00025124565491820483, "loss": 0.0203, "step": 125390 }, { "epoch": 0.33, "learning_rate": 0.0002512417667018334, "loss": 0.0207, "step": 125400 }, { "epoch": 0.33, "learning_rate": 0.00025123787848546197, "loss": 0.0197, "step": 125410 }, { "epoch": 0.33, "learning_rate": 0.0002512339902690905, "loss": 0.0175, "step": 125420 }, { "epoch": 0.33, "learning_rate": 0.000251230102052719, "loss": 0.0215, "step": 125430 }, { "epoch": 0.33, "learning_rate": 0.00025122621383634756, "loss": 0.0242, "step": 125440 }, { "epoch": 0.33, "learning_rate": 0.0002512223256199761, "loss": 0.023, "step": 125450 }, { "epoch": 0.33, "learning_rate": 0.0002512184374036046, "loss": 0.0194, "step": 125460 }, { "epoch": 0.33, "learning_rate": 0.00025121454918723316, "loss": 0.0221, "step": 125470 }, { "epoch": 0.33, "learning_rate": 0.0002512106609708617, "loss": 0.0176, "step": 125480 }, { "epoch": 0.33, "learning_rate": 0.00025120677275449025, "loss": 0.0173, "step": 125490 }, { "epoch": 0.33, "learning_rate": 0.00025120288453811876, "loss": 0.022, "step": 125500 }, { "epoch": 0.33, "learning_rate": 0.0002511989963217473, "loss": 0.0197, "step": 125510 }, { "epoch": 0.33, "learning_rate": 0.00025119510810537584, "loss": 0.0199, "step": 125520 }, { "epoch": 0.33, "learning_rate": 0.00025119121988900436, "loss": 0.0187, "step": 125530 }, { "epoch": 0.33, "learning_rate": 0.00025118733167263287, "loss": 0.0189, "step": 125540 }, { "epoch": 0.33, "learning_rate": 0.00025118344345626144, "loss": 0.0175, "step": 125550 }, { "epoch": 0.33, "learning_rate": 0.00025117955523988996, "loss": 0.0202, "step": 125560 }, { "epoch": 0.33, "learning_rate": 0.0002511756670235185, "loss": 0.0197, "step": 125570 }, { "epoch": 0.33, "learning_rate": 0.00025117177880714704, "loss": 0.026, "step": 125580 }, { "epoch": 0.33, "learning_rate": 0.00025116789059077555, "loss": 0.031, "step": 125590 }, { "epoch": 0.33, "learning_rate": 0.00025116400237440407, "loss": 0.022, "step": 125600 }, { "epoch": 0.33, "learning_rate": 0.00025116011415803264, "loss": 0.0219, "step": 125610 }, { "epoch": 0.33, "learning_rate": 0.0002511562259416612, "loss": 0.0194, "step": 125620 }, { "epoch": 0.33, "learning_rate": 0.0002511523377252897, "loss": 0.0225, "step": 125630 }, { "epoch": 0.33, "learning_rate": 0.00025114844950891823, "loss": 0.0212, "step": 125640 }, { "epoch": 0.33, "learning_rate": 0.0002511445612925468, "loss": 0.0187, "step": 125650 }, { "epoch": 0.33, "learning_rate": 0.0002511406730761753, "loss": 0.0243, "step": 125660 }, { "epoch": 0.33, "learning_rate": 0.00025113678485980383, "loss": 0.0213, "step": 125670 }, { "epoch": 0.33, "learning_rate": 0.0002511328966434324, "loss": 0.0213, "step": 125680 }, { "epoch": 0.33, "learning_rate": 0.0002511290084270609, "loss": 0.0262, "step": 125690 }, { "epoch": 0.33, "learning_rate": 0.0002511251202106895, "loss": 0.0268, "step": 125700 }, { "epoch": 0.33, "learning_rate": 0.000251121231994318, "loss": 0.0237, "step": 125710 }, { "epoch": 0.33, "learning_rate": 0.0002511173437779465, "loss": 0.0179, "step": 125720 }, { "epoch": 0.33, "learning_rate": 0.0002511134555615751, "loss": 0.0195, "step": 125730 }, { "epoch": 0.33, "learning_rate": 0.0002511095673452036, "loss": 0.0244, "step": 125740 }, { "epoch": 0.33, "learning_rate": 0.0002511056791288321, "loss": 0.0196, "step": 125750 }, { "epoch": 0.33, "learning_rate": 0.0002511017909124607, "loss": 0.0235, "step": 125760 }, { "epoch": 0.33, "learning_rate": 0.00025109790269608925, "loss": 0.0243, "step": 125770 }, { "epoch": 0.33, "learning_rate": 0.00025109401447971776, "loss": 0.0258, "step": 125780 }, { "epoch": 0.33, "learning_rate": 0.0002510901262633463, "loss": 0.0314, "step": 125790 }, { "epoch": 0.33, "learning_rate": 0.0002510862380469748, "loss": 0.0227, "step": 125800 }, { "epoch": 0.33, "learning_rate": 0.00025108234983060336, "loss": 0.0201, "step": 125810 }, { "epoch": 0.33, "learning_rate": 0.0002510784616142319, "loss": 0.0186, "step": 125820 }, { "epoch": 0.33, "learning_rate": 0.00025107457339786044, "loss": 0.0297, "step": 125830 }, { "epoch": 0.33, "learning_rate": 0.00025107068518148896, "loss": 0.0212, "step": 125840 }, { "epoch": 0.33, "learning_rate": 0.0002510667969651175, "loss": 0.0173, "step": 125850 }, { "epoch": 0.33, "learning_rate": 0.00025106290874874604, "loss": 0.0261, "step": 125860 }, { "epoch": 0.33, "learning_rate": 0.00025105902053237456, "loss": 0.0222, "step": 125870 }, { "epoch": 0.33, "learning_rate": 0.00025105513231600307, "loss": 0.0188, "step": 125880 }, { "epoch": 0.33, "learning_rate": 0.00025105124409963164, "loss": 0.0213, "step": 125890 }, { "epoch": 0.33, "learning_rate": 0.00025104735588326015, "loss": 0.0249, "step": 125900 }, { "epoch": 0.33, "learning_rate": 0.0002510434676668887, "loss": 0.0184, "step": 125910 }, { "epoch": 0.33, "learning_rate": 0.00025103957945051724, "loss": 0.0184, "step": 125920 }, { "epoch": 0.33, "learning_rate": 0.00025103569123414575, "loss": 0.0236, "step": 125930 }, { "epoch": 0.33, "learning_rate": 0.0002510318030177743, "loss": 0.02, "step": 125940 }, { "epoch": 0.33, "learning_rate": 0.00025102791480140284, "loss": 0.0239, "step": 125950 }, { "epoch": 0.33, "learning_rate": 0.0002510240265850314, "loss": 0.0223, "step": 125960 }, { "epoch": 0.33, "learning_rate": 0.0002510201383686599, "loss": 0.0183, "step": 125970 }, { "epoch": 0.33, "learning_rate": 0.0002510162501522885, "loss": 0.0225, "step": 125980 }, { "epoch": 0.33, "learning_rate": 0.000251012361935917, "loss": 0.0206, "step": 125990 }, { "epoch": 0.33, "learning_rate": 0.0002510084737195455, "loss": 0.0194, "step": 126000 }, { "epoch": 0.33, "eval_cer": 0.8818146572779021, "eval_loss": 0.014803457073867321, "eval_runtime": 107.7105, "eval_samples_per_second": 18.568, "eval_steps_per_second": 4.642, "step": 126000 }, { "epoch": 0.33, "learning_rate": 0.00025100458550317403, "loss": 0.0184, "step": 126010 }, { "epoch": 0.33, "learning_rate": 0.0002510006972868026, "loss": 0.0157, "step": 126020 }, { "epoch": 0.33, "learning_rate": 0.0002509968090704311, "loss": 0.0205, "step": 126030 }, { "epoch": 0.33, "learning_rate": 0.0002509929208540597, "loss": 0.0212, "step": 126040 }, { "epoch": 0.33, "learning_rate": 0.0002509890326376882, "loss": 0.017, "step": 126050 }, { "epoch": 0.33, "learning_rate": 0.0002509851444213167, "loss": 0.0213, "step": 126060 }, { "epoch": 0.33, "learning_rate": 0.0002509812562049453, "loss": 0.0203, "step": 126070 }, { "epoch": 0.33, "learning_rate": 0.0002509773679885738, "loss": 0.0206, "step": 126080 }, { "epoch": 0.33, "learning_rate": 0.0002509734797722023, "loss": 0.0189, "step": 126090 }, { "epoch": 0.33, "learning_rate": 0.0002509695915558309, "loss": 0.0177, "step": 126100 }, { "epoch": 0.33, "learning_rate": 0.00025096570333945945, "loss": 0.0171, "step": 126110 }, { "epoch": 0.33, "learning_rate": 0.00025096181512308796, "loss": 0.0227, "step": 126120 }, { "epoch": 0.33, "learning_rate": 0.0002509579269067165, "loss": 0.0209, "step": 126130 }, { "epoch": 0.33, "learning_rate": 0.000250954038690345, "loss": 0.0257, "step": 126140 }, { "epoch": 0.33, "learning_rate": 0.00025095015047397356, "loss": 0.0224, "step": 126150 }, { "epoch": 0.33, "learning_rate": 0.0002509462622576021, "loss": 0.0165, "step": 126160 }, { "epoch": 0.33, "learning_rate": 0.00025094237404123064, "loss": 0.0174, "step": 126170 }, { "epoch": 0.33, "learning_rate": 0.00025093848582485916, "loss": 0.0176, "step": 126180 }, { "epoch": 0.33, "learning_rate": 0.0002509345976084877, "loss": 0.0258, "step": 126190 }, { "epoch": 0.33, "learning_rate": 0.00025093070939211624, "loss": 0.0216, "step": 126200 }, { "epoch": 0.33, "learning_rate": 0.00025092682117574476, "loss": 0.0257, "step": 126210 }, { "epoch": 0.33, "learning_rate": 0.00025092293295937327, "loss": 0.0194, "step": 126220 }, { "epoch": 0.33, "learning_rate": 0.00025091904474300184, "loss": 0.0168, "step": 126230 }, { "epoch": 0.33, "learning_rate": 0.00025091515652663035, "loss": 0.0249, "step": 126240 }, { "epoch": 0.33, "learning_rate": 0.0002509112683102589, "loss": 0.0213, "step": 126250 }, { "epoch": 0.33, "learning_rate": 0.00025090738009388744, "loss": 0.0203, "step": 126260 }, { "epoch": 0.33, "learning_rate": 0.000250903491877516, "loss": 0.0185, "step": 126270 }, { "epoch": 0.33, "learning_rate": 0.0002508996036611445, "loss": 0.0283, "step": 126280 }, { "epoch": 0.33, "learning_rate": 0.00025089571544477303, "loss": 0.0175, "step": 126290 }, { "epoch": 0.33, "learning_rate": 0.00025089182722840155, "loss": 0.0197, "step": 126300 }, { "epoch": 0.33, "learning_rate": 0.0002508879390120301, "loss": 0.0209, "step": 126310 }, { "epoch": 0.33, "learning_rate": 0.0002508840507956587, "loss": 0.021, "step": 126320 }, { "epoch": 0.33, "learning_rate": 0.0002508801625792872, "loss": 0.0175, "step": 126330 }, { "epoch": 0.33, "learning_rate": 0.0002508762743629157, "loss": 0.0187, "step": 126340 }, { "epoch": 0.33, "learning_rate": 0.00025087238614654423, "loss": 0.0225, "step": 126350 }, { "epoch": 0.33, "learning_rate": 0.0002508684979301728, "loss": 0.0188, "step": 126360 }, { "epoch": 0.33, "learning_rate": 0.0002508646097138013, "loss": 0.0289, "step": 126370 }, { "epoch": 0.33, "learning_rate": 0.0002508607214974299, "loss": 0.0224, "step": 126380 }, { "epoch": 0.33, "learning_rate": 0.0002508568332810584, "loss": 0.0216, "step": 126390 }, { "epoch": 0.33, "learning_rate": 0.00025085294506468697, "loss": 0.0187, "step": 126400 }, { "epoch": 0.33, "learning_rate": 0.0002508490568483155, "loss": 0.0218, "step": 126410 }, { "epoch": 0.33, "learning_rate": 0.000250845168631944, "loss": 0.0185, "step": 126420 }, { "epoch": 0.33, "learning_rate": 0.0002508412804155725, "loss": 0.0188, "step": 126430 }, { "epoch": 0.33, "learning_rate": 0.0002508373921992011, "loss": 0.0202, "step": 126440 }, { "epoch": 0.33, "learning_rate": 0.00025083350398282965, "loss": 0.0198, "step": 126450 }, { "epoch": 0.33, "learning_rate": 0.00025082961576645816, "loss": 0.0237, "step": 126460 }, { "epoch": 0.33, "learning_rate": 0.0002508257275500867, "loss": 0.0255, "step": 126470 }, { "epoch": 0.33, "learning_rate": 0.00025082183933371524, "loss": 0.0248, "step": 126480 }, { "epoch": 0.33, "learning_rate": 0.00025081795111734376, "loss": 0.0199, "step": 126490 }, { "epoch": 0.33, "learning_rate": 0.0002508140629009723, "loss": 0.02, "step": 126500 }, { "epoch": 0.33, "learning_rate": 0.00025081017468460084, "loss": 0.0212, "step": 126510 }, { "epoch": 0.33, "learning_rate": 0.00025080628646822936, "loss": 0.0201, "step": 126520 }, { "epoch": 0.33, "learning_rate": 0.0002508023982518579, "loss": 0.0226, "step": 126530 }, { "epoch": 0.33, "learning_rate": 0.00025079851003548644, "loss": 0.0191, "step": 126540 }, { "epoch": 0.33, "learning_rate": 0.00025079462181911495, "loss": 0.0225, "step": 126550 }, { "epoch": 0.33, "learning_rate": 0.00025079073360274347, "loss": 0.0228, "step": 126560 }, { "epoch": 0.33, "learning_rate": 0.00025078684538637204, "loss": 0.0221, "step": 126570 }, { "epoch": 0.33, "learning_rate": 0.00025078295717000055, "loss": 0.0206, "step": 126580 }, { "epoch": 0.33, "learning_rate": 0.0002507790689536291, "loss": 0.0202, "step": 126590 }, { "epoch": 0.33, "learning_rate": 0.00025077518073725764, "loss": 0.0227, "step": 126600 }, { "epoch": 0.33, "learning_rate": 0.0002507712925208862, "loss": 0.0213, "step": 126610 }, { "epoch": 0.33, "learning_rate": 0.0002507674043045147, "loss": 0.0212, "step": 126620 }, { "epoch": 0.33, "learning_rate": 0.00025076351608814323, "loss": 0.021, "step": 126630 }, { "epoch": 0.33, "learning_rate": 0.00025075962787177175, "loss": 0.0206, "step": 126640 }, { "epoch": 0.33, "learning_rate": 0.0002507557396554003, "loss": 0.0207, "step": 126650 }, { "epoch": 0.33, "learning_rate": 0.0002507518514390289, "loss": 0.0216, "step": 126660 }, { "epoch": 0.33, "learning_rate": 0.0002507479632226574, "loss": 0.0213, "step": 126670 }, { "epoch": 0.33, "learning_rate": 0.0002507440750062859, "loss": 0.0198, "step": 126680 }, { "epoch": 0.33, "learning_rate": 0.0002507401867899145, "loss": 0.0192, "step": 126690 }, { "epoch": 0.33, "learning_rate": 0.000250736298573543, "loss": 0.0165, "step": 126700 }, { "epoch": 0.33, "learning_rate": 0.0002507324103571715, "loss": 0.0185, "step": 126710 }, { "epoch": 0.33, "learning_rate": 0.0002507285221408001, "loss": 0.0172, "step": 126720 }, { "epoch": 0.33, "learning_rate": 0.0002507246339244286, "loss": 0.0198, "step": 126730 }, { "epoch": 0.33, "learning_rate": 0.00025072074570805716, "loss": 0.0219, "step": 126740 }, { "epoch": 0.33, "learning_rate": 0.0002507168574916857, "loss": 0.0182, "step": 126750 }, { "epoch": 0.33, "learning_rate": 0.0002507129692753142, "loss": 0.0192, "step": 126760 }, { "epoch": 0.33, "learning_rate": 0.00025070908105894276, "loss": 0.0221, "step": 126770 }, { "epoch": 0.33, "learning_rate": 0.0002507051928425713, "loss": 0.0184, "step": 126780 }, { "epoch": 0.33, "learning_rate": 0.0002507013046261998, "loss": 0.0216, "step": 126790 }, { "epoch": 0.33, "learning_rate": 0.00025069741640982836, "loss": 0.0191, "step": 126800 }, { "epoch": 0.33, "learning_rate": 0.0002506935281934569, "loss": 0.0183, "step": 126810 }, { "epoch": 0.33, "learning_rate": 0.00025068963997708544, "loss": 0.0201, "step": 126820 }, { "epoch": 0.33, "learning_rate": 0.00025068575176071396, "loss": 0.0204, "step": 126830 }, { "epoch": 0.33, "learning_rate": 0.00025068186354434247, "loss": 0.019, "step": 126840 }, { "epoch": 0.33, "learning_rate": 0.00025067797532797104, "loss": 0.0197, "step": 126850 }, { "epoch": 0.33, "learning_rate": 0.00025067408711159956, "loss": 0.0196, "step": 126860 }, { "epoch": 0.33, "learning_rate": 0.0002506701988952281, "loss": 0.0257, "step": 126870 }, { "epoch": 0.33, "learning_rate": 0.00025066631067885664, "loss": 0.0209, "step": 126880 }, { "epoch": 0.33, "learning_rate": 0.00025066242246248515, "loss": 0.0198, "step": 126890 }, { "epoch": 0.33, "learning_rate": 0.0002506585342461137, "loss": 0.0192, "step": 126900 }, { "epoch": 0.33, "learning_rate": 0.00025065464602974224, "loss": 0.0201, "step": 126910 }, { "epoch": 0.33, "learning_rate": 0.00025065075781337075, "loss": 0.0198, "step": 126920 }, { "epoch": 0.33, "learning_rate": 0.0002506468695969993, "loss": 0.0202, "step": 126930 }, { "epoch": 0.33, "learning_rate": 0.00025064298138062783, "loss": 0.0201, "step": 126940 }, { "epoch": 0.33, "learning_rate": 0.0002506390931642564, "loss": 0.0191, "step": 126950 }, { "epoch": 0.33, "learning_rate": 0.0002506352049478849, "loss": 0.0179, "step": 126960 }, { "epoch": 0.33, "learning_rate": 0.00025063131673151343, "loss": 0.0231, "step": 126970 }, { "epoch": 0.33, "learning_rate": 0.000250627428515142, "loss": 0.0216, "step": 126980 }, { "epoch": 0.33, "learning_rate": 0.0002506235402987705, "loss": 0.0217, "step": 126990 }, { "epoch": 0.33, "learning_rate": 0.0002506196520823991, "loss": 0.025, "step": 127000 }, { "epoch": 0.33, "eval_cer": 0.8817880641761527, "eval_loss": 0.014219284057617188, "eval_runtime": 107.5382, "eval_samples_per_second": 18.598, "eval_steps_per_second": 4.65, "step": 127000 }, { "epoch": 0.33, "learning_rate": 0.0002506157638660276, "loss": 0.0177, "step": 127010 }, { "epoch": 0.33, "learning_rate": 0.00025061187564965617, "loss": 0.0191, "step": 127020 }, { "epoch": 0.33, "learning_rate": 0.0002506079874332847, "loss": 0.0191, "step": 127030 }, { "epoch": 0.33, "learning_rate": 0.0002506040992169132, "loss": 0.0264, "step": 127040 }, { "epoch": 0.33, "learning_rate": 0.0002506002110005417, "loss": 0.0173, "step": 127050 }, { "epoch": 0.33, "learning_rate": 0.0002505963227841703, "loss": 0.0218, "step": 127060 }, { "epoch": 0.33, "learning_rate": 0.0002505924345677988, "loss": 0.0217, "step": 127070 }, { "epoch": 0.33, "learning_rate": 0.00025058854635142736, "loss": 0.0215, "step": 127080 }, { "epoch": 0.33, "learning_rate": 0.0002505846581350559, "loss": 0.0159, "step": 127090 }, { "epoch": 0.33, "learning_rate": 0.0002505807699186844, "loss": 0.0215, "step": 127100 }, { "epoch": 0.33, "learning_rate": 0.00025057688170231296, "loss": 0.017, "step": 127110 }, { "epoch": 0.33, "learning_rate": 0.0002505729934859415, "loss": 0.02, "step": 127120 }, { "epoch": 0.33, "learning_rate": 0.00025056910526957, "loss": 0.0178, "step": 127130 }, { "epoch": 0.33, "learning_rate": 0.00025056521705319856, "loss": 0.0167, "step": 127140 }, { "epoch": 0.33, "learning_rate": 0.00025056132883682713, "loss": 0.025, "step": 127150 }, { "epoch": 0.33, "learning_rate": 0.00025055744062045564, "loss": 0.0197, "step": 127160 }, { "epoch": 0.33, "learning_rate": 0.00025055355240408416, "loss": 0.0211, "step": 127170 }, { "epoch": 0.33, "learning_rate": 0.00025054966418771267, "loss": 0.022, "step": 127180 }, { "epoch": 0.33, "learning_rate": 0.00025054577597134124, "loss": 0.025, "step": 127190 }, { "epoch": 0.33, "learning_rate": 0.00025054188775496975, "loss": 0.0424, "step": 127200 }, { "epoch": 0.33, "learning_rate": 0.0002505379995385983, "loss": 0.0212, "step": 127210 }, { "epoch": 0.33, "learning_rate": 0.00025053411132222684, "loss": 0.0181, "step": 127220 }, { "epoch": 0.33, "learning_rate": 0.0002505302231058554, "loss": 0.0205, "step": 127230 }, { "epoch": 0.33, "learning_rate": 0.0002505263348894839, "loss": 0.0221, "step": 127240 }, { "epoch": 0.33, "learning_rate": 0.00025052244667311244, "loss": 0.0223, "step": 127250 }, { "epoch": 0.33, "learning_rate": 0.00025051855845674095, "loss": 0.0235, "step": 127260 }, { "epoch": 0.33, "learning_rate": 0.0002505146702403695, "loss": 0.0272, "step": 127270 }, { "epoch": 0.33, "learning_rate": 0.00025051078202399803, "loss": 0.0237, "step": 127280 }, { "epoch": 0.33, "learning_rate": 0.0002505068938076266, "loss": 0.0257, "step": 127290 }, { "epoch": 0.33, "learning_rate": 0.0002505030055912551, "loss": 0.019, "step": 127300 }, { "epoch": 0.33, "learning_rate": 0.00025049911737488363, "loss": 0.021, "step": 127310 }, { "epoch": 0.33, "learning_rate": 0.0002504952291585122, "loss": 0.0188, "step": 127320 }, { "epoch": 0.33, "learning_rate": 0.0002504913409421407, "loss": 0.0188, "step": 127330 }, { "epoch": 0.33, "learning_rate": 0.00025048745272576923, "loss": 0.021, "step": 127340 }, { "epoch": 0.33, "learning_rate": 0.0002504835645093978, "loss": 0.0234, "step": 127350 }, { "epoch": 0.33, "learning_rate": 0.00025047967629302637, "loss": 0.0212, "step": 127360 }, { "epoch": 0.33, "learning_rate": 0.0002504757880766549, "loss": 0.0178, "step": 127370 }, { "epoch": 0.33, "learning_rate": 0.0002504718998602834, "loss": 0.0211, "step": 127380 }, { "epoch": 0.33, "learning_rate": 0.0002504680116439119, "loss": 0.0168, "step": 127390 }, { "epoch": 0.33, "learning_rate": 0.0002504641234275405, "loss": 0.0211, "step": 127400 }, { "epoch": 0.33, "learning_rate": 0.000250460235211169, "loss": 0.0196, "step": 127410 }, { "epoch": 0.33, "learning_rate": 0.00025045634699479756, "loss": 0.0209, "step": 127420 }, { "epoch": 0.33, "learning_rate": 0.0002504524587784261, "loss": 0.0173, "step": 127430 }, { "epoch": 0.33, "learning_rate": 0.00025044857056205465, "loss": 0.0191, "step": 127440 }, { "epoch": 0.33, "learning_rate": 0.00025044468234568316, "loss": 0.0209, "step": 127450 }, { "epoch": 0.33, "learning_rate": 0.0002504407941293117, "loss": 0.0201, "step": 127460 }, { "epoch": 0.33, "learning_rate": 0.0002504369059129402, "loss": 0.0207, "step": 127470 }, { "epoch": 0.33, "learning_rate": 0.00025043301769656876, "loss": 0.018, "step": 127480 }, { "epoch": 0.33, "learning_rate": 0.00025042912948019727, "loss": 0.0221, "step": 127490 }, { "epoch": 0.33, "learning_rate": 0.00025042524126382584, "loss": 0.0213, "step": 127500 }, { "epoch": 0.33, "learning_rate": 0.00025042135304745436, "loss": 0.0197, "step": 127510 }, { "epoch": 0.33, "learning_rate": 0.0002504174648310829, "loss": 0.0195, "step": 127520 }, { "epoch": 0.33, "learning_rate": 0.00025041357661471144, "loss": 0.0204, "step": 127530 }, { "epoch": 0.33, "learning_rate": 0.00025040968839833995, "loss": 0.0199, "step": 127540 }, { "epoch": 0.33, "learning_rate": 0.0002504058001819685, "loss": 0.0184, "step": 127550 }, { "epoch": 0.33, "learning_rate": 0.00025040191196559704, "loss": 0.0242, "step": 127560 }, { "epoch": 0.33, "learning_rate": 0.0002503980237492256, "loss": 0.0169, "step": 127570 }, { "epoch": 0.33, "learning_rate": 0.0002503941355328541, "loss": 0.0169, "step": 127580 }, { "epoch": 0.33, "learning_rate": 0.00025039024731648263, "loss": 0.0254, "step": 127590 }, { "epoch": 0.33, "learning_rate": 0.00025038635910011115, "loss": 0.0198, "step": 127600 }, { "epoch": 0.33, "learning_rate": 0.0002503824708837397, "loss": 0.0172, "step": 127610 }, { "epoch": 0.33, "learning_rate": 0.00025037858266736823, "loss": 0.0194, "step": 127620 }, { "epoch": 0.33, "learning_rate": 0.0002503746944509968, "loss": 0.0216, "step": 127630 }, { "epoch": 0.33, "learning_rate": 0.0002503708062346253, "loss": 0.019, "step": 127640 }, { "epoch": 0.33, "learning_rate": 0.0002503669180182539, "loss": 0.0207, "step": 127650 }, { "epoch": 0.33, "learning_rate": 0.0002503630298018824, "loss": 0.0209, "step": 127660 }, { "epoch": 0.33, "learning_rate": 0.0002503591415855109, "loss": 0.0203, "step": 127670 }, { "epoch": 0.33, "learning_rate": 0.00025035525336913943, "loss": 0.0189, "step": 127680 }, { "epoch": 0.33, "learning_rate": 0.000250351365152768, "loss": 0.0206, "step": 127690 }, { "epoch": 0.33, "learning_rate": 0.00025034747693639657, "loss": 0.0172, "step": 127700 }, { "epoch": 0.33, "learning_rate": 0.0002503435887200251, "loss": 0.0189, "step": 127710 }, { "epoch": 0.33, "learning_rate": 0.0002503397005036536, "loss": 0.0234, "step": 127720 }, { "epoch": 0.33, "learning_rate": 0.00025033581228728216, "loss": 0.0295, "step": 127730 }, { "epoch": 0.33, "learning_rate": 0.0002503319240709107, "loss": 0.0194, "step": 127740 }, { "epoch": 0.33, "learning_rate": 0.0002503280358545392, "loss": 0.0182, "step": 127750 }, { "epoch": 0.33, "learning_rate": 0.00025032414763816776, "loss": 0.0185, "step": 127760 }, { "epoch": 0.33, "learning_rate": 0.0002503202594217963, "loss": 0.0203, "step": 127770 }, { "epoch": 0.33, "learning_rate": 0.00025031637120542484, "loss": 0.0155, "step": 127780 }, { "epoch": 0.33, "learning_rate": 0.00025031248298905336, "loss": 0.0207, "step": 127790 }, { "epoch": 0.33, "learning_rate": 0.0002503085947726819, "loss": 0.0215, "step": 127800 }, { "epoch": 0.33, "learning_rate": 0.0002503047065563104, "loss": 0.0191, "step": 127810 }, { "epoch": 0.33, "learning_rate": 0.00025030081833993896, "loss": 0.0204, "step": 127820 }, { "epoch": 0.33, "learning_rate": 0.00025029693012356747, "loss": 0.0221, "step": 127830 }, { "epoch": 0.33, "learning_rate": 0.00025029304190719604, "loss": 0.0219, "step": 127840 }, { "epoch": 0.33, "learning_rate": 0.00025028915369082455, "loss": 0.0199, "step": 127850 }, { "epoch": 0.33, "learning_rate": 0.0002502852654744531, "loss": 0.0245, "step": 127860 }, { "epoch": 0.33, "learning_rate": 0.00025028137725808164, "loss": 0.0193, "step": 127870 }, { "epoch": 0.33, "learning_rate": 0.00025027748904171015, "loss": 0.0216, "step": 127880 }, { "epoch": 0.33, "learning_rate": 0.00025027360082533867, "loss": 0.0226, "step": 127890 }, { "epoch": 0.33, "learning_rate": 0.00025026971260896724, "loss": 0.0233, "step": 127900 }, { "epoch": 0.33, "learning_rate": 0.0002502658243925958, "loss": 0.0191, "step": 127910 }, { "epoch": 0.33, "learning_rate": 0.0002502619361762243, "loss": 0.0189, "step": 127920 }, { "epoch": 0.33, "learning_rate": 0.00025025804795985283, "loss": 0.0217, "step": 127930 }, { "epoch": 0.33, "learning_rate": 0.0002502541597434814, "loss": 0.0197, "step": 127940 }, { "epoch": 0.33, "learning_rate": 0.0002502502715271099, "loss": 0.0201, "step": 127950 }, { "epoch": 0.33, "learning_rate": 0.00025024638331073843, "loss": 0.0249, "step": 127960 }, { "epoch": 0.33, "learning_rate": 0.000250242495094367, "loss": 0.0215, "step": 127970 }, { "epoch": 0.33, "learning_rate": 0.0002502386068779955, "loss": 0.0176, "step": 127980 }, { "epoch": 0.33, "learning_rate": 0.0002502347186616241, "loss": 0.0257, "step": 127990 }, { "epoch": 0.33, "learning_rate": 0.0002502308304452526, "loss": 0.0264, "step": 128000 }, { "epoch": 0.33, "eval_cer": 0.8818188561887047, "eval_loss": 0.014465493150055408, "eval_runtime": 107.6927, "eval_samples_per_second": 18.571, "eval_steps_per_second": 4.643, "step": 128000 }, { "epoch": 0.33, "learning_rate": 0.0002502269422288811, "loss": 0.0197, "step": 128010 }, { "epoch": 0.33, "learning_rate": 0.0002502230540125097, "loss": 0.0175, "step": 128020 }, { "epoch": 0.33, "learning_rate": 0.0002502191657961382, "loss": 0.0189, "step": 128030 }, { "epoch": 0.33, "learning_rate": 0.00025021527757976676, "loss": 0.0171, "step": 128040 }, { "epoch": 0.33, "learning_rate": 0.0002502113893633953, "loss": 0.0202, "step": 128050 }, { "epoch": 0.33, "learning_rate": 0.0002502075011470238, "loss": 0.0208, "step": 128060 }, { "epoch": 0.33, "learning_rate": 0.00025020361293065236, "loss": 0.0198, "step": 128070 }, { "epoch": 0.33, "learning_rate": 0.0002501997247142809, "loss": 0.0223, "step": 128080 }, { "epoch": 0.33, "learning_rate": 0.0002501958364979094, "loss": 0.0223, "step": 128090 }, { "epoch": 0.33, "learning_rate": 0.00025019194828153796, "loss": 0.02, "step": 128100 }, { "epoch": 0.33, "learning_rate": 0.0002501880600651665, "loss": 0.0143, "step": 128110 }, { "epoch": 0.33, "learning_rate": 0.00025018417184879504, "loss": 0.0262, "step": 128120 }, { "epoch": 0.33, "learning_rate": 0.00025018028363242356, "loss": 0.0189, "step": 128130 }, { "epoch": 0.33, "learning_rate": 0.00025017639541605207, "loss": 0.0191, "step": 128140 }, { "epoch": 0.33, "learning_rate": 0.00025017250719968064, "loss": 0.0209, "step": 128150 }, { "epoch": 0.33, "learning_rate": 0.00025016861898330916, "loss": 0.0221, "step": 128160 }, { "epoch": 0.33, "learning_rate": 0.00025016473076693767, "loss": 0.0179, "step": 128170 }, { "epoch": 0.33, "learning_rate": 0.00025016084255056624, "loss": 0.0213, "step": 128180 }, { "epoch": 0.33, "learning_rate": 0.0002501569543341948, "loss": 0.0218, "step": 128190 }, { "epoch": 0.33, "learning_rate": 0.0002501530661178233, "loss": 0.0248, "step": 128200 }, { "epoch": 0.33, "learning_rate": 0.00025014917790145184, "loss": 0.0224, "step": 128210 }, { "epoch": 0.33, "learning_rate": 0.00025014528968508035, "loss": 0.0183, "step": 128220 }, { "epoch": 0.33, "learning_rate": 0.0002501414014687089, "loss": 0.0208, "step": 128230 }, { "epoch": 0.33, "learning_rate": 0.00025013751325233743, "loss": 0.0207, "step": 128240 }, { "epoch": 0.33, "learning_rate": 0.000250133625035966, "loss": 0.0201, "step": 128250 }, { "epoch": 0.33, "learning_rate": 0.0002501297368195945, "loss": 0.0189, "step": 128260 }, { "epoch": 0.33, "learning_rate": 0.0002501258486032231, "loss": 0.0241, "step": 128270 }, { "epoch": 0.33, "learning_rate": 0.0002501219603868516, "loss": 0.0173, "step": 128280 }, { "epoch": 0.33, "learning_rate": 0.0002501180721704801, "loss": 0.0243, "step": 128290 }, { "epoch": 0.33, "learning_rate": 0.00025011418395410863, "loss": 0.0201, "step": 128300 }, { "epoch": 0.33, "learning_rate": 0.0002501102957377372, "loss": 0.0202, "step": 128310 }, { "epoch": 0.33, "learning_rate": 0.0002501064075213657, "loss": 0.0185, "step": 128320 }, { "epoch": 0.33, "learning_rate": 0.0002501025193049943, "loss": 0.0246, "step": 128330 }, { "epoch": 0.33, "learning_rate": 0.0002500986310886228, "loss": 0.0218, "step": 128340 }, { "epoch": 0.33, "learning_rate": 0.0002500947428722513, "loss": 0.0248, "step": 128350 }, { "epoch": 0.33, "learning_rate": 0.0002500908546558799, "loss": 0.0222, "step": 128360 }, { "epoch": 0.33, "learning_rate": 0.0002500869664395084, "loss": 0.0159, "step": 128370 }, { "epoch": 0.33, "learning_rate": 0.0002500830782231369, "loss": 0.0207, "step": 128380 }, { "epoch": 0.33, "learning_rate": 0.0002500791900067655, "loss": 0.0187, "step": 128390 }, { "epoch": 0.33, "learning_rate": 0.00025007530179039405, "loss": 0.0243, "step": 128400 }, { "epoch": 0.33, "learning_rate": 0.00025007141357402256, "loss": 0.0262, "step": 128410 }, { "epoch": 0.33, "learning_rate": 0.0002500675253576511, "loss": 0.0252, "step": 128420 }, { "epoch": 0.33, "learning_rate": 0.0002500636371412796, "loss": 0.022, "step": 128430 }, { "epoch": 0.33, "learning_rate": 0.00025005974892490816, "loss": 0.0202, "step": 128440 }, { "epoch": 0.33, "learning_rate": 0.0002500558607085367, "loss": 0.0201, "step": 128450 }, { "epoch": 0.33, "learning_rate": 0.00025005197249216524, "loss": 0.024, "step": 128460 }, { "epoch": 0.33, "learning_rate": 0.00025004808427579376, "loss": 0.0218, "step": 128470 }, { "epoch": 0.33, "learning_rate": 0.0002500441960594223, "loss": 0.0173, "step": 128480 }, { "epoch": 0.33, "learning_rate": 0.00025004030784305084, "loss": 0.0176, "step": 128490 }, { "epoch": 0.33, "learning_rate": 0.00025003641962667935, "loss": 0.0137, "step": 128500 }, { "epoch": 0.33, "learning_rate": 0.00025003253141030787, "loss": 0.0233, "step": 128510 }, { "epoch": 0.33, "learning_rate": 0.00025002864319393644, "loss": 0.0206, "step": 128520 }, { "epoch": 0.33, "learning_rate": 0.00025002475497756495, "loss": 0.0226, "step": 128530 }, { "epoch": 0.33, "learning_rate": 0.0002500208667611935, "loss": 0.0214, "step": 128540 }, { "epoch": 0.33, "learning_rate": 0.00025001697854482204, "loss": 0.0179, "step": 128550 }, { "epoch": 0.33, "learning_rate": 0.00025001309032845055, "loss": 0.0236, "step": 128560 }, { "epoch": 0.33, "learning_rate": 0.0002500092021120791, "loss": 0.0265, "step": 128570 }, { "epoch": 0.33, "learning_rate": 0.00025000531389570763, "loss": 0.0375, "step": 128580 }, { "epoch": 0.33, "learning_rate": 0.0002500014256793362, "loss": 0.0272, "step": 128590 }, { "epoch": 0.33, "learning_rate": 0.0002499975374629647, "loss": 0.0224, "step": 128600 }, { "epoch": 0.33, "learning_rate": 0.0002499936492465933, "loss": 0.1259, "step": 128610 }, { "epoch": 0.33, "learning_rate": 0.0002499897610302218, "loss": 0.079, "step": 128620 }, { "epoch": 0.33, "learning_rate": 0.0002499858728138503, "loss": 0.0776, "step": 128630 }, { "epoch": 0.33, "learning_rate": 0.00024998198459747883, "loss": 0.0215, "step": 128640 }, { "epoch": 0.33, "learning_rate": 0.0002499780963811074, "loss": 0.0355, "step": 128650 }, { "epoch": 0.33, "learning_rate": 0.0002499742081647359, "loss": 0.0206, "step": 128660 }, { "epoch": 0.33, "learning_rate": 0.0002499703199483645, "loss": 0.0219, "step": 128670 }, { "epoch": 0.33, "learning_rate": 0.000249966431731993, "loss": 0.0319, "step": 128680 }, { "epoch": 0.33, "learning_rate": 0.00024996254351562156, "loss": 0.0222, "step": 128690 }, { "epoch": 0.33, "learning_rate": 0.0002499586552992501, "loss": 0.0281, "step": 128700 }, { "epoch": 0.33, "learning_rate": 0.0002499547670828786, "loss": 0.0226, "step": 128710 }, { "epoch": 0.33, "learning_rate": 0.0002499508788665071, "loss": 0.0225, "step": 128720 }, { "epoch": 0.33, "learning_rate": 0.0002499469906501357, "loss": 0.0233, "step": 128730 }, { "epoch": 0.33, "learning_rate": 0.00024994310243376425, "loss": 0.0173, "step": 128740 }, { "epoch": 0.33, "learning_rate": 0.00024993921421739276, "loss": 0.0192, "step": 128750 }, { "epoch": 0.33, "learning_rate": 0.0002499353260010213, "loss": 0.0218, "step": 128760 }, { "epoch": 0.33, "learning_rate": 0.0002499314377846498, "loss": 0.0216, "step": 128770 }, { "epoch": 0.33, "learning_rate": 0.00024992754956827836, "loss": 0.0174, "step": 128780 }, { "epoch": 0.33, "learning_rate": 0.00024992366135190687, "loss": 0.0178, "step": 128790 }, { "epoch": 0.33, "learning_rate": 0.00024991977313553544, "loss": 0.0205, "step": 128800 }, { "epoch": 0.33, "learning_rate": 0.00024991588491916396, "loss": 0.0251, "step": 128810 }, { "epoch": 0.33, "learning_rate": 0.0002499119967027925, "loss": 0.0253, "step": 128820 }, { "epoch": 0.33, "learning_rate": 0.00024990810848642104, "loss": 0.0201, "step": 128830 }, { "epoch": 0.33, "learning_rate": 0.00024990422027004955, "loss": 0.0284, "step": 128840 }, { "epoch": 0.33, "learning_rate": 0.00024990033205367807, "loss": 0.0311, "step": 128850 }, { "epoch": 0.33, "learning_rate": 0.00024989644383730664, "loss": 0.022, "step": 128860 }, { "epoch": 0.33, "learning_rate": 0.00024989255562093515, "loss": 0.0217, "step": 128870 }, { "epoch": 0.33, "learning_rate": 0.0002498886674045637, "loss": 0.0201, "step": 128880 }, { "epoch": 0.33, "learning_rate": 0.00024988477918819223, "loss": 0.0184, "step": 128890 }, { "epoch": 0.33, "learning_rate": 0.0002498808909718208, "loss": 0.0221, "step": 128900 }, { "epoch": 0.33, "learning_rate": 0.0002498770027554493, "loss": 0.0244, "step": 128910 }, { "epoch": 0.33, "learning_rate": 0.00024987311453907783, "loss": 0.021, "step": 128920 }, { "epoch": 0.33, "learning_rate": 0.00024986922632270635, "loss": 0.0218, "step": 128930 }, { "epoch": 0.33, "learning_rate": 0.0002498653381063349, "loss": 0.0191, "step": 128940 }, { "epoch": 0.33, "learning_rate": 0.0002498614498899635, "loss": 0.0182, "step": 128950 }, { "epoch": 0.33, "learning_rate": 0.000249857561673592, "loss": 0.0191, "step": 128960 }, { "epoch": 0.33, "learning_rate": 0.0002498536734572205, "loss": 0.0186, "step": 128970 }, { "epoch": 0.33, "learning_rate": 0.0002498497852408491, "loss": 0.0176, "step": 128980 }, { "epoch": 0.33, "learning_rate": 0.0002498458970244776, "loss": 0.0174, "step": 128990 }, { "epoch": 0.33, "learning_rate": 0.0002498420088081061, "loss": 0.0213, "step": 129000 }, { "epoch": 0.33, "eval_cer": 0.8818006609085604, "eval_loss": 0.014310148544609547, "eval_runtime": 107.6549, "eval_samples_per_second": 18.578, "eval_steps_per_second": 4.644, "step": 129000 }, { "epoch": 0.33, "learning_rate": 0.0002498381205917347, "loss": 0.0241, "step": 129010 }, { "epoch": 0.33, "learning_rate": 0.0002498342323753632, "loss": 0.0188, "step": 129020 }, { "epoch": 0.33, "learning_rate": 0.00024983034415899176, "loss": 0.0225, "step": 129030 }, { "epoch": 0.33, "learning_rate": 0.0002498264559426203, "loss": 0.0198, "step": 129040 }, { "epoch": 0.33, "learning_rate": 0.0002498225677262488, "loss": 0.0195, "step": 129050 }, { "epoch": 0.33, "learning_rate": 0.0002498186795098773, "loss": 0.0177, "step": 129060 }, { "epoch": 0.33, "learning_rate": 0.0002498147912935059, "loss": 0.0186, "step": 129070 }, { "epoch": 0.33, "learning_rate": 0.0002498109030771344, "loss": 0.0202, "step": 129080 }, { "epoch": 0.33, "learning_rate": 0.00024980701486076296, "loss": 0.0189, "step": 129090 }, { "epoch": 0.33, "learning_rate": 0.0002498031266443915, "loss": 0.0154, "step": 129100 }, { "epoch": 0.33, "learning_rate": 0.00024979923842802004, "loss": 0.0221, "step": 129110 }, { "epoch": 0.33, "learning_rate": 0.00024979535021164856, "loss": 0.021, "step": 129120 }, { "epoch": 0.33, "learning_rate": 0.00024979146199527707, "loss": 0.0163, "step": 129130 }, { "epoch": 0.33, "learning_rate": 0.00024978757377890564, "loss": 0.0226, "step": 129140 }, { "epoch": 0.33, "learning_rate": 0.00024978368556253415, "loss": 0.0169, "step": 129150 }, { "epoch": 0.33, "learning_rate": 0.0002497797973461627, "loss": 0.0202, "step": 129160 }, { "epoch": 0.33, "learning_rate": 0.00024977590912979124, "loss": 0.0197, "step": 129170 }, { "epoch": 0.33, "learning_rate": 0.00024977202091341975, "loss": 0.0182, "step": 129180 }, { "epoch": 0.33, "learning_rate": 0.0002497681326970483, "loss": 0.0222, "step": 129190 }, { "epoch": 0.33, "learning_rate": 0.00024976424448067684, "loss": 0.019, "step": 129200 }, { "epoch": 0.33, "learning_rate": 0.00024976035626430535, "loss": 0.0198, "step": 129210 }, { "epoch": 0.33, "learning_rate": 0.0002497564680479339, "loss": 0.0168, "step": 129220 }, { "epoch": 0.33, "learning_rate": 0.0002497525798315625, "loss": 0.0194, "step": 129230 }, { "epoch": 0.34, "learning_rate": 0.000249748691615191, "loss": 0.0175, "step": 129240 }, { "epoch": 0.34, "learning_rate": 0.0002497448033988195, "loss": 0.0208, "step": 129250 }, { "epoch": 0.34, "learning_rate": 0.00024974091518244803, "loss": 0.0208, "step": 129260 }, { "epoch": 0.34, "learning_rate": 0.00024973702696607655, "loss": 0.0189, "step": 129270 }, { "epoch": 0.34, "learning_rate": 0.0002497331387497051, "loss": 0.0232, "step": 129280 }, { "epoch": 0.34, "learning_rate": 0.0002497292505333337, "loss": 0.0241, "step": 129290 }, { "epoch": 0.34, "learning_rate": 0.0002497253623169622, "loss": 0.0191, "step": 129300 }, { "epoch": 0.34, "learning_rate": 0.0002497214741005907, "loss": 0.0222, "step": 129310 }, { "epoch": 0.34, "learning_rate": 0.0002497175858842193, "loss": 0.0175, "step": 129320 }, { "epoch": 0.34, "learning_rate": 0.0002497136976678478, "loss": 0.0217, "step": 129330 }, { "epoch": 0.34, "learning_rate": 0.0002497098094514763, "loss": 0.0167, "step": 129340 }, { "epoch": 0.34, "learning_rate": 0.0002497059212351049, "loss": 0.0196, "step": 129350 }, { "epoch": 0.34, "learning_rate": 0.0002497020330187334, "loss": 0.0204, "step": 129360 }, { "epoch": 0.34, "learning_rate": 0.00024969814480236196, "loss": 0.0202, "step": 129370 }, { "epoch": 0.34, "learning_rate": 0.0002496942565859905, "loss": 0.0174, "step": 129380 }, { "epoch": 0.34, "learning_rate": 0.000249690368369619, "loss": 0.02, "step": 129390 }, { "epoch": 0.34, "learning_rate": 0.00024968648015324756, "loss": 0.021, "step": 129400 }, { "epoch": 0.34, "learning_rate": 0.0002496825919368761, "loss": 0.0193, "step": 129410 }, { "epoch": 0.34, "learning_rate": 0.0002496787037205046, "loss": 0.0191, "step": 129420 }, { "epoch": 0.34, "learning_rate": 0.00024967481550413316, "loss": 0.0247, "step": 129430 }, { "epoch": 0.34, "learning_rate": 0.0002496709272877617, "loss": 0.0211, "step": 129440 }, { "epoch": 0.34, "learning_rate": 0.00024966703907139024, "loss": 0.0227, "step": 129450 }, { "epoch": 0.34, "learning_rate": 0.00024966315085501876, "loss": 0.0194, "step": 129460 }, { "epoch": 0.34, "learning_rate": 0.00024965926263864727, "loss": 0.0244, "step": 129470 }, { "epoch": 0.34, "learning_rate": 0.00024965537442227584, "loss": 0.0218, "step": 129480 }, { "epoch": 0.34, "learning_rate": 0.00024965148620590435, "loss": 0.0207, "step": 129490 }, { "epoch": 0.34, "learning_rate": 0.0002496475979895329, "loss": 0.024, "step": 129500 }, { "epoch": 0.34, "learning_rate": 0.00024964370977316144, "loss": 0.0211, "step": 129510 }, { "epoch": 0.34, "learning_rate": 0.00024963982155678995, "loss": 0.0178, "step": 129520 }, { "epoch": 0.34, "learning_rate": 0.0002496359333404185, "loss": 0.0166, "step": 129530 }, { "epoch": 0.34, "learning_rate": 0.00024963204512404703, "loss": 0.0151, "step": 129540 }, { "epoch": 0.34, "learning_rate": 0.00024962815690767555, "loss": 0.0205, "step": 129550 }, { "epoch": 0.34, "learning_rate": 0.0002496242686913041, "loss": 0.0232, "step": 129560 }, { "epoch": 0.34, "learning_rate": 0.00024962038047493263, "loss": 0.0232, "step": 129570 }, { "epoch": 0.34, "learning_rate": 0.0002496164922585612, "loss": 0.0257, "step": 129580 }, { "epoch": 0.34, "learning_rate": 0.0002496126040421897, "loss": 0.017, "step": 129590 }, { "epoch": 0.34, "learning_rate": 0.00024960871582581823, "loss": 0.0211, "step": 129600 }, { "epoch": 0.34, "learning_rate": 0.0002496048276094468, "loss": 0.0203, "step": 129610 }, { "epoch": 0.34, "learning_rate": 0.0002496009393930753, "loss": 0.02, "step": 129620 }, { "epoch": 0.34, "learning_rate": 0.0002495970511767039, "loss": 0.0193, "step": 129630 }, { "epoch": 0.34, "learning_rate": 0.0002495931629603324, "loss": 0.0181, "step": 129640 }, { "epoch": 0.34, "learning_rate": 0.00024958927474396097, "loss": 0.0218, "step": 129650 }, { "epoch": 0.34, "learning_rate": 0.0002495853865275895, "loss": 0.0191, "step": 129660 }, { "epoch": 0.34, "learning_rate": 0.000249581498311218, "loss": 0.0202, "step": 129670 }, { "epoch": 0.34, "learning_rate": 0.0002495776100948465, "loss": 0.016, "step": 129680 }, { "epoch": 0.34, "learning_rate": 0.0002495737218784751, "loss": 0.028, "step": 129690 }, { "epoch": 0.34, "learning_rate": 0.0002495698336621036, "loss": 0.0181, "step": 129700 }, { "epoch": 0.34, "learning_rate": 0.00024956594544573216, "loss": 0.0199, "step": 129710 }, { "epoch": 0.34, "learning_rate": 0.0002495620572293607, "loss": 0.0192, "step": 129720 }, { "epoch": 0.34, "learning_rate": 0.00024955816901298924, "loss": 0.0247, "step": 129730 }, { "epoch": 0.34, "learning_rate": 0.00024955428079661776, "loss": 0.021, "step": 129740 }, { "epoch": 0.34, "learning_rate": 0.0002495503925802463, "loss": 0.0299, "step": 129750 }, { "epoch": 0.34, "learning_rate": 0.0002495465043638748, "loss": 0.0207, "step": 129760 }, { "epoch": 0.34, "learning_rate": 0.00024954261614750336, "loss": 0.0235, "step": 129770 }, { "epoch": 0.34, "learning_rate": 0.0002495387279311319, "loss": 0.0247, "step": 129780 }, { "epoch": 0.34, "learning_rate": 0.00024953483971476044, "loss": 0.0201, "step": 129790 }, { "epoch": 0.34, "learning_rate": 0.00024953095149838895, "loss": 0.022, "step": 129800 }, { "epoch": 0.34, "learning_rate": 0.00024952706328201747, "loss": 0.0166, "step": 129810 }, { "epoch": 0.34, "learning_rate": 0.00024952317506564604, "loss": 0.0178, "step": 129820 }, { "epoch": 0.34, "learning_rate": 0.00024951928684927455, "loss": 0.0193, "step": 129830 }, { "epoch": 0.34, "learning_rate": 0.0002495153986329031, "loss": 0.0194, "step": 129840 }, { "epoch": 0.34, "learning_rate": 0.00024951151041653164, "loss": 0.0228, "step": 129850 }, { "epoch": 0.34, "learning_rate": 0.0002495076222001602, "loss": 0.0194, "step": 129860 }, { "epoch": 0.34, "learning_rate": 0.0002495037339837887, "loss": 0.02, "step": 129870 }, { "epoch": 0.34, "learning_rate": 0.00024949984576741723, "loss": 0.0243, "step": 129880 }, { "epoch": 0.34, "learning_rate": 0.00024949595755104575, "loss": 0.0251, "step": 129890 }, { "epoch": 0.34, "learning_rate": 0.0002494920693346743, "loss": 0.0214, "step": 129900 }, { "epoch": 0.34, "learning_rate": 0.00024948818111830283, "loss": 0.0245, "step": 129910 }, { "epoch": 0.34, "learning_rate": 0.0002494842929019314, "loss": 0.0192, "step": 129920 }, { "epoch": 0.34, "learning_rate": 0.0002494804046855599, "loss": 0.0215, "step": 129930 }, { "epoch": 0.34, "learning_rate": 0.0002494765164691885, "loss": 0.0212, "step": 129940 }, { "epoch": 0.34, "learning_rate": 0.000249472628252817, "loss": 0.0188, "step": 129950 }, { "epoch": 0.34, "learning_rate": 0.0002494687400364455, "loss": 0.0179, "step": 129960 }, { "epoch": 0.34, "learning_rate": 0.000249464851820074, "loss": 0.0188, "step": 129970 }, { "epoch": 0.34, "learning_rate": 0.0002494609636037026, "loss": 0.0214, "step": 129980 }, { "epoch": 0.34, "learning_rate": 0.00024945707538733116, "loss": 0.0201, "step": 129990 }, { "epoch": 0.34, "learning_rate": 0.0002494531871709597, "loss": 0.0232, "step": 130000 }, { "epoch": 0.34, "eval_cer": 0.8818048598193629, "eval_loss": 0.014468919485807419, "eval_runtime": 107.45, "eval_samples_per_second": 18.613, "eval_steps_per_second": 4.653, "step": 130000 }, { "epoch": 0.34, "learning_rate": 0.0002494492989545882, "loss": 0.0175, "step": 130010 }, { "epoch": 0.34, "learning_rate": 0.0002494454107382167, "loss": 0.0188, "step": 130020 }, { "epoch": 0.34, "learning_rate": 0.0002494415225218453, "loss": 0.0199, "step": 130030 }, { "epoch": 0.34, "learning_rate": 0.0002494376343054738, "loss": 0.0191, "step": 130040 }, { "epoch": 0.34, "learning_rate": 0.00024943374608910236, "loss": 0.0191, "step": 130050 }, { "epoch": 0.34, "learning_rate": 0.0002494298578727309, "loss": 0.0204, "step": 130060 }, { "epoch": 0.34, "learning_rate": 0.00024942596965635944, "loss": 0.0189, "step": 130070 }, { "epoch": 0.34, "learning_rate": 0.00024942208143998796, "loss": 0.0179, "step": 130080 }, { "epoch": 0.34, "learning_rate": 0.00024941819322361647, "loss": 0.0202, "step": 130090 }, { "epoch": 0.34, "learning_rate": 0.000249414305007245, "loss": 0.0166, "step": 130100 }, { "epoch": 0.34, "learning_rate": 0.00024941041679087356, "loss": 0.0184, "step": 130110 }, { "epoch": 0.34, "learning_rate": 0.00024940652857450207, "loss": 0.0193, "step": 130120 }, { "epoch": 0.34, "learning_rate": 0.00024940264035813064, "loss": 0.0198, "step": 130130 }, { "epoch": 0.34, "learning_rate": 0.00024939875214175915, "loss": 0.0192, "step": 130140 }, { "epoch": 0.34, "learning_rate": 0.0002493948639253877, "loss": 0.0172, "step": 130150 }, { "epoch": 0.34, "learning_rate": 0.00024939097570901624, "loss": 0.0215, "step": 130160 }, { "epoch": 0.34, "learning_rate": 0.00024938708749264475, "loss": 0.0212, "step": 130170 }, { "epoch": 0.34, "learning_rate": 0.0002493831992762733, "loss": 0.0207, "step": 130180 }, { "epoch": 0.34, "learning_rate": 0.00024937931105990183, "loss": 0.018, "step": 130190 }, { "epoch": 0.34, "learning_rate": 0.0002493754228435304, "loss": 0.0207, "step": 130200 }, { "epoch": 0.34, "learning_rate": 0.0002493715346271589, "loss": 0.0171, "step": 130210 }, { "epoch": 0.34, "learning_rate": 0.00024936764641078743, "loss": 0.0253, "step": 130220 }, { "epoch": 0.34, "learning_rate": 0.000249363758194416, "loss": 0.0208, "step": 130230 }, { "epoch": 0.34, "learning_rate": 0.0002493598699780445, "loss": 0.0219, "step": 130240 }, { "epoch": 0.34, "learning_rate": 0.00024935598176167303, "loss": 0.0166, "step": 130250 }, { "epoch": 0.34, "learning_rate": 0.0002493520935453016, "loss": 0.0195, "step": 130260 }, { "epoch": 0.34, "learning_rate": 0.0002493482053289301, "loss": 0.0231, "step": 130270 }, { "epoch": 0.34, "learning_rate": 0.0002493443171125587, "loss": 0.0214, "step": 130280 }, { "epoch": 0.34, "learning_rate": 0.0002493404288961872, "loss": 0.0206, "step": 130290 }, { "epoch": 0.34, "learning_rate": 0.0002493365406798157, "loss": 0.0252, "step": 130300 }, { "epoch": 0.34, "learning_rate": 0.0002493326524634442, "loss": 0.015, "step": 130310 }, { "epoch": 0.34, "learning_rate": 0.0002493287642470728, "loss": 0.0154, "step": 130320 }, { "epoch": 0.34, "learning_rate": 0.00024932487603070136, "loss": 0.0199, "step": 130330 }, { "epoch": 0.34, "learning_rate": 0.0002493209878143299, "loss": 0.0218, "step": 130340 }, { "epoch": 0.34, "learning_rate": 0.0002493170995979584, "loss": 0.0351, "step": 130350 }, { "epoch": 0.34, "learning_rate": 0.00024931321138158696, "loss": 0.0207, "step": 130360 }, { "epoch": 0.34, "learning_rate": 0.0002493093231652155, "loss": 0.0218, "step": 130370 }, { "epoch": 0.34, "learning_rate": 0.000249305434948844, "loss": 0.1019, "step": 130380 }, { "epoch": 0.34, "learning_rate": 0.00024930154673247256, "loss": 0.0271, "step": 130390 }, { "epoch": 0.34, "learning_rate": 0.0002492976585161011, "loss": 0.0184, "step": 130400 }, { "epoch": 0.34, "learning_rate": 0.00024929377029972964, "loss": 0.021, "step": 130410 }, { "epoch": 0.34, "learning_rate": 0.00024928988208335816, "loss": 0.0239, "step": 130420 }, { "epoch": 0.34, "learning_rate": 0.00024928599386698667, "loss": 0.0193, "step": 130430 }, { "epoch": 0.34, "learning_rate": 0.00024928210565061524, "loss": 0.0252, "step": 130440 }, { "epoch": 0.34, "learning_rate": 0.00024927821743424375, "loss": 0.0154, "step": 130450 }, { "epoch": 0.34, "learning_rate": 0.00024927432921787227, "loss": 0.0199, "step": 130460 }, { "epoch": 0.34, "learning_rate": 0.00024927044100150084, "loss": 0.0221, "step": 130470 }, { "epoch": 0.34, "learning_rate": 0.0002492665527851294, "loss": 0.0141, "step": 130480 }, { "epoch": 0.34, "learning_rate": 0.0002492626645687579, "loss": 0.0172, "step": 130490 }, { "epoch": 0.34, "learning_rate": 0.00024925877635238644, "loss": 0.0235, "step": 130500 }, { "epoch": 0.34, "learning_rate": 0.00024925488813601495, "loss": 0.0228, "step": 130510 }, { "epoch": 0.34, "learning_rate": 0.00024925099991964346, "loss": 0.0239, "step": 130520 }, { "epoch": 0.34, "learning_rate": 0.00024924711170327203, "loss": 0.0213, "step": 130530 }, { "epoch": 0.34, "learning_rate": 0.0002492432234869006, "loss": 0.0235, "step": 130540 }, { "epoch": 0.34, "learning_rate": 0.0002492393352705291, "loss": 0.0214, "step": 130550 }, { "epoch": 0.34, "learning_rate": 0.00024923544705415763, "loss": 0.0186, "step": 130560 }, { "epoch": 0.34, "learning_rate": 0.0002492315588377862, "loss": 0.018, "step": 130570 }, { "epoch": 0.34, "learning_rate": 0.0002492276706214147, "loss": 0.0197, "step": 130580 }, { "epoch": 0.34, "learning_rate": 0.00024922378240504323, "loss": 0.0252, "step": 130590 }, { "epoch": 0.34, "learning_rate": 0.0002492198941886718, "loss": 0.0204, "step": 130600 }, { "epoch": 0.34, "learning_rate": 0.0002492160059723003, "loss": 0.0194, "step": 130610 }, { "epoch": 0.34, "learning_rate": 0.0002492121177559289, "loss": 0.0211, "step": 130620 }, { "epoch": 0.34, "learning_rate": 0.0002492082295395574, "loss": 0.0193, "step": 130630 }, { "epoch": 0.34, "learning_rate": 0.0002492043413231859, "loss": 0.0243, "step": 130640 }, { "epoch": 0.34, "learning_rate": 0.0002492004531068145, "loss": 0.0162, "step": 130650 }, { "epoch": 0.34, "learning_rate": 0.000249196564890443, "loss": 0.0184, "step": 130660 }, { "epoch": 0.34, "learning_rate": 0.0002491926766740715, "loss": 0.0253, "step": 130670 }, { "epoch": 0.34, "learning_rate": 0.0002491887884577001, "loss": 0.0179, "step": 130680 }, { "epoch": 0.34, "learning_rate": 0.00024918490024132864, "loss": 0.0198, "step": 130690 }, { "epoch": 0.34, "learning_rate": 0.00024918101202495716, "loss": 0.0197, "step": 130700 }, { "epoch": 0.34, "learning_rate": 0.0002491771238085857, "loss": 0.0204, "step": 130710 }, { "epoch": 0.34, "learning_rate": 0.0002491732355922142, "loss": 0.0152, "step": 130720 }, { "epoch": 0.34, "learning_rate": 0.00024916934737584276, "loss": 0.0218, "step": 130730 }, { "epoch": 0.34, "learning_rate": 0.00024916545915947127, "loss": 0.021, "step": 130740 }, { "epoch": 0.34, "learning_rate": 0.00024916157094309984, "loss": 0.0208, "step": 130750 }, { "epoch": 0.34, "learning_rate": 0.00024915768272672836, "loss": 0.0204, "step": 130760 }, { "epoch": 0.34, "learning_rate": 0.00024915379451035687, "loss": 0.0194, "step": 130770 }, { "epoch": 0.34, "learning_rate": 0.00024914990629398544, "loss": 0.0173, "step": 130780 }, { "epoch": 0.34, "learning_rate": 0.00024914601807761395, "loss": 0.019, "step": 130790 }, { "epoch": 0.34, "learning_rate": 0.00024914212986124247, "loss": 0.0222, "step": 130800 }, { "epoch": 0.34, "learning_rate": 0.00024913824164487104, "loss": 0.0227, "step": 130810 }, { "epoch": 0.34, "learning_rate": 0.0002491343534284996, "loss": 0.0239, "step": 130820 }, { "epoch": 0.34, "learning_rate": 0.0002491304652121281, "loss": 0.0196, "step": 130830 }, { "epoch": 0.34, "learning_rate": 0.00024912657699575663, "loss": 0.0236, "step": 130840 }, { "epoch": 0.34, "learning_rate": 0.00024912268877938515, "loss": 0.0241, "step": 130850 }, { "epoch": 0.34, "learning_rate": 0.0002491188005630137, "loss": 0.0294, "step": 130860 }, { "epoch": 0.34, "learning_rate": 0.00024911491234664223, "loss": 0.0326, "step": 130870 }, { "epoch": 0.34, "learning_rate": 0.0002491110241302708, "loss": 0.0183, "step": 130880 }, { "epoch": 0.34, "learning_rate": 0.0002491071359138993, "loss": 0.0181, "step": 130890 }, { "epoch": 0.34, "learning_rate": 0.0002491032476975279, "loss": 0.0191, "step": 130900 }, { "epoch": 0.34, "learning_rate": 0.0002490993594811564, "loss": 0.0243, "step": 130910 }, { "epoch": 0.34, "learning_rate": 0.0002490954712647849, "loss": 0.0197, "step": 130920 }, { "epoch": 0.34, "learning_rate": 0.00024909158304841343, "loss": 0.0186, "step": 130930 }, { "epoch": 0.34, "learning_rate": 0.000249087694832042, "loss": 0.02, "step": 130940 }, { "epoch": 0.34, "learning_rate": 0.0002490838066156705, "loss": 0.0225, "step": 130950 }, { "epoch": 0.34, "learning_rate": 0.0002490799183992991, "loss": 0.0232, "step": 130960 }, { "epoch": 0.34, "learning_rate": 0.0002490760301829276, "loss": 0.0251, "step": 130970 }, { "epoch": 0.34, "learning_rate": 0.00024907214196655616, "loss": 0.0156, "step": 130980 }, { "epoch": 0.34, "learning_rate": 0.0002490682537501847, "loss": 0.023, "step": 130990 }, { "epoch": 0.34, "learning_rate": 0.0002490643655338132, "loss": 0.0232, "step": 131000 }, { "epoch": 0.34, "eval_cer": 0.8818034601824287, "eval_loss": 0.014057641848921776, "eval_runtime": 107.6812, "eval_samples_per_second": 18.573, "eval_steps_per_second": 4.643, "step": 131000 }, { "epoch": 0.34, "learning_rate": 0.0002490604773174417, "loss": 0.0197, "step": 131010 }, { "epoch": 0.34, "learning_rate": 0.0002490565891010703, "loss": 0.0217, "step": 131020 }, { "epoch": 0.34, "learning_rate": 0.00024905270088469884, "loss": 0.023, "step": 131030 }, { "epoch": 0.34, "learning_rate": 0.00024904881266832736, "loss": 0.0172, "step": 131040 }, { "epoch": 0.34, "learning_rate": 0.00024904492445195587, "loss": 0.0207, "step": 131050 }, { "epoch": 0.34, "learning_rate": 0.0002490410362355844, "loss": 0.0194, "step": 131060 }, { "epoch": 0.34, "learning_rate": 0.00024903714801921296, "loss": 0.022, "step": 131070 }, { "epoch": 0.34, "learning_rate": 0.00024903325980284147, "loss": 0.0248, "step": 131080 }, { "epoch": 0.34, "learning_rate": 0.00024902937158647004, "loss": 0.0176, "step": 131090 }, { "epoch": 0.34, "learning_rate": 0.00024902548337009855, "loss": 0.0179, "step": 131100 }, { "epoch": 0.34, "learning_rate": 0.0002490215951537271, "loss": 0.0191, "step": 131110 }, { "epoch": 0.34, "learning_rate": 0.00024901770693735564, "loss": 0.0238, "step": 131120 }, { "epoch": 0.34, "learning_rate": 0.00024901381872098415, "loss": 0.0221, "step": 131130 }, { "epoch": 0.34, "learning_rate": 0.00024900993050461267, "loss": 0.0194, "step": 131140 }, { "epoch": 0.34, "learning_rate": 0.00024900604228824124, "loss": 0.0202, "step": 131150 }, { "epoch": 0.34, "learning_rate": 0.00024900215407186975, "loss": 0.0243, "step": 131160 }, { "epoch": 0.34, "learning_rate": 0.0002489982658554983, "loss": 0.0246, "step": 131170 }, { "epoch": 0.34, "learning_rate": 0.00024899437763912683, "loss": 0.0236, "step": 131180 }, { "epoch": 0.34, "learning_rate": 0.0002489904894227554, "loss": 0.0231, "step": 131190 }, { "epoch": 0.34, "learning_rate": 0.0002489866012063839, "loss": 0.0265, "step": 131200 }, { "epoch": 0.34, "learning_rate": 0.00024898271299001243, "loss": 0.0243, "step": 131210 }, { "epoch": 0.34, "learning_rate": 0.000248978824773641, "loss": 0.0198, "step": 131220 }, { "epoch": 0.34, "learning_rate": 0.0002489749365572695, "loss": 0.02, "step": 131230 }, { "epoch": 0.34, "learning_rate": 0.0002489710483408981, "loss": 0.0212, "step": 131240 }, { "epoch": 0.34, "learning_rate": 0.0002489671601245266, "loss": 0.0206, "step": 131250 }, { "epoch": 0.34, "learning_rate": 0.0002489632719081551, "loss": 0.0242, "step": 131260 }, { "epoch": 0.34, "learning_rate": 0.0002489593836917836, "loss": 0.0182, "step": 131270 }, { "epoch": 0.34, "learning_rate": 0.0002489554954754122, "loss": 0.021, "step": 131280 }, { "epoch": 0.34, "learning_rate": 0.0002489516072590407, "loss": 0.0202, "step": 131290 }, { "epoch": 0.34, "learning_rate": 0.0002489477190426693, "loss": 0.0171, "step": 131300 }, { "epoch": 0.34, "learning_rate": 0.0002489438308262978, "loss": 0.0244, "step": 131310 }, { "epoch": 0.34, "learning_rate": 0.00024893994260992636, "loss": 0.0236, "step": 131320 }, { "epoch": 0.34, "learning_rate": 0.0002489360543935549, "loss": 0.0174, "step": 131330 }, { "epoch": 0.34, "learning_rate": 0.0002489321661771834, "loss": 0.021, "step": 131340 }, { "epoch": 0.34, "learning_rate": 0.0002489282779608119, "loss": 0.0309, "step": 131350 }, { "epoch": 0.34, "learning_rate": 0.0002489243897444405, "loss": 0.0274, "step": 131360 }, { "epoch": 0.34, "learning_rate": 0.00024892050152806904, "loss": 0.0248, "step": 131370 }, { "epoch": 0.34, "learning_rate": 0.00024891661331169756, "loss": 0.0181, "step": 131380 }, { "epoch": 0.34, "learning_rate": 0.00024891272509532607, "loss": 0.0198, "step": 131390 }, { "epoch": 0.34, "learning_rate": 0.00024890883687895464, "loss": 0.018, "step": 131400 }, { "epoch": 0.34, "learning_rate": 0.00024890494866258316, "loss": 0.0204, "step": 131410 }, { "epoch": 0.34, "learning_rate": 0.00024890106044621167, "loss": 0.0238, "step": 131420 }, { "epoch": 0.34, "learning_rate": 0.00024889717222984024, "loss": 0.0193, "step": 131430 }, { "epoch": 0.34, "learning_rate": 0.00024889328401346875, "loss": 0.0192, "step": 131440 }, { "epoch": 0.34, "learning_rate": 0.0002488893957970973, "loss": 0.0235, "step": 131450 }, { "epoch": 0.34, "learning_rate": 0.00024888550758072584, "loss": 0.0193, "step": 131460 }, { "epoch": 0.34, "learning_rate": 0.00024888161936435435, "loss": 0.0233, "step": 131470 }, { "epoch": 0.34, "learning_rate": 0.0002488777311479829, "loss": 0.0183, "step": 131480 }, { "epoch": 0.34, "learning_rate": 0.00024887384293161143, "loss": 0.0217, "step": 131490 }, { "epoch": 0.34, "learning_rate": 0.00024886995471523995, "loss": 0.0279, "step": 131500 }, { "epoch": 0.34, "learning_rate": 0.0002488660664988685, "loss": 0.0225, "step": 131510 }, { "epoch": 0.34, "learning_rate": 0.00024886217828249703, "loss": 0.0184, "step": 131520 }, { "epoch": 0.34, "learning_rate": 0.0002488582900661256, "loss": 0.022, "step": 131530 }, { "epoch": 0.34, "learning_rate": 0.0002488544018497541, "loss": 0.0161, "step": 131540 }, { "epoch": 0.34, "learning_rate": 0.00024885051363338263, "loss": 0.0215, "step": 131550 }, { "epoch": 0.34, "learning_rate": 0.00024884662541701114, "loss": 0.0188, "step": 131560 }, { "epoch": 0.34, "learning_rate": 0.0002488427372006397, "loss": 0.0204, "step": 131570 }, { "epoch": 0.34, "learning_rate": 0.0002488388489842683, "loss": 0.0186, "step": 131580 }, { "epoch": 0.34, "learning_rate": 0.0002488349607678968, "loss": 0.0233, "step": 131590 }, { "epoch": 0.34, "learning_rate": 0.0002488310725515253, "loss": 0.0213, "step": 131600 }, { "epoch": 0.34, "learning_rate": 0.0002488271843351539, "loss": 0.0195, "step": 131610 }, { "epoch": 0.34, "learning_rate": 0.0002488232961187824, "loss": 0.0191, "step": 131620 }, { "epoch": 0.34, "learning_rate": 0.0002488194079024109, "loss": 0.021, "step": 131630 }, { "epoch": 0.34, "learning_rate": 0.0002488155196860395, "loss": 0.0206, "step": 131640 }, { "epoch": 0.34, "learning_rate": 0.000248811631469668, "loss": 0.0297, "step": 131650 }, { "epoch": 0.34, "learning_rate": 0.00024880774325329656, "loss": 0.0209, "step": 131660 }, { "epoch": 0.34, "learning_rate": 0.0002488038550369251, "loss": 0.0245, "step": 131670 }, { "epoch": 0.34, "learning_rate": 0.0002487999668205536, "loss": 0.0215, "step": 131680 }, { "epoch": 0.34, "learning_rate": 0.00024879607860418216, "loss": 0.0237, "step": 131690 }, { "epoch": 0.34, "learning_rate": 0.00024879219038781067, "loss": 0.0248, "step": 131700 }, { "epoch": 0.34, "learning_rate": 0.0002487883021714392, "loss": 0.0216, "step": 131710 }, { "epoch": 0.34, "learning_rate": 0.00024878441395506776, "loss": 0.0255, "step": 131720 }, { "epoch": 0.34, "learning_rate": 0.0002487805257386963, "loss": 0.0177, "step": 131730 }, { "epoch": 0.34, "learning_rate": 0.00024877663752232484, "loss": 0.0201, "step": 131740 }, { "epoch": 0.34, "learning_rate": 0.00024877274930595335, "loss": 0.0216, "step": 131750 }, { "epoch": 0.34, "learning_rate": 0.00024876886108958187, "loss": 0.0192, "step": 131760 }, { "epoch": 0.34, "learning_rate": 0.00024876497287321044, "loss": 0.0173, "step": 131770 }, { "epoch": 0.34, "learning_rate": 0.00024876108465683895, "loss": 0.0177, "step": 131780 }, { "epoch": 0.34, "learning_rate": 0.0002487571964404675, "loss": 0.0171, "step": 131790 }, { "epoch": 0.34, "learning_rate": 0.00024875330822409603, "loss": 0.0196, "step": 131800 }, { "epoch": 0.34, "learning_rate": 0.00024874942000772455, "loss": 0.02, "step": 131810 }, { "epoch": 0.34, "learning_rate": 0.0002487455317913531, "loss": 0.0203, "step": 131820 }, { "epoch": 0.34, "learning_rate": 0.00024874164357498163, "loss": 0.0204, "step": 131830 }, { "epoch": 0.34, "learning_rate": 0.00024873775535861015, "loss": 0.0201, "step": 131840 }, { "epoch": 0.34, "learning_rate": 0.0002487338671422387, "loss": 0.0176, "step": 131850 }, { "epoch": 0.34, "learning_rate": 0.00024872997892586723, "loss": 0.0216, "step": 131860 }, { "epoch": 0.34, "learning_rate": 0.0002487260907094958, "loss": 0.0163, "step": 131870 }, { "epoch": 0.34, "learning_rate": 0.0002487222024931243, "loss": 0.0173, "step": 131880 }, { "epoch": 0.34, "learning_rate": 0.00024871831427675283, "loss": 0.025, "step": 131890 }, { "epoch": 0.34, "learning_rate": 0.0002487144260603814, "loss": 0.0205, "step": 131900 }, { "epoch": 0.34, "learning_rate": 0.0002487105378440099, "loss": 0.021, "step": 131910 }, { "epoch": 0.34, "learning_rate": 0.0002487066496276385, "loss": 0.0164, "step": 131920 }, { "epoch": 0.34, "learning_rate": 0.000248702761411267, "loss": 0.0203, "step": 131930 }, { "epoch": 0.34, "learning_rate": 0.00024869887319489556, "loss": 0.0201, "step": 131940 }, { "epoch": 0.34, "learning_rate": 0.0002486949849785241, "loss": 0.0176, "step": 131950 }, { "epoch": 0.34, "learning_rate": 0.0002486910967621526, "loss": 0.0203, "step": 131960 }, { "epoch": 0.34, "learning_rate": 0.0002486872085457811, "loss": 0.0196, "step": 131970 }, { "epoch": 0.34, "learning_rate": 0.0002486833203294097, "loss": 0.0183, "step": 131980 }, { "epoch": 0.34, "learning_rate": 0.0002486794321130382, "loss": 0.0199, "step": 131990 }, { "epoch": 0.34, "learning_rate": 0.00024867554389666676, "loss": 0.0186, "step": 132000 }, { "epoch": 0.34, "eval_cer": 0.8818034601824287, "eval_loss": 0.014384100213646889, "eval_runtime": 107.6844, "eval_samples_per_second": 18.573, "eval_steps_per_second": 4.643, "step": 132000 }, { "epoch": 0.34, "learning_rate": 0.0002486716556802953, "loss": 0.0219, "step": 132010 }, { "epoch": 0.34, "learning_rate": 0.0002486677674639238, "loss": 0.0215, "step": 132020 }, { "epoch": 0.34, "learning_rate": 0.00024866387924755236, "loss": 0.014, "step": 132030 }, { "epoch": 0.34, "learning_rate": 0.00024865999103118087, "loss": 0.0201, "step": 132040 }, { "epoch": 0.34, "learning_rate": 0.0002486561028148094, "loss": 0.0265, "step": 132050 }, { "epoch": 0.34, "learning_rate": 0.00024865221459843795, "loss": 0.0225, "step": 132060 }, { "epoch": 0.34, "learning_rate": 0.0002486483263820665, "loss": 0.0199, "step": 132070 }, { "epoch": 0.34, "learning_rate": 0.00024864443816569504, "loss": 0.0173, "step": 132080 }, { "epoch": 0.34, "learning_rate": 0.00024864054994932355, "loss": 0.0195, "step": 132090 }, { "epoch": 0.34, "learning_rate": 0.00024863666173295207, "loss": 0.0237, "step": 132100 }, { "epoch": 0.34, "learning_rate": 0.00024863277351658064, "loss": 0.0182, "step": 132110 }, { "epoch": 0.34, "learning_rate": 0.00024862888530020915, "loss": 0.0182, "step": 132120 }, { "epoch": 0.34, "learning_rate": 0.0002486249970838377, "loss": 0.0155, "step": 132130 }, { "epoch": 0.34, "learning_rate": 0.00024862110886746623, "loss": 0.0221, "step": 132140 }, { "epoch": 0.34, "learning_rate": 0.0002486172206510948, "loss": 0.0224, "step": 132150 }, { "epoch": 0.34, "learning_rate": 0.0002486133324347233, "loss": 0.0163, "step": 132160 }, { "epoch": 0.34, "learning_rate": 0.00024860944421835183, "loss": 0.0236, "step": 132170 }, { "epoch": 0.34, "learning_rate": 0.00024860555600198035, "loss": 0.0199, "step": 132180 }, { "epoch": 0.34, "learning_rate": 0.0002486016677856089, "loss": 0.0201, "step": 132190 }, { "epoch": 0.34, "learning_rate": 0.00024859777956923743, "loss": 0.0166, "step": 132200 }, { "epoch": 0.34, "learning_rate": 0.000248593891352866, "loss": 0.0163, "step": 132210 }, { "epoch": 0.34, "learning_rate": 0.0002485900031364945, "loss": 0.021, "step": 132220 }, { "epoch": 0.34, "learning_rate": 0.0002485861149201231, "loss": 0.0202, "step": 132230 }, { "epoch": 0.34, "learning_rate": 0.0002485822267037516, "loss": 0.0176, "step": 132240 }, { "epoch": 0.34, "learning_rate": 0.0002485783384873801, "loss": 0.0223, "step": 132250 }, { "epoch": 0.34, "learning_rate": 0.0002485744502710086, "loss": 0.0225, "step": 132260 }, { "epoch": 0.34, "learning_rate": 0.0002485705620546372, "loss": 0.0205, "step": 132270 }, { "epoch": 0.34, "learning_rate": 0.00024856667383826576, "loss": 0.0192, "step": 132280 }, { "epoch": 0.34, "learning_rate": 0.0002485627856218943, "loss": 0.0194, "step": 132290 }, { "epoch": 0.34, "learning_rate": 0.0002485588974055228, "loss": 0.0192, "step": 132300 }, { "epoch": 0.34, "learning_rate": 0.0002485550091891513, "loss": 0.0182, "step": 132310 }, { "epoch": 0.34, "learning_rate": 0.0002485511209727799, "loss": 0.0224, "step": 132320 }, { "epoch": 0.34, "learning_rate": 0.0002485472327564084, "loss": 0.02, "step": 132330 }, { "epoch": 0.34, "learning_rate": 0.00024854334454003696, "loss": 0.0202, "step": 132340 }, { "epoch": 0.34, "learning_rate": 0.00024853945632366547, "loss": 0.0181, "step": 132350 }, { "epoch": 0.34, "learning_rate": 0.00024853556810729404, "loss": 0.0209, "step": 132360 }, { "epoch": 0.34, "learning_rate": 0.00024853167989092256, "loss": 0.0193, "step": 132370 }, { "epoch": 0.34, "learning_rate": 0.00024852779167455107, "loss": 0.02, "step": 132380 }, { "epoch": 0.34, "learning_rate": 0.0002485239034581796, "loss": 0.0223, "step": 132390 }, { "epoch": 0.34, "learning_rate": 0.00024852001524180815, "loss": 0.0206, "step": 132400 }, { "epoch": 0.34, "learning_rate": 0.0002485161270254367, "loss": 0.0152, "step": 132410 }, { "epoch": 0.34, "learning_rate": 0.00024851223880906524, "loss": 0.0231, "step": 132420 }, { "epoch": 0.34, "learning_rate": 0.00024850835059269375, "loss": 0.0174, "step": 132430 }, { "epoch": 0.34, "learning_rate": 0.0002485044623763223, "loss": 0.0193, "step": 132440 }, { "epoch": 0.34, "learning_rate": 0.00024850057415995083, "loss": 0.0246, "step": 132450 }, { "epoch": 0.34, "learning_rate": 0.00024849668594357935, "loss": 0.0179, "step": 132460 }, { "epoch": 0.34, "learning_rate": 0.0002484927977272079, "loss": 0.0207, "step": 132470 }, { "epoch": 0.34, "learning_rate": 0.00024848890951083643, "loss": 0.0174, "step": 132480 }, { "epoch": 0.34, "learning_rate": 0.000248485021294465, "loss": 0.0222, "step": 132490 }, { "epoch": 0.34, "learning_rate": 0.0002484811330780935, "loss": 0.0167, "step": 132500 }, { "epoch": 0.34, "learning_rate": 0.00024847724486172203, "loss": 0.0165, "step": 132510 }, { "epoch": 0.34, "learning_rate": 0.00024847335664535054, "loss": 0.0196, "step": 132520 }, { "epoch": 0.34, "learning_rate": 0.0002484694684289791, "loss": 0.0184, "step": 132530 }, { "epoch": 0.34, "learning_rate": 0.00024846558021260763, "loss": 0.0199, "step": 132540 }, { "epoch": 0.34, "learning_rate": 0.0002484616919962362, "loss": 0.0226, "step": 132550 }, { "epoch": 0.34, "learning_rate": 0.0002484578037798647, "loss": 0.0185, "step": 132560 }, { "epoch": 0.34, "learning_rate": 0.0002484539155634933, "loss": 0.0163, "step": 132570 }, { "epoch": 0.34, "learning_rate": 0.0002484500273471218, "loss": 0.0295, "step": 132580 }, { "epoch": 0.34, "learning_rate": 0.0002484461391307503, "loss": 0.0218, "step": 132590 }, { "epoch": 0.34, "learning_rate": 0.0002484422509143788, "loss": 0.0221, "step": 132600 }, { "epoch": 0.34, "learning_rate": 0.0002484383626980074, "loss": 0.0211, "step": 132610 }, { "epoch": 0.34, "learning_rate": 0.00024843447448163596, "loss": 0.0205, "step": 132620 }, { "epoch": 0.34, "learning_rate": 0.0002484305862652645, "loss": 0.0191, "step": 132630 }, { "epoch": 0.34, "learning_rate": 0.000248426698048893, "loss": 0.0255, "step": 132640 }, { "epoch": 0.34, "learning_rate": 0.00024842280983252156, "loss": 0.0191, "step": 132650 }, { "epoch": 0.34, "learning_rate": 0.0002484189216161501, "loss": 0.0225, "step": 132660 }, { "epoch": 0.34, "learning_rate": 0.0002484150333997786, "loss": 0.0192, "step": 132670 }, { "epoch": 0.34, "learning_rate": 0.00024841114518340716, "loss": 0.0208, "step": 132680 }, { "epoch": 0.34, "learning_rate": 0.00024840725696703567, "loss": 0.0172, "step": 132690 }, { "epoch": 0.34, "learning_rate": 0.00024840336875066424, "loss": 0.0233, "step": 132700 }, { "epoch": 0.34, "learning_rate": 0.00024839948053429275, "loss": 0.0197, "step": 132710 }, { "epoch": 0.34, "learning_rate": 0.00024839559231792127, "loss": 0.0177, "step": 132720 }, { "epoch": 0.34, "learning_rate": 0.00024839170410154984, "loss": 0.0217, "step": 132730 }, { "epoch": 0.34, "learning_rate": 0.00024838781588517835, "loss": 0.0263, "step": 132740 }, { "epoch": 0.34, "learning_rate": 0.00024838392766880687, "loss": 0.0199, "step": 132750 }, { "epoch": 0.34, "learning_rate": 0.00024838003945243544, "loss": 0.024, "step": 132760 }, { "epoch": 0.34, "learning_rate": 0.00024837615123606395, "loss": 0.0186, "step": 132770 }, { "epoch": 0.34, "learning_rate": 0.0002483722630196925, "loss": 0.0164, "step": 132780 }, { "epoch": 0.34, "learning_rate": 0.00024836837480332103, "loss": 0.0183, "step": 132790 }, { "epoch": 0.34, "learning_rate": 0.00024836448658694955, "loss": 0.0205, "step": 132800 }, { "epoch": 0.34, "learning_rate": 0.0002483605983705781, "loss": 0.0255, "step": 132810 }, { "epoch": 0.34, "learning_rate": 0.00024835671015420663, "loss": 0.0201, "step": 132820 }, { "epoch": 0.34, "learning_rate": 0.0002483528219378352, "loss": 0.0171, "step": 132830 }, { "epoch": 0.34, "learning_rate": 0.0002483489337214637, "loss": 0.0185, "step": 132840 }, { "epoch": 0.34, "learning_rate": 0.00024834504550509223, "loss": 0.0183, "step": 132850 }, { "epoch": 0.34, "learning_rate": 0.0002483411572887208, "loss": 0.021, "step": 132860 }, { "epoch": 0.34, "learning_rate": 0.0002483372690723493, "loss": 0.0272, "step": 132870 }, { "epoch": 0.34, "learning_rate": 0.0002483333808559778, "loss": 0.0232, "step": 132880 }, { "epoch": 0.34, "learning_rate": 0.0002483294926396064, "loss": 0.0209, "step": 132890 }, { "epoch": 0.34, "learning_rate": 0.0002483256044232349, "loss": 0.0192, "step": 132900 }, { "epoch": 0.34, "learning_rate": 0.0002483217162068635, "loss": 0.0187, "step": 132910 }, { "epoch": 0.34, "learning_rate": 0.000248317827990492, "loss": 0.0169, "step": 132920 }, { "epoch": 0.34, "learning_rate": 0.0002483139397741205, "loss": 0.0193, "step": 132930 }, { "epoch": 0.34, "learning_rate": 0.0002483100515577491, "loss": 0.0233, "step": 132940 }, { "epoch": 0.34, "learning_rate": 0.0002483061633413776, "loss": 0.023, "step": 132950 }, { "epoch": 0.34, "learning_rate": 0.00024830227512500616, "loss": 0.02, "step": 132960 }, { "epoch": 0.34, "learning_rate": 0.0002482983869086347, "loss": 0.0231, "step": 132970 }, { "epoch": 0.34, "learning_rate": 0.00024829449869226324, "loss": 0.0239, "step": 132980 }, { "epoch": 0.34, "learning_rate": 0.00024829061047589176, "loss": 0.0284, "step": 132990 }, { "epoch": 0.34, "learning_rate": 0.00024828672225952027, "loss": 0.0241, "step": 133000 }, { "epoch": 0.34, "eval_cer": 0.8817880641761527, "eval_loss": 0.013718601316213608, "eval_runtime": 107.4626, "eval_samples_per_second": 18.611, "eval_steps_per_second": 4.653, "step": 133000 }, { "epoch": 0.34, "learning_rate": 0.0002482828340431488, "loss": 0.0189, "step": 133010 }, { "epoch": 0.34, "learning_rate": 0.00024827894582677736, "loss": 0.0176, "step": 133020 }, { "epoch": 0.34, "learning_rate": 0.00024827505761040587, "loss": 0.0176, "step": 133030 }, { "epoch": 0.34, "learning_rate": 0.00024827116939403444, "loss": 0.0172, "step": 133040 }, { "epoch": 0.34, "learning_rate": 0.00024826728117766295, "loss": 0.0291, "step": 133050 }, { "epoch": 0.34, "learning_rate": 0.00024826339296129147, "loss": 0.02, "step": 133060 }, { "epoch": 0.34, "learning_rate": 0.00024825950474492004, "loss": 0.0188, "step": 133070 }, { "epoch": 0.34, "learning_rate": 0.00024825561652854855, "loss": 0.0192, "step": 133080 }, { "epoch": 0.34, "learning_rate": 0.00024825172831217707, "loss": 0.0204, "step": 133090 }, { "epoch": 0.35, "learning_rate": 0.00024824784009580563, "loss": 0.0207, "step": 133100 }, { "epoch": 0.35, "learning_rate": 0.0002482439518794342, "loss": 0.0218, "step": 133110 }, { "epoch": 0.35, "learning_rate": 0.0002482400636630627, "loss": 0.0222, "step": 133120 }, { "epoch": 0.35, "learning_rate": 0.00024823617544669123, "loss": 0.0202, "step": 133130 }, { "epoch": 0.35, "learning_rate": 0.00024823228723031975, "loss": 0.0239, "step": 133140 }, { "epoch": 0.35, "learning_rate": 0.0002482283990139483, "loss": 0.0236, "step": 133150 }, { "epoch": 0.35, "learning_rate": 0.00024822451079757683, "loss": 0.0206, "step": 133160 }, { "epoch": 0.35, "learning_rate": 0.0002482206225812054, "loss": 0.0239, "step": 133170 }, { "epoch": 0.35, "learning_rate": 0.0002482167343648339, "loss": 0.0222, "step": 133180 }, { "epoch": 0.35, "learning_rate": 0.0002482128461484625, "loss": 0.0209, "step": 133190 }, { "epoch": 0.35, "learning_rate": 0.000248208957932091, "loss": 0.0202, "step": 133200 }, { "epoch": 0.35, "learning_rate": 0.0002482050697157195, "loss": 0.0233, "step": 133210 }, { "epoch": 0.35, "learning_rate": 0.000248201181499348, "loss": 0.0335, "step": 133220 }, { "epoch": 0.35, "learning_rate": 0.0002481972932829766, "loss": 0.0234, "step": 133230 }, { "epoch": 0.35, "learning_rate": 0.0002481934050666051, "loss": 0.0199, "step": 133240 }, { "epoch": 0.35, "learning_rate": 0.0002481895168502337, "loss": 0.0229, "step": 133250 }, { "epoch": 0.35, "learning_rate": 0.0002481856286338622, "loss": 0.0246, "step": 133260 }, { "epoch": 0.35, "learning_rate": 0.0002481817404174907, "loss": 0.0192, "step": 133270 }, { "epoch": 0.35, "learning_rate": 0.0002481778522011193, "loss": 0.0238, "step": 133280 }, { "epoch": 0.35, "learning_rate": 0.0002481739639847478, "loss": 0.0188, "step": 133290 }, { "epoch": 0.35, "learning_rate": 0.0002481700757683763, "loss": 0.0198, "step": 133300 }, { "epoch": 0.35, "learning_rate": 0.0002481661875520049, "loss": 0.0197, "step": 133310 }, { "epoch": 0.35, "learning_rate": 0.00024816229933563344, "loss": 0.0181, "step": 133320 }, { "epoch": 0.35, "learning_rate": 0.00024815841111926196, "loss": 0.02, "step": 133330 }, { "epoch": 0.35, "learning_rate": 0.00024815452290289047, "loss": 0.0222, "step": 133340 }, { "epoch": 0.35, "learning_rate": 0.000248150634686519, "loss": 0.0215, "step": 133350 }, { "epoch": 0.35, "learning_rate": 0.00024814674647014755, "loss": 0.019, "step": 133360 }, { "epoch": 0.35, "learning_rate": 0.00024814285825377607, "loss": 0.0203, "step": 133370 }, { "epoch": 0.35, "learning_rate": 0.00024813897003740464, "loss": 0.0188, "step": 133380 }, { "epoch": 0.35, "learning_rate": 0.00024813508182103315, "loss": 0.0169, "step": 133390 }, { "epoch": 0.35, "learning_rate": 0.0002481311936046617, "loss": 0.0201, "step": 133400 }, { "epoch": 0.35, "learning_rate": 0.00024812730538829024, "loss": 0.0274, "step": 133410 }, { "epoch": 0.35, "learning_rate": 0.00024812341717191875, "loss": 0.0221, "step": 133420 }, { "epoch": 0.35, "learning_rate": 0.00024811952895554726, "loss": 0.0216, "step": 133430 }, { "epoch": 0.35, "learning_rate": 0.00024811564073917583, "loss": 0.0192, "step": 133440 }, { "epoch": 0.35, "learning_rate": 0.00024811175252280435, "loss": 0.0176, "step": 133450 }, { "epoch": 0.35, "learning_rate": 0.0002481078643064329, "loss": 0.0193, "step": 133460 }, { "epoch": 0.35, "learning_rate": 0.00024810397609006143, "loss": 0.0204, "step": 133470 }, { "epoch": 0.35, "learning_rate": 0.00024810008787369, "loss": 0.0206, "step": 133480 }, { "epoch": 0.35, "learning_rate": 0.0002480961996573185, "loss": 0.025, "step": 133490 }, { "epoch": 0.35, "learning_rate": 0.00024809231144094703, "loss": 0.018, "step": 133500 }, { "epoch": 0.35, "learning_rate": 0.0002480884232245756, "loss": 0.0194, "step": 133510 }, { "epoch": 0.35, "learning_rate": 0.0002480845350082041, "loss": 0.0168, "step": 133520 }, { "epoch": 0.35, "learning_rate": 0.0002480806467918327, "loss": 0.0211, "step": 133530 }, { "epoch": 0.35, "learning_rate": 0.0002480767585754612, "loss": 0.02, "step": 133540 }, { "epoch": 0.35, "learning_rate": 0.0002480728703590897, "loss": 0.0183, "step": 133550 }, { "epoch": 0.35, "learning_rate": 0.0002480689821427182, "loss": 0.0205, "step": 133560 }, { "epoch": 0.35, "learning_rate": 0.0002480650939263468, "loss": 0.0154, "step": 133570 }, { "epoch": 0.35, "learning_rate": 0.0002480612057099753, "loss": 0.0229, "step": 133580 }, { "epoch": 0.35, "learning_rate": 0.0002480573174936039, "loss": 0.0167, "step": 133590 }, { "epoch": 0.35, "learning_rate": 0.0002480534292772324, "loss": 0.0184, "step": 133600 }, { "epoch": 0.35, "learning_rate": 0.00024804954106086096, "loss": 0.018, "step": 133610 }, { "epoch": 0.35, "learning_rate": 0.0002480456528444895, "loss": 0.018, "step": 133620 }, { "epoch": 0.35, "learning_rate": 0.000248041764628118, "loss": 0.0242, "step": 133630 }, { "epoch": 0.35, "learning_rate": 0.0002480378764117465, "loss": 0.0195, "step": 133640 }, { "epoch": 0.35, "learning_rate": 0.00024803398819537507, "loss": 0.0196, "step": 133650 }, { "epoch": 0.35, "learning_rate": 0.00024803009997900364, "loss": 0.0199, "step": 133660 }, { "epoch": 0.35, "learning_rate": 0.00024802621176263216, "loss": 0.0195, "step": 133670 }, { "epoch": 0.35, "learning_rate": 0.00024802232354626067, "loss": 0.0233, "step": 133680 }, { "epoch": 0.35, "learning_rate": 0.00024801843532988924, "loss": 0.0257, "step": 133690 }, { "epoch": 0.35, "learning_rate": 0.00024801454711351775, "loss": 0.0197, "step": 133700 }, { "epoch": 0.35, "learning_rate": 0.00024801065889714627, "loss": 0.0213, "step": 133710 }, { "epoch": 0.35, "learning_rate": 0.00024800677068077484, "loss": 0.0207, "step": 133720 }, { "epoch": 0.35, "learning_rate": 0.00024800288246440335, "loss": 0.0271, "step": 133730 }, { "epoch": 0.35, "learning_rate": 0.0002479989942480319, "loss": 0.0203, "step": 133740 }, { "epoch": 0.35, "learning_rate": 0.00024799510603166043, "loss": 0.0204, "step": 133750 }, { "epoch": 0.35, "learning_rate": 0.00024799121781528895, "loss": 0.0198, "step": 133760 }, { "epoch": 0.35, "learning_rate": 0.00024798732959891746, "loss": 0.0179, "step": 133770 }, { "epoch": 0.35, "learning_rate": 0.00024798344138254603, "loss": 0.0252, "step": 133780 }, { "epoch": 0.35, "learning_rate": 0.00024797955316617455, "loss": 0.0194, "step": 133790 }, { "epoch": 0.35, "learning_rate": 0.0002479756649498031, "loss": 0.0185, "step": 133800 }, { "epoch": 0.35, "learning_rate": 0.00024797177673343163, "loss": 0.0207, "step": 133810 }, { "epoch": 0.35, "learning_rate": 0.0002479678885170602, "loss": 0.0258, "step": 133820 }, { "epoch": 0.35, "learning_rate": 0.0002479640003006887, "loss": 0.0333, "step": 133830 }, { "epoch": 0.35, "learning_rate": 0.00024796011208431723, "loss": 0.0189, "step": 133840 }, { "epoch": 0.35, "learning_rate": 0.00024795622386794574, "loss": 0.0186, "step": 133850 }, { "epoch": 0.35, "learning_rate": 0.0002479523356515743, "loss": 0.0225, "step": 133860 }, { "epoch": 0.35, "learning_rate": 0.0002479484474352029, "loss": 0.096, "step": 133870 }, { "epoch": 0.35, "learning_rate": 0.0002479445592188314, "loss": 0.0277, "step": 133880 }, { "epoch": 0.35, "learning_rate": 0.0002479406710024599, "loss": 0.0213, "step": 133890 }, { "epoch": 0.35, "learning_rate": 0.0002479367827860885, "loss": 0.0272, "step": 133900 }, { "epoch": 0.35, "learning_rate": 0.000247932894569717, "loss": 0.024, "step": 133910 }, { "epoch": 0.35, "learning_rate": 0.0002479290063533455, "loss": 0.0212, "step": 133920 }, { "epoch": 0.35, "learning_rate": 0.0002479251181369741, "loss": 0.02, "step": 133930 }, { "epoch": 0.35, "learning_rate": 0.0002479212299206026, "loss": 0.0205, "step": 133940 }, { "epoch": 0.35, "learning_rate": 0.00024791734170423116, "loss": 0.0214, "step": 133950 }, { "epoch": 0.35, "learning_rate": 0.0002479134534878597, "loss": 0.018, "step": 133960 }, { "epoch": 0.35, "learning_rate": 0.0002479095652714882, "loss": 0.0302, "step": 133970 }, { "epoch": 0.35, "learning_rate": 0.0002479056770551167, "loss": 0.0189, "step": 133980 }, { "epoch": 0.35, "learning_rate": 0.00024790178883874527, "loss": 0.0169, "step": 133990 }, { "epoch": 0.35, "learning_rate": 0.00024789790062237384, "loss": 0.0197, "step": 134000 }, { "epoch": 0.35, "eval_cer": 0.8817558725266665, "eval_loss": 0.014305938966572285, "eval_runtime": 107.3575, "eval_samples_per_second": 18.629, "eval_steps_per_second": 4.657, "step": 134000 }, { "epoch": 0.35, "learning_rate": 0.00024789401240600235, "loss": 0.0234, "step": 134010 }, { "epoch": 0.35, "learning_rate": 0.00024789012418963087, "loss": 0.0222, "step": 134020 }, { "epoch": 0.35, "learning_rate": 0.00024788623597325944, "loss": 0.0188, "step": 134030 }, { "epoch": 0.35, "learning_rate": 0.00024788234775688795, "loss": 0.0258, "step": 134040 }, { "epoch": 0.35, "learning_rate": 0.00024787845954051647, "loss": 0.0175, "step": 134050 }, { "epoch": 0.35, "learning_rate": 0.00024787457132414504, "loss": 0.0185, "step": 134060 }, { "epoch": 0.35, "learning_rate": 0.00024787068310777355, "loss": 0.0167, "step": 134070 }, { "epoch": 0.35, "learning_rate": 0.0002478667948914021, "loss": 0.0151, "step": 134080 }, { "epoch": 0.35, "learning_rate": 0.00024786290667503063, "loss": 0.0213, "step": 134090 }, { "epoch": 0.35, "learning_rate": 0.00024785901845865915, "loss": 0.0181, "step": 134100 }, { "epoch": 0.35, "learning_rate": 0.0002478551302422877, "loss": 0.0192, "step": 134110 }, { "epoch": 0.35, "learning_rate": 0.00024785124202591623, "loss": 0.0191, "step": 134120 }, { "epoch": 0.35, "learning_rate": 0.00024784735380954475, "loss": 0.0223, "step": 134130 }, { "epoch": 0.35, "learning_rate": 0.0002478434655931733, "loss": 0.0249, "step": 134140 }, { "epoch": 0.35, "learning_rate": 0.0002478395773768019, "loss": 0.0263, "step": 134150 }, { "epoch": 0.35, "learning_rate": 0.0002478356891604304, "loss": 0.0172, "step": 134160 }, { "epoch": 0.35, "learning_rate": 0.0002478318009440589, "loss": 0.0192, "step": 134170 }, { "epoch": 0.35, "learning_rate": 0.0002478279127276874, "loss": 0.021, "step": 134180 }, { "epoch": 0.35, "learning_rate": 0.000247824024511316, "loss": 0.0197, "step": 134190 }, { "epoch": 0.35, "learning_rate": 0.0002478201362949445, "loss": 0.0251, "step": 134200 }, { "epoch": 0.35, "learning_rate": 0.0002478162480785731, "loss": 0.0189, "step": 134210 }, { "epoch": 0.35, "learning_rate": 0.0002478123598622016, "loss": 0.0208, "step": 134220 }, { "epoch": 0.35, "learning_rate": 0.0002478084716458301, "loss": 0.0239, "step": 134230 }, { "epoch": 0.35, "learning_rate": 0.0002478045834294587, "loss": 0.0206, "step": 134240 }, { "epoch": 0.35, "learning_rate": 0.0002478006952130872, "loss": 0.0227, "step": 134250 }, { "epoch": 0.35, "learning_rate": 0.0002477968069967157, "loss": 0.0201, "step": 134260 }, { "epoch": 0.35, "learning_rate": 0.0002477929187803443, "loss": 0.0173, "step": 134270 }, { "epoch": 0.35, "learning_rate": 0.0002477890305639728, "loss": 0.0236, "step": 134280 }, { "epoch": 0.35, "learning_rate": 0.00024778514234760136, "loss": 0.0223, "step": 134290 }, { "epoch": 0.35, "learning_rate": 0.00024778125413122987, "loss": 0.0169, "step": 134300 }, { "epoch": 0.35, "learning_rate": 0.0002477773659148584, "loss": 0.0148, "step": 134310 }, { "epoch": 0.35, "learning_rate": 0.00024777347769848696, "loss": 0.019, "step": 134320 }, { "epoch": 0.35, "learning_rate": 0.00024776958948211547, "loss": 0.021, "step": 134330 }, { "epoch": 0.35, "learning_rate": 0.000247765701265744, "loss": 0.0199, "step": 134340 }, { "epoch": 0.35, "learning_rate": 0.00024776181304937255, "loss": 0.0196, "step": 134350 }, { "epoch": 0.35, "learning_rate": 0.0002477579248330011, "loss": 0.0189, "step": 134360 }, { "epoch": 0.35, "learning_rate": 0.00024775403661662964, "loss": 0.0212, "step": 134370 }, { "epoch": 0.35, "learning_rate": 0.00024775014840025815, "loss": 0.0212, "step": 134380 }, { "epoch": 0.35, "learning_rate": 0.00024774626018388667, "loss": 0.0153, "step": 134390 }, { "epoch": 0.35, "learning_rate": 0.00024774237196751523, "loss": 0.019, "step": 134400 }, { "epoch": 0.35, "learning_rate": 0.00024773848375114375, "loss": 0.0214, "step": 134410 }, { "epoch": 0.35, "learning_rate": 0.0002477345955347723, "loss": 0.0176, "step": 134420 }, { "epoch": 0.35, "learning_rate": 0.00024773070731840083, "loss": 0.0231, "step": 134430 }, { "epoch": 0.35, "learning_rate": 0.0002477268191020294, "loss": 0.0193, "step": 134440 }, { "epoch": 0.35, "learning_rate": 0.0002477229308856579, "loss": 0.0196, "step": 134450 }, { "epoch": 0.35, "learning_rate": 0.00024771904266928643, "loss": 0.0195, "step": 134460 }, { "epoch": 0.35, "learning_rate": 0.00024771515445291494, "loss": 0.0208, "step": 134470 }, { "epoch": 0.35, "learning_rate": 0.0002477112662365435, "loss": 0.0219, "step": 134480 }, { "epoch": 0.35, "learning_rate": 0.00024770737802017203, "loss": 0.0233, "step": 134490 }, { "epoch": 0.35, "learning_rate": 0.0002477034898038006, "loss": 0.023, "step": 134500 }, { "epoch": 0.35, "learning_rate": 0.0002476996015874291, "loss": 0.0276, "step": 134510 }, { "epoch": 0.35, "learning_rate": 0.0002476957133710576, "loss": 0.019, "step": 134520 }, { "epoch": 0.35, "learning_rate": 0.0002476918251546862, "loss": 0.0204, "step": 134530 }, { "epoch": 0.35, "learning_rate": 0.0002476879369383147, "loss": 0.0204, "step": 134540 }, { "epoch": 0.35, "learning_rate": 0.0002476840487219433, "loss": 0.0237, "step": 134550 }, { "epoch": 0.35, "learning_rate": 0.0002476801605055718, "loss": 0.0187, "step": 134560 }, { "epoch": 0.35, "learning_rate": 0.00024767627228920036, "loss": 0.0149, "step": 134570 }, { "epoch": 0.35, "learning_rate": 0.0002476723840728289, "loss": 0.0172, "step": 134580 }, { "epoch": 0.35, "learning_rate": 0.0002476684958564574, "loss": 0.022, "step": 134590 }, { "epoch": 0.35, "learning_rate": 0.0002476646076400859, "loss": 0.0168, "step": 134600 }, { "epoch": 0.35, "learning_rate": 0.0002476607194237145, "loss": 0.0272, "step": 134610 }, { "epoch": 0.35, "learning_rate": 0.000247656831207343, "loss": 0.0198, "step": 134620 }, { "epoch": 0.35, "learning_rate": 0.00024765294299097156, "loss": 0.0221, "step": 134630 }, { "epoch": 0.35, "learning_rate": 0.00024764905477460007, "loss": 0.0182, "step": 134640 }, { "epoch": 0.35, "learning_rate": 0.00024764516655822864, "loss": 0.0162, "step": 134650 }, { "epoch": 0.35, "learning_rate": 0.00024764127834185715, "loss": 0.0194, "step": 134660 }, { "epoch": 0.35, "learning_rate": 0.00024763739012548567, "loss": 0.0161, "step": 134670 }, { "epoch": 0.35, "learning_rate": 0.0002476335019091142, "loss": 0.0225, "step": 134680 }, { "epoch": 0.35, "learning_rate": 0.00024762961369274275, "loss": 0.0176, "step": 134690 }, { "epoch": 0.35, "learning_rate": 0.0002476257254763713, "loss": 0.0228, "step": 134700 }, { "epoch": 0.35, "learning_rate": 0.00024762183725999984, "loss": 0.0216, "step": 134710 }, { "epoch": 0.35, "learning_rate": 0.00024761794904362835, "loss": 0.0204, "step": 134720 }, { "epoch": 0.35, "learning_rate": 0.00024761406082725686, "loss": 0.0236, "step": 134730 }, { "epoch": 0.35, "learning_rate": 0.00024761017261088543, "loss": 0.0191, "step": 134740 }, { "epoch": 0.35, "learning_rate": 0.00024760628439451395, "loss": 0.0188, "step": 134750 }, { "epoch": 0.35, "learning_rate": 0.0002476023961781425, "loss": 0.0197, "step": 134760 }, { "epoch": 0.35, "learning_rate": 0.00024759850796177103, "loss": 0.0197, "step": 134770 }, { "epoch": 0.35, "learning_rate": 0.0002475946197453996, "loss": 0.0255, "step": 134780 }, { "epoch": 0.35, "learning_rate": 0.0002475907315290281, "loss": 0.0158, "step": 134790 }, { "epoch": 0.35, "learning_rate": 0.00024758684331265663, "loss": 0.02, "step": 134800 }, { "epoch": 0.35, "learning_rate": 0.00024758295509628514, "loss": 0.0279, "step": 134810 }, { "epoch": 0.35, "learning_rate": 0.0002475790668799137, "loss": 0.0248, "step": 134820 }, { "epoch": 0.35, "learning_rate": 0.0002475751786635422, "loss": 0.0192, "step": 134830 }, { "epoch": 0.35, "learning_rate": 0.0002475712904471708, "loss": 0.0161, "step": 134840 }, { "epoch": 0.35, "learning_rate": 0.0002475674022307993, "loss": 0.0209, "step": 134850 }, { "epoch": 0.35, "learning_rate": 0.0002475635140144279, "loss": 0.0199, "step": 134860 }, { "epoch": 0.35, "learning_rate": 0.0002475596257980564, "loss": 0.0196, "step": 134870 }, { "epoch": 0.35, "learning_rate": 0.0002475557375816849, "loss": 0.0227, "step": 134880 }, { "epoch": 0.35, "learning_rate": 0.0002475518493653134, "loss": 0.0169, "step": 134890 }, { "epoch": 0.35, "learning_rate": 0.000247547961148942, "loss": 0.0208, "step": 134900 }, { "epoch": 0.35, "learning_rate": 0.00024754407293257056, "loss": 0.0254, "step": 134910 }, { "epoch": 0.35, "learning_rate": 0.0002475401847161991, "loss": 0.0204, "step": 134920 }, { "epoch": 0.35, "learning_rate": 0.0002475362964998276, "loss": 0.0184, "step": 134930 }, { "epoch": 0.35, "learning_rate": 0.00024753240828345616, "loss": 0.0191, "step": 134940 }, { "epoch": 0.35, "learning_rate": 0.00024752852006708467, "loss": 0.0216, "step": 134950 }, { "epoch": 0.35, "learning_rate": 0.0002475246318507132, "loss": 0.0157, "step": 134960 }, { "epoch": 0.35, "learning_rate": 0.00024752074363434176, "loss": 0.019, "step": 134970 }, { "epoch": 0.35, "learning_rate": 0.00024751685541797027, "loss": 0.0192, "step": 134980 }, { "epoch": 0.35, "learning_rate": 0.00024751296720159884, "loss": 0.0192, "step": 134990 }, { "epoch": 0.35, "learning_rate": 0.00024750907898522735, "loss": 0.0196, "step": 135000 }, { "epoch": 0.35, "eval_cer": 0.8818258543733756, "eval_loss": 0.014533363282680511, "eval_runtime": 107.3258, "eval_samples_per_second": 18.635, "eval_steps_per_second": 4.659, "step": 135000 }, { "epoch": 0.35, "learning_rate": 0.00024750519076885587, "loss": 0.0254, "step": 135010 }, { "epoch": 0.35, "learning_rate": 0.0002475013025524844, "loss": 0.019, "step": 135020 }, { "epoch": 0.35, "learning_rate": 0.00024749741433611295, "loss": 0.0226, "step": 135030 }, { "epoch": 0.35, "learning_rate": 0.00024749352611974147, "loss": 0.0187, "step": 135040 }, { "epoch": 0.35, "learning_rate": 0.00024748963790337003, "loss": 0.019, "step": 135050 }, { "epoch": 0.35, "learning_rate": 0.00024748574968699855, "loss": 0.0212, "step": 135060 }, { "epoch": 0.35, "learning_rate": 0.0002474818614706271, "loss": 0.0222, "step": 135070 }, { "epoch": 0.35, "learning_rate": 0.00024747797325425563, "loss": 0.0229, "step": 135080 }, { "epoch": 0.35, "learning_rate": 0.00024747408503788415, "loss": 0.0265, "step": 135090 }, { "epoch": 0.35, "learning_rate": 0.0002474701968215127, "loss": 0.0213, "step": 135100 }, { "epoch": 0.35, "learning_rate": 0.00024746630860514123, "loss": 0.0177, "step": 135110 }, { "epoch": 0.35, "learning_rate": 0.0002474624203887698, "loss": 0.0261, "step": 135120 }, { "epoch": 0.35, "learning_rate": 0.0002474585321723983, "loss": 0.0226, "step": 135130 }, { "epoch": 0.35, "learning_rate": 0.00024745464395602683, "loss": 0.0196, "step": 135140 }, { "epoch": 0.35, "learning_rate": 0.0002474507557396554, "loss": 0.0213, "step": 135150 }, { "epoch": 0.35, "learning_rate": 0.0002474468675232839, "loss": 0.0192, "step": 135160 }, { "epoch": 0.35, "learning_rate": 0.0002474429793069124, "loss": 0.0301, "step": 135170 }, { "epoch": 0.35, "learning_rate": 0.000247439091090541, "loss": 0.0226, "step": 135180 }, { "epoch": 0.35, "learning_rate": 0.0002474352028741695, "loss": 0.0235, "step": 135190 }, { "epoch": 0.35, "learning_rate": 0.0002474313146577981, "loss": 0.0198, "step": 135200 }, { "epoch": 0.35, "learning_rate": 0.0002474274264414266, "loss": 0.0214, "step": 135210 }, { "epoch": 0.35, "learning_rate": 0.0002474235382250551, "loss": 0.0174, "step": 135220 }, { "epoch": 0.35, "learning_rate": 0.0002474196500086836, "loss": 0.02, "step": 135230 }, { "epoch": 0.35, "learning_rate": 0.0002474157617923122, "loss": 0.0181, "step": 135240 }, { "epoch": 0.35, "learning_rate": 0.00024741187357594076, "loss": 0.018, "step": 135250 }, { "epoch": 0.35, "learning_rate": 0.0002474079853595693, "loss": 0.0198, "step": 135260 }, { "epoch": 0.35, "learning_rate": 0.0002474040971431978, "loss": 0.0225, "step": 135270 }, { "epoch": 0.35, "learning_rate": 0.00024740020892682636, "loss": 0.0236, "step": 135280 }, { "epoch": 0.35, "learning_rate": 0.00024739632071045487, "loss": 0.0175, "step": 135290 }, { "epoch": 0.35, "learning_rate": 0.0002473924324940834, "loss": 0.0161, "step": 135300 }, { "epoch": 0.35, "learning_rate": 0.00024738854427771195, "loss": 0.0263, "step": 135310 }, { "epoch": 0.35, "learning_rate": 0.00024738465606134047, "loss": 0.0182, "step": 135320 }, { "epoch": 0.35, "learning_rate": 0.00024738076784496904, "loss": 0.0192, "step": 135330 }, { "epoch": 0.35, "learning_rate": 0.00024737687962859755, "loss": 0.0229, "step": 135340 }, { "epoch": 0.35, "learning_rate": 0.00024737299141222607, "loss": 0.0315, "step": 135350 }, { "epoch": 0.35, "learning_rate": 0.00024736910319585464, "loss": 0.0268, "step": 135360 }, { "epoch": 0.35, "learning_rate": 0.00024736521497948315, "loss": 0.0181, "step": 135370 }, { "epoch": 0.35, "learning_rate": 0.00024736132676311166, "loss": 0.0164, "step": 135380 }, { "epoch": 0.35, "learning_rate": 0.00024735743854674023, "loss": 0.0188, "step": 135390 }, { "epoch": 0.35, "learning_rate": 0.0002473535503303688, "loss": 0.0198, "step": 135400 }, { "epoch": 0.35, "learning_rate": 0.0002473496621139973, "loss": 0.0185, "step": 135410 }, { "epoch": 0.35, "learning_rate": 0.00024734577389762583, "loss": 0.0196, "step": 135420 }, { "epoch": 0.35, "learning_rate": 0.00024734188568125435, "loss": 0.02, "step": 135430 }, { "epoch": 0.35, "learning_rate": 0.0002473379974648829, "loss": 0.0183, "step": 135440 }, { "epoch": 0.35, "learning_rate": 0.00024733410924851143, "loss": 0.0273, "step": 135450 }, { "epoch": 0.35, "learning_rate": 0.00024733022103214, "loss": 0.0256, "step": 135460 }, { "epoch": 0.35, "learning_rate": 0.0002473263328157685, "loss": 0.0197, "step": 135470 }, { "epoch": 0.35, "learning_rate": 0.000247322444599397, "loss": 0.0219, "step": 135480 }, { "epoch": 0.35, "learning_rate": 0.0002473185563830256, "loss": 0.0232, "step": 135490 }, { "epoch": 0.35, "learning_rate": 0.0002473146681666541, "loss": 0.0209, "step": 135500 }, { "epoch": 0.35, "learning_rate": 0.0002473107799502826, "loss": 0.0222, "step": 135510 }, { "epoch": 0.35, "learning_rate": 0.0002473068917339112, "loss": 0.0227, "step": 135520 }, { "epoch": 0.35, "learning_rate": 0.0002473030035175397, "loss": 0.0164, "step": 135530 }, { "epoch": 0.35, "learning_rate": 0.0002472991153011683, "loss": 0.0259, "step": 135540 }, { "epoch": 0.35, "learning_rate": 0.0002472952270847968, "loss": 0.0186, "step": 135550 }, { "epoch": 0.35, "learning_rate": 0.0002472913388684253, "loss": 0.0185, "step": 135560 }, { "epoch": 0.35, "learning_rate": 0.0002472874506520539, "loss": 0.0191, "step": 135570 }, { "epoch": 0.35, "learning_rate": 0.0002472835624356824, "loss": 0.0192, "step": 135580 }, { "epoch": 0.35, "learning_rate": 0.0002472796742193109, "loss": 0.0209, "step": 135590 }, { "epoch": 0.35, "learning_rate": 0.00024727578600293947, "loss": 0.0162, "step": 135600 }, { "epoch": 0.35, "learning_rate": 0.00024727189778656804, "loss": 0.0182, "step": 135610 }, { "epoch": 0.35, "learning_rate": 0.00024726800957019656, "loss": 0.0189, "step": 135620 }, { "epoch": 0.35, "learning_rate": 0.00024726412135382507, "loss": 0.027, "step": 135630 }, { "epoch": 0.35, "learning_rate": 0.0002472602331374536, "loss": 0.0158, "step": 135640 }, { "epoch": 0.35, "learning_rate": 0.00024725634492108215, "loss": 0.0216, "step": 135650 }, { "epoch": 0.35, "learning_rate": 0.00024725245670471067, "loss": 0.0161, "step": 135660 }, { "epoch": 0.35, "learning_rate": 0.00024724856848833924, "loss": 0.023, "step": 135670 }, { "epoch": 0.35, "learning_rate": 0.00024724468027196775, "loss": 0.0194, "step": 135680 }, { "epoch": 0.35, "learning_rate": 0.0002472407920555963, "loss": 0.0152, "step": 135690 }, { "epoch": 0.35, "learning_rate": 0.00024723690383922483, "loss": 0.0186, "step": 135700 }, { "epoch": 0.35, "learning_rate": 0.00024723301562285335, "loss": 0.0247, "step": 135710 }, { "epoch": 0.35, "learning_rate": 0.00024722912740648186, "loss": 0.0223, "step": 135720 }, { "epoch": 0.35, "learning_rate": 0.00024722523919011043, "loss": 0.018, "step": 135730 }, { "epoch": 0.35, "learning_rate": 0.000247221350973739, "loss": 0.019, "step": 135740 }, { "epoch": 0.35, "learning_rate": 0.0002472174627573675, "loss": 0.0253, "step": 135750 }, { "epoch": 0.35, "learning_rate": 0.00024721357454099603, "loss": 0.0202, "step": 135760 }, { "epoch": 0.35, "learning_rate": 0.00024720968632462454, "loss": 0.0213, "step": 135770 }, { "epoch": 0.35, "learning_rate": 0.0002472057981082531, "loss": 0.0212, "step": 135780 }, { "epoch": 0.35, "learning_rate": 0.00024720190989188163, "loss": 0.0192, "step": 135790 }, { "epoch": 0.35, "learning_rate": 0.0002471980216755102, "loss": 0.0169, "step": 135800 }, { "epoch": 0.35, "learning_rate": 0.0002471941334591387, "loss": 0.0173, "step": 135810 }, { "epoch": 0.35, "learning_rate": 0.0002471902452427673, "loss": 0.0198, "step": 135820 }, { "epoch": 0.35, "learning_rate": 0.0002471863570263958, "loss": 0.0205, "step": 135830 }, { "epoch": 0.35, "learning_rate": 0.0002471824688100243, "loss": 0.024, "step": 135840 }, { "epoch": 0.35, "learning_rate": 0.0002471785805936528, "loss": 0.0199, "step": 135850 }, { "epoch": 0.35, "learning_rate": 0.0002471746923772814, "loss": 0.0264, "step": 135860 }, { "epoch": 0.35, "learning_rate": 0.0002471708041609099, "loss": 0.0166, "step": 135870 }, { "epoch": 0.35, "learning_rate": 0.0002471669159445385, "loss": 0.0195, "step": 135880 }, { "epoch": 0.35, "learning_rate": 0.000247163027728167, "loss": 0.0234, "step": 135890 }, { "epoch": 0.35, "learning_rate": 0.00024715913951179556, "loss": 0.0211, "step": 135900 }, { "epoch": 0.35, "learning_rate": 0.0002471552512954241, "loss": 0.0157, "step": 135910 }, { "epoch": 0.35, "learning_rate": 0.0002471513630790526, "loss": 0.0195, "step": 135920 }, { "epoch": 0.35, "learning_rate": 0.0002471474748626811, "loss": 0.022, "step": 135930 }, { "epoch": 0.35, "learning_rate": 0.00024714358664630967, "loss": 0.0199, "step": 135940 }, { "epoch": 0.35, "learning_rate": 0.00024713969842993824, "loss": 0.0205, "step": 135950 }, { "epoch": 0.35, "learning_rate": 0.00024713581021356675, "loss": 0.0183, "step": 135960 }, { "epoch": 0.35, "learning_rate": 0.00024713192199719527, "loss": 0.0178, "step": 135970 }, { "epoch": 0.35, "learning_rate": 0.0002471280337808238, "loss": 0.0184, "step": 135980 }, { "epoch": 0.35, "learning_rate": 0.00024712414556445235, "loss": 0.0195, "step": 135990 }, { "epoch": 0.35, "learning_rate": 0.00024712025734808087, "loss": 0.0224, "step": 136000 }, { "epoch": 0.35, "eval_cer": 0.8818034601824287, "eval_loss": 0.013970781117677689, "eval_runtime": 107.2477, "eval_samples_per_second": 18.648, "eval_steps_per_second": 4.662, "step": 136000 }, { "epoch": 0.35, "learning_rate": 0.00024711636913170944, "loss": 0.0188, "step": 136010 }, { "epoch": 0.35, "learning_rate": 0.00024711248091533795, "loss": 0.021, "step": 136020 }, { "epoch": 0.35, "learning_rate": 0.0002471085926989665, "loss": 0.0186, "step": 136030 }, { "epoch": 0.35, "learning_rate": 0.00024710470448259503, "loss": 0.0191, "step": 136040 }, { "epoch": 0.35, "learning_rate": 0.00024710081626622355, "loss": 0.0254, "step": 136050 }, { "epoch": 0.35, "learning_rate": 0.00024709692804985206, "loss": 0.0232, "step": 136060 }, { "epoch": 0.35, "learning_rate": 0.00024709303983348063, "loss": 0.0216, "step": 136070 }, { "epoch": 0.35, "learning_rate": 0.00024708915161710915, "loss": 0.0212, "step": 136080 }, { "epoch": 0.35, "learning_rate": 0.0002470852634007377, "loss": 0.0164, "step": 136090 }, { "epoch": 0.35, "learning_rate": 0.00024708137518436623, "loss": 0.0183, "step": 136100 }, { "epoch": 0.35, "learning_rate": 0.0002470774869679948, "loss": 0.0187, "step": 136110 }, { "epoch": 0.35, "learning_rate": 0.0002470735987516233, "loss": 0.0187, "step": 136120 }, { "epoch": 0.35, "learning_rate": 0.0002470697105352518, "loss": 0.0157, "step": 136130 }, { "epoch": 0.35, "learning_rate": 0.0002470658223188804, "loss": 0.0174, "step": 136140 }, { "epoch": 0.35, "learning_rate": 0.0002470619341025089, "loss": 0.0138, "step": 136150 }, { "epoch": 0.35, "learning_rate": 0.0002470580458861375, "loss": 0.0188, "step": 136160 }, { "epoch": 0.35, "learning_rate": 0.000247054157669766, "loss": 0.0201, "step": 136170 }, { "epoch": 0.35, "learning_rate": 0.0002470502694533945, "loss": 0.017, "step": 136180 }, { "epoch": 0.35, "learning_rate": 0.0002470463812370231, "loss": 0.0185, "step": 136190 }, { "epoch": 0.35, "learning_rate": 0.0002470424930206516, "loss": 0.0238, "step": 136200 }, { "epoch": 0.35, "learning_rate": 0.0002470386048042801, "loss": 0.0228, "step": 136210 }, { "epoch": 0.35, "learning_rate": 0.0002470347165879087, "loss": 0.0263, "step": 136220 }, { "epoch": 0.35, "learning_rate": 0.0002470308283715372, "loss": 0.0205, "step": 136230 }, { "epoch": 0.35, "learning_rate": 0.00024702694015516576, "loss": 0.0233, "step": 136240 }, { "epoch": 0.35, "learning_rate": 0.00024702305193879427, "loss": 0.018, "step": 136250 }, { "epoch": 0.35, "learning_rate": 0.0002470191637224228, "loss": 0.0175, "step": 136260 }, { "epoch": 0.35, "learning_rate": 0.0002470152755060513, "loss": 0.0227, "step": 136270 }, { "epoch": 0.35, "learning_rate": 0.00024701138728967987, "loss": 0.0217, "step": 136280 }, { "epoch": 0.35, "learning_rate": 0.00024700749907330844, "loss": 0.0188, "step": 136290 }, { "epoch": 0.35, "learning_rate": 0.00024700361085693695, "loss": 0.0199, "step": 136300 }, { "epoch": 0.35, "learning_rate": 0.00024699972264056547, "loss": 0.0264, "step": 136310 }, { "epoch": 0.35, "learning_rate": 0.00024699583442419404, "loss": 0.0186, "step": 136320 }, { "epoch": 0.35, "learning_rate": 0.00024699194620782255, "loss": 0.0209, "step": 136330 }, { "epoch": 0.35, "learning_rate": 0.00024698805799145107, "loss": 0.0217, "step": 136340 }, { "epoch": 0.35, "learning_rate": 0.00024698416977507963, "loss": 0.0215, "step": 136350 }, { "epoch": 0.35, "learning_rate": 0.00024698028155870815, "loss": 0.0181, "step": 136360 }, { "epoch": 0.35, "learning_rate": 0.0002469763933423367, "loss": 0.0204, "step": 136370 }, { "epoch": 0.35, "learning_rate": 0.00024697250512596523, "loss": 0.0192, "step": 136380 }, { "epoch": 0.35, "learning_rate": 0.00024696861690959375, "loss": 0.0202, "step": 136390 }, { "epoch": 0.35, "learning_rate": 0.0002469647286932223, "loss": 0.0198, "step": 136400 }, { "epoch": 0.35, "learning_rate": 0.00024696084047685083, "loss": 0.021, "step": 136410 }, { "epoch": 0.35, "learning_rate": 0.00024695695226047934, "loss": 0.0192, "step": 136420 }, { "epoch": 0.35, "learning_rate": 0.0002469530640441079, "loss": 0.02, "step": 136430 }, { "epoch": 0.35, "learning_rate": 0.0002469491758277365, "loss": 0.0186, "step": 136440 }, { "epoch": 0.35, "learning_rate": 0.000246945287611365, "loss": 0.0255, "step": 136450 }, { "epoch": 0.35, "learning_rate": 0.0002469413993949935, "loss": 0.0192, "step": 136460 }, { "epoch": 0.35, "learning_rate": 0.000246937511178622, "loss": 0.0191, "step": 136470 }, { "epoch": 0.35, "learning_rate": 0.00024693362296225054, "loss": 0.0182, "step": 136480 }, { "epoch": 0.35, "learning_rate": 0.0002469297347458791, "loss": 0.0209, "step": 136490 }, { "epoch": 0.35, "learning_rate": 0.0002469258465295077, "loss": 0.0217, "step": 136500 }, { "epoch": 0.35, "learning_rate": 0.0002469219583131362, "loss": 0.022, "step": 136510 }, { "epoch": 0.35, "learning_rate": 0.0002469180700967647, "loss": 0.021, "step": 136520 }, { "epoch": 0.35, "learning_rate": 0.0002469141818803933, "loss": 0.0167, "step": 136530 }, { "epoch": 0.35, "learning_rate": 0.0002469102936640218, "loss": 0.0191, "step": 136540 }, { "epoch": 0.35, "learning_rate": 0.0002469064054476503, "loss": 0.021, "step": 136550 }, { "epoch": 0.35, "learning_rate": 0.0002469025172312789, "loss": 0.022, "step": 136560 }, { "epoch": 0.35, "learning_rate": 0.0002468986290149074, "loss": 0.0214, "step": 136570 }, { "epoch": 0.35, "learning_rate": 0.00024689474079853596, "loss": 0.0209, "step": 136580 }, { "epoch": 0.35, "learning_rate": 0.00024689085258216447, "loss": 0.0171, "step": 136590 }, { "epoch": 0.35, "learning_rate": 0.000246886964365793, "loss": 0.0187, "step": 136600 }, { "epoch": 0.35, "learning_rate": 0.00024688307614942155, "loss": 0.0168, "step": 136610 }, { "epoch": 0.35, "learning_rate": 0.00024687918793305007, "loss": 0.0266, "step": 136620 }, { "epoch": 0.35, "learning_rate": 0.0002468752997166786, "loss": 0.0191, "step": 136630 }, { "epoch": 0.35, "learning_rate": 0.00024687141150030715, "loss": 0.0212, "step": 136640 }, { "epoch": 0.35, "learning_rate": 0.0002468675232839357, "loss": 0.0217, "step": 136650 }, { "epoch": 0.35, "learning_rate": 0.00024686363506756424, "loss": 0.0259, "step": 136660 }, { "epoch": 0.35, "learning_rate": 0.00024685974685119275, "loss": 0.0219, "step": 136670 }, { "epoch": 0.35, "learning_rate": 0.00024685585863482126, "loss": 0.0205, "step": 136680 }, { "epoch": 0.35, "learning_rate": 0.00024685197041844983, "loss": 0.0196, "step": 136690 }, { "epoch": 0.35, "learning_rate": 0.00024684808220207835, "loss": 0.019, "step": 136700 }, { "epoch": 0.35, "learning_rate": 0.0002468441939857069, "loss": 0.0249, "step": 136710 }, { "epoch": 0.35, "learning_rate": 0.00024684030576933543, "loss": 0.0221, "step": 136720 }, { "epoch": 0.35, "learning_rate": 0.00024683641755296395, "loss": 0.0183, "step": 136730 }, { "epoch": 0.35, "learning_rate": 0.0002468325293365925, "loss": 0.0235, "step": 136740 }, { "epoch": 0.35, "learning_rate": 0.00024682864112022103, "loss": 0.0176, "step": 136750 }, { "epoch": 0.35, "learning_rate": 0.00024682475290384954, "loss": 0.0196, "step": 136760 }, { "epoch": 0.35, "learning_rate": 0.0002468208646874781, "loss": 0.023, "step": 136770 }, { "epoch": 0.35, "learning_rate": 0.0002468169764711066, "loss": 0.0164, "step": 136780 }, { "epoch": 0.35, "learning_rate": 0.0002468130882547352, "loss": 0.0252, "step": 136790 }, { "epoch": 0.35, "learning_rate": 0.0002468092000383637, "loss": 0.0229, "step": 136800 }, { "epoch": 0.35, "learning_rate": 0.0002468053118219922, "loss": 0.0198, "step": 136810 }, { "epoch": 0.35, "learning_rate": 0.0002468014236056208, "loss": 0.0225, "step": 136820 }, { "epoch": 0.35, "learning_rate": 0.0002467975353892493, "loss": 0.0171, "step": 136830 }, { "epoch": 0.35, "learning_rate": 0.0002467936471728779, "loss": 0.0171, "step": 136840 }, { "epoch": 0.35, "learning_rate": 0.0002467897589565064, "loss": 0.0238, "step": 136850 }, { "epoch": 0.35, "learning_rate": 0.00024678587074013496, "loss": 0.0194, "step": 136860 }, { "epoch": 0.35, "learning_rate": 0.0002467819825237635, "loss": 0.0233, "step": 136870 }, { "epoch": 0.35, "learning_rate": 0.000246778094307392, "loss": 0.0209, "step": 136880 }, { "epoch": 0.35, "learning_rate": 0.0002467742060910205, "loss": 0.0178, "step": 136890 }, { "epoch": 0.35, "learning_rate": 0.00024677031787464907, "loss": 0.0235, "step": 136900 }, { "epoch": 0.35, "learning_rate": 0.0002467664296582776, "loss": 0.0217, "step": 136910 }, { "epoch": 0.35, "learning_rate": 0.00024676254144190616, "loss": 0.0262, "step": 136920 }, { "epoch": 0.35, "learning_rate": 0.00024675865322553467, "loss": 0.0199, "step": 136930 }, { "epoch": 0.35, "learning_rate": 0.00024675476500916324, "loss": 0.017, "step": 136940 }, { "epoch": 0.35, "learning_rate": 0.00024675087679279175, "loss": 0.0197, "step": 136950 }, { "epoch": 0.36, "learning_rate": 0.00024674698857642027, "loss": 0.0187, "step": 136960 }, { "epoch": 0.36, "learning_rate": 0.0002467431003600488, "loss": 0.0239, "step": 136970 }, { "epoch": 0.36, "learning_rate": 0.00024673921214367735, "loss": 0.025, "step": 136980 }, { "epoch": 0.36, "learning_rate": 0.0002467353239273059, "loss": 0.0183, "step": 136990 }, { "epoch": 0.36, "learning_rate": 0.00024673143571093443, "loss": 0.0171, "step": 137000 }, { "epoch": 0.36, "eval_cer": 0.8817684692590742, "eval_loss": 0.014788404107093811, "eval_runtime": 107.1104, "eval_samples_per_second": 18.672, "eval_steps_per_second": 4.668, "step": 137000 }, { "epoch": 0.36, "learning_rate": 0.00024672754749456295, "loss": 0.0182, "step": 137010 }, { "epoch": 0.36, "learning_rate": 0.00024672365927819146, "loss": 0.0249, "step": 137020 }, { "epoch": 0.36, "learning_rate": 0.00024671977106182003, "loss": 0.0182, "step": 137030 }, { "epoch": 0.36, "learning_rate": 0.00024671588284544855, "loss": 0.0198, "step": 137040 }, { "epoch": 0.36, "learning_rate": 0.0002467119946290771, "loss": 0.019, "step": 137050 }, { "epoch": 0.36, "learning_rate": 0.00024670810641270563, "loss": 0.0227, "step": 137060 }, { "epoch": 0.36, "learning_rate": 0.0002467042181963342, "loss": 0.0217, "step": 137070 }, { "epoch": 0.36, "learning_rate": 0.0002467003299799627, "loss": 0.0237, "step": 137080 }, { "epoch": 0.36, "learning_rate": 0.00024669644176359123, "loss": 0.0211, "step": 137090 }, { "epoch": 0.36, "learning_rate": 0.00024669255354721974, "loss": 0.0221, "step": 137100 }, { "epoch": 0.36, "learning_rate": 0.0002466886653308483, "loss": 0.0206, "step": 137110 }, { "epoch": 0.36, "learning_rate": 0.0002466847771144768, "loss": 0.0215, "step": 137120 }, { "epoch": 0.36, "learning_rate": 0.0002466808888981054, "loss": 0.0209, "step": 137130 }, { "epoch": 0.36, "learning_rate": 0.0002466770006817339, "loss": 0.0268, "step": 137140 }, { "epoch": 0.36, "learning_rate": 0.0002466731124653625, "loss": 0.0247, "step": 137150 }, { "epoch": 0.36, "learning_rate": 0.000246669224248991, "loss": 0.02, "step": 137160 }, { "epoch": 0.36, "learning_rate": 0.0002466653360326195, "loss": 0.0155, "step": 137170 }, { "epoch": 0.36, "learning_rate": 0.000246661447816248, "loss": 0.0213, "step": 137180 }, { "epoch": 0.36, "learning_rate": 0.0002466575595998766, "loss": 0.0186, "step": 137190 }, { "epoch": 0.36, "learning_rate": 0.00024665367138350516, "loss": 0.0199, "step": 137200 }, { "epoch": 0.36, "learning_rate": 0.00024664978316713367, "loss": 0.0165, "step": 137210 }, { "epoch": 0.36, "learning_rate": 0.0002466458949507622, "loss": 0.0223, "step": 137220 }, { "epoch": 0.36, "learning_rate": 0.0002466420067343907, "loss": 0.0173, "step": 137230 }, { "epoch": 0.36, "learning_rate": 0.00024663811851801927, "loss": 0.022, "step": 137240 }, { "epoch": 0.36, "learning_rate": 0.0002466342303016478, "loss": 0.0213, "step": 137250 }, { "epoch": 0.36, "learning_rate": 0.00024663034208527635, "loss": 0.0254, "step": 137260 }, { "epoch": 0.36, "learning_rate": 0.00024662645386890487, "loss": 0.0207, "step": 137270 }, { "epoch": 0.36, "learning_rate": 0.00024662256565253344, "loss": 0.022, "step": 137280 }, { "epoch": 0.36, "learning_rate": 0.00024661867743616195, "loss": 0.0177, "step": 137290 }, { "epoch": 0.36, "learning_rate": 0.00024661478921979047, "loss": 0.0208, "step": 137300 }, { "epoch": 0.36, "learning_rate": 0.000246610901003419, "loss": 0.02, "step": 137310 }, { "epoch": 0.36, "learning_rate": 0.00024660701278704755, "loss": 0.0202, "step": 137320 }, { "epoch": 0.36, "learning_rate": 0.0002466031245706761, "loss": 0.0242, "step": 137330 }, { "epoch": 0.36, "learning_rate": 0.00024659923635430463, "loss": 0.0181, "step": 137340 }, { "epoch": 0.36, "learning_rate": 0.00024659534813793315, "loss": 0.0177, "step": 137350 }, { "epoch": 0.36, "learning_rate": 0.0002465914599215617, "loss": 0.0194, "step": 137360 }, { "epoch": 0.36, "learning_rate": 0.00024658757170519023, "loss": 0.0221, "step": 137370 }, { "epoch": 0.36, "learning_rate": 0.00024658368348881875, "loss": 0.0188, "step": 137380 }, { "epoch": 0.36, "learning_rate": 0.0002465797952724473, "loss": 0.0175, "step": 137390 }, { "epoch": 0.36, "learning_rate": 0.00024657590705607583, "loss": 0.016, "step": 137400 }, { "epoch": 0.36, "learning_rate": 0.0002465720188397044, "loss": 0.0196, "step": 137410 }, { "epoch": 0.36, "learning_rate": 0.0002465681306233329, "loss": 0.0167, "step": 137420 }, { "epoch": 0.36, "learning_rate": 0.0002465642424069614, "loss": 0.0236, "step": 137430 }, { "epoch": 0.36, "learning_rate": 0.00024656035419059, "loss": 0.0182, "step": 137440 }, { "epoch": 0.36, "learning_rate": 0.0002465564659742185, "loss": 0.0177, "step": 137450 }, { "epoch": 0.36, "learning_rate": 0.000246552577757847, "loss": 0.0224, "step": 137460 }, { "epoch": 0.36, "learning_rate": 0.0002465486895414756, "loss": 0.0223, "step": 137470 }, { "epoch": 0.36, "learning_rate": 0.0002465448013251041, "loss": 0.0168, "step": 137480 }, { "epoch": 0.36, "learning_rate": 0.0002465409131087327, "loss": 0.0205, "step": 137490 }, { "epoch": 0.36, "learning_rate": 0.0002465370248923612, "loss": 0.0188, "step": 137500 }, { "epoch": 0.36, "learning_rate": 0.0002465331366759897, "loss": 0.0169, "step": 137510 }, { "epoch": 0.36, "learning_rate": 0.0002465292484596182, "loss": 0.0165, "step": 137520 }, { "epoch": 0.36, "learning_rate": 0.0002465253602432468, "loss": 0.0172, "step": 137530 }, { "epoch": 0.36, "learning_rate": 0.00024652147202687536, "loss": 0.0214, "step": 137540 }, { "epoch": 0.36, "learning_rate": 0.00024651758381050387, "loss": 0.0186, "step": 137550 }, { "epoch": 0.36, "learning_rate": 0.0002465136955941324, "loss": 0.0241, "step": 137560 }, { "epoch": 0.36, "learning_rate": 0.00024650980737776095, "loss": 0.0189, "step": 137570 }, { "epoch": 0.36, "learning_rate": 0.00024650591916138947, "loss": 0.0223, "step": 137580 }, { "epoch": 0.36, "learning_rate": 0.000246502030945018, "loss": 0.0218, "step": 137590 }, { "epoch": 0.36, "learning_rate": 0.00024649814272864655, "loss": 0.0206, "step": 137600 }, { "epoch": 0.36, "learning_rate": 0.00024649425451227507, "loss": 0.0172, "step": 137610 }, { "epoch": 0.36, "learning_rate": 0.00024649036629590364, "loss": 0.0308, "step": 137620 }, { "epoch": 0.36, "learning_rate": 0.00024648647807953215, "loss": 0.0273, "step": 137630 }, { "epoch": 0.36, "learning_rate": 0.00024648258986316067, "loss": 0.0213, "step": 137640 }, { "epoch": 0.36, "learning_rate": 0.00024647870164678923, "loss": 0.0264, "step": 137650 }, { "epoch": 0.36, "learning_rate": 0.00024647481343041775, "loss": 0.017, "step": 137660 }, { "epoch": 0.36, "learning_rate": 0.00024647092521404626, "loss": 0.0193, "step": 137670 }, { "epoch": 0.36, "learning_rate": 0.00024646703699767483, "loss": 0.0182, "step": 137680 }, { "epoch": 0.36, "learning_rate": 0.0002464631487813034, "loss": 0.02, "step": 137690 }, { "epoch": 0.36, "learning_rate": 0.0002464592605649319, "loss": 0.0187, "step": 137700 }, { "epoch": 0.36, "learning_rate": 0.00024645537234856043, "loss": 0.0213, "step": 137710 }, { "epoch": 0.36, "learning_rate": 0.00024645148413218894, "loss": 0.0213, "step": 137720 }, { "epoch": 0.36, "learning_rate": 0.0002464475959158175, "loss": 0.0195, "step": 137730 }, { "epoch": 0.36, "learning_rate": 0.00024644370769944603, "loss": 0.0218, "step": 137740 }, { "epoch": 0.36, "learning_rate": 0.0002464398194830746, "loss": 0.0196, "step": 137750 }, { "epoch": 0.36, "learning_rate": 0.0002464359312667031, "loss": 0.0201, "step": 137760 }, { "epoch": 0.36, "learning_rate": 0.0002464320430503316, "loss": 0.0206, "step": 137770 }, { "epoch": 0.36, "learning_rate": 0.0002464281548339602, "loss": 0.0198, "step": 137780 }, { "epoch": 0.36, "learning_rate": 0.0002464242666175887, "loss": 0.0235, "step": 137790 }, { "epoch": 0.36, "learning_rate": 0.0002464203784012172, "loss": 0.0202, "step": 137800 }, { "epoch": 0.36, "learning_rate": 0.0002464164901848458, "loss": 0.0227, "step": 137810 }, { "epoch": 0.36, "learning_rate": 0.0002464126019684743, "loss": 0.021, "step": 137820 }, { "epoch": 0.36, "learning_rate": 0.0002464087137521029, "loss": 0.0181, "step": 137830 }, { "epoch": 0.36, "learning_rate": 0.0002464048255357314, "loss": 0.016, "step": 137840 }, { "epoch": 0.36, "learning_rate": 0.0002464009373193599, "loss": 0.0288, "step": 137850 }, { "epoch": 0.36, "learning_rate": 0.00024639704910298847, "loss": 0.0218, "step": 137860 }, { "epoch": 0.36, "learning_rate": 0.000246393160886617, "loss": 0.0156, "step": 137870 }, { "epoch": 0.36, "learning_rate": 0.00024638927267024556, "loss": 0.0209, "step": 137880 }, { "epoch": 0.36, "learning_rate": 0.00024638538445387407, "loss": 0.0216, "step": 137890 }, { "epoch": 0.36, "learning_rate": 0.00024638149623750264, "loss": 0.0212, "step": 137900 }, { "epoch": 0.36, "learning_rate": 0.00024637760802113115, "loss": 0.0215, "step": 137910 }, { "epoch": 0.36, "learning_rate": 0.00024637371980475967, "loss": 0.0198, "step": 137920 }, { "epoch": 0.36, "learning_rate": 0.0002463698315883882, "loss": 0.0178, "step": 137930 }, { "epoch": 0.36, "learning_rate": 0.00024636594337201675, "loss": 0.021, "step": 137940 }, { "epoch": 0.36, "learning_rate": 0.00024636205515564527, "loss": 0.017, "step": 137950 }, { "epoch": 0.36, "learning_rate": 0.00024635816693927383, "loss": 0.0229, "step": 137960 }, { "epoch": 0.36, "learning_rate": 0.00024635427872290235, "loss": 0.0217, "step": 137970 }, { "epoch": 0.36, "learning_rate": 0.00024635039050653086, "loss": 0.0227, "step": 137980 }, { "epoch": 0.36, "learning_rate": 0.00024634650229015943, "loss": 0.0214, "step": 137990 }, { "epoch": 0.36, "learning_rate": 0.00024634261407378795, "loss": 0.0189, "step": 138000 }, { "epoch": 0.36, "eval_cer": 0.8817936627238894, "eval_loss": 0.014577467925846577, "eval_runtime": 107.3326, "eval_samples_per_second": 18.634, "eval_steps_per_second": 4.658, "step": 138000 }, { "epoch": 0.36, "learning_rate": 0.00024633872585741646, "loss": 0.0155, "step": 138010 }, { "epoch": 0.36, "learning_rate": 0.00024633483764104503, "loss": 0.0157, "step": 138020 }, { "epoch": 0.36, "learning_rate": 0.0002463309494246736, "loss": 0.0175, "step": 138030 }, { "epoch": 0.36, "learning_rate": 0.0002463270612083021, "loss": 0.0184, "step": 138040 }, { "epoch": 0.36, "learning_rate": 0.00024632317299193063, "loss": 0.0183, "step": 138050 }, { "epoch": 0.36, "learning_rate": 0.00024631928477555914, "loss": 0.024, "step": 138060 }, { "epoch": 0.36, "learning_rate": 0.0002463153965591877, "loss": 0.0215, "step": 138070 }, { "epoch": 0.36, "learning_rate": 0.0002463115083428162, "loss": 0.0188, "step": 138080 }, { "epoch": 0.36, "learning_rate": 0.0002463076201264448, "loss": 0.0207, "step": 138090 }, { "epoch": 0.36, "learning_rate": 0.0002463037319100733, "loss": 0.0168, "step": 138100 }, { "epoch": 0.36, "learning_rate": 0.0002462998436937019, "loss": 0.0191, "step": 138110 }, { "epoch": 0.36, "learning_rate": 0.0002462959554773304, "loss": 0.0234, "step": 138120 }, { "epoch": 0.36, "learning_rate": 0.0002462920672609589, "loss": 0.0177, "step": 138130 }, { "epoch": 0.36, "learning_rate": 0.0002462881790445874, "loss": 0.0203, "step": 138140 }, { "epoch": 0.36, "learning_rate": 0.000246284290828216, "loss": 0.0191, "step": 138150 }, { "epoch": 0.36, "learning_rate": 0.0002462804026118445, "loss": 0.0174, "step": 138160 }, { "epoch": 0.36, "learning_rate": 0.0002462765143954731, "loss": 0.0203, "step": 138170 }, { "epoch": 0.36, "learning_rate": 0.0002462726261791016, "loss": 0.0222, "step": 138180 }, { "epoch": 0.36, "learning_rate": 0.00024626873796273016, "loss": 0.0224, "step": 138190 }, { "epoch": 0.36, "learning_rate": 0.00024626484974635867, "loss": 0.0207, "step": 138200 }, { "epoch": 0.36, "learning_rate": 0.0002462609615299872, "loss": 0.0205, "step": 138210 }, { "epoch": 0.36, "learning_rate": 0.0002462570733136157, "loss": 0.023, "step": 138220 }, { "epoch": 0.36, "learning_rate": 0.00024625318509724427, "loss": 0.0208, "step": 138230 }, { "epoch": 0.36, "learning_rate": 0.00024624929688087284, "loss": 0.0171, "step": 138240 }, { "epoch": 0.36, "learning_rate": 0.00024624540866450135, "loss": 0.0177, "step": 138250 }, { "epoch": 0.36, "learning_rate": 0.00024624152044812987, "loss": 0.0193, "step": 138260 }, { "epoch": 0.36, "learning_rate": 0.0002462376322317584, "loss": 0.021, "step": 138270 }, { "epoch": 0.36, "learning_rate": 0.00024623374401538695, "loss": 0.0188, "step": 138280 }, { "epoch": 0.36, "learning_rate": 0.00024622985579901546, "loss": 0.018, "step": 138290 }, { "epoch": 0.36, "learning_rate": 0.00024622596758264403, "loss": 0.0179, "step": 138300 }, { "epoch": 0.36, "learning_rate": 0.00024622207936627255, "loss": 0.0161, "step": 138310 }, { "epoch": 0.36, "learning_rate": 0.0002462181911499011, "loss": 0.0168, "step": 138320 }, { "epoch": 0.36, "learning_rate": 0.00024621430293352963, "loss": 0.0221, "step": 138330 }, { "epoch": 0.36, "learning_rate": 0.00024621041471715815, "loss": 0.0214, "step": 138340 }, { "epoch": 0.36, "learning_rate": 0.00024620652650078666, "loss": 0.0206, "step": 138350 }, { "epoch": 0.36, "learning_rate": 0.00024620263828441523, "loss": 0.0243, "step": 138360 }, { "epoch": 0.36, "learning_rate": 0.00024619875006804374, "loss": 0.02, "step": 138370 }, { "epoch": 0.36, "learning_rate": 0.0002461948618516723, "loss": 0.0298, "step": 138380 }, { "epoch": 0.36, "learning_rate": 0.00024619097363530083, "loss": 0.0176, "step": 138390 }, { "epoch": 0.36, "learning_rate": 0.0002461870854189294, "loss": 0.023, "step": 138400 }, { "epoch": 0.36, "learning_rate": 0.0002461831972025579, "loss": 0.0194, "step": 138410 }, { "epoch": 0.36, "learning_rate": 0.0002461793089861864, "loss": 0.0203, "step": 138420 }, { "epoch": 0.36, "learning_rate": 0.000246175420769815, "loss": 0.022, "step": 138430 }, { "epoch": 0.36, "learning_rate": 0.0002461715325534435, "loss": 0.0217, "step": 138440 }, { "epoch": 0.36, "learning_rate": 0.0002461676443370721, "loss": 0.031, "step": 138450 }, { "epoch": 0.36, "learning_rate": 0.0002461637561207006, "loss": 0.0164, "step": 138460 }, { "epoch": 0.36, "learning_rate": 0.0002461598679043291, "loss": 0.0178, "step": 138470 }, { "epoch": 0.36, "learning_rate": 0.0002461559796879576, "loss": 0.0205, "step": 138480 }, { "epoch": 0.36, "learning_rate": 0.0002461520914715862, "loss": 0.0215, "step": 138490 }, { "epoch": 0.36, "learning_rate": 0.0002461482032552147, "loss": 0.0215, "step": 138500 }, { "epoch": 0.36, "learning_rate": 0.00024614431503884327, "loss": 0.0217, "step": 138510 }, { "epoch": 0.36, "learning_rate": 0.0002461404268224718, "loss": 0.0188, "step": 138520 }, { "epoch": 0.36, "learning_rate": 0.00024613653860610036, "loss": 0.019, "step": 138530 }, { "epoch": 0.36, "learning_rate": 0.00024613265038972887, "loss": 0.0221, "step": 138540 }, { "epoch": 0.36, "learning_rate": 0.0002461287621733574, "loss": 0.0185, "step": 138550 }, { "epoch": 0.36, "learning_rate": 0.0002461248739569859, "loss": 0.0198, "step": 138560 }, { "epoch": 0.36, "learning_rate": 0.00024612098574061447, "loss": 0.0182, "step": 138570 }, { "epoch": 0.36, "learning_rate": 0.00024611709752424304, "loss": 0.0183, "step": 138580 }, { "epoch": 0.36, "learning_rate": 0.00024611320930787155, "loss": 0.0171, "step": 138590 }, { "epoch": 0.36, "learning_rate": 0.00024610932109150007, "loss": 0.0191, "step": 138600 }, { "epoch": 0.36, "learning_rate": 0.00024610543287512863, "loss": 0.0189, "step": 138610 }, { "epoch": 0.36, "learning_rate": 0.00024610154465875715, "loss": 0.023, "step": 138620 }, { "epoch": 0.36, "learning_rate": 0.00024609765644238566, "loss": 0.0185, "step": 138630 }, { "epoch": 0.36, "learning_rate": 0.00024609376822601423, "loss": 0.0194, "step": 138640 }, { "epoch": 0.36, "learning_rate": 0.00024608988000964275, "loss": 0.0241, "step": 138650 }, { "epoch": 0.36, "learning_rate": 0.0002460859917932713, "loss": 0.0221, "step": 138660 }, { "epoch": 0.36, "learning_rate": 0.00024608210357689983, "loss": 0.018, "step": 138670 }, { "epoch": 0.36, "learning_rate": 0.00024607821536052834, "loss": 0.028, "step": 138680 }, { "epoch": 0.36, "learning_rate": 0.0002460743271441569, "loss": 0.0193, "step": 138690 }, { "epoch": 0.36, "learning_rate": 0.00024607043892778543, "loss": 0.0266, "step": 138700 }, { "epoch": 0.36, "learning_rate": 0.00024606655071141394, "loss": 0.0242, "step": 138710 }, { "epoch": 0.36, "learning_rate": 0.0002460626624950425, "loss": 0.0157, "step": 138720 }, { "epoch": 0.36, "learning_rate": 0.000246058774278671, "loss": 0.0176, "step": 138730 }, { "epoch": 0.36, "learning_rate": 0.0002460548860622996, "loss": 0.0213, "step": 138740 }, { "epoch": 0.36, "learning_rate": 0.0002460509978459281, "loss": 0.0162, "step": 138750 }, { "epoch": 0.36, "learning_rate": 0.0002460471096295566, "loss": 0.0228, "step": 138760 }, { "epoch": 0.36, "learning_rate": 0.00024604322141318514, "loss": 0.0207, "step": 138770 }, { "epoch": 0.36, "learning_rate": 0.0002460393331968137, "loss": 0.0213, "step": 138780 }, { "epoch": 0.36, "learning_rate": 0.0002460354449804423, "loss": 0.02, "step": 138790 }, { "epoch": 0.36, "learning_rate": 0.0002460315567640708, "loss": 0.0229, "step": 138800 }, { "epoch": 0.36, "learning_rate": 0.0002460276685476993, "loss": 0.0216, "step": 138810 }, { "epoch": 0.36, "learning_rate": 0.0002460237803313279, "loss": 0.0185, "step": 138820 }, { "epoch": 0.36, "learning_rate": 0.0002460198921149564, "loss": 0.0204, "step": 138830 }, { "epoch": 0.36, "learning_rate": 0.0002460160038985849, "loss": 0.0205, "step": 138840 }, { "epoch": 0.36, "learning_rate": 0.00024601211568221347, "loss": 0.0166, "step": 138850 }, { "epoch": 0.36, "learning_rate": 0.000246008227465842, "loss": 0.0198, "step": 138860 }, { "epoch": 0.36, "learning_rate": 0.00024600433924947055, "loss": 0.0206, "step": 138870 }, { "epoch": 0.36, "learning_rate": 0.00024600045103309907, "loss": 0.0175, "step": 138880 }, { "epoch": 0.36, "learning_rate": 0.0002459965628167276, "loss": 0.0219, "step": 138890 }, { "epoch": 0.36, "learning_rate": 0.00024599267460035615, "loss": 0.018, "step": 138900 }, { "epoch": 0.36, "learning_rate": 0.00024598878638398467, "loss": 0.0213, "step": 138910 }, { "epoch": 0.36, "learning_rate": 0.00024598489816761324, "loss": 0.0194, "step": 138920 }, { "epoch": 0.36, "learning_rate": 0.00024598100995124175, "loss": 0.0229, "step": 138930 }, { "epoch": 0.36, "learning_rate": 0.00024597712173487026, "loss": 0.0224, "step": 138940 }, { "epoch": 0.36, "learning_rate": 0.00024597323351849883, "loss": 0.0201, "step": 138950 }, { "epoch": 0.36, "learning_rate": 0.00024596934530212735, "loss": 0.0205, "step": 138960 }, { "epoch": 0.36, "learning_rate": 0.00024596545708575586, "loss": 0.0233, "step": 138970 }, { "epoch": 0.36, "learning_rate": 0.00024596156886938443, "loss": 0.0196, "step": 138980 }, { "epoch": 0.36, "learning_rate": 0.00024595768065301295, "loss": 0.022, "step": 138990 }, { "epoch": 0.36, "learning_rate": 0.0002459537924366415, "loss": 0.026, "step": 139000 }, { "epoch": 0.36, "eval_cer": 0.8817642703482717, "eval_loss": 0.013596959412097931, "eval_runtime": 107.3644, "eval_samples_per_second": 18.628, "eval_steps_per_second": 4.657, "step": 139000 }, { "epoch": 0.36, "learning_rate": 0.00024594990422027003, "loss": 0.017, "step": 139010 }, { "epoch": 0.36, "learning_rate": 0.00024594601600389854, "loss": 0.0219, "step": 139020 }, { "epoch": 0.36, "learning_rate": 0.0002459421277875271, "loss": 0.0151, "step": 139030 }, { "epoch": 0.36, "learning_rate": 0.0002459382395711556, "loss": 0.0265, "step": 139040 }, { "epoch": 0.36, "learning_rate": 0.00024593435135478414, "loss": 0.0203, "step": 139050 }, { "epoch": 0.36, "learning_rate": 0.0002459304631384127, "loss": 0.0248, "step": 139060 }, { "epoch": 0.36, "learning_rate": 0.0002459265749220413, "loss": 0.0183, "step": 139070 }, { "epoch": 0.36, "learning_rate": 0.0002459226867056698, "loss": 0.0164, "step": 139080 }, { "epoch": 0.36, "learning_rate": 0.0002459187984892983, "loss": 0.0196, "step": 139090 }, { "epoch": 0.36, "learning_rate": 0.0002459149102729268, "loss": 0.0211, "step": 139100 }, { "epoch": 0.36, "learning_rate": 0.0002459110220565554, "loss": 0.0167, "step": 139110 }, { "epoch": 0.36, "learning_rate": 0.0002459071338401839, "loss": 0.0239, "step": 139120 }, { "epoch": 0.36, "learning_rate": 0.0002459032456238125, "loss": 0.0185, "step": 139130 }, { "epoch": 0.36, "learning_rate": 0.000245899357407441, "loss": 0.0204, "step": 139140 }, { "epoch": 0.36, "learning_rate": 0.00024589546919106956, "loss": 0.0242, "step": 139150 }, { "epoch": 0.36, "learning_rate": 0.00024589158097469807, "loss": 0.0273, "step": 139160 }, { "epoch": 0.36, "learning_rate": 0.0002458876927583266, "loss": 0.0193, "step": 139170 }, { "epoch": 0.36, "learning_rate": 0.0002458838045419551, "loss": 0.021, "step": 139180 }, { "epoch": 0.36, "learning_rate": 0.00024587991632558367, "loss": 0.0202, "step": 139190 }, { "epoch": 0.36, "learning_rate": 0.0002458760281092122, "loss": 0.0179, "step": 139200 }, { "epoch": 0.36, "learning_rate": 0.00024587213989284075, "loss": 0.0233, "step": 139210 }, { "epoch": 0.36, "learning_rate": 0.00024586825167646927, "loss": 0.0301, "step": 139220 }, { "epoch": 0.36, "learning_rate": 0.0002458643634600978, "loss": 0.0205, "step": 139230 }, { "epoch": 0.36, "learning_rate": 0.00024586047524372635, "loss": 0.0237, "step": 139240 }, { "epoch": 0.36, "learning_rate": 0.00024585658702735487, "loss": 0.0197, "step": 139250 }, { "epoch": 0.36, "learning_rate": 0.0002458526988109834, "loss": 0.0218, "step": 139260 }, { "epoch": 0.36, "learning_rate": 0.00024584881059461195, "loss": 0.0204, "step": 139270 }, { "epoch": 0.36, "learning_rate": 0.0002458449223782405, "loss": 0.0206, "step": 139280 }, { "epoch": 0.36, "learning_rate": 0.00024584103416186903, "loss": 0.0246, "step": 139290 }, { "epoch": 0.36, "learning_rate": 0.00024583714594549755, "loss": 0.0168, "step": 139300 }, { "epoch": 0.36, "learning_rate": 0.00024583325772912606, "loss": 0.0215, "step": 139310 }, { "epoch": 0.36, "learning_rate": 0.00024582936951275463, "loss": 0.0187, "step": 139320 }, { "epoch": 0.36, "learning_rate": 0.00024582548129638314, "loss": 0.0196, "step": 139330 }, { "epoch": 0.36, "learning_rate": 0.0002458215930800117, "loss": 0.0218, "step": 139340 }, { "epoch": 0.36, "learning_rate": 0.00024581770486364023, "loss": 0.0234, "step": 139350 }, { "epoch": 0.36, "learning_rate": 0.0002458138166472688, "loss": 0.017, "step": 139360 }, { "epoch": 0.36, "learning_rate": 0.0002458099284308973, "loss": 0.0214, "step": 139370 }, { "epoch": 0.36, "learning_rate": 0.0002458060402145258, "loss": 0.0184, "step": 139380 }, { "epoch": 0.36, "learning_rate": 0.00024580215199815434, "loss": 0.016, "step": 139390 }, { "epoch": 0.36, "learning_rate": 0.0002457982637817829, "loss": 0.0262, "step": 139400 }, { "epoch": 0.36, "learning_rate": 0.0002457943755654114, "loss": 0.0203, "step": 139410 }, { "epoch": 0.36, "learning_rate": 0.00024579048734904, "loss": 0.0191, "step": 139420 }, { "epoch": 0.36, "learning_rate": 0.0002457865991326685, "loss": 0.0213, "step": 139430 }, { "epoch": 0.36, "learning_rate": 0.000245782710916297, "loss": 0.0208, "step": 139440 }, { "epoch": 0.36, "learning_rate": 0.0002457788226999256, "loss": 0.0186, "step": 139450 }, { "epoch": 0.36, "learning_rate": 0.0002457749344835541, "loss": 0.0195, "step": 139460 }, { "epoch": 0.36, "learning_rate": 0.0002457710462671827, "loss": 0.0201, "step": 139470 }, { "epoch": 0.36, "learning_rate": 0.0002457671580508112, "loss": 0.0204, "step": 139480 }, { "epoch": 0.36, "learning_rate": 0.00024576326983443976, "loss": 0.019, "step": 139490 }, { "epoch": 0.36, "learning_rate": 0.00024575938161806827, "loss": 0.0231, "step": 139500 }, { "epoch": 0.36, "learning_rate": 0.0002457554934016968, "loss": 0.0213, "step": 139510 }, { "epoch": 0.36, "learning_rate": 0.0002457516051853253, "loss": 0.027, "step": 139520 }, { "epoch": 0.36, "learning_rate": 0.00024574771696895387, "loss": 0.0179, "step": 139530 }, { "epoch": 0.36, "learning_rate": 0.0002457438287525824, "loss": 0.0165, "step": 139540 }, { "epoch": 0.36, "learning_rate": 0.00024573994053621095, "loss": 0.0219, "step": 139550 }, { "epoch": 0.36, "learning_rate": 0.00024573605231983947, "loss": 0.0288, "step": 139560 }, { "epoch": 0.36, "learning_rate": 0.00024573216410346804, "loss": 0.0222, "step": 139570 }, { "epoch": 0.36, "learning_rate": 0.00024572827588709655, "loss": 0.0198, "step": 139580 }, { "epoch": 0.36, "learning_rate": 0.00024572438767072506, "loss": 0.027, "step": 139590 }, { "epoch": 0.36, "learning_rate": 0.0002457204994543536, "loss": 0.0204, "step": 139600 }, { "epoch": 0.36, "learning_rate": 0.00024571661123798215, "loss": 0.0223, "step": 139610 }, { "epoch": 0.36, "learning_rate": 0.0002457127230216107, "loss": 0.0211, "step": 139620 }, { "epoch": 0.36, "learning_rate": 0.00024570883480523923, "loss": 0.0189, "step": 139630 }, { "epoch": 0.36, "learning_rate": 0.00024570494658886775, "loss": 0.024, "step": 139640 }, { "epoch": 0.36, "learning_rate": 0.0002457010583724963, "loss": 0.0231, "step": 139650 }, { "epoch": 0.36, "learning_rate": 0.00024569717015612483, "loss": 0.0195, "step": 139660 }, { "epoch": 0.36, "learning_rate": 0.00024569328193975334, "loss": 0.0296, "step": 139670 }, { "epoch": 0.36, "learning_rate": 0.0002456893937233819, "loss": 0.018, "step": 139680 }, { "epoch": 0.36, "learning_rate": 0.0002456855055070104, "loss": 0.0211, "step": 139690 }, { "epoch": 0.36, "learning_rate": 0.000245681617290639, "loss": 0.0206, "step": 139700 }, { "epoch": 0.36, "learning_rate": 0.0002456777290742675, "loss": 0.0192, "step": 139710 }, { "epoch": 0.36, "learning_rate": 0.000245673840857896, "loss": 0.0212, "step": 139720 }, { "epoch": 0.36, "learning_rate": 0.00024566995264152454, "loss": 0.0192, "step": 139730 }, { "epoch": 0.36, "learning_rate": 0.0002456660644251531, "loss": 0.0259, "step": 139740 }, { "epoch": 0.36, "learning_rate": 0.0002456621762087816, "loss": 0.0363, "step": 139750 }, { "epoch": 0.36, "learning_rate": 0.0002456582879924102, "loss": 0.0213, "step": 139760 }, { "epoch": 0.36, "learning_rate": 0.0002456543997760387, "loss": 0.018, "step": 139770 }, { "epoch": 0.36, "learning_rate": 0.0002456505115596673, "loss": 0.0209, "step": 139780 }, { "epoch": 0.36, "learning_rate": 0.0002456466233432958, "loss": 0.021, "step": 139790 }, { "epoch": 0.36, "learning_rate": 0.0002456427351269243, "loss": 0.0205, "step": 139800 }, { "epoch": 0.36, "learning_rate": 0.0002456388469105528, "loss": 0.0195, "step": 139810 }, { "epoch": 0.36, "learning_rate": 0.0002456349586941814, "loss": 0.0216, "step": 139820 }, { "epoch": 0.36, "learning_rate": 0.00024563107047780996, "loss": 0.0244, "step": 139830 }, { "epoch": 0.36, "learning_rate": 0.00024562718226143847, "loss": 0.0234, "step": 139840 }, { "epoch": 0.36, "learning_rate": 0.000245623294045067, "loss": 0.0223, "step": 139850 }, { "epoch": 0.36, "learning_rate": 0.00024561940582869555, "loss": 0.0237, "step": 139860 }, { "epoch": 0.36, "learning_rate": 0.00024561551761232407, "loss": 0.0231, "step": 139870 }, { "epoch": 0.36, "learning_rate": 0.0002456116293959526, "loss": 0.0214, "step": 139880 }, { "epoch": 0.36, "learning_rate": 0.00024560774117958115, "loss": 0.0239, "step": 139890 }, { "epoch": 0.36, "learning_rate": 0.00024560385296320967, "loss": 0.0211, "step": 139900 }, { "epoch": 0.36, "learning_rate": 0.00024559996474683823, "loss": 0.018, "step": 139910 }, { "epoch": 0.36, "learning_rate": 0.00024559607653046675, "loss": 0.0256, "step": 139920 }, { "epoch": 0.36, "learning_rate": 0.00024559218831409526, "loss": 0.0214, "step": 139930 }, { "epoch": 0.36, "learning_rate": 0.0002455883000977238, "loss": 0.0214, "step": 139940 }, { "epoch": 0.36, "learning_rate": 0.00024558441188135235, "loss": 0.0225, "step": 139950 }, { "epoch": 0.36, "learning_rate": 0.00024558052366498086, "loss": 0.0226, "step": 139960 }, { "epoch": 0.36, "learning_rate": 0.00024557663544860943, "loss": 0.0175, "step": 139970 }, { "epoch": 0.36, "learning_rate": 0.00024557274723223794, "loss": 0.0215, "step": 139980 }, { "epoch": 0.36, "learning_rate": 0.0002455688590158665, "loss": 0.0247, "step": 139990 }, { "epoch": 0.36, "learning_rate": 0.00024556497079949503, "loss": 0.016, "step": 140000 }, { "epoch": 0.36, "eval_cer": 0.8817992612716261, "eval_loss": 0.013859533704817295, "eval_runtime": 107.2731, "eval_samples_per_second": 18.644, "eval_steps_per_second": 4.661, "step": 140000 }, { "epoch": 0.36, "learning_rate": 0.00024556108258312354, "loss": 0.0173, "step": 140010 }, { "epoch": 0.36, "learning_rate": 0.0002455571943667521, "loss": 0.0205, "step": 140020 }, { "epoch": 0.36, "learning_rate": 0.0002455533061503806, "loss": 0.0218, "step": 140030 }, { "epoch": 0.36, "learning_rate": 0.0002455494179340092, "loss": 0.018, "step": 140040 }, { "epoch": 0.36, "learning_rate": 0.0002455455297176377, "loss": 0.0199, "step": 140050 }, { "epoch": 0.36, "learning_rate": 0.0002455416415012662, "loss": 0.0196, "step": 140060 }, { "epoch": 0.36, "learning_rate": 0.0002455377532848948, "loss": 0.0162, "step": 140070 }, { "epoch": 0.36, "learning_rate": 0.0002455338650685233, "loss": 0.0223, "step": 140080 }, { "epoch": 0.36, "learning_rate": 0.0002455299768521518, "loss": 0.0172, "step": 140090 }, { "epoch": 0.36, "learning_rate": 0.0002455260886357804, "loss": 0.0185, "step": 140100 }, { "epoch": 0.36, "learning_rate": 0.00024552220041940896, "loss": 0.018, "step": 140110 }, { "epoch": 0.36, "learning_rate": 0.0002455183122030375, "loss": 0.019, "step": 140120 }, { "epoch": 0.36, "learning_rate": 0.000245514423986666, "loss": 0.0161, "step": 140130 }, { "epoch": 0.36, "learning_rate": 0.0002455105357702945, "loss": 0.0226, "step": 140140 }, { "epoch": 0.36, "learning_rate": 0.00024550664755392307, "loss": 0.0178, "step": 140150 }, { "epoch": 0.36, "learning_rate": 0.0002455027593375516, "loss": 0.0188, "step": 140160 }, { "epoch": 0.36, "learning_rate": 0.00024549887112118015, "loss": 0.0174, "step": 140170 }, { "epoch": 0.36, "learning_rate": 0.00024549498290480867, "loss": 0.0196, "step": 140180 }, { "epoch": 0.36, "learning_rate": 0.0002454910946884372, "loss": 0.0207, "step": 140190 }, { "epoch": 0.36, "learning_rate": 0.00024548720647206575, "loss": 0.0201, "step": 140200 }, { "epoch": 0.36, "learning_rate": 0.00024548331825569427, "loss": 0.0195, "step": 140210 }, { "epoch": 0.36, "learning_rate": 0.0002454794300393228, "loss": 0.0189, "step": 140220 }, { "epoch": 0.36, "learning_rate": 0.00024547554182295135, "loss": 0.0199, "step": 140230 }, { "epoch": 0.36, "learning_rate": 0.00024547165360657986, "loss": 0.0207, "step": 140240 }, { "epoch": 0.36, "learning_rate": 0.00024546776539020843, "loss": 0.0187, "step": 140250 }, { "epoch": 0.36, "learning_rate": 0.00024546387717383695, "loss": 0.0181, "step": 140260 }, { "epoch": 0.36, "learning_rate": 0.00024545998895746546, "loss": 0.0164, "step": 140270 }, { "epoch": 0.36, "learning_rate": 0.00024545610074109403, "loss": 0.0199, "step": 140280 }, { "epoch": 0.36, "learning_rate": 0.00024545221252472255, "loss": 0.0232, "step": 140290 }, { "epoch": 0.36, "learning_rate": 0.00024544832430835106, "loss": 0.0234, "step": 140300 }, { "epoch": 0.36, "learning_rate": 0.00024544443609197963, "loss": 0.0203, "step": 140310 }, { "epoch": 0.36, "learning_rate": 0.0002454405478756082, "loss": 0.0219, "step": 140320 }, { "epoch": 0.36, "learning_rate": 0.0002454366596592367, "loss": 0.0212, "step": 140330 }, { "epoch": 0.36, "learning_rate": 0.0002454327714428652, "loss": 0.0219, "step": 140340 }, { "epoch": 0.36, "learning_rate": 0.00024542888322649374, "loss": 0.0204, "step": 140350 }, { "epoch": 0.36, "learning_rate": 0.0002454249950101223, "loss": 0.0142, "step": 140360 }, { "epoch": 0.36, "learning_rate": 0.0002454211067937508, "loss": 0.0163, "step": 140370 }, { "epoch": 0.36, "learning_rate": 0.0002454172185773794, "loss": 0.0213, "step": 140380 }, { "epoch": 0.36, "learning_rate": 0.0002454133303610079, "loss": 0.018, "step": 140390 }, { "epoch": 0.36, "learning_rate": 0.0002454094421446365, "loss": 0.022, "step": 140400 }, { "epoch": 0.36, "learning_rate": 0.000245405553928265, "loss": 0.021, "step": 140410 }, { "epoch": 0.36, "learning_rate": 0.0002454016657118935, "loss": 0.015, "step": 140420 }, { "epoch": 0.36, "learning_rate": 0.000245397777495522, "loss": 0.0184, "step": 140430 }, { "epoch": 0.36, "learning_rate": 0.0002453938892791506, "loss": 0.0213, "step": 140440 }, { "epoch": 0.36, "learning_rate": 0.0002453900010627791, "loss": 0.016, "step": 140450 }, { "epoch": 0.36, "learning_rate": 0.00024538611284640767, "loss": 0.0191, "step": 140460 }, { "epoch": 0.36, "learning_rate": 0.0002453822246300362, "loss": 0.0165, "step": 140470 }, { "epoch": 0.36, "learning_rate": 0.0002453783364136647, "loss": 0.0198, "step": 140480 }, { "epoch": 0.36, "learning_rate": 0.00024537444819729327, "loss": 0.0172, "step": 140490 }, { "epoch": 0.36, "learning_rate": 0.0002453705599809218, "loss": 0.0207, "step": 140500 }, { "epoch": 0.36, "learning_rate": 0.00024536667176455035, "loss": 0.0188, "step": 140510 }, { "epoch": 0.36, "learning_rate": 0.00024536278354817887, "loss": 0.02, "step": 140520 }, { "epoch": 0.36, "learning_rate": 0.00024535889533180744, "loss": 0.0195, "step": 140530 }, { "epoch": 0.36, "learning_rate": 0.00024535500711543595, "loss": 0.0181, "step": 140540 }, { "epoch": 0.36, "learning_rate": 0.00024535111889906447, "loss": 0.0151, "step": 140550 }, { "epoch": 0.36, "learning_rate": 0.000245347230682693, "loss": 0.0159, "step": 140560 }, { "epoch": 0.36, "learning_rate": 0.00024534334246632155, "loss": 0.0195, "step": 140570 }, { "epoch": 0.36, "learning_rate": 0.00024533945424995006, "loss": 0.0189, "step": 140580 }, { "epoch": 0.36, "learning_rate": 0.00024533556603357863, "loss": 0.0239, "step": 140590 }, { "epoch": 0.36, "learning_rate": 0.00024533167781720715, "loss": 0.0194, "step": 140600 }, { "epoch": 0.36, "learning_rate": 0.0002453277896008357, "loss": 0.0218, "step": 140610 }, { "epoch": 0.36, "learning_rate": 0.00024532390138446423, "loss": 0.0195, "step": 140620 }, { "epoch": 0.36, "learning_rate": 0.00024532001316809274, "loss": 0.0216, "step": 140630 }, { "epoch": 0.36, "learning_rate": 0.00024531612495172126, "loss": 0.0172, "step": 140640 }, { "epoch": 0.36, "learning_rate": 0.00024531223673534983, "loss": 0.0194, "step": 140650 }, { "epoch": 0.36, "learning_rate": 0.0002453083485189784, "loss": 0.0193, "step": 140660 }, { "epoch": 0.36, "learning_rate": 0.0002453044603026069, "loss": 0.0199, "step": 140670 }, { "epoch": 0.36, "learning_rate": 0.0002453005720862354, "loss": 0.0194, "step": 140680 }, { "epoch": 0.36, "learning_rate": 0.00024529668386986394, "loss": 0.0172, "step": 140690 }, { "epoch": 0.36, "learning_rate": 0.0002452927956534925, "loss": 0.0183, "step": 140700 }, { "epoch": 0.36, "learning_rate": 0.000245288907437121, "loss": 0.022, "step": 140710 }, { "epoch": 0.36, "learning_rate": 0.0002452850192207496, "loss": 0.0168, "step": 140720 }, { "epoch": 0.36, "learning_rate": 0.0002452811310043781, "loss": 0.0171, "step": 140730 }, { "epoch": 0.36, "learning_rate": 0.0002452772427880067, "loss": 0.0241, "step": 140740 }, { "epoch": 0.36, "learning_rate": 0.0002452733545716352, "loss": 0.0196, "step": 140750 }, { "epoch": 0.36, "learning_rate": 0.0002452694663552637, "loss": 0.0224, "step": 140760 }, { "epoch": 0.36, "learning_rate": 0.0002452655781388922, "loss": 0.0205, "step": 140770 }, { "epoch": 0.36, "learning_rate": 0.0002452616899225208, "loss": 0.0209, "step": 140780 }, { "epoch": 0.36, "learning_rate": 0.0002452578017061493, "loss": 0.0185, "step": 140790 }, { "epoch": 0.36, "learning_rate": 0.00024525391348977787, "loss": 0.0212, "step": 140800 }, { "epoch": 0.36, "learning_rate": 0.0002452500252734064, "loss": 0.02, "step": 140810 }, { "epoch": 0.37, "learning_rate": 0.00024524613705703495, "loss": 0.0236, "step": 140820 }, { "epoch": 0.37, "learning_rate": 0.00024524224884066347, "loss": 0.0196, "step": 140830 }, { "epoch": 0.37, "learning_rate": 0.000245238360624292, "loss": 0.0249, "step": 140840 }, { "epoch": 0.37, "learning_rate": 0.0002452344724079205, "loss": 0.0203, "step": 140850 }, { "epoch": 0.37, "learning_rate": 0.00024523058419154907, "loss": 0.0232, "step": 140860 }, { "epoch": 0.37, "learning_rate": 0.00024522669597517764, "loss": 0.0229, "step": 140870 }, { "epoch": 0.37, "learning_rate": 0.00024522280775880615, "loss": 0.024, "step": 140880 }, { "epoch": 0.37, "learning_rate": 0.00024521891954243466, "loss": 0.0189, "step": 140890 }, { "epoch": 0.37, "learning_rate": 0.00024521503132606323, "loss": 0.0198, "step": 140900 }, { "epoch": 0.37, "learning_rate": 0.00024521114310969175, "loss": 0.0157, "step": 140910 }, { "epoch": 0.37, "learning_rate": 0.00024520725489332026, "loss": 0.0219, "step": 140920 }, { "epoch": 0.37, "learning_rate": 0.00024520336667694883, "loss": 0.0207, "step": 140930 }, { "epoch": 0.37, "learning_rate": 0.00024519947846057735, "loss": 0.0223, "step": 140940 }, { "epoch": 0.37, "learning_rate": 0.0002451955902442059, "loss": 0.0213, "step": 140950 }, { "epoch": 0.37, "learning_rate": 0.00024519170202783443, "loss": 0.0233, "step": 140960 }, { "epoch": 0.37, "learning_rate": 0.00024518781381146294, "loss": 0.0178, "step": 140970 }, { "epoch": 0.37, "learning_rate": 0.00024518392559509146, "loss": 0.0178, "step": 140980 }, { "epoch": 0.37, "learning_rate": 0.00024518003737872, "loss": 0.0191, "step": 140990 }, { "epoch": 0.37, "learning_rate": 0.00024517614916234854, "loss": 0.021, "step": 141000 }, { "epoch": 0.37, "eval_cer": 0.881751673615864, "eval_loss": 0.013707040809094906, "eval_runtime": 107.3675, "eval_samples_per_second": 18.628, "eval_steps_per_second": 4.657, "step": 141000 }, { "epoch": 0.37, "learning_rate": 0.0002451722609459771, "loss": 0.02, "step": 141010 }, { "epoch": 0.37, "learning_rate": 0.0002451683727296056, "loss": 0.025, "step": 141020 }, { "epoch": 0.37, "learning_rate": 0.0002451644845132342, "loss": 0.0184, "step": 141030 }, { "epoch": 0.37, "learning_rate": 0.0002451605962968627, "loss": 0.0201, "step": 141040 }, { "epoch": 0.37, "learning_rate": 0.0002451567080804912, "loss": 0.0246, "step": 141050 }, { "epoch": 0.37, "learning_rate": 0.0002451528198641198, "loss": 0.0242, "step": 141060 }, { "epoch": 0.37, "learning_rate": 0.0002451489316477483, "loss": 0.0196, "step": 141070 }, { "epoch": 0.37, "learning_rate": 0.0002451450434313769, "loss": 0.0184, "step": 141080 }, { "epoch": 0.37, "learning_rate": 0.0002451411552150054, "loss": 0.0204, "step": 141090 }, { "epoch": 0.37, "learning_rate": 0.0002451372669986339, "loss": 0.0174, "step": 141100 }, { "epoch": 0.37, "learning_rate": 0.00024513337878226247, "loss": 0.0163, "step": 141110 }, { "epoch": 0.37, "learning_rate": 0.000245129490565891, "loss": 0.025, "step": 141120 }, { "epoch": 0.37, "learning_rate": 0.0002451256023495195, "loss": 0.0191, "step": 141130 }, { "epoch": 0.37, "learning_rate": 0.00024512171413314807, "loss": 0.022, "step": 141140 }, { "epoch": 0.37, "learning_rate": 0.0002451178259167766, "loss": 0.0183, "step": 141150 }, { "epoch": 0.37, "learning_rate": 0.00024511393770040515, "loss": 0.0149, "step": 141160 }, { "epoch": 0.37, "learning_rate": 0.00024511004948403367, "loss": 0.0181, "step": 141170 }, { "epoch": 0.37, "learning_rate": 0.0002451061612676622, "loss": 0.0156, "step": 141180 }, { "epoch": 0.37, "learning_rate": 0.0002451022730512907, "loss": 0.0168, "step": 141190 }, { "epoch": 0.37, "learning_rate": 0.00024509838483491927, "loss": 0.0202, "step": 141200 }, { "epoch": 0.37, "learning_rate": 0.00024509449661854783, "loss": 0.0188, "step": 141210 }, { "epoch": 0.37, "learning_rate": 0.00024509060840217635, "loss": 0.0246, "step": 141220 }, { "epoch": 0.37, "learning_rate": 0.00024508672018580486, "loss": 0.0237, "step": 141230 }, { "epoch": 0.37, "learning_rate": 0.00024508283196943343, "loss": 0.0199, "step": 141240 }, { "epoch": 0.37, "learning_rate": 0.00024507894375306195, "loss": 0.0233, "step": 141250 }, { "epoch": 0.37, "learning_rate": 0.00024507505553669046, "loss": 0.0236, "step": 141260 }, { "epoch": 0.37, "learning_rate": 0.00024507116732031903, "loss": 0.0192, "step": 141270 }, { "epoch": 0.37, "learning_rate": 0.00024506727910394754, "loss": 0.0238, "step": 141280 }, { "epoch": 0.37, "learning_rate": 0.0002450633908875761, "loss": 0.0228, "step": 141290 }, { "epoch": 0.37, "learning_rate": 0.00024505950267120463, "loss": 0.016, "step": 141300 }, { "epoch": 0.37, "learning_rate": 0.00024505561445483314, "loss": 0.0178, "step": 141310 }, { "epoch": 0.37, "learning_rate": 0.0002450517262384617, "loss": 0.0259, "step": 141320 }, { "epoch": 0.37, "learning_rate": 0.0002450478380220902, "loss": 0.0133, "step": 141330 }, { "epoch": 0.37, "learning_rate": 0.00024504394980571874, "loss": 0.0183, "step": 141340 }, { "epoch": 0.37, "learning_rate": 0.0002450400615893473, "loss": 0.0212, "step": 141350 }, { "epoch": 0.37, "learning_rate": 0.0002450361733729759, "loss": 0.0233, "step": 141360 }, { "epoch": 0.37, "learning_rate": 0.0002450322851566044, "loss": 0.0202, "step": 141370 }, { "epoch": 0.37, "learning_rate": 0.0002450283969402329, "loss": 0.017, "step": 141380 }, { "epoch": 0.37, "learning_rate": 0.0002450245087238614, "loss": 0.0219, "step": 141390 }, { "epoch": 0.37, "learning_rate": 0.00024502062050749, "loss": 0.02, "step": 141400 }, { "epoch": 0.37, "learning_rate": 0.0002450167322911185, "loss": 0.0224, "step": 141410 }, { "epoch": 0.37, "learning_rate": 0.0002450128440747471, "loss": 0.0216, "step": 141420 }, { "epoch": 0.37, "learning_rate": 0.0002450089558583756, "loss": 0.0209, "step": 141430 }, { "epoch": 0.37, "learning_rate": 0.0002450050676420041, "loss": 0.0211, "step": 141440 }, { "epoch": 0.37, "learning_rate": 0.00024500117942563267, "loss": 0.0181, "step": 141450 }, { "epoch": 0.37, "learning_rate": 0.0002449972912092612, "loss": 0.0188, "step": 141460 }, { "epoch": 0.37, "learning_rate": 0.0002449934029928897, "loss": 0.0206, "step": 141470 }, { "epoch": 0.37, "learning_rate": 0.00024498951477651827, "loss": 0.0213, "step": 141480 }, { "epoch": 0.37, "learning_rate": 0.0002449856265601468, "loss": 0.02, "step": 141490 }, { "epoch": 0.37, "learning_rate": 0.00024498173834377535, "loss": 0.0202, "step": 141500 }, { "epoch": 0.37, "learning_rate": 0.00024497785012740387, "loss": 0.019, "step": 141510 }, { "epoch": 0.37, "learning_rate": 0.0002449739619110324, "loss": 0.0163, "step": 141520 }, { "epoch": 0.37, "learning_rate": 0.00024497007369466095, "loss": 0.0186, "step": 141530 }, { "epoch": 0.37, "learning_rate": 0.00024496618547828946, "loss": 0.0173, "step": 141540 }, { "epoch": 0.37, "learning_rate": 0.000244962297261918, "loss": 0.0164, "step": 141550 }, { "epoch": 0.37, "learning_rate": 0.00024495840904554655, "loss": 0.0176, "step": 141560 }, { "epoch": 0.37, "learning_rate": 0.0002449545208291751, "loss": 0.0175, "step": 141570 }, { "epoch": 0.37, "learning_rate": 0.00024495063261280363, "loss": 0.0247, "step": 141580 }, { "epoch": 0.37, "learning_rate": 0.00024494674439643215, "loss": 0.017, "step": 141590 }, { "epoch": 0.37, "learning_rate": 0.00024494285618006066, "loss": 0.0213, "step": 141600 }, { "epoch": 0.37, "learning_rate": 0.00024493896796368923, "loss": 0.0205, "step": 141610 }, { "epoch": 0.37, "learning_rate": 0.00024493507974731774, "loss": 0.0171, "step": 141620 }, { "epoch": 0.37, "learning_rate": 0.0002449311915309463, "loss": 0.0189, "step": 141630 }, { "epoch": 0.37, "learning_rate": 0.0002449273033145748, "loss": 0.0221, "step": 141640 }, { "epoch": 0.37, "learning_rate": 0.0002449234150982034, "loss": 0.0195, "step": 141650 }, { "epoch": 0.37, "learning_rate": 0.0002449195268818319, "loss": 0.0194, "step": 141660 }, { "epoch": 0.37, "learning_rate": 0.0002449156386654604, "loss": 0.0206, "step": 141670 }, { "epoch": 0.37, "learning_rate": 0.00024491175044908894, "loss": 0.0195, "step": 141680 }, { "epoch": 0.37, "learning_rate": 0.0002449078622327175, "loss": 0.0246, "step": 141690 }, { "epoch": 0.37, "learning_rate": 0.0002449039740163461, "loss": 0.0185, "step": 141700 }, { "epoch": 0.37, "learning_rate": 0.0002449000857999746, "loss": 0.0226, "step": 141710 }, { "epoch": 0.37, "learning_rate": 0.0002448961975836031, "loss": 0.021, "step": 141720 }, { "epoch": 0.37, "learning_rate": 0.0002448923093672316, "loss": 0.018, "step": 141730 }, { "epoch": 0.37, "learning_rate": 0.0002448884211508602, "loss": 0.0163, "step": 141740 }, { "epoch": 0.37, "learning_rate": 0.0002448845329344887, "loss": 0.0166, "step": 141750 }, { "epoch": 0.37, "learning_rate": 0.00024488064471811727, "loss": 0.0202, "step": 141760 }, { "epoch": 0.37, "learning_rate": 0.0002448767565017458, "loss": 0.0168, "step": 141770 }, { "epoch": 0.37, "learning_rate": 0.00024487286828537436, "loss": 0.0332, "step": 141780 }, { "epoch": 0.37, "learning_rate": 0.00024486898006900287, "loss": 0.0185, "step": 141790 }, { "epoch": 0.37, "learning_rate": 0.0002448650918526314, "loss": 0.0211, "step": 141800 }, { "epoch": 0.37, "learning_rate": 0.0002448612036362599, "loss": 0.0179, "step": 141810 }, { "epoch": 0.37, "learning_rate": 0.00024485731541988847, "loss": 0.0176, "step": 141820 }, { "epoch": 0.37, "learning_rate": 0.000244853427203517, "loss": 0.0204, "step": 141830 }, { "epoch": 0.37, "learning_rate": 0.00024484953898714555, "loss": 0.0216, "step": 141840 }, { "epoch": 0.37, "learning_rate": 0.00024484565077077407, "loss": 0.0211, "step": 141850 }, { "epoch": 0.37, "learning_rate": 0.00024484176255440263, "loss": 0.0224, "step": 141860 }, { "epoch": 0.37, "learning_rate": 0.00024483787433803115, "loss": 0.0162, "step": 141870 }, { "epoch": 0.37, "learning_rate": 0.00024483398612165966, "loss": 0.0216, "step": 141880 }, { "epoch": 0.37, "learning_rate": 0.0002448300979052882, "loss": 0.0207, "step": 141890 }, { "epoch": 0.37, "learning_rate": 0.00024482620968891675, "loss": 0.0189, "step": 141900 }, { "epoch": 0.37, "learning_rate": 0.0002448223214725453, "loss": 0.0212, "step": 141910 }, { "epoch": 0.37, "learning_rate": 0.00024481843325617383, "loss": 0.0225, "step": 141920 }, { "epoch": 0.37, "learning_rate": 0.00024481454503980234, "loss": 0.0201, "step": 141930 }, { "epoch": 0.37, "learning_rate": 0.00024481065682343086, "loss": 0.0171, "step": 141940 }, { "epoch": 0.37, "learning_rate": 0.00024480676860705943, "loss": 0.0159, "step": 141950 }, { "epoch": 0.37, "learning_rate": 0.00024480288039068794, "loss": 0.0184, "step": 141960 }, { "epoch": 0.37, "learning_rate": 0.0002447989921743165, "loss": 0.0179, "step": 141970 }, { "epoch": 0.37, "learning_rate": 0.000244795103957945, "loss": 0.0146, "step": 141980 }, { "epoch": 0.37, "learning_rate": 0.0002447912157415736, "loss": 0.0225, "step": 141990 }, { "epoch": 0.37, "learning_rate": 0.0002447873275252021, "loss": 0.0215, "step": 142000 }, { "epoch": 0.37, "eval_cer": 0.8817838652653501, "eval_loss": 0.013540214858949184, "eval_runtime": 107.2038, "eval_samples_per_second": 18.656, "eval_steps_per_second": 4.664, "step": 142000 }, { "epoch": 0.37, "learning_rate": 0.0002447834393088306, "loss": 0.0176, "step": 142010 }, { "epoch": 0.37, "learning_rate": 0.00024477955109245914, "loss": 0.0222, "step": 142020 }, { "epoch": 0.37, "learning_rate": 0.0002447756628760877, "loss": 0.023, "step": 142030 }, { "epoch": 0.37, "learning_rate": 0.0002447717746597162, "loss": 0.0215, "step": 142040 }, { "epoch": 0.37, "learning_rate": 0.0002447678864433448, "loss": 0.0245, "step": 142050 }, { "epoch": 0.37, "learning_rate": 0.0002447639982269733, "loss": 0.0216, "step": 142060 }, { "epoch": 0.37, "learning_rate": 0.0002447601100106019, "loss": 0.019, "step": 142070 }, { "epoch": 0.37, "learning_rate": 0.0002447562217942304, "loss": 0.0218, "step": 142080 }, { "epoch": 0.37, "learning_rate": 0.0002447523335778589, "loss": 0.032, "step": 142090 }, { "epoch": 0.37, "learning_rate": 0.00024474844536148747, "loss": 0.0201, "step": 142100 }, { "epoch": 0.37, "learning_rate": 0.000244744557145116, "loss": 0.017, "step": 142110 }, { "epoch": 0.37, "learning_rate": 0.00024474066892874455, "loss": 0.0207, "step": 142120 }, { "epoch": 0.37, "learning_rate": 0.00024473678071237307, "loss": 0.0204, "step": 142130 }, { "epoch": 0.37, "learning_rate": 0.0002447328924960016, "loss": 0.0184, "step": 142140 }, { "epoch": 0.37, "learning_rate": 0.00024472900427963015, "loss": 0.0174, "step": 142150 }, { "epoch": 0.37, "learning_rate": 0.00024472511606325867, "loss": 0.0207, "step": 142160 }, { "epoch": 0.37, "learning_rate": 0.0002447212278468872, "loss": 0.0221, "step": 142170 }, { "epoch": 0.37, "learning_rate": 0.00024471733963051575, "loss": 0.0201, "step": 142180 }, { "epoch": 0.37, "learning_rate": 0.00024471345141414426, "loss": 0.0194, "step": 142190 }, { "epoch": 0.37, "learning_rate": 0.00024470956319777283, "loss": 0.0194, "step": 142200 }, { "epoch": 0.37, "learning_rate": 0.00024470567498140135, "loss": 0.018, "step": 142210 }, { "epoch": 0.37, "learning_rate": 0.00024470178676502986, "loss": 0.0162, "step": 142220 }, { "epoch": 0.37, "learning_rate": 0.0002446978985486584, "loss": 0.019, "step": 142230 }, { "epoch": 0.37, "learning_rate": 0.00024469401033228695, "loss": 0.0166, "step": 142240 }, { "epoch": 0.37, "learning_rate": 0.0002446901221159155, "loss": 0.0193, "step": 142250 }, { "epoch": 0.37, "learning_rate": 0.00024468623389954403, "loss": 0.0223, "step": 142260 }, { "epoch": 0.37, "learning_rate": 0.00024468234568317254, "loss": 0.0235, "step": 142270 }, { "epoch": 0.37, "learning_rate": 0.0002446784574668011, "loss": 0.0162, "step": 142280 }, { "epoch": 0.37, "learning_rate": 0.0002446745692504296, "loss": 0.0191, "step": 142290 }, { "epoch": 0.37, "learning_rate": 0.00024467068103405814, "loss": 0.0178, "step": 142300 }, { "epoch": 0.37, "learning_rate": 0.0002446667928176867, "loss": 0.0229, "step": 142310 }, { "epoch": 0.37, "learning_rate": 0.0002446629046013152, "loss": 0.0271, "step": 142320 }, { "epoch": 0.37, "learning_rate": 0.0002446590163849438, "loss": 0.0199, "step": 142330 }, { "epoch": 0.37, "learning_rate": 0.0002446551281685723, "loss": 0.018, "step": 142340 }, { "epoch": 0.37, "learning_rate": 0.0002446512399522008, "loss": 0.0187, "step": 142350 }, { "epoch": 0.37, "learning_rate": 0.0002446473517358294, "loss": 0.0159, "step": 142360 }, { "epoch": 0.37, "learning_rate": 0.0002446434635194579, "loss": 0.0195, "step": 142370 }, { "epoch": 0.37, "learning_rate": 0.0002446395753030864, "loss": 0.0175, "step": 142380 }, { "epoch": 0.37, "learning_rate": 0.000244635687086715, "loss": 0.0208, "step": 142390 }, { "epoch": 0.37, "learning_rate": 0.00024463179887034356, "loss": 0.0201, "step": 142400 }, { "epoch": 0.37, "learning_rate": 0.00024462791065397207, "loss": 0.0211, "step": 142410 }, { "epoch": 0.37, "learning_rate": 0.0002446240224376006, "loss": 0.0238, "step": 142420 }, { "epoch": 0.37, "learning_rate": 0.0002446201342212291, "loss": 0.0168, "step": 142430 }, { "epoch": 0.37, "learning_rate": 0.0002446162460048576, "loss": 0.017, "step": 142440 }, { "epoch": 0.37, "learning_rate": 0.0002446123577884862, "loss": 0.0254, "step": 142450 }, { "epoch": 0.37, "learning_rate": 0.00024460846957211475, "loss": 0.0216, "step": 142460 }, { "epoch": 0.37, "learning_rate": 0.00024460458135574327, "loss": 0.0221, "step": 142470 }, { "epoch": 0.37, "learning_rate": 0.0002446006931393718, "loss": 0.0156, "step": 142480 }, { "epoch": 0.37, "learning_rate": 0.00024459680492300035, "loss": 0.0212, "step": 142490 }, { "epoch": 0.37, "learning_rate": 0.00024459291670662887, "loss": 0.023, "step": 142500 }, { "epoch": 0.37, "learning_rate": 0.0002445890284902574, "loss": 0.0181, "step": 142510 }, { "epoch": 0.37, "learning_rate": 0.00024458514027388595, "loss": 0.0197, "step": 142520 }, { "epoch": 0.37, "learning_rate": 0.00024458125205751446, "loss": 0.0222, "step": 142530 }, { "epoch": 0.37, "learning_rate": 0.00024457736384114303, "loss": 0.0186, "step": 142540 }, { "epoch": 0.37, "learning_rate": 0.00024457347562477155, "loss": 0.0189, "step": 142550 }, { "epoch": 0.37, "learning_rate": 0.00024456958740840006, "loss": 0.0155, "step": 142560 }, { "epoch": 0.37, "learning_rate": 0.00024456569919202863, "loss": 0.0171, "step": 142570 }, { "epoch": 0.37, "learning_rate": 0.00024456181097565714, "loss": 0.018, "step": 142580 }, { "epoch": 0.37, "learning_rate": 0.00024455792275928566, "loss": 0.0173, "step": 142590 }, { "epoch": 0.37, "learning_rate": 0.00024455403454291423, "loss": 0.0222, "step": 142600 }, { "epoch": 0.37, "learning_rate": 0.0002445501463265428, "loss": 0.0174, "step": 142610 }, { "epoch": 0.37, "learning_rate": 0.0002445462581101713, "loss": 0.0191, "step": 142620 }, { "epoch": 0.37, "learning_rate": 0.0002445423698937998, "loss": 0.0218, "step": 142630 }, { "epoch": 0.37, "learning_rate": 0.00024453848167742834, "loss": 0.0175, "step": 142640 }, { "epoch": 0.37, "learning_rate": 0.0002445345934610569, "loss": 0.0141, "step": 142650 }, { "epoch": 0.37, "learning_rate": 0.0002445307052446854, "loss": 0.0215, "step": 142660 }, { "epoch": 0.37, "learning_rate": 0.000244526817028314, "loss": 0.0164, "step": 142670 }, { "epoch": 0.37, "learning_rate": 0.0002445229288119425, "loss": 0.0214, "step": 142680 }, { "epoch": 0.37, "learning_rate": 0.000244519040595571, "loss": 0.0234, "step": 142690 }, { "epoch": 0.37, "learning_rate": 0.0002445151523791996, "loss": 0.018, "step": 142700 }, { "epoch": 0.37, "learning_rate": 0.0002445112641628281, "loss": 0.021, "step": 142710 }, { "epoch": 0.37, "learning_rate": 0.0002445073759464566, "loss": 0.0208, "step": 142720 }, { "epoch": 0.37, "learning_rate": 0.0002445034877300852, "loss": 0.0196, "step": 142730 }, { "epoch": 0.37, "learning_rate": 0.0002444995995137137, "loss": 0.0202, "step": 142740 }, { "epoch": 0.37, "learning_rate": 0.00024449571129734227, "loss": 0.0189, "step": 142750 }, { "epoch": 0.37, "learning_rate": 0.0002444918230809708, "loss": 0.0154, "step": 142760 }, { "epoch": 0.37, "learning_rate": 0.0002444879348645993, "loss": 0.0178, "step": 142770 }, { "epoch": 0.37, "learning_rate": 0.00024448404664822787, "loss": 0.0212, "step": 142780 }, { "epoch": 0.37, "learning_rate": 0.0002444801584318564, "loss": 0.0165, "step": 142790 }, { "epoch": 0.37, "learning_rate": 0.00024447627021548495, "loss": 0.0165, "step": 142800 }, { "epoch": 0.37, "learning_rate": 0.00024447238199911347, "loss": 0.0182, "step": 142810 }, { "epoch": 0.37, "learning_rate": 0.00024446849378274204, "loss": 0.0183, "step": 142820 }, { "epoch": 0.37, "learning_rate": 0.00024446460556637055, "loss": 0.0215, "step": 142830 }, { "epoch": 0.37, "learning_rate": 0.00024446071734999906, "loss": 0.0193, "step": 142840 }, { "epoch": 0.37, "learning_rate": 0.0002444568291336276, "loss": 0.0188, "step": 142850 }, { "epoch": 0.37, "learning_rate": 0.00024445294091725615, "loss": 0.0179, "step": 142860 }, { "epoch": 0.37, "learning_rate": 0.00024444905270088466, "loss": 0.0195, "step": 142870 }, { "epoch": 0.37, "learning_rate": 0.00024444516448451323, "loss": 0.0235, "step": 142880 }, { "epoch": 0.37, "learning_rate": 0.00024444127626814175, "loss": 0.0147, "step": 142890 }, { "epoch": 0.37, "learning_rate": 0.0002444373880517703, "loss": 0.019, "step": 142900 }, { "epoch": 0.37, "learning_rate": 0.00024443349983539883, "loss": 0.0204, "step": 142910 }, { "epoch": 0.37, "learning_rate": 0.00024442961161902734, "loss": 0.0167, "step": 142920 }, { "epoch": 0.37, "learning_rate": 0.00024442572340265586, "loss": 0.0155, "step": 142930 }, { "epoch": 0.37, "learning_rate": 0.0002444218351862844, "loss": 0.0229, "step": 142940 }, { "epoch": 0.37, "learning_rate": 0.000244417946969913, "loss": 0.0182, "step": 142950 }, { "epoch": 0.37, "learning_rate": 0.0002444140587535415, "loss": 0.0203, "step": 142960 }, { "epoch": 0.37, "learning_rate": 0.00024441017053717, "loss": 0.0189, "step": 142970 }, { "epoch": 0.37, "learning_rate": 0.00024440628232079854, "loss": 0.0207, "step": 142980 }, { "epoch": 0.37, "learning_rate": 0.0002444023941044271, "loss": 0.0215, "step": 142990 }, { "epoch": 0.37, "learning_rate": 0.0002443985058880556, "loss": 0.022, "step": 143000 }, { "epoch": 0.37, "eval_cer": 0.8818286536472439, "eval_loss": 0.013993228785693645, "eval_runtime": 107.6329, "eval_samples_per_second": 18.582, "eval_steps_per_second": 4.645, "step": 143000 }, { "epoch": 0.37, "learning_rate": 0.0002443946176716842, "loss": 0.0182, "step": 143010 }, { "epoch": 0.37, "learning_rate": 0.0002443907294553127, "loss": 0.0179, "step": 143020 }, { "epoch": 0.37, "learning_rate": 0.0002443868412389413, "loss": 0.0181, "step": 143030 }, { "epoch": 0.37, "learning_rate": 0.0002443829530225698, "loss": 0.016, "step": 143040 }, { "epoch": 0.37, "learning_rate": 0.0002443790648061983, "loss": 0.0215, "step": 143050 }, { "epoch": 0.37, "learning_rate": 0.0002443751765898268, "loss": 0.0219, "step": 143060 }, { "epoch": 0.37, "learning_rate": 0.0002443712883734554, "loss": 0.0195, "step": 143070 }, { "epoch": 0.37, "learning_rate": 0.0002443674001570839, "loss": 0.0209, "step": 143080 }, { "epoch": 0.37, "learning_rate": 0.00024436351194071247, "loss": 0.0194, "step": 143090 }, { "epoch": 0.37, "learning_rate": 0.000244359623724341, "loss": 0.0202, "step": 143100 }, { "epoch": 0.37, "learning_rate": 0.00024435573550796955, "loss": 0.017, "step": 143110 }, { "epoch": 0.37, "learning_rate": 0.00024435184729159807, "loss": 0.0219, "step": 143120 }, { "epoch": 0.37, "learning_rate": 0.0002443479590752266, "loss": 0.0197, "step": 143130 }, { "epoch": 0.37, "learning_rate": 0.0002443440708588551, "loss": 0.0221, "step": 143140 }, { "epoch": 0.37, "learning_rate": 0.00024434018264248367, "loss": 0.0189, "step": 143150 }, { "epoch": 0.37, "learning_rate": 0.00024433629442611223, "loss": 0.0175, "step": 143160 }, { "epoch": 0.37, "learning_rate": 0.00024433240620974075, "loss": 0.0202, "step": 143170 }, { "epoch": 0.37, "learning_rate": 0.00024432851799336926, "loss": 0.0215, "step": 143180 }, { "epoch": 0.37, "learning_rate": 0.0002443246297769978, "loss": 0.0135, "step": 143190 }, { "epoch": 0.37, "learning_rate": 0.00024432074156062635, "loss": 0.015, "step": 143200 }, { "epoch": 0.37, "learning_rate": 0.00024431685334425486, "loss": 0.0231, "step": 143210 }, { "epoch": 0.37, "learning_rate": 0.00024431296512788343, "loss": 0.0198, "step": 143220 }, { "epoch": 0.37, "learning_rate": 0.00024430907691151194, "loss": 0.0205, "step": 143230 }, { "epoch": 0.37, "learning_rate": 0.0002443051886951405, "loss": 0.0251, "step": 143240 }, { "epoch": 0.37, "learning_rate": 0.00024430130047876903, "loss": 0.0202, "step": 143250 }, { "epoch": 0.37, "learning_rate": 0.00024429741226239754, "loss": 0.0211, "step": 143260 }, { "epoch": 0.37, "learning_rate": 0.00024429352404602606, "loss": 0.0174, "step": 143270 }, { "epoch": 0.37, "learning_rate": 0.0002442896358296546, "loss": 0.0176, "step": 143280 }, { "epoch": 0.37, "learning_rate": 0.0002442857476132832, "loss": 0.0179, "step": 143290 }, { "epoch": 0.37, "learning_rate": 0.0002442818593969117, "loss": 0.0205, "step": 143300 }, { "epoch": 0.37, "learning_rate": 0.0002442779711805402, "loss": 0.0203, "step": 143310 }, { "epoch": 0.37, "learning_rate": 0.0002442740829641688, "loss": 0.0263, "step": 143320 }, { "epoch": 0.37, "learning_rate": 0.0002442701947477973, "loss": 0.0184, "step": 143330 }, { "epoch": 0.37, "learning_rate": 0.0002442663065314258, "loss": 0.0194, "step": 143340 }, { "epoch": 0.37, "learning_rate": 0.0002442624183150544, "loss": 0.0178, "step": 143350 }, { "epoch": 0.37, "learning_rate": 0.0002442585300986829, "loss": 0.022, "step": 143360 }, { "epoch": 0.37, "learning_rate": 0.00024425464188231147, "loss": 0.0241, "step": 143370 }, { "epoch": 0.37, "learning_rate": 0.00024425075366594, "loss": 0.0201, "step": 143380 }, { "epoch": 0.37, "learning_rate": 0.0002442468654495685, "loss": 0.0185, "step": 143390 }, { "epoch": 0.37, "learning_rate": 0.00024424297723319707, "loss": 0.0227, "step": 143400 }, { "epoch": 0.37, "learning_rate": 0.0002442390890168256, "loss": 0.0223, "step": 143410 }, { "epoch": 0.37, "learning_rate": 0.0002442352008004541, "loss": 0.0191, "step": 143420 }, { "epoch": 0.37, "learning_rate": 0.00024423131258408267, "loss": 0.02, "step": 143430 }, { "epoch": 0.37, "learning_rate": 0.0002442274243677112, "loss": 0.0191, "step": 143440 }, { "epoch": 0.37, "learning_rate": 0.00024422353615133975, "loss": 0.0204, "step": 143450 }, { "epoch": 0.37, "learning_rate": 0.00024421964793496827, "loss": 0.021, "step": 143460 }, { "epoch": 0.37, "learning_rate": 0.0002442157597185968, "loss": 0.0237, "step": 143470 }, { "epoch": 0.37, "learning_rate": 0.0002442118715022253, "loss": 0.0191, "step": 143480 }, { "epoch": 0.37, "learning_rate": 0.00024420798328585386, "loss": 0.0193, "step": 143490 }, { "epoch": 0.37, "learning_rate": 0.00024420409506948243, "loss": 0.0185, "step": 143500 }, { "epoch": 0.37, "learning_rate": 0.00024420020685311095, "loss": 0.0221, "step": 143510 }, { "epoch": 0.37, "learning_rate": 0.00024419631863673946, "loss": 0.0192, "step": 143520 }, { "epoch": 0.37, "learning_rate": 0.00024419243042036803, "loss": 0.0181, "step": 143530 }, { "epoch": 0.37, "learning_rate": 0.00024418854220399655, "loss": 0.0172, "step": 143540 }, { "epoch": 0.37, "learning_rate": 0.00024418465398762506, "loss": 0.0165, "step": 143550 }, { "epoch": 0.37, "learning_rate": 0.00024418076577125363, "loss": 0.0211, "step": 143560 }, { "epoch": 0.37, "learning_rate": 0.00024417687755488214, "loss": 0.0184, "step": 143570 }, { "epoch": 0.37, "learning_rate": 0.0002441729893385107, "loss": 0.0184, "step": 143580 }, { "epoch": 0.37, "learning_rate": 0.0002441691011221392, "loss": 0.0224, "step": 143590 }, { "epoch": 0.37, "learning_rate": 0.00024416521290576774, "loss": 0.0267, "step": 143600 }, { "epoch": 0.37, "learning_rate": 0.0002441613246893963, "loss": 0.0242, "step": 143610 }, { "epoch": 0.37, "learning_rate": 0.0002441574364730248, "loss": 0.0209, "step": 143620 }, { "epoch": 0.37, "learning_rate": 0.00024415354825665334, "loss": 0.0208, "step": 143630 }, { "epoch": 0.37, "learning_rate": 0.0002441496600402819, "loss": 0.0217, "step": 143640 }, { "epoch": 0.37, "learning_rate": 0.0002441457718239105, "loss": 0.0259, "step": 143650 }, { "epoch": 0.37, "learning_rate": 0.000244141883607539, "loss": 0.0221, "step": 143660 }, { "epoch": 0.37, "learning_rate": 0.0002441379953911675, "loss": 0.0188, "step": 143670 }, { "epoch": 0.37, "learning_rate": 0.00024413410717479605, "loss": 0.0222, "step": 143680 }, { "epoch": 0.37, "learning_rate": 0.00024413021895842456, "loss": 0.02, "step": 143690 }, { "epoch": 0.37, "learning_rate": 0.00024412633074205313, "loss": 0.0203, "step": 143700 }, { "epoch": 0.37, "learning_rate": 0.00024412244252568164, "loss": 0.0195, "step": 143710 }, { "epoch": 0.37, "learning_rate": 0.00024411855430931019, "loss": 0.0168, "step": 143720 }, { "epoch": 0.37, "learning_rate": 0.0002441146660929387, "loss": 0.0219, "step": 143730 }, { "epoch": 0.37, "learning_rate": 0.00024411077787656727, "loss": 0.0179, "step": 143740 }, { "epoch": 0.37, "learning_rate": 0.00024410688966019578, "loss": 0.0181, "step": 143750 }, { "epoch": 0.37, "learning_rate": 0.00024410300144382433, "loss": 0.0172, "step": 143760 }, { "epoch": 0.37, "learning_rate": 0.00024409911322745284, "loss": 0.0186, "step": 143770 }, { "epoch": 0.37, "learning_rate": 0.0002440952250110814, "loss": 0.0234, "step": 143780 }, { "epoch": 0.37, "learning_rate": 0.00024409133679470992, "loss": 0.0172, "step": 143790 }, { "epoch": 0.37, "learning_rate": 0.00024408744857833847, "loss": 0.0196, "step": 143800 }, { "epoch": 0.37, "learning_rate": 0.00024408356036196698, "loss": 0.0217, "step": 143810 }, { "epoch": 0.37, "learning_rate": 0.00024407967214559555, "loss": 0.0192, "step": 143820 }, { "epoch": 0.37, "learning_rate": 0.0002440757839292241, "loss": 0.0252, "step": 143830 }, { "epoch": 0.37, "learning_rate": 0.0002440718957128526, "loss": 0.0214, "step": 143840 }, { "epoch": 0.37, "learning_rate": 0.00024406800749648115, "loss": 0.0249, "step": 143850 }, { "epoch": 0.37, "learning_rate": 0.0002440641192801097, "loss": 0.0182, "step": 143860 }, { "epoch": 0.37, "learning_rate": 0.00024406023106373823, "loss": 0.0203, "step": 143870 }, { "epoch": 0.37, "learning_rate": 0.00024405634284736674, "loss": 0.0259, "step": 143880 }, { "epoch": 0.37, "learning_rate": 0.00024405245463099529, "loss": 0.02, "step": 143890 }, { "epoch": 0.37, "learning_rate": 0.00024404856641462383, "loss": 0.0193, "step": 143900 }, { "epoch": 0.37, "learning_rate": 0.00024404467819825237, "loss": 0.0215, "step": 143910 }, { "epoch": 0.37, "learning_rate": 0.00024404078998188088, "loss": 0.0187, "step": 143920 }, { "epoch": 0.37, "learning_rate": 0.00024403690176550943, "loss": 0.02, "step": 143930 }, { "epoch": 0.37, "learning_rate": 0.00024403301354913794, "loss": 0.0228, "step": 143940 }, { "epoch": 0.37, "learning_rate": 0.0002440291253327665, "loss": 0.0226, "step": 143950 }, { "epoch": 0.37, "learning_rate": 0.00024402523711639502, "loss": 0.0178, "step": 143960 }, { "epoch": 0.37, "learning_rate": 0.00024402134890002356, "loss": 0.0185, "step": 143970 }, { "epoch": 0.37, "learning_rate": 0.00024401746068365208, "loss": 0.0209, "step": 143980 }, { "epoch": 0.37, "learning_rate": 0.00024401357246728065, "loss": 0.0218, "step": 143990 }, { "epoch": 0.37, "learning_rate": 0.0002440096842509092, "loss": 0.0212, "step": 144000 }, { "epoch": 0.37, "eval_cer": 0.881806259456297, "eval_loss": 0.014057588763535023, "eval_runtime": 107.315, "eval_samples_per_second": 18.637, "eval_steps_per_second": 4.659, "step": 144000 }, { "epoch": 0.37, "learning_rate": 0.0002440057960345377, "loss": 0.023, "step": 144010 }, { "epoch": 0.37, "learning_rate": 0.00024400190781816622, "loss": 0.0212, "step": 144020 }, { "epoch": 0.37, "learning_rate": 0.0002439980196017948, "loss": 0.0209, "step": 144030 }, { "epoch": 0.37, "learning_rate": 0.00024399413138542333, "loss": 0.0195, "step": 144040 }, { "epoch": 0.37, "learning_rate": 0.00024399024316905184, "loss": 0.0245, "step": 144050 }, { "epoch": 0.37, "learning_rate": 0.00024398635495268039, "loss": 0.0192, "step": 144060 }, { "epoch": 0.37, "learning_rate": 0.00024398246673630893, "loss": 0.022, "step": 144070 }, { "epoch": 0.37, "learning_rate": 0.00024397857851993747, "loss": 0.0249, "step": 144080 }, { "epoch": 0.37, "learning_rate": 0.00024397469030356598, "loss": 0.0198, "step": 144090 }, { "epoch": 0.37, "learning_rate": 0.00024397080208719452, "loss": 0.0166, "step": 144100 }, { "epoch": 0.37, "learning_rate": 0.00024396691387082307, "loss": 0.0193, "step": 144110 }, { "epoch": 0.37, "learning_rate": 0.0002439630256544516, "loss": 0.0195, "step": 144120 }, { "epoch": 0.37, "learning_rate": 0.00024395913743808012, "loss": 0.0189, "step": 144130 }, { "epoch": 0.37, "learning_rate": 0.00024395524922170866, "loss": 0.0237, "step": 144140 }, { "epoch": 0.37, "learning_rate": 0.00024395136100533718, "loss": 0.0182, "step": 144150 }, { "epoch": 0.37, "learning_rate": 0.00024394747278896575, "loss": 0.0198, "step": 144160 }, { "epoch": 0.37, "learning_rate": 0.00024394358457259426, "loss": 0.0202, "step": 144170 }, { "epoch": 0.37, "learning_rate": 0.0002439396963562228, "loss": 0.0228, "step": 144180 }, { "epoch": 0.37, "learning_rate": 0.00024393580813985132, "loss": 0.0233, "step": 144190 }, { "epoch": 0.37, "learning_rate": 0.0002439319199234799, "loss": 0.0174, "step": 144200 }, { "epoch": 0.37, "learning_rate": 0.00024392803170710843, "loss": 0.0219, "step": 144210 }, { "epoch": 0.37, "learning_rate": 0.00024392414349073694, "loss": 0.0176, "step": 144220 }, { "epoch": 0.37, "learning_rate": 0.00024392025527436548, "loss": 0.0165, "step": 144230 }, { "epoch": 0.37, "learning_rate": 0.00024391636705799403, "loss": 0.0217, "step": 144240 }, { "epoch": 0.37, "learning_rate": 0.00024391247884162257, "loss": 0.0149, "step": 144250 }, { "epoch": 0.37, "learning_rate": 0.00024390859062525108, "loss": 0.0286, "step": 144260 }, { "epoch": 0.37, "learning_rate": 0.00024390470240887962, "loss": 0.0187, "step": 144270 }, { "epoch": 0.37, "learning_rate": 0.00024390081419250817, "loss": 0.0224, "step": 144280 }, { "epoch": 0.37, "learning_rate": 0.0002438969259761367, "loss": 0.0183, "step": 144290 }, { "epoch": 0.37, "learning_rate": 0.00024389303775976522, "loss": 0.0224, "step": 144300 }, { "epoch": 0.37, "learning_rate": 0.00024388914954339376, "loss": 0.0328, "step": 144310 }, { "epoch": 0.37, "learning_rate": 0.00024388526132702233, "loss": 0.0206, "step": 144320 }, { "epoch": 0.37, "learning_rate": 0.00024388137311065085, "loss": 0.0226, "step": 144330 }, { "epoch": 0.37, "learning_rate": 0.00024387748489427936, "loss": 0.026, "step": 144340 }, { "epoch": 0.37, "learning_rate": 0.0002438735966779079, "loss": 0.0238, "step": 144350 }, { "epoch": 0.37, "learning_rate": 0.00024386970846153647, "loss": 0.0215, "step": 144360 }, { "epoch": 0.37, "learning_rate": 0.00024386582024516499, "loss": 0.0233, "step": 144370 }, { "epoch": 0.37, "learning_rate": 0.00024386193202879353, "loss": 0.0296, "step": 144380 }, { "epoch": 0.37, "learning_rate": 0.00024385804381242204, "loss": 0.021, "step": 144390 }, { "epoch": 0.37, "learning_rate": 0.00024385415559605058, "loss": 0.0208, "step": 144400 }, { "epoch": 0.37, "learning_rate": 0.00024385026737967913, "loss": 0.0181, "step": 144410 }, { "epoch": 0.37, "learning_rate": 0.00024384637916330767, "loss": 0.0185, "step": 144420 }, { "epoch": 0.37, "learning_rate": 0.00024384249094693618, "loss": 0.0194, "step": 144430 }, { "epoch": 0.37, "learning_rate": 0.00024383860273056472, "loss": 0.0224, "step": 144440 }, { "epoch": 0.37, "learning_rate": 0.00024383471451419326, "loss": 0.0197, "step": 144450 }, { "epoch": 0.37, "learning_rate": 0.0002438308262978218, "loss": 0.0154, "step": 144460 }, { "epoch": 0.37, "learning_rate": 0.00024382693808145032, "loss": 0.0212, "step": 144470 }, { "epoch": 0.37, "learning_rate": 0.00024382304986507886, "loss": 0.0207, "step": 144480 }, { "epoch": 0.37, "learning_rate": 0.0002438191616487074, "loss": 0.0236, "step": 144490 }, { "epoch": 0.37, "learning_rate": 0.00024381527343233595, "loss": 0.0192, "step": 144500 }, { "epoch": 0.37, "learning_rate": 0.00024381138521596446, "loss": 0.0185, "step": 144510 }, { "epoch": 0.37, "learning_rate": 0.000243807496999593, "loss": 0.015, "step": 144520 }, { "epoch": 0.37, "learning_rate": 0.00024380360878322157, "loss": 0.0194, "step": 144530 }, { "epoch": 0.37, "learning_rate": 0.00024379972056685009, "loss": 0.0217, "step": 144540 }, { "epoch": 0.37, "learning_rate": 0.00024379583235047863, "loss": 0.0211, "step": 144550 }, { "epoch": 0.37, "learning_rate": 0.00024379194413410714, "loss": 0.022, "step": 144560 }, { "epoch": 0.37, "learning_rate": 0.0002437880559177357, "loss": 0.0211, "step": 144570 }, { "epoch": 0.37, "learning_rate": 0.00024378416770136422, "loss": 0.0248, "step": 144580 }, { "epoch": 0.37, "learning_rate": 0.00024378027948499277, "loss": 0.019, "step": 144590 }, { "epoch": 0.37, "learning_rate": 0.00024377639126862128, "loss": 0.0181, "step": 144600 }, { "epoch": 0.37, "learning_rate": 0.00024377250305224985, "loss": 0.0239, "step": 144610 }, { "epoch": 0.37, "learning_rate": 0.00024376861483587836, "loss": 0.0198, "step": 144620 }, { "epoch": 0.37, "learning_rate": 0.0002437647266195069, "loss": 0.0288, "step": 144630 }, { "epoch": 0.37, "learning_rate": 0.00024376083840313542, "loss": 0.0218, "step": 144640 }, { "epoch": 0.37, "learning_rate": 0.00024375695018676396, "loss": 0.019, "step": 144650 }, { "epoch": 0.37, "learning_rate": 0.0002437530619703925, "loss": 0.0176, "step": 144660 }, { "epoch": 0.38, "learning_rate": 0.00024374917375402105, "loss": 0.0231, "step": 144670 }, { "epoch": 0.38, "learning_rate": 0.00024374528553764956, "loss": 0.0169, "step": 144680 }, { "epoch": 0.38, "learning_rate": 0.0002437413973212781, "loss": 0.0212, "step": 144690 }, { "epoch": 0.38, "learning_rate": 0.00024373750910490667, "loss": 0.0247, "step": 144700 }, { "epoch": 0.38, "learning_rate": 0.00024373362088853518, "loss": 0.0245, "step": 144710 }, { "epoch": 0.38, "learning_rate": 0.00024372973267216373, "loss": 0.0174, "step": 144720 }, { "epoch": 0.38, "learning_rate": 0.00024372584445579224, "loss": 0.0208, "step": 144730 }, { "epoch": 0.38, "learning_rate": 0.0002437219562394208, "loss": 0.0191, "step": 144740 }, { "epoch": 0.38, "learning_rate": 0.00024371806802304932, "loss": 0.0173, "step": 144750 }, { "epoch": 0.38, "learning_rate": 0.00024371417980667787, "loss": 0.0211, "step": 144760 }, { "epoch": 0.38, "learning_rate": 0.00024371029159030638, "loss": 0.0189, "step": 144770 }, { "epoch": 0.38, "learning_rate": 0.00024370640337393495, "loss": 0.0184, "step": 144780 }, { "epoch": 0.38, "learning_rate": 0.00024370251515756346, "loss": 0.0195, "step": 144790 }, { "epoch": 0.38, "learning_rate": 0.000243698626941192, "loss": 0.0243, "step": 144800 }, { "epoch": 0.38, "learning_rate": 0.00024369473872482052, "loss": 0.0192, "step": 144810 }, { "epoch": 0.38, "learning_rate": 0.0002436908505084491, "loss": 0.0244, "step": 144820 }, { "epoch": 0.38, "learning_rate": 0.0002436869622920776, "loss": 0.0197, "step": 144830 }, { "epoch": 0.38, "learning_rate": 0.00024368307407570614, "loss": 0.0257, "step": 144840 }, { "epoch": 0.38, "learning_rate": 0.00024367918585933466, "loss": 0.017, "step": 144850 }, { "epoch": 0.38, "learning_rate": 0.00024367529764296323, "loss": 0.0299, "step": 144860 }, { "epoch": 0.38, "learning_rate": 0.00024367140942659177, "loss": 0.0194, "step": 144870 }, { "epoch": 0.38, "learning_rate": 0.00024366752121022028, "loss": 0.0217, "step": 144880 }, { "epoch": 0.38, "learning_rate": 0.0002436636329938488, "loss": 0.0205, "step": 144890 }, { "epoch": 0.38, "learning_rate": 0.00024365974477747734, "loss": 0.0273, "step": 144900 }, { "epoch": 0.38, "learning_rate": 0.0002436558565611059, "loss": 0.0214, "step": 144910 }, { "epoch": 0.38, "learning_rate": 0.00024365196834473442, "loss": 0.0197, "step": 144920 }, { "epoch": 0.38, "learning_rate": 0.00024364808012836297, "loss": 0.0215, "step": 144930 }, { "epoch": 0.38, "learning_rate": 0.00024364419191199148, "loss": 0.0182, "step": 144940 }, { "epoch": 0.38, "learning_rate": 0.00024364030369562005, "loss": 0.0226, "step": 144950 }, { "epoch": 0.38, "learning_rate": 0.00024363641547924856, "loss": 0.0177, "step": 144960 }, { "epoch": 0.38, "learning_rate": 0.0002436325272628771, "loss": 0.0187, "step": 144970 }, { "epoch": 0.38, "learning_rate": 0.00024362863904650562, "loss": 0.0195, "step": 144980 }, { "epoch": 0.38, "learning_rate": 0.0002436247508301342, "loss": 0.0241, "step": 144990 }, { "epoch": 0.38, "learning_rate": 0.0002436208626137627, "loss": 0.019, "step": 145000 }, { "epoch": 0.38, "eval_cer": 0.881751673615864, "eval_loss": 0.013631855137646198, "eval_runtime": 107.3251, "eval_samples_per_second": 18.635, "eval_steps_per_second": 4.659, "step": 145000 }, { "epoch": 0.38, "learning_rate": 0.00024361697439739124, "loss": 0.0184, "step": 145010 }, { "epoch": 0.38, "learning_rate": 0.00024361308618101976, "loss": 0.0243, "step": 145020 }, { "epoch": 0.38, "learning_rate": 0.00024360919796464833, "loss": 0.022, "step": 145030 }, { "epoch": 0.38, "learning_rate": 0.00024360530974827687, "loss": 0.0166, "step": 145040 }, { "epoch": 0.38, "learning_rate": 0.00024360142153190538, "loss": 0.0215, "step": 145050 }, { "epoch": 0.38, "learning_rate": 0.0002435975333155339, "loss": 0.0185, "step": 145060 }, { "epoch": 0.38, "learning_rate": 0.00024359364509916247, "loss": 0.0275, "step": 145070 }, { "epoch": 0.38, "learning_rate": 0.000243589756882791, "loss": 0.0207, "step": 145080 }, { "epoch": 0.38, "learning_rate": 0.00024358586866641952, "loss": 0.0248, "step": 145090 }, { "epoch": 0.38, "learning_rate": 0.00024358198045004806, "loss": 0.0264, "step": 145100 }, { "epoch": 0.38, "learning_rate": 0.0002435780922336766, "loss": 0.0247, "step": 145110 }, { "epoch": 0.38, "learning_rate": 0.00024357420401730515, "loss": 0.0189, "step": 145120 }, { "epoch": 0.38, "learning_rate": 0.00024357031580093366, "loss": 0.0253, "step": 145130 }, { "epoch": 0.38, "learning_rate": 0.0002435664275845622, "loss": 0.0188, "step": 145140 }, { "epoch": 0.38, "learning_rate": 0.00024356253936819072, "loss": 0.0186, "step": 145150 }, { "epoch": 0.38, "learning_rate": 0.0002435586511518193, "loss": 0.0215, "step": 145160 }, { "epoch": 0.38, "learning_rate": 0.0002435547629354478, "loss": 0.0196, "step": 145170 }, { "epoch": 0.38, "learning_rate": 0.00024355087471907634, "loss": 0.0212, "step": 145180 }, { "epoch": 0.38, "learning_rate": 0.00024354698650270486, "loss": 0.0189, "step": 145190 }, { "epoch": 0.38, "learning_rate": 0.00024354309828633343, "loss": 0.0186, "step": 145200 }, { "epoch": 0.38, "learning_rate": 0.00024353921006996194, "loss": 0.0184, "step": 145210 }, { "epoch": 0.38, "learning_rate": 0.00024353532185359048, "loss": 0.0231, "step": 145220 }, { "epoch": 0.38, "learning_rate": 0.000243531433637219, "loss": 0.0197, "step": 145230 }, { "epoch": 0.38, "learning_rate": 0.00024352754542084757, "loss": 0.019, "step": 145240 }, { "epoch": 0.38, "learning_rate": 0.0002435236572044761, "loss": 0.0169, "step": 145250 }, { "epoch": 0.38, "learning_rate": 0.00024351976898810462, "loss": 0.015, "step": 145260 }, { "epoch": 0.38, "learning_rate": 0.00024351588077173316, "loss": 0.0223, "step": 145270 }, { "epoch": 0.38, "learning_rate": 0.0002435119925553617, "loss": 0.0172, "step": 145280 }, { "epoch": 0.38, "learning_rate": 0.00024350810433899025, "loss": 0.0421, "step": 145290 }, { "epoch": 0.38, "learning_rate": 0.00024350421612261876, "loss": 0.0221, "step": 145300 }, { "epoch": 0.38, "learning_rate": 0.0002435003279062473, "loss": 0.0297, "step": 145310 }, { "epoch": 0.38, "learning_rate": 0.00024349643968987585, "loss": 0.0212, "step": 145320 }, { "epoch": 0.38, "learning_rate": 0.0002434925514735044, "loss": 0.03, "step": 145330 }, { "epoch": 0.38, "learning_rate": 0.0002434886632571329, "loss": 0.0266, "step": 145340 }, { "epoch": 0.38, "learning_rate": 0.00024348477504076144, "loss": 0.0174, "step": 145350 }, { "epoch": 0.38, "learning_rate": 0.00024348088682438998, "loss": 0.0342, "step": 145360 }, { "epoch": 0.38, "learning_rate": 0.00024347699860801853, "loss": 0.0269, "step": 145370 }, { "epoch": 0.38, "learning_rate": 0.00024347311039164704, "loss": 0.0198, "step": 145380 }, { "epoch": 0.38, "learning_rate": 0.00024346922217527558, "loss": 0.02, "step": 145390 }, { "epoch": 0.38, "learning_rate": 0.0002434653339589041, "loss": 0.0163, "step": 145400 }, { "epoch": 0.38, "learning_rate": 0.00024346144574253267, "loss": 0.0172, "step": 145410 }, { "epoch": 0.38, "learning_rate": 0.0002434575575261612, "loss": 0.0207, "step": 145420 }, { "epoch": 0.38, "learning_rate": 0.00024345366930978972, "loss": 0.0201, "step": 145430 }, { "epoch": 0.38, "learning_rate": 0.00024344978109341826, "loss": 0.0256, "step": 145440 }, { "epoch": 0.38, "learning_rate": 0.0002434458928770468, "loss": 0.0194, "step": 145450 }, { "epoch": 0.38, "learning_rate": 0.00024344200466067535, "loss": 0.0187, "step": 145460 }, { "epoch": 0.38, "learning_rate": 0.00024343811644430386, "loss": 0.0209, "step": 145470 }, { "epoch": 0.38, "learning_rate": 0.0002434342282279324, "loss": 0.0183, "step": 145480 }, { "epoch": 0.38, "learning_rate": 0.00024343034001156094, "loss": 0.0179, "step": 145490 }, { "epoch": 0.38, "learning_rate": 0.00024342645179518949, "loss": 0.0206, "step": 145500 }, { "epoch": 0.38, "learning_rate": 0.000243422563578818, "loss": 0.0194, "step": 145510 }, { "epoch": 0.38, "learning_rate": 0.00024341867536244654, "loss": 0.0194, "step": 145520 }, { "epoch": 0.38, "learning_rate": 0.00024341478714607508, "loss": 0.0269, "step": 145530 }, { "epoch": 0.38, "learning_rate": 0.00024341089892970363, "loss": 0.0195, "step": 145540 }, { "epoch": 0.38, "learning_rate": 0.00024340701071333214, "loss": 0.0213, "step": 145550 }, { "epoch": 0.38, "learning_rate": 0.00024340312249696068, "loss": 0.0207, "step": 145560 }, { "epoch": 0.38, "learning_rate": 0.00024339923428058925, "loss": 0.02, "step": 145570 }, { "epoch": 0.38, "learning_rate": 0.00024339534606421777, "loss": 0.0216, "step": 145580 }, { "epoch": 0.38, "learning_rate": 0.0002433914578478463, "loss": 0.0268, "step": 145590 }, { "epoch": 0.38, "learning_rate": 0.00024338756963147482, "loss": 0.0235, "step": 145600 }, { "epoch": 0.38, "learning_rate": 0.0002433836814151034, "loss": 0.0168, "step": 145610 }, { "epoch": 0.38, "learning_rate": 0.0002433797931987319, "loss": 0.0216, "step": 145620 }, { "epoch": 0.38, "learning_rate": 0.00024337590498236045, "loss": 0.0179, "step": 145630 }, { "epoch": 0.38, "learning_rate": 0.00024337201676598896, "loss": 0.0167, "step": 145640 }, { "epoch": 0.38, "learning_rate": 0.0002433681285496175, "loss": 0.0202, "step": 145650 }, { "epoch": 0.38, "learning_rate": 0.00024336424033324604, "loss": 0.0205, "step": 145660 }, { "epoch": 0.38, "learning_rate": 0.00024336035211687459, "loss": 0.019, "step": 145670 }, { "epoch": 0.38, "learning_rate": 0.0002433564639005031, "loss": 0.0192, "step": 145680 }, { "epoch": 0.38, "learning_rate": 0.00024335257568413164, "loss": 0.0148, "step": 145690 }, { "epoch": 0.38, "learning_rate": 0.00024334868746776018, "loss": 0.0165, "step": 145700 }, { "epoch": 0.38, "learning_rate": 0.00024334479925138873, "loss": 0.0164, "step": 145710 }, { "epoch": 0.38, "learning_rate": 0.00024334091103501724, "loss": 0.0201, "step": 145720 }, { "epoch": 0.38, "learning_rate": 0.00024333702281864578, "loss": 0.0184, "step": 145730 }, { "epoch": 0.38, "learning_rate": 0.00024333313460227435, "loss": 0.0222, "step": 145740 }, { "epoch": 0.38, "learning_rate": 0.00024332924638590286, "loss": 0.02, "step": 145750 }, { "epoch": 0.38, "learning_rate": 0.00024332535816953138, "loss": 0.0213, "step": 145760 }, { "epoch": 0.38, "learning_rate": 0.00024332146995315992, "loss": 0.0229, "step": 145770 }, { "epoch": 0.38, "learning_rate": 0.0002433175817367885, "loss": 0.024, "step": 145780 }, { "epoch": 0.38, "learning_rate": 0.000243313693520417, "loss": 0.0219, "step": 145790 }, { "epoch": 0.38, "learning_rate": 0.00024330980530404555, "loss": 0.0213, "step": 145800 }, { "epoch": 0.38, "learning_rate": 0.00024330591708767406, "loss": 0.0253, "step": 145810 }, { "epoch": 0.38, "learning_rate": 0.00024330202887130263, "loss": 0.0199, "step": 145820 }, { "epoch": 0.38, "learning_rate": 0.00024329814065493114, "loss": 0.0198, "step": 145830 }, { "epoch": 0.38, "learning_rate": 0.00024329425243855969, "loss": 0.0156, "step": 145840 }, { "epoch": 0.38, "learning_rate": 0.0002432903642221882, "loss": 0.0218, "step": 145850 }, { "epoch": 0.38, "learning_rate": 0.00024328647600581677, "loss": 0.018, "step": 145860 }, { "epoch": 0.38, "learning_rate": 0.00024328258778944528, "loss": 0.0215, "step": 145870 }, { "epoch": 0.38, "learning_rate": 0.00024327869957307382, "loss": 0.0181, "step": 145880 }, { "epoch": 0.38, "learning_rate": 0.00024327481135670234, "loss": 0.0169, "step": 145890 }, { "epoch": 0.38, "learning_rate": 0.00024327092314033088, "loss": 0.0169, "step": 145900 }, { "epoch": 0.38, "learning_rate": 0.00024326703492395945, "loss": 0.0192, "step": 145910 }, { "epoch": 0.38, "learning_rate": 0.00024326314670758796, "loss": 0.0229, "step": 145920 }, { "epoch": 0.38, "learning_rate": 0.00024325925849121648, "loss": 0.0207, "step": 145930 }, { "epoch": 0.38, "learning_rate": 0.00024325537027484502, "loss": 0.0191, "step": 145940 }, { "epoch": 0.38, "learning_rate": 0.0002432514820584736, "loss": 0.0205, "step": 145950 }, { "epoch": 0.38, "learning_rate": 0.0002432475938421021, "loss": 0.0161, "step": 145960 }, { "epoch": 0.38, "learning_rate": 0.00024324370562573065, "loss": 0.0197, "step": 145970 }, { "epoch": 0.38, "learning_rate": 0.00024323981740935916, "loss": 0.0213, "step": 145980 }, { "epoch": 0.38, "learning_rate": 0.00024323592919298773, "loss": 0.0208, "step": 145990 }, { "epoch": 0.38, "learning_rate": 0.00024323204097661624, "loss": 0.0181, "step": 146000 }, { "epoch": 0.38, "eval_cer": 0.8817628707113375, "eval_loss": 0.013447397388517857, "eval_runtime": 107.4268, "eval_samples_per_second": 18.617, "eval_steps_per_second": 4.654, "step": 146000 }, { "epoch": 0.38, "learning_rate": 0.00024322815276024478, "loss": 0.0197, "step": 146010 }, { "epoch": 0.38, "learning_rate": 0.0002432242645438733, "loss": 0.0184, "step": 146020 }, { "epoch": 0.38, "learning_rate": 0.00024322037632750187, "loss": 0.0296, "step": 146030 }, { "epoch": 0.38, "learning_rate": 0.00024321648811113038, "loss": 0.0268, "step": 146040 }, { "epoch": 0.38, "learning_rate": 0.00024321259989475892, "loss": 0.0156, "step": 146050 }, { "epoch": 0.38, "learning_rate": 0.00024320871167838744, "loss": 0.0191, "step": 146060 }, { "epoch": 0.38, "learning_rate": 0.000243204823462016, "loss": 0.0186, "step": 146070 }, { "epoch": 0.38, "learning_rate": 0.00024320093524564452, "loss": 0.0205, "step": 146080 }, { "epoch": 0.38, "learning_rate": 0.00024319704702927306, "loss": 0.0219, "step": 146090 }, { "epoch": 0.38, "learning_rate": 0.00024319315881290158, "loss": 0.0225, "step": 146100 }, { "epoch": 0.38, "learning_rate": 0.00024318927059653015, "loss": 0.0206, "step": 146110 }, { "epoch": 0.38, "learning_rate": 0.0002431853823801587, "loss": 0.0415, "step": 146120 }, { "epoch": 0.38, "learning_rate": 0.0002431814941637872, "loss": 0.0226, "step": 146130 }, { "epoch": 0.38, "learning_rate": 0.00024317760594741574, "loss": 0.022, "step": 146140 }, { "epoch": 0.38, "learning_rate": 0.00024317371773104426, "loss": 0.021, "step": 146150 }, { "epoch": 0.38, "learning_rate": 0.00024316982951467283, "loss": 0.0163, "step": 146160 }, { "epoch": 0.38, "learning_rate": 0.00024316594129830134, "loss": 0.0177, "step": 146170 }, { "epoch": 0.38, "learning_rate": 0.00024316205308192988, "loss": 0.0206, "step": 146180 }, { "epoch": 0.38, "learning_rate": 0.0002431581648655584, "loss": 0.0218, "step": 146190 }, { "epoch": 0.38, "learning_rate": 0.00024315427664918697, "loss": 0.0216, "step": 146200 }, { "epoch": 0.38, "learning_rate": 0.00024315038843281548, "loss": 0.0207, "step": 146210 }, { "epoch": 0.38, "learning_rate": 0.00024314650021644402, "loss": 0.0203, "step": 146220 }, { "epoch": 0.38, "learning_rate": 0.00024314261200007254, "loss": 0.0177, "step": 146230 }, { "epoch": 0.38, "learning_rate": 0.0002431387237837011, "loss": 0.0155, "step": 146240 }, { "epoch": 0.38, "learning_rate": 0.00024313483556732962, "loss": 0.0193, "step": 146250 }, { "epoch": 0.38, "learning_rate": 0.00024313094735095816, "loss": 0.0347, "step": 146260 }, { "epoch": 0.38, "learning_rate": 0.00024312705913458668, "loss": 0.021, "step": 146270 }, { "epoch": 0.38, "learning_rate": 0.00024312317091821525, "loss": 0.02, "step": 146280 }, { "epoch": 0.38, "learning_rate": 0.0002431192827018438, "loss": 0.0198, "step": 146290 }, { "epoch": 0.38, "learning_rate": 0.0002431153944854723, "loss": 0.0171, "step": 146300 }, { "epoch": 0.38, "learning_rate": 0.00024311150626910084, "loss": 0.019, "step": 146310 }, { "epoch": 0.38, "learning_rate": 0.00024310761805272939, "loss": 0.0218, "step": 146320 }, { "epoch": 0.38, "learning_rate": 0.00024310372983635793, "loss": 0.0185, "step": 146330 }, { "epoch": 0.38, "learning_rate": 0.00024309984161998644, "loss": 0.0225, "step": 146340 }, { "epoch": 0.38, "learning_rate": 0.00024309595340361498, "loss": 0.018, "step": 146350 }, { "epoch": 0.38, "learning_rate": 0.00024309206518724353, "loss": 0.0207, "step": 146360 }, { "epoch": 0.38, "learning_rate": 0.00024308817697087207, "loss": 0.0185, "step": 146370 }, { "epoch": 0.38, "learning_rate": 0.00024308428875450058, "loss": 0.0187, "step": 146380 }, { "epoch": 0.38, "learning_rate": 0.00024308040053812912, "loss": 0.0184, "step": 146390 }, { "epoch": 0.38, "learning_rate": 0.00024307651232175764, "loss": 0.0155, "step": 146400 }, { "epoch": 0.38, "learning_rate": 0.0002430726241053862, "loss": 0.0215, "step": 146410 }, { "epoch": 0.38, "learning_rate": 0.00024306873588901472, "loss": 0.0262, "step": 146420 }, { "epoch": 0.38, "learning_rate": 0.00024306484767264326, "loss": 0.0223, "step": 146430 }, { "epoch": 0.38, "learning_rate": 0.00024306095945627178, "loss": 0.0216, "step": 146440 }, { "epoch": 0.38, "learning_rate": 0.00024305707123990035, "loss": 0.0185, "step": 146450 }, { "epoch": 0.38, "learning_rate": 0.0002430531830235289, "loss": 0.0186, "step": 146460 }, { "epoch": 0.38, "learning_rate": 0.0002430492948071574, "loss": 0.0198, "step": 146470 }, { "epoch": 0.38, "learning_rate": 0.00024304540659078592, "loss": 0.0189, "step": 146480 }, { "epoch": 0.38, "learning_rate": 0.00024304151837441449, "loss": 0.0186, "step": 146490 }, { "epoch": 0.38, "learning_rate": 0.00024303763015804303, "loss": 0.0213, "step": 146500 }, { "epoch": 0.38, "learning_rate": 0.00024303374194167154, "loss": 0.0164, "step": 146510 }, { "epoch": 0.38, "learning_rate": 0.00024302985372530008, "loss": 0.017, "step": 146520 }, { "epoch": 0.38, "learning_rate": 0.00024302596550892862, "loss": 0.0216, "step": 146530 }, { "epoch": 0.38, "learning_rate": 0.00024302207729255717, "loss": 0.0189, "step": 146540 }, { "epoch": 0.38, "learning_rate": 0.00024301818907618568, "loss": 0.0205, "step": 146550 }, { "epoch": 0.38, "learning_rate": 0.00024301430085981422, "loss": 0.0169, "step": 146560 }, { "epoch": 0.38, "learning_rate": 0.00024301041264344276, "loss": 0.0188, "step": 146570 }, { "epoch": 0.38, "learning_rate": 0.0002430065244270713, "loss": 0.0178, "step": 146580 }, { "epoch": 0.38, "learning_rate": 0.00024300263621069982, "loss": 0.019, "step": 146590 }, { "epoch": 0.38, "learning_rate": 0.00024299874799432836, "loss": 0.0183, "step": 146600 }, { "epoch": 0.38, "learning_rate": 0.00024299485977795693, "loss": 0.0206, "step": 146610 }, { "epoch": 0.38, "learning_rate": 0.00024299097156158545, "loss": 0.0173, "step": 146620 }, { "epoch": 0.38, "learning_rate": 0.00024298708334521396, "loss": 0.0171, "step": 146630 }, { "epoch": 0.38, "learning_rate": 0.0002429831951288425, "loss": 0.0196, "step": 146640 }, { "epoch": 0.38, "learning_rate": 0.00024297930691247102, "loss": 0.0186, "step": 146650 }, { "epoch": 0.38, "learning_rate": 0.00024297541869609958, "loss": 0.0232, "step": 146660 }, { "epoch": 0.38, "learning_rate": 0.00024297153047972813, "loss": 0.0239, "step": 146670 }, { "epoch": 0.38, "learning_rate": 0.00024296764226335664, "loss": 0.0182, "step": 146680 }, { "epoch": 0.38, "learning_rate": 0.00024296375404698518, "loss": 0.0298, "step": 146690 }, { "epoch": 0.38, "learning_rate": 0.00024295986583061372, "loss": 0.0183, "step": 146700 }, { "epoch": 0.38, "learning_rate": 0.00024295597761424227, "loss": 0.0175, "step": 146710 }, { "epoch": 0.38, "learning_rate": 0.00024295208939787078, "loss": 0.025, "step": 146720 }, { "epoch": 0.38, "learning_rate": 0.00024294820118149932, "loss": 0.0187, "step": 146730 }, { "epoch": 0.38, "learning_rate": 0.00024294431296512786, "loss": 0.0251, "step": 146740 }, { "epoch": 0.38, "learning_rate": 0.0002429404247487564, "loss": 0.0278, "step": 146750 }, { "epoch": 0.38, "learning_rate": 0.00024293653653238492, "loss": 0.023, "step": 146760 }, { "epoch": 0.38, "learning_rate": 0.00024293264831601346, "loss": 0.018, "step": 146770 }, { "epoch": 0.38, "learning_rate": 0.00024292876009964203, "loss": 0.0179, "step": 146780 }, { "epoch": 0.38, "learning_rate": 0.00024292487188327054, "loss": 0.0224, "step": 146790 }, { "epoch": 0.38, "learning_rate": 0.00024292098366689906, "loss": 0.0198, "step": 146800 }, { "epoch": 0.38, "learning_rate": 0.0002429170954505276, "loss": 0.0178, "step": 146810 }, { "epoch": 0.38, "learning_rate": 0.00024291320723415617, "loss": 0.0212, "step": 146820 }, { "epoch": 0.38, "learning_rate": 0.00024290931901778468, "loss": 0.0179, "step": 146830 }, { "epoch": 0.38, "learning_rate": 0.00024290543080141323, "loss": 0.0164, "step": 146840 }, { "epoch": 0.38, "learning_rate": 0.00024290154258504174, "loss": 0.0181, "step": 146850 }, { "epoch": 0.38, "learning_rate": 0.0002428976543686703, "loss": 0.0171, "step": 146860 }, { "epoch": 0.38, "learning_rate": 0.00024289376615229882, "loss": 0.0169, "step": 146870 }, { "epoch": 0.38, "learning_rate": 0.00024288987793592737, "loss": 0.0197, "step": 146880 }, { "epoch": 0.38, "learning_rate": 0.00024288598971955588, "loss": 0.0194, "step": 146890 }, { "epoch": 0.38, "learning_rate": 0.00024288210150318442, "loss": 0.017, "step": 146900 }, { "epoch": 0.38, "learning_rate": 0.00024287821328681296, "loss": 0.0176, "step": 146910 }, { "epoch": 0.38, "learning_rate": 0.0002428743250704415, "loss": 0.016, "step": 146920 }, { "epoch": 0.38, "learning_rate": 0.00024287043685407002, "loss": 0.0171, "step": 146930 }, { "epoch": 0.38, "learning_rate": 0.00024286654863769856, "loss": 0.0226, "step": 146940 }, { "epoch": 0.38, "learning_rate": 0.0002428626604213271, "loss": 0.021, "step": 146950 }, { "epoch": 0.38, "learning_rate": 0.00024285877220495564, "loss": 0.0215, "step": 146960 }, { "epoch": 0.38, "learning_rate": 0.00024285488398858416, "loss": 0.0211, "step": 146970 }, { "epoch": 0.38, "learning_rate": 0.0002428509957722127, "loss": 0.0181, "step": 146980 }, { "epoch": 0.38, "learning_rate": 0.00024284710755584127, "loss": 0.0173, "step": 146990 }, { "epoch": 0.38, "learning_rate": 0.00024284321933946978, "loss": 0.0228, "step": 147000 }, { "epoch": 0.38, "eval_cer": 0.8817726681698768, "eval_loss": 0.013879619538784027, "eval_runtime": 107.3335, "eval_samples_per_second": 18.634, "eval_steps_per_second": 4.658, "step": 147000 }, { "epoch": 0.38, "learning_rate": 0.00024283933112309833, "loss": 0.0175, "step": 147010 }, { "epoch": 0.38, "learning_rate": 0.00024283544290672684, "loss": 0.0203, "step": 147020 }, { "epoch": 0.38, "learning_rate": 0.0002428315546903554, "loss": 0.0163, "step": 147030 }, { "epoch": 0.38, "learning_rate": 0.00024282766647398392, "loss": 0.0183, "step": 147040 }, { "epoch": 0.38, "learning_rate": 0.00024282377825761246, "loss": 0.0199, "step": 147050 }, { "epoch": 0.38, "learning_rate": 0.00024281989004124098, "loss": 0.0171, "step": 147060 }, { "epoch": 0.38, "learning_rate": 0.00024281600182486955, "loss": 0.0255, "step": 147070 }, { "epoch": 0.38, "learning_rate": 0.00024281211360849806, "loss": 0.0162, "step": 147080 }, { "epoch": 0.38, "learning_rate": 0.0002428082253921266, "loss": 0.0153, "step": 147090 }, { "epoch": 0.38, "learning_rate": 0.00024280433717575512, "loss": 0.0172, "step": 147100 }, { "epoch": 0.38, "learning_rate": 0.0002428004489593837, "loss": 0.0194, "step": 147110 }, { "epoch": 0.38, "learning_rate": 0.0002427965607430122, "loss": 0.0189, "step": 147120 }, { "epoch": 0.38, "learning_rate": 0.00024279267252664074, "loss": 0.0208, "step": 147130 }, { "epoch": 0.38, "learning_rate": 0.00024278878431026926, "loss": 0.0163, "step": 147140 }, { "epoch": 0.38, "learning_rate": 0.0002427848960938978, "loss": 0.0222, "step": 147150 }, { "epoch": 0.38, "learning_rate": 0.00024278100787752637, "loss": 0.0192, "step": 147160 }, { "epoch": 0.38, "learning_rate": 0.00024277711966115488, "loss": 0.0219, "step": 147170 }, { "epoch": 0.38, "learning_rate": 0.00024277323144478342, "loss": 0.0223, "step": 147180 }, { "epoch": 0.38, "learning_rate": 0.00024276934322841194, "loss": 0.0221, "step": 147190 }, { "epoch": 0.38, "learning_rate": 0.0002427654550120405, "loss": 0.0149, "step": 147200 }, { "epoch": 0.38, "learning_rate": 0.00024276156679566902, "loss": 0.0185, "step": 147210 }, { "epoch": 0.38, "learning_rate": 0.00024275767857929756, "loss": 0.0203, "step": 147220 }, { "epoch": 0.38, "learning_rate": 0.00024275379036292608, "loss": 0.021, "step": 147230 }, { "epoch": 0.38, "learning_rate": 0.00024274990214655465, "loss": 0.022, "step": 147240 }, { "epoch": 0.38, "learning_rate": 0.00024274601393018316, "loss": 0.0204, "step": 147250 }, { "epoch": 0.38, "learning_rate": 0.0002427421257138117, "loss": 0.0228, "step": 147260 }, { "epoch": 0.38, "learning_rate": 0.00024273823749744022, "loss": 0.0194, "step": 147270 }, { "epoch": 0.38, "learning_rate": 0.0002427343492810688, "loss": 0.0245, "step": 147280 }, { "epoch": 0.38, "learning_rate": 0.0002427304610646973, "loss": 0.0195, "step": 147290 }, { "epoch": 0.38, "learning_rate": 0.00024272657284832584, "loss": 0.0183, "step": 147300 }, { "epoch": 0.38, "learning_rate": 0.00024272268463195436, "loss": 0.0229, "step": 147310 }, { "epoch": 0.38, "learning_rate": 0.00024271879641558293, "loss": 0.0195, "step": 147320 }, { "epoch": 0.38, "learning_rate": 0.00024271490819921147, "loss": 0.0189, "step": 147330 }, { "epoch": 0.38, "learning_rate": 0.00024271101998283998, "loss": 0.0139, "step": 147340 }, { "epoch": 0.38, "learning_rate": 0.0002427071317664685, "loss": 0.0235, "step": 147350 }, { "epoch": 0.38, "learning_rate": 0.00024270324355009707, "loss": 0.0226, "step": 147360 }, { "epoch": 0.38, "learning_rate": 0.0002426993553337256, "loss": 0.0192, "step": 147370 }, { "epoch": 0.38, "learning_rate": 0.00024269546711735412, "loss": 0.0169, "step": 147380 }, { "epoch": 0.38, "learning_rate": 0.00024269157890098266, "loss": 0.0218, "step": 147390 }, { "epoch": 0.38, "learning_rate": 0.00024268769068461118, "loss": 0.0174, "step": 147400 }, { "epoch": 0.38, "learning_rate": 0.00024268380246823975, "loss": 0.0222, "step": 147410 }, { "epoch": 0.38, "learning_rate": 0.00024267991425186826, "loss": 0.0237, "step": 147420 }, { "epoch": 0.38, "learning_rate": 0.0002426760260354968, "loss": 0.0199, "step": 147430 }, { "epoch": 0.38, "learning_rate": 0.00024267213781912532, "loss": 0.0204, "step": 147440 }, { "epoch": 0.38, "learning_rate": 0.00024266824960275389, "loss": 0.0205, "step": 147450 }, { "epoch": 0.38, "learning_rate": 0.0002426643613863824, "loss": 0.0197, "step": 147460 }, { "epoch": 0.38, "learning_rate": 0.00024266047317001094, "loss": 0.0168, "step": 147470 }, { "epoch": 0.38, "learning_rate": 0.00024265658495363946, "loss": 0.0196, "step": 147480 }, { "epoch": 0.38, "learning_rate": 0.00024265269673726803, "loss": 0.0188, "step": 147490 }, { "epoch": 0.38, "learning_rate": 0.00024264880852089657, "loss": 0.016, "step": 147500 }, { "epoch": 0.38, "learning_rate": 0.00024264492030452508, "loss": 0.0176, "step": 147510 }, { "epoch": 0.38, "learning_rate": 0.0002426410320881536, "loss": 0.0207, "step": 147520 }, { "epoch": 0.38, "learning_rate": 0.00024263714387178216, "loss": 0.019, "step": 147530 }, { "epoch": 0.38, "learning_rate": 0.0002426332556554107, "loss": 0.0171, "step": 147540 }, { "epoch": 0.38, "learning_rate": 0.00024262936743903922, "loss": 0.0197, "step": 147550 }, { "epoch": 0.38, "learning_rate": 0.00024262547922266776, "loss": 0.0219, "step": 147560 }, { "epoch": 0.38, "learning_rate": 0.0002426215910062963, "loss": 0.0235, "step": 147570 }, { "epoch": 0.38, "learning_rate": 0.00024261770278992485, "loss": 0.0182, "step": 147580 }, { "epoch": 0.38, "learning_rate": 0.00024261381457355336, "loss": 0.0196, "step": 147590 }, { "epoch": 0.38, "learning_rate": 0.0002426099263571819, "loss": 0.0189, "step": 147600 }, { "epoch": 0.38, "learning_rate": 0.00024260603814081044, "loss": 0.0192, "step": 147610 }, { "epoch": 0.38, "learning_rate": 0.00024260214992443899, "loss": 0.0171, "step": 147620 }, { "epoch": 0.38, "learning_rate": 0.0002425982617080675, "loss": 0.0167, "step": 147630 }, { "epoch": 0.38, "learning_rate": 0.00024259437349169604, "loss": 0.0154, "step": 147640 }, { "epoch": 0.38, "learning_rate": 0.00024259048527532456, "loss": 0.0214, "step": 147650 }, { "epoch": 0.38, "learning_rate": 0.00024258659705895312, "loss": 0.0229, "step": 147660 }, { "epoch": 0.38, "learning_rate": 0.00024258270884258164, "loss": 0.0196, "step": 147670 }, { "epoch": 0.38, "learning_rate": 0.00024257882062621018, "loss": 0.0181, "step": 147680 }, { "epoch": 0.38, "learning_rate": 0.0002425749324098387, "loss": 0.018, "step": 147690 }, { "epoch": 0.38, "learning_rate": 0.00024257104419346726, "loss": 0.0187, "step": 147700 }, { "epoch": 0.38, "learning_rate": 0.0002425671559770958, "loss": 0.0196, "step": 147710 }, { "epoch": 0.38, "learning_rate": 0.00024256326776072432, "loss": 0.0192, "step": 147720 }, { "epoch": 0.38, "learning_rate": 0.00024255937954435286, "loss": 0.016, "step": 147730 }, { "epoch": 0.38, "learning_rate": 0.0002425554913279814, "loss": 0.0184, "step": 147740 }, { "epoch": 0.38, "learning_rate": 0.00024255160311160995, "loss": 0.0241, "step": 147750 }, { "epoch": 0.38, "learning_rate": 0.00024254771489523846, "loss": 0.0151, "step": 147760 }, { "epoch": 0.38, "learning_rate": 0.000242543826678867, "loss": 0.0191, "step": 147770 }, { "epoch": 0.38, "learning_rate": 0.00024253993846249554, "loss": 0.0155, "step": 147780 }, { "epoch": 0.38, "learning_rate": 0.00024253605024612408, "loss": 0.0166, "step": 147790 }, { "epoch": 0.38, "learning_rate": 0.0002425321620297526, "loss": 0.0171, "step": 147800 }, { "epoch": 0.38, "learning_rate": 0.00024252827381338114, "loss": 0.0203, "step": 147810 }, { "epoch": 0.38, "learning_rate": 0.00024252438559700968, "loss": 0.0194, "step": 147820 }, { "epoch": 0.38, "learning_rate": 0.00024252049738063822, "loss": 0.0197, "step": 147830 }, { "epoch": 0.38, "learning_rate": 0.00024251660916426674, "loss": 0.0192, "step": 147840 }, { "epoch": 0.38, "learning_rate": 0.00024251272094789528, "loss": 0.0207, "step": 147850 }, { "epoch": 0.38, "learning_rate": 0.00024250883273152385, "loss": 0.0198, "step": 147860 }, { "epoch": 0.38, "learning_rate": 0.00024250494451515236, "loss": 0.0177, "step": 147870 }, { "epoch": 0.38, "learning_rate": 0.0002425010562987809, "loss": 0.0227, "step": 147880 }, { "epoch": 0.38, "learning_rate": 0.00024249716808240942, "loss": 0.0198, "step": 147890 }, { "epoch": 0.38, "learning_rate": 0.00024249327986603796, "loss": 0.0229, "step": 147900 }, { "epoch": 0.38, "learning_rate": 0.0002424893916496665, "loss": 0.0161, "step": 147910 }, { "epoch": 0.38, "learning_rate": 0.00024248550343329504, "loss": 0.0201, "step": 147920 }, { "epoch": 0.38, "learning_rate": 0.00024248161521692356, "loss": 0.024, "step": 147930 }, { "epoch": 0.38, "learning_rate": 0.0002424777270005521, "loss": 0.0166, "step": 147940 }, { "epoch": 0.38, "learning_rate": 0.00024247383878418064, "loss": 0.0185, "step": 147950 }, { "epoch": 0.38, "learning_rate": 0.00024246995056780918, "loss": 0.0204, "step": 147960 }, { "epoch": 0.38, "learning_rate": 0.0002424660623514377, "loss": 0.0138, "step": 147970 }, { "epoch": 0.38, "learning_rate": 0.00024246217413506624, "loss": 0.0176, "step": 147980 }, { "epoch": 0.38, "learning_rate": 0.00024245828591869478, "loss": 0.0167, "step": 147990 }, { "epoch": 0.38, "learning_rate": 0.00024245439770232332, "loss": 0.0176, "step": 148000 }, { "epoch": 0.38, "eval_cer": 0.881782465628416, "eval_loss": 0.013744070194661617, "eval_runtime": 107.4219, "eval_samples_per_second": 18.618, "eval_steps_per_second": 4.655, "step": 148000 }, { "epoch": 0.38, "learning_rate": 0.00024245050948595184, "loss": 0.0171, "step": 148010 }, { "epoch": 0.38, "learning_rate": 0.00024244662126958038, "loss": 0.0143, "step": 148020 }, { "epoch": 0.38, "learning_rate": 0.00024244273305320895, "loss": 0.0181, "step": 148030 }, { "epoch": 0.38, "learning_rate": 0.00024243884483683746, "loss": 0.0167, "step": 148040 }, { "epoch": 0.38, "learning_rate": 0.000242434956620466, "loss": 0.0174, "step": 148050 }, { "epoch": 0.38, "learning_rate": 0.00024243106840409452, "loss": 0.0236, "step": 148060 }, { "epoch": 0.38, "learning_rate": 0.0002424271801877231, "loss": 0.0184, "step": 148070 }, { "epoch": 0.38, "learning_rate": 0.0002424232919713516, "loss": 0.0193, "step": 148080 }, { "epoch": 0.38, "learning_rate": 0.00024241940375498014, "loss": 0.0216, "step": 148090 }, { "epoch": 0.38, "learning_rate": 0.00024241551553860866, "loss": 0.021, "step": 148100 }, { "epoch": 0.38, "learning_rate": 0.00024241162732223723, "loss": 0.0228, "step": 148110 }, { "epoch": 0.38, "learning_rate": 0.00024240773910586574, "loss": 0.0188, "step": 148120 }, { "epoch": 0.38, "learning_rate": 0.00024240385088949428, "loss": 0.0199, "step": 148130 }, { "epoch": 0.38, "learning_rate": 0.0002423999626731228, "loss": 0.0226, "step": 148140 }, { "epoch": 0.38, "learning_rate": 0.00024239607445675134, "loss": 0.0202, "step": 148150 }, { "epoch": 0.38, "learning_rate": 0.00024239218624037988, "loss": 0.0192, "step": 148160 }, { "epoch": 0.38, "learning_rate": 0.00024238829802400842, "loss": 0.0168, "step": 148170 }, { "epoch": 0.38, "learning_rate": 0.00024238440980763694, "loss": 0.019, "step": 148180 }, { "epoch": 0.38, "learning_rate": 0.00024238052159126548, "loss": 0.0228, "step": 148190 }, { "epoch": 0.38, "learning_rate": 0.00024237663337489405, "loss": 0.0206, "step": 148200 }, { "epoch": 0.38, "learning_rate": 0.00024237274515852256, "loss": 0.0192, "step": 148210 }, { "epoch": 0.38, "learning_rate": 0.00024236885694215108, "loss": 0.0248, "step": 148220 }, { "epoch": 0.38, "learning_rate": 0.00024236496872577962, "loss": 0.025, "step": 148230 }, { "epoch": 0.38, "learning_rate": 0.0002423610805094082, "loss": 0.0178, "step": 148240 }, { "epoch": 0.38, "learning_rate": 0.0002423571922930367, "loss": 0.0205, "step": 148250 }, { "epoch": 0.38, "learning_rate": 0.00024235330407666524, "loss": 0.0227, "step": 148260 }, { "epoch": 0.38, "learning_rate": 0.00024234941586029376, "loss": 0.0205, "step": 148270 }, { "epoch": 0.38, "learning_rate": 0.00024234552764392233, "loss": 0.0186, "step": 148280 }, { "epoch": 0.38, "learning_rate": 0.00024234163942755084, "loss": 0.0214, "step": 148290 }, { "epoch": 0.38, "learning_rate": 0.00024233775121117938, "loss": 0.0202, "step": 148300 }, { "epoch": 0.38, "learning_rate": 0.0002423338629948079, "loss": 0.0185, "step": 148310 }, { "epoch": 0.38, "learning_rate": 0.00024232997477843647, "loss": 0.0241, "step": 148320 }, { "epoch": 0.38, "learning_rate": 0.00024232608656206498, "loss": 0.0224, "step": 148330 }, { "epoch": 0.38, "learning_rate": 0.00024232219834569352, "loss": 0.0219, "step": 148340 }, { "epoch": 0.38, "learning_rate": 0.00024231831012932204, "loss": 0.0234, "step": 148350 }, { "epoch": 0.38, "learning_rate": 0.0002423144219129506, "loss": 0.023, "step": 148360 }, { "epoch": 0.38, "learning_rate": 0.00024231053369657915, "loss": 0.0174, "step": 148370 }, { "epoch": 0.38, "learning_rate": 0.00024230664548020766, "loss": 0.0254, "step": 148380 }, { "epoch": 0.38, "learning_rate": 0.00024230275726383618, "loss": 0.0168, "step": 148390 }, { "epoch": 0.38, "learning_rate": 0.00024229886904746472, "loss": 0.0212, "step": 148400 }, { "epoch": 0.38, "learning_rate": 0.0002422949808310933, "loss": 0.023, "step": 148410 }, { "epoch": 0.38, "learning_rate": 0.0002422910926147218, "loss": 0.02, "step": 148420 }, { "epoch": 0.38, "learning_rate": 0.00024228720439835034, "loss": 0.0161, "step": 148430 }, { "epoch": 0.38, "learning_rate": 0.00024228331618197886, "loss": 0.0205, "step": 148440 }, { "epoch": 0.38, "learning_rate": 0.00024227942796560743, "loss": 0.0217, "step": 148450 }, { "epoch": 0.38, "learning_rate": 0.00024227553974923594, "loss": 0.0225, "step": 148460 }, { "epoch": 0.38, "learning_rate": 0.00024227165153286448, "loss": 0.0183, "step": 148470 }, { "epoch": 0.38, "learning_rate": 0.000242267763316493, "loss": 0.0182, "step": 148480 }, { "epoch": 0.38, "learning_rate": 0.00024226387510012157, "loss": 0.0218, "step": 148490 }, { "epoch": 0.38, "learning_rate": 0.00024225998688375008, "loss": 0.0204, "step": 148500 }, { "epoch": 0.38, "learning_rate": 0.00024225609866737862, "loss": 0.019, "step": 148510 }, { "epoch": 0.38, "learning_rate": 0.00024225221045100714, "loss": 0.0203, "step": 148520 }, { "epoch": 0.39, "learning_rate": 0.0002422483222346357, "loss": 0.0201, "step": 148530 }, { "epoch": 0.39, "learning_rate": 0.00024224443401826422, "loss": 0.0154, "step": 148540 }, { "epoch": 0.39, "learning_rate": 0.00024224054580189276, "loss": 0.0182, "step": 148550 }, { "epoch": 0.39, "learning_rate": 0.00024223665758552128, "loss": 0.022, "step": 148560 }, { "epoch": 0.39, "learning_rate": 0.00024223276936914984, "loss": 0.0198, "step": 148570 }, { "epoch": 0.39, "learning_rate": 0.00024222888115277839, "loss": 0.0213, "step": 148580 }, { "epoch": 0.39, "learning_rate": 0.0002422249929364069, "loss": 0.0234, "step": 148590 }, { "epoch": 0.39, "learning_rate": 0.00024222110472003544, "loss": 0.0174, "step": 148600 }, { "epoch": 0.39, "learning_rate": 0.00024221721650366398, "loss": 0.018, "step": 148610 }, { "epoch": 0.39, "learning_rate": 0.00024221332828729253, "loss": 0.0184, "step": 148620 }, { "epoch": 0.39, "learning_rate": 0.00024220944007092104, "loss": 0.0233, "step": 148630 }, { "epoch": 0.39, "learning_rate": 0.00024220555185454958, "loss": 0.0187, "step": 148640 }, { "epoch": 0.39, "learning_rate": 0.0002422016636381781, "loss": 0.0177, "step": 148650 }, { "epoch": 0.39, "learning_rate": 0.00024219777542180667, "loss": 0.02, "step": 148660 }, { "epoch": 0.39, "learning_rate": 0.00024219388720543518, "loss": 0.0184, "step": 148670 }, { "epoch": 0.39, "learning_rate": 0.00024218999898906372, "loss": 0.0229, "step": 148680 }, { "epoch": 0.39, "learning_rate": 0.00024218611077269224, "loss": 0.0194, "step": 148690 }, { "epoch": 0.39, "learning_rate": 0.0002421822225563208, "loss": 0.0246, "step": 148700 }, { "epoch": 0.39, "learning_rate": 0.00024217833433994932, "loss": 0.0209, "step": 148710 }, { "epoch": 0.39, "learning_rate": 0.00024217444612357786, "loss": 0.019, "step": 148720 }, { "epoch": 0.39, "learning_rate": 0.00024217055790720638, "loss": 0.0242, "step": 148730 }, { "epoch": 0.39, "learning_rate": 0.00024216666969083494, "loss": 0.0198, "step": 148740 }, { "epoch": 0.39, "learning_rate": 0.00024216278147446349, "loss": 0.0239, "step": 148750 }, { "epoch": 0.39, "learning_rate": 0.000242158893258092, "loss": 0.0196, "step": 148760 }, { "epoch": 0.39, "learning_rate": 0.00024215500504172054, "loss": 0.0171, "step": 148770 }, { "epoch": 0.39, "learning_rate": 0.00024215111682534908, "loss": 0.0198, "step": 148780 }, { "epoch": 0.39, "learning_rate": 0.00024214722860897763, "loss": 0.0196, "step": 148790 }, { "epoch": 0.39, "learning_rate": 0.00024214334039260614, "loss": 0.0163, "step": 148800 }, { "epoch": 0.39, "learning_rate": 0.00024213945217623468, "loss": 0.0217, "step": 148810 }, { "epoch": 0.39, "learning_rate": 0.00024213556395986322, "loss": 0.0201, "step": 148820 }, { "epoch": 0.39, "learning_rate": 0.00024213167574349176, "loss": 0.0173, "step": 148830 }, { "epoch": 0.39, "learning_rate": 0.00024212778752712028, "loss": 0.0146, "step": 148840 }, { "epoch": 0.39, "learning_rate": 0.00024212389931074882, "loss": 0.0231, "step": 148850 }, { "epoch": 0.39, "learning_rate": 0.00024212001109437736, "loss": 0.0252, "step": 148860 }, { "epoch": 0.39, "learning_rate": 0.0002421161228780059, "loss": 0.0196, "step": 148870 }, { "epoch": 0.39, "learning_rate": 0.00024211223466163442, "loss": 0.0187, "step": 148880 }, { "epoch": 0.39, "learning_rate": 0.00024210834644526296, "loss": 0.0165, "step": 148890 }, { "epoch": 0.39, "learning_rate": 0.00024210445822889147, "loss": 0.0169, "step": 148900 }, { "epoch": 0.39, "learning_rate": 0.00024210057001252004, "loss": 0.0169, "step": 148910 }, { "epoch": 0.39, "learning_rate": 0.00024209668179614859, "loss": 0.0189, "step": 148920 }, { "epoch": 0.39, "learning_rate": 0.0002420927935797771, "loss": 0.0217, "step": 148930 }, { "epoch": 0.39, "learning_rate": 0.00024208890536340561, "loss": 0.0185, "step": 148940 }, { "epoch": 0.39, "learning_rate": 0.00024208501714703418, "loss": 0.0166, "step": 148950 }, { "epoch": 0.39, "learning_rate": 0.00024208112893066272, "loss": 0.0183, "step": 148960 }, { "epoch": 0.39, "learning_rate": 0.00024207724071429124, "loss": 0.0195, "step": 148970 }, { "epoch": 0.39, "learning_rate": 0.00024207335249791978, "loss": 0.0149, "step": 148980 }, { "epoch": 0.39, "learning_rate": 0.00024206946428154832, "loss": 0.0185, "step": 148990 }, { "epoch": 0.39, "learning_rate": 0.00024206557606517686, "loss": 0.0198, "step": 149000 }, { "epoch": 0.39, "eval_cer": 0.8817642703482717, "eval_loss": 0.013767913915216923, "eval_runtime": 107.1271, "eval_samples_per_second": 18.669, "eval_steps_per_second": 4.667, "step": 149000 }, { "epoch": 0.39, "learning_rate": 0.00024206168784880538, "loss": 0.0155, "step": 149010 }, { "epoch": 0.39, "learning_rate": 0.00024205779963243392, "loss": 0.0183, "step": 149020 }, { "epoch": 0.39, "learning_rate": 0.00024205391141606246, "loss": 0.0186, "step": 149030 }, { "epoch": 0.39, "learning_rate": 0.000242050023199691, "loss": 0.0151, "step": 149040 }, { "epoch": 0.39, "learning_rate": 0.00024204613498331952, "loss": 0.0163, "step": 149050 }, { "epoch": 0.39, "learning_rate": 0.00024204224676694806, "loss": 0.025, "step": 149060 }, { "epoch": 0.39, "learning_rate": 0.00024203835855057663, "loss": 0.0172, "step": 149070 }, { "epoch": 0.39, "learning_rate": 0.00024203447033420514, "loss": 0.0188, "step": 149080 }, { "epoch": 0.39, "learning_rate": 0.00024203058211783368, "loss": 0.0281, "step": 149090 }, { "epoch": 0.39, "learning_rate": 0.0002420266939014622, "loss": 0.0243, "step": 149100 }, { "epoch": 0.39, "learning_rate": 0.00024202280568509077, "loss": 0.0232, "step": 149110 }, { "epoch": 0.39, "learning_rate": 0.00024201891746871928, "loss": 0.017, "step": 149120 }, { "epoch": 0.39, "learning_rate": 0.00024201502925234782, "loss": 0.0256, "step": 149130 }, { "epoch": 0.39, "learning_rate": 0.00024201114103597634, "loss": 0.0198, "step": 149140 }, { "epoch": 0.39, "learning_rate": 0.00024200725281960488, "loss": 0.0237, "step": 149150 }, { "epoch": 0.39, "learning_rate": 0.00024200336460323342, "loss": 0.0184, "step": 149160 }, { "epoch": 0.39, "learning_rate": 0.00024199947638686196, "loss": 0.0187, "step": 149170 }, { "epoch": 0.39, "learning_rate": 0.00024199558817049048, "loss": 0.0193, "step": 149180 }, { "epoch": 0.39, "learning_rate": 0.00024199169995411902, "loss": 0.017, "step": 149190 }, { "epoch": 0.39, "learning_rate": 0.00024198781173774756, "loss": 0.0265, "step": 149200 }, { "epoch": 0.39, "learning_rate": 0.0002419839235213761, "loss": 0.022, "step": 149210 }, { "epoch": 0.39, "learning_rate": 0.00024198003530500462, "loss": 0.0174, "step": 149220 }, { "epoch": 0.39, "learning_rate": 0.00024197614708863316, "loss": 0.016, "step": 149230 }, { "epoch": 0.39, "learning_rate": 0.00024197225887226173, "loss": 0.0184, "step": 149240 }, { "epoch": 0.39, "learning_rate": 0.00024196837065589024, "loss": 0.0168, "step": 149250 }, { "epoch": 0.39, "learning_rate": 0.00024196448243951876, "loss": 0.0184, "step": 149260 }, { "epoch": 0.39, "learning_rate": 0.0002419605942231473, "loss": 0.0174, "step": 149270 }, { "epoch": 0.39, "learning_rate": 0.00024195670600677587, "loss": 0.0175, "step": 149280 }, { "epoch": 0.39, "learning_rate": 0.00024195281779040438, "loss": 0.0159, "step": 149290 }, { "epoch": 0.39, "learning_rate": 0.00024194892957403292, "loss": 0.0197, "step": 149300 }, { "epoch": 0.39, "learning_rate": 0.00024194504135766144, "loss": 0.0186, "step": 149310 }, { "epoch": 0.39, "learning_rate": 0.00024194115314129, "loss": 0.0207, "step": 149320 }, { "epoch": 0.39, "learning_rate": 0.00024193726492491852, "loss": 0.0241, "step": 149330 }, { "epoch": 0.39, "learning_rate": 0.00024193337670854706, "loss": 0.0191, "step": 149340 }, { "epoch": 0.39, "learning_rate": 0.00024192948849217558, "loss": 0.017, "step": 149350 }, { "epoch": 0.39, "learning_rate": 0.00024192560027580415, "loss": 0.0164, "step": 149360 }, { "epoch": 0.39, "learning_rate": 0.00024192171205943266, "loss": 0.02, "step": 149370 }, { "epoch": 0.39, "learning_rate": 0.0002419178238430612, "loss": 0.0229, "step": 149380 }, { "epoch": 0.39, "learning_rate": 0.00024191393562668972, "loss": 0.0206, "step": 149390 }, { "epoch": 0.39, "learning_rate": 0.00024191004741031826, "loss": 0.0176, "step": 149400 }, { "epoch": 0.39, "learning_rate": 0.0002419061591939468, "loss": 0.0216, "step": 149410 }, { "epoch": 0.39, "learning_rate": 0.00024190227097757534, "loss": 0.0219, "step": 149420 }, { "epoch": 0.39, "learning_rate": 0.00024189838276120386, "loss": 0.0126, "step": 149430 }, { "epoch": 0.39, "learning_rate": 0.0002418944945448324, "loss": 0.0185, "step": 149440 }, { "epoch": 0.39, "learning_rate": 0.00024189060632846097, "loss": 0.0169, "step": 149450 }, { "epoch": 0.39, "learning_rate": 0.00024188671811208948, "loss": 0.0228, "step": 149460 }, { "epoch": 0.39, "learning_rate": 0.00024188282989571802, "loss": 0.0179, "step": 149470 }, { "epoch": 0.39, "learning_rate": 0.00024187894167934654, "loss": 0.0179, "step": 149480 }, { "epoch": 0.39, "learning_rate": 0.0002418750534629751, "loss": 0.0213, "step": 149490 }, { "epoch": 0.39, "learning_rate": 0.00024187116524660362, "loss": 0.0188, "step": 149500 }, { "epoch": 0.39, "learning_rate": 0.00024186727703023216, "loss": 0.0229, "step": 149510 }, { "epoch": 0.39, "learning_rate": 0.00024186338881386068, "loss": 0.018, "step": 149520 }, { "epoch": 0.39, "learning_rate": 0.00024185950059748925, "loss": 0.0181, "step": 149530 }, { "epoch": 0.39, "learning_rate": 0.00024185561238111776, "loss": 0.024, "step": 149540 }, { "epoch": 0.39, "learning_rate": 0.0002418517241647463, "loss": 0.0189, "step": 149550 }, { "epoch": 0.39, "learning_rate": 0.00024184783594837482, "loss": 0.0158, "step": 149560 }, { "epoch": 0.39, "learning_rate": 0.00024184394773200339, "loss": 0.0213, "step": 149570 }, { "epoch": 0.39, "learning_rate": 0.0002418400595156319, "loss": 0.017, "step": 149580 }, { "epoch": 0.39, "learning_rate": 0.00024183617129926044, "loss": 0.0161, "step": 149590 }, { "epoch": 0.39, "learning_rate": 0.00024183228308288896, "loss": 0.0158, "step": 149600 }, { "epoch": 0.39, "learning_rate": 0.0002418283948665175, "loss": 0.0202, "step": 149610 }, { "epoch": 0.39, "learning_rate": 0.00024182450665014607, "loss": 0.0202, "step": 149620 }, { "epoch": 0.39, "learning_rate": 0.00024182061843377458, "loss": 0.0172, "step": 149630 }, { "epoch": 0.39, "learning_rate": 0.00024181673021740312, "loss": 0.0196, "step": 149640 }, { "epoch": 0.39, "learning_rate": 0.00024181284200103164, "loss": 0.0196, "step": 149650 }, { "epoch": 0.39, "learning_rate": 0.0002418089537846602, "loss": 0.018, "step": 149660 }, { "epoch": 0.39, "learning_rate": 0.00024180506556828872, "loss": 0.0191, "step": 149670 }, { "epoch": 0.39, "learning_rate": 0.00024180117735191726, "loss": 0.0201, "step": 149680 }, { "epoch": 0.39, "learning_rate": 0.00024179728913554578, "loss": 0.0196, "step": 149690 }, { "epoch": 0.39, "learning_rate": 0.00024179340091917435, "loss": 0.0182, "step": 149700 }, { "epoch": 0.39, "learning_rate": 0.00024178951270280286, "loss": 0.0198, "step": 149710 }, { "epoch": 0.39, "learning_rate": 0.0002417856244864314, "loss": 0.017, "step": 149720 }, { "epoch": 0.39, "learning_rate": 0.00024178173627005992, "loss": 0.0162, "step": 149730 }, { "epoch": 0.39, "learning_rate": 0.00024177784805368848, "loss": 0.0191, "step": 149740 }, { "epoch": 0.39, "learning_rate": 0.000241773959837317, "loss": 0.0194, "step": 149750 }, { "epoch": 0.39, "learning_rate": 0.00024177007162094554, "loss": 0.0212, "step": 149760 }, { "epoch": 0.39, "learning_rate": 0.00024176618340457406, "loss": 0.0174, "step": 149770 }, { "epoch": 0.39, "learning_rate": 0.00024176229518820262, "loss": 0.0209, "step": 149780 }, { "epoch": 0.39, "learning_rate": 0.00024175840697183117, "loss": 0.0157, "step": 149790 }, { "epoch": 0.39, "learning_rate": 0.00024175451875545968, "loss": 0.0183, "step": 149800 }, { "epoch": 0.39, "learning_rate": 0.0002417506305390882, "loss": 0.0174, "step": 149810 }, { "epoch": 0.39, "learning_rate": 0.00024174674232271676, "loss": 0.019, "step": 149820 }, { "epoch": 0.39, "learning_rate": 0.0002417428541063453, "loss": 0.0222, "step": 149830 }, { "epoch": 0.39, "learning_rate": 0.00024173896588997382, "loss": 0.0179, "step": 149840 }, { "epoch": 0.39, "learning_rate": 0.00024173507767360236, "loss": 0.0152, "step": 149850 }, { "epoch": 0.39, "learning_rate": 0.00024173118945723088, "loss": 0.0192, "step": 149860 }, { "epoch": 0.39, "learning_rate": 0.00024172730124085944, "loss": 0.0188, "step": 149870 }, { "epoch": 0.39, "learning_rate": 0.00024172341302448796, "loss": 0.0205, "step": 149880 }, { "epoch": 0.39, "learning_rate": 0.0002417195248081165, "loss": 0.0219, "step": 149890 }, { "epoch": 0.39, "learning_rate": 0.00024171563659174502, "loss": 0.0183, "step": 149900 }, { "epoch": 0.39, "learning_rate": 0.00024171174837537358, "loss": 0.0199, "step": 149910 }, { "epoch": 0.39, "learning_rate": 0.0002417078601590021, "loss": 0.0219, "step": 149920 }, { "epoch": 0.39, "learning_rate": 0.00024170397194263064, "loss": 0.0151, "step": 149930 }, { "epoch": 0.39, "learning_rate": 0.00024170008372625915, "loss": 0.0218, "step": 149940 }, { "epoch": 0.39, "learning_rate": 0.00024169619550988772, "loss": 0.0186, "step": 149950 }, { "epoch": 0.39, "learning_rate": 0.00024169230729351627, "loss": 0.0194, "step": 149960 }, { "epoch": 0.39, "learning_rate": 0.00024168841907714478, "loss": 0.0216, "step": 149970 }, { "epoch": 0.39, "learning_rate": 0.0002416845308607733, "loss": 0.0188, "step": 149980 }, { "epoch": 0.39, "learning_rate": 0.00024168064264440186, "loss": 0.025, "step": 149990 }, { "epoch": 0.39, "learning_rate": 0.0002416767544280304, "loss": 0.0238, "step": 150000 }, { "epoch": 0.39, "eval_cer": 0.8817754674437451, "eval_loss": 0.013502559624612331, "eval_runtime": 107.4245, "eval_samples_per_second": 18.618, "eval_steps_per_second": 4.654, "step": 150000 }, { "epoch": 0.39, "learning_rate": 0.00024167286621165892, "loss": 0.0176, "step": 150010 }, { "epoch": 0.39, "learning_rate": 0.00024166897799528746, "loss": 0.0341, "step": 150020 }, { "epoch": 0.39, "learning_rate": 0.000241665089778916, "loss": 0.0205, "step": 150030 }, { "epoch": 0.39, "learning_rate": 0.00024166120156254454, "loss": 0.0226, "step": 150040 }, { "epoch": 0.39, "learning_rate": 0.00024165731334617306, "loss": 0.0161, "step": 150050 }, { "epoch": 0.39, "learning_rate": 0.0002416534251298016, "loss": 0.0308, "step": 150060 }, { "epoch": 0.39, "learning_rate": 0.00024164953691343014, "loss": 0.0184, "step": 150070 }, { "epoch": 0.39, "learning_rate": 0.00024164564869705868, "loss": 0.0197, "step": 150080 }, { "epoch": 0.39, "learning_rate": 0.0002416417604806872, "loss": 0.0215, "step": 150090 }, { "epoch": 0.39, "learning_rate": 0.00024163787226431574, "loss": 0.0169, "step": 150100 }, { "epoch": 0.39, "learning_rate": 0.00024163398404794425, "loss": 0.0251, "step": 150110 }, { "epoch": 0.39, "learning_rate": 0.00024163009583157282, "loss": 0.0158, "step": 150120 }, { "epoch": 0.39, "learning_rate": 0.00024162620761520134, "loss": 0.0179, "step": 150130 }, { "epoch": 0.39, "learning_rate": 0.00024162231939882988, "loss": 0.0196, "step": 150140 }, { "epoch": 0.39, "learning_rate": 0.0002416184311824584, "loss": 0.0172, "step": 150150 }, { "epoch": 0.39, "learning_rate": 0.00024161454296608696, "loss": 0.0204, "step": 150160 }, { "epoch": 0.39, "learning_rate": 0.0002416106547497155, "loss": 0.0239, "step": 150170 }, { "epoch": 0.39, "learning_rate": 0.00024160676653334402, "loss": 0.0191, "step": 150180 }, { "epoch": 0.39, "learning_rate": 0.00024160287831697256, "loss": 0.0205, "step": 150190 }, { "epoch": 0.39, "learning_rate": 0.0002415989901006011, "loss": 0.0229, "step": 150200 }, { "epoch": 0.39, "learning_rate": 0.00024159510188422964, "loss": 0.0258, "step": 150210 }, { "epoch": 0.39, "learning_rate": 0.00024159121366785816, "loss": 0.019, "step": 150220 }, { "epoch": 0.39, "learning_rate": 0.0002415873254514867, "loss": 0.0192, "step": 150230 }, { "epoch": 0.39, "learning_rate": 0.00024158343723511524, "loss": 0.0186, "step": 150240 }, { "epoch": 0.39, "learning_rate": 0.00024157954901874378, "loss": 0.0193, "step": 150250 }, { "epoch": 0.39, "learning_rate": 0.0002415756608023723, "loss": 0.0212, "step": 150260 }, { "epoch": 0.39, "learning_rate": 0.00024157177258600084, "loss": 0.0183, "step": 150270 }, { "epoch": 0.39, "learning_rate": 0.0002415678843696294, "loss": 0.0208, "step": 150280 }, { "epoch": 0.39, "learning_rate": 0.00024156399615325792, "loss": 0.0169, "step": 150290 }, { "epoch": 0.39, "learning_rate": 0.00024156010793688644, "loss": 0.0193, "step": 150300 }, { "epoch": 0.39, "learning_rate": 0.00024155621972051498, "loss": 0.017, "step": 150310 }, { "epoch": 0.39, "learning_rate": 0.00024155233150414355, "loss": 0.0218, "step": 150320 }, { "epoch": 0.39, "learning_rate": 0.00024154844328777206, "loss": 0.0178, "step": 150330 }, { "epoch": 0.39, "learning_rate": 0.0002415445550714006, "loss": 0.0217, "step": 150340 }, { "epoch": 0.39, "learning_rate": 0.00024154066685502912, "loss": 0.0173, "step": 150350 }, { "epoch": 0.39, "learning_rate": 0.00024153677863865766, "loss": 0.0231, "step": 150360 }, { "epoch": 0.39, "learning_rate": 0.0002415328904222862, "loss": 0.0197, "step": 150370 }, { "epoch": 0.39, "learning_rate": 0.00024152900220591474, "loss": 0.0168, "step": 150380 }, { "epoch": 0.39, "learning_rate": 0.00024152511398954326, "loss": 0.0149, "step": 150390 }, { "epoch": 0.39, "learning_rate": 0.0002415212257731718, "loss": 0.0185, "step": 150400 }, { "epoch": 0.39, "learning_rate": 0.00024151733755680034, "loss": 0.016, "step": 150410 }, { "epoch": 0.39, "learning_rate": 0.00024151344934042888, "loss": 0.0174, "step": 150420 }, { "epoch": 0.39, "learning_rate": 0.0002415095611240574, "loss": 0.0171, "step": 150430 }, { "epoch": 0.39, "learning_rate": 0.00024150567290768594, "loss": 0.0186, "step": 150440 }, { "epoch": 0.39, "learning_rate": 0.00024150178469131448, "loss": 0.0182, "step": 150450 }, { "epoch": 0.39, "learning_rate": 0.00024149789647494302, "loss": 0.0171, "step": 150460 }, { "epoch": 0.39, "learning_rate": 0.00024149400825857154, "loss": 0.0251, "step": 150470 }, { "epoch": 0.39, "learning_rate": 0.00024149012004220008, "loss": 0.0246, "step": 150480 }, { "epoch": 0.39, "learning_rate": 0.00024148623182582865, "loss": 0.0232, "step": 150490 }, { "epoch": 0.39, "learning_rate": 0.00024148234360945716, "loss": 0.0227, "step": 150500 }, { "epoch": 0.39, "learning_rate": 0.0002414784553930857, "loss": 0.0206, "step": 150510 }, { "epoch": 0.39, "learning_rate": 0.00024147456717671422, "loss": 0.0205, "step": 150520 }, { "epoch": 0.39, "learning_rate": 0.00024147067896034279, "loss": 0.0249, "step": 150530 }, { "epoch": 0.39, "learning_rate": 0.0002414667907439713, "loss": 0.0168, "step": 150540 }, { "epoch": 0.39, "learning_rate": 0.00024146290252759984, "loss": 0.0191, "step": 150550 }, { "epoch": 0.39, "learning_rate": 0.00024145901431122836, "loss": 0.0232, "step": 150560 }, { "epoch": 0.39, "learning_rate": 0.00024145512609485693, "loss": 0.0203, "step": 150570 }, { "epoch": 0.39, "learning_rate": 0.00024145123787848544, "loss": 0.015, "step": 150580 }, { "epoch": 0.39, "learning_rate": 0.00024144734966211398, "loss": 0.0203, "step": 150590 }, { "epoch": 0.39, "learning_rate": 0.0002414434614457425, "loss": 0.0185, "step": 150600 }, { "epoch": 0.39, "learning_rate": 0.00024143957322937104, "loss": 0.019, "step": 150610 }, { "epoch": 0.39, "learning_rate": 0.00024143568501299958, "loss": 0.0172, "step": 150620 }, { "epoch": 0.39, "learning_rate": 0.00024143179679662812, "loss": 0.0178, "step": 150630 }, { "epoch": 0.39, "learning_rate": 0.00024142790858025664, "loss": 0.0204, "step": 150640 }, { "epoch": 0.39, "learning_rate": 0.00024142402036388518, "loss": 0.0188, "step": 150650 }, { "epoch": 0.39, "learning_rate": 0.00024142013214751375, "loss": 0.0201, "step": 150660 }, { "epoch": 0.39, "learning_rate": 0.00024141624393114226, "loss": 0.0197, "step": 150670 }, { "epoch": 0.39, "learning_rate": 0.0002414123557147708, "loss": 0.0191, "step": 150680 }, { "epoch": 0.39, "learning_rate": 0.00024140846749839932, "loss": 0.0203, "step": 150690 }, { "epoch": 0.39, "learning_rate": 0.00024140457928202789, "loss": 0.0189, "step": 150700 }, { "epoch": 0.39, "learning_rate": 0.0002414006910656564, "loss": 0.0179, "step": 150710 }, { "epoch": 0.39, "learning_rate": 0.00024139680284928494, "loss": 0.0175, "step": 150720 }, { "epoch": 0.39, "learning_rate": 0.00024139291463291346, "loss": 0.019, "step": 150730 }, { "epoch": 0.39, "learning_rate": 0.00024138902641654202, "loss": 0.0149, "step": 150740 }, { "epoch": 0.39, "learning_rate": 0.00024138513820017054, "loss": 0.0164, "step": 150750 }, { "epoch": 0.39, "learning_rate": 0.00024138124998379908, "loss": 0.019, "step": 150760 }, { "epoch": 0.39, "learning_rate": 0.0002413773617674276, "loss": 0.0216, "step": 150770 }, { "epoch": 0.39, "learning_rate": 0.00024137347355105616, "loss": 0.0212, "step": 150780 }, { "epoch": 0.39, "learning_rate": 0.00024136958533468468, "loss": 0.0181, "step": 150790 }, { "epoch": 0.39, "learning_rate": 0.00024136569711831322, "loss": 0.0241, "step": 150800 }, { "epoch": 0.39, "learning_rate": 0.00024136180890194174, "loss": 0.0173, "step": 150810 }, { "epoch": 0.39, "learning_rate": 0.0002413579206855703, "loss": 0.0216, "step": 150820 }, { "epoch": 0.39, "learning_rate": 0.00024135403246919885, "loss": 0.017, "step": 150830 }, { "epoch": 0.39, "learning_rate": 0.00024135014425282736, "loss": 0.029, "step": 150840 }, { "epoch": 0.39, "learning_rate": 0.00024134625603645587, "loss": 0.0181, "step": 150850 }, { "epoch": 0.39, "learning_rate": 0.00024134236782008442, "loss": 0.0198, "step": 150860 }, { "epoch": 0.39, "learning_rate": 0.00024133847960371298, "loss": 0.0212, "step": 150870 }, { "epoch": 0.39, "learning_rate": 0.0002413345913873415, "loss": 0.0168, "step": 150880 }, { "epoch": 0.39, "learning_rate": 0.00024133070317097004, "loss": 0.0203, "step": 150890 }, { "epoch": 0.39, "learning_rate": 0.00024132681495459856, "loss": 0.0181, "step": 150900 }, { "epoch": 0.39, "learning_rate": 0.00024132292673822712, "loss": 0.0174, "step": 150910 }, { "epoch": 0.39, "learning_rate": 0.00024131903852185564, "loss": 0.0264, "step": 150920 }, { "epoch": 0.39, "learning_rate": 0.00024131515030548418, "loss": 0.0209, "step": 150930 }, { "epoch": 0.39, "learning_rate": 0.0002413112620891127, "loss": 0.0198, "step": 150940 }, { "epoch": 0.39, "learning_rate": 0.00024130737387274126, "loss": 0.0142, "step": 150950 }, { "epoch": 0.39, "learning_rate": 0.00024130348565636978, "loss": 0.0176, "step": 150960 }, { "epoch": 0.39, "learning_rate": 0.00024129959743999832, "loss": 0.0168, "step": 150970 }, { "epoch": 0.39, "learning_rate": 0.00024129570922362683, "loss": 0.0203, "step": 150980 }, { "epoch": 0.39, "learning_rate": 0.0002412918210072554, "loss": 0.0202, "step": 150990 }, { "epoch": 0.39, "learning_rate": 0.00024128793279088392, "loss": 0.0206, "step": 151000 }, { "epoch": 0.39, "eval_cer": 0.8817768670806793, "eval_loss": 0.013644468039274216, "eval_runtime": 107.4348, "eval_samples_per_second": 18.616, "eval_steps_per_second": 4.654, "step": 151000 }, { "epoch": 0.39, "learning_rate": 0.00024128404457451246, "loss": 0.0214, "step": 151010 }, { "epoch": 0.39, "learning_rate": 0.00024128015635814097, "loss": 0.0141, "step": 151020 }, { "epoch": 0.39, "learning_rate": 0.00024127626814176954, "loss": 0.0167, "step": 151030 }, { "epoch": 0.39, "learning_rate": 0.00024127237992539808, "loss": 0.0133, "step": 151040 }, { "epoch": 0.39, "learning_rate": 0.0002412684917090266, "loss": 0.0183, "step": 151050 }, { "epoch": 0.39, "learning_rate": 0.00024126460349265514, "loss": 0.0167, "step": 151060 }, { "epoch": 0.39, "learning_rate": 0.00024126071527628368, "loss": 0.0179, "step": 151070 }, { "epoch": 0.39, "learning_rate": 0.00024125682705991222, "loss": 0.0189, "step": 151080 }, { "epoch": 0.39, "learning_rate": 0.00024125293884354074, "loss": 0.0177, "step": 151090 }, { "epoch": 0.39, "learning_rate": 0.00024124905062716928, "loss": 0.0192, "step": 151100 }, { "epoch": 0.39, "learning_rate": 0.0002412451624107978, "loss": 0.0243, "step": 151110 }, { "epoch": 0.39, "learning_rate": 0.00024124127419442636, "loss": 0.0169, "step": 151120 }, { "epoch": 0.39, "learning_rate": 0.00024123738597805488, "loss": 0.0246, "step": 151130 }, { "epoch": 0.39, "learning_rate": 0.00024123349776168342, "loss": 0.0186, "step": 151140 }, { "epoch": 0.39, "learning_rate": 0.00024122960954531193, "loss": 0.0216, "step": 151150 }, { "epoch": 0.39, "learning_rate": 0.0002412257213289405, "loss": 0.0183, "step": 151160 }, { "epoch": 0.39, "learning_rate": 0.00024122183311256902, "loss": 0.0175, "step": 151170 }, { "epoch": 0.39, "learning_rate": 0.00024121794489619756, "loss": 0.018, "step": 151180 }, { "epoch": 0.39, "learning_rate": 0.00024121405667982607, "loss": 0.02, "step": 151190 }, { "epoch": 0.39, "learning_rate": 0.00024121016846345464, "loss": 0.0177, "step": 151200 }, { "epoch": 0.39, "learning_rate": 0.00024120628024708318, "loss": 0.0233, "step": 151210 }, { "epoch": 0.39, "learning_rate": 0.0002412023920307117, "loss": 0.0175, "step": 151220 }, { "epoch": 0.39, "learning_rate": 0.00024119850381434024, "loss": 0.0192, "step": 151230 }, { "epoch": 0.39, "learning_rate": 0.00024119461559796878, "loss": 0.0196, "step": 151240 }, { "epoch": 0.39, "learning_rate": 0.00024119072738159732, "loss": 0.0199, "step": 151250 }, { "epoch": 0.39, "learning_rate": 0.00024118683916522584, "loss": 0.0207, "step": 151260 }, { "epoch": 0.39, "learning_rate": 0.00024118295094885438, "loss": 0.0209, "step": 151270 }, { "epoch": 0.39, "learning_rate": 0.00024117906273248292, "loss": 0.0185, "step": 151280 }, { "epoch": 0.39, "learning_rate": 0.00024117517451611146, "loss": 0.0189, "step": 151290 }, { "epoch": 0.39, "learning_rate": 0.00024117128629973998, "loss": 0.0156, "step": 151300 }, { "epoch": 0.39, "learning_rate": 0.00024116739808336852, "loss": 0.016, "step": 151310 }, { "epoch": 0.39, "learning_rate": 0.00024116350986699706, "loss": 0.019, "step": 151320 }, { "epoch": 0.39, "learning_rate": 0.0002411596216506256, "loss": 0.0172, "step": 151330 }, { "epoch": 0.39, "learning_rate": 0.00024115573343425412, "loss": 0.0229, "step": 151340 }, { "epoch": 0.39, "learning_rate": 0.00024115184521788266, "loss": 0.0242, "step": 151350 }, { "epoch": 0.39, "learning_rate": 0.00024114795700151117, "loss": 0.0291, "step": 151360 }, { "epoch": 0.39, "learning_rate": 0.00024114406878513974, "loss": 0.0241, "step": 151370 }, { "epoch": 0.39, "learning_rate": 0.00024114018056876828, "loss": 0.0215, "step": 151380 }, { "epoch": 0.39, "learning_rate": 0.0002411362923523968, "loss": 0.0178, "step": 151390 }, { "epoch": 0.39, "learning_rate": 0.0002411324041360253, "loss": 0.018, "step": 151400 }, { "epoch": 0.39, "learning_rate": 0.00024112851591965388, "loss": 0.0203, "step": 151410 }, { "epoch": 0.39, "learning_rate": 0.00024112462770328242, "loss": 0.0197, "step": 151420 }, { "epoch": 0.39, "learning_rate": 0.00024112073948691094, "loss": 0.0217, "step": 151430 }, { "epoch": 0.39, "learning_rate": 0.00024111685127053948, "loss": 0.0219, "step": 151440 }, { "epoch": 0.39, "learning_rate": 0.00024111296305416802, "loss": 0.0179, "step": 151450 }, { "epoch": 0.39, "learning_rate": 0.00024110907483779656, "loss": 0.0168, "step": 151460 }, { "epoch": 0.39, "learning_rate": 0.00024110518662142508, "loss": 0.0168, "step": 151470 }, { "epoch": 0.39, "learning_rate": 0.00024110129840505362, "loss": 0.0189, "step": 151480 }, { "epoch": 0.39, "learning_rate": 0.00024109741018868216, "loss": 0.022, "step": 151490 }, { "epoch": 0.39, "learning_rate": 0.0002410935219723107, "loss": 0.0195, "step": 151500 }, { "epoch": 0.39, "learning_rate": 0.00024108963375593922, "loss": 0.02, "step": 151510 }, { "epoch": 0.39, "learning_rate": 0.00024108574553956776, "loss": 0.0189, "step": 151520 }, { "epoch": 0.39, "learning_rate": 0.00024108185732319633, "loss": 0.0182, "step": 151530 }, { "epoch": 0.39, "learning_rate": 0.00024107796910682484, "loss": 0.0229, "step": 151540 }, { "epoch": 0.39, "learning_rate": 0.00024107408089045338, "loss": 0.0214, "step": 151550 }, { "epoch": 0.39, "learning_rate": 0.0002410701926740819, "loss": 0.0196, "step": 151560 }, { "epoch": 0.39, "learning_rate": 0.00024106630445771047, "loss": 0.0223, "step": 151570 }, { "epoch": 0.39, "learning_rate": 0.00024106241624133898, "loss": 0.0199, "step": 151580 }, { "epoch": 0.39, "learning_rate": 0.00024105852802496752, "loss": 0.0212, "step": 151590 }, { "epoch": 0.39, "learning_rate": 0.00024105463980859604, "loss": 0.021, "step": 151600 }, { "epoch": 0.39, "learning_rate": 0.00024105075159222458, "loss": 0.0213, "step": 151610 }, { "epoch": 0.39, "learning_rate": 0.00024104686337585312, "loss": 0.0202, "step": 151620 }, { "epoch": 0.39, "learning_rate": 0.00024104297515948166, "loss": 0.0192, "step": 151630 }, { "epoch": 0.39, "learning_rate": 0.00024103908694311018, "loss": 0.0154, "step": 151640 }, { "epoch": 0.39, "learning_rate": 0.00024103519872673872, "loss": 0.0175, "step": 151650 }, { "epoch": 0.39, "learning_rate": 0.00024103131051036726, "loss": 0.0204, "step": 151660 }, { "epoch": 0.39, "learning_rate": 0.0002410274222939958, "loss": 0.0178, "step": 151670 }, { "epoch": 0.39, "learning_rate": 0.00024102353407762432, "loss": 0.0204, "step": 151680 }, { "epoch": 0.39, "learning_rate": 0.00024101964586125286, "loss": 0.0238, "step": 151690 }, { "epoch": 0.39, "learning_rate": 0.00024101575764488143, "loss": 0.023, "step": 151700 }, { "epoch": 0.39, "learning_rate": 0.00024101186942850994, "loss": 0.0191, "step": 151710 }, { "epoch": 0.39, "learning_rate": 0.00024100798121213845, "loss": 0.0182, "step": 151720 }, { "epoch": 0.39, "learning_rate": 0.000241004092995767, "loss": 0.0195, "step": 151730 }, { "epoch": 0.39, "learning_rate": 0.00024100020477939557, "loss": 0.022, "step": 151740 }, { "epoch": 0.39, "learning_rate": 0.00024099631656302408, "loss": 0.021, "step": 151750 }, { "epoch": 0.39, "learning_rate": 0.00024099242834665262, "loss": 0.0201, "step": 151760 }, { "epoch": 0.39, "learning_rate": 0.00024098854013028114, "loss": 0.0205, "step": 151770 }, { "epoch": 0.39, "learning_rate": 0.0002409846519139097, "loss": 0.0146, "step": 151780 }, { "epoch": 0.39, "learning_rate": 0.00024098076369753822, "loss": 0.0214, "step": 151790 }, { "epoch": 0.39, "learning_rate": 0.00024097687548116676, "loss": 0.0181, "step": 151800 }, { "epoch": 0.39, "learning_rate": 0.00024097298726479528, "loss": 0.021, "step": 151810 }, { "epoch": 0.39, "learning_rate": 0.00024096909904842384, "loss": 0.0163, "step": 151820 }, { "epoch": 0.39, "learning_rate": 0.00024096521083205236, "loss": 0.0233, "step": 151830 }, { "epoch": 0.39, "learning_rate": 0.0002409613226156809, "loss": 0.0209, "step": 151840 }, { "epoch": 0.39, "learning_rate": 0.00024095743439930941, "loss": 0.0198, "step": 151850 }, { "epoch": 0.39, "learning_rate": 0.00024095354618293796, "loss": 0.0184, "step": 151860 }, { "epoch": 0.39, "learning_rate": 0.00024094965796656653, "loss": 0.0179, "step": 151870 }, { "epoch": 0.39, "learning_rate": 0.00024094576975019504, "loss": 0.0202, "step": 151880 }, { "epoch": 0.39, "learning_rate": 0.00024094188153382355, "loss": 0.0237, "step": 151890 }, { "epoch": 0.39, "learning_rate": 0.0002409379933174521, "loss": 0.0259, "step": 151900 }, { "epoch": 0.39, "learning_rate": 0.00024093410510108066, "loss": 0.0211, "step": 151910 }, { "epoch": 0.39, "learning_rate": 0.00024093021688470918, "loss": 0.0242, "step": 151920 }, { "epoch": 0.39, "learning_rate": 0.00024092632866833772, "loss": 0.0167, "step": 151930 }, { "epoch": 0.39, "learning_rate": 0.00024092244045196624, "loss": 0.0157, "step": 151940 }, { "epoch": 0.39, "learning_rate": 0.0002409185522355948, "loss": 0.0192, "step": 151950 }, { "epoch": 0.39, "learning_rate": 0.00024091466401922332, "loss": 0.0178, "step": 151960 }, { "epoch": 0.39, "learning_rate": 0.00024091077580285186, "loss": 0.0163, "step": 151970 }, { "epoch": 0.39, "learning_rate": 0.00024090688758648037, "loss": 0.0229, "step": 151980 }, { "epoch": 0.39, "learning_rate": 0.00024090299937010894, "loss": 0.0192, "step": 151990 }, { "epoch": 0.39, "learning_rate": 0.00024089911115373746, "loss": 0.0169, "step": 152000 }, { "epoch": 0.39, "eval_cer": 0.8817950623608236, "eval_loss": 0.013452214188873768, "eval_runtime": 107.3551, "eval_samples_per_second": 18.63, "eval_steps_per_second": 4.657, "step": 152000 }, { "epoch": 0.39, "learning_rate": 0.000240895222937366, "loss": 0.0205, "step": 152010 }, { "epoch": 0.39, "learning_rate": 0.00024089133472099451, "loss": 0.0222, "step": 152020 }, { "epoch": 0.39, "learning_rate": 0.00024088744650462308, "loss": 0.0189, "step": 152030 }, { "epoch": 0.39, "learning_rate": 0.0002408835582882516, "loss": 0.0212, "step": 152040 }, { "epoch": 0.39, "learning_rate": 0.00024087967007188014, "loss": 0.0227, "step": 152050 }, { "epoch": 0.39, "learning_rate": 0.00024087578185550865, "loss": 0.0204, "step": 152060 }, { "epoch": 0.39, "learning_rate": 0.00024087189363913722, "loss": 0.0189, "step": 152070 }, { "epoch": 0.39, "learning_rate": 0.00024086800542276576, "loss": 0.018, "step": 152080 }, { "epoch": 0.39, "learning_rate": 0.00024086411720639428, "loss": 0.0217, "step": 152090 }, { "epoch": 0.39, "learning_rate": 0.00024086022899002282, "loss": 0.0205, "step": 152100 }, { "epoch": 0.39, "learning_rate": 0.00024085634077365133, "loss": 0.0212, "step": 152110 }, { "epoch": 0.39, "learning_rate": 0.0002408524525572799, "loss": 0.0205, "step": 152120 }, { "epoch": 0.39, "learning_rate": 0.00024084856434090842, "loss": 0.0284, "step": 152130 }, { "epoch": 0.39, "learning_rate": 0.00024084467612453696, "loss": 0.0207, "step": 152140 }, { "epoch": 0.39, "learning_rate": 0.00024084078790816547, "loss": 0.0164, "step": 152150 }, { "epoch": 0.39, "learning_rate": 0.00024083689969179404, "loss": 0.0189, "step": 152160 }, { "epoch": 0.39, "learning_rate": 0.00024083301147542256, "loss": 0.0172, "step": 152170 }, { "epoch": 0.39, "learning_rate": 0.0002408291232590511, "loss": 0.0194, "step": 152180 }, { "epoch": 0.39, "learning_rate": 0.00024082523504267961, "loss": 0.0237, "step": 152190 }, { "epoch": 0.39, "learning_rate": 0.00024082134682630818, "loss": 0.0167, "step": 152200 }, { "epoch": 0.39, "learning_rate": 0.0002408174586099367, "loss": 0.0203, "step": 152210 }, { "epoch": 0.39, "learning_rate": 0.00024081357039356524, "loss": 0.0267, "step": 152220 }, { "epoch": 0.39, "learning_rate": 0.00024080968217719375, "loss": 0.0219, "step": 152230 }, { "epoch": 0.39, "learning_rate": 0.00024080579396082232, "loss": 0.0188, "step": 152240 }, { "epoch": 0.39, "learning_rate": 0.00024080190574445086, "loss": 0.0183, "step": 152250 }, { "epoch": 0.39, "learning_rate": 0.00024079801752807938, "loss": 0.0217, "step": 152260 }, { "epoch": 0.39, "learning_rate": 0.00024079412931170792, "loss": 0.0181, "step": 152270 }, { "epoch": 0.39, "learning_rate": 0.00024079024109533646, "loss": 0.0265, "step": 152280 }, { "epoch": 0.39, "learning_rate": 0.000240786352878965, "loss": 0.0199, "step": 152290 }, { "epoch": 0.39, "learning_rate": 0.00024078246466259352, "loss": 0.0238, "step": 152300 }, { "epoch": 0.39, "learning_rate": 0.00024077857644622206, "loss": 0.0163, "step": 152310 }, { "epoch": 0.39, "learning_rate": 0.0002407746882298506, "loss": 0.0183, "step": 152320 }, { "epoch": 0.39, "learning_rate": 0.00024077080001347914, "loss": 0.0213, "step": 152330 }, { "epoch": 0.39, "learning_rate": 0.00024076691179710766, "loss": 0.0185, "step": 152340 }, { "epoch": 0.39, "learning_rate": 0.0002407630235807362, "loss": 0.0202, "step": 152350 }, { "epoch": 0.39, "learning_rate": 0.0002407591353643647, "loss": 0.0177, "step": 152360 }, { "epoch": 0.39, "learning_rate": 0.00024075524714799328, "loss": 0.0156, "step": 152370 }, { "epoch": 0.39, "learning_rate": 0.0002407513589316218, "loss": 0.0207, "step": 152380 }, { "epoch": 0.4, "learning_rate": 0.00024074747071525034, "loss": 0.0191, "step": 152390 }, { "epoch": 0.4, "learning_rate": 0.00024074358249887885, "loss": 0.0239, "step": 152400 }, { "epoch": 0.4, "learning_rate": 0.00024073969428250742, "loss": 0.0164, "step": 152410 }, { "epoch": 0.4, "learning_rate": 0.00024073580606613596, "loss": 0.0174, "step": 152420 }, { "epoch": 0.4, "learning_rate": 0.00024073191784976448, "loss": 0.0159, "step": 152430 }, { "epoch": 0.4, "learning_rate": 0.000240728029633393, "loss": 0.018, "step": 152440 }, { "epoch": 0.4, "learning_rate": 0.00024072414141702156, "loss": 0.019, "step": 152450 }, { "epoch": 0.4, "learning_rate": 0.0002407202532006501, "loss": 0.0291, "step": 152460 }, { "epoch": 0.4, "learning_rate": 0.00024071636498427862, "loss": 0.0212, "step": 152470 }, { "epoch": 0.4, "learning_rate": 0.00024071247676790716, "loss": 0.021, "step": 152480 }, { "epoch": 0.4, "learning_rate": 0.0002407085885515357, "loss": 0.0197, "step": 152490 }, { "epoch": 0.4, "learning_rate": 0.00024070470033516424, "loss": 0.0184, "step": 152500 }, { "epoch": 0.4, "learning_rate": 0.00024070081211879276, "loss": 0.0204, "step": 152510 }, { "epoch": 0.4, "learning_rate": 0.0002406969239024213, "loss": 0.0153, "step": 152520 }, { "epoch": 0.4, "learning_rate": 0.00024069303568604984, "loss": 0.0184, "step": 152530 }, { "epoch": 0.4, "learning_rate": 0.00024068914746967838, "loss": 0.019, "step": 152540 }, { "epoch": 0.4, "learning_rate": 0.0002406852592533069, "loss": 0.0198, "step": 152550 }, { "epoch": 0.4, "learning_rate": 0.00024068137103693544, "loss": 0.0248, "step": 152560 }, { "epoch": 0.4, "learning_rate": 0.000240677482820564, "loss": 0.0158, "step": 152570 }, { "epoch": 0.4, "learning_rate": 0.00024067359460419252, "loss": 0.0207, "step": 152580 }, { "epoch": 0.4, "learning_rate": 0.00024066970638782104, "loss": 0.0186, "step": 152590 }, { "epoch": 0.4, "learning_rate": 0.00024066581817144958, "loss": 0.0234, "step": 152600 }, { "epoch": 0.4, "learning_rate": 0.0002406619299550781, "loss": 0.0202, "step": 152610 }, { "epoch": 0.4, "learning_rate": 0.00024065804173870666, "loss": 0.0223, "step": 152620 }, { "epoch": 0.4, "learning_rate": 0.0002406541535223352, "loss": 0.0205, "step": 152630 }, { "epoch": 0.4, "learning_rate": 0.00024065026530596372, "loss": 0.0279, "step": 152640 }, { "epoch": 0.4, "learning_rate": 0.00024064637708959226, "loss": 0.0212, "step": 152650 }, { "epoch": 0.4, "learning_rate": 0.0002406424888732208, "loss": 0.0202, "step": 152660 }, { "epoch": 0.4, "learning_rate": 0.00024063860065684934, "loss": 0.0184, "step": 152670 }, { "epoch": 0.4, "learning_rate": 0.00024063471244047786, "loss": 0.0209, "step": 152680 }, { "epoch": 0.4, "learning_rate": 0.0002406308242241064, "loss": 0.0185, "step": 152690 }, { "epoch": 0.4, "learning_rate": 0.00024062693600773494, "loss": 0.0199, "step": 152700 }, { "epoch": 0.4, "learning_rate": 0.00024062304779136348, "loss": 0.0249, "step": 152710 }, { "epoch": 0.4, "learning_rate": 0.000240619159574992, "loss": 0.0193, "step": 152720 }, { "epoch": 0.4, "learning_rate": 0.00024061527135862054, "loss": 0.0219, "step": 152730 }, { "epoch": 0.4, "learning_rate": 0.0002406113831422491, "loss": 0.0218, "step": 152740 }, { "epoch": 0.4, "learning_rate": 0.00024060749492587762, "loss": 0.0188, "step": 152750 }, { "epoch": 0.4, "learning_rate": 0.00024060360670950613, "loss": 0.0164, "step": 152760 }, { "epoch": 0.4, "learning_rate": 0.00024059971849313468, "loss": 0.0167, "step": 152770 }, { "epoch": 0.4, "learning_rate": 0.00024059583027676325, "loss": 0.018, "step": 152780 }, { "epoch": 0.4, "learning_rate": 0.00024059194206039176, "loss": 0.021, "step": 152790 }, { "epoch": 0.4, "learning_rate": 0.0002405880538440203, "loss": 0.0228, "step": 152800 }, { "epoch": 0.4, "learning_rate": 0.00024058416562764882, "loss": 0.019, "step": 152810 }, { "epoch": 0.4, "learning_rate": 0.00024058027741127738, "loss": 0.0181, "step": 152820 }, { "epoch": 0.4, "learning_rate": 0.0002405763891949059, "loss": 0.0261, "step": 152830 }, { "epoch": 0.4, "learning_rate": 0.00024057250097853444, "loss": 0.0174, "step": 152840 }, { "epoch": 0.4, "learning_rate": 0.00024056861276216296, "loss": 0.0172, "step": 152850 }, { "epoch": 0.4, "learning_rate": 0.0002405647245457915, "loss": 0.0236, "step": 152860 }, { "epoch": 0.4, "learning_rate": 0.00024056083632942004, "loss": 0.0173, "step": 152870 }, { "epoch": 0.4, "learning_rate": 0.00024055694811304858, "loss": 0.0189, "step": 152880 }, { "epoch": 0.4, "learning_rate": 0.0002405530598966771, "loss": 0.0164, "step": 152890 }, { "epoch": 0.4, "learning_rate": 0.00024054917168030564, "loss": 0.0164, "step": 152900 }, { "epoch": 0.4, "learning_rate": 0.00024054528346393418, "loss": 0.0195, "step": 152910 }, { "epoch": 0.4, "learning_rate": 0.00024054139524756272, "loss": 0.0188, "step": 152920 }, { "epoch": 0.4, "learning_rate": 0.00024053750703119123, "loss": 0.0208, "step": 152930 }, { "epoch": 0.4, "learning_rate": 0.00024053361881481978, "loss": 0.0192, "step": 152940 }, { "epoch": 0.4, "learning_rate": 0.00024052973059844834, "loss": 0.0201, "step": 152950 }, { "epoch": 0.4, "learning_rate": 0.00024052584238207686, "loss": 0.0238, "step": 152960 }, { "epoch": 0.4, "learning_rate": 0.0002405219541657054, "loss": 0.0199, "step": 152970 }, { "epoch": 0.4, "learning_rate": 0.00024051806594933392, "loss": 0.0242, "step": 152980 }, { "epoch": 0.4, "learning_rate": 0.00024051417773296248, "loss": 0.0164, "step": 152990 }, { "epoch": 0.4, "learning_rate": 0.000240510289516591, "loss": 0.0165, "step": 153000 }, { "epoch": 0.4, "eval_cer": 0.881782465628416, "eval_loss": 0.013410561718046665, "eval_runtime": 107.4393, "eval_samples_per_second": 18.615, "eval_steps_per_second": 4.654, "step": 153000 }, { "epoch": 0.4, "learning_rate": 0.00024050640130021954, "loss": 0.0188, "step": 153010 }, { "epoch": 0.4, "learning_rate": 0.00024050251308384805, "loss": 0.0178, "step": 153020 }, { "epoch": 0.4, "learning_rate": 0.00024049862486747662, "loss": 0.0191, "step": 153030 }, { "epoch": 0.4, "learning_rate": 0.00024049473665110514, "loss": 0.0207, "step": 153040 }, { "epoch": 0.4, "learning_rate": 0.00024049084843473368, "loss": 0.0182, "step": 153050 }, { "epoch": 0.4, "learning_rate": 0.0002404869602183622, "loss": 0.0223, "step": 153060 }, { "epoch": 0.4, "learning_rate": 0.00024048307200199076, "loss": 0.0171, "step": 153070 }, { "epoch": 0.4, "learning_rate": 0.00024047918378561928, "loss": 0.0201, "step": 153080 }, { "epoch": 0.4, "learning_rate": 0.00024047529556924782, "loss": 0.0197, "step": 153090 }, { "epoch": 0.4, "learning_rate": 0.00024047140735287633, "loss": 0.0207, "step": 153100 }, { "epoch": 0.4, "learning_rate": 0.00024046751913650488, "loss": 0.0221, "step": 153110 }, { "epoch": 0.4, "learning_rate": 0.00024046363092013344, "loss": 0.0176, "step": 153120 }, { "epoch": 0.4, "learning_rate": 0.00024045974270376196, "loss": 0.0261, "step": 153130 }, { "epoch": 0.4, "learning_rate": 0.0002404558544873905, "loss": 0.019, "step": 153140 }, { "epoch": 0.4, "learning_rate": 0.00024045196627101901, "loss": 0.0173, "step": 153150 }, { "epoch": 0.4, "learning_rate": 0.00024044807805464758, "loss": 0.0199, "step": 153160 }, { "epoch": 0.4, "learning_rate": 0.0002404441898382761, "loss": 0.0196, "step": 153170 }, { "epoch": 0.4, "learning_rate": 0.00024044030162190464, "loss": 0.016, "step": 153180 }, { "epoch": 0.4, "learning_rate": 0.00024043641340553315, "loss": 0.0148, "step": 153190 }, { "epoch": 0.4, "learning_rate": 0.00024043252518916172, "loss": 0.0197, "step": 153200 }, { "epoch": 0.4, "learning_rate": 0.00024042863697279024, "loss": 0.0213, "step": 153210 }, { "epoch": 0.4, "learning_rate": 0.00024042474875641878, "loss": 0.0198, "step": 153220 }, { "epoch": 0.4, "learning_rate": 0.0002404208605400473, "loss": 0.0205, "step": 153230 }, { "epoch": 0.4, "learning_rate": 0.00024041697232367586, "loss": 0.0238, "step": 153240 }, { "epoch": 0.4, "learning_rate": 0.00024041308410730438, "loss": 0.0233, "step": 153250 }, { "epoch": 0.4, "learning_rate": 0.00024040919589093292, "loss": 0.0198, "step": 153260 }, { "epoch": 0.4, "learning_rate": 0.00024040530767456143, "loss": 0.0196, "step": 153270 }, { "epoch": 0.4, "learning_rate": 0.00024040141945819, "loss": 0.0206, "step": 153280 }, { "epoch": 0.4, "learning_rate": 0.00024039753124181854, "loss": 0.0193, "step": 153290 }, { "epoch": 0.4, "learning_rate": 0.00024039364302544706, "loss": 0.0203, "step": 153300 }, { "epoch": 0.4, "learning_rate": 0.00024038975480907557, "loss": 0.0212, "step": 153310 }, { "epoch": 0.4, "learning_rate": 0.00024038586659270414, "loss": 0.0184, "step": 153320 }, { "epoch": 0.4, "learning_rate": 0.00024038197837633268, "loss": 0.0194, "step": 153330 }, { "epoch": 0.4, "learning_rate": 0.0002403780901599612, "loss": 0.016, "step": 153340 }, { "epoch": 0.4, "learning_rate": 0.00024037420194358974, "loss": 0.0182, "step": 153350 }, { "epoch": 0.4, "learning_rate": 0.00024037031372721825, "loss": 0.0208, "step": 153360 }, { "epoch": 0.4, "learning_rate": 0.00024036642551084682, "loss": 0.0207, "step": 153370 }, { "epoch": 0.4, "learning_rate": 0.00024036253729447534, "loss": 0.0435, "step": 153380 }, { "epoch": 0.4, "learning_rate": 0.00024035864907810388, "loss": 0.0195, "step": 153390 }, { "epoch": 0.4, "learning_rate": 0.0002403547608617324, "loss": 0.0639, "step": 153400 }, { "epoch": 0.4, "learning_rate": 0.00024035087264536096, "loss": 0.0275, "step": 153410 }, { "epoch": 0.4, "learning_rate": 0.00024034698442898948, "loss": 0.0176, "step": 153420 }, { "epoch": 0.4, "learning_rate": 0.00024034309621261802, "loss": 0.0191, "step": 153430 }, { "epoch": 0.4, "learning_rate": 0.00024033920799624653, "loss": 0.0187, "step": 153440 }, { "epoch": 0.4, "learning_rate": 0.0002403353197798751, "loss": 0.0221, "step": 153450 }, { "epoch": 0.4, "learning_rate": 0.00024033143156350364, "loss": 0.0181, "step": 153460 }, { "epoch": 0.4, "learning_rate": 0.00024032754334713216, "loss": 0.02, "step": 153470 }, { "epoch": 0.4, "learning_rate": 0.00024032365513076067, "loss": 0.0193, "step": 153480 }, { "epoch": 0.4, "learning_rate": 0.00024031976691438924, "loss": 0.0174, "step": 153490 }, { "epoch": 0.4, "learning_rate": 0.00024031587869801778, "loss": 0.0208, "step": 153500 }, { "epoch": 0.4, "learning_rate": 0.0002403119904816463, "loss": 0.0218, "step": 153510 }, { "epoch": 0.4, "learning_rate": 0.00024030810226527484, "loss": 0.0221, "step": 153520 }, { "epoch": 0.4, "learning_rate": 0.00024030421404890338, "loss": 0.0238, "step": 153530 }, { "epoch": 0.4, "learning_rate": 0.00024030032583253192, "loss": 0.0215, "step": 153540 }, { "epoch": 0.4, "learning_rate": 0.00024029643761616044, "loss": 0.0229, "step": 153550 }, { "epoch": 0.4, "learning_rate": 0.00024029254939978898, "loss": 0.0206, "step": 153560 }, { "epoch": 0.4, "learning_rate": 0.00024028866118341752, "loss": 0.0204, "step": 153570 }, { "epoch": 0.4, "learning_rate": 0.00024028477296704606, "loss": 0.0187, "step": 153580 }, { "epoch": 0.4, "learning_rate": 0.00024028088475067458, "loss": 0.0206, "step": 153590 }, { "epoch": 0.4, "learning_rate": 0.00024027699653430312, "loss": 0.0372, "step": 153600 }, { "epoch": 0.4, "learning_rate": 0.00024027310831793163, "loss": 0.0185, "step": 153610 }, { "epoch": 0.4, "learning_rate": 0.0002402692201015602, "loss": 0.0205, "step": 153620 }, { "epoch": 0.4, "learning_rate": 0.00024026533188518872, "loss": 0.0197, "step": 153630 }, { "epoch": 0.4, "learning_rate": 0.00024026144366881726, "loss": 0.0178, "step": 153640 }, { "epoch": 0.4, "learning_rate": 0.00024025755545244577, "loss": 0.0201, "step": 153650 }, { "epoch": 0.4, "learning_rate": 0.00024025366723607434, "loss": 0.0194, "step": 153660 }, { "epoch": 0.4, "learning_rate": 0.00024024977901970288, "loss": 0.0182, "step": 153670 }, { "epoch": 0.4, "learning_rate": 0.0002402458908033314, "loss": 0.0262, "step": 153680 }, { "epoch": 0.4, "learning_rate": 0.00024024200258695994, "loss": 0.0213, "step": 153690 }, { "epoch": 0.4, "learning_rate": 0.00024023811437058848, "loss": 0.019, "step": 153700 }, { "epoch": 0.4, "learning_rate": 0.00024023422615421702, "loss": 0.019, "step": 153710 }, { "epoch": 0.4, "learning_rate": 0.00024023033793784554, "loss": 0.0234, "step": 153720 }, { "epoch": 0.4, "learning_rate": 0.00024022644972147408, "loss": 0.02, "step": 153730 }, { "epoch": 0.4, "learning_rate": 0.00024022256150510262, "loss": 0.0206, "step": 153740 }, { "epoch": 0.4, "learning_rate": 0.00024021867328873116, "loss": 0.0197, "step": 153750 }, { "epoch": 0.4, "learning_rate": 0.00024021478507235968, "loss": 0.0168, "step": 153760 }, { "epoch": 0.4, "learning_rate": 0.00024021089685598822, "loss": 0.0201, "step": 153770 }, { "epoch": 0.4, "learning_rate": 0.00024020700863961676, "loss": 0.0204, "step": 153780 }, { "epoch": 0.4, "learning_rate": 0.0002402031204232453, "loss": 0.015, "step": 153790 }, { "epoch": 0.4, "learning_rate": 0.00024019923220687381, "loss": 0.0151, "step": 153800 }, { "epoch": 0.4, "learning_rate": 0.00024019534399050236, "loss": 0.0208, "step": 153810 }, { "epoch": 0.4, "learning_rate": 0.00024019145577413092, "loss": 0.0139, "step": 153820 }, { "epoch": 0.4, "learning_rate": 0.00024018756755775944, "loss": 0.0166, "step": 153830 }, { "epoch": 0.4, "learning_rate": 0.00024018367934138798, "loss": 0.023, "step": 153840 }, { "epoch": 0.4, "learning_rate": 0.0002401797911250165, "loss": 0.0191, "step": 153850 }, { "epoch": 0.4, "learning_rate": 0.00024017590290864504, "loss": 0.0244, "step": 153860 }, { "epoch": 0.4, "learning_rate": 0.00024017201469227358, "loss": 0.0241, "step": 153870 }, { "epoch": 0.4, "learning_rate": 0.00024016812647590212, "loss": 0.0162, "step": 153880 }, { "epoch": 0.4, "learning_rate": 0.00024016423825953063, "loss": 0.0162, "step": 153890 }, { "epoch": 0.4, "learning_rate": 0.00024016035004315918, "loss": 0.0184, "step": 153900 }, { "epoch": 0.4, "learning_rate": 0.00024015646182678772, "loss": 0.0183, "step": 153910 }, { "epoch": 0.4, "learning_rate": 0.00024015257361041626, "loss": 0.0175, "step": 153920 }, { "epoch": 0.4, "learning_rate": 0.00024014868539404477, "loss": 0.017, "step": 153930 }, { "epoch": 0.4, "learning_rate": 0.00024014479717767332, "loss": 0.02, "step": 153940 }, { "epoch": 0.4, "learning_rate": 0.00024014090896130186, "loss": 0.0201, "step": 153950 }, { "epoch": 0.4, "learning_rate": 0.0002401370207449304, "loss": 0.0263, "step": 153960 }, { "epoch": 0.4, "learning_rate": 0.00024013313252855891, "loss": 0.0175, "step": 153970 }, { "epoch": 0.4, "learning_rate": 0.00024012924431218746, "loss": 0.0172, "step": 153980 }, { "epoch": 0.4, "learning_rate": 0.00024012535609581602, "loss": 0.0157, "step": 153990 }, { "epoch": 0.4, "learning_rate": 0.00024012146787944454, "loss": 0.0188, "step": 154000 }, { "epoch": 0.4, "eval_cer": 0.881782465628416, "eval_loss": 0.013507870957255363, "eval_runtime": 107.4654, "eval_samples_per_second": 18.611, "eval_steps_per_second": 4.653, "step": 154000 }, { "epoch": 0.4, "learning_rate": 0.00024011757966307308, "loss": 0.0161, "step": 154010 }, { "epoch": 0.4, "learning_rate": 0.0002401136914467016, "loss": 0.0192, "step": 154020 }, { "epoch": 0.4, "learning_rate": 0.00024010980323033016, "loss": 0.028, "step": 154030 }, { "epoch": 0.4, "learning_rate": 0.00024010591501395868, "loss": 0.0159, "step": 154040 }, { "epoch": 0.4, "learning_rate": 0.00024010202679758722, "loss": 0.0208, "step": 154050 }, { "epoch": 0.4, "learning_rate": 0.00024009813858121573, "loss": 0.0195, "step": 154060 }, { "epoch": 0.4, "learning_rate": 0.0002400942503648443, "loss": 0.0249, "step": 154070 }, { "epoch": 0.4, "learning_rate": 0.00024009036214847282, "loss": 0.018, "step": 154080 }, { "epoch": 0.4, "learning_rate": 0.00024008647393210136, "loss": 0.0182, "step": 154090 }, { "epoch": 0.4, "learning_rate": 0.00024008258571572987, "loss": 0.0196, "step": 154100 }, { "epoch": 0.4, "learning_rate": 0.00024007869749935842, "loss": 0.0205, "step": 154110 }, { "epoch": 0.4, "learning_rate": 0.00024007480928298696, "loss": 0.0203, "step": 154120 }, { "epoch": 0.4, "learning_rate": 0.0002400709210666155, "loss": 0.0191, "step": 154130 }, { "epoch": 0.4, "learning_rate": 0.000240067032850244, "loss": 0.0156, "step": 154140 }, { "epoch": 0.4, "learning_rate": 0.00024006314463387255, "loss": 0.0186, "step": 154150 }, { "epoch": 0.4, "learning_rate": 0.00024005925641750112, "loss": 0.0222, "step": 154160 }, { "epoch": 0.4, "learning_rate": 0.00024005536820112964, "loss": 0.0201, "step": 154170 }, { "epoch": 0.4, "learning_rate": 0.00024005147998475815, "loss": 0.0195, "step": 154180 }, { "epoch": 0.4, "learning_rate": 0.0002400475917683867, "loss": 0.0205, "step": 154190 }, { "epoch": 0.4, "learning_rate": 0.00024004370355201526, "loss": 0.0156, "step": 154200 }, { "epoch": 0.4, "learning_rate": 0.00024003981533564378, "loss": 0.0213, "step": 154210 }, { "epoch": 0.4, "learning_rate": 0.00024003592711927232, "loss": 0.0216, "step": 154220 }, { "epoch": 0.4, "learning_rate": 0.00024003203890290083, "loss": 0.0215, "step": 154230 }, { "epoch": 0.4, "learning_rate": 0.0002400281506865294, "loss": 0.0162, "step": 154240 }, { "epoch": 0.4, "learning_rate": 0.00024002426247015792, "loss": 0.0188, "step": 154250 }, { "epoch": 0.4, "learning_rate": 0.00024002037425378646, "loss": 0.0197, "step": 154260 }, { "epoch": 0.4, "learning_rate": 0.00024001648603741497, "loss": 0.0243, "step": 154270 }, { "epoch": 0.4, "learning_rate": 0.00024001259782104354, "loss": 0.0184, "step": 154280 }, { "epoch": 0.4, "learning_rate": 0.00024000870960467206, "loss": 0.0182, "step": 154290 }, { "epoch": 0.4, "learning_rate": 0.0002400048213883006, "loss": 0.0213, "step": 154300 }, { "epoch": 0.4, "learning_rate": 0.0002400009331719291, "loss": 0.0192, "step": 154310 }, { "epoch": 0.4, "learning_rate": 0.00023999704495555768, "loss": 0.0196, "step": 154320 }, { "epoch": 0.4, "learning_rate": 0.00023999315673918622, "loss": 0.0177, "step": 154330 }, { "epoch": 0.4, "learning_rate": 0.00023998926852281474, "loss": 0.02, "step": 154340 }, { "epoch": 0.4, "learning_rate": 0.00023998538030644325, "loss": 0.019, "step": 154350 }, { "epoch": 0.4, "learning_rate": 0.0002399814920900718, "loss": 0.0291, "step": 154360 }, { "epoch": 0.4, "learning_rate": 0.00023997760387370036, "loss": 0.0213, "step": 154370 }, { "epoch": 0.4, "learning_rate": 0.00023997371565732888, "loss": 0.0187, "step": 154380 }, { "epoch": 0.4, "learning_rate": 0.00023996982744095742, "loss": 0.0168, "step": 154390 }, { "epoch": 0.4, "learning_rate": 0.00023996593922458593, "loss": 0.0206, "step": 154400 }, { "epoch": 0.4, "learning_rate": 0.0002399620510082145, "loss": 0.0189, "step": 154410 }, { "epoch": 0.4, "learning_rate": 0.00023995816279184302, "loss": 0.0188, "step": 154420 }, { "epoch": 0.4, "learning_rate": 0.00023995427457547156, "loss": 0.0177, "step": 154430 }, { "epoch": 0.4, "learning_rate": 0.00023995038635910007, "loss": 0.0221, "step": 154440 }, { "epoch": 0.4, "learning_rate": 0.00023994649814272864, "loss": 0.0184, "step": 154450 }, { "epoch": 0.4, "learning_rate": 0.00023994260992635716, "loss": 0.0169, "step": 154460 }, { "epoch": 0.4, "learning_rate": 0.0002399387217099857, "loss": 0.0225, "step": 154470 }, { "epoch": 0.4, "learning_rate": 0.0002399348334936142, "loss": 0.018, "step": 154480 }, { "epoch": 0.4, "learning_rate": 0.00023993094527724278, "loss": 0.0175, "step": 154490 }, { "epoch": 0.4, "learning_rate": 0.0002399270570608713, "loss": 0.018, "step": 154500 }, { "epoch": 0.4, "learning_rate": 0.00023992316884449984, "loss": 0.0172, "step": 154510 }, { "epoch": 0.4, "learning_rate": 0.00023991928062812835, "loss": 0.0216, "step": 154520 }, { "epoch": 0.4, "learning_rate": 0.00023991539241175692, "loss": 0.0176, "step": 154530 }, { "epoch": 0.4, "learning_rate": 0.00023991150419538546, "loss": 0.0216, "step": 154540 }, { "epoch": 0.4, "learning_rate": 0.00023990761597901398, "loss": 0.0204, "step": 154550 }, { "epoch": 0.4, "learning_rate": 0.00023990372776264252, "loss": 0.0187, "step": 154560 }, { "epoch": 0.4, "learning_rate": 0.00023989983954627106, "loss": 0.0179, "step": 154570 }, { "epoch": 0.4, "learning_rate": 0.0002398959513298996, "loss": 0.0192, "step": 154580 }, { "epoch": 0.4, "learning_rate": 0.00023989206311352812, "loss": 0.0168, "step": 154590 }, { "epoch": 0.4, "learning_rate": 0.00023988817489715666, "loss": 0.0163, "step": 154600 }, { "epoch": 0.4, "learning_rate": 0.00023988428668078517, "loss": 0.0194, "step": 154610 }, { "epoch": 0.4, "learning_rate": 0.00023988039846441374, "loss": 0.016, "step": 154620 }, { "epoch": 0.4, "learning_rate": 0.00023987651024804226, "loss": 0.0188, "step": 154630 }, { "epoch": 0.4, "learning_rate": 0.0002398726220316708, "loss": 0.0145, "step": 154640 }, { "epoch": 0.4, "learning_rate": 0.0002398687338152993, "loss": 0.0206, "step": 154650 }, { "epoch": 0.4, "learning_rate": 0.00023986484559892788, "loss": 0.0242, "step": 154660 }, { "epoch": 0.4, "learning_rate": 0.0002398609573825564, "loss": 0.0242, "step": 154670 }, { "epoch": 0.4, "learning_rate": 0.00023985706916618494, "loss": 0.0187, "step": 154680 }, { "epoch": 0.4, "learning_rate": 0.00023985318094981345, "loss": 0.0158, "step": 154690 }, { "epoch": 0.4, "learning_rate": 0.00023984929273344202, "loss": 0.0173, "step": 154700 }, { "epoch": 0.4, "learning_rate": 0.00023984540451707056, "loss": 0.0183, "step": 154710 }, { "epoch": 0.4, "learning_rate": 0.00023984151630069908, "loss": 0.0207, "step": 154720 }, { "epoch": 0.4, "learning_rate": 0.00023983762808432762, "loss": 0.0167, "step": 154730 }, { "epoch": 0.4, "learning_rate": 0.00023983373986795616, "loss": 0.016, "step": 154740 }, { "epoch": 0.4, "learning_rate": 0.0002398298516515847, "loss": 0.0175, "step": 154750 }, { "epoch": 0.4, "learning_rate": 0.00023982596343521322, "loss": 0.018, "step": 154760 }, { "epoch": 0.4, "learning_rate": 0.00023982207521884176, "loss": 0.0179, "step": 154770 }, { "epoch": 0.4, "learning_rate": 0.0002398181870024703, "loss": 0.0197, "step": 154780 }, { "epoch": 0.4, "learning_rate": 0.00023981429878609884, "loss": 0.0184, "step": 154790 }, { "epoch": 0.4, "learning_rate": 0.00023981041056972735, "loss": 0.0186, "step": 154800 }, { "epoch": 0.4, "learning_rate": 0.0002398065223533559, "loss": 0.0181, "step": 154810 }, { "epoch": 0.4, "learning_rate": 0.0002398026341369844, "loss": 0.02, "step": 154820 }, { "epoch": 0.4, "learning_rate": 0.00023979874592061298, "loss": 0.0162, "step": 154830 }, { "epoch": 0.4, "learning_rate": 0.0002397948577042415, "loss": 0.0206, "step": 154840 }, { "epoch": 0.4, "learning_rate": 0.00023979096948787004, "loss": 0.0187, "step": 154850 }, { "epoch": 0.4, "learning_rate": 0.00023978708127149855, "loss": 0.0191, "step": 154860 }, { "epoch": 0.4, "learning_rate": 0.00023978319305512712, "loss": 0.0179, "step": 154870 }, { "epoch": 0.4, "learning_rate": 0.00023977930483875566, "loss": 0.0167, "step": 154880 }, { "epoch": 0.4, "learning_rate": 0.00023977541662238418, "loss": 0.0198, "step": 154890 }, { "epoch": 0.4, "learning_rate": 0.0002397715284060127, "loss": 0.0165, "step": 154900 }, { "epoch": 0.4, "learning_rate": 0.00023976764018964126, "loss": 0.0211, "step": 154910 }, { "epoch": 0.4, "learning_rate": 0.0002397637519732698, "loss": 0.0191, "step": 154920 }, { "epoch": 0.4, "learning_rate": 0.00023975986375689831, "loss": 0.0166, "step": 154930 }, { "epoch": 0.4, "learning_rate": 0.00023975597554052686, "loss": 0.0177, "step": 154940 }, { "epoch": 0.4, "learning_rate": 0.0002397520873241554, "loss": 0.0177, "step": 154950 }, { "epoch": 0.4, "learning_rate": 0.00023974819910778394, "loss": 0.0171, "step": 154960 }, { "epoch": 0.4, "learning_rate": 0.00023974431089141245, "loss": 0.0249, "step": 154970 }, { "epoch": 0.4, "learning_rate": 0.000239740422675041, "loss": 0.0234, "step": 154980 }, { "epoch": 0.4, "learning_rate": 0.00023973653445866954, "loss": 0.0175, "step": 154990 }, { "epoch": 0.4, "learning_rate": 0.00023973264624229808, "loss": 0.0185, "step": 155000 }, { "epoch": 0.4, "eval_cer": 0.8818146572779021, "eval_loss": 0.013523012399673462, "eval_runtime": 108.0058, "eval_samples_per_second": 18.518, "eval_steps_per_second": 4.629, "step": 155000 }, { "epoch": 0.4, "learning_rate": 0.0002397287580259266, "loss": 0.0183, "step": 155010 }, { "epoch": 0.4, "learning_rate": 0.00023972486980955514, "loss": 0.0213, "step": 155020 }, { "epoch": 0.4, "learning_rate": 0.0002397209815931837, "loss": 0.0215, "step": 155030 }, { "epoch": 0.4, "learning_rate": 0.00023971709337681222, "loss": 0.0207, "step": 155040 }, { "epoch": 0.4, "learning_rate": 0.00023971320516044073, "loss": 0.0167, "step": 155050 }, { "epoch": 0.4, "learning_rate": 0.00023970931694406927, "loss": 0.0144, "step": 155060 }, { "epoch": 0.4, "learning_rate": 0.0002397054287276978, "loss": 0.0368, "step": 155070 }, { "epoch": 0.4, "learning_rate": 0.00023970154051132636, "loss": 0.0214, "step": 155080 }, { "epoch": 0.4, "learning_rate": 0.0002396976522949549, "loss": 0.0182, "step": 155090 }, { "epoch": 0.4, "learning_rate": 0.00023969376407858341, "loss": 0.0177, "step": 155100 }, { "epoch": 0.4, "learning_rate": 0.00023968987586221196, "loss": 0.021, "step": 155110 }, { "epoch": 0.4, "learning_rate": 0.0002396859876458405, "loss": 0.021, "step": 155120 }, { "epoch": 0.4, "learning_rate": 0.00023968209942946904, "loss": 0.0173, "step": 155130 }, { "epoch": 0.4, "learning_rate": 0.00023967821121309755, "loss": 0.0214, "step": 155140 }, { "epoch": 0.4, "learning_rate": 0.0002396743229967261, "loss": 0.0217, "step": 155150 }, { "epoch": 0.4, "learning_rate": 0.00023967043478035464, "loss": 0.0186, "step": 155160 }, { "epoch": 0.4, "learning_rate": 0.00023966654656398318, "loss": 0.0176, "step": 155170 }, { "epoch": 0.4, "learning_rate": 0.0002396626583476117, "loss": 0.0191, "step": 155180 }, { "epoch": 0.4, "learning_rate": 0.00023965877013124023, "loss": 0.0183, "step": 155190 }, { "epoch": 0.4, "learning_rate": 0.0002396548819148688, "loss": 0.0165, "step": 155200 }, { "epoch": 0.4, "learning_rate": 0.00023965099369849732, "loss": 0.0181, "step": 155210 }, { "epoch": 0.4, "learning_rate": 0.00023964710548212583, "loss": 0.0229, "step": 155220 }, { "epoch": 0.4, "learning_rate": 0.00023964321726575437, "loss": 0.0224, "step": 155230 }, { "epoch": 0.4, "learning_rate": 0.00023963932904938294, "loss": 0.0214, "step": 155240 }, { "epoch": 0.4, "learning_rate": 0.00023963544083301146, "loss": 0.0202, "step": 155250 }, { "epoch": 0.4, "learning_rate": 0.00023963155261664, "loss": 0.0224, "step": 155260 }, { "epoch": 0.4, "learning_rate": 0.00023962766440026851, "loss": 0.0201, "step": 155270 }, { "epoch": 0.4, "learning_rate": 0.00023962377618389708, "loss": 0.0203, "step": 155280 }, { "epoch": 0.4, "learning_rate": 0.0002396198879675256, "loss": 0.0198, "step": 155290 }, { "epoch": 0.4, "learning_rate": 0.00023961599975115414, "loss": 0.0162, "step": 155300 }, { "epoch": 0.4, "learning_rate": 0.00023961211153478265, "loss": 0.0192, "step": 155310 }, { "epoch": 0.4, "learning_rate": 0.0002396082233184112, "loss": 0.022, "step": 155320 }, { "epoch": 0.4, "learning_rate": 0.00023960433510203974, "loss": 0.0201, "step": 155330 }, { "epoch": 0.4, "learning_rate": 0.00023960044688566828, "loss": 0.0169, "step": 155340 }, { "epoch": 0.4, "learning_rate": 0.0002395965586692968, "loss": 0.0224, "step": 155350 }, { "epoch": 0.4, "learning_rate": 0.00023959267045292533, "loss": 0.0215, "step": 155360 }, { "epoch": 0.4, "learning_rate": 0.00023958878223655388, "loss": 0.02, "step": 155370 }, { "epoch": 0.4, "learning_rate": 0.00023958489402018242, "loss": 0.0197, "step": 155380 }, { "epoch": 0.4, "learning_rate": 0.00023958100580381093, "loss": 0.0166, "step": 155390 }, { "epoch": 0.4, "learning_rate": 0.00023957711758743947, "loss": 0.0229, "step": 155400 }, { "epoch": 0.4, "learning_rate": 0.00023957322937106804, "loss": 0.021, "step": 155410 }, { "epoch": 0.4, "learning_rate": 0.00023956934115469656, "loss": 0.0202, "step": 155420 }, { "epoch": 0.4, "learning_rate": 0.0002395654529383251, "loss": 0.0176, "step": 155430 }, { "epoch": 0.4, "learning_rate": 0.0002395615647219536, "loss": 0.0203, "step": 155440 }, { "epoch": 0.4, "learning_rate": 0.00023955767650558218, "loss": 0.0265, "step": 155450 }, { "epoch": 0.4, "learning_rate": 0.0002395537882892107, "loss": 0.0187, "step": 155460 }, { "epoch": 0.4, "learning_rate": 0.00023954990007283924, "loss": 0.0186, "step": 155470 }, { "epoch": 0.4, "learning_rate": 0.00023954601185646775, "loss": 0.0186, "step": 155480 }, { "epoch": 0.4, "learning_rate": 0.00023954212364009632, "loss": 0.017, "step": 155490 }, { "epoch": 0.4, "learning_rate": 0.00023953823542372484, "loss": 0.0225, "step": 155500 }, { "epoch": 0.4, "learning_rate": 0.00023953434720735338, "loss": 0.0174, "step": 155510 }, { "epoch": 0.4, "learning_rate": 0.0002395304589909819, "loss": 0.0179, "step": 155520 }, { "epoch": 0.4, "learning_rate": 0.00023952657077461046, "loss": 0.0195, "step": 155530 }, { "epoch": 0.4, "learning_rate": 0.00023952268255823898, "loss": 0.0181, "step": 155540 }, { "epoch": 0.4, "learning_rate": 0.00023951879434186752, "loss": 0.018, "step": 155550 }, { "epoch": 0.4, "learning_rate": 0.00023951490612549603, "loss": 0.0175, "step": 155560 }, { "epoch": 0.4, "learning_rate": 0.00023951101790912457, "loss": 0.0238, "step": 155570 }, { "epoch": 0.4, "learning_rate": 0.00023950712969275314, "loss": 0.0156, "step": 155580 }, { "epoch": 0.4, "learning_rate": 0.00023950324147638166, "loss": 0.0188, "step": 155590 }, { "epoch": 0.4, "learning_rate": 0.0002394993532600102, "loss": 0.0184, "step": 155600 }, { "epoch": 0.4, "learning_rate": 0.0002394954650436387, "loss": 0.0165, "step": 155610 }, { "epoch": 0.4, "learning_rate": 0.00023949157682726728, "loss": 0.02, "step": 155620 }, { "epoch": 0.4, "learning_rate": 0.0002394876886108958, "loss": 0.015, "step": 155630 }, { "epoch": 0.4, "learning_rate": 0.00023948380039452434, "loss": 0.0192, "step": 155640 }, { "epoch": 0.4, "learning_rate": 0.00023947991217815285, "loss": 0.0141, "step": 155650 }, { "epoch": 0.4, "learning_rate": 0.00023947602396178142, "loss": 0.0228, "step": 155660 }, { "epoch": 0.4, "learning_rate": 0.00023947213574540994, "loss": 0.0184, "step": 155670 }, { "epoch": 0.4, "learning_rate": 0.00023946824752903848, "loss": 0.0205, "step": 155680 }, { "epoch": 0.4, "learning_rate": 0.000239464359312667, "loss": 0.0222, "step": 155690 }, { "epoch": 0.4, "learning_rate": 0.00023946047109629556, "loss": 0.0187, "step": 155700 }, { "epoch": 0.4, "learning_rate": 0.00023945658287992407, "loss": 0.0206, "step": 155710 }, { "epoch": 0.4, "learning_rate": 0.00023945269466355262, "loss": 0.0185, "step": 155720 }, { "epoch": 0.4, "learning_rate": 0.00023944880644718113, "loss": 0.0178, "step": 155730 }, { "epoch": 0.4, "learning_rate": 0.0002394449182308097, "loss": 0.0179, "step": 155740 }, { "epoch": 0.4, "learning_rate": 0.00023944103001443824, "loss": 0.0149, "step": 155750 }, { "epoch": 0.4, "learning_rate": 0.00023943714179806676, "loss": 0.0183, "step": 155760 }, { "epoch": 0.4, "learning_rate": 0.00023943325358169527, "loss": 0.0168, "step": 155770 }, { "epoch": 0.4, "learning_rate": 0.00023942936536532384, "loss": 0.0191, "step": 155780 }, { "epoch": 0.4, "learning_rate": 0.00023942547714895238, "loss": 0.0176, "step": 155790 }, { "epoch": 0.4, "learning_rate": 0.0002394215889325809, "loss": 0.0214, "step": 155800 }, { "epoch": 0.4, "learning_rate": 0.00023941770071620944, "loss": 0.022, "step": 155810 }, { "epoch": 0.4, "learning_rate": 0.00023941381249983795, "loss": 0.0261, "step": 155820 }, { "epoch": 0.4, "learning_rate": 0.00023940992428346652, "loss": 0.0239, "step": 155830 }, { "epoch": 0.4, "learning_rate": 0.00023940603606709503, "loss": 0.0182, "step": 155840 }, { "epoch": 0.4, "learning_rate": 0.00023940214785072358, "loss": 0.0191, "step": 155850 }, { "epoch": 0.4, "learning_rate": 0.0002393982596343521, "loss": 0.0212, "step": 155860 }, { "epoch": 0.4, "learning_rate": 0.00023939437141798066, "loss": 0.018, "step": 155870 }, { "epoch": 0.4, "learning_rate": 0.00023939048320160917, "loss": 0.019, "step": 155880 }, { "epoch": 0.4, "learning_rate": 0.00023938659498523772, "loss": 0.0239, "step": 155890 }, { "epoch": 0.4, "learning_rate": 0.00023938270676886623, "loss": 0.0233, "step": 155900 }, { "epoch": 0.4, "learning_rate": 0.0002393788185524948, "loss": 0.0176, "step": 155910 }, { "epoch": 0.4, "learning_rate": 0.00023937493033612334, "loss": 0.0239, "step": 155920 }, { "epoch": 0.4, "learning_rate": 0.00023937104211975186, "loss": 0.0206, "step": 155930 }, { "epoch": 0.4, "learning_rate": 0.00023936715390338037, "loss": 0.0213, "step": 155940 }, { "epoch": 0.4, "learning_rate": 0.00023936326568700894, "loss": 0.0252, "step": 155950 }, { "epoch": 0.4, "learning_rate": 0.00023935937747063748, "loss": 0.0237, "step": 155960 }, { "epoch": 0.4, "learning_rate": 0.000239355489254266, "loss": 0.0173, "step": 155970 }, { "epoch": 0.4, "learning_rate": 0.00023935160103789454, "loss": 0.0203, "step": 155980 }, { "epoch": 0.4, "learning_rate": 0.00023934771282152308, "loss": 0.021, "step": 155990 }, { "epoch": 0.4, "learning_rate": 0.00023934382460515162, "loss": 0.0229, "step": 156000 }, { "epoch": 0.4, "eval_cer": 0.8817740678068109, "eval_loss": 0.012980636209249496, "eval_runtime": 108.1448, "eval_samples_per_second": 18.494, "eval_steps_per_second": 4.623, "step": 156000 }, { "epoch": 0.4, "learning_rate": 0.00023933993638878013, "loss": 0.0183, "step": 156010 }, { "epoch": 0.4, "learning_rate": 0.00023933604817240868, "loss": 0.0206, "step": 156020 }, { "epoch": 0.4, "learning_rate": 0.00023933215995603722, "loss": 0.0172, "step": 156030 }, { "epoch": 0.4, "learning_rate": 0.00023932827173966576, "loss": 0.0202, "step": 156040 }, { "epoch": 0.4, "learning_rate": 0.00023932438352329427, "loss": 0.0173, "step": 156050 }, { "epoch": 0.4, "learning_rate": 0.00023932049530692282, "loss": 0.0174, "step": 156060 }, { "epoch": 0.4, "learning_rate": 0.00023931660709055133, "loss": 0.0168, "step": 156070 }, { "epoch": 0.4, "learning_rate": 0.0002393127188741799, "loss": 0.0176, "step": 156080 }, { "epoch": 0.4, "learning_rate": 0.0002393088306578084, "loss": 0.0172, "step": 156090 }, { "epoch": 0.4, "learning_rate": 0.00023930494244143695, "loss": 0.0344, "step": 156100 }, { "epoch": 0.4, "learning_rate": 0.00023930105422506547, "loss": 0.0204, "step": 156110 }, { "epoch": 0.4, "learning_rate": 0.00023929716600869404, "loss": 0.0174, "step": 156120 }, { "epoch": 0.4, "learning_rate": 0.00023929327779232258, "loss": 0.0237, "step": 156130 }, { "epoch": 0.4, "learning_rate": 0.0002392893895759511, "loss": 0.0183, "step": 156140 }, { "epoch": 0.4, "learning_rate": 0.00023928550135957964, "loss": 0.0171, "step": 156150 }, { "epoch": 0.4, "learning_rate": 0.00023928161314320818, "loss": 0.0204, "step": 156160 }, { "epoch": 0.4, "learning_rate": 0.00023927772492683672, "loss": 0.0189, "step": 156170 }, { "epoch": 0.4, "learning_rate": 0.00023927383671046523, "loss": 0.018, "step": 156180 }, { "epoch": 0.4, "learning_rate": 0.00023926994849409378, "loss": 0.0188, "step": 156190 }, { "epoch": 0.4, "learning_rate": 0.00023926606027772232, "loss": 0.0179, "step": 156200 }, { "epoch": 0.4, "learning_rate": 0.00023926217206135086, "loss": 0.0204, "step": 156210 }, { "epoch": 0.4, "learning_rate": 0.00023925828384497937, "loss": 0.016, "step": 156220 }, { "epoch": 0.4, "learning_rate": 0.00023925439562860791, "loss": 0.0231, "step": 156230 }, { "epoch": 0.4, "learning_rate": 0.00023925050741223646, "loss": 0.0208, "step": 156240 }, { "epoch": 0.41, "learning_rate": 0.000239246619195865, "loss": 0.0187, "step": 156250 }, { "epoch": 0.41, "learning_rate": 0.0002392427309794935, "loss": 0.0188, "step": 156260 }, { "epoch": 0.41, "learning_rate": 0.00023923884276312205, "loss": 0.0182, "step": 156270 }, { "epoch": 0.41, "learning_rate": 0.00023923495454675062, "loss": 0.016, "step": 156280 }, { "epoch": 0.41, "learning_rate": 0.00023923106633037914, "loss": 0.0178, "step": 156290 }, { "epoch": 0.41, "learning_rate": 0.00023922717811400768, "loss": 0.0213, "step": 156300 }, { "epoch": 0.41, "learning_rate": 0.0002392232898976362, "loss": 0.017, "step": 156310 }, { "epoch": 0.41, "learning_rate": 0.00023921940168126474, "loss": 0.0172, "step": 156320 }, { "epoch": 0.41, "learning_rate": 0.00023921551346489328, "loss": 0.0204, "step": 156330 }, { "epoch": 0.41, "learning_rate": 0.00023921162524852182, "loss": 0.022, "step": 156340 }, { "epoch": 0.41, "learning_rate": 0.00023920773703215033, "loss": 0.0146, "step": 156350 }, { "epoch": 0.41, "learning_rate": 0.00023920384881577887, "loss": 0.0179, "step": 156360 }, { "epoch": 0.41, "learning_rate": 0.00023919996059940742, "loss": 0.0221, "step": 156370 }, { "epoch": 0.41, "learning_rate": 0.00023919607238303596, "loss": 0.0237, "step": 156380 }, { "epoch": 0.41, "learning_rate": 0.00023919218416666447, "loss": 0.0208, "step": 156390 }, { "epoch": 0.41, "learning_rate": 0.00023918829595029301, "loss": 0.0185, "step": 156400 }, { "epoch": 0.41, "learning_rate": 0.00023918440773392156, "loss": 0.0183, "step": 156410 }, { "epoch": 0.41, "learning_rate": 0.0002391805195175501, "loss": 0.0202, "step": 156420 }, { "epoch": 0.41, "learning_rate": 0.0002391766313011786, "loss": 0.0159, "step": 156430 }, { "epoch": 0.41, "learning_rate": 0.00023917274308480715, "loss": 0.0161, "step": 156440 }, { "epoch": 0.41, "learning_rate": 0.00023916885486843572, "loss": 0.0226, "step": 156450 }, { "epoch": 0.41, "learning_rate": 0.00023916496665206424, "loss": 0.0211, "step": 156460 }, { "epoch": 0.41, "learning_rate": 0.00023916107843569278, "loss": 0.0181, "step": 156470 }, { "epoch": 0.41, "learning_rate": 0.0002391571902193213, "loss": 0.0193, "step": 156480 }, { "epoch": 0.41, "learning_rate": 0.00023915330200294986, "loss": 0.0152, "step": 156490 }, { "epoch": 0.41, "learning_rate": 0.00023914941378657838, "loss": 0.0191, "step": 156500 }, { "epoch": 0.41, "learning_rate": 0.00023914552557020692, "loss": 0.0196, "step": 156510 }, { "epoch": 0.41, "learning_rate": 0.00023914163735383543, "loss": 0.0212, "step": 156520 }, { "epoch": 0.41, "learning_rate": 0.000239137749137464, "loss": 0.016, "step": 156530 }, { "epoch": 0.41, "learning_rate": 0.00023913386092109252, "loss": 0.0192, "step": 156540 }, { "epoch": 0.41, "learning_rate": 0.00023912997270472106, "loss": 0.0242, "step": 156550 }, { "epoch": 0.41, "learning_rate": 0.00023912608448834957, "loss": 0.02, "step": 156560 }, { "epoch": 0.41, "learning_rate": 0.0002391221962719781, "loss": 0.0193, "step": 156570 }, { "epoch": 0.41, "learning_rate": 0.00023911830805560666, "loss": 0.0185, "step": 156580 }, { "epoch": 0.41, "learning_rate": 0.0002391144198392352, "loss": 0.0234, "step": 156590 }, { "epoch": 0.41, "learning_rate": 0.0002391105316228637, "loss": 0.019, "step": 156600 }, { "epoch": 0.41, "learning_rate": 0.00023910664340649225, "loss": 0.021, "step": 156610 }, { "epoch": 0.41, "learning_rate": 0.00023910275519012082, "loss": 0.0209, "step": 156620 }, { "epoch": 0.41, "learning_rate": 0.00023909886697374934, "loss": 0.025, "step": 156630 }, { "epoch": 0.41, "learning_rate": 0.00023909497875737785, "loss": 0.0263, "step": 156640 }, { "epoch": 0.41, "learning_rate": 0.0002390910905410064, "loss": 0.0198, "step": 156650 }, { "epoch": 0.41, "learning_rate": 0.00023908720232463496, "loss": 0.0239, "step": 156660 }, { "epoch": 0.41, "learning_rate": 0.00023908331410826348, "loss": 0.0206, "step": 156670 }, { "epoch": 0.41, "learning_rate": 0.00023907942589189202, "loss": 0.0163, "step": 156680 }, { "epoch": 0.41, "learning_rate": 0.00023907553767552053, "loss": 0.0221, "step": 156690 }, { "epoch": 0.41, "learning_rate": 0.0002390716494591491, "loss": 0.0209, "step": 156700 }, { "epoch": 0.41, "learning_rate": 0.00023906776124277762, "loss": 0.0182, "step": 156710 }, { "epoch": 0.41, "learning_rate": 0.00023906387302640616, "loss": 0.0154, "step": 156720 }, { "epoch": 0.41, "learning_rate": 0.00023905998481003467, "loss": 0.0194, "step": 156730 }, { "epoch": 0.41, "learning_rate": 0.00023905609659366324, "loss": 0.0212, "step": 156740 }, { "epoch": 0.41, "learning_rate": 0.00023905220837729175, "loss": 0.0174, "step": 156750 }, { "epoch": 0.41, "learning_rate": 0.0002390483201609203, "loss": 0.0159, "step": 156760 }, { "epoch": 0.41, "learning_rate": 0.0002390444319445488, "loss": 0.0171, "step": 156770 }, { "epoch": 0.41, "learning_rate": 0.00023904054372817738, "loss": 0.0176, "step": 156780 }, { "epoch": 0.41, "learning_rate": 0.00023903665551180592, "loss": 0.0203, "step": 156790 }, { "epoch": 0.41, "learning_rate": 0.00023903276729543444, "loss": 0.02, "step": 156800 }, { "epoch": 0.41, "learning_rate": 0.00023902887907906295, "loss": 0.0177, "step": 156810 }, { "epoch": 0.41, "learning_rate": 0.0002390249908626915, "loss": 0.0205, "step": 156820 }, { "epoch": 0.41, "learning_rate": 0.00023902110264632006, "loss": 0.0183, "step": 156830 }, { "epoch": 0.41, "learning_rate": 0.00023901721442994857, "loss": 0.018, "step": 156840 }, { "epoch": 0.41, "learning_rate": 0.00023901332621357712, "loss": 0.0218, "step": 156850 }, { "epoch": 0.41, "learning_rate": 0.00023900943799720563, "loss": 0.0224, "step": 156860 }, { "epoch": 0.41, "learning_rate": 0.0002390055497808342, "loss": 0.0215, "step": 156870 }, { "epoch": 0.41, "learning_rate": 0.00023900166156446271, "loss": 0.0195, "step": 156880 }, { "epoch": 0.41, "learning_rate": 0.00023899777334809126, "loss": 0.0167, "step": 156890 }, { "epoch": 0.41, "learning_rate": 0.00023899388513171977, "loss": 0.0191, "step": 156900 }, { "epoch": 0.41, "learning_rate": 0.00023898999691534834, "loss": 0.0187, "step": 156910 }, { "epoch": 0.41, "learning_rate": 0.00023898610869897685, "loss": 0.0182, "step": 156920 }, { "epoch": 0.41, "learning_rate": 0.0002389822204826054, "loss": 0.0212, "step": 156930 }, { "epoch": 0.41, "learning_rate": 0.0002389783322662339, "loss": 0.0185, "step": 156940 }, { "epoch": 0.41, "learning_rate": 0.00023897444404986248, "loss": 0.0167, "step": 156950 }, { "epoch": 0.41, "learning_rate": 0.000238970555833491, "loss": 0.0215, "step": 156960 }, { "epoch": 0.41, "learning_rate": 0.00023896666761711953, "loss": 0.0166, "step": 156970 }, { "epoch": 0.41, "learning_rate": 0.00023896277940074805, "loss": 0.02, "step": 156980 }, { "epoch": 0.41, "learning_rate": 0.00023895889118437662, "loss": 0.0134, "step": 156990 }, { "epoch": 0.41, "learning_rate": 0.00023895500296800516, "loss": 0.0189, "step": 157000 }, { "epoch": 0.41, "eval_cer": 0.8817852649022844, "eval_loss": 0.013182581402361393, "eval_runtime": 108.1899, "eval_samples_per_second": 18.486, "eval_steps_per_second": 4.622, "step": 157000 }, { "epoch": 0.41, "learning_rate": 0.00023895111475163367, "loss": 0.0227, "step": 157010 }, { "epoch": 0.41, "learning_rate": 0.00023894722653526222, "loss": 0.0176, "step": 157020 }, { "epoch": 0.41, "learning_rate": 0.00023894333831889076, "loss": 0.0164, "step": 157030 }, { "epoch": 0.41, "learning_rate": 0.0002389394501025193, "loss": 0.0157, "step": 157040 }, { "epoch": 0.41, "learning_rate": 0.00023893556188614781, "loss": 0.0199, "step": 157050 }, { "epoch": 0.41, "learning_rate": 0.00023893167366977636, "loss": 0.0196, "step": 157060 }, { "epoch": 0.41, "learning_rate": 0.00023892778545340487, "loss": 0.0202, "step": 157070 }, { "epoch": 0.41, "learning_rate": 0.00023892389723703344, "loss": 0.0184, "step": 157080 }, { "epoch": 0.41, "learning_rate": 0.00023892000902066195, "loss": 0.0199, "step": 157090 }, { "epoch": 0.41, "learning_rate": 0.0002389161208042905, "loss": 0.0177, "step": 157100 }, { "epoch": 0.41, "learning_rate": 0.000238912232587919, "loss": 0.0224, "step": 157110 }, { "epoch": 0.41, "learning_rate": 0.00023890834437154758, "loss": 0.0189, "step": 157120 }, { "epoch": 0.41, "learning_rate": 0.0002389044561551761, "loss": 0.0179, "step": 157130 }, { "epoch": 0.41, "learning_rate": 0.00023890056793880463, "loss": 0.0224, "step": 157140 }, { "epoch": 0.41, "learning_rate": 0.00023889667972243315, "loss": 0.0179, "step": 157150 }, { "epoch": 0.41, "learning_rate": 0.00023889279150606172, "loss": 0.0199, "step": 157160 }, { "epoch": 0.41, "learning_rate": 0.00023888890328969026, "loss": 0.0191, "step": 157170 }, { "epoch": 0.41, "learning_rate": 0.00023888501507331877, "loss": 0.0176, "step": 157180 }, { "epoch": 0.41, "learning_rate": 0.00023888112685694732, "loss": 0.0238, "step": 157190 }, { "epoch": 0.41, "learning_rate": 0.00023887723864057586, "loss": 0.0169, "step": 157200 }, { "epoch": 0.41, "learning_rate": 0.0002388733504242044, "loss": 0.0201, "step": 157210 }, { "epoch": 0.41, "learning_rate": 0.0002388694622078329, "loss": 0.0174, "step": 157220 }, { "epoch": 0.41, "learning_rate": 0.00023886557399146145, "loss": 0.0202, "step": 157230 }, { "epoch": 0.41, "learning_rate": 0.00023886168577509, "loss": 0.0172, "step": 157240 }, { "epoch": 0.41, "learning_rate": 0.00023885779755871854, "loss": 0.0188, "step": 157250 }, { "epoch": 0.41, "learning_rate": 0.00023885390934234705, "loss": 0.0184, "step": 157260 }, { "epoch": 0.41, "learning_rate": 0.0002388500211259756, "loss": 0.0183, "step": 157270 }, { "epoch": 0.41, "learning_rate": 0.00023884613290960414, "loss": 0.0225, "step": 157280 }, { "epoch": 0.41, "learning_rate": 0.00023884224469323268, "loss": 0.018, "step": 157290 }, { "epoch": 0.41, "learning_rate": 0.0002388383564768612, "loss": 0.0205, "step": 157300 }, { "epoch": 0.41, "learning_rate": 0.00023883446826048973, "loss": 0.021, "step": 157310 }, { "epoch": 0.41, "learning_rate": 0.00023883058004411825, "loss": 0.0163, "step": 157320 }, { "epoch": 0.41, "learning_rate": 0.00023882669182774682, "loss": 0.0182, "step": 157330 }, { "epoch": 0.41, "learning_rate": 0.00023882280361137536, "loss": 0.0161, "step": 157340 }, { "epoch": 0.41, "learning_rate": 0.00023881891539500387, "loss": 0.0206, "step": 157350 }, { "epoch": 0.41, "learning_rate": 0.0002388150271786324, "loss": 0.0166, "step": 157360 }, { "epoch": 0.41, "learning_rate": 0.00023881113896226096, "loss": 0.0212, "step": 157370 }, { "epoch": 0.41, "learning_rate": 0.0002388072507458895, "loss": 0.0132, "step": 157380 }, { "epoch": 0.41, "learning_rate": 0.000238803362529518, "loss": 0.0197, "step": 157390 }, { "epoch": 0.41, "learning_rate": 0.00023879947431314655, "loss": 0.0178, "step": 157400 }, { "epoch": 0.41, "learning_rate": 0.0002387955860967751, "loss": 0.0192, "step": 157410 }, { "epoch": 0.41, "learning_rate": 0.00023879169788040364, "loss": 0.018, "step": 157420 }, { "epoch": 0.41, "learning_rate": 0.00023878780966403215, "loss": 0.0172, "step": 157430 }, { "epoch": 0.41, "learning_rate": 0.0002387839214476607, "loss": 0.0158, "step": 157440 }, { "epoch": 0.41, "learning_rate": 0.00023878003323128924, "loss": 0.0231, "step": 157450 }, { "epoch": 0.41, "learning_rate": 0.00023877614501491778, "loss": 0.0205, "step": 157460 }, { "epoch": 0.41, "learning_rate": 0.0002387722567985463, "loss": 0.0174, "step": 157470 }, { "epoch": 0.41, "learning_rate": 0.00023876836858217483, "loss": 0.0153, "step": 157480 }, { "epoch": 0.41, "learning_rate": 0.0002387644803658034, "loss": 0.0176, "step": 157490 }, { "epoch": 0.41, "learning_rate": 0.00023876059214943192, "loss": 0.0184, "step": 157500 }, { "epoch": 0.41, "learning_rate": 0.00023875670393306046, "loss": 0.0207, "step": 157510 }, { "epoch": 0.41, "learning_rate": 0.00023875281571668897, "loss": 0.0201, "step": 157520 }, { "epoch": 0.41, "learning_rate": 0.00023874892750031754, "loss": 0.0188, "step": 157530 }, { "epoch": 0.41, "learning_rate": 0.00023874503928394606, "loss": 0.0216, "step": 157540 }, { "epoch": 0.41, "learning_rate": 0.0002387411510675746, "loss": 0.02, "step": 157550 }, { "epoch": 0.41, "learning_rate": 0.0002387372628512031, "loss": 0.0213, "step": 157560 }, { "epoch": 0.41, "learning_rate": 0.00023873337463483165, "loss": 0.0187, "step": 157570 }, { "epoch": 0.41, "learning_rate": 0.0002387294864184602, "loss": 0.0194, "step": 157580 }, { "epoch": 0.41, "learning_rate": 0.00023872559820208874, "loss": 0.0166, "step": 157590 }, { "epoch": 0.41, "learning_rate": 0.00023872170998571725, "loss": 0.0144, "step": 157600 }, { "epoch": 0.41, "learning_rate": 0.0002387178217693458, "loss": 0.0174, "step": 157610 }, { "epoch": 0.41, "learning_rate": 0.00023871393355297433, "loss": 0.0212, "step": 157620 }, { "epoch": 0.41, "learning_rate": 0.00023871004533660288, "loss": 0.0164, "step": 157630 }, { "epoch": 0.41, "learning_rate": 0.0002387061571202314, "loss": 0.0162, "step": 157640 }, { "epoch": 0.41, "learning_rate": 0.00023870226890385993, "loss": 0.0216, "step": 157650 }, { "epoch": 0.41, "learning_rate": 0.0002386983806874885, "loss": 0.022, "step": 157660 }, { "epoch": 0.41, "learning_rate": 0.00023869449247111702, "loss": 0.0192, "step": 157670 }, { "epoch": 0.41, "learning_rate": 0.00023869060425474553, "loss": 0.0206, "step": 157680 }, { "epoch": 0.41, "learning_rate": 0.00023868671603837407, "loss": 0.0154, "step": 157690 }, { "epoch": 0.41, "learning_rate": 0.00023868282782200264, "loss": 0.0189, "step": 157700 }, { "epoch": 0.41, "learning_rate": 0.00023867893960563116, "loss": 0.0197, "step": 157710 }, { "epoch": 0.41, "learning_rate": 0.0002386750513892597, "loss": 0.0236, "step": 157720 }, { "epoch": 0.41, "learning_rate": 0.0002386711631728882, "loss": 0.0222, "step": 157730 }, { "epoch": 0.41, "learning_rate": 0.00023866727495651678, "loss": 0.0198, "step": 157740 }, { "epoch": 0.41, "learning_rate": 0.0002386633867401453, "loss": 0.017, "step": 157750 }, { "epoch": 0.41, "learning_rate": 0.00023865949852377384, "loss": 0.0186, "step": 157760 }, { "epoch": 0.41, "learning_rate": 0.00023865561030740235, "loss": 0.0165, "step": 157770 }, { "epoch": 0.41, "learning_rate": 0.00023865172209103092, "loss": 0.0185, "step": 157780 }, { "epoch": 0.41, "learning_rate": 0.00023864783387465943, "loss": 0.0183, "step": 157790 }, { "epoch": 0.41, "learning_rate": 0.00023864394565828798, "loss": 0.0207, "step": 157800 }, { "epoch": 0.41, "learning_rate": 0.0002386400574419165, "loss": 0.0185, "step": 157810 }, { "epoch": 0.41, "learning_rate": 0.00023863616922554503, "loss": 0.0201, "step": 157820 }, { "epoch": 0.41, "learning_rate": 0.00023863228100917357, "loss": 0.0191, "step": 157830 }, { "epoch": 0.41, "learning_rate": 0.00023862839279280212, "loss": 0.0209, "step": 157840 }, { "epoch": 0.41, "learning_rate": 0.00023862450457643063, "loss": 0.0208, "step": 157850 }, { "epoch": 0.41, "learning_rate": 0.00023862061636005917, "loss": 0.0238, "step": 157860 }, { "epoch": 0.41, "learning_rate": 0.00023861672814368774, "loss": 0.0196, "step": 157870 }, { "epoch": 0.41, "learning_rate": 0.00023861283992731625, "loss": 0.0176, "step": 157880 }, { "epoch": 0.41, "learning_rate": 0.0002386089517109448, "loss": 0.0159, "step": 157890 }, { "epoch": 0.41, "learning_rate": 0.0002386050634945733, "loss": 0.0198, "step": 157900 }, { "epoch": 0.41, "learning_rate": 0.00023860117527820188, "loss": 0.0195, "step": 157910 }, { "epoch": 0.41, "learning_rate": 0.0002385972870618304, "loss": 0.0178, "step": 157920 }, { "epoch": 0.41, "learning_rate": 0.00023859339884545894, "loss": 0.021, "step": 157930 }, { "epoch": 0.41, "learning_rate": 0.00023858951062908745, "loss": 0.018, "step": 157940 }, { "epoch": 0.41, "learning_rate": 0.00023858562241271602, "loss": 0.0194, "step": 157950 }, { "epoch": 0.41, "learning_rate": 0.00023858173419634453, "loss": 0.0243, "step": 157960 }, { "epoch": 0.41, "learning_rate": 0.00023857784597997308, "loss": 0.0199, "step": 157970 }, { "epoch": 0.41, "learning_rate": 0.0002385739577636016, "loss": 0.0198, "step": 157980 }, { "epoch": 0.41, "learning_rate": 0.00023857006954723016, "loss": 0.0185, "step": 157990 }, { "epoch": 0.41, "learning_rate": 0.00023856618133085867, "loss": 0.0172, "step": 158000 }, { "epoch": 0.41, "eval_cer": 0.8817726681698768, "eval_loss": 0.012989984825253487, "eval_runtime": 107.5587, "eval_samples_per_second": 18.594, "eval_steps_per_second": 4.649, "step": 158000 }, { "epoch": 0.41, "learning_rate": 0.00023856229311448721, "loss": 0.0186, "step": 158010 }, { "epoch": 0.41, "learning_rate": 0.00023855840489811573, "loss": 0.0204, "step": 158020 }, { "epoch": 0.41, "learning_rate": 0.0002385545166817443, "loss": 0.0228, "step": 158030 }, { "epoch": 0.41, "learning_rate": 0.00023855062846537284, "loss": 0.0206, "step": 158040 }, { "epoch": 0.41, "learning_rate": 0.00023854674024900135, "loss": 0.0199, "step": 158050 }, { "epoch": 0.41, "learning_rate": 0.0002385428520326299, "loss": 0.018, "step": 158060 }, { "epoch": 0.41, "learning_rate": 0.0002385389638162584, "loss": 0.0179, "step": 158070 }, { "epoch": 0.41, "learning_rate": 0.00023853507559988698, "loss": 0.0219, "step": 158080 }, { "epoch": 0.41, "learning_rate": 0.0002385311873835155, "loss": 0.0166, "step": 158090 }, { "epoch": 0.41, "learning_rate": 0.00023852729916714404, "loss": 0.023, "step": 158100 }, { "epoch": 0.41, "learning_rate": 0.00023852341095077255, "loss": 0.0187, "step": 158110 }, { "epoch": 0.41, "learning_rate": 0.00023851952273440112, "loss": 0.0212, "step": 158120 }, { "epoch": 0.41, "learning_rate": 0.00023851563451802963, "loss": 0.0173, "step": 158130 }, { "epoch": 0.41, "learning_rate": 0.00023851174630165817, "loss": 0.0174, "step": 158140 }, { "epoch": 0.41, "learning_rate": 0.0002385078580852867, "loss": 0.0189, "step": 158150 }, { "epoch": 0.41, "learning_rate": 0.00023850396986891526, "loss": 0.0247, "step": 158160 }, { "epoch": 0.41, "learning_rate": 0.00023850008165254377, "loss": 0.0192, "step": 158170 }, { "epoch": 0.41, "learning_rate": 0.00023849619343617231, "loss": 0.0169, "step": 158180 }, { "epoch": 0.41, "learning_rate": 0.00023849230521980083, "loss": 0.018, "step": 158190 }, { "epoch": 0.41, "learning_rate": 0.0002384884170034294, "loss": 0.0185, "step": 158200 }, { "epoch": 0.41, "learning_rate": 0.00023848452878705794, "loss": 0.0306, "step": 158210 }, { "epoch": 0.41, "learning_rate": 0.00023848064057068645, "loss": 0.0165, "step": 158220 }, { "epoch": 0.41, "learning_rate": 0.00023847675235431497, "loss": 0.0181, "step": 158230 }, { "epoch": 0.41, "learning_rate": 0.00023847286413794354, "loss": 0.0169, "step": 158240 }, { "epoch": 0.41, "learning_rate": 0.00023846897592157208, "loss": 0.0166, "step": 158250 }, { "epoch": 0.41, "learning_rate": 0.0002384650877052006, "loss": 0.0196, "step": 158260 }, { "epoch": 0.41, "learning_rate": 0.00023846119948882913, "loss": 0.018, "step": 158270 }, { "epoch": 0.41, "learning_rate": 0.00023845731127245768, "loss": 0.0188, "step": 158280 }, { "epoch": 0.41, "learning_rate": 0.00023845342305608622, "loss": 0.0201, "step": 158290 }, { "epoch": 0.41, "learning_rate": 0.00023844953483971473, "loss": 0.019, "step": 158300 }, { "epoch": 0.41, "learning_rate": 0.00023844564662334327, "loss": 0.0227, "step": 158310 }, { "epoch": 0.41, "learning_rate": 0.0002384417584069718, "loss": 0.0196, "step": 158320 }, { "epoch": 0.41, "learning_rate": 0.00023843787019060036, "loss": 0.0229, "step": 158330 }, { "epoch": 0.41, "learning_rate": 0.00023843398197422887, "loss": 0.022, "step": 158340 }, { "epoch": 0.41, "learning_rate": 0.00023843009375785741, "loss": 0.0216, "step": 158350 }, { "epoch": 0.41, "learning_rate": 0.00023842620554148593, "loss": 0.0202, "step": 158360 }, { "epoch": 0.41, "learning_rate": 0.0002384223173251145, "loss": 0.0154, "step": 158370 }, { "epoch": 0.41, "learning_rate": 0.00023841842910874304, "loss": 0.0174, "step": 158380 }, { "epoch": 0.41, "learning_rate": 0.00023841454089237155, "loss": 0.0209, "step": 158390 }, { "epoch": 0.41, "learning_rate": 0.00023841065267600007, "loss": 0.0197, "step": 158400 }, { "epoch": 0.41, "learning_rate": 0.00023840676445962864, "loss": 0.0192, "step": 158410 }, { "epoch": 0.41, "learning_rate": 0.00023840287624325718, "loss": 0.0189, "step": 158420 }, { "epoch": 0.41, "learning_rate": 0.0002383989880268857, "loss": 0.0226, "step": 158430 }, { "epoch": 0.41, "learning_rate": 0.00023839509981051423, "loss": 0.0188, "step": 158440 }, { "epoch": 0.41, "learning_rate": 0.00023839121159414278, "loss": 0.0215, "step": 158450 }, { "epoch": 0.41, "learning_rate": 0.00023838732337777132, "loss": 0.0241, "step": 158460 }, { "epoch": 0.41, "learning_rate": 0.00023838343516139983, "loss": 0.0193, "step": 158470 }, { "epoch": 0.41, "learning_rate": 0.00023837954694502837, "loss": 0.02, "step": 158480 }, { "epoch": 0.41, "learning_rate": 0.00023837565872865692, "loss": 0.0174, "step": 158490 }, { "epoch": 0.41, "learning_rate": 0.00023837177051228546, "loss": 0.0202, "step": 158500 }, { "epoch": 0.41, "learning_rate": 0.00023836788229591397, "loss": 0.0269, "step": 158510 }, { "epoch": 0.41, "learning_rate": 0.0002383639940795425, "loss": 0.0192, "step": 158520 }, { "epoch": 0.41, "learning_rate": 0.00023836010586317108, "loss": 0.0182, "step": 158530 }, { "epoch": 0.41, "learning_rate": 0.0002383562176467996, "loss": 0.0193, "step": 158540 }, { "epoch": 0.41, "learning_rate": 0.0002383523294304281, "loss": 0.0182, "step": 158550 }, { "epoch": 0.41, "learning_rate": 0.00023834844121405665, "loss": 0.0175, "step": 158560 }, { "epoch": 0.41, "learning_rate": 0.00023834455299768517, "loss": 0.0236, "step": 158570 }, { "epoch": 0.41, "learning_rate": 0.00023834066478131374, "loss": 0.0223, "step": 158580 }, { "epoch": 0.41, "learning_rate": 0.00023833677656494228, "loss": 0.0136, "step": 158590 }, { "epoch": 0.41, "learning_rate": 0.0002383328883485708, "loss": 0.0177, "step": 158600 }, { "epoch": 0.41, "learning_rate": 0.00023832900013219933, "loss": 0.017, "step": 158610 }, { "epoch": 0.41, "learning_rate": 0.00023832511191582788, "loss": 0.0189, "step": 158620 }, { "epoch": 0.41, "learning_rate": 0.00023832122369945642, "loss": 0.0231, "step": 158630 }, { "epoch": 0.41, "learning_rate": 0.00023831733548308493, "loss": 0.02, "step": 158640 }, { "epoch": 0.41, "learning_rate": 0.00023831344726671347, "loss": 0.0169, "step": 158650 }, { "epoch": 0.41, "learning_rate": 0.00023830955905034201, "loss": 0.017, "step": 158660 }, { "epoch": 0.41, "learning_rate": 0.00023830567083397056, "loss": 0.0187, "step": 158670 }, { "epoch": 0.41, "learning_rate": 0.00023830178261759907, "loss": 0.0184, "step": 158680 }, { "epoch": 0.41, "learning_rate": 0.0002382978944012276, "loss": 0.0189, "step": 158690 }, { "epoch": 0.41, "learning_rate": 0.00023829400618485618, "loss": 0.0228, "step": 158700 }, { "epoch": 0.41, "learning_rate": 0.0002382901179684847, "loss": 0.0247, "step": 158710 }, { "epoch": 0.41, "learning_rate": 0.0002382862297521132, "loss": 0.0171, "step": 158720 }, { "epoch": 0.41, "learning_rate": 0.00023828234153574175, "loss": 0.0226, "step": 158730 }, { "epoch": 0.41, "learning_rate": 0.00023827845331937032, "loss": 0.0164, "step": 158740 }, { "epoch": 0.41, "learning_rate": 0.00023827456510299884, "loss": 0.0216, "step": 158750 }, { "epoch": 0.41, "learning_rate": 0.00023827067688662738, "loss": 0.0167, "step": 158760 }, { "epoch": 0.41, "learning_rate": 0.0002382667886702559, "loss": 0.0178, "step": 158770 }, { "epoch": 0.41, "learning_rate": 0.00023826290045388446, "loss": 0.0188, "step": 158780 }, { "epoch": 0.41, "learning_rate": 0.00023825901223751297, "loss": 0.021, "step": 158790 }, { "epoch": 0.41, "learning_rate": 0.00023825512402114152, "loss": 0.0195, "step": 158800 }, { "epoch": 0.41, "learning_rate": 0.00023825123580477003, "loss": 0.0191, "step": 158810 }, { "epoch": 0.41, "learning_rate": 0.00023824734758839857, "loss": 0.0184, "step": 158820 }, { "epoch": 0.41, "learning_rate": 0.00023824345937202711, "loss": 0.0227, "step": 158830 }, { "epoch": 0.41, "learning_rate": 0.00023823957115565566, "loss": 0.02, "step": 158840 }, { "epoch": 0.41, "learning_rate": 0.00023823568293928417, "loss": 0.0152, "step": 158850 }, { "epoch": 0.41, "learning_rate": 0.0002382317947229127, "loss": 0.0198, "step": 158860 }, { "epoch": 0.41, "learning_rate": 0.00023822790650654125, "loss": 0.0194, "step": 158870 }, { "epoch": 0.41, "learning_rate": 0.0002382240182901698, "loss": 0.0194, "step": 158880 }, { "epoch": 0.41, "learning_rate": 0.0002382201300737983, "loss": 0.0231, "step": 158890 }, { "epoch": 0.41, "learning_rate": 0.00023821624185742685, "loss": 0.0195, "step": 158900 }, { "epoch": 0.41, "learning_rate": 0.00023821235364105542, "loss": 0.0188, "step": 158910 }, { "epoch": 0.41, "learning_rate": 0.00023820846542468393, "loss": 0.0182, "step": 158920 }, { "epoch": 0.41, "learning_rate": 0.00023820457720831248, "loss": 0.0182, "step": 158930 }, { "epoch": 0.41, "learning_rate": 0.000238200688991941, "loss": 0.018, "step": 158940 }, { "epoch": 0.41, "learning_rate": 0.00023819680077556956, "loss": 0.0177, "step": 158950 }, { "epoch": 0.41, "learning_rate": 0.00023819291255919807, "loss": 0.0155, "step": 158960 }, { "epoch": 0.41, "learning_rate": 0.00023818902434282662, "loss": 0.0174, "step": 158970 }, { "epoch": 0.41, "learning_rate": 0.00023818513612645513, "loss": 0.018, "step": 158980 }, { "epoch": 0.41, "learning_rate": 0.0002381812479100837, "loss": 0.0165, "step": 158990 }, { "epoch": 0.41, "learning_rate": 0.0002381773596937122, "loss": 0.0168, "step": 159000 }, { "epoch": 0.41, "eval_cer": 0.8817796663545476, "eval_loss": 0.013127253390848637, "eval_runtime": 107.1652, "eval_samples_per_second": 18.663, "eval_steps_per_second": 4.666, "step": 159000 }, { "epoch": 0.41, "learning_rate": 0.00023817347147734076, "loss": 0.0213, "step": 159010 }, { "epoch": 0.41, "learning_rate": 0.00023816958326096927, "loss": 0.0207, "step": 159020 }, { "epoch": 0.41, "learning_rate": 0.00023816569504459784, "loss": 0.0185, "step": 159030 }, { "epoch": 0.41, "learning_rate": 0.00023816180682822635, "loss": 0.02, "step": 159040 }, { "epoch": 0.41, "learning_rate": 0.0002381579186118549, "loss": 0.0171, "step": 159050 }, { "epoch": 0.41, "learning_rate": 0.0002381540303954834, "loss": 0.0232, "step": 159060 }, { "epoch": 0.41, "learning_rate": 0.00023815014217911195, "loss": 0.0184, "step": 159070 }, { "epoch": 0.41, "learning_rate": 0.00023814625396274052, "loss": 0.0252, "step": 159080 }, { "epoch": 0.41, "learning_rate": 0.00023814236574636903, "loss": 0.0235, "step": 159090 }, { "epoch": 0.41, "learning_rate": 0.00023813847752999758, "loss": 0.0163, "step": 159100 }, { "epoch": 0.41, "learning_rate": 0.0002381345893136261, "loss": 0.0183, "step": 159110 }, { "epoch": 0.41, "learning_rate": 0.00023813070109725466, "loss": 0.0173, "step": 159120 }, { "epoch": 0.41, "learning_rate": 0.00023812681288088317, "loss": 0.0184, "step": 159130 }, { "epoch": 0.41, "learning_rate": 0.00023812292466451172, "loss": 0.0185, "step": 159140 }, { "epoch": 0.41, "learning_rate": 0.00023811903644814023, "loss": 0.0217, "step": 159150 }, { "epoch": 0.41, "learning_rate": 0.0002381151482317688, "loss": 0.0158, "step": 159160 }, { "epoch": 0.41, "learning_rate": 0.0002381112600153973, "loss": 0.0208, "step": 159170 }, { "epoch": 0.41, "learning_rate": 0.00023810737179902585, "loss": 0.0368, "step": 159180 }, { "epoch": 0.41, "learning_rate": 0.00023810348358265437, "loss": 0.0206, "step": 159190 }, { "epoch": 0.41, "learning_rate": 0.00023809959536628294, "loss": 0.0174, "step": 159200 }, { "epoch": 0.41, "learning_rate": 0.00023809570714991145, "loss": 0.0176, "step": 159210 }, { "epoch": 0.41, "learning_rate": 0.00023809181893354, "loss": 0.0194, "step": 159220 }, { "epoch": 0.41, "learning_rate": 0.0002380879307171685, "loss": 0.024, "step": 159230 }, { "epoch": 0.41, "learning_rate": 0.00023808404250079708, "loss": 0.0173, "step": 159240 }, { "epoch": 0.41, "learning_rate": 0.00023808015428442562, "loss": 0.0232, "step": 159250 }, { "epoch": 0.41, "learning_rate": 0.00023807626606805413, "loss": 0.0241, "step": 159260 }, { "epoch": 0.41, "learning_rate": 0.00023807237785168265, "loss": 0.0184, "step": 159270 }, { "epoch": 0.41, "learning_rate": 0.00023806848963531122, "loss": 0.0199, "step": 159280 }, { "epoch": 0.41, "learning_rate": 0.00023806460141893976, "loss": 0.0239, "step": 159290 }, { "epoch": 0.41, "learning_rate": 0.00023806071320256827, "loss": 0.0284, "step": 159300 }, { "epoch": 0.41, "learning_rate": 0.00023805682498619681, "loss": 0.0208, "step": 159310 }, { "epoch": 0.41, "learning_rate": 0.00023805293676982533, "loss": 0.0183, "step": 159320 }, { "epoch": 0.41, "learning_rate": 0.0002380490485534539, "loss": 0.0159, "step": 159330 }, { "epoch": 0.41, "learning_rate": 0.0002380451603370824, "loss": 0.0157, "step": 159340 }, { "epoch": 0.41, "learning_rate": 0.00023804127212071095, "loss": 0.018, "step": 159350 }, { "epoch": 0.41, "learning_rate": 0.00023803738390433947, "loss": 0.0186, "step": 159360 }, { "epoch": 0.41, "learning_rate": 0.00023803349568796804, "loss": 0.0165, "step": 159370 }, { "epoch": 0.41, "learning_rate": 0.00023802960747159655, "loss": 0.0152, "step": 159380 }, { "epoch": 0.41, "learning_rate": 0.0002380257192552251, "loss": 0.0148, "step": 159390 }, { "epoch": 0.41, "learning_rate": 0.0002380218310388536, "loss": 0.0193, "step": 159400 }, { "epoch": 0.41, "learning_rate": 0.00023801794282248218, "loss": 0.0163, "step": 159410 }, { "epoch": 0.41, "learning_rate": 0.0002380140546061107, "loss": 0.0199, "step": 159420 }, { "epoch": 0.41, "learning_rate": 0.00023801016638973923, "loss": 0.015, "step": 159430 }, { "epoch": 0.41, "learning_rate": 0.00023800627817336775, "loss": 0.0207, "step": 159440 }, { "epoch": 0.41, "learning_rate": 0.00023800238995699632, "loss": 0.014, "step": 159450 }, { "epoch": 0.41, "learning_rate": 0.00023799850174062486, "loss": 0.0194, "step": 159460 }, { "epoch": 0.41, "learning_rate": 0.00023799461352425337, "loss": 0.0143, "step": 159470 }, { "epoch": 0.41, "learning_rate": 0.00023799072530788191, "loss": 0.0255, "step": 159480 }, { "epoch": 0.41, "learning_rate": 0.00023798683709151046, "loss": 0.016, "step": 159490 }, { "epoch": 0.41, "learning_rate": 0.000237982948875139, "loss": 0.0207, "step": 159500 }, { "epoch": 0.41, "learning_rate": 0.0002379790606587675, "loss": 0.0186, "step": 159510 }, { "epoch": 0.41, "learning_rate": 0.00023797517244239605, "loss": 0.0204, "step": 159520 }, { "epoch": 0.41, "learning_rate": 0.0002379712842260246, "loss": 0.0184, "step": 159530 }, { "epoch": 0.41, "learning_rate": 0.00023796739600965314, "loss": 0.0167, "step": 159540 }, { "epoch": 0.41, "learning_rate": 0.00023796350779328165, "loss": 0.0207, "step": 159550 }, { "epoch": 0.41, "learning_rate": 0.0002379596195769102, "loss": 0.022, "step": 159560 }, { "epoch": 0.41, "learning_rate": 0.0002379557313605387, "loss": 0.0195, "step": 159570 }, { "epoch": 0.41, "learning_rate": 0.00023795184314416728, "loss": 0.019, "step": 159580 }, { "epoch": 0.41, "learning_rate": 0.0002379479549277958, "loss": 0.0175, "step": 159590 }, { "epoch": 0.41, "learning_rate": 0.00023794406671142433, "loss": 0.0236, "step": 159600 }, { "epoch": 0.41, "learning_rate": 0.00023794017849505285, "loss": 0.016, "step": 159610 }, { "epoch": 0.41, "learning_rate": 0.00023793629027868142, "loss": 0.0188, "step": 159620 }, { "epoch": 0.41, "learning_rate": 0.00023793240206230996, "loss": 0.0188, "step": 159630 }, { "epoch": 0.41, "learning_rate": 0.00023792851384593847, "loss": 0.0165, "step": 159640 }, { "epoch": 0.41, "learning_rate": 0.000237924625629567, "loss": 0.0147, "step": 159650 }, { "epoch": 0.41, "learning_rate": 0.00023792073741319556, "loss": 0.019, "step": 159660 }, { "epoch": 0.41, "learning_rate": 0.0002379168491968241, "loss": 0.0177, "step": 159670 }, { "epoch": 0.41, "learning_rate": 0.0002379129609804526, "loss": 0.0175, "step": 159680 }, { "epoch": 0.41, "learning_rate": 0.00023790907276408115, "loss": 0.0189, "step": 159690 }, { "epoch": 0.41, "learning_rate": 0.0002379051845477097, "loss": 0.0188, "step": 159700 }, { "epoch": 0.41, "learning_rate": 0.00023790129633133824, "loss": 0.0216, "step": 159710 }, { "epoch": 0.41, "learning_rate": 0.00023789740811496675, "loss": 0.0199, "step": 159720 }, { "epoch": 0.41, "learning_rate": 0.0002378935198985953, "loss": 0.0175, "step": 159730 }, { "epoch": 0.41, "learning_rate": 0.00023788963168222383, "loss": 0.0207, "step": 159740 }, { "epoch": 0.41, "learning_rate": 0.00023788574346585238, "loss": 0.0189, "step": 159750 }, { "epoch": 0.41, "learning_rate": 0.0002378818552494809, "loss": 0.0194, "step": 159760 }, { "epoch": 0.41, "learning_rate": 0.00023787796703310943, "loss": 0.0208, "step": 159770 }, { "epoch": 0.41, "learning_rate": 0.000237874078816738, "loss": 0.0177, "step": 159780 }, { "epoch": 0.41, "learning_rate": 0.00023787019060036651, "loss": 0.0162, "step": 159790 }, { "epoch": 0.41, "learning_rate": 0.00023786630238399506, "loss": 0.021, "step": 159800 }, { "epoch": 0.41, "learning_rate": 0.00023786241416762357, "loss": 0.0159, "step": 159810 }, { "epoch": 0.41, "learning_rate": 0.00023785852595125209, "loss": 0.0189, "step": 159820 }, { "epoch": 0.41, "learning_rate": 0.00023785463773488065, "loss": 0.0165, "step": 159830 }, { "epoch": 0.41, "learning_rate": 0.0002378507495185092, "loss": 0.0214, "step": 159840 }, { "epoch": 0.41, "learning_rate": 0.0002378468613021377, "loss": 0.0307, "step": 159850 }, { "epoch": 0.41, "learning_rate": 0.00023784297308576625, "loss": 0.0163, "step": 159860 }, { "epoch": 0.41, "learning_rate": 0.0002378390848693948, "loss": 0.02, "step": 159870 }, { "epoch": 0.41, "learning_rate": 0.00023783519665302334, "loss": 0.0188, "step": 159880 }, { "epoch": 0.41, "learning_rate": 0.00023783130843665185, "loss": 0.0199, "step": 159890 }, { "epoch": 0.41, "learning_rate": 0.0002378274202202804, "loss": 0.0213, "step": 159900 }, { "epoch": 0.41, "learning_rate": 0.00023782353200390893, "loss": 0.0202, "step": 159910 }, { "epoch": 0.41, "learning_rate": 0.00023781964378753747, "loss": 0.016, "step": 159920 }, { "epoch": 0.41, "learning_rate": 0.000237815755571166, "loss": 0.0176, "step": 159930 }, { "epoch": 0.41, "learning_rate": 0.00023781186735479453, "loss": 0.0165, "step": 159940 }, { "epoch": 0.41, "learning_rate": 0.0002378079791384231, "loss": 0.0203, "step": 159950 }, { "epoch": 0.41, "learning_rate": 0.00023780409092205161, "loss": 0.022, "step": 159960 }, { "epoch": 0.41, "learning_rate": 0.00023780020270568016, "loss": 0.022, "step": 159970 }, { "epoch": 0.41, "learning_rate": 0.00023779631448930867, "loss": 0.0208, "step": 159980 }, { "epoch": 0.41, "learning_rate": 0.00023779242627293724, "loss": 0.0165, "step": 159990 }, { "epoch": 0.41, "learning_rate": 0.00023778853805656575, "loss": 0.017, "step": 160000 }, { "epoch": 0.41, "eval_cer": 0.881806259456297, "eval_loss": 0.013189446181058884, "eval_runtime": 107.4253, "eval_samples_per_second": 18.618, "eval_steps_per_second": 4.654, "step": 160000 }, { "epoch": 0.41, "learning_rate": 0.0002377846498401943, "loss": 0.0176, "step": 160010 }, { "epoch": 0.41, "learning_rate": 0.0002377807616238228, "loss": 0.0175, "step": 160020 }, { "epoch": 0.41, "learning_rate": 0.00023777687340745135, "loss": 0.0178, "step": 160030 }, { "epoch": 0.41, "learning_rate": 0.0002377729851910799, "loss": 0.0178, "step": 160040 }, { "epoch": 0.41, "learning_rate": 0.00023776909697470843, "loss": 0.02, "step": 160050 }, { "epoch": 0.41, "learning_rate": 0.00023776520875833695, "loss": 0.0147, "step": 160060 }, { "epoch": 0.41, "learning_rate": 0.0002377613205419655, "loss": 0.0188, "step": 160070 }, { "epoch": 0.41, "learning_rate": 0.00023775743232559403, "loss": 0.0152, "step": 160080 }, { "epoch": 0.41, "learning_rate": 0.00023775354410922257, "loss": 0.0218, "step": 160090 }, { "epoch": 0.42, "learning_rate": 0.0002377496558928511, "loss": 0.0195, "step": 160100 }, { "epoch": 0.42, "learning_rate": 0.00023774576767647963, "loss": 0.0199, "step": 160110 }, { "epoch": 0.42, "learning_rate": 0.0002377418794601082, "loss": 0.0197, "step": 160120 }, { "epoch": 0.42, "learning_rate": 0.00023773799124373671, "loss": 0.0208, "step": 160130 }, { "epoch": 0.42, "learning_rate": 0.00023773410302736523, "loss": 0.0144, "step": 160140 }, { "epoch": 0.42, "learning_rate": 0.00023773021481099377, "loss": 0.0171, "step": 160150 }, { "epoch": 0.42, "learning_rate": 0.00023772632659462234, "loss": 0.018, "step": 160160 }, { "epoch": 0.42, "learning_rate": 0.00023772243837825085, "loss": 0.0189, "step": 160170 }, { "epoch": 0.42, "learning_rate": 0.0002377185501618794, "loss": 0.0174, "step": 160180 }, { "epoch": 0.42, "learning_rate": 0.0002377146619455079, "loss": 0.0198, "step": 160190 }, { "epoch": 0.42, "learning_rate": 0.00023771077372913648, "loss": 0.0163, "step": 160200 }, { "epoch": 0.42, "learning_rate": 0.000237706885512765, "loss": 0.0218, "step": 160210 }, { "epoch": 0.42, "learning_rate": 0.00023770299729639353, "loss": 0.0192, "step": 160220 }, { "epoch": 0.42, "learning_rate": 0.00023769910908002205, "loss": 0.0209, "step": 160230 }, { "epoch": 0.42, "learning_rate": 0.00023769522086365062, "loss": 0.0149, "step": 160240 }, { "epoch": 0.42, "learning_rate": 0.00023769133264727913, "loss": 0.0207, "step": 160250 }, { "epoch": 0.42, "learning_rate": 0.00023768744443090767, "loss": 0.0225, "step": 160260 }, { "epoch": 0.42, "learning_rate": 0.0002376835562145362, "loss": 0.0258, "step": 160270 }, { "epoch": 0.42, "learning_rate": 0.00023767966799816473, "loss": 0.0187, "step": 160280 }, { "epoch": 0.42, "learning_rate": 0.0002376757797817933, "loss": 0.0256, "step": 160290 }, { "epoch": 0.42, "learning_rate": 0.0002376718915654218, "loss": 0.0189, "step": 160300 }, { "epoch": 0.42, "learning_rate": 0.00023766800334905033, "loss": 0.0207, "step": 160310 }, { "epoch": 0.42, "learning_rate": 0.00023766411513267887, "loss": 0.0201, "step": 160320 }, { "epoch": 0.42, "learning_rate": 0.00023766022691630744, "loss": 0.0185, "step": 160330 }, { "epoch": 0.42, "learning_rate": 0.00023765633869993595, "loss": 0.0217, "step": 160340 }, { "epoch": 0.42, "learning_rate": 0.0002376524504835645, "loss": 0.018, "step": 160350 }, { "epoch": 0.42, "learning_rate": 0.000237648562267193, "loss": 0.016, "step": 160360 }, { "epoch": 0.42, "learning_rate": 0.00023764467405082158, "loss": 0.0187, "step": 160370 }, { "epoch": 0.42, "learning_rate": 0.0002376407858344501, "loss": 0.0174, "step": 160380 }, { "epoch": 0.42, "learning_rate": 0.00023763689761807863, "loss": 0.0204, "step": 160390 }, { "epoch": 0.42, "learning_rate": 0.00023763300940170715, "loss": 0.0157, "step": 160400 }, { "epoch": 0.42, "learning_rate": 0.00023762912118533572, "loss": 0.0213, "step": 160410 }, { "epoch": 0.42, "learning_rate": 0.00023762523296896423, "loss": 0.0181, "step": 160420 }, { "epoch": 0.42, "learning_rate": 0.00023762134475259277, "loss": 0.0188, "step": 160430 }, { "epoch": 0.42, "learning_rate": 0.0002376174565362213, "loss": 0.022, "step": 160440 }, { "epoch": 0.42, "learning_rate": 0.00023761356831984986, "loss": 0.0247, "step": 160450 }, { "epoch": 0.42, "learning_rate": 0.00023760968010347837, "loss": 0.0172, "step": 160460 }, { "epoch": 0.42, "learning_rate": 0.0002376057918871069, "loss": 0.0201, "step": 160470 }, { "epoch": 0.42, "learning_rate": 0.00023760190367073543, "loss": 0.0208, "step": 160480 }, { "epoch": 0.42, "learning_rate": 0.000237598015454364, "loss": 0.018, "step": 160490 }, { "epoch": 0.42, "learning_rate": 0.00023759412723799254, "loss": 0.0157, "step": 160500 }, { "epoch": 0.42, "learning_rate": 0.00023759023902162105, "loss": 0.0192, "step": 160510 }, { "epoch": 0.42, "learning_rate": 0.0002375863508052496, "loss": 0.0133, "step": 160520 }, { "epoch": 0.42, "learning_rate": 0.0002375824625888781, "loss": 0.0205, "step": 160530 }, { "epoch": 0.42, "learning_rate": 0.00023757857437250668, "loss": 0.0187, "step": 160540 }, { "epoch": 0.42, "learning_rate": 0.0002375746861561352, "loss": 0.0231, "step": 160550 }, { "epoch": 0.42, "learning_rate": 0.00023757079793976373, "loss": 0.0209, "step": 160560 }, { "epoch": 0.42, "learning_rate": 0.00023756690972339225, "loss": 0.023, "step": 160570 }, { "epoch": 0.42, "learning_rate": 0.00023756302150702082, "loss": 0.0212, "step": 160580 }, { "epoch": 0.42, "learning_rate": 0.00023755913329064933, "loss": 0.016, "step": 160590 }, { "epoch": 0.42, "learning_rate": 0.00023755524507427787, "loss": 0.0211, "step": 160600 }, { "epoch": 0.42, "learning_rate": 0.0002375513568579064, "loss": 0.0203, "step": 160610 }, { "epoch": 0.42, "learning_rate": 0.00023754746864153496, "loss": 0.0207, "step": 160620 }, { "epoch": 0.42, "learning_rate": 0.00023754358042516347, "loss": 0.019, "step": 160630 }, { "epoch": 0.42, "learning_rate": 0.000237539692208792, "loss": 0.0187, "step": 160640 }, { "epoch": 0.42, "learning_rate": 0.00023753580399242053, "loss": 0.0198, "step": 160650 }, { "epoch": 0.42, "learning_rate": 0.0002375319157760491, "loss": 0.0197, "step": 160660 }, { "epoch": 0.42, "learning_rate": 0.00023752802755967764, "loss": 0.0168, "step": 160670 }, { "epoch": 0.42, "learning_rate": 0.00023752413934330615, "loss": 0.0175, "step": 160680 }, { "epoch": 0.42, "learning_rate": 0.0002375202511269347, "loss": 0.0192, "step": 160690 }, { "epoch": 0.42, "learning_rate": 0.00023751636291056323, "loss": 0.0214, "step": 160700 }, { "epoch": 0.42, "learning_rate": 0.00023751247469419178, "loss": 0.0183, "step": 160710 }, { "epoch": 0.42, "learning_rate": 0.0002375085864778203, "loss": 0.0175, "step": 160720 }, { "epoch": 0.42, "learning_rate": 0.00023750469826144883, "loss": 0.0207, "step": 160730 }, { "epoch": 0.42, "learning_rate": 0.00023750081004507737, "loss": 0.0172, "step": 160740 }, { "epoch": 0.42, "learning_rate": 0.00023749692182870592, "loss": 0.018, "step": 160750 }, { "epoch": 0.42, "learning_rate": 0.00023749303361233443, "loss": 0.0172, "step": 160760 }, { "epoch": 0.42, "learning_rate": 0.00023748914539596297, "loss": 0.0187, "step": 160770 }, { "epoch": 0.42, "learning_rate": 0.0002374852571795915, "loss": 0.0224, "step": 160780 }, { "epoch": 0.42, "learning_rate": 0.00023748136896322006, "loss": 0.0221, "step": 160790 }, { "epoch": 0.42, "learning_rate": 0.00023747748074684857, "loss": 0.0215, "step": 160800 }, { "epoch": 0.42, "learning_rate": 0.0002374735925304771, "loss": 0.0192, "step": 160810 }, { "epoch": 0.42, "learning_rate": 0.00023746970431410563, "loss": 0.0178, "step": 160820 }, { "epoch": 0.42, "learning_rate": 0.0002374658160977342, "loss": 0.016, "step": 160830 }, { "epoch": 0.42, "learning_rate": 0.00023746192788136274, "loss": 0.0209, "step": 160840 }, { "epoch": 0.42, "learning_rate": 0.00023745803966499125, "loss": 0.0224, "step": 160850 }, { "epoch": 0.42, "learning_rate": 0.00023745415144861977, "loss": 0.0175, "step": 160860 }, { "epoch": 0.42, "learning_rate": 0.00023745026323224833, "loss": 0.0165, "step": 160870 }, { "epoch": 0.42, "learning_rate": 0.00023744637501587688, "loss": 0.0204, "step": 160880 }, { "epoch": 0.42, "learning_rate": 0.0002374424867995054, "loss": 0.017, "step": 160890 }, { "epoch": 0.42, "learning_rate": 0.00023743859858313393, "loss": 0.0281, "step": 160900 }, { "epoch": 0.42, "learning_rate": 0.00023743471036676247, "loss": 0.0252, "step": 160910 }, { "epoch": 0.42, "learning_rate": 0.00023743082215039102, "loss": 0.0156, "step": 160920 }, { "epoch": 0.42, "learning_rate": 0.00023742693393401953, "loss": 0.0192, "step": 160930 }, { "epoch": 0.42, "learning_rate": 0.00023742304571764807, "loss": 0.0176, "step": 160940 }, { "epoch": 0.42, "learning_rate": 0.0002374191575012766, "loss": 0.0188, "step": 160950 }, { "epoch": 0.42, "learning_rate": 0.00023741526928490515, "loss": 0.0222, "step": 160960 }, { "epoch": 0.42, "learning_rate": 0.00023741138106853367, "loss": 0.0193, "step": 160970 }, { "epoch": 0.42, "learning_rate": 0.0002374074928521622, "loss": 0.016, "step": 160980 }, { "epoch": 0.42, "learning_rate": 0.00023740360463579078, "loss": 0.0219, "step": 160990 }, { "epoch": 0.42, "learning_rate": 0.0002373997164194193, "loss": 0.018, "step": 161000 }, { "epoch": 0.42, "eval_cer": 0.88176706962214, "eval_loss": 0.012851111590862274, "eval_runtime": 107.3307, "eval_samples_per_second": 18.634, "eval_steps_per_second": 4.658, "step": 161000 }, { "epoch": 0.42, "learning_rate": 0.0002373958282030478, "loss": 0.0159, "step": 161010 }, { "epoch": 0.42, "learning_rate": 0.00023739193998667635, "loss": 0.0141, "step": 161020 }, { "epoch": 0.42, "learning_rate": 0.00023738805177030486, "loss": 0.0187, "step": 161030 }, { "epoch": 0.42, "learning_rate": 0.00023738416355393343, "loss": 0.0198, "step": 161040 }, { "epoch": 0.42, "learning_rate": 0.00023738027533756198, "loss": 0.0185, "step": 161050 }, { "epoch": 0.42, "learning_rate": 0.0002373763871211905, "loss": 0.0158, "step": 161060 }, { "epoch": 0.42, "learning_rate": 0.00023737249890481903, "loss": 0.0188, "step": 161070 }, { "epoch": 0.42, "learning_rate": 0.00023736861068844757, "loss": 0.022, "step": 161080 }, { "epoch": 0.42, "learning_rate": 0.00023736472247207611, "loss": 0.0219, "step": 161090 }, { "epoch": 0.42, "learning_rate": 0.00023736083425570463, "loss": 0.0175, "step": 161100 }, { "epoch": 0.42, "learning_rate": 0.00023735694603933317, "loss": 0.0195, "step": 161110 }, { "epoch": 0.42, "learning_rate": 0.0002373530578229617, "loss": 0.0182, "step": 161120 }, { "epoch": 0.42, "learning_rate": 0.00023734916960659025, "loss": 0.0212, "step": 161130 }, { "epoch": 0.42, "learning_rate": 0.00023734528139021877, "loss": 0.0173, "step": 161140 }, { "epoch": 0.42, "learning_rate": 0.0002373413931738473, "loss": 0.0182, "step": 161150 }, { "epoch": 0.42, "learning_rate": 0.00023733750495747588, "loss": 0.0187, "step": 161160 }, { "epoch": 0.42, "learning_rate": 0.0002373336167411044, "loss": 0.0186, "step": 161170 }, { "epoch": 0.42, "learning_rate": 0.0002373297285247329, "loss": 0.0163, "step": 161180 }, { "epoch": 0.42, "learning_rate": 0.00023732584030836145, "loss": 0.0195, "step": 161190 }, { "epoch": 0.42, "learning_rate": 0.00023732195209199002, "loss": 0.0171, "step": 161200 }, { "epoch": 0.42, "learning_rate": 0.00023731806387561853, "loss": 0.0153, "step": 161210 }, { "epoch": 0.42, "learning_rate": 0.00023731417565924707, "loss": 0.0153, "step": 161220 }, { "epoch": 0.42, "learning_rate": 0.0002373102874428756, "loss": 0.0149, "step": 161230 }, { "epoch": 0.42, "learning_rate": 0.00023730639922650416, "loss": 0.0158, "step": 161240 }, { "epoch": 0.42, "learning_rate": 0.00023730251101013267, "loss": 0.0179, "step": 161250 }, { "epoch": 0.42, "learning_rate": 0.00023729862279376121, "loss": 0.0216, "step": 161260 }, { "epoch": 0.42, "learning_rate": 0.00023729473457738973, "loss": 0.0198, "step": 161270 }, { "epoch": 0.42, "learning_rate": 0.00023729084636101827, "loss": 0.0159, "step": 161280 }, { "epoch": 0.42, "learning_rate": 0.0002372869581446468, "loss": 0.0299, "step": 161290 }, { "epoch": 0.42, "learning_rate": 0.00023728306992827535, "loss": 0.0184, "step": 161300 }, { "epoch": 0.42, "learning_rate": 0.00023727918171190387, "loss": 0.0135, "step": 161310 }, { "epoch": 0.42, "learning_rate": 0.0002372752934955324, "loss": 0.0184, "step": 161320 }, { "epoch": 0.42, "learning_rate": 0.00023727140527916095, "loss": 0.0224, "step": 161330 }, { "epoch": 0.42, "learning_rate": 0.0002372675170627895, "loss": 0.0215, "step": 161340 }, { "epoch": 0.42, "learning_rate": 0.000237263628846418, "loss": 0.0195, "step": 161350 }, { "epoch": 0.42, "learning_rate": 0.00023725974063004655, "loss": 0.0169, "step": 161360 }, { "epoch": 0.42, "learning_rate": 0.00023725585241367512, "loss": 0.0191, "step": 161370 }, { "epoch": 0.42, "learning_rate": 0.00023725196419730363, "loss": 0.0158, "step": 161380 }, { "epoch": 0.42, "learning_rate": 0.00023724807598093217, "loss": 0.0187, "step": 161390 }, { "epoch": 0.42, "learning_rate": 0.0002372441877645607, "loss": 0.0202, "step": 161400 }, { "epoch": 0.42, "learning_rate": 0.00023724029954818926, "loss": 0.0181, "step": 161410 }, { "epoch": 0.42, "learning_rate": 0.00023723641133181777, "loss": 0.0175, "step": 161420 }, { "epoch": 0.42, "learning_rate": 0.00023723252311544631, "loss": 0.0194, "step": 161430 }, { "epoch": 0.42, "learning_rate": 0.00023722863489907483, "loss": 0.0191, "step": 161440 }, { "epoch": 0.42, "learning_rate": 0.0002372247466827034, "loss": 0.0178, "step": 161450 }, { "epoch": 0.42, "learning_rate": 0.0002372208584663319, "loss": 0.0167, "step": 161460 }, { "epoch": 0.42, "learning_rate": 0.00023721697024996045, "loss": 0.0245, "step": 161470 }, { "epoch": 0.42, "learning_rate": 0.00023721308203358897, "loss": 0.0216, "step": 161480 }, { "epoch": 0.42, "learning_rate": 0.00023720919381721754, "loss": 0.0184, "step": 161490 }, { "epoch": 0.42, "learning_rate": 0.00023720530560084605, "loss": 0.0152, "step": 161500 }, { "epoch": 0.42, "learning_rate": 0.0002372014173844746, "loss": 0.0213, "step": 161510 }, { "epoch": 0.42, "learning_rate": 0.0002371975291681031, "loss": 0.0183, "step": 161520 }, { "epoch": 0.42, "learning_rate": 0.00023719364095173165, "loss": 0.0214, "step": 161530 }, { "epoch": 0.42, "learning_rate": 0.00023718975273536022, "loss": 0.028, "step": 161540 }, { "epoch": 0.42, "learning_rate": 0.00023718586451898873, "loss": 0.0254, "step": 161550 }, { "epoch": 0.42, "learning_rate": 0.00023718197630261727, "loss": 0.0172, "step": 161560 }, { "epoch": 0.42, "learning_rate": 0.0002371780880862458, "loss": 0.018, "step": 161570 }, { "epoch": 0.42, "learning_rate": 0.00023717419986987436, "loss": 0.0191, "step": 161580 }, { "epoch": 0.42, "learning_rate": 0.00023717031165350287, "loss": 0.016, "step": 161590 }, { "epoch": 0.42, "learning_rate": 0.0002371664234371314, "loss": 0.0216, "step": 161600 }, { "epoch": 0.42, "learning_rate": 0.00023716253522075993, "loss": 0.0156, "step": 161610 }, { "epoch": 0.42, "learning_rate": 0.0002371586470043885, "loss": 0.0167, "step": 161620 }, { "epoch": 0.42, "learning_rate": 0.000237154758788017, "loss": 0.0165, "step": 161630 }, { "epoch": 0.42, "learning_rate": 0.00023715087057164555, "loss": 0.0159, "step": 161640 }, { "epoch": 0.42, "learning_rate": 0.00023714698235527407, "loss": 0.0187, "step": 161650 }, { "epoch": 0.42, "learning_rate": 0.00023714309413890264, "loss": 0.0221, "step": 161660 }, { "epoch": 0.42, "learning_rate": 0.00023713920592253115, "loss": 0.0185, "step": 161670 }, { "epoch": 0.42, "learning_rate": 0.0002371353177061597, "loss": 0.0169, "step": 161680 }, { "epoch": 0.42, "learning_rate": 0.0002371314294897882, "loss": 0.0158, "step": 161690 }, { "epoch": 0.42, "learning_rate": 0.00023712754127341678, "loss": 0.0186, "step": 161700 }, { "epoch": 0.42, "learning_rate": 0.00023712365305704532, "loss": 0.0223, "step": 161710 }, { "epoch": 0.42, "learning_rate": 0.00023711976484067383, "loss": 0.0191, "step": 161720 }, { "epoch": 0.42, "learning_rate": 0.00023711587662430235, "loss": 0.0189, "step": 161730 }, { "epoch": 0.42, "learning_rate": 0.00023711198840793091, "loss": 0.0231, "step": 161740 }, { "epoch": 0.42, "learning_rate": 0.00023710810019155946, "loss": 0.0202, "step": 161750 }, { "epoch": 0.42, "learning_rate": 0.00023710421197518797, "loss": 0.0228, "step": 161760 }, { "epoch": 0.42, "learning_rate": 0.0002371003237588165, "loss": 0.0185, "step": 161770 }, { "epoch": 0.42, "learning_rate": 0.00023709643554244503, "loss": 0.0195, "step": 161780 }, { "epoch": 0.42, "learning_rate": 0.0002370925473260736, "loss": 0.0187, "step": 161790 }, { "epoch": 0.42, "learning_rate": 0.0002370886591097021, "loss": 0.0198, "step": 161800 }, { "epoch": 0.42, "learning_rate": 0.00023708477089333065, "loss": 0.0281, "step": 161810 }, { "epoch": 0.42, "learning_rate": 0.00023708088267695917, "loss": 0.0216, "step": 161820 }, { "epoch": 0.42, "learning_rate": 0.00023707699446058774, "loss": 0.0167, "step": 161830 }, { "epoch": 0.42, "learning_rate": 0.00023707310624421625, "loss": 0.0207, "step": 161840 }, { "epoch": 0.42, "learning_rate": 0.0002370692180278448, "loss": 0.0279, "step": 161850 }, { "epoch": 0.42, "learning_rate": 0.0002370653298114733, "loss": 0.0206, "step": 161860 }, { "epoch": 0.42, "learning_rate": 0.00023706144159510187, "loss": 0.0228, "step": 161870 }, { "epoch": 0.42, "learning_rate": 0.0002370575533787304, "loss": 0.0157, "step": 161880 }, { "epoch": 0.42, "learning_rate": 0.00023705366516235893, "loss": 0.0196, "step": 161890 }, { "epoch": 0.42, "learning_rate": 0.00023704977694598745, "loss": 0.0189, "step": 161900 }, { "epoch": 0.42, "learning_rate": 0.00023704588872961601, "loss": 0.0206, "step": 161910 }, { "epoch": 0.42, "learning_rate": 0.00023704200051324456, "loss": 0.0183, "step": 161920 }, { "epoch": 0.42, "learning_rate": 0.00023703811229687307, "loss": 0.0137, "step": 161930 }, { "epoch": 0.42, "learning_rate": 0.0002370342240805016, "loss": 0.0182, "step": 161940 }, { "epoch": 0.42, "learning_rate": 0.00023703033586413015, "loss": 0.0163, "step": 161950 }, { "epoch": 0.42, "learning_rate": 0.0002370264476477587, "loss": 0.0159, "step": 161960 }, { "epoch": 0.42, "learning_rate": 0.0002370225594313872, "loss": 0.0199, "step": 161970 }, { "epoch": 0.42, "learning_rate": 0.00023701867121501575, "loss": 0.0157, "step": 161980 }, { "epoch": 0.42, "learning_rate": 0.0002370147829986443, "loss": 0.0251, "step": 161990 }, { "epoch": 0.42, "learning_rate": 0.00023701089478227283, "loss": 0.0198, "step": 162000 }, { "epoch": 0.42, "eval_cer": 0.8817796663545476, "eval_loss": 0.012595619075000286, "eval_runtime": 107.3974, "eval_samples_per_second": 18.622, "eval_steps_per_second": 4.656, "step": 162000 }, { "epoch": 0.42, "learning_rate": 0.00023700700656590135, "loss": 0.0167, "step": 162010 }, { "epoch": 0.42, "learning_rate": 0.0002370031183495299, "loss": 0.0218, "step": 162020 }, { "epoch": 0.42, "learning_rate": 0.0002369992301331584, "loss": 0.0321, "step": 162030 }, { "epoch": 0.42, "learning_rate": 0.00023699534191678697, "loss": 0.0219, "step": 162040 }, { "epoch": 0.42, "learning_rate": 0.0002369914537004155, "loss": 0.0177, "step": 162050 }, { "epoch": 0.42, "learning_rate": 0.00023698756548404403, "loss": 0.0219, "step": 162060 }, { "epoch": 0.42, "learning_rate": 0.00023698367726767254, "loss": 0.0203, "step": 162070 }, { "epoch": 0.42, "learning_rate": 0.0002369797890513011, "loss": 0.0198, "step": 162080 }, { "epoch": 0.42, "learning_rate": 0.00023697590083492966, "loss": 0.0263, "step": 162090 }, { "epoch": 0.42, "learning_rate": 0.00023697201261855817, "loss": 0.0153, "step": 162100 }, { "epoch": 0.42, "learning_rate": 0.0002369681244021867, "loss": 0.013, "step": 162110 }, { "epoch": 0.42, "learning_rate": 0.00023696423618581525, "loss": 0.0223, "step": 162120 }, { "epoch": 0.42, "learning_rate": 0.0002369603479694438, "loss": 0.0169, "step": 162130 }, { "epoch": 0.42, "learning_rate": 0.0002369564597530723, "loss": 0.0222, "step": 162140 }, { "epoch": 0.42, "learning_rate": 0.00023695257153670085, "loss": 0.0173, "step": 162150 }, { "epoch": 0.42, "learning_rate": 0.0002369486833203294, "loss": 0.0154, "step": 162160 }, { "epoch": 0.42, "learning_rate": 0.00023694479510395793, "loss": 0.0193, "step": 162170 }, { "epoch": 0.42, "learning_rate": 0.00023694090688758645, "loss": 0.0164, "step": 162180 }, { "epoch": 0.42, "learning_rate": 0.000236937018671215, "loss": 0.0175, "step": 162190 }, { "epoch": 0.42, "learning_rate": 0.00023693313045484353, "loss": 0.0189, "step": 162200 }, { "epoch": 0.42, "learning_rate": 0.00023692924223847207, "loss": 0.0223, "step": 162210 }, { "epoch": 0.42, "learning_rate": 0.0002369253540221006, "loss": 0.0197, "step": 162220 }, { "epoch": 0.42, "learning_rate": 0.00023692146580572913, "loss": 0.0223, "step": 162230 }, { "epoch": 0.42, "learning_rate": 0.0002369175775893577, "loss": 0.018, "step": 162240 }, { "epoch": 0.42, "learning_rate": 0.0002369136893729862, "loss": 0.018, "step": 162250 }, { "epoch": 0.42, "learning_rate": 0.00023690980115661475, "loss": 0.0183, "step": 162260 }, { "epoch": 0.42, "learning_rate": 0.00023690591294024327, "loss": 0.023, "step": 162270 }, { "epoch": 0.42, "learning_rate": 0.0002369020247238718, "loss": 0.0161, "step": 162280 }, { "epoch": 0.42, "learning_rate": 0.00023689813650750035, "loss": 0.0163, "step": 162290 }, { "epoch": 0.42, "learning_rate": 0.0002368942482911289, "loss": 0.0289, "step": 162300 }, { "epoch": 0.42, "learning_rate": 0.0002368903600747574, "loss": 0.0202, "step": 162310 }, { "epoch": 0.42, "learning_rate": 0.00023688647185838595, "loss": 0.0181, "step": 162320 }, { "epoch": 0.42, "learning_rate": 0.0002368825836420145, "loss": 0.0181, "step": 162330 }, { "epoch": 0.42, "learning_rate": 0.00023687869542564303, "loss": 0.0193, "step": 162340 }, { "epoch": 0.42, "learning_rate": 0.00023687480720927155, "loss": 0.0175, "step": 162350 }, { "epoch": 0.42, "learning_rate": 0.0002368709189929001, "loss": 0.0187, "step": 162360 }, { "epoch": 0.42, "learning_rate": 0.00023686703077652863, "loss": 0.0156, "step": 162370 }, { "epoch": 0.42, "learning_rate": 0.00023686314256015717, "loss": 0.018, "step": 162380 }, { "epoch": 0.42, "learning_rate": 0.0002368592543437857, "loss": 0.017, "step": 162390 }, { "epoch": 0.42, "learning_rate": 0.00023685536612741423, "loss": 0.0183, "step": 162400 }, { "epoch": 0.42, "learning_rate": 0.0002368514779110428, "loss": 0.0217, "step": 162410 }, { "epoch": 0.42, "learning_rate": 0.0002368475896946713, "loss": 0.0199, "step": 162420 }, { "epoch": 0.42, "learning_rate": 0.00023684370147829985, "loss": 0.0227, "step": 162430 }, { "epoch": 0.42, "learning_rate": 0.00023683981326192837, "loss": 0.0173, "step": 162440 }, { "epoch": 0.42, "learning_rate": 0.00023683592504555694, "loss": 0.0197, "step": 162450 }, { "epoch": 0.42, "learning_rate": 0.00023683203682918545, "loss": 0.022, "step": 162460 }, { "epoch": 0.42, "learning_rate": 0.000236828148612814, "loss": 0.0161, "step": 162470 }, { "epoch": 0.42, "learning_rate": 0.0002368242603964425, "loss": 0.0236, "step": 162480 }, { "epoch": 0.42, "learning_rate": 0.00023682037218007108, "loss": 0.0208, "step": 162490 }, { "epoch": 0.42, "learning_rate": 0.0002368164839636996, "loss": 0.0205, "step": 162500 }, { "epoch": 0.42, "learning_rate": 0.00023681259574732813, "loss": 0.0173, "step": 162510 }, { "epoch": 0.42, "learning_rate": 0.00023680870753095665, "loss": 0.0154, "step": 162520 }, { "epoch": 0.42, "learning_rate": 0.0002368048193145852, "loss": 0.0197, "step": 162530 }, { "epoch": 0.42, "learning_rate": 0.00023680093109821373, "loss": 0.0185, "step": 162540 }, { "epoch": 0.42, "learning_rate": 0.00023679704288184227, "loss": 0.0145, "step": 162550 }, { "epoch": 0.42, "learning_rate": 0.0002367931546654708, "loss": 0.0218, "step": 162560 }, { "epoch": 0.42, "learning_rate": 0.00023678926644909933, "loss": 0.0184, "step": 162570 }, { "epoch": 0.42, "learning_rate": 0.0002367853782327279, "loss": 0.0169, "step": 162580 }, { "epoch": 0.42, "learning_rate": 0.0002367814900163564, "loss": 0.0229, "step": 162590 }, { "epoch": 0.42, "learning_rate": 0.00023677760179998493, "loss": 0.0197, "step": 162600 }, { "epoch": 0.42, "learning_rate": 0.00023677371358361347, "loss": 0.023, "step": 162610 }, { "epoch": 0.42, "learning_rate": 0.00023676982536724204, "loss": 0.0209, "step": 162620 }, { "epoch": 0.42, "learning_rate": 0.00023676593715087055, "loss": 0.0219, "step": 162630 }, { "epoch": 0.42, "learning_rate": 0.0002367620489344991, "loss": 0.0191, "step": 162640 }, { "epoch": 0.42, "learning_rate": 0.0002367581607181276, "loss": 0.0207, "step": 162650 }, { "epoch": 0.42, "learning_rate": 0.00023675427250175618, "loss": 0.0212, "step": 162660 }, { "epoch": 0.42, "learning_rate": 0.0002367503842853847, "loss": 0.0187, "step": 162670 }, { "epoch": 0.42, "learning_rate": 0.00023674649606901323, "loss": 0.0247, "step": 162680 }, { "epoch": 0.42, "learning_rate": 0.00023674260785264175, "loss": 0.0175, "step": 162690 }, { "epoch": 0.42, "learning_rate": 0.00023673871963627032, "loss": 0.0207, "step": 162700 }, { "epoch": 0.42, "learning_rate": 0.00023673483141989883, "loss": 0.0182, "step": 162710 }, { "epoch": 0.42, "learning_rate": 0.00023673094320352737, "loss": 0.0179, "step": 162720 }, { "epoch": 0.42, "learning_rate": 0.00023672705498715589, "loss": 0.0163, "step": 162730 }, { "epoch": 0.42, "learning_rate": 0.00023672316677078445, "loss": 0.0194, "step": 162740 }, { "epoch": 0.42, "learning_rate": 0.000236719278554413, "loss": 0.0165, "step": 162750 }, { "epoch": 0.42, "learning_rate": 0.0002367153903380415, "loss": 0.021, "step": 162760 }, { "epoch": 0.42, "learning_rate": 0.00023671150212167003, "loss": 0.0177, "step": 162770 }, { "epoch": 0.42, "learning_rate": 0.00023670761390529857, "loss": 0.017, "step": 162780 }, { "epoch": 0.42, "learning_rate": 0.00023670372568892714, "loss": 0.0203, "step": 162790 }, { "epoch": 0.42, "learning_rate": 0.00023669983747255565, "loss": 0.0228, "step": 162800 }, { "epoch": 0.42, "learning_rate": 0.0002366959492561842, "loss": 0.0177, "step": 162810 }, { "epoch": 0.42, "learning_rate": 0.0002366920610398127, "loss": 0.0179, "step": 162820 }, { "epoch": 0.42, "learning_rate": 0.00023668817282344128, "loss": 0.0198, "step": 162830 }, { "epoch": 0.42, "learning_rate": 0.0002366842846070698, "loss": 0.022, "step": 162840 }, { "epoch": 0.42, "learning_rate": 0.00023668039639069833, "loss": 0.0181, "step": 162850 }, { "epoch": 0.42, "learning_rate": 0.00023667650817432685, "loss": 0.0171, "step": 162860 }, { "epoch": 0.42, "learning_rate": 0.00023667261995795541, "loss": 0.0181, "step": 162870 }, { "epoch": 0.42, "learning_rate": 0.00023666873174158393, "loss": 0.0295, "step": 162880 }, { "epoch": 0.42, "learning_rate": 0.00023666484352521247, "loss": 0.0184, "step": 162890 }, { "epoch": 0.42, "learning_rate": 0.00023666095530884099, "loss": 0.0212, "step": 162900 }, { "epoch": 0.42, "learning_rate": 0.00023665706709246955, "loss": 0.0166, "step": 162910 }, { "epoch": 0.42, "learning_rate": 0.00023665317887609807, "loss": 0.0225, "step": 162920 }, { "epoch": 0.42, "learning_rate": 0.0002366492906597266, "loss": 0.0189, "step": 162930 }, { "epoch": 0.42, "learning_rate": 0.00023664540244335513, "loss": 0.0202, "step": 162940 }, { "epoch": 0.42, "learning_rate": 0.0002366415142269837, "loss": 0.0198, "step": 162950 }, { "epoch": 0.42, "learning_rate": 0.00023663762601061224, "loss": 0.016, "step": 162960 }, { "epoch": 0.42, "learning_rate": 0.00023663373779424075, "loss": 0.0164, "step": 162970 }, { "epoch": 0.42, "learning_rate": 0.0002366298495778693, "loss": 0.0193, "step": 162980 }, { "epoch": 0.42, "learning_rate": 0.00023662596136149783, "loss": 0.023, "step": 162990 }, { "epoch": 0.42, "learning_rate": 0.00023662207314512637, "loss": 0.0169, "step": 163000 }, { "epoch": 0.42, "eval_cer": 0.8817838652653501, "eval_loss": 0.01325357798486948, "eval_runtime": 107.3603, "eval_samples_per_second": 18.629, "eval_steps_per_second": 4.657, "step": 163000 }, { "epoch": 0.42, "learning_rate": 0.0002366181849287549, "loss": 0.0191, "step": 163010 }, { "epoch": 0.42, "learning_rate": 0.00023661429671238343, "loss": 0.0161, "step": 163020 }, { "epoch": 0.42, "learning_rate": 0.00023661040849601195, "loss": 0.0211, "step": 163030 }, { "epoch": 0.42, "learning_rate": 0.00023660652027964051, "loss": 0.0191, "step": 163040 }, { "epoch": 0.42, "learning_rate": 0.00023660263206326903, "loss": 0.017, "step": 163050 }, { "epoch": 0.42, "learning_rate": 0.00023659874384689757, "loss": 0.0187, "step": 163060 }, { "epoch": 0.42, "learning_rate": 0.00023659485563052609, "loss": 0.0173, "step": 163070 }, { "epoch": 0.42, "learning_rate": 0.00023659096741415465, "loss": 0.0223, "step": 163080 }, { "epoch": 0.42, "learning_rate": 0.00023658707919778317, "loss": 0.0185, "step": 163090 }, { "epoch": 0.42, "learning_rate": 0.0002365831909814117, "loss": 0.0164, "step": 163100 }, { "epoch": 0.42, "learning_rate": 0.00023657930276504022, "loss": 0.0178, "step": 163110 }, { "epoch": 0.42, "learning_rate": 0.0002365754145486688, "loss": 0.0162, "step": 163120 }, { "epoch": 0.42, "learning_rate": 0.00023657152633229733, "loss": 0.0199, "step": 163130 }, { "epoch": 0.42, "learning_rate": 0.00023656763811592585, "loss": 0.0185, "step": 163140 }, { "epoch": 0.42, "learning_rate": 0.0002365637498995544, "loss": 0.0191, "step": 163150 }, { "epoch": 0.42, "learning_rate": 0.00023655986168318293, "loss": 0.0176, "step": 163160 }, { "epoch": 0.42, "learning_rate": 0.00023655597346681147, "loss": 0.021, "step": 163170 }, { "epoch": 0.42, "learning_rate": 0.00023655208525044, "loss": 0.0187, "step": 163180 }, { "epoch": 0.42, "learning_rate": 0.00023654819703406853, "loss": 0.02, "step": 163190 }, { "epoch": 0.42, "learning_rate": 0.00023654430881769707, "loss": 0.0199, "step": 163200 }, { "epoch": 0.42, "learning_rate": 0.00023654042060132561, "loss": 0.0216, "step": 163210 }, { "epoch": 0.42, "learning_rate": 0.00023653653238495413, "loss": 0.0217, "step": 163220 }, { "epoch": 0.42, "learning_rate": 0.00023653264416858267, "loss": 0.0178, "step": 163230 }, { "epoch": 0.42, "learning_rate": 0.0002365287559522112, "loss": 0.0177, "step": 163240 }, { "epoch": 0.42, "learning_rate": 0.00023652486773583975, "loss": 0.0188, "step": 163250 }, { "epoch": 0.42, "learning_rate": 0.00023652097951946827, "loss": 0.015, "step": 163260 }, { "epoch": 0.42, "learning_rate": 0.0002365170913030968, "loss": 0.0195, "step": 163270 }, { "epoch": 0.42, "learning_rate": 0.00023651320308672532, "loss": 0.018, "step": 163280 }, { "epoch": 0.42, "learning_rate": 0.0002365093148703539, "loss": 0.0173, "step": 163290 }, { "epoch": 0.42, "learning_rate": 0.00023650542665398243, "loss": 0.0207, "step": 163300 }, { "epoch": 0.42, "learning_rate": 0.00023650153843761095, "loss": 0.018, "step": 163310 }, { "epoch": 0.42, "learning_rate": 0.00023649765022123946, "loss": 0.0202, "step": 163320 }, { "epoch": 0.42, "learning_rate": 0.00023649376200486803, "loss": 0.0223, "step": 163330 }, { "epoch": 0.42, "learning_rate": 0.00023648987378849657, "loss": 0.0199, "step": 163340 }, { "epoch": 0.42, "learning_rate": 0.0002364859855721251, "loss": 0.0181, "step": 163350 }, { "epoch": 0.42, "learning_rate": 0.00023648209735575363, "loss": 0.0219, "step": 163360 }, { "epoch": 0.42, "learning_rate": 0.00023647820913938217, "loss": 0.0181, "step": 163370 }, { "epoch": 0.42, "learning_rate": 0.0002364743209230107, "loss": 0.0191, "step": 163380 }, { "epoch": 0.42, "learning_rate": 0.00023647043270663923, "loss": 0.0176, "step": 163390 }, { "epoch": 0.42, "learning_rate": 0.00023646654449026777, "loss": 0.0225, "step": 163400 }, { "epoch": 0.42, "learning_rate": 0.0002364626562738963, "loss": 0.0244, "step": 163410 }, { "epoch": 0.42, "learning_rate": 0.00023645876805752485, "loss": 0.0147, "step": 163420 }, { "epoch": 0.42, "learning_rate": 0.00023645487984115337, "loss": 0.0217, "step": 163430 }, { "epoch": 0.42, "learning_rate": 0.0002364509916247819, "loss": 0.0198, "step": 163440 }, { "epoch": 0.42, "learning_rate": 0.00023644710340841048, "loss": 0.0204, "step": 163450 }, { "epoch": 0.42, "learning_rate": 0.000236443215192039, "loss": 0.0188, "step": 163460 }, { "epoch": 0.42, "learning_rate": 0.0002364393269756675, "loss": 0.0245, "step": 163470 }, { "epoch": 0.42, "learning_rate": 0.00023643543875929605, "loss": 0.0248, "step": 163480 }, { "epoch": 0.42, "learning_rate": 0.00023643155054292462, "loss": 0.0224, "step": 163490 }, { "epoch": 0.42, "learning_rate": 0.00023642766232655313, "loss": 0.0174, "step": 163500 }, { "epoch": 0.42, "learning_rate": 0.00023642377411018167, "loss": 0.0202, "step": 163510 }, { "epoch": 0.42, "learning_rate": 0.0002364198858938102, "loss": 0.0213, "step": 163520 }, { "epoch": 0.42, "learning_rate": 0.00023641599767743873, "loss": 0.0194, "step": 163530 }, { "epoch": 0.42, "learning_rate": 0.00023641210946106727, "loss": 0.0191, "step": 163540 }, { "epoch": 0.42, "learning_rate": 0.0002364082212446958, "loss": 0.0247, "step": 163550 }, { "epoch": 0.42, "learning_rate": 0.00023640433302832433, "loss": 0.0207, "step": 163560 }, { "epoch": 0.42, "learning_rate": 0.00023640044481195287, "loss": 0.0187, "step": 163570 }, { "epoch": 0.42, "learning_rate": 0.0002363965565955814, "loss": 0.02, "step": 163580 }, { "epoch": 0.42, "learning_rate": 0.00023639266837920995, "loss": 0.0221, "step": 163590 }, { "epoch": 0.42, "learning_rate": 0.00023638878016283847, "loss": 0.0211, "step": 163600 }, { "epoch": 0.42, "learning_rate": 0.000236384891946467, "loss": 0.0171, "step": 163610 }, { "epoch": 0.42, "learning_rate": 0.00023638100373009558, "loss": 0.032, "step": 163620 }, { "epoch": 0.42, "learning_rate": 0.0002363771155137241, "loss": 0.0301, "step": 163630 }, { "epoch": 0.42, "learning_rate": 0.0002363732272973526, "loss": 0.0198, "step": 163640 }, { "epoch": 0.42, "learning_rate": 0.00023636933908098115, "loss": 0.014, "step": 163650 }, { "epoch": 0.42, "learning_rate": 0.00023636545086460972, "loss": 0.0197, "step": 163660 }, { "epoch": 0.42, "learning_rate": 0.00023636156264823823, "loss": 0.0213, "step": 163670 }, { "epoch": 0.42, "learning_rate": 0.00023635767443186677, "loss": 0.0198, "step": 163680 }, { "epoch": 0.42, "learning_rate": 0.0002363537862154953, "loss": 0.0191, "step": 163690 }, { "epoch": 0.42, "learning_rate": 0.00023634989799912386, "loss": 0.0169, "step": 163700 }, { "epoch": 0.42, "learning_rate": 0.00023634600978275237, "loss": 0.0214, "step": 163710 }, { "epoch": 0.42, "learning_rate": 0.0002363421215663809, "loss": 0.0211, "step": 163720 }, { "epoch": 0.42, "learning_rate": 0.00023633823335000943, "loss": 0.018, "step": 163730 }, { "epoch": 0.42, "learning_rate": 0.000236334345133638, "loss": 0.0208, "step": 163740 }, { "epoch": 0.42, "learning_rate": 0.0002363304569172665, "loss": 0.0175, "step": 163750 }, { "epoch": 0.42, "learning_rate": 0.00023632656870089505, "loss": 0.0211, "step": 163760 }, { "epoch": 0.42, "learning_rate": 0.00023632268048452357, "loss": 0.0181, "step": 163770 }, { "epoch": 0.42, "learning_rate": 0.0002363187922681521, "loss": 0.0223, "step": 163780 }, { "epoch": 0.42, "learning_rate": 0.00023631490405178065, "loss": 0.0177, "step": 163790 }, { "epoch": 0.42, "learning_rate": 0.0002363110158354092, "loss": 0.0194, "step": 163800 }, { "epoch": 0.42, "learning_rate": 0.0002363071276190377, "loss": 0.0203, "step": 163810 }, { "epoch": 0.42, "learning_rate": 0.00023630323940266625, "loss": 0.0139, "step": 163820 }, { "epoch": 0.42, "learning_rate": 0.00023629935118629482, "loss": 0.0236, "step": 163830 }, { "epoch": 0.42, "learning_rate": 0.00023629546296992333, "loss": 0.02, "step": 163840 }, { "epoch": 0.42, "learning_rate": 0.00023629157475355187, "loss": 0.0163, "step": 163850 }, { "epoch": 0.42, "learning_rate": 0.0002362876865371804, "loss": 0.0183, "step": 163860 }, { "epoch": 0.42, "learning_rate": 0.00023628379832080896, "loss": 0.0223, "step": 163870 }, { "epoch": 0.42, "learning_rate": 0.00023627991010443747, "loss": 0.0246, "step": 163880 }, { "epoch": 0.42, "learning_rate": 0.000236276021888066, "loss": 0.0154, "step": 163890 }, { "epoch": 0.42, "learning_rate": 0.00023627213367169453, "loss": 0.0198, "step": 163900 }, { "epoch": 0.42, "learning_rate": 0.0002362682454553231, "loss": 0.0202, "step": 163910 }, { "epoch": 0.42, "learning_rate": 0.0002362643572389516, "loss": 0.0222, "step": 163920 }, { "epoch": 0.42, "learning_rate": 0.00023626046902258015, "loss": 0.0203, "step": 163930 }, { "epoch": 0.42, "learning_rate": 0.00023625658080620867, "loss": 0.0202, "step": 163940 }, { "epoch": 0.42, "learning_rate": 0.00023625269258983723, "loss": 0.0308, "step": 163950 }, { "epoch": 0.43, "learning_rate": 0.00023624880437346575, "loss": 0.0221, "step": 163960 }, { "epoch": 0.43, "learning_rate": 0.0002362449161570943, "loss": 0.0198, "step": 163970 }, { "epoch": 0.43, "learning_rate": 0.0002362410279407228, "loss": 0.02, "step": 163980 }, { "epoch": 0.43, "learning_rate": 0.00023623713972435137, "loss": 0.0207, "step": 163990 }, { "epoch": 0.43, "learning_rate": 0.00023623325150797992, "loss": 0.0232, "step": 164000 }, { "epoch": 0.43, "eval_cer": 0.8817880641761527, "eval_loss": 0.012865516357123852, "eval_runtime": 107.376, "eval_samples_per_second": 18.626, "eval_steps_per_second": 4.657, "step": 164000 }, { "epoch": 0.43, "learning_rate": 0.00023622936329160843, "loss": 0.0242, "step": 164010 }, { "epoch": 0.43, "learning_rate": 0.00023622547507523697, "loss": 0.0177, "step": 164020 }, { "epoch": 0.43, "learning_rate": 0.00023622158685886549, "loss": 0.0212, "step": 164030 }, { "epoch": 0.43, "learning_rate": 0.00023621769864249405, "loss": 0.0168, "step": 164040 }, { "epoch": 0.43, "learning_rate": 0.00023621381042612257, "loss": 0.0172, "step": 164050 }, { "epoch": 0.43, "learning_rate": 0.0002362099222097511, "loss": 0.0189, "step": 164060 }, { "epoch": 0.43, "learning_rate": 0.00023620603399337963, "loss": 0.0159, "step": 164070 }, { "epoch": 0.43, "learning_rate": 0.0002362021457770082, "loss": 0.017, "step": 164080 }, { "epoch": 0.43, "learning_rate": 0.0002361982575606367, "loss": 0.0186, "step": 164090 }, { "epoch": 0.43, "learning_rate": 0.00023619436934426525, "loss": 0.0181, "step": 164100 }, { "epoch": 0.43, "learning_rate": 0.00023619048112789376, "loss": 0.0147, "step": 164110 }, { "epoch": 0.43, "learning_rate": 0.00023618659291152233, "loss": 0.0163, "step": 164120 }, { "epoch": 0.43, "learning_rate": 0.00023618270469515085, "loss": 0.0173, "step": 164130 }, { "epoch": 0.43, "learning_rate": 0.0002361788164787794, "loss": 0.0176, "step": 164140 }, { "epoch": 0.43, "learning_rate": 0.0002361749282624079, "loss": 0.0204, "step": 164150 }, { "epoch": 0.43, "learning_rate": 0.00023617104004603647, "loss": 0.0195, "step": 164160 }, { "epoch": 0.43, "learning_rate": 0.00023616715182966501, "loss": 0.0208, "step": 164170 }, { "epoch": 0.43, "learning_rate": 0.00023616326361329353, "loss": 0.02, "step": 164180 }, { "epoch": 0.43, "learning_rate": 0.00023615937539692204, "loss": 0.0198, "step": 164190 }, { "epoch": 0.43, "learning_rate": 0.0002361554871805506, "loss": 0.0178, "step": 164200 }, { "epoch": 0.43, "learning_rate": 0.00023615159896417915, "loss": 0.0147, "step": 164210 }, { "epoch": 0.43, "learning_rate": 0.00023614771074780767, "loss": 0.0185, "step": 164220 }, { "epoch": 0.43, "learning_rate": 0.0002361438225314362, "loss": 0.0192, "step": 164230 }, { "epoch": 0.43, "learning_rate": 0.00023613993431506475, "loss": 0.0231, "step": 164240 }, { "epoch": 0.43, "learning_rate": 0.0002361360460986933, "loss": 0.0197, "step": 164250 }, { "epoch": 0.43, "learning_rate": 0.0002361321578823218, "loss": 0.0159, "step": 164260 }, { "epoch": 0.43, "learning_rate": 0.00023612826966595035, "loss": 0.0188, "step": 164270 }, { "epoch": 0.43, "learning_rate": 0.00023612438144957886, "loss": 0.0216, "step": 164280 }, { "epoch": 0.43, "learning_rate": 0.00023612049323320743, "loss": 0.0205, "step": 164290 }, { "epoch": 0.43, "learning_rate": 0.00023611660501683595, "loss": 0.0206, "step": 164300 }, { "epoch": 0.43, "learning_rate": 0.0002361127168004645, "loss": 0.016, "step": 164310 }, { "epoch": 0.43, "learning_rate": 0.000236108828584093, "loss": 0.0152, "step": 164320 }, { "epoch": 0.43, "learning_rate": 0.00023610494036772157, "loss": 0.0216, "step": 164330 }, { "epoch": 0.43, "learning_rate": 0.00023610105215135011, "loss": 0.0196, "step": 164340 }, { "epoch": 0.43, "learning_rate": 0.00023609716393497863, "loss": 0.0174, "step": 164350 }, { "epoch": 0.43, "learning_rate": 0.00023609327571860714, "loss": 0.0198, "step": 164360 }, { "epoch": 0.43, "learning_rate": 0.0002360893875022357, "loss": 0.0209, "step": 164370 }, { "epoch": 0.43, "learning_rate": 0.00023608549928586425, "loss": 0.0196, "step": 164380 }, { "epoch": 0.43, "learning_rate": 0.00023608161106949277, "loss": 0.0195, "step": 164390 }, { "epoch": 0.43, "learning_rate": 0.0002360777228531213, "loss": 0.0191, "step": 164400 }, { "epoch": 0.43, "learning_rate": 0.00023607383463674985, "loss": 0.0145, "step": 164410 }, { "epoch": 0.43, "learning_rate": 0.0002360699464203784, "loss": 0.0182, "step": 164420 }, { "epoch": 0.43, "learning_rate": 0.0002360660582040069, "loss": 0.0206, "step": 164430 }, { "epoch": 0.43, "learning_rate": 0.00023606216998763545, "loss": 0.0152, "step": 164440 }, { "epoch": 0.43, "learning_rate": 0.000236058281771264, "loss": 0.0185, "step": 164450 }, { "epoch": 0.43, "learning_rate": 0.00023605439355489253, "loss": 0.019, "step": 164460 }, { "epoch": 0.43, "learning_rate": 0.00023605050533852105, "loss": 0.0172, "step": 164470 }, { "epoch": 0.43, "learning_rate": 0.0002360466171221496, "loss": 0.0165, "step": 164480 }, { "epoch": 0.43, "learning_rate": 0.00023604272890577816, "loss": 0.0197, "step": 164490 }, { "epoch": 0.43, "learning_rate": 0.00023603884068940667, "loss": 0.0176, "step": 164500 }, { "epoch": 0.43, "learning_rate": 0.0002360349524730352, "loss": 0.0171, "step": 164510 }, { "epoch": 0.43, "learning_rate": 0.00023603106425666373, "loss": 0.0199, "step": 164520 }, { "epoch": 0.43, "learning_rate": 0.00023602717604029224, "loss": 0.0158, "step": 164530 }, { "epoch": 0.43, "learning_rate": 0.0002360232878239208, "loss": 0.0179, "step": 164540 }, { "epoch": 0.43, "learning_rate": 0.00023601939960754935, "loss": 0.0195, "step": 164550 }, { "epoch": 0.43, "learning_rate": 0.00023601551139117787, "loss": 0.0164, "step": 164560 }, { "epoch": 0.43, "learning_rate": 0.0002360116231748064, "loss": 0.0142, "step": 164570 }, { "epoch": 0.43, "learning_rate": 0.00023600773495843495, "loss": 0.0159, "step": 164580 }, { "epoch": 0.43, "learning_rate": 0.0002360038467420635, "loss": 0.0182, "step": 164590 }, { "epoch": 0.43, "learning_rate": 0.000235999958525692, "loss": 0.0196, "step": 164600 }, { "epoch": 0.43, "learning_rate": 0.00023599607030932055, "loss": 0.0216, "step": 164610 }, { "epoch": 0.43, "learning_rate": 0.0002359921820929491, "loss": 0.0217, "step": 164620 }, { "epoch": 0.43, "learning_rate": 0.00023598829387657763, "loss": 0.0224, "step": 164630 }, { "epoch": 0.43, "learning_rate": 0.00023598440566020615, "loss": 0.0166, "step": 164640 }, { "epoch": 0.43, "learning_rate": 0.0002359805174438347, "loss": 0.0206, "step": 164650 }, { "epoch": 0.43, "learning_rate": 0.00023597662922746323, "loss": 0.0191, "step": 164660 }, { "epoch": 0.43, "learning_rate": 0.00023597274101109177, "loss": 0.0213, "step": 164670 }, { "epoch": 0.43, "learning_rate": 0.00023596885279472029, "loss": 0.0157, "step": 164680 }, { "epoch": 0.43, "learning_rate": 0.00023596496457834883, "loss": 0.0219, "step": 164690 }, { "epoch": 0.43, "learning_rate": 0.0002359610763619774, "loss": 0.0183, "step": 164700 }, { "epoch": 0.43, "learning_rate": 0.0002359571881456059, "loss": 0.0186, "step": 164710 }, { "epoch": 0.43, "learning_rate": 0.00023595329992923445, "loss": 0.027, "step": 164720 }, { "epoch": 0.43, "learning_rate": 0.00023594941171286297, "loss": 0.02, "step": 164730 }, { "epoch": 0.43, "learning_rate": 0.00023594552349649154, "loss": 0.0167, "step": 164740 }, { "epoch": 0.43, "learning_rate": 0.00023594163528012005, "loss": 0.017, "step": 164750 }, { "epoch": 0.43, "learning_rate": 0.0002359377470637486, "loss": 0.0214, "step": 164760 }, { "epoch": 0.43, "learning_rate": 0.0002359338588473771, "loss": 0.0223, "step": 164770 }, { "epoch": 0.43, "learning_rate": 0.00023592997063100565, "loss": 0.0245, "step": 164780 }, { "epoch": 0.43, "learning_rate": 0.0002359260824146342, "loss": 0.0188, "step": 164790 }, { "epoch": 0.43, "learning_rate": 0.00023592219419826273, "loss": 0.0228, "step": 164800 }, { "epoch": 0.43, "learning_rate": 0.00023591830598189125, "loss": 0.018, "step": 164810 }, { "epoch": 0.43, "learning_rate": 0.0002359144177655198, "loss": 0.0189, "step": 164820 }, { "epoch": 0.43, "learning_rate": 0.00023591052954914833, "loss": 0.0187, "step": 164830 }, { "epoch": 0.43, "learning_rate": 0.00023590664133277687, "loss": 0.0205, "step": 164840 }, { "epoch": 0.43, "learning_rate": 0.00023590275311640539, "loss": 0.0218, "step": 164850 }, { "epoch": 0.43, "learning_rate": 0.00023589886490003393, "loss": 0.0211, "step": 164860 }, { "epoch": 0.43, "learning_rate": 0.0002358949766836625, "loss": 0.0211, "step": 164870 }, { "epoch": 0.43, "learning_rate": 0.000235891088467291, "loss": 0.0174, "step": 164880 }, { "epoch": 0.43, "learning_rate": 0.00023588720025091955, "loss": 0.0201, "step": 164890 }, { "epoch": 0.43, "learning_rate": 0.00023588331203454807, "loss": 0.0188, "step": 164900 }, { "epoch": 0.43, "learning_rate": 0.00023587942381817664, "loss": 0.0188, "step": 164910 }, { "epoch": 0.43, "learning_rate": 0.00023587553560180515, "loss": 0.0241, "step": 164920 }, { "epoch": 0.43, "learning_rate": 0.0002358716473854337, "loss": 0.0192, "step": 164930 }, { "epoch": 0.43, "learning_rate": 0.0002358677591690622, "loss": 0.024, "step": 164940 }, { "epoch": 0.43, "learning_rate": 0.00023586387095269077, "loss": 0.0158, "step": 164950 }, { "epoch": 0.43, "learning_rate": 0.0002358599827363193, "loss": 0.0174, "step": 164960 }, { "epoch": 0.43, "learning_rate": 0.00023585609451994783, "loss": 0.0197, "step": 164970 }, { "epoch": 0.43, "learning_rate": 0.00023585220630357635, "loss": 0.0201, "step": 164980 }, { "epoch": 0.43, "learning_rate": 0.00023584831808720491, "loss": 0.0168, "step": 164990 }, { "epoch": 0.43, "learning_rate": 0.00023584442987083343, "loss": 0.0178, "step": 165000 }, { "epoch": 0.43, "eval_cer": 0.8818048598193629, "eval_loss": 0.013063205406069756, "eval_runtime": 107.4075, "eval_samples_per_second": 18.621, "eval_steps_per_second": 4.655, "step": 165000 }, { "epoch": 0.43, "learning_rate": 0.00023584054165446197, "loss": 0.0151, "step": 165010 }, { "epoch": 0.43, "learning_rate": 0.00023583665343809048, "loss": 0.0214, "step": 165020 }, { "epoch": 0.43, "learning_rate": 0.00023583276522171903, "loss": 0.0214, "step": 165030 }, { "epoch": 0.43, "learning_rate": 0.0002358288770053476, "loss": 0.018, "step": 165040 }, { "epoch": 0.43, "learning_rate": 0.0002358249887889761, "loss": 0.0195, "step": 165050 }, { "epoch": 0.43, "learning_rate": 0.00023582110057260462, "loss": 0.02, "step": 165060 }, { "epoch": 0.43, "learning_rate": 0.00023581721235623317, "loss": 0.0251, "step": 165070 }, { "epoch": 0.43, "learning_rate": 0.00023581332413986173, "loss": 0.019, "step": 165080 }, { "epoch": 0.43, "learning_rate": 0.00023580943592349025, "loss": 0.0247, "step": 165090 }, { "epoch": 0.43, "learning_rate": 0.0002358055477071188, "loss": 0.0161, "step": 165100 }, { "epoch": 0.43, "learning_rate": 0.0002358016594907473, "loss": 0.0223, "step": 165110 }, { "epoch": 0.43, "learning_rate": 0.00023579777127437587, "loss": 0.0181, "step": 165120 }, { "epoch": 0.43, "learning_rate": 0.0002357938830580044, "loss": 0.0173, "step": 165130 }, { "epoch": 0.43, "learning_rate": 0.00023578999484163293, "loss": 0.0205, "step": 165140 }, { "epoch": 0.43, "learning_rate": 0.00023578610662526144, "loss": 0.0191, "step": 165150 }, { "epoch": 0.43, "learning_rate": 0.00023578221840889, "loss": 0.016, "step": 165160 }, { "epoch": 0.43, "learning_rate": 0.00023577833019251853, "loss": 0.0187, "step": 165170 }, { "epoch": 0.43, "learning_rate": 0.00023577444197614707, "loss": 0.0209, "step": 165180 }, { "epoch": 0.43, "learning_rate": 0.00023577055375977558, "loss": 0.0234, "step": 165190 }, { "epoch": 0.43, "learning_rate": 0.00023576666554340415, "loss": 0.0176, "step": 165200 }, { "epoch": 0.43, "learning_rate": 0.0002357627773270327, "loss": 0.0174, "step": 165210 }, { "epoch": 0.43, "learning_rate": 0.0002357588891106612, "loss": 0.0178, "step": 165220 }, { "epoch": 0.43, "learning_rate": 0.00023575500089428972, "loss": 0.0185, "step": 165230 }, { "epoch": 0.43, "learning_rate": 0.00023575111267791827, "loss": 0.0173, "step": 165240 }, { "epoch": 0.43, "learning_rate": 0.00023574722446154683, "loss": 0.0176, "step": 165250 }, { "epoch": 0.43, "learning_rate": 0.00023574333624517535, "loss": 0.0193, "step": 165260 }, { "epoch": 0.43, "learning_rate": 0.0002357394480288039, "loss": 0.0219, "step": 165270 }, { "epoch": 0.43, "learning_rate": 0.0002357355598124324, "loss": 0.02, "step": 165280 }, { "epoch": 0.43, "learning_rate": 0.00023573167159606097, "loss": 0.0199, "step": 165290 }, { "epoch": 0.43, "learning_rate": 0.0002357277833796895, "loss": 0.0185, "step": 165300 }, { "epoch": 0.43, "learning_rate": 0.00023572389516331803, "loss": 0.0228, "step": 165310 }, { "epoch": 0.43, "learning_rate": 0.00023572000694694654, "loss": 0.0217, "step": 165320 }, { "epoch": 0.43, "learning_rate": 0.0002357161187305751, "loss": 0.0228, "step": 165330 }, { "epoch": 0.43, "learning_rate": 0.00023571223051420363, "loss": 0.0172, "step": 165340 }, { "epoch": 0.43, "learning_rate": 0.00023570834229783217, "loss": 0.0168, "step": 165350 }, { "epoch": 0.43, "learning_rate": 0.00023570445408146068, "loss": 0.0174, "step": 165360 }, { "epoch": 0.43, "learning_rate": 0.00023570056586508925, "loss": 0.0258, "step": 165370 }, { "epoch": 0.43, "learning_rate": 0.00023569667764871777, "loss": 0.0146, "step": 165380 }, { "epoch": 0.43, "learning_rate": 0.0002356927894323463, "loss": 0.0167, "step": 165390 }, { "epoch": 0.43, "learning_rate": 0.00023568890121597482, "loss": 0.0177, "step": 165400 }, { "epoch": 0.43, "learning_rate": 0.0002356850129996034, "loss": 0.0147, "step": 165410 }, { "epoch": 0.43, "learning_rate": 0.00023568112478323193, "loss": 0.0166, "step": 165420 }, { "epoch": 0.43, "learning_rate": 0.00023567723656686045, "loss": 0.0205, "step": 165430 }, { "epoch": 0.43, "learning_rate": 0.000235673348350489, "loss": 0.0204, "step": 165440 }, { "epoch": 0.43, "learning_rate": 0.00023566946013411753, "loss": 0.0186, "step": 165450 }, { "epoch": 0.43, "learning_rate": 0.00023566557191774607, "loss": 0.0138, "step": 165460 }, { "epoch": 0.43, "learning_rate": 0.0002356616837013746, "loss": 0.015, "step": 165470 }, { "epoch": 0.43, "learning_rate": 0.00023565779548500313, "loss": 0.0178, "step": 165480 }, { "epoch": 0.43, "learning_rate": 0.00023565390726863164, "loss": 0.0237, "step": 165490 }, { "epoch": 0.43, "learning_rate": 0.0002356500190522602, "loss": 0.0173, "step": 165500 }, { "epoch": 0.43, "learning_rate": 0.00023564613083588873, "loss": 0.0191, "step": 165510 }, { "epoch": 0.43, "learning_rate": 0.00023564224261951727, "loss": 0.0223, "step": 165520 }, { "epoch": 0.43, "learning_rate": 0.00023563835440314578, "loss": 0.0236, "step": 165530 }, { "epoch": 0.43, "learning_rate": 0.00023563446618677435, "loss": 0.0214, "step": 165540 }, { "epoch": 0.43, "learning_rate": 0.00023563057797040287, "loss": 0.0201, "step": 165550 }, { "epoch": 0.43, "learning_rate": 0.0002356266897540314, "loss": 0.0189, "step": 165560 }, { "epoch": 0.43, "learning_rate": 0.00023562280153765992, "loss": 0.0194, "step": 165570 }, { "epoch": 0.43, "learning_rate": 0.0002356189133212885, "loss": 0.0153, "step": 165580 }, { "epoch": 0.43, "learning_rate": 0.00023561502510491703, "loss": 0.0171, "step": 165590 }, { "epoch": 0.43, "learning_rate": 0.00023561113688854555, "loss": 0.0172, "step": 165600 }, { "epoch": 0.43, "learning_rate": 0.0002356072486721741, "loss": 0.0217, "step": 165610 }, { "epoch": 0.43, "learning_rate": 0.00023560336045580263, "loss": 0.0167, "step": 165620 }, { "epoch": 0.43, "learning_rate": 0.00023559947223943117, "loss": 0.015, "step": 165630 }, { "epoch": 0.43, "learning_rate": 0.0002355955840230597, "loss": 0.0194, "step": 165640 }, { "epoch": 0.43, "learning_rate": 0.00023559169580668823, "loss": 0.0203, "step": 165650 }, { "epoch": 0.43, "learning_rate": 0.00023558780759031677, "loss": 0.0207, "step": 165660 }, { "epoch": 0.43, "learning_rate": 0.0002355839193739453, "loss": 0.0175, "step": 165670 }, { "epoch": 0.43, "learning_rate": 0.00023558003115757383, "loss": 0.021, "step": 165680 }, { "epoch": 0.43, "learning_rate": 0.00023557614294120237, "loss": 0.0191, "step": 165690 }, { "epoch": 0.43, "learning_rate": 0.0002355722547248309, "loss": 0.02, "step": 165700 }, { "epoch": 0.43, "learning_rate": 0.00023556836650845945, "loss": 0.0192, "step": 165710 }, { "epoch": 0.43, "learning_rate": 0.00023556447829208797, "loss": 0.0195, "step": 165720 }, { "epoch": 0.43, "learning_rate": 0.0002355605900757165, "loss": 0.0201, "step": 165730 }, { "epoch": 0.43, "learning_rate": 0.00023555670185934502, "loss": 0.0187, "step": 165740 }, { "epoch": 0.43, "learning_rate": 0.0002355528136429736, "loss": 0.0194, "step": 165750 }, { "epoch": 0.43, "learning_rate": 0.00023554892542660213, "loss": 0.021, "step": 165760 }, { "epoch": 0.43, "learning_rate": 0.00023554503721023065, "loss": 0.0194, "step": 165770 }, { "epoch": 0.43, "learning_rate": 0.00023554114899385916, "loss": 0.0143, "step": 165780 }, { "epoch": 0.43, "learning_rate": 0.00023553726077748773, "loss": 0.0205, "step": 165790 }, { "epoch": 0.43, "learning_rate": 0.00023553337256111627, "loss": 0.0194, "step": 165800 }, { "epoch": 0.43, "learning_rate": 0.00023552948434474479, "loss": 0.0189, "step": 165810 }, { "epoch": 0.43, "learning_rate": 0.00023552559612837333, "loss": 0.0227, "step": 165820 }, { "epoch": 0.43, "learning_rate": 0.00023552170791200187, "loss": 0.02, "step": 165830 }, { "epoch": 0.43, "learning_rate": 0.0002355178196956304, "loss": 0.0151, "step": 165840 }, { "epoch": 0.43, "learning_rate": 0.00023551393147925893, "loss": 0.0193, "step": 165850 }, { "epoch": 0.43, "learning_rate": 0.00023551004326288747, "loss": 0.0189, "step": 165860 }, { "epoch": 0.43, "learning_rate": 0.000235506155046516, "loss": 0.0204, "step": 165870 }, { "epoch": 0.43, "learning_rate": 0.00023550226683014455, "loss": 0.0178, "step": 165880 }, { "epoch": 0.43, "learning_rate": 0.00023549837861377307, "loss": 0.0166, "step": 165890 }, { "epoch": 0.43, "learning_rate": 0.0002354944903974016, "loss": 0.0166, "step": 165900 }, { "epoch": 0.43, "learning_rate": 0.00023549060218103018, "loss": 0.0185, "step": 165910 }, { "epoch": 0.43, "learning_rate": 0.0002354867139646587, "loss": 0.0174, "step": 165920 }, { "epoch": 0.43, "learning_rate": 0.00023548282574828723, "loss": 0.0181, "step": 165930 }, { "epoch": 0.43, "learning_rate": 0.00023547893753191575, "loss": 0.0222, "step": 165940 }, { "epoch": 0.43, "learning_rate": 0.00023547504931554431, "loss": 0.019, "step": 165950 }, { "epoch": 0.43, "learning_rate": 0.00023547116109917283, "loss": 0.0192, "step": 165960 }, { "epoch": 0.43, "learning_rate": 0.00023546727288280137, "loss": 0.02, "step": 165970 }, { "epoch": 0.43, "learning_rate": 0.00023546338466642989, "loss": 0.0243, "step": 165980 }, { "epoch": 0.43, "learning_rate": 0.00023545949645005843, "loss": 0.0174, "step": 165990 }, { "epoch": 0.43, "learning_rate": 0.00023545560823368697, "loss": 0.0213, "step": 166000 }, { "epoch": 0.43, "eval_cer": 0.8817446754311932, "eval_loss": 0.012856963090598583, "eval_runtime": 107.8453, "eval_samples_per_second": 18.545, "eval_steps_per_second": 4.636, "step": 166000 }, { "epoch": 0.43, "learning_rate": 0.0002354517200173155, "loss": 0.0203, "step": 166010 }, { "epoch": 0.43, "learning_rate": 0.00023544783180094403, "loss": 0.0207, "step": 166020 }, { "epoch": 0.43, "learning_rate": 0.00023544394358457257, "loss": 0.0172, "step": 166030 }, { "epoch": 0.43, "learning_rate": 0.0002354400553682011, "loss": 0.0168, "step": 166040 }, { "epoch": 0.43, "learning_rate": 0.00023543616715182965, "loss": 0.0186, "step": 166050 }, { "epoch": 0.43, "learning_rate": 0.00023543227893545816, "loss": 0.0168, "step": 166060 }, { "epoch": 0.43, "learning_rate": 0.0002354283907190867, "loss": 0.0195, "step": 166070 }, { "epoch": 0.43, "learning_rate": 0.00023542450250271527, "loss": 0.0168, "step": 166080 }, { "epoch": 0.43, "learning_rate": 0.0002354206142863438, "loss": 0.0193, "step": 166090 }, { "epoch": 0.43, "learning_rate": 0.0002354167260699723, "loss": 0.0205, "step": 166100 }, { "epoch": 0.43, "learning_rate": 0.00023541283785360085, "loss": 0.0181, "step": 166110 }, { "epoch": 0.43, "learning_rate": 0.00023540894963722941, "loss": 0.0176, "step": 166120 }, { "epoch": 0.43, "learning_rate": 0.00023540506142085793, "loss": 0.0183, "step": 166130 }, { "epoch": 0.43, "learning_rate": 0.00023540117320448647, "loss": 0.0207, "step": 166140 }, { "epoch": 0.43, "learning_rate": 0.00023539728498811499, "loss": 0.0202, "step": 166150 }, { "epoch": 0.43, "learning_rate": 0.00023539339677174355, "loss": 0.0177, "step": 166160 }, { "epoch": 0.43, "learning_rate": 0.00023538950855537207, "loss": 0.0202, "step": 166170 }, { "epoch": 0.43, "learning_rate": 0.0002353856203390006, "loss": 0.0221, "step": 166180 }, { "epoch": 0.43, "learning_rate": 0.00023538173212262912, "loss": 0.019, "step": 166190 }, { "epoch": 0.43, "learning_rate": 0.0002353778439062577, "loss": 0.0145, "step": 166200 }, { "epoch": 0.43, "learning_rate": 0.0002353739556898862, "loss": 0.0186, "step": 166210 }, { "epoch": 0.43, "learning_rate": 0.00023537006747351475, "loss": 0.0208, "step": 166220 }, { "epoch": 0.43, "learning_rate": 0.00023536617925714326, "loss": 0.0167, "step": 166230 }, { "epoch": 0.43, "learning_rate": 0.0002353622910407718, "loss": 0.0217, "step": 166240 }, { "epoch": 0.43, "learning_rate": 0.00023535840282440035, "loss": 0.018, "step": 166250 }, { "epoch": 0.43, "learning_rate": 0.0002353545146080289, "loss": 0.0183, "step": 166260 }, { "epoch": 0.43, "learning_rate": 0.0002353506263916574, "loss": 0.021, "step": 166270 }, { "epoch": 0.43, "learning_rate": 0.00023534673817528595, "loss": 0.021, "step": 166280 }, { "epoch": 0.43, "learning_rate": 0.00023534284995891451, "loss": 0.0223, "step": 166290 }, { "epoch": 0.43, "learning_rate": 0.00023533896174254303, "loss": 0.016, "step": 166300 }, { "epoch": 0.43, "learning_rate": 0.00023533507352617157, "loss": 0.023, "step": 166310 }, { "epoch": 0.43, "learning_rate": 0.00023533118530980008, "loss": 0.0202, "step": 166320 }, { "epoch": 0.43, "learning_rate": 0.00023532729709342865, "loss": 0.0243, "step": 166330 }, { "epoch": 0.43, "learning_rate": 0.00023532340887705717, "loss": 0.021, "step": 166340 }, { "epoch": 0.43, "learning_rate": 0.0002353195206606857, "loss": 0.0187, "step": 166350 }, { "epoch": 0.43, "learning_rate": 0.00023531563244431422, "loss": 0.0183, "step": 166360 }, { "epoch": 0.43, "learning_rate": 0.0002353117442279428, "loss": 0.0194, "step": 166370 }, { "epoch": 0.43, "learning_rate": 0.0002353078560115713, "loss": 0.0169, "step": 166380 }, { "epoch": 0.43, "learning_rate": 0.00023530396779519985, "loss": 0.0204, "step": 166390 }, { "epoch": 0.43, "learning_rate": 0.00023530007957882836, "loss": 0.0155, "step": 166400 }, { "epoch": 0.43, "learning_rate": 0.00023529619136245693, "loss": 0.0207, "step": 166410 }, { "epoch": 0.43, "learning_rate": 0.00023529230314608545, "loss": 0.0175, "step": 166420 }, { "epoch": 0.43, "learning_rate": 0.000235288414929714, "loss": 0.0144, "step": 166430 }, { "epoch": 0.43, "learning_rate": 0.0002352845267133425, "loss": 0.0174, "step": 166440 }, { "epoch": 0.43, "learning_rate": 0.00023528063849697107, "loss": 0.0189, "step": 166450 }, { "epoch": 0.43, "learning_rate": 0.0002352767502805996, "loss": 0.0158, "step": 166460 }, { "epoch": 0.43, "learning_rate": 0.00023527286206422813, "loss": 0.0222, "step": 166470 }, { "epoch": 0.43, "learning_rate": 0.00023526897384785667, "loss": 0.0178, "step": 166480 }, { "epoch": 0.43, "learning_rate": 0.00023526508563148518, "loss": 0.0158, "step": 166490 }, { "epoch": 0.43, "learning_rate": 0.00023526119741511375, "loss": 0.016, "step": 166500 }, { "epoch": 0.43, "learning_rate": 0.00023525730919874227, "loss": 0.021, "step": 166510 }, { "epoch": 0.43, "learning_rate": 0.0002352534209823708, "loss": 0.0175, "step": 166520 }, { "epoch": 0.43, "learning_rate": 0.00023524953276599932, "loss": 0.0175, "step": 166530 }, { "epoch": 0.43, "learning_rate": 0.0002352456445496279, "loss": 0.0188, "step": 166540 }, { "epoch": 0.43, "learning_rate": 0.0002352417563332564, "loss": 0.0161, "step": 166550 }, { "epoch": 0.43, "learning_rate": 0.00023523786811688495, "loss": 0.0197, "step": 166560 }, { "epoch": 0.43, "learning_rate": 0.00023523397990051346, "loss": 0.0221, "step": 166570 }, { "epoch": 0.43, "learning_rate": 0.00023523009168414203, "loss": 0.0185, "step": 166580 }, { "epoch": 0.43, "learning_rate": 0.00023522620346777055, "loss": 0.0177, "step": 166590 }, { "epoch": 0.43, "learning_rate": 0.0002352223152513991, "loss": 0.0145, "step": 166600 }, { "epoch": 0.43, "learning_rate": 0.0002352184270350276, "loss": 0.0219, "step": 166610 }, { "epoch": 0.43, "learning_rate": 0.00023521453881865617, "loss": 0.0244, "step": 166620 }, { "epoch": 0.43, "learning_rate": 0.0002352106506022847, "loss": 0.0174, "step": 166630 }, { "epoch": 0.43, "learning_rate": 0.00023520676238591323, "loss": 0.0184, "step": 166640 }, { "epoch": 0.43, "learning_rate": 0.00023520287416954174, "loss": 0.019, "step": 166650 }, { "epoch": 0.43, "learning_rate": 0.0002351989859531703, "loss": 0.0248, "step": 166660 }, { "epoch": 0.43, "learning_rate": 0.00023519509773679885, "loss": 0.0202, "step": 166670 }, { "epoch": 0.43, "learning_rate": 0.00023519120952042737, "loss": 0.0193, "step": 166680 }, { "epoch": 0.43, "learning_rate": 0.0002351873213040559, "loss": 0.0175, "step": 166690 }, { "epoch": 0.43, "learning_rate": 0.00023518343308768445, "loss": 0.0185, "step": 166700 }, { "epoch": 0.43, "learning_rate": 0.000235179544871313, "loss": 0.0206, "step": 166710 }, { "epoch": 0.43, "learning_rate": 0.0002351756566549415, "loss": 0.0219, "step": 166720 }, { "epoch": 0.43, "learning_rate": 0.00023517176843857005, "loss": 0.0228, "step": 166730 }, { "epoch": 0.43, "learning_rate": 0.00023516788022219856, "loss": 0.0198, "step": 166740 }, { "epoch": 0.43, "learning_rate": 0.00023516399200582713, "loss": 0.0181, "step": 166750 }, { "epoch": 0.43, "learning_rate": 0.00023516010378945565, "loss": 0.0204, "step": 166760 }, { "epoch": 0.43, "learning_rate": 0.0002351562155730842, "loss": 0.0183, "step": 166770 }, { "epoch": 0.43, "learning_rate": 0.0002351523273567127, "loss": 0.0188, "step": 166780 }, { "epoch": 0.43, "learning_rate": 0.00023514843914034127, "loss": 0.0202, "step": 166790 }, { "epoch": 0.43, "learning_rate": 0.0002351445509239698, "loss": 0.0162, "step": 166800 }, { "epoch": 0.43, "learning_rate": 0.00023514066270759833, "loss": 0.0157, "step": 166810 }, { "epoch": 0.43, "learning_rate": 0.00023513677449122684, "loss": 0.0139, "step": 166820 }, { "epoch": 0.43, "learning_rate": 0.0002351328862748554, "loss": 0.0174, "step": 166830 }, { "epoch": 0.43, "learning_rate": 0.00023512899805848395, "loss": 0.0224, "step": 166840 }, { "epoch": 0.43, "learning_rate": 0.00023512510984211247, "loss": 0.0176, "step": 166850 }, { "epoch": 0.43, "learning_rate": 0.000235121221625741, "loss": 0.0199, "step": 166860 }, { "epoch": 0.43, "learning_rate": 0.00023511733340936955, "loss": 0.0158, "step": 166870 }, { "epoch": 0.43, "learning_rate": 0.0002351134451929981, "loss": 0.0181, "step": 166880 }, { "epoch": 0.43, "learning_rate": 0.0002351095569766266, "loss": 0.0226, "step": 166890 }, { "epoch": 0.43, "learning_rate": 0.00023510566876025515, "loss": 0.0175, "step": 166900 }, { "epoch": 0.43, "learning_rate": 0.0002351017805438837, "loss": 0.021, "step": 166910 }, { "epoch": 0.43, "learning_rate": 0.00023509789232751223, "loss": 0.0185, "step": 166920 }, { "epoch": 0.43, "learning_rate": 0.00023509400411114074, "loss": 0.0173, "step": 166930 }, { "epoch": 0.43, "learning_rate": 0.0002350901158947693, "loss": 0.0199, "step": 166940 }, { "epoch": 0.43, "learning_rate": 0.00023508622767839786, "loss": 0.0185, "step": 166950 }, { "epoch": 0.43, "learning_rate": 0.00023508233946202637, "loss": 0.0168, "step": 166960 }, { "epoch": 0.43, "learning_rate": 0.00023507845124565488, "loss": 0.0202, "step": 166970 }, { "epoch": 0.43, "learning_rate": 0.00023507456302928343, "loss": 0.0175, "step": 166980 }, { "epoch": 0.43, "learning_rate": 0.00023507067481291194, "loss": 0.0194, "step": 166990 }, { "epoch": 0.43, "learning_rate": 0.0002350667865965405, "loss": 0.018, "step": 167000 }, { "epoch": 0.43, "eval_cer": 0.8817306790618513, "eval_loss": 0.012466521002352238, "eval_runtime": 107.3379, "eval_samples_per_second": 18.633, "eval_steps_per_second": 4.658, "step": 167000 }, { "epoch": 0.43, "learning_rate": 0.00023506289838016905, "loss": 0.0156, "step": 167010 }, { "epoch": 0.43, "learning_rate": 0.00023505901016379757, "loss": 0.0195, "step": 167020 }, { "epoch": 0.43, "learning_rate": 0.0002350551219474261, "loss": 0.0149, "step": 167030 }, { "epoch": 0.43, "learning_rate": 0.00023505123373105465, "loss": 0.0177, "step": 167040 }, { "epoch": 0.43, "learning_rate": 0.0002350473455146832, "loss": 0.0217, "step": 167050 }, { "epoch": 0.43, "learning_rate": 0.0002350434572983117, "loss": 0.0217, "step": 167060 }, { "epoch": 0.43, "learning_rate": 0.00023503956908194025, "loss": 0.0146, "step": 167070 }, { "epoch": 0.43, "learning_rate": 0.0002350356808655688, "loss": 0.0151, "step": 167080 }, { "epoch": 0.43, "learning_rate": 0.00023503179264919733, "loss": 0.0157, "step": 167090 }, { "epoch": 0.43, "learning_rate": 0.00023502790443282584, "loss": 0.0196, "step": 167100 }, { "epoch": 0.43, "learning_rate": 0.00023502401621645439, "loss": 0.0191, "step": 167110 }, { "epoch": 0.43, "learning_rate": 0.00023502012800008295, "loss": 0.0181, "step": 167120 }, { "epoch": 0.43, "learning_rate": 0.00023501623978371147, "loss": 0.018, "step": 167130 }, { "epoch": 0.43, "learning_rate": 0.00023501235156733998, "loss": 0.0175, "step": 167140 }, { "epoch": 0.43, "learning_rate": 0.00023500846335096853, "loss": 0.0197, "step": 167150 }, { "epoch": 0.43, "learning_rate": 0.0002350045751345971, "loss": 0.0229, "step": 167160 }, { "epoch": 0.43, "learning_rate": 0.0002350006869182256, "loss": 0.0199, "step": 167170 }, { "epoch": 0.43, "learning_rate": 0.00023499679870185415, "loss": 0.016, "step": 167180 }, { "epoch": 0.43, "learning_rate": 0.00023499291048548266, "loss": 0.0165, "step": 167190 }, { "epoch": 0.43, "learning_rate": 0.00023498902226911123, "loss": 0.0178, "step": 167200 }, { "epoch": 0.43, "learning_rate": 0.00023498513405273975, "loss": 0.0208, "step": 167210 }, { "epoch": 0.43, "learning_rate": 0.0002349812458363683, "loss": 0.0187, "step": 167220 }, { "epoch": 0.43, "learning_rate": 0.0002349773576199968, "loss": 0.0175, "step": 167230 }, { "epoch": 0.43, "learning_rate": 0.00023497346940362535, "loss": 0.0169, "step": 167240 }, { "epoch": 0.43, "learning_rate": 0.0002349695811872539, "loss": 0.0151, "step": 167250 }, { "epoch": 0.43, "learning_rate": 0.00023496569297088243, "loss": 0.0179, "step": 167260 }, { "epoch": 0.43, "learning_rate": 0.00023496180475451094, "loss": 0.0202, "step": 167270 }, { "epoch": 0.43, "learning_rate": 0.00023495791653813949, "loss": 0.0199, "step": 167280 }, { "epoch": 0.43, "learning_rate": 0.00023495402832176803, "loss": 0.0146, "step": 167290 }, { "epoch": 0.43, "learning_rate": 0.00023495014010539657, "loss": 0.0184, "step": 167300 }, { "epoch": 0.43, "learning_rate": 0.00023494625188902508, "loss": 0.0203, "step": 167310 }, { "epoch": 0.43, "learning_rate": 0.00023494236367265362, "loss": 0.0162, "step": 167320 }, { "epoch": 0.43, "learning_rate": 0.0002349384754562822, "loss": 0.0152, "step": 167330 }, { "epoch": 0.43, "learning_rate": 0.0002349345872399107, "loss": 0.0218, "step": 167340 }, { "epoch": 0.43, "learning_rate": 0.00023493069902353925, "loss": 0.0172, "step": 167350 }, { "epoch": 0.43, "learning_rate": 0.00023492681080716776, "loss": 0.0216, "step": 167360 }, { "epoch": 0.43, "learning_rate": 0.00023492292259079633, "loss": 0.0203, "step": 167370 }, { "epoch": 0.43, "learning_rate": 0.00023491903437442485, "loss": 0.0159, "step": 167380 }, { "epoch": 0.43, "learning_rate": 0.0002349151461580534, "loss": 0.0406, "step": 167390 }, { "epoch": 0.43, "learning_rate": 0.0002349112579416819, "loss": 0.0167, "step": 167400 }, { "epoch": 0.43, "learning_rate": 0.00023490736972531047, "loss": 0.0235, "step": 167410 }, { "epoch": 0.43, "learning_rate": 0.000234903481508939, "loss": 0.0204, "step": 167420 }, { "epoch": 0.43, "learning_rate": 0.00023489959329256753, "loss": 0.0216, "step": 167430 }, { "epoch": 0.43, "learning_rate": 0.00023489570507619604, "loss": 0.0165, "step": 167440 }, { "epoch": 0.43, "learning_rate": 0.0002348918168598246, "loss": 0.02, "step": 167450 }, { "epoch": 0.43, "learning_rate": 0.00023488792864345313, "loss": 0.0201, "step": 167460 }, { "epoch": 0.43, "learning_rate": 0.00023488404042708167, "loss": 0.0163, "step": 167470 }, { "epoch": 0.43, "learning_rate": 0.00023488015221071018, "loss": 0.0182, "step": 167480 }, { "epoch": 0.43, "learning_rate": 0.00023487626399433872, "loss": 0.0203, "step": 167490 }, { "epoch": 0.43, "learning_rate": 0.0002348723757779673, "loss": 0.0232, "step": 167500 }, { "epoch": 0.43, "learning_rate": 0.0002348684875615958, "loss": 0.0168, "step": 167510 }, { "epoch": 0.43, "learning_rate": 0.00023486459934522435, "loss": 0.0191, "step": 167520 }, { "epoch": 0.43, "learning_rate": 0.00023486071112885286, "loss": 0.0204, "step": 167530 }, { "epoch": 0.43, "learning_rate": 0.00023485682291248143, "loss": 0.0194, "step": 167540 }, { "epoch": 0.43, "learning_rate": 0.00023485293469610995, "loss": 0.0185, "step": 167550 }, { "epoch": 0.43, "learning_rate": 0.0002348490464797385, "loss": 0.0213, "step": 167560 }, { "epoch": 0.43, "learning_rate": 0.000234845158263367, "loss": 0.0211, "step": 167570 }, { "epoch": 0.43, "learning_rate": 0.00023484127004699557, "loss": 0.0163, "step": 167580 }, { "epoch": 0.43, "learning_rate": 0.00023483738183062409, "loss": 0.019, "step": 167590 }, { "epoch": 0.43, "learning_rate": 0.00023483349361425263, "loss": 0.0172, "step": 167600 }, { "epoch": 0.43, "learning_rate": 0.00023482960539788114, "loss": 0.0181, "step": 167610 }, { "epoch": 0.43, "learning_rate": 0.0002348257171815097, "loss": 0.0198, "step": 167620 }, { "epoch": 0.43, "learning_rate": 0.00023482182896513823, "loss": 0.0219, "step": 167630 }, { "epoch": 0.43, "learning_rate": 0.00023481794074876677, "loss": 0.0195, "step": 167640 }, { "epoch": 0.43, "learning_rate": 0.00023481405253239528, "loss": 0.0179, "step": 167650 }, { "epoch": 0.43, "learning_rate": 0.00023481016431602385, "loss": 0.0186, "step": 167660 }, { "epoch": 0.43, "learning_rate": 0.0002348062760996524, "loss": 0.0187, "step": 167670 }, { "epoch": 0.43, "learning_rate": 0.0002348023878832809, "loss": 0.0152, "step": 167680 }, { "epoch": 0.43, "learning_rate": 0.00023479849966690942, "loss": 0.0175, "step": 167690 }, { "epoch": 0.43, "learning_rate": 0.000234794611450538, "loss": 0.0208, "step": 167700 }, { "epoch": 0.43, "learning_rate": 0.00023479072323416653, "loss": 0.0173, "step": 167710 }, { "epoch": 0.43, "learning_rate": 0.00023478683501779505, "loss": 0.0174, "step": 167720 }, { "epoch": 0.43, "learning_rate": 0.0002347829468014236, "loss": 0.0188, "step": 167730 }, { "epoch": 0.43, "learning_rate": 0.0002347790585850521, "loss": 0.0153, "step": 167740 }, { "epoch": 0.43, "learning_rate": 0.00023477517036868067, "loss": 0.0168, "step": 167750 }, { "epoch": 0.43, "learning_rate": 0.00023477128215230919, "loss": 0.0162, "step": 167760 }, { "epoch": 0.43, "learning_rate": 0.00023476739393593773, "loss": 0.0169, "step": 167770 }, { "epoch": 0.43, "learning_rate": 0.00023476350571956624, "loss": 0.0188, "step": 167780 }, { "epoch": 0.43, "learning_rate": 0.0002347596175031948, "loss": 0.0285, "step": 167790 }, { "epoch": 0.43, "learning_rate": 0.00023475572928682333, "loss": 0.0203, "step": 167800 }, { "epoch": 0.43, "learning_rate": 0.00023475184107045187, "loss": 0.0143, "step": 167810 }, { "epoch": 0.44, "learning_rate": 0.00023474795285408038, "loss": 0.0195, "step": 167820 }, { "epoch": 0.44, "learning_rate": 0.00023474406463770895, "loss": 0.0175, "step": 167830 }, { "epoch": 0.44, "learning_rate": 0.00023474017642133746, "loss": 0.0228, "step": 167840 }, { "epoch": 0.44, "learning_rate": 0.000234736288204966, "loss": 0.0219, "step": 167850 }, { "epoch": 0.44, "learning_rate": 0.00023473239998859452, "loss": 0.0163, "step": 167860 }, { "epoch": 0.44, "learning_rate": 0.0002347285117722231, "loss": 0.0189, "step": 167870 }, { "epoch": 0.44, "learning_rate": 0.00023472462355585163, "loss": 0.0163, "step": 167880 }, { "epoch": 0.44, "learning_rate": 0.00023472073533948015, "loss": 0.0164, "step": 167890 }, { "epoch": 0.44, "learning_rate": 0.0002347168471231087, "loss": 0.0205, "step": 167900 }, { "epoch": 0.44, "learning_rate": 0.00023471295890673723, "loss": 0.0203, "step": 167910 }, { "epoch": 0.44, "learning_rate": 0.00023470907069036577, "loss": 0.02, "step": 167920 }, { "epoch": 0.44, "learning_rate": 0.00023470518247399429, "loss": 0.0196, "step": 167930 }, { "epoch": 0.44, "learning_rate": 0.00023470129425762283, "loss": 0.0192, "step": 167940 }, { "epoch": 0.44, "learning_rate": 0.00023469740604125137, "loss": 0.0167, "step": 167950 }, { "epoch": 0.44, "learning_rate": 0.0002346935178248799, "loss": 0.0205, "step": 167960 }, { "epoch": 0.44, "learning_rate": 0.00023468962960850842, "loss": 0.0177, "step": 167970 }, { "epoch": 0.44, "learning_rate": 0.00023468574139213697, "loss": 0.0223, "step": 167980 }, { "epoch": 0.44, "learning_rate": 0.00023468185317576548, "loss": 0.0186, "step": 167990 }, { "epoch": 0.44, "learning_rate": 0.00023467796495939405, "loss": 0.0226, "step": 168000 }, { "epoch": 0.44, "eval_cer": 0.8817390768834564, "eval_loss": 0.012735070660710335, "eval_runtime": 108.0118, "eval_samples_per_second": 18.517, "eval_steps_per_second": 4.629, "step": 168000 }, { "epoch": 0.44, "learning_rate": 0.00023467407674302256, "loss": 0.0206, "step": 168010 }, { "epoch": 0.44, "learning_rate": 0.0002346701885266511, "loss": 0.0255, "step": 168020 }, { "epoch": 0.44, "learning_rate": 0.00023466630031027962, "loss": 0.0213, "step": 168030 }, { "epoch": 0.44, "learning_rate": 0.0002346624120939082, "loss": 0.021, "step": 168040 }, { "epoch": 0.44, "learning_rate": 0.00023465852387753673, "loss": 0.0168, "step": 168050 }, { "epoch": 0.44, "learning_rate": 0.00023465463566116525, "loss": 0.0206, "step": 168060 }, { "epoch": 0.44, "learning_rate": 0.0002346507474447938, "loss": 0.0258, "step": 168070 }, { "epoch": 0.44, "learning_rate": 0.00023464685922842233, "loss": 0.0183, "step": 168080 }, { "epoch": 0.44, "learning_rate": 0.00023464297101205087, "loss": 0.0211, "step": 168090 }, { "epoch": 0.44, "learning_rate": 0.00023463908279567938, "loss": 0.0181, "step": 168100 }, { "epoch": 0.44, "learning_rate": 0.00023463519457930793, "loss": 0.0167, "step": 168110 }, { "epoch": 0.44, "learning_rate": 0.00023463130636293647, "loss": 0.0176, "step": 168120 }, { "epoch": 0.44, "learning_rate": 0.000234627418146565, "loss": 0.0184, "step": 168130 }, { "epoch": 0.44, "learning_rate": 0.00023462352993019352, "loss": 0.0184, "step": 168140 }, { "epoch": 0.44, "learning_rate": 0.00023461964171382207, "loss": 0.0173, "step": 168150 }, { "epoch": 0.44, "learning_rate": 0.0002346157534974506, "loss": 0.0201, "step": 168160 }, { "epoch": 0.44, "learning_rate": 0.00023461186528107915, "loss": 0.0165, "step": 168170 }, { "epoch": 0.44, "learning_rate": 0.00023460797706470766, "loss": 0.0196, "step": 168180 }, { "epoch": 0.44, "learning_rate": 0.0002346040888483362, "loss": 0.0156, "step": 168190 }, { "epoch": 0.44, "learning_rate": 0.00023460020063196477, "loss": 0.0314, "step": 168200 }, { "epoch": 0.44, "learning_rate": 0.0002345963124155933, "loss": 0.0201, "step": 168210 }, { "epoch": 0.44, "learning_rate": 0.00023459242419922183, "loss": 0.0186, "step": 168220 }, { "epoch": 0.44, "learning_rate": 0.00023458853598285034, "loss": 0.0179, "step": 168230 }, { "epoch": 0.44, "learning_rate": 0.00023458464776647886, "loss": 0.0204, "step": 168240 }, { "epoch": 0.44, "learning_rate": 0.00023458075955010743, "loss": 0.0164, "step": 168250 }, { "epoch": 0.44, "learning_rate": 0.00023457687133373597, "loss": 0.0212, "step": 168260 }, { "epoch": 0.44, "learning_rate": 0.00023457298311736448, "loss": 0.0148, "step": 168270 }, { "epoch": 0.44, "learning_rate": 0.00023456909490099303, "loss": 0.0153, "step": 168280 }, { "epoch": 0.44, "learning_rate": 0.00023456520668462157, "loss": 0.0176, "step": 168290 }, { "epoch": 0.44, "learning_rate": 0.0002345613184682501, "loss": 0.0172, "step": 168300 }, { "epoch": 0.44, "learning_rate": 0.00023455743025187862, "loss": 0.0193, "step": 168310 }, { "epoch": 0.44, "learning_rate": 0.00023455354203550717, "loss": 0.0137, "step": 168320 }, { "epoch": 0.44, "learning_rate": 0.0002345496538191357, "loss": 0.0208, "step": 168330 }, { "epoch": 0.44, "learning_rate": 0.00023454576560276425, "loss": 0.0176, "step": 168340 }, { "epoch": 0.44, "learning_rate": 0.00023454187738639276, "loss": 0.0226, "step": 168350 }, { "epoch": 0.44, "learning_rate": 0.0002345379891700213, "loss": 0.0159, "step": 168360 }, { "epoch": 0.44, "learning_rate": 0.00023453410095364987, "loss": 0.0186, "step": 168370 }, { "epoch": 0.44, "learning_rate": 0.0002345302127372784, "loss": 0.0267, "step": 168380 }, { "epoch": 0.44, "learning_rate": 0.00023452632452090693, "loss": 0.0174, "step": 168390 }, { "epoch": 0.44, "learning_rate": 0.00023452243630453544, "loss": 0.0216, "step": 168400 }, { "epoch": 0.44, "learning_rate": 0.000234518548088164, "loss": 0.0219, "step": 168410 }, { "epoch": 0.44, "learning_rate": 0.00023451465987179253, "loss": 0.0184, "step": 168420 }, { "epoch": 0.44, "learning_rate": 0.00023451077165542107, "loss": 0.0245, "step": 168430 }, { "epoch": 0.44, "learning_rate": 0.00023450688343904958, "loss": 0.0203, "step": 168440 }, { "epoch": 0.44, "learning_rate": 0.00023450299522267815, "loss": 0.0194, "step": 168450 }, { "epoch": 0.44, "learning_rate": 0.00023449910700630667, "loss": 0.0187, "step": 168460 }, { "epoch": 0.44, "learning_rate": 0.0002344952187899352, "loss": 0.0209, "step": 168470 }, { "epoch": 0.44, "learning_rate": 0.00023449133057356372, "loss": 0.0175, "step": 168480 }, { "epoch": 0.44, "learning_rate": 0.00023448744235719226, "loss": 0.0179, "step": 168490 }, { "epoch": 0.44, "learning_rate": 0.0002344835541408208, "loss": 0.0212, "step": 168500 }, { "epoch": 0.44, "learning_rate": 0.00023447966592444935, "loss": 0.018, "step": 168510 }, { "epoch": 0.44, "learning_rate": 0.00023447577770807786, "loss": 0.0165, "step": 168520 }, { "epoch": 0.44, "learning_rate": 0.0002344718894917064, "loss": 0.019, "step": 168530 }, { "epoch": 0.44, "learning_rate": 0.00023446800127533497, "loss": 0.0205, "step": 168540 }, { "epoch": 0.44, "learning_rate": 0.0002344641130589635, "loss": 0.0181, "step": 168550 }, { "epoch": 0.44, "learning_rate": 0.000234460224842592, "loss": 0.019, "step": 168560 }, { "epoch": 0.44, "learning_rate": 0.00023445633662622054, "loss": 0.0241, "step": 168570 }, { "epoch": 0.44, "learning_rate": 0.0002344524484098491, "loss": 0.0182, "step": 168580 }, { "epoch": 0.44, "learning_rate": 0.00023444856019347763, "loss": 0.0198, "step": 168590 }, { "epoch": 0.44, "learning_rate": 0.00023444467197710617, "loss": 0.0218, "step": 168600 }, { "epoch": 0.44, "learning_rate": 0.00023444078376073468, "loss": 0.0165, "step": 168610 }, { "epoch": 0.44, "learning_rate": 0.00023443689554436325, "loss": 0.0184, "step": 168620 }, { "epoch": 0.44, "learning_rate": 0.00023443300732799177, "loss": 0.0172, "step": 168630 }, { "epoch": 0.44, "learning_rate": 0.0002344291191116203, "loss": 0.0146, "step": 168640 }, { "epoch": 0.44, "learning_rate": 0.00023442523089524882, "loss": 0.0166, "step": 168650 }, { "epoch": 0.44, "learning_rate": 0.0002344213426788774, "loss": 0.0249, "step": 168660 }, { "epoch": 0.44, "learning_rate": 0.0002344174544625059, "loss": 0.0162, "step": 168670 }, { "epoch": 0.44, "learning_rate": 0.00023441356624613445, "loss": 0.0189, "step": 168680 }, { "epoch": 0.44, "learning_rate": 0.00023440967802976296, "loss": 0.0193, "step": 168690 }, { "epoch": 0.44, "learning_rate": 0.00023440578981339153, "loss": 0.0209, "step": 168700 }, { "epoch": 0.44, "learning_rate": 0.00023440190159702007, "loss": 0.0192, "step": 168710 }, { "epoch": 0.44, "learning_rate": 0.0002343980133806486, "loss": 0.0184, "step": 168720 }, { "epoch": 0.44, "learning_rate": 0.0002343941251642771, "loss": 0.0216, "step": 168730 }, { "epoch": 0.44, "learning_rate": 0.00023439023694790564, "loss": 0.0212, "step": 168740 }, { "epoch": 0.44, "learning_rate": 0.0002343863487315342, "loss": 0.0165, "step": 168750 }, { "epoch": 0.44, "learning_rate": 0.00023438246051516273, "loss": 0.018, "step": 168760 }, { "epoch": 0.44, "learning_rate": 0.00023437857229879127, "loss": 0.0173, "step": 168770 }, { "epoch": 0.44, "learning_rate": 0.00023437468408241978, "loss": 0.0207, "step": 168780 }, { "epoch": 0.44, "learning_rate": 0.00023437079586604835, "loss": 0.0215, "step": 168790 }, { "epoch": 0.44, "learning_rate": 0.00023436690764967687, "loss": 0.0201, "step": 168800 }, { "epoch": 0.44, "learning_rate": 0.0002343630194333054, "loss": 0.0187, "step": 168810 }, { "epoch": 0.44, "learning_rate": 0.00023435913121693392, "loss": 0.0181, "step": 168820 }, { "epoch": 0.44, "learning_rate": 0.0002343552430005625, "loss": 0.0197, "step": 168830 }, { "epoch": 0.44, "learning_rate": 0.000234351354784191, "loss": 0.021, "step": 168840 }, { "epoch": 0.44, "learning_rate": 0.00023434746656781955, "loss": 0.0182, "step": 168850 }, { "epoch": 0.44, "learning_rate": 0.00023434357835144806, "loss": 0.0238, "step": 168860 }, { "epoch": 0.44, "learning_rate": 0.00023433969013507663, "loss": 0.021, "step": 168870 }, { "epoch": 0.44, "learning_rate": 0.00023433580191870514, "loss": 0.0163, "step": 168880 }, { "epoch": 0.44, "learning_rate": 0.00023433191370233369, "loss": 0.0128, "step": 168890 }, { "epoch": 0.44, "learning_rate": 0.0002343280254859622, "loss": 0.0204, "step": 168900 }, { "epoch": 0.44, "learning_rate": 0.00023432413726959077, "loss": 0.0208, "step": 168910 }, { "epoch": 0.44, "learning_rate": 0.0002343202490532193, "loss": 0.0195, "step": 168920 }, { "epoch": 0.44, "learning_rate": 0.00023431636083684783, "loss": 0.0181, "step": 168930 }, { "epoch": 0.44, "learning_rate": 0.00023431247262047637, "loss": 0.02, "step": 168940 }, { "epoch": 0.44, "learning_rate": 0.0002343085844041049, "loss": 0.0192, "step": 168950 }, { "epoch": 0.44, "learning_rate": 0.00023430469618773345, "loss": 0.0191, "step": 168960 }, { "epoch": 0.44, "learning_rate": 0.00023430080797136197, "loss": 0.0175, "step": 168970 }, { "epoch": 0.44, "learning_rate": 0.0002342969197549905, "loss": 0.0195, "step": 168980 }, { "epoch": 0.44, "learning_rate": 0.00023429303153861902, "loss": 0.0192, "step": 168990 }, { "epoch": 0.44, "learning_rate": 0.0002342891433222476, "loss": 0.0192, "step": 169000 }, { "epoch": 0.44, "eval_cer": 0.88176706962214, "eval_loss": 0.012475664727389812, "eval_runtime": 107.3738, "eval_samples_per_second": 18.627, "eval_steps_per_second": 4.657, "step": 169000 }, { "epoch": 0.44, "learning_rate": 0.0002342852551058761, "loss": 0.022, "step": 169010 }, { "epoch": 0.44, "learning_rate": 0.00023428136688950465, "loss": 0.014, "step": 169020 }, { "epoch": 0.44, "learning_rate": 0.00023427747867313316, "loss": 0.0267, "step": 169030 }, { "epoch": 0.44, "learning_rate": 0.00023427359045676173, "loss": 0.0186, "step": 169040 }, { "epoch": 0.44, "learning_rate": 0.00023426970224039024, "loss": 0.0232, "step": 169050 }, { "epoch": 0.44, "learning_rate": 0.00023426581402401879, "loss": 0.0162, "step": 169060 }, { "epoch": 0.44, "learning_rate": 0.0002342619258076473, "loss": 0.0181, "step": 169070 }, { "epoch": 0.44, "learning_rate": 0.00023425803759127587, "loss": 0.0147, "step": 169080 }, { "epoch": 0.44, "learning_rate": 0.0002342541493749044, "loss": 0.02, "step": 169090 }, { "epoch": 0.44, "learning_rate": 0.00023425026115853293, "loss": 0.0189, "step": 169100 }, { "epoch": 0.44, "learning_rate": 0.00023424637294216147, "loss": 0.0212, "step": 169110 }, { "epoch": 0.44, "learning_rate": 0.00023424248472579, "loss": 0.0184, "step": 169120 }, { "epoch": 0.44, "learning_rate": 0.00023423859650941855, "loss": 0.0178, "step": 169130 }, { "epoch": 0.44, "learning_rate": 0.00023423470829304706, "loss": 0.0161, "step": 169140 }, { "epoch": 0.44, "learning_rate": 0.0002342308200766756, "loss": 0.0158, "step": 169150 }, { "epoch": 0.44, "learning_rate": 0.00023422693186030415, "loss": 0.0187, "step": 169160 }, { "epoch": 0.44, "learning_rate": 0.0002342230436439327, "loss": 0.0195, "step": 169170 }, { "epoch": 0.44, "learning_rate": 0.0002342191554275612, "loss": 0.0163, "step": 169180 }, { "epoch": 0.44, "learning_rate": 0.00023421526721118975, "loss": 0.0216, "step": 169190 }, { "epoch": 0.44, "learning_rate": 0.0002342113789948183, "loss": 0.0173, "step": 169200 }, { "epoch": 0.44, "learning_rate": 0.00023420749077844683, "loss": 0.0158, "step": 169210 }, { "epoch": 0.44, "learning_rate": 0.00023420360256207534, "loss": 0.0177, "step": 169220 }, { "epoch": 0.44, "learning_rate": 0.00023419971434570389, "loss": 0.0196, "step": 169230 }, { "epoch": 0.44, "learning_rate": 0.0002341958261293324, "loss": 0.0208, "step": 169240 }, { "epoch": 0.44, "learning_rate": 0.00023419193791296097, "loss": 0.0206, "step": 169250 }, { "epoch": 0.44, "learning_rate": 0.0002341880496965895, "loss": 0.0187, "step": 169260 }, { "epoch": 0.44, "learning_rate": 0.00023418416148021802, "loss": 0.0161, "step": 169270 }, { "epoch": 0.44, "learning_rate": 0.00023418027326384654, "loss": 0.0201, "step": 169280 }, { "epoch": 0.44, "learning_rate": 0.0002341763850474751, "loss": 0.0129, "step": 169290 }, { "epoch": 0.44, "learning_rate": 0.00023417249683110365, "loss": 0.0171, "step": 169300 }, { "epoch": 0.44, "learning_rate": 0.00023416860861473216, "loss": 0.02, "step": 169310 }, { "epoch": 0.44, "learning_rate": 0.0002341647203983607, "loss": 0.0167, "step": 169320 }, { "epoch": 0.44, "learning_rate": 0.00023416083218198925, "loss": 0.02, "step": 169330 }, { "epoch": 0.44, "learning_rate": 0.0002341569439656178, "loss": 0.0173, "step": 169340 }, { "epoch": 0.44, "learning_rate": 0.0002341530557492463, "loss": 0.0182, "step": 169350 }, { "epoch": 0.44, "learning_rate": 0.00023414916753287485, "loss": 0.0185, "step": 169360 }, { "epoch": 0.44, "learning_rate": 0.0002341452793165034, "loss": 0.0225, "step": 169370 }, { "epoch": 0.44, "learning_rate": 0.00023414139110013193, "loss": 0.0192, "step": 169380 }, { "epoch": 0.44, "learning_rate": 0.00023413750288376044, "loss": 0.0207, "step": 169390 }, { "epoch": 0.44, "learning_rate": 0.00023413361466738898, "loss": 0.0221, "step": 169400 }, { "epoch": 0.44, "learning_rate": 0.00023412972645101755, "loss": 0.0207, "step": 169410 }, { "epoch": 0.44, "learning_rate": 0.00023412583823464607, "loss": 0.0184, "step": 169420 }, { "epoch": 0.44, "learning_rate": 0.00023412195001827458, "loss": 0.0158, "step": 169430 }, { "epoch": 0.44, "learning_rate": 0.00023411806180190312, "loss": 0.0194, "step": 169440 }, { "epoch": 0.44, "learning_rate": 0.0002341141735855317, "loss": 0.0155, "step": 169450 }, { "epoch": 0.44, "learning_rate": 0.0002341102853691602, "loss": 0.0202, "step": 169460 }, { "epoch": 0.44, "learning_rate": 0.00023410639715278875, "loss": 0.0193, "step": 169470 }, { "epoch": 0.44, "learning_rate": 0.00023410250893641726, "loss": 0.0196, "step": 169480 }, { "epoch": 0.44, "learning_rate": 0.0002340986207200458, "loss": 0.0282, "step": 169490 }, { "epoch": 0.44, "learning_rate": 0.00023409473250367435, "loss": 0.0189, "step": 169500 }, { "epoch": 0.44, "learning_rate": 0.0002340908442873029, "loss": 0.0204, "step": 169510 }, { "epoch": 0.44, "learning_rate": 0.0002340869560709314, "loss": 0.0203, "step": 169520 }, { "epoch": 0.44, "learning_rate": 0.00023408306785455994, "loss": 0.0203, "step": 169530 }, { "epoch": 0.44, "learning_rate": 0.00023407917963818849, "loss": 0.0157, "step": 169540 }, { "epoch": 0.44, "learning_rate": 0.00023407529142181703, "loss": 0.0179, "step": 169550 }, { "epoch": 0.44, "learning_rate": 0.00023407140320544554, "loss": 0.0159, "step": 169560 }, { "epoch": 0.44, "learning_rate": 0.00023406751498907408, "loss": 0.0187, "step": 169570 }, { "epoch": 0.44, "learning_rate": 0.00023406362677270265, "loss": 0.0203, "step": 169580 }, { "epoch": 0.44, "learning_rate": 0.00023405973855633117, "loss": 0.0162, "step": 169590 }, { "epoch": 0.44, "learning_rate": 0.00023405585033995968, "loss": 0.0168, "step": 169600 }, { "epoch": 0.44, "learning_rate": 0.00023405196212358822, "loss": 0.0181, "step": 169610 }, { "epoch": 0.44, "learning_rate": 0.0002340480739072168, "loss": 0.023, "step": 169620 }, { "epoch": 0.44, "learning_rate": 0.0002340441856908453, "loss": 0.0201, "step": 169630 }, { "epoch": 0.44, "learning_rate": 0.00023404029747447385, "loss": 0.0167, "step": 169640 }, { "epoch": 0.44, "learning_rate": 0.00023403640925810236, "loss": 0.02, "step": 169650 }, { "epoch": 0.44, "learning_rate": 0.00023403252104173093, "loss": 0.0183, "step": 169660 }, { "epoch": 0.44, "learning_rate": 0.00023402863282535945, "loss": 0.0184, "step": 169670 }, { "epoch": 0.44, "learning_rate": 0.000234024744608988, "loss": 0.0148, "step": 169680 }, { "epoch": 0.44, "learning_rate": 0.0002340208563926165, "loss": 0.0166, "step": 169690 }, { "epoch": 0.44, "learning_rate": 0.00023401696817624507, "loss": 0.0152, "step": 169700 }, { "epoch": 0.44, "learning_rate": 0.00023401307995987359, "loss": 0.0147, "step": 169710 }, { "epoch": 0.44, "learning_rate": 0.00023400919174350213, "loss": 0.0174, "step": 169720 }, { "epoch": 0.44, "learning_rate": 0.00023400530352713064, "loss": 0.016, "step": 169730 }, { "epoch": 0.44, "learning_rate": 0.00023400141531075918, "loss": 0.0174, "step": 169740 }, { "epoch": 0.44, "learning_rate": 0.00023399752709438772, "loss": 0.019, "step": 169750 }, { "epoch": 0.44, "learning_rate": 0.00023399363887801627, "loss": 0.0173, "step": 169760 }, { "epoch": 0.44, "learning_rate": 0.00023398975066164478, "loss": 0.0212, "step": 169770 }, { "epoch": 0.44, "learning_rate": 0.00023398586244527332, "loss": 0.0175, "step": 169780 }, { "epoch": 0.44, "learning_rate": 0.0002339819742289019, "loss": 0.0227, "step": 169790 }, { "epoch": 0.44, "learning_rate": 0.0002339780860125304, "loss": 0.019, "step": 169800 }, { "epoch": 0.44, "learning_rate": 0.00023397419779615895, "loss": 0.017, "step": 169810 }, { "epoch": 0.44, "learning_rate": 0.00023397030957978746, "loss": 0.0182, "step": 169820 }, { "epoch": 0.44, "learning_rate": 0.00023396642136341603, "loss": 0.0214, "step": 169830 }, { "epoch": 0.44, "learning_rate": 0.00023396253314704455, "loss": 0.0194, "step": 169840 }, { "epoch": 0.44, "learning_rate": 0.0002339586449306731, "loss": 0.0211, "step": 169850 }, { "epoch": 0.44, "learning_rate": 0.0002339547567143016, "loss": 0.0182, "step": 169860 }, { "epoch": 0.44, "learning_rate": 0.00023395086849793017, "loss": 0.0221, "step": 169870 }, { "epoch": 0.44, "learning_rate": 0.00023394698028155868, "loss": 0.0209, "step": 169880 }, { "epoch": 0.44, "learning_rate": 0.00023394309206518723, "loss": 0.0178, "step": 169890 }, { "epoch": 0.44, "learning_rate": 0.00023393920384881574, "loss": 0.0232, "step": 169900 }, { "epoch": 0.44, "learning_rate": 0.0002339353156324443, "loss": 0.0169, "step": 169910 }, { "epoch": 0.44, "learning_rate": 0.00023393142741607282, "loss": 0.0169, "step": 169920 }, { "epoch": 0.44, "learning_rate": 0.00023392753919970137, "loss": 0.0188, "step": 169930 }, { "epoch": 0.44, "learning_rate": 0.00023392365098332988, "loss": 0.0168, "step": 169940 }, { "epoch": 0.44, "learning_rate": 0.00023391976276695845, "loss": 0.0165, "step": 169950 }, { "epoch": 0.44, "learning_rate": 0.000233915874550587, "loss": 0.0146, "step": 169960 }, { "epoch": 0.44, "learning_rate": 0.0002339119863342155, "loss": 0.017, "step": 169970 }, { "epoch": 0.44, "learning_rate": 0.00023390809811784405, "loss": 0.0311, "step": 169980 }, { "epoch": 0.44, "learning_rate": 0.00023390420990147256, "loss": 0.0195, "step": 169990 }, { "epoch": 0.44, "learning_rate": 0.00023390032168510113, "loss": 0.0191, "step": 170000 }, { "epoch": 0.44, "eval_cer": 0.8818048598193629, "eval_loss": 0.01211427990347147, "eval_runtime": 107.8438, "eval_samples_per_second": 18.545, "eval_steps_per_second": 4.636, "step": 170000 }, { "epoch": 0.44, "learning_rate": 0.00023389643346872964, "loss": 0.0174, "step": 170010 }, { "epoch": 0.44, "learning_rate": 0.0002338925452523582, "loss": 0.0151, "step": 170020 }, { "epoch": 0.44, "learning_rate": 0.0002338886570359867, "loss": 0.0167, "step": 170030 }, { "epoch": 0.44, "learning_rate": 0.00023388476881961527, "loss": 0.0189, "step": 170040 }, { "epoch": 0.44, "learning_rate": 0.00023388088060324378, "loss": 0.0237, "step": 170050 }, { "epoch": 0.44, "learning_rate": 0.00023387699238687233, "loss": 0.0173, "step": 170060 }, { "epoch": 0.44, "learning_rate": 0.00023387310417050084, "loss": 0.0172, "step": 170070 }, { "epoch": 0.44, "learning_rate": 0.0002338692159541294, "loss": 0.016, "step": 170080 }, { "epoch": 0.44, "learning_rate": 0.00023386532773775792, "loss": 0.0175, "step": 170090 }, { "epoch": 0.44, "learning_rate": 0.00023386143952138647, "loss": 0.0199, "step": 170100 }, { "epoch": 0.44, "learning_rate": 0.00023385755130501498, "loss": 0.0167, "step": 170110 }, { "epoch": 0.44, "learning_rate": 0.00023385366308864355, "loss": 0.0184, "step": 170120 }, { "epoch": 0.44, "learning_rate": 0.0002338497748722721, "loss": 0.0154, "step": 170130 }, { "epoch": 0.44, "learning_rate": 0.0002338458866559006, "loss": 0.0207, "step": 170140 }, { "epoch": 0.44, "learning_rate": 0.00023384199843952912, "loss": 0.0185, "step": 170150 }, { "epoch": 0.44, "learning_rate": 0.0002338381102231577, "loss": 0.018, "step": 170160 }, { "epoch": 0.44, "learning_rate": 0.00023383422200678623, "loss": 0.0164, "step": 170170 }, { "epoch": 0.44, "learning_rate": 0.00023383033379041474, "loss": 0.0177, "step": 170180 }, { "epoch": 0.44, "learning_rate": 0.00023382644557404329, "loss": 0.0172, "step": 170190 }, { "epoch": 0.44, "learning_rate": 0.00023382255735767183, "loss": 0.0185, "step": 170200 }, { "epoch": 0.44, "learning_rate": 0.00023381866914130037, "loss": 0.0146, "step": 170210 }, { "epoch": 0.44, "learning_rate": 0.00023381478092492888, "loss": 0.0182, "step": 170220 }, { "epoch": 0.44, "learning_rate": 0.00023381089270855743, "loss": 0.0141, "step": 170230 }, { "epoch": 0.44, "learning_rate": 0.00023380700449218594, "loss": 0.0144, "step": 170240 }, { "epoch": 0.44, "learning_rate": 0.0002338031162758145, "loss": 0.0196, "step": 170250 }, { "epoch": 0.44, "learning_rate": 0.00023379922805944302, "loss": 0.0168, "step": 170260 }, { "epoch": 0.44, "learning_rate": 0.00023379533984307156, "loss": 0.0169, "step": 170270 }, { "epoch": 0.44, "learning_rate": 0.00023379145162670008, "loss": 0.0179, "step": 170280 }, { "epoch": 0.44, "learning_rate": 0.00023378756341032865, "loss": 0.0182, "step": 170290 }, { "epoch": 0.44, "learning_rate": 0.00023378367519395716, "loss": 0.0171, "step": 170300 }, { "epoch": 0.44, "learning_rate": 0.0002337797869775857, "loss": 0.0175, "step": 170310 }, { "epoch": 0.44, "learning_rate": 0.00023377589876121422, "loss": 0.0202, "step": 170320 }, { "epoch": 0.44, "learning_rate": 0.0002337720105448428, "loss": 0.0165, "step": 170330 }, { "epoch": 0.44, "learning_rate": 0.00023376812232847133, "loss": 0.0155, "step": 170340 }, { "epoch": 0.44, "learning_rate": 0.00023376423411209984, "loss": 0.0217, "step": 170350 }, { "epoch": 0.44, "learning_rate": 0.00023376034589572839, "loss": 0.018, "step": 170360 }, { "epoch": 0.44, "learning_rate": 0.00023375645767935693, "loss": 0.016, "step": 170370 }, { "epoch": 0.44, "learning_rate": 0.00023375256946298547, "loss": 0.016, "step": 170380 }, { "epoch": 0.44, "learning_rate": 0.00023374868124661398, "loss": 0.0164, "step": 170390 }, { "epoch": 0.44, "learning_rate": 0.00023374479303024252, "loss": 0.0213, "step": 170400 }, { "epoch": 0.44, "learning_rate": 0.00023374090481387107, "loss": 0.0196, "step": 170410 }, { "epoch": 0.44, "learning_rate": 0.0002337370165974996, "loss": 0.0149, "step": 170420 }, { "epoch": 0.44, "learning_rate": 0.00023373312838112812, "loss": 0.0172, "step": 170430 }, { "epoch": 0.44, "learning_rate": 0.00023372924016475666, "loss": 0.023, "step": 170440 }, { "epoch": 0.44, "learning_rate": 0.00023372535194838518, "loss": 0.0173, "step": 170450 }, { "epoch": 0.44, "learning_rate": 0.00023372146373201375, "loss": 0.0164, "step": 170460 }, { "epoch": 0.44, "learning_rate": 0.00023371757551564226, "loss": 0.0203, "step": 170470 }, { "epoch": 0.44, "learning_rate": 0.0002337136872992708, "loss": 0.016, "step": 170480 }, { "epoch": 0.44, "learning_rate": 0.00023370979908289932, "loss": 0.0178, "step": 170490 }, { "epoch": 0.44, "learning_rate": 0.0002337059108665279, "loss": 0.016, "step": 170500 }, { "epoch": 0.44, "learning_rate": 0.00023370202265015643, "loss": 0.0178, "step": 170510 }, { "epoch": 0.44, "learning_rate": 0.00023369813443378494, "loss": 0.0127, "step": 170520 }, { "epoch": 0.44, "learning_rate": 0.00023369424621741348, "loss": 0.0203, "step": 170530 }, { "epoch": 0.44, "learning_rate": 0.00023369035800104203, "loss": 0.0152, "step": 170540 }, { "epoch": 0.44, "learning_rate": 0.00023368646978467057, "loss": 0.0173, "step": 170550 }, { "epoch": 0.44, "learning_rate": 0.00023368258156829908, "loss": 0.0164, "step": 170560 }, { "epoch": 0.44, "learning_rate": 0.00023367869335192762, "loss": 0.0188, "step": 170570 }, { "epoch": 0.44, "learning_rate": 0.00023367480513555617, "loss": 0.0243, "step": 170580 }, { "epoch": 0.44, "learning_rate": 0.0002336709169191847, "loss": 0.015, "step": 170590 }, { "epoch": 0.44, "learning_rate": 0.00023366702870281322, "loss": 0.0187, "step": 170600 }, { "epoch": 0.44, "learning_rate": 0.00023366314048644176, "loss": 0.0203, "step": 170610 }, { "epoch": 0.44, "learning_rate": 0.0002336592522700703, "loss": 0.0165, "step": 170620 }, { "epoch": 0.44, "learning_rate": 0.00023365536405369885, "loss": 0.0216, "step": 170630 }, { "epoch": 0.44, "learning_rate": 0.00023365147583732736, "loss": 0.0196, "step": 170640 }, { "epoch": 0.44, "learning_rate": 0.0002336475876209559, "loss": 0.0161, "step": 170650 }, { "epoch": 0.44, "learning_rate": 0.00023364369940458447, "loss": 0.0215, "step": 170660 }, { "epoch": 0.44, "learning_rate": 0.00023363981118821299, "loss": 0.0151, "step": 170670 }, { "epoch": 0.44, "learning_rate": 0.00023363592297184153, "loss": 0.0158, "step": 170680 }, { "epoch": 0.44, "learning_rate": 0.00023363203475547004, "loss": 0.0197, "step": 170690 }, { "epoch": 0.44, "learning_rate": 0.00023362814653909858, "loss": 0.0171, "step": 170700 }, { "epoch": 0.44, "learning_rate": 0.00023362425832272713, "loss": 0.0188, "step": 170710 }, { "epoch": 0.44, "learning_rate": 0.00023362037010635567, "loss": 0.0202, "step": 170720 }, { "epoch": 0.44, "learning_rate": 0.00023361648188998418, "loss": 0.0228, "step": 170730 }, { "epoch": 0.44, "learning_rate": 0.00023361259367361272, "loss": 0.0191, "step": 170740 }, { "epoch": 0.44, "learning_rate": 0.00023360870545724127, "loss": 0.0186, "step": 170750 }, { "epoch": 0.44, "learning_rate": 0.0002336048172408698, "loss": 0.0246, "step": 170760 }, { "epoch": 0.44, "learning_rate": 0.00023360092902449832, "loss": 0.0233, "step": 170770 }, { "epoch": 0.44, "learning_rate": 0.00023359704080812686, "loss": 0.0202, "step": 170780 }, { "epoch": 0.44, "learning_rate": 0.0002335931525917554, "loss": 0.0181, "step": 170790 }, { "epoch": 0.44, "learning_rate": 0.00023358926437538395, "loss": 0.0171, "step": 170800 }, { "epoch": 0.44, "learning_rate": 0.00023358537615901246, "loss": 0.0248, "step": 170810 }, { "epoch": 0.44, "learning_rate": 0.000233581487942641, "loss": 0.0182, "step": 170820 }, { "epoch": 0.44, "learning_rate": 0.00023357759972626957, "loss": 0.0139, "step": 170830 }, { "epoch": 0.44, "learning_rate": 0.00023357371150989809, "loss": 0.0191, "step": 170840 }, { "epoch": 0.44, "learning_rate": 0.00023356982329352663, "loss": 0.0144, "step": 170850 }, { "epoch": 0.44, "learning_rate": 0.00023356593507715514, "loss": 0.0172, "step": 170860 }, { "epoch": 0.44, "learning_rate": 0.0002335620468607837, "loss": 0.0173, "step": 170870 }, { "epoch": 0.44, "learning_rate": 0.00023355815864441223, "loss": 0.0141, "step": 170880 }, { "epoch": 0.44, "learning_rate": 0.00023355427042804077, "loss": 0.0195, "step": 170890 }, { "epoch": 0.44, "learning_rate": 0.00023355038221166928, "loss": 0.0196, "step": 170900 }, { "epoch": 0.44, "learning_rate": 0.00023354649399529785, "loss": 0.0181, "step": 170910 }, { "epoch": 0.44, "learning_rate": 0.00023354260577892636, "loss": 0.0169, "step": 170920 }, { "epoch": 0.44, "learning_rate": 0.0002335387175625549, "loss": 0.0175, "step": 170930 }, { "epoch": 0.44, "learning_rate": 0.00023353482934618342, "loss": 0.0145, "step": 170940 }, { "epoch": 0.44, "learning_rate": 0.00023353094112981196, "loss": 0.0165, "step": 170950 }, { "epoch": 0.44, "learning_rate": 0.0002335270529134405, "loss": 0.0284, "step": 170960 }, { "epoch": 0.44, "learning_rate": 0.00023352316469706905, "loss": 0.0172, "step": 170970 }, { "epoch": 0.44, "learning_rate": 0.00023351927648069756, "loss": 0.0187, "step": 170980 }, { "epoch": 0.44, "learning_rate": 0.0002335153882643261, "loss": 0.017, "step": 170990 }, { "epoch": 0.44, "learning_rate": 0.00023351150004795467, "loss": 0.026, "step": 171000 }, { "epoch": 0.44, "eval_cer": 0.8818006609085604, "eval_loss": 0.01254571508616209, "eval_runtime": 108.0306, "eval_samples_per_second": 18.513, "eval_steps_per_second": 4.628, "step": 171000 }, { "epoch": 0.44, "learning_rate": 0.00023350761183158319, "loss": 0.0176, "step": 171010 }, { "epoch": 0.44, "learning_rate": 0.0002335037236152117, "loss": 0.0204, "step": 171020 }, { "epoch": 0.44, "learning_rate": 0.00023349983539884024, "loss": 0.0178, "step": 171030 }, { "epoch": 0.44, "learning_rate": 0.0002334959471824688, "loss": 0.0205, "step": 171040 }, { "epoch": 0.44, "learning_rate": 0.00023349205896609732, "loss": 0.0237, "step": 171050 }, { "epoch": 0.44, "learning_rate": 0.00023348817074972587, "loss": 0.0196, "step": 171060 }, { "epoch": 0.44, "learning_rate": 0.00023348428253335438, "loss": 0.0188, "step": 171070 }, { "epoch": 0.44, "learning_rate": 0.00023348039431698295, "loss": 0.0146, "step": 171080 }, { "epoch": 0.44, "learning_rate": 0.00023347650610061146, "loss": 0.0247, "step": 171090 }, { "epoch": 0.44, "learning_rate": 0.00023347261788424, "loss": 0.0167, "step": 171100 }, { "epoch": 0.44, "learning_rate": 0.00023346872966786852, "loss": 0.018, "step": 171110 }, { "epoch": 0.44, "learning_rate": 0.0002334648414514971, "loss": 0.0149, "step": 171120 }, { "epoch": 0.44, "learning_rate": 0.0002334609532351256, "loss": 0.018, "step": 171130 }, { "epoch": 0.44, "learning_rate": 0.00023345706501875415, "loss": 0.0203, "step": 171140 }, { "epoch": 0.44, "learning_rate": 0.00023345317680238266, "loss": 0.0205, "step": 171150 }, { "epoch": 0.44, "learning_rate": 0.00023344928858601123, "loss": 0.0176, "step": 171160 }, { "epoch": 0.44, "learning_rate": 0.00023344540036963977, "loss": 0.0144, "step": 171170 }, { "epoch": 0.44, "learning_rate": 0.00023344151215326828, "loss": 0.0222, "step": 171180 }, { "epoch": 0.44, "learning_rate": 0.0002334376239368968, "loss": 0.0179, "step": 171190 }, { "epoch": 0.44, "learning_rate": 0.00023343373572052534, "loss": 0.024, "step": 171200 }, { "epoch": 0.44, "learning_rate": 0.0002334298475041539, "loss": 0.0185, "step": 171210 }, { "epoch": 0.44, "learning_rate": 0.00023342595928778242, "loss": 0.0163, "step": 171220 }, { "epoch": 0.44, "learning_rate": 0.00023342207107141097, "loss": 0.0166, "step": 171230 }, { "epoch": 0.44, "learning_rate": 0.00023341818285503948, "loss": 0.0162, "step": 171240 }, { "epoch": 0.44, "learning_rate": 0.00023341429463866805, "loss": 0.0183, "step": 171250 }, { "epoch": 0.44, "learning_rate": 0.00023341040642229656, "loss": 0.0174, "step": 171260 }, { "epoch": 0.44, "learning_rate": 0.0002334065182059251, "loss": 0.0166, "step": 171270 }, { "epoch": 0.44, "learning_rate": 0.00023340262998955362, "loss": 0.0172, "step": 171280 }, { "epoch": 0.44, "learning_rate": 0.0002333987417731822, "loss": 0.0289, "step": 171290 }, { "epoch": 0.44, "learning_rate": 0.0002333948535568107, "loss": 0.0197, "step": 171300 }, { "epoch": 0.44, "learning_rate": 0.00023339096534043924, "loss": 0.0199, "step": 171310 }, { "epoch": 0.44, "learning_rate": 0.00023338707712406776, "loss": 0.0169, "step": 171320 }, { "epoch": 0.44, "learning_rate": 0.00023338318890769633, "loss": 0.0207, "step": 171330 }, { "epoch": 0.44, "learning_rate": 0.00023337930069132484, "loss": 0.0185, "step": 171340 }, { "epoch": 0.44, "learning_rate": 0.00023337541247495338, "loss": 0.0221, "step": 171350 }, { "epoch": 0.44, "learning_rate": 0.0002333715242585819, "loss": 0.0223, "step": 171360 }, { "epoch": 0.44, "learning_rate": 0.00023336763604221047, "loss": 0.0229, "step": 171370 }, { "epoch": 0.44, "learning_rate": 0.000233363747825839, "loss": 0.0209, "step": 171380 }, { "epoch": 0.44, "learning_rate": 0.00023335985960946752, "loss": 0.023, "step": 171390 }, { "epoch": 0.44, "learning_rate": 0.00023335597139309607, "loss": 0.0182, "step": 171400 }, { "epoch": 0.44, "learning_rate": 0.0002333520831767246, "loss": 0.0183, "step": 171410 }, { "epoch": 0.44, "learning_rate": 0.00023334819496035315, "loss": 0.0161, "step": 171420 }, { "epoch": 0.44, "learning_rate": 0.00023334430674398166, "loss": 0.0153, "step": 171430 }, { "epoch": 0.44, "learning_rate": 0.0002333404185276102, "loss": 0.0218, "step": 171440 }, { "epoch": 0.44, "learning_rate": 0.00023333653031123872, "loss": 0.0181, "step": 171450 }, { "epoch": 0.44, "learning_rate": 0.0002333326420948673, "loss": 0.0193, "step": 171460 }, { "epoch": 0.44, "learning_rate": 0.0002333287538784958, "loss": 0.0195, "step": 171470 }, { "epoch": 0.44, "learning_rate": 0.00023332486566212434, "loss": 0.0167, "step": 171480 }, { "epoch": 0.44, "learning_rate": 0.00023332097744575286, "loss": 0.0185, "step": 171490 }, { "epoch": 0.44, "learning_rate": 0.00023331708922938143, "loss": 0.0195, "step": 171500 }, { "epoch": 0.44, "learning_rate": 0.00023331320101300994, "loss": 0.018, "step": 171510 }, { "epoch": 0.44, "learning_rate": 0.00023330931279663848, "loss": 0.0159, "step": 171520 }, { "epoch": 0.44, "learning_rate": 0.000233305424580267, "loss": 0.0195, "step": 171530 }, { "epoch": 0.44, "learning_rate": 0.00023330153636389557, "loss": 0.0143, "step": 171540 }, { "epoch": 0.44, "learning_rate": 0.0002332976481475241, "loss": 0.0152, "step": 171550 }, { "epoch": 0.44, "learning_rate": 0.00023329375993115262, "loss": 0.014, "step": 171560 }, { "epoch": 0.44, "learning_rate": 0.00023328987171478116, "loss": 0.0214, "step": 171570 }, { "epoch": 0.44, "learning_rate": 0.0002332859834984097, "loss": 0.017, "step": 171580 }, { "epoch": 0.44, "learning_rate": 0.00023328209528203825, "loss": 0.0199, "step": 171590 }, { "epoch": 0.44, "learning_rate": 0.00023327820706566676, "loss": 0.0138, "step": 171600 }, { "epoch": 0.44, "learning_rate": 0.0002332743188492953, "loss": 0.0182, "step": 171610 }, { "epoch": 0.44, "learning_rate": 0.00023327043063292385, "loss": 0.0169, "step": 171620 }, { "epoch": 0.44, "learning_rate": 0.0002332665424165524, "loss": 0.0187, "step": 171630 }, { "epoch": 0.44, "learning_rate": 0.0002332626542001809, "loss": 0.0198, "step": 171640 }, { "epoch": 0.44, "learning_rate": 0.00023325876598380944, "loss": 0.0174, "step": 171650 }, { "epoch": 0.44, "learning_rate": 0.00023325487776743799, "loss": 0.0166, "step": 171660 }, { "epoch": 0.44, "learning_rate": 0.00023325098955106653, "loss": 0.0188, "step": 171670 }, { "epoch": 0.45, "learning_rate": 0.00023324710133469504, "loss": 0.0259, "step": 171680 }, { "epoch": 0.45, "learning_rate": 0.00023324321311832358, "loss": 0.0181, "step": 171690 }, { "epoch": 0.45, "learning_rate": 0.0002332393249019521, "loss": 0.0199, "step": 171700 }, { "epoch": 0.45, "learning_rate": 0.00023323543668558067, "loss": 0.018, "step": 171710 }, { "epoch": 0.45, "learning_rate": 0.0002332315484692092, "loss": 0.0171, "step": 171720 }, { "epoch": 0.45, "learning_rate": 0.00023322766025283772, "loss": 0.0203, "step": 171730 }, { "epoch": 0.45, "learning_rate": 0.00023322377203646624, "loss": 0.0241, "step": 171740 }, { "epoch": 0.45, "learning_rate": 0.0002332198838200948, "loss": 0.0197, "step": 171750 }, { "epoch": 0.45, "learning_rate": 0.00023321599560372335, "loss": 0.0187, "step": 171760 }, { "epoch": 0.45, "learning_rate": 0.00023321210738735186, "loss": 0.0182, "step": 171770 }, { "epoch": 0.45, "learning_rate": 0.0002332082191709804, "loss": 0.0185, "step": 171780 }, { "epoch": 0.45, "learning_rate": 0.00023320433095460895, "loss": 0.0159, "step": 171790 }, { "epoch": 0.45, "learning_rate": 0.0002332004427382375, "loss": 0.0182, "step": 171800 }, { "epoch": 0.45, "learning_rate": 0.000233196554521866, "loss": 0.0174, "step": 171810 }, { "epoch": 0.45, "learning_rate": 0.00023319266630549454, "loss": 0.0169, "step": 171820 }, { "epoch": 0.45, "learning_rate": 0.00023318877808912308, "loss": 0.0164, "step": 171830 }, { "epoch": 0.45, "learning_rate": 0.00023318488987275163, "loss": 0.0165, "step": 171840 }, { "epoch": 0.45, "learning_rate": 0.00023318100165638014, "loss": 0.0163, "step": 171850 }, { "epoch": 0.45, "learning_rate": 0.00023317711344000868, "loss": 0.021, "step": 171860 }, { "epoch": 0.45, "learning_rate": 0.00023317322522363725, "loss": 0.0171, "step": 171870 }, { "epoch": 0.45, "learning_rate": 0.00023316933700726577, "loss": 0.0175, "step": 171880 }, { "epoch": 0.45, "learning_rate": 0.00023316544879089428, "loss": 0.0202, "step": 171890 }, { "epoch": 0.45, "learning_rate": 0.00023316156057452282, "loss": 0.0198, "step": 171900 }, { "epoch": 0.45, "learning_rate": 0.0002331576723581514, "loss": 0.0214, "step": 171910 }, { "epoch": 0.45, "learning_rate": 0.0002331537841417799, "loss": 0.0177, "step": 171920 }, { "epoch": 0.45, "learning_rate": 0.00023314989592540845, "loss": 0.0156, "step": 171930 }, { "epoch": 0.45, "learning_rate": 0.00023314600770903696, "loss": 0.0187, "step": 171940 }, { "epoch": 0.45, "learning_rate": 0.0002331421194926655, "loss": 0.0184, "step": 171950 }, { "epoch": 0.45, "learning_rate": 0.00023313823127629404, "loss": 0.0213, "step": 171960 }, { "epoch": 0.45, "learning_rate": 0.00023313434305992259, "loss": 0.0183, "step": 171970 }, { "epoch": 0.45, "learning_rate": 0.0002331304548435511, "loss": 0.0243, "step": 171980 }, { "epoch": 0.45, "learning_rate": 0.00023312656662717964, "loss": 0.0199, "step": 171990 }, { "epoch": 0.45, "learning_rate": 0.00023312267841080818, "loss": 0.0185, "step": 172000 }, { "epoch": 0.45, "eval_cer": 0.881782465628416, "eval_loss": 0.012556556612253189, "eval_runtime": 107.2056, "eval_samples_per_second": 18.656, "eval_steps_per_second": 4.664, "step": 172000 }, { "epoch": 0.45, "learning_rate": 0.00023311879019443673, "loss": 0.0217, "step": 172010 }, { "epoch": 0.45, "learning_rate": 0.00023311490197806524, "loss": 0.0176, "step": 172020 }, { "epoch": 0.45, "learning_rate": 0.00023311101376169378, "loss": 0.0182, "step": 172030 }, { "epoch": 0.45, "learning_rate": 0.00023310712554532235, "loss": 0.0225, "step": 172040 }, { "epoch": 0.45, "learning_rate": 0.00023310323732895087, "loss": 0.0164, "step": 172050 }, { "epoch": 0.45, "learning_rate": 0.00023309934911257938, "loss": 0.0172, "step": 172060 }, { "epoch": 0.45, "learning_rate": 0.00023309546089620792, "loss": 0.0199, "step": 172070 }, { "epoch": 0.45, "learning_rate": 0.0002330915726798365, "loss": 0.021, "step": 172080 }, { "epoch": 0.45, "learning_rate": 0.000233087684463465, "loss": 0.0174, "step": 172090 }, { "epoch": 0.45, "learning_rate": 0.00023308379624709355, "loss": 0.0191, "step": 172100 }, { "epoch": 0.45, "learning_rate": 0.00023307990803072206, "loss": 0.0152, "step": 172110 }, { "epoch": 0.45, "learning_rate": 0.00023307601981435063, "loss": 0.0177, "step": 172120 }, { "epoch": 0.45, "learning_rate": 0.00023307213159797914, "loss": 0.0183, "step": 172130 }, { "epoch": 0.45, "learning_rate": 0.00023306824338160769, "loss": 0.0203, "step": 172140 }, { "epoch": 0.45, "learning_rate": 0.0002330643551652362, "loss": 0.0175, "step": 172150 }, { "epoch": 0.45, "learning_rate": 0.00023306046694886477, "loss": 0.0183, "step": 172160 }, { "epoch": 0.45, "learning_rate": 0.00023305657873249328, "loss": 0.0215, "step": 172170 }, { "epoch": 0.45, "learning_rate": 0.00023305269051612183, "loss": 0.0185, "step": 172180 }, { "epoch": 0.45, "learning_rate": 0.00023304880229975034, "loss": 0.0155, "step": 172190 }, { "epoch": 0.45, "learning_rate": 0.00023304491408337888, "loss": 0.0203, "step": 172200 }, { "epoch": 0.45, "learning_rate": 0.00023304102586700742, "loss": 0.0216, "step": 172210 }, { "epoch": 0.45, "learning_rate": 0.00023303713765063596, "loss": 0.0205, "step": 172220 }, { "epoch": 0.45, "learning_rate": 0.00023303324943426448, "loss": 0.0165, "step": 172230 }, { "epoch": 0.45, "learning_rate": 0.00023302936121789302, "loss": 0.0181, "step": 172240 }, { "epoch": 0.45, "learning_rate": 0.0002330254730015216, "loss": 0.0171, "step": 172250 }, { "epoch": 0.45, "learning_rate": 0.0002330215847851501, "loss": 0.0163, "step": 172260 }, { "epoch": 0.45, "learning_rate": 0.00023301769656877865, "loss": 0.0189, "step": 172270 }, { "epoch": 0.45, "learning_rate": 0.00023301380835240716, "loss": 0.019, "step": 172280 }, { "epoch": 0.45, "learning_rate": 0.00023300992013603573, "loss": 0.0148, "step": 172290 }, { "epoch": 0.45, "learning_rate": 0.00023300603191966424, "loss": 0.0196, "step": 172300 }, { "epoch": 0.45, "learning_rate": 0.00023300214370329279, "loss": 0.0196, "step": 172310 }, { "epoch": 0.45, "learning_rate": 0.0002329982554869213, "loss": 0.0189, "step": 172320 }, { "epoch": 0.45, "learning_rate": 0.00023299436727054987, "loss": 0.0174, "step": 172330 }, { "epoch": 0.45, "learning_rate": 0.00023299047905417838, "loss": 0.0191, "step": 172340 }, { "epoch": 0.45, "learning_rate": 0.00023298659083780692, "loss": 0.0222, "step": 172350 }, { "epoch": 0.45, "learning_rate": 0.00023298270262143544, "loss": 0.0213, "step": 172360 }, { "epoch": 0.45, "learning_rate": 0.000232978814405064, "loss": 0.0175, "step": 172370 }, { "epoch": 0.45, "learning_rate": 0.00023297492618869252, "loss": 0.0186, "step": 172380 }, { "epoch": 0.45, "learning_rate": 0.00023297103797232106, "loss": 0.0182, "step": 172390 }, { "epoch": 0.45, "learning_rate": 0.00023296714975594958, "loss": 0.0208, "step": 172400 }, { "epoch": 0.45, "learning_rate": 0.00023296326153957815, "loss": 0.02, "step": 172410 }, { "epoch": 0.45, "learning_rate": 0.0002329593733232067, "loss": 0.0149, "step": 172420 }, { "epoch": 0.45, "learning_rate": 0.0002329554851068352, "loss": 0.0174, "step": 172430 }, { "epoch": 0.45, "learning_rate": 0.00023295159689046374, "loss": 0.0218, "step": 172440 }, { "epoch": 0.45, "learning_rate": 0.00023294770867409226, "loss": 0.0181, "step": 172450 }, { "epoch": 0.45, "learning_rate": 0.00023294382045772083, "loss": 0.0166, "step": 172460 }, { "epoch": 0.45, "learning_rate": 0.00023293993224134934, "loss": 0.0174, "step": 172470 }, { "epoch": 0.45, "learning_rate": 0.00023293604402497788, "loss": 0.0167, "step": 172480 }, { "epoch": 0.45, "learning_rate": 0.0002329321558086064, "loss": 0.0162, "step": 172490 }, { "epoch": 0.45, "learning_rate": 0.00023292826759223497, "loss": 0.0159, "step": 172500 }, { "epoch": 0.45, "learning_rate": 0.00023292437937586348, "loss": 0.0159, "step": 172510 }, { "epoch": 0.45, "learning_rate": 0.00023292049115949202, "loss": 0.0188, "step": 172520 }, { "epoch": 0.45, "learning_rate": 0.00023291660294312054, "loss": 0.0213, "step": 172530 }, { "epoch": 0.45, "learning_rate": 0.0002329127147267491, "loss": 0.018, "step": 172540 }, { "epoch": 0.45, "learning_rate": 0.00023290882651037762, "loss": 0.0167, "step": 172550 }, { "epoch": 0.45, "learning_rate": 0.00023290493829400616, "loss": 0.0201, "step": 172560 }, { "epoch": 0.45, "learning_rate": 0.00023290105007763468, "loss": 0.0186, "step": 172570 }, { "epoch": 0.45, "learning_rate": 0.00023289716186126325, "loss": 0.0165, "step": 172580 }, { "epoch": 0.45, "learning_rate": 0.0002328932736448918, "loss": 0.021, "step": 172590 }, { "epoch": 0.45, "learning_rate": 0.0002328893854285203, "loss": 0.0157, "step": 172600 }, { "epoch": 0.45, "learning_rate": 0.00023288549721214882, "loss": 0.0164, "step": 172610 }, { "epoch": 0.45, "learning_rate": 0.00023288160899577739, "loss": 0.0198, "step": 172620 }, { "epoch": 0.45, "learning_rate": 0.00023287772077940593, "loss": 0.0312, "step": 172630 }, { "epoch": 0.45, "learning_rate": 0.00023287383256303444, "loss": 0.017, "step": 172640 }, { "epoch": 0.45, "learning_rate": 0.00023286994434666298, "loss": 0.0199, "step": 172650 }, { "epoch": 0.45, "learning_rate": 0.00023286605613029153, "loss": 0.0209, "step": 172660 }, { "epoch": 0.45, "learning_rate": 0.00023286216791392007, "loss": 0.0205, "step": 172670 }, { "epoch": 0.45, "learning_rate": 0.00023285827969754858, "loss": 0.0233, "step": 172680 }, { "epoch": 0.45, "learning_rate": 0.00023285439148117712, "loss": 0.0148, "step": 172690 }, { "epoch": 0.45, "learning_rate": 0.00023285050326480564, "loss": 0.02, "step": 172700 }, { "epoch": 0.45, "learning_rate": 0.0002328466150484342, "loss": 0.019, "step": 172710 }, { "epoch": 0.45, "learning_rate": 0.00023284272683206272, "loss": 0.0178, "step": 172720 }, { "epoch": 0.45, "learning_rate": 0.00023283883861569126, "loss": 0.0187, "step": 172730 }, { "epoch": 0.45, "learning_rate": 0.00023283495039931978, "loss": 0.017, "step": 172740 }, { "epoch": 0.45, "learning_rate": 0.00023283106218294835, "loss": 0.0281, "step": 172750 }, { "epoch": 0.45, "learning_rate": 0.0002328271739665769, "loss": 0.0165, "step": 172760 }, { "epoch": 0.45, "learning_rate": 0.0002328232857502054, "loss": 0.0168, "step": 172770 }, { "epoch": 0.45, "learning_rate": 0.00023281939753383392, "loss": 0.0176, "step": 172780 }, { "epoch": 0.45, "learning_rate": 0.00023281550931746249, "loss": 0.0187, "step": 172790 }, { "epoch": 0.45, "learning_rate": 0.00023281162110109103, "loss": 0.0162, "step": 172800 }, { "epoch": 0.45, "learning_rate": 0.00023280773288471954, "loss": 0.018, "step": 172810 }, { "epoch": 0.45, "learning_rate": 0.00023280384466834808, "loss": 0.0198, "step": 172820 }, { "epoch": 0.45, "learning_rate": 0.00023279995645197662, "loss": 0.0167, "step": 172830 }, { "epoch": 0.45, "learning_rate": 0.00023279606823560517, "loss": 0.0204, "step": 172840 }, { "epoch": 0.45, "learning_rate": 0.00023279218001923368, "loss": 0.0231, "step": 172850 }, { "epoch": 0.45, "learning_rate": 0.00023278829180286222, "loss": 0.0175, "step": 172860 }, { "epoch": 0.45, "learning_rate": 0.00023278440358649076, "loss": 0.0185, "step": 172870 }, { "epoch": 0.45, "learning_rate": 0.0002327805153701193, "loss": 0.0189, "step": 172880 }, { "epoch": 0.45, "learning_rate": 0.00023277662715374782, "loss": 0.0204, "step": 172890 }, { "epoch": 0.45, "learning_rate": 0.00023277273893737636, "loss": 0.0194, "step": 172900 }, { "epoch": 0.45, "learning_rate": 0.00023276885072100493, "loss": 0.0232, "step": 172910 }, { "epoch": 0.45, "learning_rate": 0.00023276496250463345, "loss": 0.0182, "step": 172920 }, { "epoch": 0.45, "learning_rate": 0.00023276107428826196, "loss": 0.0191, "step": 172930 }, { "epoch": 0.45, "learning_rate": 0.0002327571860718905, "loss": 0.019, "step": 172940 }, { "epoch": 0.45, "learning_rate": 0.00023275329785551902, "loss": 0.0198, "step": 172950 }, { "epoch": 0.45, "learning_rate": 0.00023274940963914758, "loss": 0.0182, "step": 172960 }, { "epoch": 0.45, "learning_rate": 0.00023274552142277613, "loss": 0.0166, "step": 172970 }, { "epoch": 0.45, "learning_rate": 0.00023274163320640464, "loss": 0.019, "step": 172980 }, { "epoch": 0.45, "learning_rate": 0.00023273774499003318, "loss": 0.0215, "step": 172990 }, { "epoch": 0.45, "learning_rate": 0.00023273385677366172, "loss": 0.0188, "step": 173000 }, { "epoch": 0.45, "eval_cer": 0.8818034601824287, "eval_loss": 0.012683995999395847, "eval_runtime": 108.0649, "eval_samples_per_second": 18.507, "eval_steps_per_second": 4.627, "step": 173000 }, { "epoch": 0.45, "learning_rate": 0.00023272996855729027, "loss": 0.0206, "step": 173010 }, { "epoch": 0.45, "learning_rate": 0.00023272608034091878, "loss": 0.0142, "step": 173020 }, { "epoch": 0.45, "learning_rate": 0.00023272219212454732, "loss": 0.0215, "step": 173030 }, { "epoch": 0.45, "learning_rate": 0.00023271830390817586, "loss": 0.0168, "step": 173040 }, { "epoch": 0.45, "learning_rate": 0.0002327144156918044, "loss": 0.0201, "step": 173050 }, { "epoch": 0.45, "learning_rate": 0.00023271052747543292, "loss": 0.019, "step": 173060 }, { "epoch": 0.45, "learning_rate": 0.00023270663925906146, "loss": 0.0171, "step": 173070 }, { "epoch": 0.45, "learning_rate": 0.00023270275104269, "loss": 0.0198, "step": 173080 }, { "epoch": 0.45, "learning_rate": 0.00023269886282631854, "loss": 0.018, "step": 173090 }, { "epoch": 0.45, "learning_rate": 0.00023269497460994706, "loss": 0.0503, "step": 173100 }, { "epoch": 0.45, "learning_rate": 0.0002326910863935756, "loss": 0.0203, "step": 173110 }, { "epoch": 0.45, "learning_rate": 0.00023268719817720417, "loss": 0.0205, "step": 173120 }, { "epoch": 0.45, "learning_rate": 0.00023268330996083268, "loss": 0.0172, "step": 173130 }, { "epoch": 0.45, "learning_rate": 0.00023267942174446123, "loss": 0.0181, "step": 173140 }, { "epoch": 0.45, "learning_rate": 0.00023267553352808974, "loss": 0.0167, "step": 173150 }, { "epoch": 0.45, "learning_rate": 0.0002326716453117183, "loss": 0.0181, "step": 173160 }, { "epoch": 0.45, "learning_rate": 0.00023266775709534682, "loss": 0.0169, "step": 173170 }, { "epoch": 0.45, "learning_rate": 0.00023266386887897537, "loss": 0.019, "step": 173180 }, { "epoch": 0.45, "learning_rate": 0.00023265998066260388, "loss": 0.0198, "step": 173190 }, { "epoch": 0.45, "learning_rate": 0.00023265609244623242, "loss": 0.0179, "step": 173200 }, { "epoch": 0.45, "learning_rate": 0.00023265220422986096, "loss": 0.0185, "step": 173210 }, { "epoch": 0.45, "learning_rate": 0.0002326483160134895, "loss": 0.0216, "step": 173220 }, { "epoch": 0.45, "learning_rate": 0.00023264442779711802, "loss": 0.0185, "step": 173230 }, { "epoch": 0.45, "learning_rate": 0.00023264053958074656, "loss": 0.0161, "step": 173240 }, { "epoch": 0.45, "learning_rate": 0.0002326366513643751, "loss": 0.0188, "step": 173250 }, { "epoch": 0.45, "learning_rate": 0.00023263276314800364, "loss": 0.0205, "step": 173260 }, { "epoch": 0.45, "learning_rate": 0.00023262887493163216, "loss": 0.0172, "step": 173270 }, { "epoch": 0.45, "learning_rate": 0.0002326249867152607, "loss": 0.014, "step": 173280 }, { "epoch": 0.45, "learning_rate": 0.00023262109849888927, "loss": 0.0181, "step": 173290 }, { "epoch": 0.45, "learning_rate": 0.00023261721028251778, "loss": 0.0177, "step": 173300 }, { "epoch": 0.45, "learning_rate": 0.00023261332206614633, "loss": 0.0165, "step": 173310 }, { "epoch": 0.45, "learning_rate": 0.00023260943384977484, "loss": 0.0182, "step": 173320 }, { "epoch": 0.45, "learning_rate": 0.0002326055456334034, "loss": 0.0162, "step": 173330 }, { "epoch": 0.45, "learning_rate": 0.00023260165741703192, "loss": 0.0194, "step": 173340 }, { "epoch": 0.45, "learning_rate": 0.00023259776920066046, "loss": 0.0171, "step": 173350 }, { "epoch": 0.45, "learning_rate": 0.00023259388098428898, "loss": 0.0191, "step": 173360 }, { "epoch": 0.45, "learning_rate": 0.00023258999276791755, "loss": 0.0188, "step": 173370 }, { "epoch": 0.45, "learning_rate": 0.00023258610455154606, "loss": 0.0165, "step": 173380 }, { "epoch": 0.45, "learning_rate": 0.0002325822163351746, "loss": 0.0176, "step": 173390 }, { "epoch": 0.45, "learning_rate": 0.00023257832811880312, "loss": 0.0171, "step": 173400 }, { "epoch": 0.45, "learning_rate": 0.0002325744399024317, "loss": 0.0211, "step": 173410 }, { "epoch": 0.45, "learning_rate": 0.0002325705516860602, "loss": 0.0199, "step": 173420 }, { "epoch": 0.45, "learning_rate": 0.00023256666346968874, "loss": 0.0156, "step": 173430 }, { "epoch": 0.45, "learning_rate": 0.00023256277525331726, "loss": 0.0203, "step": 173440 }, { "epoch": 0.45, "learning_rate": 0.0002325588870369458, "loss": 0.0208, "step": 173450 }, { "epoch": 0.45, "learning_rate": 0.00023255499882057437, "loss": 0.0227, "step": 173460 }, { "epoch": 0.45, "learning_rate": 0.00023255111060420288, "loss": 0.0188, "step": 173470 }, { "epoch": 0.45, "learning_rate": 0.0002325472223878314, "loss": 0.0134, "step": 173480 }, { "epoch": 0.45, "learning_rate": 0.00023254333417145994, "loss": 0.016, "step": 173490 }, { "epoch": 0.45, "learning_rate": 0.0002325394459550885, "loss": 0.016, "step": 173500 }, { "epoch": 0.45, "learning_rate": 0.00023253555773871702, "loss": 0.0186, "step": 173510 }, { "epoch": 0.45, "learning_rate": 0.00023253166952234556, "loss": 0.0208, "step": 173520 }, { "epoch": 0.45, "learning_rate": 0.00023252778130597408, "loss": 0.0171, "step": 173530 }, { "epoch": 0.45, "learning_rate": 0.00023252389308960265, "loss": 0.0172, "step": 173540 }, { "epoch": 0.45, "learning_rate": 0.00023252000487323116, "loss": 0.0198, "step": 173550 }, { "epoch": 0.45, "learning_rate": 0.0002325161166568597, "loss": 0.0193, "step": 173560 }, { "epoch": 0.45, "learning_rate": 0.00023251222844048822, "loss": 0.0227, "step": 173570 }, { "epoch": 0.45, "learning_rate": 0.0002325083402241168, "loss": 0.017, "step": 173580 }, { "epoch": 0.45, "learning_rate": 0.0002325044520077453, "loss": 0.0239, "step": 173590 }, { "epoch": 0.45, "learning_rate": 0.00023250056379137384, "loss": 0.0177, "step": 173600 }, { "epoch": 0.45, "learning_rate": 0.00023249667557500236, "loss": 0.0245, "step": 173610 }, { "epoch": 0.45, "learning_rate": 0.00023249278735863093, "loss": 0.0166, "step": 173620 }, { "epoch": 0.45, "learning_rate": 0.00023248889914225947, "loss": 0.0201, "step": 173630 }, { "epoch": 0.45, "learning_rate": 0.00023248501092588798, "loss": 0.0167, "step": 173640 }, { "epoch": 0.45, "learning_rate": 0.0002324811227095165, "loss": 0.016, "step": 173650 }, { "epoch": 0.45, "learning_rate": 0.00023247723449314507, "loss": 0.0185, "step": 173660 }, { "epoch": 0.45, "learning_rate": 0.0002324733462767736, "loss": 0.018, "step": 173670 }, { "epoch": 0.45, "learning_rate": 0.00023246945806040212, "loss": 0.018, "step": 173680 }, { "epoch": 0.45, "learning_rate": 0.00023246556984403066, "loss": 0.0172, "step": 173690 }, { "epoch": 0.45, "learning_rate": 0.00023246168162765918, "loss": 0.0192, "step": 173700 }, { "epoch": 0.45, "learning_rate": 0.00023245779341128775, "loss": 0.022, "step": 173710 }, { "epoch": 0.45, "learning_rate": 0.00023245390519491626, "loss": 0.0183, "step": 173720 }, { "epoch": 0.45, "learning_rate": 0.0002324500169785448, "loss": 0.0176, "step": 173730 }, { "epoch": 0.45, "learning_rate": 0.00023244612876217332, "loss": 0.0163, "step": 173740 }, { "epoch": 0.45, "learning_rate": 0.00023244224054580189, "loss": 0.0171, "step": 173750 }, { "epoch": 0.45, "learning_rate": 0.0002324383523294304, "loss": 0.0154, "step": 173760 }, { "epoch": 0.45, "learning_rate": 0.00023243446411305894, "loss": 0.0194, "step": 173770 }, { "epoch": 0.45, "learning_rate": 0.00023243057589668746, "loss": 0.0172, "step": 173780 }, { "epoch": 0.45, "learning_rate": 0.00023242668768031603, "loss": 0.0186, "step": 173790 }, { "epoch": 0.45, "learning_rate": 0.00023242279946394454, "loss": 0.017, "step": 173800 }, { "epoch": 0.45, "learning_rate": 0.00023241891124757308, "loss": 0.0189, "step": 173810 }, { "epoch": 0.45, "learning_rate": 0.0002324150230312016, "loss": 0.0149, "step": 173820 }, { "epoch": 0.45, "learning_rate": 0.00023241113481483017, "loss": 0.0181, "step": 173830 }, { "epoch": 0.45, "learning_rate": 0.0002324072465984587, "loss": 0.0245, "step": 173840 }, { "epoch": 0.45, "learning_rate": 0.00023240335838208722, "loss": 0.0163, "step": 173850 }, { "epoch": 0.45, "learning_rate": 0.00023239947016571576, "loss": 0.0176, "step": 173860 }, { "epoch": 0.45, "learning_rate": 0.0002323955819493443, "loss": 0.0196, "step": 173870 }, { "epoch": 0.45, "learning_rate": 0.00023239169373297285, "loss": 0.0186, "step": 173880 }, { "epoch": 0.45, "learning_rate": 0.00023238780551660136, "loss": 0.0161, "step": 173890 }, { "epoch": 0.45, "learning_rate": 0.0002323839173002299, "loss": 0.0188, "step": 173900 }, { "epoch": 0.45, "learning_rate": 0.00023238002908385844, "loss": 0.0216, "step": 173910 }, { "epoch": 0.45, "learning_rate": 0.00023237614086748699, "loss": 0.0148, "step": 173920 }, { "epoch": 0.45, "learning_rate": 0.0002323722526511155, "loss": 0.019, "step": 173930 }, { "epoch": 0.45, "learning_rate": 0.00023236836443474404, "loss": 0.021, "step": 173940 }, { "epoch": 0.45, "learning_rate": 0.00023236447621837256, "loss": 0.0169, "step": 173950 }, { "epoch": 0.45, "learning_rate": 0.00023236058800200113, "loss": 0.0119, "step": 173960 }, { "epoch": 0.45, "learning_rate": 0.00023235669978562964, "loss": 0.0181, "step": 173970 }, { "epoch": 0.45, "learning_rate": 0.00023235281156925818, "loss": 0.0174, "step": 173980 }, { "epoch": 0.45, "learning_rate": 0.0002323489233528867, "loss": 0.0195, "step": 173990 }, { "epoch": 0.45, "learning_rate": 0.00023234503513651526, "loss": 0.0179, "step": 174000 }, { "epoch": 0.45, "eval_cer": 0.8817922630869552, "eval_loss": 0.012246196158230305, "eval_runtime": 108.0303, "eval_samples_per_second": 18.513, "eval_steps_per_second": 4.628, "step": 174000 }, { "epoch": 0.45, "learning_rate": 0.0002323411469201438, "loss": 0.0174, "step": 174010 }, { "epoch": 0.45, "learning_rate": 0.00023233725870377232, "loss": 0.0171, "step": 174020 }, { "epoch": 0.45, "learning_rate": 0.00023233337048740086, "loss": 0.016, "step": 174030 }, { "epoch": 0.45, "learning_rate": 0.0002323294822710294, "loss": 0.0179, "step": 174040 }, { "epoch": 0.45, "learning_rate": 0.00023232559405465795, "loss": 0.0215, "step": 174050 }, { "epoch": 0.45, "learning_rate": 0.00023232170583828646, "loss": 0.0227, "step": 174060 }, { "epoch": 0.45, "learning_rate": 0.000232317817621915, "loss": 0.0187, "step": 174070 }, { "epoch": 0.45, "learning_rate": 0.00023231392940554354, "loss": 0.0179, "step": 174080 }, { "epoch": 0.45, "learning_rate": 0.00023231004118917209, "loss": 0.0169, "step": 174090 }, { "epoch": 0.45, "learning_rate": 0.0002323061529728006, "loss": 0.0211, "step": 174100 }, { "epoch": 0.45, "learning_rate": 0.00023230226475642914, "loss": 0.0183, "step": 174110 }, { "epoch": 0.45, "learning_rate": 0.00023229837654005768, "loss": 0.0167, "step": 174120 }, { "epoch": 0.45, "learning_rate": 0.00023229448832368622, "loss": 0.0233, "step": 174130 }, { "epoch": 0.45, "learning_rate": 0.00023229060010731474, "loss": 0.0187, "step": 174140 }, { "epoch": 0.45, "learning_rate": 0.00023228671189094328, "loss": 0.0199, "step": 174150 }, { "epoch": 0.45, "learning_rate": 0.00023228282367457185, "loss": 0.0201, "step": 174160 }, { "epoch": 0.45, "learning_rate": 0.00023227893545820036, "loss": 0.0183, "step": 174170 }, { "epoch": 0.45, "learning_rate": 0.0002322750472418289, "loss": 0.0211, "step": 174180 }, { "epoch": 0.45, "learning_rate": 0.00023227115902545742, "loss": 0.0209, "step": 174190 }, { "epoch": 0.45, "learning_rate": 0.00023226727080908593, "loss": 0.0183, "step": 174200 }, { "epoch": 0.45, "learning_rate": 0.0002322633825927145, "loss": 0.016, "step": 174210 }, { "epoch": 0.45, "learning_rate": 0.00023225949437634305, "loss": 0.0218, "step": 174220 }, { "epoch": 0.45, "learning_rate": 0.00023225560615997156, "loss": 0.0185, "step": 174230 }, { "epoch": 0.45, "learning_rate": 0.0002322517179436001, "loss": 0.02, "step": 174240 }, { "epoch": 0.45, "learning_rate": 0.00023224782972722864, "loss": 0.0144, "step": 174250 }, { "epoch": 0.45, "learning_rate": 0.00023224394151085718, "loss": 0.0167, "step": 174260 }, { "epoch": 0.45, "learning_rate": 0.0002322400532944857, "loss": 0.0176, "step": 174270 }, { "epoch": 0.45, "learning_rate": 0.00023223616507811424, "loss": 0.0179, "step": 174280 }, { "epoch": 0.45, "learning_rate": 0.00023223227686174278, "loss": 0.0166, "step": 174290 }, { "epoch": 0.45, "learning_rate": 0.00023222838864537132, "loss": 0.0161, "step": 174300 }, { "epoch": 0.45, "learning_rate": 0.00023222450042899984, "loss": 0.0183, "step": 174310 }, { "epoch": 0.45, "learning_rate": 0.00023222061221262838, "loss": 0.0227, "step": 174320 }, { "epoch": 0.45, "learning_rate": 0.00023221672399625695, "loss": 0.0145, "step": 174330 }, { "epoch": 0.45, "learning_rate": 0.00023221283577988546, "loss": 0.0182, "step": 174340 }, { "epoch": 0.45, "learning_rate": 0.000232208947563514, "loss": 0.0165, "step": 174350 }, { "epoch": 0.45, "learning_rate": 0.00023220505934714252, "loss": 0.0182, "step": 174360 }, { "epoch": 0.45, "learning_rate": 0.0002322011711307711, "loss": 0.0192, "step": 174370 }, { "epoch": 0.45, "learning_rate": 0.0002321972829143996, "loss": 0.0174, "step": 174380 }, { "epoch": 0.45, "learning_rate": 0.00023219339469802814, "loss": 0.0188, "step": 174390 }, { "epoch": 0.45, "learning_rate": 0.00023218950648165666, "loss": 0.0166, "step": 174400 }, { "epoch": 0.45, "learning_rate": 0.00023218561826528523, "loss": 0.0156, "step": 174410 }, { "epoch": 0.45, "learning_rate": 0.00023218173004891374, "loss": 0.018, "step": 174420 }, { "epoch": 0.45, "learning_rate": 0.00023217784183254228, "loss": 0.0165, "step": 174430 }, { "epoch": 0.45, "learning_rate": 0.0002321739536161708, "loss": 0.0189, "step": 174440 }, { "epoch": 0.45, "learning_rate": 0.00023217006539979934, "loss": 0.0147, "step": 174450 }, { "epoch": 0.45, "learning_rate": 0.00023216617718342788, "loss": 0.0177, "step": 174460 }, { "epoch": 0.45, "learning_rate": 0.00023216228896705642, "loss": 0.0144, "step": 174470 }, { "epoch": 0.45, "learning_rate": 0.00023215840075068494, "loss": 0.0149, "step": 174480 }, { "epoch": 0.45, "learning_rate": 0.00023215451253431348, "loss": 0.0183, "step": 174490 }, { "epoch": 0.45, "learning_rate": 0.00023215062431794205, "loss": 0.0206, "step": 174500 }, { "epoch": 0.45, "learning_rate": 0.00023214673610157056, "loss": 0.0188, "step": 174510 }, { "epoch": 0.45, "learning_rate": 0.00023214284788519908, "loss": 0.0176, "step": 174520 }, { "epoch": 0.45, "learning_rate": 0.00023213895966882762, "loss": 0.0243, "step": 174530 }, { "epoch": 0.45, "learning_rate": 0.0002321350714524562, "loss": 0.0175, "step": 174540 }, { "epoch": 0.45, "learning_rate": 0.0002321311832360847, "loss": 0.0183, "step": 174550 }, { "epoch": 0.45, "learning_rate": 0.00023212729501971324, "loss": 0.0169, "step": 174560 }, { "epoch": 0.45, "learning_rate": 0.00023212340680334176, "loss": 0.0205, "step": 174570 }, { "epoch": 0.45, "learning_rate": 0.00023211951858697033, "loss": 0.0156, "step": 174580 }, { "epoch": 0.45, "learning_rate": 0.00023211563037059884, "loss": 0.0149, "step": 174590 }, { "epoch": 0.45, "learning_rate": 0.00023211174215422738, "loss": 0.0162, "step": 174600 }, { "epoch": 0.45, "learning_rate": 0.0002321078539378559, "loss": 0.027, "step": 174610 }, { "epoch": 0.45, "learning_rate": 0.00023210396572148447, "loss": 0.0198, "step": 174620 }, { "epoch": 0.45, "learning_rate": 0.00023210007750511298, "loss": 0.0172, "step": 174630 }, { "epoch": 0.45, "learning_rate": 0.00023209618928874152, "loss": 0.0188, "step": 174640 }, { "epoch": 0.45, "learning_rate": 0.00023209230107237004, "loss": 0.0186, "step": 174650 }, { "epoch": 0.45, "learning_rate": 0.0002320884128559986, "loss": 0.0164, "step": 174660 }, { "epoch": 0.45, "learning_rate": 0.00023208452463962712, "loss": 0.0193, "step": 174670 }, { "epoch": 0.45, "learning_rate": 0.00023208063642325566, "loss": 0.0174, "step": 174680 }, { "epoch": 0.45, "learning_rate": 0.00023207674820688418, "loss": 0.0166, "step": 174690 }, { "epoch": 0.45, "learning_rate": 0.00023207285999051272, "loss": 0.0176, "step": 174700 }, { "epoch": 0.45, "learning_rate": 0.0002320689717741413, "loss": 0.0182, "step": 174710 }, { "epoch": 0.45, "learning_rate": 0.0002320650835577698, "loss": 0.0176, "step": 174720 }, { "epoch": 0.45, "learning_rate": 0.00023206119534139834, "loss": 0.0187, "step": 174730 }, { "epoch": 0.45, "learning_rate": 0.00023205730712502686, "loss": 0.0256, "step": 174740 }, { "epoch": 0.45, "learning_rate": 0.00023205341890865543, "loss": 0.0181, "step": 174750 }, { "epoch": 0.45, "learning_rate": 0.00023204953069228394, "loss": 0.0141, "step": 174760 }, { "epoch": 0.45, "learning_rate": 0.00023204564247591248, "loss": 0.0171, "step": 174770 }, { "epoch": 0.45, "learning_rate": 0.000232041754259541, "loss": 0.0195, "step": 174780 }, { "epoch": 0.45, "learning_rate": 0.00023203786604316957, "loss": 0.017, "step": 174790 }, { "epoch": 0.45, "learning_rate": 0.00023203397782679808, "loss": 0.0199, "step": 174800 }, { "epoch": 0.45, "learning_rate": 0.00023203008961042662, "loss": 0.0208, "step": 174810 }, { "epoch": 0.45, "learning_rate": 0.00023202620139405514, "loss": 0.0183, "step": 174820 }, { "epoch": 0.45, "learning_rate": 0.0002320223131776837, "loss": 0.0206, "step": 174830 }, { "epoch": 0.45, "learning_rate": 0.00023201842496131222, "loss": 0.0192, "step": 174840 }, { "epoch": 0.45, "learning_rate": 0.00023201453674494076, "loss": 0.0178, "step": 174850 }, { "epoch": 0.45, "learning_rate": 0.00023201064852856928, "loss": 0.0174, "step": 174860 }, { "epoch": 0.45, "learning_rate": 0.00023200676031219785, "loss": 0.018, "step": 174870 }, { "epoch": 0.45, "learning_rate": 0.0002320028720958264, "loss": 0.0158, "step": 174880 }, { "epoch": 0.45, "learning_rate": 0.0002319989838794549, "loss": 0.0164, "step": 174890 }, { "epoch": 0.45, "learning_rate": 0.00023199509566308344, "loss": 0.0203, "step": 174900 }, { "epoch": 0.45, "learning_rate": 0.00023199120744671198, "loss": 0.0195, "step": 174910 }, { "epoch": 0.45, "learning_rate": 0.00023198731923034053, "loss": 0.0212, "step": 174920 }, { "epoch": 0.45, "learning_rate": 0.00023198343101396904, "loss": 0.0156, "step": 174930 }, { "epoch": 0.45, "learning_rate": 0.00023197954279759758, "loss": 0.0142, "step": 174940 }, { "epoch": 0.45, "learning_rate": 0.0002319756545812261, "loss": 0.0186, "step": 174950 }, { "epoch": 0.45, "learning_rate": 0.00023197176636485467, "loss": 0.0185, "step": 174960 }, { "epoch": 0.45, "learning_rate": 0.00023196787814848318, "loss": 0.0166, "step": 174970 }, { "epoch": 0.45, "learning_rate": 0.00023196398993211172, "loss": 0.0162, "step": 174980 }, { "epoch": 0.45, "learning_rate": 0.00023196010171574024, "loss": 0.018, "step": 174990 }, { "epoch": 0.45, "learning_rate": 0.0002319562134993688, "loss": 0.019, "step": 175000 }, { "epoch": 0.45, "eval_cer": 0.8818048598193629, "eval_loss": 0.012664512731134892, "eval_runtime": 107.9478, "eval_samples_per_second": 18.527, "eval_steps_per_second": 4.632, "step": 175000 }, { "epoch": 0.45, "learning_rate": 0.00023195232528299732, "loss": 0.0157, "step": 175010 }, { "epoch": 0.45, "learning_rate": 0.00023194843706662586, "loss": 0.0172, "step": 175020 }, { "epoch": 0.45, "learning_rate": 0.00023194454885025438, "loss": 0.0217, "step": 175030 }, { "epoch": 0.45, "learning_rate": 0.00023194066063388294, "loss": 0.0169, "step": 175040 }, { "epoch": 0.45, "learning_rate": 0.00023193677241751149, "loss": 0.0177, "step": 175050 }, { "epoch": 0.45, "learning_rate": 0.00023193288420114, "loss": 0.0178, "step": 175060 }, { "epoch": 0.45, "learning_rate": 0.00023192899598476852, "loss": 0.0228, "step": 175070 }, { "epoch": 0.45, "learning_rate": 0.00023192510776839708, "loss": 0.0175, "step": 175080 }, { "epoch": 0.45, "learning_rate": 0.00023192121955202563, "loss": 0.0186, "step": 175090 }, { "epoch": 0.45, "learning_rate": 0.00023191733133565414, "loss": 0.0205, "step": 175100 }, { "epoch": 0.45, "learning_rate": 0.00023191344311928268, "loss": 0.0218, "step": 175110 }, { "epoch": 0.45, "learning_rate": 0.00023190955490291122, "loss": 0.0162, "step": 175120 }, { "epoch": 0.45, "learning_rate": 0.00023190566668653977, "loss": 0.02, "step": 175130 }, { "epoch": 0.45, "learning_rate": 0.00023190177847016828, "loss": 0.0217, "step": 175140 }, { "epoch": 0.45, "learning_rate": 0.00023189789025379682, "loss": 0.0161, "step": 175150 }, { "epoch": 0.45, "learning_rate": 0.00023189400203742536, "loss": 0.0178, "step": 175160 }, { "epoch": 0.45, "learning_rate": 0.0002318901138210539, "loss": 0.021, "step": 175170 }, { "epoch": 0.45, "learning_rate": 0.00023188622560468242, "loss": 0.0231, "step": 175180 }, { "epoch": 0.45, "learning_rate": 0.00023188233738831096, "loss": 0.017, "step": 175190 }, { "epoch": 0.45, "learning_rate": 0.00023187844917193948, "loss": 0.0187, "step": 175200 }, { "epoch": 0.45, "learning_rate": 0.00023187456095556804, "loss": 0.0165, "step": 175210 }, { "epoch": 0.45, "learning_rate": 0.00023187067273919659, "loss": 0.0158, "step": 175220 }, { "epoch": 0.45, "learning_rate": 0.0002318667845228251, "loss": 0.0172, "step": 175230 }, { "epoch": 0.45, "learning_rate": 0.00023186289630645361, "loss": 0.0166, "step": 175240 }, { "epoch": 0.45, "learning_rate": 0.00023185900809008218, "loss": 0.0196, "step": 175250 }, { "epoch": 0.45, "learning_rate": 0.00023185511987371073, "loss": 0.0217, "step": 175260 }, { "epoch": 0.45, "learning_rate": 0.00023185123165733924, "loss": 0.0163, "step": 175270 }, { "epoch": 0.45, "learning_rate": 0.00023184734344096778, "loss": 0.0219, "step": 175280 }, { "epoch": 0.45, "learning_rate": 0.00023184345522459632, "loss": 0.0164, "step": 175290 }, { "epoch": 0.45, "learning_rate": 0.00023183956700822486, "loss": 0.0207, "step": 175300 }, { "epoch": 0.45, "learning_rate": 0.00023183567879185338, "loss": 0.0198, "step": 175310 }, { "epoch": 0.45, "learning_rate": 0.00023183179057548192, "loss": 0.0166, "step": 175320 }, { "epoch": 0.45, "learning_rate": 0.00023182790235911046, "loss": 0.017, "step": 175330 }, { "epoch": 0.45, "learning_rate": 0.000231824014142739, "loss": 0.0186, "step": 175340 }, { "epoch": 0.45, "learning_rate": 0.00023182012592636752, "loss": 0.0207, "step": 175350 }, { "epoch": 0.45, "learning_rate": 0.00023181623770999606, "loss": 0.0203, "step": 175360 }, { "epoch": 0.45, "learning_rate": 0.00023181234949362463, "loss": 0.0154, "step": 175370 }, { "epoch": 0.45, "learning_rate": 0.00023180846127725314, "loss": 0.0182, "step": 175380 }, { "epoch": 0.45, "learning_rate": 0.00023180457306088166, "loss": 0.0222, "step": 175390 }, { "epoch": 0.45, "learning_rate": 0.0002318006848445102, "loss": 0.0174, "step": 175400 }, { "epoch": 0.45, "learning_rate": 0.00023179679662813877, "loss": 0.0163, "step": 175410 }, { "epoch": 0.45, "learning_rate": 0.00023179290841176728, "loss": 0.0158, "step": 175420 }, { "epoch": 0.45, "learning_rate": 0.00023178902019539582, "loss": 0.0187, "step": 175430 }, { "epoch": 0.45, "learning_rate": 0.00023178513197902434, "loss": 0.0243, "step": 175440 }, { "epoch": 0.45, "learning_rate": 0.00023178124376265288, "loss": 0.0211, "step": 175450 }, { "epoch": 0.45, "learning_rate": 0.00023177735554628142, "loss": 0.0296, "step": 175460 }, { "epoch": 0.45, "learning_rate": 0.00023177346732990996, "loss": 0.0217, "step": 175470 }, { "epoch": 0.45, "learning_rate": 0.00023176957911353848, "loss": 0.0162, "step": 175480 }, { "epoch": 0.45, "learning_rate": 0.00023176569089716702, "loss": 0.0186, "step": 175490 }, { "epoch": 0.45, "learning_rate": 0.00023176180268079556, "loss": 0.0185, "step": 175500 }, { "epoch": 0.45, "learning_rate": 0.0002317579144644241, "loss": 0.0192, "step": 175510 }, { "epoch": 0.45, "learning_rate": 0.00023175402624805262, "loss": 0.0166, "step": 175520 }, { "epoch": 0.45, "learning_rate": 0.00023175013803168116, "loss": 0.0171, "step": 175530 }, { "epoch": 0.46, "learning_rate": 0.00023174624981530973, "loss": 0.019, "step": 175540 }, { "epoch": 0.46, "learning_rate": 0.00023174236159893824, "loss": 0.0172, "step": 175550 }, { "epoch": 0.46, "learning_rate": 0.00023173847338256676, "loss": 0.0183, "step": 175560 }, { "epoch": 0.46, "learning_rate": 0.0002317345851661953, "loss": 0.0166, "step": 175570 }, { "epoch": 0.46, "learning_rate": 0.00023173069694982387, "loss": 0.0222, "step": 175580 }, { "epoch": 0.46, "learning_rate": 0.00023172680873345238, "loss": 0.017, "step": 175590 }, { "epoch": 0.46, "learning_rate": 0.00023172292051708092, "loss": 0.0174, "step": 175600 }, { "epoch": 0.46, "learning_rate": 0.00023171903230070944, "loss": 0.0212, "step": 175610 }, { "epoch": 0.46, "learning_rate": 0.000231715144084338, "loss": 0.0177, "step": 175620 }, { "epoch": 0.46, "learning_rate": 0.00023171125586796652, "loss": 0.0184, "step": 175630 }, { "epoch": 0.46, "learning_rate": 0.00023170736765159506, "loss": 0.0172, "step": 175640 }, { "epoch": 0.46, "learning_rate": 0.00023170347943522358, "loss": 0.0194, "step": 175650 }, { "epoch": 0.46, "learning_rate": 0.00023169959121885212, "loss": 0.0154, "step": 175660 }, { "epoch": 0.46, "learning_rate": 0.00023169570300248066, "loss": 0.0185, "step": 175670 }, { "epoch": 0.46, "learning_rate": 0.0002316918147861092, "loss": 0.0214, "step": 175680 }, { "epoch": 0.46, "learning_rate": 0.00023168792656973772, "loss": 0.0171, "step": 175690 }, { "epoch": 0.46, "learning_rate": 0.00023168403835336626, "loss": 0.0196, "step": 175700 }, { "epoch": 0.46, "learning_rate": 0.0002316801501369948, "loss": 0.02, "step": 175710 }, { "epoch": 0.46, "learning_rate": 0.00023167626192062334, "loss": 0.0192, "step": 175720 }, { "epoch": 0.46, "learning_rate": 0.00023167237370425186, "loss": 0.0163, "step": 175730 }, { "epoch": 0.46, "learning_rate": 0.0002316684854878804, "loss": 0.0194, "step": 175740 }, { "epoch": 0.46, "learning_rate": 0.00023166459727150897, "loss": 0.0192, "step": 175750 }, { "epoch": 0.46, "learning_rate": 0.00023166070905513748, "loss": 0.0186, "step": 175760 }, { "epoch": 0.46, "learning_rate": 0.00023165682083876602, "loss": 0.0174, "step": 175770 }, { "epoch": 0.46, "learning_rate": 0.00023165293262239454, "loss": 0.0218, "step": 175780 }, { "epoch": 0.46, "learning_rate": 0.0002316490444060231, "loss": 0.0169, "step": 175790 }, { "epoch": 0.46, "learning_rate": 0.00023164515618965162, "loss": 0.0201, "step": 175800 }, { "epoch": 0.46, "learning_rate": 0.00023164126797328016, "loss": 0.0226, "step": 175810 }, { "epoch": 0.46, "learning_rate": 0.00023163737975690868, "loss": 0.0259, "step": 175820 }, { "epoch": 0.46, "learning_rate": 0.00023163349154053725, "loss": 0.019, "step": 175830 }, { "epoch": 0.46, "learning_rate": 0.00023162960332416576, "loss": 0.023, "step": 175840 }, { "epoch": 0.46, "learning_rate": 0.0002316257151077943, "loss": 0.0178, "step": 175850 }, { "epoch": 0.46, "learning_rate": 0.00023162182689142282, "loss": 0.0238, "step": 175860 }, { "epoch": 0.46, "learning_rate": 0.00023161793867505139, "loss": 0.0181, "step": 175870 }, { "epoch": 0.46, "learning_rate": 0.0002316140504586799, "loss": 0.0177, "step": 175880 }, { "epoch": 0.46, "learning_rate": 0.00023161016224230844, "loss": 0.0169, "step": 175890 }, { "epoch": 0.46, "learning_rate": 0.00023160627402593696, "loss": 0.0159, "step": 175900 }, { "epoch": 0.46, "learning_rate": 0.0002316023858095655, "loss": 0.0234, "step": 175910 }, { "epoch": 0.46, "learning_rate": 0.00023159849759319407, "loss": 0.023, "step": 175920 }, { "epoch": 0.46, "learning_rate": 0.00023159460937682258, "loss": 0.0238, "step": 175930 }, { "epoch": 0.46, "learning_rate": 0.00023159072116045112, "loss": 0.016, "step": 175940 }, { "epoch": 0.46, "learning_rate": 0.00023158683294407964, "loss": 0.0185, "step": 175950 }, { "epoch": 0.46, "learning_rate": 0.0002315829447277082, "loss": 0.0174, "step": 175960 }, { "epoch": 0.46, "learning_rate": 0.00023157905651133672, "loss": 0.016, "step": 175970 }, { "epoch": 0.46, "learning_rate": 0.00023157516829496526, "loss": 0.0187, "step": 175980 }, { "epoch": 0.46, "learning_rate": 0.00023157128007859378, "loss": 0.0173, "step": 175990 }, { "epoch": 0.46, "learning_rate": 0.00023156739186222235, "loss": 0.0156, "step": 176000 }, { "epoch": 0.46, "eval_cer": 0.8817838652653501, "eval_loss": 0.012811483815312386, "eval_runtime": 107.6031, "eval_samples_per_second": 18.587, "eval_steps_per_second": 4.647, "step": 176000 }, { "epoch": 0.46, "learning_rate": 0.00023156350364585086, "loss": 0.0194, "step": 176010 }, { "epoch": 0.46, "learning_rate": 0.0002315596154294794, "loss": 0.0152, "step": 176020 }, { "epoch": 0.46, "learning_rate": 0.00023155572721310792, "loss": 0.0193, "step": 176030 }, { "epoch": 0.46, "learning_rate": 0.00023155183899673648, "loss": 0.0154, "step": 176040 }, { "epoch": 0.46, "learning_rate": 0.000231547950780365, "loss": 0.0254, "step": 176050 }, { "epoch": 0.46, "learning_rate": 0.00023154406256399354, "loss": 0.0169, "step": 176060 }, { "epoch": 0.46, "learning_rate": 0.00023154017434762206, "loss": 0.021, "step": 176070 }, { "epoch": 0.46, "learning_rate": 0.00023153628613125062, "loss": 0.0196, "step": 176080 }, { "epoch": 0.46, "learning_rate": 0.00023153239791487917, "loss": 0.0208, "step": 176090 }, { "epoch": 0.46, "learning_rate": 0.00023152850969850768, "loss": 0.0189, "step": 176100 }, { "epoch": 0.46, "learning_rate": 0.0002315246214821362, "loss": 0.0183, "step": 176110 }, { "epoch": 0.46, "learning_rate": 0.00023152073326576476, "loss": 0.0167, "step": 176120 }, { "epoch": 0.46, "learning_rate": 0.0002315168450493933, "loss": 0.0156, "step": 176130 }, { "epoch": 0.46, "learning_rate": 0.00023151295683302182, "loss": 0.0215, "step": 176140 }, { "epoch": 0.46, "learning_rate": 0.00023150906861665036, "loss": 0.0168, "step": 176150 }, { "epoch": 0.46, "learning_rate": 0.00023150518040027888, "loss": 0.0204, "step": 176160 }, { "epoch": 0.46, "learning_rate": 0.00023150129218390744, "loss": 0.0204, "step": 176170 }, { "epoch": 0.46, "learning_rate": 0.00023149740396753596, "loss": 0.0213, "step": 176180 }, { "epoch": 0.46, "learning_rate": 0.0002314935157511645, "loss": 0.0187, "step": 176190 }, { "epoch": 0.46, "learning_rate": 0.00023148962753479302, "loss": 0.0197, "step": 176200 }, { "epoch": 0.46, "learning_rate": 0.00023148573931842158, "loss": 0.0181, "step": 176210 }, { "epoch": 0.46, "learning_rate": 0.0002314818511020501, "loss": 0.0183, "step": 176220 }, { "epoch": 0.46, "learning_rate": 0.00023147796288567864, "loss": 0.0245, "step": 176230 }, { "epoch": 0.46, "learning_rate": 0.00023147407466930715, "loss": 0.0196, "step": 176240 }, { "epoch": 0.46, "learning_rate": 0.00023147018645293572, "loss": 0.0165, "step": 176250 }, { "epoch": 0.46, "learning_rate": 0.00023146629823656424, "loss": 0.018, "step": 176260 }, { "epoch": 0.46, "learning_rate": 0.00023146241002019278, "loss": 0.0158, "step": 176270 }, { "epoch": 0.46, "learning_rate": 0.0002314585218038213, "loss": 0.0176, "step": 176280 }, { "epoch": 0.46, "learning_rate": 0.00023145463358744986, "loss": 0.0213, "step": 176290 }, { "epoch": 0.46, "learning_rate": 0.0002314507453710784, "loss": 0.0163, "step": 176300 }, { "epoch": 0.46, "learning_rate": 0.00023144685715470692, "loss": 0.0215, "step": 176310 }, { "epoch": 0.46, "learning_rate": 0.00023144296893833546, "loss": 0.0158, "step": 176320 }, { "epoch": 0.46, "learning_rate": 0.000231439080721964, "loss": 0.0163, "step": 176330 }, { "epoch": 0.46, "learning_rate": 0.00023143519250559254, "loss": 0.0168, "step": 176340 }, { "epoch": 0.46, "learning_rate": 0.00023143130428922106, "loss": 0.0158, "step": 176350 }, { "epoch": 0.46, "learning_rate": 0.0002314274160728496, "loss": 0.0174, "step": 176360 }, { "epoch": 0.46, "learning_rate": 0.00023142352785647814, "loss": 0.0162, "step": 176370 }, { "epoch": 0.46, "learning_rate": 0.00023141963964010668, "loss": 0.0206, "step": 176380 }, { "epoch": 0.46, "learning_rate": 0.0002314157514237352, "loss": 0.0201, "step": 176390 }, { "epoch": 0.46, "learning_rate": 0.00023141186320736374, "loss": 0.0167, "step": 176400 }, { "epoch": 0.46, "learning_rate": 0.00023140797499099225, "loss": 0.0149, "step": 176410 }, { "epoch": 0.46, "learning_rate": 0.00023140408677462082, "loss": 0.0186, "step": 176420 }, { "epoch": 0.46, "learning_rate": 0.00023140019855824934, "loss": 0.0184, "step": 176430 }, { "epoch": 0.46, "learning_rate": 0.00023139631034187788, "loss": 0.0187, "step": 176440 }, { "epoch": 0.46, "learning_rate": 0.0002313924221255064, "loss": 0.019, "step": 176450 }, { "epoch": 0.46, "learning_rate": 0.00023138853390913496, "loss": 0.0169, "step": 176460 }, { "epoch": 0.46, "learning_rate": 0.0002313846456927635, "loss": 0.0177, "step": 176470 }, { "epoch": 0.46, "learning_rate": 0.00023138075747639202, "loss": 0.0149, "step": 176480 }, { "epoch": 0.46, "learning_rate": 0.00023137686926002056, "loss": 0.0204, "step": 176490 }, { "epoch": 0.46, "learning_rate": 0.0002313729810436491, "loss": 0.0144, "step": 176500 }, { "epoch": 0.46, "learning_rate": 0.00023136909282727764, "loss": 0.0195, "step": 176510 }, { "epoch": 0.46, "learning_rate": 0.00023136520461090616, "loss": 0.0251, "step": 176520 }, { "epoch": 0.46, "learning_rate": 0.0002313613163945347, "loss": 0.0276, "step": 176530 }, { "epoch": 0.46, "learning_rate": 0.00023135742817816324, "loss": 0.014, "step": 176540 }, { "epoch": 0.46, "learning_rate": 0.00023135353996179178, "loss": 0.0192, "step": 176550 }, { "epoch": 0.46, "learning_rate": 0.0002313496517454203, "loss": 0.0204, "step": 176560 }, { "epoch": 0.46, "learning_rate": 0.00023134576352904884, "loss": 0.0233, "step": 176570 }, { "epoch": 0.46, "learning_rate": 0.00023134187531267738, "loss": 0.0176, "step": 176580 }, { "epoch": 0.46, "learning_rate": 0.00023133798709630592, "loss": 0.0288, "step": 176590 }, { "epoch": 0.46, "learning_rate": 0.00023133409887993444, "loss": 0.0176, "step": 176600 }, { "epoch": 0.46, "learning_rate": 0.00023133021066356298, "loss": 0.0155, "step": 176610 }, { "epoch": 0.46, "learning_rate": 0.00023132632244719155, "loss": 0.0169, "step": 176620 }, { "epoch": 0.46, "learning_rate": 0.00023132243423082006, "loss": 0.0171, "step": 176630 }, { "epoch": 0.46, "learning_rate": 0.0002313185460144486, "loss": 0.0153, "step": 176640 }, { "epoch": 0.46, "learning_rate": 0.00023131465779807712, "loss": 0.0169, "step": 176650 }, { "epoch": 0.46, "learning_rate": 0.00023131076958170563, "loss": 0.0208, "step": 176660 }, { "epoch": 0.46, "learning_rate": 0.0002313068813653342, "loss": 0.0256, "step": 176670 }, { "epoch": 0.46, "learning_rate": 0.00023130299314896274, "loss": 0.0194, "step": 176680 }, { "epoch": 0.46, "learning_rate": 0.00023129910493259126, "loss": 0.0176, "step": 176690 }, { "epoch": 0.46, "learning_rate": 0.0002312952167162198, "loss": 0.0181, "step": 176700 }, { "epoch": 0.46, "learning_rate": 0.00023129132849984834, "loss": 0.0137, "step": 176710 }, { "epoch": 0.46, "learning_rate": 0.00023128744028347688, "loss": 0.0165, "step": 176720 }, { "epoch": 0.46, "learning_rate": 0.0002312835520671054, "loss": 0.0145, "step": 176730 }, { "epoch": 0.46, "learning_rate": 0.00023127966385073394, "loss": 0.0159, "step": 176740 }, { "epoch": 0.46, "learning_rate": 0.00023127577563436248, "loss": 0.0171, "step": 176750 }, { "epoch": 0.46, "learning_rate": 0.00023127188741799102, "loss": 0.0172, "step": 176760 }, { "epoch": 0.46, "learning_rate": 0.00023126799920161954, "loss": 0.0161, "step": 176770 }, { "epoch": 0.46, "learning_rate": 0.00023126411098524808, "loss": 0.0193, "step": 176780 }, { "epoch": 0.46, "learning_rate": 0.00023126022276887665, "loss": 0.0193, "step": 176790 }, { "epoch": 0.46, "learning_rate": 0.00023125633455250516, "loss": 0.0201, "step": 176800 }, { "epoch": 0.46, "learning_rate": 0.0002312524463361337, "loss": 0.021, "step": 176810 }, { "epoch": 0.46, "learning_rate": 0.00023124855811976222, "loss": 0.0152, "step": 176820 }, { "epoch": 0.46, "learning_rate": 0.00023124466990339079, "loss": 0.0168, "step": 176830 }, { "epoch": 0.46, "learning_rate": 0.0002312407816870193, "loss": 0.0207, "step": 176840 }, { "epoch": 0.46, "learning_rate": 0.00023123689347064784, "loss": 0.0151, "step": 176850 }, { "epoch": 0.46, "learning_rate": 0.00023123300525427636, "loss": 0.0174, "step": 176860 }, { "epoch": 0.46, "learning_rate": 0.00023122911703790493, "loss": 0.0206, "step": 176870 }, { "epoch": 0.46, "learning_rate": 0.00023122522882153344, "loss": 0.0305, "step": 176880 }, { "epoch": 0.46, "learning_rate": 0.00023122134060516198, "loss": 0.0193, "step": 176890 }, { "epoch": 0.46, "learning_rate": 0.0002312174523887905, "loss": 0.0227, "step": 176900 }, { "epoch": 0.46, "learning_rate": 0.00023121356417241904, "loss": 0.0175, "step": 176910 }, { "epoch": 0.46, "learning_rate": 0.00023120967595604758, "loss": 0.0167, "step": 176920 }, { "epoch": 0.46, "learning_rate": 0.00023120578773967612, "loss": 0.0246, "step": 176930 }, { "epoch": 0.46, "learning_rate": 0.00023120189952330464, "loss": 0.0182, "step": 176940 }, { "epoch": 0.46, "learning_rate": 0.00023119801130693318, "loss": 0.0146, "step": 176950 }, { "epoch": 0.46, "learning_rate": 0.00023119412309056175, "loss": 0.019, "step": 176960 }, { "epoch": 0.46, "learning_rate": 0.00023119023487419026, "loss": 0.0165, "step": 176970 }, { "epoch": 0.46, "learning_rate": 0.00023118634665781878, "loss": 0.0148, "step": 176980 }, { "epoch": 0.46, "learning_rate": 0.00023118245844144732, "loss": 0.018, "step": 176990 }, { "epoch": 0.46, "learning_rate": 0.00023117857022507589, "loss": 0.0189, "step": 177000 }, { "epoch": 0.46, "eval_cer": 0.8818174565517705, "eval_loss": 0.012291929684579372, "eval_runtime": 107.4295, "eval_samples_per_second": 18.617, "eval_steps_per_second": 4.654, "step": 177000 }, { "epoch": 0.46, "learning_rate": 0.0002311746820087044, "loss": 0.0188, "step": 177010 }, { "epoch": 0.46, "learning_rate": 0.00023117079379233294, "loss": 0.019, "step": 177020 }, { "epoch": 0.46, "learning_rate": 0.00023116690557596146, "loss": 0.0171, "step": 177030 }, { "epoch": 0.46, "learning_rate": 0.00023116301735959003, "loss": 0.016, "step": 177040 }, { "epoch": 0.46, "learning_rate": 0.00023115912914321854, "loss": 0.0188, "step": 177050 }, { "epoch": 0.46, "learning_rate": 0.00023115524092684708, "loss": 0.0175, "step": 177060 }, { "epoch": 0.46, "learning_rate": 0.0002311513527104756, "loss": 0.0175, "step": 177070 }, { "epoch": 0.46, "learning_rate": 0.00023114746449410416, "loss": 0.0163, "step": 177080 }, { "epoch": 0.46, "learning_rate": 0.00023114357627773268, "loss": 0.0168, "step": 177090 }, { "epoch": 0.46, "learning_rate": 0.00023113968806136122, "loss": 0.0147, "step": 177100 }, { "epoch": 0.46, "learning_rate": 0.00023113579984498974, "loss": 0.0208, "step": 177110 }, { "epoch": 0.46, "learning_rate": 0.0002311319116286183, "loss": 0.0163, "step": 177120 }, { "epoch": 0.46, "learning_rate": 0.00023112802341224682, "loss": 0.0193, "step": 177130 }, { "epoch": 0.46, "learning_rate": 0.00023112413519587536, "loss": 0.0142, "step": 177140 }, { "epoch": 0.46, "learning_rate": 0.00023112024697950387, "loss": 0.0232, "step": 177150 }, { "epoch": 0.46, "learning_rate": 0.00023111635876313242, "loss": 0.0194, "step": 177160 }, { "epoch": 0.46, "learning_rate": 0.00023111247054676099, "loss": 0.0161, "step": 177170 }, { "epoch": 0.46, "learning_rate": 0.0002311085823303895, "loss": 0.0209, "step": 177180 }, { "epoch": 0.46, "learning_rate": 0.00023110469411401804, "loss": 0.017, "step": 177190 }, { "epoch": 0.46, "learning_rate": 0.00023110080589764656, "loss": 0.016, "step": 177200 }, { "epoch": 0.46, "learning_rate": 0.00023109691768127512, "loss": 0.02, "step": 177210 }, { "epoch": 0.46, "learning_rate": 0.00023109302946490364, "loss": 0.0143, "step": 177220 }, { "epoch": 0.46, "learning_rate": 0.00023108914124853218, "loss": 0.0188, "step": 177230 }, { "epoch": 0.46, "learning_rate": 0.0002310852530321607, "loss": 0.0174, "step": 177240 }, { "epoch": 0.46, "learning_rate": 0.00023108136481578926, "loss": 0.0157, "step": 177250 }, { "epoch": 0.46, "learning_rate": 0.00023107747659941778, "loss": 0.0236, "step": 177260 }, { "epoch": 0.46, "learning_rate": 0.00023107358838304632, "loss": 0.0224, "step": 177270 }, { "epoch": 0.46, "learning_rate": 0.00023106970016667483, "loss": 0.0243, "step": 177280 }, { "epoch": 0.46, "learning_rate": 0.0002310658119503034, "loss": 0.0238, "step": 177290 }, { "epoch": 0.46, "learning_rate": 0.00023106192373393192, "loss": 0.0156, "step": 177300 }, { "epoch": 0.46, "learning_rate": 0.00023105803551756046, "loss": 0.0168, "step": 177310 }, { "epoch": 0.46, "learning_rate": 0.00023105414730118897, "loss": 0.0166, "step": 177320 }, { "epoch": 0.46, "learning_rate": 0.00023105025908481754, "loss": 0.0173, "step": 177330 }, { "epoch": 0.46, "learning_rate": 0.00023104637086844608, "loss": 0.0244, "step": 177340 }, { "epoch": 0.46, "learning_rate": 0.0002310424826520746, "loss": 0.0164, "step": 177350 }, { "epoch": 0.46, "learning_rate": 0.00023103859443570314, "loss": 0.0201, "step": 177360 }, { "epoch": 0.46, "learning_rate": 0.00023103470621933168, "loss": 0.0168, "step": 177370 }, { "epoch": 0.46, "learning_rate": 0.00023103081800296022, "loss": 0.022, "step": 177380 }, { "epoch": 0.46, "learning_rate": 0.00023102692978658874, "loss": 0.0291, "step": 177390 }, { "epoch": 0.46, "learning_rate": 0.00023102304157021728, "loss": 0.0238, "step": 177400 }, { "epoch": 0.46, "learning_rate": 0.0002310191533538458, "loss": 0.0196, "step": 177410 }, { "epoch": 0.46, "learning_rate": 0.00023101526513747436, "loss": 0.029, "step": 177420 }, { "epoch": 0.46, "learning_rate": 0.00023101137692110288, "loss": 0.027, "step": 177430 }, { "epoch": 0.46, "learning_rate": 0.00023100748870473142, "loss": 0.0157, "step": 177440 }, { "epoch": 0.46, "learning_rate": 0.00023100360048835993, "loss": 0.0147, "step": 177450 }, { "epoch": 0.46, "learning_rate": 0.0002309997122719885, "loss": 0.015, "step": 177460 }, { "epoch": 0.46, "learning_rate": 0.00023099582405561702, "loss": 0.0377, "step": 177470 }, { "epoch": 0.46, "learning_rate": 0.00023099193583924556, "loss": 0.0661, "step": 177480 }, { "epoch": 0.46, "learning_rate": 0.00023098804762287407, "loss": 0.0178, "step": 177490 }, { "epoch": 0.46, "learning_rate": 0.00023098415940650264, "loss": 0.0147, "step": 177500 }, { "epoch": 0.46, "learning_rate": 0.00023098027119013118, "loss": 0.014, "step": 177510 }, { "epoch": 0.46, "learning_rate": 0.0002309763829737597, "loss": 0.0189, "step": 177520 }, { "epoch": 0.46, "learning_rate": 0.00023097249475738824, "loss": 0.0175, "step": 177530 }, { "epoch": 0.46, "learning_rate": 0.00023096860654101678, "loss": 0.0194, "step": 177540 }, { "epoch": 0.46, "learning_rate": 0.00023096471832464532, "loss": 0.0175, "step": 177550 }, { "epoch": 0.46, "learning_rate": 0.00023096083010827384, "loss": 0.015, "step": 177560 }, { "epoch": 0.46, "learning_rate": 0.00023095694189190238, "loss": 0.0151, "step": 177570 }, { "epoch": 0.46, "learning_rate": 0.00023095305367553092, "loss": 0.0206, "step": 177580 }, { "epoch": 0.46, "learning_rate": 0.00023094916545915946, "loss": 0.0188, "step": 177590 }, { "epoch": 0.46, "learning_rate": 0.00023094527724278798, "loss": 0.0227, "step": 177600 }, { "epoch": 0.46, "learning_rate": 0.00023094138902641652, "loss": 0.0259, "step": 177610 }, { "epoch": 0.46, "learning_rate": 0.00023093750081004506, "loss": 0.0185, "step": 177620 }, { "epoch": 0.46, "learning_rate": 0.0002309336125936736, "loss": 0.02, "step": 177630 }, { "epoch": 0.46, "learning_rate": 0.00023092972437730212, "loss": 0.0212, "step": 177640 }, { "epoch": 0.46, "learning_rate": 0.00023092583616093066, "loss": 0.0175, "step": 177650 }, { "epoch": 0.46, "learning_rate": 0.00023092194794455917, "loss": 0.0176, "step": 177660 }, { "epoch": 0.46, "learning_rate": 0.00023091805972818774, "loss": 0.0188, "step": 177670 }, { "epoch": 0.46, "learning_rate": 0.00023091417151181628, "loss": 0.0175, "step": 177680 }, { "epoch": 0.46, "learning_rate": 0.0002309102832954448, "loss": 0.0167, "step": 177690 }, { "epoch": 0.46, "learning_rate": 0.0002309063950790733, "loss": 0.0149, "step": 177700 }, { "epoch": 0.46, "learning_rate": 0.00023090250686270188, "loss": 0.0167, "step": 177710 }, { "epoch": 0.46, "learning_rate": 0.00023089861864633042, "loss": 0.0154, "step": 177720 }, { "epoch": 0.46, "learning_rate": 0.00023089473042995894, "loss": 0.0165, "step": 177730 }, { "epoch": 0.46, "learning_rate": 0.00023089084221358748, "loss": 0.0153, "step": 177740 }, { "epoch": 0.46, "learning_rate": 0.00023088695399721602, "loss": 0.0181, "step": 177750 }, { "epoch": 0.46, "learning_rate": 0.00023088306578084456, "loss": 0.021, "step": 177760 }, { "epoch": 0.46, "learning_rate": 0.00023087917756447308, "loss": 0.0199, "step": 177770 }, { "epoch": 0.46, "learning_rate": 0.00023087528934810162, "loss": 0.0179, "step": 177780 }, { "epoch": 0.46, "learning_rate": 0.00023087140113173016, "loss": 0.0164, "step": 177790 }, { "epoch": 0.46, "learning_rate": 0.0002308675129153587, "loss": 0.0189, "step": 177800 }, { "epoch": 0.46, "learning_rate": 0.00023086362469898722, "loss": 0.018, "step": 177810 }, { "epoch": 0.46, "learning_rate": 0.00023085973648261576, "loss": 0.022, "step": 177820 }, { "epoch": 0.46, "learning_rate": 0.00023085584826624433, "loss": 0.0193, "step": 177830 }, { "epoch": 0.46, "learning_rate": 0.00023085196004987284, "loss": 0.0152, "step": 177840 }, { "epoch": 0.46, "learning_rate": 0.00023084807183350136, "loss": 0.0175, "step": 177850 }, { "epoch": 0.46, "learning_rate": 0.0002308441836171299, "loss": 0.0161, "step": 177860 }, { "epoch": 0.46, "learning_rate": 0.00023084029540075847, "loss": 0.018, "step": 177870 }, { "epoch": 0.46, "learning_rate": 0.00023083640718438698, "loss": 0.0157, "step": 177880 }, { "epoch": 0.46, "learning_rate": 0.00023083251896801552, "loss": 0.0174, "step": 177890 }, { "epoch": 0.46, "learning_rate": 0.00023082863075164404, "loss": 0.0158, "step": 177900 }, { "epoch": 0.46, "learning_rate": 0.00023082474253527258, "loss": 0.0157, "step": 177910 }, { "epoch": 0.46, "learning_rate": 0.00023082085431890112, "loss": 0.012, "step": 177920 }, { "epoch": 0.46, "learning_rate": 0.00023081696610252966, "loss": 0.0153, "step": 177930 }, { "epoch": 0.46, "learning_rate": 0.00023081307788615818, "loss": 0.0143, "step": 177940 }, { "epoch": 0.46, "learning_rate": 0.00023080918966978672, "loss": 0.0185, "step": 177950 }, { "epoch": 0.46, "learning_rate": 0.00023080530145341526, "loss": 0.0155, "step": 177960 }, { "epoch": 0.46, "learning_rate": 0.0002308014132370438, "loss": 0.0145, "step": 177970 }, { "epoch": 0.46, "learning_rate": 0.00023079752502067232, "loss": 0.0178, "step": 177980 }, { "epoch": 0.46, "learning_rate": 0.00023079363680430086, "loss": 0.0188, "step": 177990 }, { "epoch": 0.46, "learning_rate": 0.00023078974858792943, "loss": 0.0162, "step": 178000 }, { "epoch": 0.46, "eval_cer": 0.8817698688960084, "eval_loss": 0.012205556035041809, "eval_runtime": 108.0603, "eval_samples_per_second": 18.508, "eval_steps_per_second": 4.627, "step": 178000 }, { "epoch": 0.46, "learning_rate": 0.00023078586037155794, "loss": 0.0186, "step": 178010 }, { "epoch": 0.46, "learning_rate": 0.00023078197215518646, "loss": 0.0161, "step": 178020 }, { "epoch": 0.46, "learning_rate": 0.000230778083938815, "loss": 0.021, "step": 178030 }, { "epoch": 0.46, "learning_rate": 0.00023077419572244357, "loss": 0.0192, "step": 178040 }, { "epoch": 0.46, "learning_rate": 0.00023077030750607208, "loss": 0.0163, "step": 178050 }, { "epoch": 0.46, "learning_rate": 0.00023076641928970062, "loss": 0.0176, "step": 178060 }, { "epoch": 0.46, "learning_rate": 0.00023076253107332914, "loss": 0.018, "step": 178070 }, { "epoch": 0.46, "learning_rate": 0.0002307586428569577, "loss": 0.0179, "step": 178080 }, { "epoch": 0.46, "learning_rate": 0.00023075475464058622, "loss": 0.018, "step": 178090 }, { "epoch": 0.46, "learning_rate": 0.00023075086642421476, "loss": 0.0154, "step": 178100 }, { "epoch": 0.46, "learning_rate": 0.00023074697820784328, "loss": 0.0198, "step": 178110 }, { "epoch": 0.46, "learning_rate": 0.00023074308999147184, "loss": 0.0348, "step": 178120 }, { "epoch": 0.46, "learning_rate": 0.00023073920177510036, "loss": 0.019, "step": 178130 }, { "epoch": 0.46, "learning_rate": 0.0002307353135587289, "loss": 0.0224, "step": 178140 }, { "epoch": 0.46, "learning_rate": 0.00023073142534235742, "loss": 0.0216, "step": 178150 }, { "epoch": 0.46, "learning_rate": 0.00023072753712598596, "loss": 0.0172, "step": 178160 }, { "epoch": 0.46, "learning_rate": 0.0002307236489096145, "loss": 0.0143, "step": 178170 }, { "epoch": 0.46, "learning_rate": 0.00023071976069324304, "loss": 0.0223, "step": 178180 }, { "epoch": 0.46, "learning_rate": 0.00023071587247687155, "loss": 0.0182, "step": 178190 }, { "epoch": 0.46, "learning_rate": 0.0002307119842605001, "loss": 0.0173, "step": 178200 }, { "epoch": 0.46, "learning_rate": 0.00023070809604412867, "loss": 0.0213, "step": 178210 }, { "epoch": 0.46, "learning_rate": 0.00023070420782775718, "loss": 0.0195, "step": 178220 }, { "epoch": 0.46, "learning_rate": 0.00023070031961138572, "loss": 0.0156, "step": 178230 }, { "epoch": 0.46, "learning_rate": 0.00023069643139501424, "loss": 0.0213, "step": 178240 }, { "epoch": 0.46, "learning_rate": 0.0002306925431786428, "loss": 0.0241, "step": 178250 }, { "epoch": 0.46, "learning_rate": 0.00023068865496227132, "loss": 0.0165, "step": 178260 }, { "epoch": 0.46, "learning_rate": 0.00023068476674589986, "loss": 0.0162, "step": 178270 }, { "epoch": 0.46, "learning_rate": 0.00023068087852952838, "loss": 0.0222, "step": 178280 }, { "epoch": 0.46, "learning_rate": 0.00023067699031315694, "loss": 0.0125, "step": 178290 }, { "epoch": 0.46, "learning_rate": 0.00023067310209678546, "loss": 0.0184, "step": 178300 }, { "epoch": 0.46, "learning_rate": 0.000230669213880414, "loss": 0.0156, "step": 178310 }, { "epoch": 0.46, "learning_rate": 0.00023066532566404251, "loss": 0.0161, "step": 178320 }, { "epoch": 0.46, "learning_rate": 0.00023066143744767108, "loss": 0.0137, "step": 178330 }, { "epoch": 0.46, "learning_rate": 0.0002306575492312996, "loss": 0.0228, "step": 178340 }, { "epoch": 0.46, "learning_rate": 0.00023065366101492814, "loss": 0.0265, "step": 178350 }, { "epoch": 0.46, "learning_rate": 0.00023064977279855665, "loss": 0.0169, "step": 178360 }, { "epoch": 0.46, "learning_rate": 0.00023064588458218522, "loss": 0.0174, "step": 178370 }, { "epoch": 0.46, "learning_rate": 0.00023064199636581376, "loss": 0.0237, "step": 178380 }, { "epoch": 0.46, "learning_rate": 0.00023063810814944228, "loss": 0.015, "step": 178390 }, { "epoch": 0.46, "learning_rate": 0.00023063421993307082, "loss": 0.017, "step": 178400 }, { "epoch": 0.46, "learning_rate": 0.00023063033171669934, "loss": 0.0204, "step": 178410 }, { "epoch": 0.46, "learning_rate": 0.0002306264435003279, "loss": 0.0179, "step": 178420 }, { "epoch": 0.46, "learning_rate": 0.00023062255528395642, "loss": 0.0163, "step": 178430 }, { "epoch": 0.46, "learning_rate": 0.00023061866706758496, "loss": 0.015, "step": 178440 }, { "epoch": 0.46, "learning_rate": 0.00023061477885121347, "loss": 0.0226, "step": 178450 }, { "epoch": 0.46, "learning_rate": 0.00023061089063484204, "loss": 0.0232, "step": 178460 }, { "epoch": 0.46, "learning_rate": 0.00023060700241847056, "loss": 0.0203, "step": 178470 }, { "epoch": 0.46, "learning_rate": 0.0002306031142020991, "loss": 0.0138, "step": 178480 }, { "epoch": 0.46, "learning_rate": 0.00023059922598572761, "loss": 0.0187, "step": 178490 }, { "epoch": 0.46, "learning_rate": 0.00023059533776935618, "loss": 0.0148, "step": 178500 }, { "epoch": 0.46, "learning_rate": 0.0002305914495529847, "loss": 0.0155, "step": 178510 }, { "epoch": 0.46, "learning_rate": 0.00023058756133661324, "loss": 0.0157, "step": 178520 }, { "epoch": 0.46, "learning_rate": 0.00023058367312024175, "loss": 0.0191, "step": 178530 }, { "epoch": 0.46, "learning_rate": 0.00023057978490387032, "loss": 0.0177, "step": 178540 }, { "epoch": 0.46, "learning_rate": 0.00023057589668749886, "loss": 0.0128, "step": 178550 }, { "epoch": 0.46, "learning_rate": 0.00023057200847112738, "loss": 0.0155, "step": 178560 }, { "epoch": 0.46, "learning_rate": 0.0002305681202547559, "loss": 0.0184, "step": 178570 }, { "epoch": 0.46, "learning_rate": 0.00023056423203838446, "loss": 0.0172, "step": 178580 }, { "epoch": 0.46, "learning_rate": 0.000230560343822013, "loss": 0.0193, "step": 178590 }, { "epoch": 0.46, "learning_rate": 0.00023055645560564152, "loss": 0.0177, "step": 178600 }, { "epoch": 0.46, "learning_rate": 0.00023055256738927006, "loss": 0.0179, "step": 178610 }, { "epoch": 0.46, "learning_rate": 0.0002305486791728986, "loss": 0.0209, "step": 178620 }, { "epoch": 0.46, "learning_rate": 0.00023054479095652714, "loss": 0.0197, "step": 178630 }, { "epoch": 0.46, "learning_rate": 0.00023054090274015566, "loss": 0.0171, "step": 178640 }, { "epoch": 0.46, "learning_rate": 0.0002305370145237842, "loss": 0.0192, "step": 178650 }, { "epoch": 0.46, "learning_rate": 0.0002305331263074127, "loss": 0.0181, "step": 178660 }, { "epoch": 0.46, "learning_rate": 0.00023052923809104128, "loss": 0.0172, "step": 178670 }, { "epoch": 0.46, "learning_rate": 0.0002305253498746698, "loss": 0.0187, "step": 178680 }, { "epoch": 0.46, "learning_rate": 0.00023052146165829834, "loss": 0.0199, "step": 178690 }, { "epoch": 0.46, "learning_rate": 0.00023051757344192685, "loss": 0.0156, "step": 178700 }, { "epoch": 0.46, "learning_rate": 0.00023051368522555542, "loss": 0.0206, "step": 178710 }, { "epoch": 0.46, "learning_rate": 0.00023050979700918394, "loss": 0.0161, "step": 178720 }, { "epoch": 0.46, "learning_rate": 0.00023050590879281248, "loss": 0.0167, "step": 178730 }, { "epoch": 0.46, "learning_rate": 0.000230502020576441, "loss": 0.0187, "step": 178740 }, { "epoch": 0.46, "learning_rate": 0.00023049813236006956, "loss": 0.0207, "step": 178750 }, { "epoch": 0.46, "learning_rate": 0.0002304942441436981, "loss": 0.0168, "step": 178760 }, { "epoch": 0.46, "learning_rate": 0.00023049035592732662, "loss": 0.0234, "step": 178770 }, { "epoch": 0.46, "learning_rate": 0.00023048646771095516, "loss": 0.0169, "step": 178780 }, { "epoch": 0.46, "learning_rate": 0.0002304825794945837, "loss": 0.0163, "step": 178790 }, { "epoch": 0.46, "learning_rate": 0.00023047869127821224, "loss": 0.0151, "step": 178800 }, { "epoch": 0.46, "learning_rate": 0.00023047480306184076, "loss": 0.0164, "step": 178810 }, { "epoch": 0.46, "learning_rate": 0.0002304709148454693, "loss": 0.0136, "step": 178820 }, { "epoch": 0.46, "learning_rate": 0.00023046702662909784, "loss": 0.0201, "step": 178830 }, { "epoch": 0.46, "learning_rate": 0.00023046313841272638, "loss": 0.0149, "step": 178840 }, { "epoch": 0.46, "learning_rate": 0.0002304592501963549, "loss": 0.0172, "step": 178850 }, { "epoch": 0.46, "learning_rate": 0.00023045536197998344, "loss": 0.0168, "step": 178860 }, { "epoch": 0.46, "learning_rate": 0.000230451473763612, "loss": 0.022, "step": 178870 }, { "epoch": 0.46, "learning_rate": 0.00023044758554724052, "loss": 0.0174, "step": 178880 }, { "epoch": 0.46, "learning_rate": 0.00023044369733086904, "loss": 0.0209, "step": 178890 }, { "epoch": 0.46, "learning_rate": 0.00023043980911449758, "loss": 0.0179, "step": 178900 }, { "epoch": 0.46, "learning_rate": 0.0002304359208981261, "loss": 0.0188, "step": 178910 }, { "epoch": 0.46, "learning_rate": 0.00023043203268175466, "loss": 0.0172, "step": 178920 }, { "epoch": 0.46, "learning_rate": 0.0002304281444653832, "loss": 0.0202, "step": 178930 }, { "epoch": 0.46, "learning_rate": 0.00023042425624901172, "loss": 0.0203, "step": 178940 }, { "epoch": 0.46, "learning_rate": 0.00023042036803264026, "loss": 0.0182, "step": 178950 }, { "epoch": 0.46, "learning_rate": 0.0002304164798162688, "loss": 0.0284, "step": 178960 }, { "epoch": 0.46, "learning_rate": 0.00023041259159989734, "loss": 0.0226, "step": 178970 }, { "epoch": 0.46, "learning_rate": 0.00023040870338352586, "loss": 0.0167, "step": 178980 }, { "epoch": 0.46, "learning_rate": 0.0002304048151671544, "loss": 0.0144, "step": 178990 }, { "epoch": 0.46, "learning_rate": 0.00023040092695078294, "loss": 0.0166, "step": 179000 }, { "epoch": 0.46, "eval_cer": 0.8817880641761527, "eval_loss": 0.012226469814777374, "eval_runtime": 108.116, "eval_samples_per_second": 18.499, "eval_steps_per_second": 4.625, "step": 179000 }, { "epoch": 0.46, "learning_rate": 0.00023039703873441148, "loss": 0.0176, "step": 179010 }, { "epoch": 0.46, "learning_rate": 0.00023039315051804, "loss": 0.0151, "step": 179020 }, { "epoch": 0.46, "learning_rate": 0.00023038926230166854, "loss": 0.021, "step": 179030 }, { "epoch": 0.46, "learning_rate": 0.00023038537408529708, "loss": 0.0225, "step": 179040 }, { "epoch": 0.46, "learning_rate": 0.00023038148586892562, "loss": 0.0185, "step": 179050 }, { "epoch": 0.46, "learning_rate": 0.00023037759765255414, "loss": 0.0163, "step": 179060 }, { "epoch": 0.46, "learning_rate": 0.00023037370943618268, "loss": 0.0141, "step": 179070 }, { "epoch": 0.46, "learning_rate": 0.00023036982121981125, "loss": 0.0185, "step": 179080 }, { "epoch": 0.46, "learning_rate": 0.00023036593300343976, "loss": 0.0155, "step": 179090 }, { "epoch": 0.46, "learning_rate": 0.0002303620447870683, "loss": 0.0151, "step": 179100 }, { "epoch": 0.46, "learning_rate": 0.00023035815657069682, "loss": 0.0149, "step": 179110 }, { "epoch": 0.46, "learning_rate": 0.00023035426835432538, "loss": 0.0195, "step": 179120 }, { "epoch": 0.46, "learning_rate": 0.0002303503801379539, "loss": 0.0186, "step": 179130 }, { "epoch": 0.46, "learning_rate": 0.00023034649192158244, "loss": 0.0196, "step": 179140 }, { "epoch": 0.46, "learning_rate": 0.00023034260370521096, "loss": 0.0166, "step": 179150 }, { "epoch": 0.46, "learning_rate": 0.0002303387154888395, "loss": 0.019, "step": 179160 }, { "epoch": 0.46, "learning_rate": 0.00023033482727246804, "loss": 0.0222, "step": 179170 }, { "epoch": 0.46, "learning_rate": 0.00023033093905609658, "loss": 0.0189, "step": 179180 }, { "epoch": 0.46, "learning_rate": 0.0002303270508397251, "loss": 0.0173, "step": 179190 }, { "epoch": 0.46, "learning_rate": 0.00023032316262335364, "loss": 0.0197, "step": 179200 }, { "epoch": 0.46, "learning_rate": 0.00023031927440698218, "loss": 0.0209, "step": 179210 }, { "epoch": 0.46, "learning_rate": 0.00023031538619061072, "loss": 0.0207, "step": 179220 }, { "epoch": 0.46, "learning_rate": 0.00023031149797423923, "loss": 0.0193, "step": 179230 }, { "epoch": 0.46, "learning_rate": 0.00023030760975786778, "loss": 0.0139, "step": 179240 }, { "epoch": 0.46, "learning_rate": 0.00023030372154149634, "loss": 0.02, "step": 179250 }, { "epoch": 0.46, "learning_rate": 0.00023029983332512486, "loss": 0.0165, "step": 179260 }, { "epoch": 0.46, "learning_rate": 0.0002302959451087534, "loss": 0.018, "step": 179270 }, { "epoch": 0.46, "learning_rate": 0.00023029205689238192, "loss": 0.0149, "step": 179280 }, { "epoch": 0.46, "learning_rate": 0.00023028816867601048, "loss": 0.0134, "step": 179290 }, { "epoch": 0.46, "learning_rate": 0.000230284280459639, "loss": 0.0178, "step": 179300 }, { "epoch": 0.46, "learning_rate": 0.00023028039224326754, "loss": 0.0158, "step": 179310 }, { "epoch": 0.46, "learning_rate": 0.00023027650402689605, "loss": 0.0164, "step": 179320 }, { "epoch": 0.46, "learning_rate": 0.00023027261581052462, "loss": 0.021, "step": 179330 }, { "epoch": 0.46, "learning_rate": 0.00023026872759415314, "loss": 0.0153, "step": 179340 }, { "epoch": 0.46, "learning_rate": 0.00023026483937778168, "loss": 0.0206, "step": 179350 }, { "epoch": 0.46, "learning_rate": 0.0002302609511614102, "loss": 0.0175, "step": 179360 }, { "epoch": 0.46, "learning_rate": 0.00023025706294503876, "loss": 0.0168, "step": 179370 }, { "epoch": 0.46, "learning_rate": 0.00023025317472866728, "loss": 0.0231, "step": 179380 }, { "epoch": 0.47, "learning_rate": 0.00023024928651229582, "loss": 0.0155, "step": 179390 }, { "epoch": 0.47, "learning_rate": 0.00023024539829592433, "loss": 0.0149, "step": 179400 }, { "epoch": 0.47, "learning_rate": 0.00023024151007955288, "loss": 0.0138, "step": 179410 }, { "epoch": 0.47, "learning_rate": 0.00023023762186318144, "loss": 0.0166, "step": 179420 }, { "epoch": 0.47, "learning_rate": 0.00023023373364680996, "loss": 0.0213, "step": 179430 }, { "epoch": 0.47, "learning_rate": 0.00023022984543043847, "loss": 0.0194, "step": 179440 }, { "epoch": 0.47, "learning_rate": 0.00023022595721406701, "loss": 0.0174, "step": 179450 }, { "epoch": 0.47, "learning_rate": 0.00023022206899769558, "loss": 0.0183, "step": 179460 }, { "epoch": 0.47, "learning_rate": 0.0002302181807813241, "loss": 0.0178, "step": 179470 }, { "epoch": 0.47, "learning_rate": 0.00023021429256495264, "loss": 0.0156, "step": 179480 }, { "epoch": 0.47, "learning_rate": 0.00023021040434858115, "loss": 0.0175, "step": 179490 }, { "epoch": 0.47, "learning_rate": 0.00023020651613220972, "loss": 0.0212, "step": 179500 }, { "epoch": 0.47, "learning_rate": 0.00023020262791583824, "loss": 0.017, "step": 179510 }, { "epoch": 0.47, "learning_rate": 0.00023019873969946678, "loss": 0.0177, "step": 179520 }, { "epoch": 0.47, "learning_rate": 0.0002301948514830953, "loss": 0.0193, "step": 179530 }, { "epoch": 0.47, "learning_rate": 0.00023019096326672386, "loss": 0.0166, "step": 179540 }, { "epoch": 0.47, "learning_rate": 0.00023018707505035238, "loss": 0.0182, "step": 179550 }, { "epoch": 0.47, "learning_rate": 0.00023018318683398092, "loss": 0.0203, "step": 179560 }, { "epoch": 0.47, "learning_rate": 0.00023017929861760943, "loss": 0.0155, "step": 179570 }, { "epoch": 0.47, "learning_rate": 0.000230175410401238, "loss": 0.0186, "step": 179580 }, { "epoch": 0.47, "learning_rate": 0.00023017152218486654, "loss": 0.0168, "step": 179590 }, { "epoch": 0.47, "learning_rate": 0.00023016763396849506, "loss": 0.0186, "step": 179600 }, { "epoch": 0.47, "learning_rate": 0.00023016374575212357, "loss": 0.0195, "step": 179610 }, { "epoch": 0.47, "learning_rate": 0.00023015985753575214, "loss": 0.0196, "step": 179620 }, { "epoch": 0.47, "learning_rate": 0.00023015596931938068, "loss": 0.0212, "step": 179630 }, { "epoch": 0.47, "learning_rate": 0.0002301520811030092, "loss": 0.0136, "step": 179640 }, { "epoch": 0.47, "learning_rate": 0.00023014819288663774, "loss": 0.0197, "step": 179650 }, { "epoch": 0.47, "learning_rate": 0.00023014430467026625, "loss": 0.0141, "step": 179660 }, { "epoch": 0.47, "learning_rate": 0.00023014041645389482, "loss": 0.0187, "step": 179670 }, { "epoch": 0.47, "learning_rate": 0.00023013652823752334, "loss": 0.0141, "step": 179680 }, { "epoch": 0.47, "learning_rate": 0.00023013264002115188, "loss": 0.0209, "step": 179690 }, { "epoch": 0.47, "learning_rate": 0.0002301287518047804, "loss": 0.0221, "step": 179700 }, { "epoch": 0.47, "learning_rate": 0.00023012486358840896, "loss": 0.0166, "step": 179710 }, { "epoch": 0.47, "learning_rate": 0.00023012097537203748, "loss": 0.0177, "step": 179720 }, { "epoch": 0.47, "learning_rate": 0.00023011708715566602, "loss": 0.0195, "step": 179730 }, { "epoch": 0.47, "learning_rate": 0.00023011319893929453, "loss": 0.0176, "step": 179740 }, { "epoch": 0.47, "learning_rate": 0.0002301093107229231, "loss": 0.0188, "step": 179750 }, { "epoch": 0.47, "learning_rate": 0.00023010542250655162, "loss": 0.0225, "step": 179760 }, { "epoch": 0.47, "learning_rate": 0.00023010153429018016, "loss": 0.0221, "step": 179770 }, { "epoch": 0.47, "learning_rate": 0.00023009764607380867, "loss": 0.0183, "step": 179780 }, { "epoch": 0.47, "learning_rate": 0.00023009375785743724, "loss": 0.0176, "step": 179790 }, { "epoch": 0.47, "learning_rate": 0.00023008986964106578, "loss": 0.0215, "step": 179800 }, { "epoch": 0.47, "learning_rate": 0.0002300859814246943, "loss": 0.0224, "step": 179810 }, { "epoch": 0.47, "learning_rate": 0.00023008209320832284, "loss": 0.0189, "step": 179820 }, { "epoch": 0.47, "learning_rate": 0.00023007820499195138, "loss": 0.0172, "step": 179830 }, { "epoch": 0.47, "learning_rate": 0.00023007431677557992, "loss": 0.0181, "step": 179840 }, { "epoch": 0.47, "learning_rate": 0.00023007042855920844, "loss": 0.0143, "step": 179850 }, { "epoch": 0.47, "learning_rate": 0.00023006654034283698, "loss": 0.0141, "step": 179860 }, { "epoch": 0.47, "learning_rate": 0.00023006265212646552, "loss": 0.0173, "step": 179870 }, { "epoch": 0.47, "learning_rate": 0.00023005876391009406, "loss": 0.0183, "step": 179880 }, { "epoch": 0.47, "learning_rate": 0.00023005487569372258, "loss": 0.0153, "step": 179890 }, { "epoch": 0.47, "learning_rate": 0.00023005098747735112, "loss": 0.0153, "step": 179900 }, { "epoch": 0.47, "learning_rate": 0.00023004709926097963, "loss": 0.0174, "step": 179910 }, { "epoch": 0.47, "learning_rate": 0.0002300432110446082, "loss": 0.0193, "step": 179920 }, { "epoch": 0.47, "learning_rate": 0.00023003932282823672, "loss": 0.0169, "step": 179930 }, { "epoch": 0.47, "learning_rate": 0.00023003543461186526, "loss": 0.0147, "step": 179940 }, { "epoch": 0.47, "learning_rate": 0.00023003154639549377, "loss": 0.0146, "step": 179950 }, { "epoch": 0.47, "learning_rate": 0.00023002765817912234, "loss": 0.0161, "step": 179960 }, { "epoch": 0.47, "learning_rate": 0.00023002376996275088, "loss": 0.0184, "step": 179970 }, { "epoch": 0.47, "learning_rate": 0.0002300198817463794, "loss": 0.0213, "step": 179980 }, { "epoch": 0.47, "learning_rate": 0.00023001599353000794, "loss": 0.0198, "step": 179990 }, { "epoch": 0.47, "learning_rate": 0.00023001210531363648, "loss": 0.0192, "step": 180000 }, { "epoch": 0.47, "eval_cer": 0.881821655462573, "eval_loss": 0.012280810624361038, "eval_runtime": 108.0099, "eval_samples_per_second": 18.517, "eval_steps_per_second": 4.629, "step": 180000 }, { "epoch": 0.47, "learning_rate": 0.00023000821709726502, "loss": 0.0165, "step": 180010 }, { "epoch": 0.47, "learning_rate": 0.00023000432888089354, "loss": 0.0186, "step": 180020 }, { "epoch": 0.47, "learning_rate": 0.00023000044066452208, "loss": 0.0208, "step": 180030 }, { "epoch": 0.47, "learning_rate": 0.00022999655244815062, "loss": 0.0213, "step": 180040 }, { "epoch": 0.47, "learning_rate": 0.00022999266423177916, "loss": 0.0197, "step": 180050 }, { "epoch": 0.47, "learning_rate": 0.00022998877601540768, "loss": 0.0195, "step": 180060 }, { "epoch": 0.47, "learning_rate": 0.00022998488779903622, "loss": 0.0176, "step": 180070 }, { "epoch": 0.47, "learning_rate": 0.00022998099958266476, "loss": 0.0195, "step": 180080 }, { "epoch": 0.47, "learning_rate": 0.0002299771113662933, "loss": 0.0199, "step": 180090 }, { "epoch": 0.47, "learning_rate": 0.00022997322314992181, "loss": 0.0144, "step": 180100 }, { "epoch": 0.47, "learning_rate": 0.00022996933493355036, "loss": 0.0158, "step": 180110 }, { "epoch": 0.47, "learning_rate": 0.00022996544671717893, "loss": 0.0175, "step": 180120 }, { "epoch": 0.47, "learning_rate": 0.00022996155850080744, "loss": 0.0186, "step": 180130 }, { "epoch": 0.47, "learning_rate": 0.00022995767028443598, "loss": 0.0203, "step": 180140 }, { "epoch": 0.47, "learning_rate": 0.0002299537820680645, "loss": 0.0167, "step": 180150 }, { "epoch": 0.47, "learning_rate": 0.000229949893851693, "loss": 0.018, "step": 180160 }, { "epoch": 0.47, "learning_rate": 0.00022994600563532158, "loss": 0.0169, "step": 180170 }, { "epoch": 0.47, "learning_rate": 0.00022994211741895012, "loss": 0.0217, "step": 180180 }, { "epoch": 0.47, "learning_rate": 0.00022993822920257864, "loss": 0.0166, "step": 180190 }, { "epoch": 0.47, "learning_rate": 0.00022993434098620718, "loss": 0.018, "step": 180200 }, { "epoch": 0.47, "learning_rate": 0.00022993045276983572, "loss": 0.0148, "step": 180210 }, { "epoch": 0.47, "learning_rate": 0.00022992656455346426, "loss": 0.016, "step": 180220 }, { "epoch": 0.47, "learning_rate": 0.00022992267633709277, "loss": 0.0169, "step": 180230 }, { "epoch": 0.47, "learning_rate": 0.00022991878812072132, "loss": 0.0167, "step": 180240 }, { "epoch": 0.47, "learning_rate": 0.00022991489990434986, "loss": 0.0179, "step": 180250 }, { "epoch": 0.47, "learning_rate": 0.0002299110116879784, "loss": 0.0163, "step": 180260 }, { "epoch": 0.47, "learning_rate": 0.00022990712347160691, "loss": 0.0177, "step": 180270 }, { "epoch": 0.47, "learning_rate": 0.00022990323525523546, "loss": 0.0167, "step": 180280 }, { "epoch": 0.47, "learning_rate": 0.00022989934703886402, "loss": 0.0173, "step": 180290 }, { "epoch": 0.47, "learning_rate": 0.00022989545882249254, "loss": 0.0237, "step": 180300 }, { "epoch": 0.47, "learning_rate": 0.00022989157060612105, "loss": 0.0175, "step": 180310 }, { "epoch": 0.47, "learning_rate": 0.0002298876823897496, "loss": 0.0195, "step": 180320 }, { "epoch": 0.47, "learning_rate": 0.00022988379417337816, "loss": 0.0191, "step": 180330 }, { "epoch": 0.47, "learning_rate": 0.00022987990595700668, "loss": 0.0174, "step": 180340 }, { "epoch": 0.47, "learning_rate": 0.00022987601774063522, "loss": 0.0159, "step": 180350 }, { "epoch": 0.47, "learning_rate": 0.00022987212952426373, "loss": 0.0174, "step": 180360 }, { "epoch": 0.47, "learning_rate": 0.0002298682413078923, "loss": 0.0166, "step": 180370 }, { "epoch": 0.47, "learning_rate": 0.00022986435309152082, "loss": 0.0183, "step": 180380 }, { "epoch": 0.47, "learning_rate": 0.00022986046487514936, "loss": 0.0182, "step": 180390 }, { "epoch": 0.47, "learning_rate": 0.00022985657665877787, "loss": 0.0178, "step": 180400 }, { "epoch": 0.47, "learning_rate": 0.00022985268844240642, "loss": 0.0183, "step": 180410 }, { "epoch": 0.47, "learning_rate": 0.00022984880022603496, "loss": 0.019, "step": 180420 }, { "epoch": 0.47, "learning_rate": 0.0002298449120096635, "loss": 0.0168, "step": 180430 }, { "epoch": 0.47, "learning_rate": 0.00022984102379329201, "loss": 0.018, "step": 180440 }, { "epoch": 0.47, "learning_rate": 0.00022983713557692056, "loss": 0.0181, "step": 180450 }, { "epoch": 0.47, "learning_rate": 0.00022983324736054912, "loss": 0.0195, "step": 180460 }, { "epoch": 0.47, "learning_rate": 0.00022982935914417764, "loss": 0.0163, "step": 180470 }, { "epoch": 0.47, "learning_rate": 0.00022982547092780615, "loss": 0.0173, "step": 180480 }, { "epoch": 0.47, "learning_rate": 0.0002298215827114347, "loss": 0.0179, "step": 180490 }, { "epoch": 0.47, "learning_rate": 0.00022981769449506326, "loss": 0.0207, "step": 180500 }, { "epoch": 0.47, "learning_rate": 0.00022981380627869178, "loss": 0.0189, "step": 180510 }, { "epoch": 0.47, "learning_rate": 0.00022980991806232032, "loss": 0.0218, "step": 180520 }, { "epoch": 0.47, "learning_rate": 0.00022980602984594883, "loss": 0.0193, "step": 180530 }, { "epoch": 0.47, "learning_rate": 0.0002298021416295774, "loss": 0.0193, "step": 180540 }, { "epoch": 0.47, "learning_rate": 0.00022979825341320592, "loss": 0.0199, "step": 180550 }, { "epoch": 0.47, "learning_rate": 0.00022979436519683446, "loss": 0.0225, "step": 180560 }, { "epoch": 0.47, "learning_rate": 0.00022979047698046297, "loss": 0.0231, "step": 180570 }, { "epoch": 0.47, "learning_rate": 0.00022978658876409154, "loss": 0.0154, "step": 180580 }, { "epoch": 0.47, "learning_rate": 0.00022978270054772006, "loss": 0.0166, "step": 180590 }, { "epoch": 0.47, "learning_rate": 0.0002297788123313486, "loss": 0.0203, "step": 180600 }, { "epoch": 0.47, "learning_rate": 0.0002297749241149771, "loss": 0.0172, "step": 180610 }, { "epoch": 0.47, "learning_rate": 0.00022977103589860568, "loss": 0.019, "step": 180620 }, { "epoch": 0.47, "learning_rate": 0.0002297671476822342, "loss": 0.0181, "step": 180630 }, { "epoch": 0.47, "learning_rate": 0.00022976325946586274, "loss": 0.0166, "step": 180640 }, { "epoch": 0.47, "learning_rate": 0.00022975937124949125, "loss": 0.0162, "step": 180650 }, { "epoch": 0.47, "learning_rate": 0.0002297554830331198, "loss": 0.0193, "step": 180660 }, { "epoch": 0.47, "learning_rate": 0.00022975159481674836, "loss": 0.0182, "step": 180670 }, { "epoch": 0.47, "learning_rate": 0.00022974770660037688, "loss": 0.0207, "step": 180680 }, { "epoch": 0.47, "learning_rate": 0.00022974381838400542, "loss": 0.0158, "step": 180690 }, { "epoch": 0.47, "learning_rate": 0.00022973993016763393, "loss": 0.0162, "step": 180700 }, { "epoch": 0.47, "learning_rate": 0.0002297360419512625, "loss": 0.0204, "step": 180710 }, { "epoch": 0.47, "learning_rate": 0.00022973215373489102, "loss": 0.0172, "step": 180720 }, { "epoch": 0.47, "learning_rate": 0.00022972826551851956, "loss": 0.0257, "step": 180730 }, { "epoch": 0.47, "learning_rate": 0.00022972437730214807, "loss": 0.0185, "step": 180740 }, { "epoch": 0.47, "learning_rate": 0.00022972048908577664, "loss": 0.0172, "step": 180750 }, { "epoch": 0.47, "learning_rate": 0.00022971660086940516, "loss": 0.0214, "step": 180760 }, { "epoch": 0.47, "learning_rate": 0.0002297127126530337, "loss": 0.02, "step": 180770 }, { "epoch": 0.47, "learning_rate": 0.0002297088244366622, "loss": 0.0184, "step": 180780 }, { "epoch": 0.47, "learning_rate": 0.00022970493622029078, "loss": 0.0206, "step": 180790 }, { "epoch": 0.47, "learning_rate": 0.0002297010480039193, "loss": 0.0179, "step": 180800 }, { "epoch": 0.47, "learning_rate": 0.00022969715978754784, "loss": 0.0173, "step": 180810 }, { "epoch": 0.47, "learning_rate": 0.00022969327157117635, "loss": 0.0186, "step": 180820 }, { "epoch": 0.47, "learning_rate": 0.00022968938335480492, "loss": 0.018, "step": 180830 }, { "epoch": 0.47, "learning_rate": 0.00022968549513843346, "loss": 0.0158, "step": 180840 }, { "epoch": 0.47, "learning_rate": 0.00022968160692206198, "loss": 0.019, "step": 180850 }, { "epoch": 0.47, "learning_rate": 0.00022967771870569052, "loss": 0.0206, "step": 180860 }, { "epoch": 0.47, "learning_rate": 0.00022967383048931903, "loss": 0.0214, "step": 180870 }, { "epoch": 0.47, "learning_rate": 0.0002296699422729476, "loss": 0.0155, "step": 180880 }, { "epoch": 0.47, "learning_rate": 0.00022966605405657612, "loss": 0.0221, "step": 180890 }, { "epoch": 0.47, "learning_rate": 0.00022966216584020466, "loss": 0.0189, "step": 180900 }, { "epoch": 0.47, "learning_rate": 0.00022965827762383317, "loss": 0.0156, "step": 180910 }, { "epoch": 0.47, "learning_rate": 0.00022965438940746174, "loss": 0.0173, "step": 180920 }, { "epoch": 0.47, "learning_rate": 0.00022965050119109026, "loss": 0.0162, "step": 180930 }, { "epoch": 0.47, "learning_rate": 0.0002296466129747188, "loss": 0.0203, "step": 180940 }, { "epoch": 0.47, "learning_rate": 0.0002296427247583473, "loss": 0.0179, "step": 180950 }, { "epoch": 0.47, "learning_rate": 0.00022963883654197588, "loss": 0.0212, "step": 180960 }, { "epoch": 0.47, "learning_rate": 0.0002296349483256044, "loss": 0.0187, "step": 180970 }, { "epoch": 0.47, "learning_rate": 0.00022963106010923294, "loss": 0.0162, "step": 180980 }, { "epoch": 0.47, "learning_rate": 0.00022962717189286145, "loss": 0.0156, "step": 180990 }, { "epoch": 0.47, "learning_rate": 0.00022962328367649002, "loss": 0.025, "step": 181000 }, { "epoch": 0.47, "eval_cer": 0.881782465628416, "eval_loss": 0.012816259637475014, "eval_runtime": 107.9694, "eval_samples_per_second": 18.524, "eval_steps_per_second": 4.631, "step": 181000 }, { "epoch": 0.47, "learning_rate": 0.00022961939546011856, "loss": 0.018, "step": 181010 }, { "epoch": 0.47, "learning_rate": 0.00022961550724374708, "loss": 0.0241, "step": 181020 }, { "epoch": 0.47, "learning_rate": 0.0002296116190273756, "loss": 0.0196, "step": 181030 }, { "epoch": 0.47, "learning_rate": 0.00022960773081100416, "loss": 0.0194, "step": 181040 }, { "epoch": 0.47, "learning_rate": 0.0002296038425946327, "loss": 0.0173, "step": 181050 }, { "epoch": 0.47, "learning_rate": 0.00022959995437826122, "loss": 0.0203, "step": 181060 }, { "epoch": 0.47, "learning_rate": 0.00022959606616188976, "loss": 0.0193, "step": 181070 }, { "epoch": 0.47, "learning_rate": 0.0002295921779455183, "loss": 0.0178, "step": 181080 }, { "epoch": 0.47, "learning_rate": 0.00022958828972914684, "loss": 0.0145, "step": 181090 }, { "epoch": 0.47, "learning_rate": 0.00022958440151277536, "loss": 0.0201, "step": 181100 }, { "epoch": 0.47, "learning_rate": 0.0002295805132964039, "loss": 0.0185, "step": 181110 }, { "epoch": 0.47, "learning_rate": 0.0002295766250800324, "loss": 0.0237, "step": 181120 }, { "epoch": 0.47, "learning_rate": 0.00022957273686366098, "loss": 0.0197, "step": 181130 }, { "epoch": 0.47, "learning_rate": 0.0002295688486472895, "loss": 0.0172, "step": 181140 }, { "epoch": 0.47, "learning_rate": 0.00022956496043091804, "loss": 0.0174, "step": 181150 }, { "epoch": 0.47, "learning_rate": 0.00022956107221454655, "loss": 0.0147, "step": 181160 }, { "epoch": 0.47, "learning_rate": 0.00022955718399817512, "loss": 0.0202, "step": 181170 }, { "epoch": 0.47, "learning_rate": 0.00022955329578180366, "loss": 0.0177, "step": 181180 }, { "epoch": 0.47, "learning_rate": 0.00022954940756543218, "loss": 0.0153, "step": 181190 }, { "epoch": 0.47, "learning_rate": 0.0002295455193490607, "loss": 0.0192, "step": 181200 }, { "epoch": 0.47, "learning_rate": 0.00022954163113268926, "loss": 0.0227, "step": 181210 }, { "epoch": 0.47, "learning_rate": 0.0002295377429163178, "loss": 0.0203, "step": 181220 }, { "epoch": 0.47, "learning_rate": 0.00022953385469994632, "loss": 0.0187, "step": 181230 }, { "epoch": 0.47, "learning_rate": 0.00022952996648357486, "loss": 0.0194, "step": 181240 }, { "epoch": 0.47, "learning_rate": 0.0002295260782672034, "loss": 0.0235, "step": 181250 }, { "epoch": 0.47, "learning_rate": 0.00022952219005083194, "loss": 0.014, "step": 181260 }, { "epoch": 0.47, "learning_rate": 0.00022951830183446045, "loss": 0.017, "step": 181270 }, { "epoch": 0.47, "learning_rate": 0.000229514413618089, "loss": 0.0171, "step": 181280 }, { "epoch": 0.47, "learning_rate": 0.00022951052540171754, "loss": 0.017, "step": 181290 }, { "epoch": 0.47, "learning_rate": 0.00022950663718534608, "loss": 0.0158, "step": 181300 }, { "epoch": 0.47, "learning_rate": 0.0002295027489689746, "loss": 0.0194, "step": 181310 }, { "epoch": 0.47, "learning_rate": 0.00022949886075260314, "loss": 0.0164, "step": 181320 }, { "epoch": 0.47, "learning_rate": 0.0002294949725362317, "loss": 0.02, "step": 181330 }, { "epoch": 0.47, "learning_rate": 0.00022949108431986022, "loss": 0.0224, "step": 181340 }, { "epoch": 0.47, "learning_rate": 0.00022948719610348873, "loss": 0.0163, "step": 181350 }, { "epoch": 0.47, "learning_rate": 0.00022948330788711728, "loss": 0.019, "step": 181360 }, { "epoch": 0.47, "learning_rate": 0.0002294794196707458, "loss": 0.0125, "step": 181370 }, { "epoch": 0.47, "learning_rate": 0.00022947553145437436, "loss": 0.0208, "step": 181380 }, { "epoch": 0.47, "learning_rate": 0.0002294716432380029, "loss": 0.0167, "step": 181390 }, { "epoch": 0.47, "learning_rate": 0.00022946775502163141, "loss": 0.0155, "step": 181400 }, { "epoch": 0.47, "learning_rate": 0.00022946386680525996, "loss": 0.0178, "step": 181410 }, { "epoch": 0.47, "learning_rate": 0.0002294599785888885, "loss": 0.0177, "step": 181420 }, { "epoch": 0.47, "learning_rate": 0.00022945609037251704, "loss": 0.0159, "step": 181430 }, { "epoch": 0.47, "learning_rate": 0.00022945220215614555, "loss": 0.0223, "step": 181440 }, { "epoch": 0.47, "learning_rate": 0.0002294483139397741, "loss": 0.0148, "step": 181450 }, { "epoch": 0.47, "learning_rate": 0.00022944442572340264, "loss": 0.0259, "step": 181460 }, { "epoch": 0.47, "learning_rate": 0.00022944053750703118, "loss": 0.0211, "step": 181470 }, { "epoch": 0.47, "learning_rate": 0.0002294366492906597, "loss": 0.0227, "step": 181480 }, { "epoch": 0.47, "learning_rate": 0.00022943276107428824, "loss": 0.0206, "step": 181490 }, { "epoch": 0.47, "learning_rate": 0.00022942887285791678, "loss": 0.017, "step": 181500 }, { "epoch": 0.47, "learning_rate": 0.00022942498464154532, "loss": 0.0145, "step": 181510 }, { "epoch": 0.47, "learning_rate": 0.00022942109642517383, "loss": 0.016, "step": 181520 }, { "epoch": 0.47, "learning_rate": 0.00022941720820880237, "loss": 0.018, "step": 181530 }, { "epoch": 0.47, "learning_rate": 0.00022941331999243094, "loss": 0.0173, "step": 181540 }, { "epoch": 0.47, "learning_rate": 0.00022940943177605946, "loss": 0.0168, "step": 181550 }, { "epoch": 0.47, "learning_rate": 0.000229405543559688, "loss": 0.0179, "step": 181560 }, { "epoch": 0.47, "learning_rate": 0.00022940165534331651, "loss": 0.0163, "step": 181570 }, { "epoch": 0.47, "learning_rate": 0.00022939776712694508, "loss": 0.0174, "step": 181580 }, { "epoch": 0.47, "learning_rate": 0.0002293938789105736, "loss": 0.0177, "step": 181590 }, { "epoch": 0.47, "learning_rate": 0.00022938999069420214, "loss": 0.0153, "step": 181600 }, { "epoch": 0.47, "learning_rate": 0.00022938610247783065, "loss": 0.0201, "step": 181610 }, { "epoch": 0.47, "learning_rate": 0.0002293822142614592, "loss": 0.0159, "step": 181620 }, { "epoch": 0.47, "learning_rate": 0.00022937832604508774, "loss": 0.0178, "step": 181630 }, { "epoch": 0.47, "learning_rate": 0.00022937443782871628, "loss": 0.016, "step": 181640 }, { "epoch": 0.47, "learning_rate": 0.0002293705496123448, "loss": 0.0158, "step": 181650 }, { "epoch": 0.47, "learning_rate": 0.00022936666139597333, "loss": 0.0182, "step": 181660 }, { "epoch": 0.47, "learning_rate": 0.00022936277317960188, "loss": 0.0217, "step": 181670 }, { "epoch": 0.47, "learning_rate": 0.00022935888496323042, "loss": 0.0231, "step": 181680 }, { "epoch": 0.47, "learning_rate": 0.00022935499674685893, "loss": 0.0179, "step": 181690 }, { "epoch": 0.47, "learning_rate": 0.00022935110853048747, "loss": 0.0196, "step": 181700 }, { "epoch": 0.47, "learning_rate": 0.00022934722031411604, "loss": 0.0159, "step": 181710 }, { "epoch": 0.47, "learning_rate": 0.00022934333209774456, "loss": 0.0153, "step": 181720 }, { "epoch": 0.47, "learning_rate": 0.0002293394438813731, "loss": 0.0185, "step": 181730 }, { "epoch": 0.47, "learning_rate": 0.0002293355556650016, "loss": 0.018, "step": 181740 }, { "epoch": 0.47, "learning_rate": 0.00022933166744863018, "loss": 0.0176, "step": 181750 }, { "epoch": 0.47, "learning_rate": 0.0002293277792322587, "loss": 0.0241, "step": 181760 }, { "epoch": 0.47, "learning_rate": 0.00022932389101588724, "loss": 0.0181, "step": 181770 }, { "epoch": 0.47, "learning_rate": 0.00022932000279951575, "loss": 0.0191, "step": 181780 }, { "epoch": 0.47, "learning_rate": 0.00022931611458314432, "loss": 0.0169, "step": 181790 }, { "epoch": 0.47, "learning_rate": 0.00022931222636677284, "loss": 0.0182, "step": 181800 }, { "epoch": 0.47, "learning_rate": 0.00022930833815040138, "loss": 0.0137, "step": 181810 }, { "epoch": 0.47, "learning_rate": 0.0002293044499340299, "loss": 0.0223, "step": 181820 }, { "epoch": 0.47, "learning_rate": 0.00022930056171765846, "loss": 0.0169, "step": 181830 }, { "epoch": 0.47, "learning_rate": 0.00022929667350128698, "loss": 0.0195, "step": 181840 }, { "epoch": 0.47, "learning_rate": 0.00022929278528491552, "loss": 0.0164, "step": 181850 }, { "epoch": 0.47, "learning_rate": 0.00022928889706854403, "loss": 0.02, "step": 181860 }, { "epoch": 0.47, "learning_rate": 0.00022928500885217257, "loss": 0.0197, "step": 181870 }, { "epoch": 0.47, "learning_rate": 0.00022928112063580114, "loss": 0.0224, "step": 181880 }, { "epoch": 0.47, "learning_rate": 0.00022927723241942966, "loss": 0.0188, "step": 181890 }, { "epoch": 0.47, "learning_rate": 0.00022927334420305817, "loss": 0.018, "step": 181900 }, { "epoch": 0.47, "learning_rate": 0.0002292694559866867, "loss": 0.0189, "step": 181910 }, { "epoch": 0.47, "learning_rate": 0.00022926556777031528, "loss": 0.0193, "step": 181920 }, { "epoch": 0.47, "learning_rate": 0.0002292616795539438, "loss": 0.0144, "step": 181930 }, { "epoch": 0.47, "learning_rate": 0.00022925779133757234, "loss": 0.017, "step": 181940 }, { "epoch": 0.47, "learning_rate": 0.00022925390312120085, "loss": 0.0192, "step": 181950 }, { "epoch": 0.47, "learning_rate": 0.00022925001490482942, "loss": 0.0208, "step": 181960 }, { "epoch": 0.47, "learning_rate": 0.00022924612668845794, "loss": 0.021, "step": 181970 }, { "epoch": 0.47, "learning_rate": 0.00022924223847208648, "loss": 0.0162, "step": 181980 }, { "epoch": 0.47, "learning_rate": 0.000229238350255715, "loss": 0.0151, "step": 181990 }, { "epoch": 0.47, "learning_rate": 0.00022923446203934356, "loss": 0.018, "step": 182000 }, { "epoch": 0.47, "eval_cer": 0.8817740678068109, "eval_loss": 0.012949470430612564, "eval_runtime": 108.1298, "eval_samples_per_second": 18.496, "eval_steps_per_second": 4.624, "step": 182000 }, { "epoch": 0.47, "learning_rate": 0.00022923057382297208, "loss": 0.0161, "step": 182010 }, { "epoch": 0.47, "learning_rate": 0.00022922668560660062, "loss": 0.0174, "step": 182020 }, { "epoch": 0.47, "learning_rate": 0.00022922279739022913, "loss": 0.024, "step": 182030 }, { "epoch": 0.47, "learning_rate": 0.0002292189091738577, "loss": 0.0201, "step": 182040 }, { "epoch": 0.47, "learning_rate": 0.00022921502095748624, "loss": 0.0182, "step": 182050 }, { "epoch": 0.47, "learning_rate": 0.00022921113274111476, "loss": 0.0183, "step": 182060 }, { "epoch": 0.47, "learning_rate": 0.00022920724452474327, "loss": 0.02, "step": 182070 }, { "epoch": 0.47, "learning_rate": 0.00022920335630837184, "loss": 0.0218, "step": 182080 }, { "epoch": 0.47, "learning_rate": 0.00022919946809200038, "loss": 0.0166, "step": 182090 }, { "epoch": 0.47, "learning_rate": 0.0002291955798756289, "loss": 0.015, "step": 182100 }, { "epoch": 0.47, "learning_rate": 0.00022919169165925744, "loss": 0.0169, "step": 182110 }, { "epoch": 0.47, "learning_rate": 0.00022918780344288595, "loss": 0.0181, "step": 182120 }, { "epoch": 0.47, "learning_rate": 0.00022918391522651452, "loss": 0.024, "step": 182130 }, { "epoch": 0.47, "learning_rate": 0.00022918002701014303, "loss": 0.0142, "step": 182140 }, { "epoch": 0.47, "learning_rate": 0.00022917613879377158, "loss": 0.0245, "step": 182150 }, { "epoch": 0.47, "learning_rate": 0.0002291722505774001, "loss": 0.014, "step": 182160 }, { "epoch": 0.47, "learning_rate": 0.00022916836236102866, "loss": 0.0199, "step": 182170 }, { "epoch": 0.47, "learning_rate": 0.00022916447414465717, "loss": 0.0221, "step": 182180 }, { "epoch": 0.47, "learning_rate": 0.00022916058592828572, "loss": 0.0221, "step": 182190 }, { "epoch": 0.47, "learning_rate": 0.00022915669771191423, "loss": 0.0216, "step": 182200 }, { "epoch": 0.47, "learning_rate": 0.0002291528094955428, "loss": 0.0171, "step": 182210 }, { "epoch": 0.47, "learning_rate": 0.00022914892127917131, "loss": 0.0159, "step": 182220 }, { "epoch": 0.47, "learning_rate": 0.00022914503306279986, "loss": 0.0154, "step": 182230 }, { "epoch": 0.47, "learning_rate": 0.00022914114484642837, "loss": 0.0202, "step": 182240 }, { "epoch": 0.47, "learning_rate": 0.00022913725663005694, "loss": 0.0167, "step": 182250 }, { "epoch": 0.47, "learning_rate": 0.00022913336841368548, "loss": 0.0182, "step": 182260 }, { "epoch": 0.47, "learning_rate": 0.000229129480197314, "loss": 0.0182, "step": 182270 }, { "epoch": 0.47, "learning_rate": 0.00022912559198094254, "loss": 0.0222, "step": 182280 }, { "epoch": 0.47, "learning_rate": 0.00022912170376457108, "loss": 0.0257, "step": 182290 }, { "epoch": 0.47, "learning_rate": 0.00022911781554819962, "loss": 0.0185, "step": 182300 }, { "epoch": 0.47, "learning_rate": 0.00022911392733182813, "loss": 0.0185, "step": 182310 }, { "epoch": 0.47, "learning_rate": 0.00022911003911545668, "loss": 0.0191, "step": 182320 }, { "epoch": 0.47, "learning_rate": 0.00022910615089908522, "loss": 0.0168, "step": 182330 }, { "epoch": 0.47, "learning_rate": 0.00022910226268271376, "loss": 0.0185, "step": 182340 }, { "epoch": 0.47, "learning_rate": 0.00022909837446634227, "loss": 0.0201, "step": 182350 }, { "epoch": 0.47, "learning_rate": 0.00022909448624997082, "loss": 0.0142, "step": 182360 }, { "epoch": 0.47, "learning_rate": 0.00022909059803359933, "loss": 0.0233, "step": 182370 }, { "epoch": 0.47, "learning_rate": 0.0002290867098172279, "loss": 0.015, "step": 182380 }, { "epoch": 0.47, "learning_rate": 0.0002290828216008564, "loss": 0.0189, "step": 182390 }, { "epoch": 0.47, "learning_rate": 0.00022907893338448495, "loss": 0.0215, "step": 182400 }, { "epoch": 0.47, "learning_rate": 0.00022907504516811347, "loss": 0.0181, "step": 182410 }, { "epoch": 0.47, "learning_rate": 0.00022907115695174204, "loss": 0.0162, "step": 182420 }, { "epoch": 0.47, "learning_rate": 0.00022906726873537058, "loss": 0.0189, "step": 182430 }, { "epoch": 0.47, "learning_rate": 0.0002290633805189991, "loss": 0.0238, "step": 182440 }, { "epoch": 0.47, "learning_rate": 0.00022905949230262764, "loss": 0.0191, "step": 182450 }, { "epoch": 0.47, "learning_rate": 0.00022905560408625618, "loss": 0.0188, "step": 182460 }, { "epoch": 0.47, "learning_rate": 0.00022905171586988472, "loss": 0.0178, "step": 182470 }, { "epoch": 0.47, "learning_rate": 0.00022904782765351323, "loss": 0.0187, "step": 182480 }, { "epoch": 0.47, "learning_rate": 0.00022904393943714178, "loss": 0.0183, "step": 182490 }, { "epoch": 0.47, "learning_rate": 0.00022904005122077032, "loss": 0.0165, "step": 182500 }, { "epoch": 0.47, "learning_rate": 0.00022903616300439886, "loss": 0.0174, "step": 182510 }, { "epoch": 0.47, "learning_rate": 0.00022903227478802737, "loss": 0.0182, "step": 182520 }, { "epoch": 0.47, "learning_rate": 0.00022902838657165591, "loss": 0.0147, "step": 182530 }, { "epoch": 0.47, "learning_rate": 0.00022902449835528446, "loss": 0.0224, "step": 182540 }, { "epoch": 0.47, "learning_rate": 0.000229020610138913, "loss": 0.0195, "step": 182550 }, { "epoch": 0.47, "learning_rate": 0.0002290167219225415, "loss": 0.0169, "step": 182560 }, { "epoch": 0.47, "learning_rate": 0.00022901283370617005, "loss": 0.0175, "step": 182570 }, { "epoch": 0.47, "learning_rate": 0.00022900894548979862, "loss": 0.018, "step": 182580 }, { "epoch": 0.47, "learning_rate": 0.00022900505727342714, "loss": 0.0183, "step": 182590 }, { "epoch": 0.47, "learning_rate": 0.00022900116905705568, "loss": 0.015, "step": 182600 }, { "epoch": 0.47, "learning_rate": 0.0002289972808406842, "loss": 0.0247, "step": 182610 }, { "epoch": 0.47, "learning_rate": 0.0002289933926243127, "loss": 0.0181, "step": 182620 }, { "epoch": 0.47, "learning_rate": 0.00022898950440794128, "loss": 0.0222, "step": 182630 }, { "epoch": 0.47, "learning_rate": 0.00022898561619156982, "loss": 0.0157, "step": 182640 }, { "epoch": 0.47, "learning_rate": 0.00022898172797519833, "loss": 0.0206, "step": 182650 }, { "epoch": 0.47, "learning_rate": 0.00022897783975882687, "loss": 0.0138, "step": 182660 }, { "epoch": 0.47, "learning_rate": 0.00022897395154245542, "loss": 0.0152, "step": 182670 }, { "epoch": 0.47, "learning_rate": 0.00022897006332608396, "loss": 0.0162, "step": 182680 }, { "epoch": 0.47, "learning_rate": 0.00022896617510971247, "loss": 0.0155, "step": 182690 }, { "epoch": 0.47, "learning_rate": 0.00022896228689334101, "loss": 0.0163, "step": 182700 }, { "epoch": 0.47, "learning_rate": 0.00022895839867696956, "loss": 0.0177, "step": 182710 }, { "epoch": 0.47, "learning_rate": 0.0002289545104605981, "loss": 0.0195, "step": 182720 }, { "epoch": 0.47, "learning_rate": 0.0002289506222442266, "loss": 0.0182, "step": 182730 }, { "epoch": 0.47, "learning_rate": 0.00022894673402785515, "loss": 0.0155, "step": 182740 }, { "epoch": 0.47, "learning_rate": 0.00022894284581148372, "loss": 0.0166, "step": 182750 }, { "epoch": 0.47, "learning_rate": 0.00022893895759511224, "loss": 0.0181, "step": 182760 }, { "epoch": 0.47, "learning_rate": 0.00022893506937874078, "loss": 0.0217, "step": 182770 }, { "epoch": 0.47, "learning_rate": 0.0002289311811623693, "loss": 0.0184, "step": 182780 }, { "epoch": 0.47, "learning_rate": 0.00022892729294599786, "loss": 0.0147, "step": 182790 }, { "epoch": 0.47, "learning_rate": 0.00022892340472962638, "loss": 0.0178, "step": 182800 }, { "epoch": 0.47, "learning_rate": 0.00022891951651325492, "loss": 0.015, "step": 182810 }, { "epoch": 0.47, "learning_rate": 0.00022891562829688343, "loss": 0.018, "step": 182820 }, { "epoch": 0.47, "learning_rate": 0.000228911740080512, "loss": 0.0191, "step": 182830 }, { "epoch": 0.47, "learning_rate": 0.00022890785186414052, "loss": 0.0145, "step": 182840 }, { "epoch": 0.47, "learning_rate": 0.00022890396364776906, "loss": 0.0149, "step": 182850 }, { "epoch": 0.47, "learning_rate": 0.00022890007543139757, "loss": 0.0203, "step": 182860 }, { "epoch": 0.47, "learning_rate": 0.00022889618721502611, "loss": 0.0216, "step": 182870 }, { "epoch": 0.47, "learning_rate": 0.00022889229899865466, "loss": 0.0132, "step": 182880 }, { "epoch": 0.47, "learning_rate": 0.0002288884107822832, "loss": 0.0192, "step": 182890 }, { "epoch": 0.47, "learning_rate": 0.0002288845225659117, "loss": 0.0156, "step": 182900 }, { "epoch": 0.47, "learning_rate": 0.00022888063434954025, "loss": 0.0163, "step": 182910 }, { "epoch": 0.47, "learning_rate": 0.00022887674613316882, "loss": 0.0152, "step": 182920 }, { "epoch": 0.47, "learning_rate": 0.00022887285791679734, "loss": 0.0204, "step": 182930 }, { "epoch": 0.47, "learning_rate": 0.00022886896970042585, "loss": 0.0181, "step": 182940 }, { "epoch": 0.47, "learning_rate": 0.0002288650814840544, "loss": 0.0182, "step": 182950 }, { "epoch": 0.47, "learning_rate": 0.00022886119326768296, "loss": 0.0229, "step": 182960 }, { "epoch": 0.47, "learning_rate": 0.00022885730505131148, "loss": 0.0249, "step": 182970 }, { "epoch": 0.47, "learning_rate": 0.00022885341683494002, "loss": 0.0163, "step": 182980 }, { "epoch": 0.47, "learning_rate": 0.00022884952861856853, "loss": 0.0155, "step": 182990 }, { "epoch": 0.47, "learning_rate": 0.0002288456404021971, "loss": 0.0191, "step": 183000 }, { "epoch": 0.47, "eval_cer": 0.8817992612716261, "eval_loss": 0.012429905124008656, "eval_runtime": 108.0004, "eval_samples_per_second": 18.518, "eval_steps_per_second": 4.63, "step": 183000 }, { "epoch": 0.47, "learning_rate": 0.00022884175218582562, "loss": 0.0171, "step": 183010 }, { "epoch": 0.47, "learning_rate": 0.00022883786396945416, "loss": 0.0166, "step": 183020 }, { "epoch": 0.47, "learning_rate": 0.00022883397575308267, "loss": 0.016, "step": 183030 }, { "epoch": 0.47, "learning_rate": 0.00022883008753671124, "loss": 0.0215, "step": 183040 }, { "epoch": 0.47, "learning_rate": 0.00022882619932033975, "loss": 0.0163, "step": 183050 }, { "epoch": 0.47, "learning_rate": 0.0002288223111039683, "loss": 0.0202, "step": 183060 }, { "epoch": 0.47, "learning_rate": 0.0002288184228875968, "loss": 0.0281, "step": 183070 }, { "epoch": 0.47, "learning_rate": 0.00022881453467122538, "loss": 0.0182, "step": 183080 }, { "epoch": 0.47, "learning_rate": 0.0002288106464548539, "loss": 0.0171, "step": 183090 }, { "epoch": 0.47, "learning_rate": 0.00022880675823848244, "loss": 0.0202, "step": 183100 }, { "epoch": 0.47, "learning_rate": 0.00022880287002211095, "loss": 0.0167, "step": 183110 }, { "epoch": 0.47, "learning_rate": 0.0002287989818057395, "loss": 0.0193, "step": 183120 }, { "epoch": 0.47, "learning_rate": 0.00022879509358936806, "loss": 0.0147, "step": 183130 }, { "epoch": 0.47, "learning_rate": 0.00022879120537299658, "loss": 0.0162, "step": 183140 }, { "epoch": 0.47, "learning_rate": 0.00022878731715662512, "loss": 0.0167, "step": 183150 }, { "epoch": 0.47, "learning_rate": 0.00022878342894025363, "loss": 0.0168, "step": 183160 }, { "epoch": 0.47, "learning_rate": 0.0002287795407238822, "loss": 0.0169, "step": 183170 }, { "epoch": 0.47, "learning_rate": 0.00022877565250751071, "loss": 0.0151, "step": 183180 }, { "epoch": 0.47, "learning_rate": 0.00022877176429113926, "loss": 0.0224, "step": 183190 }, { "epoch": 0.47, "learning_rate": 0.00022876787607476777, "loss": 0.0184, "step": 183200 }, { "epoch": 0.47, "learning_rate": 0.00022876398785839634, "loss": 0.0187, "step": 183210 }, { "epoch": 0.47, "learning_rate": 0.00022876009964202485, "loss": 0.0183, "step": 183220 }, { "epoch": 0.47, "learning_rate": 0.0002287562114256534, "loss": 0.0135, "step": 183230 }, { "epoch": 0.47, "learning_rate": 0.0002287523232092819, "loss": 0.0153, "step": 183240 }, { "epoch": 0.48, "learning_rate": 0.00022874843499291048, "loss": 0.0201, "step": 183250 }, { "epoch": 0.48, "learning_rate": 0.000228744546776539, "loss": 0.0169, "step": 183260 }, { "epoch": 0.48, "learning_rate": 0.00022874065856016754, "loss": 0.0157, "step": 183270 }, { "epoch": 0.48, "learning_rate": 0.00022873677034379605, "loss": 0.0244, "step": 183280 }, { "epoch": 0.48, "learning_rate": 0.00022873288212742462, "loss": 0.0182, "step": 183290 }, { "epoch": 0.48, "learning_rate": 0.00022872899391105316, "loss": 0.0175, "step": 183300 }, { "epoch": 0.48, "learning_rate": 0.00022872510569468167, "loss": 0.0234, "step": 183310 }, { "epoch": 0.48, "learning_rate": 0.00022872121747831022, "loss": 0.0155, "step": 183320 }, { "epoch": 0.48, "learning_rate": 0.00022871732926193876, "loss": 0.018, "step": 183330 }, { "epoch": 0.48, "learning_rate": 0.0002287134410455673, "loss": 0.0234, "step": 183340 }, { "epoch": 0.48, "learning_rate": 0.00022870955282919581, "loss": 0.017, "step": 183350 }, { "epoch": 0.48, "learning_rate": 0.00022870566461282436, "loss": 0.0183, "step": 183360 }, { "epoch": 0.48, "learning_rate": 0.00022870177639645287, "loss": 0.0195, "step": 183370 }, { "epoch": 0.48, "learning_rate": 0.00022869788818008144, "loss": 0.0228, "step": 183380 }, { "epoch": 0.48, "learning_rate": 0.00022869399996370995, "loss": 0.0192, "step": 183390 }, { "epoch": 0.48, "learning_rate": 0.0002286901117473385, "loss": 0.0195, "step": 183400 }, { "epoch": 0.48, "learning_rate": 0.000228686223530967, "loss": 0.0173, "step": 183410 }, { "epoch": 0.48, "learning_rate": 0.00022868233531459558, "loss": 0.0162, "step": 183420 }, { "epoch": 0.48, "learning_rate": 0.0002286784470982241, "loss": 0.0242, "step": 183430 }, { "epoch": 0.48, "learning_rate": 0.00022867455888185263, "loss": 0.0168, "step": 183440 }, { "epoch": 0.48, "learning_rate": 0.00022867067066548115, "loss": 0.0153, "step": 183450 }, { "epoch": 0.48, "learning_rate": 0.00022866678244910972, "loss": 0.0174, "step": 183460 }, { "epoch": 0.48, "learning_rate": 0.00022866289423273826, "loss": 0.0195, "step": 183470 }, { "epoch": 0.48, "learning_rate": 0.00022865900601636677, "loss": 0.0162, "step": 183480 }, { "epoch": 0.48, "learning_rate": 0.0002286551177999953, "loss": 0.0181, "step": 183490 }, { "epoch": 0.48, "learning_rate": 0.00022865122958362386, "loss": 0.0177, "step": 183500 }, { "epoch": 0.48, "learning_rate": 0.0002286473413672524, "loss": 0.0165, "step": 183510 }, { "epoch": 0.48, "learning_rate": 0.00022864345315088091, "loss": 0.0184, "step": 183520 }, { "epoch": 0.48, "learning_rate": 0.00022863956493450946, "loss": 0.013, "step": 183530 }, { "epoch": 0.48, "learning_rate": 0.000228635676718138, "loss": 0.0131, "step": 183540 }, { "epoch": 0.48, "learning_rate": 0.00022863178850176654, "loss": 0.0182, "step": 183550 }, { "epoch": 0.48, "learning_rate": 0.00022862790028539505, "loss": 0.0162, "step": 183560 }, { "epoch": 0.48, "learning_rate": 0.0002286240120690236, "loss": 0.019, "step": 183570 }, { "epoch": 0.48, "learning_rate": 0.00022862012385265214, "loss": 0.0154, "step": 183580 }, { "epoch": 0.48, "learning_rate": 0.00022861623563628068, "loss": 0.0169, "step": 183590 }, { "epoch": 0.48, "learning_rate": 0.0002286123474199092, "loss": 0.0188, "step": 183600 }, { "epoch": 0.48, "learning_rate": 0.00022860845920353773, "loss": 0.0161, "step": 183610 }, { "epoch": 0.48, "learning_rate": 0.00022860457098716625, "loss": 0.0177, "step": 183620 }, { "epoch": 0.48, "learning_rate": 0.00022860068277079482, "loss": 0.0164, "step": 183630 }, { "epoch": 0.48, "learning_rate": 0.00022859679455442336, "loss": 0.0157, "step": 183640 }, { "epoch": 0.48, "learning_rate": 0.00022859290633805187, "loss": 0.0148, "step": 183650 }, { "epoch": 0.48, "learning_rate": 0.0002285890181216804, "loss": 0.0167, "step": 183660 }, { "epoch": 0.48, "learning_rate": 0.00022858512990530896, "loss": 0.0178, "step": 183670 }, { "epoch": 0.48, "learning_rate": 0.0002285812416889375, "loss": 0.017, "step": 183680 }, { "epoch": 0.48, "learning_rate": 0.000228577353472566, "loss": 0.02, "step": 183690 }, { "epoch": 0.48, "learning_rate": 0.00022857346525619455, "loss": 0.0153, "step": 183700 }, { "epoch": 0.48, "learning_rate": 0.0002285695770398231, "loss": 0.0185, "step": 183710 }, { "epoch": 0.48, "learning_rate": 0.00022856568882345164, "loss": 0.0247, "step": 183720 }, { "epoch": 0.48, "learning_rate": 0.00022856180060708015, "loss": 0.0234, "step": 183730 }, { "epoch": 0.48, "learning_rate": 0.0002285579123907087, "loss": 0.018, "step": 183740 }, { "epoch": 0.48, "learning_rate": 0.00022855402417433724, "loss": 0.019, "step": 183750 }, { "epoch": 0.48, "learning_rate": 0.00022855013595796578, "loss": 0.0157, "step": 183760 }, { "epoch": 0.48, "learning_rate": 0.0002285462477415943, "loss": 0.021, "step": 183770 }, { "epoch": 0.48, "learning_rate": 0.00022854235952522283, "loss": 0.0217, "step": 183780 }, { "epoch": 0.48, "learning_rate": 0.0002285384713088514, "loss": 0.0218, "step": 183790 }, { "epoch": 0.48, "learning_rate": 0.00022853458309247992, "loss": 0.0271, "step": 183800 }, { "epoch": 0.48, "learning_rate": 0.00022853069487610843, "loss": 0.0169, "step": 183810 }, { "epoch": 0.48, "learning_rate": 0.00022852680665973697, "loss": 0.0187, "step": 183820 }, { "epoch": 0.48, "learning_rate": 0.00022852291844336554, "loss": 0.0164, "step": 183830 }, { "epoch": 0.48, "learning_rate": 0.00022851903022699406, "loss": 0.0224, "step": 183840 }, { "epoch": 0.48, "learning_rate": 0.0002285151420106226, "loss": 0.0183, "step": 183850 }, { "epoch": 0.48, "learning_rate": 0.0002285112537942511, "loss": 0.0151, "step": 183860 }, { "epoch": 0.48, "learning_rate": 0.00022850736557787965, "loss": 0.0183, "step": 183870 }, { "epoch": 0.48, "learning_rate": 0.0002285034773615082, "loss": 0.0229, "step": 183880 }, { "epoch": 0.48, "learning_rate": 0.00022849958914513674, "loss": 0.0209, "step": 183890 }, { "epoch": 0.48, "learning_rate": 0.00022849570092876525, "loss": 0.037, "step": 183900 }, { "epoch": 0.48, "learning_rate": 0.0002284918127123938, "loss": 0.0236, "step": 183910 }, { "epoch": 0.48, "learning_rate": 0.00022848792449602234, "loss": 0.0194, "step": 183920 }, { "epoch": 0.48, "learning_rate": 0.00022848403627965088, "loss": 0.0197, "step": 183930 }, { "epoch": 0.48, "learning_rate": 0.0002284801480632794, "loss": 0.0233, "step": 183940 }, { "epoch": 0.48, "learning_rate": 0.00022847625984690793, "loss": 0.0178, "step": 183950 }, { "epoch": 0.48, "learning_rate": 0.00022847237163053647, "loss": 0.0197, "step": 183960 }, { "epoch": 0.48, "learning_rate": 0.00022846848341416502, "loss": 0.0154, "step": 183970 }, { "epoch": 0.48, "learning_rate": 0.00022846459519779353, "loss": 0.0155, "step": 183980 }, { "epoch": 0.48, "learning_rate": 0.00022846070698142207, "loss": 0.0206, "step": 183990 }, { "epoch": 0.48, "learning_rate": 0.00022845681876505064, "loss": 0.021, "step": 184000 }, { "epoch": 0.48, "eval_cer": 0.8817712685329425, "eval_loss": 0.012564102187752724, "eval_runtime": 108.043, "eval_samples_per_second": 18.511, "eval_steps_per_second": 4.628, "step": 184000 }, { "epoch": 0.48, "learning_rate": 0.00022845293054867916, "loss": 0.0193, "step": 184010 }, { "epoch": 0.48, "learning_rate": 0.0002284490423323077, "loss": 0.0184, "step": 184020 }, { "epoch": 0.48, "learning_rate": 0.0002284451541159362, "loss": 0.0251, "step": 184030 }, { "epoch": 0.48, "learning_rate": 0.00022844126589956478, "loss": 0.0248, "step": 184040 }, { "epoch": 0.48, "learning_rate": 0.0002284373776831933, "loss": 0.0146, "step": 184050 }, { "epoch": 0.48, "learning_rate": 0.00022843348946682184, "loss": 0.0184, "step": 184060 }, { "epoch": 0.48, "learning_rate": 0.00022842960125045035, "loss": 0.0198, "step": 184070 }, { "epoch": 0.48, "learning_rate": 0.00022842571303407892, "loss": 0.0143, "step": 184080 }, { "epoch": 0.48, "learning_rate": 0.00022842182481770743, "loss": 0.0214, "step": 184090 }, { "epoch": 0.48, "learning_rate": 0.00022841793660133598, "loss": 0.0181, "step": 184100 }, { "epoch": 0.48, "learning_rate": 0.0002284140483849645, "loss": 0.0179, "step": 184110 }, { "epoch": 0.48, "learning_rate": 0.00022841016016859303, "loss": 0.0183, "step": 184120 }, { "epoch": 0.48, "learning_rate": 0.00022840627195222157, "loss": 0.0171, "step": 184130 }, { "epoch": 0.48, "learning_rate": 0.00022840238373585012, "loss": 0.0186, "step": 184140 }, { "epoch": 0.48, "learning_rate": 0.00022839849551947863, "loss": 0.0143, "step": 184150 }, { "epoch": 0.48, "learning_rate": 0.00022839460730310717, "loss": 0.0148, "step": 184160 }, { "epoch": 0.48, "learning_rate": 0.00022839071908673574, "loss": 0.0158, "step": 184170 }, { "epoch": 0.48, "learning_rate": 0.00022838683087036426, "loss": 0.0134, "step": 184180 }, { "epoch": 0.48, "learning_rate": 0.0002283829426539928, "loss": 0.0179, "step": 184190 }, { "epoch": 0.48, "learning_rate": 0.0002283790544376213, "loss": 0.017, "step": 184200 }, { "epoch": 0.48, "learning_rate": 0.00022837516622124988, "loss": 0.0172, "step": 184210 }, { "epoch": 0.48, "learning_rate": 0.0002283712780048784, "loss": 0.016, "step": 184220 }, { "epoch": 0.48, "learning_rate": 0.00022836738978850694, "loss": 0.0148, "step": 184230 }, { "epoch": 0.48, "learning_rate": 0.00022836350157213545, "loss": 0.0182, "step": 184240 }, { "epoch": 0.48, "learning_rate": 0.00022835961335576402, "loss": 0.0172, "step": 184250 }, { "epoch": 0.48, "learning_rate": 0.00022835572513939253, "loss": 0.0159, "step": 184260 }, { "epoch": 0.48, "learning_rate": 0.00022835183692302108, "loss": 0.0164, "step": 184270 }, { "epoch": 0.48, "learning_rate": 0.0002283479487066496, "loss": 0.0224, "step": 184280 }, { "epoch": 0.48, "learning_rate": 0.00022834406049027816, "loss": 0.0218, "step": 184290 }, { "epoch": 0.48, "learning_rate": 0.00022834017227390667, "loss": 0.0139, "step": 184300 }, { "epoch": 0.48, "learning_rate": 0.00022833628405753522, "loss": 0.0212, "step": 184310 }, { "epoch": 0.48, "learning_rate": 0.00022833239584116373, "loss": 0.0153, "step": 184320 }, { "epoch": 0.48, "learning_rate": 0.0002283285076247923, "loss": 0.02, "step": 184330 }, { "epoch": 0.48, "learning_rate": 0.00022832461940842084, "loss": 0.0202, "step": 184340 }, { "epoch": 0.48, "learning_rate": 0.00022832073119204935, "loss": 0.0225, "step": 184350 }, { "epoch": 0.48, "learning_rate": 0.0002283168429756779, "loss": 0.022, "step": 184360 }, { "epoch": 0.48, "learning_rate": 0.0002283129547593064, "loss": 0.0142, "step": 184370 }, { "epoch": 0.48, "learning_rate": 0.00022830906654293498, "loss": 0.0177, "step": 184380 }, { "epoch": 0.48, "learning_rate": 0.0002283051783265635, "loss": 0.0173, "step": 184390 }, { "epoch": 0.48, "learning_rate": 0.00022830129011019204, "loss": 0.0153, "step": 184400 }, { "epoch": 0.48, "learning_rate": 0.00022829740189382055, "loss": 0.0197, "step": 184410 }, { "epoch": 0.48, "learning_rate": 0.00022829351367744912, "loss": 0.0178, "step": 184420 }, { "epoch": 0.48, "learning_rate": 0.00022828962546107763, "loss": 0.0172, "step": 184430 }, { "epoch": 0.48, "learning_rate": 0.00022828573724470618, "loss": 0.0153, "step": 184440 }, { "epoch": 0.48, "learning_rate": 0.0002282818490283347, "loss": 0.0195, "step": 184450 }, { "epoch": 0.48, "learning_rate": 0.00022827796081196326, "loss": 0.0173, "step": 184460 }, { "epoch": 0.48, "learning_rate": 0.00022827407259559177, "loss": 0.017, "step": 184470 }, { "epoch": 0.48, "learning_rate": 0.00022827018437922031, "loss": 0.0178, "step": 184480 }, { "epoch": 0.48, "learning_rate": 0.00022826629616284883, "loss": 0.0128, "step": 184490 }, { "epoch": 0.48, "learning_rate": 0.0002282624079464774, "loss": 0.0185, "step": 184500 }, { "epoch": 0.48, "learning_rate": 0.00022825851973010594, "loss": 0.0255, "step": 184510 }, { "epoch": 0.48, "learning_rate": 0.00022825463151373445, "loss": 0.0163, "step": 184520 }, { "epoch": 0.48, "learning_rate": 0.00022825074329736297, "loss": 0.0171, "step": 184530 }, { "epoch": 0.48, "learning_rate": 0.00022824685508099154, "loss": 0.0155, "step": 184540 }, { "epoch": 0.48, "learning_rate": 0.00022824296686462008, "loss": 0.0167, "step": 184550 }, { "epoch": 0.48, "learning_rate": 0.0002282390786482486, "loss": 0.015, "step": 184560 }, { "epoch": 0.48, "learning_rate": 0.00022823519043187714, "loss": 0.021, "step": 184570 }, { "epoch": 0.48, "learning_rate": 0.00022823130221550568, "loss": 0.0172, "step": 184580 }, { "epoch": 0.48, "learning_rate": 0.00022822741399913422, "loss": 0.0199, "step": 184590 }, { "epoch": 0.48, "learning_rate": 0.00022822352578276273, "loss": 0.0155, "step": 184600 }, { "epoch": 0.48, "learning_rate": 0.00022821963756639127, "loss": 0.0175, "step": 184610 }, { "epoch": 0.48, "learning_rate": 0.0002282157493500198, "loss": 0.0205, "step": 184620 }, { "epoch": 0.48, "learning_rate": 0.00022821186113364836, "loss": 0.0183, "step": 184630 }, { "epoch": 0.48, "learning_rate": 0.00022820797291727687, "loss": 0.0179, "step": 184640 }, { "epoch": 0.48, "learning_rate": 0.00022820408470090541, "loss": 0.0165, "step": 184650 }, { "epoch": 0.48, "learning_rate": 0.00022820019648453393, "loss": 0.0177, "step": 184660 }, { "epoch": 0.48, "learning_rate": 0.0002281963082681625, "loss": 0.0197, "step": 184670 }, { "epoch": 0.48, "learning_rate": 0.000228192420051791, "loss": 0.0217, "step": 184680 }, { "epoch": 0.48, "learning_rate": 0.00022818853183541955, "loss": 0.018, "step": 184690 }, { "epoch": 0.48, "learning_rate": 0.00022818464361904807, "loss": 0.0169, "step": 184700 }, { "epoch": 0.48, "learning_rate": 0.00022818075540267664, "loss": 0.0159, "step": 184710 }, { "epoch": 0.48, "learning_rate": 0.00022817686718630518, "loss": 0.0168, "step": 184720 }, { "epoch": 0.48, "learning_rate": 0.0002281729789699337, "loss": 0.0214, "step": 184730 }, { "epoch": 0.48, "learning_rate": 0.00022816909075356223, "loss": 0.02, "step": 184740 }, { "epoch": 0.48, "learning_rate": 0.00022816520253719078, "loss": 0.0169, "step": 184750 }, { "epoch": 0.48, "learning_rate": 0.00022816131432081932, "loss": 0.0211, "step": 184760 }, { "epoch": 0.48, "learning_rate": 0.00022815742610444783, "loss": 0.0156, "step": 184770 }, { "epoch": 0.48, "learning_rate": 0.00022815353788807637, "loss": 0.0216, "step": 184780 }, { "epoch": 0.48, "learning_rate": 0.00022814964967170492, "loss": 0.019, "step": 184790 }, { "epoch": 0.48, "learning_rate": 0.00022814576145533346, "loss": 0.0187, "step": 184800 }, { "epoch": 0.48, "learning_rate": 0.00022814187323896197, "loss": 0.0188, "step": 184810 }, { "epoch": 0.48, "learning_rate": 0.0002281379850225905, "loss": 0.0161, "step": 184820 }, { "epoch": 0.48, "learning_rate": 0.00022813409680621908, "loss": 0.0196, "step": 184830 }, { "epoch": 0.48, "learning_rate": 0.0002281302085898476, "loss": 0.0189, "step": 184840 }, { "epoch": 0.48, "learning_rate": 0.0002281263203734761, "loss": 0.0225, "step": 184850 }, { "epoch": 0.48, "learning_rate": 0.00022812243215710465, "loss": 0.0191, "step": 184860 }, { "epoch": 0.48, "learning_rate": 0.00022811854394073317, "loss": 0.0166, "step": 184870 }, { "epoch": 0.48, "learning_rate": 0.00022811465572436174, "loss": 0.0141, "step": 184880 }, { "epoch": 0.48, "learning_rate": 0.00022811076750799028, "loss": 0.0202, "step": 184890 }, { "epoch": 0.48, "learning_rate": 0.0002281068792916188, "loss": 0.0207, "step": 184900 }, { "epoch": 0.48, "learning_rate": 0.00022810299107524733, "loss": 0.0214, "step": 184910 }, { "epoch": 0.48, "learning_rate": 0.00022809910285887588, "loss": 0.0155, "step": 184920 }, { "epoch": 0.48, "learning_rate": 0.00022809521464250442, "loss": 0.0165, "step": 184930 }, { "epoch": 0.48, "learning_rate": 0.00022809132642613293, "loss": 0.0167, "step": 184940 }, { "epoch": 0.48, "learning_rate": 0.00022808743820976147, "loss": 0.016, "step": 184950 }, { "epoch": 0.48, "learning_rate": 0.00022808354999339002, "loss": 0.0156, "step": 184960 }, { "epoch": 0.48, "learning_rate": 0.00022807966177701856, "loss": 0.025, "step": 184970 }, { "epoch": 0.48, "learning_rate": 0.00022807577356064707, "loss": 0.018, "step": 184980 }, { "epoch": 0.48, "learning_rate": 0.0002280718853442756, "loss": 0.0206, "step": 184990 }, { "epoch": 0.48, "learning_rate": 0.00022806799712790415, "loss": 0.0197, "step": 185000 }, { "epoch": 0.48, "eval_cer": 0.8817614710744033, "eval_loss": 0.01203981600701809, "eval_runtime": 108.1177, "eval_samples_per_second": 18.498, "eval_steps_per_second": 4.625, "step": 185000 }, { "epoch": 0.48, "learning_rate": 0.0002280641089115327, "loss": 0.0149, "step": 185010 }, { "epoch": 0.48, "learning_rate": 0.0002280602206951612, "loss": 0.0135, "step": 185020 }, { "epoch": 0.48, "learning_rate": 0.00022805633247878975, "loss": 0.0166, "step": 185030 }, { "epoch": 0.48, "learning_rate": 0.00022805244426241832, "loss": 0.0182, "step": 185040 }, { "epoch": 0.48, "learning_rate": 0.00022804855604604684, "loss": 0.0178, "step": 185050 }, { "epoch": 0.48, "learning_rate": 0.00022804466782967538, "loss": 0.0176, "step": 185060 }, { "epoch": 0.48, "learning_rate": 0.0002280407796133039, "loss": 0.0178, "step": 185070 }, { "epoch": 0.48, "learning_rate": 0.00022803689139693246, "loss": 0.0207, "step": 185080 }, { "epoch": 0.48, "learning_rate": 0.00022803300318056097, "loss": 0.0163, "step": 185090 }, { "epoch": 0.48, "learning_rate": 0.00022802911496418952, "loss": 0.017, "step": 185100 }, { "epoch": 0.48, "learning_rate": 0.00022802522674781803, "loss": 0.0147, "step": 185110 }, { "epoch": 0.48, "learning_rate": 0.00022802133853144657, "loss": 0.0204, "step": 185120 }, { "epoch": 0.48, "learning_rate": 0.00022801745031507511, "loss": 0.0174, "step": 185130 }, { "epoch": 0.48, "learning_rate": 0.00022801356209870366, "loss": 0.0138, "step": 185140 }, { "epoch": 0.48, "learning_rate": 0.00022800967388233217, "loss": 0.0171, "step": 185150 }, { "epoch": 0.48, "learning_rate": 0.0002280057856659607, "loss": 0.0171, "step": 185160 }, { "epoch": 0.48, "learning_rate": 0.00022800189744958925, "loss": 0.0173, "step": 185170 }, { "epoch": 0.48, "learning_rate": 0.0002279980092332178, "loss": 0.0207, "step": 185180 }, { "epoch": 0.48, "learning_rate": 0.0002279941210168463, "loss": 0.0171, "step": 185190 }, { "epoch": 0.48, "learning_rate": 0.00022799023280047485, "loss": 0.0227, "step": 185200 }, { "epoch": 0.48, "learning_rate": 0.00022798634458410342, "loss": 0.0162, "step": 185210 }, { "epoch": 0.48, "learning_rate": 0.00022798245636773193, "loss": 0.0169, "step": 185220 }, { "epoch": 0.48, "learning_rate": 0.00022797856815136048, "loss": 0.0186, "step": 185230 }, { "epoch": 0.48, "learning_rate": 0.000227974679934989, "loss": 0.0226, "step": 185240 }, { "epoch": 0.48, "learning_rate": 0.00022797079171861756, "loss": 0.0177, "step": 185250 }, { "epoch": 0.48, "learning_rate": 0.00022796690350224607, "loss": 0.0134, "step": 185260 }, { "epoch": 0.48, "learning_rate": 0.00022796301528587462, "loss": 0.017, "step": 185270 }, { "epoch": 0.48, "learning_rate": 0.00022795912706950313, "loss": 0.0205, "step": 185280 }, { "epoch": 0.48, "learning_rate": 0.0002279552388531317, "loss": 0.0156, "step": 185290 }, { "epoch": 0.48, "learning_rate": 0.00022795135063676021, "loss": 0.0201, "step": 185300 }, { "epoch": 0.48, "learning_rate": 0.00022794746242038876, "loss": 0.0184, "step": 185310 }, { "epoch": 0.48, "learning_rate": 0.00022794357420401727, "loss": 0.0169, "step": 185320 }, { "epoch": 0.48, "learning_rate": 0.00022793968598764584, "loss": 0.0167, "step": 185330 }, { "epoch": 0.48, "learning_rate": 0.00022793579777127435, "loss": 0.0174, "step": 185340 }, { "epoch": 0.48, "learning_rate": 0.0002279319095549029, "loss": 0.0208, "step": 185350 }, { "epoch": 0.48, "learning_rate": 0.0002279280213385314, "loss": 0.0157, "step": 185360 }, { "epoch": 0.48, "learning_rate": 0.00022792413312215995, "loss": 0.017, "step": 185370 }, { "epoch": 0.48, "learning_rate": 0.00022792024490578852, "loss": 0.0165, "step": 185380 }, { "epoch": 0.48, "learning_rate": 0.00022791635668941703, "loss": 0.0163, "step": 185390 }, { "epoch": 0.48, "learning_rate": 0.00022791246847304555, "loss": 0.0187, "step": 185400 }, { "epoch": 0.48, "learning_rate": 0.0002279085802566741, "loss": 0.0163, "step": 185410 }, { "epoch": 0.48, "learning_rate": 0.00022790469204030266, "loss": 0.0151, "step": 185420 }, { "epoch": 0.48, "learning_rate": 0.00022790080382393117, "loss": 0.0153, "step": 185430 }, { "epoch": 0.48, "learning_rate": 0.00022789691560755972, "loss": 0.0227, "step": 185440 }, { "epoch": 0.48, "learning_rate": 0.00022789302739118823, "loss": 0.0177, "step": 185450 }, { "epoch": 0.48, "learning_rate": 0.0002278891391748168, "loss": 0.0154, "step": 185460 }, { "epoch": 0.48, "learning_rate": 0.0002278852509584453, "loss": 0.0246, "step": 185470 }, { "epoch": 0.48, "learning_rate": 0.00022788136274207385, "loss": 0.0154, "step": 185480 }, { "epoch": 0.48, "learning_rate": 0.00022787747452570237, "loss": 0.0181, "step": 185490 }, { "epoch": 0.48, "learning_rate": 0.00022787358630933094, "loss": 0.0189, "step": 185500 }, { "epoch": 0.48, "learning_rate": 0.00022786969809295945, "loss": 0.0256, "step": 185510 }, { "epoch": 0.48, "learning_rate": 0.000227865809876588, "loss": 0.0211, "step": 185520 }, { "epoch": 0.48, "learning_rate": 0.0002278619216602165, "loss": 0.017, "step": 185530 }, { "epoch": 0.48, "learning_rate": 0.00022785803344384508, "loss": 0.0169, "step": 185540 }, { "epoch": 0.48, "learning_rate": 0.0002278541452274736, "loss": 0.0152, "step": 185550 }, { "epoch": 0.48, "learning_rate": 0.00022785025701110213, "loss": 0.02, "step": 185560 }, { "epoch": 0.48, "learning_rate": 0.00022784636879473065, "loss": 0.0194, "step": 185570 }, { "epoch": 0.48, "learning_rate": 0.00022784248057835922, "loss": 0.0173, "step": 185580 }, { "epoch": 0.48, "learning_rate": 0.00022783859236198776, "loss": 0.0182, "step": 185590 }, { "epoch": 0.48, "learning_rate": 0.00022783470414561627, "loss": 0.0175, "step": 185600 }, { "epoch": 0.48, "learning_rate": 0.00022783081592924481, "loss": 0.0172, "step": 185610 }, { "epoch": 0.48, "learning_rate": 0.00022782692771287333, "loss": 0.0182, "step": 185620 }, { "epoch": 0.48, "learning_rate": 0.0002278230394965019, "loss": 0.0167, "step": 185630 }, { "epoch": 0.48, "learning_rate": 0.0002278191512801304, "loss": 0.019, "step": 185640 }, { "epoch": 0.48, "learning_rate": 0.00022781526306375895, "loss": 0.0182, "step": 185650 }, { "epoch": 0.48, "learning_rate": 0.00022781137484738747, "loss": 0.0177, "step": 185660 }, { "epoch": 0.48, "learning_rate": 0.00022780748663101604, "loss": 0.0154, "step": 185670 }, { "epoch": 0.48, "learning_rate": 0.00022780359841464455, "loss": 0.0215, "step": 185680 }, { "epoch": 0.48, "learning_rate": 0.0002277997101982731, "loss": 0.0165, "step": 185690 }, { "epoch": 0.48, "learning_rate": 0.0002277958219819016, "loss": 0.019, "step": 185700 }, { "epoch": 0.48, "learning_rate": 0.00022779193376553018, "loss": 0.0186, "step": 185710 }, { "epoch": 0.48, "learning_rate": 0.0002277880455491587, "loss": 0.0144, "step": 185720 }, { "epoch": 0.48, "learning_rate": 0.00022778415733278723, "loss": 0.0182, "step": 185730 }, { "epoch": 0.48, "learning_rate": 0.00022778026911641575, "loss": 0.0178, "step": 185740 }, { "epoch": 0.48, "learning_rate": 0.00022777638090004432, "loss": 0.0159, "step": 185750 }, { "epoch": 0.48, "learning_rate": 0.00022777249268367286, "loss": 0.0205, "step": 185760 }, { "epoch": 0.48, "learning_rate": 0.00022776860446730137, "loss": 0.017, "step": 185770 }, { "epoch": 0.48, "learning_rate": 0.00022776471625092991, "loss": 0.0225, "step": 185780 }, { "epoch": 0.48, "learning_rate": 0.00022776082803455846, "loss": 0.015, "step": 185790 }, { "epoch": 0.48, "learning_rate": 0.000227756939818187, "loss": 0.0185, "step": 185800 }, { "epoch": 0.48, "learning_rate": 0.0002277530516018155, "loss": 0.0193, "step": 185810 }, { "epoch": 0.48, "learning_rate": 0.00022774916338544405, "loss": 0.0139, "step": 185820 }, { "epoch": 0.48, "learning_rate": 0.0002277452751690726, "loss": 0.0157, "step": 185830 }, { "epoch": 0.48, "learning_rate": 0.00022774138695270114, "loss": 0.016, "step": 185840 }, { "epoch": 0.48, "learning_rate": 0.00022773749873632965, "loss": 0.0212, "step": 185850 }, { "epoch": 0.48, "learning_rate": 0.0002277336105199582, "loss": 0.0161, "step": 185860 }, { "epoch": 0.48, "learning_rate": 0.0002277297223035867, "loss": 0.017, "step": 185870 }, { "epoch": 0.48, "learning_rate": 0.00022772583408721528, "loss": 0.017, "step": 185880 }, { "epoch": 0.48, "learning_rate": 0.0002277219458708438, "loss": 0.0168, "step": 185890 }, { "epoch": 0.48, "learning_rate": 0.00022771805765447233, "loss": 0.0166, "step": 185900 }, { "epoch": 0.48, "learning_rate": 0.00022771416943810085, "loss": 0.0174, "step": 185910 }, { "epoch": 0.48, "learning_rate": 0.00022771028122172942, "loss": 0.0178, "step": 185920 }, { "epoch": 0.48, "learning_rate": 0.00022770639300535796, "loss": 0.0171, "step": 185930 }, { "epoch": 0.48, "learning_rate": 0.00022770250478898647, "loss": 0.0175, "step": 185940 }, { "epoch": 0.48, "learning_rate": 0.00022769861657261501, "loss": 0.0173, "step": 185950 }, { "epoch": 0.48, "learning_rate": 0.00022769472835624356, "loss": 0.018, "step": 185960 }, { "epoch": 0.48, "learning_rate": 0.0002276908401398721, "loss": 0.0178, "step": 185970 }, { "epoch": 0.48, "learning_rate": 0.0002276869519235006, "loss": 0.0134, "step": 185980 }, { "epoch": 0.48, "learning_rate": 0.00022768306370712915, "loss": 0.0168, "step": 185990 }, { "epoch": 0.48, "learning_rate": 0.0002276791754907577, "loss": 0.0172, "step": 186000 }, { "epoch": 0.48, "eval_cer": 0.8818188561887047, "eval_loss": 0.012164667248725891, "eval_runtime": 107.6778, "eval_samples_per_second": 18.574, "eval_steps_per_second": 4.643, "step": 186000 }, { "epoch": 0.48, "learning_rate": 0.00022767528727438624, "loss": 0.0175, "step": 186010 }, { "epoch": 0.48, "learning_rate": 0.00022767139905801475, "loss": 0.0145, "step": 186020 }, { "epoch": 0.48, "learning_rate": 0.0002276675108416433, "loss": 0.0205, "step": 186030 }, { "epoch": 0.48, "learning_rate": 0.00022766362262527183, "loss": 0.0171, "step": 186040 }, { "epoch": 0.48, "learning_rate": 0.00022765973440890038, "loss": 0.0157, "step": 186050 }, { "epoch": 0.48, "learning_rate": 0.0002276558461925289, "loss": 0.0181, "step": 186060 }, { "epoch": 0.48, "learning_rate": 0.00022765195797615743, "loss": 0.0179, "step": 186070 }, { "epoch": 0.48, "learning_rate": 0.00022764806975978595, "loss": 0.0172, "step": 186080 }, { "epoch": 0.48, "learning_rate": 0.00022764418154341452, "loss": 0.0225, "step": 186090 }, { "epoch": 0.48, "learning_rate": 0.00022764029332704306, "loss": 0.0223, "step": 186100 }, { "epoch": 0.48, "learning_rate": 0.00022763640511067157, "loss": 0.0181, "step": 186110 }, { "epoch": 0.48, "learning_rate": 0.00022763251689430009, "loss": 0.0131, "step": 186120 }, { "epoch": 0.48, "learning_rate": 0.00022762862867792865, "loss": 0.0188, "step": 186130 }, { "epoch": 0.48, "learning_rate": 0.0002276247404615572, "loss": 0.0203, "step": 186140 }, { "epoch": 0.48, "learning_rate": 0.0002276208522451857, "loss": 0.0185, "step": 186150 }, { "epoch": 0.48, "learning_rate": 0.00022761696402881425, "loss": 0.0139, "step": 186160 }, { "epoch": 0.48, "learning_rate": 0.0002276130758124428, "loss": 0.0175, "step": 186170 }, { "epoch": 0.48, "learning_rate": 0.00022760918759607134, "loss": 0.0156, "step": 186180 }, { "epoch": 0.48, "learning_rate": 0.00022760529937969985, "loss": 0.0221, "step": 186190 }, { "epoch": 0.48, "learning_rate": 0.0002276014111633284, "loss": 0.0163, "step": 186200 }, { "epoch": 0.48, "learning_rate": 0.00022759752294695693, "loss": 0.0141, "step": 186210 }, { "epoch": 0.48, "learning_rate": 0.00022759363473058548, "loss": 0.0197, "step": 186220 }, { "epoch": 0.48, "learning_rate": 0.000227589746514214, "loss": 0.0169, "step": 186230 }, { "epoch": 0.48, "learning_rate": 0.00022758585829784253, "loss": 0.0183, "step": 186240 }, { "epoch": 0.48, "learning_rate": 0.0002275819700814711, "loss": 0.0164, "step": 186250 }, { "epoch": 0.48, "learning_rate": 0.00022757808186509961, "loss": 0.0191, "step": 186260 }, { "epoch": 0.48, "learning_rate": 0.00022757419364872813, "loss": 0.016, "step": 186270 }, { "epoch": 0.48, "learning_rate": 0.00022757030543235667, "loss": 0.0161, "step": 186280 }, { "epoch": 0.48, "learning_rate": 0.00022756641721598524, "loss": 0.0179, "step": 186290 }, { "epoch": 0.48, "learning_rate": 0.00022756252899961375, "loss": 0.0165, "step": 186300 }, { "epoch": 0.48, "learning_rate": 0.0002275586407832423, "loss": 0.0166, "step": 186310 }, { "epoch": 0.48, "learning_rate": 0.0002275547525668708, "loss": 0.0172, "step": 186320 }, { "epoch": 0.48, "learning_rate": 0.00022755086435049935, "loss": 0.018, "step": 186330 }, { "epoch": 0.48, "learning_rate": 0.0002275469761341279, "loss": 0.0174, "step": 186340 }, { "epoch": 0.48, "learning_rate": 0.00022754308791775644, "loss": 0.0177, "step": 186350 }, { "epoch": 0.48, "learning_rate": 0.00022753919970138495, "loss": 0.0165, "step": 186360 }, { "epoch": 0.48, "learning_rate": 0.0002275353114850135, "loss": 0.0153, "step": 186370 }, { "epoch": 0.48, "learning_rate": 0.00022753142326864203, "loss": 0.0159, "step": 186380 }, { "epoch": 0.48, "learning_rate": 0.00022752753505227057, "loss": 0.0221, "step": 186390 }, { "epoch": 0.48, "learning_rate": 0.0002275236468358991, "loss": 0.019, "step": 186400 }, { "epoch": 0.48, "learning_rate": 0.00022751975861952763, "loss": 0.0155, "step": 186410 }, { "epoch": 0.48, "learning_rate": 0.0002275158704031562, "loss": 0.0136, "step": 186420 }, { "epoch": 0.48, "learning_rate": 0.00022751198218678471, "loss": 0.0206, "step": 186430 }, { "epoch": 0.48, "learning_rate": 0.00022750809397041323, "loss": 0.0208, "step": 186440 }, { "epoch": 0.48, "learning_rate": 0.00022750420575404177, "loss": 0.0189, "step": 186450 }, { "epoch": 0.48, "learning_rate": 0.00022750031753767034, "loss": 0.0209, "step": 186460 }, { "epoch": 0.48, "learning_rate": 0.00022749642932129885, "loss": 0.0167, "step": 186470 }, { "epoch": 0.48, "learning_rate": 0.0002274925411049274, "loss": 0.0181, "step": 186480 }, { "epoch": 0.48, "learning_rate": 0.0002274886528885559, "loss": 0.0177, "step": 186490 }, { "epoch": 0.48, "learning_rate": 0.00022748476467218448, "loss": 0.0198, "step": 186500 }, { "epoch": 0.48, "learning_rate": 0.000227480876455813, "loss": 0.0165, "step": 186510 }, { "epoch": 0.48, "learning_rate": 0.00022747698823944153, "loss": 0.0137, "step": 186520 }, { "epoch": 0.48, "learning_rate": 0.00022747310002307005, "loss": 0.015, "step": 186530 }, { "epoch": 0.48, "learning_rate": 0.00022746921180669862, "loss": 0.0191, "step": 186540 }, { "epoch": 0.48, "learning_rate": 0.00022746532359032713, "loss": 0.0202, "step": 186550 }, { "epoch": 0.48, "learning_rate": 0.00022746143537395567, "loss": 0.0176, "step": 186560 }, { "epoch": 0.48, "learning_rate": 0.0002274575471575842, "loss": 0.0184, "step": 186570 }, { "epoch": 0.48, "learning_rate": 0.00022745365894121273, "loss": 0.0186, "step": 186580 }, { "epoch": 0.48, "learning_rate": 0.00022744977072484127, "loss": 0.0178, "step": 186590 }, { "epoch": 0.48, "learning_rate": 0.00022744588250846981, "loss": 0.0192, "step": 186600 }, { "epoch": 0.48, "learning_rate": 0.00022744199429209833, "loss": 0.0164, "step": 186610 }, { "epoch": 0.48, "learning_rate": 0.00022743810607572687, "loss": 0.0174, "step": 186620 }, { "epoch": 0.48, "learning_rate": 0.00022743421785935544, "loss": 0.0204, "step": 186630 }, { "epoch": 0.48, "learning_rate": 0.00022743032964298395, "loss": 0.0152, "step": 186640 }, { "epoch": 0.48, "learning_rate": 0.0002274264414266125, "loss": 0.0194, "step": 186650 }, { "epoch": 0.48, "learning_rate": 0.000227422553210241, "loss": 0.0277, "step": 186660 }, { "epoch": 0.48, "learning_rate": 0.00022741866499386958, "loss": 0.0201, "step": 186670 }, { "epoch": 0.48, "learning_rate": 0.0002274147767774981, "loss": 0.0146, "step": 186680 }, { "epoch": 0.48, "learning_rate": 0.00022741088856112663, "loss": 0.018, "step": 186690 }, { "epoch": 0.48, "learning_rate": 0.00022740700034475515, "loss": 0.0154, "step": 186700 }, { "epoch": 0.48, "learning_rate": 0.00022740311212838372, "loss": 0.0199, "step": 186710 }, { "epoch": 0.48, "learning_rate": 0.00022739922391201223, "loss": 0.019, "step": 186720 }, { "epoch": 0.48, "learning_rate": 0.00022739533569564077, "loss": 0.0158, "step": 186730 }, { "epoch": 0.48, "learning_rate": 0.0002273914474792693, "loss": 0.0203, "step": 186740 }, { "epoch": 0.48, "learning_rate": 0.00022738755926289786, "loss": 0.02, "step": 186750 }, { "epoch": 0.48, "learning_rate": 0.00022738367104652637, "loss": 0.0169, "step": 186760 }, { "epoch": 0.48, "learning_rate": 0.0002273797828301549, "loss": 0.0239, "step": 186770 }, { "epoch": 0.48, "learning_rate": 0.00022737589461378343, "loss": 0.0175, "step": 186780 }, { "epoch": 0.48, "learning_rate": 0.000227372006397412, "loss": 0.0174, "step": 186790 }, { "epoch": 0.48, "learning_rate": 0.00022736811818104054, "loss": 0.0169, "step": 186800 }, { "epoch": 0.48, "learning_rate": 0.00022736422996466905, "loss": 0.0185, "step": 186810 }, { "epoch": 0.48, "learning_rate": 0.0002273603417482976, "loss": 0.0154, "step": 186820 }, { "epoch": 0.48, "learning_rate": 0.0002273564535319261, "loss": 0.0193, "step": 186830 }, { "epoch": 0.48, "learning_rate": 0.00022735256531555468, "loss": 0.0279, "step": 186840 }, { "epoch": 0.48, "learning_rate": 0.0002273486770991832, "loss": 0.0169, "step": 186850 }, { "epoch": 0.48, "learning_rate": 0.00022734478888281173, "loss": 0.0222, "step": 186860 }, { "epoch": 0.48, "learning_rate": 0.00022734090066644025, "loss": 0.0135, "step": 186870 }, { "epoch": 0.48, "learning_rate": 0.00022733701245006882, "loss": 0.0186, "step": 186880 }, { "epoch": 0.48, "learning_rate": 0.00022733312423369733, "loss": 0.016, "step": 186890 }, { "epoch": 0.48, "learning_rate": 0.00022732923601732587, "loss": 0.0248, "step": 186900 }, { "epoch": 0.48, "learning_rate": 0.0002273253478009544, "loss": 0.0158, "step": 186910 }, { "epoch": 0.48, "learning_rate": 0.00022732145958458296, "loss": 0.018, "step": 186920 }, { "epoch": 0.48, "learning_rate": 0.00022731757136821147, "loss": 0.0163, "step": 186930 }, { "epoch": 0.48, "learning_rate": 0.00022731368315184, "loss": 0.0312, "step": 186940 }, { "epoch": 0.48, "learning_rate": 0.00022730979493546853, "loss": 0.0182, "step": 186950 }, { "epoch": 0.48, "learning_rate": 0.0002273059067190971, "loss": 0.0152, "step": 186960 }, { "epoch": 0.48, "learning_rate": 0.00022730201850272564, "loss": 0.0179, "step": 186970 }, { "epoch": 0.48, "learning_rate": 0.00022729813028635415, "loss": 0.0194, "step": 186980 }, { "epoch": 0.48, "learning_rate": 0.00022729424206998267, "loss": 0.0162, "step": 186990 }, { "epoch": 0.48, "learning_rate": 0.00022729035385361124, "loss": 0.0229, "step": 187000 }, { "epoch": 0.48, "eval_cer": 0.8818174565517705, "eval_loss": 0.01267703715711832, "eval_runtime": 107.8484, "eval_samples_per_second": 18.545, "eval_steps_per_second": 4.636, "step": 187000 }, { "epoch": 0.48, "learning_rate": 0.00022728646563723978, "loss": 0.0177, "step": 187010 }, { "epoch": 0.48, "learning_rate": 0.0002272825774208683, "loss": 0.0146, "step": 187020 }, { "epoch": 0.48, "learning_rate": 0.00022727868920449683, "loss": 0.0159, "step": 187030 }, { "epoch": 0.48, "learning_rate": 0.00022727480098812537, "loss": 0.0196, "step": 187040 }, { "epoch": 0.48, "learning_rate": 0.00022727091277175392, "loss": 0.0188, "step": 187050 }, { "epoch": 0.48, "learning_rate": 0.00022726702455538243, "loss": 0.0213, "step": 187060 }, { "epoch": 0.48, "learning_rate": 0.00022726313633901097, "loss": 0.02, "step": 187070 }, { "epoch": 0.48, "learning_rate": 0.0002272592481226395, "loss": 0.0169, "step": 187080 }, { "epoch": 0.48, "learning_rate": 0.00022725535990626806, "loss": 0.018, "step": 187090 }, { "epoch": 0.48, "learning_rate": 0.00022725147168989657, "loss": 0.016, "step": 187100 }, { "epoch": 0.49, "learning_rate": 0.0002272475834735251, "loss": 0.0275, "step": 187110 }, { "epoch": 0.49, "learning_rate": 0.00022724369525715363, "loss": 0.0154, "step": 187120 }, { "epoch": 0.49, "learning_rate": 0.0002272398070407822, "loss": 0.0194, "step": 187130 }, { "epoch": 0.49, "learning_rate": 0.0002272359188244107, "loss": 0.0182, "step": 187140 }, { "epoch": 0.49, "learning_rate": 0.00022723203060803925, "loss": 0.0164, "step": 187150 }, { "epoch": 0.49, "learning_rate": 0.00022722814239166777, "loss": 0.016, "step": 187160 }, { "epoch": 0.49, "learning_rate": 0.00022722425417529633, "loss": 0.019, "step": 187170 }, { "epoch": 0.49, "learning_rate": 0.00022722036595892488, "loss": 0.0182, "step": 187180 }, { "epoch": 0.49, "learning_rate": 0.0002272164777425534, "loss": 0.0171, "step": 187190 }, { "epoch": 0.49, "learning_rate": 0.00022721258952618193, "loss": 0.0215, "step": 187200 }, { "epoch": 0.49, "learning_rate": 0.00022720870130981047, "loss": 0.0157, "step": 187210 }, { "epoch": 0.49, "learning_rate": 0.00022720481309343902, "loss": 0.0202, "step": 187220 }, { "epoch": 0.49, "learning_rate": 0.00022720092487706753, "loss": 0.0175, "step": 187230 }, { "epoch": 0.49, "learning_rate": 0.00022719703666069607, "loss": 0.0197, "step": 187240 }, { "epoch": 0.49, "learning_rate": 0.0002271931484443246, "loss": 0.0178, "step": 187250 }, { "epoch": 0.49, "learning_rate": 0.00022718926022795316, "loss": 0.0194, "step": 187260 }, { "epoch": 0.49, "learning_rate": 0.00022718537201158167, "loss": 0.0149, "step": 187270 }, { "epoch": 0.49, "learning_rate": 0.0002271814837952102, "loss": 0.0188, "step": 187280 }, { "epoch": 0.49, "learning_rate": 0.00022717759557883878, "loss": 0.0171, "step": 187290 }, { "epoch": 0.49, "learning_rate": 0.0002271737073624673, "loss": 0.019, "step": 187300 }, { "epoch": 0.49, "learning_rate": 0.0002271698191460958, "loss": 0.0211, "step": 187310 }, { "epoch": 0.49, "learning_rate": 0.00022716593092972435, "loss": 0.0176, "step": 187320 }, { "epoch": 0.49, "learning_rate": 0.00022716204271335287, "loss": 0.0164, "step": 187330 }, { "epoch": 0.49, "learning_rate": 0.00022715815449698143, "loss": 0.0157, "step": 187340 }, { "epoch": 0.49, "learning_rate": 0.00022715426628060998, "loss": 0.0192, "step": 187350 }, { "epoch": 0.49, "learning_rate": 0.0002271503780642385, "loss": 0.0148, "step": 187360 }, { "epoch": 0.49, "learning_rate": 0.00022714648984786703, "loss": 0.0164, "step": 187370 }, { "epoch": 0.49, "learning_rate": 0.00022714260163149557, "loss": 0.0143, "step": 187380 }, { "epoch": 0.49, "learning_rate": 0.00022713871341512412, "loss": 0.02, "step": 187390 }, { "epoch": 0.49, "learning_rate": 0.00022713482519875263, "loss": 0.0196, "step": 187400 }, { "epoch": 0.49, "learning_rate": 0.00022713093698238117, "loss": 0.0164, "step": 187410 }, { "epoch": 0.49, "learning_rate": 0.0002271270487660097, "loss": 0.0192, "step": 187420 }, { "epoch": 0.49, "learning_rate": 0.00022712316054963825, "loss": 0.0182, "step": 187430 }, { "epoch": 0.49, "learning_rate": 0.00022711927233326677, "loss": 0.0192, "step": 187440 }, { "epoch": 0.49, "learning_rate": 0.0002271153841168953, "loss": 0.0182, "step": 187450 }, { "epoch": 0.49, "learning_rate": 0.00022711149590052385, "loss": 0.0141, "step": 187460 }, { "epoch": 0.49, "learning_rate": 0.0002271076076841524, "loss": 0.0245, "step": 187470 }, { "epoch": 0.49, "learning_rate": 0.0002271037194677809, "loss": 0.0191, "step": 187480 }, { "epoch": 0.49, "learning_rate": 0.00022709983125140945, "loss": 0.0182, "step": 187490 }, { "epoch": 0.49, "learning_rate": 0.00022709594303503802, "loss": 0.0175, "step": 187500 }, { "epoch": 0.49, "learning_rate": 0.00022709205481866653, "loss": 0.0189, "step": 187510 }, { "epoch": 0.49, "learning_rate": 0.00022708816660229508, "loss": 0.0139, "step": 187520 }, { "epoch": 0.49, "learning_rate": 0.0002270842783859236, "loss": 0.0211, "step": 187530 }, { "epoch": 0.49, "learning_rate": 0.00022708039016955216, "loss": 0.0238, "step": 187540 }, { "epoch": 0.49, "learning_rate": 0.00022707650195318067, "loss": 0.0162, "step": 187550 }, { "epoch": 0.49, "learning_rate": 0.00022707261373680921, "loss": 0.0181, "step": 187560 }, { "epoch": 0.49, "learning_rate": 0.00022706872552043773, "loss": 0.0171, "step": 187570 }, { "epoch": 0.49, "learning_rate": 0.00022706483730406627, "loss": 0.0198, "step": 187580 }, { "epoch": 0.49, "learning_rate": 0.0002270609490876948, "loss": 0.0191, "step": 187590 }, { "epoch": 0.49, "learning_rate": 0.00022705706087132335, "loss": 0.0167, "step": 187600 }, { "epoch": 0.49, "learning_rate": 0.00022705317265495187, "loss": 0.0183, "step": 187610 }, { "epoch": 0.49, "learning_rate": 0.0002270492844385804, "loss": 0.0157, "step": 187620 }, { "epoch": 0.49, "learning_rate": 0.00022704539622220895, "loss": 0.0163, "step": 187630 }, { "epoch": 0.49, "learning_rate": 0.0002270415080058375, "loss": 0.0151, "step": 187640 }, { "epoch": 0.49, "learning_rate": 0.000227037619789466, "loss": 0.0183, "step": 187650 }, { "epoch": 0.49, "learning_rate": 0.00022703373157309455, "loss": 0.0198, "step": 187660 }, { "epoch": 0.49, "learning_rate": 0.00022702984335672312, "loss": 0.0175, "step": 187670 }, { "epoch": 0.49, "learning_rate": 0.00022702595514035163, "loss": 0.0218, "step": 187680 }, { "epoch": 0.49, "learning_rate": 0.00022702206692398017, "loss": 0.0203, "step": 187690 }, { "epoch": 0.49, "learning_rate": 0.0002270181787076087, "loss": 0.0183, "step": 187700 }, { "epoch": 0.49, "learning_rate": 0.00022701429049123726, "loss": 0.0148, "step": 187710 }, { "epoch": 0.49, "learning_rate": 0.00022701040227486577, "loss": 0.018, "step": 187720 }, { "epoch": 0.49, "learning_rate": 0.00022700651405849431, "loss": 0.0174, "step": 187730 }, { "epoch": 0.49, "learning_rate": 0.00022700262584212283, "loss": 0.0189, "step": 187740 }, { "epoch": 0.49, "learning_rate": 0.0002269987376257514, "loss": 0.0142, "step": 187750 }, { "epoch": 0.49, "learning_rate": 0.0002269948494093799, "loss": 0.0244, "step": 187760 }, { "epoch": 0.49, "learning_rate": 0.00022699096119300845, "loss": 0.0181, "step": 187770 }, { "epoch": 0.49, "learning_rate": 0.00022698707297663697, "loss": 0.0186, "step": 187780 }, { "epoch": 0.49, "learning_rate": 0.00022698318476026554, "loss": 0.0164, "step": 187790 }, { "epoch": 0.49, "learning_rate": 0.00022697929654389405, "loss": 0.0214, "step": 187800 }, { "epoch": 0.49, "learning_rate": 0.0002269754083275226, "loss": 0.014, "step": 187810 }, { "epoch": 0.49, "learning_rate": 0.0002269715201111511, "loss": 0.0142, "step": 187820 }, { "epoch": 0.49, "learning_rate": 0.00022696763189477965, "loss": 0.0169, "step": 187830 }, { "epoch": 0.49, "learning_rate": 0.00022696374367840822, "loss": 0.0181, "step": 187840 }, { "epoch": 0.49, "learning_rate": 0.00022695985546203673, "loss": 0.0198, "step": 187850 }, { "epoch": 0.49, "learning_rate": 0.00022695596724566525, "loss": 0.0173, "step": 187860 }, { "epoch": 0.49, "learning_rate": 0.0002269520790292938, "loss": 0.0196, "step": 187870 }, { "epoch": 0.49, "learning_rate": 0.00022694819081292236, "loss": 0.0214, "step": 187880 }, { "epoch": 0.49, "learning_rate": 0.00022694430259655087, "loss": 0.0255, "step": 187890 }, { "epoch": 0.49, "learning_rate": 0.0002269404143801794, "loss": 0.0138, "step": 187900 }, { "epoch": 0.49, "learning_rate": 0.00022693652616380793, "loss": 0.0194, "step": 187910 }, { "epoch": 0.49, "learning_rate": 0.0002269326379474365, "loss": 0.0142, "step": 187920 }, { "epoch": 0.49, "learning_rate": 0.000226928749731065, "loss": 0.0195, "step": 187930 }, { "epoch": 0.49, "learning_rate": 0.00022692486151469355, "loss": 0.027, "step": 187940 }, { "epoch": 0.49, "learning_rate": 0.00022692097329832207, "loss": 0.0178, "step": 187950 }, { "epoch": 0.49, "learning_rate": 0.00022691708508195064, "loss": 0.0208, "step": 187960 }, { "epoch": 0.49, "learning_rate": 0.00022691319686557915, "loss": 0.021, "step": 187970 }, { "epoch": 0.49, "learning_rate": 0.0002269093086492077, "loss": 0.0188, "step": 187980 }, { "epoch": 0.49, "learning_rate": 0.0002269054204328362, "loss": 0.017, "step": 187990 }, { "epoch": 0.49, "learning_rate": 0.00022690153221646478, "loss": 0.0159, "step": 188000 }, { "epoch": 0.49, "eval_cer": 0.8818286536472439, "eval_loss": 0.012727465480566025, "eval_runtime": 108.1818, "eval_samples_per_second": 18.487, "eval_steps_per_second": 4.622, "step": 188000 }, { "epoch": 0.49, "learning_rate": 0.00022689764400009332, "loss": 0.0225, "step": 188010 }, { "epoch": 0.49, "learning_rate": 0.00022689375578372183, "loss": 0.021, "step": 188020 }, { "epoch": 0.49, "learning_rate": 0.00022688986756735035, "loss": 0.0155, "step": 188030 }, { "epoch": 0.49, "learning_rate": 0.00022688597935097891, "loss": 0.0185, "step": 188040 }, { "epoch": 0.49, "learning_rate": 0.00022688209113460746, "loss": 0.0184, "step": 188050 }, { "epoch": 0.49, "learning_rate": 0.00022687820291823597, "loss": 0.0232, "step": 188060 }, { "epoch": 0.49, "learning_rate": 0.0002268743147018645, "loss": 0.0157, "step": 188070 }, { "epoch": 0.49, "learning_rate": 0.00022687042648549303, "loss": 0.0272, "step": 188080 }, { "epoch": 0.49, "learning_rate": 0.0002268665382691216, "loss": 0.0194, "step": 188090 }, { "epoch": 0.49, "learning_rate": 0.0002268626500527501, "loss": 0.024, "step": 188100 }, { "epoch": 0.49, "learning_rate": 0.00022685876183637865, "loss": 0.0192, "step": 188110 }, { "epoch": 0.49, "learning_rate": 0.00022685487362000717, "loss": 0.0222, "step": 188120 }, { "epoch": 0.49, "learning_rate": 0.00022685098540363574, "loss": 0.0156, "step": 188130 }, { "epoch": 0.49, "learning_rate": 0.00022684709718726425, "loss": 0.0211, "step": 188140 }, { "epoch": 0.49, "learning_rate": 0.0002268432089708928, "loss": 0.0176, "step": 188150 }, { "epoch": 0.49, "learning_rate": 0.0002268393207545213, "loss": 0.0195, "step": 188160 }, { "epoch": 0.49, "learning_rate": 0.00022683543253814987, "loss": 0.0188, "step": 188170 }, { "epoch": 0.49, "learning_rate": 0.0002268315443217784, "loss": 0.0177, "step": 188180 }, { "epoch": 0.49, "learning_rate": 0.00022682765610540693, "loss": 0.0152, "step": 188190 }, { "epoch": 0.49, "learning_rate": 0.00022682376788903545, "loss": 0.0135, "step": 188200 }, { "epoch": 0.49, "learning_rate": 0.00022681987967266401, "loss": 0.0257, "step": 188210 }, { "epoch": 0.49, "learning_rate": 0.00022681599145629256, "loss": 0.0191, "step": 188220 }, { "epoch": 0.49, "learning_rate": 0.00022681210323992107, "loss": 0.0179, "step": 188230 }, { "epoch": 0.49, "learning_rate": 0.0002268082150235496, "loss": 0.0185, "step": 188240 }, { "epoch": 0.49, "learning_rate": 0.00022680432680717815, "loss": 0.0169, "step": 188250 }, { "epoch": 0.49, "learning_rate": 0.0002268004385908067, "loss": 0.0173, "step": 188260 }, { "epoch": 0.49, "learning_rate": 0.0002267965503744352, "loss": 0.0178, "step": 188270 }, { "epoch": 0.49, "learning_rate": 0.00022679266215806375, "loss": 0.021, "step": 188280 }, { "epoch": 0.49, "learning_rate": 0.0002267887739416923, "loss": 0.0199, "step": 188290 }, { "epoch": 0.49, "learning_rate": 0.00022678488572532083, "loss": 0.0155, "step": 188300 }, { "epoch": 0.49, "learning_rate": 0.00022678099750894935, "loss": 0.0155, "step": 188310 }, { "epoch": 0.49, "learning_rate": 0.0002267771092925779, "loss": 0.0162, "step": 188320 }, { "epoch": 0.49, "learning_rate": 0.0002267732210762064, "loss": 0.0186, "step": 188330 }, { "epoch": 0.49, "learning_rate": 0.00022676933285983497, "loss": 0.0181, "step": 188340 }, { "epoch": 0.49, "learning_rate": 0.0002267654446434635, "loss": 0.0178, "step": 188350 }, { "epoch": 0.49, "learning_rate": 0.00022676155642709203, "loss": 0.0199, "step": 188360 }, { "epoch": 0.49, "learning_rate": 0.00022675766821072055, "loss": 0.0148, "step": 188370 }, { "epoch": 0.49, "learning_rate": 0.00022675377999434911, "loss": 0.0195, "step": 188380 }, { "epoch": 0.49, "learning_rate": 0.00022674989177797766, "loss": 0.0161, "step": 188390 }, { "epoch": 0.49, "learning_rate": 0.00022674600356160617, "loss": 0.0153, "step": 188400 }, { "epoch": 0.49, "learning_rate": 0.0002267421153452347, "loss": 0.0189, "step": 188410 }, { "epoch": 0.49, "learning_rate": 0.00022673822712886325, "loss": 0.024, "step": 188420 }, { "epoch": 0.49, "learning_rate": 0.0002267343389124918, "loss": 0.0157, "step": 188430 }, { "epoch": 0.49, "learning_rate": 0.0002267304506961203, "loss": 0.0217, "step": 188440 }, { "epoch": 0.49, "learning_rate": 0.00022672656247974885, "loss": 0.0173, "step": 188450 }, { "epoch": 0.49, "learning_rate": 0.0002267226742633774, "loss": 0.0182, "step": 188460 }, { "epoch": 0.49, "learning_rate": 0.00022671878604700593, "loss": 0.0208, "step": 188470 }, { "epoch": 0.49, "learning_rate": 0.00022671489783063445, "loss": 0.0155, "step": 188480 }, { "epoch": 0.49, "learning_rate": 0.000226711009614263, "loss": 0.0214, "step": 188490 }, { "epoch": 0.49, "learning_rate": 0.00022670712139789153, "loss": 0.0165, "step": 188500 }, { "epoch": 0.49, "learning_rate": 0.00022670323318152007, "loss": 0.0148, "step": 188510 }, { "epoch": 0.49, "learning_rate": 0.0002266993449651486, "loss": 0.0177, "step": 188520 }, { "epoch": 0.49, "learning_rate": 0.00022669545674877713, "loss": 0.0231, "step": 188530 }, { "epoch": 0.49, "learning_rate": 0.0002266915685324057, "loss": 0.0152, "step": 188540 }, { "epoch": 0.49, "learning_rate": 0.0002266876803160342, "loss": 0.0154, "step": 188550 }, { "epoch": 0.49, "learning_rate": 0.00022668379209966275, "loss": 0.0202, "step": 188560 }, { "epoch": 0.49, "learning_rate": 0.00022667990388329127, "loss": 0.0223, "step": 188570 }, { "epoch": 0.49, "learning_rate": 0.00022667601566691978, "loss": 0.0194, "step": 188580 }, { "epoch": 0.49, "learning_rate": 0.00022667212745054835, "loss": 0.0176, "step": 188590 }, { "epoch": 0.49, "learning_rate": 0.0002266682392341769, "loss": 0.0196, "step": 188600 }, { "epoch": 0.49, "learning_rate": 0.0002266643510178054, "loss": 0.026, "step": 188610 }, { "epoch": 0.49, "learning_rate": 0.00022666046280143395, "loss": 0.0162, "step": 188620 }, { "epoch": 0.49, "learning_rate": 0.0002266565745850625, "loss": 0.0174, "step": 188630 }, { "epoch": 0.49, "learning_rate": 0.00022665268636869103, "loss": 0.0159, "step": 188640 }, { "epoch": 0.49, "learning_rate": 0.00022664879815231955, "loss": 0.0171, "step": 188650 }, { "epoch": 0.49, "learning_rate": 0.0002266449099359481, "loss": 0.0162, "step": 188660 }, { "epoch": 0.49, "learning_rate": 0.00022664102171957663, "loss": 0.0178, "step": 188670 }, { "epoch": 0.49, "learning_rate": 0.00022663713350320517, "loss": 0.0189, "step": 188680 }, { "epoch": 0.49, "learning_rate": 0.0002266332452868337, "loss": 0.0182, "step": 188690 }, { "epoch": 0.49, "learning_rate": 0.00022662935707046223, "loss": 0.0207, "step": 188700 }, { "epoch": 0.49, "learning_rate": 0.0002266254688540908, "loss": 0.02, "step": 188710 }, { "epoch": 0.49, "learning_rate": 0.0002266215806377193, "loss": 0.0136, "step": 188720 }, { "epoch": 0.49, "learning_rate": 0.00022661769242134783, "loss": 0.0174, "step": 188730 }, { "epoch": 0.49, "learning_rate": 0.00022661380420497637, "loss": 0.0237, "step": 188740 }, { "epoch": 0.49, "learning_rate": 0.00022660991598860494, "loss": 0.0172, "step": 188750 }, { "epoch": 0.49, "learning_rate": 0.00022660602777223345, "loss": 0.0236, "step": 188760 }, { "epoch": 0.49, "learning_rate": 0.000226602139555862, "loss": 0.0171, "step": 188770 }, { "epoch": 0.49, "learning_rate": 0.0002265982513394905, "loss": 0.0186, "step": 188780 }, { "epoch": 0.49, "learning_rate": 0.00022659436312311908, "loss": 0.0206, "step": 188790 }, { "epoch": 0.49, "learning_rate": 0.0002265904749067476, "loss": 0.0192, "step": 188800 }, { "epoch": 0.49, "learning_rate": 0.00022658658669037613, "loss": 0.0163, "step": 188810 }, { "epoch": 0.49, "learning_rate": 0.00022658269847400465, "loss": 0.0201, "step": 188820 }, { "epoch": 0.49, "learning_rate": 0.0002265788102576332, "loss": 0.0179, "step": 188830 }, { "epoch": 0.49, "learning_rate": 0.00022657492204126173, "loss": 0.0171, "step": 188840 }, { "epoch": 0.49, "learning_rate": 0.00022657103382489027, "loss": 0.0156, "step": 188850 }, { "epoch": 0.49, "learning_rate": 0.0002265671456085188, "loss": 0.017, "step": 188860 }, { "epoch": 0.49, "learning_rate": 0.00022656325739214733, "loss": 0.0167, "step": 188870 }, { "epoch": 0.49, "learning_rate": 0.0002265593691757759, "loss": 0.0197, "step": 188880 }, { "epoch": 0.49, "learning_rate": 0.0002265554809594044, "loss": 0.0194, "step": 188890 }, { "epoch": 0.49, "learning_rate": 0.00022655159274303293, "loss": 0.0192, "step": 188900 }, { "epoch": 0.49, "learning_rate": 0.00022654770452666147, "loss": 0.018, "step": 188910 }, { "epoch": 0.49, "learning_rate": 0.00022654381631029004, "loss": 0.0182, "step": 188920 }, { "epoch": 0.49, "learning_rate": 0.00022653992809391855, "loss": 0.0242, "step": 188930 }, { "epoch": 0.49, "learning_rate": 0.0002265360398775471, "loss": 0.0183, "step": 188940 }, { "epoch": 0.49, "learning_rate": 0.0002265321516611756, "loss": 0.0257, "step": 188950 }, { "epoch": 0.49, "learning_rate": 0.00022652826344480418, "loss": 0.0172, "step": 188960 }, { "epoch": 0.49, "learning_rate": 0.0002265243752284327, "loss": 0.0141, "step": 188970 }, { "epoch": 0.49, "learning_rate": 0.00022652048701206123, "loss": 0.0169, "step": 188980 }, { "epoch": 0.49, "learning_rate": 0.00022651659879568975, "loss": 0.0193, "step": 188990 }, { "epoch": 0.49, "learning_rate": 0.00022651271057931832, "loss": 0.0195, "step": 189000 }, { "epoch": 0.49, "eval_cer": 0.8818104583670996, "eval_loss": 0.012447088025510311, "eval_runtime": 108.0069, "eval_samples_per_second": 18.517, "eval_steps_per_second": 4.629, "step": 189000 }, { "epoch": 0.49, "learning_rate": 0.00022650882236294683, "loss": 0.0172, "step": 189010 }, { "epoch": 0.49, "learning_rate": 0.00022650493414657537, "loss": 0.0156, "step": 189020 }, { "epoch": 0.49, "learning_rate": 0.0002265010459302039, "loss": 0.0192, "step": 189030 }, { "epoch": 0.49, "learning_rate": 0.00022649715771383246, "loss": 0.0197, "step": 189040 }, { "epoch": 0.49, "learning_rate": 0.00022649326949746097, "loss": 0.0157, "step": 189050 }, { "epoch": 0.49, "learning_rate": 0.0002264893812810895, "loss": 0.0168, "step": 189060 }, { "epoch": 0.49, "learning_rate": 0.00022648549306471803, "loss": 0.0237, "step": 189070 }, { "epoch": 0.49, "learning_rate": 0.00022648160484834657, "loss": 0.0191, "step": 189080 }, { "epoch": 0.49, "learning_rate": 0.00022647771663197514, "loss": 0.0166, "step": 189090 }, { "epoch": 0.49, "learning_rate": 0.00022647382841560365, "loss": 0.0166, "step": 189100 }, { "epoch": 0.49, "learning_rate": 0.0002264699401992322, "loss": 0.0231, "step": 189110 }, { "epoch": 0.49, "learning_rate": 0.0002264660519828607, "loss": 0.0157, "step": 189120 }, { "epoch": 0.49, "learning_rate": 0.00022646216376648928, "loss": 0.0156, "step": 189130 }, { "epoch": 0.49, "learning_rate": 0.0002264582755501178, "loss": 0.0182, "step": 189140 }, { "epoch": 0.49, "learning_rate": 0.00022645438733374633, "loss": 0.0185, "step": 189150 }, { "epoch": 0.49, "learning_rate": 0.00022645049911737485, "loss": 0.018, "step": 189160 }, { "epoch": 0.49, "learning_rate": 0.00022644661090100342, "loss": 0.0176, "step": 189170 }, { "epoch": 0.49, "learning_rate": 0.00022644272268463193, "loss": 0.0159, "step": 189180 }, { "epoch": 0.49, "learning_rate": 0.00022643883446826047, "loss": 0.0163, "step": 189190 }, { "epoch": 0.49, "learning_rate": 0.00022643494625188899, "loss": 0.0168, "step": 189200 }, { "epoch": 0.49, "learning_rate": 0.00022643105803551755, "loss": 0.0176, "step": 189210 }, { "epoch": 0.49, "learning_rate": 0.00022642716981914607, "loss": 0.0258, "step": 189220 }, { "epoch": 0.49, "learning_rate": 0.0002264232816027746, "loss": 0.0156, "step": 189230 }, { "epoch": 0.49, "learning_rate": 0.00022641939338640313, "loss": 0.0214, "step": 189240 }, { "epoch": 0.49, "learning_rate": 0.0002264155051700317, "loss": 0.0164, "step": 189250 }, { "epoch": 0.49, "learning_rate": 0.00022641161695366024, "loss": 0.0171, "step": 189260 }, { "epoch": 0.49, "learning_rate": 0.00022640772873728875, "loss": 0.0173, "step": 189270 }, { "epoch": 0.49, "learning_rate": 0.0002264038405209173, "loss": 0.0181, "step": 189280 }, { "epoch": 0.49, "learning_rate": 0.00022639995230454583, "loss": 0.016, "step": 189290 }, { "epoch": 0.49, "learning_rate": 0.00022639606408817438, "loss": 0.0222, "step": 189300 }, { "epoch": 0.49, "learning_rate": 0.0002263921758718029, "loss": 0.0154, "step": 189310 }, { "epoch": 0.49, "learning_rate": 0.00022638828765543143, "loss": 0.0194, "step": 189320 }, { "epoch": 0.49, "learning_rate": 0.00022638439943905995, "loss": 0.0337, "step": 189330 }, { "epoch": 0.49, "learning_rate": 0.00022638051122268851, "loss": 0.0191, "step": 189340 }, { "epoch": 0.49, "learning_rate": 0.00022637662300631703, "loss": 0.0146, "step": 189350 }, { "epoch": 0.49, "learning_rate": 0.00022637273478994557, "loss": 0.0184, "step": 189360 }, { "epoch": 0.49, "learning_rate": 0.00022636884657357409, "loss": 0.0175, "step": 189370 }, { "epoch": 0.49, "learning_rate": 0.00022636495835720265, "loss": 0.0163, "step": 189380 }, { "epoch": 0.49, "learning_rate": 0.00022636107014083117, "loss": 0.017, "step": 189390 }, { "epoch": 0.49, "learning_rate": 0.0002263571819244597, "loss": 0.014, "step": 189400 }, { "epoch": 0.49, "learning_rate": 0.00022635329370808822, "loss": 0.0201, "step": 189410 }, { "epoch": 0.49, "learning_rate": 0.0002263494054917168, "loss": 0.0186, "step": 189420 }, { "epoch": 0.49, "learning_rate": 0.00022634551727534534, "loss": 0.0183, "step": 189430 }, { "epoch": 0.49, "learning_rate": 0.00022634162905897385, "loss": 0.0222, "step": 189440 }, { "epoch": 0.49, "learning_rate": 0.00022633774084260236, "loss": 0.0156, "step": 189450 }, { "epoch": 0.49, "learning_rate": 0.00022633385262623093, "loss": 0.0155, "step": 189460 }, { "epoch": 0.49, "learning_rate": 0.00022632996440985947, "loss": 0.0159, "step": 189470 }, { "epoch": 0.49, "learning_rate": 0.000226326076193488, "loss": 0.0202, "step": 189480 }, { "epoch": 0.49, "learning_rate": 0.00022632218797711653, "loss": 0.0144, "step": 189490 }, { "epoch": 0.49, "learning_rate": 0.00022631829976074507, "loss": 0.0163, "step": 189500 }, { "epoch": 0.49, "learning_rate": 0.00022631441154437361, "loss": 0.0174, "step": 189510 }, { "epoch": 0.49, "learning_rate": 0.00022631052332800213, "loss": 0.0182, "step": 189520 }, { "epoch": 0.49, "learning_rate": 0.00022630663511163067, "loss": 0.018, "step": 189530 }, { "epoch": 0.49, "learning_rate": 0.0002263027468952592, "loss": 0.0192, "step": 189540 }, { "epoch": 0.49, "learning_rate": 0.00022629885867888775, "loss": 0.019, "step": 189550 }, { "epoch": 0.49, "learning_rate": 0.00022629497046251627, "loss": 0.0145, "step": 189560 }, { "epoch": 0.49, "learning_rate": 0.0002262910822461448, "loss": 0.021, "step": 189570 }, { "epoch": 0.49, "learning_rate": 0.00022628719402977332, "loss": 0.0143, "step": 189580 }, { "epoch": 0.49, "learning_rate": 0.0002262833058134019, "loss": 0.0171, "step": 189590 }, { "epoch": 0.49, "learning_rate": 0.00022627941759703043, "loss": 0.0146, "step": 189600 }, { "epoch": 0.49, "learning_rate": 0.00022627552938065895, "loss": 0.0159, "step": 189610 }, { "epoch": 0.49, "learning_rate": 0.00022627164116428746, "loss": 0.0156, "step": 189620 }, { "epoch": 0.49, "learning_rate": 0.00022626775294791603, "loss": 0.0165, "step": 189630 }, { "epoch": 0.49, "learning_rate": 0.00022626386473154457, "loss": 0.0146, "step": 189640 }, { "epoch": 0.49, "learning_rate": 0.0002262599765151731, "loss": 0.0168, "step": 189650 }, { "epoch": 0.49, "learning_rate": 0.00022625608829880163, "loss": 0.0143, "step": 189660 }, { "epoch": 0.49, "learning_rate": 0.00022625220008243017, "loss": 0.0195, "step": 189670 }, { "epoch": 0.49, "learning_rate": 0.00022624831186605871, "loss": 0.0218, "step": 189680 }, { "epoch": 0.49, "learning_rate": 0.00022624442364968723, "loss": 0.0154, "step": 189690 }, { "epoch": 0.49, "learning_rate": 0.00022624053543331577, "loss": 0.0177, "step": 189700 }, { "epoch": 0.49, "learning_rate": 0.0002262366472169443, "loss": 0.0207, "step": 189710 }, { "epoch": 0.49, "learning_rate": 0.00022623275900057285, "loss": 0.0165, "step": 189720 }, { "epoch": 0.49, "learning_rate": 0.00022622887078420137, "loss": 0.0188, "step": 189730 }, { "epoch": 0.49, "learning_rate": 0.0002262249825678299, "loss": 0.0173, "step": 189740 }, { "epoch": 0.49, "learning_rate": 0.00022622109435145848, "loss": 0.0207, "step": 189750 }, { "epoch": 0.49, "learning_rate": 0.000226217206135087, "loss": 0.0183, "step": 189760 }, { "epoch": 0.49, "learning_rate": 0.0002262133179187155, "loss": 0.017, "step": 189770 }, { "epoch": 0.49, "learning_rate": 0.00022620942970234405, "loss": 0.0175, "step": 189780 }, { "epoch": 0.49, "learning_rate": 0.00022620554148597262, "loss": 0.0208, "step": 189790 }, { "epoch": 0.49, "learning_rate": 0.00022620165326960113, "loss": 0.0169, "step": 189800 }, { "epoch": 0.49, "learning_rate": 0.00022619776505322967, "loss": 0.0183, "step": 189810 }, { "epoch": 0.49, "learning_rate": 0.0002261938768368582, "loss": 0.0228, "step": 189820 }, { "epoch": 0.49, "learning_rate": 0.00022618998862048673, "loss": 0.0166, "step": 189830 }, { "epoch": 0.49, "learning_rate": 0.00022618610040411527, "loss": 0.0206, "step": 189840 }, { "epoch": 0.49, "learning_rate": 0.0002261822121877438, "loss": 0.0226, "step": 189850 }, { "epoch": 0.49, "learning_rate": 0.00022617832397137233, "loss": 0.018, "step": 189860 }, { "epoch": 0.49, "learning_rate": 0.00022617443575500087, "loss": 0.0158, "step": 189870 }, { "epoch": 0.49, "learning_rate": 0.0002261705475386294, "loss": 0.0188, "step": 189880 }, { "epoch": 0.49, "learning_rate": 0.00022616665932225795, "loss": 0.0179, "step": 189890 }, { "epoch": 0.49, "learning_rate": 0.00022616277110588647, "loss": 0.0162, "step": 189900 }, { "epoch": 0.49, "learning_rate": 0.000226158882889515, "loss": 0.0147, "step": 189910 }, { "epoch": 0.49, "learning_rate": 0.00022615499467314355, "loss": 0.0192, "step": 189920 }, { "epoch": 0.49, "learning_rate": 0.0002261511064567721, "loss": 0.0198, "step": 189930 }, { "epoch": 0.49, "learning_rate": 0.0002261472182404006, "loss": 0.0176, "step": 189940 }, { "epoch": 0.49, "learning_rate": 0.00022614333002402915, "loss": 0.0178, "step": 189950 }, { "epoch": 0.49, "learning_rate": 0.00022613944180765772, "loss": 0.0161, "step": 189960 }, { "epoch": 0.49, "learning_rate": 0.00022613555359128623, "loss": 0.0195, "step": 189970 }, { "epoch": 0.49, "learning_rate": 0.00022613166537491477, "loss": 0.0185, "step": 189980 }, { "epoch": 0.49, "learning_rate": 0.0002261277771585433, "loss": 0.0233, "step": 189990 }, { "epoch": 0.49, "learning_rate": 0.00022612388894217186, "loss": 0.0184, "step": 190000 }, { "epoch": 0.49, "eval_cer": 0.8817894638130869, "eval_loss": 0.01178650464862585, "eval_runtime": 107.62, "eval_samples_per_second": 18.584, "eval_steps_per_second": 4.646, "step": 190000 }, { "epoch": 0.49, "learning_rate": 0.00022612000072580037, "loss": 0.0157, "step": 190010 }, { "epoch": 0.49, "learning_rate": 0.0002261161125094289, "loss": 0.0139, "step": 190020 }, { "epoch": 0.49, "learning_rate": 0.00022611222429305743, "loss": 0.0165, "step": 190030 }, { "epoch": 0.49, "learning_rate": 0.000226108336076686, "loss": 0.0176, "step": 190040 }, { "epoch": 0.49, "learning_rate": 0.0002261044478603145, "loss": 0.0134, "step": 190050 }, { "epoch": 0.49, "learning_rate": 0.00022610055964394305, "loss": 0.0154, "step": 190060 }, { "epoch": 0.49, "learning_rate": 0.00022609667142757157, "loss": 0.0162, "step": 190070 }, { "epoch": 0.49, "learning_rate": 0.0002260927832112001, "loss": 0.0177, "step": 190080 }, { "epoch": 0.49, "learning_rate": 0.00022608889499482865, "loss": 0.0165, "step": 190090 }, { "epoch": 0.49, "learning_rate": 0.0002260850067784572, "loss": 0.0159, "step": 190100 }, { "epoch": 0.49, "learning_rate": 0.0002260811185620857, "loss": 0.0164, "step": 190110 }, { "epoch": 0.49, "learning_rate": 0.00022607723034571425, "loss": 0.0188, "step": 190120 }, { "epoch": 0.49, "learning_rate": 0.00022607334212934282, "loss": 0.0153, "step": 190130 }, { "epoch": 0.49, "learning_rate": 0.00022606945391297133, "loss": 0.0182, "step": 190140 }, { "epoch": 0.49, "learning_rate": 0.00022606556569659987, "loss": 0.0145, "step": 190150 }, { "epoch": 0.49, "learning_rate": 0.0002260616774802284, "loss": 0.0173, "step": 190160 }, { "epoch": 0.49, "learning_rate": 0.00022605778926385696, "loss": 0.0145, "step": 190170 }, { "epoch": 0.49, "learning_rate": 0.00022605390104748547, "loss": 0.0188, "step": 190180 }, { "epoch": 0.49, "learning_rate": 0.000226050012831114, "loss": 0.0167, "step": 190190 }, { "epoch": 0.49, "learning_rate": 0.00022604612461474253, "loss": 0.0193, "step": 190200 }, { "epoch": 0.49, "learning_rate": 0.0002260422363983711, "loss": 0.0194, "step": 190210 }, { "epoch": 0.49, "learning_rate": 0.0002260383481819996, "loss": 0.0138, "step": 190220 }, { "epoch": 0.49, "learning_rate": 0.00022603445996562815, "loss": 0.0165, "step": 190230 }, { "epoch": 0.49, "learning_rate": 0.00022603057174925667, "loss": 0.0153, "step": 190240 }, { "epoch": 0.49, "learning_rate": 0.00022602668353288523, "loss": 0.0202, "step": 190250 }, { "epoch": 0.49, "learning_rate": 0.00022602279531651375, "loss": 0.0155, "step": 190260 }, { "epoch": 0.49, "learning_rate": 0.0002260189071001423, "loss": 0.0193, "step": 190270 }, { "epoch": 0.49, "learning_rate": 0.0002260150188837708, "loss": 0.0205, "step": 190280 }, { "epoch": 0.49, "learning_rate": 0.00022601113066739937, "loss": 0.0186, "step": 190290 }, { "epoch": 0.49, "learning_rate": 0.00022600724245102792, "loss": 0.0158, "step": 190300 }, { "epoch": 0.49, "learning_rate": 0.00022600335423465643, "loss": 0.0177, "step": 190310 }, { "epoch": 0.49, "learning_rate": 0.00022599946601828494, "loss": 0.0161, "step": 190320 }, { "epoch": 0.49, "learning_rate": 0.00022599557780191349, "loss": 0.0164, "step": 190330 }, { "epoch": 0.49, "learning_rate": 0.00022599168958554206, "loss": 0.0169, "step": 190340 }, { "epoch": 0.49, "learning_rate": 0.00022598780136917057, "loss": 0.0189, "step": 190350 }, { "epoch": 0.49, "learning_rate": 0.0002259839131527991, "loss": 0.0186, "step": 190360 }, { "epoch": 0.49, "learning_rate": 0.00022598002493642763, "loss": 0.0174, "step": 190370 }, { "epoch": 0.49, "learning_rate": 0.0002259761367200562, "loss": 0.0237, "step": 190380 }, { "epoch": 0.49, "learning_rate": 0.0002259722485036847, "loss": 0.0225, "step": 190390 }, { "epoch": 0.49, "learning_rate": 0.00022596836028731325, "loss": 0.0152, "step": 190400 }, { "epoch": 0.49, "learning_rate": 0.00022596447207094177, "loss": 0.0172, "step": 190410 }, { "epoch": 0.49, "learning_rate": 0.00022596058385457033, "loss": 0.0171, "step": 190420 }, { "epoch": 0.49, "learning_rate": 0.00022595669563819885, "loss": 0.0201, "step": 190430 }, { "epoch": 0.49, "learning_rate": 0.0002259528074218274, "loss": 0.014, "step": 190440 }, { "epoch": 0.49, "learning_rate": 0.0002259489192054559, "loss": 0.0207, "step": 190450 }, { "epoch": 0.49, "learning_rate": 0.00022594503098908447, "loss": 0.0164, "step": 190460 }, { "epoch": 0.49, "learning_rate": 0.00022594114277271302, "loss": 0.016, "step": 190470 }, { "epoch": 0.49, "learning_rate": 0.00022593725455634153, "loss": 0.0341, "step": 190480 }, { "epoch": 0.49, "learning_rate": 0.00022593336633997004, "loss": 0.0191, "step": 190490 }, { "epoch": 0.49, "learning_rate": 0.0002259294781235986, "loss": 0.016, "step": 190500 }, { "epoch": 0.49, "learning_rate": 0.00022592558990722715, "loss": 0.0212, "step": 190510 }, { "epoch": 0.49, "learning_rate": 0.00022592170169085567, "loss": 0.0186, "step": 190520 }, { "epoch": 0.49, "learning_rate": 0.0002259178134744842, "loss": 0.0185, "step": 190530 }, { "epoch": 0.49, "learning_rate": 0.00022591392525811275, "loss": 0.0189, "step": 190540 }, { "epoch": 0.49, "learning_rate": 0.0002259100370417413, "loss": 0.0157, "step": 190550 }, { "epoch": 0.49, "learning_rate": 0.0002259061488253698, "loss": 0.0184, "step": 190560 }, { "epoch": 0.49, "learning_rate": 0.00022590226060899835, "loss": 0.0184, "step": 190570 }, { "epoch": 0.49, "learning_rate": 0.00022589837239262686, "loss": 0.0189, "step": 190580 }, { "epoch": 0.49, "learning_rate": 0.00022589448417625543, "loss": 0.0184, "step": 190590 }, { "epoch": 0.49, "learning_rate": 0.00022589059595988395, "loss": 0.0173, "step": 190600 }, { "epoch": 0.49, "learning_rate": 0.0002258867077435125, "loss": 0.0189, "step": 190610 }, { "epoch": 0.49, "learning_rate": 0.000225882819527141, "loss": 0.0127, "step": 190620 }, { "epoch": 0.49, "learning_rate": 0.00022587893131076957, "loss": 0.016, "step": 190630 }, { "epoch": 0.49, "learning_rate": 0.0002258750430943981, "loss": 0.0175, "step": 190640 }, { "epoch": 0.49, "learning_rate": 0.00022587115487802663, "loss": 0.0163, "step": 190650 }, { "epoch": 0.49, "learning_rate": 0.00022586726666165514, "loss": 0.0155, "step": 190660 }, { "epoch": 0.49, "learning_rate": 0.0002258633784452837, "loss": 0.0214, "step": 190670 }, { "epoch": 0.49, "learning_rate": 0.00022585949022891225, "loss": 0.0182, "step": 190680 }, { "epoch": 0.49, "learning_rate": 0.00022585560201254077, "loss": 0.0211, "step": 190690 }, { "epoch": 0.49, "learning_rate": 0.0002258517137961693, "loss": 0.0142, "step": 190700 }, { "epoch": 0.49, "learning_rate": 0.00022584782557979785, "loss": 0.0182, "step": 190710 }, { "epoch": 0.49, "learning_rate": 0.0002258439373634264, "loss": 0.0195, "step": 190720 }, { "epoch": 0.49, "learning_rate": 0.0002258400491470549, "loss": 0.0182, "step": 190730 }, { "epoch": 0.49, "learning_rate": 0.00022583616093068345, "loss": 0.0171, "step": 190740 }, { "epoch": 0.49, "learning_rate": 0.000225832272714312, "loss": 0.0161, "step": 190750 }, { "epoch": 0.49, "learning_rate": 0.00022582838449794053, "loss": 0.0144, "step": 190760 }, { "epoch": 0.49, "learning_rate": 0.00022582449628156905, "loss": 0.0265, "step": 190770 }, { "epoch": 0.49, "learning_rate": 0.0002258206080651976, "loss": 0.0155, "step": 190780 }, { "epoch": 0.49, "learning_rate": 0.00022581671984882616, "loss": 0.0161, "step": 190790 }, { "epoch": 0.49, "learning_rate": 0.00022581283163245467, "loss": 0.0141, "step": 190800 }, { "epoch": 0.49, "learning_rate": 0.0002258089434160832, "loss": 0.0164, "step": 190810 }, { "epoch": 0.49, "learning_rate": 0.00022580505519971173, "loss": 0.0191, "step": 190820 }, { "epoch": 0.49, "learning_rate": 0.00022580116698334024, "loss": 0.0202, "step": 190830 }, { "epoch": 0.49, "learning_rate": 0.0002257972787669688, "loss": 0.0206, "step": 190840 }, { "epoch": 0.49, "learning_rate": 0.00022579339055059735, "loss": 0.0181, "step": 190850 }, { "epoch": 0.49, "learning_rate": 0.00022578950233422587, "loss": 0.0202, "step": 190860 }, { "epoch": 0.49, "learning_rate": 0.0002257856141178544, "loss": 0.0312, "step": 190870 }, { "epoch": 0.49, "learning_rate": 0.00022578172590148295, "loss": 0.0134, "step": 190880 }, { "epoch": 0.49, "learning_rate": 0.0002257778376851115, "loss": 0.0152, "step": 190890 }, { "epoch": 0.49, "learning_rate": 0.00022577394946874, "loss": 0.0157, "step": 190900 }, { "epoch": 0.49, "learning_rate": 0.00022577006125236855, "loss": 0.0152, "step": 190910 }, { "epoch": 0.49, "learning_rate": 0.0002257661730359971, "loss": 0.0197, "step": 190920 }, { "epoch": 0.49, "learning_rate": 0.00022576228481962563, "loss": 0.0199, "step": 190930 }, { "epoch": 0.49, "learning_rate": 0.00022575839660325415, "loss": 0.0204, "step": 190940 }, { "epoch": 0.49, "learning_rate": 0.0002257545083868827, "loss": 0.0242, "step": 190950 }, { "epoch": 0.49, "learning_rate": 0.00022575062017051123, "loss": 0.0165, "step": 190960 }, { "epoch": 0.5, "learning_rate": 0.00022574673195413977, "loss": 0.018, "step": 190970 }, { "epoch": 0.5, "learning_rate": 0.00022574284373776829, "loss": 0.0175, "step": 190980 }, { "epoch": 0.5, "learning_rate": 0.00022573895552139683, "loss": 0.0174, "step": 190990 }, { "epoch": 0.5, "learning_rate": 0.0002257350673050254, "loss": 0.0218, "step": 191000 }, { "epoch": 0.5, "eval_cer": 0.8817964619977577, "eval_loss": 0.01211930438876152, "eval_runtime": 107.8599, "eval_samples_per_second": 18.543, "eval_steps_per_second": 4.636, "step": 191000 }, { "epoch": 0.5, "learning_rate": 0.0002257311790886539, "loss": 0.0167, "step": 191010 }, { "epoch": 0.5, "learning_rate": 0.00022572729087228245, "loss": 0.0167, "step": 191020 }, { "epoch": 0.5, "learning_rate": 0.00022572340265591097, "loss": 0.0185, "step": 191030 }, { "epoch": 0.5, "learning_rate": 0.00022571951443953954, "loss": 0.0151, "step": 191040 }, { "epoch": 0.5, "learning_rate": 0.00022571562622316805, "loss": 0.0177, "step": 191050 }, { "epoch": 0.5, "learning_rate": 0.0002257117380067966, "loss": 0.0188, "step": 191060 }, { "epoch": 0.5, "learning_rate": 0.0002257078497904251, "loss": 0.0203, "step": 191070 }, { "epoch": 0.5, "learning_rate": 0.00022570396157405365, "loss": 0.0205, "step": 191080 }, { "epoch": 0.5, "learning_rate": 0.0002257000733576822, "loss": 0.0177, "step": 191090 }, { "epoch": 0.5, "learning_rate": 0.00022569618514131073, "loss": 0.0242, "step": 191100 }, { "epoch": 0.5, "learning_rate": 0.00022569229692493925, "loss": 0.0136, "step": 191110 }, { "epoch": 0.5, "learning_rate": 0.0002256884087085678, "loss": 0.021, "step": 191120 }, { "epoch": 0.5, "learning_rate": 0.00022568452049219633, "loss": 0.0241, "step": 191130 }, { "epoch": 0.5, "learning_rate": 0.00022568063227582487, "loss": 0.0181, "step": 191140 }, { "epoch": 0.5, "learning_rate": 0.00022567674405945339, "loss": 0.0193, "step": 191150 }, { "epoch": 0.5, "learning_rate": 0.00022567285584308193, "loss": 0.0201, "step": 191160 }, { "epoch": 0.5, "learning_rate": 0.0002256689676267105, "loss": 0.0184, "step": 191170 }, { "epoch": 0.5, "learning_rate": 0.000225665079410339, "loss": 0.0258, "step": 191180 }, { "epoch": 0.5, "learning_rate": 0.00022566119119396755, "loss": 0.0159, "step": 191190 }, { "epoch": 0.5, "learning_rate": 0.00022565730297759607, "loss": 0.0195, "step": 191200 }, { "epoch": 0.5, "learning_rate": 0.00022565341476122464, "loss": 0.0178, "step": 191210 }, { "epoch": 0.5, "learning_rate": 0.00022564952654485315, "loss": 0.0153, "step": 191220 }, { "epoch": 0.5, "learning_rate": 0.0002256456383284817, "loss": 0.0174, "step": 191230 }, { "epoch": 0.5, "learning_rate": 0.0002256417501121102, "loss": 0.017, "step": 191240 }, { "epoch": 0.5, "learning_rate": 0.00022563786189573877, "loss": 0.0241, "step": 191250 }, { "epoch": 0.5, "learning_rate": 0.0002256339736793673, "loss": 0.0183, "step": 191260 }, { "epoch": 0.5, "learning_rate": 0.00022563008546299583, "loss": 0.0211, "step": 191270 }, { "epoch": 0.5, "learning_rate": 0.00022562619724662435, "loss": 0.0192, "step": 191280 }, { "epoch": 0.5, "learning_rate": 0.00022562230903025291, "loss": 0.0183, "step": 191290 }, { "epoch": 0.5, "learning_rate": 0.00022561842081388143, "loss": 0.0176, "step": 191300 }, { "epoch": 0.5, "learning_rate": 0.00022561453259750997, "loss": 0.0182, "step": 191310 }, { "epoch": 0.5, "learning_rate": 0.00022561064438113849, "loss": 0.0128, "step": 191320 }, { "epoch": 0.5, "learning_rate": 0.00022560675616476703, "loss": 0.0117, "step": 191330 }, { "epoch": 0.5, "learning_rate": 0.0002256028679483956, "loss": 0.0254, "step": 191340 }, { "epoch": 0.5, "learning_rate": 0.0002255989797320241, "loss": 0.0169, "step": 191350 }, { "epoch": 0.5, "learning_rate": 0.00022559509151565262, "loss": 0.0166, "step": 191360 }, { "epoch": 0.5, "learning_rate": 0.00022559120329928117, "loss": 0.0185, "step": 191370 }, { "epoch": 0.5, "learning_rate": 0.00022558731508290973, "loss": 0.0175, "step": 191380 }, { "epoch": 0.5, "learning_rate": 0.00022558342686653825, "loss": 0.0156, "step": 191390 }, { "epoch": 0.5, "learning_rate": 0.0002255795386501668, "loss": 0.0189, "step": 191400 }, { "epoch": 0.5, "learning_rate": 0.0002255756504337953, "loss": 0.0242, "step": 191410 }, { "epoch": 0.5, "learning_rate": 0.00022557176221742387, "loss": 0.0176, "step": 191420 }, { "epoch": 0.5, "learning_rate": 0.0002255678740010524, "loss": 0.0204, "step": 191430 }, { "epoch": 0.5, "learning_rate": 0.00022556398578468093, "loss": 0.0232, "step": 191440 }, { "epoch": 0.5, "learning_rate": 0.00022556009756830945, "loss": 0.0199, "step": 191450 }, { "epoch": 0.5, "learning_rate": 0.00022555620935193801, "loss": 0.0179, "step": 191460 }, { "epoch": 0.5, "learning_rate": 0.00022555232113556653, "loss": 0.0216, "step": 191470 }, { "epoch": 0.5, "learning_rate": 0.00022554843291919507, "loss": 0.0176, "step": 191480 }, { "epoch": 0.5, "learning_rate": 0.00022554454470282358, "loss": 0.0185, "step": 191490 }, { "epoch": 0.5, "learning_rate": 0.00022554065648645215, "loss": 0.0219, "step": 191500 }, { "epoch": 0.5, "learning_rate": 0.00022553676827008067, "loss": 0.0168, "step": 191510 }, { "epoch": 0.5, "learning_rate": 0.0002255328800537092, "loss": 0.0185, "step": 191520 }, { "epoch": 0.5, "learning_rate": 0.00022552899183733772, "loss": 0.017, "step": 191530 }, { "epoch": 0.5, "learning_rate": 0.00022552510362096627, "loss": 0.0176, "step": 191540 }, { "epoch": 0.5, "learning_rate": 0.00022552121540459483, "loss": 0.017, "step": 191550 }, { "epoch": 0.5, "learning_rate": 0.00022551732718822335, "loss": 0.0169, "step": 191560 }, { "epoch": 0.5, "learning_rate": 0.0002255134389718519, "loss": 0.0159, "step": 191570 }, { "epoch": 0.5, "learning_rate": 0.0002255095507554804, "loss": 0.0202, "step": 191580 }, { "epoch": 0.5, "learning_rate": 0.00022550566253910897, "loss": 0.0173, "step": 191590 }, { "epoch": 0.5, "learning_rate": 0.0002255017743227375, "loss": 0.0221, "step": 191600 }, { "epoch": 0.5, "learning_rate": 0.00022549788610636603, "loss": 0.0164, "step": 191610 }, { "epoch": 0.5, "learning_rate": 0.00022549399788999454, "loss": 0.018, "step": 191620 }, { "epoch": 0.5, "learning_rate": 0.0002254901096736231, "loss": 0.0212, "step": 191630 }, { "epoch": 0.5, "learning_rate": 0.00022548622145725163, "loss": 0.0197, "step": 191640 }, { "epoch": 0.5, "learning_rate": 0.00022548233324088017, "loss": 0.0178, "step": 191650 }, { "epoch": 0.5, "learning_rate": 0.00022547844502450868, "loss": 0.0191, "step": 191660 }, { "epoch": 0.5, "learning_rate": 0.00022547455680813725, "loss": 0.0163, "step": 191670 }, { "epoch": 0.5, "learning_rate": 0.00022547066859176577, "loss": 0.019, "step": 191680 }, { "epoch": 0.5, "learning_rate": 0.0002254667803753943, "loss": 0.0166, "step": 191690 }, { "epoch": 0.5, "learning_rate": 0.00022546289215902282, "loss": 0.0165, "step": 191700 }, { "epoch": 0.5, "learning_rate": 0.0002254590039426514, "loss": 0.0153, "step": 191710 }, { "epoch": 0.5, "learning_rate": 0.00022545511572627993, "loss": 0.0172, "step": 191720 }, { "epoch": 0.5, "learning_rate": 0.00022545122750990845, "loss": 0.013, "step": 191730 }, { "epoch": 0.5, "learning_rate": 0.000225447339293537, "loss": 0.0136, "step": 191740 }, { "epoch": 0.5, "learning_rate": 0.00022544345107716553, "loss": 0.0124, "step": 191750 }, { "epoch": 0.5, "learning_rate": 0.00022543956286079407, "loss": 0.0182, "step": 191760 }, { "epoch": 0.5, "learning_rate": 0.0002254356746444226, "loss": 0.016, "step": 191770 }, { "epoch": 0.5, "learning_rate": 0.00022543178642805113, "loss": 0.0184, "step": 191780 }, { "epoch": 0.5, "learning_rate": 0.00022542789821167964, "loss": 0.0142, "step": 191790 }, { "epoch": 0.5, "learning_rate": 0.0002254240099953082, "loss": 0.0131, "step": 191800 }, { "epoch": 0.5, "learning_rate": 0.00022542012177893673, "loss": 0.0189, "step": 191810 }, { "epoch": 0.5, "learning_rate": 0.00022541623356256527, "loss": 0.0145, "step": 191820 }, { "epoch": 0.5, "learning_rate": 0.00022541234534619378, "loss": 0.0169, "step": 191830 }, { "epoch": 0.5, "learning_rate": 0.00022540845712982235, "loss": 0.0191, "step": 191840 }, { "epoch": 0.5, "learning_rate": 0.00022540456891345087, "loss": 0.0144, "step": 191850 }, { "epoch": 0.5, "learning_rate": 0.0002254006806970794, "loss": 0.0191, "step": 191860 }, { "epoch": 0.5, "learning_rate": 0.00022539679248070792, "loss": 0.0146, "step": 191870 }, { "epoch": 0.5, "learning_rate": 0.0002253929042643365, "loss": 0.0201, "step": 191880 }, { "epoch": 0.5, "learning_rate": 0.00022538901604796503, "loss": 0.0185, "step": 191890 }, { "epoch": 0.5, "learning_rate": 0.00022538512783159355, "loss": 0.0191, "step": 191900 }, { "epoch": 0.5, "learning_rate": 0.00022538123961522206, "loss": 0.0163, "step": 191910 }, { "epoch": 0.5, "learning_rate": 0.00022537735139885063, "loss": 0.0197, "step": 191920 }, { "epoch": 0.5, "learning_rate": 0.00022537346318247917, "loss": 0.0192, "step": 191930 }, { "epoch": 0.5, "learning_rate": 0.0002253695749661077, "loss": 0.0205, "step": 191940 }, { "epoch": 0.5, "learning_rate": 0.00022536568674973623, "loss": 0.0181, "step": 191950 }, { "epoch": 0.5, "learning_rate": 0.00022536179853336477, "loss": 0.0172, "step": 191960 }, { "epoch": 0.5, "learning_rate": 0.0002253579103169933, "loss": 0.0187, "step": 191970 }, { "epoch": 0.5, "learning_rate": 0.00022535402210062183, "loss": 0.022, "step": 191980 }, { "epoch": 0.5, "learning_rate": 0.00022535013388425037, "loss": 0.0179, "step": 191990 }, { "epoch": 0.5, "learning_rate": 0.0002253462456678789, "loss": 0.0161, "step": 192000 }, { "epoch": 0.5, "eval_cer": 0.8818188561887047, "eval_loss": 0.012052525766193867, "eval_runtime": 108.244, "eval_samples_per_second": 18.477, "eval_steps_per_second": 4.619, "step": 192000 }, { "epoch": 0.5, "learning_rate": 0.00022534235745150745, "loss": 0.0164, "step": 192010 }, { "epoch": 0.5, "learning_rate": 0.00022533846923513597, "loss": 0.0162, "step": 192020 }, { "epoch": 0.5, "learning_rate": 0.0002253345810187645, "loss": 0.0144, "step": 192030 }, { "epoch": 0.5, "learning_rate": 0.00022533069280239302, "loss": 0.0217, "step": 192040 }, { "epoch": 0.5, "learning_rate": 0.0002253268045860216, "loss": 0.0189, "step": 192050 }, { "epoch": 0.5, "learning_rate": 0.00022532291636965013, "loss": 0.0167, "step": 192060 }, { "epoch": 0.5, "learning_rate": 0.00022531902815327865, "loss": 0.0193, "step": 192070 }, { "epoch": 0.5, "learning_rate": 0.00022531513993690716, "loss": 0.0212, "step": 192080 }, { "epoch": 0.5, "learning_rate": 0.00022531125172053573, "loss": 0.0168, "step": 192090 }, { "epoch": 0.5, "learning_rate": 0.00022530736350416427, "loss": 0.0196, "step": 192100 }, { "epoch": 0.5, "learning_rate": 0.0002253034752877928, "loss": 0.018, "step": 192110 }, { "epoch": 0.5, "learning_rate": 0.00022529958707142133, "loss": 0.0241, "step": 192120 }, { "epoch": 0.5, "learning_rate": 0.00022529569885504987, "loss": 0.0176, "step": 192130 }, { "epoch": 0.5, "learning_rate": 0.0002252918106386784, "loss": 0.0175, "step": 192140 }, { "epoch": 0.5, "learning_rate": 0.00022528792242230693, "loss": 0.019, "step": 192150 }, { "epoch": 0.5, "learning_rate": 0.00022528403420593547, "loss": 0.0202, "step": 192160 }, { "epoch": 0.5, "learning_rate": 0.000225280145989564, "loss": 0.018, "step": 192170 }, { "epoch": 0.5, "learning_rate": 0.00022527625777319255, "loss": 0.0175, "step": 192180 }, { "epoch": 0.5, "learning_rate": 0.00022527236955682107, "loss": 0.0182, "step": 192190 }, { "epoch": 0.5, "learning_rate": 0.0002252684813404496, "loss": 0.0132, "step": 192200 }, { "epoch": 0.5, "learning_rate": 0.00022526459312407818, "loss": 0.0191, "step": 192210 }, { "epoch": 0.5, "learning_rate": 0.0002252607049077067, "loss": 0.0192, "step": 192220 }, { "epoch": 0.5, "learning_rate": 0.0002252568166913352, "loss": 0.0173, "step": 192230 }, { "epoch": 0.5, "learning_rate": 0.00022525292847496375, "loss": 0.0194, "step": 192240 }, { "epoch": 0.5, "learning_rate": 0.00022524904025859232, "loss": 0.014, "step": 192250 }, { "epoch": 0.5, "learning_rate": 0.00022524515204222083, "loss": 0.0161, "step": 192260 }, { "epoch": 0.5, "learning_rate": 0.00022524126382584937, "loss": 0.0149, "step": 192270 }, { "epoch": 0.5, "learning_rate": 0.00022523737560947789, "loss": 0.0164, "step": 192280 }, { "epoch": 0.5, "learning_rate": 0.00022523348739310643, "loss": 0.0148, "step": 192290 }, { "epoch": 0.5, "learning_rate": 0.00022522959917673497, "loss": 0.0152, "step": 192300 }, { "epoch": 0.5, "learning_rate": 0.0002252257109603635, "loss": 0.0177, "step": 192310 }, { "epoch": 0.5, "learning_rate": 0.00022522182274399203, "loss": 0.0218, "step": 192320 }, { "epoch": 0.5, "learning_rate": 0.00022521793452762057, "loss": 0.0176, "step": 192330 }, { "epoch": 0.5, "learning_rate": 0.0002252140463112491, "loss": 0.0173, "step": 192340 }, { "epoch": 0.5, "learning_rate": 0.00022521015809487765, "loss": 0.0173, "step": 192350 }, { "epoch": 0.5, "learning_rate": 0.00022520626987850616, "loss": 0.0191, "step": 192360 }, { "epoch": 0.5, "learning_rate": 0.0002252023816621347, "loss": 0.0146, "step": 192370 }, { "epoch": 0.5, "learning_rate": 0.00022519849344576325, "loss": 0.0201, "step": 192380 }, { "epoch": 0.5, "learning_rate": 0.0002251946052293918, "loss": 0.0148, "step": 192390 }, { "epoch": 0.5, "learning_rate": 0.0002251907170130203, "loss": 0.0177, "step": 192400 }, { "epoch": 0.5, "learning_rate": 0.00022518682879664885, "loss": 0.0167, "step": 192410 }, { "epoch": 0.5, "learning_rate": 0.00022518294058027741, "loss": 0.0156, "step": 192420 }, { "epoch": 0.5, "learning_rate": 0.00022517905236390593, "loss": 0.0145, "step": 192430 }, { "epoch": 0.5, "learning_rate": 0.00022517516414753447, "loss": 0.0156, "step": 192440 }, { "epoch": 0.5, "learning_rate": 0.00022517127593116299, "loss": 0.0226, "step": 192450 }, { "epoch": 0.5, "learning_rate": 0.00022516738771479155, "loss": 0.0207, "step": 192460 }, { "epoch": 0.5, "learning_rate": 0.00022516349949842007, "loss": 0.0185, "step": 192470 }, { "epoch": 0.5, "learning_rate": 0.0002251596112820486, "loss": 0.0191, "step": 192480 }, { "epoch": 0.5, "learning_rate": 0.00022515572306567712, "loss": 0.0182, "step": 192490 }, { "epoch": 0.5, "learning_rate": 0.0002251518348493057, "loss": 0.0167, "step": 192500 }, { "epoch": 0.5, "learning_rate": 0.0002251479466329342, "loss": 0.0167, "step": 192510 }, { "epoch": 0.5, "learning_rate": 0.00022514405841656275, "loss": 0.0159, "step": 192520 }, { "epoch": 0.5, "learning_rate": 0.00022514017020019126, "loss": 0.0176, "step": 192530 }, { "epoch": 0.5, "learning_rate": 0.0002251362819838198, "loss": 0.0165, "step": 192540 }, { "epoch": 0.5, "learning_rate": 0.00022513239376744835, "loss": 0.0199, "step": 192550 }, { "epoch": 0.5, "learning_rate": 0.0002251285055510769, "loss": 0.0181, "step": 192560 }, { "epoch": 0.5, "learning_rate": 0.0002251246173347054, "loss": 0.0173, "step": 192570 }, { "epoch": 0.5, "learning_rate": 0.00022512072911833395, "loss": 0.0151, "step": 192580 }, { "epoch": 0.5, "learning_rate": 0.00022511684090196251, "loss": 0.0214, "step": 192590 }, { "epoch": 0.5, "learning_rate": 0.00022511295268559103, "loss": 0.0255, "step": 192600 }, { "epoch": 0.5, "learning_rate": 0.00022510906446921957, "loss": 0.0172, "step": 192610 }, { "epoch": 0.5, "learning_rate": 0.00022510517625284808, "loss": 0.0148, "step": 192620 }, { "epoch": 0.5, "learning_rate": 0.00022510128803647665, "loss": 0.017, "step": 192630 }, { "epoch": 0.5, "learning_rate": 0.00022509739982010517, "loss": 0.0227, "step": 192640 }, { "epoch": 0.5, "learning_rate": 0.0002250935116037337, "loss": 0.0161, "step": 192650 }, { "epoch": 0.5, "learning_rate": 0.00022508962338736222, "loss": 0.0181, "step": 192660 }, { "epoch": 0.5, "learning_rate": 0.0002250857351709908, "loss": 0.0174, "step": 192670 }, { "epoch": 0.5, "learning_rate": 0.0002250818469546193, "loss": 0.0202, "step": 192680 }, { "epoch": 0.5, "learning_rate": 0.00022507795873824785, "loss": 0.0178, "step": 192690 }, { "epoch": 0.5, "learning_rate": 0.00022507407052187636, "loss": 0.0183, "step": 192700 }, { "epoch": 0.5, "learning_rate": 0.00022507018230550493, "loss": 0.0237, "step": 192710 }, { "epoch": 0.5, "learning_rate": 0.00022506629408913345, "loss": 0.0165, "step": 192720 }, { "epoch": 0.5, "learning_rate": 0.000225062405872762, "loss": 0.0258, "step": 192730 }, { "epoch": 0.5, "learning_rate": 0.0002250585176563905, "loss": 0.0201, "step": 192740 }, { "epoch": 0.5, "learning_rate": 0.00022505462944001907, "loss": 0.0226, "step": 192750 }, { "epoch": 0.5, "learning_rate": 0.00022505074122364761, "loss": 0.0196, "step": 192760 }, { "epoch": 0.5, "learning_rate": 0.00022504685300727613, "loss": 0.0212, "step": 192770 }, { "epoch": 0.5, "learning_rate": 0.00022504296479090467, "loss": 0.0192, "step": 192780 }, { "epoch": 0.5, "learning_rate": 0.00022503907657453318, "loss": 0.0163, "step": 192790 }, { "epoch": 0.5, "learning_rate": 0.00022503518835816175, "loss": 0.0191, "step": 192800 }, { "epoch": 0.5, "learning_rate": 0.00022503130014179027, "loss": 0.0183, "step": 192810 }, { "epoch": 0.5, "learning_rate": 0.0002250274119254188, "loss": 0.0183, "step": 192820 }, { "epoch": 0.5, "learning_rate": 0.00022502352370904732, "loss": 0.0185, "step": 192830 }, { "epoch": 0.5, "learning_rate": 0.0002250196354926759, "loss": 0.0236, "step": 192840 }, { "epoch": 0.5, "learning_rate": 0.0002250157472763044, "loss": 0.0191, "step": 192850 }, { "epoch": 0.5, "learning_rate": 0.00022501185905993295, "loss": 0.016, "step": 192860 }, { "epoch": 0.5, "learning_rate": 0.00022500797084356146, "loss": 0.0146, "step": 192870 }, { "epoch": 0.5, "learning_rate": 0.00022500408262719003, "loss": 0.0177, "step": 192880 }, { "epoch": 0.5, "learning_rate": 0.00022500019441081855, "loss": 0.0156, "step": 192890 }, { "epoch": 0.5, "learning_rate": 0.0002249963061944471, "loss": 0.0171, "step": 192900 }, { "epoch": 0.5, "learning_rate": 0.0002249924179780756, "loss": 0.0178, "step": 192910 }, { "epoch": 0.5, "learning_rate": 0.00022498852976170417, "loss": 0.0154, "step": 192920 }, { "epoch": 0.5, "learning_rate": 0.0002249846415453327, "loss": 0.0204, "step": 192930 }, { "epoch": 0.5, "learning_rate": 0.00022498075332896123, "loss": 0.0214, "step": 192940 }, { "epoch": 0.5, "learning_rate": 0.00022497686511258974, "loss": 0.023, "step": 192950 }, { "epoch": 0.5, "learning_rate": 0.0002249729768962183, "loss": 0.0152, "step": 192960 }, { "epoch": 0.5, "learning_rate": 0.00022496908867984685, "loss": 0.0155, "step": 192970 }, { "epoch": 0.5, "learning_rate": 0.00022496520046347537, "loss": 0.0185, "step": 192980 }, { "epoch": 0.5, "learning_rate": 0.0002249613122471039, "loss": 0.022, "step": 192990 }, { "epoch": 0.5, "learning_rate": 0.00022495742403073245, "loss": 0.0187, "step": 193000 }, { "epoch": 0.5, "eval_cer": 0.8818286536472439, "eval_loss": 0.012139668688178062, "eval_runtime": 108.0099, "eval_samples_per_second": 18.517, "eval_steps_per_second": 4.629, "step": 193000 }, { "epoch": 0.5, "learning_rate": 0.000224953535814361, "loss": 0.02, "step": 193010 }, { "epoch": 0.5, "learning_rate": 0.0002249496475979895, "loss": 0.0183, "step": 193020 }, { "epoch": 0.5, "learning_rate": 0.00022494575938161805, "loss": 0.0223, "step": 193030 }, { "epoch": 0.5, "learning_rate": 0.00022494187116524656, "loss": 0.0189, "step": 193040 }, { "epoch": 0.5, "learning_rate": 0.00022493798294887513, "loss": 0.018, "step": 193050 }, { "epoch": 0.5, "learning_rate": 0.00022493409473250365, "loss": 0.0212, "step": 193060 }, { "epoch": 0.5, "learning_rate": 0.0002249302065161322, "loss": 0.0206, "step": 193070 }, { "epoch": 0.5, "learning_rate": 0.0002249263182997607, "loss": 0.0182, "step": 193080 }, { "epoch": 0.5, "learning_rate": 0.00022492243008338927, "loss": 0.018, "step": 193090 }, { "epoch": 0.5, "learning_rate": 0.00022491854186701779, "loss": 0.0207, "step": 193100 }, { "epoch": 0.5, "learning_rate": 0.00022491465365064633, "loss": 0.0244, "step": 193110 }, { "epoch": 0.5, "learning_rate": 0.00022491076543427484, "loss": 0.018, "step": 193120 }, { "epoch": 0.5, "learning_rate": 0.0002249068772179034, "loss": 0.0194, "step": 193130 }, { "epoch": 0.5, "learning_rate": 0.00022490298900153195, "loss": 0.0173, "step": 193140 }, { "epoch": 0.5, "learning_rate": 0.00022489910078516047, "loss": 0.0192, "step": 193150 }, { "epoch": 0.5, "learning_rate": 0.000224895212568789, "loss": 0.015, "step": 193160 }, { "epoch": 0.5, "learning_rate": 0.00022489132435241755, "loss": 0.0149, "step": 193170 }, { "epoch": 0.5, "learning_rate": 0.0002248874361360461, "loss": 0.0198, "step": 193180 }, { "epoch": 0.5, "learning_rate": 0.0002248835479196746, "loss": 0.0187, "step": 193190 }, { "epoch": 0.5, "learning_rate": 0.00022487965970330315, "loss": 0.0157, "step": 193200 }, { "epoch": 0.5, "learning_rate": 0.0002248757714869317, "loss": 0.0207, "step": 193210 }, { "epoch": 0.5, "learning_rate": 0.00022487188327056023, "loss": 0.0228, "step": 193220 }, { "epoch": 0.5, "learning_rate": 0.00022486799505418875, "loss": 0.0184, "step": 193230 }, { "epoch": 0.5, "learning_rate": 0.0002248641068378173, "loss": 0.0178, "step": 193240 }, { "epoch": 0.5, "learning_rate": 0.00022486021862144586, "loss": 0.0164, "step": 193250 }, { "epoch": 0.5, "learning_rate": 0.00022485633040507437, "loss": 0.0156, "step": 193260 }, { "epoch": 0.5, "learning_rate": 0.00022485244218870288, "loss": 0.0157, "step": 193270 }, { "epoch": 0.5, "learning_rate": 0.00022484855397233143, "loss": 0.0184, "step": 193280 }, { "epoch": 0.5, "learning_rate": 0.00022484466575595994, "loss": 0.0198, "step": 193290 }, { "epoch": 0.5, "learning_rate": 0.0002248407775395885, "loss": 0.0162, "step": 193300 }, { "epoch": 0.5, "learning_rate": 0.00022483688932321705, "loss": 0.0208, "step": 193310 }, { "epoch": 0.5, "learning_rate": 0.00022483300110684557, "loss": 0.0167, "step": 193320 }, { "epoch": 0.5, "learning_rate": 0.0002248291128904741, "loss": 0.0132, "step": 193330 }, { "epoch": 0.5, "learning_rate": 0.00022482522467410265, "loss": 0.0154, "step": 193340 }, { "epoch": 0.5, "learning_rate": 0.0002248213364577312, "loss": 0.018, "step": 193350 }, { "epoch": 0.5, "learning_rate": 0.0002248174482413597, "loss": 0.0173, "step": 193360 }, { "epoch": 0.5, "learning_rate": 0.00022481356002498825, "loss": 0.0193, "step": 193370 }, { "epoch": 0.5, "learning_rate": 0.0002248096718086168, "loss": 0.0152, "step": 193380 }, { "epoch": 0.5, "learning_rate": 0.00022480578359224533, "loss": 0.0167, "step": 193390 }, { "epoch": 0.5, "learning_rate": 0.00022480189537587384, "loss": 0.0213, "step": 193400 }, { "epoch": 0.5, "learning_rate": 0.00022479800715950239, "loss": 0.0185, "step": 193410 }, { "epoch": 0.5, "learning_rate": 0.00022479411894313093, "loss": 0.0153, "step": 193420 }, { "epoch": 0.5, "learning_rate": 0.00022479023072675947, "loss": 0.0171, "step": 193430 }, { "epoch": 0.5, "learning_rate": 0.00022478634251038798, "loss": 0.0194, "step": 193440 }, { "epoch": 0.5, "learning_rate": 0.00022478245429401653, "loss": 0.0143, "step": 193450 }, { "epoch": 0.5, "learning_rate": 0.0002247785660776451, "loss": 0.0223, "step": 193460 }, { "epoch": 0.5, "learning_rate": 0.0002247746778612736, "loss": 0.0202, "step": 193470 }, { "epoch": 0.5, "learning_rate": 0.00022477078964490215, "loss": 0.0149, "step": 193480 }, { "epoch": 0.5, "learning_rate": 0.00022476690142853067, "loss": 0.0143, "step": 193490 }, { "epoch": 0.5, "learning_rate": 0.00022476301321215923, "loss": 0.0161, "step": 193500 }, { "epoch": 0.5, "learning_rate": 0.00022475912499578775, "loss": 0.016, "step": 193510 }, { "epoch": 0.5, "learning_rate": 0.0002247552367794163, "loss": 0.0197, "step": 193520 }, { "epoch": 0.5, "learning_rate": 0.0002247513485630448, "loss": 0.017, "step": 193530 }, { "epoch": 0.5, "learning_rate": 0.00022474746034667335, "loss": 0.0184, "step": 193540 }, { "epoch": 0.5, "learning_rate": 0.0002247435721303019, "loss": 0.0188, "step": 193550 }, { "epoch": 0.5, "learning_rate": 0.00022473968391393043, "loss": 0.0229, "step": 193560 }, { "epoch": 0.5, "learning_rate": 0.00022473579569755894, "loss": 0.0186, "step": 193570 }, { "epoch": 0.5, "learning_rate": 0.00022473190748118749, "loss": 0.0146, "step": 193580 }, { "epoch": 0.5, "learning_rate": 0.00022472801926481603, "loss": 0.0184, "step": 193590 }, { "epoch": 0.5, "learning_rate": 0.00022472413104844457, "loss": 0.017, "step": 193600 }, { "epoch": 0.5, "learning_rate": 0.00022472024283207308, "loss": 0.0188, "step": 193610 }, { "epoch": 0.5, "learning_rate": 0.00022471635461570163, "loss": 0.0202, "step": 193620 }, { "epoch": 0.5, "learning_rate": 0.0002247124663993302, "loss": 0.0214, "step": 193630 }, { "epoch": 0.5, "learning_rate": 0.0002247085781829587, "loss": 0.0228, "step": 193640 }, { "epoch": 0.5, "learning_rate": 0.00022470468996658725, "loss": 0.0209, "step": 193650 }, { "epoch": 0.5, "learning_rate": 0.00022470080175021576, "loss": 0.0183, "step": 193660 }, { "epoch": 0.5, "learning_rate": 0.00022469691353384433, "loss": 0.0173, "step": 193670 }, { "epoch": 0.5, "learning_rate": 0.00022469302531747285, "loss": 0.0178, "step": 193680 }, { "epoch": 0.5, "learning_rate": 0.0002246891371011014, "loss": 0.0204, "step": 193690 }, { "epoch": 0.5, "learning_rate": 0.0002246852488847299, "loss": 0.0166, "step": 193700 }, { "epoch": 0.5, "learning_rate": 0.00022468136066835847, "loss": 0.0152, "step": 193710 }, { "epoch": 0.5, "learning_rate": 0.000224677472451987, "loss": 0.0137, "step": 193720 }, { "epoch": 0.5, "learning_rate": 0.00022467358423561553, "loss": 0.0165, "step": 193730 }, { "epoch": 0.5, "learning_rate": 0.00022466969601924404, "loss": 0.0182, "step": 193740 }, { "epoch": 0.5, "learning_rate": 0.0002246658078028726, "loss": 0.0167, "step": 193750 }, { "epoch": 0.5, "learning_rate": 0.00022466191958650113, "loss": 0.0131, "step": 193760 }, { "epoch": 0.5, "learning_rate": 0.00022465803137012967, "loss": 0.0181, "step": 193770 }, { "epoch": 0.5, "learning_rate": 0.00022465414315375818, "loss": 0.0186, "step": 193780 }, { "epoch": 0.5, "learning_rate": 0.00022465025493738672, "loss": 0.0199, "step": 193790 }, { "epoch": 0.5, "learning_rate": 0.0002246463667210153, "loss": 0.0205, "step": 193800 }, { "epoch": 0.5, "learning_rate": 0.0002246424785046438, "loss": 0.0178, "step": 193810 }, { "epoch": 0.5, "learning_rate": 0.00022463859028827232, "loss": 0.0186, "step": 193820 }, { "epoch": 0.5, "learning_rate": 0.00022463470207190086, "loss": 0.0176, "step": 193830 }, { "epoch": 0.5, "learning_rate": 0.00022463081385552943, "loss": 0.018, "step": 193840 }, { "epoch": 0.5, "learning_rate": 0.00022462692563915795, "loss": 0.0182, "step": 193850 }, { "epoch": 0.5, "learning_rate": 0.0002246230374227865, "loss": 0.0174, "step": 193860 }, { "epoch": 0.5, "learning_rate": 0.000224619149206415, "loss": 0.0206, "step": 193870 }, { "epoch": 0.5, "learning_rate": 0.00022461526099004357, "loss": 0.0193, "step": 193880 }, { "epoch": 0.5, "learning_rate": 0.0002246113727736721, "loss": 0.0166, "step": 193890 }, { "epoch": 0.5, "learning_rate": 0.00022460748455730063, "loss": 0.0177, "step": 193900 }, { "epoch": 0.5, "learning_rate": 0.00022460359634092914, "loss": 0.0184, "step": 193910 }, { "epoch": 0.5, "learning_rate": 0.0002245997081245577, "loss": 0.0194, "step": 193920 }, { "epoch": 0.5, "learning_rate": 0.00022459581990818623, "loss": 0.0191, "step": 193930 }, { "epoch": 0.5, "learning_rate": 0.00022459193169181477, "loss": 0.0232, "step": 193940 }, { "epoch": 0.5, "learning_rate": 0.00022458804347544328, "loss": 0.016, "step": 193950 }, { "epoch": 0.5, "learning_rate": 0.00022458415525907185, "loss": 0.0116, "step": 193960 }, { "epoch": 0.5, "learning_rate": 0.00022458026704270037, "loss": 0.0209, "step": 193970 }, { "epoch": 0.5, "learning_rate": 0.0002245763788263289, "loss": 0.018, "step": 193980 }, { "epoch": 0.5, "learning_rate": 0.00022457249060995742, "loss": 0.0169, "step": 193990 }, { "epoch": 0.5, "learning_rate": 0.000224568602393586, "loss": 0.0127, "step": 194000 }, { "epoch": 0.5, "eval_cer": 0.8817992612716261, "eval_loss": 0.012113718315958977, "eval_runtime": 108.1959, "eval_samples_per_second": 18.485, "eval_steps_per_second": 4.621, "step": 194000 }, { "epoch": 0.5, "learning_rate": 0.00022456471417721453, "loss": 0.0165, "step": 194010 }, { "epoch": 0.5, "learning_rate": 0.00022456082596084305, "loss": 0.0167, "step": 194020 }, { "epoch": 0.5, "learning_rate": 0.0002245569377444716, "loss": 0.0252, "step": 194030 }, { "epoch": 0.5, "learning_rate": 0.0002245530495281001, "loss": 0.0184, "step": 194040 }, { "epoch": 0.5, "learning_rate": 0.00022454916131172867, "loss": 0.022, "step": 194050 }, { "epoch": 0.5, "learning_rate": 0.00022454527309535719, "loss": 0.0152, "step": 194060 }, { "epoch": 0.5, "learning_rate": 0.00022454138487898573, "loss": 0.0152, "step": 194070 }, { "epoch": 0.5, "learning_rate": 0.00022453749666261424, "loss": 0.0147, "step": 194080 }, { "epoch": 0.5, "learning_rate": 0.0002245336084462428, "loss": 0.0146, "step": 194090 }, { "epoch": 0.5, "learning_rate": 0.00022452972022987133, "loss": 0.0203, "step": 194100 }, { "epoch": 0.5, "learning_rate": 0.00022452583201349987, "loss": 0.0177, "step": 194110 }, { "epoch": 0.5, "learning_rate": 0.00022452194379712838, "loss": 0.0196, "step": 194120 }, { "epoch": 0.5, "learning_rate": 0.00022451805558075695, "loss": 0.0168, "step": 194130 }, { "epoch": 0.5, "learning_rate": 0.00022451416736438547, "loss": 0.0202, "step": 194140 }, { "epoch": 0.5, "learning_rate": 0.000224510279148014, "loss": 0.015, "step": 194150 }, { "epoch": 0.5, "learning_rate": 0.00022450639093164252, "loss": 0.0176, "step": 194160 }, { "epoch": 0.5, "learning_rate": 0.0002245025027152711, "loss": 0.0177, "step": 194170 }, { "epoch": 0.5, "learning_rate": 0.00022449861449889963, "loss": 0.0179, "step": 194180 }, { "epoch": 0.5, "learning_rate": 0.00022449472628252815, "loss": 0.0176, "step": 194190 }, { "epoch": 0.5, "learning_rate": 0.0002244908380661567, "loss": 0.0152, "step": 194200 }, { "epoch": 0.5, "learning_rate": 0.00022448694984978523, "loss": 0.0166, "step": 194210 }, { "epoch": 0.5, "learning_rate": 0.00022448306163341377, "loss": 0.0144, "step": 194220 }, { "epoch": 0.5, "learning_rate": 0.00022447917341704229, "loss": 0.0247, "step": 194230 }, { "epoch": 0.5, "learning_rate": 0.00022447528520067083, "loss": 0.0166, "step": 194240 }, { "epoch": 0.5, "learning_rate": 0.00022447139698429937, "loss": 0.0166, "step": 194250 }, { "epoch": 0.5, "learning_rate": 0.0002244675087679279, "loss": 0.0285, "step": 194260 }, { "epoch": 0.5, "learning_rate": 0.00022446362055155643, "loss": 0.0176, "step": 194270 }, { "epoch": 0.5, "learning_rate": 0.00022445973233518497, "loss": 0.019, "step": 194280 }, { "epoch": 0.5, "learning_rate": 0.00022445584411881348, "loss": 0.019, "step": 194290 }, { "epoch": 0.5, "learning_rate": 0.00022445195590244205, "loss": 0.0163, "step": 194300 }, { "epoch": 0.5, "learning_rate": 0.00022444806768607056, "loss": 0.018, "step": 194310 }, { "epoch": 0.5, "learning_rate": 0.0002244441794696991, "loss": 0.0183, "step": 194320 }, { "epoch": 0.5, "learning_rate": 0.00022444029125332762, "loss": 0.0163, "step": 194330 }, { "epoch": 0.5, "learning_rate": 0.0002244364030369562, "loss": 0.0142, "step": 194340 }, { "epoch": 0.5, "learning_rate": 0.00022443251482058473, "loss": 0.0166, "step": 194350 }, { "epoch": 0.5, "learning_rate": 0.00022442862660421325, "loss": 0.0221, "step": 194360 }, { "epoch": 0.5, "learning_rate": 0.0002244247383878418, "loss": 0.0226, "step": 194370 }, { "epoch": 0.5, "learning_rate": 0.00022442085017147033, "loss": 0.0152, "step": 194380 }, { "epoch": 0.5, "learning_rate": 0.00022441696195509887, "loss": 0.0188, "step": 194390 }, { "epoch": 0.5, "learning_rate": 0.00022441307373872739, "loss": 0.0152, "step": 194400 }, { "epoch": 0.5, "learning_rate": 0.00022440918552235593, "loss": 0.0192, "step": 194410 }, { "epoch": 0.5, "learning_rate": 0.00022440529730598447, "loss": 0.0174, "step": 194420 }, { "epoch": 0.5, "learning_rate": 0.000224401409089613, "loss": 0.0165, "step": 194430 }, { "epoch": 0.5, "learning_rate": 0.00022439752087324152, "loss": 0.0172, "step": 194440 }, { "epoch": 0.5, "learning_rate": 0.00022439363265687007, "loss": 0.0173, "step": 194450 }, { "epoch": 0.5, "learning_rate": 0.0002243897444404986, "loss": 0.0182, "step": 194460 }, { "epoch": 0.5, "learning_rate": 0.00022438585622412715, "loss": 0.012, "step": 194470 }, { "epoch": 0.5, "learning_rate": 0.00022438196800775566, "loss": 0.0156, "step": 194480 }, { "epoch": 0.5, "learning_rate": 0.0002243780797913842, "loss": 0.0193, "step": 194490 }, { "epoch": 0.5, "learning_rate": 0.00022437419157501277, "loss": 0.0189, "step": 194500 }, { "epoch": 0.5, "learning_rate": 0.0002243703033586413, "loss": 0.0154, "step": 194510 }, { "epoch": 0.5, "learning_rate": 0.00022436641514226983, "loss": 0.0126, "step": 194520 }, { "epoch": 0.5, "learning_rate": 0.00022436252692589835, "loss": 0.0172, "step": 194530 }, { "epoch": 0.5, "learning_rate": 0.00022435863870952686, "loss": 0.0166, "step": 194540 }, { "epoch": 0.5, "learning_rate": 0.00022435475049315543, "loss": 0.0155, "step": 194550 }, { "epoch": 0.5, "learning_rate": 0.00022435086227678397, "loss": 0.0189, "step": 194560 }, { "epoch": 0.5, "learning_rate": 0.00022434697406041248, "loss": 0.0171, "step": 194570 }, { "epoch": 0.5, "learning_rate": 0.00022434308584404103, "loss": 0.0118, "step": 194580 }, { "epoch": 0.5, "learning_rate": 0.00022433919762766957, "loss": 0.0138, "step": 194590 }, { "epoch": 0.5, "learning_rate": 0.0002243353094112981, "loss": 0.0161, "step": 194600 }, { "epoch": 0.5, "learning_rate": 0.00022433142119492662, "loss": 0.0218, "step": 194610 }, { "epoch": 0.5, "learning_rate": 0.00022432753297855517, "loss": 0.0197, "step": 194620 }, { "epoch": 0.5, "learning_rate": 0.0002243236447621837, "loss": 0.0161, "step": 194630 }, { "epoch": 0.5, "learning_rate": 0.00022431975654581225, "loss": 0.017, "step": 194640 }, { "epoch": 0.5, "learning_rate": 0.00022431586832944076, "loss": 0.0169, "step": 194650 }, { "epoch": 0.5, "learning_rate": 0.0002243119801130693, "loss": 0.0195, "step": 194660 }, { "epoch": 0.5, "learning_rate": 0.00022430809189669787, "loss": 0.0206, "step": 194670 }, { "epoch": 0.5, "learning_rate": 0.0002243042036803264, "loss": 0.0161, "step": 194680 }, { "epoch": 0.5, "learning_rate": 0.0002243003154639549, "loss": 0.0151, "step": 194690 }, { "epoch": 0.5, "learning_rate": 0.00022429642724758344, "loss": 0.0157, "step": 194700 }, { "epoch": 0.5, "learning_rate": 0.000224292539031212, "loss": 0.0176, "step": 194710 }, { "epoch": 0.5, "learning_rate": 0.00022428865081484053, "loss": 0.0151, "step": 194720 }, { "epoch": 0.5, "learning_rate": 0.00022428476259846907, "loss": 0.0166, "step": 194730 }, { "epoch": 0.5, "learning_rate": 0.00022428087438209758, "loss": 0.02, "step": 194740 }, { "epoch": 0.5, "learning_rate": 0.00022427698616572615, "loss": 0.0177, "step": 194750 }, { "epoch": 0.5, "learning_rate": 0.00022427309794935467, "loss": 0.0201, "step": 194760 }, { "epoch": 0.5, "learning_rate": 0.0002242692097329832, "loss": 0.0189, "step": 194770 }, { "epoch": 0.5, "learning_rate": 0.00022426532151661172, "loss": 0.0226, "step": 194780 }, { "epoch": 0.5, "learning_rate": 0.00022426143330024026, "loss": 0.0243, "step": 194790 }, { "epoch": 0.5, "learning_rate": 0.0002242575450838688, "loss": 0.0151, "step": 194800 }, { "epoch": 0.5, "learning_rate": 0.00022425365686749735, "loss": 0.0165, "step": 194810 }, { "epoch": 0.51, "learning_rate": 0.00022424976865112586, "loss": 0.0152, "step": 194820 }, { "epoch": 0.51, "learning_rate": 0.0002242458804347544, "loss": 0.0162, "step": 194830 }, { "epoch": 0.51, "learning_rate": 0.00022424199221838297, "loss": 0.0168, "step": 194840 }, { "epoch": 0.51, "learning_rate": 0.0002242381040020115, "loss": 0.0172, "step": 194850 }, { "epoch": 0.51, "learning_rate": 0.00022423421578564, "loss": 0.0129, "step": 194860 }, { "epoch": 0.51, "learning_rate": 0.00022423032756926854, "loss": 0.0209, "step": 194870 }, { "epoch": 0.51, "learning_rate": 0.0002242264393528971, "loss": 0.019, "step": 194880 }, { "epoch": 0.51, "learning_rate": 0.00022422255113652563, "loss": 0.0177, "step": 194890 }, { "epoch": 0.51, "learning_rate": 0.00022421866292015417, "loss": 0.0168, "step": 194900 }, { "epoch": 0.51, "learning_rate": 0.00022421477470378268, "loss": 0.0197, "step": 194910 }, { "epoch": 0.51, "learning_rate": 0.00022421088648741125, "loss": 0.0141, "step": 194920 }, { "epoch": 0.51, "learning_rate": 0.00022420699827103977, "loss": 0.0183, "step": 194930 }, { "epoch": 0.51, "learning_rate": 0.0002242031100546683, "loss": 0.0176, "step": 194940 }, { "epoch": 0.51, "learning_rate": 0.00022419922183829682, "loss": 0.0166, "step": 194950 }, { "epoch": 0.51, "learning_rate": 0.0002241953336219254, "loss": 0.0129, "step": 194960 }, { "epoch": 0.51, "learning_rate": 0.0002241914454055539, "loss": 0.0168, "step": 194970 }, { "epoch": 0.51, "learning_rate": 0.00022418755718918245, "loss": 0.014, "step": 194980 }, { "epoch": 0.51, "learning_rate": 0.00022418366897281096, "loss": 0.016, "step": 194990 }, { "epoch": 0.51, "learning_rate": 0.00022417978075643953, "loss": 0.0182, "step": 195000 }, { "epoch": 0.51, "eval_cer": 0.8817726681698768, "eval_loss": 0.012146620079874992, "eval_runtime": 108.1358, "eval_samples_per_second": 18.495, "eval_steps_per_second": 4.624, "step": 195000 }, { "epoch": 0.51, "learning_rate": 0.00022417589254006805, "loss": 0.0212, "step": 195010 }, { "epoch": 0.51, "learning_rate": 0.0002241720043236966, "loss": 0.0181, "step": 195020 }, { "epoch": 0.51, "learning_rate": 0.0002241681161073251, "loss": 0.0192, "step": 195030 }, { "epoch": 0.51, "learning_rate": 0.00022416422789095364, "loss": 0.0177, "step": 195040 }, { "epoch": 0.51, "learning_rate": 0.0002241603396745822, "loss": 0.0194, "step": 195050 }, { "epoch": 0.51, "learning_rate": 0.00022415645145821073, "loss": 0.0192, "step": 195060 }, { "epoch": 0.51, "learning_rate": 0.00022415256324183927, "loss": 0.018, "step": 195070 }, { "epoch": 0.51, "learning_rate": 0.00022414867502546778, "loss": 0.0203, "step": 195080 }, { "epoch": 0.51, "learning_rate": 0.00022414478680909635, "loss": 0.023, "step": 195090 }, { "epoch": 0.51, "learning_rate": 0.00022414089859272487, "loss": 0.0159, "step": 195100 }, { "epoch": 0.51, "learning_rate": 0.0002241370103763534, "loss": 0.0168, "step": 195110 }, { "epoch": 0.51, "learning_rate": 0.00022413312215998192, "loss": 0.0222, "step": 195120 }, { "epoch": 0.51, "learning_rate": 0.0002241292339436105, "loss": 0.0131, "step": 195130 }, { "epoch": 0.51, "learning_rate": 0.000224125345727239, "loss": 0.0172, "step": 195140 }, { "epoch": 0.51, "learning_rate": 0.00022412145751086755, "loss": 0.026, "step": 195150 }, { "epoch": 0.51, "learning_rate": 0.00022411756929449606, "loss": 0.0171, "step": 195160 }, { "epoch": 0.51, "learning_rate": 0.00022411368107812463, "loss": 0.0179, "step": 195170 }, { "epoch": 0.51, "learning_rate": 0.00022410979286175314, "loss": 0.0146, "step": 195180 }, { "epoch": 0.51, "learning_rate": 0.0002241059046453817, "loss": 0.0203, "step": 195190 }, { "epoch": 0.51, "learning_rate": 0.0002241020164290102, "loss": 0.0163, "step": 195200 }, { "epoch": 0.51, "learning_rate": 0.00022409812821263877, "loss": 0.017, "step": 195210 }, { "epoch": 0.51, "learning_rate": 0.0002240942399962673, "loss": 0.0172, "step": 195220 }, { "epoch": 0.51, "learning_rate": 0.00022409035177989583, "loss": 0.0186, "step": 195230 }, { "epoch": 0.51, "learning_rate": 0.00022408646356352437, "loss": 0.0195, "step": 195240 }, { "epoch": 0.51, "learning_rate": 0.0002240825753471529, "loss": 0.0173, "step": 195250 }, { "epoch": 0.51, "learning_rate": 0.00022407868713078145, "loss": 0.0207, "step": 195260 }, { "epoch": 0.51, "learning_rate": 0.00022407479891440997, "loss": 0.0195, "step": 195270 }, { "epoch": 0.51, "learning_rate": 0.0002240709106980385, "loss": 0.0152, "step": 195280 }, { "epoch": 0.51, "learning_rate": 0.00022406702248166702, "loss": 0.0163, "step": 195290 }, { "epoch": 0.51, "learning_rate": 0.0002240631342652956, "loss": 0.0212, "step": 195300 }, { "epoch": 0.51, "learning_rate": 0.0002240592460489241, "loss": 0.0208, "step": 195310 }, { "epoch": 0.51, "learning_rate": 0.00022405535783255265, "loss": 0.0158, "step": 195320 }, { "epoch": 0.51, "learning_rate": 0.00022405146961618116, "loss": 0.017, "step": 195330 }, { "epoch": 0.51, "learning_rate": 0.00022404758139980973, "loss": 0.0183, "step": 195340 }, { "epoch": 0.51, "learning_rate": 0.00022404369318343824, "loss": 0.0131, "step": 195350 }, { "epoch": 0.51, "learning_rate": 0.00022403980496706679, "loss": 0.0163, "step": 195360 }, { "epoch": 0.51, "learning_rate": 0.0002240359167506953, "loss": 0.02, "step": 195370 }, { "epoch": 0.51, "learning_rate": 0.00022403202853432387, "loss": 0.0198, "step": 195380 }, { "epoch": 0.51, "learning_rate": 0.0002240281403179524, "loss": 0.0188, "step": 195390 }, { "epoch": 0.51, "learning_rate": 0.00022402425210158093, "loss": 0.0184, "step": 195400 }, { "epoch": 0.51, "learning_rate": 0.00022402036388520944, "loss": 0.0206, "step": 195410 }, { "epoch": 0.51, "learning_rate": 0.000224016475668838, "loss": 0.0189, "step": 195420 }, { "epoch": 0.51, "learning_rate": 0.00022401258745246655, "loss": 0.0155, "step": 195430 }, { "epoch": 0.51, "learning_rate": 0.00022400869923609506, "loss": 0.0215, "step": 195440 }, { "epoch": 0.51, "learning_rate": 0.0002240048110197236, "loss": 0.0152, "step": 195450 }, { "epoch": 0.51, "learning_rate": 0.00022400092280335215, "loss": 0.0169, "step": 195460 }, { "epoch": 0.51, "learning_rate": 0.0002239970345869807, "loss": 0.0201, "step": 195470 }, { "epoch": 0.51, "learning_rate": 0.0002239931463706092, "loss": 0.0208, "step": 195480 }, { "epoch": 0.51, "learning_rate": 0.00022398925815423775, "loss": 0.0219, "step": 195490 }, { "epoch": 0.51, "learning_rate": 0.0002239853699378663, "loss": 0.0349, "step": 195500 }, { "epoch": 0.51, "learning_rate": 0.00022398148172149483, "loss": 0.0163, "step": 195510 }, { "epoch": 0.51, "learning_rate": 0.00022397759350512334, "loss": 0.0181, "step": 195520 }, { "epoch": 0.51, "learning_rate": 0.00022397370528875189, "loss": 0.0157, "step": 195530 }, { "epoch": 0.51, "learning_rate": 0.0002239698170723804, "loss": 0.0141, "step": 195540 }, { "epoch": 0.51, "learning_rate": 0.00022396592885600897, "loss": 0.0164, "step": 195550 }, { "epoch": 0.51, "learning_rate": 0.00022396204063963748, "loss": 0.0193, "step": 195560 }, { "epoch": 0.51, "learning_rate": 0.00022395815242326602, "loss": 0.0216, "step": 195570 }, { "epoch": 0.51, "learning_rate": 0.00022395426420689454, "loss": 0.0164, "step": 195580 }, { "epoch": 0.51, "learning_rate": 0.0002239503759905231, "loss": 0.0191, "step": 195590 }, { "epoch": 0.51, "learning_rate": 0.00022394648777415165, "loss": 0.0168, "step": 195600 }, { "epoch": 0.51, "learning_rate": 0.00022394259955778016, "loss": 0.02, "step": 195610 }, { "epoch": 0.51, "learning_rate": 0.0002239387113414087, "loss": 0.0172, "step": 195620 }, { "epoch": 0.51, "learning_rate": 0.00022393482312503725, "loss": 0.0174, "step": 195630 }, { "epoch": 0.51, "learning_rate": 0.0002239309349086658, "loss": 0.0162, "step": 195640 }, { "epoch": 0.51, "learning_rate": 0.0002239270466922943, "loss": 0.0139, "step": 195650 }, { "epoch": 0.51, "learning_rate": 0.00022392315847592285, "loss": 0.0176, "step": 195660 }, { "epoch": 0.51, "learning_rate": 0.0002239192702595514, "loss": 0.0154, "step": 195670 }, { "epoch": 0.51, "learning_rate": 0.00022391538204317993, "loss": 0.0157, "step": 195680 }, { "epoch": 0.51, "learning_rate": 0.00022391149382680844, "loss": 0.0465, "step": 195690 }, { "epoch": 0.51, "learning_rate": 0.00022390760561043698, "loss": 0.0235, "step": 195700 }, { "epoch": 0.51, "learning_rate": 0.00022390371739406555, "loss": 0.0192, "step": 195710 }, { "epoch": 0.51, "learning_rate": 0.00022389982917769407, "loss": 0.02, "step": 195720 }, { "epoch": 0.51, "learning_rate": 0.00022389594096132258, "loss": 0.0176, "step": 195730 }, { "epoch": 0.51, "learning_rate": 0.00022389205274495112, "loss": 0.0214, "step": 195740 }, { "epoch": 0.51, "learning_rate": 0.0002238881645285797, "loss": 0.0203, "step": 195750 }, { "epoch": 0.51, "learning_rate": 0.0002238842763122082, "loss": 0.0405, "step": 195760 }, { "epoch": 0.51, "learning_rate": 0.00022388038809583675, "loss": 0.0177, "step": 195770 }, { "epoch": 0.51, "learning_rate": 0.00022387649987946526, "loss": 0.0172, "step": 195780 }, { "epoch": 0.51, "learning_rate": 0.0002238726116630938, "loss": 0.0189, "step": 195790 }, { "epoch": 0.51, "learning_rate": 0.00022386872344672235, "loss": 0.0168, "step": 195800 }, { "epoch": 0.51, "learning_rate": 0.0002238648352303509, "loss": 0.0244, "step": 195810 }, { "epoch": 0.51, "learning_rate": 0.0002238609470139794, "loss": 0.0133, "step": 195820 }, { "epoch": 0.51, "learning_rate": 0.00022385705879760794, "loss": 0.0157, "step": 195830 }, { "epoch": 0.51, "learning_rate": 0.00022385317058123649, "loss": 0.0177, "step": 195840 }, { "epoch": 0.51, "learning_rate": 0.00022384928236486503, "loss": 0.0185, "step": 195850 }, { "epoch": 0.51, "learning_rate": 0.00022384539414849354, "loss": 0.0156, "step": 195860 }, { "epoch": 0.51, "learning_rate": 0.00022384150593212208, "loss": 0.0215, "step": 195870 }, { "epoch": 0.51, "learning_rate": 0.00022383761771575063, "loss": 0.0199, "step": 195880 }, { "epoch": 0.51, "learning_rate": 0.00022383372949937917, "loss": 0.0179, "step": 195890 }, { "epoch": 0.51, "learning_rate": 0.00022382984128300768, "loss": 0.0207, "step": 195900 }, { "epoch": 0.51, "learning_rate": 0.00022382595306663622, "loss": 0.0162, "step": 195910 }, { "epoch": 0.51, "learning_rate": 0.0002238220648502648, "loss": 0.0188, "step": 195920 }, { "epoch": 0.51, "learning_rate": 0.0002238181766338933, "loss": 0.0157, "step": 195930 }, { "epoch": 0.51, "learning_rate": 0.00022381428841752185, "loss": 0.0175, "step": 195940 }, { "epoch": 0.51, "learning_rate": 0.00022381040020115036, "loss": 0.0153, "step": 195950 }, { "epoch": 0.51, "learning_rate": 0.00022380651198477893, "loss": 0.0214, "step": 195960 }, { "epoch": 0.51, "learning_rate": 0.00022380262376840745, "loss": 0.0178, "step": 195970 }, { "epoch": 0.51, "learning_rate": 0.000223798735552036, "loss": 0.0208, "step": 195980 }, { "epoch": 0.51, "learning_rate": 0.0002237948473356645, "loss": 0.019, "step": 195990 }, { "epoch": 0.51, "learning_rate": 0.00022379095911929307, "loss": 0.0157, "step": 196000 }, { "epoch": 0.51, "eval_cer": 0.8817740678068109, "eval_loss": 0.012171548791229725, "eval_runtime": 107.9343, "eval_samples_per_second": 18.53, "eval_steps_per_second": 4.632, "step": 196000 }, { "epoch": 0.51, "learning_rate": 0.00022378707090292159, "loss": 0.0186, "step": 196010 }, { "epoch": 0.51, "learning_rate": 0.00022378318268655013, "loss": 0.0173, "step": 196020 }, { "epoch": 0.51, "learning_rate": 0.00022377929447017864, "loss": 0.0196, "step": 196030 }, { "epoch": 0.51, "learning_rate": 0.00022377540625380718, "loss": 0.0192, "step": 196040 }, { "epoch": 0.51, "learning_rate": 0.00022377151803743573, "loss": 0.0177, "step": 196050 }, { "epoch": 0.51, "learning_rate": 0.00022376762982106427, "loss": 0.0166, "step": 196060 }, { "epoch": 0.51, "learning_rate": 0.00022376374160469278, "loss": 0.0195, "step": 196070 }, { "epoch": 0.51, "learning_rate": 0.00022375985338832132, "loss": 0.0172, "step": 196080 }, { "epoch": 0.51, "learning_rate": 0.0002237559651719499, "loss": 0.018, "step": 196090 }, { "epoch": 0.51, "learning_rate": 0.0002237520769555784, "loss": 0.0148, "step": 196100 }, { "epoch": 0.51, "learning_rate": 0.00022374818873920695, "loss": 0.0175, "step": 196110 }, { "epoch": 0.51, "learning_rate": 0.00022374430052283546, "loss": 0.0185, "step": 196120 }, { "epoch": 0.51, "learning_rate": 0.00022374041230646403, "loss": 0.018, "step": 196130 }, { "epoch": 0.51, "learning_rate": 0.00022373652409009255, "loss": 0.017, "step": 196140 }, { "epoch": 0.51, "learning_rate": 0.0002237326358737211, "loss": 0.0149, "step": 196150 }, { "epoch": 0.51, "learning_rate": 0.0002237287476573496, "loss": 0.0178, "step": 196160 }, { "epoch": 0.51, "learning_rate": 0.00022372485944097817, "loss": 0.0155, "step": 196170 }, { "epoch": 0.51, "learning_rate": 0.00022372097122460669, "loss": 0.0177, "step": 196180 }, { "epoch": 0.51, "learning_rate": 0.00022371708300823523, "loss": 0.0231, "step": 196190 }, { "epoch": 0.51, "learning_rate": 0.00022371319479186374, "loss": 0.0169, "step": 196200 }, { "epoch": 0.51, "learning_rate": 0.0002237093065754923, "loss": 0.0196, "step": 196210 }, { "epoch": 0.51, "learning_rate": 0.00022370541835912082, "loss": 0.0176, "step": 196220 }, { "epoch": 0.51, "learning_rate": 0.00022370153014274937, "loss": 0.0184, "step": 196230 }, { "epoch": 0.51, "learning_rate": 0.00022369764192637788, "loss": 0.0205, "step": 196240 }, { "epoch": 0.51, "learning_rate": 0.00022369375371000645, "loss": 0.0155, "step": 196250 }, { "epoch": 0.51, "learning_rate": 0.000223689865493635, "loss": 0.0211, "step": 196260 }, { "epoch": 0.51, "learning_rate": 0.0002236859772772635, "loss": 0.0165, "step": 196270 }, { "epoch": 0.51, "learning_rate": 0.00022368208906089202, "loss": 0.0131, "step": 196280 }, { "epoch": 0.51, "learning_rate": 0.00022367820084452056, "loss": 0.0165, "step": 196290 }, { "epoch": 0.51, "learning_rate": 0.00022367431262814913, "loss": 0.0169, "step": 196300 }, { "epoch": 0.51, "learning_rate": 0.00022367042441177765, "loss": 0.022, "step": 196310 }, { "epoch": 0.51, "learning_rate": 0.0002236665361954062, "loss": 0.018, "step": 196320 }, { "epoch": 0.51, "learning_rate": 0.0002236626479790347, "loss": 0.0244, "step": 196330 }, { "epoch": 0.51, "learning_rate": 0.00022365875976266327, "loss": 0.018, "step": 196340 }, { "epoch": 0.51, "learning_rate": 0.00022365487154629178, "loss": 0.0196, "step": 196350 }, { "epoch": 0.51, "learning_rate": 0.00022365098332992033, "loss": 0.0157, "step": 196360 }, { "epoch": 0.51, "learning_rate": 0.00022364709511354884, "loss": 0.0202, "step": 196370 }, { "epoch": 0.51, "learning_rate": 0.0002236432068971774, "loss": 0.0152, "step": 196380 }, { "epoch": 0.51, "learning_rate": 0.00022363931868080592, "loss": 0.0218, "step": 196390 }, { "epoch": 0.51, "learning_rate": 0.00022363543046443447, "loss": 0.0185, "step": 196400 }, { "epoch": 0.51, "learning_rate": 0.00022363154224806298, "loss": 0.0143, "step": 196410 }, { "epoch": 0.51, "learning_rate": 0.00022362765403169155, "loss": 0.0161, "step": 196420 }, { "epoch": 0.51, "learning_rate": 0.0002236237658153201, "loss": 0.0198, "step": 196430 }, { "epoch": 0.51, "learning_rate": 0.0002236198775989486, "loss": 0.0204, "step": 196440 }, { "epoch": 0.51, "learning_rate": 0.00022361598938257712, "loss": 0.0183, "step": 196450 }, { "epoch": 0.51, "learning_rate": 0.0002236121011662057, "loss": 0.0178, "step": 196460 }, { "epoch": 0.51, "learning_rate": 0.00022360821294983423, "loss": 0.0182, "step": 196470 }, { "epoch": 0.51, "learning_rate": 0.00022360432473346274, "loss": 0.0161, "step": 196480 }, { "epoch": 0.51, "learning_rate": 0.00022360043651709129, "loss": 0.0189, "step": 196490 }, { "epoch": 0.51, "learning_rate": 0.00022359654830071983, "loss": 0.0142, "step": 196500 }, { "epoch": 0.51, "learning_rate": 0.00022359266008434837, "loss": 0.017, "step": 196510 }, { "epoch": 0.51, "learning_rate": 0.00022358877186797688, "loss": 0.0174, "step": 196520 }, { "epoch": 0.51, "learning_rate": 0.00022358488365160543, "loss": 0.0167, "step": 196530 }, { "epoch": 0.51, "learning_rate": 0.00022358099543523394, "loss": 0.0161, "step": 196540 }, { "epoch": 0.51, "learning_rate": 0.0002235771072188625, "loss": 0.0155, "step": 196550 }, { "epoch": 0.51, "learning_rate": 0.00022357321900249102, "loss": 0.0221, "step": 196560 }, { "epoch": 0.51, "learning_rate": 0.00022356933078611957, "loss": 0.0151, "step": 196570 }, { "epoch": 0.51, "learning_rate": 0.00022356544256974808, "loss": 0.0145, "step": 196580 }, { "epoch": 0.51, "learning_rate": 0.00022356155435337665, "loss": 0.0154, "step": 196590 }, { "epoch": 0.51, "learning_rate": 0.00022355766613700516, "loss": 0.0163, "step": 196600 }, { "epoch": 0.51, "learning_rate": 0.0002235537779206337, "loss": 0.0153, "step": 196610 }, { "epoch": 0.51, "learning_rate": 0.00022354988970426222, "loss": 0.0167, "step": 196620 }, { "epoch": 0.51, "learning_rate": 0.0002235460014878908, "loss": 0.0173, "step": 196630 }, { "epoch": 0.51, "learning_rate": 0.00022354211327151933, "loss": 0.0137, "step": 196640 }, { "epoch": 0.51, "learning_rate": 0.00022353822505514784, "loss": 0.0149, "step": 196650 }, { "epoch": 0.51, "learning_rate": 0.00022353433683877639, "loss": 0.0174, "step": 196660 }, { "epoch": 0.51, "learning_rate": 0.00022353044862240493, "loss": 0.018, "step": 196670 }, { "epoch": 0.51, "learning_rate": 0.00022352656040603347, "loss": 0.0174, "step": 196680 }, { "epoch": 0.51, "learning_rate": 0.00022352267218966198, "loss": 0.0193, "step": 196690 }, { "epoch": 0.51, "learning_rate": 0.00022351878397329053, "loss": 0.0168, "step": 196700 }, { "epoch": 0.51, "learning_rate": 0.00022351489575691907, "loss": 0.0172, "step": 196710 }, { "epoch": 0.51, "learning_rate": 0.0002235110075405476, "loss": 0.0167, "step": 196720 }, { "epoch": 0.51, "learning_rate": 0.00022350711932417612, "loss": 0.0175, "step": 196730 }, { "epoch": 0.51, "learning_rate": 0.00022350323110780466, "loss": 0.019, "step": 196740 }, { "epoch": 0.51, "learning_rate": 0.00022349934289143318, "loss": 0.0175, "step": 196750 }, { "epoch": 0.51, "learning_rate": 0.00022349545467506175, "loss": 0.0226, "step": 196760 }, { "epoch": 0.51, "learning_rate": 0.00022349156645869026, "loss": 0.0158, "step": 196770 }, { "epoch": 0.51, "learning_rate": 0.0002234876782423188, "loss": 0.0138, "step": 196780 }, { "epoch": 0.51, "learning_rate": 0.00022348379002594732, "loss": 0.0168, "step": 196790 }, { "epoch": 0.51, "learning_rate": 0.0002234799018095759, "loss": 0.0174, "step": 196800 }, { "epoch": 0.51, "learning_rate": 0.00022347601359320443, "loss": 0.0159, "step": 196810 }, { "epoch": 0.51, "learning_rate": 0.00022347212537683294, "loss": 0.0182, "step": 196820 }, { "epoch": 0.51, "learning_rate": 0.00022346823716046149, "loss": 0.0173, "step": 196830 }, { "epoch": 0.51, "learning_rate": 0.00022346434894409003, "loss": 0.0193, "step": 196840 }, { "epoch": 0.51, "learning_rate": 0.00022346046072771857, "loss": 0.0169, "step": 196850 }, { "epoch": 0.51, "learning_rate": 0.00022345657251134708, "loss": 0.0202, "step": 196860 }, { "epoch": 0.51, "learning_rate": 0.00022345268429497562, "loss": 0.0223, "step": 196870 }, { "epoch": 0.51, "learning_rate": 0.00022344879607860417, "loss": 0.0175, "step": 196880 }, { "epoch": 0.51, "learning_rate": 0.0002234449078622327, "loss": 0.0167, "step": 196890 }, { "epoch": 0.51, "learning_rate": 0.00022344101964586122, "loss": 0.0146, "step": 196900 }, { "epoch": 0.51, "learning_rate": 0.00022343713142948976, "loss": 0.0171, "step": 196910 }, { "epoch": 0.51, "learning_rate": 0.0002234332432131183, "loss": 0.0171, "step": 196920 }, { "epoch": 0.51, "learning_rate": 0.00022342935499674685, "loss": 0.0125, "step": 196930 }, { "epoch": 0.51, "learning_rate": 0.00022342546678037536, "loss": 0.0182, "step": 196940 }, { "epoch": 0.51, "learning_rate": 0.0002234215785640039, "loss": 0.0189, "step": 196950 }, { "epoch": 0.51, "learning_rate": 0.00022341769034763247, "loss": 0.0157, "step": 196960 }, { "epoch": 0.51, "learning_rate": 0.000223413802131261, "loss": 0.0172, "step": 196970 }, { "epoch": 0.51, "learning_rate": 0.00022340991391488953, "loss": 0.0164, "step": 196980 }, { "epoch": 0.51, "learning_rate": 0.00022340602569851804, "loss": 0.014, "step": 196990 }, { "epoch": 0.51, "learning_rate": 0.00022340213748214656, "loss": 0.0163, "step": 197000 }, { "epoch": 0.51, "eval_cer": 0.8818160569148363, "eval_loss": 0.011719505302608013, "eval_runtime": 107.9068, "eval_samples_per_second": 18.535, "eval_steps_per_second": 4.634, "step": 197000 }, { "epoch": 0.51, "learning_rate": 0.00022339824926577513, "loss": 0.0164, "step": 197010 }, { "epoch": 0.51, "learning_rate": 0.00022339436104940367, "loss": 0.0196, "step": 197020 }, { "epoch": 0.51, "learning_rate": 0.00022339047283303218, "loss": 0.0201, "step": 197030 }, { "epoch": 0.51, "learning_rate": 0.00022338658461666072, "loss": 0.0158, "step": 197040 }, { "epoch": 0.51, "learning_rate": 0.00022338269640028927, "loss": 0.0208, "step": 197050 }, { "epoch": 0.51, "learning_rate": 0.0002233788081839178, "loss": 0.0196, "step": 197060 }, { "epoch": 0.51, "learning_rate": 0.00022337491996754632, "loss": 0.0179, "step": 197070 }, { "epoch": 0.51, "learning_rate": 0.00022337103175117486, "loss": 0.0175, "step": 197080 }, { "epoch": 0.51, "learning_rate": 0.0002233671435348034, "loss": 0.0174, "step": 197090 }, { "epoch": 0.51, "learning_rate": 0.00022336325531843195, "loss": 0.0177, "step": 197100 }, { "epoch": 0.51, "learning_rate": 0.00022335936710206046, "loss": 0.0206, "step": 197110 }, { "epoch": 0.51, "learning_rate": 0.000223355478885689, "loss": 0.0142, "step": 197120 }, { "epoch": 0.51, "learning_rate": 0.00022335159066931757, "loss": 0.0141, "step": 197130 }, { "epoch": 0.51, "learning_rate": 0.00022334770245294609, "loss": 0.0178, "step": 197140 }, { "epoch": 0.51, "learning_rate": 0.0002233438142365746, "loss": 0.0161, "step": 197150 }, { "epoch": 0.51, "learning_rate": 0.00022333992602020314, "loss": 0.0143, "step": 197160 }, { "epoch": 0.51, "learning_rate": 0.0002233360378038317, "loss": 0.0168, "step": 197170 }, { "epoch": 0.51, "learning_rate": 0.00022333214958746023, "loss": 0.0171, "step": 197180 }, { "epoch": 0.51, "learning_rate": 0.00022332826137108877, "loss": 0.0165, "step": 197190 }, { "epoch": 0.51, "learning_rate": 0.00022332437315471728, "loss": 0.0194, "step": 197200 }, { "epoch": 0.51, "learning_rate": 0.00022332048493834585, "loss": 0.0176, "step": 197210 }, { "epoch": 0.51, "learning_rate": 0.00022331659672197437, "loss": 0.0182, "step": 197220 }, { "epoch": 0.51, "learning_rate": 0.0002233127085056029, "loss": 0.0211, "step": 197230 }, { "epoch": 0.51, "learning_rate": 0.00022330882028923142, "loss": 0.0167, "step": 197240 }, { "epoch": 0.51, "learning_rate": 0.00022330493207285996, "loss": 0.0167, "step": 197250 }, { "epoch": 0.51, "learning_rate": 0.0002233010438564885, "loss": 0.0156, "step": 197260 }, { "epoch": 0.51, "learning_rate": 0.00022329715564011705, "loss": 0.0175, "step": 197270 }, { "epoch": 0.51, "learning_rate": 0.00022329326742374556, "loss": 0.0145, "step": 197280 }, { "epoch": 0.51, "learning_rate": 0.0002232893792073741, "loss": 0.0178, "step": 197290 }, { "epoch": 0.51, "learning_rate": 0.00022328549099100267, "loss": 0.0147, "step": 197300 }, { "epoch": 0.51, "learning_rate": 0.00022328160277463119, "loss": 0.0144, "step": 197310 }, { "epoch": 0.51, "learning_rate": 0.0002232777145582597, "loss": 0.0159, "step": 197320 }, { "epoch": 0.51, "learning_rate": 0.00022327382634188824, "loss": 0.0172, "step": 197330 }, { "epoch": 0.51, "learning_rate": 0.0002232699381255168, "loss": 0.0166, "step": 197340 }, { "epoch": 0.51, "learning_rate": 0.00022326604990914533, "loss": 0.0153, "step": 197350 }, { "epoch": 0.51, "learning_rate": 0.00022326216169277387, "loss": 0.0174, "step": 197360 }, { "epoch": 0.51, "learning_rate": 0.00022325827347640238, "loss": 0.0163, "step": 197370 }, { "epoch": 0.51, "learning_rate": 0.00022325438526003095, "loss": 0.0159, "step": 197380 }, { "epoch": 0.51, "learning_rate": 0.00022325049704365946, "loss": 0.0174, "step": 197390 }, { "epoch": 0.51, "learning_rate": 0.000223246608827288, "loss": 0.0156, "step": 197400 }, { "epoch": 0.51, "learning_rate": 0.00022324272061091652, "loss": 0.0225, "step": 197410 }, { "epoch": 0.51, "learning_rate": 0.0002232388323945451, "loss": 0.0176, "step": 197420 }, { "epoch": 0.51, "learning_rate": 0.0002232349441781736, "loss": 0.0211, "step": 197430 }, { "epoch": 0.51, "learning_rate": 0.00022323105596180215, "loss": 0.016, "step": 197440 }, { "epoch": 0.51, "learning_rate": 0.00022322716774543066, "loss": 0.0153, "step": 197450 }, { "epoch": 0.51, "learning_rate": 0.00022322327952905923, "loss": 0.0143, "step": 197460 }, { "epoch": 0.51, "learning_rate": 0.00022321939131268774, "loss": 0.0132, "step": 197470 }, { "epoch": 0.51, "learning_rate": 0.00022321550309631629, "loss": 0.0166, "step": 197480 }, { "epoch": 0.51, "learning_rate": 0.0002232116148799448, "loss": 0.0166, "step": 197490 }, { "epoch": 0.51, "learning_rate": 0.00022320772666357334, "loss": 0.0165, "step": 197500 }, { "epoch": 0.51, "learning_rate": 0.0002232038384472019, "loss": 0.0196, "step": 197510 }, { "epoch": 0.51, "learning_rate": 0.00022319995023083042, "loss": 0.0185, "step": 197520 }, { "epoch": 0.51, "learning_rate": 0.00022319606201445897, "loss": 0.016, "step": 197530 }, { "epoch": 0.51, "learning_rate": 0.00022319217379808748, "loss": 0.0149, "step": 197540 }, { "epoch": 0.51, "learning_rate": 0.00022318828558171605, "loss": 0.016, "step": 197550 }, { "epoch": 0.51, "learning_rate": 0.00022318439736534456, "loss": 0.0195, "step": 197560 }, { "epoch": 0.51, "learning_rate": 0.0002231805091489731, "loss": 0.0255, "step": 197570 }, { "epoch": 0.51, "learning_rate": 0.00022317662093260162, "loss": 0.0231, "step": 197580 }, { "epoch": 0.51, "learning_rate": 0.0002231727327162302, "loss": 0.0153, "step": 197590 }, { "epoch": 0.51, "learning_rate": 0.0002231688444998587, "loss": 0.0148, "step": 197600 }, { "epoch": 0.51, "learning_rate": 0.00022316495628348725, "loss": 0.0179, "step": 197610 }, { "epoch": 0.51, "learning_rate": 0.00022316106806711576, "loss": 0.0162, "step": 197620 }, { "epoch": 0.51, "learning_rate": 0.00022315717985074433, "loss": 0.0182, "step": 197630 }, { "epoch": 0.51, "learning_rate": 0.00022315329163437284, "loss": 0.0218, "step": 197640 }, { "epoch": 0.51, "learning_rate": 0.00022314940341800138, "loss": 0.0153, "step": 197650 }, { "epoch": 0.51, "learning_rate": 0.0002231455152016299, "loss": 0.0183, "step": 197660 }, { "epoch": 0.51, "learning_rate": 0.00022314162698525847, "loss": 0.0176, "step": 197670 }, { "epoch": 0.51, "learning_rate": 0.000223137738768887, "loss": 0.0187, "step": 197680 }, { "epoch": 0.51, "learning_rate": 0.00022313385055251552, "loss": 0.016, "step": 197690 }, { "epoch": 0.51, "learning_rate": 0.00022312996233614407, "loss": 0.0176, "step": 197700 }, { "epoch": 0.51, "learning_rate": 0.0002231260741197726, "loss": 0.02, "step": 197710 }, { "epoch": 0.51, "learning_rate": 0.00022312218590340115, "loss": 0.0234, "step": 197720 }, { "epoch": 0.51, "learning_rate": 0.00022311829768702966, "loss": 0.018, "step": 197730 }, { "epoch": 0.51, "learning_rate": 0.0002231144094706582, "loss": 0.0165, "step": 197740 }, { "epoch": 0.51, "learning_rate": 0.00022311052125428672, "loss": 0.0195, "step": 197750 }, { "epoch": 0.51, "learning_rate": 0.0002231066330379153, "loss": 0.0179, "step": 197760 }, { "epoch": 0.51, "learning_rate": 0.0002231027448215438, "loss": 0.0159, "step": 197770 }, { "epoch": 0.51, "learning_rate": 0.00022309885660517234, "loss": 0.0126, "step": 197780 }, { "epoch": 0.51, "learning_rate": 0.00022309496838880086, "loss": 0.0162, "step": 197790 }, { "epoch": 0.51, "learning_rate": 0.00022309108017242943, "loss": 0.0172, "step": 197800 }, { "epoch": 0.51, "learning_rate": 0.00022308719195605794, "loss": 0.0194, "step": 197810 }, { "epoch": 0.51, "learning_rate": 0.00022308330373968648, "loss": 0.0181, "step": 197820 }, { "epoch": 0.51, "learning_rate": 0.000223079415523315, "loss": 0.0191, "step": 197830 }, { "epoch": 0.51, "learning_rate": 0.00022307552730694357, "loss": 0.0193, "step": 197840 }, { "epoch": 0.51, "learning_rate": 0.0002230716390905721, "loss": 0.0223, "step": 197850 }, { "epoch": 0.51, "learning_rate": 0.00022306775087420062, "loss": 0.0153, "step": 197860 }, { "epoch": 0.51, "learning_rate": 0.00022306386265782914, "loss": 0.0202, "step": 197870 }, { "epoch": 0.51, "learning_rate": 0.0002230599744414577, "loss": 0.0157, "step": 197880 }, { "epoch": 0.51, "learning_rate": 0.00022305608622508625, "loss": 0.0172, "step": 197890 }, { "epoch": 0.51, "learning_rate": 0.00022305219800871476, "loss": 0.0197, "step": 197900 }, { "epoch": 0.51, "learning_rate": 0.0002230483097923433, "loss": 0.0177, "step": 197910 }, { "epoch": 0.51, "learning_rate": 0.00022304442157597185, "loss": 0.02, "step": 197920 }, { "epoch": 0.51, "learning_rate": 0.0002230405333596004, "loss": 0.0171, "step": 197930 }, { "epoch": 0.51, "learning_rate": 0.0002230366451432289, "loss": 0.0185, "step": 197940 }, { "epoch": 0.51, "learning_rate": 0.00022303275692685744, "loss": 0.0162, "step": 197950 }, { "epoch": 0.51, "learning_rate": 0.00022302886871048599, "loss": 0.0172, "step": 197960 }, { "epoch": 0.51, "learning_rate": 0.00022302498049411453, "loss": 0.0163, "step": 197970 }, { "epoch": 0.51, "learning_rate": 0.00022302109227774304, "loss": 0.0201, "step": 197980 }, { "epoch": 0.51, "learning_rate": 0.00022301720406137158, "loss": 0.0158, "step": 197990 }, { "epoch": 0.51, "learning_rate": 0.0002230133158450001, "loss": 0.0157, "step": 198000 }, { "epoch": 0.51, "eval_cer": 0.8818356518319148, "eval_loss": 0.011476157233119011, "eval_runtime": 107.9405, "eval_samples_per_second": 18.529, "eval_steps_per_second": 4.632, "step": 198000 }, { "epoch": 0.51, "learning_rate": 0.00022300942762862867, "loss": 0.0173, "step": 198010 }, { "epoch": 0.51, "learning_rate": 0.0002230055394122572, "loss": 0.0132, "step": 198020 }, { "epoch": 0.51, "learning_rate": 0.00022300165119588572, "loss": 0.0172, "step": 198030 }, { "epoch": 0.51, "learning_rate": 0.00022299776297951424, "loss": 0.0177, "step": 198040 }, { "epoch": 0.51, "learning_rate": 0.0002229938747631428, "loss": 0.0204, "step": 198050 }, { "epoch": 0.51, "learning_rate": 0.00022298998654677135, "loss": 0.0165, "step": 198060 }, { "epoch": 0.51, "learning_rate": 0.00022298609833039986, "loss": 0.0208, "step": 198070 }, { "epoch": 0.51, "learning_rate": 0.0002229822101140284, "loss": 0.0165, "step": 198080 }, { "epoch": 0.51, "learning_rate": 0.00022297832189765695, "loss": 0.0182, "step": 198090 }, { "epoch": 0.51, "learning_rate": 0.0002229744336812855, "loss": 0.018, "step": 198100 }, { "epoch": 0.51, "learning_rate": 0.000222970545464914, "loss": 0.0174, "step": 198110 }, { "epoch": 0.51, "learning_rate": 0.00022296665724854254, "loss": 0.0179, "step": 198120 }, { "epoch": 0.51, "learning_rate": 0.00022296276903217108, "loss": 0.0202, "step": 198130 }, { "epoch": 0.51, "learning_rate": 0.00022295888081579963, "loss": 0.0211, "step": 198140 }, { "epoch": 0.51, "learning_rate": 0.00022295499259942814, "loss": 0.0166, "step": 198150 }, { "epoch": 0.51, "learning_rate": 0.00022295110438305668, "loss": 0.0158, "step": 198160 }, { "epoch": 0.51, "learning_rate": 0.00022294721616668525, "loss": 0.0176, "step": 198170 }, { "epoch": 0.51, "learning_rate": 0.00022294332795031377, "loss": 0.0164, "step": 198180 }, { "epoch": 0.51, "learning_rate": 0.00022293943973394228, "loss": 0.0162, "step": 198190 }, { "epoch": 0.51, "learning_rate": 0.00022293555151757082, "loss": 0.0196, "step": 198200 }, { "epoch": 0.51, "learning_rate": 0.0002229316633011994, "loss": 0.0165, "step": 198210 }, { "epoch": 0.51, "learning_rate": 0.0002229277750848279, "loss": 0.0251, "step": 198220 }, { "epoch": 0.51, "learning_rate": 0.00022292388686845645, "loss": 0.0219, "step": 198230 }, { "epoch": 0.51, "learning_rate": 0.00022291999865208496, "loss": 0.0182, "step": 198240 }, { "epoch": 0.51, "learning_rate": 0.0002229161104357135, "loss": 0.0158, "step": 198250 }, { "epoch": 0.51, "learning_rate": 0.00022291222221934204, "loss": 0.0154, "step": 198260 }, { "epoch": 0.51, "learning_rate": 0.0002229083340029706, "loss": 0.0152, "step": 198270 }, { "epoch": 0.51, "learning_rate": 0.0002229044457865991, "loss": 0.0158, "step": 198280 }, { "epoch": 0.51, "learning_rate": 0.00022290055757022764, "loss": 0.0161, "step": 198290 }, { "epoch": 0.51, "learning_rate": 0.00022289666935385618, "loss": 0.0193, "step": 198300 }, { "epoch": 0.51, "learning_rate": 0.00022289278113748473, "loss": 0.0181, "step": 198310 }, { "epoch": 0.51, "learning_rate": 0.00022288889292111324, "loss": 0.0189, "step": 198320 }, { "epoch": 0.51, "learning_rate": 0.00022288500470474178, "loss": 0.014, "step": 198330 }, { "epoch": 0.51, "learning_rate": 0.00022288111648837032, "loss": 0.0167, "step": 198340 }, { "epoch": 0.51, "learning_rate": 0.00022287722827199887, "loss": 0.0161, "step": 198350 }, { "epoch": 0.51, "learning_rate": 0.00022287334005562738, "loss": 0.0198, "step": 198360 }, { "epoch": 0.51, "learning_rate": 0.00022286945183925592, "loss": 0.0143, "step": 198370 }, { "epoch": 0.51, "learning_rate": 0.0002228655636228845, "loss": 0.0139, "step": 198380 }, { "epoch": 0.51, "learning_rate": 0.000222861675406513, "loss": 0.0189, "step": 198390 }, { "epoch": 0.51, "learning_rate": 0.00022285778719014155, "loss": 0.0262, "step": 198400 }, { "epoch": 0.51, "learning_rate": 0.00022285389897377006, "loss": 0.0191, "step": 198410 }, { "epoch": 0.51, "learning_rate": 0.00022285001075739863, "loss": 0.0195, "step": 198420 }, { "epoch": 0.51, "learning_rate": 0.00022284612254102714, "loss": 0.0175, "step": 198430 }, { "epoch": 0.51, "learning_rate": 0.00022284223432465569, "loss": 0.0143, "step": 198440 }, { "epoch": 0.51, "learning_rate": 0.0002228383461082842, "loss": 0.0163, "step": 198450 }, { "epoch": 0.51, "learning_rate": 0.00022283445789191277, "loss": 0.0202, "step": 198460 }, { "epoch": 0.51, "learning_rate": 0.00022283056967554128, "loss": 0.0151, "step": 198470 }, { "epoch": 0.51, "learning_rate": 0.00022282668145916983, "loss": 0.0167, "step": 198480 }, { "epoch": 0.51, "learning_rate": 0.00022282279324279834, "loss": 0.018, "step": 198490 }, { "epoch": 0.51, "learning_rate": 0.00022281890502642688, "loss": 0.0183, "step": 198500 }, { "epoch": 0.51, "learning_rate": 0.00022281501681005542, "loss": 0.0228, "step": 198510 }, { "epoch": 0.51, "learning_rate": 0.00022281112859368396, "loss": 0.0176, "step": 198520 }, { "epoch": 0.51, "learning_rate": 0.00022280724037731248, "loss": 0.0166, "step": 198530 }, { "epoch": 0.51, "learning_rate": 0.00022280335216094102, "loss": 0.0168, "step": 198540 }, { "epoch": 0.51, "learning_rate": 0.0002227994639445696, "loss": 0.0184, "step": 198550 }, { "epoch": 0.51, "learning_rate": 0.0002227955757281981, "loss": 0.0168, "step": 198560 }, { "epoch": 0.51, "learning_rate": 0.00022279168751182665, "loss": 0.0187, "step": 198570 }, { "epoch": 0.51, "learning_rate": 0.00022278779929545516, "loss": 0.0135, "step": 198580 }, { "epoch": 0.51, "learning_rate": 0.00022278391107908373, "loss": 0.0212, "step": 198590 }, { "epoch": 0.51, "learning_rate": 0.00022278002286271224, "loss": 0.0187, "step": 198600 }, { "epoch": 0.51, "learning_rate": 0.00022277613464634079, "loss": 0.017, "step": 198610 }, { "epoch": 0.51, "learning_rate": 0.0002227722464299693, "loss": 0.0198, "step": 198620 }, { "epoch": 0.51, "learning_rate": 0.00022276835821359787, "loss": 0.0175, "step": 198630 }, { "epoch": 0.51, "learning_rate": 0.00022276446999722638, "loss": 0.0175, "step": 198640 }, { "epoch": 0.51, "learning_rate": 0.00022276058178085492, "loss": 0.0168, "step": 198650 }, { "epoch": 0.51, "learning_rate": 0.00022275669356448344, "loss": 0.0174, "step": 198660 }, { "epoch": 0.51, "learning_rate": 0.000222752805348112, "loss": 0.0167, "step": 198670 }, { "epoch": 0.52, "learning_rate": 0.00022274891713174052, "loss": 0.0178, "step": 198680 }, { "epoch": 0.52, "learning_rate": 0.00022274502891536906, "loss": 0.0145, "step": 198690 }, { "epoch": 0.52, "learning_rate": 0.00022274114069899758, "loss": 0.0183, "step": 198700 }, { "epoch": 0.52, "learning_rate": 0.00022273725248262615, "loss": 0.015, "step": 198710 }, { "epoch": 0.52, "learning_rate": 0.0002227333642662547, "loss": 0.0199, "step": 198720 }, { "epoch": 0.52, "learning_rate": 0.0002227294760498832, "loss": 0.0205, "step": 198730 }, { "epoch": 0.52, "learning_rate": 0.00022272558783351172, "loss": 0.0177, "step": 198740 }, { "epoch": 0.52, "learning_rate": 0.00022272169961714026, "loss": 0.0152, "step": 198750 }, { "epoch": 0.52, "learning_rate": 0.00022271781140076883, "loss": 0.0213, "step": 198760 }, { "epoch": 0.52, "learning_rate": 0.00022271392318439734, "loss": 0.0164, "step": 198770 }, { "epoch": 0.52, "learning_rate": 0.00022271003496802588, "loss": 0.0171, "step": 198780 }, { "epoch": 0.52, "learning_rate": 0.0002227061467516544, "loss": 0.0234, "step": 198790 }, { "epoch": 0.52, "learning_rate": 0.00022270225853528297, "loss": 0.021, "step": 198800 }, { "epoch": 0.52, "learning_rate": 0.00022269837031891148, "loss": 0.0175, "step": 198810 }, { "epoch": 0.52, "learning_rate": 0.00022269448210254002, "loss": 0.0179, "step": 198820 }, { "epoch": 0.52, "learning_rate": 0.00022269059388616854, "loss": 0.0166, "step": 198830 }, { "epoch": 0.52, "learning_rate": 0.0002226867056697971, "loss": 0.0189, "step": 198840 }, { "epoch": 0.52, "learning_rate": 0.00022268281745342562, "loss": 0.0187, "step": 198850 }, { "epoch": 0.52, "learning_rate": 0.00022267892923705416, "loss": 0.0185, "step": 198860 }, { "epoch": 0.52, "learning_rate": 0.00022267504102068268, "loss": 0.0163, "step": 198870 }, { "epoch": 0.52, "learning_rate": 0.00022267115280431125, "loss": 0.0137, "step": 198880 }, { "epoch": 0.52, "learning_rate": 0.0002226672645879398, "loss": 0.0205, "step": 198890 }, { "epoch": 0.52, "learning_rate": 0.0002226633763715683, "loss": 0.0175, "step": 198900 }, { "epoch": 0.52, "learning_rate": 0.00022265948815519682, "loss": 0.0138, "step": 198910 }, { "epoch": 0.52, "learning_rate": 0.00022265559993882539, "loss": 0.0154, "step": 198920 }, { "epoch": 0.52, "learning_rate": 0.00022265171172245393, "loss": 0.0156, "step": 198930 }, { "epoch": 0.52, "learning_rate": 0.00022264782350608244, "loss": 0.0165, "step": 198940 }, { "epoch": 0.52, "learning_rate": 0.00022264393528971098, "loss": 0.0198, "step": 198950 }, { "epoch": 0.52, "learning_rate": 0.00022264004707333953, "loss": 0.0208, "step": 198960 }, { "epoch": 0.52, "learning_rate": 0.00022263615885696807, "loss": 0.0168, "step": 198970 }, { "epoch": 0.52, "learning_rate": 0.00022263227064059658, "loss": 0.0174, "step": 198980 }, { "epoch": 0.52, "learning_rate": 0.00022262838242422512, "loss": 0.0187, "step": 198990 }, { "epoch": 0.52, "learning_rate": 0.00022262449420785364, "loss": 0.0176, "step": 199000 }, { "epoch": 0.52, "eval_cer": 0.8817992612716261, "eval_loss": 0.012197881937026978, "eval_runtime": 107.9744, "eval_samples_per_second": 18.523, "eval_steps_per_second": 4.631, "step": 199000 }, { "epoch": 0.52, "learning_rate": 0.0002226206059914822, "loss": 0.0189, "step": 199010 }, { "epoch": 0.52, "learning_rate": 0.00022261671777511072, "loss": 0.0175, "step": 199020 }, { "epoch": 0.52, "learning_rate": 0.00022261282955873926, "loss": 0.0192, "step": 199030 }, { "epoch": 0.52, "learning_rate": 0.00022260894134236778, "loss": 0.0169, "step": 199040 }, { "epoch": 0.52, "learning_rate": 0.00022260505312599635, "loss": 0.0182, "step": 199050 }, { "epoch": 0.52, "learning_rate": 0.00022260116490962486, "loss": 0.017, "step": 199060 }, { "epoch": 0.52, "learning_rate": 0.0002225972766932534, "loss": 0.0141, "step": 199070 }, { "epoch": 0.52, "learning_rate": 0.00022259338847688192, "loss": 0.0136, "step": 199080 }, { "epoch": 0.52, "learning_rate": 0.00022258950026051049, "loss": 0.018, "step": 199090 }, { "epoch": 0.52, "learning_rate": 0.00022258561204413903, "loss": 0.0148, "step": 199100 }, { "epoch": 0.52, "learning_rate": 0.00022258172382776754, "loss": 0.0197, "step": 199110 }, { "epoch": 0.52, "learning_rate": 0.00022257783561139608, "loss": 0.0169, "step": 199120 }, { "epoch": 0.52, "learning_rate": 0.00022257394739502463, "loss": 0.0187, "step": 199130 }, { "epoch": 0.52, "learning_rate": 0.00022257005917865317, "loss": 0.019, "step": 199140 }, { "epoch": 0.52, "learning_rate": 0.00022256617096228168, "loss": 0.0192, "step": 199150 }, { "epoch": 0.52, "learning_rate": 0.00022256228274591022, "loss": 0.0161, "step": 199160 }, { "epoch": 0.52, "learning_rate": 0.00022255839452953876, "loss": 0.0146, "step": 199170 }, { "epoch": 0.52, "learning_rate": 0.0002225545063131673, "loss": 0.0201, "step": 199180 }, { "epoch": 0.52, "learning_rate": 0.00022255061809679582, "loss": 0.0196, "step": 199190 }, { "epoch": 0.52, "learning_rate": 0.00022254672988042436, "loss": 0.0162, "step": 199200 }, { "epoch": 0.52, "learning_rate": 0.0002225428416640529, "loss": 0.0199, "step": 199210 }, { "epoch": 0.52, "learning_rate": 0.00022253895344768145, "loss": 0.0189, "step": 199220 }, { "epoch": 0.52, "learning_rate": 0.00022253506523130996, "loss": 0.0214, "step": 199230 }, { "epoch": 0.52, "learning_rate": 0.0002225311770149385, "loss": 0.0196, "step": 199240 }, { "epoch": 0.52, "learning_rate": 0.00022252728879856702, "loss": 0.0143, "step": 199250 }, { "epoch": 0.52, "learning_rate": 0.00022252340058219559, "loss": 0.018, "step": 199260 }, { "epoch": 0.52, "learning_rate": 0.00022251951236582413, "loss": 0.0171, "step": 199270 }, { "epoch": 0.52, "learning_rate": 0.00022251562414945264, "loss": 0.0173, "step": 199280 }, { "epoch": 0.52, "learning_rate": 0.00022251173593308118, "loss": 0.0153, "step": 199290 }, { "epoch": 0.52, "learning_rate": 0.00022250784771670972, "loss": 0.0207, "step": 199300 }, { "epoch": 0.52, "learning_rate": 0.00022250395950033827, "loss": 0.0165, "step": 199310 }, { "epoch": 0.52, "learning_rate": 0.00022250007128396678, "loss": 0.0176, "step": 199320 }, { "epoch": 0.52, "learning_rate": 0.00022249618306759532, "loss": 0.014, "step": 199330 }, { "epoch": 0.52, "learning_rate": 0.00022249229485122386, "loss": 0.0171, "step": 199340 }, { "epoch": 0.52, "learning_rate": 0.0002224884066348524, "loss": 0.0161, "step": 199350 }, { "epoch": 0.52, "learning_rate": 0.00022248451841848092, "loss": 0.0155, "step": 199360 }, { "epoch": 0.52, "learning_rate": 0.00022248063020210946, "loss": 0.0178, "step": 199370 }, { "epoch": 0.52, "learning_rate": 0.000222476741985738, "loss": 0.0155, "step": 199380 }, { "epoch": 0.52, "learning_rate": 0.00022247285376936655, "loss": 0.0212, "step": 199390 }, { "epoch": 0.52, "learning_rate": 0.00022246896555299506, "loss": 0.0204, "step": 199400 }, { "epoch": 0.52, "learning_rate": 0.0002224650773366236, "loss": 0.0158, "step": 199410 }, { "epoch": 0.52, "learning_rate": 0.00022246118912025217, "loss": 0.0128, "step": 199420 }, { "epoch": 0.52, "learning_rate": 0.00022245730090388068, "loss": 0.0158, "step": 199430 }, { "epoch": 0.52, "learning_rate": 0.00022245341268750923, "loss": 0.0205, "step": 199440 }, { "epoch": 0.52, "learning_rate": 0.00022244952447113774, "loss": 0.0217, "step": 199450 }, { "epoch": 0.52, "learning_rate": 0.0002224456362547663, "loss": 0.0194, "step": 199460 }, { "epoch": 0.52, "learning_rate": 0.00022244174803839482, "loss": 0.0179, "step": 199470 }, { "epoch": 0.52, "learning_rate": 0.00022243785982202337, "loss": 0.0189, "step": 199480 }, { "epoch": 0.52, "learning_rate": 0.00022243397160565188, "loss": 0.0162, "step": 199490 }, { "epoch": 0.52, "learning_rate": 0.00022243008338928042, "loss": 0.0151, "step": 199500 }, { "epoch": 0.52, "learning_rate": 0.00022242619517290896, "loss": 0.018, "step": 199510 }, { "epoch": 0.52, "learning_rate": 0.0002224223069565375, "loss": 0.0196, "step": 199520 }, { "epoch": 0.52, "learning_rate": 0.00022241841874016602, "loss": 0.0167, "step": 199530 }, { "epoch": 0.52, "learning_rate": 0.00022241453052379456, "loss": 0.0188, "step": 199540 }, { "epoch": 0.52, "learning_rate": 0.0002224106423074231, "loss": 0.0193, "step": 199550 }, { "epoch": 0.52, "learning_rate": 0.00022240675409105164, "loss": 0.0175, "step": 199560 }, { "epoch": 0.52, "learning_rate": 0.00022240286587468016, "loss": 0.0233, "step": 199570 }, { "epoch": 0.52, "learning_rate": 0.0002223989776583087, "loss": 0.023, "step": 199580 }, { "epoch": 0.52, "learning_rate": 0.00022239508944193727, "loss": 0.0167, "step": 199590 }, { "epoch": 0.52, "learning_rate": 0.00022239120122556578, "loss": 0.0191, "step": 199600 }, { "epoch": 0.52, "learning_rate": 0.00022238731300919433, "loss": 0.0137, "step": 199610 }, { "epoch": 0.52, "learning_rate": 0.00022238342479282284, "loss": 0.0151, "step": 199620 }, { "epoch": 0.52, "learning_rate": 0.0002223795365764514, "loss": 0.0183, "step": 199630 }, { "epoch": 0.52, "learning_rate": 0.00022237564836007992, "loss": 0.0207, "step": 199640 }, { "epoch": 0.52, "learning_rate": 0.00022237176014370847, "loss": 0.0188, "step": 199650 }, { "epoch": 0.52, "learning_rate": 0.00022236787192733698, "loss": 0.019, "step": 199660 }, { "epoch": 0.52, "learning_rate": 0.00022236398371096555, "loss": 0.018, "step": 199670 }, { "epoch": 0.52, "learning_rate": 0.00022236009549459406, "loss": 0.0173, "step": 199680 }, { "epoch": 0.52, "learning_rate": 0.0002223562072782226, "loss": 0.0174, "step": 199690 }, { "epoch": 0.52, "learning_rate": 0.00022235231906185112, "loss": 0.0166, "step": 199700 }, { "epoch": 0.52, "learning_rate": 0.0002223484308454797, "loss": 0.0192, "step": 199710 }, { "epoch": 0.52, "learning_rate": 0.0002223445426291082, "loss": 0.0154, "step": 199720 }, { "epoch": 0.52, "learning_rate": 0.00022234065441273674, "loss": 0.0207, "step": 199730 }, { "epoch": 0.52, "learning_rate": 0.00022233676619636526, "loss": 0.0192, "step": 199740 }, { "epoch": 0.52, "learning_rate": 0.0002223328779799938, "loss": 0.0154, "step": 199750 }, { "epoch": 0.52, "learning_rate": 0.00022232898976362237, "loss": 0.0225, "step": 199760 }, { "epoch": 0.52, "learning_rate": 0.00022232510154725088, "loss": 0.02, "step": 199770 }, { "epoch": 0.52, "learning_rate": 0.0002223212133308794, "loss": 0.0164, "step": 199780 }, { "epoch": 0.52, "learning_rate": 0.00022231732511450794, "loss": 0.0162, "step": 199790 }, { "epoch": 0.52, "learning_rate": 0.0002223134368981365, "loss": 0.0176, "step": 199800 }, { "epoch": 0.52, "learning_rate": 0.00022230954868176502, "loss": 0.0165, "step": 199810 }, { "epoch": 0.52, "learning_rate": 0.00022230566046539356, "loss": 0.02, "step": 199820 }, { "epoch": 0.52, "learning_rate": 0.00022230177224902208, "loss": 0.016, "step": 199830 }, { "epoch": 0.52, "learning_rate": 0.00022229788403265065, "loss": 0.015, "step": 199840 }, { "epoch": 0.52, "learning_rate": 0.00022229399581627916, "loss": 0.0201, "step": 199850 }, { "epoch": 0.52, "learning_rate": 0.0002222901075999077, "loss": 0.0214, "step": 199860 }, { "epoch": 0.52, "learning_rate": 0.00022228621938353622, "loss": 0.024, "step": 199870 }, { "epoch": 0.52, "learning_rate": 0.0002222823311671648, "loss": 0.0152, "step": 199880 }, { "epoch": 0.52, "learning_rate": 0.0002222784429507933, "loss": 0.018, "step": 199890 }, { "epoch": 0.52, "learning_rate": 0.00022227455473442184, "loss": 0.0154, "step": 199900 }, { "epoch": 0.52, "learning_rate": 0.00022227066651805036, "loss": 0.0183, "step": 199910 }, { "epoch": 0.52, "learning_rate": 0.00022226677830167893, "loss": 0.0169, "step": 199920 }, { "epoch": 0.52, "learning_rate": 0.00022226289008530744, "loss": 0.0183, "step": 199930 }, { "epoch": 0.52, "learning_rate": 0.00022225900186893598, "loss": 0.0151, "step": 199940 }, { "epoch": 0.52, "learning_rate": 0.0002222551136525645, "loss": 0.0181, "step": 199950 }, { "epoch": 0.52, "learning_rate": 0.00022225122543619307, "loss": 0.0179, "step": 199960 }, { "epoch": 0.52, "learning_rate": 0.0002222473372198216, "loss": 0.0153, "step": 199970 }, { "epoch": 0.52, "learning_rate": 0.00022224344900345012, "loss": 0.0164, "step": 199980 }, { "epoch": 0.52, "learning_rate": 0.00022223956078707866, "loss": 0.0148, "step": 199990 }, { "epoch": 0.52, "learning_rate": 0.00022223567257070718, "loss": 0.0183, "step": 200000 }, { "epoch": 0.52, "eval_cer": 0.8817880641761527, "eval_loss": 0.012208198197185993, "eval_runtime": 108.0565, "eval_samples_per_second": 18.509, "eval_steps_per_second": 4.627, "step": 200000 }, { "epoch": 0.52, "learning_rate": 0.00022223178435433575, "loss": 0.0196, "step": 200010 }, { "epoch": 0.52, "learning_rate": 0.00022222789613796426, "loss": 0.021, "step": 200020 }, { "epoch": 0.52, "learning_rate": 0.0002222240079215928, "loss": 0.016, "step": 200030 }, { "epoch": 0.52, "learning_rate": 0.00022222011970522132, "loss": 0.0178, "step": 200040 }, { "epoch": 0.52, "learning_rate": 0.0002222162314888499, "loss": 0.0136, "step": 200050 }, { "epoch": 0.52, "learning_rate": 0.0002222123432724784, "loss": 0.0163, "step": 200060 }, { "epoch": 0.52, "learning_rate": 0.00022220845505610694, "loss": 0.0175, "step": 200070 }, { "epoch": 0.52, "learning_rate": 0.00022220456683973546, "loss": 0.0194, "step": 200080 }, { "epoch": 0.52, "learning_rate": 0.00022220067862336403, "loss": 0.0196, "step": 200090 }, { "epoch": 0.52, "learning_rate": 0.00022219679040699254, "loss": 0.0191, "step": 200100 }, { "epoch": 0.52, "learning_rate": 0.00022219290219062108, "loss": 0.0164, "step": 200110 }, { "epoch": 0.52, "learning_rate": 0.0002221890139742496, "loss": 0.0188, "step": 200120 }, { "epoch": 0.52, "learning_rate": 0.00022218512575787817, "loss": 0.0189, "step": 200130 }, { "epoch": 0.52, "learning_rate": 0.0002221812375415067, "loss": 0.0172, "step": 200140 }, { "epoch": 0.52, "learning_rate": 0.00022217734932513522, "loss": 0.0166, "step": 200150 }, { "epoch": 0.52, "learning_rate": 0.00022217346110876376, "loss": 0.0209, "step": 200160 }, { "epoch": 0.52, "learning_rate": 0.0002221695728923923, "loss": 0.0152, "step": 200170 }, { "epoch": 0.52, "learning_rate": 0.00022216568467602085, "loss": 0.0198, "step": 200180 }, { "epoch": 0.52, "learning_rate": 0.00022216179645964936, "loss": 0.0181, "step": 200190 }, { "epoch": 0.52, "learning_rate": 0.0002221579082432779, "loss": 0.0168, "step": 200200 }, { "epoch": 0.52, "learning_rate": 0.00022215402002690644, "loss": 0.0184, "step": 200210 }, { "epoch": 0.52, "learning_rate": 0.00022215013181053499, "loss": 0.024, "step": 200220 }, { "epoch": 0.52, "learning_rate": 0.0002221462435941635, "loss": 0.0496, "step": 200230 }, { "epoch": 0.52, "learning_rate": 0.00022214235537779204, "loss": 0.0284, "step": 200240 }, { "epoch": 0.52, "learning_rate": 0.00022213846716142056, "loss": 0.016, "step": 200250 }, { "epoch": 0.52, "learning_rate": 0.00022213457894504913, "loss": 0.0203, "step": 200260 }, { "epoch": 0.52, "learning_rate": 0.00022213069072867764, "loss": 0.0208, "step": 200270 }, { "epoch": 0.52, "learning_rate": 0.00022212680251230618, "loss": 0.0184, "step": 200280 }, { "epoch": 0.52, "learning_rate": 0.0002221229142959347, "loss": 0.0161, "step": 200290 }, { "epoch": 0.52, "learning_rate": 0.00022211902607956327, "loss": 0.0209, "step": 200300 }, { "epoch": 0.52, "learning_rate": 0.0002221151378631918, "loss": 0.0183, "step": 200310 }, { "epoch": 0.52, "learning_rate": 0.00022211124964682032, "loss": 0.0181, "step": 200320 }, { "epoch": 0.52, "learning_rate": 0.00022210736143044884, "loss": 0.019, "step": 200330 }, { "epoch": 0.52, "learning_rate": 0.0002221034732140774, "loss": 0.0152, "step": 200340 }, { "epoch": 0.52, "learning_rate": 0.00022209958499770595, "loss": 0.0183, "step": 200350 }, { "epoch": 0.52, "learning_rate": 0.00022209569678133446, "loss": 0.0164, "step": 200360 }, { "epoch": 0.52, "learning_rate": 0.000222091808564963, "loss": 0.0239, "step": 200370 }, { "epoch": 0.52, "learning_rate": 0.00022208792034859154, "loss": 0.0138, "step": 200380 }, { "epoch": 0.52, "learning_rate": 0.00022208403213222009, "loss": 0.0192, "step": 200390 }, { "epoch": 0.52, "learning_rate": 0.0002220801439158486, "loss": 0.0154, "step": 200400 }, { "epoch": 0.52, "learning_rate": 0.00022207625569947714, "loss": 0.0181, "step": 200410 }, { "epoch": 0.52, "learning_rate": 0.00022207236748310568, "loss": 0.018, "step": 200420 }, { "epoch": 0.52, "learning_rate": 0.00022206847926673423, "loss": 0.0235, "step": 200430 }, { "epoch": 0.52, "learning_rate": 0.00022206459105036274, "loss": 0.023, "step": 200440 }, { "epoch": 0.52, "learning_rate": 0.00022206070283399128, "loss": 0.0251, "step": 200450 }, { "epoch": 0.52, "learning_rate": 0.00022205681461761985, "loss": 0.0182, "step": 200460 }, { "epoch": 0.52, "learning_rate": 0.00022205292640124836, "loss": 0.0168, "step": 200470 }, { "epoch": 0.52, "learning_rate": 0.0002220490381848769, "loss": 0.0182, "step": 200480 }, { "epoch": 0.52, "learning_rate": 0.00022204514996850542, "loss": 0.0203, "step": 200490 }, { "epoch": 0.52, "learning_rate": 0.00022204126175213394, "loss": 0.0189, "step": 200500 }, { "epoch": 0.52, "learning_rate": 0.0002220373735357625, "loss": 0.0145, "step": 200510 }, { "epoch": 0.52, "learning_rate": 0.00022203348531939105, "loss": 0.0162, "step": 200520 }, { "epoch": 0.52, "learning_rate": 0.00022202959710301956, "loss": 0.0197, "step": 200530 }, { "epoch": 0.52, "learning_rate": 0.0002220257088866481, "loss": 0.0184, "step": 200540 }, { "epoch": 0.52, "learning_rate": 0.00022202182067027664, "loss": 0.0228, "step": 200550 }, { "epoch": 0.52, "learning_rate": 0.00022201793245390519, "loss": 0.0123, "step": 200560 }, { "epoch": 0.52, "learning_rate": 0.0002220140442375337, "loss": 0.0186, "step": 200570 }, { "epoch": 0.52, "learning_rate": 0.00022201015602116224, "loss": 0.0172, "step": 200580 }, { "epoch": 0.52, "learning_rate": 0.00022200626780479078, "loss": 0.0153, "step": 200590 }, { "epoch": 0.52, "learning_rate": 0.00022200237958841932, "loss": 0.0225, "step": 200600 }, { "epoch": 0.52, "learning_rate": 0.00022199849137204784, "loss": 0.0175, "step": 200610 }, { "epoch": 0.52, "learning_rate": 0.00022199460315567638, "loss": 0.019, "step": 200620 }, { "epoch": 0.52, "learning_rate": 0.00022199071493930495, "loss": 0.0189, "step": 200630 }, { "epoch": 0.52, "learning_rate": 0.00022198682672293346, "loss": 0.0162, "step": 200640 }, { "epoch": 0.52, "learning_rate": 0.00022198293850656198, "loss": 0.0165, "step": 200650 }, { "epoch": 0.52, "learning_rate": 0.00022197905029019052, "loss": 0.0181, "step": 200660 }, { "epoch": 0.52, "learning_rate": 0.0002219751620738191, "loss": 0.0239, "step": 200670 }, { "epoch": 0.52, "learning_rate": 0.0002219712738574476, "loss": 0.0181, "step": 200680 }, { "epoch": 0.52, "learning_rate": 0.00022196738564107614, "loss": 0.0207, "step": 200690 }, { "epoch": 0.52, "learning_rate": 0.00022196349742470466, "loss": 0.0178, "step": 200700 }, { "epoch": 0.52, "learning_rate": 0.00022195960920833323, "loss": 0.0156, "step": 200710 }, { "epoch": 0.52, "learning_rate": 0.00022195572099196174, "loss": 0.0135, "step": 200720 }, { "epoch": 0.52, "learning_rate": 0.00022195183277559028, "loss": 0.0214, "step": 200730 }, { "epoch": 0.52, "learning_rate": 0.0002219479445592188, "loss": 0.0165, "step": 200740 }, { "epoch": 0.52, "learning_rate": 0.00022194405634284734, "loss": 0.0142, "step": 200750 }, { "epoch": 0.52, "learning_rate": 0.00022194016812647588, "loss": 0.0159, "step": 200760 }, { "epoch": 0.52, "learning_rate": 0.00022193627991010442, "loss": 0.0215, "step": 200770 }, { "epoch": 0.52, "learning_rate": 0.00022193239169373294, "loss": 0.0219, "step": 200780 }, { "epoch": 0.52, "learning_rate": 0.00022192850347736148, "loss": 0.0185, "step": 200790 }, { "epoch": 0.52, "learning_rate": 0.00022192461526099002, "loss": 0.0192, "step": 200800 }, { "epoch": 0.52, "learning_rate": 0.00022192072704461856, "loss": 0.0179, "step": 200810 }, { "epoch": 0.52, "learning_rate": 0.00022191683882824708, "loss": 0.0156, "step": 200820 }, { "epoch": 0.52, "learning_rate": 0.00022191295061187562, "loss": 0.0168, "step": 200830 }, { "epoch": 0.52, "learning_rate": 0.0002219090623955042, "loss": 0.0167, "step": 200840 }, { "epoch": 0.52, "learning_rate": 0.0002219051741791327, "loss": 0.0259, "step": 200850 }, { "epoch": 0.52, "learning_rate": 0.00022190128596276124, "loss": 0.0182, "step": 200860 }, { "epoch": 0.52, "learning_rate": 0.00022189739774638976, "loss": 0.0175, "step": 200870 }, { "epoch": 0.52, "learning_rate": 0.00022189350953001833, "loss": 0.0175, "step": 200880 }, { "epoch": 0.52, "learning_rate": 0.00022188962131364684, "loss": 0.0151, "step": 200890 }, { "epoch": 0.52, "learning_rate": 0.00022188573309727538, "loss": 0.0176, "step": 200900 }, { "epoch": 0.52, "learning_rate": 0.0002218818448809039, "loss": 0.015, "step": 200910 }, { "epoch": 0.52, "learning_rate": 0.00022187795666453247, "loss": 0.0207, "step": 200920 }, { "epoch": 0.52, "learning_rate": 0.00022187406844816098, "loss": 0.0207, "step": 200930 }, { "epoch": 0.52, "learning_rate": 0.00022187018023178952, "loss": 0.0206, "step": 200940 }, { "epoch": 0.52, "learning_rate": 0.00022186629201541804, "loss": 0.0171, "step": 200950 }, { "epoch": 0.52, "learning_rate": 0.0002218624037990466, "loss": 0.0172, "step": 200960 }, { "epoch": 0.52, "learning_rate": 0.00022185851558267512, "loss": 0.0187, "step": 200970 }, { "epoch": 0.52, "learning_rate": 0.00022185462736630366, "loss": 0.0195, "step": 200980 }, { "epoch": 0.52, "learning_rate": 0.00022185073914993218, "loss": 0.0185, "step": 200990 }, { "epoch": 0.52, "learning_rate": 0.00022184685093356072, "loss": 0.0169, "step": 201000 }, { "epoch": 0.52, "eval_cer": 0.8817600714374692, "eval_loss": 0.011896415613591671, "eval_runtime": 108.2669, "eval_samples_per_second": 18.473, "eval_steps_per_second": 4.618, "step": 201000 }, { "epoch": 0.52, "learning_rate": 0.0002218429627171893, "loss": 0.0207, "step": 201010 }, { "epoch": 0.52, "learning_rate": 0.0002218390745008178, "loss": 0.028, "step": 201020 }, { "epoch": 0.52, "learning_rate": 0.00022183518628444634, "loss": 0.0166, "step": 201030 }, { "epoch": 0.52, "learning_rate": 0.00022183129806807486, "loss": 0.017, "step": 201040 }, { "epoch": 0.52, "learning_rate": 0.00022182740985170343, "loss": 0.0207, "step": 201050 }, { "epoch": 0.52, "learning_rate": 0.00022182352163533194, "loss": 0.0169, "step": 201060 }, { "epoch": 0.52, "learning_rate": 0.00022181963341896048, "loss": 0.0153, "step": 201070 }, { "epoch": 0.52, "learning_rate": 0.000221815745202589, "loss": 0.0116, "step": 201080 }, { "epoch": 0.52, "learning_rate": 0.00022181185698621757, "loss": 0.0135, "step": 201090 }, { "epoch": 0.52, "learning_rate": 0.00022180796876984608, "loss": 0.0184, "step": 201100 }, { "epoch": 0.52, "learning_rate": 0.00022180408055347462, "loss": 0.0157, "step": 201110 }, { "epoch": 0.52, "learning_rate": 0.00022180019233710314, "loss": 0.0191, "step": 201120 }, { "epoch": 0.52, "learning_rate": 0.0002217963041207317, "loss": 0.0149, "step": 201130 }, { "epoch": 0.52, "learning_rate": 0.00022179241590436022, "loss": 0.0159, "step": 201140 }, { "epoch": 0.52, "learning_rate": 0.00022178852768798876, "loss": 0.017, "step": 201150 }, { "epoch": 0.52, "learning_rate": 0.00022178463947161728, "loss": 0.0182, "step": 201160 }, { "epoch": 0.52, "learning_rate": 0.00022178075125524585, "loss": 0.0161, "step": 201170 }, { "epoch": 0.52, "learning_rate": 0.0002217768630388744, "loss": 0.0169, "step": 201180 }, { "epoch": 0.52, "learning_rate": 0.0002217729748225029, "loss": 0.0142, "step": 201190 }, { "epoch": 0.52, "learning_rate": 0.00022176908660613144, "loss": 0.0165, "step": 201200 }, { "epoch": 0.52, "learning_rate": 0.00022176519838975998, "loss": 0.0138, "step": 201210 }, { "epoch": 0.52, "learning_rate": 0.00022176131017338853, "loss": 0.0174, "step": 201220 }, { "epoch": 0.52, "learning_rate": 0.00022175742195701704, "loss": 0.0131, "step": 201230 }, { "epoch": 0.52, "learning_rate": 0.00022175353374064558, "loss": 0.021, "step": 201240 }, { "epoch": 0.52, "learning_rate": 0.0002217496455242741, "loss": 0.0198, "step": 201250 }, { "epoch": 0.52, "learning_rate": 0.00022174575730790267, "loss": 0.0176, "step": 201260 }, { "epoch": 0.52, "learning_rate": 0.00022174186909153118, "loss": 0.0157, "step": 201270 }, { "epoch": 0.52, "learning_rate": 0.00022173798087515972, "loss": 0.0172, "step": 201280 }, { "epoch": 0.52, "learning_rate": 0.00022173409265878824, "loss": 0.0243, "step": 201290 }, { "epoch": 0.52, "learning_rate": 0.0002217302044424168, "loss": 0.0173, "step": 201300 }, { "epoch": 0.52, "learning_rate": 0.00022172631622604532, "loss": 0.0169, "step": 201310 }, { "epoch": 0.52, "learning_rate": 0.00022172242800967386, "loss": 0.0192, "step": 201320 }, { "epoch": 0.52, "learning_rate": 0.00022171853979330238, "loss": 0.02, "step": 201330 }, { "epoch": 0.52, "learning_rate": 0.00022171465157693094, "loss": 0.0189, "step": 201340 }, { "epoch": 0.52, "learning_rate": 0.0002217107633605595, "loss": 0.0142, "step": 201350 }, { "epoch": 0.52, "learning_rate": 0.000221706875144188, "loss": 0.0197, "step": 201360 }, { "epoch": 0.52, "learning_rate": 0.00022170298692781652, "loss": 0.0196, "step": 201370 }, { "epoch": 0.52, "learning_rate": 0.00022169909871144508, "loss": 0.0146, "step": 201380 }, { "epoch": 0.52, "learning_rate": 0.00022169521049507363, "loss": 0.0147, "step": 201390 }, { "epoch": 0.52, "learning_rate": 0.00022169132227870214, "loss": 0.0175, "step": 201400 }, { "epoch": 0.52, "learning_rate": 0.00022168743406233068, "loss": 0.0181, "step": 201410 }, { "epoch": 0.52, "learning_rate": 0.00022168354584595922, "loss": 0.0148, "step": 201420 }, { "epoch": 0.52, "learning_rate": 0.00022167965762958777, "loss": 0.0188, "step": 201430 }, { "epoch": 0.52, "learning_rate": 0.00022167576941321628, "loss": 0.0184, "step": 201440 }, { "epoch": 0.52, "learning_rate": 0.00022167188119684482, "loss": 0.0174, "step": 201450 }, { "epoch": 0.52, "learning_rate": 0.00022166799298047336, "loss": 0.018, "step": 201460 }, { "epoch": 0.52, "learning_rate": 0.0002216641047641019, "loss": 0.0196, "step": 201470 }, { "epoch": 0.52, "learning_rate": 0.00022166021654773042, "loss": 0.0168, "step": 201480 }, { "epoch": 0.52, "learning_rate": 0.00022165632833135896, "loss": 0.0195, "step": 201490 }, { "epoch": 0.52, "learning_rate": 0.00022165244011498748, "loss": 0.0158, "step": 201500 }, { "epoch": 0.52, "learning_rate": 0.00022164855189861604, "loss": 0.0183, "step": 201510 }, { "epoch": 0.52, "learning_rate": 0.00022164466368224456, "loss": 0.0186, "step": 201520 }, { "epoch": 0.52, "learning_rate": 0.0002216407754658731, "loss": 0.017, "step": 201530 }, { "epoch": 0.52, "learning_rate": 0.00022163688724950161, "loss": 0.0204, "step": 201540 }, { "epoch": 0.52, "learning_rate": 0.00022163299903313018, "loss": 0.0152, "step": 201550 }, { "epoch": 0.52, "learning_rate": 0.00022162911081675873, "loss": 0.03, "step": 201560 }, { "epoch": 0.52, "learning_rate": 0.00022162522260038724, "loss": 0.0166, "step": 201570 }, { "epoch": 0.52, "learning_rate": 0.00022162133438401578, "loss": 0.0193, "step": 201580 }, { "epoch": 0.52, "learning_rate": 0.00022161744616764432, "loss": 0.0355, "step": 201590 }, { "epoch": 0.52, "learning_rate": 0.00022161355795127286, "loss": 0.0154, "step": 201600 }, { "epoch": 0.52, "learning_rate": 0.00022160966973490138, "loss": 0.0166, "step": 201610 }, { "epoch": 0.52, "learning_rate": 0.00022160578151852992, "loss": 0.0142, "step": 201620 }, { "epoch": 0.52, "learning_rate": 0.00022160189330215846, "loss": 0.0162, "step": 201630 }, { "epoch": 0.52, "learning_rate": 0.000221598005085787, "loss": 0.0181, "step": 201640 }, { "epoch": 0.52, "learning_rate": 0.00022159411686941552, "loss": 0.0184, "step": 201650 }, { "epoch": 0.52, "learning_rate": 0.00022159022865304406, "loss": 0.0197, "step": 201660 }, { "epoch": 0.52, "learning_rate": 0.00022158634043667263, "loss": 0.0167, "step": 201670 }, { "epoch": 0.52, "learning_rate": 0.00022158245222030114, "loss": 0.0184, "step": 201680 }, { "epoch": 0.52, "learning_rate": 0.00022157856400392966, "loss": 0.018, "step": 201690 }, { "epoch": 0.52, "learning_rate": 0.0002215746757875582, "loss": 0.0155, "step": 201700 }, { "epoch": 0.52, "learning_rate": 0.00022157078757118677, "loss": 0.0171, "step": 201710 }, { "epoch": 0.52, "learning_rate": 0.00022156689935481528, "loss": 0.0152, "step": 201720 }, { "epoch": 0.52, "learning_rate": 0.00022156301113844382, "loss": 0.0196, "step": 201730 }, { "epoch": 0.52, "learning_rate": 0.00022155912292207234, "loss": 0.0183, "step": 201740 }, { "epoch": 0.52, "learning_rate": 0.00022155523470570088, "loss": 0.0167, "step": 201750 }, { "epoch": 0.52, "learning_rate": 0.00022155134648932942, "loss": 0.0176, "step": 201760 }, { "epoch": 0.52, "learning_rate": 0.00022154745827295796, "loss": 0.0151, "step": 201770 }, { "epoch": 0.52, "learning_rate": 0.00022154357005658648, "loss": 0.0138, "step": 201780 }, { "epoch": 0.52, "learning_rate": 0.00022153968184021502, "loss": 0.0168, "step": 201790 }, { "epoch": 0.52, "learning_rate": 0.00022153579362384356, "loss": 0.0159, "step": 201800 }, { "epoch": 0.52, "learning_rate": 0.0002215319054074721, "loss": 0.0159, "step": 201810 }, { "epoch": 0.52, "learning_rate": 0.00022152801719110062, "loss": 0.0166, "step": 201820 }, { "epoch": 0.52, "learning_rate": 0.00022152412897472916, "loss": 0.0177, "step": 201830 }, { "epoch": 0.52, "learning_rate": 0.0002215202407583577, "loss": 0.0156, "step": 201840 }, { "epoch": 0.52, "learning_rate": 0.00022151635254198624, "loss": 0.0202, "step": 201850 }, { "epoch": 0.52, "learning_rate": 0.00022151246432561476, "loss": 0.0173, "step": 201860 }, { "epoch": 0.52, "learning_rate": 0.0002215085761092433, "loss": 0.0174, "step": 201870 }, { "epoch": 0.52, "learning_rate": 0.00022150468789287187, "loss": 0.0183, "step": 201880 }, { "epoch": 0.52, "learning_rate": 0.00022150079967650038, "loss": 0.0208, "step": 201890 }, { "epoch": 0.52, "learning_rate": 0.00022149691146012892, "loss": 0.0155, "step": 201900 }, { "epoch": 0.52, "learning_rate": 0.00022149302324375744, "loss": 0.0185, "step": 201910 }, { "epoch": 0.52, "learning_rate": 0.000221489135027386, "loss": 0.0158, "step": 201920 }, { "epoch": 0.52, "learning_rate": 0.00022148524681101452, "loss": 0.0185, "step": 201930 }, { "epoch": 0.52, "learning_rate": 0.00022148135859464306, "loss": 0.0179, "step": 201940 }, { "epoch": 0.52, "learning_rate": 0.00022147747037827158, "loss": 0.0138, "step": 201950 }, { "epoch": 0.52, "learning_rate": 0.00022147358216190012, "loss": 0.0157, "step": 201960 }, { "epoch": 0.52, "learning_rate": 0.00022146969394552866, "loss": 0.0132, "step": 201970 }, { "epoch": 0.52, "learning_rate": 0.0002214658057291572, "loss": 0.0147, "step": 201980 }, { "epoch": 0.52, "learning_rate": 0.00022146191751278572, "loss": 0.0142, "step": 201990 }, { "epoch": 0.52, "learning_rate": 0.00022145802929641426, "loss": 0.0185, "step": 202000 }, { "epoch": 0.52, "eval_cer": 0.8818104583670996, "eval_loss": 0.011379092931747437, "eval_runtime": 107.8594, "eval_samples_per_second": 18.543, "eval_steps_per_second": 4.636, "step": 202000 }, { "epoch": 0.52, "learning_rate": 0.0002214541410800428, "loss": 0.0207, "step": 202010 }, { "epoch": 0.52, "learning_rate": 0.00022145025286367134, "loss": 0.015, "step": 202020 }, { "epoch": 0.52, "learning_rate": 0.00022144636464729986, "loss": 0.0144, "step": 202030 }, { "epoch": 0.52, "learning_rate": 0.0002214424764309284, "loss": 0.0168, "step": 202040 }, { "epoch": 0.52, "learning_rate": 0.00022143858821455697, "loss": 0.014, "step": 202050 }, { "epoch": 0.52, "learning_rate": 0.00022143469999818548, "loss": 0.0175, "step": 202060 }, { "epoch": 0.52, "learning_rate": 0.00022143081178181402, "loss": 0.0181, "step": 202070 }, { "epoch": 0.52, "learning_rate": 0.00022142692356544254, "loss": 0.0131, "step": 202080 }, { "epoch": 0.52, "learning_rate": 0.0002214230353490711, "loss": 0.0222, "step": 202090 }, { "epoch": 0.52, "learning_rate": 0.00022141914713269962, "loss": 0.018, "step": 202100 }, { "epoch": 0.52, "learning_rate": 0.00022141525891632816, "loss": 0.0162, "step": 202110 }, { "epoch": 0.52, "learning_rate": 0.00022141137069995668, "loss": 0.0148, "step": 202120 }, { "epoch": 0.52, "learning_rate": 0.00022140748248358525, "loss": 0.0136, "step": 202130 }, { "epoch": 0.52, "learning_rate": 0.00022140359426721376, "loss": 0.0191, "step": 202140 }, { "epoch": 0.52, "learning_rate": 0.0002213997060508423, "loss": 0.0174, "step": 202150 }, { "epoch": 0.52, "learning_rate": 0.00022139581783447082, "loss": 0.0158, "step": 202160 }, { "epoch": 0.52, "learning_rate": 0.00022139192961809939, "loss": 0.018, "step": 202170 }, { "epoch": 0.52, "learning_rate": 0.0002213880414017279, "loss": 0.0213, "step": 202180 }, { "epoch": 0.52, "learning_rate": 0.00022138415318535644, "loss": 0.0162, "step": 202190 }, { "epoch": 0.52, "learning_rate": 0.00022138026496898496, "loss": 0.0227, "step": 202200 }, { "epoch": 0.52, "learning_rate": 0.0002213763767526135, "loss": 0.0216, "step": 202210 }, { "epoch": 0.52, "learning_rate": 0.00022137248853624207, "loss": 0.0169, "step": 202220 }, { "epoch": 0.52, "learning_rate": 0.00022136860031987058, "loss": 0.0166, "step": 202230 }, { "epoch": 0.52, "learning_rate": 0.0002213647121034991, "loss": 0.0232, "step": 202240 }, { "epoch": 0.52, "learning_rate": 0.00022136082388712764, "loss": 0.0207, "step": 202250 }, { "epoch": 0.52, "learning_rate": 0.0002213569356707562, "loss": 0.0146, "step": 202260 }, { "epoch": 0.52, "learning_rate": 0.00022135304745438472, "loss": 0.0155, "step": 202270 }, { "epoch": 0.52, "learning_rate": 0.00022134915923801326, "loss": 0.0162, "step": 202280 }, { "epoch": 0.52, "learning_rate": 0.00022134527102164178, "loss": 0.0177, "step": 202290 }, { "epoch": 0.52, "learning_rate": 0.00022134138280527035, "loss": 0.0146, "step": 202300 }, { "epoch": 0.52, "learning_rate": 0.00022133749458889886, "loss": 0.0133, "step": 202310 }, { "epoch": 0.52, "learning_rate": 0.0002213336063725274, "loss": 0.015, "step": 202320 }, { "epoch": 0.52, "learning_rate": 0.00022132971815615592, "loss": 0.0186, "step": 202330 }, { "epoch": 0.52, "learning_rate": 0.00022132582993978449, "loss": 0.0219, "step": 202340 }, { "epoch": 0.52, "learning_rate": 0.000221321941723413, "loss": 0.0171, "step": 202350 }, { "epoch": 0.52, "learning_rate": 0.00022131805350704154, "loss": 0.0205, "step": 202360 }, { "epoch": 0.52, "learning_rate": 0.00022131416529067006, "loss": 0.0154, "step": 202370 }, { "epoch": 0.52, "learning_rate": 0.00022131027707429862, "loss": 0.0182, "step": 202380 }, { "epoch": 0.52, "learning_rate": 0.00022130638885792714, "loss": 0.017, "step": 202390 }, { "epoch": 0.52, "learning_rate": 0.00022130250064155568, "loss": 0.0166, "step": 202400 }, { "epoch": 0.52, "learning_rate": 0.0002212986124251842, "loss": 0.0176, "step": 202410 }, { "epoch": 0.52, "learning_rate": 0.00022129472420881276, "loss": 0.0218, "step": 202420 }, { "epoch": 0.52, "learning_rate": 0.0002212908359924413, "loss": 0.0218, "step": 202430 }, { "epoch": 0.52, "learning_rate": 0.00022128694777606982, "loss": 0.0193, "step": 202440 }, { "epoch": 0.52, "learning_rate": 0.00022128305955969836, "loss": 0.0202, "step": 202450 }, { "epoch": 0.52, "learning_rate": 0.00022127917134332688, "loss": 0.0216, "step": 202460 }, { "epoch": 0.52, "learning_rate": 0.00022127528312695545, "loss": 0.0183, "step": 202470 }, { "epoch": 0.52, "learning_rate": 0.00022127139491058396, "loss": 0.0132, "step": 202480 }, { "epoch": 0.52, "learning_rate": 0.0002212675066942125, "loss": 0.0229, "step": 202490 }, { "epoch": 0.52, "learning_rate": 0.00022126361847784102, "loss": 0.0224, "step": 202500 }, { "epoch": 0.52, "learning_rate": 0.00022125973026146958, "loss": 0.0206, "step": 202510 }, { "epoch": 0.52, "learning_rate": 0.0002212558420450981, "loss": 0.0163, "step": 202520 }, { "epoch": 0.52, "learning_rate": 0.00022125195382872664, "loss": 0.0214, "step": 202530 }, { "epoch": 0.53, "learning_rate": 0.00022124806561235516, "loss": 0.0169, "step": 202540 }, { "epoch": 0.53, "learning_rate": 0.00022124417739598372, "loss": 0.019, "step": 202550 }, { "epoch": 0.53, "learning_rate": 0.00022124028917961224, "loss": 0.0175, "step": 202560 }, { "epoch": 0.53, "learning_rate": 0.00022123640096324078, "loss": 0.0176, "step": 202570 }, { "epoch": 0.53, "learning_rate": 0.0002212325127468693, "loss": 0.0225, "step": 202580 }, { "epoch": 0.53, "learning_rate": 0.00022122862453049786, "loss": 0.0151, "step": 202590 }, { "epoch": 0.53, "learning_rate": 0.0002212247363141264, "loss": 0.0151, "step": 202600 }, { "epoch": 0.53, "learning_rate": 0.00022122084809775492, "loss": 0.0197, "step": 202610 }, { "epoch": 0.53, "learning_rate": 0.00022121695988138346, "loss": 0.0174, "step": 202620 }, { "epoch": 0.53, "learning_rate": 0.000221213071665012, "loss": 0.0175, "step": 202630 }, { "epoch": 0.53, "learning_rate": 0.00022120918344864054, "loss": 0.0161, "step": 202640 }, { "epoch": 0.53, "learning_rate": 0.00022120529523226906, "loss": 0.0157, "step": 202650 }, { "epoch": 0.53, "learning_rate": 0.0002212014070158976, "loss": 0.0161, "step": 202660 }, { "epoch": 0.53, "learning_rate": 0.00022119751879952614, "loss": 0.019, "step": 202670 }, { "epoch": 0.53, "learning_rate": 0.00022119363058315468, "loss": 0.0176, "step": 202680 }, { "epoch": 0.53, "learning_rate": 0.0002211897423667832, "loss": 0.0193, "step": 202690 }, { "epoch": 0.53, "learning_rate": 0.00022118585415041174, "loss": 0.0152, "step": 202700 }, { "epoch": 0.53, "learning_rate": 0.00022118196593404025, "loss": 0.0177, "step": 202710 }, { "epoch": 0.53, "learning_rate": 0.00022117807771766882, "loss": 0.0188, "step": 202720 }, { "epoch": 0.53, "learning_rate": 0.00022117418950129734, "loss": 0.0173, "step": 202730 }, { "epoch": 0.53, "learning_rate": 0.00022117030128492588, "loss": 0.0166, "step": 202740 }, { "epoch": 0.53, "learning_rate": 0.0002211664130685544, "loss": 0.0151, "step": 202750 }, { "epoch": 0.53, "learning_rate": 0.00022116252485218296, "loss": 0.0185, "step": 202760 }, { "epoch": 0.53, "learning_rate": 0.0002211586366358115, "loss": 0.0134, "step": 202770 }, { "epoch": 0.53, "learning_rate": 0.00022115474841944002, "loss": 0.0177, "step": 202780 }, { "epoch": 0.53, "learning_rate": 0.00022115086020306856, "loss": 0.0134, "step": 202790 }, { "epoch": 0.53, "learning_rate": 0.0002211469719866971, "loss": 0.0159, "step": 202800 }, { "epoch": 0.53, "learning_rate": 0.00022114308377032564, "loss": 0.0213, "step": 202810 }, { "epoch": 0.53, "learning_rate": 0.00022113919555395416, "loss": 0.0207, "step": 202820 }, { "epoch": 0.53, "learning_rate": 0.0002211353073375827, "loss": 0.0201, "step": 202830 }, { "epoch": 0.53, "learning_rate": 0.00022113141912121124, "loss": 0.0167, "step": 202840 }, { "epoch": 0.53, "learning_rate": 0.00022112753090483978, "loss": 0.0165, "step": 202850 }, { "epoch": 0.53, "learning_rate": 0.0002211236426884683, "loss": 0.0191, "step": 202860 }, { "epoch": 0.53, "learning_rate": 0.00022111975447209684, "loss": 0.0185, "step": 202870 }, { "epoch": 0.53, "learning_rate": 0.00022111586625572538, "loss": 0.0191, "step": 202880 }, { "epoch": 0.53, "learning_rate": 0.00022111197803935392, "loss": 0.0241, "step": 202890 }, { "epoch": 0.53, "learning_rate": 0.00022110808982298244, "loss": 0.0172, "step": 202900 }, { "epoch": 0.53, "learning_rate": 0.00022110420160661098, "loss": 0.0184, "step": 202910 }, { "epoch": 0.53, "learning_rate": 0.00022110031339023955, "loss": 0.0182, "step": 202920 }, { "epoch": 0.53, "learning_rate": 0.00022109642517386806, "loss": 0.0161, "step": 202930 }, { "epoch": 0.53, "learning_rate": 0.0002210925369574966, "loss": 0.0154, "step": 202940 }, { "epoch": 0.53, "learning_rate": 0.00022108864874112512, "loss": 0.0136, "step": 202950 }, { "epoch": 0.53, "learning_rate": 0.00022108476052475363, "loss": 0.0157, "step": 202960 }, { "epoch": 0.53, "learning_rate": 0.0002210808723083822, "loss": 0.0189, "step": 202970 }, { "epoch": 0.53, "learning_rate": 0.00022107698409201074, "loss": 0.0197, "step": 202980 }, { "epoch": 0.53, "learning_rate": 0.00022107309587563926, "loss": 0.0154, "step": 202990 }, { "epoch": 0.53, "learning_rate": 0.0002210692076592678, "loss": 0.0149, "step": 203000 }, { "epoch": 0.53, "eval_cer": 0.8817866645392185, "eval_loss": 0.011468823999166489, "eval_runtime": 107.5391, "eval_samples_per_second": 18.598, "eval_steps_per_second": 4.649, "step": 203000 }, { "epoch": 0.53, "learning_rate": 0.00022106531944289634, "loss": 0.02, "step": 203010 }, { "epoch": 0.53, "learning_rate": 0.00022106143122652488, "loss": 0.0127, "step": 203020 }, { "epoch": 0.53, "learning_rate": 0.0002210575430101534, "loss": 0.019, "step": 203030 }, { "epoch": 0.53, "learning_rate": 0.00022105365479378194, "loss": 0.0138, "step": 203040 }, { "epoch": 0.53, "learning_rate": 0.00022104976657741048, "loss": 0.016, "step": 203050 }, { "epoch": 0.53, "learning_rate": 0.00022104587836103902, "loss": 0.0183, "step": 203060 }, { "epoch": 0.53, "learning_rate": 0.00022104199014466754, "loss": 0.0164, "step": 203070 }, { "epoch": 0.53, "learning_rate": 0.00022103810192829608, "loss": 0.0179, "step": 203080 }, { "epoch": 0.53, "learning_rate": 0.00022103421371192465, "loss": 0.0173, "step": 203090 }, { "epoch": 0.53, "learning_rate": 0.00022103032549555316, "loss": 0.0193, "step": 203100 }, { "epoch": 0.53, "learning_rate": 0.00022102643727918168, "loss": 0.0225, "step": 203110 }, { "epoch": 0.53, "learning_rate": 0.00022102254906281022, "loss": 0.0158, "step": 203120 }, { "epoch": 0.53, "learning_rate": 0.0002210186608464388, "loss": 0.0169, "step": 203130 }, { "epoch": 0.53, "learning_rate": 0.0002210147726300673, "loss": 0.0273, "step": 203140 }, { "epoch": 0.53, "learning_rate": 0.00022101088441369584, "loss": 0.0196, "step": 203150 }, { "epoch": 0.53, "learning_rate": 0.00022100699619732436, "loss": 0.0126, "step": 203160 }, { "epoch": 0.53, "learning_rate": 0.00022100310798095293, "loss": 0.0133, "step": 203170 }, { "epoch": 0.53, "learning_rate": 0.00022099921976458144, "loss": 0.0187, "step": 203180 }, { "epoch": 0.53, "learning_rate": 0.00022099533154820998, "loss": 0.0183, "step": 203190 }, { "epoch": 0.53, "learning_rate": 0.0002209914433318385, "loss": 0.0174, "step": 203200 }, { "epoch": 0.53, "learning_rate": 0.00022098755511546704, "loss": 0.0171, "step": 203210 }, { "epoch": 0.53, "learning_rate": 0.00022098366689909558, "loss": 0.0161, "step": 203220 }, { "epoch": 0.53, "learning_rate": 0.00022097977868272412, "loss": 0.0141, "step": 203230 }, { "epoch": 0.53, "learning_rate": 0.00022097589046635264, "loss": 0.0164, "step": 203240 }, { "epoch": 0.53, "learning_rate": 0.00022097200224998118, "loss": 0.0217, "step": 203250 }, { "epoch": 0.53, "learning_rate": 0.00022096811403360975, "loss": 0.0207, "step": 203260 }, { "epoch": 0.53, "learning_rate": 0.00022096422581723826, "loss": 0.0187, "step": 203270 }, { "epoch": 0.53, "learning_rate": 0.00022096033760086678, "loss": 0.0193, "step": 203280 }, { "epoch": 0.53, "learning_rate": 0.00022095644938449532, "loss": 0.0174, "step": 203290 }, { "epoch": 0.53, "learning_rate": 0.00022095256116812389, "loss": 0.0162, "step": 203300 }, { "epoch": 0.53, "learning_rate": 0.0002209486729517524, "loss": 0.014, "step": 203310 }, { "epoch": 0.53, "learning_rate": 0.00022094478473538094, "loss": 0.014, "step": 203320 }, { "epoch": 0.53, "learning_rate": 0.00022094089651900946, "loss": 0.0205, "step": 203330 }, { "epoch": 0.53, "learning_rate": 0.00022093700830263803, "loss": 0.0188, "step": 203340 }, { "epoch": 0.53, "learning_rate": 0.00022093312008626654, "loss": 0.0212, "step": 203350 }, { "epoch": 0.53, "learning_rate": 0.00022092923186989508, "loss": 0.0195, "step": 203360 }, { "epoch": 0.53, "learning_rate": 0.0002209253436535236, "loss": 0.0118, "step": 203370 }, { "epoch": 0.53, "learning_rate": 0.00022092145543715217, "loss": 0.0157, "step": 203380 }, { "epoch": 0.53, "learning_rate": 0.00022091756722078068, "loss": 0.0169, "step": 203390 }, { "epoch": 0.53, "learning_rate": 0.00022091367900440922, "loss": 0.0154, "step": 203400 }, { "epoch": 0.53, "learning_rate": 0.00022090979078803774, "loss": 0.0164, "step": 203410 }, { "epoch": 0.53, "learning_rate": 0.0002209059025716663, "loss": 0.0164, "step": 203420 }, { "epoch": 0.53, "learning_rate": 0.00022090201435529482, "loss": 0.0243, "step": 203430 }, { "epoch": 0.53, "learning_rate": 0.00022089812613892336, "loss": 0.0247, "step": 203440 }, { "epoch": 0.53, "learning_rate": 0.00022089423792255188, "loss": 0.022, "step": 203450 }, { "epoch": 0.53, "learning_rate": 0.00022089034970618042, "loss": 0.0153, "step": 203460 }, { "epoch": 0.53, "learning_rate": 0.00022088646148980899, "loss": 0.0162, "step": 203470 }, { "epoch": 0.53, "learning_rate": 0.0002208825732734375, "loss": 0.022, "step": 203480 }, { "epoch": 0.53, "learning_rate": 0.00022087868505706604, "loss": 0.0156, "step": 203490 }, { "epoch": 0.53, "learning_rate": 0.00022087479684069456, "loss": 0.0227, "step": 203500 }, { "epoch": 0.53, "learning_rate": 0.00022087090862432313, "loss": 0.0156, "step": 203510 }, { "epoch": 0.53, "learning_rate": 0.00022086702040795164, "loss": 0.0137, "step": 203520 }, { "epoch": 0.53, "learning_rate": 0.00022086313219158018, "loss": 0.0186, "step": 203530 }, { "epoch": 0.53, "learning_rate": 0.0002208592439752087, "loss": 0.0172, "step": 203540 }, { "epoch": 0.53, "learning_rate": 0.00022085535575883726, "loss": 0.0187, "step": 203550 }, { "epoch": 0.53, "learning_rate": 0.00022085146754246578, "loss": 0.0182, "step": 203560 }, { "epoch": 0.53, "learning_rate": 0.00022084757932609432, "loss": 0.0176, "step": 203570 }, { "epoch": 0.53, "learning_rate": 0.00022084369110972284, "loss": 0.0183, "step": 203580 }, { "epoch": 0.53, "learning_rate": 0.0002208398028933514, "loss": 0.0145, "step": 203590 }, { "epoch": 0.53, "learning_rate": 0.00022083591467697992, "loss": 0.0226, "step": 203600 }, { "epoch": 0.53, "learning_rate": 0.00022083202646060846, "loss": 0.0149, "step": 203610 }, { "epoch": 0.53, "learning_rate": 0.00022082813824423697, "loss": 0.013, "step": 203620 }, { "epoch": 0.53, "learning_rate": 0.00022082425002786554, "loss": 0.0212, "step": 203630 }, { "epoch": 0.53, "learning_rate": 0.00022082036181149408, "loss": 0.0159, "step": 203640 }, { "epoch": 0.53, "learning_rate": 0.0002208164735951226, "loss": 0.016, "step": 203650 }, { "epoch": 0.53, "learning_rate": 0.00022081258537875114, "loss": 0.0151, "step": 203660 }, { "epoch": 0.53, "learning_rate": 0.00022080869716237968, "loss": 0.0171, "step": 203670 }, { "epoch": 0.53, "learning_rate": 0.00022080480894600822, "loss": 0.0134, "step": 203680 }, { "epoch": 0.53, "learning_rate": 0.00022080092072963674, "loss": 0.017, "step": 203690 }, { "epoch": 0.53, "learning_rate": 0.00022079703251326528, "loss": 0.0188, "step": 203700 }, { "epoch": 0.53, "learning_rate": 0.0002207931442968938, "loss": 0.0191, "step": 203710 }, { "epoch": 0.53, "learning_rate": 0.00022078925608052236, "loss": 0.0182, "step": 203720 }, { "epoch": 0.53, "learning_rate": 0.00022078536786415088, "loss": 0.0128, "step": 203730 }, { "epoch": 0.53, "learning_rate": 0.00022078147964777942, "loss": 0.0155, "step": 203740 }, { "epoch": 0.53, "learning_rate": 0.00022077759143140793, "loss": 0.0169, "step": 203750 }, { "epoch": 0.53, "learning_rate": 0.0002207737032150365, "loss": 0.0156, "step": 203760 }, { "epoch": 0.53, "learning_rate": 0.00022076981499866502, "loss": 0.0172, "step": 203770 }, { "epoch": 0.53, "learning_rate": 0.00022076592678229356, "loss": 0.019, "step": 203780 }, { "epoch": 0.53, "learning_rate": 0.00022076203856592207, "loss": 0.0208, "step": 203790 }, { "epoch": 0.53, "learning_rate": 0.00022075815034955064, "loss": 0.0195, "step": 203800 }, { "epoch": 0.53, "learning_rate": 0.00022075426213317918, "loss": 0.0125, "step": 203810 }, { "epoch": 0.53, "learning_rate": 0.0002207503739168077, "loss": 0.0169, "step": 203820 }, { "epoch": 0.53, "learning_rate": 0.0002207464857004362, "loss": 0.0156, "step": 203830 }, { "epoch": 0.53, "learning_rate": 0.00022074259748406478, "loss": 0.016, "step": 203840 }, { "epoch": 0.53, "learning_rate": 0.00022073870926769332, "loss": 0.0174, "step": 203850 }, { "epoch": 0.53, "learning_rate": 0.00022073482105132184, "loss": 0.0182, "step": 203860 }, { "epoch": 0.53, "learning_rate": 0.00022073093283495038, "loss": 0.0151, "step": 203870 }, { "epoch": 0.53, "learning_rate": 0.00022072704461857892, "loss": 0.0167, "step": 203880 }, { "epoch": 0.53, "learning_rate": 0.00022072315640220746, "loss": 0.0153, "step": 203890 }, { "epoch": 0.53, "learning_rate": 0.00022071926818583598, "loss": 0.0167, "step": 203900 }, { "epoch": 0.53, "learning_rate": 0.00022071537996946452, "loss": 0.0152, "step": 203910 }, { "epoch": 0.53, "learning_rate": 0.00022071149175309306, "loss": 0.0166, "step": 203920 }, { "epoch": 0.53, "learning_rate": 0.0002207076035367216, "loss": 0.0173, "step": 203930 }, { "epoch": 0.53, "learning_rate": 0.00022070371532035012, "loss": 0.0204, "step": 203940 }, { "epoch": 0.53, "learning_rate": 0.00022069982710397866, "loss": 0.0142, "step": 203950 }, { "epoch": 0.53, "learning_rate": 0.00022069593888760717, "loss": 0.0164, "step": 203960 }, { "epoch": 0.53, "learning_rate": 0.00022069205067123574, "loss": 0.0158, "step": 203970 }, { "epoch": 0.53, "learning_rate": 0.00022068816245486426, "loss": 0.017, "step": 203980 }, { "epoch": 0.53, "learning_rate": 0.0002206842742384928, "loss": 0.0134, "step": 203990 }, { "epoch": 0.53, "learning_rate": 0.0002206803860221213, "loss": 0.0158, "step": 204000 }, { "epoch": 0.53, "eval_cer": 0.8817334783357197, "eval_loss": 0.01144192460924387, "eval_runtime": 107.6151, "eval_samples_per_second": 18.585, "eval_steps_per_second": 4.646, "step": 204000 }, { "epoch": 0.53, "learning_rate": 0.00022067649780574988, "loss": 0.0132, "step": 204010 }, { "epoch": 0.53, "learning_rate": 0.00022067260958937842, "loss": 0.0235, "step": 204020 }, { "epoch": 0.53, "learning_rate": 0.00022066872137300694, "loss": 0.022, "step": 204030 }, { "epoch": 0.53, "learning_rate": 0.00022066483315663548, "loss": 0.0167, "step": 204040 }, { "epoch": 0.53, "learning_rate": 0.00022066094494026402, "loss": 0.016, "step": 204050 }, { "epoch": 0.53, "learning_rate": 0.00022065705672389256, "loss": 0.0141, "step": 204060 }, { "epoch": 0.53, "learning_rate": 0.00022065316850752108, "loss": 0.0168, "step": 204070 }, { "epoch": 0.53, "learning_rate": 0.00022064928029114962, "loss": 0.0184, "step": 204080 }, { "epoch": 0.53, "learning_rate": 0.00022064539207477816, "loss": 0.0174, "step": 204090 }, { "epoch": 0.53, "learning_rate": 0.0002206415038584067, "loss": 0.0167, "step": 204100 }, { "epoch": 0.53, "learning_rate": 0.00022063761564203522, "loss": 0.0183, "step": 204110 }, { "epoch": 0.53, "learning_rate": 0.00022063372742566376, "loss": 0.017, "step": 204120 }, { "epoch": 0.53, "learning_rate": 0.00022062983920929233, "loss": 0.0145, "step": 204130 }, { "epoch": 0.53, "learning_rate": 0.00022062595099292084, "loss": 0.0191, "step": 204140 }, { "epoch": 0.53, "learning_rate": 0.00022062206277654936, "loss": 0.0284, "step": 204150 }, { "epoch": 0.53, "learning_rate": 0.0002206181745601779, "loss": 0.0155, "step": 204160 }, { "epoch": 0.53, "learning_rate": 0.00022061428634380647, "loss": 0.0172, "step": 204170 }, { "epoch": 0.53, "learning_rate": 0.00022061039812743498, "loss": 0.0156, "step": 204180 }, { "epoch": 0.53, "learning_rate": 0.00022060650991106352, "loss": 0.018, "step": 204190 }, { "epoch": 0.53, "learning_rate": 0.00022060262169469204, "loss": 0.0153, "step": 204200 }, { "epoch": 0.53, "learning_rate": 0.00022059873347832058, "loss": 0.0164, "step": 204210 }, { "epoch": 0.53, "learning_rate": 0.00022059484526194912, "loss": 0.0182, "step": 204220 }, { "epoch": 0.53, "learning_rate": 0.00022059095704557766, "loss": 0.0133, "step": 204230 }, { "epoch": 0.53, "learning_rate": 0.00022058706882920618, "loss": 0.0154, "step": 204240 }, { "epoch": 0.53, "learning_rate": 0.00022058318061283472, "loss": 0.0161, "step": 204250 }, { "epoch": 0.53, "learning_rate": 0.00022057929239646326, "loss": 0.0173, "step": 204260 }, { "epoch": 0.53, "learning_rate": 0.0002205754041800918, "loss": 0.0166, "step": 204270 }, { "epoch": 0.53, "learning_rate": 0.00022057151596372032, "loss": 0.0169, "step": 204280 }, { "epoch": 0.53, "learning_rate": 0.00022056762774734886, "loss": 0.0153, "step": 204290 }, { "epoch": 0.53, "learning_rate": 0.0002205637395309774, "loss": 0.0161, "step": 204300 }, { "epoch": 0.53, "learning_rate": 0.00022055985131460594, "loss": 0.0208, "step": 204310 }, { "epoch": 0.53, "learning_rate": 0.00022055596309823446, "loss": 0.0164, "step": 204320 }, { "epoch": 0.53, "learning_rate": 0.000220552074881863, "loss": 0.0197, "step": 204330 }, { "epoch": 0.53, "learning_rate": 0.00022054818666549157, "loss": 0.0141, "step": 204340 }, { "epoch": 0.53, "learning_rate": 0.00022054429844912008, "loss": 0.0166, "step": 204350 }, { "epoch": 0.53, "learning_rate": 0.00022054041023274862, "loss": 0.0168, "step": 204360 }, { "epoch": 0.53, "learning_rate": 0.00022053652201637714, "loss": 0.0143, "step": 204370 }, { "epoch": 0.53, "learning_rate": 0.0002205326338000057, "loss": 0.0196, "step": 204380 }, { "epoch": 0.53, "learning_rate": 0.00022052874558363422, "loss": 0.0134, "step": 204390 }, { "epoch": 0.53, "learning_rate": 0.00022052485736726276, "loss": 0.0143, "step": 204400 }, { "epoch": 0.53, "learning_rate": 0.00022052096915089128, "loss": 0.0163, "step": 204410 }, { "epoch": 0.53, "learning_rate": 0.00022051708093451984, "loss": 0.0184, "step": 204420 }, { "epoch": 0.53, "learning_rate": 0.00022051319271814836, "loss": 0.0153, "step": 204430 }, { "epoch": 0.53, "learning_rate": 0.0002205093045017769, "loss": 0.0186, "step": 204440 }, { "epoch": 0.53, "learning_rate": 0.00022050541628540542, "loss": 0.0147, "step": 204450 }, { "epoch": 0.53, "learning_rate": 0.00022050152806903396, "loss": 0.0153, "step": 204460 }, { "epoch": 0.53, "learning_rate": 0.0002204976398526625, "loss": 0.0219, "step": 204470 }, { "epoch": 0.53, "learning_rate": 0.00022049375163629104, "loss": 0.0161, "step": 204480 }, { "epoch": 0.53, "learning_rate": 0.00022048986341991955, "loss": 0.0153, "step": 204490 }, { "epoch": 0.53, "learning_rate": 0.0002204859752035481, "loss": 0.0218, "step": 204500 }, { "epoch": 0.53, "learning_rate": 0.00022048208698717667, "loss": 0.0184, "step": 204510 }, { "epoch": 0.53, "learning_rate": 0.00022047819877080518, "loss": 0.0219, "step": 204520 }, { "epoch": 0.53, "learning_rate": 0.00022047431055443372, "loss": 0.0202, "step": 204530 }, { "epoch": 0.53, "learning_rate": 0.00022047042233806224, "loss": 0.0232, "step": 204540 }, { "epoch": 0.53, "learning_rate": 0.0002204665341216908, "loss": 0.0133, "step": 204550 }, { "epoch": 0.53, "learning_rate": 0.00022046264590531932, "loss": 0.015, "step": 204560 }, { "epoch": 0.53, "learning_rate": 0.00022045875768894786, "loss": 0.0151, "step": 204570 }, { "epoch": 0.53, "learning_rate": 0.00022045486947257638, "loss": 0.0198, "step": 204580 }, { "epoch": 0.53, "learning_rate": 0.00022045098125620494, "loss": 0.0172, "step": 204590 }, { "epoch": 0.53, "learning_rate": 0.00022044709303983346, "loss": 0.0209, "step": 204600 }, { "epoch": 0.53, "learning_rate": 0.000220443204823462, "loss": 0.0154, "step": 204610 }, { "epoch": 0.53, "learning_rate": 0.00022043931660709051, "loss": 0.0209, "step": 204620 }, { "epoch": 0.53, "learning_rate": 0.00022043542839071908, "loss": 0.0241, "step": 204630 }, { "epoch": 0.53, "learning_rate": 0.0002204315401743476, "loss": 0.0161, "step": 204640 }, { "epoch": 0.53, "learning_rate": 0.00022042765195797614, "loss": 0.0179, "step": 204650 }, { "epoch": 0.53, "learning_rate": 0.00022042376374160465, "loss": 0.0167, "step": 204660 }, { "epoch": 0.53, "learning_rate": 0.00022041987552523322, "loss": 0.0153, "step": 204670 }, { "epoch": 0.53, "learning_rate": 0.00022041598730886176, "loss": 0.0202, "step": 204680 }, { "epoch": 0.53, "learning_rate": 0.00022041209909249028, "loss": 0.0149, "step": 204690 }, { "epoch": 0.53, "learning_rate": 0.0002204082108761188, "loss": 0.0164, "step": 204700 }, { "epoch": 0.53, "learning_rate": 0.00022040432265974734, "loss": 0.0177, "step": 204710 }, { "epoch": 0.53, "learning_rate": 0.0002204004344433759, "loss": 0.0155, "step": 204720 }, { "epoch": 0.53, "learning_rate": 0.00022039654622700442, "loss": 0.0176, "step": 204730 }, { "epoch": 0.53, "learning_rate": 0.00022039265801063296, "loss": 0.014, "step": 204740 }, { "epoch": 0.53, "learning_rate": 0.00022038876979426147, "loss": 0.0158, "step": 204750 }, { "epoch": 0.53, "learning_rate": 0.00022038488157789004, "loss": 0.0163, "step": 204760 }, { "epoch": 0.53, "learning_rate": 0.00022038099336151856, "loss": 0.0143, "step": 204770 }, { "epoch": 0.53, "learning_rate": 0.0002203771051451471, "loss": 0.0172, "step": 204780 }, { "epoch": 0.53, "learning_rate": 0.00022037321692877561, "loss": 0.0167, "step": 204790 }, { "epoch": 0.53, "learning_rate": 0.00022036932871240418, "loss": 0.0159, "step": 204800 }, { "epoch": 0.53, "learning_rate": 0.0002203654404960327, "loss": 0.0177, "step": 204810 }, { "epoch": 0.53, "learning_rate": 0.00022036155227966124, "loss": 0.0177, "step": 204820 }, { "epoch": 0.53, "learning_rate": 0.00022035766406328975, "loss": 0.0193, "step": 204830 }, { "epoch": 0.53, "learning_rate": 0.00022035377584691832, "loss": 0.0174, "step": 204840 }, { "epoch": 0.53, "learning_rate": 0.00022034988763054686, "loss": 0.0179, "step": 204850 }, { "epoch": 0.53, "learning_rate": 0.00022034599941417538, "loss": 0.0165, "step": 204860 }, { "epoch": 0.53, "learning_rate": 0.0002203421111978039, "loss": 0.0208, "step": 204870 }, { "epoch": 0.53, "learning_rate": 0.00022033822298143246, "loss": 0.0178, "step": 204880 }, { "epoch": 0.53, "learning_rate": 0.000220334334765061, "loss": 0.0195, "step": 204890 }, { "epoch": 0.53, "learning_rate": 0.00022033044654868952, "loss": 0.0177, "step": 204900 }, { "epoch": 0.53, "learning_rate": 0.00022032655833231806, "loss": 0.0155, "step": 204910 }, { "epoch": 0.53, "learning_rate": 0.0002203226701159466, "loss": 0.019, "step": 204920 }, { "epoch": 0.53, "learning_rate": 0.00022031878189957514, "loss": 0.0114, "step": 204930 }, { "epoch": 0.53, "learning_rate": 0.00022031489368320366, "loss": 0.0178, "step": 204940 }, { "epoch": 0.53, "learning_rate": 0.0002203110054668322, "loss": 0.0142, "step": 204950 }, { "epoch": 0.53, "learning_rate": 0.00022030711725046071, "loss": 0.0147, "step": 204960 }, { "epoch": 0.53, "learning_rate": 0.00022030322903408928, "loss": 0.0167, "step": 204970 }, { "epoch": 0.53, "learning_rate": 0.0002202993408177178, "loss": 0.0163, "step": 204980 }, { "epoch": 0.53, "learning_rate": 0.00022029545260134634, "loss": 0.016, "step": 204990 }, { "epoch": 0.53, "learning_rate": 0.00022029156438497485, "loss": 0.021, "step": 205000 }, { "epoch": 0.53, "eval_cer": 0.8817810659914818, "eval_loss": 0.011213579215109348, "eval_runtime": 107.384, "eval_samples_per_second": 18.625, "eval_steps_per_second": 4.656, "step": 205000 }, { "epoch": 0.53, "learning_rate": 0.00022028767616860342, "loss": 0.0162, "step": 205010 }, { "epoch": 0.53, "learning_rate": 0.00022028378795223194, "loss": 0.0163, "step": 205020 }, { "epoch": 0.53, "learning_rate": 0.00022027989973586048, "loss": 0.018, "step": 205030 }, { "epoch": 0.53, "learning_rate": 0.000220276011519489, "loss": 0.0197, "step": 205040 }, { "epoch": 0.53, "learning_rate": 0.00022027212330311756, "loss": 0.0169, "step": 205050 }, { "epoch": 0.53, "learning_rate": 0.0002202682350867461, "loss": 0.0147, "step": 205060 }, { "epoch": 0.53, "learning_rate": 0.00022026434687037462, "loss": 0.014, "step": 205070 }, { "epoch": 0.53, "learning_rate": 0.00022026045865400316, "loss": 0.0181, "step": 205080 }, { "epoch": 0.53, "learning_rate": 0.0002202565704376317, "loss": 0.0184, "step": 205090 }, { "epoch": 0.53, "learning_rate": 0.00022025268222126024, "loss": 0.0179, "step": 205100 }, { "epoch": 0.53, "learning_rate": 0.00022024879400488876, "loss": 0.0103, "step": 205110 }, { "epoch": 0.53, "learning_rate": 0.0002202449057885173, "loss": 0.0176, "step": 205120 }, { "epoch": 0.53, "learning_rate": 0.00022024101757214584, "loss": 0.0137, "step": 205130 }, { "epoch": 0.53, "learning_rate": 0.00022023712935577438, "loss": 0.0173, "step": 205140 }, { "epoch": 0.53, "learning_rate": 0.0002202332411394029, "loss": 0.0205, "step": 205150 }, { "epoch": 0.53, "learning_rate": 0.00022022935292303144, "loss": 0.0159, "step": 205160 }, { "epoch": 0.53, "learning_rate": 0.00022022546470665998, "loss": 0.0166, "step": 205170 }, { "epoch": 0.53, "learning_rate": 0.00022022157649028852, "loss": 0.0155, "step": 205180 }, { "epoch": 0.53, "learning_rate": 0.00022021768827391704, "loss": 0.0119, "step": 205190 }, { "epoch": 0.53, "learning_rate": 0.00022021380005754558, "loss": 0.0137, "step": 205200 }, { "epoch": 0.53, "learning_rate": 0.0002202099118411741, "loss": 0.0188, "step": 205210 }, { "epoch": 0.53, "learning_rate": 0.00022020602362480266, "loss": 0.0164, "step": 205220 }, { "epoch": 0.53, "learning_rate": 0.0002202021354084312, "loss": 0.0205, "step": 205230 }, { "epoch": 0.53, "learning_rate": 0.00022019824719205972, "loss": 0.0222, "step": 205240 }, { "epoch": 0.53, "learning_rate": 0.00022019435897568826, "loss": 0.0308, "step": 205250 }, { "epoch": 0.53, "learning_rate": 0.0002201904707593168, "loss": 0.0202, "step": 205260 }, { "epoch": 0.53, "learning_rate": 0.00022018658254294534, "loss": 0.017, "step": 205270 }, { "epoch": 0.53, "learning_rate": 0.00022018269432657386, "loss": 0.0187, "step": 205280 }, { "epoch": 0.53, "learning_rate": 0.0002201788061102024, "loss": 0.0216, "step": 205290 }, { "epoch": 0.53, "learning_rate": 0.00022017491789383094, "loss": 0.0177, "step": 205300 }, { "epoch": 0.53, "learning_rate": 0.00022017102967745948, "loss": 0.0161, "step": 205310 }, { "epoch": 0.53, "learning_rate": 0.000220167141461088, "loss": 0.0183, "step": 205320 }, { "epoch": 0.53, "learning_rate": 0.00022016325324471654, "loss": 0.0183, "step": 205330 }, { "epoch": 0.53, "learning_rate": 0.00022015936502834508, "loss": 0.0177, "step": 205340 }, { "epoch": 0.53, "learning_rate": 0.00022015547681197362, "loss": 0.0194, "step": 205350 }, { "epoch": 0.53, "learning_rate": 0.00022015158859560214, "loss": 0.0169, "step": 205360 }, { "epoch": 0.53, "learning_rate": 0.00022014770037923068, "loss": 0.0159, "step": 205370 }, { "epoch": 0.53, "learning_rate": 0.00022014381216285925, "loss": 0.0188, "step": 205380 }, { "epoch": 0.53, "learning_rate": 0.00022013992394648776, "loss": 0.0188, "step": 205390 }, { "epoch": 0.53, "learning_rate": 0.0002201360357301163, "loss": 0.0172, "step": 205400 }, { "epoch": 0.53, "learning_rate": 0.00022013214751374482, "loss": 0.0186, "step": 205410 }, { "epoch": 0.53, "learning_rate": 0.00022012825929737339, "loss": 0.0195, "step": 205420 }, { "epoch": 0.53, "learning_rate": 0.0002201243710810019, "loss": 0.025, "step": 205430 }, { "epoch": 0.53, "learning_rate": 0.00022012048286463044, "loss": 0.0184, "step": 205440 }, { "epoch": 0.53, "learning_rate": 0.00022011659464825896, "loss": 0.0203, "step": 205450 }, { "epoch": 0.53, "learning_rate": 0.0002201127064318875, "loss": 0.0212, "step": 205460 }, { "epoch": 0.53, "learning_rate": 0.00022010881821551604, "loss": 0.0222, "step": 205470 }, { "epoch": 0.53, "learning_rate": 0.00022010492999914458, "loss": 0.0172, "step": 205480 }, { "epoch": 0.53, "learning_rate": 0.0002201010417827731, "loss": 0.0152, "step": 205490 }, { "epoch": 0.53, "learning_rate": 0.00022009715356640164, "loss": 0.0187, "step": 205500 }, { "epoch": 0.53, "learning_rate": 0.00022009326535003018, "loss": 0.0189, "step": 205510 }, { "epoch": 0.53, "learning_rate": 0.00022008937713365872, "loss": 0.0175, "step": 205520 }, { "epoch": 0.53, "learning_rate": 0.00022008548891728723, "loss": 0.0198, "step": 205530 }, { "epoch": 0.53, "learning_rate": 0.00022008160070091578, "loss": 0.02, "step": 205540 }, { "epoch": 0.53, "learning_rate": 0.00022007771248454435, "loss": 0.0192, "step": 205550 }, { "epoch": 0.53, "learning_rate": 0.00022007382426817286, "loss": 0.0197, "step": 205560 }, { "epoch": 0.53, "learning_rate": 0.00022006993605180137, "loss": 0.0194, "step": 205570 }, { "epoch": 0.53, "learning_rate": 0.00022006604783542992, "loss": 0.0173, "step": 205580 }, { "epoch": 0.53, "learning_rate": 0.00022006215961905848, "loss": 0.0142, "step": 205590 }, { "epoch": 0.53, "learning_rate": 0.000220058271402687, "loss": 0.0159, "step": 205600 }, { "epoch": 0.53, "learning_rate": 0.00022005438318631554, "loss": 0.0197, "step": 205610 }, { "epoch": 0.53, "learning_rate": 0.00022005049496994406, "loss": 0.0195, "step": 205620 }, { "epoch": 0.53, "learning_rate": 0.00022004660675357262, "loss": 0.0181, "step": 205630 }, { "epoch": 0.53, "learning_rate": 0.00022004271853720114, "loss": 0.0146, "step": 205640 }, { "epoch": 0.53, "learning_rate": 0.00022003883032082968, "loss": 0.0205, "step": 205650 }, { "epoch": 0.53, "learning_rate": 0.0002200349421044582, "loss": 0.0164, "step": 205660 }, { "epoch": 0.53, "learning_rate": 0.00022003105388808676, "loss": 0.0157, "step": 205670 }, { "epoch": 0.53, "learning_rate": 0.00022002716567171528, "loss": 0.016, "step": 205680 }, { "epoch": 0.53, "learning_rate": 0.00022002327745534382, "loss": 0.015, "step": 205690 }, { "epoch": 0.53, "learning_rate": 0.00022001938923897233, "loss": 0.0174, "step": 205700 }, { "epoch": 0.53, "learning_rate": 0.00022001550102260088, "loss": 0.0192, "step": 205710 }, { "epoch": 0.53, "learning_rate": 0.00022001161280622944, "loss": 0.0172, "step": 205720 }, { "epoch": 0.53, "learning_rate": 0.00022000772458985796, "loss": 0.0188, "step": 205730 }, { "epoch": 0.53, "learning_rate": 0.00022000383637348647, "loss": 0.0198, "step": 205740 }, { "epoch": 0.53, "learning_rate": 0.00021999994815711502, "loss": 0.0175, "step": 205750 }, { "epoch": 0.53, "learning_rate": 0.00021999605994074358, "loss": 0.0176, "step": 205760 }, { "epoch": 0.53, "learning_rate": 0.0002199921717243721, "loss": 0.0205, "step": 205770 }, { "epoch": 0.53, "learning_rate": 0.00021998828350800064, "loss": 0.0195, "step": 205780 }, { "epoch": 0.53, "learning_rate": 0.00021998439529162915, "loss": 0.0208, "step": 205790 }, { "epoch": 0.53, "learning_rate": 0.00021998050707525772, "loss": 0.0174, "step": 205800 }, { "epoch": 0.53, "learning_rate": 0.00021997661885888624, "loss": 0.0184, "step": 205810 }, { "epoch": 0.53, "learning_rate": 0.00021997273064251478, "loss": 0.0223, "step": 205820 }, { "epoch": 0.53, "learning_rate": 0.0002199688424261433, "loss": 0.0148, "step": 205830 }, { "epoch": 0.53, "learning_rate": 0.00021996495420977186, "loss": 0.0155, "step": 205840 }, { "epoch": 0.53, "learning_rate": 0.00021996106599340038, "loss": 0.0188, "step": 205850 }, { "epoch": 0.53, "learning_rate": 0.00021995717777702892, "loss": 0.0187, "step": 205860 }, { "epoch": 0.53, "learning_rate": 0.00021995328956065743, "loss": 0.0178, "step": 205870 }, { "epoch": 0.53, "learning_rate": 0.000219949401344286, "loss": 0.0131, "step": 205880 }, { "epoch": 0.53, "learning_rate": 0.00021994551312791452, "loss": 0.02, "step": 205890 }, { "epoch": 0.53, "learning_rate": 0.00021994162491154306, "loss": 0.0178, "step": 205900 }, { "epoch": 0.53, "learning_rate": 0.00021993773669517157, "loss": 0.0195, "step": 205910 }, { "epoch": 0.53, "learning_rate": 0.00021993384847880014, "loss": 0.0196, "step": 205920 }, { "epoch": 0.53, "learning_rate": 0.00021992996026242868, "loss": 0.0177, "step": 205930 }, { "epoch": 0.53, "learning_rate": 0.0002199260720460572, "loss": 0.0195, "step": 205940 }, { "epoch": 0.53, "learning_rate": 0.00021992218382968574, "loss": 0.0174, "step": 205950 }, { "epoch": 0.53, "learning_rate": 0.00021991829561331425, "loss": 0.0162, "step": 205960 }, { "epoch": 0.53, "learning_rate": 0.00021991440739694282, "loss": 0.014, "step": 205970 }, { "epoch": 0.53, "learning_rate": 0.00021991051918057134, "loss": 0.0143, "step": 205980 }, { "epoch": 0.53, "learning_rate": 0.00021990663096419988, "loss": 0.0159, "step": 205990 }, { "epoch": 0.53, "learning_rate": 0.0002199027427478284, "loss": 0.0159, "step": 206000 }, { "epoch": 0.53, "eval_cer": 0.8817754674437451, "eval_loss": 0.011567558161914349, "eval_runtime": 107.5415, "eval_samples_per_second": 18.597, "eval_steps_per_second": 4.649, "step": 206000 }, { "epoch": 0.53, "learning_rate": 0.00021989885453145696, "loss": 0.0163, "step": 206010 }, { "epoch": 0.53, "learning_rate": 0.00021989496631508548, "loss": 0.0139, "step": 206020 }, { "epoch": 0.53, "learning_rate": 0.00021989107809871402, "loss": 0.02, "step": 206030 }, { "epoch": 0.53, "learning_rate": 0.00021988718988234253, "loss": 0.0173, "step": 206040 }, { "epoch": 0.53, "learning_rate": 0.0002198833016659711, "loss": 0.0161, "step": 206050 }, { "epoch": 0.53, "learning_rate": 0.00021987941344959962, "loss": 0.0148, "step": 206060 }, { "epoch": 0.53, "learning_rate": 0.00021987552523322816, "loss": 0.0142, "step": 206070 }, { "epoch": 0.53, "learning_rate": 0.00021987163701685667, "loss": 0.0211, "step": 206080 }, { "epoch": 0.53, "learning_rate": 0.00021986774880048524, "loss": 0.0182, "step": 206090 }, { "epoch": 0.53, "learning_rate": 0.00021986386058411378, "loss": 0.0127, "step": 206100 }, { "epoch": 0.53, "learning_rate": 0.0002198599723677423, "loss": 0.0173, "step": 206110 }, { "epoch": 0.53, "learning_rate": 0.00021985608415137084, "loss": 0.0228, "step": 206120 }, { "epoch": 0.53, "learning_rate": 0.00021985219593499938, "loss": 0.0155, "step": 206130 }, { "epoch": 0.53, "learning_rate": 0.00021984830771862792, "loss": 0.0194, "step": 206140 }, { "epoch": 0.53, "learning_rate": 0.00021984441950225644, "loss": 0.0175, "step": 206150 }, { "epoch": 0.53, "learning_rate": 0.00021984053128588498, "loss": 0.02, "step": 206160 }, { "epoch": 0.53, "learning_rate": 0.00021983664306951352, "loss": 0.0172, "step": 206170 }, { "epoch": 0.53, "learning_rate": 0.00021983275485314206, "loss": 0.0179, "step": 206180 }, { "epoch": 0.53, "learning_rate": 0.00021982886663677058, "loss": 0.019, "step": 206190 }, { "epoch": 0.53, "learning_rate": 0.00021982497842039912, "loss": 0.0195, "step": 206200 }, { "epoch": 0.53, "learning_rate": 0.00021982109020402763, "loss": 0.017, "step": 206210 }, { "epoch": 0.53, "learning_rate": 0.0002198172019876562, "loss": 0.0202, "step": 206220 }, { "epoch": 0.53, "learning_rate": 0.00021981331377128472, "loss": 0.0177, "step": 206230 }, { "epoch": 0.53, "learning_rate": 0.00021980942555491326, "loss": 0.0188, "step": 206240 }, { "epoch": 0.53, "learning_rate": 0.00021980553733854177, "loss": 0.0215, "step": 206250 }, { "epoch": 0.53, "learning_rate": 0.00021980164912217034, "loss": 0.0151, "step": 206260 }, { "epoch": 0.53, "learning_rate": 0.00021979776090579888, "loss": 0.0154, "step": 206270 }, { "epoch": 0.53, "learning_rate": 0.0002197938726894274, "loss": 0.0174, "step": 206280 }, { "epoch": 0.53, "learning_rate": 0.0002197899844730559, "loss": 0.0161, "step": 206290 }, { "epoch": 0.53, "learning_rate": 0.00021978609625668448, "loss": 0.0171, "step": 206300 }, { "epoch": 0.53, "learning_rate": 0.00021978220804031302, "loss": 0.016, "step": 206310 }, { "epoch": 0.53, "learning_rate": 0.00021977831982394154, "loss": 0.0225, "step": 206320 }, { "epoch": 0.53, "learning_rate": 0.00021977443160757008, "loss": 0.0194, "step": 206330 }, { "epoch": 0.53, "learning_rate": 0.00021977054339119862, "loss": 0.0196, "step": 206340 }, { "epoch": 0.53, "learning_rate": 0.00021976665517482716, "loss": 0.0187, "step": 206350 }, { "epoch": 0.53, "learning_rate": 0.00021976276695845568, "loss": 0.0166, "step": 206360 }, { "epoch": 0.53, "learning_rate": 0.00021975887874208422, "loss": 0.0151, "step": 206370 }, { "epoch": 0.53, "learning_rate": 0.00021975499052571276, "loss": 0.0144, "step": 206380 }, { "epoch": 0.53, "learning_rate": 0.0002197511023093413, "loss": 0.0114, "step": 206390 }, { "epoch": 0.54, "learning_rate": 0.00021974721409296982, "loss": 0.0199, "step": 206400 }, { "epoch": 0.54, "learning_rate": 0.00021974332587659836, "loss": 0.0175, "step": 206410 }, { "epoch": 0.54, "learning_rate": 0.00021973943766022693, "loss": 0.0127, "step": 206420 }, { "epoch": 0.54, "learning_rate": 0.00021973554944385544, "loss": 0.0169, "step": 206430 }, { "epoch": 0.54, "learning_rate": 0.00021973166122748398, "loss": 0.0158, "step": 206440 }, { "epoch": 0.54, "learning_rate": 0.0002197277730111125, "loss": 0.0131, "step": 206450 }, { "epoch": 0.54, "learning_rate": 0.000219723884794741, "loss": 0.019, "step": 206460 }, { "epoch": 0.54, "learning_rate": 0.00021971999657836958, "loss": 0.0168, "step": 206470 }, { "epoch": 0.54, "learning_rate": 0.00021971610836199812, "loss": 0.0154, "step": 206480 }, { "epoch": 0.54, "learning_rate": 0.00021971222014562664, "loss": 0.0165, "step": 206490 }, { "epoch": 0.54, "learning_rate": 0.00021970833192925518, "loss": 0.0155, "step": 206500 }, { "epoch": 0.54, "learning_rate": 0.00021970444371288372, "loss": 0.0156, "step": 206510 }, { "epoch": 0.54, "learning_rate": 0.00021970055549651226, "loss": 0.0154, "step": 206520 }, { "epoch": 0.54, "learning_rate": 0.00021969666728014078, "loss": 0.0153, "step": 206530 }, { "epoch": 0.54, "learning_rate": 0.00021969277906376932, "loss": 0.0161, "step": 206540 }, { "epoch": 0.54, "learning_rate": 0.00021968889084739786, "loss": 0.0212, "step": 206550 }, { "epoch": 0.54, "learning_rate": 0.0002196850026310264, "loss": 0.0192, "step": 206560 }, { "epoch": 0.54, "learning_rate": 0.00021968111441465491, "loss": 0.0208, "step": 206570 }, { "epoch": 0.54, "learning_rate": 0.00021967722619828346, "loss": 0.0232, "step": 206580 }, { "epoch": 0.54, "learning_rate": 0.00021967333798191202, "loss": 0.0189, "step": 206590 }, { "epoch": 0.54, "learning_rate": 0.00021966944976554054, "loss": 0.0161, "step": 206600 }, { "epoch": 0.54, "learning_rate": 0.00021966556154916905, "loss": 0.0151, "step": 206610 }, { "epoch": 0.54, "learning_rate": 0.0002196616733327976, "loss": 0.0153, "step": 206620 }, { "epoch": 0.54, "learning_rate": 0.00021965778511642616, "loss": 0.0157, "step": 206630 }, { "epoch": 0.54, "learning_rate": 0.00021965389690005468, "loss": 0.0132, "step": 206640 }, { "epoch": 0.54, "learning_rate": 0.00021965000868368322, "loss": 0.0168, "step": 206650 }, { "epoch": 0.54, "learning_rate": 0.00021964612046731174, "loss": 0.0176, "step": 206660 }, { "epoch": 0.54, "learning_rate": 0.0002196422322509403, "loss": 0.0154, "step": 206670 }, { "epoch": 0.54, "learning_rate": 0.00021963834403456882, "loss": 0.0154, "step": 206680 }, { "epoch": 0.54, "learning_rate": 0.00021963445581819736, "loss": 0.0141, "step": 206690 }, { "epoch": 0.54, "learning_rate": 0.00021963056760182587, "loss": 0.0194, "step": 206700 }, { "epoch": 0.54, "learning_rate": 0.00021962667938545442, "loss": 0.0174, "step": 206710 }, { "epoch": 0.54, "learning_rate": 0.00021962279116908296, "loss": 0.0155, "step": 206720 }, { "epoch": 0.54, "learning_rate": 0.0002196189029527115, "loss": 0.0129, "step": 206730 }, { "epoch": 0.54, "learning_rate": 0.00021961501473634001, "loss": 0.0152, "step": 206740 }, { "epoch": 0.54, "learning_rate": 0.00021961112651996856, "loss": 0.0189, "step": 206750 }, { "epoch": 0.54, "learning_rate": 0.0002196072383035971, "loss": 0.0208, "step": 206760 }, { "epoch": 0.54, "learning_rate": 0.00021960335008722564, "loss": 0.0174, "step": 206770 }, { "epoch": 0.54, "learning_rate": 0.00021959946187085415, "loss": 0.019, "step": 206780 }, { "epoch": 0.54, "learning_rate": 0.0002195955736544827, "loss": 0.02, "step": 206790 }, { "epoch": 0.54, "learning_rate": 0.00021959168543811126, "loss": 0.0192, "step": 206800 }, { "epoch": 0.54, "learning_rate": 0.00021958779722173978, "loss": 0.0186, "step": 206810 }, { "epoch": 0.54, "learning_rate": 0.00021958390900536832, "loss": 0.0167, "step": 206820 }, { "epoch": 0.54, "learning_rate": 0.00021958002078899683, "loss": 0.0134, "step": 206830 }, { "epoch": 0.54, "learning_rate": 0.0002195761325726254, "loss": 0.0175, "step": 206840 }, { "epoch": 0.54, "learning_rate": 0.00021957224435625392, "loss": 0.0164, "step": 206850 }, { "epoch": 0.54, "learning_rate": 0.00021956835613988246, "loss": 0.0182, "step": 206860 }, { "epoch": 0.54, "learning_rate": 0.00021956446792351097, "loss": 0.0142, "step": 206870 }, { "epoch": 0.54, "learning_rate": 0.00021956057970713954, "loss": 0.0138, "step": 206880 }, { "epoch": 0.54, "learning_rate": 0.00021955669149076806, "loss": 0.0135, "step": 206890 }, { "epoch": 0.54, "learning_rate": 0.0002195528032743966, "loss": 0.0183, "step": 206900 }, { "epoch": 0.54, "learning_rate": 0.0002195489150580251, "loss": 0.0115, "step": 206910 }, { "epoch": 0.54, "learning_rate": 0.00021954502684165368, "loss": 0.0168, "step": 206920 }, { "epoch": 0.54, "learning_rate": 0.0002195411386252822, "loss": 0.0187, "step": 206930 }, { "epoch": 0.54, "learning_rate": 0.00021953725040891074, "loss": 0.0177, "step": 206940 }, { "epoch": 0.54, "learning_rate": 0.00021953336219253925, "loss": 0.0154, "step": 206950 }, { "epoch": 0.54, "learning_rate": 0.0002195294739761678, "loss": 0.0157, "step": 206960 }, { "epoch": 0.54, "learning_rate": 0.00021952558575979636, "loss": 0.0168, "step": 206970 }, { "epoch": 0.54, "learning_rate": 0.00021952169754342488, "loss": 0.0146, "step": 206980 }, { "epoch": 0.54, "learning_rate": 0.00021951780932705342, "loss": 0.0163, "step": 206990 }, { "epoch": 0.54, "learning_rate": 0.00021951392111068193, "loss": 0.0188, "step": 207000 }, { "epoch": 0.54, "eval_cer": 0.8817614710744033, "eval_loss": 0.011343833990395069, "eval_runtime": 107.8464, "eval_samples_per_second": 18.545, "eval_steps_per_second": 4.636, "step": 207000 }, { "epoch": 0.54, "learning_rate": 0.0002195100328943105, "loss": 0.017, "step": 207010 }, { "epoch": 0.54, "learning_rate": 0.00021950614467793902, "loss": 0.0183, "step": 207020 }, { "epoch": 0.54, "learning_rate": 0.00021950225646156756, "loss": 0.0125, "step": 207030 }, { "epoch": 0.54, "learning_rate": 0.00021949836824519607, "loss": 0.0171, "step": 207040 }, { "epoch": 0.54, "learning_rate": 0.00021949448002882464, "loss": 0.0192, "step": 207050 }, { "epoch": 0.54, "learning_rate": 0.00021949059181245316, "loss": 0.0168, "step": 207060 }, { "epoch": 0.54, "learning_rate": 0.0002194867035960817, "loss": 0.0241, "step": 207070 }, { "epoch": 0.54, "learning_rate": 0.0002194828153797102, "loss": 0.017, "step": 207080 }, { "epoch": 0.54, "learning_rate": 0.00021947892716333878, "loss": 0.0142, "step": 207090 }, { "epoch": 0.54, "learning_rate": 0.0002194750389469673, "loss": 0.0146, "step": 207100 }, { "epoch": 0.54, "learning_rate": 0.00021947115073059584, "loss": 0.0179, "step": 207110 }, { "epoch": 0.54, "learning_rate": 0.00021946726251422435, "loss": 0.0164, "step": 207120 }, { "epoch": 0.54, "learning_rate": 0.00021946337429785292, "loss": 0.0191, "step": 207130 }, { "epoch": 0.54, "learning_rate": 0.00021945948608148146, "loss": 0.0168, "step": 207140 }, { "epoch": 0.54, "learning_rate": 0.00021945559786510998, "loss": 0.0136, "step": 207150 }, { "epoch": 0.54, "learning_rate": 0.0002194517096487385, "loss": 0.0152, "step": 207160 }, { "epoch": 0.54, "learning_rate": 0.00021944782143236703, "loss": 0.016, "step": 207170 }, { "epoch": 0.54, "learning_rate": 0.0002194439332159956, "loss": 0.0189, "step": 207180 }, { "epoch": 0.54, "learning_rate": 0.00021944004499962412, "loss": 0.0148, "step": 207190 }, { "epoch": 0.54, "learning_rate": 0.00021943615678325266, "loss": 0.0119, "step": 207200 }, { "epoch": 0.54, "learning_rate": 0.00021943226856688117, "loss": 0.0195, "step": 207210 }, { "epoch": 0.54, "learning_rate": 0.00021942838035050974, "loss": 0.0176, "step": 207220 }, { "epoch": 0.54, "learning_rate": 0.00021942449213413826, "loss": 0.0187, "step": 207230 }, { "epoch": 0.54, "learning_rate": 0.0002194206039177668, "loss": 0.015, "step": 207240 }, { "epoch": 0.54, "learning_rate": 0.0002194167157013953, "loss": 0.0212, "step": 207250 }, { "epoch": 0.54, "learning_rate": 0.00021941282748502388, "loss": 0.0142, "step": 207260 }, { "epoch": 0.54, "learning_rate": 0.0002194089392686524, "loss": 0.0153, "step": 207270 }, { "epoch": 0.54, "learning_rate": 0.00021940505105228094, "loss": 0.0161, "step": 207280 }, { "epoch": 0.54, "learning_rate": 0.00021940116283590945, "loss": 0.0147, "step": 207290 }, { "epoch": 0.54, "learning_rate": 0.00021939727461953802, "loss": 0.0169, "step": 207300 }, { "epoch": 0.54, "learning_rate": 0.00021939338640316656, "loss": 0.0158, "step": 207310 }, { "epoch": 0.54, "learning_rate": 0.00021938949818679508, "loss": 0.0153, "step": 207320 }, { "epoch": 0.54, "learning_rate": 0.0002193856099704236, "loss": 0.019, "step": 207330 }, { "epoch": 0.54, "learning_rate": 0.00021938172175405216, "loss": 0.0178, "step": 207340 }, { "epoch": 0.54, "learning_rate": 0.0002193778335376807, "loss": 0.0173, "step": 207350 }, { "epoch": 0.54, "learning_rate": 0.00021937394532130922, "loss": 0.0169, "step": 207360 }, { "epoch": 0.54, "learning_rate": 0.00021937005710493776, "loss": 0.019, "step": 207370 }, { "epoch": 0.54, "learning_rate": 0.0002193661688885663, "loss": 0.0154, "step": 207380 }, { "epoch": 0.54, "learning_rate": 0.00021936228067219484, "loss": 0.0172, "step": 207390 }, { "epoch": 0.54, "learning_rate": 0.00021935839245582336, "loss": 0.0139, "step": 207400 }, { "epoch": 0.54, "learning_rate": 0.0002193545042394519, "loss": 0.0156, "step": 207410 }, { "epoch": 0.54, "learning_rate": 0.0002193506160230804, "loss": 0.0176, "step": 207420 }, { "epoch": 0.54, "learning_rate": 0.00021934672780670898, "loss": 0.0347, "step": 207430 }, { "epoch": 0.54, "learning_rate": 0.0002193428395903375, "loss": 0.0158, "step": 207440 }, { "epoch": 0.54, "learning_rate": 0.00021933895137396604, "loss": 0.018, "step": 207450 }, { "epoch": 0.54, "learning_rate": 0.00021933506315759455, "loss": 0.0166, "step": 207460 }, { "epoch": 0.54, "learning_rate": 0.00021933117494122312, "loss": 0.0169, "step": 207470 }, { "epoch": 0.54, "learning_rate": 0.00021932728672485163, "loss": 0.0202, "step": 207480 }, { "epoch": 0.54, "learning_rate": 0.00021932339850848018, "loss": 0.0148, "step": 207490 }, { "epoch": 0.54, "learning_rate": 0.0002193195102921087, "loss": 0.0227, "step": 207500 }, { "epoch": 0.54, "learning_rate": 0.00021931562207573726, "loss": 0.0187, "step": 207510 }, { "epoch": 0.54, "learning_rate": 0.0002193117338593658, "loss": 0.0155, "step": 207520 }, { "epoch": 0.54, "learning_rate": 0.00021930784564299432, "loss": 0.0134, "step": 207530 }, { "epoch": 0.54, "learning_rate": 0.00021930395742662286, "loss": 0.0158, "step": 207540 }, { "epoch": 0.54, "learning_rate": 0.0002193000692102514, "loss": 0.0142, "step": 207550 }, { "epoch": 0.54, "learning_rate": 0.00021929618099387994, "loss": 0.0169, "step": 207560 }, { "epoch": 0.54, "learning_rate": 0.00021929229277750845, "loss": 0.0116, "step": 207570 }, { "epoch": 0.54, "learning_rate": 0.000219288404561137, "loss": 0.0156, "step": 207580 }, { "epoch": 0.54, "learning_rate": 0.00021928451634476554, "loss": 0.0187, "step": 207590 }, { "epoch": 0.54, "learning_rate": 0.00021928062812839408, "loss": 0.0271, "step": 207600 }, { "epoch": 0.54, "learning_rate": 0.0002192767399120226, "loss": 0.0172, "step": 207610 }, { "epoch": 0.54, "learning_rate": 0.00021927285169565114, "loss": 0.0154, "step": 207620 }, { "epoch": 0.54, "learning_rate": 0.00021926896347927968, "loss": 0.022, "step": 207630 }, { "epoch": 0.54, "learning_rate": 0.00021926507526290822, "loss": 0.0182, "step": 207640 }, { "epoch": 0.54, "learning_rate": 0.00021926118704653673, "loss": 0.0139, "step": 207650 }, { "epoch": 0.54, "learning_rate": 0.00021925729883016528, "loss": 0.0167, "step": 207660 }, { "epoch": 0.54, "learning_rate": 0.0002192534106137938, "loss": 0.0161, "step": 207670 }, { "epoch": 0.54, "learning_rate": 0.00021924952239742236, "loss": 0.0187, "step": 207680 }, { "epoch": 0.54, "learning_rate": 0.0002192456341810509, "loss": 0.0202, "step": 207690 }, { "epoch": 0.54, "learning_rate": 0.00021924174596467941, "loss": 0.0177, "step": 207700 }, { "epoch": 0.54, "learning_rate": 0.00021923785774830796, "loss": 0.0171, "step": 207710 }, { "epoch": 0.54, "learning_rate": 0.0002192339695319365, "loss": 0.0165, "step": 207720 }, { "epoch": 0.54, "learning_rate": 0.00021923008131556504, "loss": 0.0144, "step": 207730 }, { "epoch": 0.54, "learning_rate": 0.00021922619309919355, "loss": 0.0125, "step": 207740 }, { "epoch": 0.54, "learning_rate": 0.0002192223048828221, "loss": 0.0156, "step": 207750 }, { "epoch": 0.54, "learning_rate": 0.00021921841666645064, "loss": 0.0147, "step": 207760 }, { "epoch": 0.54, "learning_rate": 0.00021921452845007918, "loss": 0.0231, "step": 207770 }, { "epoch": 0.54, "learning_rate": 0.0002192106402337077, "loss": 0.0166, "step": 207780 }, { "epoch": 0.54, "learning_rate": 0.00021920675201733624, "loss": 0.0153, "step": 207790 }, { "epoch": 0.54, "learning_rate": 0.00021920286380096478, "loss": 0.0155, "step": 207800 }, { "epoch": 0.54, "learning_rate": 0.00021919897558459332, "loss": 0.0168, "step": 207810 }, { "epoch": 0.54, "learning_rate": 0.00021919508736822183, "loss": 0.0161, "step": 207820 }, { "epoch": 0.54, "learning_rate": 0.00021919119915185037, "loss": 0.0254, "step": 207830 }, { "epoch": 0.54, "learning_rate": 0.00021918731093547894, "loss": 0.0152, "step": 207840 }, { "epoch": 0.54, "learning_rate": 0.00021918342271910746, "loss": 0.0177, "step": 207850 }, { "epoch": 0.54, "learning_rate": 0.000219179534502736, "loss": 0.0184, "step": 207860 }, { "epoch": 0.54, "learning_rate": 0.00021917564628636451, "loss": 0.0187, "step": 207870 }, { "epoch": 0.54, "learning_rate": 0.00021917175806999308, "loss": 0.0158, "step": 207880 }, { "epoch": 0.54, "learning_rate": 0.0002191678698536216, "loss": 0.0181, "step": 207890 }, { "epoch": 0.54, "learning_rate": 0.00021916398163725014, "loss": 0.016, "step": 207900 }, { "epoch": 0.54, "learning_rate": 0.00021916009342087865, "loss": 0.0181, "step": 207910 }, { "epoch": 0.54, "learning_rate": 0.0002191562052045072, "loss": 0.0194, "step": 207920 }, { "epoch": 0.54, "learning_rate": 0.00021915231698813574, "loss": 0.0166, "step": 207930 }, { "epoch": 0.54, "learning_rate": 0.00021914842877176428, "loss": 0.0134, "step": 207940 }, { "epoch": 0.54, "learning_rate": 0.0002191445405553928, "loss": 0.0167, "step": 207950 }, { "epoch": 0.54, "learning_rate": 0.00021914065233902133, "loss": 0.0225, "step": 207960 }, { "epoch": 0.54, "learning_rate": 0.00021913676412264988, "loss": 0.0157, "step": 207970 }, { "epoch": 0.54, "learning_rate": 0.00021913287590627842, "loss": 0.0178, "step": 207980 }, { "epoch": 0.54, "learning_rate": 0.00021912898768990693, "loss": 0.0149, "step": 207990 }, { "epoch": 0.54, "learning_rate": 0.00021912509947353547, "loss": 0.0187, "step": 208000 }, { "epoch": 0.54, "eval_cer": 0.8817726681698768, "eval_loss": 0.011146793141961098, "eval_runtime": 108.0067, "eval_samples_per_second": 18.517, "eval_steps_per_second": 4.629, "step": 208000 }, { "epoch": 0.54, "learning_rate": 0.00021912121125716404, "loss": 0.0137, "step": 208010 }, { "epoch": 0.54, "learning_rate": 0.00021911732304079256, "loss": 0.0167, "step": 208020 }, { "epoch": 0.54, "learning_rate": 0.0002191134348244211, "loss": 0.0143, "step": 208030 }, { "epoch": 0.54, "learning_rate": 0.00021910954660804961, "loss": 0.0174, "step": 208040 }, { "epoch": 0.54, "learning_rate": 0.00021910565839167818, "loss": 0.0166, "step": 208050 }, { "epoch": 0.54, "learning_rate": 0.0002191017701753067, "loss": 0.0151, "step": 208060 }, { "epoch": 0.54, "learning_rate": 0.00021909788195893524, "loss": 0.0177, "step": 208070 }, { "epoch": 0.54, "learning_rate": 0.00021909399374256375, "loss": 0.0164, "step": 208080 }, { "epoch": 0.54, "learning_rate": 0.00021909010552619232, "loss": 0.021, "step": 208090 }, { "epoch": 0.54, "learning_rate": 0.00021908621730982084, "loss": 0.0135, "step": 208100 }, { "epoch": 0.54, "learning_rate": 0.00021908232909344938, "loss": 0.016, "step": 208110 }, { "epoch": 0.54, "learning_rate": 0.0002190784408770779, "loss": 0.0168, "step": 208120 }, { "epoch": 0.54, "learning_rate": 0.00021907455266070646, "loss": 0.0148, "step": 208130 }, { "epoch": 0.54, "learning_rate": 0.00021907066444433498, "loss": 0.0151, "step": 208140 }, { "epoch": 0.54, "learning_rate": 0.00021906677622796352, "loss": 0.0177, "step": 208150 }, { "epoch": 0.54, "learning_rate": 0.00021906288801159203, "loss": 0.0155, "step": 208160 }, { "epoch": 0.54, "learning_rate": 0.00021905899979522057, "loss": 0.0165, "step": 208170 }, { "epoch": 0.54, "learning_rate": 0.00021905511157884914, "loss": 0.0168, "step": 208180 }, { "epoch": 0.54, "learning_rate": 0.00021905122336247766, "loss": 0.0135, "step": 208190 }, { "epoch": 0.54, "learning_rate": 0.00021904733514610617, "loss": 0.017, "step": 208200 }, { "epoch": 0.54, "learning_rate": 0.0002190434469297347, "loss": 0.0173, "step": 208210 }, { "epoch": 0.54, "learning_rate": 0.00021903955871336328, "loss": 0.0154, "step": 208220 }, { "epoch": 0.54, "learning_rate": 0.0002190356704969918, "loss": 0.0167, "step": 208230 }, { "epoch": 0.54, "learning_rate": 0.00021903178228062034, "loss": 0.0184, "step": 208240 }, { "epoch": 0.54, "learning_rate": 0.00021902789406424885, "loss": 0.0189, "step": 208250 }, { "epoch": 0.54, "learning_rate": 0.00021902400584787742, "loss": 0.0166, "step": 208260 }, { "epoch": 0.54, "learning_rate": 0.00021902011763150594, "loss": 0.0173, "step": 208270 }, { "epoch": 0.54, "learning_rate": 0.00021901622941513448, "loss": 0.0174, "step": 208280 }, { "epoch": 0.54, "learning_rate": 0.000219012341198763, "loss": 0.0165, "step": 208290 }, { "epoch": 0.54, "learning_rate": 0.00021900845298239156, "loss": 0.0141, "step": 208300 }, { "epoch": 0.54, "learning_rate": 0.00021900456476602008, "loss": 0.0185, "step": 208310 }, { "epoch": 0.54, "learning_rate": 0.00021900067654964862, "loss": 0.0152, "step": 208320 }, { "epoch": 0.54, "learning_rate": 0.00021899678833327713, "loss": 0.0175, "step": 208330 }, { "epoch": 0.54, "learning_rate": 0.0002189929001169057, "loss": 0.0161, "step": 208340 }, { "epoch": 0.54, "learning_rate": 0.00021898901190053421, "loss": 0.0178, "step": 208350 }, { "epoch": 0.54, "learning_rate": 0.00021898512368416276, "loss": 0.0162, "step": 208360 }, { "epoch": 0.54, "learning_rate": 0.00021898123546779127, "loss": 0.0138, "step": 208370 }, { "epoch": 0.54, "learning_rate": 0.00021897734725141984, "loss": 0.0211, "step": 208380 }, { "epoch": 0.54, "learning_rate": 0.00021897345903504838, "loss": 0.0176, "step": 208390 }, { "epoch": 0.54, "learning_rate": 0.0002189695708186769, "loss": 0.0172, "step": 208400 }, { "epoch": 0.54, "learning_rate": 0.00021896568260230544, "loss": 0.0136, "step": 208410 }, { "epoch": 0.54, "learning_rate": 0.00021896179438593395, "loss": 0.0159, "step": 208420 }, { "epoch": 0.54, "learning_rate": 0.00021895790616956252, "loss": 0.0176, "step": 208430 }, { "epoch": 0.54, "learning_rate": 0.00021895401795319104, "loss": 0.017, "step": 208440 }, { "epoch": 0.54, "learning_rate": 0.00021895012973681958, "loss": 0.0133, "step": 208450 }, { "epoch": 0.54, "learning_rate": 0.0002189462415204481, "loss": 0.0185, "step": 208460 }, { "epoch": 0.54, "learning_rate": 0.00021894235330407666, "loss": 0.0152, "step": 208470 }, { "epoch": 0.54, "learning_rate": 0.00021893846508770517, "loss": 0.0211, "step": 208480 }, { "epoch": 0.54, "learning_rate": 0.00021893457687133372, "loss": 0.0172, "step": 208490 }, { "epoch": 0.54, "learning_rate": 0.00021893068865496223, "loss": 0.0158, "step": 208500 }, { "epoch": 0.54, "learning_rate": 0.0002189268004385908, "loss": 0.0197, "step": 208510 }, { "epoch": 0.54, "learning_rate": 0.00021892291222221931, "loss": 0.0171, "step": 208520 }, { "epoch": 0.54, "learning_rate": 0.00021891902400584786, "loss": 0.0175, "step": 208530 }, { "epoch": 0.54, "learning_rate": 0.00021891513578947637, "loss": 0.0162, "step": 208540 }, { "epoch": 0.54, "learning_rate": 0.00021891124757310494, "loss": 0.0157, "step": 208550 }, { "epoch": 0.54, "learning_rate": 0.00021890735935673348, "loss": 0.0166, "step": 208560 }, { "epoch": 0.54, "learning_rate": 0.000218903471140362, "loss": 0.0186, "step": 208570 }, { "epoch": 0.54, "learning_rate": 0.00021889958292399054, "loss": 0.0161, "step": 208580 }, { "epoch": 0.54, "learning_rate": 0.00021889569470761908, "loss": 0.0154, "step": 208590 }, { "epoch": 0.54, "learning_rate": 0.00021889180649124762, "loss": 0.0189, "step": 208600 }, { "epoch": 0.54, "learning_rate": 0.00021888791827487613, "loss": 0.0156, "step": 208610 }, { "epoch": 0.54, "learning_rate": 0.00021888403005850468, "loss": 0.016, "step": 208620 }, { "epoch": 0.54, "learning_rate": 0.00021888014184213322, "loss": 0.0213, "step": 208630 }, { "epoch": 0.54, "learning_rate": 0.00021887625362576176, "loss": 0.0207, "step": 208640 }, { "epoch": 0.54, "learning_rate": 0.00021887236540939027, "loss": 0.014, "step": 208650 }, { "epoch": 0.54, "learning_rate": 0.00021886847719301882, "loss": 0.0157, "step": 208660 }, { "epoch": 0.54, "learning_rate": 0.00021886458897664733, "loss": 0.0189, "step": 208670 }, { "epoch": 0.54, "learning_rate": 0.0002188607007602759, "loss": 0.0158, "step": 208680 }, { "epoch": 0.54, "learning_rate": 0.00021885681254390441, "loss": 0.0135, "step": 208690 }, { "epoch": 0.54, "learning_rate": 0.00021885292432753296, "loss": 0.0144, "step": 208700 }, { "epoch": 0.54, "learning_rate": 0.00021884903611116147, "loss": 0.0196, "step": 208710 }, { "epoch": 0.54, "learning_rate": 0.00021884514789479004, "loss": 0.0218, "step": 208720 }, { "epoch": 0.54, "learning_rate": 0.00021884125967841858, "loss": 0.0161, "step": 208730 }, { "epoch": 0.54, "learning_rate": 0.0002188373714620471, "loss": 0.0131, "step": 208740 }, { "epoch": 0.54, "learning_rate": 0.0002188334832456756, "loss": 0.0147, "step": 208750 }, { "epoch": 0.54, "learning_rate": 0.00021882959502930418, "loss": 0.0159, "step": 208760 }, { "epoch": 0.54, "learning_rate": 0.00021882570681293272, "loss": 0.0172, "step": 208770 }, { "epoch": 0.54, "learning_rate": 0.00021882181859656123, "loss": 0.0169, "step": 208780 }, { "epoch": 0.54, "learning_rate": 0.00021881793038018978, "loss": 0.0162, "step": 208790 }, { "epoch": 0.54, "learning_rate": 0.00021881404216381832, "loss": 0.0148, "step": 208800 }, { "epoch": 0.54, "learning_rate": 0.00021881015394744686, "loss": 0.0189, "step": 208810 }, { "epoch": 0.54, "learning_rate": 0.00021880626573107537, "loss": 0.0146, "step": 208820 }, { "epoch": 0.54, "learning_rate": 0.00021880237751470392, "loss": 0.0176, "step": 208830 }, { "epoch": 0.54, "learning_rate": 0.00021879848929833246, "loss": 0.0227, "step": 208840 }, { "epoch": 0.54, "learning_rate": 0.000218794601081961, "loss": 0.0174, "step": 208850 }, { "epoch": 0.54, "learning_rate": 0.0002187907128655895, "loss": 0.018, "step": 208860 }, { "epoch": 0.54, "learning_rate": 0.00021878682464921805, "loss": 0.0189, "step": 208870 }, { "epoch": 0.54, "learning_rate": 0.00021878293643284662, "loss": 0.0184, "step": 208880 }, { "epoch": 0.54, "learning_rate": 0.00021877904821647514, "loss": 0.0168, "step": 208890 }, { "epoch": 0.54, "learning_rate": 0.00021877516000010368, "loss": 0.0174, "step": 208900 }, { "epoch": 0.54, "learning_rate": 0.0002187712717837322, "loss": 0.0142, "step": 208910 }, { "epoch": 0.54, "learning_rate": 0.0002187673835673607, "loss": 0.0185, "step": 208920 }, { "epoch": 0.54, "learning_rate": 0.00021876349535098928, "loss": 0.0177, "step": 208930 }, { "epoch": 0.54, "learning_rate": 0.00021875960713461782, "loss": 0.0166, "step": 208940 }, { "epoch": 0.54, "learning_rate": 0.00021875571891824633, "loss": 0.0142, "step": 208950 }, { "epoch": 0.54, "learning_rate": 0.00021875183070187488, "loss": 0.0142, "step": 208960 }, { "epoch": 0.54, "learning_rate": 0.00021874794248550342, "loss": 0.0184, "step": 208970 }, { "epoch": 0.54, "learning_rate": 0.00021874405426913196, "loss": 0.0192, "step": 208980 }, { "epoch": 0.54, "learning_rate": 0.00021874016605276047, "loss": 0.0176, "step": 208990 }, { "epoch": 0.54, "learning_rate": 0.00021873627783638901, "loss": 0.0197, "step": 209000 }, { "epoch": 0.54, "eval_cer": 0.8817362776095881, "eval_loss": 0.011807015165686607, "eval_runtime": 107.3317, "eval_samples_per_second": 18.634, "eval_steps_per_second": 4.658, "step": 209000 }, { "epoch": 0.54, "learning_rate": 0.00021873238962001756, "loss": 0.0188, "step": 209010 }, { "epoch": 0.54, "learning_rate": 0.0002187285014036461, "loss": 0.016, "step": 209020 }, { "epoch": 0.54, "learning_rate": 0.0002187246131872746, "loss": 0.0207, "step": 209030 }, { "epoch": 0.54, "learning_rate": 0.00021872072497090315, "loss": 0.0159, "step": 209040 }, { "epoch": 0.54, "learning_rate": 0.00021871683675453172, "loss": 0.0173, "step": 209050 }, { "epoch": 0.54, "learning_rate": 0.00021871294853816024, "loss": 0.0207, "step": 209060 }, { "epoch": 0.54, "learning_rate": 0.00021870906032178875, "loss": 0.0154, "step": 209070 }, { "epoch": 0.54, "learning_rate": 0.0002187051721054173, "loss": 0.0165, "step": 209080 }, { "epoch": 0.54, "learning_rate": 0.00021870128388904586, "loss": 0.0142, "step": 209090 }, { "epoch": 0.54, "learning_rate": 0.00021869739567267438, "loss": 0.0173, "step": 209100 }, { "epoch": 0.54, "learning_rate": 0.00021869350745630292, "loss": 0.0206, "step": 209110 }, { "epoch": 0.54, "learning_rate": 0.00021868961923993143, "loss": 0.0246, "step": 209120 }, { "epoch": 0.54, "learning_rate": 0.00021868573102356, "loss": 0.0159, "step": 209130 }, { "epoch": 0.54, "learning_rate": 0.00021868184280718852, "loss": 0.0179, "step": 209140 }, { "epoch": 0.54, "learning_rate": 0.00021867795459081706, "loss": 0.0208, "step": 209150 }, { "epoch": 0.54, "learning_rate": 0.00021867406637444557, "loss": 0.0214, "step": 209160 }, { "epoch": 0.54, "learning_rate": 0.00021867017815807411, "loss": 0.0167, "step": 209170 }, { "epoch": 0.54, "learning_rate": 0.00021866628994170266, "loss": 0.0189, "step": 209180 }, { "epoch": 0.54, "learning_rate": 0.0002186624017253312, "loss": 0.0188, "step": 209190 }, { "epoch": 0.54, "learning_rate": 0.0002186585135089597, "loss": 0.0206, "step": 209200 }, { "epoch": 0.54, "learning_rate": 0.00021865462529258825, "loss": 0.0254, "step": 209210 }, { "epoch": 0.54, "learning_rate": 0.0002186507370762168, "loss": 0.0152, "step": 209220 }, { "epoch": 0.54, "learning_rate": 0.00021864684885984534, "loss": 0.0186, "step": 209230 }, { "epoch": 0.54, "learning_rate": 0.00021864296064347385, "loss": 0.0189, "step": 209240 }, { "epoch": 0.54, "learning_rate": 0.0002186390724271024, "loss": 0.0144, "step": 209250 }, { "epoch": 0.54, "learning_rate": 0.00021863518421073096, "loss": 0.0173, "step": 209260 }, { "epoch": 0.54, "learning_rate": 0.00021863129599435948, "loss": 0.0169, "step": 209270 }, { "epoch": 0.54, "learning_rate": 0.00021862740777798802, "loss": 0.0191, "step": 209280 }, { "epoch": 0.54, "learning_rate": 0.00021862351956161653, "loss": 0.0184, "step": 209290 }, { "epoch": 0.54, "learning_rate": 0.0002186196313452451, "loss": 0.0173, "step": 209300 }, { "epoch": 0.54, "learning_rate": 0.00021861574312887362, "loss": 0.0209, "step": 209310 }, { "epoch": 0.54, "learning_rate": 0.00021861185491250216, "loss": 0.0165, "step": 209320 }, { "epoch": 0.54, "learning_rate": 0.00021860796669613067, "loss": 0.0151, "step": 209330 }, { "epoch": 0.54, "learning_rate": 0.00021860407847975924, "loss": 0.0145, "step": 209340 }, { "epoch": 0.54, "learning_rate": 0.00021860019026338776, "loss": 0.0229, "step": 209350 }, { "epoch": 0.54, "learning_rate": 0.0002185963020470163, "loss": 0.0176, "step": 209360 }, { "epoch": 0.54, "learning_rate": 0.0002185924138306448, "loss": 0.0174, "step": 209370 }, { "epoch": 0.54, "learning_rate": 0.00021858852561427338, "loss": 0.0163, "step": 209380 }, { "epoch": 0.54, "learning_rate": 0.0002185846373979019, "loss": 0.0155, "step": 209390 }, { "epoch": 0.54, "learning_rate": 0.00021858074918153044, "loss": 0.0176, "step": 209400 }, { "epoch": 0.54, "learning_rate": 0.00021857686096515895, "loss": 0.0187, "step": 209410 }, { "epoch": 0.54, "learning_rate": 0.0002185729727487875, "loss": 0.0198, "step": 209420 }, { "epoch": 0.54, "learning_rate": 0.00021856908453241606, "loss": 0.0155, "step": 209430 }, { "epoch": 0.54, "learning_rate": 0.00021856519631604458, "loss": 0.0188, "step": 209440 }, { "epoch": 0.54, "learning_rate": 0.00021856130809967312, "loss": 0.0175, "step": 209450 }, { "epoch": 0.54, "learning_rate": 0.00021855741988330163, "loss": 0.0162, "step": 209460 }, { "epoch": 0.54, "learning_rate": 0.0002185535316669302, "loss": 0.016, "step": 209470 }, { "epoch": 0.54, "learning_rate": 0.00021854964345055872, "loss": 0.0132, "step": 209480 }, { "epoch": 0.54, "learning_rate": 0.00021854575523418726, "loss": 0.0118, "step": 209490 }, { "epoch": 0.54, "learning_rate": 0.00021854186701781577, "loss": 0.0187, "step": 209500 }, { "epoch": 0.54, "learning_rate": 0.00021853797880144434, "loss": 0.0108, "step": 209510 }, { "epoch": 0.54, "learning_rate": 0.00021853409058507285, "loss": 0.0167, "step": 209520 }, { "epoch": 0.54, "learning_rate": 0.0002185302023687014, "loss": 0.0128, "step": 209530 }, { "epoch": 0.54, "learning_rate": 0.0002185263141523299, "loss": 0.0185, "step": 209540 }, { "epoch": 0.54, "learning_rate": 0.00021852242593595848, "loss": 0.0115, "step": 209550 }, { "epoch": 0.54, "learning_rate": 0.000218518537719587, "loss": 0.0183, "step": 209560 }, { "epoch": 0.54, "learning_rate": 0.00021851464950321554, "loss": 0.0164, "step": 209570 }, { "epoch": 0.54, "learning_rate": 0.00021851076128684405, "loss": 0.0231, "step": 209580 }, { "epoch": 0.54, "learning_rate": 0.00021850687307047262, "loss": 0.0159, "step": 209590 }, { "epoch": 0.54, "learning_rate": 0.00021850298485410116, "loss": 0.0175, "step": 209600 }, { "epoch": 0.54, "learning_rate": 0.00021849909663772968, "loss": 0.0158, "step": 209610 }, { "epoch": 0.54, "learning_rate": 0.00021849520842135822, "loss": 0.0196, "step": 209620 }, { "epoch": 0.54, "learning_rate": 0.00021849132020498676, "loss": 0.0139, "step": 209630 }, { "epoch": 0.54, "learning_rate": 0.0002184874319886153, "loss": 0.0198, "step": 209640 }, { "epoch": 0.54, "learning_rate": 0.00021848354377224381, "loss": 0.0157, "step": 209650 }, { "epoch": 0.54, "learning_rate": 0.00021847965555587236, "loss": 0.0227, "step": 209660 }, { "epoch": 0.54, "learning_rate": 0.00021847576733950087, "loss": 0.0155, "step": 209670 }, { "epoch": 0.54, "learning_rate": 0.00021847187912312944, "loss": 0.0142, "step": 209680 }, { "epoch": 0.54, "learning_rate": 0.00021846799090675795, "loss": 0.0161, "step": 209690 }, { "epoch": 0.54, "learning_rate": 0.0002184641026903865, "loss": 0.0183, "step": 209700 }, { "epoch": 0.54, "learning_rate": 0.000218460214474015, "loss": 0.0166, "step": 209710 }, { "epoch": 0.54, "learning_rate": 0.00021845632625764358, "loss": 0.0193, "step": 209720 }, { "epoch": 0.54, "learning_rate": 0.0002184524380412721, "loss": 0.0155, "step": 209730 }, { "epoch": 0.54, "learning_rate": 0.00021844854982490064, "loss": 0.0175, "step": 209740 }, { "epoch": 0.54, "learning_rate": 0.00021844466160852915, "loss": 0.016, "step": 209750 }, { "epoch": 0.54, "learning_rate": 0.00021844077339215772, "loss": 0.0167, "step": 209760 }, { "epoch": 0.54, "learning_rate": 0.00021843688517578626, "loss": 0.0127, "step": 209770 }, { "epoch": 0.54, "learning_rate": 0.00021843299695941477, "loss": 0.0161, "step": 209780 }, { "epoch": 0.54, "learning_rate": 0.0002184291087430433, "loss": 0.015, "step": 209790 }, { "epoch": 0.54, "learning_rate": 0.00021842522052667186, "loss": 0.0151, "step": 209800 }, { "epoch": 0.54, "learning_rate": 0.0002184213323103004, "loss": 0.0123, "step": 209810 }, { "epoch": 0.54, "learning_rate": 0.00021841744409392891, "loss": 0.0175, "step": 209820 }, { "epoch": 0.54, "learning_rate": 0.00021841355587755746, "loss": 0.0197, "step": 209830 }, { "epoch": 0.54, "learning_rate": 0.000218409667661186, "loss": 0.0215, "step": 209840 }, { "epoch": 0.54, "learning_rate": 0.00021840577944481454, "loss": 0.0196, "step": 209850 }, { "epoch": 0.54, "learning_rate": 0.00021840189122844305, "loss": 0.0145, "step": 209860 }, { "epoch": 0.54, "learning_rate": 0.0002183980030120716, "loss": 0.0141, "step": 209870 }, { "epoch": 0.54, "learning_rate": 0.00021839411479570014, "loss": 0.0181, "step": 209880 }, { "epoch": 0.54, "learning_rate": 0.00021839022657932868, "loss": 0.0124, "step": 209890 }, { "epoch": 0.54, "learning_rate": 0.0002183863383629572, "loss": 0.0185, "step": 209900 }, { "epoch": 0.54, "learning_rate": 0.00021838245014658573, "loss": 0.0191, "step": 209910 }, { "epoch": 0.54, "learning_rate": 0.00021837856193021425, "loss": 0.0193, "step": 209920 }, { "epoch": 0.54, "learning_rate": 0.00021837467371384282, "loss": 0.0153, "step": 209930 }, { "epoch": 0.54, "learning_rate": 0.00021837078549747133, "loss": 0.014, "step": 209940 }, { "epoch": 0.54, "learning_rate": 0.00021836689728109987, "loss": 0.0179, "step": 209950 }, { "epoch": 0.54, "learning_rate": 0.0002183630090647284, "loss": 0.0153, "step": 209960 }, { "epoch": 0.54, "learning_rate": 0.00021835912084835696, "loss": 0.0175, "step": 209970 }, { "epoch": 0.54, "learning_rate": 0.0002183552326319855, "loss": 0.0163, "step": 209980 }, { "epoch": 0.54, "learning_rate": 0.000218351344415614, "loss": 0.0202, "step": 209990 }, { "epoch": 0.54, "learning_rate": 0.00021834745619924256, "loss": 0.0165, "step": 210000 }, { "epoch": 0.54, "eval_cer": 0.8817362776095881, "eval_loss": 0.011167431250214577, "eval_runtime": 108.0029, "eval_samples_per_second": 18.518, "eval_steps_per_second": 4.63, "step": 210000 }, { "epoch": 0.54, "learning_rate": 0.0002183435679828711, "loss": 0.018, "step": 210010 }, { "epoch": 0.54, "learning_rate": 0.00021833967976649964, "loss": 0.0149, "step": 210020 }, { "epoch": 0.54, "learning_rate": 0.00021833579155012815, "loss": 0.016, "step": 210030 }, { "epoch": 0.54, "learning_rate": 0.0002183319033337567, "loss": 0.0151, "step": 210040 }, { "epoch": 0.54, "learning_rate": 0.00021832801511738524, "loss": 0.0152, "step": 210050 }, { "epoch": 0.54, "learning_rate": 0.00021832412690101378, "loss": 0.019, "step": 210060 }, { "epoch": 0.54, "learning_rate": 0.0002183202386846423, "loss": 0.0211, "step": 210070 }, { "epoch": 0.54, "learning_rate": 0.00021831635046827083, "loss": 0.0162, "step": 210080 }, { "epoch": 0.54, "learning_rate": 0.0002183124622518994, "loss": 0.0307, "step": 210090 }, { "epoch": 0.54, "learning_rate": 0.00021830857403552792, "loss": 0.0206, "step": 210100 }, { "epoch": 0.54, "learning_rate": 0.00021830468581915643, "loss": 0.0198, "step": 210110 }, { "epoch": 0.54, "learning_rate": 0.00021830079760278497, "loss": 0.0153, "step": 210120 }, { "epoch": 0.54, "learning_rate": 0.00021829690938641354, "loss": 0.014, "step": 210130 }, { "epoch": 0.54, "learning_rate": 0.00021829302117004206, "loss": 0.0169, "step": 210140 }, { "epoch": 0.54, "learning_rate": 0.0002182891329536706, "loss": 0.0287, "step": 210150 }, { "epoch": 0.54, "learning_rate": 0.0002182852447372991, "loss": 0.0176, "step": 210160 }, { "epoch": 0.54, "learning_rate": 0.00021828135652092765, "loss": 0.0178, "step": 210170 }, { "epoch": 0.54, "learning_rate": 0.0002182774683045562, "loss": 0.0176, "step": 210180 }, { "epoch": 0.54, "learning_rate": 0.00021827358008818474, "loss": 0.0193, "step": 210190 }, { "epoch": 0.54, "learning_rate": 0.00021826969187181325, "loss": 0.0175, "step": 210200 }, { "epoch": 0.54, "learning_rate": 0.0002182658036554418, "loss": 0.0181, "step": 210210 }, { "epoch": 0.54, "learning_rate": 0.00021826191543907034, "loss": 0.0207, "step": 210220 }, { "epoch": 0.54, "learning_rate": 0.00021825802722269888, "loss": 0.0158, "step": 210230 }, { "epoch": 0.54, "learning_rate": 0.0002182541390063274, "loss": 0.0178, "step": 210240 }, { "epoch": 0.54, "learning_rate": 0.00021825025078995593, "loss": 0.0141, "step": 210250 }, { "epoch": 0.55, "learning_rate": 0.00021824636257358448, "loss": 0.0158, "step": 210260 }, { "epoch": 0.55, "learning_rate": 0.00021824247435721302, "loss": 0.0184, "step": 210270 }, { "epoch": 0.55, "learning_rate": 0.00021823858614084153, "loss": 0.0175, "step": 210280 }, { "epoch": 0.55, "learning_rate": 0.00021823469792447007, "loss": 0.015, "step": 210290 }, { "epoch": 0.55, "learning_rate": 0.00021823080970809864, "loss": 0.0178, "step": 210300 }, { "epoch": 0.55, "learning_rate": 0.00021822692149172716, "loss": 0.022, "step": 210310 }, { "epoch": 0.55, "learning_rate": 0.0002182230332753557, "loss": 0.016, "step": 210320 }, { "epoch": 0.55, "learning_rate": 0.0002182191450589842, "loss": 0.0162, "step": 210330 }, { "epoch": 0.55, "learning_rate": 0.00021821525684261278, "loss": 0.0184, "step": 210340 }, { "epoch": 0.55, "learning_rate": 0.0002182113686262413, "loss": 0.0161, "step": 210350 }, { "epoch": 0.55, "learning_rate": 0.00021820748040986984, "loss": 0.0178, "step": 210360 }, { "epoch": 0.55, "learning_rate": 0.00021820359219349835, "loss": 0.0171, "step": 210370 }, { "epoch": 0.55, "learning_rate": 0.00021819970397712692, "loss": 0.0232, "step": 210380 }, { "epoch": 0.55, "learning_rate": 0.00021819581576075543, "loss": 0.0169, "step": 210390 }, { "epoch": 0.55, "learning_rate": 0.00021819192754438398, "loss": 0.0153, "step": 210400 }, { "epoch": 0.55, "learning_rate": 0.0002181880393280125, "loss": 0.0244, "step": 210410 }, { "epoch": 0.55, "learning_rate": 0.00021818415111164103, "loss": 0.0186, "step": 210420 }, { "epoch": 0.55, "learning_rate": 0.00021818026289526957, "loss": 0.0306, "step": 210430 }, { "epoch": 0.55, "learning_rate": 0.00021817637467889812, "loss": 0.0153, "step": 210440 }, { "epoch": 0.55, "learning_rate": 0.00021817248646252663, "loss": 0.0207, "step": 210450 }, { "epoch": 0.55, "learning_rate": 0.00021816859824615517, "loss": 0.0149, "step": 210460 }, { "epoch": 0.55, "learning_rate": 0.00021816471002978374, "loss": 0.0227, "step": 210470 }, { "epoch": 0.55, "learning_rate": 0.00021816082181341226, "loss": 0.0203, "step": 210480 }, { "epoch": 0.55, "learning_rate": 0.0002181569335970408, "loss": 0.0188, "step": 210490 }, { "epoch": 0.55, "learning_rate": 0.0002181530453806693, "loss": 0.0183, "step": 210500 }, { "epoch": 0.55, "learning_rate": 0.00021814915716429788, "loss": 0.0183, "step": 210510 }, { "epoch": 0.55, "learning_rate": 0.0002181452689479264, "loss": 0.0127, "step": 210520 }, { "epoch": 0.55, "learning_rate": 0.00021814138073155494, "loss": 0.0204, "step": 210530 }, { "epoch": 0.55, "learning_rate": 0.00021813749251518345, "loss": 0.0157, "step": 210540 }, { "epoch": 0.55, "learning_rate": 0.00021813360429881202, "loss": 0.0172, "step": 210550 }, { "epoch": 0.55, "learning_rate": 0.00021812971608244053, "loss": 0.0163, "step": 210560 }, { "epoch": 0.55, "learning_rate": 0.00021812582786606908, "loss": 0.0155, "step": 210570 }, { "epoch": 0.55, "learning_rate": 0.0002181219396496976, "loss": 0.0176, "step": 210580 }, { "epoch": 0.55, "learning_rate": 0.00021811805143332616, "loss": 0.0161, "step": 210590 }, { "epoch": 0.55, "learning_rate": 0.00021811416321695467, "loss": 0.0155, "step": 210600 }, { "epoch": 0.55, "learning_rate": 0.00021811027500058322, "loss": 0.0162, "step": 210610 }, { "epoch": 0.55, "learning_rate": 0.00021810638678421173, "loss": 0.0199, "step": 210620 }, { "epoch": 0.55, "learning_rate": 0.0002181024985678403, "loss": 0.0205, "step": 210630 }, { "epoch": 0.55, "learning_rate": 0.00021809861035146884, "loss": 0.0201, "step": 210640 }, { "epoch": 0.55, "learning_rate": 0.00021809472213509735, "loss": 0.0118, "step": 210650 }, { "epoch": 0.55, "learning_rate": 0.00021809083391872587, "loss": 0.0191, "step": 210660 }, { "epoch": 0.55, "learning_rate": 0.0002180869457023544, "loss": 0.0165, "step": 210670 }, { "epoch": 0.55, "learning_rate": 0.00021808305748598298, "loss": 0.0153, "step": 210680 }, { "epoch": 0.55, "learning_rate": 0.0002180791692696115, "loss": 0.0127, "step": 210690 }, { "epoch": 0.55, "learning_rate": 0.00021807528105324004, "loss": 0.0164, "step": 210700 }, { "epoch": 0.55, "learning_rate": 0.00021807139283686855, "loss": 0.0138, "step": 210710 }, { "epoch": 0.55, "learning_rate": 0.00021806750462049712, "loss": 0.0207, "step": 210720 }, { "epoch": 0.55, "learning_rate": 0.00021806361640412563, "loss": 0.0201, "step": 210730 }, { "epoch": 0.55, "learning_rate": 0.00021805972818775418, "loss": 0.0181, "step": 210740 }, { "epoch": 0.55, "learning_rate": 0.0002180558399713827, "loss": 0.0206, "step": 210750 }, { "epoch": 0.55, "learning_rate": 0.00021805195175501126, "loss": 0.0131, "step": 210760 }, { "epoch": 0.55, "learning_rate": 0.00021804806353863977, "loss": 0.0141, "step": 210770 }, { "epoch": 0.55, "learning_rate": 0.00021804417532226831, "loss": 0.0152, "step": 210780 }, { "epoch": 0.55, "learning_rate": 0.00021804028710589683, "loss": 0.0172, "step": 210790 }, { "epoch": 0.55, "learning_rate": 0.0002180363988895254, "loss": 0.0206, "step": 210800 }, { "epoch": 0.55, "learning_rate": 0.0002180325106731539, "loss": 0.0148, "step": 210810 }, { "epoch": 0.55, "learning_rate": 0.00021802862245678245, "loss": 0.0201, "step": 210820 }, { "epoch": 0.55, "learning_rate": 0.00021802473424041097, "loss": 0.0172, "step": 210830 }, { "epoch": 0.55, "learning_rate": 0.00021802084602403954, "loss": 0.0144, "step": 210840 }, { "epoch": 0.55, "learning_rate": 0.00021801695780766808, "loss": 0.0207, "step": 210850 }, { "epoch": 0.55, "learning_rate": 0.0002180130695912966, "loss": 0.0167, "step": 210860 }, { "epoch": 0.55, "learning_rate": 0.00021800918137492514, "loss": 0.0239, "step": 210870 }, { "epoch": 0.55, "learning_rate": 0.00021800529315855368, "loss": 0.017, "step": 210880 }, { "epoch": 0.55, "learning_rate": 0.00021800140494218222, "loss": 0.017, "step": 210890 }, { "epoch": 0.55, "learning_rate": 0.00021799751672581073, "loss": 0.0154, "step": 210900 }, { "epoch": 0.55, "learning_rate": 0.00021799362850943927, "loss": 0.0132, "step": 210910 }, { "epoch": 0.55, "learning_rate": 0.0002179897402930678, "loss": 0.0162, "step": 210920 }, { "epoch": 0.55, "learning_rate": 0.00021798585207669636, "loss": 0.0175, "step": 210930 }, { "epoch": 0.55, "learning_rate": 0.00021798196386032487, "loss": 0.0119, "step": 210940 }, { "epoch": 0.55, "learning_rate": 0.00021797807564395341, "loss": 0.0165, "step": 210950 }, { "epoch": 0.55, "learning_rate": 0.00021797418742758193, "loss": 0.0221, "step": 210960 }, { "epoch": 0.55, "learning_rate": 0.0002179702992112105, "loss": 0.0133, "step": 210970 }, { "epoch": 0.55, "learning_rate": 0.000217966410994839, "loss": 0.0173, "step": 210980 }, { "epoch": 0.55, "learning_rate": 0.00021796252277846755, "loss": 0.0183, "step": 210990 }, { "epoch": 0.55, "learning_rate": 0.00021795863456209607, "loss": 0.015, "step": 211000 }, { "epoch": 0.55, "eval_cer": 0.8817600714374692, "eval_loss": 0.011309986002743244, "eval_runtime": 107.7403, "eval_samples_per_second": 18.563, "eval_steps_per_second": 4.641, "step": 211000 }, { "epoch": 0.55, "learning_rate": 0.00021795474634572464, "loss": 0.016, "step": 211010 }, { "epoch": 0.55, "learning_rate": 0.00021795085812935318, "loss": 0.0133, "step": 211020 }, { "epoch": 0.55, "learning_rate": 0.0002179469699129817, "loss": 0.0176, "step": 211030 }, { "epoch": 0.55, "learning_rate": 0.00021794308169661023, "loss": 0.0176, "step": 211040 }, { "epoch": 0.55, "learning_rate": 0.00021793919348023878, "loss": 0.0149, "step": 211050 }, { "epoch": 0.55, "learning_rate": 0.00021793530526386732, "loss": 0.02, "step": 211060 }, { "epoch": 0.55, "learning_rate": 0.00021793141704749583, "loss": 0.0199, "step": 211070 }, { "epoch": 0.55, "learning_rate": 0.00021792752883112437, "loss": 0.019, "step": 211080 }, { "epoch": 0.55, "learning_rate": 0.00021792364061475292, "loss": 0.0177, "step": 211090 }, { "epoch": 0.55, "learning_rate": 0.00021791975239838146, "loss": 0.019, "step": 211100 }, { "epoch": 0.55, "learning_rate": 0.00021791586418200997, "loss": 0.022, "step": 211110 }, { "epoch": 0.55, "learning_rate": 0.00021791197596563851, "loss": 0.0188, "step": 211120 }, { "epoch": 0.55, "learning_rate": 0.00021790808774926706, "loss": 0.017, "step": 211130 }, { "epoch": 0.55, "learning_rate": 0.0002179041995328956, "loss": 0.0182, "step": 211140 }, { "epoch": 0.55, "learning_rate": 0.0002179003113165241, "loss": 0.0125, "step": 211150 }, { "epoch": 0.55, "learning_rate": 0.00021789642310015265, "loss": 0.0171, "step": 211160 }, { "epoch": 0.55, "learning_rate": 0.00021789253488378117, "loss": 0.0148, "step": 211170 }, { "epoch": 0.55, "learning_rate": 0.00021788864666740974, "loss": 0.0191, "step": 211180 }, { "epoch": 0.55, "learning_rate": 0.00021788475845103828, "loss": 0.0156, "step": 211190 }, { "epoch": 0.55, "learning_rate": 0.0002178808702346668, "loss": 0.0189, "step": 211200 }, { "epoch": 0.55, "learning_rate": 0.00021787698201829533, "loss": 0.0165, "step": 211210 }, { "epoch": 0.55, "learning_rate": 0.00021787309380192388, "loss": 0.0203, "step": 211220 }, { "epoch": 0.55, "learning_rate": 0.00021786920558555242, "loss": 0.0145, "step": 211230 }, { "epoch": 0.55, "learning_rate": 0.00021786531736918093, "loss": 0.017, "step": 211240 }, { "epoch": 0.55, "learning_rate": 0.00021786142915280947, "loss": 0.0188, "step": 211250 }, { "epoch": 0.55, "learning_rate": 0.00021785754093643802, "loss": 0.0156, "step": 211260 }, { "epoch": 0.55, "learning_rate": 0.00021785365272006656, "loss": 0.0145, "step": 211270 }, { "epoch": 0.55, "learning_rate": 0.00021784976450369507, "loss": 0.015, "step": 211280 }, { "epoch": 0.55, "learning_rate": 0.0002178458762873236, "loss": 0.0171, "step": 211290 }, { "epoch": 0.55, "learning_rate": 0.00021784198807095215, "loss": 0.0158, "step": 211300 }, { "epoch": 0.55, "learning_rate": 0.0002178380998545807, "loss": 0.016, "step": 211310 }, { "epoch": 0.55, "learning_rate": 0.0002178342116382092, "loss": 0.021, "step": 211320 }, { "epoch": 0.55, "learning_rate": 0.00021783032342183775, "loss": 0.0162, "step": 211330 }, { "epoch": 0.55, "learning_rate": 0.00021782643520546632, "loss": 0.018, "step": 211340 }, { "epoch": 0.55, "learning_rate": 0.00021782254698909484, "loss": 0.0149, "step": 211350 }, { "epoch": 0.55, "learning_rate": 0.00021781865877272338, "loss": 0.0185, "step": 211360 }, { "epoch": 0.55, "learning_rate": 0.0002178147705563519, "loss": 0.0177, "step": 211370 }, { "epoch": 0.55, "learning_rate": 0.00021781088233998046, "loss": 0.0128, "step": 211380 }, { "epoch": 0.55, "learning_rate": 0.00021780699412360898, "loss": 0.018, "step": 211390 }, { "epoch": 0.55, "learning_rate": 0.00021780310590723752, "loss": 0.0176, "step": 211400 }, { "epoch": 0.55, "learning_rate": 0.00021779921769086603, "loss": 0.0137, "step": 211410 }, { "epoch": 0.55, "learning_rate": 0.00021779532947449457, "loss": 0.0185, "step": 211420 }, { "epoch": 0.55, "learning_rate": 0.00021779144125812311, "loss": 0.0161, "step": 211430 }, { "epoch": 0.55, "learning_rate": 0.00021778755304175166, "loss": 0.0161, "step": 211440 }, { "epoch": 0.55, "learning_rate": 0.00021778366482538017, "loss": 0.0195, "step": 211450 }, { "epoch": 0.55, "learning_rate": 0.0002177797766090087, "loss": 0.0153, "step": 211460 }, { "epoch": 0.55, "learning_rate": 0.00021777588839263725, "loss": 0.0148, "step": 211470 }, { "epoch": 0.55, "learning_rate": 0.0002177720001762658, "loss": 0.0186, "step": 211480 }, { "epoch": 0.55, "learning_rate": 0.0002177681119598943, "loss": 0.0162, "step": 211490 }, { "epoch": 0.55, "learning_rate": 0.00021776422374352285, "loss": 0.0173, "step": 211500 }, { "epoch": 0.55, "learning_rate": 0.00021776033552715142, "loss": 0.0184, "step": 211510 }, { "epoch": 0.55, "learning_rate": 0.00021775644731077994, "loss": 0.0148, "step": 211520 }, { "epoch": 0.55, "learning_rate": 0.00021775255909440845, "loss": 0.0192, "step": 211530 }, { "epoch": 0.55, "learning_rate": 0.000217748670878037, "loss": 0.0172, "step": 211540 }, { "epoch": 0.55, "learning_rate": 0.00021774478266166556, "loss": 0.0181, "step": 211550 }, { "epoch": 0.55, "learning_rate": 0.00021774089444529407, "loss": 0.0181, "step": 211560 }, { "epoch": 0.55, "learning_rate": 0.00021773700622892262, "loss": 0.0129, "step": 211570 }, { "epoch": 0.55, "learning_rate": 0.00021773311801255113, "loss": 0.0164, "step": 211580 }, { "epoch": 0.55, "learning_rate": 0.0002177292297961797, "loss": 0.0157, "step": 211590 }, { "epoch": 0.55, "learning_rate": 0.00021772534157980821, "loss": 0.0154, "step": 211600 }, { "epoch": 0.55, "learning_rate": 0.00021772145336343676, "loss": 0.0188, "step": 211610 }, { "epoch": 0.55, "learning_rate": 0.00021771756514706527, "loss": 0.0172, "step": 211620 }, { "epoch": 0.55, "learning_rate": 0.00021771367693069384, "loss": 0.0198, "step": 211630 }, { "epoch": 0.55, "learning_rate": 0.00021770978871432235, "loss": 0.0188, "step": 211640 }, { "epoch": 0.55, "learning_rate": 0.0002177059004979509, "loss": 0.0155, "step": 211650 }, { "epoch": 0.55, "learning_rate": 0.0002177020122815794, "loss": 0.0196, "step": 211660 }, { "epoch": 0.55, "learning_rate": 0.00021769812406520795, "loss": 0.0171, "step": 211670 }, { "epoch": 0.55, "learning_rate": 0.00021769423584883652, "loss": 0.0173, "step": 211680 }, { "epoch": 0.55, "learning_rate": 0.00021769034763246503, "loss": 0.021, "step": 211690 }, { "epoch": 0.55, "learning_rate": 0.00021768645941609355, "loss": 0.0173, "step": 211700 }, { "epoch": 0.55, "learning_rate": 0.0002176825711997221, "loss": 0.0194, "step": 211710 }, { "epoch": 0.55, "learning_rate": 0.00021767868298335066, "loss": 0.0184, "step": 211720 }, { "epoch": 0.55, "learning_rate": 0.00021767479476697917, "loss": 0.0197, "step": 211730 }, { "epoch": 0.55, "learning_rate": 0.00021767090655060772, "loss": 0.0162, "step": 211740 }, { "epoch": 0.55, "learning_rate": 0.00021766701833423623, "loss": 0.018, "step": 211750 }, { "epoch": 0.55, "learning_rate": 0.0002176631301178648, "loss": 0.0165, "step": 211760 }, { "epoch": 0.55, "learning_rate": 0.00021765924190149331, "loss": 0.0151, "step": 211770 }, { "epoch": 0.55, "learning_rate": 0.00021765535368512186, "loss": 0.0145, "step": 211780 }, { "epoch": 0.55, "learning_rate": 0.00021765146546875037, "loss": 0.0158, "step": 211790 }, { "epoch": 0.55, "learning_rate": 0.00021764757725237894, "loss": 0.0183, "step": 211800 }, { "epoch": 0.55, "learning_rate": 0.00021764368903600745, "loss": 0.0208, "step": 211810 }, { "epoch": 0.55, "learning_rate": 0.000217639800819636, "loss": 0.0153, "step": 211820 }, { "epoch": 0.55, "learning_rate": 0.0002176359126032645, "loss": 0.0181, "step": 211830 }, { "epoch": 0.55, "learning_rate": 0.00021763202438689308, "loss": 0.0157, "step": 211840 }, { "epoch": 0.55, "learning_rate": 0.0002176281361705216, "loss": 0.0134, "step": 211850 }, { "epoch": 0.55, "learning_rate": 0.00021762424795415013, "loss": 0.0181, "step": 211860 }, { "epoch": 0.55, "learning_rate": 0.00021762035973777865, "loss": 0.0192, "step": 211870 }, { "epoch": 0.55, "learning_rate": 0.00021761647152140722, "loss": 0.0159, "step": 211880 }, { "epoch": 0.55, "learning_rate": 0.00021761258330503576, "loss": 0.0139, "step": 211890 }, { "epoch": 0.55, "learning_rate": 0.00021760869508866427, "loss": 0.0138, "step": 211900 }, { "epoch": 0.55, "learning_rate": 0.00021760480687229282, "loss": 0.0175, "step": 211910 }, { "epoch": 0.55, "learning_rate": 0.00021760091865592133, "loss": 0.0146, "step": 211920 }, { "epoch": 0.55, "learning_rate": 0.0002175970304395499, "loss": 0.0169, "step": 211930 }, { "epoch": 0.55, "learning_rate": 0.0002175931422231784, "loss": 0.0178, "step": 211940 }, { "epoch": 0.55, "learning_rate": 0.00021758925400680695, "loss": 0.0181, "step": 211950 }, { "epoch": 0.55, "learning_rate": 0.00021758536579043547, "loss": 0.0169, "step": 211960 }, { "epoch": 0.55, "learning_rate": 0.00021758147757406404, "loss": 0.0172, "step": 211970 }, { "epoch": 0.55, "learning_rate": 0.00021757758935769255, "loss": 0.0165, "step": 211980 }, { "epoch": 0.55, "learning_rate": 0.0002175737011413211, "loss": 0.0224, "step": 211990 }, { "epoch": 0.55, "learning_rate": 0.0002175698129249496, "loss": 0.0168, "step": 212000 }, { "epoch": 0.55, "eval_cer": 0.8817446754311932, "eval_loss": 0.011121110990643501, "eval_runtime": 107.2308, "eval_samples_per_second": 18.651, "eval_steps_per_second": 4.663, "step": 212000 }, { "epoch": 0.55, "learning_rate": 0.00021756592470857818, "loss": 0.0188, "step": 212010 }, { "epoch": 0.55, "learning_rate": 0.0002175620364922067, "loss": 0.0154, "step": 212020 }, { "epoch": 0.55, "learning_rate": 0.00021755814827583523, "loss": 0.0143, "step": 212030 }, { "epoch": 0.55, "learning_rate": 0.00021755426005946375, "loss": 0.0141, "step": 212040 }, { "epoch": 0.55, "learning_rate": 0.00021755037184309232, "loss": 0.0171, "step": 212050 }, { "epoch": 0.55, "learning_rate": 0.00021754648362672086, "loss": 0.0209, "step": 212060 }, { "epoch": 0.55, "learning_rate": 0.00021754259541034937, "loss": 0.0235, "step": 212070 }, { "epoch": 0.55, "learning_rate": 0.00021753870719397791, "loss": 0.0169, "step": 212080 }, { "epoch": 0.55, "learning_rate": 0.00021753481897760646, "loss": 0.0176, "step": 212090 }, { "epoch": 0.55, "learning_rate": 0.000217530930761235, "loss": 0.0141, "step": 212100 }, { "epoch": 0.55, "learning_rate": 0.0002175270425448635, "loss": 0.018, "step": 212110 }, { "epoch": 0.55, "learning_rate": 0.00021752315432849205, "loss": 0.0165, "step": 212120 }, { "epoch": 0.55, "learning_rate": 0.0002175192661121206, "loss": 0.017, "step": 212130 }, { "epoch": 0.55, "learning_rate": 0.00021751537789574914, "loss": 0.016, "step": 212140 }, { "epoch": 0.55, "learning_rate": 0.00021751148967937765, "loss": 0.0176, "step": 212150 }, { "epoch": 0.55, "learning_rate": 0.0002175076014630062, "loss": 0.0189, "step": 212160 }, { "epoch": 0.55, "learning_rate": 0.0002175037132466347, "loss": 0.0157, "step": 212170 }, { "epoch": 0.55, "learning_rate": 0.00021749982503026328, "loss": 0.016, "step": 212180 }, { "epoch": 0.55, "learning_rate": 0.0002174959368138918, "loss": 0.0188, "step": 212190 }, { "epoch": 0.55, "learning_rate": 0.00021749204859752033, "loss": 0.0154, "step": 212200 }, { "epoch": 0.55, "learning_rate": 0.00021748816038114885, "loss": 0.0158, "step": 212210 }, { "epoch": 0.55, "learning_rate": 0.00021748427216477742, "loss": 0.0134, "step": 212220 }, { "epoch": 0.55, "learning_rate": 0.00021748038394840596, "loss": 0.0188, "step": 212230 }, { "epoch": 0.55, "learning_rate": 0.00021747649573203447, "loss": 0.016, "step": 212240 }, { "epoch": 0.55, "learning_rate": 0.000217472607515663, "loss": 0.0153, "step": 212250 }, { "epoch": 0.55, "learning_rate": 0.00021746871929929156, "loss": 0.0188, "step": 212260 }, { "epoch": 0.55, "learning_rate": 0.0002174648310829201, "loss": 0.0165, "step": 212270 }, { "epoch": 0.55, "learning_rate": 0.0002174609428665486, "loss": 0.0174, "step": 212280 }, { "epoch": 0.55, "learning_rate": 0.00021745705465017715, "loss": 0.0203, "step": 212290 }, { "epoch": 0.55, "learning_rate": 0.0002174531664338057, "loss": 0.0201, "step": 212300 }, { "epoch": 0.55, "learning_rate": 0.00021744927821743424, "loss": 0.0196, "step": 212310 }, { "epoch": 0.55, "learning_rate": 0.00021744539000106275, "loss": 0.0208, "step": 212320 }, { "epoch": 0.55, "learning_rate": 0.0002174415017846913, "loss": 0.0173, "step": 212330 }, { "epoch": 0.55, "learning_rate": 0.00021743761356831983, "loss": 0.011, "step": 212340 }, { "epoch": 0.55, "learning_rate": 0.00021743372535194838, "loss": 0.0181, "step": 212350 }, { "epoch": 0.55, "learning_rate": 0.0002174298371355769, "loss": 0.0183, "step": 212360 }, { "epoch": 0.55, "learning_rate": 0.00021742594891920543, "loss": 0.0152, "step": 212370 }, { "epoch": 0.55, "learning_rate": 0.00021742206070283395, "loss": 0.0177, "step": 212380 }, { "epoch": 0.55, "learning_rate": 0.00021741817248646252, "loss": 0.0164, "step": 212390 }, { "epoch": 0.55, "learning_rate": 0.00021741428427009103, "loss": 0.022, "step": 212400 }, { "epoch": 0.55, "learning_rate": 0.00021741039605371957, "loss": 0.0193, "step": 212410 }, { "epoch": 0.55, "learning_rate": 0.00021740650783734809, "loss": 0.0173, "step": 212420 }, { "epoch": 0.55, "learning_rate": 0.00021740261962097666, "loss": 0.0208, "step": 212430 }, { "epoch": 0.55, "learning_rate": 0.0002173987314046052, "loss": 0.0136, "step": 212440 }, { "epoch": 0.55, "learning_rate": 0.0002173948431882337, "loss": 0.0165, "step": 212450 }, { "epoch": 0.55, "learning_rate": 0.00021739095497186225, "loss": 0.0199, "step": 212460 }, { "epoch": 0.55, "learning_rate": 0.0002173870667554908, "loss": 0.0111, "step": 212470 }, { "epoch": 0.55, "learning_rate": 0.00021738317853911934, "loss": 0.0149, "step": 212480 }, { "epoch": 0.55, "learning_rate": 0.00021737929032274785, "loss": 0.0176, "step": 212490 }, { "epoch": 0.55, "learning_rate": 0.0002173754021063764, "loss": 0.0162, "step": 212500 }, { "epoch": 0.55, "learning_rate": 0.00021737151389000493, "loss": 0.0179, "step": 212510 }, { "epoch": 0.55, "learning_rate": 0.00021736762567363348, "loss": 0.0162, "step": 212520 }, { "epoch": 0.55, "learning_rate": 0.000217363737457262, "loss": 0.0166, "step": 212530 }, { "epoch": 0.55, "learning_rate": 0.00021735984924089053, "loss": 0.0149, "step": 212540 }, { "epoch": 0.55, "learning_rate": 0.0002173559610245191, "loss": 0.0167, "step": 212550 }, { "epoch": 0.55, "learning_rate": 0.00021735207280814762, "loss": 0.0189, "step": 212560 }, { "epoch": 0.55, "learning_rate": 0.00021734818459177613, "loss": 0.0149, "step": 212570 }, { "epoch": 0.55, "learning_rate": 0.00021734429637540467, "loss": 0.0155, "step": 212580 }, { "epoch": 0.55, "learning_rate": 0.00021734040815903324, "loss": 0.0148, "step": 212590 }, { "epoch": 0.55, "learning_rate": 0.00021733651994266175, "loss": 0.0162, "step": 212600 }, { "epoch": 0.55, "learning_rate": 0.0002173326317262903, "loss": 0.0184, "step": 212610 }, { "epoch": 0.55, "learning_rate": 0.0002173287435099188, "loss": 0.0165, "step": 212620 }, { "epoch": 0.55, "learning_rate": 0.00021732485529354735, "loss": 0.0175, "step": 212630 }, { "epoch": 0.55, "learning_rate": 0.0002173209670771759, "loss": 0.0178, "step": 212640 }, { "epoch": 0.55, "learning_rate": 0.00021731707886080444, "loss": 0.0183, "step": 212650 }, { "epoch": 0.55, "learning_rate": 0.00021731319064443295, "loss": 0.0139, "step": 212660 }, { "epoch": 0.55, "learning_rate": 0.0002173093024280615, "loss": 0.0216, "step": 212670 }, { "epoch": 0.55, "learning_rate": 0.00021730541421169003, "loss": 0.0168, "step": 212680 }, { "epoch": 0.55, "learning_rate": 0.00021730152599531858, "loss": 0.0176, "step": 212690 }, { "epoch": 0.55, "learning_rate": 0.0002172976377789471, "loss": 0.0181, "step": 212700 }, { "epoch": 0.55, "learning_rate": 0.00021729374956257563, "loss": 0.0179, "step": 212710 }, { "epoch": 0.55, "learning_rate": 0.00021728986134620417, "loss": 0.0122, "step": 212720 }, { "epoch": 0.55, "learning_rate": 0.00021728597312983271, "loss": 0.0116, "step": 212730 }, { "epoch": 0.55, "learning_rate": 0.00021728208491346123, "loss": 0.0154, "step": 212740 }, { "epoch": 0.55, "learning_rate": 0.00021727819669708977, "loss": 0.0135, "step": 212750 }, { "epoch": 0.55, "learning_rate": 0.00021727430848071834, "loss": 0.0159, "step": 212760 }, { "epoch": 0.55, "learning_rate": 0.00021727042026434685, "loss": 0.0199, "step": 212770 }, { "epoch": 0.55, "learning_rate": 0.0002172665320479754, "loss": 0.0156, "step": 212780 }, { "epoch": 0.55, "learning_rate": 0.0002172626438316039, "loss": 0.0147, "step": 212790 }, { "epoch": 0.55, "learning_rate": 0.00021725875561523248, "loss": 0.0157, "step": 212800 }, { "epoch": 0.55, "learning_rate": 0.000217254867398861, "loss": 0.0214, "step": 212810 }, { "epoch": 0.55, "learning_rate": 0.00021725097918248954, "loss": 0.0143, "step": 212820 }, { "epoch": 0.55, "learning_rate": 0.00021724709096611805, "loss": 0.0207, "step": 212830 }, { "epoch": 0.55, "learning_rate": 0.00021724320274974662, "loss": 0.0172, "step": 212840 }, { "epoch": 0.55, "learning_rate": 0.00021723931453337513, "loss": 0.0162, "step": 212850 }, { "epoch": 0.55, "learning_rate": 0.00021723542631700367, "loss": 0.0164, "step": 212860 }, { "epoch": 0.55, "learning_rate": 0.0002172315381006322, "loss": 0.023, "step": 212870 }, { "epoch": 0.55, "learning_rate": 0.00021722764988426073, "loss": 0.0188, "step": 212880 }, { "epoch": 0.55, "learning_rate": 0.00021722376166788927, "loss": 0.0131, "step": 212890 }, { "epoch": 0.55, "learning_rate": 0.00021721987345151781, "loss": 0.0155, "step": 212900 }, { "epoch": 0.55, "learning_rate": 0.00021721598523514633, "loss": 0.0168, "step": 212910 }, { "epoch": 0.55, "learning_rate": 0.00021721209701877487, "loss": 0.0152, "step": 212920 }, { "epoch": 0.55, "learning_rate": 0.00021720820880240344, "loss": 0.0168, "step": 212930 }, { "epoch": 0.55, "learning_rate": 0.00021720432058603195, "loss": 0.02, "step": 212940 }, { "epoch": 0.55, "learning_rate": 0.0002172004323696605, "loss": 0.0149, "step": 212950 }, { "epoch": 0.55, "learning_rate": 0.000217196544153289, "loss": 0.016, "step": 212960 }, { "epoch": 0.55, "learning_rate": 0.00021719265593691758, "loss": 0.0228, "step": 212970 }, { "epoch": 0.55, "learning_rate": 0.0002171887677205461, "loss": 0.0157, "step": 212980 }, { "epoch": 0.55, "learning_rate": 0.00021718487950417463, "loss": 0.0197, "step": 212990 }, { "epoch": 0.55, "learning_rate": 0.00021718099128780315, "loss": 0.018, "step": 213000 }, { "epoch": 0.55, "eval_cer": 0.8817586718005349, "eval_loss": 0.01114367600530386, "eval_runtime": 107.9769, "eval_samples_per_second": 18.522, "eval_steps_per_second": 4.631, "step": 213000 }, { "epoch": 0.55, "learning_rate": 0.00021717710307143172, "loss": 0.0153, "step": 213010 }, { "epoch": 0.55, "learning_rate": 0.00021717321485506023, "loss": 0.0135, "step": 213020 }, { "epoch": 0.55, "learning_rate": 0.00021716932663868877, "loss": 0.0158, "step": 213030 }, { "epoch": 0.55, "learning_rate": 0.0002171654384223173, "loss": 0.0152, "step": 213040 }, { "epoch": 0.55, "learning_rate": 0.00021716155020594586, "loss": 0.0231, "step": 213050 }, { "epoch": 0.55, "learning_rate": 0.00021715766198957437, "loss": 0.0182, "step": 213060 }, { "epoch": 0.55, "learning_rate": 0.0002171537737732029, "loss": 0.0122, "step": 213070 }, { "epoch": 0.55, "learning_rate": 0.00021714988555683143, "loss": 0.0183, "step": 213080 }, { "epoch": 0.55, "learning_rate": 0.00021714599734046, "loss": 0.0146, "step": 213090 }, { "epoch": 0.55, "learning_rate": 0.00021714210912408854, "loss": 0.0211, "step": 213100 }, { "epoch": 0.55, "learning_rate": 0.00021713822090771705, "loss": 0.015, "step": 213110 }, { "epoch": 0.55, "learning_rate": 0.00021713433269134557, "loss": 0.0161, "step": 213120 }, { "epoch": 0.55, "learning_rate": 0.0002171304444749741, "loss": 0.0148, "step": 213130 }, { "epoch": 0.55, "learning_rate": 0.00021712655625860268, "loss": 0.0153, "step": 213140 }, { "epoch": 0.55, "learning_rate": 0.0002171226680422312, "loss": 0.0135, "step": 213150 }, { "epoch": 0.55, "learning_rate": 0.00021711877982585973, "loss": 0.0201, "step": 213160 }, { "epoch": 0.55, "learning_rate": 0.00021711489160948825, "loss": 0.0158, "step": 213170 }, { "epoch": 0.55, "learning_rate": 0.00021711100339311682, "loss": 0.0183, "step": 213180 }, { "epoch": 0.55, "learning_rate": 0.00021710711517674533, "loss": 0.0127, "step": 213190 }, { "epoch": 0.55, "learning_rate": 0.00021710322696037387, "loss": 0.0172, "step": 213200 }, { "epoch": 0.55, "learning_rate": 0.0002170993387440024, "loss": 0.0212, "step": 213210 }, { "epoch": 0.55, "learning_rate": 0.00021709545052763096, "loss": 0.0175, "step": 213220 }, { "epoch": 0.55, "learning_rate": 0.00021709156231125947, "loss": 0.0169, "step": 213230 }, { "epoch": 0.55, "learning_rate": 0.000217087674094888, "loss": 0.0178, "step": 213240 }, { "epoch": 0.55, "learning_rate": 0.00021708378587851653, "loss": 0.0139, "step": 213250 }, { "epoch": 0.55, "learning_rate": 0.0002170798976621451, "loss": 0.0214, "step": 213260 }, { "epoch": 0.55, "learning_rate": 0.00021707600944577364, "loss": 0.0176, "step": 213270 }, { "epoch": 0.55, "learning_rate": 0.00021707212122940215, "loss": 0.017, "step": 213280 }, { "epoch": 0.55, "learning_rate": 0.00021706823301303067, "loss": 0.0142, "step": 213290 }, { "epoch": 0.55, "learning_rate": 0.00021706434479665924, "loss": 0.0139, "step": 213300 }, { "epoch": 0.55, "learning_rate": 0.00021706045658028778, "loss": 0.0138, "step": 213310 }, { "epoch": 0.55, "learning_rate": 0.0002170565683639163, "loss": 0.017, "step": 213320 }, { "epoch": 0.55, "learning_rate": 0.00021705268014754483, "loss": 0.0164, "step": 213330 }, { "epoch": 0.55, "learning_rate": 0.00021704879193117337, "loss": 0.0198, "step": 213340 }, { "epoch": 0.55, "learning_rate": 0.00021704490371480192, "loss": 0.0163, "step": 213350 }, { "epoch": 0.55, "learning_rate": 0.00021704101549843043, "loss": 0.0162, "step": 213360 }, { "epoch": 0.55, "learning_rate": 0.00021703712728205897, "loss": 0.0157, "step": 213370 }, { "epoch": 0.55, "learning_rate": 0.0002170332390656875, "loss": 0.0173, "step": 213380 }, { "epoch": 0.55, "learning_rate": 0.00021702935084931606, "loss": 0.0162, "step": 213390 }, { "epoch": 0.55, "learning_rate": 0.00021702546263294457, "loss": 0.0166, "step": 213400 }, { "epoch": 0.55, "learning_rate": 0.0002170215744165731, "loss": 0.0176, "step": 213410 }, { "epoch": 0.55, "learning_rate": 0.00021701768620020163, "loss": 0.0155, "step": 213420 }, { "epoch": 0.55, "learning_rate": 0.0002170137979838302, "loss": 0.0189, "step": 213430 }, { "epoch": 0.55, "learning_rate": 0.0002170099097674587, "loss": 0.0168, "step": 213440 }, { "epoch": 0.55, "learning_rate": 0.00021700602155108725, "loss": 0.0148, "step": 213450 }, { "epoch": 0.55, "learning_rate": 0.00021700213333471577, "loss": 0.0151, "step": 213460 }, { "epoch": 0.55, "learning_rate": 0.00021699824511834433, "loss": 0.0142, "step": 213470 }, { "epoch": 0.55, "learning_rate": 0.00021699435690197288, "loss": 0.0159, "step": 213480 }, { "epoch": 0.55, "learning_rate": 0.0002169904686856014, "loss": 0.0168, "step": 213490 }, { "epoch": 0.55, "learning_rate": 0.00021698658046922993, "loss": 0.0154, "step": 213500 }, { "epoch": 0.55, "learning_rate": 0.00021698269225285847, "loss": 0.0151, "step": 213510 }, { "epoch": 0.55, "learning_rate": 0.00021697880403648702, "loss": 0.0125, "step": 213520 }, { "epoch": 0.55, "learning_rate": 0.00021697491582011553, "loss": 0.0157, "step": 213530 }, { "epoch": 0.55, "learning_rate": 0.00021697102760374407, "loss": 0.0175, "step": 213540 }, { "epoch": 0.55, "learning_rate": 0.00021696713938737261, "loss": 0.0126, "step": 213550 }, { "epoch": 0.55, "learning_rate": 0.00021696325117100116, "loss": 0.0179, "step": 213560 }, { "epoch": 0.55, "learning_rate": 0.00021695936295462967, "loss": 0.0178, "step": 213570 }, { "epoch": 0.55, "learning_rate": 0.0002169554747382582, "loss": 0.0195, "step": 213580 }, { "epoch": 0.55, "learning_rate": 0.00021695158652188675, "loss": 0.0172, "step": 213590 }, { "epoch": 0.55, "learning_rate": 0.0002169476983055153, "loss": 0.0138, "step": 213600 }, { "epoch": 0.55, "learning_rate": 0.0002169438100891438, "loss": 0.0192, "step": 213610 }, { "epoch": 0.55, "learning_rate": 0.00021693992187277235, "loss": 0.017, "step": 213620 }, { "epoch": 0.55, "learning_rate": 0.00021693603365640087, "loss": 0.0172, "step": 213630 }, { "epoch": 0.55, "learning_rate": 0.00021693214544002943, "loss": 0.0141, "step": 213640 }, { "epoch": 0.55, "learning_rate": 0.00021692825722365798, "loss": 0.0137, "step": 213650 }, { "epoch": 0.55, "learning_rate": 0.0002169243690072865, "loss": 0.0146, "step": 213660 }, { "epoch": 0.55, "learning_rate": 0.00021692048079091503, "loss": 0.0139, "step": 213670 }, { "epoch": 0.55, "learning_rate": 0.00021691659257454357, "loss": 0.0143, "step": 213680 }, { "epoch": 0.55, "learning_rate": 0.00021691270435817212, "loss": 0.0177, "step": 213690 }, { "epoch": 0.55, "learning_rate": 0.00021690881614180063, "loss": 0.0148, "step": 213700 }, { "epoch": 0.55, "learning_rate": 0.00021690492792542917, "loss": 0.0181, "step": 213710 }, { "epoch": 0.55, "learning_rate": 0.0002169010397090577, "loss": 0.0162, "step": 213720 }, { "epoch": 0.55, "learning_rate": 0.00021689715149268625, "loss": 0.0164, "step": 213730 }, { "epoch": 0.55, "learning_rate": 0.00021689326327631477, "loss": 0.0163, "step": 213740 }, { "epoch": 0.55, "learning_rate": 0.0002168893750599433, "loss": 0.0151, "step": 213750 }, { "epoch": 0.55, "learning_rate": 0.00021688548684357185, "loss": 0.0172, "step": 213760 }, { "epoch": 0.55, "learning_rate": 0.0002168815986272004, "loss": 0.0184, "step": 213770 }, { "epoch": 0.55, "learning_rate": 0.0002168777104108289, "loss": 0.0119, "step": 213780 }, { "epoch": 0.55, "learning_rate": 0.00021687382219445745, "loss": 0.0241, "step": 213790 }, { "epoch": 0.55, "learning_rate": 0.00021686993397808602, "loss": 0.0164, "step": 213800 }, { "epoch": 0.55, "learning_rate": 0.00021686604576171453, "loss": 0.0145, "step": 213810 }, { "epoch": 0.55, "learning_rate": 0.00021686215754534308, "loss": 0.0145, "step": 213820 }, { "epoch": 0.55, "learning_rate": 0.0002168582693289716, "loss": 0.0144, "step": 213830 }, { "epoch": 0.55, "learning_rate": 0.00021685438111260016, "loss": 0.014, "step": 213840 }, { "epoch": 0.55, "learning_rate": 0.00021685049289622867, "loss": 0.0156, "step": 213850 }, { "epoch": 0.55, "learning_rate": 0.00021684660467985721, "loss": 0.0186, "step": 213860 }, { "epoch": 0.55, "learning_rate": 0.00021684271646348573, "loss": 0.0183, "step": 213870 }, { "epoch": 0.55, "learning_rate": 0.00021683882824711427, "loss": 0.0344, "step": 213880 }, { "epoch": 0.55, "learning_rate": 0.0002168349400307428, "loss": 0.0184, "step": 213890 }, { "epoch": 0.55, "learning_rate": 0.00021683105181437135, "loss": 0.0183, "step": 213900 }, { "epoch": 0.55, "learning_rate": 0.00021682716359799987, "loss": 0.0184, "step": 213910 }, { "epoch": 0.55, "learning_rate": 0.0002168232753816284, "loss": 0.0158, "step": 213920 }, { "epoch": 0.55, "learning_rate": 0.00021681938716525695, "loss": 0.0132, "step": 213930 }, { "epoch": 0.55, "learning_rate": 0.0002168154989488855, "loss": 0.0166, "step": 213940 }, { "epoch": 0.55, "learning_rate": 0.000216811610732514, "loss": 0.0205, "step": 213950 }, { "epoch": 0.55, "learning_rate": 0.00021680772251614255, "loss": 0.0173, "step": 213960 }, { "epoch": 0.55, "learning_rate": 0.00021680383429977112, "loss": 0.0186, "step": 213970 }, { "epoch": 0.55, "learning_rate": 0.00021679994608339963, "loss": 0.0197, "step": 213980 }, { "epoch": 0.55, "learning_rate": 0.00021679605786702815, "loss": 0.0146, "step": 213990 }, { "epoch": 0.55, "learning_rate": 0.0002167921696506567, "loss": 0.0189, "step": 214000 }, { "epoch": 0.55, "eval_cer": 0.8817418761573248, "eval_loss": 0.01149623654782772, "eval_runtime": 107.8487, "eval_samples_per_second": 18.544, "eval_steps_per_second": 4.636, "step": 214000 }, { "epoch": 0.55, "learning_rate": 0.00021678828143428526, "loss": 0.0176, "step": 214010 }, { "epoch": 0.55, "learning_rate": 0.00021678439321791377, "loss": 0.0185, "step": 214020 }, { "epoch": 0.55, "learning_rate": 0.00021678050500154231, "loss": 0.0148, "step": 214030 }, { "epoch": 0.55, "learning_rate": 0.00021677661678517083, "loss": 0.0218, "step": 214040 }, { "epoch": 0.55, "learning_rate": 0.0002167727285687994, "loss": 0.0146, "step": 214050 }, { "epoch": 0.55, "learning_rate": 0.0002167688403524279, "loss": 0.0157, "step": 214060 }, { "epoch": 0.55, "learning_rate": 0.00021676495213605645, "loss": 0.0136, "step": 214070 }, { "epoch": 0.55, "learning_rate": 0.00021676106391968497, "loss": 0.0162, "step": 214080 }, { "epoch": 0.55, "learning_rate": 0.00021675717570331354, "loss": 0.0186, "step": 214090 }, { "epoch": 0.55, "learning_rate": 0.00021675328748694205, "loss": 0.0148, "step": 214100 }, { "epoch": 0.56, "learning_rate": 0.0002167493992705706, "loss": 0.0162, "step": 214110 }, { "epoch": 0.56, "learning_rate": 0.0002167455110541991, "loss": 0.0184, "step": 214120 }, { "epoch": 0.56, "learning_rate": 0.00021674162283782765, "loss": 0.0185, "step": 214130 }, { "epoch": 0.56, "learning_rate": 0.00021673773462145622, "loss": 0.0155, "step": 214140 }, { "epoch": 0.56, "learning_rate": 0.00021673384640508473, "loss": 0.0198, "step": 214150 }, { "epoch": 0.56, "learning_rate": 0.00021672995818871325, "loss": 0.0214, "step": 214160 }, { "epoch": 0.56, "learning_rate": 0.0002167260699723418, "loss": 0.0177, "step": 214170 }, { "epoch": 0.56, "learning_rate": 0.00021672218175597036, "loss": 0.0154, "step": 214180 }, { "epoch": 0.56, "learning_rate": 0.00021671829353959887, "loss": 0.0162, "step": 214190 }, { "epoch": 0.56, "learning_rate": 0.00021671440532322741, "loss": 0.0169, "step": 214200 }, { "epoch": 0.56, "learning_rate": 0.00021671051710685593, "loss": 0.0231, "step": 214210 }, { "epoch": 0.56, "learning_rate": 0.0002167066288904845, "loss": 0.0166, "step": 214220 }, { "epoch": 0.56, "learning_rate": 0.000216702740674113, "loss": 0.0165, "step": 214230 }, { "epoch": 0.56, "learning_rate": 0.00021669885245774155, "loss": 0.0181, "step": 214240 }, { "epoch": 0.56, "learning_rate": 0.00021669496424137007, "loss": 0.0158, "step": 214250 }, { "epoch": 0.56, "learning_rate": 0.00021669107602499864, "loss": 0.0229, "step": 214260 }, { "epoch": 0.56, "learning_rate": 0.00021668718780862715, "loss": 0.0194, "step": 214270 }, { "epoch": 0.56, "learning_rate": 0.0002166832995922557, "loss": 0.0161, "step": 214280 }, { "epoch": 0.56, "learning_rate": 0.0002166794113758842, "loss": 0.0161, "step": 214290 }, { "epoch": 0.56, "learning_rate": 0.00021667552315951278, "loss": 0.018, "step": 214300 }, { "epoch": 0.56, "learning_rate": 0.0002166716349431413, "loss": 0.0168, "step": 214310 }, { "epoch": 0.56, "learning_rate": 0.00021666774672676983, "loss": 0.0163, "step": 214320 }, { "epoch": 0.56, "learning_rate": 0.00021666385851039835, "loss": 0.0173, "step": 214330 }, { "epoch": 0.56, "learning_rate": 0.00021665997029402692, "loss": 0.0145, "step": 214340 }, { "epoch": 0.56, "learning_rate": 0.00021665608207765546, "loss": 0.0169, "step": 214350 }, { "epoch": 0.56, "learning_rate": 0.00021665219386128397, "loss": 0.0136, "step": 214360 }, { "epoch": 0.56, "learning_rate": 0.0002166483056449125, "loss": 0.0151, "step": 214370 }, { "epoch": 0.56, "learning_rate": 0.00021664441742854103, "loss": 0.0172, "step": 214380 }, { "epoch": 0.56, "learning_rate": 0.0002166405292121696, "loss": 0.0235, "step": 214390 }, { "epoch": 0.56, "learning_rate": 0.0002166366409957981, "loss": 0.017, "step": 214400 }, { "epoch": 0.56, "learning_rate": 0.00021663275277942665, "loss": 0.0196, "step": 214410 }, { "epoch": 0.56, "learning_rate": 0.00021662886456305517, "loss": 0.019, "step": 214420 }, { "epoch": 0.56, "learning_rate": 0.00021662497634668374, "loss": 0.0193, "step": 214430 }, { "epoch": 0.56, "learning_rate": 0.00021662108813031225, "loss": 0.0147, "step": 214440 }, { "epoch": 0.56, "learning_rate": 0.0002166171999139408, "loss": 0.0169, "step": 214450 }, { "epoch": 0.56, "learning_rate": 0.0002166133116975693, "loss": 0.0152, "step": 214460 }, { "epoch": 0.56, "learning_rate": 0.00021660942348119788, "loss": 0.0175, "step": 214470 }, { "epoch": 0.56, "learning_rate": 0.0002166055352648264, "loss": 0.0202, "step": 214480 }, { "epoch": 0.56, "learning_rate": 0.00021660164704845493, "loss": 0.02, "step": 214490 }, { "epoch": 0.56, "learning_rate": 0.00021659775883208345, "loss": 0.017, "step": 214500 }, { "epoch": 0.56, "learning_rate": 0.00021659387061571201, "loss": 0.0166, "step": 214510 }, { "epoch": 0.56, "learning_rate": 0.00021658998239934056, "loss": 0.0263, "step": 214520 }, { "epoch": 0.56, "learning_rate": 0.00021658609418296907, "loss": 0.0191, "step": 214530 }, { "epoch": 0.56, "learning_rate": 0.0002165822059665976, "loss": 0.0155, "step": 214540 }, { "epoch": 0.56, "learning_rate": 0.00021657831775022615, "loss": 0.0204, "step": 214550 }, { "epoch": 0.56, "learning_rate": 0.0002165744295338547, "loss": 0.0172, "step": 214560 }, { "epoch": 0.56, "learning_rate": 0.0002165705413174832, "loss": 0.0176, "step": 214570 }, { "epoch": 0.56, "learning_rate": 0.00021656665310111175, "loss": 0.018, "step": 214580 }, { "epoch": 0.56, "learning_rate": 0.0002165627648847403, "loss": 0.0171, "step": 214590 }, { "epoch": 0.56, "learning_rate": 0.00021655887666836884, "loss": 0.0218, "step": 214600 }, { "epoch": 0.56, "learning_rate": 0.00021655498845199735, "loss": 0.0154, "step": 214610 }, { "epoch": 0.56, "learning_rate": 0.0002165511002356259, "loss": 0.0166, "step": 214620 }, { "epoch": 0.56, "learning_rate": 0.0002165472120192544, "loss": 0.0182, "step": 214630 }, { "epoch": 0.56, "learning_rate": 0.00021654332380288297, "loss": 0.0181, "step": 214640 }, { "epoch": 0.56, "learning_rate": 0.0002165394355865115, "loss": 0.0155, "step": 214650 }, { "epoch": 0.56, "learning_rate": 0.00021653554737014003, "loss": 0.0149, "step": 214660 }, { "epoch": 0.56, "learning_rate": 0.00021653165915376855, "loss": 0.0175, "step": 214670 }, { "epoch": 0.56, "learning_rate": 0.00021652777093739711, "loss": 0.0202, "step": 214680 }, { "epoch": 0.56, "learning_rate": 0.00021652388272102566, "loss": 0.0122, "step": 214690 }, { "epoch": 0.56, "learning_rate": 0.00021651999450465417, "loss": 0.0191, "step": 214700 }, { "epoch": 0.56, "learning_rate": 0.00021651610628828268, "loss": 0.0125, "step": 214710 }, { "epoch": 0.56, "learning_rate": 0.00021651221807191125, "loss": 0.0153, "step": 214720 }, { "epoch": 0.56, "learning_rate": 0.0002165083298555398, "loss": 0.0138, "step": 214730 }, { "epoch": 0.56, "learning_rate": 0.0002165044416391683, "loss": 0.0172, "step": 214740 }, { "epoch": 0.56, "learning_rate": 0.00021650055342279685, "loss": 0.0165, "step": 214750 }, { "epoch": 0.56, "learning_rate": 0.0002164966652064254, "loss": 0.0161, "step": 214760 }, { "epoch": 0.56, "learning_rate": 0.00021649277699005393, "loss": 0.0198, "step": 214770 }, { "epoch": 0.56, "learning_rate": 0.00021648888877368245, "loss": 0.0179, "step": 214780 }, { "epoch": 0.56, "learning_rate": 0.000216485000557311, "loss": 0.013, "step": 214790 }, { "epoch": 0.56, "learning_rate": 0.00021648111234093953, "loss": 0.0169, "step": 214800 }, { "epoch": 0.56, "learning_rate": 0.00021647722412456807, "loss": 0.0184, "step": 214810 }, { "epoch": 0.56, "learning_rate": 0.0002164733359081966, "loss": 0.0209, "step": 214820 }, { "epoch": 0.56, "learning_rate": 0.00021646944769182513, "loss": 0.0179, "step": 214830 }, { "epoch": 0.56, "learning_rate": 0.0002164655594754537, "loss": 0.0149, "step": 214840 }, { "epoch": 0.56, "learning_rate": 0.00021646167125908221, "loss": 0.0164, "step": 214850 }, { "epoch": 0.56, "learning_rate": 0.00021645778304271076, "loss": 0.0137, "step": 214860 }, { "epoch": 0.56, "learning_rate": 0.00021645389482633927, "loss": 0.0142, "step": 214870 }, { "epoch": 0.56, "learning_rate": 0.00021645000660996778, "loss": 0.0179, "step": 214880 }, { "epoch": 0.56, "learning_rate": 0.00021644611839359635, "loss": 0.0156, "step": 214890 }, { "epoch": 0.56, "learning_rate": 0.0002164422301772249, "loss": 0.0143, "step": 214900 }, { "epoch": 0.56, "learning_rate": 0.0002164383419608534, "loss": 0.0188, "step": 214910 }, { "epoch": 0.56, "learning_rate": 0.00021643445374448195, "loss": 0.0142, "step": 214920 }, { "epoch": 0.56, "learning_rate": 0.0002164305655281105, "loss": 0.0165, "step": 214930 }, { "epoch": 0.56, "learning_rate": 0.00021642667731173903, "loss": 0.0185, "step": 214940 }, { "epoch": 0.56, "learning_rate": 0.00021642278909536755, "loss": 0.0132, "step": 214950 }, { "epoch": 0.56, "learning_rate": 0.0002164189008789961, "loss": 0.0207, "step": 214960 }, { "epoch": 0.56, "learning_rate": 0.00021641501266262463, "loss": 0.0184, "step": 214970 }, { "epoch": 0.56, "learning_rate": 0.00021641112444625317, "loss": 0.0213, "step": 214980 }, { "epoch": 0.56, "learning_rate": 0.0002164072362298817, "loss": 0.0148, "step": 214990 }, { "epoch": 0.56, "learning_rate": 0.00021640334801351023, "loss": 0.0152, "step": 215000 }, { "epoch": 0.56, "eval_cer": 0.8817292794249172, "eval_loss": 0.011770045384764671, "eval_runtime": 107.7843, "eval_samples_per_second": 18.556, "eval_steps_per_second": 4.639, "step": 215000 }, { "epoch": 0.56, "learning_rate": 0.0002163994597971388, "loss": 0.0123, "step": 215010 }, { "epoch": 0.56, "learning_rate": 0.0002163955715807673, "loss": 0.0195, "step": 215020 }, { "epoch": 0.56, "learning_rate": 0.00021639168336439583, "loss": 0.0231, "step": 215030 }, { "epoch": 0.56, "learning_rate": 0.00021638779514802437, "loss": 0.0146, "step": 215040 }, { "epoch": 0.56, "learning_rate": 0.00021638390693165294, "loss": 0.015, "step": 215050 }, { "epoch": 0.56, "learning_rate": 0.00021638001871528145, "loss": 0.0146, "step": 215060 }, { "epoch": 0.56, "learning_rate": 0.00021637613049891, "loss": 0.0158, "step": 215070 }, { "epoch": 0.56, "learning_rate": 0.0002163722422825385, "loss": 0.0238, "step": 215080 }, { "epoch": 0.56, "learning_rate": 0.00021636835406616708, "loss": 0.0197, "step": 215090 }, { "epoch": 0.56, "learning_rate": 0.0002163644658497956, "loss": 0.0186, "step": 215100 }, { "epoch": 0.56, "learning_rate": 0.00021636057763342413, "loss": 0.0187, "step": 215110 }, { "epoch": 0.56, "learning_rate": 0.00021635668941705265, "loss": 0.0184, "step": 215120 }, { "epoch": 0.56, "learning_rate": 0.0002163528012006812, "loss": 0.0169, "step": 215130 }, { "epoch": 0.56, "learning_rate": 0.00021634891298430973, "loss": 0.0151, "step": 215140 }, { "epoch": 0.56, "learning_rate": 0.00021634502476793827, "loss": 0.0169, "step": 215150 }, { "epoch": 0.56, "learning_rate": 0.0002163411365515668, "loss": 0.0213, "step": 215160 }, { "epoch": 0.56, "learning_rate": 0.00021633724833519533, "loss": 0.0193, "step": 215170 }, { "epoch": 0.56, "learning_rate": 0.00021633336011882387, "loss": 0.0173, "step": 215180 }, { "epoch": 0.56, "learning_rate": 0.0002163294719024524, "loss": 0.0164, "step": 215190 }, { "epoch": 0.56, "learning_rate": 0.00021632558368608093, "loss": 0.0142, "step": 215200 }, { "epoch": 0.56, "learning_rate": 0.00021632169546970947, "loss": 0.0129, "step": 215210 }, { "epoch": 0.56, "learning_rate": 0.00021631780725333804, "loss": 0.0167, "step": 215220 }, { "epoch": 0.56, "learning_rate": 0.00021631391903696655, "loss": 0.0128, "step": 215230 }, { "epoch": 0.56, "learning_rate": 0.0002163100308205951, "loss": 0.0187, "step": 215240 }, { "epoch": 0.56, "learning_rate": 0.0002163061426042236, "loss": 0.0167, "step": 215250 }, { "epoch": 0.56, "learning_rate": 0.00021630225438785218, "loss": 0.0154, "step": 215260 }, { "epoch": 0.56, "learning_rate": 0.0002162983661714807, "loss": 0.017, "step": 215270 }, { "epoch": 0.56, "learning_rate": 0.00021629447795510923, "loss": 0.0157, "step": 215280 }, { "epoch": 0.56, "learning_rate": 0.00021629058973873775, "loss": 0.0153, "step": 215290 }, { "epoch": 0.56, "learning_rate": 0.00021628670152236632, "loss": 0.0158, "step": 215300 }, { "epoch": 0.56, "learning_rate": 0.00021628281330599483, "loss": 0.0137, "step": 215310 }, { "epoch": 0.56, "learning_rate": 0.00021627892508962337, "loss": 0.0192, "step": 215320 }, { "epoch": 0.56, "learning_rate": 0.0002162750368732519, "loss": 0.0133, "step": 215330 }, { "epoch": 0.56, "learning_rate": 0.00021627114865688046, "loss": 0.0158, "step": 215340 }, { "epoch": 0.56, "learning_rate": 0.00021626726044050897, "loss": 0.0126, "step": 215350 }, { "epoch": 0.56, "learning_rate": 0.0002162633722241375, "loss": 0.0137, "step": 215360 }, { "epoch": 0.56, "learning_rate": 0.00021625948400776603, "loss": 0.0178, "step": 215370 }, { "epoch": 0.56, "learning_rate": 0.00021625559579139457, "loss": 0.0203, "step": 215380 }, { "epoch": 0.56, "learning_rate": 0.00021625170757502314, "loss": 0.0195, "step": 215390 }, { "epoch": 0.56, "learning_rate": 0.00021624781935865165, "loss": 0.0129, "step": 215400 }, { "epoch": 0.56, "learning_rate": 0.0002162439311422802, "loss": 0.016, "step": 215410 }, { "epoch": 0.56, "learning_rate": 0.0002162400429259087, "loss": 0.0162, "step": 215420 }, { "epoch": 0.56, "learning_rate": 0.00021623615470953728, "loss": 0.0141, "step": 215430 }, { "epoch": 0.56, "learning_rate": 0.0002162322664931658, "loss": 0.0139, "step": 215440 }, { "epoch": 0.56, "learning_rate": 0.00021622837827679433, "loss": 0.0155, "step": 215450 }, { "epoch": 0.56, "learning_rate": 0.00021622449006042285, "loss": 0.0199, "step": 215460 }, { "epoch": 0.56, "learning_rate": 0.00021622060184405142, "loss": 0.0144, "step": 215470 }, { "epoch": 0.56, "learning_rate": 0.00021621671362767993, "loss": 0.0215, "step": 215480 }, { "epoch": 0.56, "learning_rate": 0.00021621282541130847, "loss": 0.0156, "step": 215490 }, { "epoch": 0.56, "learning_rate": 0.00021620893719493699, "loss": 0.0153, "step": 215500 }, { "epoch": 0.56, "learning_rate": 0.00021620504897856556, "loss": 0.0157, "step": 215510 }, { "epoch": 0.56, "learning_rate": 0.00021620116076219407, "loss": 0.0168, "step": 215520 }, { "epoch": 0.56, "learning_rate": 0.0002161972725458226, "loss": 0.0218, "step": 215530 }, { "epoch": 0.56, "learning_rate": 0.00021619338432945113, "loss": 0.0199, "step": 215540 }, { "epoch": 0.56, "learning_rate": 0.0002161894961130797, "loss": 0.017, "step": 215550 }, { "epoch": 0.56, "learning_rate": 0.00021618560789670824, "loss": 0.0174, "step": 215560 }, { "epoch": 0.56, "learning_rate": 0.00021618171968033675, "loss": 0.0189, "step": 215570 }, { "epoch": 0.56, "learning_rate": 0.00021617783146396527, "loss": 0.019, "step": 215580 }, { "epoch": 0.56, "learning_rate": 0.00021617394324759383, "loss": 0.0153, "step": 215590 }, { "epoch": 0.56, "learning_rate": 0.00021617005503122238, "loss": 0.0119, "step": 215600 }, { "epoch": 0.56, "learning_rate": 0.0002161661668148509, "loss": 0.0186, "step": 215610 }, { "epoch": 0.56, "learning_rate": 0.00021616227859847943, "loss": 0.0146, "step": 215620 }, { "epoch": 0.56, "learning_rate": 0.00021615839038210795, "loss": 0.0141, "step": 215630 }, { "epoch": 0.56, "learning_rate": 0.00021615450216573652, "loss": 0.0173, "step": 215640 }, { "epoch": 0.56, "learning_rate": 0.00021615061394936503, "loss": 0.0139, "step": 215650 }, { "epoch": 0.56, "learning_rate": 0.00021614672573299357, "loss": 0.0157, "step": 215660 }, { "epoch": 0.56, "learning_rate": 0.00021614283751662209, "loss": 0.0155, "step": 215670 }, { "epoch": 0.56, "learning_rate": 0.00021613894930025065, "loss": 0.0178, "step": 215680 }, { "epoch": 0.56, "learning_rate": 0.00021613506108387917, "loss": 0.0159, "step": 215690 }, { "epoch": 0.56, "learning_rate": 0.0002161311728675077, "loss": 0.0185, "step": 215700 }, { "epoch": 0.56, "learning_rate": 0.00021612728465113623, "loss": 0.0139, "step": 215710 }, { "epoch": 0.56, "learning_rate": 0.0002161233964347648, "loss": 0.0175, "step": 215720 }, { "epoch": 0.56, "learning_rate": 0.00021611950821839334, "loss": 0.0151, "step": 215730 }, { "epoch": 0.56, "learning_rate": 0.00021611562000202185, "loss": 0.0189, "step": 215740 }, { "epoch": 0.56, "learning_rate": 0.00021611173178565036, "loss": 0.0131, "step": 215750 }, { "epoch": 0.56, "learning_rate": 0.00021610784356927893, "loss": 0.0191, "step": 215760 }, { "epoch": 0.56, "learning_rate": 0.00021610395535290748, "loss": 0.0182, "step": 215770 }, { "epoch": 0.56, "learning_rate": 0.000216100067136536, "loss": 0.0162, "step": 215780 }, { "epoch": 0.56, "learning_rate": 0.00021609617892016453, "loss": 0.0149, "step": 215790 }, { "epoch": 0.56, "learning_rate": 0.00021609229070379307, "loss": 0.0164, "step": 215800 }, { "epoch": 0.56, "learning_rate": 0.00021608840248742161, "loss": 0.0155, "step": 215810 }, { "epoch": 0.56, "learning_rate": 0.00021608451427105013, "loss": 0.0145, "step": 215820 }, { "epoch": 0.56, "learning_rate": 0.00021608062605467867, "loss": 0.0143, "step": 215830 }, { "epoch": 0.56, "learning_rate": 0.0002160767378383072, "loss": 0.0165, "step": 215840 }, { "epoch": 0.56, "learning_rate": 0.00021607284962193575, "loss": 0.0139, "step": 215850 }, { "epoch": 0.56, "learning_rate": 0.00021606896140556427, "loss": 0.0141, "step": 215860 }, { "epoch": 0.56, "learning_rate": 0.0002160650731891928, "loss": 0.0154, "step": 215870 }, { "epoch": 0.56, "learning_rate": 0.00021606118497282132, "loss": 0.0187, "step": 215880 }, { "epoch": 0.56, "learning_rate": 0.0002160572967564499, "loss": 0.0146, "step": 215890 }, { "epoch": 0.56, "learning_rate": 0.0002160534085400784, "loss": 0.0146, "step": 215900 }, { "epoch": 0.56, "learning_rate": 0.00021604952032370695, "loss": 0.0144, "step": 215910 }, { "epoch": 0.56, "learning_rate": 0.00021604563210733546, "loss": 0.0162, "step": 215920 }, { "epoch": 0.56, "learning_rate": 0.00021604174389096403, "loss": 0.0204, "step": 215930 }, { "epoch": 0.56, "learning_rate": 0.00021603785567459257, "loss": 0.0179, "step": 215940 }, { "epoch": 0.56, "learning_rate": 0.0002160339674582211, "loss": 0.0167, "step": 215950 }, { "epoch": 0.56, "learning_rate": 0.00021603007924184963, "loss": 0.0194, "step": 215960 }, { "epoch": 0.56, "learning_rate": 0.00021602619102547817, "loss": 0.0174, "step": 215970 }, { "epoch": 0.56, "learning_rate": 0.00021602230280910671, "loss": 0.022, "step": 215980 }, { "epoch": 0.56, "learning_rate": 0.00021601841459273523, "loss": 0.0158, "step": 215990 }, { "epoch": 0.56, "learning_rate": 0.00021601452637636377, "loss": 0.0189, "step": 216000 }, { "epoch": 0.56, "eval_cer": 0.8817712685329425, "eval_loss": 0.011435981839895248, "eval_runtime": 108.0861, "eval_samples_per_second": 18.504, "eval_steps_per_second": 4.626, "step": 216000 }, { "epoch": 0.56, "learning_rate": 0.0002160106381599923, "loss": 0.0162, "step": 216010 }, { "epoch": 0.56, "learning_rate": 0.00021600674994362085, "loss": 0.0178, "step": 216020 }, { "epoch": 0.56, "learning_rate": 0.00021600286172724937, "loss": 0.0162, "step": 216030 }, { "epoch": 0.56, "learning_rate": 0.0002159989735108779, "loss": 0.0152, "step": 216040 }, { "epoch": 0.56, "learning_rate": 0.00021599508529450645, "loss": 0.016, "step": 216050 }, { "epoch": 0.56, "learning_rate": 0.000215991197078135, "loss": 0.0154, "step": 216060 }, { "epoch": 0.56, "learning_rate": 0.0002159873088617635, "loss": 0.0139, "step": 216070 }, { "epoch": 0.56, "learning_rate": 0.00021598342064539205, "loss": 0.0188, "step": 216080 }, { "epoch": 0.56, "learning_rate": 0.00021597953242902062, "loss": 0.0194, "step": 216090 }, { "epoch": 0.56, "learning_rate": 0.00021597564421264913, "loss": 0.0159, "step": 216100 }, { "epoch": 0.56, "learning_rate": 0.00021597175599627767, "loss": 0.0159, "step": 216110 }, { "epoch": 0.56, "learning_rate": 0.0002159678677799062, "loss": 0.017, "step": 216120 }, { "epoch": 0.56, "learning_rate": 0.00021596397956353473, "loss": 0.0148, "step": 216130 }, { "epoch": 0.56, "learning_rate": 0.00021596009134716327, "loss": 0.0176, "step": 216140 }, { "epoch": 0.56, "learning_rate": 0.0002159562031307918, "loss": 0.0171, "step": 216150 }, { "epoch": 0.56, "learning_rate": 0.00021595231491442033, "loss": 0.0158, "step": 216160 }, { "epoch": 0.56, "learning_rate": 0.00021594842669804887, "loss": 0.0202, "step": 216170 }, { "epoch": 0.56, "learning_rate": 0.0002159445384816774, "loss": 0.0155, "step": 216180 }, { "epoch": 0.56, "learning_rate": 0.00021594065026530595, "loss": 0.0147, "step": 216190 }, { "epoch": 0.56, "learning_rate": 0.00021593676204893447, "loss": 0.0213, "step": 216200 }, { "epoch": 0.56, "learning_rate": 0.000215932873832563, "loss": 0.0169, "step": 216210 }, { "epoch": 0.56, "learning_rate": 0.00021592898561619155, "loss": 0.0203, "step": 216220 }, { "epoch": 0.56, "learning_rate": 0.0002159250973998201, "loss": 0.0192, "step": 216230 }, { "epoch": 0.56, "learning_rate": 0.0002159212091834486, "loss": 0.0175, "step": 216240 }, { "epoch": 0.56, "learning_rate": 0.00021591732096707715, "loss": 0.016, "step": 216250 }, { "epoch": 0.56, "learning_rate": 0.00021591343275070572, "loss": 0.0241, "step": 216260 }, { "epoch": 0.56, "learning_rate": 0.00021590954453433423, "loss": 0.0153, "step": 216270 }, { "epoch": 0.56, "learning_rate": 0.00021590565631796277, "loss": 0.0167, "step": 216280 }, { "epoch": 0.56, "learning_rate": 0.0002159017681015913, "loss": 0.0158, "step": 216290 }, { "epoch": 0.56, "learning_rate": 0.00021589787988521986, "loss": 0.0149, "step": 216300 }, { "epoch": 0.56, "learning_rate": 0.00021589399166884837, "loss": 0.0212, "step": 216310 }, { "epoch": 0.56, "learning_rate": 0.0002158901034524769, "loss": 0.0153, "step": 216320 }, { "epoch": 0.56, "learning_rate": 0.00021588621523610543, "loss": 0.0177, "step": 216330 }, { "epoch": 0.56, "learning_rate": 0.000215882327019734, "loss": 0.0144, "step": 216340 }, { "epoch": 0.56, "learning_rate": 0.0002158784388033625, "loss": 0.0143, "step": 216350 }, { "epoch": 0.56, "learning_rate": 0.00021587455058699105, "loss": 0.021, "step": 216360 }, { "epoch": 0.56, "learning_rate": 0.00021587066237061957, "loss": 0.016, "step": 216370 }, { "epoch": 0.56, "learning_rate": 0.0002158667741542481, "loss": 0.0164, "step": 216380 }, { "epoch": 0.56, "learning_rate": 0.00021586288593787665, "loss": 0.0159, "step": 216390 }, { "epoch": 0.56, "learning_rate": 0.0002158589977215052, "loss": 0.019, "step": 216400 }, { "epoch": 0.56, "learning_rate": 0.0002158551095051337, "loss": 0.0173, "step": 216410 }, { "epoch": 0.56, "learning_rate": 0.00021585122128876225, "loss": 0.0177, "step": 216420 }, { "epoch": 0.56, "learning_rate": 0.00021584733307239082, "loss": 0.0165, "step": 216430 }, { "epoch": 0.56, "learning_rate": 0.00021584344485601933, "loss": 0.0168, "step": 216440 }, { "epoch": 0.56, "learning_rate": 0.00021583955663964787, "loss": 0.0225, "step": 216450 }, { "epoch": 0.56, "learning_rate": 0.0002158356684232764, "loss": 0.0191, "step": 216460 }, { "epoch": 0.56, "learning_rate": 0.00021583178020690496, "loss": 0.02, "step": 216470 }, { "epoch": 0.56, "learning_rate": 0.00021582789199053347, "loss": 0.015, "step": 216480 }, { "epoch": 0.56, "learning_rate": 0.000215824003774162, "loss": 0.0189, "step": 216490 }, { "epoch": 0.56, "learning_rate": 0.00021582011555779053, "loss": 0.0147, "step": 216500 }, { "epoch": 0.56, "learning_rate": 0.0002158162273414191, "loss": 0.0164, "step": 216510 }, { "epoch": 0.56, "learning_rate": 0.0002158123391250476, "loss": 0.0144, "step": 216520 }, { "epoch": 0.56, "learning_rate": 0.00021580845090867615, "loss": 0.0142, "step": 216530 }, { "epoch": 0.56, "learning_rate": 0.00021580456269230467, "loss": 0.0132, "step": 216540 }, { "epoch": 0.56, "learning_rate": 0.00021580067447593323, "loss": 0.0212, "step": 216550 }, { "epoch": 0.56, "learning_rate": 0.00021579678625956175, "loss": 0.0174, "step": 216560 }, { "epoch": 0.56, "learning_rate": 0.0002157928980431903, "loss": 0.0172, "step": 216570 }, { "epoch": 0.56, "learning_rate": 0.0002157890098268188, "loss": 0.0221, "step": 216580 }, { "epoch": 0.56, "learning_rate": 0.00021578512161044737, "loss": 0.0162, "step": 216590 }, { "epoch": 0.56, "learning_rate": 0.00021578123339407592, "loss": 0.016, "step": 216600 }, { "epoch": 0.56, "learning_rate": 0.00021577734517770443, "loss": 0.0289, "step": 216610 }, { "epoch": 0.56, "learning_rate": 0.00021577345696133295, "loss": 0.0193, "step": 216620 }, { "epoch": 0.56, "learning_rate": 0.0002157695687449615, "loss": 0.0157, "step": 216630 }, { "epoch": 0.56, "learning_rate": 0.00021576568052859006, "loss": 0.0191, "step": 216640 }, { "epoch": 0.56, "learning_rate": 0.00021576179231221857, "loss": 0.0185, "step": 216650 }, { "epoch": 0.56, "learning_rate": 0.0002157579040958471, "loss": 0.0271, "step": 216660 }, { "epoch": 0.56, "learning_rate": 0.00021575401587947563, "loss": 0.019, "step": 216670 }, { "epoch": 0.56, "learning_rate": 0.0002157501276631042, "loss": 0.0181, "step": 216680 }, { "epoch": 0.56, "learning_rate": 0.0002157462394467327, "loss": 0.0167, "step": 216690 }, { "epoch": 0.56, "learning_rate": 0.00021574235123036125, "loss": 0.0199, "step": 216700 }, { "epoch": 0.56, "learning_rate": 0.00021573846301398977, "loss": 0.0188, "step": 216710 }, { "epoch": 0.56, "learning_rate": 0.00021573457479761833, "loss": 0.02, "step": 216720 }, { "epoch": 0.56, "learning_rate": 0.00021573068658124685, "loss": 0.0182, "step": 216730 }, { "epoch": 0.56, "learning_rate": 0.0002157267983648754, "loss": 0.0152, "step": 216740 }, { "epoch": 0.56, "learning_rate": 0.0002157229101485039, "loss": 0.0123, "step": 216750 }, { "epoch": 0.56, "learning_rate": 0.00021571902193213247, "loss": 0.0177, "step": 216760 }, { "epoch": 0.56, "learning_rate": 0.000215715133715761, "loss": 0.017, "step": 216770 }, { "epoch": 0.56, "learning_rate": 0.00021571124549938953, "loss": 0.0205, "step": 216780 }, { "epoch": 0.56, "learning_rate": 0.00021570735728301804, "loss": 0.016, "step": 216790 }, { "epoch": 0.56, "learning_rate": 0.0002157034690666466, "loss": 0.0148, "step": 216800 }, { "epoch": 0.56, "learning_rate": 0.00021569958085027515, "loss": 0.0143, "step": 216810 }, { "epoch": 0.56, "learning_rate": 0.00021569569263390367, "loss": 0.0207, "step": 216820 }, { "epoch": 0.56, "learning_rate": 0.0002156918044175322, "loss": 0.0192, "step": 216830 }, { "epoch": 0.56, "learning_rate": 0.00021568791620116075, "loss": 0.0218, "step": 216840 }, { "epoch": 0.56, "learning_rate": 0.0002156840279847893, "loss": 0.0191, "step": 216850 }, { "epoch": 0.56, "learning_rate": 0.0002156801397684178, "loss": 0.0153, "step": 216860 }, { "epoch": 0.56, "learning_rate": 0.00021567625155204635, "loss": 0.0123, "step": 216870 }, { "epoch": 0.56, "learning_rate": 0.00021567236333567487, "loss": 0.0201, "step": 216880 }, { "epoch": 0.56, "learning_rate": 0.00021566847511930343, "loss": 0.0178, "step": 216890 }, { "epoch": 0.56, "learning_rate": 0.00021566458690293195, "loss": 0.0165, "step": 216900 }, { "epoch": 0.56, "learning_rate": 0.0002156606986865605, "loss": 0.0176, "step": 216910 }, { "epoch": 0.56, "learning_rate": 0.000215656810470189, "loss": 0.0151, "step": 216920 }, { "epoch": 0.56, "learning_rate": 0.00021565292225381757, "loss": 0.0121, "step": 216930 }, { "epoch": 0.56, "learning_rate": 0.0002156490340374461, "loss": 0.0157, "step": 216940 }, { "epoch": 0.56, "learning_rate": 0.00021564514582107463, "loss": 0.0154, "step": 216950 }, { "epoch": 0.56, "learning_rate": 0.00021564125760470314, "loss": 0.0197, "step": 216960 }, { "epoch": 0.56, "learning_rate": 0.0002156373693883317, "loss": 0.0195, "step": 216970 }, { "epoch": 0.56, "learning_rate": 0.00021563348117196025, "loss": 0.016, "step": 216980 }, { "epoch": 0.56, "learning_rate": 0.00021562959295558877, "loss": 0.0164, "step": 216990 }, { "epoch": 0.56, "learning_rate": 0.0002156257047392173, "loss": 0.0129, "step": 217000 }, { "epoch": 0.56, "eval_cer": 0.8817432757942589, "eval_loss": 0.011607037857174873, "eval_runtime": 107.7722, "eval_samples_per_second": 18.558, "eval_steps_per_second": 4.639, "step": 217000 }, { "epoch": 0.56, "learning_rate": 0.00021562181652284585, "loss": 0.0165, "step": 217010 }, { "epoch": 0.56, "learning_rate": 0.0002156179283064744, "loss": 0.0174, "step": 217020 }, { "epoch": 0.56, "learning_rate": 0.0002156140400901029, "loss": 0.0235, "step": 217030 }, { "epoch": 0.56, "learning_rate": 0.00021561015187373145, "loss": 0.0158, "step": 217040 }, { "epoch": 0.56, "learning_rate": 0.00021560626365736, "loss": 0.0167, "step": 217050 }, { "epoch": 0.56, "learning_rate": 0.00021560237544098853, "loss": 0.017, "step": 217060 }, { "epoch": 0.56, "learning_rate": 0.00021559848722461705, "loss": 0.0194, "step": 217070 }, { "epoch": 0.56, "learning_rate": 0.0002155945990082456, "loss": 0.0157, "step": 217080 }, { "epoch": 0.56, "learning_rate": 0.00021559071079187413, "loss": 0.0183, "step": 217090 }, { "epoch": 0.56, "learning_rate": 0.00021558682257550267, "loss": 0.0169, "step": 217100 }, { "epoch": 0.56, "learning_rate": 0.0002155829343591312, "loss": 0.0164, "step": 217110 }, { "epoch": 0.56, "learning_rate": 0.00021557904614275973, "loss": 0.017, "step": 217120 }, { "epoch": 0.56, "learning_rate": 0.00021557515792638824, "loss": 0.0141, "step": 217130 }, { "epoch": 0.56, "learning_rate": 0.0002155712697100168, "loss": 0.0162, "step": 217140 }, { "epoch": 0.56, "learning_rate": 0.00021556738149364535, "loss": 0.0151, "step": 217150 }, { "epoch": 0.56, "learning_rate": 0.00021556349327727387, "loss": 0.0174, "step": 217160 }, { "epoch": 0.56, "learning_rate": 0.00021555960506090238, "loss": 0.0167, "step": 217170 }, { "epoch": 0.56, "learning_rate": 0.00021555571684453095, "loss": 0.0148, "step": 217180 }, { "epoch": 0.56, "learning_rate": 0.0002155518286281595, "loss": 0.0151, "step": 217190 }, { "epoch": 0.56, "learning_rate": 0.000215547940411788, "loss": 0.0167, "step": 217200 }, { "epoch": 0.56, "learning_rate": 0.00021554405219541655, "loss": 0.0209, "step": 217210 }, { "epoch": 0.56, "learning_rate": 0.0002155401639790451, "loss": 0.0179, "step": 217220 }, { "epoch": 0.56, "learning_rate": 0.00021553627576267363, "loss": 0.018, "step": 217230 }, { "epoch": 0.56, "learning_rate": 0.00021553238754630215, "loss": 0.0174, "step": 217240 }, { "epoch": 0.56, "learning_rate": 0.0002155284993299307, "loss": 0.0145, "step": 217250 }, { "epoch": 0.56, "learning_rate": 0.00021552461111355923, "loss": 0.0149, "step": 217260 }, { "epoch": 0.56, "learning_rate": 0.00021552072289718777, "loss": 0.0172, "step": 217270 }, { "epoch": 0.56, "learning_rate": 0.0002155168346808163, "loss": 0.0215, "step": 217280 }, { "epoch": 0.56, "learning_rate": 0.00021551294646444483, "loss": 0.02, "step": 217290 }, { "epoch": 0.56, "learning_rate": 0.0002155090582480734, "loss": 0.0152, "step": 217300 }, { "epoch": 0.56, "learning_rate": 0.0002155051700317019, "loss": 0.0184, "step": 217310 }, { "epoch": 0.56, "learning_rate": 0.00021550128181533045, "loss": 0.0154, "step": 217320 }, { "epoch": 0.56, "learning_rate": 0.00021549739359895897, "loss": 0.0168, "step": 217330 }, { "epoch": 0.56, "learning_rate": 0.00021549350538258754, "loss": 0.0238, "step": 217340 }, { "epoch": 0.56, "learning_rate": 0.00021548961716621605, "loss": 0.0175, "step": 217350 }, { "epoch": 0.56, "learning_rate": 0.0002154857289498446, "loss": 0.0177, "step": 217360 }, { "epoch": 0.56, "learning_rate": 0.0002154818407334731, "loss": 0.0164, "step": 217370 }, { "epoch": 0.56, "learning_rate": 0.00021547795251710165, "loss": 0.0156, "step": 217380 }, { "epoch": 0.56, "learning_rate": 0.0002154740643007302, "loss": 0.0146, "step": 217390 }, { "epoch": 0.56, "learning_rate": 0.00021547017608435873, "loss": 0.0162, "step": 217400 }, { "epoch": 0.56, "learning_rate": 0.00021546628786798725, "loss": 0.0151, "step": 217410 }, { "epoch": 0.56, "learning_rate": 0.0002154623996516158, "loss": 0.0173, "step": 217420 }, { "epoch": 0.56, "learning_rate": 0.00021545851143524433, "loss": 0.0197, "step": 217430 }, { "epoch": 0.56, "learning_rate": 0.00021545462321887287, "loss": 0.0146, "step": 217440 }, { "epoch": 0.56, "learning_rate": 0.00021545073500250139, "loss": 0.0147, "step": 217450 }, { "epoch": 0.56, "learning_rate": 0.00021544684678612993, "loss": 0.0187, "step": 217460 }, { "epoch": 0.56, "learning_rate": 0.0002154429585697585, "loss": 0.0134, "step": 217470 }, { "epoch": 0.56, "learning_rate": 0.000215439070353387, "loss": 0.0157, "step": 217480 }, { "epoch": 0.56, "learning_rate": 0.00021543518213701553, "loss": 0.0159, "step": 217490 }, { "epoch": 0.56, "learning_rate": 0.00021543129392064407, "loss": 0.0148, "step": 217500 }, { "epoch": 0.56, "learning_rate": 0.00021542740570427264, "loss": 0.0175, "step": 217510 }, { "epoch": 0.56, "learning_rate": 0.00021542351748790115, "loss": 0.0139, "step": 217520 }, { "epoch": 0.56, "learning_rate": 0.0002154196292715297, "loss": 0.0183, "step": 217530 }, { "epoch": 0.56, "learning_rate": 0.0002154157410551582, "loss": 0.02, "step": 217540 }, { "epoch": 0.56, "learning_rate": 0.00021541185283878678, "loss": 0.0161, "step": 217550 }, { "epoch": 0.56, "learning_rate": 0.0002154079646224153, "loss": 0.0159, "step": 217560 }, { "epoch": 0.56, "learning_rate": 0.00021540407640604383, "loss": 0.0162, "step": 217570 }, { "epoch": 0.56, "learning_rate": 0.00021540018818967235, "loss": 0.0136, "step": 217580 }, { "epoch": 0.56, "learning_rate": 0.0002153962999733009, "loss": 0.0209, "step": 217590 }, { "epoch": 0.56, "learning_rate": 0.00021539241175692943, "loss": 0.0162, "step": 217600 }, { "epoch": 0.56, "learning_rate": 0.00021538852354055797, "loss": 0.0188, "step": 217610 }, { "epoch": 0.56, "learning_rate": 0.00021538463532418649, "loss": 0.0204, "step": 217620 }, { "epoch": 0.56, "learning_rate": 0.00021538074710781503, "loss": 0.017, "step": 217630 }, { "epoch": 0.56, "learning_rate": 0.00021537685889144357, "loss": 0.0159, "step": 217640 }, { "epoch": 0.56, "learning_rate": 0.0002153729706750721, "loss": 0.0187, "step": 217650 }, { "epoch": 0.56, "learning_rate": 0.00021536908245870062, "loss": 0.0166, "step": 217660 }, { "epoch": 0.56, "learning_rate": 0.00021536519424232917, "loss": 0.0184, "step": 217670 }, { "epoch": 0.56, "learning_rate": 0.00021536130602595774, "loss": 0.0187, "step": 217680 }, { "epoch": 0.56, "learning_rate": 0.00021535741780958625, "loss": 0.0211, "step": 217690 }, { "epoch": 0.56, "learning_rate": 0.0002153535295932148, "loss": 0.0223, "step": 217700 }, { "epoch": 0.56, "learning_rate": 0.0002153496413768433, "loss": 0.0299, "step": 217710 }, { "epoch": 0.56, "learning_rate": 0.00021534575316047187, "loss": 0.021, "step": 217720 }, { "epoch": 0.56, "learning_rate": 0.0002153418649441004, "loss": 0.0138, "step": 217730 }, { "epoch": 0.56, "learning_rate": 0.00021533797672772893, "loss": 0.0155, "step": 217740 }, { "epoch": 0.56, "learning_rate": 0.00021533408851135745, "loss": 0.0154, "step": 217750 }, { "epoch": 0.56, "learning_rate": 0.00021533020029498601, "loss": 0.0165, "step": 217760 }, { "epoch": 0.56, "learning_rate": 0.00021532631207861453, "loss": 0.0183, "step": 217770 }, { "epoch": 0.56, "learning_rate": 0.00021532242386224307, "loss": 0.0151, "step": 217780 }, { "epoch": 0.56, "learning_rate": 0.00021531853564587158, "loss": 0.0171, "step": 217790 }, { "epoch": 0.56, "learning_rate": 0.00021531464742950015, "loss": 0.0183, "step": 217800 }, { "epoch": 0.56, "learning_rate": 0.00021531075921312867, "loss": 0.0176, "step": 217810 }, { "epoch": 0.56, "learning_rate": 0.0002153068709967572, "loss": 0.0161, "step": 217820 }, { "epoch": 0.56, "learning_rate": 0.00021530298278038572, "loss": 0.014, "step": 217830 }, { "epoch": 0.56, "learning_rate": 0.00021529909456401427, "loss": 0.0134, "step": 217840 }, { "epoch": 0.56, "learning_rate": 0.00021529520634764283, "loss": 0.0169, "step": 217850 }, { "epoch": 0.56, "learning_rate": 0.00021529131813127135, "loss": 0.0183, "step": 217860 }, { "epoch": 0.56, "learning_rate": 0.0002152874299148999, "loss": 0.0251, "step": 217870 }, { "epoch": 0.56, "learning_rate": 0.0002152835416985284, "loss": 0.0201, "step": 217880 }, { "epoch": 0.56, "learning_rate": 0.00021527965348215697, "loss": 0.0177, "step": 217890 }, { "epoch": 0.56, "learning_rate": 0.0002152757652657855, "loss": 0.0168, "step": 217900 }, { "epoch": 0.56, "learning_rate": 0.00021527187704941403, "loss": 0.0141, "step": 217910 }, { "epoch": 0.56, "learning_rate": 0.00021526798883304254, "loss": 0.0157, "step": 217920 }, { "epoch": 0.56, "learning_rate": 0.00021526410061667111, "loss": 0.0162, "step": 217930 }, { "epoch": 0.56, "learning_rate": 0.00021526021240029963, "loss": 0.0155, "step": 217940 }, { "epoch": 0.56, "learning_rate": 0.00021525632418392817, "loss": 0.0151, "step": 217950 }, { "epoch": 0.56, "learning_rate": 0.00021525243596755668, "loss": 0.0183, "step": 217960 }, { "epoch": 0.57, "learning_rate": 0.00021524854775118525, "loss": 0.0192, "step": 217970 }, { "epoch": 0.57, "learning_rate": 0.00021524465953481377, "loss": 0.0186, "step": 217980 }, { "epoch": 0.57, "learning_rate": 0.0002152407713184423, "loss": 0.017, "step": 217990 }, { "epoch": 0.57, "learning_rate": 0.00021523688310207082, "loss": 0.0165, "step": 218000 }, { "epoch": 0.57, "eval_cer": 0.8817376772465223, "eval_loss": 0.011108589358627796, "eval_runtime": 107.5987, "eval_samples_per_second": 18.588, "eval_steps_per_second": 4.647, "step": 218000 }, { "epoch": 0.57, "learning_rate": 0.0002152329948856994, "loss": 0.0141, "step": 218010 }, { "epoch": 0.57, "learning_rate": 0.00021522910666932793, "loss": 0.0193, "step": 218020 }, { "epoch": 0.57, "learning_rate": 0.00021522521845295645, "loss": 0.0171, "step": 218030 }, { "epoch": 0.57, "learning_rate": 0.000215221330236585, "loss": 0.0147, "step": 218040 }, { "epoch": 0.57, "learning_rate": 0.00021521744202021353, "loss": 0.0178, "step": 218050 }, { "epoch": 0.57, "learning_rate": 0.00021521355380384207, "loss": 0.0191, "step": 218060 }, { "epoch": 0.57, "learning_rate": 0.0002152096655874706, "loss": 0.0162, "step": 218070 }, { "epoch": 0.57, "learning_rate": 0.00021520577737109913, "loss": 0.0183, "step": 218080 }, { "epoch": 0.57, "learning_rate": 0.00021520188915472764, "loss": 0.0162, "step": 218090 }, { "epoch": 0.57, "learning_rate": 0.0002151980009383562, "loss": 0.0168, "step": 218100 }, { "epoch": 0.57, "learning_rate": 0.00021519411272198473, "loss": 0.0159, "step": 218110 }, { "epoch": 0.57, "learning_rate": 0.00021519022450561327, "loss": 0.0161, "step": 218120 }, { "epoch": 0.57, "learning_rate": 0.00021518633628924178, "loss": 0.0159, "step": 218130 }, { "epoch": 0.57, "learning_rate": 0.00021518244807287035, "loss": 0.0128, "step": 218140 }, { "epoch": 0.57, "learning_rate": 0.00021517855985649887, "loss": 0.0141, "step": 218150 }, { "epoch": 0.57, "learning_rate": 0.0002151746716401274, "loss": 0.0129, "step": 218160 }, { "epoch": 0.57, "learning_rate": 0.00021517078342375592, "loss": 0.0138, "step": 218170 }, { "epoch": 0.57, "learning_rate": 0.0002151668952073845, "loss": 0.0182, "step": 218180 }, { "epoch": 0.57, "learning_rate": 0.00021516300699101303, "loss": 0.0135, "step": 218190 }, { "epoch": 0.57, "learning_rate": 0.00021515911877464155, "loss": 0.019, "step": 218200 }, { "epoch": 0.57, "learning_rate": 0.00021515523055827006, "loss": 0.0143, "step": 218210 }, { "epoch": 0.57, "learning_rate": 0.00021515134234189863, "loss": 0.02, "step": 218220 }, { "epoch": 0.57, "learning_rate": 0.00021514745412552717, "loss": 0.0185, "step": 218230 }, { "epoch": 0.57, "learning_rate": 0.0002151435659091557, "loss": 0.0191, "step": 218240 }, { "epoch": 0.57, "learning_rate": 0.00021513967769278423, "loss": 0.0146, "step": 218250 }, { "epoch": 0.57, "learning_rate": 0.00021513578947641277, "loss": 0.0168, "step": 218260 }, { "epoch": 0.57, "learning_rate": 0.0002151319012600413, "loss": 0.0172, "step": 218270 }, { "epoch": 0.57, "learning_rate": 0.00021512801304366983, "loss": 0.0158, "step": 218280 }, { "epoch": 0.57, "learning_rate": 0.00021512412482729837, "loss": 0.0167, "step": 218290 }, { "epoch": 0.57, "learning_rate": 0.0002151202366109269, "loss": 0.0159, "step": 218300 }, { "epoch": 0.57, "learning_rate": 0.00021511634839455545, "loss": 0.0157, "step": 218310 }, { "epoch": 0.57, "learning_rate": 0.00021511246017818397, "loss": 0.0123, "step": 218320 }, { "epoch": 0.57, "learning_rate": 0.0002151085719618125, "loss": 0.0163, "step": 218330 }, { "epoch": 0.57, "learning_rate": 0.00021510468374544102, "loss": 0.0146, "step": 218340 }, { "epoch": 0.57, "learning_rate": 0.0002151007955290696, "loss": 0.0212, "step": 218350 }, { "epoch": 0.57, "learning_rate": 0.0002150969073126981, "loss": 0.0174, "step": 218360 }, { "epoch": 0.57, "learning_rate": 0.00021509301909632665, "loss": 0.0143, "step": 218370 }, { "epoch": 0.57, "learning_rate": 0.00021508913087995516, "loss": 0.0175, "step": 218380 }, { "epoch": 0.57, "learning_rate": 0.00021508524266358373, "loss": 0.017, "step": 218390 }, { "epoch": 0.57, "learning_rate": 0.00021508135444721227, "loss": 0.013, "step": 218400 }, { "epoch": 0.57, "learning_rate": 0.0002150774662308408, "loss": 0.0179, "step": 218410 }, { "epoch": 0.57, "learning_rate": 0.00021507357801446933, "loss": 0.0142, "step": 218420 }, { "epoch": 0.57, "learning_rate": 0.00021506968979809787, "loss": 0.0175, "step": 218430 }, { "epoch": 0.57, "learning_rate": 0.0002150658015817264, "loss": 0.0183, "step": 218440 }, { "epoch": 0.57, "learning_rate": 0.00021506191336535493, "loss": 0.0201, "step": 218450 }, { "epoch": 0.57, "learning_rate": 0.00021505802514898347, "loss": 0.0169, "step": 218460 }, { "epoch": 0.57, "learning_rate": 0.000215054136932612, "loss": 0.0195, "step": 218470 }, { "epoch": 0.57, "learning_rate": 0.00021505024871624055, "loss": 0.015, "step": 218480 }, { "epoch": 0.57, "learning_rate": 0.00021504636049986907, "loss": 0.0174, "step": 218490 }, { "epoch": 0.57, "learning_rate": 0.0002150424722834976, "loss": 0.022, "step": 218500 }, { "epoch": 0.57, "learning_rate": 0.00021503858406712618, "loss": 0.0162, "step": 218510 }, { "epoch": 0.57, "learning_rate": 0.0002150346958507547, "loss": 0.0161, "step": 218520 }, { "epoch": 0.57, "learning_rate": 0.0002150308076343832, "loss": 0.0162, "step": 218530 }, { "epoch": 0.57, "learning_rate": 0.00021502691941801175, "loss": 0.0142, "step": 218540 }, { "epoch": 0.57, "learning_rate": 0.00021502303120164032, "loss": 0.0183, "step": 218550 }, { "epoch": 0.57, "learning_rate": 0.00021501914298526883, "loss": 0.02, "step": 218560 }, { "epoch": 0.57, "learning_rate": 0.00021501525476889737, "loss": 0.0216, "step": 218570 }, { "epoch": 0.57, "learning_rate": 0.00021501136655252589, "loss": 0.0168, "step": 218580 }, { "epoch": 0.57, "learning_rate": 0.00021500747833615443, "loss": 0.0164, "step": 218590 }, { "epoch": 0.57, "learning_rate": 0.00021500359011978297, "loss": 0.0165, "step": 218600 }, { "epoch": 0.57, "learning_rate": 0.0002149997019034115, "loss": 0.0116, "step": 218610 }, { "epoch": 0.57, "learning_rate": 0.00021499581368704003, "loss": 0.0143, "step": 218620 }, { "epoch": 0.57, "learning_rate": 0.00021499192547066857, "loss": 0.0192, "step": 218630 }, { "epoch": 0.57, "learning_rate": 0.0002149880372542971, "loss": 0.0201, "step": 218640 }, { "epoch": 0.57, "learning_rate": 0.00021498414903792565, "loss": 0.0153, "step": 218650 }, { "epoch": 0.57, "learning_rate": 0.00021498026082155417, "loss": 0.0197, "step": 218660 }, { "epoch": 0.57, "learning_rate": 0.0002149763726051827, "loss": 0.017, "step": 218670 }, { "epoch": 0.57, "learning_rate": 0.00021497248438881125, "loss": 0.0166, "step": 218680 }, { "epoch": 0.57, "learning_rate": 0.0002149685961724398, "loss": 0.0217, "step": 218690 }, { "epoch": 0.57, "learning_rate": 0.0002149647079560683, "loss": 0.0192, "step": 218700 }, { "epoch": 0.57, "learning_rate": 0.00021496081973969685, "loss": 0.0217, "step": 218710 }, { "epoch": 0.57, "learning_rate": 0.00021495693152332542, "loss": 0.0168, "step": 218720 }, { "epoch": 0.57, "learning_rate": 0.00021495304330695393, "loss": 0.0155, "step": 218730 }, { "epoch": 0.57, "learning_rate": 0.00021494915509058247, "loss": 0.0147, "step": 218740 }, { "epoch": 0.57, "learning_rate": 0.00021494526687421099, "loss": 0.0182, "step": 218750 }, { "epoch": 0.57, "learning_rate": 0.00021494137865783955, "loss": 0.0183, "step": 218760 }, { "epoch": 0.57, "learning_rate": 0.00021493749044146807, "loss": 0.0177, "step": 218770 }, { "epoch": 0.57, "learning_rate": 0.0002149336022250966, "loss": 0.0176, "step": 218780 }, { "epoch": 0.57, "learning_rate": 0.00021492971400872513, "loss": 0.0195, "step": 218790 }, { "epoch": 0.57, "learning_rate": 0.0002149258257923537, "loss": 0.0147, "step": 218800 }, { "epoch": 0.57, "learning_rate": 0.0002149219375759822, "loss": 0.0178, "step": 218810 }, { "epoch": 0.57, "learning_rate": 0.00021491804935961075, "loss": 0.0161, "step": 218820 }, { "epoch": 0.57, "learning_rate": 0.00021491416114323926, "loss": 0.0165, "step": 218830 }, { "epoch": 0.57, "learning_rate": 0.0002149102729268678, "loss": 0.0242, "step": 218840 }, { "epoch": 0.57, "learning_rate": 0.00021490638471049635, "loss": 0.0185, "step": 218850 }, { "epoch": 0.57, "learning_rate": 0.0002149024964941249, "loss": 0.0172, "step": 218860 }, { "epoch": 0.57, "learning_rate": 0.0002148986082777534, "loss": 0.0164, "step": 218870 }, { "epoch": 0.57, "learning_rate": 0.00021489472006138195, "loss": 0.0172, "step": 218880 }, { "epoch": 0.57, "learning_rate": 0.00021489083184501051, "loss": 0.0194, "step": 218890 }, { "epoch": 0.57, "learning_rate": 0.00021488694362863903, "loss": 0.0205, "step": 218900 }, { "epoch": 0.57, "learning_rate": 0.00021488305541226757, "loss": 0.0191, "step": 218910 }, { "epoch": 0.57, "learning_rate": 0.00021487916719589609, "loss": 0.0147, "step": 218920 }, { "epoch": 0.57, "learning_rate": 0.00021487527897952465, "loss": 0.0144, "step": 218930 }, { "epoch": 0.57, "learning_rate": 0.00021487139076315317, "loss": 0.0179, "step": 218940 }, { "epoch": 0.57, "learning_rate": 0.0002148675025467817, "loss": 0.018, "step": 218950 }, { "epoch": 0.57, "learning_rate": 0.00021486361433041022, "loss": 0.0157, "step": 218960 }, { "epoch": 0.57, "learning_rate": 0.0002148597261140388, "loss": 0.0165, "step": 218970 }, { "epoch": 0.57, "learning_rate": 0.0002148558378976673, "loss": 0.0161, "step": 218980 }, { "epoch": 0.57, "learning_rate": 0.00021485194968129585, "loss": 0.0162, "step": 218990 }, { "epoch": 0.57, "learning_rate": 0.00021484806146492436, "loss": 0.019, "step": 219000 }, { "epoch": 0.57, "eval_cer": 0.8817684692590742, "eval_loss": 0.011217095889151096, "eval_runtime": 107.9572, "eval_samples_per_second": 18.526, "eval_steps_per_second": 4.631, "step": 219000 }, { "epoch": 0.57, "learning_rate": 0.00021484417324855293, "loss": 0.0152, "step": 219010 }, { "epoch": 0.57, "learning_rate": 0.00021484028503218145, "loss": 0.0155, "step": 219020 }, { "epoch": 0.57, "learning_rate": 0.00021483639681581, "loss": 0.0171, "step": 219030 }, { "epoch": 0.57, "learning_rate": 0.0002148325085994385, "loss": 0.0151, "step": 219040 }, { "epoch": 0.57, "learning_rate": 0.00021482862038306707, "loss": 0.0145, "step": 219050 }, { "epoch": 0.57, "learning_rate": 0.00021482473216669561, "loss": 0.0152, "step": 219060 }, { "epoch": 0.57, "learning_rate": 0.00021482084395032413, "loss": 0.0168, "step": 219070 }, { "epoch": 0.57, "learning_rate": 0.00021481695573395264, "loss": 0.0165, "step": 219080 }, { "epoch": 0.57, "learning_rate": 0.00021481306751758118, "loss": 0.0169, "step": 219090 }, { "epoch": 0.57, "learning_rate": 0.00021480917930120975, "loss": 0.0129, "step": 219100 }, { "epoch": 0.57, "learning_rate": 0.00021480529108483827, "loss": 0.0174, "step": 219110 }, { "epoch": 0.57, "learning_rate": 0.0002148014028684668, "loss": 0.0184, "step": 219120 }, { "epoch": 0.57, "learning_rate": 0.00021479751465209532, "loss": 0.0156, "step": 219130 }, { "epoch": 0.57, "learning_rate": 0.0002147936264357239, "loss": 0.0159, "step": 219140 }, { "epoch": 0.57, "learning_rate": 0.0002147897382193524, "loss": 0.0157, "step": 219150 }, { "epoch": 0.57, "learning_rate": 0.00021478585000298095, "loss": 0.0145, "step": 219160 }, { "epoch": 0.57, "learning_rate": 0.00021478196178660946, "loss": 0.0112, "step": 219170 }, { "epoch": 0.57, "learning_rate": 0.00021477807357023803, "loss": 0.0163, "step": 219180 }, { "epoch": 0.57, "learning_rate": 0.00021477418535386655, "loss": 0.0149, "step": 219190 }, { "epoch": 0.57, "learning_rate": 0.0002147702971374951, "loss": 0.0162, "step": 219200 }, { "epoch": 0.57, "learning_rate": 0.0002147664089211236, "loss": 0.0204, "step": 219210 }, { "epoch": 0.57, "learning_rate": 0.00021476252070475217, "loss": 0.0149, "step": 219220 }, { "epoch": 0.57, "learning_rate": 0.00021475863248838069, "loss": 0.0153, "step": 219230 }, { "epoch": 0.57, "learning_rate": 0.00021475474427200923, "loss": 0.0174, "step": 219240 }, { "epoch": 0.57, "learning_rate": 0.00021475085605563774, "loss": 0.0177, "step": 219250 }, { "epoch": 0.57, "learning_rate": 0.0002147469678392663, "loss": 0.0176, "step": 219260 }, { "epoch": 0.57, "learning_rate": 0.00021474307962289485, "loss": 0.016, "step": 219270 }, { "epoch": 0.57, "learning_rate": 0.00021473919140652337, "loss": 0.0185, "step": 219280 }, { "epoch": 0.57, "learning_rate": 0.0002147353031901519, "loss": 0.0129, "step": 219290 }, { "epoch": 0.57, "learning_rate": 0.00021473141497378045, "loss": 0.0181, "step": 219300 }, { "epoch": 0.57, "learning_rate": 0.000214727526757409, "loss": 0.0162, "step": 219310 }, { "epoch": 0.57, "learning_rate": 0.0002147236385410375, "loss": 0.0182, "step": 219320 }, { "epoch": 0.57, "learning_rate": 0.00021471975032466605, "loss": 0.0168, "step": 219330 }, { "epoch": 0.57, "learning_rate": 0.00021471586210829456, "loss": 0.0185, "step": 219340 }, { "epoch": 0.57, "learning_rate": 0.00021471197389192313, "loss": 0.0162, "step": 219350 }, { "epoch": 0.57, "learning_rate": 0.00021470808567555165, "loss": 0.0164, "step": 219360 }, { "epoch": 0.57, "learning_rate": 0.0002147041974591802, "loss": 0.016, "step": 219370 }, { "epoch": 0.57, "learning_rate": 0.0002147003092428087, "loss": 0.0169, "step": 219380 }, { "epoch": 0.57, "learning_rate": 0.00021469642102643727, "loss": 0.0171, "step": 219390 }, { "epoch": 0.57, "learning_rate": 0.00021469253281006579, "loss": 0.0209, "step": 219400 }, { "epoch": 0.57, "learning_rate": 0.00021468864459369433, "loss": 0.0215, "step": 219410 }, { "epoch": 0.57, "learning_rate": 0.00021468475637732284, "loss": 0.0136, "step": 219420 }, { "epoch": 0.57, "learning_rate": 0.0002146808681609514, "loss": 0.0143, "step": 219430 }, { "epoch": 0.57, "learning_rate": 0.00021467697994457995, "loss": 0.0159, "step": 219440 }, { "epoch": 0.57, "learning_rate": 0.00021467309172820847, "loss": 0.0164, "step": 219450 }, { "epoch": 0.57, "learning_rate": 0.000214669203511837, "loss": 0.0134, "step": 219460 }, { "epoch": 0.57, "learning_rate": 0.00021466531529546555, "loss": 0.0172, "step": 219470 }, { "epoch": 0.57, "learning_rate": 0.0002146614270790941, "loss": 0.0196, "step": 219480 }, { "epoch": 0.57, "learning_rate": 0.0002146575388627226, "loss": 0.0168, "step": 219490 }, { "epoch": 0.57, "learning_rate": 0.00021465365064635115, "loss": 0.0168, "step": 219500 }, { "epoch": 0.57, "learning_rate": 0.0002146497624299797, "loss": 0.0172, "step": 219510 }, { "epoch": 0.57, "learning_rate": 0.00021464587421360823, "loss": 0.0215, "step": 219520 }, { "epoch": 0.57, "learning_rate": 0.00021464198599723675, "loss": 0.0189, "step": 219530 }, { "epoch": 0.57, "learning_rate": 0.0002146380977808653, "loss": 0.0185, "step": 219540 }, { "epoch": 0.57, "learning_rate": 0.00021463420956449383, "loss": 0.0155, "step": 219550 }, { "epoch": 0.57, "learning_rate": 0.00021463032134812237, "loss": 0.0189, "step": 219560 }, { "epoch": 0.57, "learning_rate": 0.00021462643313175089, "loss": 0.0193, "step": 219570 }, { "epoch": 0.57, "learning_rate": 0.00021462254491537943, "loss": 0.0165, "step": 219580 }, { "epoch": 0.57, "learning_rate": 0.00021461865669900794, "loss": 0.0168, "step": 219590 }, { "epoch": 0.57, "learning_rate": 0.0002146147684826365, "loss": 0.0152, "step": 219600 }, { "epoch": 0.57, "learning_rate": 0.00021461088026626505, "loss": 0.0158, "step": 219610 }, { "epoch": 0.57, "learning_rate": 0.00021460699204989357, "loss": 0.0169, "step": 219620 }, { "epoch": 0.57, "learning_rate": 0.0002146031038335221, "loss": 0.0152, "step": 219630 }, { "epoch": 0.57, "learning_rate": 0.00021459921561715065, "loss": 0.0156, "step": 219640 }, { "epoch": 0.57, "learning_rate": 0.0002145953274007792, "loss": 0.0156, "step": 219650 }, { "epoch": 0.57, "learning_rate": 0.0002145914391844077, "loss": 0.0188, "step": 219660 }, { "epoch": 0.57, "learning_rate": 0.00021458755096803625, "loss": 0.0211, "step": 219670 }, { "epoch": 0.57, "learning_rate": 0.0002145836627516648, "loss": 0.0168, "step": 219680 }, { "epoch": 0.57, "learning_rate": 0.00021457977453529333, "loss": 0.0209, "step": 219690 }, { "epoch": 0.57, "learning_rate": 0.00021457588631892185, "loss": 0.0131, "step": 219700 }, { "epoch": 0.57, "learning_rate": 0.0002145719981025504, "loss": 0.0164, "step": 219710 }, { "epoch": 0.57, "learning_rate": 0.00021456810988617893, "loss": 0.0163, "step": 219720 }, { "epoch": 0.57, "learning_rate": 0.00021456422166980747, "loss": 0.0142, "step": 219730 }, { "epoch": 0.57, "learning_rate": 0.00021456033345343598, "loss": 0.0177, "step": 219740 }, { "epoch": 0.57, "learning_rate": 0.00021455644523706453, "loss": 0.0147, "step": 219750 }, { "epoch": 0.57, "learning_rate": 0.0002145525570206931, "loss": 0.0148, "step": 219760 }, { "epoch": 0.57, "learning_rate": 0.0002145486688043216, "loss": 0.0139, "step": 219770 }, { "epoch": 0.57, "learning_rate": 0.00021454478058795015, "loss": 0.0129, "step": 219780 }, { "epoch": 0.57, "learning_rate": 0.00021454089237157867, "loss": 0.018, "step": 219790 }, { "epoch": 0.57, "learning_rate": 0.00021453700415520723, "loss": 0.0174, "step": 219800 }, { "epoch": 0.57, "learning_rate": 0.00021453311593883575, "loss": 0.0172, "step": 219810 }, { "epoch": 0.57, "learning_rate": 0.0002145292277224643, "loss": 0.0167, "step": 219820 }, { "epoch": 0.57, "learning_rate": 0.0002145253395060928, "loss": 0.0183, "step": 219830 }, { "epoch": 0.57, "learning_rate": 0.00021452145128972135, "loss": 0.0179, "step": 219840 }, { "epoch": 0.57, "learning_rate": 0.0002145175630733499, "loss": 0.0148, "step": 219850 }, { "epoch": 0.57, "learning_rate": 0.00021451367485697843, "loss": 0.0166, "step": 219860 }, { "epoch": 0.57, "learning_rate": 0.00021450978664060694, "loss": 0.0178, "step": 219870 }, { "epoch": 0.57, "learning_rate": 0.00021450589842423549, "loss": 0.0177, "step": 219880 }, { "epoch": 0.57, "learning_rate": 0.00021450201020786403, "loss": 0.0195, "step": 219890 }, { "epoch": 0.57, "learning_rate": 0.00021449812199149257, "loss": 0.0133, "step": 219900 }, { "epoch": 0.57, "learning_rate": 0.00021449423377512108, "loss": 0.015, "step": 219910 }, { "epoch": 0.57, "learning_rate": 0.00021449034555874963, "loss": 0.0169, "step": 219920 }, { "epoch": 0.57, "learning_rate": 0.0002144864573423782, "loss": 0.0139, "step": 219930 }, { "epoch": 0.57, "learning_rate": 0.0002144825691260067, "loss": 0.0149, "step": 219940 }, { "epoch": 0.57, "learning_rate": 0.00021447868090963522, "loss": 0.0141, "step": 219950 }, { "epoch": 0.57, "learning_rate": 0.00021447479269326377, "loss": 0.0193, "step": 219960 }, { "epoch": 0.57, "learning_rate": 0.00021447090447689233, "loss": 0.0144, "step": 219970 }, { "epoch": 0.57, "learning_rate": 0.00021446701626052085, "loss": 0.0131, "step": 219980 }, { "epoch": 0.57, "learning_rate": 0.0002144631280441494, "loss": 0.0141, "step": 219990 }, { "epoch": 0.57, "learning_rate": 0.0002144592398277779, "loss": 0.0245, "step": 220000 }, { "epoch": 0.57, "eval_cer": 0.8817306790618513, "eval_loss": 0.011034357361495495, "eval_runtime": 107.3096, "eval_samples_per_second": 18.638, "eval_steps_per_second": 4.659, "step": 220000 }, { "epoch": 0.57, "learning_rate": 0.00021445535161140647, "loss": 0.0137, "step": 220010 }, { "epoch": 0.57, "learning_rate": 0.000214451463395035, "loss": 0.0172, "step": 220020 }, { "epoch": 0.57, "learning_rate": 0.00021444757517866353, "loss": 0.0136, "step": 220030 }, { "epoch": 0.57, "learning_rate": 0.00021444368696229204, "loss": 0.016, "step": 220040 }, { "epoch": 0.57, "learning_rate": 0.0002144397987459206, "loss": 0.0216, "step": 220050 }, { "epoch": 0.57, "learning_rate": 0.00021443591052954913, "loss": 0.0157, "step": 220060 }, { "epoch": 0.57, "learning_rate": 0.00021443202231317767, "loss": 0.0204, "step": 220070 }, { "epoch": 0.57, "learning_rate": 0.00021442813409680618, "loss": 0.0219, "step": 220080 }, { "epoch": 0.57, "learning_rate": 0.00021442424588043472, "loss": 0.0156, "step": 220090 }, { "epoch": 0.57, "learning_rate": 0.0002144203576640633, "loss": 0.0173, "step": 220100 }, { "epoch": 0.57, "learning_rate": 0.0002144164694476918, "loss": 0.0164, "step": 220110 }, { "epoch": 0.57, "learning_rate": 0.00021441258123132032, "loss": 0.0168, "step": 220120 }, { "epoch": 0.57, "learning_rate": 0.00021440869301494886, "loss": 0.0161, "step": 220130 }, { "epoch": 0.57, "learning_rate": 0.00021440480479857743, "loss": 0.0172, "step": 220140 }, { "epoch": 0.57, "learning_rate": 0.00021440091658220595, "loss": 0.0172, "step": 220150 }, { "epoch": 0.57, "learning_rate": 0.0002143970283658345, "loss": 0.0171, "step": 220160 }, { "epoch": 0.57, "learning_rate": 0.000214393140149463, "loss": 0.0181, "step": 220170 }, { "epoch": 0.57, "learning_rate": 0.00021438925193309157, "loss": 0.0153, "step": 220180 }, { "epoch": 0.57, "learning_rate": 0.0002143853637167201, "loss": 0.015, "step": 220190 }, { "epoch": 0.57, "learning_rate": 0.00021438147550034863, "loss": 0.0249, "step": 220200 }, { "epoch": 0.57, "learning_rate": 0.00021437758728397714, "loss": 0.0227, "step": 220210 }, { "epoch": 0.57, "learning_rate": 0.0002143736990676057, "loss": 0.0157, "step": 220220 }, { "epoch": 0.57, "learning_rate": 0.00021436981085123423, "loss": 0.0156, "step": 220230 }, { "epoch": 0.57, "learning_rate": 0.00021436592263486277, "loss": 0.0168, "step": 220240 }, { "epoch": 0.57, "learning_rate": 0.00021436203441849128, "loss": 0.0148, "step": 220250 }, { "epoch": 0.57, "learning_rate": 0.00021435814620211985, "loss": 0.0157, "step": 220260 }, { "epoch": 0.57, "learning_rate": 0.00021435425798574837, "loss": 0.0154, "step": 220270 }, { "epoch": 0.57, "learning_rate": 0.0002143503697693769, "loss": 0.0131, "step": 220280 }, { "epoch": 0.57, "learning_rate": 0.00021434648155300542, "loss": 0.0184, "step": 220290 }, { "epoch": 0.57, "learning_rate": 0.000214342593336634, "loss": 0.0134, "step": 220300 }, { "epoch": 0.57, "learning_rate": 0.00021433870512026253, "loss": 0.0173, "step": 220310 }, { "epoch": 0.57, "learning_rate": 0.00021433481690389105, "loss": 0.0188, "step": 220320 }, { "epoch": 0.57, "learning_rate": 0.0002143309286875196, "loss": 0.0158, "step": 220330 }, { "epoch": 0.57, "learning_rate": 0.0002143270404711481, "loss": 0.0179, "step": 220340 }, { "epoch": 0.57, "learning_rate": 0.00021432315225477667, "loss": 0.0183, "step": 220350 }, { "epoch": 0.57, "learning_rate": 0.0002143192640384052, "loss": 0.0163, "step": 220360 }, { "epoch": 0.57, "learning_rate": 0.00021431537582203373, "loss": 0.0139, "step": 220370 }, { "epoch": 0.57, "learning_rate": 0.00021431148760566224, "loss": 0.0144, "step": 220380 }, { "epoch": 0.57, "learning_rate": 0.0002143075993892908, "loss": 0.0169, "step": 220390 }, { "epoch": 0.57, "learning_rate": 0.00021430371117291933, "loss": 0.0136, "step": 220400 }, { "epoch": 0.57, "learning_rate": 0.00021429982295654787, "loss": 0.0167, "step": 220410 }, { "epoch": 0.57, "learning_rate": 0.00021429593474017638, "loss": 0.0161, "step": 220420 }, { "epoch": 0.57, "learning_rate": 0.00021429204652380495, "loss": 0.0161, "step": 220430 }, { "epoch": 0.57, "learning_rate": 0.00021428815830743347, "loss": 0.0182, "step": 220440 }, { "epoch": 0.57, "learning_rate": 0.000214284270091062, "loss": 0.0182, "step": 220450 }, { "epoch": 0.57, "learning_rate": 0.00021428038187469052, "loss": 0.0187, "step": 220460 }, { "epoch": 0.57, "learning_rate": 0.0002142764936583191, "loss": 0.0166, "step": 220470 }, { "epoch": 0.57, "learning_rate": 0.00021427260544194763, "loss": 0.0157, "step": 220480 }, { "epoch": 0.57, "learning_rate": 0.00021426871722557615, "loss": 0.0129, "step": 220490 }, { "epoch": 0.57, "learning_rate": 0.0002142648290092047, "loss": 0.0188, "step": 220500 }, { "epoch": 0.57, "learning_rate": 0.00021426094079283323, "loss": 0.0157, "step": 220510 }, { "epoch": 0.57, "learning_rate": 0.00021425705257646177, "loss": 0.0135, "step": 220520 }, { "epoch": 0.57, "learning_rate": 0.00021425316436009029, "loss": 0.0304, "step": 220530 }, { "epoch": 0.57, "learning_rate": 0.00021424927614371883, "loss": 0.0189, "step": 220540 }, { "epoch": 0.57, "learning_rate": 0.00021424538792734737, "loss": 0.0166, "step": 220550 }, { "epoch": 0.57, "learning_rate": 0.0002142414997109759, "loss": 0.015, "step": 220560 }, { "epoch": 0.57, "learning_rate": 0.00021423761149460443, "loss": 0.0194, "step": 220570 }, { "epoch": 0.57, "learning_rate": 0.00021423372327823297, "loss": 0.0166, "step": 220580 }, { "epoch": 0.57, "learning_rate": 0.00021422983506186148, "loss": 0.0187, "step": 220590 }, { "epoch": 0.57, "learning_rate": 0.00021422594684549005, "loss": 0.0162, "step": 220600 }, { "epoch": 0.57, "learning_rate": 0.00021422205862911856, "loss": 0.0156, "step": 220610 }, { "epoch": 0.57, "learning_rate": 0.0002142181704127471, "loss": 0.0201, "step": 220620 }, { "epoch": 0.57, "learning_rate": 0.00021421428219637562, "loss": 0.0156, "step": 220630 }, { "epoch": 0.57, "learning_rate": 0.0002142103939800042, "loss": 0.0161, "step": 220640 }, { "epoch": 0.57, "learning_rate": 0.00021420650576363273, "loss": 0.0183, "step": 220650 }, { "epoch": 0.57, "learning_rate": 0.00021420261754726125, "loss": 0.0186, "step": 220660 }, { "epoch": 0.57, "learning_rate": 0.00021419872933088976, "loss": 0.0219, "step": 220670 }, { "epoch": 0.57, "learning_rate": 0.00021419484111451833, "loss": 0.0147, "step": 220680 }, { "epoch": 0.57, "learning_rate": 0.00021419095289814687, "loss": 0.0179, "step": 220690 }, { "epoch": 0.57, "learning_rate": 0.00021418706468177539, "loss": 0.0204, "step": 220700 }, { "epoch": 0.57, "learning_rate": 0.00021418317646540393, "loss": 0.0188, "step": 220710 }, { "epoch": 0.57, "learning_rate": 0.00021417928824903247, "loss": 0.018, "step": 220720 }, { "epoch": 0.57, "learning_rate": 0.000214175400032661, "loss": 0.019, "step": 220730 }, { "epoch": 0.57, "learning_rate": 0.00021417151181628952, "loss": 0.0176, "step": 220740 }, { "epoch": 0.57, "learning_rate": 0.00021416762359991807, "loss": 0.0158, "step": 220750 }, { "epoch": 0.57, "learning_rate": 0.0002141637353835466, "loss": 0.0175, "step": 220760 }, { "epoch": 0.57, "learning_rate": 0.00021415984716717515, "loss": 0.0188, "step": 220770 }, { "epoch": 0.57, "learning_rate": 0.00021415595895080366, "loss": 0.0165, "step": 220780 }, { "epoch": 0.57, "learning_rate": 0.0002141520707344322, "loss": 0.0158, "step": 220790 }, { "epoch": 0.57, "learning_rate": 0.00021414818251806077, "loss": 0.0175, "step": 220800 }, { "epoch": 0.57, "learning_rate": 0.0002141442943016893, "loss": 0.0182, "step": 220810 }, { "epoch": 0.57, "learning_rate": 0.0002141404060853178, "loss": 0.0186, "step": 220820 }, { "epoch": 0.57, "learning_rate": 0.00021413651786894635, "loss": 0.02, "step": 220830 }, { "epoch": 0.57, "learning_rate": 0.00021413262965257486, "loss": 0.0163, "step": 220840 }, { "epoch": 0.57, "learning_rate": 0.00021412874143620343, "loss": 0.0141, "step": 220850 }, { "epoch": 0.57, "learning_rate": 0.00021412485321983197, "loss": 0.0159, "step": 220860 }, { "epoch": 0.57, "learning_rate": 0.00021412096500346048, "loss": 0.0179, "step": 220870 }, { "epoch": 0.57, "learning_rate": 0.00021411707678708903, "loss": 0.019, "step": 220880 }, { "epoch": 0.57, "learning_rate": 0.00021411318857071757, "loss": 0.0157, "step": 220890 }, { "epoch": 0.57, "learning_rate": 0.0002141093003543461, "loss": 0.0154, "step": 220900 }, { "epoch": 0.57, "learning_rate": 0.00021410541213797462, "loss": 0.0168, "step": 220910 }, { "epoch": 0.57, "learning_rate": 0.00021410152392160317, "loss": 0.017, "step": 220920 }, { "epoch": 0.57, "learning_rate": 0.0002140976357052317, "loss": 0.0145, "step": 220930 }, { "epoch": 0.57, "learning_rate": 0.00021409374748886025, "loss": 0.016, "step": 220940 }, { "epoch": 0.57, "learning_rate": 0.00021408985927248876, "loss": 0.0151, "step": 220950 }, { "epoch": 0.57, "learning_rate": 0.0002140859710561173, "loss": 0.0167, "step": 220960 }, { "epoch": 0.57, "learning_rate": 0.00021408208283974587, "loss": 0.0141, "step": 220970 }, { "epoch": 0.57, "learning_rate": 0.0002140781946233744, "loss": 0.0195, "step": 220980 }, { "epoch": 0.57, "learning_rate": 0.0002140743064070029, "loss": 0.0174, "step": 220990 }, { "epoch": 0.57, "learning_rate": 0.00021407041819063144, "loss": 0.0136, "step": 221000 }, { "epoch": 0.57, "eval_cer": 0.8817754674437451, "eval_loss": 0.011082570999860764, "eval_runtime": 107.259, "eval_samples_per_second": 18.646, "eval_steps_per_second": 4.662, "step": 221000 }, { "epoch": 0.57, "learning_rate": 0.00021406652997426001, "loss": 0.0179, "step": 221010 }, { "epoch": 0.57, "learning_rate": 0.00021406264175788853, "loss": 0.0198, "step": 221020 }, { "epoch": 0.57, "learning_rate": 0.00021405875354151707, "loss": 0.0141, "step": 221030 }, { "epoch": 0.57, "learning_rate": 0.00021405486532514558, "loss": 0.0174, "step": 221040 }, { "epoch": 0.57, "learning_rate": 0.00021405097710877415, "loss": 0.0184, "step": 221050 }, { "epoch": 0.57, "learning_rate": 0.00021404708889240267, "loss": 0.0134, "step": 221060 }, { "epoch": 0.57, "learning_rate": 0.0002140432006760312, "loss": 0.0165, "step": 221070 }, { "epoch": 0.57, "learning_rate": 0.00021403931245965972, "loss": 0.0162, "step": 221080 }, { "epoch": 0.57, "learning_rate": 0.00021403542424328827, "loss": 0.0165, "step": 221090 }, { "epoch": 0.57, "learning_rate": 0.0002140315360269168, "loss": 0.0138, "step": 221100 }, { "epoch": 0.57, "learning_rate": 0.00021402764781054535, "loss": 0.0155, "step": 221110 }, { "epoch": 0.57, "learning_rate": 0.00021402375959417386, "loss": 0.0162, "step": 221120 }, { "epoch": 0.57, "learning_rate": 0.0002140198713778024, "loss": 0.016, "step": 221130 }, { "epoch": 0.57, "learning_rate": 0.00021401598316143095, "loss": 0.0145, "step": 221140 }, { "epoch": 0.57, "learning_rate": 0.0002140120949450595, "loss": 0.0157, "step": 221150 }, { "epoch": 0.57, "learning_rate": 0.000214008206728688, "loss": 0.0159, "step": 221160 }, { "epoch": 0.57, "learning_rate": 0.00021400431851231654, "loss": 0.0166, "step": 221170 }, { "epoch": 0.57, "learning_rate": 0.0002140004302959451, "loss": 0.0143, "step": 221180 }, { "epoch": 0.57, "learning_rate": 0.00021399654207957363, "loss": 0.0164, "step": 221190 }, { "epoch": 0.57, "learning_rate": 0.00021399265386320217, "loss": 0.0199, "step": 221200 }, { "epoch": 0.57, "learning_rate": 0.00021398876564683068, "loss": 0.0198, "step": 221210 }, { "epoch": 0.57, "learning_rate": 0.00021398487743045925, "loss": 0.0207, "step": 221220 }, { "epoch": 0.57, "learning_rate": 0.00021398098921408777, "loss": 0.0119, "step": 221230 }, { "epoch": 0.57, "learning_rate": 0.0002139771009977163, "loss": 0.0175, "step": 221240 }, { "epoch": 0.57, "learning_rate": 0.00021397321278134482, "loss": 0.0151, "step": 221250 }, { "epoch": 0.57, "learning_rate": 0.0002139693245649734, "loss": 0.0164, "step": 221260 }, { "epoch": 0.57, "learning_rate": 0.0002139654363486019, "loss": 0.0174, "step": 221270 }, { "epoch": 0.57, "learning_rate": 0.00021396154813223045, "loss": 0.0153, "step": 221280 }, { "epoch": 0.57, "learning_rate": 0.00021395765991585896, "loss": 0.0212, "step": 221290 }, { "epoch": 0.57, "learning_rate": 0.00021395377169948753, "loss": 0.017, "step": 221300 }, { "epoch": 0.57, "learning_rate": 0.00021394988348311605, "loss": 0.0139, "step": 221310 }, { "epoch": 0.57, "learning_rate": 0.0002139459952667446, "loss": 0.0152, "step": 221320 }, { "epoch": 0.57, "learning_rate": 0.0002139421070503731, "loss": 0.0148, "step": 221330 }, { "epoch": 0.57, "learning_rate": 0.00021393821883400164, "loss": 0.0147, "step": 221340 }, { "epoch": 0.57, "learning_rate": 0.0002139343306176302, "loss": 0.0146, "step": 221350 }, { "epoch": 0.57, "learning_rate": 0.00021393044240125873, "loss": 0.0143, "step": 221360 }, { "epoch": 0.57, "learning_rate": 0.00021392655418488727, "loss": 0.0147, "step": 221370 }, { "epoch": 0.57, "learning_rate": 0.00021392266596851578, "loss": 0.0156, "step": 221380 }, { "epoch": 0.57, "learning_rate": 0.00021391877775214435, "loss": 0.0165, "step": 221390 }, { "epoch": 0.57, "learning_rate": 0.00021391488953577287, "loss": 0.0153, "step": 221400 }, { "epoch": 0.57, "learning_rate": 0.0002139110013194014, "loss": 0.015, "step": 221410 }, { "epoch": 0.57, "learning_rate": 0.00021390711310302992, "loss": 0.0158, "step": 221420 }, { "epoch": 0.57, "learning_rate": 0.0002139032248866585, "loss": 0.0167, "step": 221430 }, { "epoch": 0.57, "learning_rate": 0.000213899336670287, "loss": 0.0206, "step": 221440 }, { "epoch": 0.57, "learning_rate": 0.00021389544845391555, "loss": 0.0145, "step": 221450 }, { "epoch": 0.57, "learning_rate": 0.00021389156023754406, "loss": 0.0147, "step": 221460 }, { "epoch": 0.57, "learning_rate": 0.00021388767202117263, "loss": 0.0135, "step": 221470 }, { "epoch": 0.57, "learning_rate": 0.00021388378380480115, "loss": 0.0129, "step": 221480 }, { "epoch": 0.57, "learning_rate": 0.0002138798955884297, "loss": 0.0121, "step": 221490 }, { "epoch": 0.57, "learning_rate": 0.0002138760073720582, "loss": 0.0173, "step": 221500 }, { "epoch": 0.57, "learning_rate": 0.00021387211915568677, "loss": 0.0198, "step": 221510 }, { "epoch": 0.57, "learning_rate": 0.0002138682309393153, "loss": 0.0193, "step": 221520 }, { "epoch": 0.57, "learning_rate": 0.00021386434272294383, "loss": 0.016, "step": 221530 }, { "epoch": 0.57, "learning_rate": 0.00021386045450657234, "loss": 0.0155, "step": 221540 }, { "epoch": 0.57, "learning_rate": 0.0002138565662902009, "loss": 0.017, "step": 221550 }, { "epoch": 0.57, "learning_rate": 0.00021385267807382945, "loss": 0.0169, "step": 221560 }, { "epoch": 0.57, "learning_rate": 0.00021384878985745797, "loss": 0.0187, "step": 221570 }, { "epoch": 0.57, "learning_rate": 0.0002138449016410865, "loss": 0.0189, "step": 221580 }, { "epoch": 0.57, "learning_rate": 0.00021384101342471502, "loss": 0.0152, "step": 221590 }, { "epoch": 0.57, "learning_rate": 0.0002138371252083436, "loss": 0.0175, "step": 221600 }, { "epoch": 0.57, "learning_rate": 0.0002138332369919721, "loss": 0.0148, "step": 221610 }, { "epoch": 0.57, "learning_rate": 0.00021382934877560065, "loss": 0.0158, "step": 221620 }, { "epoch": 0.57, "learning_rate": 0.00021382546055922916, "loss": 0.0188, "step": 221630 }, { "epoch": 0.57, "learning_rate": 0.00021382157234285773, "loss": 0.0141, "step": 221640 }, { "epoch": 0.57, "learning_rate": 0.00021381768412648624, "loss": 0.0149, "step": 221650 }, { "epoch": 0.57, "learning_rate": 0.00021381379591011479, "loss": 0.0157, "step": 221660 }, { "epoch": 0.57, "learning_rate": 0.0002138099076937433, "loss": 0.0194, "step": 221670 }, { "epoch": 0.57, "learning_rate": 0.00021380601947737187, "loss": 0.0182, "step": 221680 }, { "epoch": 0.57, "learning_rate": 0.0002138021312610004, "loss": 0.0175, "step": 221690 }, { "epoch": 0.57, "learning_rate": 0.00021379824304462893, "loss": 0.0137, "step": 221700 }, { "epoch": 0.57, "learning_rate": 0.00021379435482825744, "loss": 0.0174, "step": 221710 }, { "epoch": 0.57, "learning_rate": 0.000213790466611886, "loss": 0.0172, "step": 221720 }, { "epoch": 0.57, "learning_rate": 0.00021378657839551455, "loss": 0.0174, "step": 221730 }, { "epoch": 0.57, "learning_rate": 0.00021378269017914307, "loss": 0.017, "step": 221740 }, { "epoch": 0.57, "learning_rate": 0.0002137788019627716, "loss": 0.0149, "step": 221750 }, { "epoch": 0.57, "learning_rate": 0.00021377491374640015, "loss": 0.0226, "step": 221760 }, { "epoch": 0.57, "learning_rate": 0.0002137710255300287, "loss": 0.0146, "step": 221770 }, { "epoch": 0.57, "learning_rate": 0.0002137671373136572, "loss": 0.017, "step": 221780 }, { "epoch": 0.57, "learning_rate": 0.00021376324909728575, "loss": 0.0134, "step": 221790 }, { "epoch": 0.57, "learning_rate": 0.0002137593608809143, "loss": 0.0154, "step": 221800 }, { "epoch": 0.57, "learning_rate": 0.00021375547266454283, "loss": 0.0192, "step": 221810 }, { "epoch": 0.57, "learning_rate": 0.00021375158444817134, "loss": 0.0129, "step": 221820 }, { "epoch": 0.58, "learning_rate": 0.00021374769623179989, "loss": 0.019, "step": 221830 }, { "epoch": 0.58, "learning_rate": 0.0002137438080154284, "loss": 0.0162, "step": 221840 }, { "epoch": 0.58, "learning_rate": 0.00021373991979905697, "loss": 0.0189, "step": 221850 }, { "epoch": 0.58, "learning_rate": 0.00021373603158268548, "loss": 0.0153, "step": 221860 }, { "epoch": 0.58, "learning_rate": 0.00021373214336631403, "loss": 0.0142, "step": 221870 }, { "epoch": 0.58, "learning_rate": 0.00021372825514994254, "loss": 0.0184, "step": 221880 }, { "epoch": 0.58, "learning_rate": 0.0002137243669335711, "loss": 0.0182, "step": 221890 }, { "epoch": 0.58, "learning_rate": 0.00021372047871719965, "loss": 0.0164, "step": 221900 }, { "epoch": 0.58, "learning_rate": 0.00021371659050082816, "loss": 0.0161, "step": 221910 }, { "epoch": 0.58, "learning_rate": 0.0002137127022844567, "loss": 0.0167, "step": 221920 }, { "epoch": 0.58, "learning_rate": 0.00021370881406808525, "loss": 0.0204, "step": 221930 }, { "epoch": 0.58, "learning_rate": 0.0002137049258517138, "loss": 0.019, "step": 221940 }, { "epoch": 0.58, "learning_rate": 0.0002137010376353423, "loss": 0.0186, "step": 221950 }, { "epoch": 0.58, "learning_rate": 0.00021369714941897085, "loss": 0.0164, "step": 221960 }, { "epoch": 0.58, "learning_rate": 0.0002136932612025994, "loss": 0.018, "step": 221970 }, { "epoch": 0.58, "learning_rate": 0.00021368937298622793, "loss": 0.0183, "step": 221980 }, { "epoch": 0.58, "learning_rate": 0.00021368548476985644, "loss": 0.0156, "step": 221990 }, { "epoch": 0.58, "learning_rate": 0.00021368159655348499, "loss": 0.0141, "step": 222000 }, { "epoch": 0.58, "eval_cer": 0.8817600714374692, "eval_loss": 0.011201182380318642, "eval_runtime": 107.2894, "eval_samples_per_second": 18.641, "eval_steps_per_second": 4.66, "step": 222000 }, { "epoch": 0.58, "learning_rate": 0.00021367770833711353, "loss": 0.0159, "step": 222010 }, { "epoch": 0.58, "learning_rate": 0.00021367382012074207, "loss": 0.0171, "step": 222020 }, { "epoch": 0.58, "learning_rate": 0.00021366993190437058, "loss": 0.0216, "step": 222030 }, { "epoch": 0.58, "learning_rate": 0.00021366604368799912, "loss": 0.0186, "step": 222040 }, { "epoch": 0.58, "learning_rate": 0.0002136621554716277, "loss": 0.0166, "step": 222050 }, { "epoch": 0.58, "learning_rate": 0.0002136582672552562, "loss": 0.0178, "step": 222060 }, { "epoch": 0.58, "learning_rate": 0.00021365437903888475, "loss": 0.0164, "step": 222070 }, { "epoch": 0.58, "learning_rate": 0.00021365049082251326, "loss": 0.0161, "step": 222080 }, { "epoch": 0.58, "learning_rate": 0.0002136466026061418, "loss": 0.016, "step": 222090 }, { "epoch": 0.58, "learning_rate": 0.00021364271438977035, "loss": 0.0152, "step": 222100 }, { "epoch": 0.58, "learning_rate": 0.0002136388261733989, "loss": 0.0156, "step": 222110 }, { "epoch": 0.58, "learning_rate": 0.0002136349379570274, "loss": 0.0197, "step": 222120 }, { "epoch": 0.58, "learning_rate": 0.00021363104974065595, "loss": 0.0166, "step": 222130 }, { "epoch": 0.58, "learning_rate": 0.0002136271615242845, "loss": 0.0171, "step": 222140 }, { "epoch": 0.58, "learning_rate": 0.00021362327330791303, "loss": 0.0189, "step": 222150 }, { "epoch": 0.58, "learning_rate": 0.00021361938509154154, "loss": 0.0159, "step": 222160 }, { "epoch": 0.58, "learning_rate": 0.00021361549687517008, "loss": 0.0224, "step": 222170 }, { "epoch": 0.58, "learning_rate": 0.00021361160865879863, "loss": 0.0177, "step": 222180 }, { "epoch": 0.58, "learning_rate": 0.00021360772044242717, "loss": 0.0156, "step": 222190 }, { "epoch": 0.58, "learning_rate": 0.00021360383222605568, "loss": 0.0176, "step": 222200 }, { "epoch": 0.58, "learning_rate": 0.00021359994400968422, "loss": 0.0161, "step": 222210 }, { "epoch": 0.58, "learning_rate": 0.0002135960557933128, "loss": 0.0174, "step": 222220 }, { "epoch": 0.58, "learning_rate": 0.0002135921675769413, "loss": 0.0137, "step": 222230 }, { "epoch": 0.58, "learning_rate": 0.00021358827936056985, "loss": 0.0147, "step": 222240 }, { "epoch": 0.58, "learning_rate": 0.00021358439114419836, "loss": 0.0148, "step": 222250 }, { "epoch": 0.58, "learning_rate": 0.00021358050292782693, "loss": 0.0201, "step": 222260 }, { "epoch": 0.58, "learning_rate": 0.00021357661471145545, "loss": 0.0176, "step": 222270 }, { "epoch": 0.58, "learning_rate": 0.000213572726495084, "loss": 0.0158, "step": 222280 }, { "epoch": 0.58, "learning_rate": 0.0002135688382787125, "loss": 0.0216, "step": 222290 }, { "epoch": 0.58, "learning_rate": 0.00021356495006234107, "loss": 0.0187, "step": 222300 }, { "epoch": 0.58, "learning_rate": 0.00021356106184596959, "loss": 0.0156, "step": 222310 }, { "epoch": 0.58, "learning_rate": 0.00021355717362959813, "loss": 0.017, "step": 222320 }, { "epoch": 0.58, "learning_rate": 0.00021355328541322664, "loss": 0.0184, "step": 222330 }, { "epoch": 0.58, "learning_rate": 0.00021354939719685518, "loss": 0.0167, "step": 222340 }, { "epoch": 0.58, "learning_rate": 0.00021354550898048373, "loss": 0.0186, "step": 222350 }, { "epoch": 0.58, "learning_rate": 0.00021354162076411227, "loss": 0.0243, "step": 222360 }, { "epoch": 0.58, "learning_rate": 0.00021353773254774078, "loss": 0.0173, "step": 222370 }, { "epoch": 0.58, "learning_rate": 0.00021353384433136932, "loss": 0.0157, "step": 222380 }, { "epoch": 0.58, "learning_rate": 0.0002135299561149979, "loss": 0.0151, "step": 222390 }, { "epoch": 0.58, "learning_rate": 0.0002135260678986264, "loss": 0.0205, "step": 222400 }, { "epoch": 0.58, "learning_rate": 0.00021352217968225492, "loss": 0.0164, "step": 222410 }, { "epoch": 0.58, "learning_rate": 0.00021351829146588346, "loss": 0.0137, "step": 222420 }, { "epoch": 0.58, "learning_rate": 0.00021351440324951203, "loss": 0.0218, "step": 222430 }, { "epoch": 0.58, "learning_rate": 0.00021351051503314055, "loss": 0.0186, "step": 222440 }, { "epoch": 0.58, "learning_rate": 0.0002135066268167691, "loss": 0.0147, "step": 222450 }, { "epoch": 0.58, "learning_rate": 0.0002135027386003976, "loss": 0.0158, "step": 222460 }, { "epoch": 0.58, "learning_rate": 0.00021349885038402617, "loss": 0.0154, "step": 222470 }, { "epoch": 0.58, "learning_rate": 0.00021349496216765469, "loss": 0.0221, "step": 222480 }, { "epoch": 0.58, "learning_rate": 0.00021349107395128323, "loss": 0.0159, "step": 222490 }, { "epoch": 0.58, "learning_rate": 0.00021348718573491174, "loss": 0.0163, "step": 222500 }, { "epoch": 0.58, "learning_rate": 0.0002134832975185403, "loss": 0.0162, "step": 222510 }, { "epoch": 0.58, "learning_rate": 0.00021347940930216883, "loss": 0.0148, "step": 222520 }, { "epoch": 0.58, "learning_rate": 0.00021347552108579737, "loss": 0.0167, "step": 222530 }, { "epoch": 0.58, "learning_rate": 0.00021347163286942588, "loss": 0.0195, "step": 222540 }, { "epoch": 0.58, "learning_rate": 0.00021346774465305445, "loss": 0.0131, "step": 222550 }, { "epoch": 0.58, "learning_rate": 0.000213463856436683, "loss": 0.0159, "step": 222560 }, { "epoch": 0.58, "learning_rate": 0.0002134599682203115, "loss": 0.0165, "step": 222570 }, { "epoch": 0.58, "learning_rate": 0.00021345608000394002, "loss": 0.0156, "step": 222580 }, { "epoch": 0.58, "learning_rate": 0.00021345219178756856, "loss": 0.0169, "step": 222590 }, { "epoch": 0.58, "learning_rate": 0.00021344830357119713, "loss": 0.015, "step": 222600 }, { "epoch": 0.58, "learning_rate": 0.00021344441535482565, "loss": 0.016, "step": 222610 }, { "epoch": 0.58, "learning_rate": 0.0002134405271384542, "loss": 0.0252, "step": 222620 }, { "epoch": 0.58, "learning_rate": 0.0002134366389220827, "loss": 0.0642, "step": 222630 }, { "epoch": 0.58, "learning_rate": 0.00021343275070571127, "loss": 0.0169, "step": 222640 }, { "epoch": 0.58, "learning_rate": 0.00021342886248933979, "loss": 0.0138, "step": 222650 }, { "epoch": 0.58, "learning_rate": 0.00021342497427296833, "loss": 0.0194, "step": 222660 }, { "epoch": 0.58, "learning_rate": 0.00021342108605659684, "loss": 0.0156, "step": 222670 }, { "epoch": 0.58, "learning_rate": 0.0002134171978402254, "loss": 0.0163, "step": 222680 }, { "epoch": 0.58, "learning_rate": 0.00021341330962385392, "loss": 0.0155, "step": 222690 }, { "epoch": 0.58, "learning_rate": 0.00021340942140748247, "loss": 0.0117, "step": 222700 }, { "epoch": 0.58, "learning_rate": 0.00021340553319111098, "loss": 0.018, "step": 222710 }, { "epoch": 0.58, "learning_rate": 0.00021340164497473955, "loss": 0.0186, "step": 222720 }, { "epoch": 0.58, "learning_rate": 0.00021339775675836806, "loss": 0.0152, "step": 222730 }, { "epoch": 0.58, "learning_rate": 0.0002133938685419966, "loss": 0.0152, "step": 222740 }, { "epoch": 0.58, "learning_rate": 0.00021338998032562512, "loss": 0.0125, "step": 222750 }, { "epoch": 0.58, "learning_rate": 0.0002133860921092537, "loss": 0.0168, "step": 222760 }, { "epoch": 0.58, "learning_rate": 0.00021338220389288223, "loss": 0.0173, "step": 222770 }, { "epoch": 0.58, "learning_rate": 0.00021337831567651075, "loss": 0.018, "step": 222780 }, { "epoch": 0.58, "learning_rate": 0.0002133744274601393, "loss": 0.0187, "step": 222790 }, { "epoch": 0.58, "learning_rate": 0.0002133705392437678, "loss": 0.0164, "step": 222800 }, { "epoch": 0.58, "learning_rate": 0.00021336665102739637, "loss": 0.015, "step": 222810 }, { "epoch": 0.58, "learning_rate": 0.00021336276281102488, "loss": 0.0146, "step": 222820 }, { "epoch": 0.58, "learning_rate": 0.00021335887459465343, "loss": 0.012, "step": 222830 }, { "epoch": 0.58, "learning_rate": 0.00021335498637828194, "loss": 0.0222, "step": 222840 }, { "epoch": 0.58, "learning_rate": 0.0002133510981619105, "loss": 0.0164, "step": 222850 }, { "epoch": 0.58, "learning_rate": 0.00021334720994553902, "loss": 0.0172, "step": 222860 }, { "epoch": 0.58, "learning_rate": 0.00021334332172916757, "loss": 0.0213, "step": 222870 }, { "epoch": 0.58, "learning_rate": 0.00021333943351279608, "loss": 0.0153, "step": 222880 }, { "epoch": 0.58, "learning_rate": 0.00021333554529642465, "loss": 0.0264, "step": 222890 }, { "epoch": 0.58, "learning_rate": 0.00021333165708005316, "loss": 0.0198, "step": 222900 }, { "epoch": 0.58, "learning_rate": 0.0002133277688636817, "loss": 0.0173, "step": 222910 }, { "epoch": 0.58, "learning_rate": 0.00021332388064731022, "loss": 0.0166, "step": 222920 }, { "epoch": 0.58, "learning_rate": 0.0002133199924309388, "loss": 0.0212, "step": 222930 }, { "epoch": 0.58, "learning_rate": 0.00021331610421456733, "loss": 0.017, "step": 222940 }, { "epoch": 0.58, "learning_rate": 0.00021331221599819584, "loss": 0.0178, "step": 222950 }, { "epoch": 0.58, "learning_rate": 0.00021330832778182439, "loss": 0.0201, "step": 222960 }, { "epoch": 0.58, "learning_rate": 0.00021330443956545293, "loss": 0.0148, "step": 222970 }, { "epoch": 0.58, "learning_rate": 0.00021330055134908147, "loss": 0.0187, "step": 222980 }, { "epoch": 0.58, "learning_rate": 0.00021329666313270998, "loss": 0.0185, "step": 222990 }, { "epoch": 0.58, "learning_rate": 0.00021329277491633853, "loss": 0.0171, "step": 223000 }, { "epoch": 0.58, "eval_cer": 0.8817726681698768, "eval_loss": 0.010963888838887215, "eval_runtime": 107.1777, "eval_samples_per_second": 18.661, "eval_steps_per_second": 4.665, "step": 223000 }, { "epoch": 0.58, "learning_rate": 0.00021328888669996707, "loss": 0.0147, "step": 223010 }, { "epoch": 0.58, "learning_rate": 0.0002132849984835956, "loss": 0.0208, "step": 223020 }, { "epoch": 0.58, "learning_rate": 0.00021328111026722412, "loss": 0.014, "step": 223030 }, { "epoch": 0.58, "learning_rate": 0.00021327722205085266, "loss": 0.0171, "step": 223040 }, { "epoch": 0.58, "learning_rate": 0.00021327333383448118, "loss": 0.021, "step": 223050 }, { "epoch": 0.58, "learning_rate": 0.00021326944561810975, "loss": 0.0131, "step": 223060 }, { "epoch": 0.58, "learning_rate": 0.00021326555740173826, "loss": 0.0159, "step": 223070 }, { "epoch": 0.58, "learning_rate": 0.0002132616691853668, "loss": 0.0185, "step": 223080 }, { "epoch": 0.58, "learning_rate": 0.00021325778096899532, "loss": 0.0158, "step": 223090 }, { "epoch": 0.58, "learning_rate": 0.0002132538927526239, "loss": 0.0222, "step": 223100 }, { "epoch": 0.58, "learning_rate": 0.00021325000453625243, "loss": 0.0224, "step": 223110 }, { "epoch": 0.58, "learning_rate": 0.00021324611631988094, "loss": 0.0179, "step": 223120 }, { "epoch": 0.58, "learning_rate": 0.00021324222810350946, "loss": 0.0141, "step": 223130 }, { "epoch": 0.58, "learning_rate": 0.00021323833988713803, "loss": 0.016, "step": 223140 }, { "epoch": 0.58, "learning_rate": 0.00021323445167076657, "loss": 0.0198, "step": 223150 }, { "epoch": 0.58, "learning_rate": 0.00021323056345439508, "loss": 0.0177, "step": 223160 }, { "epoch": 0.58, "learning_rate": 0.00021322667523802362, "loss": 0.0139, "step": 223170 }, { "epoch": 0.58, "learning_rate": 0.00021322278702165217, "loss": 0.0173, "step": 223180 }, { "epoch": 0.58, "learning_rate": 0.0002132188988052807, "loss": 0.0158, "step": 223190 }, { "epoch": 0.58, "learning_rate": 0.00021321501058890922, "loss": 0.0153, "step": 223200 }, { "epoch": 0.58, "learning_rate": 0.00021321112237253776, "loss": 0.0159, "step": 223210 }, { "epoch": 0.58, "learning_rate": 0.0002132072341561663, "loss": 0.0177, "step": 223220 }, { "epoch": 0.58, "learning_rate": 0.00021320334593979485, "loss": 0.0174, "step": 223230 }, { "epoch": 0.58, "learning_rate": 0.00021319945772342336, "loss": 0.0129, "step": 223240 }, { "epoch": 0.58, "learning_rate": 0.0002131955695070519, "loss": 0.0144, "step": 223250 }, { "epoch": 0.58, "learning_rate": 0.00021319168129068047, "loss": 0.0162, "step": 223260 }, { "epoch": 0.58, "learning_rate": 0.000213187793074309, "loss": 0.0148, "step": 223270 }, { "epoch": 0.58, "learning_rate": 0.00021318390485793753, "loss": 0.0146, "step": 223280 }, { "epoch": 0.58, "learning_rate": 0.00021318001664156604, "loss": 0.015, "step": 223290 }, { "epoch": 0.58, "learning_rate": 0.00021317612842519456, "loss": 0.0145, "step": 223300 }, { "epoch": 0.58, "learning_rate": 0.00021317224020882313, "loss": 0.0185, "step": 223310 }, { "epoch": 0.58, "learning_rate": 0.00021316835199245167, "loss": 0.0146, "step": 223320 }, { "epoch": 0.58, "learning_rate": 0.00021316446377608018, "loss": 0.0161, "step": 223330 }, { "epoch": 0.58, "learning_rate": 0.00021316057555970872, "loss": 0.0136, "step": 223340 }, { "epoch": 0.58, "learning_rate": 0.00021315668734333727, "loss": 0.0137, "step": 223350 }, { "epoch": 0.58, "learning_rate": 0.0002131527991269658, "loss": 0.0146, "step": 223360 }, { "epoch": 0.58, "learning_rate": 0.00021314891091059432, "loss": 0.0202, "step": 223370 }, { "epoch": 0.58, "learning_rate": 0.00021314502269422286, "loss": 0.0123, "step": 223380 }, { "epoch": 0.58, "learning_rate": 0.0002131411344778514, "loss": 0.0152, "step": 223390 }, { "epoch": 0.58, "learning_rate": 0.00021313724626147995, "loss": 0.0165, "step": 223400 }, { "epoch": 0.58, "learning_rate": 0.00021313335804510846, "loss": 0.0162, "step": 223410 }, { "epoch": 0.58, "learning_rate": 0.000213129469828737, "loss": 0.0163, "step": 223420 }, { "epoch": 0.58, "learning_rate": 0.00021312558161236557, "loss": 0.0159, "step": 223430 }, { "epoch": 0.58, "learning_rate": 0.0002131216933959941, "loss": 0.0183, "step": 223440 }, { "epoch": 0.58, "learning_rate": 0.0002131178051796226, "loss": 0.0147, "step": 223450 }, { "epoch": 0.58, "learning_rate": 0.00021311391696325114, "loss": 0.0175, "step": 223460 }, { "epoch": 0.58, "learning_rate": 0.0002131100287468797, "loss": 0.015, "step": 223470 }, { "epoch": 0.58, "learning_rate": 0.00021310614053050823, "loss": 0.015, "step": 223480 }, { "epoch": 0.58, "learning_rate": 0.00021310225231413677, "loss": 0.0163, "step": 223490 }, { "epoch": 0.58, "learning_rate": 0.00021309836409776528, "loss": 0.0173, "step": 223500 }, { "epoch": 0.58, "learning_rate": 0.00021309447588139385, "loss": 0.0168, "step": 223510 }, { "epoch": 0.58, "learning_rate": 0.00021309058766502237, "loss": 0.0153, "step": 223520 }, { "epoch": 0.58, "learning_rate": 0.0002130866994486509, "loss": 0.0167, "step": 223530 }, { "epoch": 0.58, "learning_rate": 0.00021308281123227942, "loss": 0.0187, "step": 223540 }, { "epoch": 0.58, "learning_rate": 0.00021307892301590796, "loss": 0.0187, "step": 223550 }, { "epoch": 0.58, "learning_rate": 0.0002130750347995365, "loss": 0.016, "step": 223560 }, { "epoch": 0.58, "learning_rate": 0.00021307114658316505, "loss": 0.0182, "step": 223570 }, { "epoch": 0.58, "learning_rate": 0.00021306725836679356, "loss": 0.0152, "step": 223580 }, { "epoch": 0.58, "learning_rate": 0.0002130633701504221, "loss": 0.0139, "step": 223590 }, { "epoch": 0.58, "learning_rate": 0.00021305948193405064, "loss": 0.0211, "step": 223600 }, { "epoch": 0.58, "learning_rate": 0.00021305559371767919, "loss": 0.0184, "step": 223610 }, { "epoch": 0.58, "learning_rate": 0.0002130517055013077, "loss": 0.0187, "step": 223620 }, { "epoch": 0.58, "learning_rate": 0.00021304781728493624, "loss": 0.0157, "step": 223630 }, { "epoch": 0.58, "learning_rate": 0.0002130439290685648, "loss": 0.0182, "step": 223640 }, { "epoch": 0.58, "learning_rate": 0.00021304004085219333, "loss": 0.0201, "step": 223650 }, { "epoch": 0.58, "learning_rate": 0.00021303615263582187, "loss": 0.0188, "step": 223660 }, { "epoch": 0.58, "learning_rate": 0.00021303226441945038, "loss": 0.0164, "step": 223670 }, { "epoch": 0.58, "learning_rate": 0.00021302837620307895, "loss": 0.0165, "step": 223680 }, { "epoch": 0.58, "learning_rate": 0.00021302448798670746, "loss": 0.0141, "step": 223690 }, { "epoch": 0.58, "learning_rate": 0.000213020599770336, "loss": 0.0143, "step": 223700 }, { "epoch": 0.58, "learning_rate": 0.00021301671155396452, "loss": 0.016, "step": 223710 }, { "epoch": 0.58, "learning_rate": 0.0002130128233375931, "loss": 0.016, "step": 223720 }, { "epoch": 0.58, "learning_rate": 0.0002130089351212216, "loss": 0.0143, "step": 223730 }, { "epoch": 0.58, "learning_rate": 0.00021300504690485015, "loss": 0.0119, "step": 223740 }, { "epoch": 0.58, "learning_rate": 0.00021300115868847866, "loss": 0.0162, "step": 223750 }, { "epoch": 0.58, "learning_rate": 0.00021299727047210723, "loss": 0.0177, "step": 223760 }, { "epoch": 0.58, "learning_rate": 0.00021299338225573574, "loss": 0.0158, "step": 223770 }, { "epoch": 0.58, "learning_rate": 0.00021298949403936429, "loss": 0.0183, "step": 223780 }, { "epoch": 0.58, "learning_rate": 0.0002129856058229928, "loss": 0.0146, "step": 223790 }, { "epoch": 0.58, "learning_rate": 0.00021298171760662134, "loss": 0.0179, "step": 223800 }, { "epoch": 0.58, "learning_rate": 0.0002129778293902499, "loss": 0.015, "step": 223810 }, { "epoch": 0.58, "learning_rate": 0.00021297394117387842, "loss": 0.0182, "step": 223820 }, { "epoch": 0.58, "learning_rate": 0.00021297005295750697, "loss": 0.0155, "step": 223830 }, { "epoch": 0.58, "learning_rate": 0.00021296616474113548, "loss": 0.0159, "step": 223840 }, { "epoch": 0.58, "learning_rate": 0.00021296227652476405, "loss": 0.0145, "step": 223850 }, { "epoch": 0.58, "learning_rate": 0.00021295838830839256, "loss": 0.0163, "step": 223860 }, { "epoch": 0.58, "learning_rate": 0.0002129545000920211, "loss": 0.0135, "step": 223870 }, { "epoch": 0.58, "learning_rate": 0.00021295061187564962, "loss": 0.0191, "step": 223880 }, { "epoch": 0.58, "learning_rate": 0.0002129467236592782, "loss": 0.0199, "step": 223890 }, { "epoch": 0.58, "learning_rate": 0.0002129428354429067, "loss": 0.0164, "step": 223900 }, { "epoch": 0.58, "learning_rate": 0.00021293894722653525, "loss": 0.0184, "step": 223910 }, { "epoch": 0.58, "learning_rate": 0.00021293505901016376, "loss": 0.0166, "step": 223920 }, { "epoch": 0.58, "learning_rate": 0.00021293117079379233, "loss": 0.0189, "step": 223930 }, { "epoch": 0.58, "learning_rate": 0.00021292728257742084, "loss": 0.017, "step": 223940 }, { "epoch": 0.58, "learning_rate": 0.00021292339436104938, "loss": 0.0172, "step": 223950 }, { "epoch": 0.58, "learning_rate": 0.0002129195061446779, "loss": 0.0177, "step": 223960 }, { "epoch": 0.58, "learning_rate": 0.00021291561792830647, "loss": 0.0165, "step": 223970 }, { "epoch": 0.58, "learning_rate": 0.000212911729711935, "loss": 0.0172, "step": 223980 }, { "epoch": 0.58, "learning_rate": 0.00021290784149556352, "loss": 0.0211, "step": 223990 }, { "epoch": 0.58, "learning_rate": 0.00021290395327919204, "loss": 0.0137, "step": 224000 }, { "epoch": 0.58, "eval_cer": 0.8817502739789299, "eval_loss": 0.010993575677275658, "eval_runtime": 107.4094, "eval_samples_per_second": 18.62, "eval_steps_per_second": 4.655, "step": 224000 }, { "epoch": 0.58, "learning_rate": 0.0002129000650628206, "loss": 0.0216, "step": 224010 }, { "epoch": 0.58, "learning_rate": 0.00021289617684644915, "loss": 0.0132, "step": 224020 }, { "epoch": 0.58, "learning_rate": 0.00021289228863007766, "loss": 0.0245, "step": 224030 }, { "epoch": 0.58, "learning_rate": 0.0002128884004137062, "loss": 0.0217, "step": 224040 }, { "epoch": 0.58, "learning_rate": 0.00021288451219733472, "loss": 0.0149, "step": 224050 }, { "epoch": 0.58, "learning_rate": 0.0002128806239809633, "loss": 0.0179, "step": 224060 }, { "epoch": 0.58, "learning_rate": 0.0002128767357645918, "loss": 0.0162, "step": 224070 }, { "epoch": 0.58, "learning_rate": 0.00021287284754822034, "loss": 0.0169, "step": 224080 }, { "epoch": 0.58, "learning_rate": 0.00021286895933184886, "loss": 0.0115, "step": 224090 }, { "epoch": 0.58, "learning_rate": 0.00021286507111547743, "loss": 0.015, "step": 224100 }, { "epoch": 0.58, "learning_rate": 0.00021286118289910594, "loss": 0.0178, "step": 224110 }, { "epoch": 0.58, "learning_rate": 0.00021285729468273448, "loss": 0.0186, "step": 224120 }, { "epoch": 0.58, "learning_rate": 0.000212853406466363, "loss": 0.0169, "step": 224130 }, { "epoch": 0.58, "learning_rate": 0.00021284951824999157, "loss": 0.0132, "step": 224140 }, { "epoch": 0.58, "learning_rate": 0.0002128456300336201, "loss": 0.0301, "step": 224150 }, { "epoch": 0.58, "learning_rate": 0.00021284174181724862, "loss": 0.0339, "step": 224160 }, { "epoch": 0.58, "learning_rate": 0.00021283785360087714, "loss": 0.0134, "step": 224170 }, { "epoch": 0.58, "learning_rate": 0.0002128339653845057, "loss": 0.0199, "step": 224180 }, { "epoch": 0.58, "learning_rate": 0.00021283007716813425, "loss": 0.0174, "step": 224190 }, { "epoch": 0.58, "learning_rate": 0.00021282618895176276, "loss": 0.015, "step": 224200 }, { "epoch": 0.58, "learning_rate": 0.0002128223007353913, "loss": 0.0178, "step": 224210 }, { "epoch": 0.58, "learning_rate": 0.00021281841251901985, "loss": 0.0193, "step": 224220 }, { "epoch": 0.58, "learning_rate": 0.0002128145243026484, "loss": 0.0225, "step": 224230 }, { "epoch": 0.58, "learning_rate": 0.0002128106360862769, "loss": 0.0129, "step": 224240 }, { "epoch": 0.58, "learning_rate": 0.00021280674786990544, "loss": 0.0185, "step": 224250 }, { "epoch": 0.58, "learning_rate": 0.00021280285965353399, "loss": 0.0165, "step": 224260 }, { "epoch": 0.58, "learning_rate": 0.00021279897143716253, "loss": 0.017, "step": 224270 }, { "epoch": 0.58, "learning_rate": 0.00021279508322079104, "loss": 0.018, "step": 224280 }, { "epoch": 0.58, "learning_rate": 0.00021279119500441958, "loss": 0.0162, "step": 224290 }, { "epoch": 0.58, "learning_rate": 0.0002127873067880481, "loss": 0.0185, "step": 224300 }, { "epoch": 0.58, "learning_rate": 0.00021278341857167667, "loss": 0.0153, "step": 224310 }, { "epoch": 0.58, "learning_rate": 0.00021277953035530518, "loss": 0.017, "step": 224320 }, { "epoch": 0.58, "learning_rate": 0.00021277564213893372, "loss": 0.016, "step": 224330 }, { "epoch": 0.58, "learning_rate": 0.00021277175392256224, "loss": 0.0189, "step": 224340 }, { "epoch": 0.58, "learning_rate": 0.0002127678657061908, "loss": 0.0153, "step": 224350 }, { "epoch": 0.58, "learning_rate": 0.00021276397748981935, "loss": 0.015, "step": 224360 }, { "epoch": 0.58, "learning_rate": 0.00021276008927344786, "loss": 0.0184, "step": 224370 }, { "epoch": 0.58, "learning_rate": 0.0002127562010570764, "loss": 0.0187, "step": 224380 }, { "epoch": 0.58, "learning_rate": 0.00021275231284070495, "loss": 0.0154, "step": 224390 }, { "epoch": 0.58, "learning_rate": 0.0002127484246243335, "loss": 0.0143, "step": 224400 }, { "epoch": 0.58, "learning_rate": 0.000212744536407962, "loss": 0.0148, "step": 224410 }, { "epoch": 0.58, "learning_rate": 0.00021274064819159054, "loss": 0.0175, "step": 224420 }, { "epoch": 0.58, "learning_rate": 0.00021273675997521909, "loss": 0.0159, "step": 224430 }, { "epoch": 0.58, "learning_rate": 0.00021273287175884763, "loss": 0.0152, "step": 224440 }, { "epoch": 0.58, "learning_rate": 0.00021272898354247614, "loss": 0.0177, "step": 224450 }, { "epoch": 0.58, "learning_rate": 0.00021272509532610468, "loss": 0.0158, "step": 224460 }, { "epoch": 0.58, "learning_rate": 0.00021272120710973322, "loss": 0.018, "step": 224470 }, { "epoch": 0.58, "learning_rate": 0.00021271731889336177, "loss": 0.0203, "step": 224480 }, { "epoch": 0.58, "learning_rate": 0.00021271343067699028, "loss": 0.0161, "step": 224490 }, { "epoch": 0.58, "learning_rate": 0.00021270954246061882, "loss": 0.0172, "step": 224500 }, { "epoch": 0.58, "learning_rate": 0.0002127056542442474, "loss": 0.0172, "step": 224510 }, { "epoch": 0.58, "learning_rate": 0.0002127017660278759, "loss": 0.0144, "step": 224520 }, { "epoch": 0.58, "learning_rate": 0.00021269787781150445, "loss": 0.0196, "step": 224530 }, { "epoch": 0.58, "learning_rate": 0.00021269398959513296, "loss": 0.0168, "step": 224540 }, { "epoch": 0.58, "learning_rate": 0.0002126901013787615, "loss": 0.0185, "step": 224550 }, { "epoch": 0.58, "learning_rate": 0.00021268621316239005, "loss": 0.0213, "step": 224560 }, { "epoch": 0.58, "learning_rate": 0.0002126823249460186, "loss": 0.018, "step": 224570 }, { "epoch": 0.58, "learning_rate": 0.0002126784367296471, "loss": 0.0142, "step": 224580 }, { "epoch": 0.58, "learning_rate": 0.00021267454851327564, "loss": 0.0172, "step": 224590 }, { "epoch": 0.58, "learning_rate": 0.00021267066029690418, "loss": 0.014, "step": 224600 }, { "epoch": 0.58, "learning_rate": 0.00021266677208053273, "loss": 0.0158, "step": 224610 }, { "epoch": 0.58, "learning_rate": 0.00021266288386416124, "loss": 0.0144, "step": 224620 }, { "epoch": 0.58, "learning_rate": 0.00021265899564778978, "loss": 0.0166, "step": 224630 }, { "epoch": 0.58, "learning_rate": 0.00021265510743141832, "loss": 0.0169, "step": 224640 }, { "epoch": 0.58, "learning_rate": 0.00021265121921504687, "loss": 0.0169, "step": 224650 }, { "epoch": 0.58, "learning_rate": 0.00021264733099867538, "loss": 0.0165, "step": 224660 }, { "epoch": 0.58, "learning_rate": 0.00021264344278230392, "loss": 0.0176, "step": 224670 }, { "epoch": 0.58, "learning_rate": 0.0002126395545659325, "loss": 0.0154, "step": 224680 }, { "epoch": 0.58, "learning_rate": 0.000212635666349561, "loss": 0.0128, "step": 224690 }, { "epoch": 0.58, "learning_rate": 0.00021263177813318955, "loss": 0.0151, "step": 224700 }, { "epoch": 0.58, "learning_rate": 0.00021262788991681806, "loss": 0.0154, "step": 224710 }, { "epoch": 0.58, "learning_rate": 0.00021262400170044663, "loss": 0.0186, "step": 224720 }, { "epoch": 0.58, "learning_rate": 0.00021262011348407514, "loss": 0.0136, "step": 224730 }, { "epoch": 0.58, "learning_rate": 0.00021261622526770369, "loss": 0.016, "step": 224740 }, { "epoch": 0.58, "learning_rate": 0.0002126123370513322, "loss": 0.0178, "step": 224750 }, { "epoch": 0.58, "learning_rate": 0.00021260844883496077, "loss": 0.0132, "step": 224760 }, { "epoch": 0.58, "learning_rate": 0.00021260456061858928, "loss": 0.0128, "step": 224770 }, { "epoch": 0.58, "learning_rate": 0.00021260067240221783, "loss": 0.0171, "step": 224780 }, { "epoch": 0.58, "learning_rate": 0.00021259678418584634, "loss": 0.0142, "step": 224790 }, { "epoch": 0.58, "learning_rate": 0.00021259289596947488, "loss": 0.0143, "step": 224800 }, { "epoch": 0.58, "learning_rate": 0.00021258900775310342, "loss": 0.0144, "step": 224810 }, { "epoch": 0.58, "learning_rate": 0.00021258511953673197, "loss": 0.016, "step": 224820 }, { "epoch": 0.58, "learning_rate": 0.00021258123132036048, "loss": 0.0147, "step": 224830 }, { "epoch": 0.58, "learning_rate": 0.00021257734310398902, "loss": 0.0138, "step": 224840 }, { "epoch": 0.58, "learning_rate": 0.0002125734548876176, "loss": 0.0187, "step": 224850 }, { "epoch": 0.58, "learning_rate": 0.0002125695666712461, "loss": 0.0173, "step": 224860 }, { "epoch": 0.58, "learning_rate": 0.00021256567845487465, "loss": 0.0188, "step": 224870 }, { "epoch": 0.58, "learning_rate": 0.00021256179023850316, "loss": 0.0164, "step": 224880 }, { "epoch": 0.58, "learning_rate": 0.00021255790202213173, "loss": 0.0108, "step": 224890 }, { "epoch": 0.58, "learning_rate": 0.00021255401380576024, "loss": 0.0145, "step": 224900 }, { "epoch": 0.58, "learning_rate": 0.00021255012558938879, "loss": 0.0195, "step": 224910 }, { "epoch": 0.58, "learning_rate": 0.0002125462373730173, "loss": 0.0159, "step": 224920 }, { "epoch": 0.58, "learning_rate": 0.00021254234915664587, "loss": 0.016, "step": 224930 }, { "epoch": 0.58, "learning_rate": 0.00021253846094027438, "loss": 0.0192, "step": 224940 }, { "epoch": 0.58, "learning_rate": 0.00021253457272390293, "loss": 0.017, "step": 224950 }, { "epoch": 0.58, "learning_rate": 0.00021253068450753144, "loss": 0.0178, "step": 224960 }, { "epoch": 0.58, "learning_rate": 0.00021252679629116, "loss": 0.0191, "step": 224970 }, { "epoch": 0.58, "learning_rate": 0.00021252290807478852, "loss": 0.0184, "step": 224980 }, { "epoch": 0.58, "learning_rate": 0.00021251901985841706, "loss": 0.0144, "step": 224990 }, { "epoch": 0.58, "learning_rate": 0.00021251513164204558, "loss": 0.0136, "step": 225000 }, { "epoch": 0.58, "eval_cer": 0.8817684692590742, "eval_loss": 0.01163857989013195, "eval_runtime": 107.3494, "eval_samples_per_second": 18.631, "eval_steps_per_second": 4.658, "step": 225000 }, { "epoch": 0.58, "learning_rate": 0.00021251124342567415, "loss": 0.0174, "step": 225010 }, { "epoch": 0.58, "learning_rate": 0.0002125073552093027, "loss": 0.0186, "step": 225020 }, { "epoch": 0.58, "learning_rate": 0.0002125034669929312, "loss": 0.0146, "step": 225030 }, { "epoch": 0.58, "learning_rate": 0.00021249957877655972, "loss": 0.0133, "step": 225040 }, { "epoch": 0.58, "learning_rate": 0.00021249569056018826, "loss": 0.0163, "step": 225050 }, { "epoch": 0.58, "learning_rate": 0.00021249180234381683, "loss": 0.0183, "step": 225060 }, { "epoch": 0.58, "learning_rate": 0.00021248791412744534, "loss": 0.0141, "step": 225070 }, { "epoch": 0.58, "learning_rate": 0.00021248402591107389, "loss": 0.0192, "step": 225080 }, { "epoch": 0.58, "learning_rate": 0.0002124801376947024, "loss": 0.0142, "step": 225090 }, { "epoch": 0.58, "learning_rate": 0.00021247624947833097, "loss": 0.0186, "step": 225100 }, { "epoch": 0.58, "learning_rate": 0.00021247236126195948, "loss": 0.0144, "step": 225110 }, { "epoch": 0.58, "learning_rate": 0.00021246847304558802, "loss": 0.0191, "step": 225120 }, { "epoch": 0.58, "learning_rate": 0.00021246458482921654, "loss": 0.0245, "step": 225130 }, { "epoch": 0.58, "learning_rate": 0.0002124606966128451, "loss": 0.0208, "step": 225140 }, { "epoch": 0.58, "learning_rate": 0.00021245680839647362, "loss": 0.0188, "step": 225150 }, { "epoch": 0.58, "learning_rate": 0.00021245292018010216, "loss": 0.0157, "step": 225160 }, { "epoch": 0.58, "learning_rate": 0.00021244903196373068, "loss": 0.0217, "step": 225170 }, { "epoch": 0.58, "learning_rate": 0.00021244514374735925, "loss": 0.0142, "step": 225180 }, { "epoch": 0.58, "learning_rate": 0.00021244125553098776, "loss": 0.0177, "step": 225190 }, { "epoch": 0.58, "learning_rate": 0.0002124373673146163, "loss": 0.0191, "step": 225200 }, { "epoch": 0.58, "learning_rate": 0.00021243347909824482, "loss": 0.0201, "step": 225210 }, { "epoch": 0.58, "learning_rate": 0.0002124295908818734, "loss": 0.0134, "step": 225220 }, { "epoch": 0.58, "learning_rate": 0.00021242570266550193, "loss": 0.0142, "step": 225230 }, { "epoch": 0.58, "learning_rate": 0.00021242181444913044, "loss": 0.0158, "step": 225240 }, { "epoch": 0.58, "learning_rate": 0.00021241792623275898, "loss": 0.018, "step": 225250 }, { "epoch": 0.58, "learning_rate": 0.00021241403801638753, "loss": 0.0182, "step": 225260 }, { "epoch": 0.58, "learning_rate": 0.00021241014980001607, "loss": 0.0146, "step": 225270 }, { "epoch": 0.58, "learning_rate": 0.00021240626158364458, "loss": 0.0174, "step": 225280 }, { "epoch": 0.58, "learning_rate": 0.00021240237336727312, "loss": 0.0163, "step": 225290 }, { "epoch": 0.58, "learning_rate": 0.00021239848515090164, "loss": 0.0137, "step": 225300 }, { "epoch": 0.58, "learning_rate": 0.0002123945969345302, "loss": 0.0152, "step": 225310 }, { "epoch": 0.58, "learning_rate": 0.00021239070871815872, "loss": 0.0132, "step": 225320 }, { "epoch": 0.58, "learning_rate": 0.00021238682050178726, "loss": 0.0157, "step": 225330 }, { "epoch": 0.58, "learning_rate": 0.00021238293228541578, "loss": 0.0182, "step": 225340 }, { "epoch": 0.58, "learning_rate": 0.00021237904406904435, "loss": 0.0158, "step": 225350 }, { "epoch": 0.58, "learning_rate": 0.00021237515585267286, "loss": 0.02, "step": 225360 }, { "epoch": 0.58, "learning_rate": 0.0002123712676363014, "loss": 0.0197, "step": 225370 }, { "epoch": 0.58, "learning_rate": 0.00021236737941992992, "loss": 0.0157, "step": 225380 }, { "epoch": 0.58, "learning_rate": 0.00021236349120355849, "loss": 0.0176, "step": 225390 }, { "epoch": 0.58, "learning_rate": 0.00021235960298718703, "loss": 0.0125, "step": 225400 }, { "epoch": 0.58, "learning_rate": 0.00021235571477081554, "loss": 0.0177, "step": 225410 }, { "epoch": 0.58, "learning_rate": 0.00021235182655444408, "loss": 0.0259, "step": 225420 }, { "epoch": 0.58, "learning_rate": 0.00021234793833807263, "loss": 0.0169, "step": 225430 }, { "epoch": 0.58, "learning_rate": 0.00021234405012170117, "loss": 0.0159, "step": 225440 }, { "epoch": 0.58, "learning_rate": 0.00021234016190532968, "loss": 0.0211, "step": 225450 }, { "epoch": 0.58, "learning_rate": 0.00021233627368895822, "loss": 0.0155, "step": 225460 }, { "epoch": 0.58, "learning_rate": 0.00021233238547258677, "loss": 0.0168, "step": 225470 }, { "epoch": 0.58, "learning_rate": 0.0002123284972562153, "loss": 0.0185, "step": 225480 }, { "epoch": 0.58, "learning_rate": 0.00021232460903984382, "loss": 0.0141, "step": 225490 }, { "epoch": 0.58, "learning_rate": 0.00021232072082347236, "loss": 0.0177, "step": 225500 }, { "epoch": 0.58, "learning_rate": 0.0002123168326071009, "loss": 0.0213, "step": 225510 }, { "epoch": 0.58, "learning_rate": 0.00021231294439072945, "loss": 0.0155, "step": 225520 }, { "epoch": 0.58, "learning_rate": 0.00021230905617435796, "loss": 0.0163, "step": 225530 }, { "epoch": 0.58, "learning_rate": 0.0002123051679579865, "loss": 0.02, "step": 225540 }, { "epoch": 0.58, "learning_rate": 0.00021230127974161502, "loss": 0.0153, "step": 225550 }, { "epoch": 0.58, "learning_rate": 0.00021229739152524359, "loss": 0.0141, "step": 225560 }, { "epoch": 0.58, "learning_rate": 0.00021229350330887213, "loss": 0.0188, "step": 225570 }, { "epoch": 0.58, "learning_rate": 0.00021228961509250064, "loss": 0.0148, "step": 225580 }, { "epoch": 0.58, "learning_rate": 0.00021228572687612916, "loss": 0.0134, "step": 225590 }, { "epoch": 0.58, "learning_rate": 0.00021228183865975773, "loss": 0.0157, "step": 225600 }, { "epoch": 0.58, "learning_rate": 0.00021227795044338627, "loss": 0.0128, "step": 225610 }, { "epoch": 0.58, "learning_rate": 0.00021227406222701478, "loss": 0.0149, "step": 225620 }, { "epoch": 0.58, "learning_rate": 0.00021227017401064332, "loss": 0.0149, "step": 225630 }, { "epoch": 0.58, "learning_rate": 0.00021226628579427186, "loss": 0.0173, "step": 225640 }, { "epoch": 0.58, "learning_rate": 0.0002122623975779004, "loss": 0.0148, "step": 225650 }, { "epoch": 0.58, "learning_rate": 0.00021225850936152892, "loss": 0.0156, "step": 225660 }, { "epoch": 0.58, "learning_rate": 0.00021225462114515746, "loss": 0.0163, "step": 225670 }, { "epoch": 0.58, "learning_rate": 0.000212250732928786, "loss": 0.0151, "step": 225680 }, { "epoch": 0.59, "learning_rate": 0.00021224684471241455, "loss": 0.0168, "step": 225690 }, { "epoch": 0.59, "learning_rate": 0.00021224295649604306, "loss": 0.0145, "step": 225700 }, { "epoch": 0.59, "learning_rate": 0.0002122390682796716, "loss": 0.0178, "step": 225710 }, { "epoch": 0.59, "learning_rate": 0.00021223518006330017, "loss": 0.0193, "step": 225720 }, { "epoch": 0.59, "learning_rate": 0.00021223129184692869, "loss": 0.0142, "step": 225730 }, { "epoch": 0.59, "learning_rate": 0.00021222740363055723, "loss": 0.0184, "step": 225740 }, { "epoch": 0.59, "learning_rate": 0.00021222351541418574, "loss": 0.0163, "step": 225750 }, { "epoch": 0.59, "learning_rate": 0.0002122196271978143, "loss": 0.0126, "step": 225760 }, { "epoch": 0.59, "learning_rate": 0.00021221573898144282, "loss": 0.0142, "step": 225770 }, { "epoch": 0.59, "learning_rate": 0.00021221185076507137, "loss": 0.0192, "step": 225780 }, { "epoch": 0.59, "learning_rate": 0.00021220796254869988, "loss": 0.018, "step": 225790 }, { "epoch": 0.59, "learning_rate": 0.00021220407433232842, "loss": 0.0152, "step": 225800 }, { "epoch": 0.59, "learning_rate": 0.00021220018611595696, "loss": 0.0168, "step": 225810 }, { "epoch": 0.59, "learning_rate": 0.0002121962978995855, "loss": 0.0182, "step": 225820 }, { "epoch": 0.59, "learning_rate": 0.00021219240968321402, "loss": 0.0179, "step": 225830 }, { "epoch": 0.59, "learning_rate": 0.00021218852146684256, "loss": 0.0142, "step": 225840 }, { "epoch": 0.59, "learning_rate": 0.0002121846332504711, "loss": 0.0151, "step": 225850 }, { "epoch": 0.59, "learning_rate": 0.00021218074503409965, "loss": 0.0146, "step": 225860 }, { "epoch": 0.59, "learning_rate": 0.00021217685681772816, "loss": 0.0197, "step": 225870 }, { "epoch": 0.59, "learning_rate": 0.0002121729686013567, "loss": 0.0161, "step": 225880 }, { "epoch": 0.59, "learning_rate": 0.00021216908038498527, "loss": 0.0204, "step": 225890 }, { "epoch": 0.59, "learning_rate": 0.00021216519216861378, "loss": 0.0177, "step": 225900 }, { "epoch": 0.59, "learning_rate": 0.0002121613039522423, "loss": 0.015, "step": 225910 }, { "epoch": 0.59, "learning_rate": 0.00021215741573587084, "loss": 0.0241, "step": 225920 }, { "epoch": 0.59, "learning_rate": 0.0002121535275194994, "loss": 0.0239, "step": 225930 }, { "epoch": 0.59, "learning_rate": 0.00021214963930312792, "loss": 0.0159, "step": 225940 }, { "epoch": 0.59, "learning_rate": 0.00021214575108675647, "loss": 0.0156, "step": 225950 }, { "epoch": 0.59, "learning_rate": 0.00021214186287038498, "loss": 0.012, "step": 225960 }, { "epoch": 0.59, "learning_rate": 0.00021213797465401355, "loss": 0.0237, "step": 225970 }, { "epoch": 0.59, "learning_rate": 0.00021213408643764206, "loss": 0.0188, "step": 225980 }, { "epoch": 0.59, "learning_rate": 0.0002121301982212706, "loss": 0.0184, "step": 225990 }, { "epoch": 0.59, "learning_rate": 0.00021212631000489912, "loss": 0.0158, "step": 226000 }, { "epoch": 0.59, "eval_cer": 0.881821655462573, "eval_loss": 0.01118859276175499, "eval_runtime": 107.4296, "eval_samples_per_second": 18.617, "eval_steps_per_second": 4.654, "step": 226000 }, { "epoch": 0.59, "learning_rate": 0.0002121224217885277, "loss": 0.0214, "step": 226010 }, { "epoch": 0.59, "learning_rate": 0.0002121185335721562, "loss": 0.0145, "step": 226020 }, { "epoch": 0.59, "learning_rate": 0.00021211464535578474, "loss": 0.0178, "step": 226030 }, { "epoch": 0.59, "learning_rate": 0.00021211075713941326, "loss": 0.0156, "step": 226040 }, { "epoch": 0.59, "learning_rate": 0.0002121068689230418, "loss": 0.013, "step": 226050 }, { "epoch": 0.59, "learning_rate": 0.00021210298070667034, "loss": 0.0163, "step": 226060 }, { "epoch": 0.59, "learning_rate": 0.00021209909249029888, "loss": 0.0157, "step": 226070 }, { "epoch": 0.59, "learning_rate": 0.0002120952042739274, "loss": 0.0165, "step": 226080 }, { "epoch": 0.59, "learning_rate": 0.00021209131605755594, "loss": 0.0164, "step": 226090 }, { "epoch": 0.59, "learning_rate": 0.0002120874278411845, "loss": 0.0149, "step": 226100 }, { "epoch": 0.59, "learning_rate": 0.00021208353962481302, "loss": 0.0149, "step": 226110 }, { "epoch": 0.59, "learning_rate": 0.00021207965140844156, "loss": 0.0157, "step": 226120 }, { "epoch": 0.59, "learning_rate": 0.00021207576319207008, "loss": 0.0134, "step": 226130 }, { "epoch": 0.59, "learning_rate": 0.00021207187497569865, "loss": 0.014, "step": 226140 }, { "epoch": 0.59, "learning_rate": 0.00021206798675932716, "loss": 0.0178, "step": 226150 }, { "epoch": 0.59, "learning_rate": 0.0002120640985429557, "loss": 0.0214, "step": 226160 }, { "epoch": 0.59, "learning_rate": 0.00021206021032658422, "loss": 0.0141, "step": 226170 }, { "epoch": 0.59, "learning_rate": 0.0002120563221102128, "loss": 0.014, "step": 226180 }, { "epoch": 0.59, "learning_rate": 0.0002120524338938413, "loss": 0.0198, "step": 226190 }, { "epoch": 0.59, "learning_rate": 0.00021204854567746984, "loss": 0.0176, "step": 226200 }, { "epoch": 0.59, "learning_rate": 0.00021204465746109836, "loss": 0.0181, "step": 226210 }, { "epoch": 0.59, "learning_rate": 0.00021204076924472693, "loss": 0.015, "step": 226220 }, { "epoch": 0.59, "learning_rate": 0.00021203688102835544, "loss": 0.0163, "step": 226230 }, { "epoch": 0.59, "learning_rate": 0.00021203299281198398, "loss": 0.0154, "step": 226240 }, { "epoch": 0.59, "learning_rate": 0.0002120291045956125, "loss": 0.0145, "step": 226250 }, { "epoch": 0.59, "learning_rate": 0.00021202521637924107, "loss": 0.0203, "step": 226260 }, { "epoch": 0.59, "learning_rate": 0.0002120213281628696, "loss": 0.0292, "step": 226270 }, { "epoch": 0.59, "learning_rate": 0.00021201743994649812, "loss": 0.0227, "step": 226280 }, { "epoch": 0.59, "learning_rate": 0.00021201355173012666, "loss": 0.0148, "step": 226290 }, { "epoch": 0.59, "learning_rate": 0.00021200966351375518, "loss": 0.02, "step": 226300 }, { "epoch": 0.59, "learning_rate": 0.00021200577529738375, "loss": 0.0181, "step": 226310 }, { "epoch": 0.59, "learning_rate": 0.00021200188708101226, "loss": 0.0165, "step": 226320 }, { "epoch": 0.59, "learning_rate": 0.0002119979988646408, "loss": 0.0153, "step": 226330 }, { "epoch": 0.59, "learning_rate": 0.00021199411064826932, "loss": 0.0141, "step": 226340 }, { "epoch": 0.59, "learning_rate": 0.0002119902224318979, "loss": 0.0167, "step": 226350 }, { "epoch": 0.59, "learning_rate": 0.0002119863342155264, "loss": 0.0187, "step": 226360 }, { "epoch": 0.59, "learning_rate": 0.00021198244599915494, "loss": 0.0157, "step": 226370 }, { "epoch": 0.59, "learning_rate": 0.00021197855778278346, "loss": 0.0164, "step": 226380 }, { "epoch": 0.59, "learning_rate": 0.00021197466956641203, "loss": 0.0158, "step": 226390 }, { "epoch": 0.59, "learning_rate": 0.00021197078135004054, "loss": 0.0183, "step": 226400 }, { "epoch": 0.59, "learning_rate": 0.00021196689313366908, "loss": 0.0178, "step": 226410 }, { "epoch": 0.59, "learning_rate": 0.0002119630049172976, "loss": 0.018, "step": 226420 }, { "epoch": 0.59, "learning_rate": 0.00021195911670092617, "loss": 0.0238, "step": 226430 }, { "epoch": 0.59, "learning_rate": 0.0002119552284845547, "loss": 0.016, "step": 226440 }, { "epoch": 0.59, "learning_rate": 0.00021195134026818322, "loss": 0.0145, "step": 226450 }, { "epoch": 0.59, "learning_rate": 0.00021194745205181176, "loss": 0.0176, "step": 226460 }, { "epoch": 0.59, "learning_rate": 0.0002119435638354403, "loss": 0.0123, "step": 226470 }, { "epoch": 0.59, "learning_rate": 0.00021193967561906885, "loss": 0.0136, "step": 226480 }, { "epoch": 0.59, "learning_rate": 0.00021193578740269736, "loss": 0.0191, "step": 226490 }, { "epoch": 0.59, "learning_rate": 0.0002119318991863259, "loss": 0.0149, "step": 226500 }, { "epoch": 0.59, "learning_rate": 0.00021192801096995444, "loss": 0.0169, "step": 226510 }, { "epoch": 0.59, "learning_rate": 0.000211924122753583, "loss": 0.0111, "step": 226520 }, { "epoch": 0.59, "learning_rate": 0.0002119202345372115, "loss": 0.0153, "step": 226530 }, { "epoch": 0.59, "learning_rate": 0.00021191634632084004, "loss": 0.016, "step": 226540 }, { "epoch": 0.59, "learning_rate": 0.00021191245810446856, "loss": 0.0151, "step": 226550 }, { "epoch": 0.59, "learning_rate": 0.00021190856988809713, "loss": 0.0168, "step": 226560 }, { "epoch": 0.59, "learning_rate": 0.00021190468167172564, "loss": 0.013, "step": 226570 }, { "epoch": 0.59, "learning_rate": 0.00021190079345535418, "loss": 0.0172, "step": 226580 }, { "epoch": 0.59, "learning_rate": 0.0002118969052389827, "loss": 0.0164, "step": 226590 }, { "epoch": 0.59, "learning_rate": 0.00021189301702261127, "loss": 0.0166, "step": 226600 }, { "epoch": 0.59, "learning_rate": 0.0002118891288062398, "loss": 0.0141, "step": 226610 }, { "epoch": 0.59, "learning_rate": 0.00021188524058986832, "loss": 0.0132, "step": 226620 }, { "epoch": 0.59, "learning_rate": 0.00021188135237349684, "loss": 0.0159, "step": 226630 }, { "epoch": 0.59, "learning_rate": 0.0002118774641571254, "loss": 0.02, "step": 226640 }, { "epoch": 0.59, "learning_rate": 0.00021187357594075395, "loss": 0.0134, "step": 226650 }, { "epoch": 0.59, "learning_rate": 0.00021186968772438246, "loss": 0.018, "step": 226660 }, { "epoch": 0.59, "learning_rate": 0.000211865799508011, "loss": 0.021, "step": 226670 }, { "epoch": 0.59, "learning_rate": 0.00021186191129163954, "loss": 0.0145, "step": 226680 }, { "epoch": 0.59, "learning_rate": 0.00021185802307526809, "loss": 0.0165, "step": 226690 }, { "epoch": 0.59, "learning_rate": 0.0002118541348588966, "loss": 0.016, "step": 226700 }, { "epoch": 0.59, "learning_rate": 0.00021185024664252514, "loss": 0.0177, "step": 226710 }, { "epoch": 0.59, "learning_rate": 0.00021184635842615368, "loss": 0.0167, "step": 226720 }, { "epoch": 0.59, "learning_rate": 0.00021184247020978223, "loss": 0.0169, "step": 226730 }, { "epoch": 0.59, "learning_rate": 0.00021183858199341074, "loss": 0.0134, "step": 226740 }, { "epoch": 0.59, "learning_rate": 0.00021183469377703928, "loss": 0.0157, "step": 226750 }, { "epoch": 0.59, "learning_rate": 0.00021183080556066785, "loss": 0.0203, "step": 226760 }, { "epoch": 0.59, "learning_rate": 0.00021182691734429636, "loss": 0.0136, "step": 226770 }, { "epoch": 0.59, "learning_rate": 0.00021182302912792488, "loss": 0.0204, "step": 226780 }, { "epoch": 0.59, "learning_rate": 0.00021181914091155342, "loss": 0.0129, "step": 226790 }, { "epoch": 0.59, "learning_rate": 0.00021181525269518194, "loss": 0.0184, "step": 226800 }, { "epoch": 0.59, "learning_rate": 0.0002118113644788105, "loss": 0.015, "step": 226810 }, { "epoch": 0.59, "learning_rate": 0.00021180747626243905, "loss": 0.0153, "step": 226820 }, { "epoch": 0.59, "learning_rate": 0.00021180358804606756, "loss": 0.0147, "step": 226830 }, { "epoch": 0.59, "learning_rate": 0.0002117996998296961, "loss": 0.0159, "step": 226840 }, { "epoch": 0.59, "learning_rate": 0.00021179581161332464, "loss": 0.0151, "step": 226850 }, { "epoch": 0.59, "learning_rate": 0.00021179192339695319, "loss": 0.0178, "step": 226860 }, { "epoch": 0.59, "learning_rate": 0.0002117880351805817, "loss": 0.0176, "step": 226870 }, { "epoch": 0.59, "learning_rate": 0.00021178414696421024, "loss": 0.0225, "step": 226880 }, { "epoch": 0.59, "learning_rate": 0.00021178025874783878, "loss": 0.0137, "step": 226890 }, { "epoch": 0.59, "learning_rate": 0.00021177637053146732, "loss": 0.0204, "step": 226900 }, { "epoch": 0.59, "learning_rate": 0.00021177248231509584, "loss": 0.0175, "step": 226910 }, { "epoch": 0.59, "learning_rate": 0.00021176859409872438, "loss": 0.0201, "step": 226920 }, { "epoch": 0.59, "learning_rate": 0.00021176470588235295, "loss": 0.0173, "step": 226930 }, { "epoch": 0.59, "learning_rate": 0.00021176081766598146, "loss": 0.0164, "step": 226940 }, { "epoch": 0.59, "learning_rate": 0.00021175692944960998, "loss": 0.0161, "step": 226950 }, { "epoch": 0.59, "learning_rate": 0.00021175304123323852, "loss": 0.0164, "step": 226960 }, { "epoch": 0.59, "learning_rate": 0.0002117491530168671, "loss": 0.0198, "step": 226970 }, { "epoch": 0.59, "learning_rate": 0.0002117452648004956, "loss": 0.0211, "step": 226980 }, { "epoch": 0.59, "learning_rate": 0.00021174137658412415, "loss": 0.0149, "step": 226990 }, { "epoch": 0.59, "learning_rate": 0.00021173748836775266, "loss": 0.0163, "step": 227000 }, { "epoch": 0.59, "eval_cer": 0.8817964619977577, "eval_loss": 0.011157948523759842, "eval_runtime": 107.4259, "eval_samples_per_second": 18.617, "eval_steps_per_second": 4.654, "step": 227000 }, { "epoch": 0.59, "learning_rate": 0.00021173360015138123, "loss": 0.0156, "step": 227010 }, { "epoch": 0.59, "learning_rate": 0.00021172971193500974, "loss": 0.0143, "step": 227020 }, { "epoch": 0.59, "learning_rate": 0.00021172582371863828, "loss": 0.0142, "step": 227030 }, { "epoch": 0.59, "learning_rate": 0.0002117219355022668, "loss": 0.0143, "step": 227040 }, { "epoch": 0.59, "learning_rate": 0.00021171804728589534, "loss": 0.0182, "step": 227050 }, { "epoch": 0.59, "learning_rate": 0.00021171415906952388, "loss": 0.0156, "step": 227060 }, { "epoch": 0.59, "learning_rate": 0.00021171027085315242, "loss": 0.0184, "step": 227070 }, { "epoch": 0.59, "learning_rate": 0.00021170638263678094, "loss": 0.0165, "step": 227080 }, { "epoch": 0.59, "learning_rate": 0.00021170249442040948, "loss": 0.0149, "step": 227090 }, { "epoch": 0.59, "learning_rate": 0.00021169860620403802, "loss": 0.0135, "step": 227100 }, { "epoch": 0.59, "learning_rate": 0.00021169471798766656, "loss": 0.0147, "step": 227110 }, { "epoch": 0.59, "learning_rate": 0.00021169082977129508, "loss": 0.0169, "step": 227120 }, { "epoch": 0.59, "learning_rate": 0.00021168694155492362, "loss": 0.0152, "step": 227130 }, { "epoch": 0.59, "learning_rate": 0.0002116830533385522, "loss": 0.0165, "step": 227140 }, { "epoch": 0.59, "learning_rate": 0.0002116791651221807, "loss": 0.0145, "step": 227150 }, { "epoch": 0.59, "learning_rate": 0.00021167527690580924, "loss": 0.0152, "step": 227160 }, { "epoch": 0.59, "learning_rate": 0.00021167138868943776, "loss": 0.0171, "step": 227170 }, { "epoch": 0.59, "learning_rate": 0.00021166750047306633, "loss": 0.0199, "step": 227180 }, { "epoch": 0.59, "learning_rate": 0.00021166361225669484, "loss": 0.0168, "step": 227190 }, { "epoch": 0.59, "learning_rate": 0.00021165972404032338, "loss": 0.0141, "step": 227200 }, { "epoch": 0.59, "learning_rate": 0.0002116558358239519, "loss": 0.0135, "step": 227210 }, { "epoch": 0.59, "learning_rate": 0.00021165194760758047, "loss": 0.0165, "step": 227220 }, { "epoch": 0.59, "learning_rate": 0.00021164805939120898, "loss": 0.0176, "step": 227230 }, { "epoch": 0.59, "learning_rate": 0.00021164417117483752, "loss": 0.0176, "step": 227240 }, { "epoch": 0.59, "learning_rate": 0.00021164028295846604, "loss": 0.0134, "step": 227250 }, { "epoch": 0.59, "learning_rate": 0.0002116363947420946, "loss": 0.0201, "step": 227260 }, { "epoch": 0.59, "learning_rate": 0.00021163250652572312, "loss": 0.0146, "step": 227270 }, { "epoch": 0.59, "learning_rate": 0.00021162861830935166, "loss": 0.0176, "step": 227280 }, { "epoch": 0.59, "learning_rate": 0.00021162473009298018, "loss": 0.0153, "step": 227290 }, { "epoch": 0.59, "learning_rate": 0.00021162084187660872, "loss": 0.0124, "step": 227300 }, { "epoch": 0.59, "learning_rate": 0.0002116169536602373, "loss": 0.0146, "step": 227310 }, { "epoch": 0.59, "learning_rate": 0.0002116130654438658, "loss": 0.0163, "step": 227320 }, { "epoch": 0.59, "learning_rate": 0.00021160917722749434, "loss": 0.0167, "step": 227330 }, { "epoch": 0.59, "learning_rate": 0.00021160528901112286, "loss": 0.0146, "step": 227340 }, { "epoch": 0.59, "learning_rate": 0.00021160140079475143, "loss": 0.0179, "step": 227350 }, { "epoch": 0.59, "learning_rate": 0.00021159751257837994, "loss": 0.0146, "step": 227360 }, { "epoch": 0.59, "learning_rate": 0.00021159362436200848, "loss": 0.0146, "step": 227370 }, { "epoch": 0.59, "learning_rate": 0.000211589736145637, "loss": 0.0168, "step": 227380 }, { "epoch": 0.59, "learning_rate": 0.00021158584792926557, "loss": 0.0153, "step": 227390 }, { "epoch": 0.59, "learning_rate": 0.00021158195971289408, "loss": 0.0199, "step": 227400 }, { "epoch": 0.59, "learning_rate": 0.00021157807149652262, "loss": 0.0155, "step": 227410 }, { "epoch": 0.59, "learning_rate": 0.00021157418328015114, "loss": 0.0162, "step": 227420 }, { "epoch": 0.59, "learning_rate": 0.0002115702950637797, "loss": 0.0142, "step": 227430 }, { "epoch": 0.59, "learning_rate": 0.00021156640684740822, "loss": 0.02, "step": 227440 }, { "epoch": 0.59, "learning_rate": 0.00021156251863103676, "loss": 0.0164, "step": 227450 }, { "epoch": 0.59, "learning_rate": 0.00021155863041466528, "loss": 0.0134, "step": 227460 }, { "epoch": 0.59, "learning_rate": 0.00021155474219829385, "loss": 0.0125, "step": 227470 }, { "epoch": 0.59, "learning_rate": 0.0002115508539819224, "loss": 0.0188, "step": 227480 }, { "epoch": 0.59, "learning_rate": 0.0002115469657655509, "loss": 0.0131, "step": 227490 }, { "epoch": 0.59, "learning_rate": 0.00021154307754917942, "loss": 0.0183, "step": 227500 }, { "epoch": 0.59, "learning_rate": 0.00021153918933280799, "loss": 0.0157, "step": 227510 }, { "epoch": 0.59, "learning_rate": 0.00021153530111643653, "loss": 0.0136, "step": 227520 }, { "epoch": 0.59, "learning_rate": 0.00021153141290006504, "loss": 0.0274, "step": 227530 }, { "epoch": 0.59, "learning_rate": 0.00021152752468369358, "loss": 0.0154, "step": 227540 }, { "epoch": 0.59, "learning_rate": 0.0002115236364673221, "loss": 0.0177, "step": 227550 }, { "epoch": 0.59, "learning_rate": 0.00021151974825095067, "loss": 0.0154, "step": 227560 }, { "epoch": 0.59, "learning_rate": 0.00021151586003457918, "loss": 0.0115, "step": 227570 }, { "epoch": 0.59, "learning_rate": 0.00021151197181820772, "loss": 0.0156, "step": 227580 }, { "epoch": 0.59, "learning_rate": 0.00021150808360183624, "loss": 0.0174, "step": 227590 }, { "epoch": 0.59, "learning_rate": 0.0002115041953854648, "loss": 0.0174, "step": 227600 }, { "epoch": 0.59, "learning_rate": 0.00021150030716909332, "loss": 0.0197, "step": 227610 }, { "epoch": 0.59, "learning_rate": 0.00021149641895272186, "loss": 0.0173, "step": 227620 }, { "epoch": 0.59, "learning_rate": 0.00021149253073635038, "loss": 0.0152, "step": 227630 }, { "epoch": 0.59, "learning_rate": 0.00021148864251997895, "loss": 0.0199, "step": 227640 }, { "epoch": 0.59, "learning_rate": 0.00021148475430360746, "loss": 0.0133, "step": 227650 }, { "epoch": 0.59, "learning_rate": 0.000211480866087236, "loss": 0.0142, "step": 227660 }, { "epoch": 0.59, "learning_rate": 0.00021147697787086452, "loss": 0.0117, "step": 227670 }, { "epoch": 0.59, "learning_rate": 0.00021147308965449308, "loss": 0.0177, "step": 227680 }, { "epoch": 0.59, "learning_rate": 0.00021146920143812163, "loss": 0.0141, "step": 227690 }, { "epoch": 0.59, "learning_rate": 0.00021146531322175014, "loss": 0.0155, "step": 227700 }, { "epoch": 0.59, "learning_rate": 0.00021146142500537868, "loss": 0.0201, "step": 227710 }, { "epoch": 0.59, "learning_rate": 0.00021145753678900722, "loss": 0.0142, "step": 227720 }, { "epoch": 0.59, "learning_rate": 0.00021145364857263577, "loss": 0.0135, "step": 227730 }, { "epoch": 0.59, "learning_rate": 0.00021144976035626428, "loss": 0.0136, "step": 227740 }, { "epoch": 0.59, "learning_rate": 0.00021144587213989282, "loss": 0.0158, "step": 227750 }, { "epoch": 0.59, "learning_rate": 0.00021144198392352136, "loss": 0.0176, "step": 227760 }, { "epoch": 0.59, "learning_rate": 0.0002114380957071499, "loss": 0.0167, "step": 227770 }, { "epoch": 0.59, "learning_rate": 0.00021143420749077842, "loss": 0.0147, "step": 227780 }, { "epoch": 0.59, "learning_rate": 0.00021143031927440696, "loss": 0.0136, "step": 227790 }, { "epoch": 0.59, "learning_rate": 0.00021142643105803548, "loss": 0.0148, "step": 227800 }, { "epoch": 0.59, "learning_rate": 0.00021142254284166404, "loss": 0.0142, "step": 227810 }, { "epoch": 0.59, "learning_rate": 0.00021141865462529256, "loss": 0.0166, "step": 227820 }, { "epoch": 0.59, "learning_rate": 0.0002114147664089211, "loss": 0.0132, "step": 227830 }, { "epoch": 0.59, "learning_rate": 0.00021141087819254962, "loss": 0.0153, "step": 227840 }, { "epoch": 0.59, "learning_rate": 0.00021140698997617818, "loss": 0.0165, "step": 227850 }, { "epoch": 0.59, "learning_rate": 0.00021140310175980673, "loss": 0.0171, "step": 227860 }, { "epoch": 0.59, "learning_rate": 0.00021139921354343524, "loss": 0.017, "step": 227870 }, { "epoch": 0.59, "learning_rate": 0.00021139532532706378, "loss": 0.0151, "step": 227880 }, { "epoch": 0.59, "learning_rate": 0.00021139143711069232, "loss": 0.015, "step": 227890 }, { "epoch": 0.59, "learning_rate": 0.00021138754889432087, "loss": 0.0125, "step": 227900 }, { "epoch": 0.59, "learning_rate": 0.00021138366067794938, "loss": 0.0138, "step": 227910 }, { "epoch": 0.59, "learning_rate": 0.00021137977246157792, "loss": 0.0154, "step": 227920 }, { "epoch": 0.59, "learning_rate": 0.00021137588424520646, "loss": 0.0159, "step": 227930 }, { "epoch": 0.59, "learning_rate": 0.000211371996028835, "loss": 0.0154, "step": 227940 }, { "epoch": 0.59, "learning_rate": 0.00021136810781246352, "loss": 0.0166, "step": 227950 }, { "epoch": 0.59, "learning_rate": 0.00021136421959609206, "loss": 0.0177, "step": 227960 }, { "epoch": 0.59, "learning_rate": 0.0002113603313797206, "loss": 0.0145, "step": 227970 }, { "epoch": 0.59, "learning_rate": 0.00021135644316334914, "loss": 0.0181, "step": 227980 }, { "epoch": 0.59, "learning_rate": 0.00021135255494697766, "loss": 0.019, "step": 227990 }, { "epoch": 0.59, "learning_rate": 0.0002113486667306062, "loss": 0.015, "step": 228000 }, { "epoch": 0.59, "eval_cer": 0.8818006609085604, "eval_loss": 0.011607250198721886, "eval_runtime": 107.2928, "eval_samples_per_second": 18.641, "eval_steps_per_second": 4.66, "step": 228000 }, { "epoch": 0.59, "learning_rate": 0.00021134477851423471, "loss": 0.0233, "step": 228010 }, { "epoch": 0.59, "learning_rate": 0.00021134089029786328, "loss": 0.0157, "step": 228020 }, { "epoch": 0.59, "learning_rate": 0.00021133700208149183, "loss": 0.0207, "step": 228030 }, { "epoch": 0.59, "learning_rate": 0.00021133311386512034, "loss": 0.0184, "step": 228040 }, { "epoch": 0.59, "learning_rate": 0.00021132922564874885, "loss": 0.0155, "step": 228050 }, { "epoch": 0.59, "learning_rate": 0.00021132533743237742, "loss": 0.0172, "step": 228060 }, { "epoch": 0.59, "learning_rate": 0.00021132144921600596, "loss": 0.0148, "step": 228070 }, { "epoch": 0.59, "learning_rate": 0.00021131756099963448, "loss": 0.0179, "step": 228080 }, { "epoch": 0.59, "learning_rate": 0.00021131367278326302, "loss": 0.0176, "step": 228090 }, { "epoch": 0.59, "learning_rate": 0.00021130978456689156, "loss": 0.0151, "step": 228100 }, { "epoch": 0.59, "learning_rate": 0.0002113058963505201, "loss": 0.0191, "step": 228110 }, { "epoch": 0.59, "learning_rate": 0.00021130200813414862, "loss": 0.0152, "step": 228120 }, { "epoch": 0.59, "learning_rate": 0.00021129811991777716, "loss": 0.0171, "step": 228130 }, { "epoch": 0.59, "learning_rate": 0.0002112942317014057, "loss": 0.0146, "step": 228140 }, { "epoch": 0.59, "learning_rate": 0.00021129034348503424, "loss": 0.0153, "step": 228150 }, { "epoch": 0.59, "learning_rate": 0.00021128645526866276, "loss": 0.0171, "step": 228160 }, { "epoch": 0.59, "learning_rate": 0.0002112825670522913, "loss": 0.0163, "step": 228170 }, { "epoch": 0.59, "learning_rate": 0.00021127867883591987, "loss": 0.0207, "step": 228180 }, { "epoch": 0.59, "learning_rate": 0.00021127479061954838, "loss": 0.016, "step": 228190 }, { "epoch": 0.59, "learning_rate": 0.00021127090240317692, "loss": 0.0169, "step": 228200 }, { "epoch": 0.59, "learning_rate": 0.00021126701418680544, "loss": 0.0145, "step": 228210 }, { "epoch": 0.59, "learning_rate": 0.000211263125970434, "loss": 0.0205, "step": 228220 }, { "epoch": 0.59, "learning_rate": 0.00021125923775406252, "loss": 0.016, "step": 228230 }, { "epoch": 0.59, "learning_rate": 0.00021125534953769106, "loss": 0.017, "step": 228240 }, { "epoch": 0.59, "learning_rate": 0.00021125146132131958, "loss": 0.0139, "step": 228250 }, { "epoch": 0.59, "learning_rate": 0.00021124757310494812, "loss": 0.0147, "step": 228260 }, { "epoch": 0.59, "learning_rate": 0.00021124368488857666, "loss": 0.0151, "step": 228270 }, { "epoch": 0.59, "learning_rate": 0.0002112397966722052, "loss": 0.0198, "step": 228280 }, { "epoch": 0.59, "learning_rate": 0.00021123590845583372, "loss": 0.0159, "step": 228290 }, { "epoch": 0.59, "learning_rate": 0.00021123202023946226, "loss": 0.0183, "step": 228300 }, { "epoch": 0.59, "learning_rate": 0.0002112281320230908, "loss": 0.0178, "step": 228310 }, { "epoch": 0.59, "learning_rate": 0.00021122424380671934, "loss": 0.0176, "step": 228320 }, { "epoch": 0.59, "learning_rate": 0.00021122035559034786, "loss": 0.0162, "step": 228330 }, { "epoch": 0.59, "learning_rate": 0.0002112164673739764, "loss": 0.0166, "step": 228340 }, { "epoch": 0.59, "learning_rate": 0.00021121257915760497, "loss": 0.0225, "step": 228350 }, { "epoch": 0.59, "learning_rate": 0.00021120869094123348, "loss": 0.0156, "step": 228360 }, { "epoch": 0.59, "learning_rate": 0.000211204802724862, "loss": 0.0176, "step": 228370 }, { "epoch": 0.59, "learning_rate": 0.00021120091450849054, "loss": 0.0129, "step": 228380 }, { "epoch": 0.59, "learning_rate": 0.0002111970262921191, "loss": 0.0171, "step": 228390 }, { "epoch": 0.59, "learning_rate": 0.00021119313807574762, "loss": 0.0189, "step": 228400 }, { "epoch": 0.59, "learning_rate": 0.00021118924985937616, "loss": 0.0121, "step": 228410 }, { "epoch": 0.59, "learning_rate": 0.00021118536164300468, "loss": 0.0134, "step": 228420 }, { "epoch": 0.59, "learning_rate": 0.00021118147342663325, "loss": 0.015, "step": 228430 }, { "epoch": 0.59, "learning_rate": 0.00021117758521026176, "loss": 0.0159, "step": 228440 }, { "epoch": 0.59, "learning_rate": 0.0002111736969938903, "loss": 0.0157, "step": 228450 }, { "epoch": 0.59, "learning_rate": 0.00021116980877751882, "loss": 0.015, "step": 228460 }, { "epoch": 0.59, "learning_rate": 0.00021116592056114739, "loss": 0.0129, "step": 228470 }, { "epoch": 0.59, "learning_rate": 0.0002111620323447759, "loss": 0.0161, "step": 228480 }, { "epoch": 0.59, "learning_rate": 0.00021115814412840444, "loss": 0.0151, "step": 228490 }, { "epoch": 0.59, "learning_rate": 0.00021115425591203296, "loss": 0.02, "step": 228500 }, { "epoch": 0.59, "learning_rate": 0.0002111503676956615, "loss": 0.0153, "step": 228510 }, { "epoch": 0.59, "learning_rate": 0.00021114647947929007, "loss": 0.0161, "step": 228520 }, { "epoch": 0.59, "learning_rate": 0.00021114259126291858, "loss": 0.0162, "step": 228530 }, { "epoch": 0.59, "learning_rate": 0.0002111387030465471, "loss": 0.0176, "step": 228540 }, { "epoch": 0.59, "learning_rate": 0.00021113481483017564, "loss": 0.0205, "step": 228550 }, { "epoch": 0.59, "learning_rate": 0.0002111309266138042, "loss": 0.0143, "step": 228560 }, { "epoch": 0.59, "learning_rate": 0.00021112703839743272, "loss": 0.0142, "step": 228570 }, { "epoch": 0.59, "learning_rate": 0.00021112315018106126, "loss": 0.014, "step": 228580 }, { "epoch": 0.59, "learning_rate": 0.00021111926196468978, "loss": 0.0158, "step": 228590 }, { "epoch": 0.59, "learning_rate": 0.00021111537374831835, "loss": 0.0159, "step": 228600 }, { "epoch": 0.59, "learning_rate": 0.00021111148553194686, "loss": 0.0113, "step": 228610 }, { "epoch": 0.59, "learning_rate": 0.0002111075973155754, "loss": 0.015, "step": 228620 }, { "epoch": 0.59, "learning_rate": 0.00021110370909920392, "loss": 0.0181, "step": 228630 }, { "epoch": 0.59, "learning_rate": 0.00021109982088283249, "loss": 0.0142, "step": 228640 }, { "epoch": 0.59, "learning_rate": 0.000211095932666461, "loss": 0.0143, "step": 228650 }, { "epoch": 0.59, "learning_rate": 0.00021109204445008954, "loss": 0.0212, "step": 228660 }, { "epoch": 0.59, "learning_rate": 0.00021108815623371806, "loss": 0.0176, "step": 228670 }, { "epoch": 0.59, "learning_rate": 0.00021108426801734663, "loss": 0.0176, "step": 228680 }, { "epoch": 0.59, "learning_rate": 0.00021108037980097514, "loss": 0.0174, "step": 228690 }, { "epoch": 0.59, "learning_rate": 0.00021107649158460368, "loss": 0.0165, "step": 228700 }, { "epoch": 0.59, "learning_rate": 0.0002110726033682322, "loss": 0.0166, "step": 228710 }, { "epoch": 0.59, "learning_rate": 0.00021106871515186076, "loss": 0.0225, "step": 228720 }, { "epoch": 0.59, "learning_rate": 0.0002110648269354893, "loss": 0.0146, "step": 228730 }, { "epoch": 0.59, "learning_rate": 0.00021106093871911782, "loss": 0.0175, "step": 228740 }, { "epoch": 0.59, "learning_rate": 0.00021105705050274636, "loss": 0.0161, "step": 228750 }, { "epoch": 0.59, "learning_rate": 0.00021105316228637488, "loss": 0.014, "step": 228760 }, { "epoch": 0.59, "learning_rate": 0.00021104927407000345, "loss": 0.0192, "step": 228770 }, { "epoch": 0.59, "learning_rate": 0.00021104538585363196, "loss": 0.0134, "step": 228780 }, { "epoch": 0.59, "learning_rate": 0.0002110414976372605, "loss": 0.0155, "step": 228790 }, { "epoch": 0.59, "learning_rate": 0.00021103760942088902, "loss": 0.0209, "step": 228800 }, { "epoch": 0.59, "learning_rate": 0.00021103372120451759, "loss": 0.0188, "step": 228810 }, { "epoch": 0.59, "learning_rate": 0.0002110298329881461, "loss": 0.0176, "step": 228820 }, { "epoch": 0.59, "learning_rate": 0.00021102594477177464, "loss": 0.0153, "step": 228830 }, { "epoch": 0.59, "learning_rate": 0.00021102205655540316, "loss": 0.0163, "step": 228840 }, { "epoch": 0.59, "learning_rate": 0.00021101816833903172, "loss": 0.0202, "step": 228850 }, { "epoch": 0.59, "learning_rate": 0.00021101428012266024, "loss": 0.0137, "step": 228860 }, { "epoch": 0.59, "learning_rate": 0.00021101039190628878, "loss": 0.016, "step": 228870 }, { "epoch": 0.59, "learning_rate": 0.0002110065036899173, "loss": 0.0159, "step": 228880 }, { "epoch": 0.59, "learning_rate": 0.00021100261547354586, "loss": 0.0156, "step": 228890 }, { "epoch": 0.59, "learning_rate": 0.0002109987272571744, "loss": 0.0161, "step": 228900 }, { "epoch": 0.59, "learning_rate": 0.00021099483904080292, "loss": 0.0146, "step": 228910 }, { "epoch": 0.59, "learning_rate": 0.00021099095082443146, "loss": 0.0124, "step": 228920 }, { "epoch": 0.59, "learning_rate": 0.00021098706260806, "loss": 0.015, "step": 228930 }, { "epoch": 0.59, "learning_rate": 0.00021098317439168854, "loss": 0.0182, "step": 228940 }, { "epoch": 0.59, "learning_rate": 0.00021097928617531706, "loss": 0.0137, "step": 228950 }, { "epoch": 0.59, "learning_rate": 0.0002109753979589456, "loss": 0.0238, "step": 228960 }, { "epoch": 0.59, "learning_rate": 0.00021097150974257414, "loss": 0.0203, "step": 228970 }, { "epoch": 0.59, "learning_rate": 0.00021096762152620268, "loss": 0.0172, "step": 228980 }, { "epoch": 0.59, "learning_rate": 0.0002109637333098312, "loss": 0.0136, "step": 228990 }, { "epoch": 0.59, "learning_rate": 0.00021095984509345974, "loss": 0.0171, "step": 229000 }, { "epoch": 0.59, "eval_cer": 0.8817838652653501, "eval_loss": 0.011135715059936047, "eval_runtime": 107.4098, "eval_samples_per_second": 18.62, "eval_steps_per_second": 4.655, "step": 229000 }, { "epoch": 0.59, "learning_rate": 0.00021095595687708826, "loss": 0.0183, "step": 229010 }, { "epoch": 0.59, "learning_rate": 0.00021095206866071682, "loss": 0.0166, "step": 229020 }, { "epoch": 0.59, "learning_rate": 0.00021094818044434534, "loss": 0.0164, "step": 229030 }, { "epoch": 0.59, "learning_rate": 0.00021094429222797388, "loss": 0.0171, "step": 229040 }, { "epoch": 0.59, "learning_rate": 0.0002109404040116024, "loss": 0.0128, "step": 229050 }, { "epoch": 0.59, "learning_rate": 0.00021093651579523096, "loss": 0.0175, "step": 229060 }, { "epoch": 0.59, "learning_rate": 0.0002109326275788595, "loss": 0.0183, "step": 229070 }, { "epoch": 0.59, "learning_rate": 0.00021092873936248802, "loss": 0.0165, "step": 229080 }, { "epoch": 0.59, "learning_rate": 0.00021092485114611653, "loss": 0.0143, "step": 229090 }, { "epoch": 0.59, "learning_rate": 0.0002109209629297451, "loss": 0.0138, "step": 229100 }, { "epoch": 0.59, "learning_rate": 0.00021091707471337364, "loss": 0.0137, "step": 229110 }, { "epoch": 0.59, "learning_rate": 0.00021091318649700216, "loss": 0.0123, "step": 229120 }, { "epoch": 0.59, "learning_rate": 0.0002109092982806307, "loss": 0.0145, "step": 229130 }, { "epoch": 0.59, "learning_rate": 0.00021090541006425924, "loss": 0.0162, "step": 229140 }, { "epoch": 0.59, "learning_rate": 0.00021090152184788778, "loss": 0.0162, "step": 229150 }, { "epoch": 0.59, "learning_rate": 0.0002108976336315163, "loss": 0.0177, "step": 229160 }, { "epoch": 0.59, "learning_rate": 0.00021089374541514484, "loss": 0.0146, "step": 229170 }, { "epoch": 0.59, "learning_rate": 0.00021088985719877338, "loss": 0.0152, "step": 229180 }, { "epoch": 0.59, "learning_rate": 0.00021088596898240192, "loss": 0.0182, "step": 229190 }, { "epoch": 0.59, "learning_rate": 0.00021088208076603044, "loss": 0.0145, "step": 229200 }, { "epoch": 0.59, "learning_rate": 0.00021087819254965898, "loss": 0.0153, "step": 229210 }, { "epoch": 0.59, "learning_rate": 0.00021087430433328755, "loss": 0.0165, "step": 229220 }, { "epoch": 0.59, "learning_rate": 0.00021087041611691606, "loss": 0.0169, "step": 229230 }, { "epoch": 0.59, "learning_rate": 0.00021086652790054458, "loss": 0.0157, "step": 229240 }, { "epoch": 0.59, "learning_rate": 0.00021086263968417312, "loss": 0.0147, "step": 229250 }, { "epoch": 0.59, "learning_rate": 0.00021085875146780163, "loss": 0.0155, "step": 229260 }, { "epoch": 0.59, "learning_rate": 0.0002108548632514302, "loss": 0.015, "step": 229270 }, { "epoch": 0.59, "learning_rate": 0.00021085097503505874, "loss": 0.0182, "step": 229280 }, { "epoch": 0.59, "learning_rate": 0.00021084708681868726, "loss": 0.0208, "step": 229290 }, { "epoch": 0.59, "learning_rate": 0.0002108431986023158, "loss": 0.0184, "step": 229300 }, { "epoch": 0.59, "learning_rate": 0.00021083931038594434, "loss": 0.0171, "step": 229310 }, { "epoch": 0.59, "learning_rate": 0.00021083542216957288, "loss": 0.0189, "step": 229320 }, { "epoch": 0.59, "learning_rate": 0.0002108315339532014, "loss": 0.014, "step": 229330 }, { "epoch": 0.59, "learning_rate": 0.00021082764573682994, "loss": 0.0202, "step": 229340 }, { "epoch": 0.59, "learning_rate": 0.00021082375752045848, "loss": 0.0188, "step": 229350 }, { "epoch": 0.59, "learning_rate": 0.00021081986930408702, "loss": 0.022, "step": 229360 }, { "epoch": 0.59, "learning_rate": 0.00021081598108771554, "loss": 0.0143, "step": 229370 }, { "epoch": 0.59, "learning_rate": 0.00021081209287134408, "loss": 0.0175, "step": 229380 }, { "epoch": 0.59, "learning_rate": 0.00021080820465497265, "loss": 0.0165, "step": 229390 }, { "epoch": 0.59, "learning_rate": 0.00021080431643860116, "loss": 0.0136, "step": 229400 }, { "epoch": 0.59, "learning_rate": 0.00021080042822222968, "loss": 0.0139, "step": 229410 }, { "epoch": 0.59, "learning_rate": 0.00021079654000585822, "loss": 0.0135, "step": 229420 }, { "epoch": 0.59, "learning_rate": 0.0002107926517894868, "loss": 0.0159, "step": 229430 }, { "epoch": 0.59, "learning_rate": 0.0002107887635731153, "loss": 0.0178, "step": 229440 }, { "epoch": 0.59, "learning_rate": 0.00021078487535674384, "loss": 0.0184, "step": 229450 }, { "epoch": 0.59, "learning_rate": 0.00021078098714037236, "loss": 0.0186, "step": 229460 }, { "epoch": 0.59, "learning_rate": 0.00021077709892400093, "loss": 0.0166, "step": 229470 }, { "epoch": 0.59, "learning_rate": 0.00021077321070762944, "loss": 0.017, "step": 229480 }, { "epoch": 0.59, "learning_rate": 0.00021076932249125798, "loss": 0.0162, "step": 229490 }, { "epoch": 0.59, "learning_rate": 0.0002107654342748865, "loss": 0.0146, "step": 229500 }, { "epoch": 0.59, "learning_rate": 0.00021076154605851504, "loss": 0.0153, "step": 229510 }, { "epoch": 0.59, "learning_rate": 0.00021075765784214358, "loss": 0.0196, "step": 229520 }, { "epoch": 0.59, "learning_rate": 0.00021075376962577212, "loss": 0.0157, "step": 229530 }, { "epoch": 0.6, "learning_rate": 0.00021074988140940064, "loss": 0.019, "step": 229540 }, { "epoch": 0.6, "learning_rate": 0.00021074599319302918, "loss": 0.0152, "step": 229550 }, { "epoch": 0.6, "learning_rate": 0.00021074210497665772, "loss": 0.0134, "step": 229560 }, { "epoch": 0.6, "learning_rate": 0.00021073821676028626, "loss": 0.015, "step": 229570 }, { "epoch": 0.6, "learning_rate": 0.00021073432854391478, "loss": 0.0148, "step": 229580 }, { "epoch": 0.6, "learning_rate": 0.00021073044032754332, "loss": 0.0167, "step": 229590 }, { "epoch": 0.6, "learning_rate": 0.0002107265521111719, "loss": 0.0144, "step": 229600 }, { "epoch": 0.6, "learning_rate": 0.0002107226638948004, "loss": 0.0177, "step": 229610 }, { "epoch": 0.6, "learning_rate": 0.00021071877567842894, "loss": 0.0152, "step": 229620 }, { "epoch": 0.6, "learning_rate": 0.00021071488746205746, "loss": 0.0134, "step": 229630 }, { "epoch": 0.6, "learning_rate": 0.00021071099924568603, "loss": 0.0155, "step": 229640 }, { "epoch": 0.6, "learning_rate": 0.00021070711102931454, "loss": 0.0183, "step": 229650 }, { "epoch": 0.6, "learning_rate": 0.00021070322281294308, "loss": 0.0175, "step": 229660 }, { "epoch": 0.6, "learning_rate": 0.0002106993345965716, "loss": 0.0175, "step": 229670 }, { "epoch": 0.6, "learning_rate": 0.00021069544638020017, "loss": 0.0161, "step": 229680 }, { "epoch": 0.6, "learning_rate": 0.00021069155816382868, "loss": 0.0181, "step": 229690 }, { "epoch": 0.6, "learning_rate": 0.00021068766994745722, "loss": 0.0174, "step": 229700 }, { "epoch": 0.6, "learning_rate": 0.00021068378173108574, "loss": 0.0205, "step": 229710 }, { "epoch": 0.6, "learning_rate": 0.0002106798935147143, "loss": 0.0163, "step": 229720 }, { "epoch": 0.6, "learning_rate": 0.00021067600529834282, "loss": 0.0183, "step": 229730 }, { "epoch": 0.6, "learning_rate": 0.00021067211708197136, "loss": 0.0153, "step": 229740 }, { "epoch": 0.6, "learning_rate": 0.00021066822886559988, "loss": 0.0147, "step": 229750 }, { "epoch": 0.6, "learning_rate": 0.00021066434064922842, "loss": 0.0202, "step": 229760 }, { "epoch": 0.6, "learning_rate": 0.00021066045243285699, "loss": 0.0162, "step": 229770 }, { "epoch": 0.6, "learning_rate": 0.0002106565642164855, "loss": 0.0183, "step": 229780 }, { "epoch": 0.6, "learning_rate": 0.00021065267600011404, "loss": 0.0175, "step": 229790 }, { "epoch": 0.6, "learning_rate": 0.00021064878778374256, "loss": 0.0154, "step": 229800 }, { "epoch": 0.6, "learning_rate": 0.00021064489956737113, "loss": 0.0166, "step": 229810 }, { "epoch": 0.6, "learning_rate": 0.00021064101135099964, "loss": 0.0151, "step": 229820 }, { "epoch": 0.6, "learning_rate": 0.00021063712313462818, "loss": 0.0163, "step": 229830 }, { "epoch": 0.6, "learning_rate": 0.0002106332349182567, "loss": 0.0169, "step": 229840 }, { "epoch": 0.6, "learning_rate": 0.00021062934670188526, "loss": 0.0192, "step": 229850 }, { "epoch": 0.6, "learning_rate": 0.00021062545848551378, "loss": 0.0138, "step": 229860 }, { "epoch": 0.6, "learning_rate": 0.00021062157026914232, "loss": 0.0147, "step": 229870 }, { "epoch": 0.6, "learning_rate": 0.00021061768205277084, "loss": 0.0162, "step": 229880 }, { "epoch": 0.6, "learning_rate": 0.0002106137938363994, "loss": 0.0152, "step": 229890 }, { "epoch": 0.6, "learning_rate": 0.00021060990562002792, "loss": 0.0173, "step": 229900 }, { "epoch": 0.6, "learning_rate": 0.00021060601740365646, "loss": 0.0175, "step": 229910 }, { "epoch": 0.6, "learning_rate": 0.00021060212918728497, "loss": 0.0175, "step": 229920 }, { "epoch": 0.6, "learning_rate": 0.00021059824097091354, "loss": 0.0197, "step": 229930 }, { "epoch": 0.6, "learning_rate": 0.00021059435275454209, "loss": 0.0173, "step": 229940 }, { "epoch": 0.6, "learning_rate": 0.0002105904645381706, "loss": 0.0173, "step": 229950 }, { "epoch": 0.6, "learning_rate": 0.00021058657632179911, "loss": 0.0142, "step": 229960 }, { "epoch": 0.6, "learning_rate": 0.00021058268810542768, "loss": 0.0154, "step": 229970 }, { "epoch": 0.6, "learning_rate": 0.00021057879988905622, "loss": 0.0176, "step": 229980 }, { "epoch": 0.6, "learning_rate": 0.00021057491167268474, "loss": 0.0161, "step": 229990 }, { "epoch": 0.6, "learning_rate": 0.00021057102345631328, "loss": 0.0179, "step": 230000 }, { "epoch": 0.6, "eval_cer": 0.8817558725266665, "eval_loss": 0.011123710311949253, "eval_runtime": 107.2187, "eval_samples_per_second": 18.653, "eval_steps_per_second": 4.663, "step": 230000 }, { "epoch": 0.6, "learning_rate": 0.0002105671352399418, "loss": 0.0188, "step": 230010 }, { "epoch": 0.6, "learning_rate": 0.00021056324702357036, "loss": 0.0195, "step": 230020 }, { "epoch": 0.6, "learning_rate": 0.00021055935880719888, "loss": 0.0151, "step": 230030 }, { "epoch": 0.6, "learning_rate": 0.00021055547059082742, "loss": 0.0143, "step": 230040 }, { "epoch": 0.6, "learning_rate": 0.00021055158237445593, "loss": 0.0153, "step": 230050 }, { "epoch": 0.6, "learning_rate": 0.0002105476941580845, "loss": 0.0164, "step": 230060 }, { "epoch": 0.6, "learning_rate": 0.00021054380594171302, "loss": 0.0166, "step": 230070 }, { "epoch": 0.6, "learning_rate": 0.00021053991772534156, "loss": 0.0156, "step": 230080 }, { "epoch": 0.6, "learning_rate": 0.00021053602950897007, "loss": 0.012, "step": 230090 }, { "epoch": 0.6, "learning_rate": 0.00021053214129259864, "loss": 0.0153, "step": 230100 }, { "epoch": 0.6, "learning_rate": 0.00021052825307622718, "loss": 0.0209, "step": 230110 }, { "epoch": 0.6, "learning_rate": 0.0002105243648598557, "loss": 0.0167, "step": 230120 }, { "epoch": 0.6, "learning_rate": 0.00021052047664348421, "loss": 0.0151, "step": 230130 }, { "epoch": 0.6, "learning_rate": 0.00021051658842711278, "loss": 0.0137, "step": 230140 }, { "epoch": 0.6, "learning_rate": 0.00021051270021074132, "loss": 0.0147, "step": 230150 }, { "epoch": 0.6, "learning_rate": 0.00021050881199436984, "loss": 0.0142, "step": 230160 }, { "epoch": 0.6, "learning_rate": 0.00021050492377799838, "loss": 0.0167, "step": 230170 }, { "epoch": 0.6, "learning_rate": 0.00021050103556162692, "loss": 0.0151, "step": 230180 }, { "epoch": 0.6, "learning_rate": 0.00021049714734525546, "loss": 0.0181, "step": 230190 }, { "epoch": 0.6, "learning_rate": 0.00021049325912888398, "loss": 0.0168, "step": 230200 }, { "epoch": 0.6, "learning_rate": 0.00021048937091251252, "loss": 0.0122, "step": 230210 }, { "epoch": 0.6, "learning_rate": 0.00021048548269614106, "loss": 0.0156, "step": 230220 }, { "epoch": 0.6, "learning_rate": 0.0002104815944797696, "loss": 0.0183, "step": 230230 }, { "epoch": 0.6, "learning_rate": 0.00021047770626339812, "loss": 0.0158, "step": 230240 }, { "epoch": 0.6, "learning_rate": 0.00021047381804702666, "loss": 0.0163, "step": 230250 }, { "epoch": 0.6, "learning_rate": 0.00021046992983065517, "loss": 0.0219, "step": 230260 }, { "epoch": 0.6, "learning_rate": 0.00021046604161428374, "loss": 0.0192, "step": 230270 }, { "epoch": 0.6, "learning_rate": 0.00021046215339791226, "loss": 0.0146, "step": 230280 }, { "epoch": 0.6, "learning_rate": 0.0002104582651815408, "loss": 0.0188, "step": 230290 }, { "epoch": 0.6, "learning_rate": 0.0002104543769651693, "loss": 0.0118, "step": 230300 }, { "epoch": 0.6, "learning_rate": 0.00021045048874879788, "loss": 0.016, "step": 230310 }, { "epoch": 0.6, "learning_rate": 0.00021044660053242642, "loss": 0.0162, "step": 230320 }, { "epoch": 0.6, "learning_rate": 0.00021044271231605494, "loss": 0.015, "step": 230330 }, { "epoch": 0.6, "learning_rate": 0.00021043882409968348, "loss": 0.0183, "step": 230340 }, { "epoch": 0.6, "learning_rate": 0.00021043493588331202, "loss": 0.0145, "step": 230350 }, { "epoch": 0.6, "learning_rate": 0.00021043104766694056, "loss": 0.0178, "step": 230360 }, { "epoch": 0.6, "learning_rate": 0.00021042715945056908, "loss": 0.0179, "step": 230370 }, { "epoch": 0.6, "learning_rate": 0.00021042327123419762, "loss": 0.0188, "step": 230380 }, { "epoch": 0.6, "learning_rate": 0.00021041938301782616, "loss": 0.0188, "step": 230390 }, { "epoch": 0.6, "learning_rate": 0.0002104154948014547, "loss": 0.0139, "step": 230400 }, { "epoch": 0.6, "learning_rate": 0.00021041160658508322, "loss": 0.0167, "step": 230410 }, { "epoch": 0.6, "learning_rate": 0.00021040771836871176, "loss": 0.0211, "step": 230420 }, { "epoch": 0.6, "learning_rate": 0.0002104038301523403, "loss": 0.0171, "step": 230430 }, { "epoch": 0.6, "learning_rate": 0.00021039994193596884, "loss": 0.0114, "step": 230440 }, { "epoch": 0.6, "learning_rate": 0.00021039605371959736, "loss": 0.0186, "step": 230450 }, { "epoch": 0.6, "learning_rate": 0.0002103921655032259, "loss": 0.0131, "step": 230460 }, { "epoch": 0.6, "learning_rate": 0.00021038827728685447, "loss": 0.014, "step": 230470 }, { "epoch": 0.6, "learning_rate": 0.00021038438907048298, "loss": 0.0212, "step": 230480 }, { "epoch": 0.6, "learning_rate": 0.00021038050085411152, "loss": 0.0142, "step": 230490 }, { "epoch": 0.6, "learning_rate": 0.00021037661263774004, "loss": 0.0151, "step": 230500 }, { "epoch": 0.6, "learning_rate": 0.00021037272442136858, "loss": 0.0187, "step": 230510 }, { "epoch": 0.6, "learning_rate": 0.00021036883620499712, "loss": 0.0156, "step": 230520 }, { "epoch": 0.6, "learning_rate": 0.00021036494798862566, "loss": 0.0149, "step": 230530 }, { "epoch": 0.6, "learning_rate": 0.00021036105977225418, "loss": 0.0125, "step": 230540 }, { "epoch": 0.6, "learning_rate": 0.00021035717155588272, "loss": 0.0135, "step": 230550 }, { "epoch": 0.6, "learning_rate": 0.00021035328333951126, "loss": 0.0144, "step": 230560 }, { "epoch": 0.6, "learning_rate": 0.0002103493951231398, "loss": 0.0205, "step": 230570 }, { "epoch": 0.6, "learning_rate": 0.00021034550690676832, "loss": 0.0164, "step": 230580 }, { "epoch": 0.6, "learning_rate": 0.00021034161869039686, "loss": 0.0197, "step": 230590 }, { "epoch": 0.6, "learning_rate": 0.0002103377304740254, "loss": 0.0164, "step": 230600 }, { "epoch": 0.6, "learning_rate": 0.00021033384225765394, "loss": 0.0196, "step": 230610 }, { "epoch": 0.6, "learning_rate": 0.00021032995404128246, "loss": 0.0173, "step": 230620 }, { "epoch": 0.6, "learning_rate": 0.000210326065824911, "loss": 0.0152, "step": 230630 }, { "epoch": 0.6, "learning_rate": 0.00021032217760853957, "loss": 0.0156, "step": 230640 }, { "epoch": 0.6, "learning_rate": 0.00021031828939216808, "loss": 0.011, "step": 230650 }, { "epoch": 0.6, "learning_rate": 0.00021031440117579662, "loss": 0.0141, "step": 230660 }, { "epoch": 0.6, "learning_rate": 0.00021031051295942514, "loss": 0.0134, "step": 230670 }, { "epoch": 0.6, "learning_rate": 0.0002103066247430537, "loss": 0.0136, "step": 230680 }, { "epoch": 0.6, "learning_rate": 0.00021030273652668222, "loss": 0.0177, "step": 230690 }, { "epoch": 0.6, "learning_rate": 0.00021029884831031076, "loss": 0.0184, "step": 230700 }, { "epoch": 0.6, "learning_rate": 0.00021029496009393928, "loss": 0.0171, "step": 230710 }, { "epoch": 0.6, "learning_rate": 0.00021029107187756785, "loss": 0.0136, "step": 230720 }, { "epoch": 0.6, "learning_rate": 0.00021028718366119636, "loss": 0.0169, "step": 230730 }, { "epoch": 0.6, "learning_rate": 0.0002102832954448249, "loss": 0.0153, "step": 230740 }, { "epoch": 0.6, "learning_rate": 0.00021027940722845342, "loss": 0.0164, "step": 230750 }, { "epoch": 0.6, "learning_rate": 0.00021027551901208196, "loss": 0.0169, "step": 230760 }, { "epoch": 0.6, "learning_rate": 0.0002102716307957105, "loss": 0.0164, "step": 230770 }, { "epoch": 0.6, "learning_rate": 0.00021026774257933904, "loss": 0.0134, "step": 230780 }, { "epoch": 0.6, "learning_rate": 0.00021026385436296756, "loss": 0.0152, "step": 230790 }, { "epoch": 0.6, "learning_rate": 0.0002102599661465961, "loss": 0.0157, "step": 230800 }, { "epoch": 0.6, "learning_rate": 0.00021025607793022467, "loss": 0.0152, "step": 230810 }, { "epoch": 0.6, "learning_rate": 0.00021025218971385318, "loss": 0.0163, "step": 230820 }, { "epoch": 0.6, "learning_rate": 0.0002102483014974817, "loss": 0.018, "step": 230830 }, { "epoch": 0.6, "learning_rate": 0.00021024441328111024, "loss": 0.0206, "step": 230840 }, { "epoch": 0.6, "learning_rate": 0.0002102405250647388, "loss": 0.0153, "step": 230850 }, { "epoch": 0.6, "learning_rate": 0.00021023663684836732, "loss": 0.021, "step": 230860 }, { "epoch": 0.6, "learning_rate": 0.00021023274863199586, "loss": 0.0223, "step": 230870 }, { "epoch": 0.6, "learning_rate": 0.00021022886041562438, "loss": 0.0169, "step": 230880 }, { "epoch": 0.6, "learning_rate": 0.00021022497219925294, "loss": 0.0159, "step": 230890 }, { "epoch": 0.6, "learning_rate": 0.00021022108398288146, "loss": 0.0201, "step": 230900 }, { "epoch": 0.6, "learning_rate": 0.00021021719576651, "loss": 0.019, "step": 230910 }, { "epoch": 0.6, "learning_rate": 0.00021021330755013852, "loss": 0.0151, "step": 230920 }, { "epoch": 0.6, "learning_rate": 0.00021020941933376708, "loss": 0.0169, "step": 230930 }, { "epoch": 0.6, "learning_rate": 0.0002102055311173956, "loss": 0.0168, "step": 230940 }, { "epoch": 0.6, "learning_rate": 0.00021020164290102414, "loss": 0.0158, "step": 230950 }, { "epoch": 0.6, "learning_rate": 0.00021019775468465265, "loss": 0.0172, "step": 230960 }, { "epoch": 0.6, "learning_rate": 0.00021019386646828122, "loss": 0.0187, "step": 230970 }, { "epoch": 0.6, "learning_rate": 0.00021018997825190977, "loss": 0.0152, "step": 230980 }, { "epoch": 0.6, "learning_rate": 0.00021018609003553828, "loss": 0.0149, "step": 230990 }, { "epoch": 0.6, "learning_rate": 0.0002101822018191668, "loss": 0.0201, "step": 231000 }, { "epoch": 0.6, "eval_cer": 0.8817656699852059, "eval_loss": 0.010918508283793926, "eval_runtime": 107.5234, "eval_samples_per_second": 18.601, "eval_steps_per_second": 4.65, "step": 231000 }, { "epoch": 0.6, "learning_rate": 0.00021017831360279534, "loss": 0.0149, "step": 231010 }, { "epoch": 0.6, "learning_rate": 0.0002101744253864239, "loss": 0.0154, "step": 231020 }, { "epoch": 0.6, "learning_rate": 0.00021017053717005242, "loss": 0.0152, "step": 231030 }, { "epoch": 0.6, "learning_rate": 0.00021016664895368096, "loss": 0.0205, "step": 231040 }, { "epoch": 0.6, "learning_rate": 0.00021016276073730948, "loss": 0.0252, "step": 231050 }, { "epoch": 0.6, "learning_rate": 0.00021015887252093804, "loss": 0.0171, "step": 231060 }, { "epoch": 0.6, "learning_rate": 0.00021015498430456656, "loss": 0.0152, "step": 231070 }, { "epoch": 0.6, "learning_rate": 0.0002101510960881951, "loss": 0.0117, "step": 231080 }, { "epoch": 0.6, "learning_rate": 0.00021014720787182361, "loss": 0.0147, "step": 231090 }, { "epoch": 0.6, "learning_rate": 0.00021014331965545218, "loss": 0.0149, "step": 231100 }, { "epoch": 0.6, "learning_rate": 0.0002101394314390807, "loss": 0.0162, "step": 231110 }, { "epoch": 0.6, "learning_rate": 0.00021013554322270924, "loss": 0.0148, "step": 231120 }, { "epoch": 0.6, "learning_rate": 0.00021013165500633775, "loss": 0.0118, "step": 231130 }, { "epoch": 0.6, "learning_rate": 0.00021012776678996632, "loss": 0.0169, "step": 231140 }, { "epoch": 0.6, "learning_rate": 0.00021012387857359484, "loss": 0.0157, "step": 231150 }, { "epoch": 0.6, "learning_rate": 0.00021011999035722338, "loss": 0.018, "step": 231160 }, { "epoch": 0.6, "learning_rate": 0.0002101161021408519, "loss": 0.0165, "step": 231170 }, { "epoch": 0.6, "learning_rate": 0.00021011221392448046, "loss": 0.0174, "step": 231180 }, { "epoch": 0.6, "learning_rate": 0.000210108325708109, "loss": 0.0137, "step": 231190 }, { "epoch": 0.6, "learning_rate": 0.00021010443749173752, "loss": 0.0247, "step": 231200 }, { "epoch": 0.6, "learning_rate": 0.00021010054927536606, "loss": 0.0136, "step": 231210 }, { "epoch": 0.6, "learning_rate": 0.0002100966610589946, "loss": 0.0158, "step": 231220 }, { "epoch": 0.6, "learning_rate": 0.00021009277284262314, "loss": 0.0195, "step": 231230 }, { "epoch": 0.6, "learning_rate": 0.00021008888462625166, "loss": 0.0251, "step": 231240 }, { "epoch": 0.6, "learning_rate": 0.0002100849964098802, "loss": 0.0148, "step": 231250 }, { "epoch": 0.6, "learning_rate": 0.00021008110819350871, "loss": 0.0125, "step": 231260 }, { "epoch": 0.6, "learning_rate": 0.00021007721997713728, "loss": 0.015, "step": 231270 }, { "epoch": 0.6, "learning_rate": 0.0002100733317607658, "loss": 0.018, "step": 231280 }, { "epoch": 0.6, "learning_rate": 0.00021006944354439434, "loss": 0.0181, "step": 231290 }, { "epoch": 0.6, "learning_rate": 0.00021006555532802285, "loss": 0.0173, "step": 231300 }, { "epoch": 0.6, "learning_rate": 0.00021006166711165142, "loss": 0.0134, "step": 231310 }, { "epoch": 0.6, "learning_rate": 0.00021005777889527994, "loss": 0.0172, "step": 231320 }, { "epoch": 0.6, "learning_rate": 0.00021005389067890848, "loss": 0.0128, "step": 231330 }, { "epoch": 0.6, "learning_rate": 0.000210050002462537, "loss": 0.0138, "step": 231340 }, { "epoch": 0.6, "learning_rate": 0.00021004611424616556, "loss": 0.018, "step": 231350 }, { "epoch": 0.6, "learning_rate": 0.0002100422260297941, "loss": 0.015, "step": 231360 }, { "epoch": 0.6, "learning_rate": 0.00021003833781342262, "loss": 0.0194, "step": 231370 }, { "epoch": 0.6, "learning_rate": 0.00021003444959705116, "loss": 0.0156, "step": 231380 }, { "epoch": 0.6, "learning_rate": 0.0002100305613806797, "loss": 0.0162, "step": 231390 }, { "epoch": 0.6, "learning_rate": 0.00021002667316430824, "loss": 0.0157, "step": 231400 }, { "epoch": 0.6, "learning_rate": 0.00021002278494793676, "loss": 0.0187, "step": 231410 }, { "epoch": 0.6, "learning_rate": 0.0002100188967315653, "loss": 0.0154, "step": 231420 }, { "epoch": 0.6, "learning_rate": 0.00021001500851519384, "loss": 0.0176, "step": 231430 }, { "epoch": 0.6, "learning_rate": 0.00021001112029882238, "loss": 0.0187, "step": 231440 }, { "epoch": 0.6, "learning_rate": 0.0002100072320824509, "loss": 0.0142, "step": 231450 }, { "epoch": 0.6, "learning_rate": 0.00021000334386607944, "loss": 0.0147, "step": 231460 }, { "epoch": 0.6, "learning_rate": 0.00020999945564970798, "loss": 0.0153, "step": 231470 }, { "epoch": 0.6, "learning_rate": 0.00020999556743333652, "loss": 0.015, "step": 231480 }, { "epoch": 0.6, "learning_rate": 0.00020999167921696504, "loss": 0.0176, "step": 231490 }, { "epoch": 0.6, "learning_rate": 0.00020998779100059358, "loss": 0.0149, "step": 231500 }, { "epoch": 0.6, "learning_rate": 0.0002099839027842221, "loss": 0.0215, "step": 231510 }, { "epoch": 0.6, "learning_rate": 0.00020998001456785066, "loss": 0.0161, "step": 231520 }, { "epoch": 0.6, "learning_rate": 0.0002099761263514792, "loss": 0.0123, "step": 231530 }, { "epoch": 0.6, "learning_rate": 0.00020997223813510772, "loss": 0.0175, "step": 231540 }, { "epoch": 0.6, "learning_rate": 0.00020996834991873623, "loss": 0.0183, "step": 231550 }, { "epoch": 0.6, "learning_rate": 0.0002099644617023648, "loss": 0.0153, "step": 231560 }, { "epoch": 0.6, "learning_rate": 0.00020996057348599334, "loss": 0.0224, "step": 231570 }, { "epoch": 0.6, "learning_rate": 0.00020995668526962186, "loss": 0.016, "step": 231580 }, { "epoch": 0.6, "learning_rate": 0.0002099527970532504, "loss": 0.0153, "step": 231590 }, { "epoch": 0.6, "learning_rate": 0.00020994890883687894, "loss": 0.0172, "step": 231600 }, { "epoch": 0.6, "learning_rate": 0.00020994502062050748, "loss": 0.0185, "step": 231610 }, { "epoch": 0.6, "learning_rate": 0.000209941132404136, "loss": 0.0127, "step": 231620 }, { "epoch": 0.6, "learning_rate": 0.00020993724418776454, "loss": 0.0175, "step": 231630 }, { "epoch": 0.6, "learning_rate": 0.00020993335597139308, "loss": 0.0188, "step": 231640 }, { "epoch": 0.6, "learning_rate": 0.00020992946775502162, "loss": 0.0144, "step": 231650 }, { "epoch": 0.6, "learning_rate": 0.00020992557953865014, "loss": 0.0208, "step": 231660 }, { "epoch": 0.6, "learning_rate": 0.00020992169132227868, "loss": 0.0175, "step": 231670 }, { "epoch": 0.6, "learning_rate": 0.00020991780310590725, "loss": 0.0157, "step": 231680 }, { "epoch": 0.6, "learning_rate": 0.00020991391488953576, "loss": 0.0155, "step": 231690 }, { "epoch": 0.6, "learning_rate": 0.0002099100266731643, "loss": 0.018, "step": 231700 }, { "epoch": 0.6, "learning_rate": 0.00020990613845679282, "loss": 0.0158, "step": 231710 }, { "epoch": 0.6, "learning_rate": 0.00020990225024042139, "loss": 0.0164, "step": 231720 }, { "epoch": 0.6, "learning_rate": 0.0002098983620240499, "loss": 0.0148, "step": 231730 }, { "epoch": 0.6, "learning_rate": 0.00020989447380767844, "loss": 0.0189, "step": 231740 }, { "epoch": 0.6, "learning_rate": 0.00020989058559130696, "loss": 0.0152, "step": 231750 }, { "epoch": 0.6, "learning_rate": 0.0002098866973749355, "loss": 0.0171, "step": 231760 }, { "epoch": 0.6, "learning_rate": 0.00020988280915856404, "loss": 0.0144, "step": 231770 }, { "epoch": 0.6, "learning_rate": 0.00020987892094219258, "loss": 0.0189, "step": 231780 }, { "epoch": 0.6, "learning_rate": 0.0002098750327258211, "loss": 0.0211, "step": 231790 }, { "epoch": 0.6, "learning_rate": 0.00020987114450944964, "loss": 0.0156, "step": 231800 }, { "epoch": 0.6, "learning_rate": 0.00020986725629307818, "loss": 0.0116, "step": 231810 }, { "epoch": 0.6, "learning_rate": 0.00020986336807670672, "loss": 0.0173, "step": 231820 }, { "epoch": 0.6, "learning_rate": 0.00020985947986033524, "loss": 0.0186, "step": 231830 }, { "epoch": 0.6, "learning_rate": 0.00020985559164396378, "loss": 0.0179, "step": 231840 }, { "epoch": 0.6, "learning_rate": 0.00020985170342759235, "loss": 0.0143, "step": 231850 }, { "epoch": 0.6, "learning_rate": 0.00020984781521122086, "loss": 0.0204, "step": 231860 }, { "epoch": 0.6, "learning_rate": 0.00020984392699484937, "loss": 0.0159, "step": 231870 }, { "epoch": 0.6, "learning_rate": 0.00020984003877847792, "loss": 0.0186, "step": 231880 }, { "epoch": 0.6, "learning_rate": 0.00020983615056210648, "loss": 0.0148, "step": 231890 }, { "epoch": 0.6, "learning_rate": 0.000209832262345735, "loss": 0.0124, "step": 231900 }, { "epoch": 0.6, "learning_rate": 0.00020982837412936354, "loss": 0.0154, "step": 231910 }, { "epoch": 0.6, "learning_rate": 0.00020982448591299206, "loss": 0.0155, "step": 231920 }, { "epoch": 0.6, "learning_rate": 0.00020982059769662062, "loss": 0.02, "step": 231930 }, { "epoch": 0.6, "learning_rate": 0.00020981670948024914, "loss": 0.0138, "step": 231940 }, { "epoch": 0.6, "learning_rate": 0.00020981282126387768, "loss": 0.0178, "step": 231950 }, { "epoch": 0.6, "learning_rate": 0.0002098089330475062, "loss": 0.0191, "step": 231960 }, { "epoch": 0.6, "learning_rate": 0.00020980504483113476, "loss": 0.0147, "step": 231970 }, { "epoch": 0.6, "learning_rate": 0.00020980115661476328, "loss": 0.0202, "step": 231980 }, { "epoch": 0.6, "learning_rate": 0.00020979726839839182, "loss": 0.0165, "step": 231990 }, { "epoch": 0.6, "learning_rate": 0.00020979338018202033, "loss": 0.02, "step": 232000 }, { "epoch": 0.6, "eval_cer": 0.8817768670806793, "eval_loss": 0.010772459208965302, "eval_runtime": 107.4987, "eval_samples_per_second": 18.605, "eval_steps_per_second": 4.651, "step": 232000 }, { "epoch": 0.6, "learning_rate": 0.00020978949196564888, "loss": 0.0152, "step": 232010 }, { "epoch": 0.6, "learning_rate": 0.00020978560374927742, "loss": 0.0174, "step": 232020 }, { "epoch": 0.6, "learning_rate": 0.00020978171553290596, "loss": 0.0168, "step": 232030 }, { "epoch": 0.6, "learning_rate": 0.00020977782731653447, "loss": 0.0178, "step": 232040 }, { "epoch": 0.6, "learning_rate": 0.00020977393910016302, "loss": 0.0159, "step": 232050 }, { "epoch": 0.6, "learning_rate": 0.00020977005088379158, "loss": 0.0132, "step": 232060 }, { "epoch": 0.6, "learning_rate": 0.0002097661626674201, "loss": 0.0144, "step": 232070 }, { "epoch": 0.6, "learning_rate": 0.00020976227445104864, "loss": 0.0163, "step": 232080 }, { "epoch": 0.6, "learning_rate": 0.00020975838623467716, "loss": 0.0154, "step": 232090 }, { "epoch": 0.6, "learning_rate": 0.00020975449801830572, "loss": 0.0155, "step": 232100 }, { "epoch": 0.6, "learning_rate": 0.00020975060980193424, "loss": 0.0178, "step": 232110 }, { "epoch": 0.6, "learning_rate": 0.00020974672158556278, "loss": 0.0178, "step": 232120 }, { "epoch": 0.6, "learning_rate": 0.0002097428333691913, "loss": 0.0192, "step": 232130 }, { "epoch": 0.6, "learning_rate": 0.00020973894515281986, "loss": 0.0172, "step": 232140 }, { "epoch": 0.6, "learning_rate": 0.00020973505693644838, "loss": 0.0239, "step": 232150 }, { "epoch": 0.6, "learning_rate": 0.00020973116872007692, "loss": 0.0184, "step": 232160 }, { "epoch": 0.6, "learning_rate": 0.00020972728050370543, "loss": 0.0171, "step": 232170 }, { "epoch": 0.6, "learning_rate": 0.000209723392287334, "loss": 0.0149, "step": 232180 }, { "epoch": 0.6, "learning_rate": 0.00020971950407096252, "loss": 0.0157, "step": 232190 }, { "epoch": 0.6, "learning_rate": 0.00020971561585459106, "loss": 0.0184, "step": 232200 }, { "epoch": 0.6, "learning_rate": 0.00020971172763821957, "loss": 0.0184, "step": 232210 }, { "epoch": 0.6, "learning_rate": 0.00020970783942184814, "loss": 0.0184, "step": 232220 }, { "epoch": 0.6, "learning_rate": 0.00020970395120547668, "loss": 0.0149, "step": 232230 }, { "epoch": 0.6, "learning_rate": 0.0002097000629891052, "loss": 0.0141, "step": 232240 }, { "epoch": 0.6, "learning_rate": 0.00020969617477273374, "loss": 0.0199, "step": 232250 }, { "epoch": 0.6, "learning_rate": 0.00020969228655636225, "loss": 0.0155, "step": 232260 }, { "epoch": 0.6, "learning_rate": 0.00020968839833999082, "loss": 0.0156, "step": 232270 }, { "epoch": 0.6, "learning_rate": 0.00020968451012361934, "loss": 0.0156, "step": 232280 }, { "epoch": 0.6, "learning_rate": 0.00020968062190724788, "loss": 0.0171, "step": 232290 }, { "epoch": 0.6, "learning_rate": 0.0002096767336908764, "loss": 0.0226, "step": 232300 }, { "epoch": 0.6, "learning_rate": 0.00020967284547450496, "loss": 0.0144, "step": 232310 }, { "epoch": 0.6, "learning_rate": 0.00020966895725813348, "loss": 0.0153, "step": 232320 }, { "epoch": 0.6, "learning_rate": 0.00020966506904176202, "loss": 0.0173, "step": 232330 }, { "epoch": 0.6, "learning_rate": 0.00020966118082539053, "loss": 0.0139, "step": 232340 }, { "epoch": 0.6, "learning_rate": 0.0002096572926090191, "loss": 0.0164, "step": 232350 }, { "epoch": 0.6, "learning_rate": 0.00020965340439264762, "loss": 0.0163, "step": 232360 }, { "epoch": 0.6, "learning_rate": 0.00020964951617627616, "loss": 0.0153, "step": 232370 }, { "epoch": 0.6, "learning_rate": 0.00020964562795990467, "loss": 0.0147, "step": 232380 }, { "epoch": 0.6, "learning_rate": 0.00020964173974353324, "loss": 0.0164, "step": 232390 }, { "epoch": 0.6, "learning_rate": 0.00020963785152716178, "loss": 0.0155, "step": 232400 }, { "epoch": 0.6, "learning_rate": 0.0002096339633107903, "loss": 0.0127, "step": 232410 }, { "epoch": 0.6, "learning_rate": 0.0002096300750944188, "loss": 0.016, "step": 232420 }, { "epoch": 0.6, "learning_rate": 0.00020962618687804738, "loss": 0.014, "step": 232430 }, { "epoch": 0.6, "learning_rate": 0.00020962229866167592, "loss": 0.0196, "step": 232440 }, { "epoch": 0.6, "learning_rate": 0.00020961841044530444, "loss": 0.0118, "step": 232450 }, { "epoch": 0.6, "learning_rate": 0.00020961452222893298, "loss": 0.0181, "step": 232460 }, { "epoch": 0.6, "learning_rate": 0.00020961063401256152, "loss": 0.0154, "step": 232470 }, { "epoch": 0.6, "learning_rate": 0.00020960674579619006, "loss": 0.0202, "step": 232480 }, { "epoch": 0.6, "learning_rate": 0.00020960285757981858, "loss": 0.017, "step": 232490 }, { "epoch": 0.6, "learning_rate": 0.00020959896936344712, "loss": 0.0177, "step": 232500 }, { "epoch": 0.6, "learning_rate": 0.00020959508114707563, "loss": 0.0154, "step": 232510 }, { "epoch": 0.6, "learning_rate": 0.0002095911929307042, "loss": 0.0137, "step": 232520 }, { "epoch": 0.6, "learning_rate": 0.00020958730471433272, "loss": 0.0194, "step": 232530 }, { "epoch": 0.6, "learning_rate": 0.00020958341649796126, "loss": 0.0166, "step": 232540 }, { "epoch": 0.6, "learning_rate": 0.00020957952828158977, "loss": 0.0148, "step": 232550 }, { "epoch": 0.6, "learning_rate": 0.00020957564006521834, "loss": 0.0169, "step": 232560 }, { "epoch": 0.6, "learning_rate": 0.00020957175184884688, "loss": 0.0163, "step": 232570 }, { "epoch": 0.6, "learning_rate": 0.0002095678636324754, "loss": 0.0137, "step": 232580 }, { "epoch": 0.6, "learning_rate": 0.0002095639754161039, "loss": 0.0142, "step": 232590 }, { "epoch": 0.6, "learning_rate": 0.00020956008719973248, "loss": 0.0192, "step": 232600 }, { "epoch": 0.6, "learning_rate": 0.00020955619898336102, "loss": 0.0144, "step": 232610 }, { "epoch": 0.6, "learning_rate": 0.00020955231076698954, "loss": 0.0202, "step": 232620 }, { "epoch": 0.6, "learning_rate": 0.00020954842255061808, "loss": 0.0156, "step": 232630 }, { "epoch": 0.6, "learning_rate": 0.00020954453433424662, "loss": 0.0144, "step": 232640 }, { "epoch": 0.6, "learning_rate": 0.00020954064611787516, "loss": 0.0169, "step": 232650 }, { "epoch": 0.6, "learning_rate": 0.00020953675790150368, "loss": 0.0164, "step": 232660 }, { "epoch": 0.6, "learning_rate": 0.00020953286968513222, "loss": 0.015, "step": 232670 }, { "epoch": 0.6, "learning_rate": 0.00020952898146876076, "loss": 0.0131, "step": 232680 }, { "epoch": 0.6, "learning_rate": 0.0002095250932523893, "loss": 0.0167, "step": 232690 }, { "epoch": 0.6, "learning_rate": 0.00020952120503601782, "loss": 0.0175, "step": 232700 }, { "epoch": 0.6, "learning_rate": 0.00020951731681964636, "loss": 0.0119, "step": 232710 }, { "epoch": 0.6, "learning_rate": 0.00020951342860327493, "loss": 0.0158, "step": 232720 }, { "epoch": 0.6, "learning_rate": 0.00020950954038690344, "loss": 0.017, "step": 232730 }, { "epoch": 0.6, "learning_rate": 0.00020950565217053195, "loss": 0.0156, "step": 232740 }, { "epoch": 0.6, "learning_rate": 0.0002095017639541605, "loss": 0.0225, "step": 232750 }, { "epoch": 0.6, "learning_rate": 0.000209497875737789, "loss": 0.0156, "step": 232760 }, { "epoch": 0.6, "learning_rate": 0.00020949398752141758, "loss": 0.014, "step": 232770 }, { "epoch": 0.6, "learning_rate": 0.00020949009930504612, "loss": 0.0164, "step": 232780 }, { "epoch": 0.6, "learning_rate": 0.00020948621108867464, "loss": 0.013, "step": 232790 }, { "epoch": 0.6, "learning_rate": 0.00020948232287230318, "loss": 0.0214, "step": 232800 }, { "epoch": 0.6, "learning_rate": 0.00020947843465593172, "loss": 0.0145, "step": 232810 }, { "epoch": 0.6, "learning_rate": 0.00020947454643956026, "loss": 0.019, "step": 232820 }, { "epoch": 0.6, "learning_rate": 0.00020947065822318878, "loss": 0.0156, "step": 232830 }, { "epoch": 0.6, "learning_rate": 0.00020946677000681732, "loss": 0.013, "step": 232840 }, { "epoch": 0.6, "learning_rate": 0.00020946288179044586, "loss": 0.0162, "step": 232850 }, { "epoch": 0.6, "learning_rate": 0.0002094589935740744, "loss": 0.0157, "step": 232860 }, { "epoch": 0.6, "learning_rate": 0.00020945510535770291, "loss": 0.0167, "step": 232870 }, { "epoch": 0.6, "learning_rate": 0.00020945121714133146, "loss": 0.0162, "step": 232880 }, { "epoch": 0.6, "learning_rate": 0.00020944732892496, "loss": 0.0148, "step": 232890 }, { "epoch": 0.6, "learning_rate": 0.00020944344070858854, "loss": 0.015, "step": 232900 }, { "epoch": 0.6, "learning_rate": 0.00020943955249221705, "loss": 0.015, "step": 232910 }, { "epoch": 0.6, "learning_rate": 0.0002094356642758456, "loss": 0.014, "step": 232920 }, { "epoch": 0.6, "learning_rate": 0.00020943177605947416, "loss": 0.0182, "step": 232930 }, { "epoch": 0.6, "learning_rate": 0.00020942788784310268, "loss": 0.0251, "step": 232940 }, { "epoch": 0.6, "learning_rate": 0.00020942399962673122, "loss": 0.0151, "step": 232950 }, { "epoch": 0.6, "learning_rate": 0.00020942011141035974, "loss": 0.0164, "step": 232960 }, { "epoch": 0.6, "learning_rate": 0.0002094162231939883, "loss": 0.0203, "step": 232970 }, { "epoch": 0.6, "learning_rate": 0.00020941233497761682, "loss": 0.0191, "step": 232980 }, { "epoch": 0.6, "learning_rate": 0.00020940844676124536, "loss": 0.0161, "step": 232990 }, { "epoch": 0.6, "learning_rate": 0.00020940455854487387, "loss": 0.0171, "step": 233000 }, { "epoch": 0.6, "eval_cer": 0.8817292794249172, "eval_loss": 0.011502685025334358, "eval_runtime": 107.4531, "eval_samples_per_second": 18.613, "eval_steps_per_second": 4.653, "step": 233000 }, { "epoch": 0.6, "learning_rate": 0.00020940067032850242, "loss": 0.0146, "step": 233010 }, { "epoch": 0.6, "learning_rate": 0.00020939678211213096, "loss": 0.0184, "step": 233020 }, { "epoch": 0.6, "learning_rate": 0.0002093928938957595, "loss": 0.0181, "step": 233030 }, { "epoch": 0.6, "learning_rate": 0.00020938900567938801, "loss": 0.016, "step": 233040 }, { "epoch": 0.6, "learning_rate": 0.00020938511746301656, "loss": 0.0144, "step": 233050 }, { "epoch": 0.6, "learning_rate": 0.0002093812292466451, "loss": 0.0158, "step": 233060 }, { "epoch": 0.6, "learning_rate": 0.00020937734103027364, "loss": 0.0174, "step": 233070 }, { "epoch": 0.6, "learning_rate": 0.00020937345281390215, "loss": 0.0149, "step": 233080 }, { "epoch": 0.6, "learning_rate": 0.0002093695645975307, "loss": 0.0181, "step": 233090 }, { "epoch": 0.6, "learning_rate": 0.00020936567638115926, "loss": 0.0174, "step": 233100 }, { "epoch": 0.6, "learning_rate": 0.00020936178816478778, "loss": 0.013, "step": 233110 }, { "epoch": 0.6, "learning_rate": 0.00020935789994841632, "loss": 0.0147, "step": 233120 }, { "epoch": 0.6, "learning_rate": 0.00020935401173204483, "loss": 0.0169, "step": 233130 }, { "epoch": 0.6, "learning_rate": 0.0002093501235156734, "loss": 0.0199, "step": 233140 }, { "epoch": 0.6, "learning_rate": 0.00020934623529930192, "loss": 0.0171, "step": 233150 }, { "epoch": 0.6, "learning_rate": 0.00020934234708293046, "loss": 0.0234, "step": 233160 }, { "epoch": 0.6, "learning_rate": 0.00020933845886655897, "loss": 0.0179, "step": 233170 }, { "epoch": 0.6, "learning_rate": 0.00020933457065018754, "loss": 0.0154, "step": 233180 }, { "epoch": 0.6, "learning_rate": 0.00020933068243381606, "loss": 0.0186, "step": 233190 }, { "epoch": 0.6, "learning_rate": 0.0002093267942174446, "loss": 0.0167, "step": 233200 }, { "epoch": 0.6, "learning_rate": 0.00020932290600107311, "loss": 0.0176, "step": 233210 }, { "epoch": 0.6, "learning_rate": 0.00020931901778470168, "loss": 0.0331, "step": 233220 }, { "epoch": 0.6, "learning_rate": 0.0002093151295683302, "loss": 0.0127, "step": 233230 }, { "epoch": 0.6, "learning_rate": 0.00020931124135195874, "loss": 0.0152, "step": 233240 }, { "epoch": 0.6, "learning_rate": 0.00020930735313558725, "loss": 0.0173, "step": 233250 }, { "epoch": 0.6, "learning_rate": 0.0002093034649192158, "loss": 0.0211, "step": 233260 }, { "epoch": 0.6, "learning_rate": 0.00020929957670284436, "loss": 0.0139, "step": 233270 }, { "epoch": 0.6, "learning_rate": 0.00020929568848647288, "loss": 0.0176, "step": 233280 }, { "epoch": 0.6, "learning_rate": 0.00020929180027010142, "loss": 0.0173, "step": 233290 }, { "epoch": 0.6, "learning_rate": 0.00020928791205372993, "loss": 0.0179, "step": 233300 }, { "epoch": 0.6, "learning_rate": 0.0002092840238373585, "loss": 0.0162, "step": 233310 }, { "epoch": 0.6, "learning_rate": 0.00020928013562098702, "loss": 0.0143, "step": 233320 }, { "epoch": 0.6, "learning_rate": 0.00020927624740461556, "loss": 0.0164, "step": 233330 }, { "epoch": 0.6, "learning_rate": 0.00020927235918824407, "loss": 0.0194, "step": 233340 }, { "epoch": 0.6, "learning_rate": 0.00020926847097187264, "loss": 0.015, "step": 233350 }, { "epoch": 0.6, "learning_rate": 0.00020926458275550116, "loss": 0.014, "step": 233360 }, { "epoch": 0.6, "learning_rate": 0.0002092606945391297, "loss": 0.0163, "step": 233370 }, { "epoch": 0.6, "learning_rate": 0.0002092568063227582, "loss": 0.0112, "step": 233380 }, { "epoch": 0.6, "learning_rate": 0.00020925291810638678, "loss": 0.0156, "step": 233390 }, { "epoch": 0.61, "learning_rate": 0.0002092490298900153, "loss": 0.0159, "step": 233400 }, { "epoch": 0.61, "learning_rate": 0.00020924514167364384, "loss": 0.0179, "step": 233410 }, { "epoch": 0.61, "learning_rate": 0.00020924125345727235, "loss": 0.0157, "step": 233420 }, { "epoch": 0.61, "learning_rate": 0.00020923736524090092, "loss": 0.0165, "step": 233430 }, { "epoch": 0.61, "learning_rate": 0.00020923347702452946, "loss": 0.0139, "step": 233440 }, { "epoch": 0.61, "learning_rate": 0.00020922958880815798, "loss": 0.015, "step": 233450 }, { "epoch": 0.61, "learning_rate": 0.0002092257005917865, "loss": 0.0157, "step": 233460 }, { "epoch": 0.61, "learning_rate": 0.00020922181237541503, "loss": 0.0146, "step": 233470 }, { "epoch": 0.61, "learning_rate": 0.0002092179241590436, "loss": 0.0194, "step": 233480 }, { "epoch": 0.61, "learning_rate": 0.00020921403594267212, "loss": 0.0147, "step": 233490 }, { "epoch": 0.61, "learning_rate": 0.00020921014772630066, "loss": 0.0156, "step": 233500 }, { "epoch": 0.61, "learning_rate": 0.00020920625950992917, "loss": 0.0129, "step": 233510 }, { "epoch": 0.61, "learning_rate": 0.00020920237129355774, "loss": 0.0167, "step": 233520 }, { "epoch": 0.61, "learning_rate": 0.00020919848307718626, "loss": 0.0115, "step": 233530 }, { "epoch": 0.61, "learning_rate": 0.0002091945948608148, "loss": 0.0189, "step": 233540 }, { "epoch": 0.61, "learning_rate": 0.0002091907066444433, "loss": 0.0172, "step": 233550 }, { "epoch": 0.61, "learning_rate": 0.00020918681842807188, "loss": 0.0152, "step": 233560 }, { "epoch": 0.61, "learning_rate": 0.0002091829302117004, "loss": 0.0192, "step": 233570 }, { "epoch": 0.61, "learning_rate": 0.00020917904199532894, "loss": 0.0163, "step": 233580 }, { "epoch": 0.61, "learning_rate": 0.00020917515377895745, "loss": 0.0165, "step": 233590 }, { "epoch": 0.61, "learning_rate": 0.00020917126556258602, "loss": 0.0187, "step": 233600 }, { "epoch": 0.61, "learning_rate": 0.00020916737734621454, "loss": 0.0167, "step": 233610 }, { "epoch": 0.61, "learning_rate": 0.00020916348912984308, "loss": 0.0176, "step": 233620 }, { "epoch": 0.61, "learning_rate": 0.0002091596009134716, "loss": 0.0141, "step": 233630 }, { "epoch": 0.61, "learning_rate": 0.00020915571269710016, "loss": 0.017, "step": 233640 }, { "epoch": 0.61, "learning_rate": 0.0002091518244807287, "loss": 0.0225, "step": 233650 }, { "epoch": 0.61, "learning_rate": 0.00020914793626435722, "loss": 0.0203, "step": 233660 }, { "epoch": 0.61, "learning_rate": 0.00020914404804798576, "loss": 0.017, "step": 233670 }, { "epoch": 0.61, "learning_rate": 0.0002091401598316143, "loss": 0.016, "step": 233680 }, { "epoch": 0.61, "learning_rate": 0.00020913627161524284, "loss": 0.0202, "step": 233690 }, { "epoch": 0.61, "learning_rate": 0.00020913238339887136, "loss": 0.0132, "step": 233700 }, { "epoch": 0.61, "learning_rate": 0.0002091284951824999, "loss": 0.0137, "step": 233710 }, { "epoch": 0.61, "learning_rate": 0.0002091246069661284, "loss": 0.0122, "step": 233720 }, { "epoch": 0.61, "learning_rate": 0.00020912071874975698, "loss": 0.0146, "step": 233730 }, { "epoch": 0.61, "learning_rate": 0.0002091168305333855, "loss": 0.015, "step": 233740 }, { "epoch": 0.61, "learning_rate": 0.00020911294231701404, "loss": 0.0152, "step": 233750 }, { "epoch": 0.61, "learning_rate": 0.00020910905410064255, "loss": 0.0136, "step": 233760 }, { "epoch": 0.61, "learning_rate": 0.00020910516588427112, "loss": 0.0148, "step": 233770 }, { "epoch": 0.61, "learning_rate": 0.00020910127766789963, "loss": 0.0164, "step": 233780 }, { "epoch": 0.61, "learning_rate": 0.00020909738945152818, "loss": 0.0179, "step": 233790 }, { "epoch": 0.61, "learning_rate": 0.0002090935012351567, "loss": 0.0167, "step": 233800 }, { "epoch": 0.61, "learning_rate": 0.00020908961301878526, "loss": 0.0162, "step": 233810 }, { "epoch": 0.61, "learning_rate": 0.0002090857248024138, "loss": 0.0157, "step": 233820 }, { "epoch": 0.61, "learning_rate": 0.00020908183658604232, "loss": 0.0153, "step": 233830 }, { "epoch": 0.61, "learning_rate": 0.00020907794836967086, "loss": 0.0272, "step": 233840 }, { "epoch": 0.61, "learning_rate": 0.0002090740601532994, "loss": 0.0107, "step": 233850 }, { "epoch": 0.61, "learning_rate": 0.00020907017193692794, "loss": 0.0169, "step": 233860 }, { "epoch": 0.61, "learning_rate": 0.00020906628372055646, "loss": 0.0123, "step": 233870 }, { "epoch": 0.61, "learning_rate": 0.000209062395504185, "loss": 0.0198, "step": 233880 }, { "epoch": 0.61, "learning_rate": 0.00020905850728781354, "loss": 0.0155, "step": 233890 }, { "epoch": 0.61, "learning_rate": 0.00020905461907144208, "loss": 0.0162, "step": 233900 }, { "epoch": 0.61, "learning_rate": 0.0002090507308550706, "loss": 0.0166, "step": 233910 }, { "epoch": 0.61, "learning_rate": 0.00020904684263869914, "loss": 0.0173, "step": 233920 }, { "epoch": 0.61, "learning_rate": 0.00020904295442232768, "loss": 0.0161, "step": 233930 }, { "epoch": 0.61, "learning_rate": 0.00020903906620595622, "loss": 0.0166, "step": 233940 }, { "epoch": 0.61, "learning_rate": 0.00020903517798958473, "loss": 0.0197, "step": 233950 }, { "epoch": 0.61, "learning_rate": 0.00020903128977321328, "loss": 0.0165, "step": 233960 }, { "epoch": 0.61, "learning_rate": 0.0002090274015568418, "loss": 0.0195, "step": 233970 }, { "epoch": 0.61, "learning_rate": 0.00020902351334047036, "loss": 0.0158, "step": 233980 }, { "epoch": 0.61, "learning_rate": 0.0002090196251240989, "loss": 0.0127, "step": 233990 }, { "epoch": 0.61, "learning_rate": 0.00020901573690772742, "loss": 0.0187, "step": 234000 }, { "epoch": 0.61, "eval_cer": 0.8817306790618513, "eval_loss": 0.011547002010047436, "eval_runtime": 107.3826, "eval_samples_per_second": 18.625, "eval_steps_per_second": 4.656, "step": 234000 }, { "epoch": 0.61, "learning_rate": 0.00020901184869135593, "loss": 0.0155, "step": 234010 }, { "epoch": 0.61, "learning_rate": 0.0002090079604749845, "loss": 0.0163, "step": 234020 }, { "epoch": 0.61, "learning_rate": 0.00020900407225861304, "loss": 0.0171, "step": 234030 }, { "epoch": 0.61, "learning_rate": 0.00020900018404224155, "loss": 0.0206, "step": 234040 }, { "epoch": 0.61, "learning_rate": 0.0002089962958258701, "loss": 0.015, "step": 234050 }, { "epoch": 0.61, "learning_rate": 0.00020899240760949864, "loss": 0.0134, "step": 234060 }, { "epoch": 0.61, "learning_rate": 0.00020898851939312718, "loss": 0.0202, "step": 234070 }, { "epoch": 0.61, "learning_rate": 0.0002089846311767557, "loss": 0.0189, "step": 234080 }, { "epoch": 0.61, "learning_rate": 0.00020898074296038424, "loss": 0.0156, "step": 234090 }, { "epoch": 0.61, "learning_rate": 0.00020897685474401278, "loss": 0.0193, "step": 234100 }, { "epoch": 0.61, "learning_rate": 0.00020897296652764132, "loss": 0.0163, "step": 234110 }, { "epoch": 0.61, "learning_rate": 0.00020896907831126983, "loss": 0.0211, "step": 234120 }, { "epoch": 0.61, "learning_rate": 0.00020896519009489838, "loss": 0.0175, "step": 234130 }, { "epoch": 0.61, "learning_rate": 0.00020896130187852694, "loss": 0.0158, "step": 234140 }, { "epoch": 0.61, "learning_rate": 0.00020895741366215546, "loss": 0.0141, "step": 234150 }, { "epoch": 0.61, "learning_rate": 0.000208953525445784, "loss": 0.0147, "step": 234160 }, { "epoch": 0.61, "learning_rate": 0.00020894963722941251, "loss": 0.017, "step": 234170 }, { "epoch": 0.61, "learning_rate": 0.00020894574901304108, "loss": 0.0198, "step": 234180 }, { "epoch": 0.61, "learning_rate": 0.0002089418607966696, "loss": 0.0139, "step": 234190 }, { "epoch": 0.61, "learning_rate": 0.00020893797258029814, "loss": 0.0175, "step": 234200 }, { "epoch": 0.61, "learning_rate": 0.00020893408436392665, "loss": 0.0138, "step": 234210 }, { "epoch": 0.61, "learning_rate": 0.0002089301961475552, "loss": 0.0136, "step": 234220 }, { "epoch": 0.61, "learning_rate": 0.00020892630793118374, "loss": 0.0177, "step": 234230 }, { "epoch": 0.61, "learning_rate": 0.00020892241971481228, "loss": 0.0137, "step": 234240 }, { "epoch": 0.61, "learning_rate": 0.0002089185314984408, "loss": 0.0145, "step": 234250 }, { "epoch": 0.61, "learning_rate": 0.00020891464328206934, "loss": 0.0165, "step": 234260 }, { "epoch": 0.61, "learning_rate": 0.00020891075506569788, "loss": 0.0154, "step": 234270 }, { "epoch": 0.61, "learning_rate": 0.00020890686684932642, "loss": 0.0167, "step": 234280 }, { "epoch": 0.61, "learning_rate": 0.00020890297863295493, "loss": 0.0146, "step": 234290 }, { "epoch": 0.61, "learning_rate": 0.00020889909041658347, "loss": 0.0182, "step": 234300 }, { "epoch": 0.61, "learning_rate": 0.00020889520220021204, "loss": 0.0159, "step": 234310 }, { "epoch": 0.61, "learning_rate": 0.00020889131398384056, "loss": 0.017, "step": 234320 }, { "epoch": 0.61, "learning_rate": 0.00020888742576746907, "loss": 0.015, "step": 234330 }, { "epoch": 0.61, "learning_rate": 0.00020888353755109761, "loss": 0.0148, "step": 234340 }, { "epoch": 0.61, "learning_rate": 0.00020887964933472618, "loss": 0.0171, "step": 234350 }, { "epoch": 0.61, "learning_rate": 0.0002088757611183547, "loss": 0.0146, "step": 234360 }, { "epoch": 0.61, "learning_rate": 0.00020887187290198324, "loss": 0.0176, "step": 234370 }, { "epoch": 0.61, "learning_rate": 0.00020886798468561175, "loss": 0.0137, "step": 234380 }, { "epoch": 0.61, "learning_rate": 0.00020886409646924032, "loss": 0.0166, "step": 234390 }, { "epoch": 0.61, "learning_rate": 0.00020886020825286884, "loss": 0.016, "step": 234400 }, { "epoch": 0.61, "learning_rate": 0.00020885632003649738, "loss": 0.0161, "step": 234410 }, { "epoch": 0.61, "learning_rate": 0.0002088524318201259, "loss": 0.0185, "step": 234420 }, { "epoch": 0.61, "learning_rate": 0.00020884854360375446, "loss": 0.014, "step": 234430 }, { "epoch": 0.61, "learning_rate": 0.00020884465538738298, "loss": 0.0163, "step": 234440 }, { "epoch": 0.61, "learning_rate": 0.00020884076717101152, "loss": 0.0149, "step": 234450 }, { "epoch": 0.61, "learning_rate": 0.00020883687895464003, "loss": 0.0162, "step": 234460 }, { "epoch": 0.61, "learning_rate": 0.00020883299073826857, "loss": 0.0177, "step": 234470 }, { "epoch": 0.61, "learning_rate": 0.00020882910252189712, "loss": 0.0169, "step": 234480 }, { "epoch": 0.61, "learning_rate": 0.00020882521430552566, "loss": 0.0171, "step": 234490 }, { "epoch": 0.61, "learning_rate": 0.00020882132608915417, "loss": 0.0156, "step": 234500 }, { "epoch": 0.61, "learning_rate": 0.00020881743787278271, "loss": 0.0177, "step": 234510 }, { "epoch": 0.61, "learning_rate": 0.00020881354965641128, "loss": 0.0194, "step": 234520 }, { "epoch": 0.61, "learning_rate": 0.0002088096614400398, "loss": 0.0235, "step": 234530 }, { "epoch": 0.61, "learning_rate": 0.00020880577322366834, "loss": 0.0154, "step": 234540 }, { "epoch": 0.61, "learning_rate": 0.00020880188500729685, "loss": 0.0189, "step": 234550 }, { "epoch": 0.61, "learning_rate": 0.00020879799679092542, "loss": 0.0161, "step": 234560 }, { "epoch": 0.61, "learning_rate": 0.00020879410857455394, "loss": 0.0121, "step": 234570 }, { "epoch": 0.61, "learning_rate": 0.00020879022035818248, "loss": 0.0189, "step": 234580 }, { "epoch": 0.61, "learning_rate": 0.000208786332141811, "loss": 0.0193, "step": 234590 }, { "epoch": 0.61, "learning_rate": 0.00020878244392543956, "loss": 0.0173, "step": 234600 }, { "epoch": 0.61, "learning_rate": 0.00020877855570906808, "loss": 0.0148, "step": 234610 }, { "epoch": 0.61, "learning_rate": 0.00020877466749269662, "loss": 0.0142, "step": 234620 }, { "epoch": 0.61, "learning_rate": 0.00020877077927632513, "loss": 0.0159, "step": 234630 }, { "epoch": 0.61, "learning_rate": 0.0002087668910599537, "loss": 0.0164, "step": 234640 }, { "epoch": 0.61, "learning_rate": 0.00020876300284358222, "loss": 0.0142, "step": 234650 }, { "epoch": 0.61, "learning_rate": 0.00020875911462721076, "loss": 0.0176, "step": 234660 }, { "epoch": 0.61, "learning_rate": 0.00020875522641083927, "loss": 0.0136, "step": 234670 }, { "epoch": 0.61, "learning_rate": 0.00020875133819446784, "loss": 0.0167, "step": 234680 }, { "epoch": 0.61, "learning_rate": 0.00020874744997809638, "loss": 0.0182, "step": 234690 }, { "epoch": 0.61, "learning_rate": 0.0002087435617617249, "loss": 0.017, "step": 234700 }, { "epoch": 0.61, "learning_rate": 0.00020873967354535344, "loss": 0.0184, "step": 234710 }, { "epoch": 0.61, "learning_rate": 0.00020873578532898195, "loss": 0.0181, "step": 234720 }, { "epoch": 0.61, "learning_rate": 0.00020873189711261052, "loss": 0.013, "step": 234730 }, { "epoch": 0.61, "learning_rate": 0.00020872800889623904, "loss": 0.0168, "step": 234740 }, { "epoch": 0.61, "learning_rate": 0.00020872412067986758, "loss": 0.0165, "step": 234750 }, { "epoch": 0.61, "learning_rate": 0.0002087202324634961, "loss": 0.0163, "step": 234760 }, { "epoch": 0.61, "learning_rate": 0.00020871634424712466, "loss": 0.015, "step": 234770 }, { "epoch": 0.61, "learning_rate": 0.00020871245603075318, "loss": 0.018, "step": 234780 }, { "epoch": 0.61, "learning_rate": 0.00020870856781438172, "loss": 0.0165, "step": 234790 }, { "epoch": 0.61, "learning_rate": 0.00020870467959801023, "loss": 0.0141, "step": 234800 }, { "epoch": 0.61, "learning_rate": 0.0002087007913816388, "loss": 0.0165, "step": 234810 }, { "epoch": 0.61, "learning_rate": 0.00020869690316526731, "loss": 0.0173, "step": 234820 }, { "epoch": 0.61, "learning_rate": 0.00020869301494889586, "loss": 0.0147, "step": 234830 }, { "epoch": 0.61, "learning_rate": 0.00020868912673252437, "loss": 0.0171, "step": 234840 }, { "epoch": 0.61, "learning_rate": 0.00020868523851615294, "loss": 0.0198, "step": 234850 }, { "epoch": 0.61, "learning_rate": 0.00020868135029978148, "loss": 0.0167, "step": 234860 }, { "epoch": 0.61, "learning_rate": 0.00020867746208341, "loss": 0.0169, "step": 234870 }, { "epoch": 0.61, "learning_rate": 0.0002086735738670385, "loss": 0.0135, "step": 234880 }, { "epoch": 0.61, "learning_rate": 0.00020866968565066708, "loss": 0.0173, "step": 234890 }, { "epoch": 0.61, "learning_rate": 0.00020866579743429562, "loss": 0.016, "step": 234900 }, { "epoch": 0.61, "learning_rate": 0.00020866190921792414, "loss": 0.0171, "step": 234910 }, { "epoch": 0.61, "learning_rate": 0.00020865802100155268, "loss": 0.021, "step": 234920 }, { "epoch": 0.61, "learning_rate": 0.00020865413278518122, "loss": 0.0159, "step": 234930 }, { "epoch": 0.61, "learning_rate": 0.00020865024456880976, "loss": 0.0168, "step": 234940 }, { "epoch": 0.61, "learning_rate": 0.00020864635635243827, "loss": 0.0193, "step": 234950 }, { "epoch": 0.61, "learning_rate": 0.00020864246813606682, "loss": 0.0177, "step": 234960 }, { "epoch": 0.61, "learning_rate": 0.00020863857991969533, "loss": 0.0151, "step": 234970 }, { "epoch": 0.61, "learning_rate": 0.0002086346917033239, "loss": 0.0158, "step": 234980 }, { "epoch": 0.61, "learning_rate": 0.00020863080348695241, "loss": 0.0198, "step": 234990 }, { "epoch": 0.61, "learning_rate": 0.00020862691527058096, "loss": 0.0213, "step": 235000 }, { "epoch": 0.61, "eval_cer": 0.881704085960102, "eval_loss": 0.010831459425389767, "eval_runtime": 107.169, "eval_samples_per_second": 18.662, "eval_steps_per_second": 4.666, "step": 235000 }, { "epoch": 0.61, "learning_rate": 0.00020862302705420947, "loss": 0.015, "step": 235010 }, { "epoch": 0.61, "learning_rate": 0.00020861913883783804, "loss": 0.0163, "step": 235020 }, { "epoch": 0.61, "learning_rate": 0.00020861525062146658, "loss": 0.0177, "step": 235030 }, { "epoch": 0.61, "learning_rate": 0.0002086113624050951, "loss": 0.0129, "step": 235040 }, { "epoch": 0.61, "learning_rate": 0.0002086074741887236, "loss": 0.0149, "step": 235050 }, { "epoch": 0.61, "learning_rate": 0.00020860358597235218, "loss": 0.0162, "step": 235060 }, { "epoch": 0.61, "learning_rate": 0.00020859969775598072, "loss": 0.0159, "step": 235070 }, { "epoch": 0.61, "learning_rate": 0.00020859580953960923, "loss": 0.0171, "step": 235080 }, { "epoch": 0.61, "learning_rate": 0.00020859192132323778, "loss": 0.0138, "step": 235090 }, { "epoch": 0.61, "learning_rate": 0.00020858803310686632, "loss": 0.0185, "step": 235100 }, { "epoch": 0.61, "learning_rate": 0.00020858414489049486, "loss": 0.0146, "step": 235110 }, { "epoch": 0.61, "learning_rate": 0.00020858025667412337, "loss": 0.0128, "step": 235120 }, { "epoch": 0.61, "learning_rate": 0.00020857636845775192, "loss": 0.0142, "step": 235130 }, { "epoch": 0.61, "learning_rate": 0.00020857248024138046, "loss": 0.0141, "step": 235140 }, { "epoch": 0.61, "learning_rate": 0.000208568592025009, "loss": 0.0214, "step": 235150 }, { "epoch": 0.61, "learning_rate": 0.0002085647038086375, "loss": 0.0149, "step": 235160 }, { "epoch": 0.61, "learning_rate": 0.00020856081559226606, "loss": 0.0167, "step": 235170 }, { "epoch": 0.61, "learning_rate": 0.00020855692737589462, "loss": 0.0168, "step": 235180 }, { "epoch": 0.61, "learning_rate": 0.00020855303915952314, "loss": 0.0157, "step": 235190 }, { "epoch": 0.61, "learning_rate": 0.00020854915094315165, "loss": 0.0156, "step": 235200 }, { "epoch": 0.61, "learning_rate": 0.0002085452627267802, "loss": 0.015, "step": 235210 }, { "epoch": 0.61, "learning_rate": 0.0002085413745104087, "loss": 0.0183, "step": 235220 }, { "epoch": 0.61, "learning_rate": 0.00020853748629403728, "loss": 0.0161, "step": 235230 }, { "epoch": 0.61, "learning_rate": 0.00020853359807766582, "loss": 0.014, "step": 235240 }, { "epoch": 0.61, "learning_rate": 0.00020852970986129433, "loss": 0.0192, "step": 235250 }, { "epoch": 0.61, "learning_rate": 0.00020852582164492288, "loss": 0.0152, "step": 235260 }, { "epoch": 0.61, "learning_rate": 0.00020852193342855142, "loss": 0.0162, "step": 235270 }, { "epoch": 0.61, "learning_rate": 0.00020851804521217996, "loss": 0.015, "step": 235280 }, { "epoch": 0.61, "learning_rate": 0.00020851415699580847, "loss": 0.0145, "step": 235290 }, { "epoch": 0.61, "learning_rate": 0.00020851026877943702, "loss": 0.0149, "step": 235300 }, { "epoch": 0.61, "learning_rate": 0.00020850638056306556, "loss": 0.0171, "step": 235310 }, { "epoch": 0.61, "learning_rate": 0.0002085024923466941, "loss": 0.0137, "step": 235320 }, { "epoch": 0.61, "learning_rate": 0.0002084986041303226, "loss": 0.0189, "step": 235330 }, { "epoch": 0.61, "learning_rate": 0.00020849471591395115, "loss": 0.0139, "step": 235340 }, { "epoch": 0.61, "learning_rate": 0.00020849082769757972, "loss": 0.0126, "step": 235350 }, { "epoch": 0.61, "learning_rate": 0.00020848693948120824, "loss": 0.0153, "step": 235360 }, { "epoch": 0.61, "learning_rate": 0.00020848305126483675, "loss": 0.0159, "step": 235370 }, { "epoch": 0.61, "learning_rate": 0.0002084791630484653, "loss": 0.016, "step": 235380 }, { "epoch": 0.61, "learning_rate": 0.00020847527483209386, "loss": 0.0156, "step": 235390 }, { "epoch": 0.61, "learning_rate": 0.00020847138661572238, "loss": 0.0178, "step": 235400 }, { "epoch": 0.61, "learning_rate": 0.00020846749839935092, "loss": 0.0137, "step": 235410 }, { "epoch": 0.61, "learning_rate": 0.00020846361018297943, "loss": 0.0182, "step": 235420 }, { "epoch": 0.61, "learning_rate": 0.000208459721966608, "loss": 0.0175, "step": 235430 }, { "epoch": 0.61, "learning_rate": 0.00020845583375023652, "loss": 0.0165, "step": 235440 }, { "epoch": 0.61, "learning_rate": 0.00020845194553386506, "loss": 0.0179, "step": 235450 }, { "epoch": 0.61, "learning_rate": 0.00020844805731749357, "loss": 0.0164, "step": 235460 }, { "epoch": 0.61, "learning_rate": 0.00020844416910112211, "loss": 0.0155, "step": 235470 }, { "epoch": 0.61, "learning_rate": 0.00020844028088475066, "loss": 0.0193, "step": 235480 }, { "epoch": 0.61, "learning_rate": 0.0002084363926683792, "loss": 0.0152, "step": 235490 }, { "epoch": 0.61, "learning_rate": 0.0002084325044520077, "loss": 0.0146, "step": 235500 }, { "epoch": 0.61, "learning_rate": 0.00020842861623563625, "loss": 0.0233, "step": 235510 }, { "epoch": 0.61, "learning_rate": 0.0002084247280192648, "loss": 0.0148, "step": 235520 }, { "epoch": 0.61, "learning_rate": 0.00020842083980289334, "loss": 0.0204, "step": 235530 }, { "epoch": 0.61, "learning_rate": 0.00020841695158652185, "loss": 0.0157, "step": 235540 }, { "epoch": 0.61, "learning_rate": 0.0002084130633701504, "loss": 0.0183, "step": 235550 }, { "epoch": 0.61, "learning_rate": 0.00020840917515377896, "loss": 0.0162, "step": 235560 }, { "epoch": 0.61, "learning_rate": 0.00020840528693740748, "loss": 0.016, "step": 235570 }, { "epoch": 0.61, "learning_rate": 0.00020840139872103602, "loss": 0.0193, "step": 235580 }, { "epoch": 0.61, "learning_rate": 0.00020839751050466453, "loss": 0.0156, "step": 235590 }, { "epoch": 0.61, "learning_rate": 0.0002083936222882931, "loss": 0.0192, "step": 235600 }, { "epoch": 0.61, "learning_rate": 0.00020838973407192162, "loss": 0.0197, "step": 235610 }, { "epoch": 0.61, "learning_rate": 0.00020838584585555016, "loss": 0.0125, "step": 235620 }, { "epoch": 0.61, "learning_rate": 0.00020838195763917867, "loss": 0.0161, "step": 235630 }, { "epoch": 0.61, "learning_rate": 0.00020837806942280724, "loss": 0.0215, "step": 235640 }, { "epoch": 0.61, "learning_rate": 0.00020837418120643576, "loss": 0.0176, "step": 235650 }, { "epoch": 0.61, "learning_rate": 0.0002083702929900643, "loss": 0.0162, "step": 235660 }, { "epoch": 0.61, "learning_rate": 0.0002083664047736928, "loss": 0.0136, "step": 235670 }, { "epoch": 0.61, "learning_rate": 0.00020836251655732138, "loss": 0.0145, "step": 235680 }, { "epoch": 0.61, "learning_rate": 0.0002083586283409499, "loss": 0.016, "step": 235690 }, { "epoch": 0.61, "learning_rate": 0.00020835474012457844, "loss": 0.015, "step": 235700 }, { "epoch": 0.61, "learning_rate": 0.00020835085190820695, "loss": 0.015, "step": 235710 }, { "epoch": 0.61, "learning_rate": 0.0002083469636918355, "loss": 0.0139, "step": 235720 }, { "epoch": 0.61, "learning_rate": 0.00020834307547546406, "loss": 0.0143, "step": 235730 }, { "epoch": 0.61, "learning_rate": 0.00020833918725909258, "loss": 0.0166, "step": 235740 }, { "epoch": 0.61, "learning_rate": 0.00020833529904272112, "loss": 0.0159, "step": 235750 }, { "epoch": 0.61, "learning_rate": 0.00020833141082634963, "loss": 0.0182, "step": 235760 }, { "epoch": 0.61, "learning_rate": 0.0002083275226099782, "loss": 0.0153, "step": 235770 }, { "epoch": 0.61, "learning_rate": 0.00020832363439360672, "loss": 0.0172, "step": 235780 }, { "epoch": 0.61, "learning_rate": 0.00020831974617723526, "loss": 0.0156, "step": 235790 }, { "epoch": 0.61, "learning_rate": 0.00020831585796086377, "loss": 0.0234, "step": 235800 }, { "epoch": 0.61, "learning_rate": 0.00020831196974449234, "loss": 0.0152, "step": 235810 }, { "epoch": 0.61, "learning_rate": 0.00020830808152812085, "loss": 0.0164, "step": 235820 }, { "epoch": 0.61, "learning_rate": 0.0002083041933117494, "loss": 0.0189, "step": 235830 }, { "epoch": 0.61, "learning_rate": 0.0002083003050953779, "loss": 0.0159, "step": 235840 }, { "epoch": 0.61, "learning_rate": 0.00020829641687900648, "loss": 0.0152, "step": 235850 }, { "epoch": 0.61, "learning_rate": 0.000208292528662635, "loss": 0.0164, "step": 235860 }, { "epoch": 0.61, "learning_rate": 0.00020828864044626354, "loss": 0.0138, "step": 235870 }, { "epoch": 0.61, "learning_rate": 0.00020828475222989205, "loss": 0.0178, "step": 235880 }, { "epoch": 0.61, "learning_rate": 0.00020828086401352062, "loss": 0.0195, "step": 235890 }, { "epoch": 0.61, "learning_rate": 0.00020827697579714916, "loss": 0.0145, "step": 235900 }, { "epoch": 0.61, "learning_rate": 0.00020827308758077768, "loss": 0.0134, "step": 235910 }, { "epoch": 0.61, "learning_rate": 0.0002082691993644062, "loss": 0.0168, "step": 235920 }, { "epoch": 0.61, "learning_rate": 0.00020826531114803476, "loss": 0.0191, "step": 235930 }, { "epoch": 0.61, "learning_rate": 0.0002082614229316633, "loss": 0.0144, "step": 235940 }, { "epoch": 0.61, "learning_rate": 0.00020825753471529181, "loss": 0.0139, "step": 235950 }, { "epoch": 0.61, "learning_rate": 0.00020825364649892036, "loss": 0.0177, "step": 235960 }, { "epoch": 0.61, "learning_rate": 0.00020824975828254887, "loss": 0.0175, "step": 235970 }, { "epoch": 0.61, "learning_rate": 0.00020824587006617744, "loss": 0.0199, "step": 235980 }, { "epoch": 0.61, "learning_rate": 0.00020824198184980595, "loss": 0.0114, "step": 235990 }, { "epoch": 0.61, "learning_rate": 0.0002082380936334345, "loss": 0.0142, "step": 236000 }, { "epoch": 0.61, "eval_cer": 0.8817376772465223, "eval_loss": 0.011257501319050789, "eval_runtime": 107.2888, "eval_samples_per_second": 18.641, "eval_steps_per_second": 4.66, "step": 236000 }, { "epoch": 0.61, "learning_rate": 0.000208234205417063, "loss": 0.015, "step": 236010 }, { "epoch": 0.61, "learning_rate": 0.00020823031720069158, "loss": 0.0134, "step": 236020 }, { "epoch": 0.61, "learning_rate": 0.0002082264289843201, "loss": 0.0176, "step": 236030 }, { "epoch": 0.61, "learning_rate": 0.00020822254076794864, "loss": 0.0177, "step": 236040 }, { "epoch": 0.61, "learning_rate": 0.00020821865255157715, "loss": 0.0164, "step": 236050 }, { "epoch": 0.61, "learning_rate": 0.00020821476433520572, "loss": 0.0142, "step": 236060 }, { "epoch": 0.61, "learning_rate": 0.00020821087611883423, "loss": 0.0172, "step": 236070 }, { "epoch": 0.61, "learning_rate": 0.00020820698790246277, "loss": 0.0155, "step": 236080 }, { "epoch": 0.61, "learning_rate": 0.0002082030996860913, "loss": 0.0167, "step": 236090 }, { "epoch": 0.61, "learning_rate": 0.00020819921146971986, "loss": 0.0177, "step": 236100 }, { "epoch": 0.61, "learning_rate": 0.0002081953232533484, "loss": 0.0201, "step": 236110 }, { "epoch": 0.61, "learning_rate": 0.00020819143503697691, "loss": 0.0192, "step": 236120 }, { "epoch": 0.61, "learning_rate": 0.00020818754682060546, "loss": 0.0185, "step": 236130 }, { "epoch": 0.61, "learning_rate": 0.000208183658604234, "loss": 0.0148, "step": 236140 }, { "epoch": 0.61, "learning_rate": 0.00020817977038786254, "loss": 0.0174, "step": 236150 }, { "epoch": 0.61, "learning_rate": 0.00020817588217149105, "loss": 0.015, "step": 236160 }, { "epoch": 0.61, "learning_rate": 0.0002081719939551196, "loss": 0.0202, "step": 236170 }, { "epoch": 0.61, "learning_rate": 0.00020816810573874814, "loss": 0.0147, "step": 236180 }, { "epoch": 0.61, "learning_rate": 0.00020816421752237668, "loss": 0.0117, "step": 236190 }, { "epoch": 0.61, "learning_rate": 0.0002081603293060052, "loss": 0.0135, "step": 236200 }, { "epoch": 0.61, "learning_rate": 0.00020815644108963373, "loss": 0.0152, "step": 236210 }, { "epoch": 0.61, "learning_rate": 0.00020815255287326225, "loss": 0.0143, "step": 236220 }, { "epoch": 0.61, "learning_rate": 0.00020814866465689082, "loss": 0.0158, "step": 236230 }, { "epoch": 0.61, "learning_rate": 0.00020814477644051933, "loss": 0.0139, "step": 236240 }, { "epoch": 0.61, "learning_rate": 0.00020814088822414787, "loss": 0.0179, "step": 236250 }, { "epoch": 0.61, "learning_rate": 0.0002081370000077764, "loss": 0.0164, "step": 236260 }, { "epoch": 0.61, "learning_rate": 0.00020813311179140496, "loss": 0.0185, "step": 236270 }, { "epoch": 0.61, "learning_rate": 0.0002081292235750335, "loss": 0.0151, "step": 236280 }, { "epoch": 0.61, "learning_rate": 0.00020812533535866201, "loss": 0.0189, "step": 236290 }, { "epoch": 0.61, "learning_rate": 0.00020812144714229056, "loss": 0.0205, "step": 236300 }, { "epoch": 0.61, "learning_rate": 0.0002081175589259191, "loss": 0.0183, "step": 236310 }, { "epoch": 0.61, "learning_rate": 0.00020811367070954764, "loss": 0.013, "step": 236320 }, { "epoch": 0.61, "learning_rate": 0.00020810978249317615, "loss": 0.0135, "step": 236330 }, { "epoch": 0.61, "learning_rate": 0.0002081058942768047, "loss": 0.0164, "step": 236340 }, { "epoch": 0.61, "learning_rate": 0.00020810200606043324, "loss": 0.0161, "step": 236350 }, { "epoch": 0.61, "learning_rate": 0.00020809811784406178, "loss": 0.0128, "step": 236360 }, { "epoch": 0.61, "learning_rate": 0.0002080942296276903, "loss": 0.0182, "step": 236370 }, { "epoch": 0.61, "learning_rate": 0.00020809034141131883, "loss": 0.0131, "step": 236380 }, { "epoch": 0.61, "learning_rate": 0.00020808645319494738, "loss": 0.0136, "step": 236390 }, { "epoch": 0.61, "learning_rate": 0.00020808256497857592, "loss": 0.016, "step": 236400 }, { "epoch": 0.61, "learning_rate": 0.00020807867676220443, "loss": 0.0137, "step": 236410 }, { "epoch": 0.61, "learning_rate": 0.00020807478854583297, "loss": 0.0166, "step": 236420 }, { "epoch": 0.61, "learning_rate": 0.00020807090032946154, "loss": 0.0136, "step": 236430 }, { "epoch": 0.61, "learning_rate": 0.00020806701211309006, "loss": 0.0132, "step": 236440 }, { "epoch": 0.61, "learning_rate": 0.0002080631238967186, "loss": 0.0152, "step": 236450 }, { "epoch": 0.61, "learning_rate": 0.0002080592356803471, "loss": 0.0168, "step": 236460 }, { "epoch": 0.61, "learning_rate": 0.00020805534746397563, "loss": 0.0138, "step": 236470 }, { "epoch": 0.61, "learning_rate": 0.0002080514592476042, "loss": 0.0127, "step": 236480 }, { "epoch": 0.61, "learning_rate": 0.00020804757103123274, "loss": 0.0157, "step": 236490 }, { "epoch": 0.61, "learning_rate": 0.00020804368281486125, "loss": 0.0161, "step": 236500 }, { "epoch": 0.61, "learning_rate": 0.0002080397945984898, "loss": 0.017, "step": 236510 }, { "epoch": 0.61, "learning_rate": 0.00020803590638211834, "loss": 0.0132, "step": 236520 }, { "epoch": 0.61, "learning_rate": 0.00020803201816574688, "loss": 0.013, "step": 236530 }, { "epoch": 0.61, "learning_rate": 0.0002080281299493754, "loss": 0.0197, "step": 236540 }, { "epoch": 0.61, "learning_rate": 0.00020802424173300393, "loss": 0.0182, "step": 236550 }, { "epoch": 0.61, "learning_rate": 0.00020802035351663248, "loss": 0.0172, "step": 236560 }, { "epoch": 0.61, "learning_rate": 0.00020801646530026102, "loss": 0.0132, "step": 236570 }, { "epoch": 0.61, "learning_rate": 0.00020801257708388953, "loss": 0.0159, "step": 236580 }, { "epoch": 0.61, "learning_rate": 0.00020800868886751807, "loss": 0.0149, "step": 236590 }, { "epoch": 0.61, "learning_rate": 0.00020800480065114664, "loss": 0.02, "step": 236600 }, { "epoch": 0.61, "learning_rate": 0.00020800091243477516, "loss": 0.0144, "step": 236610 }, { "epoch": 0.61, "learning_rate": 0.0002079970242184037, "loss": 0.0133, "step": 236620 }, { "epoch": 0.61, "learning_rate": 0.0002079931360020322, "loss": 0.016, "step": 236630 }, { "epoch": 0.61, "learning_rate": 0.00020798924778566078, "loss": 0.0158, "step": 236640 }, { "epoch": 0.61, "learning_rate": 0.0002079853595692893, "loss": 0.0151, "step": 236650 }, { "epoch": 0.61, "learning_rate": 0.00020798147135291784, "loss": 0.0151, "step": 236660 }, { "epoch": 0.61, "learning_rate": 0.00020797758313654635, "loss": 0.0161, "step": 236670 }, { "epoch": 0.61, "learning_rate": 0.00020797369492017492, "loss": 0.019, "step": 236680 }, { "epoch": 0.61, "learning_rate": 0.00020796980670380344, "loss": 0.0125, "step": 236690 }, { "epoch": 0.61, "learning_rate": 0.00020796591848743198, "loss": 0.0132, "step": 236700 }, { "epoch": 0.61, "learning_rate": 0.0002079620302710605, "loss": 0.0148, "step": 236710 }, { "epoch": 0.61, "learning_rate": 0.00020795814205468903, "loss": 0.0166, "step": 236720 }, { "epoch": 0.61, "learning_rate": 0.00020795425383831757, "loss": 0.0125, "step": 236730 }, { "epoch": 0.61, "learning_rate": 0.00020795036562194612, "loss": 0.0172, "step": 236740 }, { "epoch": 0.61, "learning_rate": 0.00020794647740557463, "loss": 0.0158, "step": 236750 }, { "epoch": 0.61, "learning_rate": 0.00020794258918920317, "loss": 0.0186, "step": 236760 }, { "epoch": 0.61, "learning_rate": 0.00020793870097283174, "loss": 0.0167, "step": 236770 }, { "epoch": 0.61, "learning_rate": 0.00020793481275646026, "loss": 0.0188, "step": 236780 }, { "epoch": 0.61, "learning_rate": 0.00020793092454008877, "loss": 0.0151, "step": 236790 }, { "epoch": 0.61, "learning_rate": 0.0002079270363237173, "loss": 0.0147, "step": 236800 }, { "epoch": 0.61, "learning_rate": 0.00020792314810734588, "loss": 0.0122, "step": 236810 }, { "epoch": 0.61, "learning_rate": 0.0002079192598909744, "loss": 0.0174, "step": 236820 }, { "epoch": 0.61, "learning_rate": 0.00020791537167460294, "loss": 0.0157, "step": 236830 }, { "epoch": 0.61, "learning_rate": 0.00020791148345823145, "loss": 0.0143, "step": 236840 }, { "epoch": 0.61, "learning_rate": 0.00020790759524186002, "loss": 0.0129, "step": 236850 }, { "epoch": 0.61, "learning_rate": 0.00020790370702548853, "loss": 0.0192, "step": 236860 }, { "epoch": 0.61, "learning_rate": 0.00020789981880911708, "loss": 0.019, "step": 236870 }, { "epoch": 0.61, "learning_rate": 0.0002078959305927456, "loss": 0.0179, "step": 236880 }, { "epoch": 0.61, "learning_rate": 0.00020789204237637416, "loss": 0.0189, "step": 236890 }, { "epoch": 0.61, "learning_rate": 0.00020788815416000267, "loss": 0.0164, "step": 236900 }, { "epoch": 0.61, "learning_rate": 0.00020788426594363122, "loss": 0.0134, "step": 236910 }, { "epoch": 0.61, "learning_rate": 0.00020788037772725973, "loss": 0.0159, "step": 236920 }, { "epoch": 0.61, "learning_rate": 0.0002078764895108883, "loss": 0.018, "step": 236930 }, { "epoch": 0.61, "learning_rate": 0.00020787260129451684, "loss": 0.0144, "step": 236940 }, { "epoch": 0.61, "learning_rate": 0.00020786871307814536, "loss": 0.0177, "step": 236950 }, { "epoch": 0.61, "learning_rate": 0.00020786482486177387, "loss": 0.0158, "step": 236960 }, { "epoch": 0.61, "learning_rate": 0.0002078609366454024, "loss": 0.0177, "step": 236970 }, { "epoch": 0.61, "learning_rate": 0.00020785704842903098, "loss": 0.0151, "step": 236980 }, { "epoch": 0.61, "learning_rate": 0.0002078531602126595, "loss": 0.0203, "step": 236990 }, { "epoch": 0.61, "learning_rate": 0.00020784927199628804, "loss": 0.0132, "step": 237000 }, { "epoch": 0.61, "eval_cer": 0.8817908634500211, "eval_loss": 0.011273314245045185, "eval_runtime": 107.1971, "eval_samples_per_second": 18.657, "eval_steps_per_second": 4.664, "step": 237000 }, { "epoch": 0.61, "learning_rate": 0.00020784538377991655, "loss": 0.0184, "step": 237010 }, { "epoch": 0.61, "learning_rate": 0.00020784149556354512, "loss": 0.0164, "step": 237020 }, { "epoch": 0.61, "learning_rate": 0.00020783760734717363, "loss": 0.0196, "step": 237030 }, { "epoch": 0.61, "learning_rate": 0.00020783371913080218, "loss": 0.0176, "step": 237040 }, { "epoch": 0.61, "learning_rate": 0.0002078298309144307, "loss": 0.0153, "step": 237050 }, { "epoch": 0.61, "learning_rate": 0.00020782594269805926, "loss": 0.0163, "step": 237060 }, { "epoch": 0.61, "learning_rate": 0.00020782205448168777, "loss": 0.0149, "step": 237070 }, { "epoch": 0.61, "learning_rate": 0.00020781816626531632, "loss": 0.0181, "step": 237080 }, { "epoch": 0.61, "learning_rate": 0.00020781427804894483, "loss": 0.0136, "step": 237090 }, { "epoch": 0.61, "learning_rate": 0.0002078103898325734, "loss": 0.0215, "step": 237100 }, { "epoch": 0.61, "learning_rate": 0.0002078065016162019, "loss": 0.0142, "step": 237110 }, { "epoch": 0.61, "learning_rate": 0.00020780261339983045, "loss": 0.0179, "step": 237120 }, { "epoch": 0.61, "learning_rate": 0.00020779872518345897, "loss": 0.0206, "step": 237130 }, { "epoch": 0.61, "learning_rate": 0.00020779483696708754, "loss": 0.0134, "step": 237140 }, { "epoch": 0.61, "learning_rate": 0.00020779094875071608, "loss": 0.017, "step": 237150 }, { "epoch": 0.61, "learning_rate": 0.0002077870605343446, "loss": 0.0202, "step": 237160 }, { "epoch": 0.61, "learning_rate": 0.00020778317231797314, "loss": 0.0167, "step": 237170 }, { "epoch": 0.61, "learning_rate": 0.00020777928410160168, "loss": 0.0147, "step": 237180 }, { "epoch": 0.61, "learning_rate": 0.00020777539588523022, "loss": 0.0198, "step": 237190 }, { "epoch": 0.61, "learning_rate": 0.00020777150766885873, "loss": 0.0188, "step": 237200 }, { "epoch": 0.61, "learning_rate": 0.00020776761945248728, "loss": 0.0152, "step": 237210 }, { "epoch": 0.61, "learning_rate": 0.0002077637312361158, "loss": 0.0217, "step": 237220 }, { "epoch": 0.61, "learning_rate": 0.00020775984301974436, "loss": 0.0177, "step": 237230 }, { "epoch": 0.61, "learning_rate": 0.00020775595480337287, "loss": 0.0179, "step": 237240 }, { "epoch": 0.61, "learning_rate": 0.00020775206658700141, "loss": 0.0174, "step": 237250 }, { "epoch": 0.62, "learning_rate": 0.00020774817837062993, "loss": 0.0154, "step": 237260 }, { "epoch": 0.62, "learning_rate": 0.0002077442901542585, "loss": 0.0177, "step": 237270 }, { "epoch": 0.62, "learning_rate": 0.000207740401937887, "loss": 0.0133, "step": 237280 }, { "epoch": 0.62, "learning_rate": 0.00020773651372151555, "loss": 0.0163, "step": 237290 }, { "epoch": 0.62, "learning_rate": 0.00020773262550514407, "loss": 0.0136, "step": 237300 }, { "epoch": 0.62, "learning_rate": 0.00020772873728877264, "loss": 0.0145, "step": 237310 }, { "epoch": 0.62, "learning_rate": 0.00020772484907240118, "loss": 0.0143, "step": 237320 }, { "epoch": 0.62, "learning_rate": 0.0002077209608560297, "loss": 0.0147, "step": 237330 }, { "epoch": 0.62, "learning_rate": 0.00020771707263965824, "loss": 0.0192, "step": 237340 }, { "epoch": 0.62, "learning_rate": 0.00020771318442328678, "loss": 0.0156, "step": 237350 }, { "epoch": 0.62, "learning_rate": 0.00020770929620691532, "loss": 0.0174, "step": 237360 }, { "epoch": 0.62, "learning_rate": 0.00020770540799054383, "loss": 0.0151, "step": 237370 }, { "epoch": 0.62, "learning_rate": 0.00020770151977417237, "loss": 0.0175, "step": 237380 }, { "epoch": 0.62, "learning_rate": 0.00020769763155780092, "loss": 0.0184, "step": 237390 }, { "epoch": 0.62, "learning_rate": 0.00020769374334142946, "loss": 0.02, "step": 237400 }, { "epoch": 0.62, "learning_rate": 0.00020768985512505797, "loss": 0.0147, "step": 237410 }, { "epoch": 0.62, "learning_rate": 0.00020768596690868651, "loss": 0.0147, "step": 237420 }, { "epoch": 0.62, "learning_rate": 0.00020768207869231506, "loss": 0.0162, "step": 237430 }, { "epoch": 0.62, "learning_rate": 0.0002076781904759436, "loss": 0.0178, "step": 237440 }, { "epoch": 0.62, "learning_rate": 0.0002076743022595721, "loss": 0.0188, "step": 237450 }, { "epoch": 0.62, "learning_rate": 0.00020767041404320065, "loss": 0.0158, "step": 237460 }, { "epoch": 0.62, "learning_rate": 0.00020766652582682917, "loss": 0.0171, "step": 237470 }, { "epoch": 0.62, "learning_rate": 0.00020766263761045774, "loss": 0.0135, "step": 237480 }, { "epoch": 0.62, "learning_rate": 0.00020765874939408628, "loss": 0.018, "step": 237490 }, { "epoch": 0.62, "learning_rate": 0.0002076548611777148, "loss": 0.0115, "step": 237500 }, { "epoch": 0.62, "learning_rate": 0.0002076509729613433, "loss": 0.0193, "step": 237510 }, { "epoch": 0.62, "learning_rate": 0.00020764708474497188, "loss": 0.0169, "step": 237520 }, { "epoch": 0.62, "learning_rate": 0.00020764319652860042, "loss": 0.0165, "step": 237530 }, { "epoch": 0.62, "learning_rate": 0.00020763930831222893, "loss": 0.016, "step": 237540 }, { "epoch": 0.62, "learning_rate": 0.00020763542009585747, "loss": 0.0167, "step": 237550 }, { "epoch": 0.62, "learning_rate": 0.00020763153187948602, "loss": 0.0224, "step": 237560 }, { "epoch": 0.62, "learning_rate": 0.00020762764366311456, "loss": 0.0151, "step": 237570 }, { "epoch": 0.62, "learning_rate": 0.00020762375544674307, "loss": 0.0125, "step": 237580 }, { "epoch": 0.62, "learning_rate": 0.0002076198672303716, "loss": 0.0156, "step": 237590 }, { "epoch": 0.62, "learning_rate": 0.00020761597901400016, "loss": 0.018, "step": 237600 }, { "epoch": 0.62, "learning_rate": 0.0002076120907976287, "loss": 0.0155, "step": 237610 }, { "epoch": 0.62, "learning_rate": 0.0002076082025812572, "loss": 0.0158, "step": 237620 }, { "epoch": 0.62, "learning_rate": 0.00020760431436488575, "loss": 0.0155, "step": 237630 }, { "epoch": 0.62, "learning_rate": 0.00020760042614851432, "loss": 0.0173, "step": 237640 }, { "epoch": 0.62, "learning_rate": 0.00020759653793214284, "loss": 0.0198, "step": 237650 }, { "epoch": 0.62, "learning_rate": 0.00020759264971577135, "loss": 0.0182, "step": 237660 }, { "epoch": 0.62, "learning_rate": 0.0002075887614993999, "loss": 0.0211, "step": 237670 }, { "epoch": 0.62, "learning_rate": 0.00020758487328302846, "loss": 0.015, "step": 237680 }, { "epoch": 0.62, "learning_rate": 0.00020758098506665698, "loss": 0.0156, "step": 237690 }, { "epoch": 0.62, "learning_rate": 0.00020757709685028552, "loss": 0.0172, "step": 237700 }, { "epoch": 0.62, "learning_rate": 0.00020757320863391403, "loss": 0.0136, "step": 237710 }, { "epoch": 0.62, "learning_rate": 0.00020756932041754257, "loss": 0.0148, "step": 237720 }, { "epoch": 0.62, "learning_rate": 0.00020756543220117112, "loss": 0.0158, "step": 237730 }, { "epoch": 0.62, "learning_rate": 0.00020756154398479966, "loss": 0.0169, "step": 237740 }, { "epoch": 0.62, "learning_rate": 0.00020755765576842817, "loss": 0.0127, "step": 237750 }, { "epoch": 0.62, "learning_rate": 0.0002075537675520567, "loss": 0.0146, "step": 237760 }, { "epoch": 0.62, "learning_rate": 0.00020754987933568525, "loss": 0.0174, "step": 237770 }, { "epoch": 0.62, "learning_rate": 0.0002075459911193138, "loss": 0.0169, "step": 237780 }, { "epoch": 0.62, "learning_rate": 0.0002075421029029423, "loss": 0.0166, "step": 237790 }, { "epoch": 0.62, "learning_rate": 0.00020753821468657085, "loss": 0.0161, "step": 237800 }, { "epoch": 0.62, "learning_rate": 0.00020753432647019942, "loss": 0.0141, "step": 237810 }, { "epoch": 0.62, "learning_rate": 0.00020753043825382794, "loss": 0.0146, "step": 237820 }, { "epoch": 0.62, "learning_rate": 0.00020752655003745645, "loss": 0.0148, "step": 237830 }, { "epoch": 0.62, "learning_rate": 0.000207522661821085, "loss": 0.013, "step": 237840 }, { "epoch": 0.62, "learning_rate": 0.00020751877360471356, "loss": 0.0121, "step": 237850 }, { "epoch": 0.62, "learning_rate": 0.00020751488538834208, "loss": 0.0161, "step": 237860 }, { "epoch": 0.62, "learning_rate": 0.00020751099717197062, "loss": 0.0184, "step": 237870 }, { "epoch": 0.62, "learning_rate": 0.00020750710895559913, "loss": 0.0162, "step": 237880 }, { "epoch": 0.62, "learning_rate": 0.0002075032207392277, "loss": 0.0142, "step": 237890 }, { "epoch": 0.62, "learning_rate": 0.00020749933252285621, "loss": 0.0163, "step": 237900 }, { "epoch": 0.62, "learning_rate": 0.00020749544430648476, "loss": 0.0137, "step": 237910 }, { "epoch": 0.62, "learning_rate": 0.00020749155609011327, "loss": 0.0207, "step": 237920 }, { "epoch": 0.62, "learning_rate": 0.00020748766787374184, "loss": 0.0163, "step": 237930 }, { "epoch": 0.62, "learning_rate": 0.00020748377965737035, "loss": 0.0193, "step": 237940 }, { "epoch": 0.62, "learning_rate": 0.0002074798914409989, "loss": 0.0161, "step": 237950 }, { "epoch": 0.62, "learning_rate": 0.0002074760032246274, "loss": 0.0155, "step": 237960 }, { "epoch": 0.62, "learning_rate": 0.00020747211500825595, "loss": 0.0198, "step": 237970 }, { "epoch": 0.62, "learning_rate": 0.0002074682267918845, "loss": 0.016, "step": 237980 }, { "epoch": 0.62, "learning_rate": 0.00020746433857551304, "loss": 0.0142, "step": 237990 }, { "epoch": 0.62, "learning_rate": 0.00020746045035914155, "loss": 0.0152, "step": 238000 }, { "epoch": 0.62, "eval_cer": 0.8817488743419957, "eval_loss": 0.01096505206078291, "eval_runtime": 107.3808, "eval_samples_per_second": 18.625, "eval_steps_per_second": 4.656, "step": 238000 }, { "epoch": 0.62, "learning_rate": 0.0002074565621427701, "loss": 0.0163, "step": 238010 }, { "epoch": 0.62, "learning_rate": 0.00020745267392639866, "loss": 0.0175, "step": 238020 }, { "epoch": 0.62, "learning_rate": 0.00020744878571002717, "loss": 0.0179, "step": 238030 }, { "epoch": 0.62, "learning_rate": 0.00020744489749365572, "loss": 0.0163, "step": 238040 }, { "epoch": 0.62, "learning_rate": 0.00020744100927728423, "loss": 0.0147, "step": 238050 }, { "epoch": 0.62, "learning_rate": 0.0002074371210609128, "loss": 0.0256, "step": 238060 }, { "epoch": 0.62, "learning_rate": 0.00020743323284454131, "loss": 0.0223, "step": 238070 }, { "epoch": 0.62, "learning_rate": 0.00020742934462816986, "loss": 0.0172, "step": 238080 }, { "epoch": 0.62, "learning_rate": 0.00020742545641179837, "loss": 0.0153, "step": 238090 }, { "epoch": 0.62, "learning_rate": 0.00020742156819542694, "loss": 0.0157, "step": 238100 }, { "epoch": 0.62, "learning_rate": 0.00020741767997905545, "loss": 0.0158, "step": 238110 }, { "epoch": 0.62, "learning_rate": 0.000207413791762684, "loss": 0.0131, "step": 238120 }, { "epoch": 0.62, "learning_rate": 0.0002074099035463125, "loss": 0.0155, "step": 238130 }, { "epoch": 0.62, "learning_rate": 0.00020740601532994108, "loss": 0.0161, "step": 238140 }, { "epoch": 0.62, "learning_rate": 0.0002074021271135696, "loss": 0.0182, "step": 238150 }, { "epoch": 0.62, "learning_rate": 0.00020739823889719813, "loss": 0.0186, "step": 238160 }, { "epoch": 0.62, "learning_rate": 0.00020739435068082665, "loss": 0.0176, "step": 238170 }, { "epoch": 0.62, "learning_rate": 0.00020739046246445522, "loss": 0.0168, "step": 238180 }, { "epoch": 0.62, "learning_rate": 0.00020738657424808376, "loss": 0.0153, "step": 238190 }, { "epoch": 0.62, "learning_rate": 0.00020738268603171227, "loss": 0.0147, "step": 238200 }, { "epoch": 0.62, "learning_rate": 0.00020737879781534082, "loss": 0.0165, "step": 238210 }, { "epoch": 0.62, "learning_rate": 0.00020737490959896933, "loss": 0.0179, "step": 238220 }, { "epoch": 0.62, "learning_rate": 0.0002073710213825979, "loss": 0.0146, "step": 238230 }, { "epoch": 0.62, "learning_rate": 0.0002073671331662264, "loss": 0.0174, "step": 238240 }, { "epoch": 0.62, "learning_rate": 0.00020736324494985496, "loss": 0.0138, "step": 238250 }, { "epoch": 0.62, "learning_rate": 0.00020735935673348347, "loss": 0.0124, "step": 238260 }, { "epoch": 0.62, "learning_rate": 0.00020735546851711204, "loss": 0.0167, "step": 238270 }, { "epoch": 0.62, "learning_rate": 0.00020735158030074055, "loss": 0.0171, "step": 238280 }, { "epoch": 0.62, "learning_rate": 0.0002073476920843691, "loss": 0.0147, "step": 238290 }, { "epoch": 0.62, "learning_rate": 0.0002073438038679976, "loss": 0.0151, "step": 238300 }, { "epoch": 0.62, "learning_rate": 0.00020733991565162618, "loss": 0.0145, "step": 238310 }, { "epoch": 0.62, "learning_rate": 0.0002073360274352547, "loss": 0.0186, "step": 238320 }, { "epoch": 0.62, "learning_rate": 0.00020733213921888323, "loss": 0.02, "step": 238330 }, { "epoch": 0.62, "learning_rate": 0.00020732825100251175, "loss": 0.0177, "step": 238340 }, { "epoch": 0.62, "learning_rate": 0.00020732436278614032, "loss": 0.0168, "step": 238350 }, { "epoch": 0.62, "learning_rate": 0.00020732047456976886, "loss": 0.0124, "step": 238360 }, { "epoch": 0.62, "learning_rate": 0.00020731658635339737, "loss": 0.0166, "step": 238370 }, { "epoch": 0.62, "learning_rate": 0.0002073126981370259, "loss": 0.0106, "step": 238380 }, { "epoch": 0.62, "learning_rate": 0.00020730880992065446, "loss": 0.018, "step": 238390 }, { "epoch": 0.62, "learning_rate": 0.000207304921704283, "loss": 0.0165, "step": 238400 }, { "epoch": 0.62, "learning_rate": 0.0002073010334879115, "loss": 0.0175, "step": 238410 }, { "epoch": 0.62, "learning_rate": 0.00020729714527154005, "loss": 0.0172, "step": 238420 }, { "epoch": 0.62, "learning_rate": 0.0002072932570551686, "loss": 0.0213, "step": 238430 }, { "epoch": 0.62, "learning_rate": 0.00020728936883879714, "loss": 0.0167, "step": 238440 }, { "epoch": 0.62, "learning_rate": 0.00020728548062242565, "loss": 0.0139, "step": 238450 }, { "epoch": 0.62, "learning_rate": 0.0002072815924060542, "loss": 0.0189, "step": 238460 }, { "epoch": 0.62, "learning_rate": 0.0002072777041896827, "loss": 0.0136, "step": 238470 }, { "epoch": 0.62, "learning_rate": 0.00020727381597331128, "loss": 0.0181, "step": 238480 }, { "epoch": 0.62, "learning_rate": 0.0002072699277569398, "loss": 0.0169, "step": 238490 }, { "epoch": 0.62, "learning_rate": 0.00020726603954056833, "loss": 0.0149, "step": 238500 }, { "epoch": 0.62, "learning_rate": 0.00020726215132419685, "loss": 0.0157, "step": 238510 }, { "epoch": 0.62, "learning_rate": 0.00020725826310782542, "loss": 0.0139, "step": 238520 }, { "epoch": 0.62, "learning_rate": 0.00020725437489145396, "loss": 0.0153, "step": 238530 }, { "epoch": 0.62, "learning_rate": 0.00020725048667508247, "loss": 0.0112, "step": 238540 }, { "epoch": 0.62, "learning_rate": 0.000207246598458711, "loss": 0.0126, "step": 238550 }, { "epoch": 0.62, "learning_rate": 0.00020724271024233956, "loss": 0.0189, "step": 238560 }, { "epoch": 0.62, "learning_rate": 0.0002072388220259681, "loss": 0.0143, "step": 238570 }, { "epoch": 0.62, "learning_rate": 0.0002072349338095966, "loss": 0.0157, "step": 238580 }, { "epoch": 0.62, "learning_rate": 0.00020723104559322515, "loss": 0.0127, "step": 238590 }, { "epoch": 0.62, "learning_rate": 0.0002072271573768537, "loss": 0.0206, "step": 238600 }, { "epoch": 0.62, "learning_rate": 0.00020722326916048224, "loss": 0.0168, "step": 238610 }, { "epoch": 0.62, "learning_rate": 0.00020721938094411075, "loss": 0.0131, "step": 238620 }, { "epoch": 0.62, "learning_rate": 0.0002072154927277393, "loss": 0.0129, "step": 238630 }, { "epoch": 0.62, "learning_rate": 0.00020721160451136783, "loss": 0.0146, "step": 238640 }, { "epoch": 0.62, "learning_rate": 0.00020720771629499638, "loss": 0.0104, "step": 238650 }, { "epoch": 0.62, "learning_rate": 0.0002072038280786249, "loss": 0.0157, "step": 238660 }, { "epoch": 0.62, "learning_rate": 0.00020719993986225343, "loss": 0.0151, "step": 238670 }, { "epoch": 0.62, "learning_rate": 0.00020719605164588195, "loss": 0.0214, "step": 238680 }, { "epoch": 0.62, "learning_rate": 0.00020719216342951052, "loss": 0.0167, "step": 238690 }, { "epoch": 0.62, "learning_rate": 0.00020718827521313903, "loss": 0.0163, "step": 238700 }, { "epoch": 0.62, "learning_rate": 0.00020718438699676757, "loss": 0.0166, "step": 238710 }, { "epoch": 0.62, "learning_rate": 0.0002071804987803961, "loss": 0.0189, "step": 238720 }, { "epoch": 0.62, "learning_rate": 0.00020717661056402466, "loss": 0.0168, "step": 238730 }, { "epoch": 0.62, "learning_rate": 0.0002071727223476532, "loss": 0.014, "step": 238740 }, { "epoch": 0.62, "learning_rate": 0.0002071688341312817, "loss": 0.0184, "step": 238750 }, { "epoch": 0.62, "learning_rate": 0.00020716494591491025, "loss": 0.0132, "step": 238760 }, { "epoch": 0.62, "learning_rate": 0.0002071610576985388, "loss": 0.0194, "step": 238770 }, { "epoch": 0.62, "learning_rate": 0.00020715716948216734, "loss": 0.0154, "step": 238780 }, { "epoch": 0.62, "learning_rate": 0.00020715328126579585, "loss": 0.0195, "step": 238790 }, { "epoch": 0.62, "learning_rate": 0.0002071493930494244, "loss": 0.018, "step": 238800 }, { "epoch": 0.62, "learning_rate": 0.00020714550483305293, "loss": 0.014, "step": 238810 }, { "epoch": 0.62, "learning_rate": 0.00020714161661668148, "loss": 0.0128, "step": 238820 }, { "epoch": 0.62, "learning_rate": 0.00020713772840031, "loss": 0.0149, "step": 238830 }, { "epoch": 0.62, "learning_rate": 0.00020713384018393853, "loss": 0.0185, "step": 238840 }, { "epoch": 0.62, "learning_rate": 0.00020712995196756707, "loss": 0.0187, "step": 238850 }, { "epoch": 0.62, "learning_rate": 0.00020712606375119562, "loss": 0.0177, "step": 238860 }, { "epoch": 0.62, "learning_rate": 0.00020712217553482413, "loss": 0.0138, "step": 238870 }, { "epoch": 0.62, "learning_rate": 0.00020711828731845267, "loss": 0.0162, "step": 238880 }, { "epoch": 0.62, "learning_rate": 0.00020711439910208124, "loss": 0.0146, "step": 238890 }, { "epoch": 0.62, "learning_rate": 0.00020711051088570975, "loss": 0.016, "step": 238900 }, { "epoch": 0.62, "learning_rate": 0.0002071066226693383, "loss": 0.0137, "step": 238910 }, { "epoch": 0.62, "learning_rate": 0.0002071027344529668, "loss": 0.0151, "step": 238920 }, { "epoch": 0.62, "learning_rate": 0.00020709884623659535, "loss": 0.0152, "step": 238930 }, { "epoch": 0.62, "learning_rate": 0.0002070949580202239, "loss": 0.0196, "step": 238940 }, { "epoch": 0.62, "learning_rate": 0.00020709106980385244, "loss": 0.0142, "step": 238950 }, { "epoch": 0.62, "learning_rate": 0.00020708718158748095, "loss": 0.0158, "step": 238960 }, { "epoch": 0.62, "learning_rate": 0.0002070832933711095, "loss": 0.0182, "step": 238970 }, { "epoch": 0.62, "learning_rate": 0.00020707940515473803, "loss": 0.0156, "step": 238980 }, { "epoch": 0.62, "learning_rate": 0.00020707551693836658, "loss": 0.0147, "step": 238990 }, { "epoch": 0.62, "learning_rate": 0.0002070716287219951, "loss": 0.0146, "step": 239000 }, { "epoch": 0.62, "eval_cer": 0.8817236808771804, "eval_loss": 0.011040524579584599, "eval_runtime": 107.4536, "eval_samples_per_second": 18.613, "eval_steps_per_second": 4.653, "step": 239000 }, { "epoch": 0.62, "learning_rate": 0.00020706774050562363, "loss": 0.0144, "step": 239010 }, { "epoch": 0.62, "learning_rate": 0.00020706385228925217, "loss": 0.0217, "step": 239020 }, { "epoch": 0.62, "learning_rate": 0.00020705996407288071, "loss": 0.0157, "step": 239030 }, { "epoch": 0.62, "learning_rate": 0.00020705607585650923, "loss": 0.0138, "step": 239040 }, { "epoch": 0.62, "learning_rate": 0.00020705218764013777, "loss": 0.0167, "step": 239050 }, { "epoch": 0.62, "learning_rate": 0.00020704829942376634, "loss": 0.0188, "step": 239060 }, { "epoch": 0.62, "learning_rate": 0.00020704441120739485, "loss": 0.0139, "step": 239070 }, { "epoch": 0.62, "learning_rate": 0.0002070405229910234, "loss": 0.0108, "step": 239080 }, { "epoch": 0.62, "learning_rate": 0.0002070366347746519, "loss": 0.015, "step": 239090 }, { "epoch": 0.62, "learning_rate": 0.00020703274655828048, "loss": 0.017, "step": 239100 }, { "epoch": 0.62, "learning_rate": 0.000207028858341909, "loss": 0.0127, "step": 239110 }, { "epoch": 0.62, "learning_rate": 0.00020702497012553754, "loss": 0.0187, "step": 239120 }, { "epoch": 0.62, "learning_rate": 0.00020702108190916605, "loss": 0.0178, "step": 239130 }, { "epoch": 0.62, "learning_rate": 0.00020701719369279462, "loss": 0.0116, "step": 239140 }, { "epoch": 0.62, "learning_rate": 0.00020701330547642313, "loss": 0.018, "step": 239150 }, { "epoch": 0.62, "learning_rate": 0.00020700941726005167, "loss": 0.0163, "step": 239160 }, { "epoch": 0.62, "learning_rate": 0.0002070055290436802, "loss": 0.0118, "step": 239170 }, { "epoch": 0.62, "learning_rate": 0.00020700164082730873, "loss": 0.0171, "step": 239180 }, { "epoch": 0.62, "learning_rate": 0.00020699775261093727, "loss": 0.0176, "step": 239190 }, { "epoch": 0.62, "learning_rate": 0.00020699386439456581, "loss": 0.0148, "step": 239200 }, { "epoch": 0.62, "learning_rate": 0.00020698997617819433, "loss": 0.0154, "step": 239210 }, { "epoch": 0.62, "learning_rate": 0.00020698608796182287, "loss": 0.0136, "step": 239220 }, { "epoch": 0.62, "learning_rate": 0.00020698219974545144, "loss": 0.0136, "step": 239230 }, { "epoch": 0.62, "learning_rate": 0.00020697831152907995, "loss": 0.0143, "step": 239240 }, { "epoch": 0.62, "learning_rate": 0.00020697442331270847, "loss": 0.0135, "step": 239250 }, { "epoch": 0.62, "learning_rate": 0.000206970535096337, "loss": 0.0133, "step": 239260 }, { "epoch": 0.62, "learning_rate": 0.00020696664687996558, "loss": 0.0211, "step": 239270 }, { "epoch": 0.62, "learning_rate": 0.0002069627586635941, "loss": 0.0163, "step": 239280 }, { "epoch": 0.62, "learning_rate": 0.00020695887044722263, "loss": 0.0158, "step": 239290 }, { "epoch": 0.62, "learning_rate": 0.00020695498223085115, "loss": 0.0159, "step": 239300 }, { "epoch": 0.62, "learning_rate": 0.00020695109401447972, "loss": 0.0187, "step": 239310 }, { "epoch": 0.62, "learning_rate": 0.00020694720579810823, "loss": 0.0158, "step": 239320 }, { "epoch": 0.62, "learning_rate": 0.00020694331758173677, "loss": 0.0164, "step": 239330 }, { "epoch": 0.62, "learning_rate": 0.0002069394293653653, "loss": 0.0194, "step": 239340 }, { "epoch": 0.62, "learning_rate": 0.00020693554114899386, "loss": 0.014, "step": 239350 }, { "epoch": 0.62, "learning_rate": 0.00020693165293262237, "loss": 0.0163, "step": 239360 }, { "epoch": 0.62, "learning_rate": 0.00020692776471625091, "loss": 0.0197, "step": 239370 }, { "epoch": 0.62, "learning_rate": 0.00020692387649987943, "loss": 0.0155, "step": 239380 }, { "epoch": 0.62, "learning_rate": 0.000206919988283508, "loss": 0.0142, "step": 239390 }, { "epoch": 0.62, "learning_rate": 0.00020691610006713654, "loss": 0.0175, "step": 239400 }, { "epoch": 0.62, "learning_rate": 0.00020691221185076505, "loss": 0.0135, "step": 239410 }, { "epoch": 0.62, "learning_rate": 0.00020690832363439357, "loss": 0.0155, "step": 239420 }, { "epoch": 0.62, "learning_rate": 0.0002069044354180221, "loss": 0.0189, "step": 239430 }, { "epoch": 0.62, "learning_rate": 0.00020690054720165068, "loss": 0.0175, "step": 239440 }, { "epoch": 0.62, "learning_rate": 0.0002068966589852792, "loss": 0.0157, "step": 239450 }, { "epoch": 0.62, "learning_rate": 0.00020689277076890773, "loss": 0.0183, "step": 239460 }, { "epoch": 0.62, "learning_rate": 0.00020688888255253625, "loss": 0.0159, "step": 239470 }, { "epoch": 0.62, "learning_rate": 0.00020688499433616482, "loss": 0.0165, "step": 239480 }, { "epoch": 0.62, "learning_rate": 0.00020688110611979333, "loss": 0.0156, "step": 239490 }, { "epoch": 0.62, "learning_rate": 0.00020687721790342187, "loss": 0.0189, "step": 239500 }, { "epoch": 0.62, "learning_rate": 0.0002068733296870504, "loss": 0.0172, "step": 239510 }, { "epoch": 0.62, "learning_rate": 0.00020686944147067896, "loss": 0.016, "step": 239520 }, { "epoch": 0.62, "learning_rate": 0.00020686555325430747, "loss": 0.0191, "step": 239530 }, { "epoch": 0.62, "learning_rate": 0.000206861665037936, "loss": 0.0171, "step": 239540 }, { "epoch": 0.62, "learning_rate": 0.00020685777682156453, "loss": 0.011, "step": 239550 }, { "epoch": 0.62, "learning_rate": 0.0002068538886051931, "loss": 0.0122, "step": 239560 }, { "epoch": 0.62, "learning_rate": 0.0002068500003888216, "loss": 0.0125, "step": 239570 }, { "epoch": 0.62, "learning_rate": 0.00020684611217245015, "loss": 0.0137, "step": 239580 }, { "epoch": 0.62, "learning_rate": 0.00020684222395607867, "loss": 0.0164, "step": 239590 }, { "epoch": 0.62, "learning_rate": 0.00020683833573970724, "loss": 0.0172, "step": 239600 }, { "epoch": 0.62, "learning_rate": 0.00020683444752333578, "loss": 0.0152, "step": 239610 }, { "epoch": 0.62, "learning_rate": 0.0002068305593069643, "loss": 0.0162, "step": 239620 }, { "epoch": 0.62, "learning_rate": 0.00020682667109059283, "loss": 0.0141, "step": 239630 }, { "epoch": 0.62, "learning_rate": 0.00020682278287422138, "loss": 0.0127, "step": 239640 }, { "epoch": 0.62, "learning_rate": 0.00020681889465784992, "loss": 0.0135, "step": 239650 }, { "epoch": 0.62, "learning_rate": 0.00020681500644147843, "loss": 0.016, "step": 239660 }, { "epoch": 0.62, "learning_rate": 0.00020681111822510697, "loss": 0.0126, "step": 239670 }, { "epoch": 0.62, "learning_rate": 0.0002068072300087355, "loss": 0.0137, "step": 239680 }, { "epoch": 0.62, "learning_rate": 0.00020680334179236406, "loss": 0.017, "step": 239690 }, { "epoch": 0.62, "learning_rate": 0.00020679945357599257, "loss": 0.0165, "step": 239700 }, { "epoch": 0.62, "learning_rate": 0.0002067955653596211, "loss": 0.0149, "step": 239710 }, { "epoch": 0.62, "learning_rate": 0.00020679167714324963, "loss": 0.0142, "step": 239720 }, { "epoch": 0.62, "learning_rate": 0.0002067877889268782, "loss": 0.0146, "step": 239730 }, { "epoch": 0.62, "learning_rate": 0.0002067839007105067, "loss": 0.0156, "step": 239740 }, { "epoch": 0.62, "learning_rate": 0.00020678001249413525, "loss": 0.0186, "step": 239750 }, { "epoch": 0.62, "learning_rate": 0.00020677612427776377, "loss": 0.0155, "step": 239760 }, { "epoch": 0.62, "learning_rate": 0.00020677223606139234, "loss": 0.0148, "step": 239770 }, { "epoch": 0.62, "learning_rate": 0.00020676834784502088, "loss": 0.0152, "step": 239780 }, { "epoch": 0.62, "learning_rate": 0.0002067644596286494, "loss": 0.0158, "step": 239790 }, { "epoch": 0.62, "learning_rate": 0.00020676057141227793, "loss": 0.0197, "step": 239800 }, { "epoch": 0.62, "learning_rate": 0.00020675668319590647, "loss": 0.0191, "step": 239810 }, { "epoch": 0.62, "learning_rate": 0.00020675279497953502, "loss": 0.0168, "step": 239820 }, { "epoch": 0.62, "learning_rate": 0.00020674890676316353, "loss": 0.0154, "step": 239830 }, { "epoch": 0.62, "learning_rate": 0.00020674501854679207, "loss": 0.0127, "step": 239840 }, { "epoch": 0.62, "learning_rate": 0.00020674113033042061, "loss": 0.0219, "step": 239850 }, { "epoch": 0.62, "learning_rate": 0.00020673724211404916, "loss": 0.0139, "step": 239860 }, { "epoch": 0.62, "learning_rate": 0.00020673335389767767, "loss": 0.0151, "step": 239870 }, { "epoch": 0.62, "learning_rate": 0.0002067294656813062, "loss": 0.0134, "step": 239880 }, { "epoch": 0.62, "learning_rate": 0.00020672557746493475, "loss": 0.0188, "step": 239890 }, { "epoch": 0.62, "learning_rate": 0.0002067216892485633, "loss": 0.0134, "step": 239900 }, { "epoch": 0.62, "learning_rate": 0.0002067178010321918, "loss": 0.0166, "step": 239910 }, { "epoch": 0.62, "learning_rate": 0.00020671391281582035, "loss": 0.0186, "step": 239920 }, { "epoch": 0.62, "learning_rate": 0.00020671002459944887, "loss": 0.0171, "step": 239930 }, { "epoch": 0.62, "learning_rate": 0.00020670613638307743, "loss": 0.0179, "step": 239940 }, { "epoch": 0.62, "learning_rate": 0.00020670224816670598, "loss": 0.0135, "step": 239950 }, { "epoch": 0.62, "learning_rate": 0.0002066983599503345, "loss": 0.0156, "step": 239960 }, { "epoch": 0.62, "learning_rate": 0.000206694471733963, "loss": 0.0138, "step": 239970 }, { "epoch": 0.62, "learning_rate": 0.00020669058351759157, "loss": 0.0134, "step": 239980 }, { "epoch": 0.62, "learning_rate": 0.00020668669530122012, "loss": 0.0257, "step": 239990 }, { "epoch": 0.62, "learning_rate": 0.00020668280708484863, "loss": 0.0143, "step": 240000 }, { "epoch": 0.62, "eval_cer": 0.8817922630869552, "eval_loss": 0.011038198135793209, "eval_runtime": 107.238, "eval_samples_per_second": 18.65, "eval_steps_per_second": 4.663, "step": 240000 }, { "epoch": 0.62, "learning_rate": 0.00020667891886847717, "loss": 0.0135, "step": 240010 }, { "epoch": 0.62, "learning_rate": 0.00020667503065210571, "loss": 0.0155, "step": 240020 }, { "epoch": 0.62, "learning_rate": 0.00020667114243573426, "loss": 0.0183, "step": 240030 }, { "epoch": 0.62, "learning_rate": 0.00020666725421936277, "loss": 0.0184, "step": 240040 }, { "epoch": 0.62, "learning_rate": 0.0002066633660029913, "loss": 0.0147, "step": 240050 }, { "epoch": 0.62, "learning_rate": 0.00020665947778661985, "loss": 0.0173, "step": 240060 }, { "epoch": 0.62, "learning_rate": 0.0002066555895702484, "loss": 0.0188, "step": 240070 }, { "epoch": 0.62, "learning_rate": 0.0002066517013538769, "loss": 0.0161, "step": 240080 }, { "epoch": 0.62, "learning_rate": 0.00020664781313750545, "loss": 0.017, "step": 240090 }, { "epoch": 0.62, "learning_rate": 0.00020664392492113402, "loss": 0.0173, "step": 240100 }, { "epoch": 0.62, "learning_rate": 0.00020664003670476253, "loss": 0.0111, "step": 240110 }, { "epoch": 0.62, "learning_rate": 0.00020663614848839108, "loss": 0.0131, "step": 240120 }, { "epoch": 0.62, "learning_rate": 0.0002066322602720196, "loss": 0.0159, "step": 240130 }, { "epoch": 0.62, "learning_rate": 0.00020662837205564816, "loss": 0.0142, "step": 240140 }, { "epoch": 0.62, "learning_rate": 0.00020662448383927667, "loss": 0.0157, "step": 240150 }, { "epoch": 0.62, "learning_rate": 0.00020662059562290522, "loss": 0.0148, "step": 240160 }, { "epoch": 0.62, "learning_rate": 0.00020661670740653373, "loss": 0.0166, "step": 240170 }, { "epoch": 0.62, "learning_rate": 0.00020661281919016227, "loss": 0.016, "step": 240180 }, { "epoch": 0.62, "learning_rate": 0.0002066089309737908, "loss": 0.0165, "step": 240190 }, { "epoch": 0.62, "learning_rate": 0.00020660504275741935, "loss": 0.0119, "step": 240200 }, { "epoch": 0.62, "learning_rate": 0.00020660115454104787, "loss": 0.0158, "step": 240210 }, { "epoch": 0.62, "learning_rate": 0.0002065972663246764, "loss": 0.015, "step": 240220 }, { "epoch": 0.62, "learning_rate": 0.00020659337810830495, "loss": 0.0155, "step": 240230 }, { "epoch": 0.62, "learning_rate": 0.0002065894898919335, "loss": 0.02, "step": 240240 }, { "epoch": 0.62, "learning_rate": 0.000206585601675562, "loss": 0.0176, "step": 240250 }, { "epoch": 0.62, "learning_rate": 0.00020658171345919055, "loss": 0.0152, "step": 240260 }, { "epoch": 0.62, "learning_rate": 0.00020657782524281912, "loss": 0.0154, "step": 240270 }, { "epoch": 0.62, "learning_rate": 0.00020657393702644763, "loss": 0.0199, "step": 240280 }, { "epoch": 0.62, "learning_rate": 0.00020657004881007615, "loss": 0.0153, "step": 240290 }, { "epoch": 0.62, "learning_rate": 0.0002065661605937047, "loss": 0.0146, "step": 240300 }, { "epoch": 0.62, "learning_rate": 0.00020656227237733326, "loss": 0.0175, "step": 240310 }, { "epoch": 0.62, "learning_rate": 0.00020655838416096177, "loss": 0.0146, "step": 240320 }, { "epoch": 0.62, "learning_rate": 0.00020655449594459031, "loss": 0.0195, "step": 240330 }, { "epoch": 0.62, "learning_rate": 0.00020655060772821883, "loss": 0.0152, "step": 240340 }, { "epoch": 0.62, "learning_rate": 0.0002065467195118474, "loss": 0.0177, "step": 240350 }, { "epoch": 0.62, "learning_rate": 0.0002065428312954759, "loss": 0.0174, "step": 240360 }, { "epoch": 0.62, "learning_rate": 0.00020653894307910445, "loss": 0.0143, "step": 240370 }, { "epoch": 0.62, "learning_rate": 0.00020653505486273297, "loss": 0.0142, "step": 240380 }, { "epoch": 0.62, "learning_rate": 0.00020653116664636154, "loss": 0.0143, "step": 240390 }, { "epoch": 0.62, "learning_rate": 0.00020652727842999005, "loss": 0.0176, "step": 240400 }, { "epoch": 0.62, "learning_rate": 0.0002065233902136186, "loss": 0.0199, "step": 240410 }, { "epoch": 0.62, "learning_rate": 0.0002065195019972471, "loss": 0.0164, "step": 240420 }, { "epoch": 0.62, "learning_rate": 0.00020651561378087565, "loss": 0.0173, "step": 240430 }, { "epoch": 0.62, "learning_rate": 0.0002065117255645042, "loss": 0.0169, "step": 240440 }, { "epoch": 0.62, "learning_rate": 0.00020650783734813273, "loss": 0.0159, "step": 240450 }, { "epoch": 0.62, "learning_rate": 0.00020650394913176125, "loss": 0.0192, "step": 240460 }, { "epoch": 0.62, "learning_rate": 0.0002065000609153898, "loss": 0.0149, "step": 240470 }, { "epoch": 0.62, "learning_rate": 0.00020649617269901836, "loss": 0.0154, "step": 240480 }, { "epoch": 0.62, "learning_rate": 0.00020649228448264687, "loss": 0.0163, "step": 240490 }, { "epoch": 0.62, "learning_rate": 0.00020648839626627541, "loss": 0.0141, "step": 240500 }, { "epoch": 0.62, "learning_rate": 0.00020648450804990393, "loss": 0.0234, "step": 240510 }, { "epoch": 0.62, "learning_rate": 0.0002064806198335325, "loss": 0.0148, "step": 240520 }, { "epoch": 0.62, "learning_rate": 0.000206476731617161, "loss": 0.0214, "step": 240530 }, { "epoch": 0.62, "learning_rate": 0.00020647284340078955, "loss": 0.0149, "step": 240540 }, { "epoch": 0.62, "learning_rate": 0.00020646895518441807, "loss": 0.0157, "step": 240550 }, { "epoch": 0.62, "learning_rate": 0.00020646506696804664, "loss": 0.0153, "step": 240560 }, { "epoch": 0.62, "learning_rate": 0.00020646117875167515, "loss": 0.0168, "step": 240570 }, { "epoch": 0.62, "learning_rate": 0.0002064572905353037, "loss": 0.0155, "step": 240580 }, { "epoch": 0.62, "learning_rate": 0.0002064534023189322, "loss": 0.0117, "step": 240590 }, { "epoch": 0.62, "learning_rate": 0.00020644951410256078, "loss": 0.014, "step": 240600 }, { "epoch": 0.62, "learning_rate": 0.0002064456258861893, "loss": 0.0156, "step": 240610 }, { "epoch": 0.62, "learning_rate": 0.00020644173766981783, "loss": 0.0146, "step": 240620 }, { "epoch": 0.62, "learning_rate": 0.00020643784945344635, "loss": 0.0133, "step": 240630 }, { "epoch": 0.62, "learning_rate": 0.00020643396123707492, "loss": 0.0129, "step": 240640 }, { "epoch": 0.62, "learning_rate": 0.00020643007302070346, "loss": 0.0157, "step": 240650 }, { "epoch": 0.62, "learning_rate": 0.00020642618480433197, "loss": 0.0161, "step": 240660 }, { "epoch": 0.62, "learning_rate": 0.0002064222965879605, "loss": 0.0185, "step": 240670 }, { "epoch": 0.62, "learning_rate": 0.00020641840837158903, "loss": 0.0147, "step": 240680 }, { "epoch": 0.62, "learning_rate": 0.0002064145201552176, "loss": 0.0129, "step": 240690 }, { "epoch": 0.62, "learning_rate": 0.0002064106319388461, "loss": 0.0129, "step": 240700 }, { "epoch": 0.62, "learning_rate": 0.00020640674372247465, "loss": 0.0162, "step": 240710 }, { "epoch": 0.62, "learning_rate": 0.00020640285550610317, "loss": 0.0175, "step": 240720 }, { "epoch": 0.62, "learning_rate": 0.00020639896728973174, "loss": 0.0162, "step": 240730 }, { "epoch": 0.62, "learning_rate": 0.00020639507907336025, "loss": 0.0172, "step": 240740 }, { "epoch": 0.62, "learning_rate": 0.0002063911908569888, "loss": 0.0194, "step": 240750 }, { "epoch": 0.62, "learning_rate": 0.0002063873026406173, "loss": 0.015, "step": 240760 }, { "epoch": 0.62, "learning_rate": 0.00020638341442424588, "loss": 0.0179, "step": 240770 }, { "epoch": 0.62, "learning_rate": 0.0002063795262078744, "loss": 0.0183, "step": 240780 }, { "epoch": 0.62, "learning_rate": 0.00020637563799150293, "loss": 0.0159, "step": 240790 }, { "epoch": 0.62, "learning_rate": 0.00020637174977513145, "loss": 0.0176, "step": 240800 }, { "epoch": 0.62, "learning_rate": 0.00020636786155876002, "loss": 0.0145, "step": 240810 }, { "epoch": 0.62, "learning_rate": 0.00020636397334238856, "loss": 0.0115, "step": 240820 }, { "epoch": 0.62, "learning_rate": 0.00020636008512601707, "loss": 0.0157, "step": 240830 }, { "epoch": 0.62, "learning_rate": 0.00020635619690964559, "loss": 0.0163, "step": 240840 }, { "epoch": 0.62, "learning_rate": 0.00020635230869327415, "loss": 0.0117, "step": 240850 }, { "epoch": 0.62, "learning_rate": 0.0002063484204769027, "loss": 0.0129, "step": 240860 }, { "epoch": 0.62, "learning_rate": 0.0002063445322605312, "loss": 0.0224, "step": 240870 }, { "epoch": 0.62, "learning_rate": 0.00020634064404415975, "loss": 0.0163, "step": 240880 }, { "epoch": 0.62, "learning_rate": 0.0002063367558277883, "loss": 0.0175, "step": 240890 }, { "epoch": 0.62, "learning_rate": 0.00020633286761141684, "loss": 0.018, "step": 240900 }, { "epoch": 0.62, "learning_rate": 0.00020632897939504535, "loss": 0.0153, "step": 240910 }, { "epoch": 0.62, "learning_rate": 0.0002063250911786739, "loss": 0.0154, "step": 240920 }, { "epoch": 0.62, "learning_rate": 0.0002063212029623024, "loss": 0.0161, "step": 240930 }, { "epoch": 0.62, "learning_rate": 0.00020631731474593098, "loss": 0.0188, "step": 240940 }, { "epoch": 0.62, "learning_rate": 0.0002063134265295595, "loss": 0.0177, "step": 240950 }, { "epoch": 0.62, "learning_rate": 0.00020630953831318803, "loss": 0.013, "step": 240960 }, { "epoch": 0.62, "learning_rate": 0.00020630565009681655, "loss": 0.0143, "step": 240970 }, { "epoch": 0.62, "learning_rate": 0.00020630176188044511, "loss": 0.0178, "step": 240980 }, { "epoch": 0.62, "learning_rate": 0.00020629787366407366, "loss": 0.0134, "step": 240990 }, { "epoch": 0.62, "learning_rate": 0.00020629398544770217, "loss": 0.0174, "step": 241000 }, { "epoch": 0.62, "eval_cer": 0.8818048598193629, "eval_loss": 0.011126725003123283, "eval_runtime": 107.3943, "eval_samples_per_second": 18.623, "eval_steps_per_second": 4.656, "step": 241000 }, { "epoch": 0.62, "learning_rate": 0.00020629009723133069, "loss": 0.0134, "step": 241010 }, { "epoch": 0.62, "learning_rate": 0.00020628620901495925, "loss": 0.0136, "step": 241020 }, { "epoch": 0.62, "learning_rate": 0.0002062823207985878, "loss": 0.0128, "step": 241030 }, { "epoch": 0.62, "learning_rate": 0.0002062784325822163, "loss": 0.0169, "step": 241040 }, { "epoch": 0.62, "learning_rate": 0.00020627454436584485, "loss": 0.0188, "step": 241050 }, { "epoch": 0.62, "learning_rate": 0.0002062706561494734, "loss": 0.0141, "step": 241060 }, { "epoch": 0.62, "learning_rate": 0.00020626676793310194, "loss": 0.0154, "step": 241070 }, { "epoch": 0.62, "learning_rate": 0.00020626287971673045, "loss": 0.0203, "step": 241080 }, { "epoch": 0.62, "learning_rate": 0.000206258991500359, "loss": 0.016, "step": 241090 }, { "epoch": 0.62, "learning_rate": 0.00020625510328398753, "loss": 0.0196, "step": 241100 }, { "epoch": 0.62, "learning_rate": 0.00020625121506761607, "loss": 0.0176, "step": 241110 }, { "epoch": 0.63, "learning_rate": 0.0002062473268512446, "loss": 0.0185, "step": 241120 }, { "epoch": 0.63, "learning_rate": 0.00020624343863487313, "loss": 0.018, "step": 241130 }, { "epoch": 0.63, "learning_rate": 0.0002062395504185017, "loss": 0.0121, "step": 241140 }, { "epoch": 0.63, "learning_rate": 0.00020623566220213021, "loss": 0.026, "step": 241150 }, { "epoch": 0.63, "learning_rate": 0.00020623177398575873, "loss": 0.0126, "step": 241160 }, { "epoch": 0.63, "learning_rate": 0.00020622788576938727, "loss": 0.014, "step": 241170 }, { "epoch": 0.63, "learning_rate": 0.00020622399755301578, "loss": 0.0172, "step": 241180 }, { "epoch": 0.63, "learning_rate": 0.00020622010933664435, "loss": 0.0178, "step": 241190 }, { "epoch": 0.63, "learning_rate": 0.0002062162211202729, "loss": 0.0151, "step": 241200 }, { "epoch": 0.63, "learning_rate": 0.0002062123329039014, "loss": 0.0196, "step": 241210 }, { "epoch": 0.63, "learning_rate": 0.00020620844468752995, "loss": 0.0151, "step": 241220 }, { "epoch": 0.63, "learning_rate": 0.0002062045564711585, "loss": 0.0195, "step": 241230 }, { "epoch": 0.63, "learning_rate": 0.00020620066825478703, "loss": 0.0163, "step": 241240 }, { "epoch": 0.63, "learning_rate": 0.00020619678003841555, "loss": 0.0163, "step": 241250 }, { "epoch": 0.63, "learning_rate": 0.0002061928918220441, "loss": 0.016, "step": 241260 }, { "epoch": 0.63, "learning_rate": 0.00020618900360567263, "loss": 0.0164, "step": 241270 }, { "epoch": 0.63, "learning_rate": 0.00020618511538930117, "loss": 0.0124, "step": 241280 }, { "epoch": 0.63, "learning_rate": 0.0002061812271729297, "loss": 0.0178, "step": 241290 }, { "epoch": 0.63, "learning_rate": 0.00020617733895655823, "loss": 0.0176, "step": 241300 }, { "epoch": 0.63, "learning_rate": 0.00020617345074018677, "loss": 0.0151, "step": 241310 }, { "epoch": 0.63, "learning_rate": 0.0002061695625238153, "loss": 0.0168, "step": 241320 }, { "epoch": 0.63, "learning_rate": 0.00020616567430744383, "loss": 0.0135, "step": 241330 }, { "epoch": 0.63, "learning_rate": 0.00020616178609107237, "loss": 0.019, "step": 241340 }, { "epoch": 0.63, "learning_rate": 0.00020615789787470094, "loss": 0.0141, "step": 241350 }, { "epoch": 0.63, "learning_rate": 0.00020615400965832945, "loss": 0.0167, "step": 241360 }, { "epoch": 0.63, "learning_rate": 0.000206150121441958, "loss": 0.0167, "step": 241370 }, { "epoch": 0.63, "learning_rate": 0.0002061462332255865, "loss": 0.016, "step": 241380 }, { "epoch": 0.63, "learning_rate": 0.00020614234500921508, "loss": 0.0141, "step": 241390 }, { "epoch": 0.63, "learning_rate": 0.0002061384567928436, "loss": 0.0223, "step": 241400 }, { "epoch": 0.63, "learning_rate": 0.00020613456857647213, "loss": 0.014, "step": 241410 }, { "epoch": 0.63, "learning_rate": 0.00020613068036010065, "loss": 0.0135, "step": 241420 }, { "epoch": 0.63, "learning_rate": 0.0002061267921437292, "loss": 0.0158, "step": 241430 }, { "epoch": 0.63, "learning_rate": 0.00020612290392735773, "loss": 0.0163, "step": 241440 }, { "epoch": 0.63, "learning_rate": 0.00020611901571098627, "loss": 0.0213, "step": 241450 }, { "epoch": 0.63, "learning_rate": 0.0002061151274946148, "loss": 0.0159, "step": 241460 }, { "epoch": 0.63, "learning_rate": 0.00020611123927824333, "loss": 0.0146, "step": 241470 }, { "epoch": 0.63, "learning_rate": 0.00020610735106187187, "loss": 0.0205, "step": 241480 }, { "epoch": 0.63, "learning_rate": 0.0002061034628455004, "loss": 0.0115, "step": 241490 }, { "epoch": 0.63, "learning_rate": 0.00020609957462912893, "loss": 0.0131, "step": 241500 }, { "epoch": 0.63, "learning_rate": 0.00020609568641275747, "loss": 0.0151, "step": 241510 }, { "epoch": 0.63, "learning_rate": 0.00020609179819638604, "loss": 0.017, "step": 241520 }, { "epoch": 0.63, "learning_rate": 0.00020608790998001455, "loss": 0.0163, "step": 241530 }, { "epoch": 0.63, "learning_rate": 0.0002060840217636431, "loss": 0.0137, "step": 241540 }, { "epoch": 0.63, "learning_rate": 0.0002060801335472716, "loss": 0.0183, "step": 241550 }, { "epoch": 0.63, "learning_rate": 0.00020607624533090018, "loss": 0.0152, "step": 241560 }, { "epoch": 0.63, "learning_rate": 0.0002060723571145287, "loss": 0.0157, "step": 241570 }, { "epoch": 0.63, "learning_rate": 0.00020606846889815723, "loss": 0.0126, "step": 241580 }, { "epoch": 0.63, "learning_rate": 0.00020606458068178575, "loss": 0.0203, "step": 241590 }, { "epoch": 0.63, "learning_rate": 0.00020606069246541432, "loss": 0.0163, "step": 241600 }, { "epoch": 0.63, "learning_rate": 0.00020605680424904283, "loss": 0.0146, "step": 241610 }, { "epoch": 0.63, "learning_rate": 0.00020605291603267137, "loss": 0.019, "step": 241620 }, { "epoch": 0.63, "learning_rate": 0.0002060490278162999, "loss": 0.0192, "step": 241630 }, { "epoch": 0.63, "learning_rate": 0.00020604513959992846, "loss": 0.0182, "step": 241640 }, { "epoch": 0.63, "learning_rate": 0.00020604125138355697, "loss": 0.0146, "step": 241650 }, { "epoch": 0.63, "learning_rate": 0.0002060373631671855, "loss": 0.0196, "step": 241660 }, { "epoch": 0.63, "learning_rate": 0.00020603347495081403, "loss": 0.0129, "step": 241670 }, { "epoch": 0.63, "learning_rate": 0.00020602958673444257, "loss": 0.0174, "step": 241680 }, { "epoch": 0.63, "learning_rate": 0.00020602569851807114, "loss": 0.0175, "step": 241690 }, { "epoch": 0.63, "learning_rate": 0.00020602181030169965, "loss": 0.015, "step": 241700 }, { "epoch": 0.63, "learning_rate": 0.0002060179220853282, "loss": 0.0128, "step": 241710 }, { "epoch": 0.63, "learning_rate": 0.0002060140338689567, "loss": 0.0153, "step": 241720 }, { "epoch": 0.63, "learning_rate": 0.00020601014565258528, "loss": 0.0178, "step": 241730 }, { "epoch": 0.63, "learning_rate": 0.0002060062574362138, "loss": 0.0243, "step": 241740 }, { "epoch": 0.63, "learning_rate": 0.00020600236921984233, "loss": 0.0232, "step": 241750 }, { "epoch": 0.63, "learning_rate": 0.00020599848100347085, "loss": 0.0209, "step": 241760 }, { "epoch": 0.63, "learning_rate": 0.00020599459278709942, "loss": 0.0178, "step": 241770 }, { "epoch": 0.63, "learning_rate": 0.00020599070457072793, "loss": 0.0201, "step": 241780 }, { "epoch": 0.63, "learning_rate": 0.00020598681635435647, "loss": 0.0181, "step": 241790 }, { "epoch": 0.63, "learning_rate": 0.000205982928137985, "loss": 0.0158, "step": 241800 }, { "epoch": 0.63, "learning_rate": 0.00020597903992161356, "loss": 0.0188, "step": 241810 }, { "epoch": 0.63, "learning_rate": 0.00020597515170524207, "loss": 0.0163, "step": 241820 }, { "epoch": 0.63, "learning_rate": 0.0002059712634888706, "loss": 0.0154, "step": 241830 }, { "epoch": 0.63, "learning_rate": 0.00020596737527249913, "loss": 0.0144, "step": 241840 }, { "epoch": 0.63, "learning_rate": 0.0002059634870561277, "loss": 0.0169, "step": 241850 }, { "epoch": 0.63, "learning_rate": 0.00020595959883975624, "loss": 0.0137, "step": 241860 }, { "epoch": 0.63, "learning_rate": 0.00020595571062338475, "loss": 0.0121, "step": 241870 }, { "epoch": 0.63, "learning_rate": 0.00020595182240701327, "loss": 0.018, "step": 241880 }, { "epoch": 0.63, "learning_rate": 0.00020594793419064183, "loss": 0.0164, "step": 241890 }, { "epoch": 0.63, "learning_rate": 0.00020594404597427038, "loss": 0.0181, "step": 241900 }, { "epoch": 0.63, "learning_rate": 0.0002059401577578989, "loss": 0.0195, "step": 241910 }, { "epoch": 0.63, "learning_rate": 0.00020593626954152743, "loss": 0.0182, "step": 241920 }, { "epoch": 0.63, "learning_rate": 0.00020593238132515595, "loss": 0.0152, "step": 241930 }, { "epoch": 0.63, "learning_rate": 0.00020592849310878452, "loss": 0.0173, "step": 241940 }, { "epoch": 0.63, "learning_rate": 0.00020592460489241303, "loss": 0.0198, "step": 241950 }, { "epoch": 0.63, "learning_rate": 0.00020592071667604157, "loss": 0.0147, "step": 241960 }, { "epoch": 0.63, "learning_rate": 0.00020591682845967009, "loss": 0.0147, "step": 241970 }, { "epoch": 0.63, "learning_rate": 0.00020591294024329865, "loss": 0.0153, "step": 241980 }, { "epoch": 0.63, "learning_rate": 0.00020590905202692717, "loss": 0.0152, "step": 241990 }, { "epoch": 0.63, "learning_rate": 0.0002059051638105557, "loss": 0.0165, "step": 242000 }, { "epoch": 0.63, "eval_cer": 0.8818272540103097, "eval_loss": 0.0112527534365654, "eval_runtime": 107.4809, "eval_samples_per_second": 18.608, "eval_steps_per_second": 4.652, "step": 242000 }, { "epoch": 0.63, "learning_rate": 0.00020590127559418423, "loss": 0.0226, "step": 242010 }, { "epoch": 0.63, "learning_rate": 0.0002058973873778128, "loss": 0.0165, "step": 242020 }, { "epoch": 0.63, "learning_rate": 0.0002058934991614413, "loss": 0.0154, "step": 242030 }, { "epoch": 0.63, "learning_rate": 0.00020588961094506985, "loss": 0.0167, "step": 242040 }, { "epoch": 0.63, "learning_rate": 0.00020588572272869837, "loss": 0.0152, "step": 242050 }, { "epoch": 0.63, "learning_rate": 0.00020588183451232693, "loss": 0.0181, "step": 242060 }, { "epoch": 0.63, "learning_rate": 0.00020587794629595548, "loss": 0.0157, "step": 242070 }, { "epoch": 0.63, "learning_rate": 0.000205874058079584, "loss": 0.0145, "step": 242080 }, { "epoch": 0.63, "learning_rate": 0.00020587016986321253, "loss": 0.0125, "step": 242090 }, { "epoch": 0.63, "learning_rate": 0.00020586628164684107, "loss": 0.0173, "step": 242100 }, { "epoch": 0.63, "learning_rate": 0.00020586239343046961, "loss": 0.0182, "step": 242110 }, { "epoch": 0.63, "learning_rate": 0.00020585850521409813, "loss": 0.0125, "step": 242120 }, { "epoch": 0.63, "learning_rate": 0.00020585461699772667, "loss": 0.0155, "step": 242130 }, { "epoch": 0.63, "learning_rate": 0.0002058507287813552, "loss": 0.0209, "step": 242140 }, { "epoch": 0.63, "learning_rate": 0.00020584684056498375, "loss": 0.015, "step": 242150 }, { "epoch": 0.63, "learning_rate": 0.00020584295234861227, "loss": 0.0167, "step": 242160 }, { "epoch": 0.63, "learning_rate": 0.0002058390641322408, "loss": 0.0138, "step": 242170 }, { "epoch": 0.63, "learning_rate": 0.00020583517591586933, "loss": 0.0173, "step": 242180 }, { "epoch": 0.63, "learning_rate": 0.0002058312876994979, "loss": 0.0158, "step": 242190 }, { "epoch": 0.63, "learning_rate": 0.0002058273994831264, "loss": 0.0178, "step": 242200 }, { "epoch": 0.63, "learning_rate": 0.00020582351126675495, "loss": 0.0154, "step": 242210 }, { "epoch": 0.63, "learning_rate": 0.00020581962305038346, "loss": 0.0185, "step": 242220 }, { "epoch": 0.63, "learning_rate": 0.00020581573483401203, "loss": 0.0133, "step": 242230 }, { "epoch": 0.63, "learning_rate": 0.00020581184661764057, "loss": 0.0146, "step": 242240 }, { "epoch": 0.63, "learning_rate": 0.0002058079584012691, "loss": 0.0137, "step": 242250 }, { "epoch": 0.63, "learning_rate": 0.00020580407018489763, "loss": 0.0206, "step": 242260 }, { "epoch": 0.63, "learning_rate": 0.00020580018196852617, "loss": 0.0133, "step": 242270 }, { "epoch": 0.63, "learning_rate": 0.00020579629375215471, "loss": 0.0139, "step": 242280 }, { "epoch": 0.63, "learning_rate": 0.00020579240553578323, "loss": 0.0128, "step": 242290 }, { "epoch": 0.63, "learning_rate": 0.00020578851731941177, "loss": 0.0153, "step": 242300 }, { "epoch": 0.63, "learning_rate": 0.0002057846291030403, "loss": 0.013, "step": 242310 }, { "epoch": 0.63, "learning_rate": 0.00020578074088666885, "loss": 0.0169, "step": 242320 }, { "epoch": 0.63, "learning_rate": 0.00020577685267029737, "loss": 0.0126, "step": 242330 }, { "epoch": 0.63, "learning_rate": 0.0002057729644539259, "loss": 0.0138, "step": 242340 }, { "epoch": 0.63, "learning_rate": 0.00020576907623755445, "loss": 0.018, "step": 242350 }, { "epoch": 0.63, "learning_rate": 0.000205765188021183, "loss": 0.0191, "step": 242360 }, { "epoch": 0.63, "learning_rate": 0.0002057612998048115, "loss": 0.015, "step": 242370 }, { "epoch": 0.63, "learning_rate": 0.00020575741158844005, "loss": 0.0169, "step": 242380 }, { "epoch": 0.63, "learning_rate": 0.00020575352337206862, "loss": 0.0169, "step": 242390 }, { "epoch": 0.63, "learning_rate": 0.00020574963515569713, "loss": 0.0198, "step": 242400 }, { "epoch": 0.63, "learning_rate": 0.00020574574693932567, "loss": 0.0141, "step": 242410 }, { "epoch": 0.63, "learning_rate": 0.0002057418587229542, "loss": 0.0117, "step": 242420 }, { "epoch": 0.63, "learning_rate": 0.0002057379705065827, "loss": 0.0194, "step": 242430 }, { "epoch": 0.63, "learning_rate": 0.00020573408229021127, "loss": 0.0165, "step": 242440 }, { "epoch": 0.63, "learning_rate": 0.00020573019407383981, "loss": 0.017, "step": 242450 }, { "epoch": 0.63, "learning_rate": 0.00020572630585746833, "loss": 0.0344, "step": 242460 }, { "epoch": 0.63, "learning_rate": 0.00020572241764109687, "loss": 0.0155, "step": 242470 }, { "epoch": 0.63, "learning_rate": 0.0002057185294247254, "loss": 0.0158, "step": 242480 }, { "epoch": 0.63, "learning_rate": 0.00020571464120835395, "loss": 0.0152, "step": 242490 }, { "epoch": 0.63, "learning_rate": 0.00020571075299198247, "loss": 0.0152, "step": 242500 }, { "epoch": 0.63, "learning_rate": 0.000205706864775611, "loss": 0.0156, "step": 242510 }, { "epoch": 0.63, "learning_rate": 0.00020570297655923955, "loss": 0.015, "step": 242520 }, { "epoch": 0.63, "learning_rate": 0.0002056990883428681, "loss": 0.0155, "step": 242530 }, { "epoch": 0.63, "learning_rate": 0.0002056952001264966, "loss": 0.014, "step": 242540 }, { "epoch": 0.63, "learning_rate": 0.00020569131191012515, "loss": 0.0154, "step": 242550 }, { "epoch": 0.63, "learning_rate": 0.00020568742369375372, "loss": 0.0168, "step": 242560 }, { "epoch": 0.63, "learning_rate": 0.00020568353547738223, "loss": 0.0172, "step": 242570 }, { "epoch": 0.63, "learning_rate": 0.00020567964726101077, "loss": 0.0166, "step": 242580 }, { "epoch": 0.63, "learning_rate": 0.0002056757590446393, "loss": 0.0128, "step": 242590 }, { "epoch": 0.63, "learning_rate": 0.00020567187082826786, "loss": 0.0132, "step": 242600 }, { "epoch": 0.63, "learning_rate": 0.00020566798261189637, "loss": 0.0126, "step": 242610 }, { "epoch": 0.63, "learning_rate": 0.0002056640943955249, "loss": 0.0199, "step": 242620 }, { "epoch": 0.63, "learning_rate": 0.00020566020617915343, "loss": 0.0158, "step": 242630 }, { "epoch": 0.63, "learning_rate": 0.000205656317962782, "loss": 0.0187, "step": 242640 }, { "epoch": 0.63, "learning_rate": 0.0002056524297464105, "loss": 0.0183, "step": 242650 }, { "epoch": 0.63, "learning_rate": 0.00020564854153003905, "loss": 0.0167, "step": 242660 }, { "epoch": 0.63, "learning_rate": 0.00020564465331366757, "loss": 0.0189, "step": 242670 }, { "epoch": 0.63, "learning_rate": 0.0002056407650972961, "loss": 0.0171, "step": 242680 }, { "epoch": 0.63, "learning_rate": 0.00020563687688092465, "loss": 0.0163, "step": 242690 }, { "epoch": 0.63, "learning_rate": 0.0002056329886645532, "loss": 0.0118, "step": 242700 }, { "epoch": 0.63, "learning_rate": 0.0002056291004481817, "loss": 0.0134, "step": 242710 }, { "epoch": 0.63, "learning_rate": 0.00020562521223181025, "loss": 0.0128, "step": 242720 }, { "epoch": 0.63, "learning_rate": 0.00020562132401543882, "loss": 0.015, "step": 242730 }, { "epoch": 0.63, "learning_rate": 0.00020561743579906733, "loss": 0.0152, "step": 242740 }, { "epoch": 0.63, "learning_rate": 0.00020561354758269585, "loss": 0.0212, "step": 242750 }, { "epoch": 0.63, "learning_rate": 0.0002056096593663244, "loss": 0.0129, "step": 242760 }, { "epoch": 0.63, "learning_rate": 0.00020560577114995296, "loss": 0.0122, "step": 242770 }, { "epoch": 0.63, "learning_rate": 0.00020560188293358147, "loss": 0.0183, "step": 242780 }, { "epoch": 0.63, "learning_rate": 0.00020559799471721, "loss": 0.0134, "step": 242790 }, { "epoch": 0.63, "learning_rate": 0.00020559410650083853, "loss": 0.0133, "step": 242800 }, { "epoch": 0.63, "learning_rate": 0.0002055902182844671, "loss": 0.0137, "step": 242810 }, { "epoch": 0.63, "learning_rate": 0.0002055863300680956, "loss": 0.0183, "step": 242820 }, { "epoch": 0.63, "learning_rate": 0.00020558244185172415, "loss": 0.0145, "step": 242830 }, { "epoch": 0.63, "learning_rate": 0.00020557855363535267, "loss": 0.0158, "step": 242840 }, { "epoch": 0.63, "learning_rate": 0.00020557466541898124, "loss": 0.0122, "step": 242850 }, { "epoch": 0.63, "learning_rate": 0.00020557077720260975, "loss": 0.0147, "step": 242860 }, { "epoch": 0.63, "learning_rate": 0.0002055668889862383, "loss": 0.0176, "step": 242870 }, { "epoch": 0.63, "learning_rate": 0.0002055630007698668, "loss": 0.0196, "step": 242880 }, { "epoch": 0.63, "learning_rate": 0.00020555911255349537, "loss": 0.0166, "step": 242890 }, { "epoch": 0.63, "learning_rate": 0.0002055552243371239, "loss": 0.0171, "step": 242900 }, { "epoch": 0.63, "learning_rate": 0.00020555133612075243, "loss": 0.0137, "step": 242910 }, { "epoch": 0.63, "learning_rate": 0.00020554744790438095, "loss": 0.017, "step": 242920 }, { "epoch": 0.63, "learning_rate": 0.0002055435596880095, "loss": 0.0164, "step": 242930 }, { "epoch": 0.63, "learning_rate": 0.00020553967147163806, "loss": 0.0127, "step": 242940 }, { "epoch": 0.63, "learning_rate": 0.00020553578325526657, "loss": 0.0168, "step": 242950 }, { "epoch": 0.63, "learning_rate": 0.0002055318950388951, "loss": 0.017, "step": 242960 }, { "epoch": 0.63, "learning_rate": 0.00020552800682252363, "loss": 0.0168, "step": 242970 }, { "epoch": 0.63, "learning_rate": 0.0002055241186061522, "loss": 0.0144, "step": 242980 }, { "epoch": 0.63, "learning_rate": 0.0002055202303897807, "loss": 0.0154, "step": 242990 }, { "epoch": 0.63, "learning_rate": 0.00020551634217340925, "loss": 0.0139, "step": 243000 }, { "epoch": 0.63, "eval_cer": 0.8818188561887047, "eval_loss": 0.011068116873502731, "eval_runtime": 107.3469, "eval_samples_per_second": 18.631, "eval_steps_per_second": 4.658, "step": 243000 }, { "epoch": 0.63, "learning_rate": 0.00020551245395703777, "loss": 0.0149, "step": 243010 }, { "epoch": 0.63, "learning_rate": 0.00020550856574066633, "loss": 0.0138, "step": 243020 }, { "epoch": 0.63, "learning_rate": 0.00020550467752429485, "loss": 0.0134, "step": 243030 }, { "epoch": 0.63, "learning_rate": 0.0002055007893079234, "loss": 0.0177, "step": 243040 }, { "epoch": 0.63, "learning_rate": 0.0002054969010915519, "loss": 0.0183, "step": 243050 }, { "epoch": 0.63, "learning_rate": 0.00020549301287518047, "loss": 0.0157, "step": 243060 }, { "epoch": 0.63, "learning_rate": 0.000205489124658809, "loss": 0.0169, "step": 243070 }, { "epoch": 0.63, "learning_rate": 0.00020548523644243753, "loss": 0.0158, "step": 243080 }, { "epoch": 0.63, "learning_rate": 0.00020548134822606604, "loss": 0.0157, "step": 243090 }, { "epoch": 0.63, "learning_rate": 0.00020547746000969461, "loss": 0.0145, "step": 243100 }, { "epoch": 0.63, "learning_rate": 0.00020547357179332316, "loss": 0.0175, "step": 243110 }, { "epoch": 0.63, "learning_rate": 0.00020546968357695167, "loss": 0.0141, "step": 243120 }, { "epoch": 0.63, "learning_rate": 0.0002054657953605802, "loss": 0.0179, "step": 243130 }, { "epoch": 0.63, "learning_rate": 0.00020546190714420875, "loss": 0.0147, "step": 243140 }, { "epoch": 0.63, "learning_rate": 0.0002054580189278373, "loss": 0.015, "step": 243150 }, { "epoch": 0.63, "learning_rate": 0.0002054541307114658, "loss": 0.0142, "step": 243160 }, { "epoch": 0.63, "learning_rate": 0.00020545024249509435, "loss": 0.02, "step": 243170 }, { "epoch": 0.63, "learning_rate": 0.00020544635427872287, "loss": 0.0202, "step": 243180 }, { "epoch": 0.63, "learning_rate": 0.00020544246606235143, "loss": 0.0137, "step": 243190 }, { "epoch": 0.63, "learning_rate": 0.00020543857784597995, "loss": 0.0162, "step": 243200 }, { "epoch": 0.63, "learning_rate": 0.0002054346896296085, "loss": 0.0188, "step": 243210 }, { "epoch": 0.63, "learning_rate": 0.000205430801413237, "loss": 0.013, "step": 243220 }, { "epoch": 0.63, "learning_rate": 0.00020542691319686557, "loss": 0.015, "step": 243230 }, { "epoch": 0.63, "learning_rate": 0.0002054230249804941, "loss": 0.0154, "step": 243240 }, { "epoch": 0.63, "learning_rate": 0.00020541913676412263, "loss": 0.0177, "step": 243250 }, { "epoch": 0.63, "learning_rate": 0.00020541524854775114, "loss": 0.0194, "step": 243260 }, { "epoch": 0.63, "learning_rate": 0.0002054113603313797, "loss": 0.0137, "step": 243270 }, { "epoch": 0.63, "learning_rate": 0.00020540747211500825, "loss": 0.0125, "step": 243280 }, { "epoch": 0.63, "learning_rate": 0.00020540358389863677, "loss": 0.0155, "step": 243290 }, { "epoch": 0.63, "learning_rate": 0.00020539969568226528, "loss": 0.0158, "step": 243300 }, { "epoch": 0.63, "learning_rate": 0.00020539580746589385, "loss": 0.0199, "step": 243310 }, { "epoch": 0.63, "learning_rate": 0.0002053919192495224, "loss": 0.0143, "step": 243320 }, { "epoch": 0.63, "learning_rate": 0.0002053880310331509, "loss": 0.0169, "step": 243330 }, { "epoch": 0.63, "learning_rate": 0.00020538414281677945, "loss": 0.0136, "step": 243340 }, { "epoch": 0.63, "learning_rate": 0.000205380254600408, "loss": 0.0134, "step": 243350 }, { "epoch": 0.63, "learning_rate": 0.00020537636638403653, "loss": 0.0124, "step": 243360 }, { "epoch": 0.63, "learning_rate": 0.00020537247816766505, "loss": 0.0171, "step": 243370 }, { "epoch": 0.63, "learning_rate": 0.0002053685899512936, "loss": 0.0154, "step": 243380 }, { "epoch": 0.63, "learning_rate": 0.00020536470173492213, "loss": 0.0146, "step": 243390 }, { "epoch": 0.63, "learning_rate": 0.00020536081351855067, "loss": 0.0154, "step": 243400 }, { "epoch": 0.63, "learning_rate": 0.0002053569253021792, "loss": 0.0156, "step": 243410 }, { "epoch": 0.63, "learning_rate": 0.00020535303708580773, "loss": 0.0155, "step": 243420 }, { "epoch": 0.63, "learning_rate": 0.00020534914886943624, "loss": 0.0158, "step": 243430 }, { "epoch": 0.63, "learning_rate": 0.0002053452606530648, "loss": 0.0172, "step": 243440 }, { "epoch": 0.63, "learning_rate": 0.00020534137243669335, "loss": 0.0126, "step": 243450 }, { "epoch": 0.63, "learning_rate": 0.00020533748422032187, "loss": 0.0171, "step": 243460 }, { "epoch": 0.63, "learning_rate": 0.00020533359600395038, "loss": 0.0155, "step": 243470 }, { "epoch": 0.63, "learning_rate": 0.00020532970778757895, "loss": 0.0161, "step": 243480 }, { "epoch": 0.63, "learning_rate": 0.0002053258195712075, "loss": 0.0121, "step": 243490 }, { "epoch": 0.63, "learning_rate": 0.000205321931354836, "loss": 0.0191, "step": 243500 }, { "epoch": 0.63, "learning_rate": 0.00020531804313846455, "loss": 0.0172, "step": 243510 }, { "epoch": 0.63, "learning_rate": 0.0002053141549220931, "loss": 0.0149, "step": 243520 }, { "epoch": 0.63, "learning_rate": 0.00020531026670572163, "loss": 0.0164, "step": 243530 }, { "epoch": 0.63, "learning_rate": 0.00020530637848935015, "loss": 0.0129, "step": 243540 }, { "epoch": 0.63, "learning_rate": 0.0002053024902729787, "loss": 0.012, "step": 243550 }, { "epoch": 0.63, "learning_rate": 0.00020529860205660723, "loss": 0.0151, "step": 243560 }, { "epoch": 0.63, "learning_rate": 0.00020529471384023577, "loss": 0.0152, "step": 243570 }, { "epoch": 0.63, "learning_rate": 0.0002052908256238643, "loss": 0.0149, "step": 243580 }, { "epoch": 0.63, "learning_rate": 0.00020528693740749283, "loss": 0.0158, "step": 243590 }, { "epoch": 0.63, "learning_rate": 0.0002052830491911214, "loss": 0.0167, "step": 243600 }, { "epoch": 0.63, "learning_rate": 0.0002052791609747499, "loss": 0.0145, "step": 243610 }, { "epoch": 0.63, "learning_rate": 0.00020527527275837843, "loss": 0.0171, "step": 243620 }, { "epoch": 0.63, "learning_rate": 0.00020527138454200697, "loss": 0.0154, "step": 243630 }, { "epoch": 0.63, "learning_rate": 0.00020526749632563554, "loss": 0.0131, "step": 243640 }, { "epoch": 0.63, "learning_rate": 0.00020526360810926405, "loss": 0.0143, "step": 243650 }, { "epoch": 0.63, "learning_rate": 0.0002052597198928926, "loss": 0.0197, "step": 243660 }, { "epoch": 0.63, "learning_rate": 0.0002052558316765211, "loss": 0.0201, "step": 243670 }, { "epoch": 0.63, "learning_rate": 0.00020525194346014965, "loss": 0.0165, "step": 243680 }, { "epoch": 0.63, "learning_rate": 0.0002052480552437782, "loss": 0.0161, "step": 243690 }, { "epoch": 0.63, "learning_rate": 0.00020524416702740673, "loss": 0.0209, "step": 243700 }, { "epoch": 0.63, "learning_rate": 0.00020524027881103525, "loss": 0.0152, "step": 243710 }, { "epoch": 0.63, "learning_rate": 0.0002052363905946638, "loss": 0.0157, "step": 243720 }, { "epoch": 0.63, "learning_rate": 0.00020523250237829233, "loss": 0.0136, "step": 243730 }, { "epoch": 0.63, "learning_rate": 0.00020522861416192087, "loss": 0.0137, "step": 243740 }, { "epoch": 0.63, "learning_rate": 0.00020522472594554939, "loss": 0.0159, "step": 243750 }, { "epoch": 0.63, "learning_rate": 0.00020522083772917793, "loss": 0.0144, "step": 243760 }, { "epoch": 0.63, "learning_rate": 0.0002052169495128065, "loss": 0.0141, "step": 243770 }, { "epoch": 0.63, "learning_rate": 0.000205213061296435, "loss": 0.0157, "step": 243780 }, { "epoch": 0.63, "learning_rate": 0.00020520917308006353, "loss": 0.0235, "step": 243790 }, { "epoch": 0.63, "learning_rate": 0.00020520528486369207, "loss": 0.0147, "step": 243800 }, { "epoch": 0.63, "learning_rate": 0.00020520139664732064, "loss": 0.0179, "step": 243810 }, { "epoch": 0.63, "learning_rate": 0.00020519750843094915, "loss": 0.0112, "step": 243820 }, { "epoch": 0.63, "learning_rate": 0.0002051936202145777, "loss": 0.0166, "step": 243830 }, { "epoch": 0.63, "learning_rate": 0.0002051897319982062, "loss": 0.0192, "step": 243840 }, { "epoch": 0.63, "learning_rate": 0.00020518584378183478, "loss": 0.0196, "step": 243850 }, { "epoch": 0.63, "learning_rate": 0.0002051819555654633, "loss": 0.018, "step": 243860 }, { "epoch": 0.63, "learning_rate": 0.00020517806734909183, "loss": 0.0127, "step": 243870 }, { "epoch": 0.63, "learning_rate": 0.00020517417913272035, "loss": 0.0117, "step": 243880 }, { "epoch": 0.63, "learning_rate": 0.0002051702909163489, "loss": 0.013, "step": 243890 }, { "epoch": 0.63, "learning_rate": 0.00020516640269997743, "loss": 0.0196, "step": 243900 }, { "epoch": 0.63, "learning_rate": 0.00020516251448360597, "loss": 0.0129, "step": 243910 }, { "epoch": 0.63, "learning_rate": 0.00020515862626723449, "loss": 0.0168, "step": 243920 }, { "epoch": 0.63, "learning_rate": 0.00020515473805086303, "loss": 0.0134, "step": 243930 }, { "epoch": 0.63, "learning_rate": 0.00020515084983449157, "loss": 0.0148, "step": 243940 }, { "epoch": 0.63, "learning_rate": 0.0002051469616181201, "loss": 0.0114, "step": 243950 }, { "epoch": 0.63, "learning_rate": 0.00020514307340174863, "loss": 0.0182, "step": 243960 }, { "epoch": 0.63, "learning_rate": 0.00020513918518537717, "loss": 0.0138, "step": 243970 }, { "epoch": 0.63, "learning_rate": 0.00020513529696900574, "loss": 0.0138, "step": 243980 }, { "epoch": 0.63, "learning_rate": 0.00020513140875263425, "loss": 0.013, "step": 243990 }, { "epoch": 0.63, "learning_rate": 0.0002051275205362628, "loss": 0.0155, "step": 244000 }, { "epoch": 0.63, "eval_cer": 0.881782465628416, "eval_loss": 0.01116818655282259, "eval_runtime": 107.1197, "eval_samples_per_second": 18.671, "eval_steps_per_second": 4.668, "step": 244000 }, { "epoch": 0.63, "learning_rate": 0.0002051236323198913, "loss": 0.0135, "step": 244010 }, { "epoch": 0.63, "learning_rate": 0.00020511974410351988, "loss": 0.0152, "step": 244020 }, { "epoch": 0.63, "learning_rate": 0.0002051158558871484, "loss": 0.0132, "step": 244030 }, { "epoch": 0.63, "learning_rate": 0.00020511196767077693, "loss": 0.0167, "step": 244040 }, { "epoch": 0.63, "learning_rate": 0.00020510807945440545, "loss": 0.0162, "step": 244050 }, { "epoch": 0.63, "learning_rate": 0.00020510419123803401, "loss": 0.0139, "step": 244060 }, { "epoch": 0.63, "learning_rate": 0.00020510030302166253, "loss": 0.0149, "step": 244070 }, { "epoch": 0.63, "learning_rate": 0.00020509641480529107, "loss": 0.0151, "step": 244080 }, { "epoch": 0.63, "learning_rate": 0.00020509252658891959, "loss": 0.0172, "step": 244090 }, { "epoch": 0.63, "learning_rate": 0.00020508863837254815, "loss": 0.0158, "step": 244100 }, { "epoch": 0.63, "learning_rate": 0.00020508475015617667, "loss": 0.0193, "step": 244110 }, { "epoch": 0.63, "learning_rate": 0.0002050808619398052, "loss": 0.0132, "step": 244120 }, { "epoch": 0.63, "learning_rate": 0.00020507697372343372, "loss": 0.0142, "step": 244130 }, { "epoch": 0.63, "learning_rate": 0.00020507308550706227, "loss": 0.0164, "step": 244140 }, { "epoch": 0.63, "learning_rate": 0.00020506919729069084, "loss": 0.0165, "step": 244150 }, { "epoch": 0.63, "learning_rate": 0.00020506530907431935, "loss": 0.0157, "step": 244160 }, { "epoch": 0.63, "learning_rate": 0.0002050614208579479, "loss": 0.0251, "step": 244170 }, { "epoch": 0.63, "learning_rate": 0.0002050575326415764, "loss": 0.0166, "step": 244180 }, { "epoch": 0.63, "learning_rate": 0.00020505364442520497, "loss": 0.0128, "step": 244190 }, { "epoch": 0.63, "learning_rate": 0.0002050497562088335, "loss": 0.0135, "step": 244200 }, { "epoch": 0.63, "learning_rate": 0.00020504586799246203, "loss": 0.0133, "step": 244210 }, { "epoch": 0.63, "learning_rate": 0.00020504197977609055, "loss": 0.0218, "step": 244220 }, { "epoch": 0.63, "learning_rate": 0.00020503809155971911, "loss": 0.0167, "step": 244230 }, { "epoch": 0.63, "learning_rate": 0.00020503420334334763, "loss": 0.0185, "step": 244240 }, { "epoch": 0.63, "learning_rate": 0.00020503031512697617, "loss": 0.016, "step": 244250 }, { "epoch": 0.63, "learning_rate": 0.00020502642691060468, "loss": 0.0167, "step": 244260 }, { "epoch": 0.63, "learning_rate": 0.00020502253869423325, "loss": 0.0114, "step": 244270 }, { "epoch": 0.63, "learning_rate": 0.00020501865047786177, "loss": 0.0182, "step": 244280 }, { "epoch": 0.63, "learning_rate": 0.0002050147622614903, "loss": 0.0128, "step": 244290 }, { "epoch": 0.63, "learning_rate": 0.00020501087404511882, "loss": 0.0167, "step": 244300 }, { "epoch": 0.63, "learning_rate": 0.0002050069858287474, "loss": 0.014, "step": 244310 }, { "epoch": 0.63, "learning_rate": 0.00020500309761237593, "loss": 0.0161, "step": 244320 }, { "epoch": 0.63, "learning_rate": 0.00020499920939600445, "loss": 0.0175, "step": 244330 }, { "epoch": 0.63, "learning_rate": 0.00020499532117963296, "loss": 0.0182, "step": 244340 }, { "epoch": 0.63, "learning_rate": 0.00020499143296326153, "loss": 0.0172, "step": 244350 }, { "epoch": 0.63, "learning_rate": 0.00020498754474689007, "loss": 0.0168, "step": 244360 }, { "epoch": 0.63, "learning_rate": 0.0002049836565305186, "loss": 0.015, "step": 244370 }, { "epoch": 0.63, "learning_rate": 0.00020497976831414713, "loss": 0.0141, "step": 244380 }, { "epoch": 0.63, "learning_rate": 0.00020497588009777564, "loss": 0.0128, "step": 244390 }, { "epoch": 0.63, "learning_rate": 0.0002049719918814042, "loss": 0.0159, "step": 244400 }, { "epoch": 0.63, "learning_rate": 0.00020496810366503273, "loss": 0.0137, "step": 244410 }, { "epoch": 0.63, "learning_rate": 0.00020496421544866127, "loss": 0.0142, "step": 244420 }, { "epoch": 0.63, "learning_rate": 0.00020496032723228978, "loss": 0.0127, "step": 244430 }, { "epoch": 0.63, "learning_rate": 0.00020495643901591835, "loss": 0.0114, "step": 244440 }, { "epoch": 0.63, "learning_rate": 0.00020495255079954687, "loss": 0.0125, "step": 244450 }, { "epoch": 0.63, "learning_rate": 0.0002049486625831754, "loss": 0.013, "step": 244460 }, { "epoch": 0.63, "learning_rate": 0.00020494477436680392, "loss": 0.0176, "step": 244470 }, { "epoch": 0.63, "learning_rate": 0.0002049408861504325, "loss": 0.0137, "step": 244480 }, { "epoch": 0.63, "learning_rate": 0.000204936997934061, "loss": 0.0197, "step": 244490 }, { "epoch": 0.63, "learning_rate": 0.00020493310971768955, "loss": 0.0124, "step": 244500 }, { "epoch": 0.63, "learning_rate": 0.00020492922150131806, "loss": 0.0165, "step": 244510 }, { "epoch": 0.63, "learning_rate": 0.00020492533328494663, "loss": 0.0146, "step": 244520 }, { "epoch": 0.63, "learning_rate": 0.00020492144506857517, "loss": 0.014, "step": 244530 }, { "epoch": 0.63, "learning_rate": 0.0002049175568522037, "loss": 0.0146, "step": 244540 }, { "epoch": 0.63, "learning_rate": 0.00020491366863583223, "loss": 0.0212, "step": 244550 }, { "epoch": 0.63, "learning_rate": 0.00020490978041946077, "loss": 0.0142, "step": 244560 }, { "epoch": 0.63, "learning_rate": 0.0002049058922030893, "loss": 0.0166, "step": 244570 }, { "epoch": 0.63, "learning_rate": 0.00020490200398671783, "loss": 0.0132, "step": 244580 }, { "epoch": 0.63, "learning_rate": 0.00020489811577034637, "loss": 0.0154, "step": 244590 }, { "epoch": 0.63, "learning_rate": 0.0002048942275539749, "loss": 0.0128, "step": 244600 }, { "epoch": 0.63, "learning_rate": 0.00020489033933760345, "loss": 0.0154, "step": 244610 }, { "epoch": 0.63, "learning_rate": 0.00020488645112123197, "loss": 0.0151, "step": 244620 }, { "epoch": 0.63, "learning_rate": 0.0002048825629048605, "loss": 0.0138, "step": 244630 }, { "epoch": 0.63, "learning_rate": 0.00020487867468848902, "loss": 0.0169, "step": 244640 }, { "epoch": 0.63, "learning_rate": 0.0002048747864721176, "loss": 0.0171, "step": 244650 }, { "epoch": 0.63, "learning_rate": 0.0002048708982557461, "loss": 0.018, "step": 244660 }, { "epoch": 0.63, "learning_rate": 0.00020486701003937465, "loss": 0.0181, "step": 244670 }, { "epoch": 0.63, "learning_rate": 0.00020486312182300316, "loss": 0.0249, "step": 244680 }, { "epoch": 0.63, "learning_rate": 0.00020485923360663173, "loss": 0.012, "step": 244690 }, { "epoch": 0.63, "learning_rate": 0.00020485534539026027, "loss": 0.0156, "step": 244700 }, { "epoch": 0.63, "learning_rate": 0.0002048514571738888, "loss": 0.014, "step": 244710 }, { "epoch": 0.63, "learning_rate": 0.00020484756895751733, "loss": 0.0159, "step": 244720 }, { "epoch": 0.63, "learning_rate": 0.00020484368074114587, "loss": 0.0196, "step": 244730 }, { "epoch": 0.63, "learning_rate": 0.0002048397925247744, "loss": 0.0195, "step": 244740 }, { "epoch": 0.63, "learning_rate": 0.00020483590430840293, "loss": 0.0127, "step": 244750 }, { "epoch": 0.63, "learning_rate": 0.00020483201609203147, "loss": 0.0154, "step": 244760 }, { "epoch": 0.63, "learning_rate": 0.00020482812787566, "loss": 0.0216, "step": 244770 }, { "epoch": 0.63, "learning_rate": 0.00020482423965928855, "loss": 0.015, "step": 244780 }, { "epoch": 0.63, "learning_rate": 0.00020482035144291707, "loss": 0.017, "step": 244790 }, { "epoch": 0.63, "learning_rate": 0.0002048164632265456, "loss": 0.018, "step": 244800 }, { "epoch": 0.63, "learning_rate": 0.00020481257501017415, "loss": 0.0169, "step": 244810 }, { "epoch": 0.63, "learning_rate": 0.0002048086867938027, "loss": 0.0145, "step": 244820 }, { "epoch": 0.63, "learning_rate": 0.0002048047985774312, "loss": 0.0245, "step": 244830 }, { "epoch": 0.63, "learning_rate": 0.00020480091036105975, "loss": 0.0175, "step": 244840 }, { "epoch": 0.63, "learning_rate": 0.00020479702214468832, "loss": 0.0145, "step": 244850 }, { "epoch": 0.63, "learning_rate": 0.00020479313392831683, "loss": 0.0165, "step": 244860 }, { "epoch": 0.63, "learning_rate": 0.00020478924571194537, "loss": 0.0128, "step": 244870 }, { "epoch": 0.63, "learning_rate": 0.0002047853574955739, "loss": 0.0171, "step": 244880 }, { "epoch": 0.63, "learning_rate": 0.0002047814692792024, "loss": 0.0132, "step": 244890 }, { "epoch": 0.63, "learning_rate": 0.00020477758106283097, "loss": 0.015, "step": 244900 }, { "epoch": 0.63, "learning_rate": 0.0002047736928464595, "loss": 0.0155, "step": 244910 }, { "epoch": 0.63, "learning_rate": 0.00020476980463008803, "loss": 0.0154, "step": 244920 }, { "epoch": 0.63, "learning_rate": 0.00020476591641371657, "loss": 0.014, "step": 244930 }, { "epoch": 0.63, "learning_rate": 0.0002047620281973451, "loss": 0.021, "step": 244940 }, { "epoch": 0.63, "learning_rate": 0.00020475813998097365, "loss": 0.0161, "step": 244950 }, { "epoch": 0.63, "learning_rate": 0.00020475425176460217, "loss": 0.0181, "step": 244960 }, { "epoch": 0.63, "learning_rate": 0.0002047503635482307, "loss": 0.0152, "step": 244970 }, { "epoch": 0.64, "learning_rate": 0.00020474647533185925, "loss": 0.0167, "step": 244980 }, { "epoch": 0.64, "learning_rate": 0.0002047425871154878, "loss": 0.0157, "step": 244990 }, { "epoch": 0.64, "learning_rate": 0.0002047386988991163, "loss": 0.0122, "step": 245000 }, { "epoch": 0.64, "eval_cer": 0.8817726681698768, "eval_loss": 0.011478559114038944, "eval_runtime": 107.2432, "eval_samples_per_second": 18.649, "eval_steps_per_second": 4.662, "step": 245000 }, { "epoch": 0.64, "learning_rate": 0.00020473481068274485, "loss": 0.0153, "step": 245010 }, { "epoch": 0.64, "learning_rate": 0.00020473092246637342, "loss": 0.0166, "step": 245020 }, { "epoch": 0.64, "learning_rate": 0.00020472703425000193, "loss": 0.0161, "step": 245030 }, { "epoch": 0.64, "learning_rate": 0.00020472314603363047, "loss": 0.0147, "step": 245040 }, { "epoch": 0.64, "learning_rate": 0.00020471925781725899, "loss": 0.014, "step": 245050 }, { "epoch": 0.64, "learning_rate": 0.00020471536960088755, "loss": 0.0186, "step": 245060 }, { "epoch": 0.64, "learning_rate": 0.00020471148138451607, "loss": 0.0169, "step": 245070 }, { "epoch": 0.64, "learning_rate": 0.0002047075931681446, "loss": 0.0161, "step": 245080 }, { "epoch": 0.64, "learning_rate": 0.00020470370495177313, "loss": 0.0151, "step": 245090 }, { "epoch": 0.64, "learning_rate": 0.0002046998167354017, "loss": 0.0149, "step": 245100 }, { "epoch": 0.64, "learning_rate": 0.0002046959285190302, "loss": 0.0182, "step": 245110 }, { "epoch": 0.64, "learning_rate": 0.00020469204030265875, "loss": 0.0186, "step": 245120 }, { "epoch": 0.64, "learning_rate": 0.00020468815208628727, "loss": 0.0185, "step": 245130 }, { "epoch": 0.64, "learning_rate": 0.0002046842638699158, "loss": 0.0187, "step": 245140 }, { "epoch": 0.64, "learning_rate": 0.00020468037565354435, "loss": 0.014, "step": 245150 }, { "epoch": 0.64, "learning_rate": 0.0002046764874371729, "loss": 0.0187, "step": 245160 }, { "epoch": 0.64, "learning_rate": 0.0002046725992208014, "loss": 0.0198, "step": 245170 }, { "epoch": 0.64, "learning_rate": 0.00020466871100442995, "loss": 0.0141, "step": 245180 }, { "epoch": 0.64, "learning_rate": 0.00020466482278805851, "loss": 0.0184, "step": 245190 }, { "epoch": 0.64, "learning_rate": 0.00020466093457168703, "loss": 0.0189, "step": 245200 }, { "epoch": 0.64, "learning_rate": 0.00020465704635531554, "loss": 0.0163, "step": 245210 }, { "epoch": 0.64, "learning_rate": 0.00020465315813894409, "loss": 0.0161, "step": 245220 }, { "epoch": 0.64, "learning_rate": 0.00020464926992257265, "loss": 0.015, "step": 245230 }, { "epoch": 0.64, "learning_rate": 0.00020464538170620117, "loss": 0.0133, "step": 245240 }, { "epoch": 0.64, "learning_rate": 0.0002046414934898297, "loss": 0.0112, "step": 245250 }, { "epoch": 0.64, "learning_rate": 0.00020463760527345823, "loss": 0.0164, "step": 245260 }, { "epoch": 0.64, "learning_rate": 0.0002046337170570868, "loss": 0.0141, "step": 245270 }, { "epoch": 0.64, "learning_rate": 0.0002046298288407153, "loss": 0.014, "step": 245280 }, { "epoch": 0.64, "learning_rate": 0.00020462594062434385, "loss": 0.0188, "step": 245290 }, { "epoch": 0.64, "learning_rate": 0.00020462205240797236, "loss": 0.0184, "step": 245300 }, { "epoch": 0.64, "learning_rate": 0.00020461816419160093, "loss": 0.0157, "step": 245310 }, { "epoch": 0.64, "learning_rate": 0.00020461427597522945, "loss": 0.0158, "step": 245320 }, { "epoch": 0.64, "learning_rate": 0.000204610387758858, "loss": 0.017, "step": 245330 }, { "epoch": 0.64, "learning_rate": 0.0002046064995424865, "loss": 0.0173, "step": 245340 }, { "epoch": 0.64, "learning_rate": 0.00020460261132611507, "loss": 0.0132, "step": 245350 }, { "epoch": 0.64, "learning_rate": 0.00020459872310974361, "loss": 0.0146, "step": 245360 }, { "epoch": 0.64, "learning_rate": 0.00020459483489337213, "loss": 0.0158, "step": 245370 }, { "epoch": 0.64, "learning_rate": 0.00020459094667700064, "loss": 0.0142, "step": 245380 }, { "epoch": 0.64, "learning_rate": 0.00020458705846062918, "loss": 0.0132, "step": 245390 }, { "epoch": 0.64, "learning_rate": 0.00020458317024425775, "loss": 0.0148, "step": 245400 }, { "epoch": 0.64, "learning_rate": 0.00020457928202788627, "loss": 0.0305, "step": 245410 }, { "epoch": 0.64, "learning_rate": 0.0002045753938115148, "loss": 0.0171, "step": 245420 }, { "epoch": 0.64, "learning_rate": 0.00020457150559514332, "loss": 0.0151, "step": 245430 }, { "epoch": 0.64, "learning_rate": 0.0002045676173787719, "loss": 0.0135, "step": 245440 }, { "epoch": 0.64, "learning_rate": 0.0002045637291624004, "loss": 0.0151, "step": 245450 }, { "epoch": 0.64, "learning_rate": 0.00020455984094602895, "loss": 0.0169, "step": 245460 }, { "epoch": 0.64, "learning_rate": 0.00020455595272965746, "loss": 0.0175, "step": 245470 }, { "epoch": 0.64, "learning_rate": 0.00020455206451328603, "loss": 0.0179, "step": 245480 }, { "epoch": 0.64, "learning_rate": 0.00020454817629691455, "loss": 0.0182, "step": 245490 }, { "epoch": 0.64, "learning_rate": 0.0002045442880805431, "loss": 0.0139, "step": 245500 }, { "epoch": 0.64, "learning_rate": 0.0002045403998641716, "loss": 0.0186, "step": 245510 }, { "epoch": 0.64, "learning_rate": 0.00020453651164780017, "loss": 0.0185, "step": 245520 }, { "epoch": 0.64, "learning_rate": 0.0002045326234314287, "loss": 0.0174, "step": 245530 }, { "epoch": 0.64, "learning_rate": 0.00020452873521505723, "loss": 0.0161, "step": 245540 }, { "epoch": 0.64, "learning_rate": 0.00020452484699868574, "loss": 0.0115, "step": 245550 }, { "epoch": 0.64, "learning_rate": 0.0002045209587823143, "loss": 0.0181, "step": 245560 }, { "epoch": 0.64, "learning_rate": 0.00020451707056594285, "loss": 0.0155, "step": 245570 }, { "epoch": 0.64, "learning_rate": 0.00020451318234957137, "loss": 0.0162, "step": 245580 }, { "epoch": 0.64, "learning_rate": 0.0002045092941331999, "loss": 0.015, "step": 245590 }, { "epoch": 0.64, "learning_rate": 0.00020450540591682845, "loss": 0.02, "step": 245600 }, { "epoch": 0.64, "learning_rate": 0.000204501517700457, "loss": 0.0177, "step": 245610 }, { "epoch": 0.64, "learning_rate": 0.0002044976294840855, "loss": 0.0164, "step": 245620 }, { "epoch": 0.64, "learning_rate": 0.00020449374126771405, "loss": 0.0188, "step": 245630 }, { "epoch": 0.64, "learning_rate": 0.00020448985305134256, "loss": 0.0167, "step": 245640 }, { "epoch": 0.64, "learning_rate": 0.00020448596483497113, "loss": 0.0144, "step": 245650 }, { "epoch": 0.64, "learning_rate": 0.00020448207661859965, "loss": 0.0153, "step": 245660 }, { "epoch": 0.64, "learning_rate": 0.0002044781884022282, "loss": 0.0201, "step": 245670 }, { "epoch": 0.64, "learning_rate": 0.0002044743001858567, "loss": 0.0141, "step": 245680 }, { "epoch": 0.64, "learning_rate": 0.00020447041196948527, "loss": 0.0148, "step": 245690 }, { "epoch": 0.64, "learning_rate": 0.00020446652375311379, "loss": 0.0188, "step": 245700 }, { "epoch": 0.64, "learning_rate": 0.00020446263553674233, "loss": 0.0184, "step": 245710 }, { "epoch": 0.64, "learning_rate": 0.00020445874732037084, "loss": 0.0158, "step": 245720 }, { "epoch": 0.64, "learning_rate": 0.0002044548591039994, "loss": 0.0145, "step": 245730 }, { "epoch": 0.64, "learning_rate": 0.00020445097088762795, "loss": 0.016, "step": 245740 }, { "epoch": 0.64, "learning_rate": 0.00020444708267125647, "loss": 0.0117, "step": 245750 }, { "epoch": 0.64, "learning_rate": 0.000204443194454885, "loss": 0.0168, "step": 245760 }, { "epoch": 0.64, "learning_rate": 0.00020443930623851355, "loss": 0.0152, "step": 245770 }, { "epoch": 0.64, "learning_rate": 0.0002044354180221421, "loss": 0.0194, "step": 245780 }, { "epoch": 0.64, "learning_rate": 0.0002044315298057706, "loss": 0.0176, "step": 245790 }, { "epoch": 0.64, "learning_rate": 0.00020442764158939915, "loss": 0.0145, "step": 245800 }, { "epoch": 0.64, "learning_rate": 0.0002044237533730277, "loss": 0.0159, "step": 245810 }, { "epoch": 0.64, "learning_rate": 0.00020441986515665623, "loss": 0.0129, "step": 245820 }, { "epoch": 0.64, "learning_rate": 0.00020441597694028475, "loss": 0.0123, "step": 245830 }, { "epoch": 0.64, "learning_rate": 0.0002044120887239133, "loss": 0.0149, "step": 245840 }, { "epoch": 0.64, "learning_rate": 0.00020440820050754183, "loss": 0.0126, "step": 245850 }, { "epoch": 0.64, "learning_rate": 0.00020440431229117037, "loss": 0.0149, "step": 245860 }, { "epoch": 0.64, "learning_rate": 0.00020440042407479889, "loss": 0.0203, "step": 245870 }, { "epoch": 0.64, "learning_rate": 0.00020439653585842743, "loss": 0.0178, "step": 245880 }, { "epoch": 0.64, "learning_rate": 0.00020439264764205594, "loss": 0.0139, "step": 245890 }, { "epoch": 0.64, "learning_rate": 0.0002043887594256845, "loss": 0.0165, "step": 245900 }, { "epoch": 0.64, "learning_rate": 0.00020438487120931305, "loss": 0.0207, "step": 245910 }, { "epoch": 0.64, "learning_rate": 0.00020438098299294157, "loss": 0.0173, "step": 245920 }, { "epoch": 0.64, "learning_rate": 0.00020437709477657008, "loss": 0.0154, "step": 245930 }, { "epoch": 0.64, "learning_rate": 0.00020437320656019865, "loss": 0.0181, "step": 245940 }, { "epoch": 0.64, "learning_rate": 0.0002043693183438272, "loss": 0.0189, "step": 245950 }, { "epoch": 0.64, "learning_rate": 0.0002043654301274557, "loss": 0.0149, "step": 245960 }, { "epoch": 0.64, "learning_rate": 0.00020436154191108425, "loss": 0.0143, "step": 245970 }, { "epoch": 0.64, "learning_rate": 0.0002043576536947128, "loss": 0.0128, "step": 245980 }, { "epoch": 0.64, "learning_rate": 0.00020435376547834133, "loss": 0.0153, "step": 245990 }, { "epoch": 0.64, "learning_rate": 0.00020434987726196985, "loss": 0.0153, "step": 246000 }, { "epoch": 0.64, "eval_cer": 0.8817628707113375, "eval_loss": 0.011506488546729088, "eval_runtime": 107.342, "eval_samples_per_second": 18.632, "eval_steps_per_second": 4.658, "step": 246000 }, { "epoch": 0.64, "learning_rate": 0.0002043459890455984, "loss": 0.0135, "step": 246010 }, { "epoch": 0.64, "learning_rate": 0.00020434210082922693, "loss": 0.0135, "step": 246020 }, { "epoch": 0.64, "learning_rate": 0.00020433821261285547, "loss": 0.018, "step": 246030 }, { "epoch": 0.64, "learning_rate": 0.00020433432439648398, "loss": 0.0146, "step": 246040 }, { "epoch": 0.64, "learning_rate": 0.00020433043618011253, "loss": 0.0136, "step": 246050 }, { "epoch": 0.64, "learning_rate": 0.0002043265479637411, "loss": 0.0145, "step": 246060 }, { "epoch": 0.64, "learning_rate": 0.0002043226597473696, "loss": 0.017, "step": 246070 }, { "epoch": 0.64, "learning_rate": 0.00020431877153099812, "loss": 0.0216, "step": 246080 }, { "epoch": 0.64, "learning_rate": 0.00020431488331462667, "loss": 0.0151, "step": 246090 }, { "epoch": 0.64, "learning_rate": 0.00020431099509825523, "loss": 0.014, "step": 246100 }, { "epoch": 0.64, "learning_rate": 0.00020430710688188375, "loss": 0.0177, "step": 246110 }, { "epoch": 0.64, "learning_rate": 0.0002043032186655123, "loss": 0.0147, "step": 246120 }, { "epoch": 0.64, "learning_rate": 0.0002042993304491408, "loss": 0.0142, "step": 246130 }, { "epoch": 0.64, "learning_rate": 0.00020429544223276935, "loss": 0.016, "step": 246140 }, { "epoch": 0.64, "learning_rate": 0.0002042915540163979, "loss": 0.0143, "step": 246150 }, { "epoch": 0.64, "learning_rate": 0.00020428766580002643, "loss": 0.0172, "step": 246160 }, { "epoch": 0.64, "learning_rate": 0.00020428377758365494, "loss": 0.0115, "step": 246170 }, { "epoch": 0.64, "learning_rate": 0.0002042798893672835, "loss": 0.0169, "step": 246180 }, { "epoch": 0.64, "learning_rate": 0.00020427600115091203, "loss": 0.0147, "step": 246190 }, { "epoch": 0.64, "learning_rate": 0.00020427211293454057, "loss": 0.0184, "step": 246200 }, { "epoch": 0.64, "learning_rate": 0.00020426822471816908, "loss": 0.0138, "step": 246210 }, { "epoch": 0.64, "learning_rate": 0.00020426433650179763, "loss": 0.0151, "step": 246220 }, { "epoch": 0.64, "learning_rate": 0.0002042604482854262, "loss": 0.0135, "step": 246230 }, { "epoch": 0.64, "learning_rate": 0.0002042565600690547, "loss": 0.0151, "step": 246240 }, { "epoch": 0.64, "learning_rate": 0.00020425267185268322, "loss": 0.0198, "step": 246250 }, { "epoch": 0.64, "learning_rate": 0.00020424878363631177, "loss": 0.0169, "step": 246260 }, { "epoch": 0.64, "learning_rate": 0.00020424489541994033, "loss": 0.0185, "step": 246270 }, { "epoch": 0.64, "learning_rate": 0.00020424100720356885, "loss": 0.0188, "step": 246280 }, { "epoch": 0.64, "learning_rate": 0.0002042371189871974, "loss": 0.0148, "step": 246290 }, { "epoch": 0.64, "learning_rate": 0.0002042332307708259, "loss": 0.0135, "step": 246300 }, { "epoch": 0.64, "learning_rate": 0.00020422934255445447, "loss": 0.0154, "step": 246310 }, { "epoch": 0.64, "learning_rate": 0.000204225454338083, "loss": 0.0181, "step": 246320 }, { "epoch": 0.64, "learning_rate": 0.00020422156612171153, "loss": 0.0155, "step": 246330 }, { "epoch": 0.64, "learning_rate": 0.00020421767790534004, "loss": 0.0141, "step": 246340 }, { "epoch": 0.64, "learning_rate": 0.0002042137896889686, "loss": 0.0144, "step": 246350 }, { "epoch": 0.64, "learning_rate": 0.00020420990147259713, "loss": 0.0142, "step": 246360 }, { "epoch": 0.64, "learning_rate": 0.00020420601325622567, "loss": 0.0156, "step": 246370 }, { "epoch": 0.64, "learning_rate": 0.00020420212503985418, "loss": 0.0169, "step": 246380 }, { "epoch": 0.64, "learning_rate": 0.00020419823682348273, "loss": 0.0131, "step": 246390 }, { "epoch": 0.64, "learning_rate": 0.00020419434860711127, "loss": 0.0162, "step": 246400 }, { "epoch": 0.64, "learning_rate": 0.0002041904603907398, "loss": 0.0138, "step": 246410 }, { "epoch": 0.64, "learning_rate": 0.00020418657217436832, "loss": 0.0153, "step": 246420 }, { "epoch": 0.64, "learning_rate": 0.00020418268395799686, "loss": 0.0131, "step": 246430 }, { "epoch": 0.64, "learning_rate": 0.00020417879574162543, "loss": 0.0127, "step": 246440 }, { "epoch": 0.64, "learning_rate": 0.00020417490752525395, "loss": 0.0167, "step": 246450 }, { "epoch": 0.64, "learning_rate": 0.0002041710193088825, "loss": 0.015, "step": 246460 }, { "epoch": 0.64, "learning_rate": 0.000204167131092511, "loss": 0.0145, "step": 246470 }, { "epoch": 0.64, "learning_rate": 0.00020416324287613957, "loss": 0.0146, "step": 246480 }, { "epoch": 0.64, "learning_rate": 0.0002041593546597681, "loss": 0.0136, "step": 246490 }, { "epoch": 0.64, "learning_rate": 0.00020415546644339663, "loss": 0.0156, "step": 246500 }, { "epoch": 0.64, "learning_rate": 0.00020415157822702514, "loss": 0.0162, "step": 246510 }, { "epoch": 0.64, "learning_rate": 0.0002041476900106537, "loss": 0.0163, "step": 246520 }, { "epoch": 0.64, "learning_rate": 0.00020414380179428223, "loss": 0.0172, "step": 246530 }, { "epoch": 0.64, "learning_rate": 0.00020413991357791077, "loss": 0.0157, "step": 246540 }, { "epoch": 0.64, "learning_rate": 0.00020413602536153928, "loss": 0.013, "step": 246550 }, { "epoch": 0.64, "learning_rate": 0.00020413213714516785, "loss": 0.0184, "step": 246560 }, { "epoch": 0.64, "learning_rate": 0.00020412824892879637, "loss": 0.0153, "step": 246570 }, { "epoch": 0.64, "learning_rate": 0.0002041243607124249, "loss": 0.0177, "step": 246580 }, { "epoch": 0.64, "learning_rate": 0.00020412047249605342, "loss": 0.0156, "step": 246590 }, { "epoch": 0.64, "learning_rate": 0.000204116584279682, "loss": 0.0156, "step": 246600 }, { "epoch": 0.64, "learning_rate": 0.00020411269606331053, "loss": 0.0165, "step": 246610 }, { "epoch": 0.64, "learning_rate": 0.00020410880784693905, "loss": 0.0165, "step": 246620 }, { "epoch": 0.64, "learning_rate": 0.0002041049196305676, "loss": 0.0146, "step": 246630 }, { "epoch": 0.64, "learning_rate": 0.0002041010314141961, "loss": 0.0157, "step": 246640 }, { "epoch": 0.64, "learning_rate": 0.00020409714319782467, "loss": 0.0212, "step": 246650 }, { "epoch": 0.64, "learning_rate": 0.0002040932549814532, "loss": 0.0142, "step": 246660 }, { "epoch": 0.64, "learning_rate": 0.00020408936676508173, "loss": 0.0138, "step": 246670 }, { "epoch": 0.64, "learning_rate": 0.00020408547854871024, "loss": 0.0155, "step": 246680 }, { "epoch": 0.64, "learning_rate": 0.0002040815903323388, "loss": 0.0147, "step": 246690 }, { "epoch": 0.64, "learning_rate": 0.00020407770211596733, "loss": 0.0129, "step": 246700 }, { "epoch": 0.64, "learning_rate": 0.00020407381389959587, "loss": 0.0202, "step": 246710 }, { "epoch": 0.64, "learning_rate": 0.00020406992568322438, "loss": 0.0138, "step": 246720 }, { "epoch": 0.64, "learning_rate": 0.00020406603746685295, "loss": 0.0155, "step": 246730 }, { "epoch": 0.64, "learning_rate": 0.00020406214925048147, "loss": 0.0143, "step": 246740 }, { "epoch": 0.64, "learning_rate": 0.00020405826103411, "loss": 0.0133, "step": 246750 }, { "epoch": 0.64, "learning_rate": 0.00020405437281773852, "loss": 0.0155, "step": 246760 }, { "epoch": 0.64, "learning_rate": 0.0002040504846013671, "loss": 0.0132, "step": 246770 }, { "epoch": 0.64, "learning_rate": 0.00020404659638499563, "loss": 0.0177, "step": 246780 }, { "epoch": 0.64, "learning_rate": 0.00020404270816862415, "loss": 0.0146, "step": 246790 }, { "epoch": 0.64, "learning_rate": 0.00020403881995225266, "loss": 0.0144, "step": 246800 }, { "epoch": 0.64, "learning_rate": 0.00020403493173588123, "loss": 0.0141, "step": 246810 }, { "epoch": 0.64, "learning_rate": 0.00020403104351950977, "loss": 0.0197, "step": 246820 }, { "epoch": 0.64, "learning_rate": 0.00020402715530313829, "loss": 0.0156, "step": 246830 }, { "epoch": 0.64, "learning_rate": 0.00020402326708676683, "loss": 0.0179, "step": 246840 }, { "epoch": 0.64, "learning_rate": 0.00020401937887039537, "loss": 0.0171, "step": 246850 }, { "epoch": 0.64, "learning_rate": 0.0002040154906540239, "loss": 0.0153, "step": 246860 }, { "epoch": 0.64, "learning_rate": 0.00020401160243765243, "loss": 0.014, "step": 246870 }, { "epoch": 0.64, "learning_rate": 0.00020400771422128097, "loss": 0.0168, "step": 246880 }, { "epoch": 0.64, "learning_rate": 0.00020400382600490948, "loss": 0.0132, "step": 246890 }, { "epoch": 0.64, "learning_rate": 0.00020399993778853805, "loss": 0.0167, "step": 246900 }, { "epoch": 0.64, "learning_rate": 0.00020399604957216657, "loss": 0.0185, "step": 246910 }, { "epoch": 0.64, "learning_rate": 0.0002039921613557951, "loss": 0.0171, "step": 246920 }, { "epoch": 0.64, "learning_rate": 0.00020398827313942362, "loss": 0.0124, "step": 246930 }, { "epoch": 0.64, "learning_rate": 0.0002039843849230522, "loss": 0.0142, "step": 246940 }, { "epoch": 0.64, "learning_rate": 0.00020398049670668073, "loss": 0.0141, "step": 246950 }, { "epoch": 0.64, "learning_rate": 0.00020397660849030925, "loss": 0.0164, "step": 246960 }, { "epoch": 0.64, "learning_rate": 0.00020397272027393776, "loss": 0.016, "step": 246970 }, { "epoch": 0.64, "learning_rate": 0.00020396883205756633, "loss": 0.0165, "step": 246980 }, { "epoch": 0.64, "learning_rate": 0.00020396494384119487, "loss": 0.0137, "step": 246990 }, { "epoch": 0.64, "learning_rate": 0.00020396105562482339, "loss": 0.0184, "step": 247000 }, { "epoch": 0.64, "eval_cer": 0.8817614710744033, "eval_loss": 0.01131850853562355, "eval_runtime": 107.4227, "eval_samples_per_second": 18.618, "eval_steps_per_second": 4.655, "step": 247000 }, { "epoch": 0.64, "learning_rate": 0.00020395716740845193, "loss": 0.0158, "step": 247010 }, { "epoch": 0.64, "learning_rate": 0.00020395327919208047, "loss": 0.0169, "step": 247020 }, { "epoch": 0.64, "learning_rate": 0.000203949390975709, "loss": 0.0142, "step": 247030 }, { "epoch": 0.64, "learning_rate": 0.00020394550275933753, "loss": 0.0142, "step": 247040 }, { "epoch": 0.64, "learning_rate": 0.00020394161454296607, "loss": 0.0199, "step": 247050 }, { "epoch": 0.64, "learning_rate": 0.0002039377263265946, "loss": 0.02, "step": 247060 }, { "epoch": 0.64, "learning_rate": 0.00020393383811022315, "loss": 0.0165, "step": 247070 }, { "epoch": 0.64, "learning_rate": 0.00020392994989385166, "loss": 0.0178, "step": 247080 }, { "epoch": 0.64, "learning_rate": 0.0002039260616774802, "loss": 0.0123, "step": 247090 }, { "epoch": 0.64, "learning_rate": 0.00020392217346110878, "loss": 0.016, "step": 247100 }, { "epoch": 0.64, "learning_rate": 0.0002039182852447373, "loss": 0.0165, "step": 247110 }, { "epoch": 0.64, "learning_rate": 0.0002039143970283658, "loss": 0.0141, "step": 247120 }, { "epoch": 0.64, "learning_rate": 0.00020391050881199435, "loss": 0.0162, "step": 247130 }, { "epoch": 0.64, "learning_rate": 0.00020390662059562286, "loss": 0.0126, "step": 247140 }, { "epoch": 0.64, "learning_rate": 0.00020390273237925143, "loss": 0.0151, "step": 247150 }, { "epoch": 0.64, "learning_rate": 0.00020389884416287997, "loss": 0.0125, "step": 247160 }, { "epoch": 0.64, "learning_rate": 0.00020389495594650849, "loss": 0.0157, "step": 247170 }, { "epoch": 0.64, "learning_rate": 0.00020389106773013703, "loss": 0.0188, "step": 247180 }, { "epoch": 0.64, "learning_rate": 0.00020388717951376557, "loss": 0.0155, "step": 247190 }, { "epoch": 0.64, "learning_rate": 0.0002038832912973941, "loss": 0.0135, "step": 247200 }, { "epoch": 0.64, "learning_rate": 0.00020387940308102262, "loss": 0.0131, "step": 247210 }, { "epoch": 0.64, "learning_rate": 0.00020387551486465117, "loss": 0.013, "step": 247220 }, { "epoch": 0.64, "learning_rate": 0.0002038716266482797, "loss": 0.0181, "step": 247230 }, { "epoch": 0.64, "learning_rate": 0.00020386773843190825, "loss": 0.0176, "step": 247240 }, { "epoch": 0.64, "learning_rate": 0.00020386385021553676, "loss": 0.0132, "step": 247250 }, { "epoch": 0.64, "learning_rate": 0.0002038599619991653, "loss": 0.0237, "step": 247260 }, { "epoch": 0.64, "learning_rate": 0.00020385607378279385, "loss": 0.0177, "step": 247270 }, { "epoch": 0.64, "learning_rate": 0.0002038521855664224, "loss": 0.0139, "step": 247280 }, { "epoch": 0.64, "learning_rate": 0.0002038482973500509, "loss": 0.0179, "step": 247290 }, { "epoch": 0.64, "learning_rate": 0.00020384440913367945, "loss": 0.0158, "step": 247300 }, { "epoch": 0.64, "learning_rate": 0.00020384052091730801, "loss": 0.0178, "step": 247310 }, { "epoch": 0.64, "learning_rate": 0.00020383663270093653, "loss": 0.0196, "step": 247320 }, { "epoch": 0.64, "learning_rate": 0.00020383274448456507, "loss": 0.0115, "step": 247330 }, { "epoch": 0.64, "learning_rate": 0.00020382885626819358, "loss": 0.0156, "step": 247340 }, { "epoch": 0.64, "learning_rate": 0.00020382496805182215, "loss": 0.0142, "step": 247350 }, { "epoch": 0.64, "learning_rate": 0.00020382107983545067, "loss": 0.0144, "step": 247360 }, { "epoch": 0.64, "learning_rate": 0.0002038171916190792, "loss": 0.0184, "step": 247370 }, { "epoch": 0.64, "learning_rate": 0.00020381330340270772, "loss": 0.0143, "step": 247380 }, { "epoch": 0.64, "learning_rate": 0.00020380941518633627, "loss": 0.0211, "step": 247390 }, { "epoch": 0.64, "learning_rate": 0.0002038055269699648, "loss": 0.0194, "step": 247400 }, { "epoch": 0.64, "learning_rate": 0.00020380163875359335, "loss": 0.013, "step": 247410 }, { "epoch": 0.64, "learning_rate": 0.00020379775053722186, "loss": 0.0122, "step": 247420 }, { "epoch": 0.64, "learning_rate": 0.0002037938623208504, "loss": 0.0178, "step": 247430 }, { "epoch": 0.64, "learning_rate": 0.00020378997410447895, "loss": 0.0121, "step": 247440 }, { "epoch": 0.64, "learning_rate": 0.0002037860858881075, "loss": 0.0165, "step": 247450 }, { "epoch": 0.64, "learning_rate": 0.000203782197671736, "loss": 0.0141, "step": 247460 }, { "epoch": 0.64, "learning_rate": 0.00020377830945536454, "loss": 0.0133, "step": 247470 }, { "epoch": 0.64, "learning_rate": 0.0002037744212389931, "loss": 0.0151, "step": 247480 }, { "epoch": 0.64, "learning_rate": 0.00020377053302262163, "loss": 0.0154, "step": 247490 }, { "epoch": 0.64, "learning_rate": 0.00020376664480625017, "loss": 0.0229, "step": 247500 }, { "epoch": 0.64, "learning_rate": 0.00020376275658987868, "loss": 0.0154, "step": 247510 }, { "epoch": 0.64, "learning_rate": 0.00020375886837350725, "loss": 0.0148, "step": 247520 }, { "epoch": 0.64, "learning_rate": 0.00020375498015713577, "loss": 0.0144, "step": 247530 }, { "epoch": 0.64, "learning_rate": 0.0002037510919407643, "loss": 0.0148, "step": 247540 }, { "epoch": 0.64, "learning_rate": 0.00020374720372439282, "loss": 0.0106, "step": 247550 }, { "epoch": 0.64, "learning_rate": 0.0002037433155080214, "loss": 0.0144, "step": 247560 }, { "epoch": 0.64, "learning_rate": 0.0002037394272916499, "loss": 0.0206, "step": 247570 }, { "epoch": 0.64, "learning_rate": 0.00020373553907527845, "loss": 0.014, "step": 247580 }, { "epoch": 0.64, "learning_rate": 0.00020373165085890696, "loss": 0.0136, "step": 247590 }, { "epoch": 0.64, "learning_rate": 0.00020372776264253553, "loss": 0.0192, "step": 247600 }, { "epoch": 0.64, "learning_rate": 0.00020372387442616405, "loss": 0.0211, "step": 247610 }, { "epoch": 0.64, "learning_rate": 0.0002037199862097926, "loss": 0.0148, "step": 247620 }, { "epoch": 0.64, "learning_rate": 0.0002037160979934211, "loss": 0.0176, "step": 247630 }, { "epoch": 0.64, "learning_rate": 0.00020371220977704964, "loss": 0.0166, "step": 247640 }, { "epoch": 0.64, "learning_rate": 0.0002037083215606782, "loss": 0.0136, "step": 247650 }, { "epoch": 0.64, "learning_rate": 0.00020370443334430673, "loss": 0.0188, "step": 247660 }, { "epoch": 0.64, "learning_rate": 0.00020370054512793524, "loss": 0.015, "step": 247670 }, { "epoch": 0.64, "learning_rate": 0.00020369665691156378, "loss": 0.0145, "step": 247680 }, { "epoch": 0.64, "learning_rate": 0.00020369276869519235, "loss": 0.0129, "step": 247690 }, { "epoch": 0.64, "learning_rate": 0.00020368888047882087, "loss": 0.0157, "step": 247700 }, { "epoch": 0.64, "learning_rate": 0.0002036849922624494, "loss": 0.0194, "step": 247710 }, { "epoch": 0.64, "learning_rate": 0.00020368110404607792, "loss": 0.0171, "step": 247720 }, { "epoch": 0.64, "learning_rate": 0.0002036772158297065, "loss": 0.0133, "step": 247730 }, { "epoch": 0.64, "learning_rate": 0.000203673327613335, "loss": 0.0194, "step": 247740 }, { "epoch": 0.64, "learning_rate": 0.00020366943939696355, "loss": 0.0175, "step": 247750 }, { "epoch": 0.64, "learning_rate": 0.00020366555118059206, "loss": 0.0208, "step": 247760 }, { "epoch": 0.64, "learning_rate": 0.00020366166296422063, "loss": 0.0169, "step": 247770 }, { "epoch": 0.64, "learning_rate": 0.00020365777474784915, "loss": 0.0147, "step": 247780 }, { "epoch": 0.64, "learning_rate": 0.0002036538865314777, "loss": 0.0194, "step": 247790 }, { "epoch": 0.64, "learning_rate": 0.0002036499983151062, "loss": 0.0217, "step": 247800 }, { "epoch": 0.64, "learning_rate": 0.00020364611009873477, "loss": 0.0149, "step": 247810 }, { "epoch": 0.64, "learning_rate": 0.0002036422218823633, "loss": 0.0134, "step": 247820 }, { "epoch": 0.64, "learning_rate": 0.00020363833366599183, "loss": 0.0152, "step": 247830 }, { "epoch": 0.64, "learning_rate": 0.00020363444544962034, "loss": 0.0139, "step": 247840 }, { "epoch": 0.64, "learning_rate": 0.0002036305572332489, "loss": 0.0204, "step": 247850 }, { "epoch": 0.64, "learning_rate": 0.00020362666901687745, "loss": 0.0137, "step": 247860 }, { "epoch": 0.64, "learning_rate": 0.00020362278080050597, "loss": 0.0187, "step": 247870 }, { "epoch": 0.64, "learning_rate": 0.0002036188925841345, "loss": 0.0137, "step": 247880 }, { "epoch": 0.64, "learning_rate": 0.00020361500436776302, "loss": 0.0145, "step": 247890 }, { "epoch": 0.64, "learning_rate": 0.0002036111161513916, "loss": 0.015, "step": 247900 }, { "epoch": 0.64, "learning_rate": 0.0002036072279350201, "loss": 0.0172, "step": 247910 }, { "epoch": 0.64, "learning_rate": 0.00020360333971864865, "loss": 0.0162, "step": 247920 }, { "epoch": 0.64, "learning_rate": 0.00020359945150227716, "loss": 0.0152, "step": 247930 }, { "epoch": 0.64, "learning_rate": 0.00020359556328590573, "loss": 0.0166, "step": 247940 }, { "epoch": 0.64, "learning_rate": 0.00020359167506953425, "loss": 0.0151, "step": 247950 }, { "epoch": 0.64, "learning_rate": 0.0002035877868531628, "loss": 0.0137, "step": 247960 }, { "epoch": 0.64, "learning_rate": 0.0002035838986367913, "loss": 0.0139, "step": 247970 }, { "epoch": 0.64, "learning_rate": 0.00020358001042041987, "loss": 0.0153, "step": 247980 }, { "epoch": 0.64, "learning_rate": 0.00020357612220404838, "loss": 0.0156, "step": 247990 }, { "epoch": 0.64, "learning_rate": 0.00020357223398767693, "loss": 0.0167, "step": 248000 }, { "epoch": 0.64, "eval_cer": 0.8818244547364413, "eval_loss": 0.010956432670354843, "eval_runtime": 107.4182, "eval_samples_per_second": 18.619, "eval_steps_per_second": 4.655, "step": 248000 }, { "epoch": 0.64, "learning_rate": 0.00020356834577130544, "loss": 0.0128, "step": 248010 }, { "epoch": 0.64, "learning_rate": 0.000203564457554934, "loss": 0.018, "step": 248020 }, { "epoch": 0.64, "learning_rate": 0.00020356056933856255, "loss": 0.016, "step": 248030 }, { "epoch": 0.64, "learning_rate": 0.00020355668112219107, "loss": 0.0149, "step": 248040 }, { "epoch": 0.64, "learning_rate": 0.0002035527929058196, "loss": 0.0159, "step": 248050 }, { "epoch": 0.64, "learning_rate": 0.00020354890468944815, "loss": 0.016, "step": 248060 }, { "epoch": 0.64, "learning_rate": 0.0002035450164730767, "loss": 0.0149, "step": 248070 }, { "epoch": 0.64, "learning_rate": 0.0002035411282567052, "loss": 0.0139, "step": 248080 }, { "epoch": 0.64, "learning_rate": 0.00020353724004033375, "loss": 0.016, "step": 248090 }, { "epoch": 0.64, "learning_rate": 0.0002035333518239623, "loss": 0.016, "step": 248100 }, { "epoch": 0.64, "learning_rate": 0.00020352946360759083, "loss": 0.0153, "step": 248110 }, { "epoch": 0.64, "learning_rate": 0.00020352557539121934, "loss": 0.0231, "step": 248120 }, { "epoch": 0.64, "learning_rate": 0.00020352168717484789, "loss": 0.0148, "step": 248130 }, { "epoch": 0.64, "learning_rate": 0.0002035177989584764, "loss": 0.0139, "step": 248140 }, { "epoch": 0.64, "learning_rate": 0.00020351391074210497, "loss": 0.0151, "step": 248150 }, { "epoch": 0.64, "learning_rate": 0.00020351002252573348, "loss": 0.0125, "step": 248160 }, { "epoch": 0.64, "learning_rate": 0.00020350613430936203, "loss": 0.0156, "step": 248170 }, { "epoch": 0.64, "learning_rate": 0.00020350224609299054, "loss": 0.0159, "step": 248180 }, { "epoch": 0.64, "learning_rate": 0.0002034983578766191, "loss": 0.018, "step": 248190 }, { "epoch": 0.64, "learning_rate": 0.00020349446966024765, "loss": 0.0171, "step": 248200 }, { "epoch": 0.64, "learning_rate": 0.00020349058144387617, "loss": 0.0154, "step": 248210 }, { "epoch": 0.64, "learning_rate": 0.0002034866932275047, "loss": 0.0157, "step": 248220 }, { "epoch": 0.64, "learning_rate": 0.00020348280501113325, "loss": 0.0163, "step": 248230 }, { "epoch": 0.64, "learning_rate": 0.0002034789167947618, "loss": 0.0162, "step": 248240 }, { "epoch": 0.64, "learning_rate": 0.0002034750285783903, "loss": 0.0154, "step": 248250 }, { "epoch": 0.64, "learning_rate": 0.00020347114036201885, "loss": 0.0207, "step": 248260 }, { "epoch": 0.64, "learning_rate": 0.0002034672521456474, "loss": 0.0157, "step": 248270 }, { "epoch": 0.64, "learning_rate": 0.00020346336392927593, "loss": 0.0145, "step": 248280 }, { "epoch": 0.64, "learning_rate": 0.00020345947571290444, "loss": 0.0125, "step": 248290 }, { "epoch": 0.64, "learning_rate": 0.00020345558749653299, "loss": 0.0134, "step": 248300 }, { "epoch": 0.64, "learning_rate": 0.00020345169928016153, "loss": 0.018, "step": 248310 }, { "epoch": 0.64, "learning_rate": 0.00020344781106379007, "loss": 0.0136, "step": 248320 }, { "epoch": 0.64, "learning_rate": 0.00020344392284741858, "loss": 0.0167, "step": 248330 }, { "epoch": 0.64, "learning_rate": 0.00020344003463104712, "loss": 0.0136, "step": 248340 }, { "epoch": 0.64, "learning_rate": 0.0002034361464146757, "loss": 0.0199, "step": 248350 }, { "epoch": 0.64, "learning_rate": 0.0002034322581983042, "loss": 0.0166, "step": 248360 }, { "epoch": 0.64, "learning_rate": 0.00020342836998193275, "loss": 0.0154, "step": 248370 }, { "epoch": 0.64, "learning_rate": 0.00020342448176556126, "loss": 0.0154, "step": 248380 }, { "epoch": 0.64, "learning_rate": 0.00020342059354918978, "loss": 0.0139, "step": 248390 }, { "epoch": 0.64, "learning_rate": 0.00020341670533281835, "loss": 0.0142, "step": 248400 }, { "epoch": 0.64, "learning_rate": 0.0002034128171164469, "loss": 0.0135, "step": 248410 }, { "epoch": 0.64, "learning_rate": 0.0002034089289000754, "loss": 0.0147, "step": 248420 }, { "epoch": 0.64, "learning_rate": 0.00020340504068370395, "loss": 0.0143, "step": 248430 }, { "epoch": 0.64, "learning_rate": 0.0002034011524673325, "loss": 0.0157, "step": 248440 }, { "epoch": 0.64, "learning_rate": 0.00020339726425096103, "loss": 0.0125, "step": 248450 }, { "epoch": 0.64, "learning_rate": 0.00020339337603458954, "loss": 0.0149, "step": 248460 }, { "epoch": 0.64, "learning_rate": 0.00020338948781821808, "loss": 0.0154, "step": 248470 }, { "epoch": 0.64, "learning_rate": 0.00020338559960184663, "loss": 0.015, "step": 248480 }, { "epoch": 0.64, "learning_rate": 0.00020338171138547517, "loss": 0.016, "step": 248490 }, { "epoch": 0.64, "learning_rate": 0.00020337782316910368, "loss": 0.0148, "step": 248500 }, { "epoch": 0.64, "learning_rate": 0.00020337393495273222, "loss": 0.0199, "step": 248510 }, { "epoch": 0.64, "learning_rate": 0.0002033700467363608, "loss": 0.0181, "step": 248520 }, { "epoch": 0.64, "learning_rate": 0.0002033661585199893, "loss": 0.0116, "step": 248530 }, { "epoch": 0.64, "learning_rate": 0.00020336227030361785, "loss": 0.0127, "step": 248540 }, { "epoch": 0.64, "learning_rate": 0.00020335838208724636, "loss": 0.0151, "step": 248550 }, { "epoch": 0.64, "learning_rate": 0.00020335449387087493, "loss": 0.015, "step": 248560 }, { "epoch": 0.64, "learning_rate": 0.00020335060565450345, "loss": 0.0146, "step": 248570 }, { "epoch": 0.64, "learning_rate": 0.000203346717438132, "loss": 0.0136, "step": 248580 }, { "epoch": 0.64, "learning_rate": 0.0002033428292217605, "loss": 0.0141, "step": 248590 }, { "epoch": 0.64, "learning_rate": 0.00020333894100538907, "loss": 0.015, "step": 248600 }, { "epoch": 0.64, "learning_rate": 0.0002033350527890176, "loss": 0.0144, "step": 248610 }, { "epoch": 0.64, "learning_rate": 0.00020333116457264613, "loss": 0.0201, "step": 248620 }, { "epoch": 0.64, "learning_rate": 0.00020332727635627464, "loss": 0.0208, "step": 248630 }, { "epoch": 0.64, "learning_rate": 0.00020332338813990318, "loss": 0.0178, "step": 248640 }, { "epoch": 0.64, "learning_rate": 0.00020331949992353173, "loss": 0.0132, "step": 248650 }, { "epoch": 0.64, "learning_rate": 0.00020331561170716027, "loss": 0.0157, "step": 248660 }, { "epoch": 0.64, "learning_rate": 0.00020331172349078878, "loss": 0.0155, "step": 248670 }, { "epoch": 0.64, "learning_rate": 0.00020330783527441732, "loss": 0.0153, "step": 248680 }, { "epoch": 0.64, "learning_rate": 0.0002033039470580459, "loss": 0.0165, "step": 248690 }, { "epoch": 0.64, "learning_rate": 0.0002033000588416744, "loss": 0.0122, "step": 248700 }, { "epoch": 0.64, "learning_rate": 0.00020329617062530292, "loss": 0.0133, "step": 248710 }, { "epoch": 0.64, "learning_rate": 0.00020329228240893146, "loss": 0.0172, "step": 248720 }, { "epoch": 0.64, "learning_rate": 0.00020328839419256003, "loss": 0.0167, "step": 248730 }, { "epoch": 0.64, "learning_rate": 0.00020328450597618855, "loss": 0.0135, "step": 248740 }, { "epoch": 0.64, "learning_rate": 0.0002032806177598171, "loss": 0.0156, "step": 248750 }, { "epoch": 0.64, "learning_rate": 0.0002032767295434456, "loss": 0.0194, "step": 248760 }, { "epoch": 0.64, "learning_rate": 0.00020327284132707417, "loss": 0.0149, "step": 248770 }, { "epoch": 0.64, "learning_rate": 0.00020326895311070269, "loss": 0.0157, "step": 248780 }, { "epoch": 0.64, "learning_rate": 0.00020326506489433123, "loss": 0.0128, "step": 248790 }, { "epoch": 0.64, "learning_rate": 0.00020326117667795974, "loss": 0.0167, "step": 248800 }, { "epoch": 0.64, "learning_rate": 0.0002032572884615883, "loss": 0.0133, "step": 248810 }, { "epoch": 0.64, "learning_rate": 0.00020325340024521683, "loss": 0.0188, "step": 248820 }, { "epoch": 0.65, "learning_rate": 0.00020324951202884537, "loss": 0.0189, "step": 248830 }, { "epoch": 0.65, "learning_rate": 0.00020324562381247388, "loss": 0.0159, "step": 248840 }, { "epoch": 0.65, "learning_rate": 0.00020324173559610245, "loss": 0.0209, "step": 248850 }, { "epoch": 0.65, "learning_rate": 0.00020323784737973096, "loss": 0.0142, "step": 248860 }, { "epoch": 0.65, "learning_rate": 0.0002032339591633595, "loss": 0.0147, "step": 248870 }, { "epoch": 0.65, "learning_rate": 0.00020323007094698802, "loss": 0.015, "step": 248880 }, { "epoch": 0.65, "learning_rate": 0.00020322618273061656, "loss": 0.0135, "step": 248890 }, { "epoch": 0.65, "learning_rate": 0.00020322229451424513, "loss": 0.0187, "step": 248900 }, { "epoch": 0.65, "learning_rate": 0.00020321840629787365, "loss": 0.0146, "step": 248910 }, { "epoch": 0.65, "learning_rate": 0.0002032145180815022, "loss": 0.0153, "step": 248920 }, { "epoch": 0.65, "learning_rate": 0.0002032106298651307, "loss": 0.0173, "step": 248930 }, { "epoch": 0.65, "learning_rate": 0.00020320674164875927, "loss": 0.0142, "step": 248940 }, { "epoch": 0.65, "learning_rate": 0.00020320285343238779, "loss": 0.0195, "step": 248950 }, { "epoch": 0.65, "learning_rate": 0.00020319896521601633, "loss": 0.0166, "step": 248960 }, { "epoch": 0.65, "learning_rate": 0.00020319507699964484, "loss": 0.0148, "step": 248970 }, { "epoch": 0.65, "learning_rate": 0.0002031911887832734, "loss": 0.0167, "step": 248980 }, { "epoch": 0.65, "learning_rate": 0.00020318730056690192, "loss": 0.0188, "step": 248990 }, { "epoch": 0.65, "learning_rate": 0.00020318341235053047, "loss": 0.0168, "step": 249000 }, { "epoch": 0.65, "eval_cer": 0.8817922630869552, "eval_loss": 0.011258595623075962, "eval_runtime": 107.1544, "eval_samples_per_second": 18.665, "eval_steps_per_second": 4.666, "step": 249000 }, { "epoch": 0.65, "learning_rate": 0.00020317952413415898, "loss": 0.0149, "step": 249010 }, { "epoch": 0.65, "learning_rate": 0.00020317563591778755, "loss": 0.0117, "step": 249020 }, { "epoch": 0.65, "learning_rate": 0.00020317174770141606, "loss": 0.014, "step": 249030 }, { "epoch": 0.65, "learning_rate": 0.0002031678594850446, "loss": 0.0182, "step": 249040 }, { "epoch": 0.65, "learning_rate": 0.00020316397126867312, "loss": 0.0152, "step": 249050 }, { "epoch": 0.65, "learning_rate": 0.0002031600830523017, "loss": 0.0141, "step": 249060 }, { "epoch": 0.65, "learning_rate": 0.00020315619483593023, "loss": 0.0198, "step": 249070 }, { "epoch": 0.65, "learning_rate": 0.00020315230661955875, "loss": 0.0133, "step": 249080 }, { "epoch": 0.65, "learning_rate": 0.0002031484184031873, "loss": 0.0194, "step": 249090 }, { "epoch": 0.65, "learning_rate": 0.0002031445301868158, "loss": 0.023, "step": 249100 }, { "epoch": 0.65, "learning_rate": 0.00020314064197044437, "loss": 0.014, "step": 249110 }, { "epoch": 0.65, "learning_rate": 0.00020313675375407288, "loss": 0.0126, "step": 249120 }, { "epoch": 0.65, "learning_rate": 0.00020313286553770143, "loss": 0.019, "step": 249130 }, { "epoch": 0.65, "learning_rate": 0.00020312897732132994, "loss": 0.0196, "step": 249140 }, { "epoch": 0.65, "learning_rate": 0.0002031250891049585, "loss": 0.0186, "step": 249150 }, { "epoch": 0.65, "learning_rate": 0.00020312120088858702, "loss": 0.016, "step": 249160 }, { "epoch": 0.65, "learning_rate": 0.00020311731267221557, "loss": 0.0148, "step": 249170 }, { "epoch": 0.65, "learning_rate": 0.00020311342445584408, "loss": 0.0179, "step": 249180 }, { "epoch": 0.65, "learning_rate": 0.00020310953623947265, "loss": 0.0151, "step": 249190 }, { "epoch": 0.65, "learning_rate": 0.00020310564802310116, "loss": 0.0197, "step": 249200 }, { "epoch": 0.65, "learning_rate": 0.0002031017598067297, "loss": 0.0199, "step": 249210 }, { "epoch": 0.65, "learning_rate": 0.00020309787159035822, "loss": 0.0161, "step": 249220 }, { "epoch": 0.65, "learning_rate": 0.0002030939833739868, "loss": 0.0156, "step": 249230 }, { "epoch": 0.65, "learning_rate": 0.00020309009515761533, "loss": 0.0162, "step": 249240 }, { "epoch": 0.65, "learning_rate": 0.00020308620694124384, "loss": 0.0151, "step": 249250 }, { "epoch": 0.65, "learning_rate": 0.00020308231872487236, "loss": 0.0144, "step": 249260 }, { "epoch": 0.65, "learning_rate": 0.00020307843050850093, "loss": 0.0139, "step": 249270 }, { "epoch": 0.65, "learning_rate": 0.00020307454229212947, "loss": 0.0169, "step": 249280 }, { "epoch": 0.65, "learning_rate": 0.00020307065407575798, "loss": 0.0165, "step": 249290 }, { "epoch": 0.65, "learning_rate": 0.00020306676585938653, "loss": 0.0149, "step": 249300 }, { "epoch": 0.65, "learning_rate": 0.00020306287764301507, "loss": 0.012, "step": 249310 }, { "epoch": 0.65, "learning_rate": 0.0002030589894266436, "loss": 0.0136, "step": 249320 }, { "epoch": 0.65, "learning_rate": 0.00020305510121027212, "loss": 0.013, "step": 249330 }, { "epoch": 0.65, "learning_rate": 0.00020305121299390067, "loss": 0.0161, "step": 249340 }, { "epoch": 0.65, "learning_rate": 0.00020304732477752918, "loss": 0.0184, "step": 249350 }, { "epoch": 0.65, "learning_rate": 0.00020304343656115775, "loss": 0.0132, "step": 249360 }, { "epoch": 0.65, "learning_rate": 0.00020303954834478626, "loss": 0.0127, "step": 249370 }, { "epoch": 0.65, "learning_rate": 0.0002030356601284148, "loss": 0.0134, "step": 249380 }, { "epoch": 0.65, "learning_rate": 0.00020303177191204332, "loss": 0.0136, "step": 249390 }, { "epoch": 0.65, "learning_rate": 0.0002030278836956719, "loss": 0.0183, "step": 249400 }, { "epoch": 0.65, "learning_rate": 0.00020302399547930043, "loss": 0.0162, "step": 249410 }, { "epoch": 0.65, "learning_rate": 0.00020302010726292894, "loss": 0.0165, "step": 249420 }, { "epoch": 0.65, "learning_rate": 0.00020301621904655746, "loss": 0.0157, "step": 249430 }, { "epoch": 0.65, "learning_rate": 0.00020301233083018603, "loss": 0.0142, "step": 249440 }, { "epoch": 0.65, "learning_rate": 0.00020300844261381457, "loss": 0.0154, "step": 249450 }, { "epoch": 0.65, "learning_rate": 0.00020300455439744308, "loss": 0.0152, "step": 249460 }, { "epoch": 0.65, "learning_rate": 0.00020300066618107163, "loss": 0.014, "step": 249470 }, { "epoch": 0.65, "learning_rate": 0.00020299677796470017, "loss": 0.0173, "step": 249480 }, { "epoch": 0.65, "learning_rate": 0.0002029928897483287, "loss": 0.0129, "step": 249490 }, { "epoch": 0.65, "learning_rate": 0.00020298900153195722, "loss": 0.0151, "step": 249500 }, { "epoch": 0.65, "learning_rate": 0.00020298511331558576, "loss": 0.0185, "step": 249510 }, { "epoch": 0.65, "learning_rate": 0.0002029812250992143, "loss": 0.0177, "step": 249520 }, { "epoch": 0.65, "learning_rate": 0.00020297733688284285, "loss": 0.0148, "step": 249530 }, { "epoch": 0.65, "learning_rate": 0.00020297344866647136, "loss": 0.0146, "step": 249540 }, { "epoch": 0.65, "learning_rate": 0.0002029695604500999, "loss": 0.0162, "step": 249550 }, { "epoch": 0.65, "learning_rate": 0.00020296567223372847, "loss": 0.0148, "step": 249560 }, { "epoch": 0.65, "learning_rate": 0.000202961784017357, "loss": 0.021, "step": 249570 }, { "epoch": 0.65, "learning_rate": 0.0002029578958009855, "loss": 0.0175, "step": 249580 }, { "epoch": 0.65, "learning_rate": 0.00020295400758461404, "loss": 0.0154, "step": 249590 }, { "epoch": 0.65, "learning_rate": 0.00020295011936824256, "loss": 0.0128, "step": 249600 }, { "epoch": 0.65, "learning_rate": 0.00020294623115187113, "loss": 0.0129, "step": 249610 }, { "epoch": 0.65, "learning_rate": 0.00020294234293549967, "loss": 0.0145, "step": 249620 }, { "epoch": 0.65, "learning_rate": 0.00020293845471912818, "loss": 0.0129, "step": 249630 }, { "epoch": 0.65, "learning_rate": 0.00020293456650275672, "loss": 0.0134, "step": 249640 }, { "epoch": 0.65, "learning_rate": 0.00020293067828638527, "loss": 0.0146, "step": 249650 }, { "epoch": 0.65, "learning_rate": 0.0002029267900700138, "loss": 0.0158, "step": 249660 }, { "epoch": 0.65, "learning_rate": 0.00020292290185364232, "loss": 0.0183, "step": 249670 }, { "epoch": 0.65, "learning_rate": 0.00020291901363727086, "loss": 0.0163, "step": 249680 }, { "epoch": 0.65, "learning_rate": 0.0002029151254208994, "loss": 0.0152, "step": 249690 }, { "epoch": 0.65, "learning_rate": 0.00020291123720452795, "loss": 0.0224, "step": 249700 }, { "epoch": 0.65, "learning_rate": 0.00020290734898815646, "loss": 0.0212, "step": 249710 }, { "epoch": 0.65, "learning_rate": 0.000202903460771785, "loss": 0.0141, "step": 249720 }, { "epoch": 0.65, "learning_rate": 0.00020289957255541355, "loss": 0.0136, "step": 249730 }, { "epoch": 0.65, "learning_rate": 0.0002028956843390421, "loss": 0.0153, "step": 249740 }, { "epoch": 0.65, "learning_rate": 0.0002028917961226706, "loss": 0.0156, "step": 249750 }, { "epoch": 0.65, "learning_rate": 0.00020288790790629914, "loss": 0.0143, "step": 249760 }, { "epoch": 0.65, "learning_rate": 0.0002028840196899277, "loss": 0.0172, "step": 249770 }, { "epoch": 0.65, "learning_rate": 0.00020288013147355623, "loss": 0.021, "step": 249780 }, { "epoch": 0.65, "learning_rate": 0.00020287624325718477, "loss": 0.018, "step": 249790 }, { "epoch": 0.65, "learning_rate": 0.00020287235504081328, "loss": 0.0132, "step": 249800 }, { "epoch": 0.65, "learning_rate": 0.00020286846682444185, "loss": 0.0172, "step": 249810 }, { "epoch": 0.65, "learning_rate": 0.00020286457860807037, "loss": 0.0145, "step": 249820 }, { "epoch": 0.65, "learning_rate": 0.0002028606903916989, "loss": 0.0136, "step": 249830 }, { "epoch": 0.65, "learning_rate": 0.00020285680217532742, "loss": 0.0168, "step": 249840 }, { "epoch": 0.65, "learning_rate": 0.00020285291395895596, "loss": 0.0138, "step": 249850 }, { "epoch": 0.65, "learning_rate": 0.0002028490257425845, "loss": 0.0138, "step": 249860 }, { "epoch": 0.65, "learning_rate": 0.00020284513752621305, "loss": 0.0138, "step": 249870 }, { "epoch": 0.65, "learning_rate": 0.00020284124930984156, "loss": 0.0216, "step": 249880 }, { "epoch": 0.65, "learning_rate": 0.0002028373610934701, "loss": 0.0176, "step": 249890 }, { "epoch": 0.65, "learning_rate": 0.00020283347287709864, "loss": 0.0159, "step": 249900 }, { "epoch": 0.65, "learning_rate": 0.00020282958466072719, "loss": 0.0211, "step": 249910 }, { "epoch": 0.65, "learning_rate": 0.0002028256964443557, "loss": 0.0151, "step": 249920 }, { "epoch": 0.65, "learning_rate": 0.00020282180822798424, "loss": 0.017, "step": 249930 }, { "epoch": 0.65, "learning_rate": 0.0002028179200116128, "loss": 0.0147, "step": 249940 }, { "epoch": 0.65, "learning_rate": 0.00020281403179524133, "loss": 0.0153, "step": 249950 }, { "epoch": 0.65, "learning_rate": 0.00020281014357886987, "loss": 0.0131, "step": 249960 }, { "epoch": 0.65, "learning_rate": 0.00020280625536249838, "loss": 0.0158, "step": 249970 }, { "epoch": 0.65, "learning_rate": 0.00020280236714612695, "loss": 0.015, "step": 249980 }, { "epoch": 0.65, "learning_rate": 0.00020279847892975547, "loss": 0.0166, "step": 249990 }, { "epoch": 0.65, "learning_rate": 0.000202794590713384, "loss": 0.0181, "step": 250000 }, { "epoch": 0.65, "eval_cer": 0.8817684692590742, "eval_loss": 0.010947254486382008, "eval_runtime": 107.1468, "eval_samples_per_second": 18.666, "eval_steps_per_second": 4.666, "step": 250000 }, { "epoch": 0.65, "learning_rate": 0.00020279070249701252, "loss": 0.0161, "step": 250010 }, { "epoch": 0.65, "learning_rate": 0.0002027868142806411, "loss": 0.0162, "step": 250020 }, { "epoch": 0.65, "learning_rate": 0.0002027829260642696, "loss": 0.0143, "step": 250030 }, { "epoch": 0.65, "learning_rate": 0.00020277903784789815, "loss": 0.0144, "step": 250040 }, { "epoch": 0.65, "learning_rate": 0.00020277514963152666, "loss": 0.0159, "step": 250050 }, { "epoch": 0.65, "learning_rate": 0.00020277126141515523, "loss": 0.0135, "step": 250060 }, { "epoch": 0.65, "learning_rate": 0.00020276737319878374, "loss": 0.0132, "step": 250070 }, { "epoch": 0.65, "learning_rate": 0.00020276348498241229, "loss": 0.0167, "step": 250080 }, { "epoch": 0.65, "learning_rate": 0.0002027595967660408, "loss": 0.017, "step": 250090 }, { "epoch": 0.65, "learning_rate": 0.00020275570854966934, "loss": 0.0169, "step": 250100 }, { "epoch": 0.65, "learning_rate": 0.0002027518203332979, "loss": 0.0125, "step": 250110 }, { "epoch": 0.65, "learning_rate": 0.00020274793211692643, "loss": 0.0158, "step": 250120 }, { "epoch": 0.65, "learning_rate": 0.00020274404390055494, "loss": 0.018, "step": 250130 }, { "epoch": 0.65, "learning_rate": 0.00020274015568418348, "loss": 0.017, "step": 250140 }, { "epoch": 0.65, "learning_rate": 0.00020273626746781205, "loss": 0.0134, "step": 250150 }, { "epoch": 0.65, "learning_rate": 0.00020273237925144056, "loss": 0.0144, "step": 250160 }, { "epoch": 0.65, "learning_rate": 0.0002027284910350691, "loss": 0.0211, "step": 250170 }, { "epoch": 0.65, "learning_rate": 0.00020272460281869762, "loss": 0.0185, "step": 250180 }, { "epoch": 0.65, "learning_rate": 0.0002027207146023262, "loss": 0.0129, "step": 250190 }, { "epoch": 0.65, "learning_rate": 0.0002027168263859547, "loss": 0.0175, "step": 250200 }, { "epoch": 0.65, "learning_rate": 0.00020271293816958325, "loss": 0.0168, "step": 250210 }, { "epoch": 0.65, "learning_rate": 0.00020270904995321176, "loss": 0.0186, "step": 250220 }, { "epoch": 0.65, "learning_rate": 0.00020270516173684033, "loss": 0.0125, "step": 250230 }, { "epoch": 0.65, "learning_rate": 0.00020270127352046884, "loss": 0.0162, "step": 250240 }, { "epoch": 0.65, "learning_rate": 0.00020269738530409739, "loss": 0.0198, "step": 250250 }, { "epoch": 0.65, "learning_rate": 0.0002026934970877259, "loss": 0.0151, "step": 250260 }, { "epoch": 0.65, "learning_rate": 0.00020268960887135447, "loss": 0.0131, "step": 250270 }, { "epoch": 0.65, "learning_rate": 0.000202685720654983, "loss": 0.0163, "step": 250280 }, { "epoch": 0.65, "learning_rate": 0.00020268183243861152, "loss": 0.0157, "step": 250290 }, { "epoch": 0.65, "learning_rate": 0.00020267794422224004, "loss": 0.0146, "step": 250300 }, { "epoch": 0.65, "learning_rate": 0.0002026740560058686, "loss": 0.0157, "step": 250310 }, { "epoch": 0.65, "learning_rate": 0.00020267016778949715, "loss": 0.0148, "step": 250320 }, { "epoch": 0.65, "learning_rate": 0.00020266627957312566, "loss": 0.0152, "step": 250330 }, { "epoch": 0.65, "learning_rate": 0.0002026623913567542, "loss": 0.0212, "step": 250340 }, { "epoch": 0.65, "learning_rate": 0.00020265850314038272, "loss": 0.02, "step": 250350 }, { "epoch": 0.65, "learning_rate": 0.0002026546149240113, "loss": 0.0154, "step": 250360 }, { "epoch": 0.65, "learning_rate": 0.0002026507267076398, "loss": 0.0151, "step": 250370 }, { "epoch": 0.65, "learning_rate": 0.00020264683849126835, "loss": 0.0166, "step": 250380 }, { "epoch": 0.65, "learning_rate": 0.00020264295027489686, "loss": 0.0168, "step": 250390 }, { "epoch": 0.65, "learning_rate": 0.00020263906205852543, "loss": 0.0147, "step": 250400 }, { "epoch": 0.65, "learning_rate": 0.00020263517384215394, "loss": 0.0168, "step": 250410 }, { "epoch": 0.65, "learning_rate": 0.00020263128562578248, "loss": 0.0193, "step": 250420 }, { "epoch": 0.65, "learning_rate": 0.000202627397409411, "loss": 0.0148, "step": 250430 }, { "epoch": 0.65, "learning_rate": 0.00020262350919303957, "loss": 0.0148, "step": 250440 }, { "epoch": 0.65, "learning_rate": 0.00020261962097666808, "loss": 0.0155, "step": 250450 }, { "epoch": 0.65, "learning_rate": 0.00020261573276029662, "loss": 0.0147, "step": 250460 }, { "epoch": 0.65, "learning_rate": 0.00020261184454392514, "loss": 0.0155, "step": 250470 }, { "epoch": 0.65, "learning_rate": 0.0002026079563275537, "loss": 0.0171, "step": 250480 }, { "epoch": 0.65, "learning_rate": 0.00020260406811118225, "loss": 0.0163, "step": 250490 }, { "epoch": 0.65, "learning_rate": 0.00020260017989481076, "loss": 0.0161, "step": 250500 }, { "epoch": 0.65, "learning_rate": 0.0002025962916784393, "loss": 0.0134, "step": 250510 }, { "epoch": 0.65, "learning_rate": 0.00020259240346206785, "loss": 0.0155, "step": 250520 }, { "epoch": 0.65, "learning_rate": 0.0002025885152456964, "loss": 0.0146, "step": 250530 }, { "epoch": 0.65, "learning_rate": 0.0002025846270293249, "loss": 0.0179, "step": 250540 }, { "epoch": 0.65, "learning_rate": 0.00020258073881295344, "loss": 0.0181, "step": 250550 }, { "epoch": 0.65, "learning_rate": 0.00020257685059658199, "loss": 0.0163, "step": 250560 }, { "epoch": 0.65, "learning_rate": 0.00020257296238021053, "loss": 0.0155, "step": 250570 }, { "epoch": 0.65, "learning_rate": 0.00020256907416383904, "loss": 0.0196, "step": 250580 }, { "epoch": 0.65, "learning_rate": 0.00020256518594746758, "loss": 0.0168, "step": 250590 }, { "epoch": 0.65, "learning_rate": 0.0002025612977310961, "loss": 0.0177, "step": 250600 }, { "epoch": 0.65, "learning_rate": 0.00020255740951472467, "loss": 0.0141, "step": 250610 }, { "epoch": 0.65, "learning_rate": 0.00020255352129835318, "loss": 0.0142, "step": 250620 }, { "epoch": 0.65, "learning_rate": 0.00020254963308198172, "loss": 0.0207, "step": 250630 }, { "epoch": 0.65, "learning_rate": 0.00020254574486561024, "loss": 0.0161, "step": 250640 }, { "epoch": 0.65, "learning_rate": 0.0002025418566492388, "loss": 0.0169, "step": 250650 }, { "epoch": 0.65, "learning_rate": 0.00020253796843286735, "loss": 0.0154, "step": 250660 }, { "epoch": 0.65, "learning_rate": 0.00020253408021649586, "loss": 0.0167, "step": 250670 }, { "epoch": 0.65, "learning_rate": 0.0002025301920001244, "loss": 0.0163, "step": 250680 }, { "epoch": 0.65, "learning_rate": 0.00020252630378375295, "loss": 0.0116, "step": 250690 }, { "epoch": 0.65, "learning_rate": 0.0002025224155673815, "loss": 0.0154, "step": 250700 }, { "epoch": 0.65, "learning_rate": 0.00020251852735101, "loss": 0.0153, "step": 250710 }, { "epoch": 0.65, "learning_rate": 0.00020251463913463854, "loss": 0.0174, "step": 250720 }, { "epoch": 0.65, "learning_rate": 0.00020251075091826709, "loss": 0.0142, "step": 250730 }, { "epoch": 0.65, "learning_rate": 0.00020250686270189563, "loss": 0.0142, "step": 250740 }, { "epoch": 0.65, "learning_rate": 0.00020250297448552414, "loss": 0.0159, "step": 250750 }, { "epoch": 0.65, "learning_rate": 0.00020249908626915268, "loss": 0.0136, "step": 250760 }, { "epoch": 0.65, "learning_rate": 0.00020249519805278123, "loss": 0.0191, "step": 250770 }, { "epoch": 0.65, "learning_rate": 0.00020249130983640977, "loss": 0.0175, "step": 250780 }, { "epoch": 0.65, "learning_rate": 0.00020248742162003828, "loss": 0.0169, "step": 250790 }, { "epoch": 0.65, "learning_rate": 0.00020248353340366682, "loss": 0.014, "step": 250800 }, { "epoch": 0.65, "learning_rate": 0.0002024796451872954, "loss": 0.017, "step": 250810 }, { "epoch": 0.65, "learning_rate": 0.0002024757569709239, "loss": 0.0162, "step": 250820 }, { "epoch": 0.65, "learning_rate": 0.00020247186875455245, "loss": 0.0125, "step": 250830 }, { "epoch": 0.65, "learning_rate": 0.00020246798053818096, "loss": 0.0187, "step": 250840 }, { "epoch": 0.65, "learning_rate": 0.00020246409232180948, "loss": 0.0155, "step": 250850 }, { "epoch": 0.65, "learning_rate": 0.00020246020410543805, "loss": 0.0174, "step": 250860 }, { "epoch": 0.65, "learning_rate": 0.0002024563158890666, "loss": 0.0171, "step": 250870 }, { "epoch": 0.65, "learning_rate": 0.0002024524276726951, "loss": 0.0137, "step": 250880 }, { "epoch": 0.65, "learning_rate": 0.00020244853945632364, "loss": 0.014, "step": 250890 }, { "epoch": 0.65, "learning_rate": 0.00020244465123995219, "loss": 0.0142, "step": 250900 }, { "epoch": 0.65, "learning_rate": 0.00020244076302358073, "loss": 0.0141, "step": 250910 }, { "epoch": 0.65, "learning_rate": 0.00020243687480720924, "loss": 0.0141, "step": 250920 }, { "epoch": 0.65, "learning_rate": 0.00020243298659083778, "loss": 0.016, "step": 250930 }, { "epoch": 0.65, "learning_rate": 0.00020242909837446632, "loss": 0.0155, "step": 250940 }, { "epoch": 0.65, "learning_rate": 0.00020242521015809487, "loss": 0.0151, "step": 250950 }, { "epoch": 0.65, "learning_rate": 0.00020242132194172338, "loss": 0.0145, "step": 250960 }, { "epoch": 0.65, "learning_rate": 0.00020241743372535192, "loss": 0.0174, "step": 250970 }, { "epoch": 0.65, "learning_rate": 0.0002024135455089805, "loss": 0.018, "step": 250980 }, { "epoch": 0.65, "learning_rate": 0.000202409657292609, "loss": 0.0154, "step": 250990 }, { "epoch": 0.65, "learning_rate": 0.00020240576907623755, "loss": 0.0162, "step": 251000 }, { "epoch": 0.65, "eval_cer": 0.88176706962214, "eval_loss": 0.011115950532257557, "eval_runtime": 107.2723, "eval_samples_per_second": 18.644, "eval_steps_per_second": 4.661, "step": 251000 }, { "epoch": 0.65, "learning_rate": 0.00020240188085986606, "loss": 0.0158, "step": 251010 }, { "epoch": 0.65, "learning_rate": 0.00020239799264349463, "loss": 0.0157, "step": 251020 }, { "epoch": 0.65, "learning_rate": 0.00020239410442712315, "loss": 0.0159, "step": 251030 }, { "epoch": 0.65, "learning_rate": 0.0002023902162107517, "loss": 0.0153, "step": 251040 }, { "epoch": 0.65, "learning_rate": 0.0002023863279943802, "loss": 0.0164, "step": 251050 }, { "epoch": 0.65, "learning_rate": 0.00020238243977800877, "loss": 0.0188, "step": 251060 }, { "epoch": 0.65, "learning_rate": 0.00020237855156163728, "loss": 0.013, "step": 251070 }, { "epoch": 0.65, "learning_rate": 0.00020237466334526583, "loss": 0.018, "step": 251080 }, { "epoch": 0.65, "learning_rate": 0.00020237077512889434, "loss": 0.0146, "step": 251090 }, { "epoch": 0.65, "learning_rate": 0.00020236688691252288, "loss": 0.0174, "step": 251100 }, { "epoch": 0.65, "learning_rate": 0.00020236299869615142, "loss": 0.0171, "step": 251110 }, { "epoch": 0.65, "learning_rate": 0.00020235911047977997, "loss": 0.0173, "step": 251120 }, { "epoch": 0.65, "learning_rate": 0.00020235522226340848, "loss": 0.0121, "step": 251130 }, { "epoch": 0.65, "learning_rate": 0.00020235133404703702, "loss": 0.0147, "step": 251140 }, { "epoch": 0.65, "learning_rate": 0.0002023474458306656, "loss": 0.0241, "step": 251150 }, { "epoch": 0.65, "learning_rate": 0.0002023435576142941, "loss": 0.0138, "step": 251160 }, { "epoch": 0.65, "learning_rate": 0.00020233966939792262, "loss": 0.0151, "step": 251170 }, { "epoch": 0.65, "learning_rate": 0.00020233578118155116, "loss": 0.0168, "step": 251180 }, { "epoch": 0.65, "learning_rate": 0.00020233189296517973, "loss": 0.0165, "step": 251190 }, { "epoch": 0.65, "learning_rate": 0.00020232800474880824, "loss": 0.0144, "step": 251200 }, { "epoch": 0.65, "learning_rate": 0.00020232411653243679, "loss": 0.0178, "step": 251210 }, { "epoch": 0.65, "learning_rate": 0.0002023202283160653, "loss": 0.0134, "step": 251220 }, { "epoch": 0.65, "learning_rate": 0.00020231634009969387, "loss": 0.0159, "step": 251230 }, { "epoch": 0.65, "learning_rate": 0.00020231245188332238, "loss": 0.0154, "step": 251240 }, { "epoch": 0.65, "learning_rate": 0.00020230856366695093, "loss": 0.0142, "step": 251250 }, { "epoch": 0.65, "learning_rate": 0.00020230467545057944, "loss": 0.0166, "step": 251260 }, { "epoch": 0.65, "learning_rate": 0.000202300787234208, "loss": 0.0178, "step": 251270 }, { "epoch": 0.65, "learning_rate": 0.00020229689901783652, "loss": 0.0168, "step": 251280 }, { "epoch": 0.65, "learning_rate": 0.00020229301080146506, "loss": 0.0189, "step": 251290 }, { "epoch": 0.65, "learning_rate": 0.00020228912258509358, "loss": 0.0121, "step": 251300 }, { "epoch": 0.65, "learning_rate": 0.00020228523436872215, "loss": 0.0146, "step": 251310 }, { "epoch": 0.65, "learning_rate": 0.00020228134615235066, "loss": 0.0172, "step": 251320 }, { "epoch": 0.65, "learning_rate": 0.0002022774579359792, "loss": 0.0218, "step": 251330 }, { "epoch": 0.65, "learning_rate": 0.00020227356971960772, "loss": 0.0132, "step": 251340 }, { "epoch": 0.65, "learning_rate": 0.00020226968150323626, "loss": 0.0129, "step": 251350 }, { "epoch": 0.65, "learning_rate": 0.00020226579328686483, "loss": 0.0153, "step": 251360 }, { "epoch": 0.65, "learning_rate": 0.00020226190507049334, "loss": 0.0158, "step": 251370 }, { "epoch": 0.65, "learning_rate": 0.00020225801685412189, "loss": 0.0122, "step": 251380 }, { "epoch": 0.65, "learning_rate": 0.0002022541286377504, "loss": 0.0153, "step": 251390 }, { "epoch": 0.65, "learning_rate": 0.00020225024042137897, "loss": 0.0147, "step": 251400 }, { "epoch": 0.65, "learning_rate": 0.00020224635220500748, "loss": 0.0169, "step": 251410 }, { "epoch": 0.65, "learning_rate": 0.00020224246398863602, "loss": 0.0163, "step": 251420 }, { "epoch": 0.65, "learning_rate": 0.00020223857577226454, "loss": 0.0138, "step": 251430 }, { "epoch": 0.65, "learning_rate": 0.0002022346875558931, "loss": 0.0164, "step": 251440 }, { "epoch": 0.65, "learning_rate": 0.00020223079933952162, "loss": 0.0158, "step": 251450 }, { "epoch": 0.65, "learning_rate": 0.00020222691112315016, "loss": 0.0217, "step": 251460 }, { "epoch": 0.65, "learning_rate": 0.00020222302290677868, "loss": 0.0126, "step": 251470 }, { "epoch": 0.65, "learning_rate": 0.00020221913469040725, "loss": 0.0164, "step": 251480 }, { "epoch": 0.65, "learning_rate": 0.00020221524647403576, "loss": 0.0123, "step": 251490 }, { "epoch": 0.65, "learning_rate": 0.0002022113582576643, "loss": 0.0136, "step": 251500 }, { "epoch": 0.65, "learning_rate": 0.00020220747004129282, "loss": 0.0124, "step": 251510 }, { "epoch": 0.65, "learning_rate": 0.0002022035818249214, "loss": 0.017, "step": 251520 }, { "epoch": 0.65, "learning_rate": 0.00020219969360854993, "loss": 0.0174, "step": 251530 }, { "epoch": 0.65, "learning_rate": 0.00020219580539217844, "loss": 0.0149, "step": 251540 }, { "epoch": 0.65, "learning_rate": 0.00020219191717580698, "loss": 0.0168, "step": 251550 }, { "epoch": 0.65, "learning_rate": 0.00020218802895943553, "loss": 0.0174, "step": 251560 }, { "epoch": 0.65, "learning_rate": 0.00020218414074306407, "loss": 0.0153, "step": 251570 }, { "epoch": 0.65, "learning_rate": 0.00020218025252669258, "loss": 0.0159, "step": 251580 }, { "epoch": 0.65, "learning_rate": 0.00020217636431032112, "loss": 0.0152, "step": 251590 }, { "epoch": 0.65, "learning_rate": 0.00020217247609394964, "loss": 0.0124, "step": 251600 }, { "epoch": 0.65, "learning_rate": 0.0002021685878775782, "loss": 0.0185, "step": 251610 }, { "epoch": 0.65, "learning_rate": 0.00020216469966120672, "loss": 0.0147, "step": 251620 }, { "epoch": 0.65, "learning_rate": 0.00020216081144483526, "loss": 0.0177, "step": 251630 }, { "epoch": 0.65, "learning_rate": 0.00020215692322846378, "loss": 0.0171, "step": 251640 }, { "epoch": 0.65, "learning_rate": 0.00020215303501209235, "loss": 0.0139, "step": 251650 }, { "epoch": 0.65, "learning_rate": 0.00020214914679572086, "loss": 0.0121, "step": 251660 }, { "epoch": 0.65, "learning_rate": 0.0002021452585793494, "loss": 0.0154, "step": 251670 }, { "epoch": 0.65, "learning_rate": 0.00020214137036297792, "loss": 0.0141, "step": 251680 }, { "epoch": 0.65, "learning_rate": 0.0002021374821466065, "loss": 0.0132, "step": 251690 }, { "epoch": 0.65, "learning_rate": 0.00020213359393023503, "loss": 0.0143, "step": 251700 }, { "epoch": 0.65, "learning_rate": 0.00020212970571386354, "loss": 0.015, "step": 251710 }, { "epoch": 0.65, "learning_rate": 0.00020212581749749206, "loss": 0.016, "step": 251720 }, { "epoch": 0.65, "learning_rate": 0.00020212192928112063, "loss": 0.0135, "step": 251730 }, { "epoch": 0.65, "learning_rate": 0.00020211804106474917, "loss": 0.0131, "step": 251740 }, { "epoch": 0.65, "learning_rate": 0.00020211415284837768, "loss": 0.0175, "step": 251750 }, { "epoch": 0.65, "learning_rate": 0.00020211026463200622, "loss": 0.0128, "step": 251760 }, { "epoch": 0.65, "learning_rate": 0.00020210637641563477, "loss": 0.0163, "step": 251770 }, { "epoch": 0.65, "learning_rate": 0.0002021024881992633, "loss": 0.0168, "step": 251780 }, { "epoch": 0.65, "learning_rate": 0.00020209859998289182, "loss": 0.0191, "step": 251790 }, { "epoch": 0.65, "learning_rate": 0.00020209471176652036, "loss": 0.015, "step": 251800 }, { "epoch": 0.65, "learning_rate": 0.0002020908235501489, "loss": 0.0151, "step": 251810 }, { "epoch": 0.65, "learning_rate": 0.00020208693533377745, "loss": 0.0143, "step": 251820 }, { "epoch": 0.65, "learning_rate": 0.00020208304711740596, "loss": 0.0147, "step": 251830 }, { "epoch": 0.65, "learning_rate": 0.0002020791589010345, "loss": 0.0203, "step": 251840 }, { "epoch": 0.65, "learning_rate": 0.00020207527068466302, "loss": 0.0149, "step": 251850 }, { "epoch": 0.65, "learning_rate": 0.00020207138246829159, "loss": 0.0149, "step": 251860 }, { "epoch": 0.65, "learning_rate": 0.00020206749425192013, "loss": 0.0138, "step": 251870 }, { "epoch": 0.65, "learning_rate": 0.00020206360603554864, "loss": 0.0168, "step": 251880 }, { "epoch": 0.65, "learning_rate": 0.00020205971781917716, "loss": 0.0155, "step": 251890 }, { "epoch": 0.65, "learning_rate": 0.00020205582960280573, "loss": 0.0157, "step": 251900 }, { "epoch": 0.65, "learning_rate": 0.00020205194138643427, "loss": 0.0171, "step": 251910 }, { "epoch": 0.65, "learning_rate": 0.00020204805317006278, "loss": 0.0186, "step": 251920 }, { "epoch": 0.65, "learning_rate": 0.00020204416495369132, "loss": 0.0158, "step": 251930 }, { "epoch": 0.65, "learning_rate": 0.00020204027673731986, "loss": 0.014, "step": 251940 }, { "epoch": 0.65, "learning_rate": 0.0002020363885209484, "loss": 0.0145, "step": 251950 }, { "epoch": 0.65, "learning_rate": 0.00020203250030457692, "loss": 0.0137, "step": 251960 }, { "epoch": 0.65, "learning_rate": 0.00020202861208820546, "loss": 0.0216, "step": 251970 }, { "epoch": 0.65, "learning_rate": 0.000202024723871834, "loss": 0.0146, "step": 251980 }, { "epoch": 0.65, "learning_rate": 0.00020202083565546255, "loss": 0.0134, "step": 251990 }, { "epoch": 0.65, "learning_rate": 0.00020201694743909106, "loss": 0.0167, "step": 252000 }, { "epoch": 0.65, "eval_cer": 0.881797861634692, "eval_loss": 0.010695898905396461, "eval_runtime": 107.3781, "eval_samples_per_second": 18.626, "eval_steps_per_second": 4.656, "step": 252000 }, { "epoch": 0.65, "learning_rate": 0.0002020130592227196, "loss": 0.0152, "step": 252010 }, { "epoch": 0.65, "learning_rate": 0.00020200917100634817, "loss": 0.0138, "step": 252020 }, { "epoch": 0.65, "learning_rate": 0.00020200528278997669, "loss": 0.0141, "step": 252030 }, { "epoch": 0.65, "learning_rate": 0.0002020013945736052, "loss": 0.0153, "step": 252040 }, { "epoch": 0.65, "learning_rate": 0.00020199750635723374, "loss": 0.0171, "step": 252050 }, { "epoch": 0.65, "learning_rate": 0.0002019936181408623, "loss": 0.0128, "step": 252060 }, { "epoch": 0.65, "learning_rate": 0.00020198972992449082, "loss": 0.0171, "step": 252070 }, { "epoch": 0.65, "learning_rate": 0.00020198584170811937, "loss": 0.0131, "step": 252080 }, { "epoch": 0.65, "learning_rate": 0.00020198195349174788, "loss": 0.0157, "step": 252090 }, { "epoch": 0.65, "learning_rate": 0.00020197806527537642, "loss": 0.0201, "step": 252100 }, { "epoch": 0.65, "learning_rate": 0.00020197417705900496, "loss": 0.017, "step": 252110 }, { "epoch": 0.65, "learning_rate": 0.0002019702888426335, "loss": 0.0147, "step": 252120 }, { "epoch": 0.65, "learning_rate": 0.00020196640062626202, "loss": 0.0167, "step": 252130 }, { "epoch": 0.65, "learning_rate": 0.00020196251240989056, "loss": 0.0137, "step": 252140 }, { "epoch": 0.65, "learning_rate": 0.0002019586241935191, "loss": 0.0142, "step": 252150 }, { "epoch": 0.65, "learning_rate": 0.00020195473597714765, "loss": 0.0173, "step": 252160 }, { "epoch": 0.65, "learning_rate": 0.00020195084776077616, "loss": 0.0147, "step": 252170 }, { "epoch": 0.65, "learning_rate": 0.0002019469595444047, "loss": 0.018, "step": 252180 }, { "epoch": 0.65, "learning_rate": 0.00020194307132803327, "loss": 0.0114, "step": 252190 }, { "epoch": 0.65, "learning_rate": 0.00020193918311166178, "loss": 0.0153, "step": 252200 }, { "epoch": 0.65, "learning_rate": 0.0002019352948952903, "loss": 0.0143, "step": 252210 }, { "epoch": 0.65, "learning_rate": 0.00020193140667891884, "loss": 0.0164, "step": 252220 }, { "epoch": 0.65, "learning_rate": 0.0002019275184625474, "loss": 0.0155, "step": 252230 }, { "epoch": 0.65, "learning_rate": 0.00020192363024617592, "loss": 0.0141, "step": 252240 }, { "epoch": 0.65, "learning_rate": 0.00020191974202980447, "loss": 0.0124, "step": 252250 }, { "epoch": 0.65, "learning_rate": 0.00020191585381343298, "loss": 0.0148, "step": 252260 }, { "epoch": 0.65, "learning_rate": 0.00020191196559706155, "loss": 0.0162, "step": 252270 }, { "epoch": 0.65, "learning_rate": 0.00020190807738069006, "loss": 0.0168, "step": 252280 }, { "epoch": 0.65, "learning_rate": 0.0002019041891643186, "loss": 0.0141, "step": 252290 }, { "epoch": 0.65, "learning_rate": 0.00020190030094794712, "loss": 0.0154, "step": 252300 }, { "epoch": 0.65, "learning_rate": 0.0002018964127315757, "loss": 0.0172, "step": 252310 }, { "epoch": 0.65, "learning_rate": 0.0002018925245152042, "loss": 0.0142, "step": 252320 }, { "epoch": 0.65, "learning_rate": 0.00020188863629883274, "loss": 0.0139, "step": 252330 }, { "epoch": 0.65, "learning_rate": 0.00020188474808246126, "loss": 0.0184, "step": 252340 }, { "epoch": 0.65, "learning_rate": 0.0002018808598660898, "loss": 0.0117, "step": 252350 }, { "epoch": 0.65, "learning_rate": 0.00020187697164971834, "loss": 0.0139, "step": 252360 }, { "epoch": 0.65, "learning_rate": 0.00020187308343334688, "loss": 0.0208, "step": 252370 }, { "epoch": 0.65, "learning_rate": 0.0002018691952169754, "loss": 0.0202, "step": 252380 }, { "epoch": 0.65, "learning_rate": 0.00020186530700060394, "loss": 0.0137, "step": 252390 }, { "epoch": 0.65, "learning_rate": 0.0002018614187842325, "loss": 0.0208, "step": 252400 }, { "epoch": 0.65, "learning_rate": 0.00020185753056786102, "loss": 0.0165, "step": 252410 }, { "epoch": 0.65, "learning_rate": 0.00020185364235148957, "loss": 0.0181, "step": 252420 }, { "epoch": 0.65, "learning_rate": 0.00020184975413511808, "loss": 0.0232, "step": 252430 }, { "epoch": 0.65, "learning_rate": 0.00020184586591874665, "loss": 0.0147, "step": 252440 }, { "epoch": 0.65, "learning_rate": 0.00020184197770237516, "loss": 0.0136, "step": 252450 }, { "epoch": 0.65, "learning_rate": 0.0002018380894860037, "loss": 0.018, "step": 252460 }, { "epoch": 0.65, "learning_rate": 0.00020183420126963222, "loss": 0.017, "step": 252470 }, { "epoch": 0.65, "learning_rate": 0.0002018303130532608, "loss": 0.0147, "step": 252480 }, { "epoch": 0.65, "learning_rate": 0.0002018264248368893, "loss": 0.0145, "step": 252490 }, { "epoch": 0.65, "learning_rate": 0.00020182253662051784, "loss": 0.0141, "step": 252500 }, { "epoch": 0.65, "learning_rate": 0.00020181864840414636, "loss": 0.0148, "step": 252510 }, { "epoch": 0.65, "learning_rate": 0.00020181476018777493, "loss": 0.014, "step": 252520 }, { "epoch": 0.65, "learning_rate": 0.00020181087197140344, "loss": 0.0199, "step": 252530 }, { "epoch": 0.65, "learning_rate": 0.00020180698375503198, "loss": 0.015, "step": 252540 }, { "epoch": 0.65, "learning_rate": 0.0002018030955386605, "loss": 0.0132, "step": 252550 }, { "epoch": 0.65, "learning_rate": 0.00020179920732228907, "loss": 0.0159, "step": 252560 }, { "epoch": 0.65, "learning_rate": 0.0002017953191059176, "loss": 0.019, "step": 252570 }, { "epoch": 0.65, "learning_rate": 0.00020179143088954612, "loss": 0.0167, "step": 252580 }, { "epoch": 0.65, "learning_rate": 0.00020178754267317466, "loss": 0.015, "step": 252590 }, { "epoch": 0.65, "learning_rate": 0.00020178365445680318, "loss": 0.0162, "step": 252600 }, { "epoch": 0.65, "learning_rate": 0.00020177976624043175, "loss": 0.0164, "step": 252610 }, { "epoch": 0.65, "learning_rate": 0.00020177587802406026, "loss": 0.0169, "step": 252620 }, { "epoch": 0.65, "learning_rate": 0.0002017719898076888, "loss": 0.0159, "step": 252630 }, { "epoch": 0.65, "learning_rate": 0.00020176810159131732, "loss": 0.0186, "step": 252640 }, { "epoch": 0.65, "learning_rate": 0.0002017642133749459, "loss": 0.0138, "step": 252650 }, { "epoch": 0.65, "learning_rate": 0.0002017603251585744, "loss": 0.0142, "step": 252660 }, { "epoch": 0.65, "learning_rate": 0.00020175643694220294, "loss": 0.0109, "step": 252670 }, { "epoch": 0.65, "learning_rate": 0.00020175254872583146, "loss": 0.0126, "step": 252680 }, { "epoch": 0.66, "learning_rate": 0.00020174866050946003, "loss": 0.0127, "step": 252690 }, { "epoch": 0.66, "learning_rate": 0.00020174477229308854, "loss": 0.0174, "step": 252700 }, { "epoch": 0.66, "learning_rate": 0.00020174088407671708, "loss": 0.0149, "step": 252710 }, { "epoch": 0.66, "learning_rate": 0.0002017369958603456, "loss": 0.0142, "step": 252720 }, { "epoch": 0.66, "learning_rate": 0.00020173310764397417, "loss": 0.0177, "step": 252730 }, { "epoch": 0.66, "learning_rate": 0.0002017292194276027, "loss": 0.0151, "step": 252740 }, { "epoch": 0.66, "learning_rate": 0.00020172533121123122, "loss": 0.0162, "step": 252750 }, { "epoch": 0.66, "learning_rate": 0.00020172144299485974, "loss": 0.0148, "step": 252760 }, { "epoch": 0.66, "learning_rate": 0.0002017175547784883, "loss": 0.0182, "step": 252770 }, { "epoch": 0.66, "learning_rate": 0.00020171366656211685, "loss": 0.0155, "step": 252780 }, { "epoch": 0.66, "learning_rate": 0.00020170977834574536, "loss": 0.0157, "step": 252790 }, { "epoch": 0.66, "learning_rate": 0.0002017058901293739, "loss": 0.0197, "step": 252800 }, { "epoch": 0.66, "learning_rate": 0.00020170200191300245, "loss": 0.0174, "step": 252810 }, { "epoch": 0.66, "learning_rate": 0.000201698113696631, "loss": 0.0111, "step": 252820 }, { "epoch": 0.66, "learning_rate": 0.0002016942254802595, "loss": 0.0137, "step": 252830 }, { "epoch": 0.66, "learning_rate": 0.00020169033726388804, "loss": 0.0156, "step": 252840 }, { "epoch": 0.66, "learning_rate": 0.00020168644904751656, "loss": 0.0185, "step": 252850 }, { "epoch": 0.66, "learning_rate": 0.00020168256083114513, "loss": 0.0143, "step": 252860 }, { "epoch": 0.66, "learning_rate": 0.00020167867261477364, "loss": 0.0179, "step": 252870 }, { "epoch": 0.66, "learning_rate": 0.00020167478439840218, "loss": 0.0168, "step": 252880 }, { "epoch": 0.66, "learning_rate": 0.0002016708961820307, "loss": 0.0118, "step": 252890 }, { "epoch": 0.66, "learning_rate": 0.00020166700796565927, "loss": 0.0154, "step": 252900 }, { "epoch": 0.66, "learning_rate": 0.00020166311974928778, "loss": 0.0149, "step": 252910 }, { "epoch": 0.66, "learning_rate": 0.00020165923153291632, "loss": 0.0141, "step": 252920 }, { "epoch": 0.66, "learning_rate": 0.00020165534331654484, "loss": 0.0174, "step": 252930 }, { "epoch": 0.66, "learning_rate": 0.0002016514551001734, "loss": 0.0126, "step": 252940 }, { "epoch": 0.66, "learning_rate": 0.00020164756688380195, "loss": 0.0175, "step": 252950 }, { "epoch": 0.66, "learning_rate": 0.00020164367866743046, "loss": 0.0169, "step": 252960 }, { "epoch": 0.66, "learning_rate": 0.000201639790451059, "loss": 0.0137, "step": 252970 }, { "epoch": 0.66, "learning_rate": 0.00020163590223468754, "loss": 0.0145, "step": 252980 }, { "epoch": 0.66, "learning_rate": 0.00020163201401831609, "loss": 0.0146, "step": 252990 }, { "epoch": 0.66, "learning_rate": 0.0002016281258019446, "loss": 0.0166, "step": 253000 }, { "epoch": 0.66, "eval_cer": 0.8817474747050615, "eval_loss": 0.01099295075982809, "eval_runtime": 107.2229, "eval_samples_per_second": 18.653, "eval_steps_per_second": 4.663, "step": 253000 }, { "epoch": 0.66, "learning_rate": 0.00020162423758557314, "loss": 0.0204, "step": 253010 }, { "epoch": 0.66, "learning_rate": 0.00020162034936920168, "loss": 0.0127, "step": 253020 }, { "epoch": 0.66, "learning_rate": 0.00020161646115283023, "loss": 0.0175, "step": 253030 }, { "epoch": 0.66, "learning_rate": 0.00020161257293645874, "loss": 0.0173, "step": 253040 }, { "epoch": 0.66, "learning_rate": 0.00020160868472008728, "loss": 0.0143, "step": 253050 }, { "epoch": 0.66, "learning_rate": 0.00020160479650371585, "loss": 0.0155, "step": 253060 }, { "epoch": 0.66, "learning_rate": 0.00020160090828734437, "loss": 0.0144, "step": 253070 }, { "epoch": 0.66, "learning_rate": 0.00020159702007097288, "loss": 0.0206, "step": 253080 }, { "epoch": 0.66, "learning_rate": 0.00020159313185460142, "loss": 0.0134, "step": 253090 }, { "epoch": 0.66, "learning_rate": 0.00020158924363822994, "loss": 0.0153, "step": 253100 }, { "epoch": 0.66, "learning_rate": 0.0002015853554218585, "loss": 0.0128, "step": 253110 }, { "epoch": 0.66, "learning_rate": 0.00020158146720548705, "loss": 0.0214, "step": 253120 }, { "epoch": 0.66, "learning_rate": 0.00020157757898911556, "loss": 0.0137, "step": 253130 }, { "epoch": 0.66, "learning_rate": 0.0002015736907727441, "loss": 0.0133, "step": 253140 }, { "epoch": 0.66, "learning_rate": 0.00020156980255637264, "loss": 0.0142, "step": 253150 }, { "epoch": 0.66, "learning_rate": 0.00020156591434000119, "loss": 0.0191, "step": 253160 }, { "epoch": 0.66, "learning_rate": 0.0002015620261236297, "loss": 0.0197, "step": 253170 }, { "epoch": 0.66, "learning_rate": 0.00020155813790725824, "loss": 0.0167, "step": 253180 }, { "epoch": 0.66, "learning_rate": 0.00020155424969088678, "loss": 0.0157, "step": 253190 }, { "epoch": 0.66, "learning_rate": 0.00020155036147451533, "loss": 0.0145, "step": 253200 }, { "epoch": 0.66, "learning_rate": 0.00020154647325814384, "loss": 0.0135, "step": 253210 }, { "epoch": 0.66, "learning_rate": 0.00020154258504177238, "loss": 0.0172, "step": 253220 }, { "epoch": 0.66, "learning_rate": 0.00020153869682540092, "loss": 0.0174, "step": 253230 }, { "epoch": 0.66, "learning_rate": 0.00020153480860902946, "loss": 0.0173, "step": 253240 }, { "epoch": 0.66, "learning_rate": 0.00020153092039265798, "loss": 0.0148, "step": 253250 }, { "epoch": 0.66, "learning_rate": 0.00020152703217628652, "loss": 0.0129, "step": 253260 }, { "epoch": 0.66, "learning_rate": 0.0002015231439599151, "loss": 0.0198, "step": 253270 }, { "epoch": 0.66, "learning_rate": 0.0002015192557435436, "loss": 0.0142, "step": 253280 }, { "epoch": 0.66, "learning_rate": 0.00020151536752717215, "loss": 0.0155, "step": 253290 }, { "epoch": 0.66, "learning_rate": 0.00020151147931080066, "loss": 0.0198, "step": 253300 }, { "epoch": 0.66, "learning_rate": 0.00020150759109442923, "loss": 0.0132, "step": 253310 }, { "epoch": 0.66, "learning_rate": 0.00020150370287805774, "loss": 0.0206, "step": 253320 }, { "epoch": 0.66, "learning_rate": 0.00020149981466168629, "loss": 0.0175, "step": 253330 }, { "epoch": 0.66, "learning_rate": 0.0002014959264453148, "loss": 0.0177, "step": 253340 }, { "epoch": 0.66, "learning_rate": 0.00020149203822894334, "loss": 0.0158, "step": 253350 }, { "epoch": 0.66, "learning_rate": 0.00020148815001257188, "loss": 0.0167, "step": 253360 }, { "epoch": 0.66, "learning_rate": 0.00020148426179620042, "loss": 0.0233, "step": 253370 }, { "epoch": 0.66, "learning_rate": 0.00020148037357982894, "loss": 0.0155, "step": 253380 }, { "epoch": 0.66, "learning_rate": 0.00020147648536345748, "loss": 0.0182, "step": 253390 }, { "epoch": 0.66, "learning_rate": 0.00020147259714708602, "loss": 0.0216, "step": 253400 }, { "epoch": 0.66, "learning_rate": 0.00020146870893071456, "loss": 0.0154, "step": 253410 }, { "epoch": 0.66, "learning_rate": 0.00020146482071434308, "loss": 0.0154, "step": 253420 }, { "epoch": 0.66, "learning_rate": 0.00020146093249797162, "loss": 0.0133, "step": 253430 }, { "epoch": 0.66, "learning_rate": 0.0002014570442816002, "loss": 0.0173, "step": 253440 }, { "epoch": 0.66, "learning_rate": 0.0002014531560652287, "loss": 0.0117, "step": 253450 }, { "epoch": 0.66, "learning_rate": 0.00020144926784885725, "loss": 0.0172, "step": 253460 }, { "epoch": 0.66, "learning_rate": 0.00020144537963248576, "loss": 0.0137, "step": 253470 }, { "epoch": 0.66, "learning_rate": 0.00020144149141611433, "loss": 0.0156, "step": 253480 }, { "epoch": 0.66, "learning_rate": 0.00020143760319974284, "loss": 0.0168, "step": 253490 }, { "epoch": 0.66, "learning_rate": 0.00020143371498337138, "loss": 0.0166, "step": 253500 }, { "epoch": 0.66, "learning_rate": 0.0002014298267669999, "loss": 0.015, "step": 253510 }, { "epoch": 0.66, "learning_rate": 0.00020142593855062847, "loss": 0.0144, "step": 253520 }, { "epoch": 0.66, "learning_rate": 0.00020142205033425698, "loss": 0.0177, "step": 253530 }, { "epoch": 0.66, "learning_rate": 0.00020141816211788552, "loss": 0.014, "step": 253540 }, { "epoch": 0.66, "learning_rate": 0.00020141427390151404, "loss": 0.0185, "step": 253550 }, { "epoch": 0.66, "learning_rate": 0.0002014103856851426, "loss": 0.0158, "step": 253560 }, { "epoch": 0.66, "learning_rate": 0.00020140649746877112, "loss": 0.0159, "step": 253570 }, { "epoch": 0.66, "learning_rate": 0.00020140260925239966, "loss": 0.0155, "step": 253580 }, { "epoch": 0.66, "learning_rate": 0.00020139872103602818, "loss": 0.0209, "step": 253590 }, { "epoch": 0.66, "learning_rate": 0.00020139483281965672, "loss": 0.0128, "step": 253600 }, { "epoch": 0.66, "learning_rate": 0.0002013909446032853, "loss": 0.0163, "step": 253610 }, { "epoch": 0.66, "learning_rate": 0.0002013870563869138, "loss": 0.014, "step": 253620 }, { "epoch": 0.66, "learning_rate": 0.00020138316817054232, "loss": 0.0204, "step": 253630 }, { "epoch": 0.66, "learning_rate": 0.00020137927995417086, "loss": 0.0152, "step": 253640 }, { "epoch": 0.66, "learning_rate": 0.00020137539173779943, "loss": 0.0158, "step": 253650 }, { "epoch": 0.66, "learning_rate": 0.00020137150352142794, "loss": 0.0186, "step": 253660 }, { "epoch": 0.66, "learning_rate": 0.00020136761530505648, "loss": 0.0169, "step": 253670 }, { "epoch": 0.66, "learning_rate": 0.000201363727088685, "loss": 0.0172, "step": 253680 }, { "epoch": 0.66, "learning_rate": 0.00020135983887231357, "loss": 0.0151, "step": 253690 }, { "epoch": 0.66, "learning_rate": 0.00020135595065594208, "loss": 0.0153, "step": 253700 }, { "epoch": 0.66, "learning_rate": 0.00020135206243957062, "loss": 0.0139, "step": 253710 }, { "epoch": 0.66, "learning_rate": 0.00020134817422319914, "loss": 0.0178, "step": 253720 }, { "epoch": 0.66, "learning_rate": 0.0002013442860068277, "loss": 0.015, "step": 253730 }, { "epoch": 0.66, "learning_rate": 0.00020134039779045622, "loss": 0.018, "step": 253740 }, { "epoch": 0.66, "learning_rate": 0.00020133650957408476, "loss": 0.0172, "step": 253750 }, { "epoch": 0.66, "learning_rate": 0.00020133262135771328, "loss": 0.014, "step": 253760 }, { "epoch": 0.66, "learning_rate": 0.00020132873314134185, "loss": 0.0151, "step": 253770 }, { "epoch": 0.66, "learning_rate": 0.0002013248449249704, "loss": 0.0165, "step": 253780 }, { "epoch": 0.66, "learning_rate": 0.0002013209567085989, "loss": 0.0146, "step": 253790 }, { "epoch": 0.66, "learning_rate": 0.00020131706849222742, "loss": 0.0159, "step": 253800 }, { "epoch": 0.66, "learning_rate": 0.00020131318027585599, "loss": 0.0156, "step": 253810 }, { "epoch": 0.66, "learning_rate": 0.00020130929205948453, "loss": 0.0131, "step": 253820 }, { "epoch": 0.66, "learning_rate": 0.00020130540384311304, "loss": 0.0166, "step": 253830 }, { "epoch": 0.66, "learning_rate": 0.00020130151562674158, "loss": 0.013, "step": 253840 }, { "epoch": 0.66, "learning_rate": 0.0002012976274103701, "loss": 0.0133, "step": 253850 }, { "epoch": 0.66, "learning_rate": 0.00020129373919399867, "loss": 0.0143, "step": 253860 }, { "epoch": 0.66, "learning_rate": 0.00020128985097762718, "loss": 0.0162, "step": 253870 }, { "epoch": 0.66, "learning_rate": 0.00020128596276125572, "loss": 0.0159, "step": 253880 }, { "epoch": 0.66, "learning_rate": 0.00020128207454488424, "loss": 0.0179, "step": 253890 }, { "epoch": 0.66, "learning_rate": 0.0002012781863285128, "loss": 0.0172, "step": 253900 }, { "epoch": 0.66, "learning_rate": 0.00020127429811214132, "loss": 0.0172, "step": 253910 }, { "epoch": 0.66, "learning_rate": 0.00020127040989576986, "loss": 0.0153, "step": 253920 }, { "epoch": 0.66, "learning_rate": 0.00020126652167939838, "loss": 0.0216, "step": 253930 }, { "epoch": 0.66, "learning_rate": 0.00020126263346302695, "loss": 0.0136, "step": 253940 }, { "epoch": 0.66, "learning_rate": 0.00020125874524665546, "loss": 0.0157, "step": 253950 }, { "epoch": 0.66, "learning_rate": 0.000201254857030284, "loss": 0.0148, "step": 253960 }, { "epoch": 0.66, "learning_rate": 0.00020125096881391252, "loss": 0.0174, "step": 253970 }, { "epoch": 0.66, "learning_rate": 0.00020124708059754109, "loss": 0.0191, "step": 253980 }, { "epoch": 0.66, "learning_rate": 0.00020124319238116963, "loss": 0.013, "step": 253990 }, { "epoch": 0.66, "learning_rate": 0.00020123930416479814, "loss": 0.0141, "step": 254000 }, { "epoch": 0.66, "eval_cer": 0.8817110841447728, "eval_loss": 0.010805866681039333, "eval_runtime": 107.3516, "eval_samples_per_second": 18.63, "eval_steps_per_second": 4.658, "step": 254000 }, { "epoch": 0.66, "learning_rate": 0.00020123541594842668, "loss": 0.0205, "step": 254010 }, { "epoch": 0.66, "learning_rate": 0.00020123152773205522, "loss": 0.0176, "step": 254020 }, { "epoch": 0.66, "learning_rate": 0.00020122763951568377, "loss": 0.0166, "step": 254030 }, { "epoch": 0.66, "learning_rate": 0.00020122375129931228, "loss": 0.013, "step": 254040 }, { "epoch": 0.66, "learning_rate": 0.00020121986308294082, "loss": 0.0134, "step": 254050 }, { "epoch": 0.66, "learning_rate": 0.00020121597486656936, "loss": 0.0142, "step": 254060 }, { "epoch": 0.66, "learning_rate": 0.0002012120866501979, "loss": 0.0137, "step": 254070 }, { "epoch": 0.66, "learning_rate": 0.00020120819843382642, "loss": 0.0142, "step": 254080 }, { "epoch": 0.66, "learning_rate": 0.00020120431021745496, "loss": 0.0122, "step": 254090 }, { "epoch": 0.66, "learning_rate": 0.00020120042200108348, "loss": 0.0176, "step": 254100 }, { "epoch": 0.66, "learning_rate": 0.00020119653378471205, "loss": 0.0149, "step": 254110 }, { "epoch": 0.66, "learning_rate": 0.00020119264556834056, "loss": 0.0146, "step": 254120 }, { "epoch": 0.66, "learning_rate": 0.0002011887573519691, "loss": 0.0158, "step": 254130 }, { "epoch": 0.66, "learning_rate": 0.00020118486913559762, "loss": 0.0141, "step": 254140 }, { "epoch": 0.66, "learning_rate": 0.00020118098091922618, "loss": 0.012, "step": 254150 }, { "epoch": 0.66, "learning_rate": 0.00020117709270285473, "loss": 0.0135, "step": 254160 }, { "epoch": 0.66, "learning_rate": 0.00020117320448648324, "loss": 0.0151, "step": 254170 }, { "epoch": 0.66, "learning_rate": 0.00020116931627011178, "loss": 0.0219, "step": 254180 }, { "epoch": 0.66, "learning_rate": 0.00020116542805374032, "loss": 0.0167, "step": 254190 }, { "epoch": 0.66, "learning_rate": 0.00020116153983736887, "loss": 0.0172, "step": 254200 }, { "epoch": 0.66, "learning_rate": 0.00020115765162099738, "loss": 0.0163, "step": 254210 }, { "epoch": 0.66, "learning_rate": 0.00020115376340462592, "loss": 0.0141, "step": 254220 }, { "epoch": 0.66, "learning_rate": 0.00020114987518825446, "loss": 0.0168, "step": 254230 }, { "epoch": 0.66, "learning_rate": 0.000201145986971883, "loss": 0.0152, "step": 254240 }, { "epoch": 0.66, "learning_rate": 0.00020114209875551152, "loss": 0.013, "step": 254250 }, { "epoch": 0.66, "learning_rate": 0.00020113821053914006, "loss": 0.0168, "step": 254260 }, { "epoch": 0.66, "learning_rate": 0.0002011343223227686, "loss": 0.0165, "step": 254270 }, { "epoch": 0.66, "learning_rate": 0.00020113043410639714, "loss": 0.0132, "step": 254280 }, { "epoch": 0.66, "learning_rate": 0.00020112654589002566, "loss": 0.0134, "step": 254290 }, { "epoch": 0.66, "learning_rate": 0.0002011226576736542, "loss": 0.016, "step": 254300 }, { "epoch": 0.66, "learning_rate": 0.00020111876945728272, "loss": 0.0159, "step": 254310 }, { "epoch": 0.66, "learning_rate": 0.00020111488124091128, "loss": 0.0178, "step": 254320 }, { "epoch": 0.66, "learning_rate": 0.00020111099302453983, "loss": 0.0181, "step": 254330 }, { "epoch": 0.66, "learning_rate": 0.00020110710480816834, "loss": 0.0201, "step": 254340 }, { "epoch": 0.66, "learning_rate": 0.00020110321659179685, "loss": 0.0175, "step": 254350 }, { "epoch": 0.66, "learning_rate": 0.00020109932837542542, "loss": 0.0134, "step": 254360 }, { "epoch": 0.66, "learning_rate": 0.00020109544015905396, "loss": 0.0165, "step": 254370 }, { "epoch": 0.66, "learning_rate": 0.00020109155194268248, "loss": 0.0126, "step": 254380 }, { "epoch": 0.66, "learning_rate": 0.00020108766372631102, "loss": 0.0118, "step": 254390 }, { "epoch": 0.66, "learning_rate": 0.00020108377550993956, "loss": 0.0143, "step": 254400 }, { "epoch": 0.66, "learning_rate": 0.0002010798872935681, "loss": 0.0135, "step": 254410 }, { "epoch": 0.66, "learning_rate": 0.00020107599907719662, "loss": 0.0126, "step": 254420 }, { "epoch": 0.66, "learning_rate": 0.00020107211086082516, "loss": 0.0135, "step": 254430 }, { "epoch": 0.66, "learning_rate": 0.0002010682226444537, "loss": 0.0134, "step": 254440 }, { "epoch": 0.66, "learning_rate": 0.00020106433442808224, "loss": 0.0169, "step": 254450 }, { "epoch": 0.66, "learning_rate": 0.00020106044621171076, "loss": 0.0138, "step": 254460 }, { "epoch": 0.66, "learning_rate": 0.0002010565579953393, "loss": 0.0155, "step": 254470 }, { "epoch": 0.66, "learning_rate": 0.00020105266977896787, "loss": 0.0136, "step": 254480 }, { "epoch": 0.66, "learning_rate": 0.00020104878156259638, "loss": 0.0154, "step": 254490 }, { "epoch": 0.66, "learning_rate": 0.0002010448933462249, "loss": 0.0161, "step": 254500 }, { "epoch": 0.66, "learning_rate": 0.00020104100512985344, "loss": 0.0144, "step": 254510 }, { "epoch": 0.66, "learning_rate": 0.000201037116913482, "loss": 0.014, "step": 254520 }, { "epoch": 0.66, "learning_rate": 0.00020103322869711052, "loss": 0.0127, "step": 254530 }, { "epoch": 0.66, "learning_rate": 0.00020102934048073906, "loss": 0.0126, "step": 254540 }, { "epoch": 0.66, "learning_rate": 0.00020102545226436758, "loss": 0.0143, "step": 254550 }, { "epoch": 0.66, "learning_rate": 0.00020102156404799612, "loss": 0.0136, "step": 254560 }, { "epoch": 0.66, "learning_rate": 0.00020101767583162466, "loss": 0.0157, "step": 254570 }, { "epoch": 0.66, "learning_rate": 0.0002010137876152532, "loss": 0.0171, "step": 254580 }, { "epoch": 0.66, "learning_rate": 0.00020100989939888172, "loss": 0.0158, "step": 254590 }, { "epoch": 0.66, "learning_rate": 0.00020100601118251026, "loss": 0.0177, "step": 254600 }, { "epoch": 0.66, "learning_rate": 0.0002010021229661388, "loss": 0.0137, "step": 254610 }, { "epoch": 0.66, "learning_rate": 0.00020099823474976734, "loss": 0.0129, "step": 254620 }, { "epoch": 0.66, "learning_rate": 0.00020099434653339586, "loss": 0.013, "step": 254630 }, { "epoch": 0.66, "learning_rate": 0.0002009904583170244, "loss": 0.0169, "step": 254640 }, { "epoch": 0.66, "learning_rate": 0.00020098657010065297, "loss": 0.0113, "step": 254650 }, { "epoch": 0.66, "learning_rate": 0.00020098268188428148, "loss": 0.0133, "step": 254660 }, { "epoch": 0.66, "learning_rate": 0.00020097879366791, "loss": 0.0189, "step": 254670 }, { "epoch": 0.66, "learning_rate": 0.00020097490545153854, "loss": 0.0176, "step": 254680 }, { "epoch": 0.66, "learning_rate": 0.0002009710172351671, "loss": 0.0147, "step": 254690 }, { "epoch": 0.66, "learning_rate": 0.00020096712901879562, "loss": 0.0142, "step": 254700 }, { "epoch": 0.66, "learning_rate": 0.00020096324080242416, "loss": 0.016, "step": 254710 }, { "epoch": 0.66, "learning_rate": 0.00020095935258605268, "loss": 0.0205, "step": 254720 }, { "epoch": 0.66, "learning_rate": 0.00020095546436968125, "loss": 0.0131, "step": 254730 }, { "epoch": 0.66, "learning_rate": 0.00020095157615330976, "loss": 0.0159, "step": 254740 }, { "epoch": 0.66, "learning_rate": 0.0002009476879369383, "loss": 0.0127, "step": 254750 }, { "epoch": 0.66, "learning_rate": 0.00020094379972056682, "loss": 0.0165, "step": 254760 }, { "epoch": 0.66, "learning_rate": 0.0002009399115041954, "loss": 0.0133, "step": 254770 }, { "epoch": 0.66, "learning_rate": 0.0002009360232878239, "loss": 0.0169, "step": 254780 }, { "epoch": 0.66, "learning_rate": 0.00020093213507145244, "loss": 0.0171, "step": 254790 }, { "epoch": 0.66, "learning_rate": 0.00020092824685508096, "loss": 0.0157, "step": 254800 }, { "epoch": 0.66, "learning_rate": 0.0002009243586387095, "loss": 0.0175, "step": 254810 }, { "epoch": 0.66, "learning_rate": 0.00020092047042233804, "loss": 0.017, "step": 254820 }, { "epoch": 0.66, "learning_rate": 0.00020091658220596658, "loss": 0.0155, "step": 254830 }, { "epoch": 0.66, "learning_rate": 0.0002009126939895951, "loss": 0.013, "step": 254840 }, { "epoch": 0.66, "learning_rate": 0.00020090880577322364, "loss": 0.017, "step": 254850 }, { "epoch": 0.66, "learning_rate": 0.0002009049175568522, "loss": 0.0183, "step": 254860 }, { "epoch": 0.66, "learning_rate": 0.00020090102934048072, "loss": 0.016, "step": 254870 }, { "epoch": 0.66, "learning_rate": 0.00020089714112410926, "loss": 0.0139, "step": 254880 }, { "epoch": 0.66, "learning_rate": 0.00020089325290773778, "loss": 0.0163, "step": 254890 }, { "epoch": 0.66, "learning_rate": 0.00020088936469136635, "loss": 0.0139, "step": 254900 }, { "epoch": 0.66, "learning_rate": 0.00020088547647499486, "loss": 0.0155, "step": 254910 }, { "epoch": 0.66, "learning_rate": 0.0002008815882586234, "loss": 0.015, "step": 254920 }, { "epoch": 0.66, "learning_rate": 0.00020087770004225192, "loss": 0.014, "step": 254930 }, { "epoch": 0.66, "learning_rate": 0.00020087381182588049, "loss": 0.0157, "step": 254940 }, { "epoch": 0.66, "learning_rate": 0.000200869923609509, "loss": 0.0137, "step": 254950 }, { "epoch": 0.66, "learning_rate": 0.00020086603539313754, "loss": 0.0126, "step": 254960 }, { "epoch": 0.66, "learning_rate": 0.00020086214717676606, "loss": 0.0135, "step": 254970 }, { "epoch": 0.66, "learning_rate": 0.00020085825896039463, "loss": 0.0141, "step": 254980 }, { "epoch": 0.66, "learning_rate": 0.00020085437074402314, "loss": 0.014, "step": 254990 }, { "epoch": 0.66, "learning_rate": 0.00020085048252765168, "loss": 0.0139, "step": 255000 }, { "epoch": 0.66, "eval_cer": 0.8817488743419957, "eval_loss": 0.010790371336042881, "eval_runtime": 107.3987, "eval_samples_per_second": 18.622, "eval_steps_per_second": 4.656, "step": 255000 }, { "epoch": 0.66, "learning_rate": 0.0002008465943112802, "loss": 0.0133, "step": 255010 }, { "epoch": 0.66, "learning_rate": 0.00020084270609490876, "loss": 0.0159, "step": 255020 }, { "epoch": 0.66, "learning_rate": 0.0002008388178785373, "loss": 0.0153, "step": 255030 }, { "epoch": 0.66, "learning_rate": 0.00020083492966216582, "loss": 0.0155, "step": 255040 }, { "epoch": 0.66, "learning_rate": 0.00020083104144579436, "loss": 0.0147, "step": 255050 }, { "epoch": 0.66, "learning_rate": 0.00020082715322942288, "loss": 0.0162, "step": 255060 }, { "epoch": 0.66, "learning_rate": 0.00020082326501305145, "loss": 0.0118, "step": 255070 }, { "epoch": 0.66, "learning_rate": 0.00020081937679667996, "loss": 0.0139, "step": 255080 }, { "epoch": 0.66, "learning_rate": 0.0002008154885803085, "loss": 0.0164, "step": 255090 }, { "epoch": 0.66, "learning_rate": 0.00020081160036393702, "loss": 0.0166, "step": 255100 }, { "epoch": 0.66, "learning_rate": 0.00020080771214756559, "loss": 0.0156, "step": 255110 }, { "epoch": 0.66, "learning_rate": 0.0002008038239311941, "loss": 0.0123, "step": 255120 }, { "epoch": 0.66, "learning_rate": 0.00020079993571482264, "loss": 0.0141, "step": 255130 }, { "epoch": 0.66, "learning_rate": 0.00020079604749845116, "loss": 0.0141, "step": 255140 }, { "epoch": 0.66, "learning_rate": 0.00020079215928207972, "loss": 0.0199, "step": 255150 }, { "epoch": 0.66, "learning_rate": 0.00020078827106570824, "loss": 0.0165, "step": 255160 }, { "epoch": 0.66, "learning_rate": 0.00020078438284933678, "loss": 0.0152, "step": 255170 }, { "epoch": 0.66, "learning_rate": 0.0002007804946329653, "loss": 0.0135, "step": 255180 }, { "epoch": 0.66, "learning_rate": 0.00020077660641659386, "loss": 0.0189, "step": 255190 }, { "epoch": 0.66, "learning_rate": 0.0002007727182002224, "loss": 0.0189, "step": 255200 }, { "epoch": 0.66, "learning_rate": 0.00020076882998385092, "loss": 0.0133, "step": 255210 }, { "epoch": 0.66, "learning_rate": 0.00020076494176747943, "loss": 0.02, "step": 255220 }, { "epoch": 0.66, "learning_rate": 0.000200761053551108, "loss": 0.0167, "step": 255230 }, { "epoch": 0.66, "learning_rate": 0.00020075716533473655, "loss": 0.0172, "step": 255240 }, { "epoch": 0.66, "learning_rate": 0.00020075327711836506, "loss": 0.0183, "step": 255250 }, { "epoch": 0.66, "learning_rate": 0.0002007493889019936, "loss": 0.0128, "step": 255260 }, { "epoch": 0.66, "learning_rate": 0.00020074550068562214, "loss": 0.0139, "step": 255270 }, { "epoch": 0.66, "learning_rate": 0.00020074161246925068, "loss": 0.0164, "step": 255280 }, { "epoch": 0.66, "learning_rate": 0.0002007377242528792, "loss": 0.0126, "step": 255290 }, { "epoch": 0.66, "learning_rate": 0.00020073383603650774, "loss": 0.0184, "step": 255300 }, { "epoch": 0.66, "learning_rate": 0.00020072994782013626, "loss": 0.015, "step": 255310 }, { "epoch": 0.66, "learning_rate": 0.00020072605960376482, "loss": 0.014, "step": 255320 }, { "epoch": 0.66, "learning_rate": 0.00020072217138739334, "loss": 0.0172, "step": 255330 }, { "epoch": 0.66, "learning_rate": 0.00020071828317102188, "loss": 0.0137, "step": 255340 }, { "epoch": 0.66, "learning_rate": 0.0002007143949546504, "loss": 0.0147, "step": 255350 }, { "epoch": 0.66, "learning_rate": 0.00020071050673827896, "loss": 0.0142, "step": 255360 }, { "epoch": 0.66, "learning_rate": 0.0002007066185219075, "loss": 0.0157, "step": 255370 }, { "epoch": 0.66, "learning_rate": 0.00020070273030553602, "loss": 0.0167, "step": 255380 }, { "epoch": 0.66, "learning_rate": 0.00020069884208916453, "loss": 0.0157, "step": 255390 }, { "epoch": 0.66, "learning_rate": 0.0002006949538727931, "loss": 0.0157, "step": 255400 }, { "epoch": 0.66, "learning_rate": 0.00020069106565642164, "loss": 0.0133, "step": 255410 }, { "epoch": 0.66, "learning_rate": 0.00020068717744005016, "loss": 0.0178, "step": 255420 }, { "epoch": 0.66, "learning_rate": 0.0002006832892236787, "loss": 0.0161, "step": 255430 }, { "epoch": 0.66, "learning_rate": 0.00020067940100730724, "loss": 0.0141, "step": 255440 }, { "epoch": 0.66, "learning_rate": 0.00020067551279093578, "loss": 0.0139, "step": 255450 }, { "epoch": 0.66, "learning_rate": 0.0002006716245745643, "loss": 0.0165, "step": 255460 }, { "epoch": 0.66, "learning_rate": 0.00020066773635819284, "loss": 0.0136, "step": 255470 }, { "epoch": 0.66, "learning_rate": 0.00020066384814182138, "loss": 0.017, "step": 255480 }, { "epoch": 0.66, "learning_rate": 0.00020065995992544992, "loss": 0.0148, "step": 255490 }, { "epoch": 0.66, "learning_rate": 0.00020065607170907844, "loss": 0.0157, "step": 255500 }, { "epoch": 0.66, "learning_rate": 0.00020065218349270698, "loss": 0.0146, "step": 255510 }, { "epoch": 0.66, "learning_rate": 0.00020064829527633555, "loss": 0.0227, "step": 255520 }, { "epoch": 0.66, "learning_rate": 0.00020064440705996406, "loss": 0.0131, "step": 255530 }, { "epoch": 0.66, "learning_rate": 0.00020064051884359258, "loss": 0.0119, "step": 255540 }, { "epoch": 0.66, "learning_rate": 0.00020063663062722112, "loss": 0.0156, "step": 255550 }, { "epoch": 0.66, "learning_rate": 0.00020063274241084963, "loss": 0.0156, "step": 255560 }, { "epoch": 0.66, "learning_rate": 0.0002006288541944782, "loss": 0.0135, "step": 255570 }, { "epoch": 0.66, "learning_rate": 0.00020062496597810674, "loss": 0.0152, "step": 255580 }, { "epoch": 0.66, "learning_rate": 0.00020062107776173526, "loss": 0.0184, "step": 255590 }, { "epoch": 0.66, "learning_rate": 0.0002006171895453638, "loss": 0.0178, "step": 255600 }, { "epoch": 0.66, "learning_rate": 0.00020061330132899234, "loss": 0.0174, "step": 255610 }, { "epoch": 0.66, "learning_rate": 0.00020060941311262088, "loss": 0.0153, "step": 255620 }, { "epoch": 0.66, "learning_rate": 0.0002006055248962494, "loss": 0.0203, "step": 255630 }, { "epoch": 0.66, "learning_rate": 0.00020060163667987794, "loss": 0.0201, "step": 255640 }, { "epoch": 0.66, "learning_rate": 0.00020059774846350648, "loss": 0.0173, "step": 255650 }, { "epoch": 0.66, "learning_rate": 0.00020059386024713502, "loss": 0.0183, "step": 255660 }, { "epoch": 0.66, "learning_rate": 0.00020058997203076354, "loss": 0.0174, "step": 255670 }, { "epoch": 0.66, "learning_rate": 0.00020058608381439208, "loss": 0.0173, "step": 255680 }, { "epoch": 0.66, "learning_rate": 0.00020058219559802062, "loss": 0.0134, "step": 255690 }, { "epoch": 0.66, "learning_rate": 0.00020057830738164916, "loss": 0.0168, "step": 255700 }, { "epoch": 0.66, "learning_rate": 0.00020057441916527768, "loss": 0.0165, "step": 255710 }, { "epoch": 0.66, "learning_rate": 0.00020057053094890622, "loss": 0.0143, "step": 255720 }, { "epoch": 0.66, "learning_rate": 0.0002005666427325348, "loss": 0.0157, "step": 255730 }, { "epoch": 0.66, "learning_rate": 0.0002005627545161633, "loss": 0.0165, "step": 255740 }, { "epoch": 0.66, "learning_rate": 0.00020055886629979184, "loss": 0.0195, "step": 255750 }, { "epoch": 0.66, "learning_rate": 0.00020055497808342036, "loss": 0.0149, "step": 255760 }, { "epoch": 0.66, "learning_rate": 0.00020055108986704893, "loss": 0.0134, "step": 255770 }, { "epoch": 0.66, "learning_rate": 0.00020054720165067744, "loss": 0.0146, "step": 255780 }, { "epoch": 0.66, "learning_rate": 0.00020054331343430598, "loss": 0.016, "step": 255790 }, { "epoch": 0.66, "learning_rate": 0.0002005394252179345, "loss": 0.0121, "step": 255800 }, { "epoch": 0.66, "learning_rate": 0.00020053553700156304, "loss": 0.0164, "step": 255810 }, { "epoch": 0.66, "learning_rate": 0.00020053164878519158, "loss": 0.0148, "step": 255820 }, { "epoch": 0.66, "learning_rate": 0.00020052776056882012, "loss": 0.01, "step": 255830 }, { "epoch": 0.66, "learning_rate": 0.00020052387235244864, "loss": 0.0147, "step": 255840 }, { "epoch": 0.66, "learning_rate": 0.00020051998413607718, "loss": 0.0137, "step": 255850 }, { "epoch": 0.66, "learning_rate": 0.00020051609591970572, "loss": 0.0124, "step": 255860 }, { "epoch": 0.66, "learning_rate": 0.00020051220770333426, "loss": 0.0137, "step": 255870 }, { "epoch": 0.66, "learning_rate": 0.00020050831948696278, "loss": 0.0149, "step": 255880 }, { "epoch": 0.66, "learning_rate": 0.00020050443127059132, "loss": 0.016, "step": 255890 }, { "epoch": 0.66, "learning_rate": 0.0002005005430542199, "loss": 0.0157, "step": 255900 }, { "epoch": 0.66, "learning_rate": 0.0002004966548378484, "loss": 0.0159, "step": 255910 }, { "epoch": 0.66, "learning_rate": 0.00020049276662147694, "loss": 0.0137, "step": 255920 }, { "epoch": 0.66, "learning_rate": 0.00020048887840510546, "loss": 0.0196, "step": 255930 }, { "epoch": 0.66, "learning_rate": 0.00020048499018873403, "loss": 0.0144, "step": 255940 }, { "epoch": 0.66, "learning_rate": 0.00020048110197236254, "loss": 0.017, "step": 255950 }, { "epoch": 0.66, "learning_rate": 0.00020047721375599108, "loss": 0.0147, "step": 255960 }, { "epoch": 0.66, "learning_rate": 0.0002004733255396196, "loss": 0.0191, "step": 255970 }, { "epoch": 0.66, "learning_rate": 0.00020046943732324817, "loss": 0.015, "step": 255980 }, { "epoch": 0.66, "learning_rate": 0.00020046554910687668, "loss": 0.0153, "step": 255990 }, { "epoch": 0.66, "learning_rate": 0.00020046166089050522, "loss": 0.0166, "step": 256000 }, { "epoch": 0.66, "eval_cer": 0.8818048598193629, "eval_loss": 0.010679894126951694, "eval_runtime": 107.5034, "eval_samples_per_second": 18.604, "eval_steps_per_second": 4.651, "step": 256000 }, { "epoch": 0.66, "learning_rate": 0.00020045777267413374, "loss": 0.0164, "step": 256010 }, { "epoch": 0.66, "learning_rate": 0.0002004538844577623, "loss": 0.0223, "step": 256020 }, { "epoch": 0.66, "learning_rate": 0.00020044999624139082, "loss": 0.0213, "step": 256030 }, { "epoch": 0.66, "learning_rate": 0.00020044610802501936, "loss": 0.0197, "step": 256040 }, { "epoch": 0.66, "learning_rate": 0.00020044221980864788, "loss": 0.0167, "step": 256050 }, { "epoch": 0.66, "learning_rate": 0.00020043833159227642, "loss": 0.0148, "step": 256060 }, { "epoch": 0.66, "learning_rate": 0.00020043444337590499, "loss": 0.0175, "step": 256070 }, { "epoch": 0.66, "learning_rate": 0.0002004305551595335, "loss": 0.0215, "step": 256080 }, { "epoch": 0.66, "learning_rate": 0.00020042666694316202, "loss": 0.019, "step": 256090 }, { "epoch": 0.66, "learning_rate": 0.00020042277872679056, "loss": 0.0153, "step": 256100 }, { "epoch": 0.66, "learning_rate": 0.00020041889051041913, "loss": 0.0154, "step": 256110 }, { "epoch": 0.66, "learning_rate": 0.00020041500229404764, "loss": 0.0168, "step": 256120 }, { "epoch": 0.66, "learning_rate": 0.00020041111407767618, "loss": 0.017, "step": 256130 }, { "epoch": 0.66, "learning_rate": 0.0002004072258613047, "loss": 0.0181, "step": 256140 }, { "epoch": 0.66, "learning_rate": 0.00020040333764493327, "loss": 0.0143, "step": 256150 }, { "epoch": 0.66, "learning_rate": 0.00020039944942856178, "loss": 0.0171, "step": 256160 }, { "epoch": 0.66, "learning_rate": 0.00020039556121219032, "loss": 0.0115, "step": 256170 }, { "epoch": 0.66, "learning_rate": 0.00020039167299581884, "loss": 0.015, "step": 256180 }, { "epoch": 0.66, "learning_rate": 0.0002003877847794474, "loss": 0.0197, "step": 256190 }, { "epoch": 0.66, "learning_rate": 0.00020038389656307592, "loss": 0.0174, "step": 256200 }, { "epoch": 0.66, "learning_rate": 0.00020038000834670446, "loss": 0.0139, "step": 256210 }, { "epoch": 0.66, "learning_rate": 0.00020037612013033298, "loss": 0.0182, "step": 256220 }, { "epoch": 0.66, "learning_rate": 0.00020037223191396154, "loss": 0.0124, "step": 256230 }, { "epoch": 0.66, "learning_rate": 0.00020036834369759009, "loss": 0.0136, "step": 256240 }, { "epoch": 0.66, "learning_rate": 0.0002003644554812186, "loss": 0.0141, "step": 256250 }, { "epoch": 0.66, "learning_rate": 0.00020036056726484711, "loss": 0.0195, "step": 256260 }, { "epoch": 0.66, "learning_rate": 0.00020035667904847568, "loss": 0.0151, "step": 256270 }, { "epoch": 0.66, "learning_rate": 0.00020035279083210423, "loss": 0.0154, "step": 256280 }, { "epoch": 0.66, "learning_rate": 0.00020034890261573274, "loss": 0.0221, "step": 256290 }, { "epoch": 0.66, "learning_rate": 0.00020034501439936128, "loss": 0.0186, "step": 256300 }, { "epoch": 0.66, "learning_rate": 0.0002003411261829898, "loss": 0.0169, "step": 256310 }, { "epoch": 0.66, "learning_rate": 0.00020033723796661836, "loss": 0.0169, "step": 256320 }, { "epoch": 0.66, "learning_rate": 0.00020033334975024688, "loss": 0.0103, "step": 256330 }, { "epoch": 0.66, "learning_rate": 0.00020032946153387542, "loss": 0.015, "step": 256340 }, { "epoch": 0.66, "learning_rate": 0.00020032557331750394, "loss": 0.0231, "step": 256350 }, { "epoch": 0.66, "learning_rate": 0.0002003216851011325, "loss": 0.0178, "step": 256360 }, { "epoch": 0.66, "learning_rate": 0.00020031779688476102, "loss": 0.0185, "step": 256370 }, { "epoch": 0.66, "learning_rate": 0.00020031390866838956, "loss": 0.0166, "step": 256380 }, { "epoch": 0.66, "learning_rate": 0.00020031002045201807, "loss": 0.015, "step": 256390 }, { "epoch": 0.66, "learning_rate": 0.00020030613223564664, "loss": 0.0148, "step": 256400 }, { "epoch": 0.66, "learning_rate": 0.00020030224401927516, "loss": 0.0136, "step": 256410 }, { "epoch": 0.66, "learning_rate": 0.0002002983558029037, "loss": 0.0138, "step": 256420 }, { "epoch": 0.66, "learning_rate": 0.00020029446758653221, "loss": 0.013, "step": 256430 }, { "epoch": 0.66, "learning_rate": 0.00020029057937016078, "loss": 0.0135, "step": 256440 }, { "epoch": 0.66, "learning_rate": 0.00020028669115378932, "loss": 0.0181, "step": 256450 }, { "epoch": 0.66, "learning_rate": 0.00020028280293741784, "loss": 0.0132, "step": 256460 }, { "epoch": 0.66, "learning_rate": 0.00020027891472104638, "loss": 0.0154, "step": 256470 }, { "epoch": 0.66, "learning_rate": 0.00020027502650467492, "loss": 0.0141, "step": 256480 }, { "epoch": 0.66, "learning_rate": 0.00020027113828830346, "loss": 0.0126, "step": 256490 }, { "epoch": 0.66, "learning_rate": 0.00020026725007193198, "loss": 0.0138, "step": 256500 }, { "epoch": 0.66, "learning_rate": 0.00020026336185556052, "loss": 0.0156, "step": 256510 }, { "epoch": 0.66, "learning_rate": 0.00020025947363918906, "loss": 0.0133, "step": 256520 }, { "epoch": 0.66, "learning_rate": 0.0002002555854228176, "loss": 0.0135, "step": 256530 }, { "epoch": 0.66, "learning_rate": 0.00020025169720644612, "loss": 0.0143, "step": 256540 }, { "epoch": 0.67, "learning_rate": 0.00020024780899007466, "loss": 0.0168, "step": 256550 }, { "epoch": 0.67, "learning_rate": 0.00020024392077370317, "loss": 0.0142, "step": 256560 }, { "epoch": 0.67, "learning_rate": 0.00020024003255733174, "loss": 0.0172, "step": 256570 }, { "epoch": 0.67, "learning_rate": 0.00020023614434096026, "loss": 0.0186, "step": 256580 }, { "epoch": 0.67, "learning_rate": 0.0002002322561245888, "loss": 0.0171, "step": 256590 }, { "epoch": 0.67, "learning_rate": 0.00020022836790821731, "loss": 0.0136, "step": 256600 }, { "epoch": 0.67, "learning_rate": 0.00020022447969184588, "loss": 0.0167, "step": 256610 }, { "epoch": 0.67, "learning_rate": 0.00020022059147547442, "loss": 0.0135, "step": 256620 }, { "epoch": 0.67, "learning_rate": 0.00020021670325910294, "loss": 0.0133, "step": 256630 }, { "epoch": 0.67, "learning_rate": 0.00020021281504273148, "loss": 0.0139, "step": 256640 }, { "epoch": 0.67, "learning_rate": 0.00020020892682636002, "loss": 0.0203, "step": 256650 }, { "epoch": 0.67, "learning_rate": 0.00020020503860998856, "loss": 0.0154, "step": 256660 }, { "epoch": 0.67, "learning_rate": 0.00020020115039361708, "loss": 0.0141, "step": 256670 }, { "epoch": 0.67, "learning_rate": 0.00020019726217724562, "loss": 0.018, "step": 256680 }, { "epoch": 0.67, "learning_rate": 0.00020019337396087416, "loss": 0.0146, "step": 256690 }, { "epoch": 0.67, "learning_rate": 0.0002001894857445027, "loss": 0.0154, "step": 256700 }, { "epoch": 0.67, "learning_rate": 0.00020018559752813122, "loss": 0.0147, "step": 256710 }, { "epoch": 0.67, "learning_rate": 0.00020018170931175976, "loss": 0.0146, "step": 256720 }, { "epoch": 0.67, "learning_rate": 0.0002001778210953883, "loss": 0.016, "step": 256730 }, { "epoch": 0.67, "learning_rate": 0.00020017393287901684, "loss": 0.0139, "step": 256740 }, { "epoch": 0.67, "learning_rate": 0.00020017004466264536, "loss": 0.0147, "step": 256750 }, { "epoch": 0.67, "learning_rate": 0.0002001661564462739, "loss": 0.0121, "step": 256760 }, { "epoch": 0.67, "learning_rate": 0.00020016226822990247, "loss": 0.0178, "step": 256770 }, { "epoch": 0.67, "learning_rate": 0.00020015838001353098, "loss": 0.0151, "step": 256780 }, { "epoch": 0.67, "learning_rate": 0.00020015449179715952, "loss": 0.0153, "step": 256790 }, { "epoch": 0.67, "learning_rate": 0.00020015060358078804, "loss": 0.0151, "step": 256800 }, { "epoch": 0.67, "learning_rate": 0.00020014671536441655, "loss": 0.0165, "step": 256810 }, { "epoch": 0.67, "learning_rate": 0.00020014282714804512, "loss": 0.0156, "step": 256820 }, { "epoch": 0.67, "learning_rate": 0.00020013893893167366, "loss": 0.0146, "step": 256830 }, { "epoch": 0.67, "learning_rate": 0.00020013505071530218, "loss": 0.0173, "step": 256840 }, { "epoch": 0.67, "learning_rate": 0.00020013116249893072, "loss": 0.0149, "step": 256850 }, { "epoch": 0.67, "learning_rate": 0.00020012727428255926, "loss": 0.0179, "step": 256860 }, { "epoch": 0.67, "learning_rate": 0.0002001233860661878, "loss": 0.0232, "step": 256870 }, { "epoch": 0.67, "learning_rate": 0.00020011949784981632, "loss": 0.0157, "step": 256880 }, { "epoch": 0.67, "learning_rate": 0.00020011560963344486, "loss": 0.0216, "step": 256890 }, { "epoch": 0.67, "learning_rate": 0.0002001117214170734, "loss": 0.0155, "step": 256900 }, { "epoch": 0.67, "learning_rate": 0.00020010783320070194, "loss": 0.016, "step": 256910 }, { "epoch": 0.67, "learning_rate": 0.00020010394498433046, "loss": 0.0178, "step": 256920 }, { "epoch": 0.67, "learning_rate": 0.000200100056767959, "loss": 0.0148, "step": 256930 }, { "epoch": 0.67, "learning_rate": 0.00020009616855158757, "loss": 0.0175, "step": 256940 }, { "epoch": 0.67, "learning_rate": 0.00020009228033521608, "loss": 0.0149, "step": 256950 }, { "epoch": 0.67, "learning_rate": 0.00020008839211884462, "loss": 0.0161, "step": 256960 }, { "epoch": 0.67, "learning_rate": 0.00020008450390247314, "loss": 0.0136, "step": 256970 }, { "epoch": 0.67, "learning_rate": 0.0002000806156861017, "loss": 0.015, "step": 256980 }, { "epoch": 0.67, "learning_rate": 0.00020007672746973022, "loss": 0.0142, "step": 256990 }, { "epoch": 0.67, "learning_rate": 0.00020007283925335876, "loss": 0.0115, "step": 257000 }, { "epoch": 0.67, "eval_cer": 0.8817446754311932, "eval_loss": 0.010795309208333492, "eval_runtime": 107.4074, "eval_samples_per_second": 18.621, "eval_steps_per_second": 4.655, "step": 257000 }, { "epoch": 0.67, "learning_rate": 0.00020006895103698728, "loss": 0.0141, "step": 257010 }, { "epoch": 0.67, "learning_rate": 0.00020006506282061585, "loss": 0.0179, "step": 257020 }, { "epoch": 0.67, "learning_rate": 0.00020006117460424436, "loss": 0.0136, "step": 257030 }, { "epoch": 0.67, "learning_rate": 0.0002000572863878729, "loss": 0.0138, "step": 257040 }, { "epoch": 0.67, "learning_rate": 0.00020005339817150142, "loss": 0.0182, "step": 257050 }, { "epoch": 0.67, "learning_rate": 0.00020004950995512996, "loss": 0.0162, "step": 257060 }, { "epoch": 0.67, "learning_rate": 0.0002000456217387585, "loss": 0.0189, "step": 257070 }, { "epoch": 0.67, "learning_rate": 0.00020004173352238704, "loss": 0.0127, "step": 257080 }, { "epoch": 0.67, "learning_rate": 0.00020003784530601556, "loss": 0.0176, "step": 257090 }, { "epoch": 0.67, "learning_rate": 0.0002000339570896441, "loss": 0.0141, "step": 257100 }, { "epoch": 0.67, "learning_rate": 0.00020003006887327267, "loss": 0.0131, "step": 257110 }, { "epoch": 0.67, "learning_rate": 0.00020002618065690118, "loss": 0.0167, "step": 257120 }, { "epoch": 0.67, "learning_rate": 0.0002000222924405297, "loss": 0.016, "step": 257130 }, { "epoch": 0.67, "learning_rate": 0.00020001840422415824, "loss": 0.015, "step": 257140 }, { "epoch": 0.67, "learning_rate": 0.0002000145160077868, "loss": 0.013, "step": 257150 }, { "epoch": 0.67, "learning_rate": 0.00020001062779141532, "loss": 0.0134, "step": 257160 }, { "epoch": 0.67, "learning_rate": 0.00020000673957504386, "loss": 0.017, "step": 257170 }, { "epoch": 0.67, "learning_rate": 0.00020000285135867238, "loss": 0.0153, "step": 257180 }, { "epoch": 0.67, "learning_rate": 0.00019999896314230094, "loss": 0.0156, "step": 257190 }, { "epoch": 0.67, "learning_rate": 0.00019999507492592946, "loss": 0.0182, "step": 257200 }, { "epoch": 0.67, "learning_rate": 0.000199991186709558, "loss": 0.0163, "step": 257210 }, { "epoch": 0.67, "learning_rate": 0.00019998729849318652, "loss": 0.0157, "step": 257220 }, { "epoch": 0.67, "learning_rate": 0.00019998341027681508, "loss": 0.0136, "step": 257230 }, { "epoch": 0.67, "learning_rate": 0.0001999795220604436, "loss": 0.0143, "step": 257240 }, { "epoch": 0.67, "learning_rate": 0.00019997563384407214, "loss": 0.0184, "step": 257250 }, { "epoch": 0.67, "learning_rate": 0.00019997174562770066, "loss": 0.0158, "step": 257260 }, { "epoch": 0.67, "learning_rate": 0.00019996785741132922, "loss": 0.0208, "step": 257270 }, { "epoch": 0.67, "learning_rate": 0.00019996396919495774, "loss": 0.0141, "step": 257280 }, { "epoch": 0.67, "learning_rate": 0.00019996008097858628, "loss": 0.0177, "step": 257290 }, { "epoch": 0.67, "learning_rate": 0.0001999561927622148, "loss": 0.0182, "step": 257300 }, { "epoch": 0.67, "learning_rate": 0.00019995230454584334, "loss": 0.0152, "step": 257310 }, { "epoch": 0.67, "learning_rate": 0.0001999484163294719, "loss": 0.0162, "step": 257320 }, { "epoch": 0.67, "learning_rate": 0.00019994452811310042, "loss": 0.0178, "step": 257330 }, { "epoch": 0.67, "learning_rate": 0.00019994063989672896, "loss": 0.018, "step": 257340 }, { "epoch": 0.67, "learning_rate": 0.00019993675168035748, "loss": 0.0204, "step": 257350 }, { "epoch": 0.67, "learning_rate": 0.00019993286346398604, "loss": 0.0154, "step": 257360 }, { "epoch": 0.67, "learning_rate": 0.00019992897524761456, "loss": 0.0155, "step": 257370 }, { "epoch": 0.67, "learning_rate": 0.0001999250870312431, "loss": 0.0181, "step": 257380 }, { "epoch": 0.67, "learning_rate": 0.00019992119881487162, "loss": 0.016, "step": 257390 }, { "epoch": 0.67, "learning_rate": 0.00019991731059850018, "loss": 0.0145, "step": 257400 }, { "epoch": 0.67, "learning_rate": 0.0001999134223821287, "loss": 0.0233, "step": 257410 }, { "epoch": 0.67, "learning_rate": 0.00019990953416575724, "loss": 0.0139, "step": 257420 }, { "epoch": 0.67, "learning_rate": 0.00019990564594938575, "loss": 0.0171, "step": 257430 }, { "epoch": 0.67, "learning_rate": 0.00019990175773301432, "loss": 0.011, "step": 257440 }, { "epoch": 0.67, "learning_rate": 0.00019989786951664284, "loss": 0.0152, "step": 257450 }, { "epoch": 0.67, "learning_rate": 0.00019989398130027138, "loss": 0.0172, "step": 257460 }, { "epoch": 0.67, "learning_rate": 0.0001998900930838999, "loss": 0.0143, "step": 257470 }, { "epoch": 0.67, "learning_rate": 0.00019988620486752846, "loss": 0.0152, "step": 257480 }, { "epoch": 0.67, "learning_rate": 0.000199882316651157, "loss": 0.012, "step": 257490 }, { "epoch": 0.67, "learning_rate": 0.00019987842843478552, "loss": 0.0211, "step": 257500 }, { "epoch": 0.67, "learning_rate": 0.00019987454021841406, "loss": 0.015, "step": 257510 }, { "epoch": 0.67, "learning_rate": 0.0001998706520020426, "loss": 0.0212, "step": 257520 }, { "epoch": 0.67, "learning_rate": 0.00019986676378567114, "loss": 0.0164, "step": 257530 }, { "epoch": 0.67, "learning_rate": 0.00019986287556929966, "loss": 0.0171, "step": 257540 }, { "epoch": 0.67, "learning_rate": 0.0001998589873529282, "loss": 0.014, "step": 257550 }, { "epoch": 0.67, "learning_rate": 0.00019985509913655671, "loss": 0.0136, "step": 257560 }, { "epoch": 0.67, "learning_rate": 0.00019985121092018528, "loss": 0.0157, "step": 257570 }, { "epoch": 0.67, "learning_rate": 0.0001998473227038138, "loss": 0.0181, "step": 257580 }, { "epoch": 0.67, "learning_rate": 0.00019984343448744234, "loss": 0.0157, "step": 257590 }, { "epoch": 0.67, "learning_rate": 0.00019983954627107085, "loss": 0.0156, "step": 257600 }, { "epoch": 0.67, "learning_rate": 0.00019983565805469942, "loss": 0.0145, "step": 257610 }, { "epoch": 0.67, "learning_rate": 0.00019983176983832794, "loss": 0.0204, "step": 257620 }, { "epoch": 0.67, "learning_rate": 0.00019982788162195648, "loss": 0.0153, "step": 257630 }, { "epoch": 0.67, "learning_rate": 0.000199823993405585, "loss": 0.0151, "step": 257640 }, { "epoch": 0.67, "learning_rate": 0.00019982010518921356, "loss": 0.0159, "step": 257650 }, { "epoch": 0.67, "learning_rate": 0.0001998162169728421, "loss": 0.0136, "step": 257660 }, { "epoch": 0.67, "learning_rate": 0.00019981232875647062, "loss": 0.0188, "step": 257670 }, { "epoch": 0.67, "learning_rate": 0.00019980844054009913, "loss": 0.0133, "step": 257680 }, { "epoch": 0.67, "learning_rate": 0.0001998045523237277, "loss": 0.0146, "step": 257690 }, { "epoch": 0.67, "learning_rate": 0.00019980066410735624, "loss": 0.0156, "step": 257700 }, { "epoch": 0.67, "learning_rate": 0.00019979677589098476, "loss": 0.0152, "step": 257710 }, { "epoch": 0.67, "learning_rate": 0.0001997928876746133, "loss": 0.0143, "step": 257720 }, { "epoch": 0.67, "learning_rate": 0.00019978899945824184, "loss": 0.0137, "step": 257730 }, { "epoch": 0.67, "learning_rate": 0.00019978511124187038, "loss": 0.0129, "step": 257740 }, { "epoch": 0.67, "learning_rate": 0.0001997812230254989, "loss": 0.0184, "step": 257750 }, { "epoch": 0.67, "learning_rate": 0.00019977733480912744, "loss": 0.0108, "step": 257760 }, { "epoch": 0.67, "learning_rate": 0.00019977344659275598, "loss": 0.0173, "step": 257770 }, { "epoch": 0.67, "learning_rate": 0.00019976955837638452, "loss": 0.0127, "step": 257780 }, { "epoch": 0.67, "learning_rate": 0.00019976567016001304, "loss": 0.0145, "step": 257790 }, { "epoch": 0.67, "learning_rate": 0.00019976178194364158, "loss": 0.0158, "step": 257800 }, { "epoch": 0.67, "learning_rate": 0.0001997578937272701, "loss": 0.0159, "step": 257810 }, { "epoch": 0.67, "learning_rate": 0.00019975400551089866, "loss": 0.0158, "step": 257820 }, { "epoch": 0.67, "learning_rate": 0.0001997501172945272, "loss": 0.0186, "step": 257830 }, { "epoch": 0.67, "learning_rate": 0.00019974622907815572, "loss": 0.0135, "step": 257840 }, { "epoch": 0.67, "learning_rate": 0.00019974234086178423, "loss": 0.0118, "step": 257850 }, { "epoch": 0.67, "learning_rate": 0.0001997384526454128, "loss": 0.0134, "step": 257860 }, { "epoch": 0.67, "learning_rate": 0.00019973456442904134, "loss": 0.0141, "step": 257870 }, { "epoch": 0.67, "learning_rate": 0.00019973067621266986, "loss": 0.0123, "step": 257880 }, { "epoch": 0.67, "learning_rate": 0.0001997267879962984, "loss": 0.0139, "step": 257890 }, { "epoch": 0.67, "learning_rate": 0.00019972289977992694, "loss": 0.0207, "step": 257900 }, { "epoch": 0.67, "learning_rate": 0.00019971901156355548, "loss": 0.0141, "step": 257910 }, { "epoch": 0.67, "learning_rate": 0.000199715123347184, "loss": 0.019, "step": 257920 }, { "epoch": 0.67, "learning_rate": 0.00019971123513081254, "loss": 0.0106, "step": 257930 }, { "epoch": 0.67, "learning_rate": 0.00019970734691444108, "loss": 0.0147, "step": 257940 }, { "epoch": 0.67, "learning_rate": 0.00019970345869806962, "loss": 0.0135, "step": 257950 }, { "epoch": 0.67, "learning_rate": 0.00019969957048169814, "loss": 0.0168, "step": 257960 }, { "epoch": 0.67, "learning_rate": 0.00019969568226532668, "loss": 0.0145, "step": 257970 }, { "epoch": 0.67, "learning_rate": 0.00019969179404895525, "loss": 0.0151, "step": 257980 }, { "epoch": 0.67, "learning_rate": 0.00019968790583258376, "loss": 0.0156, "step": 257990 }, { "epoch": 0.67, "learning_rate": 0.00019968401761621228, "loss": 0.0182, "step": 258000 }, { "epoch": 0.67, "eval_cer": 0.8818202558256388, "eval_loss": 0.010769709013402462, "eval_runtime": 107.7755, "eval_samples_per_second": 18.557, "eval_steps_per_second": 4.639, "step": 258000 }, { "epoch": 0.67, "learning_rate": 0.00019968012939984082, "loss": 0.0188, "step": 258010 }, { "epoch": 0.67, "learning_rate": 0.00019967624118346939, "loss": 0.0165, "step": 258020 }, { "epoch": 0.67, "learning_rate": 0.0001996723529670979, "loss": 0.0138, "step": 258030 }, { "epoch": 0.67, "learning_rate": 0.00019966846475072644, "loss": 0.0175, "step": 258040 }, { "epoch": 0.67, "learning_rate": 0.00019966457653435496, "loss": 0.0143, "step": 258050 }, { "epoch": 0.67, "learning_rate": 0.0001996606883179835, "loss": 0.0129, "step": 258060 }, { "epoch": 0.67, "learning_rate": 0.00019965680010161204, "loss": 0.0146, "step": 258070 }, { "epoch": 0.67, "learning_rate": 0.00019965291188524058, "loss": 0.0186, "step": 258080 }, { "epoch": 0.67, "learning_rate": 0.0001996490236688691, "loss": 0.0141, "step": 258090 }, { "epoch": 0.67, "learning_rate": 0.00019964513545249764, "loss": 0.0153, "step": 258100 }, { "epoch": 0.67, "learning_rate": 0.00019964124723612618, "loss": 0.0152, "step": 258110 }, { "epoch": 0.67, "learning_rate": 0.00019963735901975472, "loss": 0.015, "step": 258120 }, { "epoch": 0.67, "learning_rate": 0.00019963347080338324, "loss": 0.0174, "step": 258130 }, { "epoch": 0.67, "learning_rate": 0.00019962958258701178, "loss": 0.0134, "step": 258140 }, { "epoch": 0.67, "learning_rate": 0.00019962569437064032, "loss": 0.0146, "step": 258150 }, { "epoch": 0.67, "learning_rate": 0.00019962180615426886, "loss": 0.0172, "step": 258160 }, { "epoch": 0.67, "learning_rate": 0.00019961791793789737, "loss": 0.0131, "step": 258170 }, { "epoch": 0.67, "learning_rate": 0.00019961402972152592, "loss": 0.0182, "step": 258180 }, { "epoch": 0.67, "learning_rate": 0.00019961014150515449, "loss": 0.0112, "step": 258190 }, { "epoch": 0.67, "learning_rate": 0.000199606253288783, "loss": 0.0161, "step": 258200 }, { "epoch": 0.67, "learning_rate": 0.00019960236507241154, "loss": 0.0146, "step": 258210 }, { "epoch": 0.67, "learning_rate": 0.00019959847685604006, "loss": 0.016, "step": 258220 }, { "epoch": 0.67, "learning_rate": 0.00019959458863966862, "loss": 0.0155, "step": 258230 }, { "epoch": 0.67, "learning_rate": 0.00019959070042329714, "loss": 0.0151, "step": 258240 }, { "epoch": 0.67, "learning_rate": 0.00019958681220692568, "loss": 0.0149, "step": 258250 }, { "epoch": 0.67, "learning_rate": 0.0001995829239905542, "loss": 0.0134, "step": 258260 }, { "epoch": 0.67, "learning_rate": 0.00019957903577418276, "loss": 0.0186, "step": 258270 }, { "epoch": 0.67, "learning_rate": 0.00019957514755781128, "loss": 0.0171, "step": 258280 }, { "epoch": 0.67, "learning_rate": 0.00019957125934143982, "loss": 0.0264, "step": 258290 }, { "epoch": 0.67, "learning_rate": 0.00019956737112506833, "loss": 0.0148, "step": 258300 }, { "epoch": 0.67, "learning_rate": 0.00019956348290869688, "loss": 0.0176, "step": 258310 }, { "epoch": 0.67, "learning_rate": 0.00019955959469232542, "loss": 0.0161, "step": 258320 }, { "epoch": 0.67, "learning_rate": 0.00019955570647595396, "loss": 0.0172, "step": 258330 }, { "epoch": 0.67, "learning_rate": 0.00019955181825958247, "loss": 0.0139, "step": 258340 }, { "epoch": 0.67, "learning_rate": 0.00019954793004321102, "loss": 0.0157, "step": 258350 }, { "epoch": 0.67, "learning_rate": 0.00019954404182683958, "loss": 0.0197, "step": 258360 }, { "epoch": 0.67, "learning_rate": 0.0001995401536104681, "loss": 0.014, "step": 258370 }, { "epoch": 0.67, "learning_rate": 0.00019953626539409664, "loss": 0.0144, "step": 258380 }, { "epoch": 0.67, "learning_rate": 0.00019953237717772516, "loss": 0.0172, "step": 258390 }, { "epoch": 0.67, "learning_rate": 0.00019952848896135372, "loss": 0.0199, "step": 258400 }, { "epoch": 0.67, "learning_rate": 0.00019952460074498224, "loss": 0.0164, "step": 258410 }, { "epoch": 0.67, "learning_rate": 0.00019952071252861078, "loss": 0.0161, "step": 258420 }, { "epoch": 0.67, "learning_rate": 0.0001995168243122393, "loss": 0.0137, "step": 258430 }, { "epoch": 0.67, "learning_rate": 0.00019951293609586786, "loss": 0.0152, "step": 258440 }, { "epoch": 0.67, "learning_rate": 0.00019950904787949638, "loss": 0.0146, "step": 258450 }, { "epoch": 0.67, "learning_rate": 0.00019950515966312492, "loss": 0.0142, "step": 258460 }, { "epoch": 0.67, "learning_rate": 0.00019950127144675343, "loss": 0.0177, "step": 258470 }, { "epoch": 0.67, "learning_rate": 0.000199497383230382, "loss": 0.0131, "step": 258480 }, { "epoch": 0.67, "learning_rate": 0.00019949349501401052, "loss": 0.0148, "step": 258490 }, { "epoch": 0.67, "learning_rate": 0.00019948960679763906, "loss": 0.0154, "step": 258500 }, { "epoch": 0.67, "learning_rate": 0.00019948571858126757, "loss": 0.0182, "step": 258510 }, { "epoch": 0.67, "learning_rate": 0.00019948183036489614, "loss": 0.0146, "step": 258520 }, { "epoch": 0.67, "learning_rate": 0.00019947794214852468, "loss": 0.0113, "step": 258530 }, { "epoch": 0.67, "learning_rate": 0.0001994740539321532, "loss": 0.0166, "step": 258540 }, { "epoch": 0.67, "learning_rate": 0.0001994701657157817, "loss": 0.0122, "step": 258550 }, { "epoch": 0.67, "learning_rate": 0.00019946627749941025, "loss": 0.0172, "step": 258560 }, { "epoch": 0.67, "learning_rate": 0.00019946238928303882, "loss": 0.0153, "step": 258570 }, { "epoch": 0.67, "learning_rate": 0.00019945850106666734, "loss": 0.0166, "step": 258580 }, { "epoch": 0.67, "learning_rate": 0.00019945461285029588, "loss": 0.0151, "step": 258590 }, { "epoch": 0.67, "learning_rate": 0.0001994507246339244, "loss": 0.0168, "step": 258600 }, { "epoch": 0.67, "learning_rate": 0.00019944683641755296, "loss": 0.0144, "step": 258610 }, { "epoch": 0.67, "learning_rate": 0.00019944294820118148, "loss": 0.0154, "step": 258620 }, { "epoch": 0.67, "learning_rate": 0.00019943905998481002, "loss": 0.0156, "step": 258630 }, { "epoch": 0.67, "learning_rate": 0.00019943517176843853, "loss": 0.0138, "step": 258640 }, { "epoch": 0.67, "learning_rate": 0.0001994312835520671, "loss": 0.0156, "step": 258650 }, { "epoch": 0.67, "learning_rate": 0.00019942739533569562, "loss": 0.0183, "step": 258660 }, { "epoch": 0.67, "learning_rate": 0.00019942350711932416, "loss": 0.0163, "step": 258670 }, { "epoch": 0.67, "learning_rate": 0.00019941961890295267, "loss": 0.0141, "step": 258680 }, { "epoch": 0.67, "learning_rate": 0.00019941573068658124, "loss": 0.0119, "step": 258690 }, { "epoch": 0.67, "learning_rate": 0.00019941184247020978, "loss": 0.0146, "step": 258700 }, { "epoch": 0.67, "learning_rate": 0.0001994079542538383, "loss": 0.0187, "step": 258710 }, { "epoch": 0.67, "learning_rate": 0.0001994040660374668, "loss": 0.0128, "step": 258720 }, { "epoch": 0.67, "learning_rate": 0.00019940017782109538, "loss": 0.0184, "step": 258730 }, { "epoch": 0.67, "learning_rate": 0.00019939628960472392, "loss": 0.0152, "step": 258740 }, { "epoch": 0.67, "learning_rate": 0.00019939240138835244, "loss": 0.0136, "step": 258750 }, { "epoch": 0.67, "learning_rate": 0.00019938851317198098, "loss": 0.0192, "step": 258760 }, { "epoch": 0.67, "learning_rate": 0.00019938462495560952, "loss": 0.0141, "step": 258770 }, { "epoch": 0.67, "learning_rate": 0.00019938073673923806, "loss": 0.0139, "step": 258780 }, { "epoch": 0.67, "learning_rate": 0.00019937684852286658, "loss": 0.0114, "step": 258790 }, { "epoch": 0.67, "learning_rate": 0.00019937296030649512, "loss": 0.013, "step": 258800 }, { "epoch": 0.67, "learning_rate": 0.00019936907209012363, "loss": 0.0129, "step": 258810 }, { "epoch": 0.67, "learning_rate": 0.0001993651838737522, "loss": 0.0136, "step": 258820 }, { "epoch": 0.67, "learning_rate": 0.00019936129565738072, "loss": 0.0187, "step": 258830 }, { "epoch": 0.67, "learning_rate": 0.00019935740744100926, "loss": 0.0154, "step": 258840 }, { "epoch": 0.67, "learning_rate": 0.00019935351922463777, "loss": 0.0189, "step": 258850 }, { "epoch": 0.67, "learning_rate": 0.00019934963100826634, "loss": 0.0146, "step": 258860 }, { "epoch": 0.67, "learning_rate": 0.00019934574279189486, "loss": 0.0171, "step": 258870 }, { "epoch": 0.67, "learning_rate": 0.0001993418545755234, "loss": 0.0182, "step": 258880 }, { "epoch": 0.67, "learning_rate": 0.0001993379663591519, "loss": 0.013, "step": 258890 }, { "epoch": 0.67, "learning_rate": 0.00019933407814278048, "loss": 0.016, "step": 258900 }, { "epoch": 0.67, "learning_rate": 0.00019933018992640902, "loss": 0.0154, "step": 258910 }, { "epoch": 0.67, "learning_rate": 0.00019932630171003754, "loss": 0.0177, "step": 258920 }, { "epoch": 0.67, "learning_rate": 0.00019932241349366608, "loss": 0.0152, "step": 258930 }, { "epoch": 0.67, "learning_rate": 0.00019931852527729462, "loss": 0.0145, "step": 258940 }, { "epoch": 0.67, "learning_rate": 0.00019931463706092316, "loss": 0.0131, "step": 258950 }, { "epoch": 0.67, "learning_rate": 0.00019931074884455168, "loss": 0.0147, "step": 258960 }, { "epoch": 0.67, "learning_rate": 0.00019930686062818022, "loss": 0.0173, "step": 258970 }, { "epoch": 0.67, "learning_rate": 0.00019930297241180876, "loss": 0.0226, "step": 258980 }, { "epoch": 0.67, "learning_rate": 0.0001992990841954373, "loss": 0.0124, "step": 258990 }, { "epoch": 0.67, "learning_rate": 0.00019929519597906582, "loss": 0.0149, "step": 259000 }, { "epoch": 0.67, "eval_cer": 0.8817740678068109, "eval_loss": 0.010703030042350292, "eval_runtime": 107.7387, "eval_samples_per_second": 18.563, "eval_steps_per_second": 4.641, "step": 259000 }, { "epoch": 0.67, "learning_rate": 0.00019929130776269436, "loss": 0.0154, "step": 259010 }, { "epoch": 0.67, "learning_rate": 0.00019928741954632293, "loss": 0.0142, "step": 259020 }, { "epoch": 0.67, "learning_rate": 0.00019928353132995144, "loss": 0.0151, "step": 259030 }, { "epoch": 0.67, "learning_rate": 0.00019927964311357996, "loss": 0.016, "step": 259040 }, { "epoch": 0.67, "learning_rate": 0.0001992757548972085, "loss": 0.0155, "step": 259050 }, { "epoch": 0.67, "learning_rate": 0.000199271866680837, "loss": 0.0151, "step": 259060 }, { "epoch": 0.67, "learning_rate": 0.00019926797846446558, "loss": 0.0196, "step": 259070 }, { "epoch": 0.67, "learning_rate": 0.00019926409024809412, "loss": 0.014, "step": 259080 }, { "epoch": 0.67, "learning_rate": 0.00019926020203172264, "loss": 0.0163, "step": 259090 }, { "epoch": 0.67, "learning_rate": 0.00019925631381535118, "loss": 0.0142, "step": 259100 }, { "epoch": 0.67, "learning_rate": 0.00019925242559897972, "loss": 0.0134, "step": 259110 }, { "epoch": 0.67, "learning_rate": 0.00019924853738260826, "loss": 0.0161, "step": 259120 }, { "epoch": 0.67, "learning_rate": 0.00019924464916623678, "loss": 0.0182, "step": 259130 }, { "epoch": 0.67, "learning_rate": 0.00019924076094986532, "loss": 0.0138, "step": 259140 }, { "epoch": 0.67, "learning_rate": 0.00019923687273349386, "loss": 0.0154, "step": 259150 }, { "epoch": 0.67, "learning_rate": 0.0001992329845171224, "loss": 0.0138, "step": 259160 }, { "epoch": 0.67, "learning_rate": 0.00019922909630075092, "loss": 0.0152, "step": 259170 }, { "epoch": 0.67, "learning_rate": 0.00019922520808437946, "loss": 0.0145, "step": 259180 }, { "epoch": 0.67, "learning_rate": 0.000199221319868008, "loss": 0.018, "step": 259190 }, { "epoch": 0.67, "learning_rate": 0.00019921743165163654, "loss": 0.0166, "step": 259200 }, { "epoch": 0.67, "learning_rate": 0.00019921354343526505, "loss": 0.0141, "step": 259210 }, { "epoch": 0.67, "learning_rate": 0.0001992096552188936, "loss": 0.0138, "step": 259220 }, { "epoch": 0.67, "learning_rate": 0.00019920576700252217, "loss": 0.0157, "step": 259230 }, { "epoch": 0.67, "learning_rate": 0.00019920187878615068, "loss": 0.0132, "step": 259240 }, { "epoch": 0.67, "learning_rate": 0.00019919799056977922, "loss": 0.0127, "step": 259250 }, { "epoch": 0.67, "learning_rate": 0.00019919410235340774, "loss": 0.0168, "step": 259260 }, { "epoch": 0.67, "learning_rate": 0.0001991902141370363, "loss": 0.0162, "step": 259270 }, { "epoch": 0.67, "learning_rate": 0.00019918632592066482, "loss": 0.016, "step": 259280 }, { "epoch": 0.67, "learning_rate": 0.00019918243770429336, "loss": 0.0158, "step": 259290 }, { "epoch": 0.67, "learning_rate": 0.00019917854948792188, "loss": 0.0197, "step": 259300 }, { "epoch": 0.67, "learning_rate": 0.00019917466127155042, "loss": 0.0195, "step": 259310 }, { "epoch": 0.67, "learning_rate": 0.00019917077305517896, "loss": 0.0238, "step": 259320 }, { "epoch": 0.67, "learning_rate": 0.0001991668848388075, "loss": 0.0174, "step": 259330 }, { "epoch": 0.67, "learning_rate": 0.00019916299662243601, "loss": 0.0105, "step": 259340 }, { "epoch": 0.67, "learning_rate": 0.00019915910840606456, "loss": 0.0166, "step": 259350 }, { "epoch": 0.67, "learning_rate": 0.0001991552201896931, "loss": 0.0154, "step": 259360 }, { "epoch": 0.67, "learning_rate": 0.00019915133197332164, "loss": 0.0151, "step": 259370 }, { "epoch": 0.67, "learning_rate": 0.00019914744375695015, "loss": 0.0183, "step": 259380 }, { "epoch": 0.67, "learning_rate": 0.0001991435555405787, "loss": 0.0191, "step": 259390 }, { "epoch": 0.67, "learning_rate": 0.00019913966732420726, "loss": 0.016, "step": 259400 }, { "epoch": 0.67, "learning_rate": 0.00019913577910783578, "loss": 0.0182, "step": 259410 }, { "epoch": 0.67, "learning_rate": 0.00019913189089146432, "loss": 0.0138, "step": 259420 }, { "epoch": 0.67, "learning_rate": 0.00019912800267509284, "loss": 0.0165, "step": 259430 }, { "epoch": 0.67, "learning_rate": 0.0001991241144587214, "loss": 0.0143, "step": 259440 }, { "epoch": 0.67, "learning_rate": 0.00019912022624234992, "loss": 0.0152, "step": 259450 }, { "epoch": 0.67, "learning_rate": 0.00019911633802597846, "loss": 0.0142, "step": 259460 }, { "epoch": 0.67, "learning_rate": 0.00019911244980960697, "loss": 0.0142, "step": 259470 }, { "epoch": 0.67, "learning_rate": 0.00019910856159323554, "loss": 0.0137, "step": 259480 }, { "epoch": 0.67, "learning_rate": 0.00019910467337686406, "loss": 0.019, "step": 259490 }, { "epoch": 0.67, "learning_rate": 0.0001991007851604926, "loss": 0.0136, "step": 259500 }, { "epoch": 0.67, "learning_rate": 0.00019909689694412111, "loss": 0.0145, "step": 259510 }, { "epoch": 0.67, "learning_rate": 0.00019909300872774966, "loss": 0.0163, "step": 259520 }, { "epoch": 0.67, "learning_rate": 0.0001990891205113782, "loss": 0.0152, "step": 259530 }, { "epoch": 0.67, "learning_rate": 0.00019908523229500674, "loss": 0.0113, "step": 259540 }, { "epoch": 0.67, "learning_rate": 0.00019908134407863525, "loss": 0.0173, "step": 259550 }, { "epoch": 0.67, "learning_rate": 0.0001990774558622638, "loss": 0.0157, "step": 259560 }, { "epoch": 0.67, "learning_rate": 0.00019907356764589236, "loss": 0.0152, "step": 259570 }, { "epoch": 0.67, "learning_rate": 0.00019906967942952088, "loss": 0.014, "step": 259580 }, { "epoch": 0.67, "learning_rate": 0.0001990657912131494, "loss": 0.0165, "step": 259590 }, { "epoch": 0.67, "learning_rate": 0.00019906190299677793, "loss": 0.0164, "step": 259600 }, { "epoch": 0.67, "learning_rate": 0.0001990580147804065, "loss": 0.0135, "step": 259610 }, { "epoch": 0.67, "learning_rate": 0.00019905412656403502, "loss": 0.0144, "step": 259620 }, { "epoch": 0.67, "learning_rate": 0.00019905023834766356, "loss": 0.0125, "step": 259630 }, { "epoch": 0.67, "learning_rate": 0.00019904635013129207, "loss": 0.0157, "step": 259640 }, { "epoch": 0.67, "learning_rate": 0.00019904246191492064, "loss": 0.0156, "step": 259650 }, { "epoch": 0.67, "learning_rate": 0.00019903857369854916, "loss": 0.016, "step": 259660 }, { "epoch": 0.67, "learning_rate": 0.0001990346854821777, "loss": 0.0135, "step": 259670 }, { "epoch": 0.67, "learning_rate": 0.00019903079726580621, "loss": 0.0135, "step": 259680 }, { "epoch": 0.67, "learning_rate": 0.00019902690904943478, "loss": 0.0151, "step": 259690 }, { "epoch": 0.67, "learning_rate": 0.0001990230208330633, "loss": 0.0143, "step": 259700 }, { "epoch": 0.67, "learning_rate": 0.00019901913261669184, "loss": 0.0122, "step": 259710 }, { "epoch": 0.67, "learning_rate": 0.00019901524440032035, "loss": 0.0161, "step": 259720 }, { "epoch": 0.67, "learning_rate": 0.00019901135618394892, "loss": 0.0196, "step": 259730 }, { "epoch": 0.67, "learning_rate": 0.00019900746796757744, "loss": 0.0131, "step": 259740 }, { "epoch": 0.67, "learning_rate": 0.00019900357975120598, "loss": 0.0155, "step": 259750 }, { "epoch": 0.67, "learning_rate": 0.0001989996915348345, "loss": 0.013, "step": 259760 }, { "epoch": 0.67, "learning_rate": 0.00019899580331846303, "loss": 0.0161, "step": 259770 }, { "epoch": 0.67, "learning_rate": 0.0001989919151020916, "loss": 0.0148, "step": 259780 }, { "epoch": 0.67, "learning_rate": 0.00019898802688572012, "loss": 0.0164, "step": 259790 }, { "epoch": 0.67, "learning_rate": 0.00019898413866934866, "loss": 0.0184, "step": 259800 }, { "epoch": 0.67, "learning_rate": 0.00019898025045297717, "loss": 0.0132, "step": 259810 }, { "epoch": 0.67, "learning_rate": 0.00019897636223660574, "loss": 0.02, "step": 259820 }, { "epoch": 0.67, "learning_rate": 0.00019897247402023426, "loss": 0.0138, "step": 259830 }, { "epoch": 0.67, "learning_rate": 0.0001989685858038628, "loss": 0.0132, "step": 259840 }, { "epoch": 0.67, "learning_rate": 0.0001989646975874913, "loss": 0.0152, "step": 259850 }, { "epoch": 0.67, "learning_rate": 0.00019896080937111988, "loss": 0.0132, "step": 259860 }, { "epoch": 0.67, "learning_rate": 0.0001989569211547484, "loss": 0.018, "step": 259870 }, { "epoch": 0.67, "learning_rate": 0.00019895303293837694, "loss": 0.0155, "step": 259880 }, { "epoch": 0.67, "learning_rate": 0.00019894914472200545, "loss": 0.0137, "step": 259890 }, { "epoch": 0.67, "learning_rate": 0.00019894525650563402, "loss": 0.018, "step": 259900 }, { "epoch": 0.67, "learning_rate": 0.00019894136828926254, "loss": 0.017, "step": 259910 }, { "epoch": 0.67, "learning_rate": 0.00019893748007289108, "loss": 0.0186, "step": 259920 }, { "epoch": 0.67, "learning_rate": 0.0001989335918565196, "loss": 0.014, "step": 259930 }, { "epoch": 0.67, "learning_rate": 0.00019892970364014816, "loss": 0.018, "step": 259940 }, { "epoch": 0.67, "learning_rate": 0.0001989258154237767, "loss": 0.0148, "step": 259950 }, { "epoch": 0.67, "learning_rate": 0.00019892192720740522, "loss": 0.016, "step": 259960 }, { "epoch": 0.67, "learning_rate": 0.00019891803899103376, "loss": 0.0147, "step": 259970 }, { "epoch": 0.67, "learning_rate": 0.0001989141507746623, "loss": 0.0142, "step": 259980 }, { "epoch": 0.67, "learning_rate": 0.00019891026255829084, "loss": 0.0168, "step": 259990 }, { "epoch": 0.67, "learning_rate": 0.00019890637434191936, "loss": 0.0179, "step": 260000 }, { "epoch": 0.67, "eval_cer": 0.881806259456297, "eval_loss": 0.010559357702732086, "eval_runtime": 107.5865, "eval_samples_per_second": 18.59, "eval_steps_per_second": 4.647, "step": 260000 }, { "epoch": 0.67, "learning_rate": 0.0001989024861255479, "loss": 0.0177, "step": 260010 }, { "epoch": 0.67, "learning_rate": 0.0001988985979091764, "loss": 0.0173, "step": 260020 }, { "epoch": 0.67, "learning_rate": 0.00019889470969280498, "loss": 0.0128, "step": 260030 }, { "epoch": 0.67, "learning_rate": 0.0001988908214764335, "loss": 0.0193, "step": 260040 }, { "epoch": 0.67, "learning_rate": 0.00019888693326006204, "loss": 0.0116, "step": 260050 }, { "epoch": 0.67, "learning_rate": 0.00019888304504369055, "loss": 0.0177, "step": 260060 }, { "epoch": 0.67, "learning_rate": 0.00019887915682731912, "loss": 0.0185, "step": 260070 }, { "epoch": 0.67, "learning_rate": 0.00019887526861094764, "loss": 0.0139, "step": 260080 }, { "epoch": 0.67, "learning_rate": 0.00019887138039457618, "loss": 0.0157, "step": 260090 }, { "epoch": 0.67, "learning_rate": 0.0001988674921782047, "loss": 0.0166, "step": 260100 }, { "epoch": 0.67, "learning_rate": 0.00019886360396183326, "loss": 0.0172, "step": 260110 }, { "epoch": 0.67, "learning_rate": 0.0001988597157454618, "loss": 0.0149, "step": 260120 }, { "epoch": 0.67, "learning_rate": 0.00019885582752909032, "loss": 0.0159, "step": 260130 }, { "epoch": 0.67, "learning_rate": 0.00019885193931271883, "loss": 0.0127, "step": 260140 }, { "epoch": 0.67, "learning_rate": 0.0001988480510963474, "loss": 0.0159, "step": 260150 }, { "epoch": 0.67, "learning_rate": 0.00019884416287997594, "loss": 0.0142, "step": 260160 }, { "epoch": 0.67, "learning_rate": 0.00019884027466360446, "loss": 0.015, "step": 260170 }, { "epoch": 0.67, "learning_rate": 0.000198836386447233, "loss": 0.0157, "step": 260180 }, { "epoch": 0.67, "learning_rate": 0.00019883249823086154, "loss": 0.017, "step": 260190 }, { "epoch": 0.67, "learning_rate": 0.00019882861001449008, "loss": 0.0125, "step": 260200 }, { "epoch": 0.67, "learning_rate": 0.0001988247217981186, "loss": 0.0161, "step": 260210 }, { "epoch": 0.67, "learning_rate": 0.00019882083358174714, "loss": 0.0142, "step": 260220 }, { "epoch": 0.67, "learning_rate": 0.00019881694536537568, "loss": 0.016, "step": 260230 }, { "epoch": 0.67, "learning_rate": 0.00019881305714900422, "loss": 0.0135, "step": 260240 }, { "epoch": 0.67, "learning_rate": 0.00019880916893263273, "loss": 0.0186, "step": 260250 }, { "epoch": 0.67, "learning_rate": 0.00019880528071626128, "loss": 0.0137, "step": 260260 }, { "epoch": 0.67, "learning_rate": 0.0001988013924998898, "loss": 0.0168, "step": 260270 }, { "epoch": 0.67, "learning_rate": 0.00019879750428351836, "loss": 0.0138, "step": 260280 }, { "epoch": 0.67, "learning_rate": 0.0001987936160671469, "loss": 0.0144, "step": 260290 }, { "epoch": 0.67, "learning_rate": 0.00019878972785077542, "loss": 0.013, "step": 260300 }, { "epoch": 0.67, "learning_rate": 0.00019878583963440393, "loss": 0.0121, "step": 260310 }, { "epoch": 0.67, "learning_rate": 0.0001987819514180325, "loss": 0.0163, "step": 260320 }, { "epoch": 0.67, "learning_rate": 0.00019877806320166104, "loss": 0.0151, "step": 260330 }, { "epoch": 0.67, "learning_rate": 0.00019877417498528956, "loss": 0.0145, "step": 260340 }, { "epoch": 0.67, "learning_rate": 0.0001987702867689181, "loss": 0.0132, "step": 260350 }, { "epoch": 0.67, "learning_rate": 0.00019876639855254664, "loss": 0.0138, "step": 260360 }, { "epoch": 0.67, "learning_rate": 0.00019876251033617518, "loss": 0.0136, "step": 260370 }, { "epoch": 0.67, "learning_rate": 0.0001987586221198037, "loss": 0.0117, "step": 260380 }, { "epoch": 0.67, "learning_rate": 0.00019875473390343224, "loss": 0.0121, "step": 260390 }, { "epoch": 0.67, "learning_rate": 0.00019875084568706078, "loss": 0.0183, "step": 260400 }, { "epoch": 0.68, "learning_rate": 0.00019874695747068932, "loss": 0.0173, "step": 260410 }, { "epoch": 0.68, "learning_rate": 0.00019874306925431783, "loss": 0.0169, "step": 260420 }, { "epoch": 0.68, "learning_rate": 0.00019873918103794638, "loss": 0.0153, "step": 260430 }, { "epoch": 0.68, "learning_rate": 0.00019873529282157494, "loss": 0.0171, "step": 260440 }, { "epoch": 0.68, "learning_rate": 0.00019873140460520346, "loss": 0.0166, "step": 260450 }, { "epoch": 0.68, "learning_rate": 0.00019872751638883197, "loss": 0.0183, "step": 260460 }, { "epoch": 0.68, "learning_rate": 0.00019872362817246052, "loss": 0.0172, "step": 260470 }, { "epoch": 0.68, "learning_rate": 0.00019871973995608908, "loss": 0.018, "step": 260480 }, { "epoch": 0.68, "learning_rate": 0.0001987158517397176, "loss": 0.0124, "step": 260490 }, { "epoch": 0.68, "learning_rate": 0.00019871196352334614, "loss": 0.0151, "step": 260500 }, { "epoch": 0.68, "learning_rate": 0.00019870807530697465, "loss": 0.0166, "step": 260510 }, { "epoch": 0.68, "learning_rate": 0.0001987041870906032, "loss": 0.0183, "step": 260520 }, { "epoch": 0.68, "learning_rate": 0.00019870029887423174, "loss": 0.0152, "step": 260530 }, { "epoch": 0.68, "learning_rate": 0.00019869641065786028, "loss": 0.013, "step": 260540 }, { "epoch": 0.68, "learning_rate": 0.0001986925224414888, "loss": 0.0186, "step": 260550 }, { "epoch": 0.68, "learning_rate": 0.00019868863422511734, "loss": 0.0175, "step": 260560 }, { "epoch": 0.68, "learning_rate": 0.00019868474600874588, "loss": 0.0136, "step": 260570 }, { "epoch": 0.68, "learning_rate": 0.00019868085779237442, "loss": 0.0145, "step": 260580 }, { "epoch": 0.68, "learning_rate": 0.00019867696957600293, "loss": 0.0157, "step": 260590 }, { "epoch": 0.68, "learning_rate": 0.00019867308135963148, "loss": 0.0178, "step": 260600 }, { "epoch": 0.68, "learning_rate": 0.00019866919314326004, "loss": 0.0181, "step": 260610 }, { "epoch": 0.68, "learning_rate": 0.00019866530492688856, "loss": 0.0139, "step": 260620 }, { "epoch": 0.68, "learning_rate": 0.00019866141671051707, "loss": 0.0132, "step": 260630 }, { "epoch": 0.68, "learning_rate": 0.00019865752849414561, "loss": 0.014, "step": 260640 }, { "epoch": 0.68, "learning_rate": 0.00019865364027777418, "loss": 0.0148, "step": 260650 }, { "epoch": 0.68, "learning_rate": 0.0001986497520614027, "loss": 0.0135, "step": 260660 }, { "epoch": 0.68, "learning_rate": 0.00019864586384503124, "loss": 0.0168, "step": 260670 }, { "epoch": 0.68, "learning_rate": 0.00019864197562865975, "loss": 0.0127, "step": 260680 }, { "epoch": 0.68, "learning_rate": 0.00019863808741228832, "loss": 0.0221, "step": 260690 }, { "epoch": 0.68, "learning_rate": 0.00019863419919591684, "loss": 0.0164, "step": 260700 }, { "epoch": 0.68, "learning_rate": 0.00019863031097954538, "loss": 0.0157, "step": 260710 }, { "epoch": 0.68, "learning_rate": 0.0001986264227631739, "loss": 0.0142, "step": 260720 }, { "epoch": 0.68, "learning_rate": 0.00019862253454680246, "loss": 0.0153, "step": 260730 }, { "epoch": 0.68, "learning_rate": 0.00019861864633043098, "loss": 0.0139, "step": 260740 }, { "epoch": 0.68, "learning_rate": 0.00019861475811405952, "loss": 0.0167, "step": 260750 }, { "epoch": 0.68, "learning_rate": 0.00019861086989768803, "loss": 0.0142, "step": 260760 }, { "epoch": 0.68, "learning_rate": 0.00019860698168131657, "loss": 0.0131, "step": 260770 }, { "epoch": 0.68, "learning_rate": 0.00019860309346494512, "loss": 0.0137, "step": 260780 }, { "epoch": 0.68, "learning_rate": 0.00019859920524857366, "loss": 0.0139, "step": 260790 }, { "epoch": 0.68, "learning_rate": 0.00019859531703220217, "loss": 0.0142, "step": 260800 }, { "epoch": 0.68, "learning_rate": 0.00019859142881583071, "loss": 0.0159, "step": 260810 }, { "epoch": 0.68, "learning_rate": 0.00019858754059945928, "loss": 0.0177, "step": 260820 }, { "epoch": 0.68, "learning_rate": 0.0001985836523830878, "loss": 0.0171, "step": 260830 }, { "epoch": 0.68, "learning_rate": 0.00019857976416671634, "loss": 0.0136, "step": 260840 }, { "epoch": 0.68, "learning_rate": 0.00019857587595034485, "loss": 0.0117, "step": 260850 }, { "epoch": 0.68, "learning_rate": 0.00019857198773397342, "loss": 0.0168, "step": 260860 }, { "epoch": 0.68, "learning_rate": 0.00019856809951760194, "loss": 0.017, "step": 260870 }, { "epoch": 0.68, "learning_rate": 0.00019856421130123048, "loss": 0.0135, "step": 260880 }, { "epoch": 0.68, "learning_rate": 0.000198560323084859, "loss": 0.0137, "step": 260890 }, { "epoch": 0.68, "learning_rate": 0.00019855643486848756, "loss": 0.0152, "step": 260900 }, { "epoch": 0.68, "learning_rate": 0.00019855254665211608, "loss": 0.0121, "step": 260910 }, { "epoch": 0.68, "learning_rate": 0.00019854865843574462, "loss": 0.0146, "step": 260920 }, { "epoch": 0.68, "learning_rate": 0.00019854477021937313, "loss": 0.0117, "step": 260930 }, { "epoch": 0.68, "learning_rate": 0.0001985408820030017, "loss": 0.0175, "step": 260940 }, { "epoch": 0.68, "learning_rate": 0.00019853699378663022, "loss": 0.0147, "step": 260950 }, { "epoch": 0.68, "learning_rate": 0.00019853310557025876, "loss": 0.018, "step": 260960 }, { "epoch": 0.68, "learning_rate": 0.00019852921735388727, "loss": 0.0143, "step": 260970 }, { "epoch": 0.68, "learning_rate": 0.00019852532913751584, "loss": 0.0128, "step": 260980 }, { "epoch": 0.68, "learning_rate": 0.00019852144092114438, "loss": 0.0135, "step": 260990 }, { "epoch": 0.68, "learning_rate": 0.0001985175527047729, "loss": 0.0119, "step": 261000 }, { "epoch": 0.68, "eval_cer": 0.8817236808771804, "eval_loss": 0.010634180158376694, "eval_runtime": 107.7642, "eval_samples_per_second": 18.559, "eval_steps_per_second": 4.64, "step": 261000 }, { "epoch": 0.68, "learning_rate": 0.00019851366448840144, "loss": 0.0155, "step": 261010 }, { "epoch": 0.68, "learning_rate": 0.00019850977627202995, "loss": 0.0115, "step": 261020 }, { "epoch": 0.68, "learning_rate": 0.00019850588805565852, "loss": 0.0165, "step": 261030 }, { "epoch": 0.68, "learning_rate": 0.00019850199983928704, "loss": 0.0171, "step": 261040 }, { "epoch": 0.68, "learning_rate": 0.00019849811162291558, "loss": 0.0189, "step": 261050 }, { "epoch": 0.68, "learning_rate": 0.0001984942234065441, "loss": 0.0181, "step": 261060 }, { "epoch": 0.68, "learning_rate": 0.00019849033519017266, "loss": 0.0197, "step": 261070 }, { "epoch": 0.68, "learning_rate": 0.00019848644697380118, "loss": 0.0146, "step": 261080 }, { "epoch": 0.68, "learning_rate": 0.00019848255875742972, "loss": 0.0128, "step": 261090 }, { "epoch": 0.68, "learning_rate": 0.00019847867054105823, "loss": 0.0161, "step": 261100 }, { "epoch": 0.68, "learning_rate": 0.0001984747823246868, "loss": 0.0173, "step": 261110 }, { "epoch": 0.68, "learning_rate": 0.00019847089410831531, "loss": 0.0153, "step": 261120 }, { "epoch": 0.68, "learning_rate": 0.00019846700589194386, "loss": 0.0111, "step": 261130 }, { "epoch": 0.68, "learning_rate": 0.00019846311767557237, "loss": 0.0183, "step": 261140 }, { "epoch": 0.68, "learning_rate": 0.00019845922945920094, "loss": 0.0137, "step": 261150 }, { "epoch": 0.68, "learning_rate": 0.00019845534124282948, "loss": 0.0196, "step": 261160 }, { "epoch": 0.68, "learning_rate": 0.000198451453026458, "loss": 0.0117, "step": 261170 }, { "epoch": 0.68, "learning_rate": 0.0001984475648100865, "loss": 0.0153, "step": 261180 }, { "epoch": 0.68, "learning_rate": 0.00019844367659371508, "loss": 0.0147, "step": 261190 }, { "epoch": 0.68, "learning_rate": 0.00019843978837734362, "loss": 0.0136, "step": 261200 }, { "epoch": 0.68, "learning_rate": 0.00019843590016097214, "loss": 0.0157, "step": 261210 }, { "epoch": 0.68, "learning_rate": 0.00019843201194460068, "loss": 0.0171, "step": 261220 }, { "epoch": 0.68, "learning_rate": 0.00019842812372822922, "loss": 0.0201, "step": 261230 }, { "epoch": 0.68, "learning_rate": 0.00019842423551185776, "loss": 0.0166, "step": 261240 }, { "epoch": 0.68, "learning_rate": 0.00019842034729548627, "loss": 0.0187, "step": 261250 }, { "epoch": 0.68, "learning_rate": 0.00019841645907911482, "loss": 0.0161, "step": 261260 }, { "epoch": 0.68, "learning_rate": 0.00019841257086274333, "loss": 0.0159, "step": 261270 }, { "epoch": 0.68, "learning_rate": 0.0001984086826463719, "loss": 0.0131, "step": 261280 }, { "epoch": 0.68, "learning_rate": 0.00019840479443000041, "loss": 0.0149, "step": 261290 }, { "epoch": 0.68, "learning_rate": 0.00019840090621362896, "loss": 0.0152, "step": 261300 }, { "epoch": 0.68, "learning_rate": 0.00019839701799725747, "loss": 0.0143, "step": 261310 }, { "epoch": 0.68, "learning_rate": 0.00019839312978088604, "loss": 0.0141, "step": 261320 }, { "epoch": 0.68, "learning_rate": 0.00019838924156451455, "loss": 0.0151, "step": 261330 }, { "epoch": 0.68, "learning_rate": 0.0001983853533481431, "loss": 0.0133, "step": 261340 }, { "epoch": 0.68, "learning_rate": 0.0001983814651317716, "loss": 0.0163, "step": 261350 }, { "epoch": 0.68, "learning_rate": 0.00019837757691540018, "loss": 0.0187, "step": 261360 }, { "epoch": 0.68, "learning_rate": 0.00019837368869902872, "loss": 0.016, "step": 261370 }, { "epoch": 0.68, "learning_rate": 0.00019836980048265723, "loss": 0.0143, "step": 261380 }, { "epoch": 0.68, "learning_rate": 0.00019836591226628578, "loss": 0.0135, "step": 261390 }, { "epoch": 0.68, "learning_rate": 0.00019836202404991432, "loss": 0.0137, "step": 261400 }, { "epoch": 0.68, "learning_rate": 0.00019835813583354286, "loss": 0.0271, "step": 261410 }, { "epoch": 0.68, "learning_rate": 0.00019835424761717137, "loss": 0.012, "step": 261420 }, { "epoch": 0.68, "learning_rate": 0.00019835035940079992, "loss": 0.0138, "step": 261430 }, { "epoch": 0.68, "learning_rate": 0.00019834647118442846, "loss": 0.0188, "step": 261440 }, { "epoch": 0.68, "learning_rate": 0.000198342582968057, "loss": 0.0144, "step": 261450 }, { "epoch": 0.68, "learning_rate": 0.00019833869475168551, "loss": 0.0163, "step": 261460 }, { "epoch": 0.68, "learning_rate": 0.00019833480653531406, "loss": 0.0151, "step": 261470 }, { "epoch": 0.68, "learning_rate": 0.00019833091831894262, "loss": 0.0123, "step": 261480 }, { "epoch": 0.68, "learning_rate": 0.00019832703010257114, "loss": 0.0144, "step": 261490 }, { "epoch": 0.68, "learning_rate": 0.00019832314188619965, "loss": 0.0183, "step": 261500 }, { "epoch": 0.68, "learning_rate": 0.0001983192536698282, "loss": 0.0197, "step": 261510 }, { "epoch": 0.68, "learning_rate": 0.0001983153654534567, "loss": 0.0135, "step": 261520 }, { "epoch": 0.68, "learning_rate": 0.00019831147723708528, "loss": 0.0159, "step": 261530 }, { "epoch": 0.68, "learning_rate": 0.00019830758902071382, "loss": 0.0137, "step": 261540 }, { "epoch": 0.68, "learning_rate": 0.00019830370080434233, "loss": 0.0143, "step": 261550 }, { "epoch": 0.68, "learning_rate": 0.00019829981258797088, "loss": 0.015, "step": 261560 }, { "epoch": 0.68, "learning_rate": 0.00019829592437159942, "loss": 0.019, "step": 261570 }, { "epoch": 0.68, "learning_rate": 0.00019829203615522796, "loss": 0.0168, "step": 261580 }, { "epoch": 0.68, "learning_rate": 0.00019828814793885647, "loss": 0.0189, "step": 261590 }, { "epoch": 0.68, "learning_rate": 0.00019828425972248502, "loss": 0.015, "step": 261600 }, { "epoch": 0.68, "learning_rate": 0.00019828037150611356, "loss": 0.0188, "step": 261610 }, { "epoch": 0.68, "learning_rate": 0.0001982764832897421, "loss": 0.0157, "step": 261620 }, { "epoch": 0.68, "learning_rate": 0.0001982725950733706, "loss": 0.0183, "step": 261630 }, { "epoch": 0.68, "learning_rate": 0.00019826870685699915, "loss": 0.0159, "step": 261640 }, { "epoch": 0.68, "learning_rate": 0.0001982648186406277, "loss": 0.0129, "step": 261650 }, { "epoch": 0.68, "learning_rate": 0.00019826093042425624, "loss": 0.018, "step": 261660 }, { "epoch": 0.68, "learning_rate": 0.00019825704220788475, "loss": 0.0158, "step": 261670 }, { "epoch": 0.68, "learning_rate": 0.0001982531539915133, "loss": 0.0183, "step": 261680 }, { "epoch": 0.68, "learning_rate": 0.00019824926577514186, "loss": 0.015, "step": 261690 }, { "epoch": 0.68, "learning_rate": 0.00019824537755877038, "loss": 0.0187, "step": 261700 }, { "epoch": 0.68, "learning_rate": 0.00019824148934239892, "loss": 0.0123, "step": 261710 }, { "epoch": 0.68, "learning_rate": 0.00019823760112602743, "loss": 0.0171, "step": 261720 }, { "epoch": 0.68, "learning_rate": 0.000198233712909656, "loss": 0.0137, "step": 261730 }, { "epoch": 0.68, "learning_rate": 0.00019822982469328452, "loss": 0.0116, "step": 261740 }, { "epoch": 0.68, "learning_rate": 0.00019822593647691306, "loss": 0.0149, "step": 261750 }, { "epoch": 0.68, "learning_rate": 0.00019822204826054157, "loss": 0.0119, "step": 261760 }, { "epoch": 0.68, "learning_rate": 0.00019821816004417011, "loss": 0.013, "step": 261770 }, { "epoch": 0.68, "learning_rate": 0.00019821427182779866, "loss": 0.0203, "step": 261780 }, { "epoch": 0.68, "learning_rate": 0.0001982103836114272, "loss": 0.0167, "step": 261790 }, { "epoch": 0.68, "learning_rate": 0.0001982064953950557, "loss": 0.0143, "step": 261800 }, { "epoch": 0.68, "learning_rate": 0.00019820260717868425, "loss": 0.0153, "step": 261810 }, { "epoch": 0.68, "learning_rate": 0.0001981987189623128, "loss": 0.0146, "step": 261820 }, { "epoch": 0.68, "learning_rate": 0.00019819483074594134, "loss": 0.0166, "step": 261830 }, { "epoch": 0.68, "learning_rate": 0.00019819094252956985, "loss": 0.0159, "step": 261840 }, { "epoch": 0.68, "learning_rate": 0.0001981870543131984, "loss": 0.0167, "step": 261850 }, { "epoch": 0.68, "learning_rate": 0.00019818316609682696, "loss": 0.0149, "step": 261860 }, { "epoch": 0.68, "learning_rate": 0.00019817927788045548, "loss": 0.0136, "step": 261870 }, { "epoch": 0.68, "learning_rate": 0.00019817538966408402, "loss": 0.015, "step": 261880 }, { "epoch": 0.68, "learning_rate": 0.00019817150144771253, "loss": 0.0141, "step": 261890 }, { "epoch": 0.68, "learning_rate": 0.0001981676132313411, "loss": 0.0116, "step": 261900 }, { "epoch": 0.68, "learning_rate": 0.00019816372501496962, "loss": 0.0143, "step": 261910 }, { "epoch": 0.68, "learning_rate": 0.00019815983679859816, "loss": 0.0188, "step": 261920 }, { "epoch": 0.68, "learning_rate": 0.00019815594858222667, "loss": 0.0167, "step": 261930 }, { "epoch": 0.68, "learning_rate": 0.00019815206036585524, "loss": 0.0198, "step": 261940 }, { "epoch": 0.68, "learning_rate": 0.00019814817214948376, "loss": 0.0126, "step": 261950 }, { "epoch": 0.68, "learning_rate": 0.0001981442839331123, "loss": 0.0159, "step": 261960 }, { "epoch": 0.68, "learning_rate": 0.0001981403957167408, "loss": 0.0173, "step": 261970 }, { "epoch": 0.68, "learning_rate": 0.00019813650750036938, "loss": 0.0144, "step": 261980 }, { "epoch": 0.68, "learning_rate": 0.0001981326192839979, "loss": 0.0188, "step": 261990 }, { "epoch": 0.68, "learning_rate": 0.00019812873106762644, "loss": 0.0156, "step": 262000 }, { "epoch": 0.68, "eval_cer": 0.8817460750681273, "eval_loss": 0.010492046363651752, "eval_runtime": 107.6887, "eval_samples_per_second": 18.572, "eval_steps_per_second": 4.643, "step": 262000 }, { "epoch": 0.68, "learning_rate": 0.00019812484285125495, "loss": 0.0173, "step": 262010 }, { "epoch": 0.68, "learning_rate": 0.0001981209546348835, "loss": 0.0152, "step": 262020 }, { "epoch": 0.68, "learning_rate": 0.00019811706641851206, "loss": 0.016, "step": 262030 }, { "epoch": 0.68, "learning_rate": 0.00019811317820214058, "loss": 0.0155, "step": 262040 }, { "epoch": 0.68, "learning_rate": 0.0001981092899857691, "loss": 0.0145, "step": 262050 }, { "epoch": 0.68, "learning_rate": 0.00019810540176939763, "loss": 0.0152, "step": 262060 }, { "epoch": 0.68, "learning_rate": 0.0001981015135530262, "loss": 0.0147, "step": 262070 }, { "epoch": 0.68, "learning_rate": 0.00019809762533665472, "loss": 0.0132, "step": 262080 }, { "epoch": 0.68, "learning_rate": 0.00019809373712028326, "loss": 0.0163, "step": 262090 }, { "epoch": 0.68, "learning_rate": 0.00019808984890391177, "loss": 0.0173, "step": 262100 }, { "epoch": 0.68, "learning_rate": 0.00019808596068754034, "loss": 0.0186, "step": 262110 }, { "epoch": 0.68, "learning_rate": 0.00019808207247116886, "loss": 0.0184, "step": 262120 }, { "epoch": 0.68, "learning_rate": 0.0001980781842547974, "loss": 0.0157, "step": 262130 }, { "epoch": 0.68, "learning_rate": 0.0001980742960384259, "loss": 0.0153, "step": 262140 }, { "epoch": 0.68, "learning_rate": 0.00019807040782205448, "loss": 0.0146, "step": 262150 }, { "epoch": 0.68, "learning_rate": 0.000198066519605683, "loss": 0.0162, "step": 262160 }, { "epoch": 0.68, "learning_rate": 0.00019806263138931154, "loss": 0.0156, "step": 262170 }, { "epoch": 0.68, "learning_rate": 0.00019805874317294005, "loss": 0.0133, "step": 262180 }, { "epoch": 0.68, "learning_rate": 0.00019805485495656862, "loss": 0.0137, "step": 262190 }, { "epoch": 0.68, "learning_rate": 0.00019805096674019716, "loss": 0.0128, "step": 262200 }, { "epoch": 0.68, "learning_rate": 0.00019804707852382568, "loss": 0.0128, "step": 262210 }, { "epoch": 0.68, "learning_rate": 0.0001980431903074542, "loss": 0.018, "step": 262220 }, { "epoch": 0.68, "learning_rate": 0.00019803930209108276, "loss": 0.0172, "step": 262230 }, { "epoch": 0.68, "learning_rate": 0.0001980354138747113, "loss": 0.0149, "step": 262240 }, { "epoch": 0.68, "learning_rate": 0.00019803152565833982, "loss": 0.0134, "step": 262250 }, { "epoch": 0.68, "learning_rate": 0.00019802763744196836, "loss": 0.0161, "step": 262260 }, { "epoch": 0.68, "learning_rate": 0.00019802374922559687, "loss": 0.0144, "step": 262270 }, { "epoch": 0.68, "learning_rate": 0.00019801986100922544, "loss": 0.0153, "step": 262280 }, { "epoch": 0.68, "learning_rate": 0.00019801597279285395, "loss": 0.0155, "step": 262290 }, { "epoch": 0.68, "learning_rate": 0.0001980120845764825, "loss": 0.0143, "step": 262300 }, { "epoch": 0.68, "learning_rate": 0.000198008196360111, "loss": 0.0146, "step": 262310 }, { "epoch": 0.68, "learning_rate": 0.00019800430814373958, "loss": 0.0192, "step": 262320 }, { "epoch": 0.68, "learning_rate": 0.0001980004199273681, "loss": 0.0144, "step": 262330 }, { "epoch": 0.68, "learning_rate": 0.00019799653171099664, "loss": 0.0127, "step": 262340 }, { "epoch": 0.68, "learning_rate": 0.00019799264349462515, "loss": 0.0164, "step": 262350 }, { "epoch": 0.68, "learning_rate": 0.00019798875527825372, "loss": 0.0146, "step": 262360 }, { "epoch": 0.68, "learning_rate": 0.00019798486706188223, "loss": 0.0146, "step": 262370 }, { "epoch": 0.68, "learning_rate": 0.00019798097884551078, "loss": 0.0108, "step": 262380 }, { "epoch": 0.68, "learning_rate": 0.0001979770906291393, "loss": 0.0159, "step": 262390 }, { "epoch": 0.68, "learning_rate": 0.00019797320241276786, "loss": 0.0134, "step": 262400 }, { "epoch": 0.68, "learning_rate": 0.0001979693141963964, "loss": 0.0145, "step": 262410 }, { "epoch": 0.68, "learning_rate": 0.00019796542598002491, "loss": 0.0153, "step": 262420 }, { "epoch": 0.68, "learning_rate": 0.00019796153776365346, "loss": 0.0156, "step": 262430 }, { "epoch": 0.68, "learning_rate": 0.000197957649547282, "loss": 0.0174, "step": 262440 }, { "epoch": 0.68, "learning_rate": 0.00019795376133091054, "loss": 0.0155, "step": 262450 }, { "epoch": 0.68, "learning_rate": 0.00019794987311453905, "loss": 0.0145, "step": 262460 }, { "epoch": 0.68, "learning_rate": 0.0001979459848981676, "loss": 0.0172, "step": 262470 }, { "epoch": 0.68, "learning_rate": 0.00019794209668179614, "loss": 0.0181, "step": 262480 }, { "epoch": 0.68, "learning_rate": 0.00019793820846542468, "loss": 0.0144, "step": 262490 }, { "epoch": 0.68, "learning_rate": 0.0001979343202490532, "loss": 0.0166, "step": 262500 }, { "epoch": 0.68, "learning_rate": 0.00019793043203268174, "loss": 0.0153, "step": 262510 }, { "epoch": 0.68, "learning_rate": 0.00019792654381631025, "loss": 0.0132, "step": 262520 }, { "epoch": 0.68, "learning_rate": 0.00019792265559993882, "loss": 0.0119, "step": 262530 }, { "epoch": 0.68, "learning_rate": 0.00019791876738356733, "loss": 0.018, "step": 262540 }, { "epoch": 0.68, "learning_rate": 0.00019791487916719587, "loss": 0.0106, "step": 262550 }, { "epoch": 0.68, "learning_rate": 0.0001979109909508244, "loss": 0.013, "step": 262560 }, { "epoch": 0.68, "learning_rate": 0.00019790710273445296, "loss": 0.0153, "step": 262570 }, { "epoch": 0.68, "learning_rate": 0.0001979032145180815, "loss": 0.0171, "step": 262580 }, { "epoch": 0.68, "learning_rate": 0.00019789932630171001, "loss": 0.0197, "step": 262590 }, { "epoch": 0.68, "learning_rate": 0.00019789543808533856, "loss": 0.0112, "step": 262600 }, { "epoch": 0.68, "learning_rate": 0.0001978915498689671, "loss": 0.0158, "step": 262610 }, { "epoch": 0.68, "learning_rate": 0.00019788766165259564, "loss": 0.0159, "step": 262620 }, { "epoch": 0.68, "learning_rate": 0.00019788377343622415, "loss": 0.015, "step": 262630 }, { "epoch": 0.68, "learning_rate": 0.0001978798852198527, "loss": 0.0154, "step": 262640 }, { "epoch": 0.68, "learning_rate": 0.00019787599700348124, "loss": 0.0154, "step": 262650 }, { "epoch": 0.68, "learning_rate": 0.00019787210878710978, "loss": 0.0174, "step": 262660 }, { "epoch": 0.68, "learning_rate": 0.0001978682205707383, "loss": 0.0165, "step": 262670 }, { "epoch": 0.68, "learning_rate": 0.00019786433235436683, "loss": 0.0127, "step": 262680 }, { "epoch": 0.68, "learning_rate": 0.00019786044413799538, "loss": 0.0143, "step": 262690 }, { "epoch": 0.68, "learning_rate": 0.00019785655592162392, "loss": 0.0133, "step": 262700 }, { "epoch": 0.68, "learning_rate": 0.00019785266770525243, "loss": 0.0138, "step": 262710 }, { "epoch": 0.68, "learning_rate": 0.00019784877948888097, "loss": 0.0165, "step": 262720 }, { "epoch": 0.68, "learning_rate": 0.00019784489127250954, "loss": 0.0181, "step": 262730 }, { "epoch": 0.68, "learning_rate": 0.00019784100305613806, "loss": 0.0156, "step": 262740 }, { "epoch": 0.68, "learning_rate": 0.0001978371148397666, "loss": 0.0128, "step": 262750 }, { "epoch": 0.68, "learning_rate": 0.00019783322662339511, "loss": 0.0171, "step": 262760 }, { "epoch": 0.68, "learning_rate": 0.00019782933840702363, "loss": 0.0158, "step": 262770 }, { "epoch": 0.68, "learning_rate": 0.0001978254501906522, "loss": 0.0179, "step": 262780 }, { "epoch": 0.68, "learning_rate": 0.00019782156197428074, "loss": 0.0154, "step": 262790 }, { "epoch": 0.68, "learning_rate": 0.00019781767375790925, "loss": 0.0136, "step": 262800 }, { "epoch": 0.68, "learning_rate": 0.0001978137855415378, "loss": 0.019, "step": 262810 }, { "epoch": 0.68, "learning_rate": 0.00019780989732516634, "loss": 0.0216, "step": 262820 }, { "epoch": 0.68, "learning_rate": 0.00019780600910879488, "loss": 0.0133, "step": 262830 }, { "epoch": 0.68, "learning_rate": 0.0001978021208924234, "loss": 0.0178, "step": 262840 }, { "epoch": 0.68, "learning_rate": 0.00019779823267605193, "loss": 0.0139, "step": 262850 }, { "epoch": 0.68, "learning_rate": 0.00019779434445968048, "loss": 0.0163, "step": 262860 }, { "epoch": 0.68, "learning_rate": 0.00019779045624330902, "loss": 0.0137, "step": 262870 }, { "epoch": 0.68, "learning_rate": 0.00019778656802693753, "loss": 0.015, "step": 262880 }, { "epoch": 0.68, "learning_rate": 0.00019778267981056607, "loss": 0.0169, "step": 262890 }, { "epoch": 0.68, "learning_rate": 0.00019777879159419464, "loss": 0.0215, "step": 262900 }, { "epoch": 0.68, "learning_rate": 0.00019777490337782316, "loss": 0.0157, "step": 262910 }, { "epoch": 0.68, "learning_rate": 0.00019777101516145167, "loss": 0.0177, "step": 262920 }, { "epoch": 0.68, "learning_rate": 0.0001977671269450802, "loss": 0.0105, "step": 262930 }, { "epoch": 0.68, "learning_rate": 0.00019776323872870878, "loss": 0.0122, "step": 262940 }, { "epoch": 0.68, "learning_rate": 0.0001977593505123373, "loss": 0.0144, "step": 262950 }, { "epoch": 0.68, "learning_rate": 0.00019775546229596584, "loss": 0.015, "step": 262960 }, { "epoch": 0.68, "learning_rate": 0.00019775157407959435, "loss": 0.0197, "step": 262970 }, { "epoch": 0.68, "learning_rate": 0.00019774768586322292, "loss": 0.0135, "step": 262980 }, { "epoch": 0.68, "learning_rate": 0.00019774379764685144, "loss": 0.0167, "step": 262990 }, { "epoch": 0.68, "learning_rate": 0.00019773990943047998, "loss": 0.0161, "step": 263000 }, { "epoch": 0.68, "eval_cer": 0.8817684692590742, "eval_loss": 0.010503942146897316, "eval_runtime": 107.871, "eval_samples_per_second": 18.541, "eval_steps_per_second": 4.635, "step": 263000 }, { "epoch": 0.68, "learning_rate": 0.0001977360212141085, "loss": 0.0146, "step": 263010 }, { "epoch": 0.68, "learning_rate": 0.00019773213299773703, "loss": 0.0173, "step": 263020 }, { "epoch": 0.68, "learning_rate": 0.00019772824478136558, "loss": 0.0168, "step": 263030 }, { "epoch": 0.68, "learning_rate": 0.00019772435656499412, "loss": 0.0169, "step": 263040 }, { "epoch": 0.68, "learning_rate": 0.00019772046834862263, "loss": 0.0164, "step": 263050 }, { "epoch": 0.68, "learning_rate": 0.00019771658013225117, "loss": 0.0177, "step": 263060 }, { "epoch": 0.68, "learning_rate": 0.00019771269191587974, "loss": 0.0146, "step": 263070 }, { "epoch": 0.68, "learning_rate": 0.00019770880369950826, "loss": 0.0218, "step": 263080 }, { "epoch": 0.68, "learning_rate": 0.00019770491548313677, "loss": 0.0142, "step": 263090 }, { "epoch": 0.68, "learning_rate": 0.0001977010272667653, "loss": 0.015, "step": 263100 }, { "epoch": 0.68, "learning_rate": 0.00019769713905039388, "loss": 0.0125, "step": 263110 }, { "epoch": 0.68, "learning_rate": 0.0001976932508340224, "loss": 0.02, "step": 263120 }, { "epoch": 0.68, "learning_rate": 0.00019768936261765094, "loss": 0.0167, "step": 263130 }, { "epoch": 0.68, "learning_rate": 0.00019768547440127945, "loss": 0.0172, "step": 263140 }, { "epoch": 0.68, "learning_rate": 0.00019768158618490802, "loss": 0.0145, "step": 263150 }, { "epoch": 0.68, "learning_rate": 0.00019767769796853654, "loss": 0.0158, "step": 263160 }, { "epoch": 0.68, "learning_rate": 0.00019767380975216508, "loss": 0.0152, "step": 263170 }, { "epoch": 0.68, "learning_rate": 0.0001976699215357936, "loss": 0.019, "step": 263180 }, { "epoch": 0.68, "learning_rate": 0.00019766603331942216, "loss": 0.0214, "step": 263190 }, { "epoch": 0.68, "learning_rate": 0.00019766214510305067, "loss": 0.0148, "step": 263200 }, { "epoch": 0.68, "learning_rate": 0.00019765825688667922, "loss": 0.0145, "step": 263210 }, { "epoch": 0.68, "learning_rate": 0.00019765436867030773, "loss": 0.0127, "step": 263220 }, { "epoch": 0.68, "learning_rate": 0.0001976504804539363, "loss": 0.016, "step": 263230 }, { "epoch": 0.68, "learning_rate": 0.00019764659223756481, "loss": 0.0179, "step": 263240 }, { "epoch": 0.68, "learning_rate": 0.00019764270402119336, "loss": 0.0144, "step": 263250 }, { "epoch": 0.68, "learning_rate": 0.00019763881580482187, "loss": 0.015, "step": 263260 }, { "epoch": 0.68, "learning_rate": 0.0001976349275884504, "loss": 0.0177, "step": 263270 }, { "epoch": 0.68, "learning_rate": 0.00019763103937207898, "loss": 0.0141, "step": 263280 }, { "epoch": 0.68, "learning_rate": 0.0001976271511557075, "loss": 0.0155, "step": 263290 }, { "epoch": 0.68, "learning_rate": 0.00019762326293933604, "loss": 0.0142, "step": 263300 }, { "epoch": 0.68, "learning_rate": 0.00019761937472296455, "loss": 0.011, "step": 263310 }, { "epoch": 0.68, "learning_rate": 0.00019761548650659312, "loss": 0.0158, "step": 263320 }, { "epoch": 0.68, "learning_rate": 0.00019761159829022163, "loss": 0.0144, "step": 263330 }, { "epoch": 0.68, "learning_rate": 0.00019760771007385018, "loss": 0.0158, "step": 263340 }, { "epoch": 0.68, "learning_rate": 0.0001976038218574787, "loss": 0.0144, "step": 263350 }, { "epoch": 0.68, "learning_rate": 0.00019759993364110726, "loss": 0.0166, "step": 263360 }, { "epoch": 0.68, "learning_rate": 0.00019759604542473577, "loss": 0.0167, "step": 263370 }, { "epoch": 0.68, "learning_rate": 0.00019759215720836432, "loss": 0.0137, "step": 263380 }, { "epoch": 0.68, "learning_rate": 0.00019758826899199283, "loss": 0.0139, "step": 263390 }, { "epoch": 0.68, "learning_rate": 0.0001975843807756214, "loss": 0.0141, "step": 263400 }, { "epoch": 0.68, "learning_rate": 0.0001975804925592499, "loss": 0.0129, "step": 263410 }, { "epoch": 0.68, "learning_rate": 0.00019757660434287846, "loss": 0.0136, "step": 263420 }, { "epoch": 0.68, "learning_rate": 0.00019757271612650697, "loss": 0.0167, "step": 263430 }, { "epoch": 0.68, "learning_rate": 0.00019756882791013554, "loss": 0.0142, "step": 263440 }, { "epoch": 0.68, "learning_rate": 0.00019756493969376408, "loss": 0.0125, "step": 263450 }, { "epoch": 0.68, "learning_rate": 0.0001975610514773926, "loss": 0.0146, "step": 263460 }, { "epoch": 0.68, "learning_rate": 0.00019755716326102114, "loss": 0.0145, "step": 263470 }, { "epoch": 0.68, "learning_rate": 0.00019755327504464968, "loss": 0.0139, "step": 263480 }, { "epoch": 0.68, "learning_rate": 0.00019754938682827822, "loss": 0.0173, "step": 263490 }, { "epoch": 0.68, "learning_rate": 0.00019754549861190673, "loss": 0.017, "step": 263500 }, { "epoch": 0.68, "learning_rate": 0.00019754161039553528, "loss": 0.0156, "step": 263510 }, { "epoch": 0.68, "learning_rate": 0.0001975377221791638, "loss": 0.0133, "step": 263520 }, { "epoch": 0.68, "learning_rate": 0.00019753383396279236, "loss": 0.0178, "step": 263530 }, { "epoch": 0.68, "learning_rate": 0.00019752994574642087, "loss": 0.0146, "step": 263540 }, { "epoch": 0.68, "learning_rate": 0.00019752605753004942, "loss": 0.0133, "step": 263550 }, { "epoch": 0.68, "learning_rate": 0.00019752216931367793, "loss": 0.0155, "step": 263560 }, { "epoch": 0.68, "learning_rate": 0.0001975182810973065, "loss": 0.017, "step": 263570 }, { "epoch": 0.68, "learning_rate": 0.000197514392880935, "loss": 0.0139, "step": 263580 }, { "epoch": 0.68, "learning_rate": 0.00019751050466456355, "loss": 0.0133, "step": 263590 }, { "epoch": 0.68, "learning_rate": 0.00019750661644819207, "loss": 0.0121, "step": 263600 }, { "epoch": 0.68, "learning_rate": 0.00019750272823182064, "loss": 0.0141, "step": 263610 }, { "epoch": 0.68, "learning_rate": 0.00019749884001544918, "loss": 0.0144, "step": 263620 }, { "epoch": 0.68, "learning_rate": 0.0001974949517990777, "loss": 0.0173, "step": 263630 }, { "epoch": 0.68, "learning_rate": 0.0001974910635827062, "loss": 0.0143, "step": 263640 }, { "epoch": 0.68, "learning_rate": 0.00019748717536633478, "loss": 0.016, "step": 263650 }, { "epoch": 0.68, "learning_rate": 0.00019748328714996332, "loss": 0.0154, "step": 263660 }, { "epoch": 0.68, "learning_rate": 0.00019747939893359183, "loss": 0.0131, "step": 263670 }, { "epoch": 0.68, "learning_rate": 0.00019747551071722038, "loss": 0.0143, "step": 263680 }, { "epoch": 0.68, "learning_rate": 0.00019747162250084892, "loss": 0.0154, "step": 263690 }, { "epoch": 0.68, "learning_rate": 0.00019746773428447746, "loss": 0.0149, "step": 263700 }, { "epoch": 0.68, "learning_rate": 0.00019746384606810597, "loss": 0.0119, "step": 263710 }, { "epoch": 0.68, "learning_rate": 0.00019745995785173451, "loss": 0.0142, "step": 263720 }, { "epoch": 0.68, "learning_rate": 0.00019745606963536306, "loss": 0.0142, "step": 263730 }, { "epoch": 0.68, "learning_rate": 0.0001974521814189916, "loss": 0.0133, "step": 263740 }, { "epoch": 0.68, "learning_rate": 0.0001974482932026201, "loss": 0.016, "step": 263750 }, { "epoch": 0.68, "learning_rate": 0.00019744440498624865, "loss": 0.0167, "step": 263760 }, { "epoch": 0.68, "learning_rate": 0.00019744051676987717, "loss": 0.0175, "step": 263770 }, { "epoch": 0.68, "learning_rate": 0.00019743662855350574, "loss": 0.0147, "step": 263780 }, { "epoch": 0.68, "learning_rate": 0.00019743274033713428, "loss": 0.0144, "step": 263790 }, { "epoch": 0.68, "learning_rate": 0.0001974288521207628, "loss": 0.0133, "step": 263800 }, { "epoch": 0.68, "learning_rate": 0.0001974249639043913, "loss": 0.0149, "step": 263810 }, { "epoch": 0.68, "learning_rate": 0.00019742107568801988, "loss": 0.013, "step": 263820 }, { "epoch": 0.68, "learning_rate": 0.00019741718747164842, "loss": 0.0147, "step": 263830 }, { "epoch": 0.68, "learning_rate": 0.00019741329925527693, "loss": 0.0128, "step": 263840 }, { "epoch": 0.68, "learning_rate": 0.00019740941103890547, "loss": 0.0168, "step": 263850 }, { "epoch": 0.68, "learning_rate": 0.00019740552282253402, "loss": 0.0183, "step": 263860 }, { "epoch": 0.68, "learning_rate": 0.00019740163460616256, "loss": 0.0152, "step": 263870 }, { "epoch": 0.68, "learning_rate": 0.00019739774638979107, "loss": 0.0146, "step": 263880 }, { "epoch": 0.68, "learning_rate": 0.00019739385817341961, "loss": 0.0217, "step": 263890 }, { "epoch": 0.68, "learning_rate": 0.00019738996995704816, "loss": 0.0118, "step": 263900 }, { "epoch": 0.68, "learning_rate": 0.0001973860817406767, "loss": 0.0133, "step": 263910 }, { "epoch": 0.68, "learning_rate": 0.0001973821935243052, "loss": 0.0122, "step": 263920 }, { "epoch": 0.68, "learning_rate": 0.00019737830530793375, "loss": 0.0169, "step": 263930 }, { "epoch": 0.68, "learning_rate": 0.00019737441709156232, "loss": 0.0162, "step": 263940 }, { "epoch": 0.68, "learning_rate": 0.00019737052887519084, "loss": 0.0188, "step": 263950 }, { "epoch": 0.68, "learning_rate": 0.00019736664065881935, "loss": 0.0159, "step": 263960 }, { "epoch": 0.68, "learning_rate": 0.0001973627524424479, "loss": 0.0135, "step": 263970 }, { "epoch": 0.68, "learning_rate": 0.00019735886422607646, "loss": 0.0151, "step": 263980 }, { "epoch": 0.68, "learning_rate": 0.00019735497600970498, "loss": 0.0144, "step": 263990 }, { "epoch": 0.68, "learning_rate": 0.00019735108779333352, "loss": 0.0157, "step": 264000 }, { "epoch": 0.68, "eval_cer": 0.881821655462573, "eval_loss": 0.010292991995811462, "eval_runtime": 107.7325, "eval_samples_per_second": 18.564, "eval_steps_per_second": 4.641, "step": 264000 }, { "epoch": 0.68, "learning_rate": 0.00019734719957696203, "loss": 0.0155, "step": 264010 }, { "epoch": 0.68, "learning_rate": 0.00019734331136059057, "loss": 0.0099, "step": 264020 }, { "epoch": 0.68, "learning_rate": 0.00019733942314421912, "loss": 0.0145, "step": 264030 }, { "epoch": 0.68, "learning_rate": 0.00019733553492784766, "loss": 0.0139, "step": 264040 }, { "epoch": 0.68, "learning_rate": 0.00019733164671147617, "loss": 0.0116, "step": 264050 }, { "epoch": 0.68, "learning_rate": 0.0001973277584951047, "loss": 0.017, "step": 264060 }, { "epoch": 0.68, "learning_rate": 0.00019732387027873325, "loss": 0.0142, "step": 264070 }, { "epoch": 0.68, "learning_rate": 0.0001973199820623618, "loss": 0.0161, "step": 264080 }, { "epoch": 0.68, "learning_rate": 0.0001973160938459903, "loss": 0.0163, "step": 264090 }, { "epoch": 0.68, "learning_rate": 0.00019731220562961885, "loss": 0.0137, "step": 264100 }, { "epoch": 0.68, "learning_rate": 0.0001973083174132474, "loss": 0.0095, "step": 264110 }, { "epoch": 0.68, "learning_rate": 0.00019730442919687594, "loss": 0.0168, "step": 264120 }, { "epoch": 0.68, "learning_rate": 0.00019730054098050445, "loss": 0.0172, "step": 264130 }, { "epoch": 0.68, "learning_rate": 0.000197296652764133, "loss": 0.0119, "step": 264140 }, { "epoch": 0.68, "learning_rate": 0.00019729276454776156, "loss": 0.0152, "step": 264150 }, { "epoch": 0.68, "learning_rate": 0.00019728887633139008, "loss": 0.0192, "step": 264160 }, { "epoch": 0.68, "learning_rate": 0.00019728498811501862, "loss": 0.0152, "step": 264170 }, { "epoch": 0.68, "learning_rate": 0.00019728109989864713, "loss": 0.0145, "step": 264180 }, { "epoch": 0.68, "learning_rate": 0.0001972772116822757, "loss": 0.0174, "step": 264190 }, { "epoch": 0.68, "learning_rate": 0.00019727332346590421, "loss": 0.0149, "step": 264200 }, { "epoch": 0.68, "learning_rate": 0.00019726943524953276, "loss": 0.0172, "step": 264210 }, { "epoch": 0.68, "learning_rate": 0.00019726554703316127, "loss": 0.0145, "step": 264220 }, { "epoch": 0.68, "learning_rate": 0.00019726165881678984, "loss": 0.019, "step": 264230 }, { "epoch": 0.68, "learning_rate": 0.00019725777060041835, "loss": 0.0156, "step": 264240 }, { "epoch": 0.68, "learning_rate": 0.0001972538823840469, "loss": 0.0138, "step": 264250 }, { "epoch": 0.68, "learning_rate": 0.0001972499941676754, "loss": 0.0159, "step": 264260 }, { "epoch": 0.69, "learning_rate": 0.00019724610595130395, "loss": 0.0132, "step": 264270 }, { "epoch": 0.69, "learning_rate": 0.0001972422177349325, "loss": 0.0172, "step": 264280 }, { "epoch": 0.69, "learning_rate": 0.00019723832951856104, "loss": 0.017, "step": 264290 }, { "epoch": 0.69, "learning_rate": 0.00019723444130218955, "loss": 0.0172, "step": 264300 }, { "epoch": 0.69, "learning_rate": 0.0001972305530858181, "loss": 0.0146, "step": 264310 }, { "epoch": 0.69, "learning_rate": 0.00019722666486944666, "loss": 0.0183, "step": 264320 }, { "epoch": 0.69, "learning_rate": 0.00019722277665307517, "loss": 0.0142, "step": 264330 }, { "epoch": 0.69, "learning_rate": 0.00019721888843670372, "loss": 0.0154, "step": 264340 }, { "epoch": 0.69, "learning_rate": 0.00019721500022033223, "loss": 0.0136, "step": 264350 }, { "epoch": 0.69, "learning_rate": 0.0001972111120039608, "loss": 0.02, "step": 264360 }, { "epoch": 0.69, "learning_rate": 0.00019720722378758931, "loss": 0.0153, "step": 264370 }, { "epoch": 0.69, "learning_rate": 0.00019720333557121786, "loss": 0.0166, "step": 264380 }, { "epoch": 0.69, "learning_rate": 0.00019719944735484637, "loss": 0.0155, "step": 264390 }, { "epoch": 0.69, "learning_rate": 0.00019719555913847494, "loss": 0.0153, "step": 264400 }, { "epoch": 0.69, "learning_rate": 0.00019719167092210345, "loss": 0.0129, "step": 264410 }, { "epoch": 0.69, "learning_rate": 0.000197187782705732, "loss": 0.0157, "step": 264420 }, { "epoch": 0.69, "learning_rate": 0.0001971838944893605, "loss": 0.0121, "step": 264430 }, { "epoch": 0.69, "learning_rate": 0.00019718000627298908, "loss": 0.0205, "step": 264440 }, { "epoch": 0.69, "learning_rate": 0.0001971761180566176, "loss": 0.0189, "step": 264450 }, { "epoch": 0.69, "learning_rate": 0.00019717222984024613, "loss": 0.0114, "step": 264460 }, { "epoch": 0.69, "learning_rate": 0.00019716834162387465, "loss": 0.0146, "step": 264470 }, { "epoch": 0.69, "learning_rate": 0.00019716445340750322, "loss": 0.0124, "step": 264480 }, { "epoch": 0.69, "learning_rate": 0.00019716056519113176, "loss": 0.0168, "step": 264490 }, { "epoch": 0.69, "learning_rate": 0.00019715667697476027, "loss": 0.0164, "step": 264500 }, { "epoch": 0.69, "learning_rate": 0.0001971527887583888, "loss": 0.0164, "step": 264510 }, { "epoch": 0.69, "learning_rate": 0.00019714890054201733, "loss": 0.0152, "step": 264520 }, { "epoch": 0.69, "learning_rate": 0.0001971450123256459, "loss": 0.0121, "step": 264530 }, { "epoch": 0.69, "learning_rate": 0.00019714112410927441, "loss": 0.0159, "step": 264540 }, { "epoch": 0.69, "learning_rate": 0.00019713723589290296, "loss": 0.0132, "step": 264550 }, { "epoch": 0.69, "learning_rate": 0.00019713334767653147, "loss": 0.0154, "step": 264560 }, { "epoch": 0.69, "learning_rate": 0.00019712945946016004, "loss": 0.014, "step": 264570 }, { "epoch": 0.69, "learning_rate": 0.00019712557124378855, "loss": 0.0215, "step": 264580 }, { "epoch": 0.69, "learning_rate": 0.0001971216830274171, "loss": 0.0162, "step": 264590 }, { "epoch": 0.69, "learning_rate": 0.0001971177948110456, "loss": 0.0151, "step": 264600 }, { "epoch": 0.69, "learning_rate": 0.00019711390659467418, "loss": 0.0153, "step": 264610 }, { "epoch": 0.69, "learning_rate": 0.0001971100183783027, "loss": 0.0136, "step": 264620 }, { "epoch": 0.69, "learning_rate": 0.00019710613016193123, "loss": 0.0141, "step": 264630 }, { "epoch": 0.69, "learning_rate": 0.00019710224194555975, "loss": 0.019, "step": 264640 }, { "epoch": 0.69, "learning_rate": 0.00019709835372918832, "loss": 0.0143, "step": 264650 }, { "epoch": 0.69, "learning_rate": 0.00019709446551281686, "loss": 0.0121, "step": 264660 }, { "epoch": 0.69, "learning_rate": 0.00019709057729644537, "loss": 0.0141, "step": 264670 }, { "epoch": 0.69, "learning_rate": 0.0001970866890800739, "loss": 0.0291, "step": 264680 }, { "epoch": 0.69, "learning_rate": 0.00019708280086370246, "loss": 0.0203, "step": 264690 }, { "epoch": 0.69, "learning_rate": 0.000197078912647331, "loss": 0.0177, "step": 264700 }, { "epoch": 0.69, "learning_rate": 0.0001970750244309595, "loss": 0.0127, "step": 264710 }, { "epoch": 0.69, "learning_rate": 0.00019707113621458805, "loss": 0.0134, "step": 264720 }, { "epoch": 0.69, "learning_rate": 0.00019706724799821657, "loss": 0.0128, "step": 264730 }, { "epoch": 0.69, "learning_rate": 0.00019706335978184514, "loss": 0.0139, "step": 264740 }, { "epoch": 0.69, "learning_rate": 0.00019705947156547365, "loss": 0.0137, "step": 264750 }, { "epoch": 0.69, "learning_rate": 0.0001970555833491022, "loss": 0.0179, "step": 264760 }, { "epoch": 0.69, "learning_rate": 0.0001970516951327307, "loss": 0.013, "step": 264770 }, { "epoch": 0.69, "learning_rate": 0.00019704780691635928, "loss": 0.0128, "step": 264780 }, { "epoch": 0.69, "learning_rate": 0.0001970439186999878, "loss": 0.013, "step": 264790 }, { "epoch": 0.69, "learning_rate": 0.00019704003048361633, "loss": 0.0151, "step": 264800 }, { "epoch": 0.69, "learning_rate": 0.00019703614226724485, "loss": 0.0141, "step": 264810 }, { "epoch": 0.69, "learning_rate": 0.00019703225405087342, "loss": 0.0131, "step": 264820 }, { "epoch": 0.69, "learning_rate": 0.00019702836583450193, "loss": 0.0133, "step": 264830 }, { "epoch": 0.69, "learning_rate": 0.00019702447761813047, "loss": 0.0127, "step": 264840 }, { "epoch": 0.69, "learning_rate": 0.000197020589401759, "loss": 0.0144, "step": 264850 }, { "epoch": 0.69, "learning_rate": 0.00019701670118538756, "loss": 0.0139, "step": 264860 }, { "epoch": 0.69, "learning_rate": 0.0001970128129690161, "loss": 0.0115, "step": 264870 }, { "epoch": 0.69, "learning_rate": 0.0001970089247526446, "loss": 0.0123, "step": 264880 }, { "epoch": 0.69, "learning_rate": 0.00019700503653627315, "loss": 0.014, "step": 264890 }, { "epoch": 0.69, "learning_rate": 0.0001970011483199017, "loss": 0.0148, "step": 264900 }, { "epoch": 0.69, "learning_rate": 0.00019699726010353024, "loss": 0.0246, "step": 264910 }, { "epoch": 0.69, "learning_rate": 0.00019699337188715875, "loss": 0.0159, "step": 264920 }, { "epoch": 0.69, "learning_rate": 0.0001969894836707873, "loss": 0.012, "step": 264930 }, { "epoch": 0.69, "learning_rate": 0.00019698559545441584, "loss": 0.0156, "step": 264940 }, { "epoch": 0.69, "learning_rate": 0.00019698170723804438, "loss": 0.0166, "step": 264950 }, { "epoch": 0.69, "learning_rate": 0.0001969778190216729, "loss": 0.0148, "step": 264960 }, { "epoch": 0.69, "learning_rate": 0.00019697393080530143, "loss": 0.0157, "step": 264970 }, { "epoch": 0.69, "learning_rate": 0.00019697004258892995, "loss": 0.0221, "step": 264980 }, { "epoch": 0.69, "learning_rate": 0.00019696615437255852, "loss": 0.0145, "step": 264990 }, { "epoch": 0.69, "learning_rate": 0.00019696226615618703, "loss": 0.0125, "step": 265000 }, { "epoch": 0.69, "eval_cer": 0.8817404765203906, "eval_loss": 0.010400773026049137, "eval_runtime": 107.7966, "eval_samples_per_second": 18.553, "eval_steps_per_second": 4.638, "step": 265000 }, { "epoch": 0.69, "learning_rate": 0.00019695837793981557, "loss": 0.0113, "step": 265010 }, { "epoch": 0.69, "learning_rate": 0.0001969544897234441, "loss": 0.0104, "step": 265020 }, { "epoch": 0.69, "learning_rate": 0.00019695060150707266, "loss": 0.0158, "step": 265030 }, { "epoch": 0.69, "learning_rate": 0.0001969467132907012, "loss": 0.02, "step": 265040 }, { "epoch": 0.69, "learning_rate": 0.0001969428250743297, "loss": 0.0157, "step": 265050 }, { "epoch": 0.69, "learning_rate": 0.00019693893685795825, "loss": 0.0143, "step": 265060 }, { "epoch": 0.69, "learning_rate": 0.0001969350486415868, "loss": 0.0168, "step": 265070 }, { "epoch": 0.69, "learning_rate": 0.00019693116042521534, "loss": 0.0158, "step": 265080 }, { "epoch": 0.69, "learning_rate": 0.00019692727220884385, "loss": 0.0125, "step": 265090 }, { "epoch": 0.69, "learning_rate": 0.0001969233839924724, "loss": 0.014, "step": 265100 }, { "epoch": 0.69, "learning_rate": 0.00019691949577610093, "loss": 0.0132, "step": 265110 }, { "epoch": 0.69, "learning_rate": 0.00019691560755972948, "loss": 0.0194, "step": 265120 }, { "epoch": 0.69, "learning_rate": 0.000196911719343358, "loss": 0.0164, "step": 265130 }, { "epoch": 0.69, "learning_rate": 0.00019690783112698653, "loss": 0.0169, "step": 265140 }, { "epoch": 0.69, "learning_rate": 0.00019690394291061507, "loss": 0.0158, "step": 265150 }, { "epoch": 0.69, "learning_rate": 0.00019690005469424362, "loss": 0.0156, "step": 265160 }, { "epoch": 0.69, "learning_rate": 0.00019689616647787213, "loss": 0.017, "step": 265170 }, { "epoch": 0.69, "learning_rate": 0.00019689227826150067, "loss": 0.0149, "step": 265180 }, { "epoch": 0.69, "learning_rate": 0.00019688839004512924, "loss": 0.0146, "step": 265190 }, { "epoch": 0.69, "learning_rate": 0.00019688450182875776, "loss": 0.0196, "step": 265200 }, { "epoch": 0.69, "learning_rate": 0.0001968806136123863, "loss": 0.0167, "step": 265210 }, { "epoch": 0.69, "learning_rate": 0.0001968767253960148, "loss": 0.0119, "step": 265220 }, { "epoch": 0.69, "learning_rate": 0.00019687283717964333, "loss": 0.0114, "step": 265230 }, { "epoch": 0.69, "learning_rate": 0.0001968689489632719, "loss": 0.0146, "step": 265240 }, { "epoch": 0.69, "learning_rate": 0.00019686506074690044, "loss": 0.0137, "step": 265250 }, { "epoch": 0.69, "learning_rate": 0.00019686117253052895, "loss": 0.0141, "step": 265260 }, { "epoch": 0.69, "learning_rate": 0.0001968572843141575, "loss": 0.0245, "step": 265270 }, { "epoch": 0.69, "learning_rate": 0.00019685339609778603, "loss": 0.0123, "step": 265280 }, { "epoch": 0.69, "learning_rate": 0.00019684950788141458, "loss": 0.0271, "step": 265290 }, { "epoch": 0.69, "learning_rate": 0.0001968456196650431, "loss": 0.0165, "step": 265300 }, { "epoch": 0.69, "learning_rate": 0.00019684173144867163, "loss": 0.0155, "step": 265310 }, { "epoch": 0.69, "learning_rate": 0.00019683784323230017, "loss": 0.0156, "step": 265320 }, { "epoch": 0.69, "learning_rate": 0.00019683395501592872, "loss": 0.0123, "step": 265330 }, { "epoch": 0.69, "learning_rate": 0.00019683006679955723, "loss": 0.0177, "step": 265340 }, { "epoch": 0.69, "learning_rate": 0.00019682617858318577, "loss": 0.0137, "step": 265350 }, { "epoch": 0.69, "learning_rate": 0.00019682229036681434, "loss": 0.0179, "step": 265360 }, { "epoch": 0.69, "learning_rate": 0.00019681840215044285, "loss": 0.0154, "step": 265370 }, { "epoch": 0.69, "learning_rate": 0.00019681451393407137, "loss": 0.0177, "step": 265380 }, { "epoch": 0.69, "learning_rate": 0.0001968106257176999, "loss": 0.0152, "step": 265390 }, { "epoch": 0.69, "learning_rate": 0.00019680673750132848, "loss": 0.0174, "step": 265400 }, { "epoch": 0.69, "learning_rate": 0.000196802849284957, "loss": 0.0173, "step": 265410 }, { "epoch": 0.69, "learning_rate": 0.00019679896106858554, "loss": 0.0133, "step": 265420 }, { "epoch": 0.69, "learning_rate": 0.00019679507285221405, "loss": 0.0162, "step": 265430 }, { "epoch": 0.69, "learning_rate": 0.00019679118463584262, "loss": 0.0159, "step": 265440 }, { "epoch": 0.69, "learning_rate": 0.00019678729641947113, "loss": 0.0182, "step": 265450 }, { "epoch": 0.69, "learning_rate": 0.00019678340820309968, "loss": 0.0171, "step": 265460 }, { "epoch": 0.69, "learning_rate": 0.0001967795199867282, "loss": 0.016, "step": 265470 }, { "epoch": 0.69, "learning_rate": 0.00019677563177035673, "loss": 0.0166, "step": 265480 }, { "epoch": 0.69, "learning_rate": 0.00019677174355398527, "loss": 0.0172, "step": 265490 }, { "epoch": 0.69, "learning_rate": 0.00019676785533761381, "loss": 0.0137, "step": 265500 }, { "epoch": 0.69, "learning_rate": 0.00019676396712124233, "loss": 0.0148, "step": 265510 }, { "epoch": 0.69, "learning_rate": 0.00019676007890487087, "loss": 0.0166, "step": 265520 }, { "epoch": 0.69, "learning_rate": 0.00019675619068849944, "loss": 0.0132, "step": 265530 }, { "epoch": 0.69, "learning_rate": 0.00019675230247212795, "loss": 0.0178, "step": 265540 }, { "epoch": 0.69, "learning_rate": 0.00019674841425575647, "loss": 0.0148, "step": 265550 }, { "epoch": 0.69, "learning_rate": 0.000196744526039385, "loss": 0.0177, "step": 265560 }, { "epoch": 0.69, "learning_rate": 0.00019674063782301358, "loss": 0.0141, "step": 265570 }, { "epoch": 0.69, "learning_rate": 0.0001967367496066421, "loss": 0.0153, "step": 265580 }, { "epoch": 0.69, "learning_rate": 0.00019673286139027064, "loss": 0.0127, "step": 265590 }, { "epoch": 0.69, "learning_rate": 0.00019672897317389915, "loss": 0.0185, "step": 265600 }, { "epoch": 0.69, "learning_rate": 0.00019672508495752772, "loss": 0.0159, "step": 265610 }, { "epoch": 0.69, "learning_rate": 0.00019672119674115623, "loss": 0.0125, "step": 265620 }, { "epoch": 0.69, "learning_rate": 0.00019671730852478477, "loss": 0.0185, "step": 265630 }, { "epoch": 0.69, "learning_rate": 0.0001967134203084133, "loss": 0.0193, "step": 265640 }, { "epoch": 0.69, "learning_rate": 0.00019670953209204186, "loss": 0.0142, "step": 265650 }, { "epoch": 0.69, "learning_rate": 0.00019670564387567037, "loss": 0.0166, "step": 265660 }, { "epoch": 0.69, "learning_rate": 0.00019670175565929891, "loss": 0.0135, "step": 265670 }, { "epoch": 0.69, "learning_rate": 0.00019669786744292743, "loss": 0.0133, "step": 265680 }, { "epoch": 0.69, "learning_rate": 0.000196693979226556, "loss": 0.0151, "step": 265690 }, { "epoch": 0.69, "learning_rate": 0.0001966900910101845, "loss": 0.0181, "step": 265700 }, { "epoch": 0.69, "learning_rate": 0.00019668620279381305, "loss": 0.0152, "step": 265710 }, { "epoch": 0.69, "learning_rate": 0.00019668231457744157, "loss": 0.0111, "step": 265720 }, { "epoch": 0.69, "learning_rate": 0.0001966784263610701, "loss": 0.0171, "step": 265730 }, { "epoch": 0.69, "learning_rate": 0.00019667453814469868, "loss": 0.0138, "step": 265740 }, { "epoch": 0.69, "learning_rate": 0.0001966706499283272, "loss": 0.0154, "step": 265750 }, { "epoch": 0.69, "learning_rate": 0.00019666676171195573, "loss": 0.0193, "step": 265760 }, { "epoch": 0.69, "learning_rate": 0.00019666287349558425, "loss": 0.0154, "step": 265770 }, { "epoch": 0.69, "learning_rate": 0.00019665898527921282, "loss": 0.0141, "step": 265780 }, { "epoch": 0.69, "learning_rate": 0.00019665509706284133, "loss": 0.0126, "step": 265790 }, { "epoch": 0.69, "learning_rate": 0.00019665120884646987, "loss": 0.0191, "step": 265800 }, { "epoch": 0.69, "learning_rate": 0.0001966473206300984, "loss": 0.0186, "step": 265810 }, { "epoch": 0.69, "learning_rate": 0.00019664343241372696, "loss": 0.0148, "step": 265820 }, { "epoch": 0.69, "learning_rate": 0.00019663954419735547, "loss": 0.0143, "step": 265830 }, { "epoch": 0.69, "learning_rate": 0.000196635655980984, "loss": 0.0148, "step": 265840 }, { "epoch": 0.69, "learning_rate": 0.00019663176776461253, "loss": 0.0107, "step": 265850 }, { "epoch": 0.69, "learning_rate": 0.0001966278795482411, "loss": 0.0165, "step": 265860 }, { "epoch": 0.69, "learning_rate": 0.0001966239913318696, "loss": 0.0142, "step": 265870 }, { "epoch": 0.69, "learning_rate": 0.00019662010311549815, "loss": 0.0142, "step": 265880 }, { "epoch": 0.69, "learning_rate": 0.00019661621489912667, "loss": 0.0159, "step": 265890 }, { "epoch": 0.69, "learning_rate": 0.00019661232668275524, "loss": 0.0175, "step": 265900 }, { "epoch": 0.69, "learning_rate": 0.00019660843846638378, "loss": 0.0129, "step": 265910 }, { "epoch": 0.69, "learning_rate": 0.0001966045502500123, "loss": 0.0148, "step": 265920 }, { "epoch": 0.69, "learning_rate": 0.00019660066203364083, "loss": 0.0148, "step": 265930 }, { "epoch": 0.69, "learning_rate": 0.00019659677381726938, "loss": 0.0141, "step": 265940 }, { "epoch": 0.69, "learning_rate": 0.00019659288560089792, "loss": 0.0137, "step": 265950 }, { "epoch": 0.69, "learning_rate": 0.00019658899738452643, "loss": 0.015, "step": 265960 }, { "epoch": 0.69, "learning_rate": 0.00019658510916815497, "loss": 0.0153, "step": 265970 }, { "epoch": 0.69, "learning_rate": 0.0001965812209517835, "loss": 0.0157, "step": 265980 }, { "epoch": 0.69, "learning_rate": 0.00019657733273541206, "loss": 0.0174, "step": 265990 }, { "epoch": 0.69, "learning_rate": 0.00019657344451904057, "loss": 0.0141, "step": 266000 }, { "epoch": 0.69, "eval_cer": 0.8817782667176135, "eval_loss": 0.01088875625282526, "eval_runtime": 107.9649, "eval_samples_per_second": 18.525, "eval_steps_per_second": 4.631, "step": 266000 }, { "epoch": 0.69, "learning_rate": 0.0001965695563026691, "loss": 0.0158, "step": 266010 }, { "epoch": 0.69, "learning_rate": 0.00019656566808629763, "loss": 0.014, "step": 266020 }, { "epoch": 0.69, "learning_rate": 0.0001965617798699262, "loss": 0.0155, "step": 266030 }, { "epoch": 0.69, "learning_rate": 0.0001965578916535547, "loss": 0.0136, "step": 266040 }, { "epoch": 0.69, "learning_rate": 0.00019655400343718325, "loss": 0.0157, "step": 266050 }, { "epoch": 0.69, "learning_rate": 0.00019655011522081177, "loss": 0.0154, "step": 266060 }, { "epoch": 0.69, "learning_rate": 0.00019654622700444034, "loss": 0.0129, "step": 266070 }, { "epoch": 0.69, "learning_rate": 0.00019654233878806888, "loss": 0.014, "step": 266080 }, { "epoch": 0.69, "learning_rate": 0.0001965384505716974, "loss": 0.0129, "step": 266090 }, { "epoch": 0.69, "learning_rate": 0.0001965345623553259, "loss": 0.0136, "step": 266100 }, { "epoch": 0.69, "learning_rate": 0.00019653067413895448, "loss": 0.0108, "step": 266110 }, { "epoch": 0.69, "learning_rate": 0.00019652678592258302, "loss": 0.0115, "step": 266120 }, { "epoch": 0.69, "learning_rate": 0.00019652289770621153, "loss": 0.0127, "step": 266130 }, { "epoch": 0.69, "learning_rate": 0.00019651900948984007, "loss": 0.0144, "step": 266140 }, { "epoch": 0.69, "learning_rate": 0.00019651512127346861, "loss": 0.0156, "step": 266150 }, { "epoch": 0.69, "learning_rate": 0.00019651123305709716, "loss": 0.017, "step": 266160 }, { "epoch": 0.69, "learning_rate": 0.00019650734484072567, "loss": 0.0154, "step": 266170 }, { "epoch": 0.69, "learning_rate": 0.0001965034566243542, "loss": 0.0172, "step": 266180 }, { "epoch": 0.69, "learning_rate": 0.00019649956840798275, "loss": 0.0142, "step": 266190 }, { "epoch": 0.69, "learning_rate": 0.0001964956801916113, "loss": 0.0133, "step": 266200 }, { "epoch": 0.69, "learning_rate": 0.0001964917919752398, "loss": 0.0132, "step": 266210 }, { "epoch": 0.69, "learning_rate": 0.00019648790375886835, "loss": 0.0195, "step": 266220 }, { "epoch": 0.69, "learning_rate": 0.00019648401554249687, "loss": 0.0165, "step": 266230 }, { "epoch": 0.69, "learning_rate": 0.00019648012732612544, "loss": 0.0247, "step": 266240 }, { "epoch": 0.69, "learning_rate": 0.00019647623910975398, "loss": 0.014, "step": 266250 }, { "epoch": 0.69, "learning_rate": 0.0001964723508933825, "loss": 0.0155, "step": 266260 }, { "epoch": 0.69, "learning_rate": 0.000196468462677011, "loss": 0.0155, "step": 266270 }, { "epoch": 0.69, "learning_rate": 0.00019646457446063957, "loss": 0.0147, "step": 266280 }, { "epoch": 0.69, "learning_rate": 0.00019646068624426812, "loss": 0.0152, "step": 266290 }, { "epoch": 0.69, "learning_rate": 0.00019645679802789663, "loss": 0.0112, "step": 266300 }, { "epoch": 0.69, "learning_rate": 0.00019645290981152517, "loss": 0.0178, "step": 266310 }, { "epoch": 0.69, "learning_rate": 0.00019644902159515371, "loss": 0.014, "step": 266320 }, { "epoch": 0.69, "learning_rate": 0.00019644513337878226, "loss": 0.0167, "step": 266330 }, { "epoch": 0.69, "learning_rate": 0.00019644124516241077, "loss": 0.0214, "step": 266340 }, { "epoch": 0.69, "learning_rate": 0.0001964373569460393, "loss": 0.0147, "step": 266350 }, { "epoch": 0.69, "learning_rate": 0.00019643346872966785, "loss": 0.0159, "step": 266360 }, { "epoch": 0.69, "learning_rate": 0.0001964295805132964, "loss": 0.0151, "step": 266370 }, { "epoch": 0.69, "learning_rate": 0.0001964256922969249, "loss": 0.0151, "step": 266380 }, { "epoch": 0.69, "learning_rate": 0.00019642180408055345, "loss": 0.0148, "step": 266390 }, { "epoch": 0.69, "learning_rate": 0.00019641791586418202, "loss": 0.0155, "step": 266400 }, { "epoch": 0.69, "learning_rate": 0.00019641402764781053, "loss": 0.0143, "step": 266410 }, { "epoch": 0.69, "learning_rate": 0.00019641013943143905, "loss": 0.0137, "step": 266420 }, { "epoch": 0.69, "learning_rate": 0.0001964062512150676, "loss": 0.0145, "step": 266430 }, { "epoch": 0.69, "learning_rate": 0.00019640236299869616, "loss": 0.0125, "step": 266440 }, { "epoch": 0.69, "learning_rate": 0.00019639847478232467, "loss": 0.0168, "step": 266450 }, { "epoch": 0.69, "learning_rate": 0.00019639458656595322, "loss": 0.0154, "step": 266460 }, { "epoch": 0.69, "learning_rate": 0.00019639069834958173, "loss": 0.018, "step": 266470 }, { "epoch": 0.69, "learning_rate": 0.00019638681013321027, "loss": 0.0168, "step": 266480 }, { "epoch": 0.69, "learning_rate": 0.0001963829219168388, "loss": 0.0141, "step": 266490 }, { "epoch": 0.69, "learning_rate": 0.00019637903370046736, "loss": 0.0166, "step": 266500 }, { "epoch": 0.69, "learning_rate": 0.00019637514548409587, "loss": 0.0208, "step": 266510 }, { "epoch": 0.69, "learning_rate": 0.0001963712572677244, "loss": 0.0137, "step": 266520 }, { "epoch": 0.69, "learning_rate": 0.00019636736905135295, "loss": 0.0171, "step": 266530 }, { "epoch": 0.69, "learning_rate": 0.0001963634808349815, "loss": 0.0169, "step": 266540 }, { "epoch": 0.69, "learning_rate": 0.00019635959261861, "loss": 0.0158, "step": 266550 }, { "epoch": 0.69, "learning_rate": 0.00019635570440223855, "loss": 0.0107, "step": 266560 }, { "epoch": 0.69, "learning_rate": 0.0001963518161858671, "loss": 0.0154, "step": 266570 }, { "epoch": 0.69, "learning_rate": 0.00019634792796949563, "loss": 0.0149, "step": 266580 }, { "epoch": 0.69, "learning_rate": 0.00019634403975312415, "loss": 0.0142, "step": 266590 }, { "epoch": 0.69, "learning_rate": 0.0001963401515367527, "loss": 0.012, "step": 266600 }, { "epoch": 0.69, "learning_rate": 0.00019633626332038126, "loss": 0.0176, "step": 266610 }, { "epoch": 0.69, "learning_rate": 0.00019633237510400977, "loss": 0.0152, "step": 266620 }, { "epoch": 0.69, "learning_rate": 0.00019632848688763832, "loss": 0.0145, "step": 266630 }, { "epoch": 0.69, "learning_rate": 0.00019632459867126683, "loss": 0.0141, "step": 266640 }, { "epoch": 0.69, "learning_rate": 0.0001963207104548954, "loss": 0.0167, "step": 266650 }, { "epoch": 0.69, "learning_rate": 0.0001963168222385239, "loss": 0.0147, "step": 266660 }, { "epoch": 0.69, "learning_rate": 0.00019631293402215245, "loss": 0.0121, "step": 266670 }, { "epoch": 0.69, "learning_rate": 0.00019630904580578097, "loss": 0.0185, "step": 266680 }, { "epoch": 0.69, "learning_rate": 0.00019630515758940954, "loss": 0.0151, "step": 266690 }, { "epoch": 0.69, "learning_rate": 0.00019630126937303805, "loss": 0.0148, "step": 266700 }, { "epoch": 0.69, "learning_rate": 0.0001962973811566666, "loss": 0.0176, "step": 266710 }, { "epoch": 0.69, "learning_rate": 0.0001962934929402951, "loss": 0.0122, "step": 266720 }, { "epoch": 0.69, "learning_rate": 0.00019628960472392365, "loss": 0.0176, "step": 266730 }, { "epoch": 0.69, "learning_rate": 0.0001962857165075522, "loss": 0.0145, "step": 266740 }, { "epoch": 0.69, "learning_rate": 0.00019628182829118073, "loss": 0.014, "step": 266750 }, { "epoch": 0.69, "learning_rate": 0.00019627794007480925, "loss": 0.0138, "step": 266760 }, { "epoch": 0.69, "learning_rate": 0.0001962740518584378, "loss": 0.0188, "step": 266770 }, { "epoch": 0.69, "learning_rate": 0.00019627016364206636, "loss": 0.0142, "step": 266780 }, { "epoch": 0.69, "learning_rate": 0.00019626627542569487, "loss": 0.0177, "step": 266790 }, { "epoch": 0.69, "learning_rate": 0.00019626238720932341, "loss": 0.0149, "step": 266800 }, { "epoch": 0.69, "learning_rate": 0.00019625849899295193, "loss": 0.015, "step": 266810 }, { "epoch": 0.69, "learning_rate": 0.0001962546107765805, "loss": 0.0154, "step": 266820 }, { "epoch": 0.69, "learning_rate": 0.000196250722560209, "loss": 0.0156, "step": 266830 }, { "epoch": 0.69, "learning_rate": 0.00019624683434383755, "loss": 0.0141, "step": 266840 }, { "epoch": 0.69, "learning_rate": 0.00019624294612746607, "loss": 0.0134, "step": 266850 }, { "epoch": 0.69, "learning_rate": 0.00019623905791109464, "loss": 0.0164, "step": 266860 }, { "epoch": 0.69, "learning_rate": 0.00019623516969472315, "loss": 0.0145, "step": 266870 }, { "epoch": 0.69, "learning_rate": 0.0001962312814783517, "loss": 0.0155, "step": 266880 }, { "epoch": 0.69, "learning_rate": 0.0001962273932619802, "loss": 0.019, "step": 266890 }, { "epoch": 0.69, "learning_rate": 0.00019622350504560878, "loss": 0.0174, "step": 266900 }, { "epoch": 0.69, "learning_rate": 0.0001962196168292373, "loss": 0.0176, "step": 266910 }, { "epoch": 0.69, "learning_rate": 0.00019621572861286583, "loss": 0.0149, "step": 266920 }, { "epoch": 0.69, "learning_rate": 0.00019621184039649435, "loss": 0.0125, "step": 266930 }, { "epoch": 0.69, "learning_rate": 0.00019620795218012292, "loss": 0.0136, "step": 266940 }, { "epoch": 0.69, "learning_rate": 0.00019620406396375146, "loss": 0.0147, "step": 266950 }, { "epoch": 0.69, "learning_rate": 0.00019620017574737997, "loss": 0.0145, "step": 266960 }, { "epoch": 0.69, "learning_rate": 0.0001961962875310085, "loss": 0.0163, "step": 266970 }, { "epoch": 0.69, "learning_rate": 0.00019619239931463703, "loss": 0.0136, "step": 266980 }, { "epoch": 0.69, "learning_rate": 0.0001961885110982656, "loss": 0.0139, "step": 266990 }, { "epoch": 0.69, "learning_rate": 0.0001961846228818941, "loss": 0.0137, "step": 267000 }, { "epoch": 0.69, "eval_cer": 0.8817306790618513, "eval_loss": 0.01065248902887106, "eval_runtime": 107.8983, "eval_samples_per_second": 18.536, "eval_steps_per_second": 4.634, "step": 267000 }, { "epoch": 0.69, "learning_rate": 0.00019618073466552265, "loss": 0.0155, "step": 267010 }, { "epoch": 0.69, "learning_rate": 0.00019617684644915117, "loss": 0.0146, "step": 267020 }, { "epoch": 0.69, "learning_rate": 0.00019617295823277974, "loss": 0.0185, "step": 267030 }, { "epoch": 0.69, "learning_rate": 0.00019616907001640825, "loss": 0.0161, "step": 267040 }, { "epoch": 0.69, "learning_rate": 0.0001961651818000368, "loss": 0.0159, "step": 267050 }, { "epoch": 0.69, "learning_rate": 0.0001961612935836653, "loss": 0.0138, "step": 267060 }, { "epoch": 0.69, "learning_rate": 0.00019615740536729388, "loss": 0.0127, "step": 267070 }, { "epoch": 0.69, "learning_rate": 0.0001961535171509224, "loss": 0.0167, "step": 267080 }, { "epoch": 0.69, "learning_rate": 0.00019614962893455093, "loss": 0.0161, "step": 267090 }, { "epoch": 0.69, "learning_rate": 0.00019614574071817945, "loss": 0.0146, "step": 267100 }, { "epoch": 0.69, "learning_rate": 0.00019614185250180802, "loss": 0.0179, "step": 267110 }, { "epoch": 0.69, "learning_rate": 0.00019613796428543656, "loss": 0.0139, "step": 267120 }, { "epoch": 0.69, "learning_rate": 0.00019613407606906507, "loss": 0.016, "step": 267130 }, { "epoch": 0.69, "learning_rate": 0.00019613018785269359, "loss": 0.0155, "step": 267140 }, { "epoch": 0.69, "learning_rate": 0.00019612629963632215, "loss": 0.0156, "step": 267150 }, { "epoch": 0.69, "learning_rate": 0.0001961224114199507, "loss": 0.0182, "step": 267160 }, { "epoch": 0.69, "learning_rate": 0.0001961185232035792, "loss": 0.0144, "step": 267170 }, { "epoch": 0.69, "learning_rate": 0.00019611463498720775, "loss": 0.0148, "step": 267180 }, { "epoch": 0.69, "learning_rate": 0.0001961107467708363, "loss": 0.0198, "step": 267190 }, { "epoch": 0.69, "learning_rate": 0.00019610685855446484, "loss": 0.0117, "step": 267200 }, { "epoch": 0.69, "learning_rate": 0.00019610297033809335, "loss": 0.0158, "step": 267210 }, { "epoch": 0.69, "learning_rate": 0.0001960990821217219, "loss": 0.0231, "step": 267220 }, { "epoch": 0.69, "learning_rate": 0.0001960951939053504, "loss": 0.016, "step": 267230 }, { "epoch": 0.69, "learning_rate": 0.00019609130568897898, "loss": 0.0136, "step": 267240 }, { "epoch": 0.69, "learning_rate": 0.0001960874174726075, "loss": 0.0162, "step": 267250 }, { "epoch": 0.69, "learning_rate": 0.00019608352925623603, "loss": 0.0135, "step": 267260 }, { "epoch": 0.69, "learning_rate": 0.00019607964103986455, "loss": 0.0182, "step": 267270 }, { "epoch": 0.69, "learning_rate": 0.00019607575282349311, "loss": 0.0149, "step": 267280 }, { "epoch": 0.69, "learning_rate": 0.00019607186460712163, "loss": 0.0122, "step": 267290 }, { "epoch": 0.69, "learning_rate": 0.00019606797639075017, "loss": 0.0141, "step": 267300 }, { "epoch": 0.69, "learning_rate": 0.00019606408817437869, "loss": 0.0206, "step": 267310 }, { "epoch": 0.69, "learning_rate": 0.00019606019995800725, "loss": 0.0128, "step": 267320 }, { "epoch": 0.69, "learning_rate": 0.0001960563117416358, "loss": 0.0159, "step": 267330 }, { "epoch": 0.69, "learning_rate": 0.0001960524235252643, "loss": 0.0153, "step": 267340 }, { "epoch": 0.69, "learning_rate": 0.00019604853530889285, "loss": 0.0194, "step": 267350 }, { "epoch": 0.69, "learning_rate": 0.0001960446470925214, "loss": 0.0124, "step": 267360 }, { "epoch": 0.69, "learning_rate": 0.00019604075887614994, "loss": 0.0156, "step": 267370 }, { "epoch": 0.69, "learning_rate": 0.00019603687065977845, "loss": 0.0157, "step": 267380 }, { "epoch": 0.69, "learning_rate": 0.000196032982443407, "loss": 0.0135, "step": 267390 }, { "epoch": 0.69, "learning_rate": 0.00019602909422703553, "loss": 0.017, "step": 267400 }, { "epoch": 0.69, "learning_rate": 0.00019602520601066407, "loss": 0.0129, "step": 267410 }, { "epoch": 0.69, "learning_rate": 0.0001960213177942926, "loss": 0.0188, "step": 267420 }, { "epoch": 0.69, "learning_rate": 0.00019601742957792113, "loss": 0.0139, "step": 267430 }, { "epoch": 0.69, "learning_rate": 0.0001960135413615497, "loss": 0.0121, "step": 267440 }, { "epoch": 0.69, "learning_rate": 0.00019600965314517821, "loss": 0.0131, "step": 267450 }, { "epoch": 0.69, "learning_rate": 0.00019600576492880673, "loss": 0.0132, "step": 267460 }, { "epoch": 0.69, "learning_rate": 0.00019600187671243527, "loss": 0.0173, "step": 267470 }, { "epoch": 0.69, "learning_rate": 0.00019599798849606379, "loss": 0.0158, "step": 267480 }, { "epoch": 0.69, "learning_rate": 0.00019599410027969235, "loss": 0.0135, "step": 267490 }, { "epoch": 0.69, "learning_rate": 0.0001959902120633209, "loss": 0.0201, "step": 267500 }, { "epoch": 0.69, "learning_rate": 0.0001959863238469494, "loss": 0.0169, "step": 267510 }, { "epoch": 0.69, "learning_rate": 0.00019598243563057795, "loss": 0.0207, "step": 267520 }, { "epoch": 0.69, "learning_rate": 0.0001959785474142065, "loss": 0.0169, "step": 267530 }, { "epoch": 0.69, "learning_rate": 0.00019597465919783503, "loss": 0.0141, "step": 267540 }, { "epoch": 0.69, "learning_rate": 0.00019597077098146355, "loss": 0.0164, "step": 267550 }, { "epoch": 0.69, "learning_rate": 0.0001959668827650921, "loss": 0.0168, "step": 267560 }, { "epoch": 0.69, "learning_rate": 0.00019596299454872063, "loss": 0.0137, "step": 267570 }, { "epoch": 0.69, "learning_rate": 0.00019595910633234917, "loss": 0.0142, "step": 267580 }, { "epoch": 0.69, "learning_rate": 0.0001959552181159777, "loss": 0.0205, "step": 267590 }, { "epoch": 0.69, "learning_rate": 0.00019595132989960623, "loss": 0.016, "step": 267600 }, { "epoch": 0.69, "learning_rate": 0.00019594744168323477, "loss": 0.012, "step": 267610 }, { "epoch": 0.69, "learning_rate": 0.00019594355346686331, "loss": 0.016, "step": 267620 }, { "epoch": 0.69, "learning_rate": 0.00019593966525049183, "loss": 0.0154, "step": 267630 }, { "epoch": 0.69, "learning_rate": 0.00019593577703412037, "loss": 0.0155, "step": 267640 }, { "epoch": 0.69, "learning_rate": 0.00019593188881774894, "loss": 0.0165, "step": 267650 }, { "epoch": 0.69, "learning_rate": 0.00019592800060137745, "loss": 0.0128, "step": 267660 }, { "epoch": 0.69, "learning_rate": 0.000195924112385006, "loss": 0.0133, "step": 267670 }, { "epoch": 0.69, "learning_rate": 0.0001959202241686345, "loss": 0.0186, "step": 267680 }, { "epoch": 0.69, "learning_rate": 0.00019591633595226308, "loss": 0.0133, "step": 267690 }, { "epoch": 0.69, "learning_rate": 0.0001959124477358916, "loss": 0.0186, "step": 267700 }, { "epoch": 0.69, "learning_rate": 0.00019590855951952013, "loss": 0.0146, "step": 267710 }, { "epoch": 0.69, "learning_rate": 0.00019590467130314865, "loss": 0.0145, "step": 267720 }, { "epoch": 0.69, "learning_rate": 0.0001959007830867772, "loss": 0.0158, "step": 267730 }, { "epoch": 0.69, "learning_rate": 0.00019589689487040573, "loss": 0.0148, "step": 267740 }, { "epoch": 0.69, "learning_rate": 0.00019589300665403427, "loss": 0.0159, "step": 267750 }, { "epoch": 0.69, "learning_rate": 0.0001958891184376628, "loss": 0.0163, "step": 267760 }, { "epoch": 0.69, "learning_rate": 0.00019588523022129133, "loss": 0.0132, "step": 267770 }, { "epoch": 0.69, "learning_rate": 0.00019588134200491987, "loss": 0.0137, "step": 267780 }, { "epoch": 0.69, "learning_rate": 0.0001958774537885484, "loss": 0.0172, "step": 267790 }, { "epoch": 0.69, "learning_rate": 0.00019587356557217693, "loss": 0.017, "step": 267800 }, { "epoch": 0.69, "learning_rate": 0.00019586967735580547, "loss": 0.0164, "step": 267810 }, { "epoch": 0.69, "learning_rate": 0.00019586578913943404, "loss": 0.014, "step": 267820 }, { "epoch": 0.69, "learning_rate": 0.00019586190092306255, "loss": 0.0191, "step": 267830 }, { "epoch": 0.69, "learning_rate": 0.0001958580127066911, "loss": 0.0169, "step": 267840 }, { "epoch": 0.69, "learning_rate": 0.0001958541244903196, "loss": 0.0137, "step": 267850 }, { "epoch": 0.69, "learning_rate": 0.00019585023627394818, "loss": 0.0165, "step": 267860 }, { "epoch": 0.69, "learning_rate": 0.0001958463480575767, "loss": 0.0137, "step": 267870 }, { "epoch": 0.69, "learning_rate": 0.00019584245984120523, "loss": 0.0103, "step": 267880 }, { "epoch": 0.69, "learning_rate": 0.00019583857162483375, "loss": 0.0133, "step": 267890 }, { "epoch": 0.69, "learning_rate": 0.00019583468340846232, "loss": 0.0161, "step": 267900 }, { "epoch": 0.69, "learning_rate": 0.00019583079519209083, "loss": 0.013, "step": 267910 }, { "epoch": 0.69, "learning_rate": 0.00019582690697571937, "loss": 0.0162, "step": 267920 }, { "epoch": 0.69, "learning_rate": 0.0001958230187593479, "loss": 0.0165, "step": 267930 }, { "epoch": 0.69, "learning_rate": 0.00019581913054297646, "loss": 0.0154, "step": 267940 }, { "epoch": 0.69, "learning_rate": 0.00019581524232660497, "loss": 0.0176, "step": 267950 }, { "epoch": 0.69, "learning_rate": 0.0001958113541102335, "loss": 0.0162, "step": 267960 }, { "epoch": 0.69, "learning_rate": 0.00019580746589386203, "loss": 0.0128, "step": 267970 }, { "epoch": 0.69, "learning_rate": 0.00019580357767749057, "loss": 0.0146, "step": 267980 }, { "epoch": 0.69, "learning_rate": 0.00019579968946111914, "loss": 0.0131, "step": 267990 }, { "epoch": 0.69, "learning_rate": 0.00019579580124474765, "loss": 0.0151, "step": 268000 }, { "epoch": 0.69, "eval_cer": 0.8817418761573248, "eval_loss": 0.010366639122366905, "eval_runtime": 108.2065, "eval_samples_per_second": 18.483, "eval_steps_per_second": 4.621, "step": 268000 }, { "epoch": 0.69, "learning_rate": 0.00019579191302837617, "loss": 0.0174, "step": 268010 }, { "epoch": 0.69, "learning_rate": 0.0001957880248120047, "loss": 0.0181, "step": 268020 }, { "epoch": 0.69, "learning_rate": 0.00019578413659563328, "loss": 0.0145, "step": 268030 }, { "epoch": 0.69, "learning_rate": 0.0001957802483792618, "loss": 0.014, "step": 268040 }, { "epoch": 0.69, "learning_rate": 0.00019577636016289033, "loss": 0.0144, "step": 268050 }, { "epoch": 0.69, "learning_rate": 0.00019577247194651885, "loss": 0.0139, "step": 268060 }, { "epoch": 0.69, "learning_rate": 0.00019576858373014742, "loss": 0.0176, "step": 268070 }, { "epoch": 0.69, "learning_rate": 0.00019576469551377593, "loss": 0.0154, "step": 268080 }, { "epoch": 0.69, "learning_rate": 0.00019576080729740447, "loss": 0.0175, "step": 268090 }, { "epoch": 0.69, "learning_rate": 0.000195756919081033, "loss": 0.0138, "step": 268100 }, { "epoch": 0.69, "learning_rate": 0.00019575303086466156, "loss": 0.0133, "step": 268110 }, { "epoch": 0.7, "learning_rate": 0.00019574914264829007, "loss": 0.0175, "step": 268120 }, { "epoch": 0.7, "learning_rate": 0.0001957452544319186, "loss": 0.0146, "step": 268130 }, { "epoch": 0.7, "learning_rate": 0.00019574136621554713, "loss": 0.0132, "step": 268140 }, { "epoch": 0.7, "learning_rate": 0.0001957374779991757, "loss": 0.0173, "step": 268150 }, { "epoch": 0.7, "learning_rate": 0.0001957335897828042, "loss": 0.0151, "step": 268160 }, { "epoch": 0.7, "learning_rate": 0.00019572970156643275, "loss": 0.0132, "step": 268170 }, { "epoch": 0.7, "learning_rate": 0.00019572581335006127, "loss": 0.0154, "step": 268180 }, { "epoch": 0.7, "learning_rate": 0.00019572192513368983, "loss": 0.0134, "step": 268190 }, { "epoch": 0.7, "learning_rate": 0.00019571803691731838, "loss": 0.0151, "step": 268200 }, { "epoch": 0.7, "learning_rate": 0.0001957141487009469, "loss": 0.0155, "step": 268210 }, { "epoch": 0.7, "learning_rate": 0.00019571026048457543, "loss": 0.016, "step": 268220 }, { "epoch": 0.7, "learning_rate": 0.00019570637226820395, "loss": 0.0128, "step": 268230 }, { "epoch": 0.7, "learning_rate": 0.00019570248405183252, "loss": 0.0103, "step": 268240 }, { "epoch": 0.7, "learning_rate": 0.00019569859583546103, "loss": 0.0144, "step": 268250 }, { "epoch": 0.7, "learning_rate": 0.00019569470761908957, "loss": 0.0193, "step": 268260 }, { "epoch": 0.7, "learning_rate": 0.0001956908194027181, "loss": 0.0183, "step": 268270 }, { "epoch": 0.7, "learning_rate": 0.00019568693118634666, "loss": 0.0139, "step": 268280 }, { "epoch": 0.7, "learning_rate": 0.00019568304296997517, "loss": 0.0102, "step": 268290 }, { "epoch": 0.7, "learning_rate": 0.0001956791547536037, "loss": 0.0141, "step": 268300 }, { "epoch": 0.7, "learning_rate": 0.00019567526653723223, "loss": 0.0133, "step": 268310 }, { "epoch": 0.7, "learning_rate": 0.0001956713783208608, "loss": 0.0138, "step": 268320 }, { "epoch": 0.7, "learning_rate": 0.0001956674901044893, "loss": 0.0157, "step": 268330 }, { "epoch": 0.7, "learning_rate": 0.00019566360188811785, "loss": 0.0136, "step": 268340 }, { "epoch": 0.7, "learning_rate": 0.00019565971367174637, "loss": 0.0157, "step": 268350 }, { "epoch": 0.7, "learning_rate": 0.00019565582545537493, "loss": 0.0142, "step": 268360 }, { "epoch": 0.7, "learning_rate": 0.00019565193723900348, "loss": 0.0146, "step": 268370 }, { "epoch": 0.7, "learning_rate": 0.000195648049022632, "loss": 0.0161, "step": 268380 }, { "epoch": 0.7, "learning_rate": 0.00019564416080626053, "loss": 0.0153, "step": 268390 }, { "epoch": 0.7, "learning_rate": 0.00019564027258988907, "loss": 0.0152, "step": 268400 }, { "epoch": 0.7, "learning_rate": 0.00019563638437351762, "loss": 0.0155, "step": 268410 }, { "epoch": 0.7, "learning_rate": 0.00019563249615714613, "loss": 0.0123, "step": 268420 }, { "epoch": 0.7, "learning_rate": 0.00019562860794077467, "loss": 0.0167, "step": 268430 }, { "epoch": 0.7, "learning_rate": 0.0001956247197244032, "loss": 0.0167, "step": 268440 }, { "epoch": 0.7, "learning_rate": 0.00019562083150803175, "loss": 0.0144, "step": 268450 }, { "epoch": 0.7, "learning_rate": 0.00019561694329166027, "loss": 0.0118, "step": 268460 }, { "epoch": 0.7, "learning_rate": 0.0001956130550752888, "loss": 0.0112, "step": 268470 }, { "epoch": 0.7, "learning_rate": 0.00019560916685891733, "loss": 0.0139, "step": 268480 }, { "epoch": 0.7, "learning_rate": 0.0001956052786425459, "loss": 0.0155, "step": 268490 }, { "epoch": 0.7, "learning_rate": 0.0001956013904261744, "loss": 0.0129, "step": 268500 }, { "epoch": 0.7, "learning_rate": 0.00019559750220980295, "loss": 0.0145, "step": 268510 }, { "epoch": 0.7, "learning_rate": 0.00019559361399343146, "loss": 0.0151, "step": 268520 }, { "epoch": 0.7, "learning_rate": 0.00019558972577706003, "loss": 0.0156, "step": 268530 }, { "epoch": 0.7, "learning_rate": 0.00019558583756068858, "loss": 0.0142, "step": 268540 }, { "epoch": 0.7, "learning_rate": 0.0001955819493443171, "loss": 0.0176, "step": 268550 }, { "epoch": 0.7, "learning_rate": 0.0001955780611279456, "loss": 0.0199, "step": 268560 }, { "epoch": 0.7, "learning_rate": 0.00019557417291157417, "loss": 0.0171, "step": 268570 }, { "epoch": 0.7, "learning_rate": 0.00019557028469520271, "loss": 0.0151, "step": 268580 }, { "epoch": 0.7, "learning_rate": 0.00019556639647883123, "loss": 0.0167, "step": 268590 }, { "epoch": 0.7, "learning_rate": 0.00019556250826245977, "loss": 0.0154, "step": 268600 }, { "epoch": 0.7, "learning_rate": 0.0001955586200460883, "loss": 0.0139, "step": 268610 }, { "epoch": 0.7, "learning_rate": 0.00019555473182971685, "loss": 0.0149, "step": 268620 }, { "epoch": 0.7, "learning_rate": 0.00019555084361334537, "loss": 0.016, "step": 268630 }, { "epoch": 0.7, "learning_rate": 0.0001955469553969739, "loss": 0.015, "step": 268640 }, { "epoch": 0.7, "learning_rate": 0.00019554306718060245, "loss": 0.0168, "step": 268650 }, { "epoch": 0.7, "learning_rate": 0.000195539178964231, "loss": 0.015, "step": 268660 }, { "epoch": 0.7, "learning_rate": 0.0001955352907478595, "loss": 0.0174, "step": 268670 }, { "epoch": 0.7, "learning_rate": 0.00019553140253148805, "loss": 0.0138, "step": 268680 }, { "epoch": 0.7, "learning_rate": 0.00019552751431511662, "loss": 0.0107, "step": 268690 }, { "epoch": 0.7, "learning_rate": 0.00019552362609874513, "loss": 0.0176, "step": 268700 }, { "epoch": 0.7, "learning_rate": 0.00019551973788237367, "loss": 0.0129, "step": 268710 }, { "epoch": 0.7, "learning_rate": 0.0001955158496660022, "loss": 0.0197, "step": 268720 }, { "epoch": 0.7, "learning_rate": 0.0001955119614496307, "loss": 0.0179, "step": 268730 }, { "epoch": 0.7, "learning_rate": 0.00019550807323325927, "loss": 0.0131, "step": 268740 }, { "epoch": 0.7, "learning_rate": 0.00019550418501688781, "loss": 0.0128, "step": 268750 }, { "epoch": 0.7, "learning_rate": 0.00019550029680051633, "loss": 0.0141, "step": 268760 }, { "epoch": 0.7, "learning_rate": 0.00019549640858414487, "loss": 0.0146, "step": 268770 }, { "epoch": 0.7, "learning_rate": 0.0001954925203677734, "loss": 0.0217, "step": 268780 }, { "epoch": 0.7, "learning_rate": 0.00019548863215140195, "loss": 0.0112, "step": 268790 }, { "epoch": 0.7, "learning_rate": 0.00019548474393503047, "loss": 0.0181, "step": 268800 }, { "epoch": 0.7, "learning_rate": 0.000195480855718659, "loss": 0.0163, "step": 268810 }, { "epoch": 0.7, "learning_rate": 0.00019547696750228755, "loss": 0.0158, "step": 268820 }, { "epoch": 0.7, "learning_rate": 0.0001954730792859161, "loss": 0.0157, "step": 268830 }, { "epoch": 0.7, "learning_rate": 0.0001954691910695446, "loss": 0.012, "step": 268840 }, { "epoch": 0.7, "learning_rate": 0.00019546530285317315, "loss": 0.0146, "step": 268850 }, { "epoch": 0.7, "learning_rate": 0.00019546141463680172, "loss": 0.0167, "step": 268860 }, { "epoch": 0.7, "learning_rate": 0.00019545752642043023, "loss": 0.017, "step": 268870 }, { "epoch": 0.7, "learning_rate": 0.00019545363820405875, "loss": 0.0158, "step": 268880 }, { "epoch": 0.7, "learning_rate": 0.0001954497499876873, "loss": 0.0139, "step": 268890 }, { "epoch": 0.7, "learning_rate": 0.00019544586177131586, "loss": 0.0159, "step": 268900 }, { "epoch": 0.7, "learning_rate": 0.00019544197355494437, "loss": 0.0148, "step": 268910 }, { "epoch": 0.7, "learning_rate": 0.0001954380853385729, "loss": 0.0157, "step": 268920 }, { "epoch": 0.7, "learning_rate": 0.00019543419712220143, "loss": 0.0162, "step": 268930 }, { "epoch": 0.7, "learning_rate": 0.00019543030890583, "loss": 0.0192, "step": 268940 }, { "epoch": 0.7, "learning_rate": 0.0001954264206894585, "loss": 0.0178, "step": 268950 }, { "epoch": 0.7, "learning_rate": 0.00019542253247308705, "loss": 0.0174, "step": 268960 }, { "epoch": 0.7, "learning_rate": 0.00019541864425671557, "loss": 0.0147, "step": 268970 }, { "epoch": 0.7, "learning_rate": 0.0001954147560403441, "loss": 0.0141, "step": 268980 }, { "epoch": 0.7, "learning_rate": 0.00019541086782397265, "loss": 0.0178, "step": 268990 }, { "epoch": 0.7, "learning_rate": 0.0001954069796076012, "loss": 0.0127, "step": 269000 }, { "epoch": 0.7, "eval_cer": 0.8817418761573248, "eval_loss": 0.010232596658170223, "eval_runtime": 108.1138, "eval_samples_per_second": 18.499, "eval_steps_per_second": 4.625, "step": 269000 }, { "epoch": 0.7, "learning_rate": 0.0001954030913912297, "loss": 0.0133, "step": 269010 }, { "epoch": 0.7, "learning_rate": 0.00019539920317485825, "loss": 0.0184, "step": 269020 }, { "epoch": 0.7, "learning_rate": 0.00019539531495848682, "loss": 0.016, "step": 269030 }, { "epoch": 0.7, "learning_rate": 0.00019539142674211533, "loss": 0.0139, "step": 269040 }, { "epoch": 0.7, "learning_rate": 0.00019538753852574385, "loss": 0.0158, "step": 269050 }, { "epoch": 0.7, "learning_rate": 0.0001953836503093724, "loss": 0.0153, "step": 269060 }, { "epoch": 0.7, "learning_rate": 0.00019537976209300096, "loss": 0.0145, "step": 269070 }, { "epoch": 0.7, "learning_rate": 0.00019537587387662947, "loss": 0.0131, "step": 269080 }, { "epoch": 0.7, "learning_rate": 0.000195371985660258, "loss": 0.0134, "step": 269090 }, { "epoch": 0.7, "learning_rate": 0.00019536809744388653, "loss": 0.0159, "step": 269100 }, { "epoch": 0.7, "learning_rate": 0.0001953642092275151, "loss": 0.0155, "step": 269110 }, { "epoch": 0.7, "learning_rate": 0.0001953603210111436, "loss": 0.0173, "step": 269120 }, { "epoch": 0.7, "learning_rate": 0.00019535643279477215, "loss": 0.0169, "step": 269130 }, { "epoch": 0.7, "learning_rate": 0.00019535254457840067, "loss": 0.0171, "step": 269140 }, { "epoch": 0.7, "learning_rate": 0.00019534865636202924, "loss": 0.0134, "step": 269150 }, { "epoch": 0.7, "learning_rate": 0.00019534476814565775, "loss": 0.0146, "step": 269160 }, { "epoch": 0.7, "learning_rate": 0.0001953408799292863, "loss": 0.014, "step": 269170 }, { "epoch": 0.7, "learning_rate": 0.0001953369917129148, "loss": 0.0152, "step": 269180 }, { "epoch": 0.7, "learning_rate": 0.00019533310349654338, "loss": 0.0154, "step": 269190 }, { "epoch": 0.7, "learning_rate": 0.0001953292152801719, "loss": 0.0151, "step": 269200 }, { "epoch": 0.7, "learning_rate": 0.00019532532706380043, "loss": 0.0173, "step": 269210 }, { "epoch": 0.7, "learning_rate": 0.00019532143884742895, "loss": 0.014, "step": 269220 }, { "epoch": 0.7, "learning_rate": 0.0001953175506310575, "loss": 0.014, "step": 269230 }, { "epoch": 0.7, "learning_rate": 0.00019531366241468606, "loss": 0.0124, "step": 269240 }, { "epoch": 0.7, "learning_rate": 0.00019530977419831457, "loss": 0.0126, "step": 269250 }, { "epoch": 0.7, "learning_rate": 0.0001953058859819431, "loss": 0.0174, "step": 269260 }, { "epoch": 0.7, "learning_rate": 0.00019530199776557163, "loss": 0.0176, "step": 269270 }, { "epoch": 0.7, "learning_rate": 0.0001952981095492002, "loss": 0.0158, "step": 269280 }, { "epoch": 0.7, "learning_rate": 0.0001952942213328287, "loss": 0.0127, "step": 269290 }, { "epoch": 0.7, "learning_rate": 0.00019529033311645725, "loss": 0.0211, "step": 269300 }, { "epoch": 0.7, "learning_rate": 0.00019528644490008577, "loss": 0.0151, "step": 269310 }, { "epoch": 0.7, "learning_rate": 0.00019528255668371434, "loss": 0.0141, "step": 269320 }, { "epoch": 0.7, "learning_rate": 0.00019527866846734285, "loss": 0.0159, "step": 269330 }, { "epoch": 0.7, "learning_rate": 0.0001952747802509714, "loss": 0.0138, "step": 269340 }, { "epoch": 0.7, "learning_rate": 0.0001952708920345999, "loss": 0.0126, "step": 269350 }, { "epoch": 0.7, "learning_rate": 0.00019526700381822847, "loss": 0.0158, "step": 269360 }, { "epoch": 0.7, "learning_rate": 0.000195263115601857, "loss": 0.0171, "step": 269370 }, { "epoch": 0.7, "learning_rate": 0.00019525922738548553, "loss": 0.0123, "step": 269380 }, { "epoch": 0.7, "learning_rate": 0.00019525533916911405, "loss": 0.0129, "step": 269390 }, { "epoch": 0.7, "learning_rate": 0.00019525145095274261, "loss": 0.0177, "step": 269400 }, { "epoch": 0.7, "learning_rate": 0.00019524756273637116, "loss": 0.0161, "step": 269410 }, { "epoch": 0.7, "learning_rate": 0.00019524367451999967, "loss": 0.0205, "step": 269420 }, { "epoch": 0.7, "learning_rate": 0.0001952397863036282, "loss": 0.0169, "step": 269430 }, { "epoch": 0.7, "learning_rate": 0.00019523589808725675, "loss": 0.0184, "step": 269440 }, { "epoch": 0.7, "learning_rate": 0.0001952320098708853, "loss": 0.0129, "step": 269450 }, { "epoch": 0.7, "learning_rate": 0.0001952281216545138, "loss": 0.0149, "step": 269460 }, { "epoch": 0.7, "learning_rate": 0.00019522423343814235, "loss": 0.0183, "step": 269470 }, { "epoch": 0.7, "learning_rate": 0.00019522034522177087, "loss": 0.0154, "step": 269480 }, { "epoch": 0.7, "learning_rate": 0.00019521645700539943, "loss": 0.0142, "step": 269490 }, { "epoch": 0.7, "learning_rate": 0.00019521256878902795, "loss": 0.0157, "step": 269500 }, { "epoch": 0.7, "learning_rate": 0.0001952086805726565, "loss": 0.0151, "step": 269510 }, { "epoch": 0.7, "learning_rate": 0.000195204792356285, "loss": 0.0124, "step": 269520 }, { "epoch": 0.7, "learning_rate": 0.00019520090413991357, "loss": 0.0154, "step": 269530 }, { "epoch": 0.7, "learning_rate": 0.0001951970159235421, "loss": 0.0152, "step": 269540 }, { "epoch": 0.7, "learning_rate": 0.00019519312770717063, "loss": 0.0163, "step": 269550 }, { "epoch": 0.7, "learning_rate": 0.00019518923949079914, "loss": 0.0193, "step": 269560 }, { "epoch": 0.7, "learning_rate": 0.0001951853512744277, "loss": 0.0143, "step": 269570 }, { "epoch": 0.7, "learning_rate": 0.00019518146305805626, "loss": 0.0138, "step": 269580 }, { "epoch": 0.7, "learning_rate": 0.00019517757484168477, "loss": 0.0186, "step": 269590 }, { "epoch": 0.7, "learning_rate": 0.00019517368662531328, "loss": 0.0105, "step": 269600 }, { "epoch": 0.7, "learning_rate": 0.00019516979840894185, "loss": 0.0141, "step": 269610 }, { "epoch": 0.7, "learning_rate": 0.0001951659101925704, "loss": 0.0155, "step": 269620 }, { "epoch": 0.7, "learning_rate": 0.0001951620219761989, "loss": 0.0161, "step": 269630 }, { "epoch": 0.7, "learning_rate": 0.00019515813375982745, "loss": 0.0126, "step": 269640 }, { "epoch": 0.7, "learning_rate": 0.000195154245543456, "loss": 0.0135, "step": 269650 }, { "epoch": 0.7, "learning_rate": 0.00019515035732708453, "loss": 0.0175, "step": 269660 }, { "epoch": 0.7, "learning_rate": 0.00019514646911071305, "loss": 0.0149, "step": 269670 }, { "epoch": 0.7, "learning_rate": 0.0001951425808943416, "loss": 0.0154, "step": 269680 }, { "epoch": 0.7, "learning_rate": 0.00019513869267797013, "loss": 0.016, "step": 269690 }, { "epoch": 0.7, "learning_rate": 0.00019513480446159867, "loss": 0.0176, "step": 269700 }, { "epoch": 0.7, "learning_rate": 0.0001951309162452272, "loss": 0.0147, "step": 269710 }, { "epoch": 0.7, "learning_rate": 0.00019512702802885573, "loss": 0.0155, "step": 269720 }, { "epoch": 0.7, "learning_rate": 0.00019512313981248424, "loss": 0.0141, "step": 269730 }, { "epoch": 0.7, "learning_rate": 0.0001951192515961128, "loss": 0.0167, "step": 269740 }, { "epoch": 0.7, "learning_rate": 0.00019511536337974133, "loss": 0.0209, "step": 269750 }, { "epoch": 0.7, "learning_rate": 0.00019511147516336987, "loss": 0.0154, "step": 269760 }, { "epoch": 0.7, "learning_rate": 0.00019510758694699838, "loss": 0.0157, "step": 269770 }, { "epoch": 0.7, "learning_rate": 0.00019510369873062695, "loss": 0.0163, "step": 269780 }, { "epoch": 0.7, "learning_rate": 0.0001950998105142555, "loss": 0.0158, "step": 269790 }, { "epoch": 0.7, "learning_rate": 0.000195095922297884, "loss": 0.0166, "step": 269800 }, { "epoch": 0.7, "learning_rate": 0.00019509203408151255, "loss": 0.0159, "step": 269810 }, { "epoch": 0.7, "learning_rate": 0.0001950881458651411, "loss": 0.0152, "step": 269820 }, { "epoch": 0.7, "learning_rate": 0.00019508425764876963, "loss": 0.0148, "step": 269830 }, { "epoch": 0.7, "learning_rate": 0.00019508036943239815, "loss": 0.0166, "step": 269840 }, { "epoch": 0.7, "learning_rate": 0.0001950764812160267, "loss": 0.015, "step": 269850 }, { "epoch": 0.7, "learning_rate": 0.00019507259299965523, "loss": 0.017, "step": 269860 }, { "epoch": 0.7, "learning_rate": 0.00019506870478328377, "loss": 0.017, "step": 269870 }, { "epoch": 0.7, "learning_rate": 0.0001950648165669123, "loss": 0.0126, "step": 269880 }, { "epoch": 0.7, "learning_rate": 0.00019506092835054083, "loss": 0.0188, "step": 269890 }, { "epoch": 0.7, "learning_rate": 0.0001950570401341694, "loss": 0.0189, "step": 269900 }, { "epoch": 0.7, "learning_rate": 0.0001950531519177979, "loss": 0.0135, "step": 269910 }, { "epoch": 0.7, "learning_rate": 0.00019504926370142643, "loss": 0.0147, "step": 269920 }, { "epoch": 0.7, "learning_rate": 0.00019504537548505497, "loss": 0.0176, "step": 269930 }, { "epoch": 0.7, "learning_rate": 0.00019504148726868354, "loss": 0.0187, "step": 269940 }, { "epoch": 0.7, "learning_rate": 0.00019503759905231205, "loss": 0.0167, "step": 269950 }, { "epoch": 0.7, "learning_rate": 0.0001950337108359406, "loss": 0.0158, "step": 269960 }, { "epoch": 0.7, "learning_rate": 0.0001950298226195691, "loss": 0.0152, "step": 269970 }, { "epoch": 0.7, "learning_rate": 0.00019502593440319765, "loss": 0.0167, "step": 269980 }, { "epoch": 0.7, "learning_rate": 0.0001950220461868262, "loss": 0.0138, "step": 269990 }, { "epoch": 0.7, "learning_rate": 0.00019501815797045473, "loss": 0.014, "step": 270000 }, { "epoch": 0.7, "eval_cer": 0.8817250805141147, "eval_loss": 0.00999659113585949, "eval_runtime": 107.9657, "eval_samples_per_second": 18.524, "eval_steps_per_second": 4.631, "step": 270000 }, { "epoch": 0.7, "learning_rate": 0.00019501426975408325, "loss": 0.0118, "step": 270010 }, { "epoch": 0.7, "learning_rate": 0.0001950103815377118, "loss": 0.0143, "step": 270020 }, { "epoch": 0.7, "learning_rate": 0.00019500649332134033, "loss": 0.0168, "step": 270030 }, { "epoch": 0.7, "learning_rate": 0.00019500260510496887, "loss": 0.0168, "step": 270040 }, { "epoch": 0.7, "learning_rate": 0.0001949987168885974, "loss": 0.0142, "step": 270050 }, { "epoch": 0.7, "learning_rate": 0.00019499482867222593, "loss": 0.0156, "step": 270060 }, { "epoch": 0.7, "learning_rate": 0.00019499094045585447, "loss": 0.02, "step": 270070 }, { "epoch": 0.7, "learning_rate": 0.000194987052239483, "loss": 0.0148, "step": 270080 }, { "epoch": 0.7, "learning_rate": 0.00019498316402311153, "loss": 0.0167, "step": 270090 }, { "epoch": 0.7, "learning_rate": 0.00019497927580674007, "loss": 0.0145, "step": 270100 }, { "epoch": 0.7, "learning_rate": 0.00019497538759036864, "loss": 0.0151, "step": 270110 }, { "epoch": 0.7, "learning_rate": 0.00019497149937399715, "loss": 0.0138, "step": 270120 }, { "epoch": 0.7, "learning_rate": 0.0001949676111576257, "loss": 0.0157, "step": 270130 }, { "epoch": 0.7, "learning_rate": 0.0001949637229412542, "loss": 0.0143, "step": 270140 }, { "epoch": 0.7, "learning_rate": 0.00019495983472488278, "loss": 0.0116, "step": 270150 }, { "epoch": 0.7, "learning_rate": 0.0001949559465085113, "loss": 0.015, "step": 270160 }, { "epoch": 0.7, "learning_rate": 0.00019495205829213983, "loss": 0.0156, "step": 270170 }, { "epoch": 0.7, "learning_rate": 0.00019494817007576835, "loss": 0.0124, "step": 270180 }, { "epoch": 0.7, "learning_rate": 0.0001949442818593969, "loss": 0.022, "step": 270190 }, { "epoch": 0.7, "learning_rate": 0.00019494039364302543, "loss": 0.015, "step": 270200 }, { "epoch": 0.7, "learning_rate": 0.00019493650542665397, "loss": 0.0175, "step": 270210 }, { "epoch": 0.7, "learning_rate": 0.00019493261721028249, "loss": 0.0257, "step": 270220 }, { "epoch": 0.7, "learning_rate": 0.00019492872899391103, "loss": 0.0165, "step": 270230 }, { "epoch": 0.7, "learning_rate": 0.00019492484077753957, "loss": 0.0175, "step": 270240 }, { "epoch": 0.7, "learning_rate": 0.0001949209525611681, "loss": 0.0141, "step": 270250 }, { "epoch": 0.7, "learning_rate": 0.00019491706434479663, "loss": 0.0137, "step": 270260 }, { "epoch": 0.7, "learning_rate": 0.00019491317612842517, "loss": 0.014, "step": 270270 }, { "epoch": 0.7, "learning_rate": 0.00019490928791205374, "loss": 0.0172, "step": 270280 }, { "epoch": 0.7, "learning_rate": 0.00019490539969568225, "loss": 0.0156, "step": 270290 }, { "epoch": 0.7, "learning_rate": 0.0001949015114793108, "loss": 0.0121, "step": 270300 }, { "epoch": 0.7, "learning_rate": 0.0001948976232629393, "loss": 0.0115, "step": 270310 }, { "epoch": 0.7, "learning_rate": 0.00019489373504656788, "loss": 0.0164, "step": 270320 }, { "epoch": 0.7, "learning_rate": 0.0001948898468301964, "loss": 0.0182, "step": 270330 }, { "epoch": 0.7, "learning_rate": 0.00019488595861382493, "loss": 0.0125, "step": 270340 }, { "epoch": 0.7, "learning_rate": 0.00019488207039745345, "loss": 0.0149, "step": 270350 }, { "epoch": 0.7, "learning_rate": 0.00019487818218108201, "loss": 0.0162, "step": 270360 }, { "epoch": 0.7, "learning_rate": 0.00019487429396471053, "loss": 0.0171, "step": 270370 }, { "epoch": 0.7, "learning_rate": 0.00019487040574833907, "loss": 0.0151, "step": 270380 }, { "epoch": 0.7, "learning_rate": 0.00019486651753196759, "loss": 0.016, "step": 270390 }, { "epoch": 0.7, "learning_rate": 0.00019486262931559615, "loss": 0.0143, "step": 270400 }, { "epoch": 0.7, "learning_rate": 0.00019485874109922467, "loss": 0.0139, "step": 270410 }, { "epoch": 0.7, "learning_rate": 0.0001948548528828532, "loss": 0.0167, "step": 270420 }, { "epoch": 0.7, "learning_rate": 0.00019485096466648173, "loss": 0.0112, "step": 270430 }, { "epoch": 0.7, "learning_rate": 0.00019484707645011027, "loss": 0.0151, "step": 270440 }, { "epoch": 0.7, "learning_rate": 0.00019484318823373884, "loss": 0.0316, "step": 270450 }, { "epoch": 0.7, "learning_rate": 0.00019483930001736735, "loss": 0.0137, "step": 270460 }, { "epoch": 0.7, "learning_rate": 0.00019483541180099586, "loss": 0.0122, "step": 270470 }, { "epoch": 0.7, "learning_rate": 0.0001948315235846244, "loss": 0.0198, "step": 270480 }, { "epoch": 0.7, "learning_rate": 0.00019482763536825297, "loss": 0.0141, "step": 270490 }, { "epoch": 0.7, "learning_rate": 0.0001948237471518815, "loss": 0.0144, "step": 270500 }, { "epoch": 0.7, "learning_rate": 0.00019481985893551003, "loss": 0.0176, "step": 270510 }, { "epoch": 0.7, "learning_rate": 0.00019481597071913855, "loss": 0.0158, "step": 270520 }, { "epoch": 0.7, "learning_rate": 0.00019481208250276711, "loss": 0.0159, "step": 270530 }, { "epoch": 0.7, "learning_rate": 0.00019480819428639563, "loss": 0.0167, "step": 270540 }, { "epoch": 0.7, "learning_rate": 0.00019480430607002417, "loss": 0.0136, "step": 270550 }, { "epoch": 0.7, "learning_rate": 0.00019480041785365269, "loss": 0.0141, "step": 270560 }, { "epoch": 0.7, "learning_rate": 0.00019479652963728125, "loss": 0.0159, "step": 270570 }, { "epoch": 0.7, "learning_rate": 0.00019479264142090977, "loss": 0.016, "step": 270580 }, { "epoch": 0.7, "learning_rate": 0.0001947887532045383, "loss": 0.0197, "step": 270590 }, { "epoch": 0.7, "learning_rate": 0.00019478486498816682, "loss": 0.0139, "step": 270600 }, { "epoch": 0.7, "learning_rate": 0.0001947809767717954, "loss": 0.0164, "step": 270610 }, { "epoch": 0.7, "learning_rate": 0.00019477708855542393, "loss": 0.0136, "step": 270620 }, { "epoch": 0.7, "learning_rate": 0.00019477320033905245, "loss": 0.0125, "step": 270630 }, { "epoch": 0.7, "learning_rate": 0.00019476931212268096, "loss": 0.0235, "step": 270640 }, { "epoch": 0.7, "learning_rate": 0.00019476542390630953, "loss": 0.0144, "step": 270650 }, { "epoch": 0.7, "learning_rate": 0.00019476153568993807, "loss": 0.0123, "step": 270660 }, { "epoch": 0.7, "learning_rate": 0.0001947576474735666, "loss": 0.0149, "step": 270670 }, { "epoch": 0.7, "learning_rate": 0.00019475375925719513, "loss": 0.0158, "step": 270680 }, { "epoch": 0.7, "learning_rate": 0.00019474987104082364, "loss": 0.0146, "step": 270690 }, { "epoch": 0.7, "learning_rate": 0.00019474598282445221, "loss": 0.0126, "step": 270700 }, { "epoch": 0.7, "learning_rate": 0.00019474209460808073, "loss": 0.0169, "step": 270710 }, { "epoch": 0.7, "learning_rate": 0.00019473820639170927, "loss": 0.0135, "step": 270720 }, { "epoch": 0.7, "learning_rate": 0.00019473431817533778, "loss": 0.0186, "step": 270730 }, { "epoch": 0.7, "learning_rate": 0.00019473042995896635, "loss": 0.0097, "step": 270740 }, { "epoch": 0.7, "learning_rate": 0.00019472654174259487, "loss": 0.0124, "step": 270750 }, { "epoch": 0.7, "learning_rate": 0.0001947226535262234, "loss": 0.0138, "step": 270760 }, { "epoch": 0.7, "learning_rate": 0.00019471876530985192, "loss": 0.0137, "step": 270770 }, { "epoch": 0.7, "learning_rate": 0.0001947148770934805, "loss": 0.0182, "step": 270780 }, { "epoch": 0.7, "learning_rate": 0.000194710988877109, "loss": 0.0132, "step": 270790 }, { "epoch": 0.7, "learning_rate": 0.00019470710066073755, "loss": 0.0208, "step": 270800 }, { "epoch": 0.7, "learning_rate": 0.00019470321244436606, "loss": 0.017, "step": 270810 }, { "epoch": 0.7, "learning_rate": 0.00019469932422799463, "loss": 0.0127, "step": 270820 }, { "epoch": 0.7, "learning_rate": 0.00019469543601162317, "loss": 0.0129, "step": 270830 }, { "epoch": 0.7, "learning_rate": 0.0001946915477952517, "loss": 0.0166, "step": 270840 }, { "epoch": 0.7, "learning_rate": 0.00019468765957888023, "loss": 0.0197, "step": 270850 }, { "epoch": 0.7, "learning_rate": 0.00019468377136250877, "loss": 0.0116, "step": 270860 }, { "epoch": 0.7, "learning_rate": 0.0001946798831461373, "loss": 0.0154, "step": 270870 }, { "epoch": 0.7, "learning_rate": 0.00019467599492976583, "loss": 0.0144, "step": 270880 }, { "epoch": 0.7, "learning_rate": 0.00019467210671339437, "loss": 0.0125, "step": 270890 }, { "epoch": 0.7, "learning_rate": 0.0001946682184970229, "loss": 0.013, "step": 270900 }, { "epoch": 0.7, "learning_rate": 0.00019466433028065145, "loss": 0.0157, "step": 270910 }, { "epoch": 0.7, "learning_rate": 0.00019466044206427997, "loss": 0.0148, "step": 270920 }, { "epoch": 0.7, "learning_rate": 0.0001946565538479085, "loss": 0.0108, "step": 270930 }, { "epoch": 0.7, "learning_rate": 0.00019465266563153702, "loss": 0.0124, "step": 270940 }, { "epoch": 0.7, "learning_rate": 0.0001946487774151656, "loss": 0.0162, "step": 270950 }, { "epoch": 0.7, "learning_rate": 0.0001946448891987941, "loss": 0.0159, "step": 270960 }, { "epoch": 0.7, "learning_rate": 0.00019464100098242265, "loss": 0.0123, "step": 270970 }, { "epoch": 0.7, "learning_rate": 0.00019463711276605116, "loss": 0.0187, "step": 270980 }, { "epoch": 0.7, "learning_rate": 0.00019463322454967973, "loss": 0.0122, "step": 270990 }, { "epoch": 0.7, "learning_rate": 0.00019462933633330827, "loss": 0.0186, "step": 271000 }, { "epoch": 0.7, "eval_cer": 0.8817404765203906, "eval_loss": 0.01013705413788557, "eval_runtime": 108.1485, "eval_samples_per_second": 18.493, "eval_steps_per_second": 4.623, "step": 271000 }, { "epoch": 0.7, "learning_rate": 0.0001946254481169368, "loss": 0.0155, "step": 271010 }, { "epoch": 0.7, "learning_rate": 0.00019462155990056533, "loss": 0.0114, "step": 271020 }, { "epoch": 0.7, "learning_rate": 0.00019461767168419387, "loss": 0.0149, "step": 271030 }, { "epoch": 0.7, "learning_rate": 0.0001946137834678224, "loss": 0.0167, "step": 271040 }, { "epoch": 0.7, "learning_rate": 0.00019460989525145093, "loss": 0.0126, "step": 271050 }, { "epoch": 0.7, "learning_rate": 0.00019460600703507947, "loss": 0.0154, "step": 271060 }, { "epoch": 0.7, "learning_rate": 0.000194602118818708, "loss": 0.0183, "step": 271070 }, { "epoch": 0.7, "learning_rate": 0.00019459823060233655, "loss": 0.0123, "step": 271080 }, { "epoch": 0.7, "learning_rate": 0.00019459434238596507, "loss": 0.0161, "step": 271090 }, { "epoch": 0.7, "learning_rate": 0.0001945904541695936, "loss": 0.0151, "step": 271100 }, { "epoch": 0.7, "learning_rate": 0.00019458656595322215, "loss": 0.0137, "step": 271110 }, { "epoch": 0.7, "learning_rate": 0.0001945826777368507, "loss": 0.0129, "step": 271120 }, { "epoch": 0.7, "learning_rate": 0.0001945787895204792, "loss": 0.0139, "step": 271130 }, { "epoch": 0.7, "learning_rate": 0.00019457490130410775, "loss": 0.0144, "step": 271140 }, { "epoch": 0.7, "learning_rate": 0.00019457101308773632, "loss": 0.016, "step": 271150 }, { "epoch": 0.7, "learning_rate": 0.00019456712487136483, "loss": 0.0116, "step": 271160 }, { "epoch": 0.7, "learning_rate": 0.00019456323665499337, "loss": 0.0156, "step": 271170 }, { "epoch": 0.7, "learning_rate": 0.0001945593484386219, "loss": 0.0155, "step": 271180 }, { "epoch": 0.7, "learning_rate": 0.0001945554602222504, "loss": 0.012, "step": 271190 }, { "epoch": 0.7, "learning_rate": 0.00019455157200587897, "loss": 0.0185, "step": 271200 }, { "epoch": 0.7, "learning_rate": 0.0001945476837895075, "loss": 0.0147, "step": 271210 }, { "epoch": 0.7, "learning_rate": 0.00019454379557313603, "loss": 0.0156, "step": 271220 }, { "epoch": 0.7, "learning_rate": 0.00019453990735676457, "loss": 0.0162, "step": 271230 }, { "epoch": 0.7, "learning_rate": 0.0001945360191403931, "loss": 0.0117, "step": 271240 }, { "epoch": 0.7, "learning_rate": 0.00019453213092402165, "loss": 0.0164, "step": 271250 }, { "epoch": 0.7, "learning_rate": 0.00019452824270765017, "loss": 0.0129, "step": 271260 }, { "epoch": 0.7, "learning_rate": 0.0001945243544912787, "loss": 0.0172, "step": 271270 }, { "epoch": 0.7, "learning_rate": 0.00019452046627490725, "loss": 0.0181, "step": 271280 }, { "epoch": 0.7, "learning_rate": 0.0001945165780585358, "loss": 0.0139, "step": 271290 }, { "epoch": 0.7, "learning_rate": 0.0001945126898421643, "loss": 0.0171, "step": 271300 }, { "epoch": 0.7, "learning_rate": 0.00019450880162579285, "loss": 0.0149, "step": 271310 }, { "epoch": 0.7, "learning_rate": 0.00019450491340942142, "loss": 0.0132, "step": 271320 }, { "epoch": 0.7, "learning_rate": 0.00019450102519304993, "loss": 0.0111, "step": 271330 }, { "epoch": 0.7, "learning_rate": 0.00019449713697667844, "loss": 0.0155, "step": 271340 }, { "epoch": 0.7, "learning_rate": 0.000194493248760307, "loss": 0.015, "step": 271350 }, { "epoch": 0.7, "learning_rate": 0.00019448936054393556, "loss": 0.012, "step": 271360 }, { "epoch": 0.7, "learning_rate": 0.00019448547232756407, "loss": 0.0198, "step": 271370 }, { "epoch": 0.7, "learning_rate": 0.0001944815841111926, "loss": 0.0171, "step": 271380 }, { "epoch": 0.7, "learning_rate": 0.00019447769589482113, "loss": 0.0149, "step": 271390 }, { "epoch": 0.7, "learning_rate": 0.0001944738076784497, "loss": 0.0131, "step": 271400 }, { "epoch": 0.7, "learning_rate": 0.0001944699194620782, "loss": 0.0144, "step": 271410 }, { "epoch": 0.7, "learning_rate": 0.00019446603124570675, "loss": 0.0135, "step": 271420 }, { "epoch": 0.7, "learning_rate": 0.00019446214302933527, "loss": 0.0155, "step": 271430 }, { "epoch": 0.7, "learning_rate": 0.0001944582548129638, "loss": 0.0128, "step": 271440 }, { "epoch": 0.7, "learning_rate": 0.00019445436659659235, "loss": 0.0136, "step": 271450 }, { "epoch": 0.7, "learning_rate": 0.0001944504783802209, "loss": 0.0239, "step": 271460 }, { "epoch": 0.7, "learning_rate": 0.0001944465901638494, "loss": 0.0127, "step": 271470 }, { "epoch": 0.7, "learning_rate": 0.00019444270194747795, "loss": 0.0109, "step": 271480 }, { "epoch": 0.7, "learning_rate": 0.00019443881373110652, "loss": 0.0152, "step": 271490 }, { "epoch": 0.7, "learning_rate": 0.00019443492551473503, "loss": 0.0149, "step": 271500 }, { "epoch": 0.7, "learning_rate": 0.00019443103729836354, "loss": 0.014, "step": 271510 }, { "epoch": 0.7, "learning_rate": 0.00019442714908199209, "loss": 0.0159, "step": 271520 }, { "epoch": 0.7, "learning_rate": 0.00019442326086562065, "loss": 0.0219, "step": 271530 }, { "epoch": 0.7, "learning_rate": 0.00019441937264924917, "loss": 0.0181, "step": 271540 }, { "epoch": 0.7, "learning_rate": 0.0001944154844328777, "loss": 0.0148, "step": 271550 }, { "epoch": 0.7, "learning_rate": 0.00019441159621650623, "loss": 0.0128, "step": 271560 }, { "epoch": 0.7, "learning_rate": 0.0001944077080001348, "loss": 0.0137, "step": 271570 }, { "epoch": 0.7, "learning_rate": 0.0001944038197837633, "loss": 0.0153, "step": 271580 }, { "epoch": 0.7, "learning_rate": 0.00019439993156739185, "loss": 0.0113, "step": 271590 }, { "epoch": 0.7, "learning_rate": 0.00019439604335102036, "loss": 0.0141, "step": 271600 }, { "epoch": 0.7, "learning_rate": 0.00019439215513464893, "loss": 0.0117, "step": 271610 }, { "epoch": 0.7, "learning_rate": 0.00019438826691827745, "loss": 0.0139, "step": 271620 }, { "epoch": 0.7, "learning_rate": 0.000194384378701906, "loss": 0.013, "step": 271630 }, { "epoch": 0.7, "learning_rate": 0.0001943804904855345, "loss": 0.0164, "step": 271640 }, { "epoch": 0.7, "learning_rate": 0.00019437660226916307, "loss": 0.0153, "step": 271650 }, { "epoch": 0.7, "learning_rate": 0.0001943727140527916, "loss": 0.0119, "step": 271660 }, { "epoch": 0.7, "learning_rate": 0.00019436882583642013, "loss": 0.014, "step": 271670 }, { "epoch": 0.7, "learning_rate": 0.00019436493762004864, "loss": 0.0134, "step": 271680 }, { "epoch": 0.7, "learning_rate": 0.00019436104940367719, "loss": 0.0127, "step": 271690 }, { "epoch": 0.7, "learning_rate": 0.00019435716118730575, "loss": 0.0166, "step": 271700 }, { "epoch": 0.7, "learning_rate": 0.00019435327297093427, "loss": 0.0151, "step": 271710 }, { "epoch": 0.7, "learning_rate": 0.0001943493847545628, "loss": 0.0138, "step": 271720 }, { "epoch": 0.7, "learning_rate": 0.00019434549653819132, "loss": 0.0171, "step": 271730 }, { "epoch": 0.7, "learning_rate": 0.0001943416083218199, "loss": 0.0176, "step": 271740 }, { "epoch": 0.7, "learning_rate": 0.0001943377201054484, "loss": 0.0178, "step": 271750 }, { "epoch": 0.7, "learning_rate": 0.00019433383188907695, "loss": 0.0174, "step": 271760 }, { "epoch": 0.7, "learning_rate": 0.00019432994367270546, "loss": 0.0195, "step": 271770 }, { "epoch": 0.7, "learning_rate": 0.00019432605545633403, "loss": 0.0141, "step": 271780 }, { "epoch": 0.7, "learning_rate": 0.00019432216723996255, "loss": 0.0157, "step": 271790 }, { "epoch": 0.7, "learning_rate": 0.0001943182790235911, "loss": 0.016, "step": 271800 }, { "epoch": 0.7, "learning_rate": 0.0001943143908072196, "loss": 0.015, "step": 271810 }, { "epoch": 0.7, "learning_rate": 0.00019431050259084817, "loss": 0.0146, "step": 271820 }, { "epoch": 0.7, "learning_rate": 0.0001943066143744767, "loss": 0.0139, "step": 271830 }, { "epoch": 0.7, "learning_rate": 0.00019430272615810523, "loss": 0.0159, "step": 271840 }, { "epoch": 0.7, "learning_rate": 0.00019429883794173374, "loss": 0.0175, "step": 271850 }, { "epoch": 0.7, "learning_rate": 0.0001942949497253623, "loss": 0.0139, "step": 271860 }, { "epoch": 0.7, "learning_rate": 0.00019429106150899085, "loss": 0.0171, "step": 271870 }, { "epoch": 0.7, "learning_rate": 0.00019428717329261937, "loss": 0.0141, "step": 271880 }, { "epoch": 0.7, "learning_rate": 0.0001942832850762479, "loss": 0.0177, "step": 271890 }, { "epoch": 0.7, "learning_rate": 0.00019427939685987645, "loss": 0.013, "step": 271900 }, { "epoch": 0.7, "learning_rate": 0.000194275508643505, "loss": 0.0165, "step": 271910 }, { "epoch": 0.7, "learning_rate": 0.0001942716204271335, "loss": 0.0169, "step": 271920 }, { "epoch": 0.7, "learning_rate": 0.00019426773221076205, "loss": 0.0159, "step": 271930 }, { "epoch": 0.7, "learning_rate": 0.00019426384399439056, "loss": 0.0179, "step": 271940 }, { "epoch": 0.7, "learning_rate": 0.00019425995577801913, "loss": 0.0154, "step": 271950 }, { "epoch": 0.7, "learning_rate": 0.00019425606756164765, "loss": 0.0197, "step": 271960 }, { "epoch": 0.7, "learning_rate": 0.0001942521793452762, "loss": 0.0156, "step": 271970 }, { "epoch": 0.71, "learning_rate": 0.0001942482911289047, "loss": 0.0162, "step": 271980 }, { "epoch": 0.71, "learning_rate": 0.00019424440291253327, "loss": 0.0129, "step": 271990 }, { "epoch": 0.71, "learning_rate": 0.00019424051469616179, "loss": 0.0181, "step": 272000 }, { "epoch": 0.71, "eval_cer": 0.8817656699852059, "eval_loss": 0.010548959486186504, "eval_runtime": 108.289, "eval_samples_per_second": 18.469, "eval_steps_per_second": 4.617, "step": 272000 }, { "epoch": 0.71, "learning_rate": 0.00019423662647979033, "loss": 0.0167, "step": 272010 }, { "epoch": 0.71, "learning_rate": 0.00019423273826341884, "loss": 0.0175, "step": 272020 }, { "epoch": 0.71, "learning_rate": 0.0001942288500470474, "loss": 0.0145, "step": 272030 }, { "epoch": 0.71, "learning_rate": 0.00019422496183067595, "loss": 0.0126, "step": 272040 }, { "epoch": 0.71, "learning_rate": 0.00019422107361430447, "loss": 0.0175, "step": 272050 }, { "epoch": 0.71, "learning_rate": 0.00019421718539793298, "loss": 0.0136, "step": 272060 }, { "epoch": 0.71, "learning_rate": 0.00019421329718156155, "loss": 0.0151, "step": 272070 }, { "epoch": 0.71, "learning_rate": 0.0001942094089651901, "loss": 0.0184, "step": 272080 }, { "epoch": 0.71, "learning_rate": 0.0001942055207488186, "loss": 0.0168, "step": 272090 }, { "epoch": 0.71, "learning_rate": 0.00019420163253244715, "loss": 0.0195, "step": 272100 }, { "epoch": 0.71, "learning_rate": 0.0001941977443160757, "loss": 0.0186, "step": 272110 }, { "epoch": 0.71, "learning_rate": 0.00019419385609970423, "loss": 0.0138, "step": 272120 }, { "epoch": 0.71, "learning_rate": 0.00019418996788333275, "loss": 0.0148, "step": 272130 }, { "epoch": 0.71, "learning_rate": 0.0001941860796669613, "loss": 0.0134, "step": 272140 }, { "epoch": 0.71, "learning_rate": 0.00019418219145058983, "loss": 0.0175, "step": 272150 }, { "epoch": 0.71, "learning_rate": 0.00019417830323421837, "loss": 0.0156, "step": 272160 }, { "epoch": 0.71, "learning_rate": 0.00019417441501784689, "loss": 0.0173, "step": 272170 }, { "epoch": 0.71, "learning_rate": 0.00019417052680147543, "loss": 0.0158, "step": 272180 }, { "epoch": 0.71, "learning_rate": 0.00019416663858510394, "loss": 0.0128, "step": 272190 }, { "epoch": 0.71, "learning_rate": 0.0001941627503687325, "loss": 0.0166, "step": 272200 }, { "epoch": 0.71, "learning_rate": 0.00019415886215236105, "loss": 0.0127, "step": 272210 }, { "epoch": 0.71, "learning_rate": 0.00019415497393598957, "loss": 0.0146, "step": 272220 }, { "epoch": 0.71, "learning_rate": 0.00019415108571961808, "loss": 0.0137, "step": 272230 }, { "epoch": 0.71, "learning_rate": 0.00019414719750324665, "loss": 0.0145, "step": 272240 }, { "epoch": 0.71, "learning_rate": 0.0001941433092868752, "loss": 0.012, "step": 272250 }, { "epoch": 0.71, "learning_rate": 0.0001941394210705037, "loss": 0.016, "step": 272260 }, { "epoch": 0.71, "learning_rate": 0.00019413553285413225, "loss": 0.0121, "step": 272270 }, { "epoch": 0.71, "learning_rate": 0.0001941316446377608, "loss": 0.0143, "step": 272280 }, { "epoch": 0.71, "learning_rate": 0.00019412775642138933, "loss": 0.0192, "step": 272290 }, { "epoch": 0.71, "learning_rate": 0.00019412386820501785, "loss": 0.014, "step": 272300 }, { "epoch": 0.71, "learning_rate": 0.0001941199799886464, "loss": 0.0136, "step": 272310 }, { "epoch": 0.71, "learning_rate": 0.00019411609177227493, "loss": 0.0165, "step": 272320 }, { "epoch": 0.71, "learning_rate": 0.00019411220355590347, "loss": 0.0127, "step": 272330 }, { "epoch": 0.71, "learning_rate": 0.00019410831533953199, "loss": 0.0167, "step": 272340 }, { "epoch": 0.71, "learning_rate": 0.00019410442712316053, "loss": 0.0126, "step": 272350 }, { "epoch": 0.71, "learning_rate": 0.0001941005389067891, "loss": 0.0177, "step": 272360 }, { "epoch": 0.71, "learning_rate": 0.0001940966506904176, "loss": 0.0127, "step": 272370 }, { "epoch": 0.71, "learning_rate": 0.00019409276247404612, "loss": 0.0242, "step": 272380 }, { "epoch": 0.71, "learning_rate": 0.00019408887425767467, "loss": 0.0161, "step": 272390 }, { "epoch": 0.71, "learning_rate": 0.00019408498604130324, "loss": 0.0163, "step": 272400 }, { "epoch": 0.71, "learning_rate": 0.00019408109782493175, "loss": 0.0157, "step": 272410 }, { "epoch": 0.71, "learning_rate": 0.0001940772096085603, "loss": 0.018, "step": 272420 }, { "epoch": 0.71, "learning_rate": 0.0001940733213921888, "loss": 0.0172, "step": 272430 }, { "epoch": 0.71, "learning_rate": 0.00019406943317581735, "loss": 0.0126, "step": 272440 }, { "epoch": 0.71, "learning_rate": 0.0001940655449594459, "loss": 0.0191, "step": 272450 }, { "epoch": 0.71, "learning_rate": 0.00019406165674307443, "loss": 0.0136, "step": 272460 }, { "epoch": 0.71, "learning_rate": 0.00019405776852670295, "loss": 0.0123, "step": 272470 }, { "epoch": 0.71, "learning_rate": 0.0001940538803103315, "loss": 0.0163, "step": 272480 }, { "epoch": 0.71, "learning_rate": 0.00019404999209396003, "loss": 0.013, "step": 272490 }, { "epoch": 0.71, "learning_rate": 0.00019404610387758857, "loss": 0.0137, "step": 272500 }, { "epoch": 0.71, "learning_rate": 0.00019404221566121708, "loss": 0.017, "step": 272510 }, { "epoch": 0.71, "learning_rate": 0.00019403832744484563, "loss": 0.0173, "step": 272520 }, { "epoch": 0.71, "learning_rate": 0.00019403443922847417, "loss": 0.0119, "step": 272530 }, { "epoch": 0.71, "learning_rate": 0.0001940305510121027, "loss": 0.0145, "step": 272540 }, { "epoch": 0.71, "learning_rate": 0.00019402666279573122, "loss": 0.0131, "step": 272550 }, { "epoch": 0.71, "learning_rate": 0.00019402277457935977, "loss": 0.0161, "step": 272560 }, { "epoch": 0.71, "learning_rate": 0.00019401888636298833, "loss": 0.0161, "step": 272570 }, { "epoch": 0.71, "learning_rate": 0.00019401499814661685, "loss": 0.0153, "step": 272580 }, { "epoch": 0.71, "learning_rate": 0.0001940111099302454, "loss": 0.0145, "step": 272590 }, { "epoch": 0.71, "learning_rate": 0.0001940072217138739, "loss": 0.0159, "step": 272600 }, { "epoch": 0.71, "learning_rate": 0.00019400333349750247, "loss": 0.0136, "step": 272610 }, { "epoch": 0.71, "learning_rate": 0.000193999445281131, "loss": 0.0152, "step": 272620 }, { "epoch": 0.71, "learning_rate": 0.00019399555706475953, "loss": 0.0151, "step": 272630 }, { "epoch": 0.71, "learning_rate": 0.00019399166884838804, "loss": 0.0193, "step": 272640 }, { "epoch": 0.71, "learning_rate": 0.0001939877806320166, "loss": 0.0143, "step": 272650 }, { "epoch": 0.71, "learning_rate": 0.00019398389241564513, "loss": 0.0126, "step": 272660 }, { "epoch": 0.71, "learning_rate": 0.00019398000419927367, "loss": 0.0223, "step": 272670 }, { "epoch": 0.71, "learning_rate": 0.00019397611598290218, "loss": 0.0141, "step": 272680 }, { "epoch": 0.71, "learning_rate": 0.00019397222776653073, "loss": 0.0141, "step": 272690 }, { "epoch": 0.71, "learning_rate": 0.00019396833955015927, "loss": 0.0162, "step": 272700 }, { "epoch": 0.71, "learning_rate": 0.0001939644513337878, "loss": 0.0173, "step": 272710 }, { "epoch": 0.71, "learning_rate": 0.00019396056311741632, "loss": 0.017, "step": 272720 }, { "epoch": 0.71, "learning_rate": 0.00019395667490104487, "loss": 0.0148, "step": 272730 }, { "epoch": 0.71, "learning_rate": 0.00019395278668467343, "loss": 0.0151, "step": 272740 }, { "epoch": 0.71, "learning_rate": 0.00019394889846830195, "loss": 0.0114, "step": 272750 }, { "epoch": 0.71, "learning_rate": 0.0001939450102519305, "loss": 0.0216, "step": 272760 }, { "epoch": 0.71, "learning_rate": 0.000193941122035559, "loss": 0.0142, "step": 272770 }, { "epoch": 0.71, "learning_rate": 0.00019393723381918757, "loss": 0.0153, "step": 272780 }, { "epoch": 0.71, "learning_rate": 0.0001939333456028161, "loss": 0.0131, "step": 272790 }, { "epoch": 0.71, "learning_rate": 0.00019392945738644463, "loss": 0.0175, "step": 272800 }, { "epoch": 0.71, "learning_rate": 0.00019392556917007314, "loss": 0.0136, "step": 272810 }, { "epoch": 0.71, "learning_rate": 0.0001939216809537017, "loss": 0.012, "step": 272820 }, { "epoch": 0.71, "learning_rate": 0.00019391779273733023, "loss": 0.0155, "step": 272830 }, { "epoch": 0.71, "learning_rate": 0.00019391390452095877, "loss": 0.0158, "step": 272840 }, { "epoch": 0.71, "learning_rate": 0.00019391001630458728, "loss": 0.0168, "step": 272850 }, { "epoch": 0.71, "learning_rate": 0.00019390612808821585, "loss": 0.0167, "step": 272860 }, { "epoch": 0.71, "learning_rate": 0.00019390223987184437, "loss": 0.0152, "step": 272870 }, { "epoch": 0.71, "learning_rate": 0.0001938983516554729, "loss": 0.0204, "step": 272880 }, { "epoch": 0.71, "learning_rate": 0.00019389446343910142, "loss": 0.0148, "step": 272890 }, { "epoch": 0.71, "learning_rate": 0.00019389057522273, "loss": 0.0151, "step": 272900 }, { "epoch": 0.71, "learning_rate": 0.00019388668700635853, "loss": 0.0142, "step": 272910 }, { "epoch": 0.71, "learning_rate": 0.00019388279878998705, "loss": 0.012, "step": 272920 }, { "epoch": 0.71, "learning_rate": 0.00019387891057361556, "loss": 0.0173, "step": 272930 }, { "epoch": 0.71, "learning_rate": 0.0001938750223572441, "loss": 0.018, "step": 272940 }, { "epoch": 0.71, "learning_rate": 0.00019387113414087267, "loss": 0.0127, "step": 272950 }, { "epoch": 0.71, "learning_rate": 0.0001938672459245012, "loss": 0.016, "step": 272960 }, { "epoch": 0.71, "learning_rate": 0.00019386335770812973, "loss": 0.014, "step": 272970 }, { "epoch": 0.71, "learning_rate": 0.00019385946949175824, "loss": 0.0172, "step": 272980 }, { "epoch": 0.71, "learning_rate": 0.0001938555812753868, "loss": 0.0159, "step": 272990 }, { "epoch": 0.71, "learning_rate": 0.00019385169305901533, "loss": 0.0182, "step": 273000 }, { "epoch": 0.71, "eval_cer": 0.8817376772465223, "eval_loss": 0.010078651830554008, "eval_runtime": 108.1362, "eval_samples_per_second": 18.495, "eval_steps_per_second": 4.624, "step": 273000 }, { "epoch": 0.71, "learning_rate": 0.00019384780484264387, "loss": 0.0187, "step": 273010 }, { "epoch": 0.71, "learning_rate": 0.00019384391662627238, "loss": 0.0127, "step": 273020 }, { "epoch": 0.71, "learning_rate": 0.00019384002840990095, "loss": 0.0135, "step": 273030 }, { "epoch": 0.71, "learning_rate": 0.00019383614019352947, "loss": 0.0144, "step": 273040 }, { "epoch": 0.71, "learning_rate": 0.000193832251977158, "loss": 0.016, "step": 273050 }, { "epoch": 0.71, "learning_rate": 0.00019382836376078652, "loss": 0.0188, "step": 273060 }, { "epoch": 0.71, "learning_rate": 0.0001938244755444151, "loss": 0.013, "step": 273070 }, { "epoch": 0.71, "learning_rate": 0.00019382058732804363, "loss": 0.0191, "step": 273080 }, { "epoch": 0.71, "learning_rate": 0.00019381669911167215, "loss": 0.0153, "step": 273090 }, { "epoch": 0.71, "learning_rate": 0.00019381281089530066, "loss": 0.0147, "step": 273100 }, { "epoch": 0.71, "learning_rate": 0.00019380892267892923, "loss": 0.016, "step": 273110 }, { "epoch": 0.71, "learning_rate": 0.00019380503446255777, "loss": 0.0163, "step": 273120 }, { "epoch": 0.71, "learning_rate": 0.0001938011462461863, "loss": 0.0162, "step": 273130 }, { "epoch": 0.71, "learning_rate": 0.00019379725802981483, "loss": 0.0182, "step": 273140 }, { "epoch": 0.71, "learning_rate": 0.00019379336981344337, "loss": 0.0166, "step": 273150 }, { "epoch": 0.71, "learning_rate": 0.0001937894815970719, "loss": 0.014, "step": 273160 }, { "epoch": 0.71, "learning_rate": 0.00019378559338070043, "loss": 0.0157, "step": 273170 }, { "epoch": 0.71, "learning_rate": 0.00019378170516432897, "loss": 0.0145, "step": 273180 }, { "epoch": 0.71, "learning_rate": 0.00019377781694795748, "loss": 0.0158, "step": 273190 }, { "epoch": 0.71, "learning_rate": 0.00019377392873158605, "loss": 0.02, "step": 273200 }, { "epoch": 0.71, "learning_rate": 0.00019377004051521457, "loss": 0.015, "step": 273210 }, { "epoch": 0.71, "learning_rate": 0.0001937661522988431, "loss": 0.0154, "step": 273220 }, { "epoch": 0.71, "learning_rate": 0.00019376226408247162, "loss": 0.0177, "step": 273230 }, { "epoch": 0.71, "learning_rate": 0.0001937583758661002, "loss": 0.0142, "step": 273240 }, { "epoch": 0.71, "learning_rate": 0.0001937544876497287, "loss": 0.0172, "step": 273250 }, { "epoch": 0.71, "learning_rate": 0.00019375059943335725, "loss": 0.0126, "step": 273260 }, { "epoch": 0.71, "learning_rate": 0.00019374671121698576, "loss": 0.0138, "step": 273270 }, { "epoch": 0.71, "learning_rate": 0.00019374282300061433, "loss": 0.014, "step": 273280 }, { "epoch": 0.71, "learning_rate": 0.00019373893478424287, "loss": 0.0148, "step": 273290 }, { "epoch": 0.71, "learning_rate": 0.00019373504656787139, "loss": 0.014, "step": 273300 }, { "epoch": 0.71, "learning_rate": 0.00019373115835149993, "loss": 0.0182, "step": 273310 }, { "epoch": 0.71, "learning_rate": 0.00019372727013512847, "loss": 0.0144, "step": 273320 }, { "epoch": 0.71, "learning_rate": 0.000193723381918757, "loss": 0.0154, "step": 273330 }, { "epoch": 0.71, "learning_rate": 0.00019371949370238553, "loss": 0.0182, "step": 273340 }, { "epoch": 0.71, "learning_rate": 0.00019371560548601407, "loss": 0.0173, "step": 273350 }, { "epoch": 0.71, "learning_rate": 0.0001937117172696426, "loss": 0.0175, "step": 273360 }, { "epoch": 0.71, "learning_rate": 0.00019370782905327115, "loss": 0.0208, "step": 273370 }, { "epoch": 0.71, "learning_rate": 0.00019370394083689967, "loss": 0.0151, "step": 273380 }, { "epoch": 0.71, "learning_rate": 0.0001937000526205282, "loss": 0.0147, "step": 273390 }, { "epoch": 0.71, "learning_rate": 0.00019369616440415675, "loss": 0.0142, "step": 273400 }, { "epoch": 0.71, "learning_rate": 0.0001936922761877853, "loss": 0.014, "step": 273410 }, { "epoch": 0.71, "learning_rate": 0.0001936883879714138, "loss": 0.0139, "step": 273420 }, { "epoch": 0.71, "learning_rate": 0.00019368449975504235, "loss": 0.0152, "step": 273430 }, { "epoch": 0.71, "learning_rate": 0.00019368061153867086, "loss": 0.0183, "step": 273440 }, { "epoch": 0.71, "learning_rate": 0.00019367672332229943, "loss": 0.0141, "step": 273450 }, { "epoch": 0.71, "learning_rate": 0.00019367283510592797, "loss": 0.0131, "step": 273460 }, { "epoch": 0.71, "learning_rate": 0.00019366894688955649, "loss": 0.0128, "step": 273470 }, { "epoch": 0.71, "learning_rate": 0.00019366505867318503, "loss": 0.0148, "step": 273480 }, { "epoch": 0.71, "learning_rate": 0.00019366117045681357, "loss": 0.0143, "step": 273490 }, { "epoch": 0.71, "learning_rate": 0.0001936572822404421, "loss": 0.0173, "step": 273500 }, { "epoch": 0.71, "learning_rate": 0.00019365339402407063, "loss": 0.0184, "step": 273510 }, { "epoch": 0.71, "learning_rate": 0.00019364950580769917, "loss": 0.0158, "step": 273520 }, { "epoch": 0.71, "learning_rate": 0.0001936456175913277, "loss": 0.018, "step": 273530 }, { "epoch": 0.71, "learning_rate": 0.00019364172937495625, "loss": 0.0137, "step": 273540 }, { "epoch": 0.71, "learning_rate": 0.00019363784115858476, "loss": 0.014, "step": 273550 }, { "epoch": 0.71, "learning_rate": 0.0001936339529422133, "loss": 0.0133, "step": 273560 }, { "epoch": 0.71, "learning_rate": 0.00019363006472584185, "loss": 0.018, "step": 273570 }, { "epoch": 0.71, "learning_rate": 0.0001936261765094704, "loss": 0.0163, "step": 273580 }, { "epoch": 0.71, "learning_rate": 0.0001936222882930989, "loss": 0.0159, "step": 273590 }, { "epoch": 0.71, "learning_rate": 0.00019361840007672745, "loss": 0.0156, "step": 273600 }, { "epoch": 0.71, "learning_rate": 0.00019361451186035601, "loss": 0.0155, "step": 273610 }, { "epoch": 0.71, "learning_rate": 0.00019361062364398453, "loss": 0.0124, "step": 273620 }, { "epoch": 0.71, "learning_rate": 0.00019360673542761307, "loss": 0.015, "step": 273630 }, { "epoch": 0.71, "learning_rate": 0.00019360284721124158, "loss": 0.014, "step": 273640 }, { "epoch": 0.71, "learning_rate": 0.00019359895899487015, "loss": 0.0127, "step": 273650 }, { "epoch": 0.71, "learning_rate": 0.00019359507077849867, "loss": 0.0163, "step": 273660 }, { "epoch": 0.71, "learning_rate": 0.0001935911825621272, "loss": 0.0132, "step": 273670 }, { "epoch": 0.71, "learning_rate": 0.00019358729434575572, "loss": 0.0141, "step": 273680 }, { "epoch": 0.71, "learning_rate": 0.00019358340612938427, "loss": 0.014, "step": 273690 }, { "epoch": 0.71, "learning_rate": 0.0001935795179130128, "loss": 0.0134, "step": 273700 }, { "epoch": 0.71, "learning_rate": 0.00019357562969664135, "loss": 0.0131, "step": 273710 }, { "epoch": 0.71, "learning_rate": 0.00019357174148026986, "loss": 0.0127, "step": 273720 }, { "epoch": 0.71, "learning_rate": 0.0001935678532638984, "loss": 0.0121, "step": 273730 }, { "epoch": 0.71, "learning_rate": 0.00019356396504752695, "loss": 0.0169, "step": 273740 }, { "epoch": 0.71, "learning_rate": 0.0001935600768311555, "loss": 0.0152, "step": 273750 }, { "epoch": 0.71, "learning_rate": 0.000193556188614784, "loss": 0.0191, "step": 273760 }, { "epoch": 0.71, "learning_rate": 0.00019355230039841254, "loss": 0.0187, "step": 273770 }, { "epoch": 0.71, "learning_rate": 0.00019354841218204111, "loss": 0.0146, "step": 273780 }, { "epoch": 0.71, "learning_rate": 0.00019354452396566963, "loss": 0.0126, "step": 273790 }, { "epoch": 0.71, "learning_rate": 0.00019354063574929814, "loss": 0.0115, "step": 273800 }, { "epoch": 0.71, "learning_rate": 0.00019353674753292668, "loss": 0.0153, "step": 273810 }, { "epoch": 0.71, "learning_rate": 0.00019353285931655525, "loss": 0.0149, "step": 273820 }, { "epoch": 0.71, "learning_rate": 0.00019352897110018377, "loss": 0.0149, "step": 273830 }, { "epoch": 0.71, "learning_rate": 0.0001935250828838123, "loss": 0.0197, "step": 273840 }, { "epoch": 0.71, "learning_rate": 0.00019352119466744082, "loss": 0.0147, "step": 273850 }, { "epoch": 0.71, "learning_rate": 0.0001935173064510694, "loss": 0.0146, "step": 273860 }, { "epoch": 0.71, "learning_rate": 0.0001935134182346979, "loss": 0.0153, "step": 273870 }, { "epoch": 0.71, "learning_rate": 0.00019350953001832645, "loss": 0.0176, "step": 273880 }, { "epoch": 0.71, "learning_rate": 0.00019350564180195496, "loss": 0.0145, "step": 273890 }, { "epoch": 0.71, "learning_rate": 0.00019350175358558353, "loss": 0.0156, "step": 273900 }, { "epoch": 0.71, "learning_rate": 0.00019349786536921205, "loss": 0.0146, "step": 273910 }, { "epoch": 0.71, "learning_rate": 0.0001934939771528406, "loss": 0.0158, "step": 273920 }, { "epoch": 0.71, "learning_rate": 0.0001934900889364691, "loss": 0.0165, "step": 273930 }, { "epoch": 0.71, "learning_rate": 0.00019348620072009764, "loss": 0.0153, "step": 273940 }, { "epoch": 0.71, "learning_rate": 0.0001934823125037262, "loss": 0.0152, "step": 273950 }, { "epoch": 0.71, "learning_rate": 0.00019347842428735473, "loss": 0.012, "step": 273960 }, { "epoch": 0.71, "learning_rate": 0.00019347453607098324, "loss": 0.0146, "step": 273970 }, { "epoch": 0.71, "learning_rate": 0.00019347064785461178, "loss": 0.0142, "step": 273980 }, { "epoch": 0.71, "learning_rate": 0.00019346675963824035, "loss": 0.0166, "step": 273990 }, { "epoch": 0.71, "learning_rate": 0.00019346287142186887, "loss": 0.0154, "step": 274000 }, { "epoch": 0.71, "eval_cer": 0.8817334783357197, "eval_loss": 0.01036932785063982, "eval_runtime": 107.9436, "eval_samples_per_second": 18.528, "eval_steps_per_second": 4.632, "step": 274000 }, { "epoch": 0.71, "learning_rate": 0.0001934589832054974, "loss": 0.0154, "step": 274010 }, { "epoch": 0.71, "learning_rate": 0.00019345509498912592, "loss": 0.0133, "step": 274020 }, { "epoch": 0.71, "learning_rate": 0.0001934512067727545, "loss": 0.0137, "step": 274030 }, { "epoch": 0.71, "learning_rate": 0.000193447318556383, "loss": 0.0134, "step": 274040 }, { "epoch": 0.71, "learning_rate": 0.00019344343034001155, "loss": 0.0189, "step": 274050 }, { "epoch": 0.71, "learning_rate": 0.00019343954212364006, "loss": 0.015, "step": 274060 }, { "epoch": 0.71, "learning_rate": 0.00019343565390726863, "loss": 0.0151, "step": 274070 }, { "epoch": 0.71, "learning_rate": 0.00019343176569089715, "loss": 0.0122, "step": 274080 }, { "epoch": 0.71, "learning_rate": 0.0001934278774745257, "loss": 0.0124, "step": 274090 }, { "epoch": 0.71, "learning_rate": 0.0001934239892581542, "loss": 0.0174, "step": 274100 }, { "epoch": 0.71, "learning_rate": 0.00019342010104178277, "loss": 0.0207, "step": 274110 }, { "epoch": 0.71, "learning_rate": 0.00019341621282541129, "loss": 0.0154, "step": 274120 }, { "epoch": 0.71, "learning_rate": 0.00019341232460903983, "loss": 0.0145, "step": 274130 }, { "epoch": 0.71, "learning_rate": 0.00019340843639266834, "loss": 0.012, "step": 274140 }, { "epoch": 0.71, "learning_rate": 0.0001934045481762969, "loss": 0.0139, "step": 274150 }, { "epoch": 0.71, "learning_rate": 0.00019340065995992545, "loss": 0.0144, "step": 274160 }, { "epoch": 0.71, "learning_rate": 0.00019339677174355397, "loss": 0.0143, "step": 274170 }, { "epoch": 0.71, "learning_rate": 0.0001933928835271825, "loss": 0.0157, "step": 274180 }, { "epoch": 0.71, "learning_rate": 0.00019338899531081102, "loss": 0.0167, "step": 274190 }, { "epoch": 0.71, "learning_rate": 0.0001933851070944396, "loss": 0.0115, "step": 274200 }, { "epoch": 0.71, "learning_rate": 0.0001933812188780681, "loss": 0.0149, "step": 274210 }, { "epoch": 0.71, "learning_rate": 0.00019337733066169665, "loss": 0.0145, "step": 274220 }, { "epoch": 0.71, "learning_rate": 0.00019337344244532516, "loss": 0.0144, "step": 274230 }, { "epoch": 0.71, "learning_rate": 0.00019336955422895373, "loss": 0.0159, "step": 274240 }, { "epoch": 0.71, "learning_rate": 0.00019336566601258225, "loss": 0.0121, "step": 274250 }, { "epoch": 0.71, "learning_rate": 0.0001933617777962108, "loss": 0.0176, "step": 274260 }, { "epoch": 0.71, "learning_rate": 0.0001933578895798393, "loss": 0.0141, "step": 274270 }, { "epoch": 0.71, "learning_rate": 0.00019335400136346787, "loss": 0.0204, "step": 274280 }, { "epoch": 0.71, "learning_rate": 0.00019335011314709638, "loss": 0.011, "step": 274290 }, { "epoch": 0.71, "learning_rate": 0.00019334622493072493, "loss": 0.0181, "step": 274300 }, { "epoch": 0.71, "learning_rate": 0.00019334233671435344, "loss": 0.0135, "step": 274310 }, { "epoch": 0.71, "learning_rate": 0.000193338448497982, "loss": 0.0202, "step": 274320 }, { "epoch": 0.71, "learning_rate": 0.00019333456028161055, "loss": 0.0159, "step": 274330 }, { "epoch": 0.71, "learning_rate": 0.00019333067206523907, "loss": 0.0115, "step": 274340 }, { "epoch": 0.71, "learning_rate": 0.0001933267838488676, "loss": 0.0143, "step": 274350 }, { "epoch": 0.71, "learning_rate": 0.00019332289563249615, "loss": 0.0153, "step": 274360 }, { "epoch": 0.71, "learning_rate": 0.0001933190074161247, "loss": 0.0131, "step": 274370 }, { "epoch": 0.71, "learning_rate": 0.0001933151191997532, "loss": 0.0159, "step": 274380 }, { "epoch": 0.71, "learning_rate": 0.00019331123098338175, "loss": 0.0124, "step": 274390 }, { "epoch": 0.71, "learning_rate": 0.0001933073427670103, "loss": 0.0156, "step": 274400 }, { "epoch": 0.71, "learning_rate": 0.00019330345455063883, "loss": 0.0146, "step": 274410 }, { "epoch": 0.71, "learning_rate": 0.00019329956633426734, "loss": 0.017, "step": 274420 }, { "epoch": 0.71, "learning_rate": 0.0001932956781178959, "loss": 0.0131, "step": 274430 }, { "epoch": 0.71, "learning_rate": 0.0001932917899015244, "loss": 0.0162, "step": 274440 }, { "epoch": 0.71, "learning_rate": 0.00019328790168515297, "loss": 0.0129, "step": 274450 }, { "epoch": 0.71, "learning_rate": 0.00019328401346878148, "loss": 0.0172, "step": 274460 }, { "epoch": 0.71, "learning_rate": 0.00019328012525241003, "loss": 0.0205, "step": 274470 }, { "epoch": 0.71, "learning_rate": 0.00019327623703603854, "loss": 0.0152, "step": 274480 }, { "epoch": 0.71, "learning_rate": 0.0001932723488196671, "loss": 0.0151, "step": 274490 }, { "epoch": 0.71, "learning_rate": 0.00019326846060329565, "loss": 0.0149, "step": 274500 }, { "epoch": 0.71, "learning_rate": 0.00019326457238692417, "loss": 0.0116, "step": 274510 }, { "epoch": 0.71, "learning_rate": 0.00019326068417055268, "loss": 0.0132, "step": 274520 }, { "epoch": 0.71, "learning_rate": 0.00019325679595418125, "loss": 0.0129, "step": 274530 }, { "epoch": 0.71, "learning_rate": 0.0001932529077378098, "loss": 0.0158, "step": 274540 }, { "epoch": 0.71, "learning_rate": 0.0001932490195214383, "loss": 0.0203, "step": 274550 }, { "epoch": 0.71, "learning_rate": 0.00019324513130506685, "loss": 0.0112, "step": 274560 }, { "epoch": 0.71, "learning_rate": 0.0001932412430886954, "loss": 0.0135, "step": 274570 }, { "epoch": 0.71, "learning_rate": 0.00019323735487232393, "loss": 0.0164, "step": 274580 }, { "epoch": 0.71, "learning_rate": 0.00019323346665595244, "loss": 0.0134, "step": 274590 }, { "epoch": 0.71, "learning_rate": 0.00019322957843958099, "loss": 0.015, "step": 274600 }, { "epoch": 0.71, "learning_rate": 0.00019322569022320953, "loss": 0.0125, "step": 274610 }, { "epoch": 0.71, "learning_rate": 0.00019322180200683807, "loss": 0.0154, "step": 274620 }, { "epoch": 0.71, "learning_rate": 0.00019321791379046658, "loss": 0.014, "step": 274630 }, { "epoch": 0.71, "learning_rate": 0.00019321402557409513, "loss": 0.015, "step": 274640 }, { "epoch": 0.71, "learning_rate": 0.0001932101373577237, "loss": 0.0114, "step": 274650 }, { "epoch": 0.71, "learning_rate": 0.0001932062491413522, "loss": 0.0134, "step": 274660 }, { "epoch": 0.71, "learning_rate": 0.00019320236092498075, "loss": 0.0204, "step": 274670 }, { "epoch": 0.71, "learning_rate": 0.00019319847270860926, "loss": 0.0156, "step": 274680 }, { "epoch": 0.71, "learning_rate": 0.00019319458449223778, "loss": 0.0181, "step": 274690 }, { "epoch": 0.71, "learning_rate": 0.00019319069627586635, "loss": 0.0157, "step": 274700 }, { "epoch": 0.71, "learning_rate": 0.0001931868080594949, "loss": 0.0112, "step": 274710 }, { "epoch": 0.71, "learning_rate": 0.0001931829198431234, "loss": 0.0162, "step": 274720 }, { "epoch": 0.71, "learning_rate": 0.00019317903162675195, "loss": 0.0156, "step": 274730 }, { "epoch": 0.71, "learning_rate": 0.0001931751434103805, "loss": 0.0152, "step": 274740 }, { "epoch": 0.71, "learning_rate": 0.00019317125519400903, "loss": 0.0109, "step": 274750 }, { "epoch": 0.71, "learning_rate": 0.00019316736697763754, "loss": 0.012, "step": 274760 }, { "epoch": 0.71, "learning_rate": 0.00019316347876126609, "loss": 0.0155, "step": 274770 }, { "epoch": 0.71, "learning_rate": 0.00019315959054489463, "loss": 0.0136, "step": 274780 }, { "epoch": 0.71, "learning_rate": 0.00019315570232852317, "loss": 0.0151, "step": 274790 }, { "epoch": 0.71, "learning_rate": 0.00019315181411215168, "loss": 0.0123, "step": 274800 }, { "epoch": 0.71, "learning_rate": 0.00019314792589578022, "loss": 0.0134, "step": 274810 }, { "epoch": 0.71, "learning_rate": 0.0001931440376794088, "loss": 0.0135, "step": 274820 }, { "epoch": 0.71, "learning_rate": 0.0001931401494630373, "loss": 0.0113, "step": 274830 }, { "epoch": 0.71, "learning_rate": 0.00019313626124666582, "loss": 0.0161, "step": 274840 }, { "epoch": 0.71, "learning_rate": 0.00019313237303029436, "loss": 0.0119, "step": 274850 }, { "epoch": 0.71, "learning_rate": 0.00019312848481392293, "loss": 0.0173, "step": 274860 }, { "epoch": 0.71, "learning_rate": 0.00019312459659755145, "loss": 0.0141, "step": 274870 }, { "epoch": 0.71, "learning_rate": 0.00019312070838118, "loss": 0.0147, "step": 274880 }, { "epoch": 0.71, "learning_rate": 0.0001931168201648085, "loss": 0.0136, "step": 274890 }, { "epoch": 0.71, "learning_rate": 0.00019311293194843707, "loss": 0.0179, "step": 274900 }, { "epoch": 0.71, "learning_rate": 0.0001931090437320656, "loss": 0.0158, "step": 274910 }, { "epoch": 0.71, "learning_rate": 0.00019310515551569413, "loss": 0.016, "step": 274920 }, { "epoch": 0.71, "learning_rate": 0.00019310126729932264, "loss": 0.0195, "step": 274930 }, { "epoch": 0.71, "learning_rate": 0.00019309737908295118, "loss": 0.0148, "step": 274940 }, { "epoch": 0.71, "learning_rate": 0.00019309349086657973, "loss": 0.0162, "step": 274950 }, { "epoch": 0.71, "learning_rate": 0.00019308960265020827, "loss": 0.0121, "step": 274960 }, { "epoch": 0.71, "learning_rate": 0.00019308571443383678, "loss": 0.0135, "step": 274970 }, { "epoch": 0.71, "learning_rate": 0.00019308182621746532, "loss": 0.0307, "step": 274980 }, { "epoch": 0.71, "learning_rate": 0.00019307793800109387, "loss": 0.0164, "step": 274990 }, { "epoch": 0.71, "learning_rate": 0.0001930740497847224, "loss": 0.0202, "step": 275000 }, { "epoch": 0.71, "eval_cer": 0.8818006609085604, "eval_loss": 0.010618000291287899, "eval_runtime": 108.0775, "eval_samples_per_second": 18.505, "eval_steps_per_second": 4.626, "step": 275000 }, { "epoch": 0.71, "learning_rate": 0.00019307016156835092, "loss": 0.0244, "step": 275010 }, { "epoch": 0.71, "learning_rate": 0.00019306627335197946, "loss": 0.0135, "step": 275020 }, { "epoch": 0.71, "learning_rate": 0.00019306238513560803, "loss": 0.0144, "step": 275030 }, { "epoch": 0.71, "learning_rate": 0.00019305849691923655, "loss": 0.0161, "step": 275040 }, { "epoch": 0.71, "learning_rate": 0.0001930546087028651, "loss": 0.0146, "step": 275050 }, { "epoch": 0.71, "learning_rate": 0.0001930507204864936, "loss": 0.0172, "step": 275060 }, { "epoch": 0.71, "learning_rate": 0.00019304683227012217, "loss": 0.0122, "step": 275070 }, { "epoch": 0.71, "learning_rate": 0.00019304294405375069, "loss": 0.0158, "step": 275080 }, { "epoch": 0.71, "learning_rate": 0.00019303905583737923, "loss": 0.0159, "step": 275090 }, { "epoch": 0.71, "learning_rate": 0.00019303516762100774, "loss": 0.017, "step": 275100 }, { "epoch": 0.71, "learning_rate": 0.0001930312794046363, "loss": 0.0155, "step": 275110 }, { "epoch": 0.71, "learning_rate": 0.00019302739118826483, "loss": 0.0143, "step": 275120 }, { "epoch": 0.71, "learning_rate": 0.00019302350297189337, "loss": 0.0152, "step": 275130 }, { "epoch": 0.71, "learning_rate": 0.00019301961475552188, "loss": 0.0164, "step": 275140 }, { "epoch": 0.71, "learning_rate": 0.00019301572653915045, "loss": 0.014, "step": 275150 }, { "epoch": 0.71, "learning_rate": 0.00019301183832277897, "loss": 0.0137, "step": 275160 }, { "epoch": 0.71, "learning_rate": 0.0001930079501064075, "loss": 0.014, "step": 275170 }, { "epoch": 0.71, "learning_rate": 0.00019300406189003602, "loss": 0.0117, "step": 275180 }, { "epoch": 0.71, "learning_rate": 0.00019300017367366456, "loss": 0.0204, "step": 275190 }, { "epoch": 0.71, "learning_rate": 0.00019299628545729313, "loss": 0.0158, "step": 275200 }, { "epoch": 0.71, "learning_rate": 0.00019299239724092165, "loss": 0.0152, "step": 275210 }, { "epoch": 0.71, "learning_rate": 0.0001929885090245502, "loss": 0.0157, "step": 275220 }, { "epoch": 0.71, "learning_rate": 0.0001929846208081787, "loss": 0.0147, "step": 275230 }, { "epoch": 0.71, "learning_rate": 0.00019298073259180727, "loss": 0.0118, "step": 275240 }, { "epoch": 0.71, "learning_rate": 0.00019297684437543579, "loss": 0.0152, "step": 275250 }, { "epoch": 0.71, "learning_rate": 0.00019297295615906433, "loss": 0.0129, "step": 275260 }, { "epoch": 0.71, "learning_rate": 0.00019296906794269284, "loss": 0.016, "step": 275270 }, { "epoch": 0.71, "learning_rate": 0.0001929651797263214, "loss": 0.018, "step": 275280 }, { "epoch": 0.71, "learning_rate": 0.00019296129150994993, "loss": 0.0134, "step": 275290 }, { "epoch": 0.71, "learning_rate": 0.00019295740329357847, "loss": 0.0156, "step": 275300 }, { "epoch": 0.71, "learning_rate": 0.00019295351507720698, "loss": 0.0179, "step": 275310 }, { "epoch": 0.71, "learning_rate": 0.00019294962686083555, "loss": 0.0143, "step": 275320 }, { "epoch": 0.71, "learning_rate": 0.00019294573864446406, "loss": 0.0112, "step": 275330 }, { "epoch": 0.71, "learning_rate": 0.0001929418504280926, "loss": 0.0134, "step": 275340 }, { "epoch": 0.71, "learning_rate": 0.00019293796221172112, "loss": 0.0138, "step": 275350 }, { "epoch": 0.71, "learning_rate": 0.0001929340739953497, "loss": 0.0151, "step": 275360 }, { "epoch": 0.71, "learning_rate": 0.00019293018577897823, "loss": 0.0135, "step": 275370 }, { "epoch": 0.71, "learning_rate": 0.00019292629756260675, "loss": 0.0175, "step": 275380 }, { "epoch": 0.71, "learning_rate": 0.00019292240934623526, "loss": 0.0138, "step": 275390 }, { "epoch": 0.71, "learning_rate": 0.0001929185211298638, "loss": 0.013, "step": 275400 }, { "epoch": 0.71, "learning_rate": 0.00019291463291349237, "loss": 0.0146, "step": 275410 }, { "epoch": 0.71, "learning_rate": 0.00019291074469712089, "loss": 0.0122, "step": 275420 }, { "epoch": 0.71, "learning_rate": 0.00019290685648074943, "loss": 0.0157, "step": 275430 }, { "epoch": 0.71, "learning_rate": 0.00019290296826437794, "loss": 0.0152, "step": 275440 }, { "epoch": 0.71, "learning_rate": 0.0001928990800480065, "loss": 0.0212, "step": 275450 }, { "epoch": 0.71, "learning_rate": 0.00019289519183163502, "loss": 0.0204, "step": 275460 }, { "epoch": 0.71, "learning_rate": 0.00019289130361526357, "loss": 0.0127, "step": 275470 }, { "epoch": 0.71, "learning_rate": 0.00019288741539889208, "loss": 0.0152, "step": 275480 }, { "epoch": 0.71, "learning_rate": 0.00019288352718252065, "loss": 0.0152, "step": 275490 }, { "epoch": 0.71, "learning_rate": 0.00019287963896614916, "loss": 0.0131, "step": 275500 }, { "epoch": 0.71, "learning_rate": 0.0001928757507497777, "loss": 0.0161, "step": 275510 }, { "epoch": 0.71, "learning_rate": 0.00019287186253340622, "loss": 0.0137, "step": 275520 }, { "epoch": 0.71, "learning_rate": 0.0001928679743170348, "loss": 0.0152, "step": 275530 }, { "epoch": 0.71, "learning_rate": 0.00019286408610066333, "loss": 0.0138, "step": 275540 }, { "epoch": 0.71, "learning_rate": 0.00019286019788429185, "loss": 0.0133, "step": 275550 }, { "epoch": 0.71, "learning_rate": 0.00019285630966792036, "loss": 0.0131, "step": 275560 }, { "epoch": 0.71, "learning_rate": 0.00019285242145154893, "loss": 0.0162, "step": 275570 }, { "epoch": 0.71, "learning_rate": 0.00019284853323517747, "loss": 0.0157, "step": 275580 }, { "epoch": 0.71, "learning_rate": 0.00019284464501880598, "loss": 0.0151, "step": 275590 }, { "epoch": 0.71, "learning_rate": 0.00019284075680243453, "loss": 0.0149, "step": 275600 }, { "epoch": 0.71, "learning_rate": 0.00019283686858606307, "loss": 0.0128, "step": 275610 }, { "epoch": 0.71, "learning_rate": 0.0001928329803696916, "loss": 0.0158, "step": 275620 }, { "epoch": 0.71, "learning_rate": 0.00019282909215332012, "loss": 0.0147, "step": 275630 }, { "epoch": 0.71, "learning_rate": 0.00019282520393694867, "loss": 0.0178, "step": 275640 }, { "epoch": 0.71, "learning_rate": 0.00019282131572057718, "loss": 0.0128, "step": 275650 }, { "epoch": 0.71, "learning_rate": 0.00019281742750420575, "loss": 0.0148, "step": 275660 }, { "epoch": 0.71, "learning_rate": 0.00019281353928783426, "loss": 0.013, "step": 275670 }, { "epoch": 0.71, "learning_rate": 0.0001928096510714628, "loss": 0.0146, "step": 275680 }, { "epoch": 0.71, "learning_rate": 0.00019280576285509132, "loss": 0.0145, "step": 275690 }, { "epoch": 0.71, "learning_rate": 0.0001928018746387199, "loss": 0.0121, "step": 275700 }, { "epoch": 0.71, "learning_rate": 0.0001927979864223484, "loss": 0.0124, "step": 275710 }, { "epoch": 0.71, "learning_rate": 0.00019279409820597694, "loss": 0.0169, "step": 275720 }, { "epoch": 0.71, "learning_rate": 0.00019279020998960546, "loss": 0.0141, "step": 275730 }, { "epoch": 0.71, "learning_rate": 0.00019278632177323403, "loss": 0.0167, "step": 275740 }, { "epoch": 0.71, "learning_rate": 0.00019278243355686257, "loss": 0.0135, "step": 275750 }, { "epoch": 0.71, "learning_rate": 0.00019277854534049108, "loss": 0.0145, "step": 275760 }, { "epoch": 0.71, "learning_rate": 0.00019277465712411963, "loss": 0.0147, "step": 275770 }, { "epoch": 0.71, "learning_rate": 0.00019277076890774817, "loss": 0.0132, "step": 275780 }, { "epoch": 0.71, "learning_rate": 0.0001927668806913767, "loss": 0.0141, "step": 275790 }, { "epoch": 0.71, "learning_rate": 0.00019276299247500522, "loss": 0.0181, "step": 275800 }, { "epoch": 0.71, "learning_rate": 0.00019275910425863377, "loss": 0.0141, "step": 275810 }, { "epoch": 0.71, "learning_rate": 0.0001927552160422623, "loss": 0.0164, "step": 275820 }, { "epoch": 0.71, "learning_rate": 0.00019275132782589085, "loss": 0.0157, "step": 275830 }, { "epoch": 0.72, "learning_rate": 0.00019274743960951936, "loss": 0.0142, "step": 275840 }, { "epoch": 0.72, "learning_rate": 0.0001927435513931479, "loss": 0.0161, "step": 275850 }, { "epoch": 0.72, "learning_rate": 0.00019273966317677647, "loss": 0.0143, "step": 275860 }, { "epoch": 0.72, "learning_rate": 0.000192735774960405, "loss": 0.0138, "step": 275870 }, { "epoch": 0.72, "learning_rate": 0.0001927318867440335, "loss": 0.0173, "step": 275880 }, { "epoch": 0.72, "learning_rate": 0.00019272799852766204, "loss": 0.0144, "step": 275890 }, { "epoch": 0.72, "learning_rate": 0.00019272411031129056, "loss": 0.02, "step": 275900 }, { "epoch": 0.72, "learning_rate": 0.00019272022209491913, "loss": 0.016, "step": 275910 }, { "epoch": 0.72, "learning_rate": 0.00019271633387854767, "loss": 0.0175, "step": 275920 }, { "epoch": 0.72, "learning_rate": 0.00019271244566217618, "loss": 0.0241, "step": 275930 }, { "epoch": 0.72, "learning_rate": 0.00019270855744580473, "loss": 0.017, "step": 275940 }, { "epoch": 0.72, "learning_rate": 0.00019270466922943327, "loss": 0.0132, "step": 275950 }, { "epoch": 0.72, "learning_rate": 0.0001927007810130618, "loss": 0.0133, "step": 275960 }, { "epoch": 0.72, "learning_rate": 0.00019269689279669032, "loss": 0.0119, "step": 275970 }, { "epoch": 0.72, "learning_rate": 0.00019269300458031886, "loss": 0.0181, "step": 275980 }, { "epoch": 0.72, "learning_rate": 0.0001926891163639474, "loss": 0.0148, "step": 275990 }, { "epoch": 0.72, "learning_rate": 0.00019268522814757595, "loss": 0.0139, "step": 276000 }, { "epoch": 0.72, "eval_cer": 0.8817124837817071, "eval_loss": 0.010350687429308891, "eval_runtime": 107.9687, "eval_samples_per_second": 18.524, "eval_steps_per_second": 4.631, "step": 276000 }, { "epoch": 0.72, "learning_rate": 0.00019268133993120446, "loss": 0.0166, "step": 276010 }, { "epoch": 0.72, "learning_rate": 0.000192677451714833, "loss": 0.0144, "step": 276020 }, { "epoch": 0.72, "learning_rate": 0.00019267356349846155, "loss": 0.0454, "step": 276030 }, { "epoch": 0.72, "learning_rate": 0.0001926696752820901, "loss": 0.0141, "step": 276040 }, { "epoch": 0.72, "learning_rate": 0.0001926657870657186, "loss": 0.0161, "step": 276050 }, { "epoch": 0.72, "learning_rate": 0.00019266189884934714, "loss": 0.0144, "step": 276060 }, { "epoch": 0.72, "learning_rate": 0.0001926580106329757, "loss": 0.0129, "step": 276070 }, { "epoch": 0.72, "learning_rate": 0.00019265412241660423, "loss": 0.0179, "step": 276080 }, { "epoch": 0.72, "learning_rate": 0.00019265023420023277, "loss": 0.0126, "step": 276090 }, { "epoch": 0.72, "learning_rate": 0.00019264634598386128, "loss": 0.0142, "step": 276100 }, { "epoch": 0.72, "learning_rate": 0.00019264245776748985, "loss": 0.0182, "step": 276110 }, { "epoch": 0.72, "learning_rate": 0.00019263856955111837, "loss": 0.0138, "step": 276120 }, { "epoch": 0.72, "learning_rate": 0.0001926346813347469, "loss": 0.0124, "step": 276130 }, { "epoch": 0.72, "learning_rate": 0.00019263079311837542, "loss": 0.0141, "step": 276140 }, { "epoch": 0.72, "learning_rate": 0.00019262690490200396, "loss": 0.0152, "step": 276150 }, { "epoch": 0.72, "learning_rate": 0.0001926230166856325, "loss": 0.0142, "step": 276160 }, { "epoch": 0.72, "learning_rate": 0.00019261912846926105, "loss": 0.0131, "step": 276170 }, { "epoch": 0.72, "learning_rate": 0.00019261524025288956, "loss": 0.012, "step": 276180 }, { "epoch": 0.72, "learning_rate": 0.0001926113520365181, "loss": 0.0171, "step": 276190 }, { "epoch": 0.72, "learning_rate": 0.00019260746382014665, "loss": 0.0175, "step": 276200 }, { "epoch": 0.72, "learning_rate": 0.0001926035756037752, "loss": 0.0211, "step": 276210 }, { "epoch": 0.72, "learning_rate": 0.0001925996873874037, "loss": 0.0157, "step": 276220 }, { "epoch": 0.72, "learning_rate": 0.00019259579917103224, "loss": 0.0177, "step": 276230 }, { "epoch": 0.72, "learning_rate": 0.0001925919109546608, "loss": 0.0137, "step": 276240 }, { "epoch": 0.72, "learning_rate": 0.00019258802273828933, "loss": 0.017, "step": 276250 }, { "epoch": 0.72, "learning_rate": 0.00019258413452191787, "loss": 0.0149, "step": 276260 }, { "epoch": 0.72, "learning_rate": 0.00019258024630554638, "loss": 0.0169, "step": 276270 }, { "epoch": 0.72, "learning_rate": 0.00019257635808917495, "loss": 0.0116, "step": 276280 }, { "epoch": 0.72, "learning_rate": 0.00019257246987280347, "loss": 0.014, "step": 276290 }, { "epoch": 0.72, "learning_rate": 0.000192568581656432, "loss": 0.0135, "step": 276300 }, { "epoch": 0.72, "learning_rate": 0.00019256469344006052, "loss": 0.0124, "step": 276310 }, { "epoch": 0.72, "learning_rate": 0.0001925608052236891, "loss": 0.0138, "step": 276320 }, { "epoch": 0.72, "learning_rate": 0.0001925569170073176, "loss": 0.0144, "step": 276330 }, { "epoch": 0.72, "learning_rate": 0.00019255302879094615, "loss": 0.0133, "step": 276340 }, { "epoch": 0.72, "learning_rate": 0.00019254914057457466, "loss": 0.0146, "step": 276350 }, { "epoch": 0.72, "learning_rate": 0.00019254525235820323, "loss": 0.0145, "step": 276360 }, { "epoch": 0.72, "learning_rate": 0.00019254136414183174, "loss": 0.0152, "step": 276370 }, { "epoch": 0.72, "learning_rate": 0.00019253747592546029, "loss": 0.0149, "step": 276380 }, { "epoch": 0.72, "learning_rate": 0.0001925335877090888, "loss": 0.0196, "step": 276390 }, { "epoch": 0.72, "learning_rate": 0.00019252969949271734, "loss": 0.0136, "step": 276400 }, { "epoch": 0.72, "learning_rate": 0.0001925258112763459, "loss": 0.0189, "step": 276410 }, { "epoch": 0.72, "learning_rate": 0.00019252192305997443, "loss": 0.0154, "step": 276420 }, { "epoch": 0.72, "learning_rate": 0.00019251803484360294, "loss": 0.0228, "step": 276430 }, { "epoch": 0.72, "learning_rate": 0.00019251414662723148, "loss": 0.0119, "step": 276440 }, { "epoch": 0.72, "learning_rate": 0.00019251025841086005, "loss": 0.0144, "step": 276450 }, { "epoch": 0.72, "learning_rate": 0.00019250637019448857, "loss": 0.0125, "step": 276460 }, { "epoch": 0.72, "learning_rate": 0.0001925024819781171, "loss": 0.0145, "step": 276470 }, { "epoch": 0.72, "learning_rate": 0.00019249859376174562, "loss": 0.018, "step": 276480 }, { "epoch": 0.72, "learning_rate": 0.0001924947055453742, "loss": 0.014, "step": 276490 }, { "epoch": 0.72, "learning_rate": 0.0001924908173290027, "loss": 0.018, "step": 276500 }, { "epoch": 0.72, "learning_rate": 0.00019248692911263125, "loss": 0.0116, "step": 276510 }, { "epoch": 0.72, "learning_rate": 0.00019248304089625976, "loss": 0.0145, "step": 276520 }, { "epoch": 0.72, "learning_rate": 0.00019247915267988833, "loss": 0.0154, "step": 276530 }, { "epoch": 0.72, "learning_rate": 0.00019247526446351684, "loss": 0.0147, "step": 276540 }, { "epoch": 0.72, "learning_rate": 0.00019247137624714539, "loss": 0.0138, "step": 276550 }, { "epoch": 0.72, "learning_rate": 0.0001924674880307739, "loss": 0.0149, "step": 276560 }, { "epoch": 0.72, "learning_rate": 0.00019246359981440247, "loss": 0.0179, "step": 276570 }, { "epoch": 0.72, "learning_rate": 0.00019245971159803098, "loss": 0.0139, "step": 276580 }, { "epoch": 0.72, "learning_rate": 0.00019245582338165952, "loss": 0.0196, "step": 276590 }, { "epoch": 0.72, "learning_rate": 0.00019245193516528804, "loss": 0.0175, "step": 276600 }, { "epoch": 0.72, "learning_rate": 0.0001924480469489166, "loss": 0.0119, "step": 276610 }, { "epoch": 0.72, "learning_rate": 0.00019244415873254515, "loss": 0.0145, "step": 276620 }, { "epoch": 0.72, "learning_rate": 0.00019244027051617366, "loss": 0.0107, "step": 276630 }, { "epoch": 0.72, "learning_rate": 0.0001924363822998022, "loss": 0.018, "step": 276640 }, { "epoch": 0.72, "learning_rate": 0.00019243249408343072, "loss": 0.0154, "step": 276650 }, { "epoch": 0.72, "learning_rate": 0.0001924286058670593, "loss": 0.0161, "step": 276660 }, { "epoch": 0.72, "learning_rate": 0.0001924247176506878, "loss": 0.0137, "step": 276670 }, { "epoch": 0.72, "learning_rate": 0.00019242082943431635, "loss": 0.0173, "step": 276680 }, { "epoch": 0.72, "learning_rate": 0.00019241694121794486, "loss": 0.0189, "step": 276690 }, { "epoch": 0.72, "learning_rate": 0.00019241305300157343, "loss": 0.0155, "step": 276700 }, { "epoch": 0.72, "learning_rate": 0.00019240916478520194, "loss": 0.0168, "step": 276710 }, { "epoch": 0.72, "learning_rate": 0.00019240527656883048, "loss": 0.0179, "step": 276720 }, { "epoch": 0.72, "learning_rate": 0.000192401388352459, "loss": 0.0175, "step": 276730 }, { "epoch": 0.72, "learning_rate": 0.00019239750013608757, "loss": 0.0159, "step": 276740 }, { "epoch": 0.72, "learning_rate": 0.00019239361191971608, "loss": 0.0133, "step": 276750 }, { "epoch": 0.72, "learning_rate": 0.00019238972370334462, "loss": 0.0148, "step": 276760 }, { "epoch": 0.72, "learning_rate": 0.00019238583548697314, "loss": 0.0149, "step": 276770 }, { "epoch": 0.72, "learning_rate": 0.0001923819472706017, "loss": 0.0186, "step": 276780 }, { "epoch": 0.72, "learning_rate": 0.00019237805905423025, "loss": 0.0132, "step": 276790 }, { "epoch": 0.72, "learning_rate": 0.00019237417083785876, "loss": 0.0137, "step": 276800 }, { "epoch": 0.72, "learning_rate": 0.0001923702826214873, "loss": 0.0162, "step": 276810 }, { "epoch": 0.72, "learning_rate": 0.00019236639440511585, "loss": 0.0143, "step": 276820 }, { "epoch": 0.72, "learning_rate": 0.0001923625061887444, "loss": 0.0169, "step": 276830 }, { "epoch": 0.72, "learning_rate": 0.0001923586179723729, "loss": 0.0201, "step": 276840 }, { "epoch": 0.72, "learning_rate": 0.00019235472975600144, "loss": 0.014, "step": 276850 }, { "epoch": 0.72, "learning_rate": 0.00019235084153963, "loss": 0.0176, "step": 276860 }, { "epoch": 0.72, "learning_rate": 0.00019234695332325853, "loss": 0.0142, "step": 276870 }, { "epoch": 0.72, "learning_rate": 0.00019234306510688704, "loss": 0.0142, "step": 276880 }, { "epoch": 0.72, "learning_rate": 0.00019233917689051558, "loss": 0.0135, "step": 276890 }, { "epoch": 0.72, "learning_rate": 0.0001923352886741441, "loss": 0.0165, "step": 276900 }, { "epoch": 0.72, "learning_rate": 0.00019233140045777267, "loss": 0.0167, "step": 276910 }, { "epoch": 0.72, "learning_rate": 0.00019232751224140118, "loss": 0.0155, "step": 276920 }, { "epoch": 0.72, "learning_rate": 0.00019232362402502972, "loss": 0.0172, "step": 276930 }, { "epoch": 0.72, "learning_rate": 0.00019231973580865824, "loss": 0.0227, "step": 276940 }, { "epoch": 0.72, "learning_rate": 0.0001923158475922868, "loss": 0.0176, "step": 276950 }, { "epoch": 0.72, "learning_rate": 0.00019231195937591535, "loss": 0.0158, "step": 276960 }, { "epoch": 0.72, "learning_rate": 0.00019230807115954386, "loss": 0.0134, "step": 276970 }, { "epoch": 0.72, "learning_rate": 0.00019230418294317238, "loss": 0.0152, "step": 276980 }, { "epoch": 0.72, "learning_rate": 0.00019230029472680095, "loss": 0.0171, "step": 276990 }, { "epoch": 0.72, "learning_rate": 0.0001922964065104295, "loss": 0.0138, "step": 277000 }, { "epoch": 0.72, "eval_cer": 0.8817138834186412, "eval_loss": 0.010107412934303284, "eval_runtime": 108.0568, "eval_samples_per_second": 18.509, "eval_steps_per_second": 4.627, "step": 277000 }, { "epoch": 0.72, "learning_rate": 0.000192292518294058, "loss": 0.012, "step": 277010 }, { "epoch": 0.72, "learning_rate": 0.00019228863007768654, "loss": 0.0118, "step": 277020 }, { "epoch": 0.72, "learning_rate": 0.00019228474186131509, "loss": 0.0182, "step": 277030 }, { "epoch": 0.72, "learning_rate": 0.00019228085364494363, "loss": 0.0176, "step": 277040 }, { "epoch": 0.72, "learning_rate": 0.00019227696542857214, "loss": 0.0138, "step": 277050 }, { "epoch": 0.72, "learning_rate": 0.00019227307721220068, "loss": 0.0124, "step": 277060 }, { "epoch": 0.72, "learning_rate": 0.00019226918899582923, "loss": 0.0124, "step": 277070 }, { "epoch": 0.72, "learning_rate": 0.00019226530077945777, "loss": 0.0164, "step": 277080 }, { "epoch": 0.72, "learning_rate": 0.00019226141256308628, "loss": 0.0137, "step": 277090 }, { "epoch": 0.72, "learning_rate": 0.00019225752434671482, "loss": 0.0167, "step": 277100 }, { "epoch": 0.72, "learning_rate": 0.0001922536361303434, "loss": 0.0157, "step": 277110 }, { "epoch": 0.72, "learning_rate": 0.0001922497479139719, "loss": 0.0148, "step": 277120 }, { "epoch": 0.72, "learning_rate": 0.00019224585969760045, "loss": 0.0154, "step": 277130 }, { "epoch": 0.72, "learning_rate": 0.00019224197148122896, "loss": 0.0166, "step": 277140 }, { "epoch": 0.72, "learning_rate": 0.00019223808326485748, "loss": 0.0136, "step": 277150 }, { "epoch": 0.72, "learning_rate": 0.00019223419504848605, "loss": 0.0142, "step": 277160 }, { "epoch": 0.72, "learning_rate": 0.0001922303068321146, "loss": 0.015, "step": 277170 }, { "epoch": 0.72, "learning_rate": 0.0001922264186157431, "loss": 0.0166, "step": 277180 }, { "epoch": 0.72, "learning_rate": 0.00019222253039937164, "loss": 0.0163, "step": 277190 }, { "epoch": 0.72, "learning_rate": 0.00019221864218300019, "loss": 0.0165, "step": 277200 }, { "epoch": 0.72, "learning_rate": 0.00019221475396662873, "loss": 0.0167, "step": 277210 }, { "epoch": 0.72, "learning_rate": 0.00019221086575025724, "loss": 0.0196, "step": 277220 }, { "epoch": 0.72, "learning_rate": 0.00019220697753388578, "loss": 0.015, "step": 277230 }, { "epoch": 0.72, "learning_rate": 0.00019220308931751432, "loss": 0.0203, "step": 277240 }, { "epoch": 0.72, "learning_rate": 0.00019219920110114287, "loss": 0.0171, "step": 277250 }, { "epoch": 0.72, "learning_rate": 0.00019219531288477138, "loss": 0.0163, "step": 277260 }, { "epoch": 0.72, "learning_rate": 0.00019219142466839992, "loss": 0.0175, "step": 277270 }, { "epoch": 0.72, "learning_rate": 0.0001921875364520285, "loss": 0.0186, "step": 277280 }, { "epoch": 0.72, "learning_rate": 0.000192183648235657, "loss": 0.011, "step": 277290 }, { "epoch": 0.72, "learning_rate": 0.00019217976001928552, "loss": 0.0144, "step": 277300 }, { "epoch": 0.72, "learning_rate": 0.00019217587180291406, "loss": 0.0161, "step": 277310 }, { "epoch": 0.72, "learning_rate": 0.00019217198358654263, "loss": 0.0131, "step": 277320 }, { "epoch": 0.72, "learning_rate": 0.00019216809537017115, "loss": 0.0124, "step": 277330 }, { "epoch": 0.72, "learning_rate": 0.0001921642071537997, "loss": 0.0137, "step": 277340 }, { "epoch": 0.72, "learning_rate": 0.0001921603189374282, "loss": 0.0142, "step": 277350 }, { "epoch": 0.72, "learning_rate": 0.00019215643072105677, "loss": 0.0115, "step": 277360 }, { "epoch": 0.72, "learning_rate": 0.00019215254250468528, "loss": 0.0148, "step": 277370 }, { "epoch": 0.72, "learning_rate": 0.00019214865428831383, "loss": 0.0119, "step": 277380 }, { "epoch": 0.72, "learning_rate": 0.00019214476607194234, "loss": 0.0178, "step": 277390 }, { "epoch": 0.72, "learning_rate": 0.00019214087785557088, "loss": 0.0169, "step": 277400 }, { "epoch": 0.72, "learning_rate": 0.00019213698963919942, "loss": 0.0159, "step": 277410 }, { "epoch": 0.72, "learning_rate": 0.00019213310142282797, "loss": 0.0169, "step": 277420 }, { "epoch": 0.72, "learning_rate": 0.00019212921320645648, "loss": 0.0174, "step": 277430 }, { "epoch": 0.72, "learning_rate": 0.00019212532499008502, "loss": 0.0124, "step": 277440 }, { "epoch": 0.72, "learning_rate": 0.0001921214367737136, "loss": 0.0172, "step": 277450 }, { "epoch": 0.72, "learning_rate": 0.0001921175485573421, "loss": 0.0123, "step": 277460 }, { "epoch": 0.72, "learning_rate": 0.00019211366034097062, "loss": 0.0134, "step": 277470 }, { "epoch": 0.72, "learning_rate": 0.00019210977212459916, "loss": 0.0139, "step": 277480 }, { "epoch": 0.72, "learning_rate": 0.00019210588390822773, "loss": 0.0184, "step": 277490 }, { "epoch": 0.72, "learning_rate": 0.00019210199569185624, "loss": 0.0141, "step": 277500 }, { "epoch": 0.72, "learning_rate": 0.0001920981074754848, "loss": 0.0144, "step": 277510 }, { "epoch": 0.72, "learning_rate": 0.0001920942192591133, "loss": 0.0127, "step": 277520 }, { "epoch": 0.72, "learning_rate": 0.00019209033104274187, "loss": 0.0123, "step": 277530 }, { "epoch": 0.72, "learning_rate": 0.00019208644282637038, "loss": 0.0163, "step": 277540 }, { "epoch": 0.72, "learning_rate": 0.00019208255460999893, "loss": 0.0171, "step": 277550 }, { "epoch": 0.72, "learning_rate": 0.00019207866639362744, "loss": 0.0145, "step": 277560 }, { "epoch": 0.72, "learning_rate": 0.000192074778177256, "loss": 0.012, "step": 277570 }, { "epoch": 0.72, "learning_rate": 0.00019207088996088452, "loss": 0.0165, "step": 277580 }, { "epoch": 0.72, "learning_rate": 0.00019206700174451307, "loss": 0.0164, "step": 277590 }, { "epoch": 0.72, "learning_rate": 0.00019206311352814158, "loss": 0.0165, "step": 277600 }, { "epoch": 0.72, "learning_rate": 0.00019205922531177015, "loss": 0.0204, "step": 277610 }, { "epoch": 0.72, "learning_rate": 0.00019205533709539866, "loss": 0.0124, "step": 277620 }, { "epoch": 0.72, "learning_rate": 0.0001920514488790272, "loss": 0.0147, "step": 277630 }, { "epoch": 0.72, "learning_rate": 0.00019204756066265572, "loss": 0.0125, "step": 277640 }, { "epoch": 0.72, "learning_rate": 0.00019204367244628426, "loss": 0.0127, "step": 277650 }, { "epoch": 0.72, "learning_rate": 0.00019203978422991283, "loss": 0.0158, "step": 277660 }, { "epoch": 0.72, "learning_rate": 0.00019203589601354134, "loss": 0.0138, "step": 277670 }, { "epoch": 0.72, "learning_rate": 0.00019203200779716989, "loss": 0.0154, "step": 277680 }, { "epoch": 0.72, "learning_rate": 0.0001920281195807984, "loss": 0.0184, "step": 277690 }, { "epoch": 0.72, "learning_rate": 0.00019202423136442697, "loss": 0.0141, "step": 277700 }, { "epoch": 0.72, "learning_rate": 0.00019202034314805548, "loss": 0.0165, "step": 277710 }, { "epoch": 0.72, "learning_rate": 0.00019201645493168403, "loss": 0.0154, "step": 277720 }, { "epoch": 0.72, "learning_rate": 0.00019201256671531254, "loss": 0.0163, "step": 277730 }, { "epoch": 0.72, "learning_rate": 0.0001920086784989411, "loss": 0.0162, "step": 277740 }, { "epoch": 0.72, "learning_rate": 0.00019200479028256962, "loss": 0.0169, "step": 277750 }, { "epoch": 0.72, "learning_rate": 0.00019200090206619816, "loss": 0.0128, "step": 277760 }, { "epoch": 0.72, "learning_rate": 0.00019199701384982668, "loss": 0.0167, "step": 277770 }, { "epoch": 0.72, "learning_rate": 0.00019199312563345525, "loss": 0.0165, "step": 277780 }, { "epoch": 0.72, "learning_rate": 0.00019198923741708376, "loss": 0.0121, "step": 277790 }, { "epoch": 0.72, "learning_rate": 0.0001919853492007123, "loss": 0.0131, "step": 277800 }, { "epoch": 0.72, "learning_rate": 0.00019198146098434082, "loss": 0.0132, "step": 277810 }, { "epoch": 0.72, "learning_rate": 0.0001919775727679694, "loss": 0.0108, "step": 277820 }, { "epoch": 0.72, "learning_rate": 0.00019197368455159793, "loss": 0.0165, "step": 277830 }, { "epoch": 0.72, "learning_rate": 0.00019196979633522644, "loss": 0.0148, "step": 277840 }, { "epoch": 0.72, "learning_rate": 0.00019196590811885499, "loss": 0.0133, "step": 277850 }, { "epoch": 0.72, "learning_rate": 0.00019196201990248353, "loss": 0.0137, "step": 277860 }, { "epoch": 0.72, "learning_rate": 0.00019195813168611207, "loss": 0.0128, "step": 277870 }, { "epoch": 0.72, "learning_rate": 0.00019195424346974058, "loss": 0.0159, "step": 277880 }, { "epoch": 0.72, "learning_rate": 0.00019195035525336912, "loss": 0.0165, "step": 277890 }, { "epoch": 0.72, "learning_rate": 0.00019194646703699764, "loss": 0.0209, "step": 277900 }, { "epoch": 0.72, "learning_rate": 0.0001919425788206262, "loss": 0.0189, "step": 277910 }, { "epoch": 0.72, "learning_rate": 0.00019193869060425472, "loss": 0.0159, "step": 277920 }, { "epoch": 0.72, "learning_rate": 0.00019193480238788326, "loss": 0.0148, "step": 277930 }, { "epoch": 0.72, "learning_rate": 0.00019193091417151178, "loss": 0.0143, "step": 277940 }, { "epoch": 0.72, "learning_rate": 0.00019192702595514035, "loss": 0.0146, "step": 277950 }, { "epoch": 0.72, "learning_rate": 0.00019192313773876886, "loss": 0.0161, "step": 277960 }, { "epoch": 0.72, "learning_rate": 0.0001919192495223974, "loss": 0.0136, "step": 277970 }, { "epoch": 0.72, "learning_rate": 0.00019191536130602592, "loss": 0.0156, "step": 277980 }, { "epoch": 0.72, "learning_rate": 0.0001919114730896545, "loss": 0.0179, "step": 277990 }, { "epoch": 0.72, "learning_rate": 0.00019190758487328303, "loss": 0.0139, "step": 278000 }, { "epoch": 0.72, "eval_cer": 0.8817334783357197, "eval_loss": 0.010161010548472404, "eval_runtime": 108.0178, "eval_samples_per_second": 18.515, "eval_steps_per_second": 4.629, "step": 278000 }, { "epoch": 0.72, "learning_rate": 0.00019190369665691154, "loss": 0.0165, "step": 278010 }, { "epoch": 0.72, "learning_rate": 0.00019189980844054006, "loss": 0.0169, "step": 278020 }, { "epoch": 0.72, "learning_rate": 0.00019189592022416863, "loss": 0.0142, "step": 278030 }, { "epoch": 0.72, "learning_rate": 0.00019189203200779717, "loss": 0.0107, "step": 278040 }, { "epoch": 0.72, "learning_rate": 0.00019188814379142568, "loss": 0.0135, "step": 278050 }, { "epoch": 0.72, "learning_rate": 0.00019188425557505422, "loss": 0.0125, "step": 278060 }, { "epoch": 0.72, "learning_rate": 0.00019188036735868277, "loss": 0.0164, "step": 278070 }, { "epoch": 0.72, "learning_rate": 0.0001918764791423113, "loss": 0.0132, "step": 278080 }, { "epoch": 0.72, "learning_rate": 0.00019187259092593982, "loss": 0.0191, "step": 278090 }, { "epoch": 0.72, "learning_rate": 0.00019186870270956836, "loss": 0.0155, "step": 278100 }, { "epoch": 0.72, "learning_rate": 0.0001918648144931969, "loss": 0.0146, "step": 278110 }, { "epoch": 0.72, "learning_rate": 0.00019186092627682545, "loss": 0.0122, "step": 278120 }, { "epoch": 0.72, "learning_rate": 0.00019185703806045396, "loss": 0.0182, "step": 278130 }, { "epoch": 0.72, "learning_rate": 0.0001918531498440825, "loss": 0.0146, "step": 278140 }, { "epoch": 0.72, "learning_rate": 0.00019184926162771102, "loss": 0.0137, "step": 278150 }, { "epoch": 0.72, "learning_rate": 0.00019184537341133959, "loss": 0.0163, "step": 278160 }, { "epoch": 0.72, "learning_rate": 0.0001918414851949681, "loss": 0.0163, "step": 278170 }, { "epoch": 0.72, "learning_rate": 0.00019183759697859664, "loss": 0.0123, "step": 278180 }, { "epoch": 0.72, "learning_rate": 0.00019183370876222516, "loss": 0.0177, "step": 278190 }, { "epoch": 0.72, "learning_rate": 0.00019182982054585373, "loss": 0.0125, "step": 278200 }, { "epoch": 0.72, "learning_rate": 0.00019182593232948227, "loss": 0.0119, "step": 278210 }, { "epoch": 0.72, "learning_rate": 0.00019182204411311078, "loss": 0.0114, "step": 278220 }, { "epoch": 0.72, "learning_rate": 0.00019181815589673932, "loss": 0.0117, "step": 278230 }, { "epoch": 0.72, "learning_rate": 0.00019181426768036787, "loss": 0.0173, "step": 278240 }, { "epoch": 0.72, "learning_rate": 0.0001918103794639964, "loss": 0.0125, "step": 278250 }, { "epoch": 0.72, "learning_rate": 0.00019180649124762492, "loss": 0.0133, "step": 278260 }, { "epoch": 0.72, "learning_rate": 0.00019180260303125346, "loss": 0.0144, "step": 278270 }, { "epoch": 0.72, "learning_rate": 0.000191798714814882, "loss": 0.0141, "step": 278280 }, { "epoch": 0.72, "learning_rate": 0.00019179482659851055, "loss": 0.0171, "step": 278290 }, { "epoch": 0.72, "learning_rate": 0.00019179093838213906, "loss": 0.0188, "step": 278300 }, { "epoch": 0.72, "learning_rate": 0.0001917870501657676, "loss": 0.0138, "step": 278310 }, { "epoch": 0.72, "learning_rate": 0.00019178316194939617, "loss": 0.0136, "step": 278320 }, { "epoch": 0.72, "learning_rate": 0.00019177927373302469, "loss": 0.015, "step": 278330 }, { "epoch": 0.72, "learning_rate": 0.0001917753855166532, "loss": 0.0151, "step": 278340 }, { "epoch": 0.72, "learning_rate": 0.00019177149730028174, "loss": 0.0126, "step": 278350 }, { "epoch": 0.72, "learning_rate": 0.0001917676090839103, "loss": 0.0107, "step": 278360 }, { "epoch": 0.72, "learning_rate": 0.00019176372086753883, "loss": 0.0143, "step": 278370 }, { "epoch": 0.72, "learning_rate": 0.00019175983265116737, "loss": 0.0163, "step": 278380 }, { "epoch": 0.72, "learning_rate": 0.00019175594443479588, "loss": 0.0155, "step": 278390 }, { "epoch": 0.72, "learning_rate": 0.00019175205621842442, "loss": 0.0142, "step": 278400 }, { "epoch": 0.72, "learning_rate": 0.00019174816800205296, "loss": 0.013, "step": 278410 }, { "epoch": 0.72, "learning_rate": 0.0001917442797856815, "loss": 0.0151, "step": 278420 }, { "epoch": 0.72, "learning_rate": 0.00019174039156931002, "loss": 0.0183, "step": 278430 }, { "epoch": 0.72, "learning_rate": 0.00019173650335293856, "loss": 0.015, "step": 278440 }, { "epoch": 0.72, "learning_rate": 0.0001917326151365671, "loss": 0.0162, "step": 278450 }, { "epoch": 0.72, "learning_rate": 0.00019172872692019565, "loss": 0.0141, "step": 278460 }, { "epoch": 0.72, "learning_rate": 0.00019172483870382416, "loss": 0.0145, "step": 278470 }, { "epoch": 0.72, "learning_rate": 0.0001917209504874527, "loss": 0.0138, "step": 278480 }, { "epoch": 0.72, "learning_rate": 0.00019171706227108124, "loss": 0.0133, "step": 278490 }, { "epoch": 0.72, "learning_rate": 0.00019171317405470979, "loss": 0.013, "step": 278500 }, { "epoch": 0.72, "learning_rate": 0.0001917092858383383, "loss": 0.0161, "step": 278510 }, { "epoch": 0.72, "learning_rate": 0.00019170539762196684, "loss": 0.0164, "step": 278520 }, { "epoch": 0.72, "learning_rate": 0.0001917015094055954, "loss": 0.0134, "step": 278530 }, { "epoch": 0.72, "learning_rate": 0.00019169762118922392, "loss": 0.0197, "step": 278540 }, { "epoch": 0.72, "learning_rate": 0.00019169373297285247, "loss": 0.0161, "step": 278550 }, { "epoch": 0.72, "learning_rate": 0.00019168984475648098, "loss": 0.0134, "step": 278560 }, { "epoch": 0.72, "learning_rate": 0.00019168595654010955, "loss": 0.016, "step": 278570 }, { "epoch": 0.72, "learning_rate": 0.00019168206832373806, "loss": 0.0154, "step": 278580 }, { "epoch": 0.72, "learning_rate": 0.0001916781801073666, "loss": 0.0162, "step": 278590 }, { "epoch": 0.72, "learning_rate": 0.00019167429189099512, "loss": 0.0133, "step": 278600 }, { "epoch": 0.72, "learning_rate": 0.0001916704036746237, "loss": 0.0143, "step": 278610 }, { "epoch": 0.72, "learning_rate": 0.0001916665154582522, "loss": 0.019, "step": 278620 }, { "epoch": 0.72, "learning_rate": 0.00019166262724188075, "loss": 0.0133, "step": 278630 }, { "epoch": 0.72, "learning_rate": 0.00019165873902550926, "loss": 0.0151, "step": 278640 }, { "epoch": 0.72, "learning_rate": 0.0001916548508091378, "loss": 0.0135, "step": 278650 }, { "epoch": 0.72, "learning_rate": 0.00019165096259276634, "loss": 0.0149, "step": 278660 }, { "epoch": 0.72, "learning_rate": 0.00019164707437639488, "loss": 0.0159, "step": 278670 }, { "epoch": 0.72, "learning_rate": 0.0001916431861600234, "loss": 0.0146, "step": 278680 }, { "epoch": 0.72, "learning_rate": 0.00019163929794365194, "loss": 0.0118, "step": 278690 }, { "epoch": 0.72, "learning_rate": 0.0001916354097272805, "loss": 0.0122, "step": 278700 }, { "epoch": 0.72, "learning_rate": 0.00019163152151090902, "loss": 0.0157, "step": 278710 }, { "epoch": 0.72, "learning_rate": 0.00019162763329453757, "loss": 0.0177, "step": 278720 }, { "epoch": 0.72, "learning_rate": 0.00019162374507816608, "loss": 0.0124, "step": 278730 }, { "epoch": 0.72, "learning_rate": 0.00019161985686179465, "loss": 0.0136, "step": 278740 }, { "epoch": 0.72, "learning_rate": 0.00019161596864542316, "loss": 0.0136, "step": 278750 }, { "epoch": 0.72, "learning_rate": 0.0001916120804290517, "loss": 0.0133, "step": 278760 }, { "epoch": 0.72, "learning_rate": 0.00019160819221268022, "loss": 0.0177, "step": 278770 }, { "epoch": 0.72, "learning_rate": 0.0001916043039963088, "loss": 0.0153, "step": 278780 }, { "epoch": 0.72, "learning_rate": 0.0001916004157799373, "loss": 0.0142, "step": 278790 }, { "epoch": 0.72, "learning_rate": 0.00019159652756356584, "loss": 0.0167, "step": 278800 }, { "epoch": 0.72, "learning_rate": 0.00019159263934719436, "loss": 0.0181, "step": 278810 }, { "epoch": 0.72, "learning_rate": 0.00019158875113082293, "loss": 0.0117, "step": 278820 }, { "epoch": 0.72, "learning_rate": 0.00019158486291445144, "loss": 0.0162, "step": 278830 }, { "epoch": 0.72, "learning_rate": 0.00019158097469807998, "loss": 0.0138, "step": 278840 }, { "epoch": 0.72, "learning_rate": 0.0001915770864817085, "loss": 0.0188, "step": 278850 }, { "epoch": 0.72, "learning_rate": 0.00019157319826533707, "loss": 0.0164, "step": 278860 }, { "epoch": 0.72, "learning_rate": 0.0001915693100489656, "loss": 0.0143, "step": 278870 }, { "epoch": 0.72, "learning_rate": 0.00019156542183259412, "loss": 0.0171, "step": 278880 }, { "epoch": 0.72, "learning_rate": 0.00019156153361622264, "loss": 0.0156, "step": 278890 }, { "epoch": 0.72, "learning_rate": 0.00019155764539985118, "loss": 0.0157, "step": 278900 }, { "epoch": 0.72, "learning_rate": 0.00019155375718347975, "loss": 0.0133, "step": 278910 }, { "epoch": 0.72, "learning_rate": 0.00019154986896710826, "loss": 0.0246, "step": 278920 }, { "epoch": 0.72, "learning_rate": 0.0001915459807507368, "loss": 0.0165, "step": 278930 }, { "epoch": 0.72, "learning_rate": 0.00019154209253436532, "loss": 0.0158, "step": 278940 }, { "epoch": 0.72, "learning_rate": 0.0001915382043179939, "loss": 0.0173, "step": 278950 }, { "epoch": 0.72, "learning_rate": 0.0001915343161016224, "loss": 0.0147, "step": 278960 }, { "epoch": 0.72, "learning_rate": 0.00019153042788525094, "loss": 0.0155, "step": 278970 }, { "epoch": 0.72, "learning_rate": 0.00019152653966887946, "loss": 0.0135, "step": 278980 }, { "epoch": 0.72, "learning_rate": 0.00019152265145250803, "loss": 0.0136, "step": 278990 }, { "epoch": 0.72, "learning_rate": 0.00019151876323613654, "loss": 0.0186, "step": 279000 }, { "epoch": 0.72, "eval_cer": 0.8817292794249172, "eval_loss": 0.010195926763117313, "eval_runtime": 107.8323, "eval_samples_per_second": 18.547, "eval_steps_per_second": 4.637, "step": 279000 }, { "epoch": 0.72, "learning_rate": 0.00019151487501976508, "loss": 0.0157, "step": 279010 }, { "epoch": 0.72, "learning_rate": 0.0001915109868033936, "loss": 0.0154, "step": 279020 }, { "epoch": 0.72, "learning_rate": 0.00019150709858702217, "loss": 0.0161, "step": 279030 }, { "epoch": 0.72, "learning_rate": 0.0001915032103706507, "loss": 0.0144, "step": 279040 }, { "epoch": 0.72, "learning_rate": 0.00019149932215427922, "loss": 0.0188, "step": 279050 }, { "epoch": 0.72, "learning_rate": 0.00019149543393790774, "loss": 0.0136, "step": 279060 }, { "epoch": 0.72, "learning_rate": 0.0001914915457215363, "loss": 0.0121, "step": 279070 }, { "epoch": 0.72, "learning_rate": 0.00019148765750516485, "loss": 0.0196, "step": 279080 }, { "epoch": 0.72, "learning_rate": 0.00019148376928879336, "loss": 0.015, "step": 279090 }, { "epoch": 0.72, "learning_rate": 0.0001914798810724219, "loss": 0.0128, "step": 279100 }, { "epoch": 0.72, "learning_rate": 0.00019147599285605045, "loss": 0.0124, "step": 279110 }, { "epoch": 0.72, "learning_rate": 0.000191472104639679, "loss": 0.0138, "step": 279120 }, { "epoch": 0.72, "learning_rate": 0.0001914682164233075, "loss": 0.0174, "step": 279130 }, { "epoch": 0.72, "learning_rate": 0.00019146432820693604, "loss": 0.0151, "step": 279140 }, { "epoch": 0.72, "learning_rate": 0.00019146043999056456, "loss": 0.0117, "step": 279150 }, { "epoch": 0.72, "learning_rate": 0.00019145655177419313, "loss": 0.0133, "step": 279160 }, { "epoch": 0.72, "learning_rate": 0.00019145266355782164, "loss": 0.0146, "step": 279170 }, { "epoch": 0.72, "learning_rate": 0.00019144877534145018, "loss": 0.0143, "step": 279180 }, { "epoch": 0.72, "learning_rate": 0.0001914448871250787, "loss": 0.0138, "step": 279190 }, { "epoch": 0.72, "learning_rate": 0.00019144099890870727, "loss": 0.0114, "step": 279200 }, { "epoch": 0.72, "learning_rate": 0.00019143711069233578, "loss": 0.0166, "step": 279210 }, { "epoch": 0.72, "learning_rate": 0.00019143322247596432, "loss": 0.0165, "step": 279220 }, { "epoch": 0.72, "learning_rate": 0.00019142933425959284, "loss": 0.0125, "step": 279230 }, { "epoch": 0.72, "learning_rate": 0.0001914254460432214, "loss": 0.015, "step": 279240 }, { "epoch": 0.72, "learning_rate": 0.00019142155782684995, "loss": 0.0129, "step": 279250 }, { "epoch": 0.72, "learning_rate": 0.00019141766961047846, "loss": 0.0146, "step": 279260 }, { "epoch": 0.72, "learning_rate": 0.000191413781394107, "loss": 0.0146, "step": 279270 }, { "epoch": 0.72, "learning_rate": 0.00019140989317773555, "loss": 0.0109, "step": 279280 }, { "epoch": 0.72, "learning_rate": 0.0001914060049613641, "loss": 0.0141, "step": 279290 }, { "epoch": 0.72, "learning_rate": 0.0001914021167449926, "loss": 0.0164, "step": 279300 }, { "epoch": 0.72, "learning_rate": 0.00019139822852862114, "loss": 0.0126, "step": 279310 }, { "epoch": 0.72, "learning_rate": 0.00019139434031224968, "loss": 0.0166, "step": 279320 }, { "epoch": 0.72, "learning_rate": 0.00019139045209587823, "loss": 0.0136, "step": 279330 }, { "epoch": 0.72, "learning_rate": 0.00019138656387950674, "loss": 0.0162, "step": 279340 }, { "epoch": 0.72, "learning_rate": 0.00019138267566313528, "loss": 0.0133, "step": 279350 }, { "epoch": 0.72, "learning_rate": 0.00019137878744676382, "loss": 0.0139, "step": 279360 }, { "epoch": 0.72, "learning_rate": 0.00019137489923039237, "loss": 0.0124, "step": 279370 }, { "epoch": 0.72, "learning_rate": 0.00019137101101402088, "loss": 0.0157, "step": 279380 }, { "epoch": 0.72, "learning_rate": 0.00019136712279764942, "loss": 0.0134, "step": 279390 }, { "epoch": 0.72, "learning_rate": 0.00019136323458127794, "loss": 0.0151, "step": 279400 }, { "epoch": 0.72, "learning_rate": 0.0001913593463649065, "loss": 0.016, "step": 279410 }, { "epoch": 0.72, "learning_rate": 0.00019135545814853505, "loss": 0.014, "step": 279420 }, { "epoch": 0.72, "learning_rate": 0.00019135156993216356, "loss": 0.0143, "step": 279430 }, { "epoch": 0.72, "learning_rate": 0.0001913476817157921, "loss": 0.0164, "step": 279440 }, { "epoch": 0.72, "learning_rate": 0.00019134379349942064, "loss": 0.0156, "step": 279450 }, { "epoch": 0.72, "learning_rate": 0.00019133990528304919, "loss": 0.0129, "step": 279460 }, { "epoch": 0.72, "learning_rate": 0.0001913360170666777, "loss": 0.0214, "step": 279470 }, { "epoch": 0.72, "learning_rate": 0.00019133212885030624, "loss": 0.0105, "step": 279480 }, { "epoch": 0.72, "learning_rate": 0.00019132824063393478, "loss": 0.0181, "step": 279490 }, { "epoch": 0.72, "learning_rate": 0.00019132435241756333, "loss": 0.0135, "step": 279500 }, { "epoch": 0.72, "learning_rate": 0.00019132046420119184, "loss": 0.0152, "step": 279510 }, { "epoch": 0.72, "learning_rate": 0.00019131657598482038, "loss": 0.012, "step": 279520 }, { "epoch": 0.72, "learning_rate": 0.00019131268776844892, "loss": 0.0153, "step": 279530 }, { "epoch": 0.72, "learning_rate": 0.00019130879955207746, "loss": 0.0132, "step": 279540 }, { "epoch": 0.72, "learning_rate": 0.00019130491133570598, "loss": 0.0155, "step": 279550 }, { "epoch": 0.72, "learning_rate": 0.00019130102311933452, "loss": 0.0135, "step": 279560 }, { "epoch": 0.72, "learning_rate": 0.0001912971349029631, "loss": 0.0147, "step": 279570 }, { "epoch": 0.72, "learning_rate": 0.0001912932466865916, "loss": 0.0135, "step": 279580 }, { "epoch": 0.72, "learning_rate": 0.00019128935847022015, "loss": 0.0171, "step": 279590 }, { "epoch": 0.72, "learning_rate": 0.00019128547025384866, "loss": 0.0159, "step": 279600 }, { "epoch": 0.72, "learning_rate": 0.00019128158203747723, "loss": 0.0124, "step": 279610 }, { "epoch": 0.72, "learning_rate": 0.00019127769382110574, "loss": 0.0162, "step": 279620 }, { "epoch": 0.72, "learning_rate": 0.00019127380560473429, "loss": 0.0142, "step": 279630 }, { "epoch": 0.72, "learning_rate": 0.0001912699173883628, "loss": 0.0142, "step": 279640 }, { "epoch": 0.72, "learning_rate": 0.00019126602917199134, "loss": 0.013, "step": 279650 }, { "epoch": 0.72, "learning_rate": 0.00019126214095561988, "loss": 0.0145, "step": 279660 }, { "epoch": 0.72, "learning_rate": 0.00019125825273924842, "loss": 0.0118, "step": 279670 }, { "epoch": 0.72, "learning_rate": 0.00019125436452287694, "loss": 0.0145, "step": 279680 }, { "epoch": 0.72, "learning_rate": 0.00019125047630650548, "loss": 0.0146, "step": 279690 }, { "epoch": 0.73, "learning_rate": 0.00019124658809013402, "loss": 0.0154, "step": 279700 }, { "epoch": 0.73, "learning_rate": 0.00019124269987376256, "loss": 0.0147, "step": 279710 }, { "epoch": 0.73, "learning_rate": 0.00019123881165739108, "loss": 0.0143, "step": 279720 }, { "epoch": 0.73, "learning_rate": 0.00019123492344101962, "loss": 0.0132, "step": 279730 }, { "epoch": 0.73, "learning_rate": 0.0001912310352246482, "loss": 0.014, "step": 279740 }, { "epoch": 0.73, "learning_rate": 0.0001912271470082767, "loss": 0.0153, "step": 279750 }, { "epoch": 0.73, "learning_rate": 0.00019122325879190522, "loss": 0.0146, "step": 279760 }, { "epoch": 0.73, "learning_rate": 0.00019121937057553376, "loss": 0.0138, "step": 279770 }, { "epoch": 0.73, "learning_rate": 0.00019121548235916233, "loss": 0.013, "step": 279780 }, { "epoch": 0.73, "learning_rate": 0.00019121159414279084, "loss": 0.0111, "step": 279790 }, { "epoch": 0.73, "learning_rate": 0.00019120770592641938, "loss": 0.0108, "step": 279800 }, { "epoch": 0.73, "learning_rate": 0.0001912038177100479, "loss": 0.0159, "step": 279810 }, { "epoch": 0.73, "learning_rate": 0.00019119992949367647, "loss": 0.0155, "step": 279820 }, { "epoch": 0.73, "learning_rate": 0.00019119604127730498, "loss": 0.0137, "step": 279830 }, { "epoch": 0.73, "learning_rate": 0.00019119215306093352, "loss": 0.0183, "step": 279840 }, { "epoch": 0.73, "learning_rate": 0.00019118826484456204, "loss": 0.0176, "step": 279850 }, { "epoch": 0.73, "learning_rate": 0.0001911843766281906, "loss": 0.0154, "step": 279860 }, { "epoch": 0.73, "learning_rate": 0.00019118048841181912, "loss": 0.0148, "step": 279870 }, { "epoch": 0.73, "learning_rate": 0.00019117660019544766, "loss": 0.0156, "step": 279880 }, { "epoch": 0.73, "learning_rate": 0.00019117271197907618, "loss": 0.0136, "step": 279890 }, { "epoch": 0.73, "learning_rate": 0.00019116882376270472, "loss": 0.0185, "step": 279900 }, { "epoch": 0.73, "learning_rate": 0.0001911649355463333, "loss": 0.0136, "step": 279910 }, { "epoch": 0.73, "learning_rate": 0.0001911610473299618, "loss": 0.0154, "step": 279920 }, { "epoch": 0.73, "learning_rate": 0.00019115715911359032, "loss": 0.0159, "step": 279930 }, { "epoch": 0.73, "learning_rate": 0.00019115327089721886, "loss": 0.0156, "step": 279940 }, { "epoch": 0.73, "learning_rate": 0.00019114938268084743, "loss": 0.0156, "step": 279950 }, { "epoch": 0.73, "learning_rate": 0.00019114549446447594, "loss": 0.0147, "step": 279960 }, { "epoch": 0.73, "learning_rate": 0.00019114160624810448, "loss": 0.018, "step": 279970 }, { "epoch": 0.73, "learning_rate": 0.000191137718031733, "loss": 0.0225, "step": 279980 }, { "epoch": 0.73, "learning_rate": 0.00019113382981536157, "loss": 0.0128, "step": 279990 }, { "epoch": 0.73, "learning_rate": 0.00019112994159899008, "loss": 0.0165, "step": 280000 }, { "epoch": 0.73, "eval_cer": 0.8817152830555753, "eval_loss": 0.010195476934313774, "eval_runtime": 108.0537, "eval_samples_per_second": 18.509, "eval_steps_per_second": 4.627, "step": 280000 }, { "epoch": 0.73, "learning_rate": 0.00019112605338261862, "loss": 0.0211, "step": 280010 }, { "epoch": 0.73, "learning_rate": 0.00019112216516624714, "loss": 0.0153, "step": 280020 }, { "epoch": 0.73, "learning_rate": 0.0001911182769498757, "loss": 0.0141, "step": 280030 }, { "epoch": 0.73, "learning_rate": 0.00019111438873350422, "loss": 0.015, "step": 280040 }, { "epoch": 0.73, "learning_rate": 0.00019111050051713276, "loss": 0.0182, "step": 280050 }, { "epoch": 0.73, "learning_rate": 0.00019110661230076128, "loss": 0.014, "step": 280060 }, { "epoch": 0.73, "learning_rate": 0.00019110272408438985, "loss": 0.0166, "step": 280070 }, { "epoch": 0.73, "learning_rate": 0.00019109883586801836, "loss": 0.0144, "step": 280080 }, { "epoch": 0.73, "learning_rate": 0.0001910949476516469, "loss": 0.0145, "step": 280090 }, { "epoch": 0.73, "learning_rate": 0.00019109105943527542, "loss": 0.0162, "step": 280100 }, { "epoch": 0.73, "learning_rate": 0.00019108717121890399, "loss": 0.0169, "step": 280110 }, { "epoch": 0.73, "learning_rate": 0.00019108328300253253, "loss": 0.016, "step": 280120 }, { "epoch": 0.73, "learning_rate": 0.00019107939478616104, "loss": 0.0235, "step": 280130 }, { "epoch": 0.73, "learning_rate": 0.00019107550656978958, "loss": 0.032, "step": 280140 }, { "epoch": 0.73, "learning_rate": 0.0001910716183534181, "loss": 0.0134, "step": 280150 }, { "epoch": 0.73, "learning_rate": 0.00019106773013704667, "loss": 0.0124, "step": 280160 }, { "epoch": 0.73, "learning_rate": 0.00019106384192067518, "loss": 0.0107, "step": 280170 }, { "epoch": 0.73, "learning_rate": 0.00019105995370430372, "loss": 0.0157, "step": 280180 }, { "epoch": 0.73, "learning_rate": 0.00019105606548793224, "loss": 0.0127, "step": 280190 }, { "epoch": 0.73, "learning_rate": 0.0001910521772715608, "loss": 0.0135, "step": 280200 }, { "epoch": 0.73, "learning_rate": 0.00019104828905518932, "loss": 0.0175, "step": 280210 }, { "epoch": 0.73, "learning_rate": 0.00019104440083881786, "loss": 0.0162, "step": 280220 }, { "epoch": 0.73, "learning_rate": 0.00019104051262244638, "loss": 0.0156, "step": 280230 }, { "epoch": 0.73, "learning_rate": 0.00019103662440607495, "loss": 0.0172, "step": 280240 }, { "epoch": 0.73, "learning_rate": 0.00019103273618970346, "loss": 0.0169, "step": 280250 }, { "epoch": 0.73, "learning_rate": 0.000191028847973332, "loss": 0.0134, "step": 280260 }, { "epoch": 0.73, "learning_rate": 0.00019102495975696052, "loss": 0.0184, "step": 280270 }, { "epoch": 0.73, "learning_rate": 0.00019102107154058909, "loss": 0.0172, "step": 280280 }, { "epoch": 0.73, "learning_rate": 0.00019101718332421763, "loss": 0.0126, "step": 280290 }, { "epoch": 0.73, "learning_rate": 0.00019101329510784614, "loss": 0.0117, "step": 280300 }, { "epoch": 0.73, "learning_rate": 0.00019100940689147468, "loss": 0.0147, "step": 280310 }, { "epoch": 0.73, "learning_rate": 0.00019100551867510322, "loss": 0.0138, "step": 280320 }, { "epoch": 0.73, "learning_rate": 0.00019100163045873177, "loss": 0.0158, "step": 280330 }, { "epoch": 0.73, "learning_rate": 0.00019099774224236028, "loss": 0.0142, "step": 280340 }, { "epoch": 0.73, "learning_rate": 0.00019099385402598882, "loss": 0.0195, "step": 280350 }, { "epoch": 0.73, "learning_rate": 0.00019098996580961736, "loss": 0.0155, "step": 280360 }, { "epoch": 0.73, "learning_rate": 0.0001909860775932459, "loss": 0.0134, "step": 280370 }, { "epoch": 0.73, "learning_rate": 0.00019098218937687442, "loss": 0.0128, "step": 280380 }, { "epoch": 0.73, "learning_rate": 0.00019097830116050296, "loss": 0.0174, "step": 280390 }, { "epoch": 0.73, "learning_rate": 0.00019097441294413148, "loss": 0.0157, "step": 280400 }, { "epoch": 0.73, "learning_rate": 0.00019097052472776005, "loss": 0.013, "step": 280410 }, { "epoch": 0.73, "learning_rate": 0.00019096663651138856, "loss": 0.0121, "step": 280420 }, { "epoch": 0.73, "learning_rate": 0.0001909627482950171, "loss": 0.0151, "step": 280430 }, { "epoch": 0.73, "learning_rate": 0.00019095886007864562, "loss": 0.0199, "step": 280440 }, { "epoch": 0.73, "learning_rate": 0.00019095497186227418, "loss": 0.0145, "step": 280450 }, { "epoch": 0.73, "learning_rate": 0.00019095108364590273, "loss": 0.0121, "step": 280460 }, { "epoch": 0.73, "learning_rate": 0.00019094719542953124, "loss": 0.0159, "step": 280470 }, { "epoch": 0.73, "learning_rate": 0.00019094330721315976, "loss": 0.0155, "step": 280480 }, { "epoch": 0.73, "learning_rate": 0.00019093941899678832, "loss": 0.0162, "step": 280490 }, { "epoch": 0.73, "learning_rate": 0.00019093553078041687, "loss": 0.0162, "step": 280500 }, { "epoch": 0.73, "learning_rate": 0.00019093164256404538, "loss": 0.0155, "step": 280510 }, { "epoch": 0.73, "learning_rate": 0.00019092775434767392, "loss": 0.0153, "step": 280520 }, { "epoch": 0.73, "learning_rate": 0.00019092386613130246, "loss": 0.0152, "step": 280530 }, { "epoch": 0.73, "learning_rate": 0.000190919977914931, "loss": 0.0137, "step": 280540 }, { "epoch": 0.73, "learning_rate": 0.00019091608969855952, "loss": 0.0123, "step": 280550 }, { "epoch": 0.73, "learning_rate": 0.00019091220148218806, "loss": 0.0149, "step": 280560 }, { "epoch": 0.73, "learning_rate": 0.0001909083132658166, "loss": 0.0118, "step": 280570 }, { "epoch": 0.73, "learning_rate": 0.00019090442504944514, "loss": 0.0129, "step": 280580 }, { "epoch": 0.73, "learning_rate": 0.00019090053683307366, "loss": 0.0132, "step": 280590 }, { "epoch": 0.73, "learning_rate": 0.0001908966486167022, "loss": 0.013, "step": 280600 }, { "epoch": 0.73, "learning_rate": 0.00019089276040033072, "loss": 0.0155, "step": 280610 }, { "epoch": 0.73, "learning_rate": 0.00019088887218395928, "loss": 0.0131, "step": 280620 }, { "epoch": 0.73, "learning_rate": 0.0001908849839675878, "loss": 0.0158, "step": 280630 }, { "epoch": 0.73, "learning_rate": 0.00019088109575121634, "loss": 0.0185, "step": 280640 }, { "epoch": 0.73, "learning_rate": 0.00019087720753484485, "loss": 0.0178, "step": 280650 }, { "epoch": 0.73, "learning_rate": 0.00019087331931847342, "loss": 0.0114, "step": 280660 }, { "epoch": 0.73, "learning_rate": 0.00019086943110210197, "loss": 0.0143, "step": 280670 }, { "epoch": 0.73, "learning_rate": 0.00019086554288573048, "loss": 0.0151, "step": 280680 }, { "epoch": 0.73, "learning_rate": 0.00019086165466935902, "loss": 0.0171, "step": 280690 }, { "epoch": 0.73, "learning_rate": 0.00019085776645298756, "loss": 0.0139, "step": 280700 }, { "epoch": 0.73, "learning_rate": 0.0001908538782366161, "loss": 0.0139, "step": 280710 }, { "epoch": 0.73, "learning_rate": 0.00019084999002024462, "loss": 0.0139, "step": 280720 }, { "epoch": 0.73, "learning_rate": 0.00019084610180387316, "loss": 0.0183, "step": 280730 }, { "epoch": 0.73, "learning_rate": 0.0001908422135875017, "loss": 0.0135, "step": 280740 }, { "epoch": 0.73, "learning_rate": 0.00019083832537113024, "loss": 0.0157, "step": 280750 }, { "epoch": 0.73, "learning_rate": 0.00019083443715475876, "loss": 0.0118, "step": 280760 }, { "epoch": 0.73, "learning_rate": 0.0001908305489383873, "loss": 0.0185, "step": 280770 }, { "epoch": 0.73, "learning_rate": 0.00019082666072201587, "loss": 0.0136, "step": 280780 }, { "epoch": 0.73, "learning_rate": 0.00019082277250564438, "loss": 0.0126, "step": 280790 }, { "epoch": 0.73, "learning_rate": 0.0001908188842892729, "loss": 0.0157, "step": 280800 }, { "epoch": 0.73, "learning_rate": 0.00019081499607290144, "loss": 0.0156, "step": 280810 }, { "epoch": 0.73, "learning_rate": 0.00019081110785653, "loss": 0.0117, "step": 280820 }, { "epoch": 0.73, "learning_rate": 0.00019080721964015852, "loss": 0.0145, "step": 280830 }, { "epoch": 0.73, "learning_rate": 0.00019080333142378706, "loss": 0.0137, "step": 280840 }, { "epoch": 0.73, "learning_rate": 0.00019079944320741558, "loss": 0.0166, "step": 280850 }, { "epoch": 0.73, "learning_rate": 0.00019079555499104412, "loss": 0.0142, "step": 280860 }, { "epoch": 0.73, "learning_rate": 0.00019079166677467266, "loss": 0.0161, "step": 280870 }, { "epoch": 0.73, "learning_rate": 0.0001907877785583012, "loss": 0.0152, "step": 280880 }, { "epoch": 0.73, "learning_rate": 0.00019078389034192972, "loss": 0.0178, "step": 280890 }, { "epoch": 0.73, "learning_rate": 0.00019078000212555826, "loss": 0.011, "step": 280900 }, { "epoch": 0.73, "learning_rate": 0.0001907761139091868, "loss": 0.0145, "step": 280910 }, { "epoch": 0.73, "learning_rate": 0.00019077222569281534, "loss": 0.0168, "step": 280920 }, { "epoch": 0.73, "learning_rate": 0.00019076833747644386, "loss": 0.0149, "step": 280930 }, { "epoch": 0.73, "learning_rate": 0.0001907644492600724, "loss": 0.0135, "step": 280940 }, { "epoch": 0.73, "learning_rate": 0.00019076056104370094, "loss": 0.019, "step": 280950 }, { "epoch": 0.73, "learning_rate": 0.00019075667282732948, "loss": 0.0133, "step": 280960 }, { "epoch": 0.73, "learning_rate": 0.000190752784610958, "loss": 0.0153, "step": 280970 }, { "epoch": 0.73, "learning_rate": 0.00019074889639458654, "loss": 0.0193, "step": 280980 }, { "epoch": 0.73, "learning_rate": 0.0001907450081782151, "loss": 0.013, "step": 280990 }, { "epoch": 0.73, "learning_rate": 0.00019074111996184362, "loss": 0.0145, "step": 281000 }, { "epoch": 0.73, "eval_cer": 0.8817334783357197, "eval_loss": 0.010047990828752518, "eval_runtime": 108.1788, "eval_samples_per_second": 18.488, "eval_steps_per_second": 4.622, "step": 281000 }, { "epoch": 0.73, "learning_rate": 0.00019073723174547216, "loss": 0.0189, "step": 281010 }, { "epoch": 0.73, "learning_rate": 0.00019073334352910068, "loss": 0.015, "step": 281020 }, { "epoch": 0.73, "learning_rate": 0.00019072945531272925, "loss": 0.0122, "step": 281030 }, { "epoch": 0.73, "learning_rate": 0.00019072556709635776, "loss": 0.0158, "step": 281040 }, { "epoch": 0.73, "learning_rate": 0.0001907216788799863, "loss": 0.0164, "step": 281050 }, { "epoch": 0.73, "learning_rate": 0.00019071779066361482, "loss": 0.0149, "step": 281060 }, { "epoch": 0.73, "learning_rate": 0.0001907139024472434, "loss": 0.0125, "step": 281070 }, { "epoch": 0.73, "learning_rate": 0.0001907100142308719, "loss": 0.0146, "step": 281080 }, { "epoch": 0.73, "learning_rate": 0.00019070612601450044, "loss": 0.0176, "step": 281090 }, { "epoch": 0.73, "learning_rate": 0.00019070223779812896, "loss": 0.0165, "step": 281100 }, { "epoch": 0.73, "learning_rate": 0.0001906983495817575, "loss": 0.0114, "step": 281110 }, { "epoch": 0.73, "learning_rate": 0.00019069446136538604, "loss": 0.0165, "step": 281120 }, { "epoch": 0.73, "learning_rate": 0.00019069057314901458, "loss": 0.0144, "step": 281130 }, { "epoch": 0.73, "learning_rate": 0.0001906866849326431, "loss": 0.0157, "step": 281140 }, { "epoch": 0.73, "learning_rate": 0.00019068279671627164, "loss": 0.0141, "step": 281150 }, { "epoch": 0.73, "learning_rate": 0.0001906789084999002, "loss": 0.0148, "step": 281160 }, { "epoch": 0.73, "learning_rate": 0.00019067502028352872, "loss": 0.0156, "step": 281170 }, { "epoch": 0.73, "learning_rate": 0.00019067113206715726, "loss": 0.014, "step": 281180 }, { "epoch": 0.73, "learning_rate": 0.00019066724385078578, "loss": 0.0116, "step": 281190 }, { "epoch": 0.73, "learning_rate": 0.00019066335563441435, "loss": 0.0144, "step": 281200 }, { "epoch": 0.73, "learning_rate": 0.00019065946741804286, "loss": 0.0135, "step": 281210 }, { "epoch": 0.73, "learning_rate": 0.0001906555792016714, "loss": 0.0153, "step": 281220 }, { "epoch": 0.73, "learning_rate": 0.00019065169098529992, "loss": 0.0201, "step": 281230 }, { "epoch": 0.73, "learning_rate": 0.00019064780276892849, "loss": 0.0114, "step": 281240 }, { "epoch": 0.73, "learning_rate": 0.000190643914552557, "loss": 0.0143, "step": 281250 }, { "epoch": 0.73, "learning_rate": 0.00019064002633618554, "loss": 0.0143, "step": 281260 }, { "epoch": 0.73, "learning_rate": 0.00019063613811981406, "loss": 0.0174, "step": 281270 }, { "epoch": 0.73, "learning_rate": 0.00019063224990344263, "loss": 0.018, "step": 281280 }, { "epoch": 0.73, "learning_rate": 0.00019062836168707114, "loss": 0.017, "step": 281290 }, { "epoch": 0.73, "learning_rate": 0.00019062447347069968, "loss": 0.0121, "step": 281300 }, { "epoch": 0.73, "learning_rate": 0.0001906205852543282, "loss": 0.0122, "step": 281310 }, { "epoch": 0.73, "learning_rate": 0.00019061669703795677, "loss": 0.0159, "step": 281320 }, { "epoch": 0.73, "learning_rate": 0.0001906128088215853, "loss": 0.0146, "step": 281330 }, { "epoch": 0.73, "learning_rate": 0.00019060892060521382, "loss": 0.0152, "step": 281340 }, { "epoch": 0.73, "learning_rate": 0.00019060503238884234, "loss": 0.0172, "step": 281350 }, { "epoch": 0.73, "learning_rate": 0.00019060114417247088, "loss": 0.0174, "step": 281360 }, { "epoch": 0.73, "learning_rate": 0.00019059725595609945, "loss": 0.0141, "step": 281370 }, { "epoch": 0.73, "learning_rate": 0.00019059336773972796, "loss": 0.0177, "step": 281380 }, { "epoch": 0.73, "learning_rate": 0.0001905894795233565, "loss": 0.0122, "step": 281390 }, { "epoch": 0.73, "learning_rate": 0.00019058559130698502, "loss": 0.0151, "step": 281400 }, { "epoch": 0.73, "learning_rate": 0.00019058170309061359, "loss": 0.0141, "step": 281410 }, { "epoch": 0.73, "learning_rate": 0.0001905778148742421, "loss": 0.0171, "step": 281420 }, { "epoch": 0.73, "learning_rate": 0.00019057392665787064, "loss": 0.0141, "step": 281430 }, { "epoch": 0.73, "learning_rate": 0.00019057003844149916, "loss": 0.013, "step": 281440 }, { "epoch": 0.73, "learning_rate": 0.00019056615022512773, "loss": 0.0134, "step": 281450 }, { "epoch": 0.73, "learning_rate": 0.00019056226200875624, "loss": 0.0148, "step": 281460 }, { "epoch": 0.73, "learning_rate": 0.00019055837379238478, "loss": 0.0134, "step": 281470 }, { "epoch": 0.73, "learning_rate": 0.0001905544855760133, "loss": 0.0179, "step": 281480 }, { "epoch": 0.73, "learning_rate": 0.00019055059735964186, "loss": 0.0156, "step": 281490 }, { "epoch": 0.73, "learning_rate": 0.0001905467091432704, "loss": 0.01, "step": 281500 }, { "epoch": 0.73, "learning_rate": 0.00019054282092689892, "loss": 0.0147, "step": 281510 }, { "epoch": 0.73, "learning_rate": 0.00019053893271052744, "loss": 0.0145, "step": 281520 }, { "epoch": 0.73, "learning_rate": 0.000190535044494156, "loss": 0.01, "step": 281530 }, { "epoch": 0.73, "learning_rate": 0.00019053115627778455, "loss": 0.0117, "step": 281540 }, { "epoch": 0.73, "learning_rate": 0.00019052726806141306, "loss": 0.0158, "step": 281550 }, { "epoch": 0.73, "learning_rate": 0.0001905233798450416, "loss": 0.0133, "step": 281560 }, { "epoch": 0.73, "learning_rate": 0.00019051949162867014, "loss": 0.0128, "step": 281570 }, { "epoch": 0.73, "learning_rate": 0.00019051560341229869, "loss": 0.0171, "step": 281580 }, { "epoch": 0.73, "learning_rate": 0.0001905117151959272, "loss": 0.0108, "step": 281590 }, { "epoch": 0.73, "learning_rate": 0.00019050782697955574, "loss": 0.018, "step": 281600 }, { "epoch": 0.73, "learning_rate": 0.00019050393876318426, "loss": 0.0165, "step": 281610 }, { "epoch": 0.73, "learning_rate": 0.00019050005054681282, "loss": 0.0144, "step": 281620 }, { "epoch": 0.73, "learning_rate": 0.00019049616233044134, "loss": 0.0168, "step": 281630 }, { "epoch": 0.73, "learning_rate": 0.00019049227411406988, "loss": 0.0178, "step": 281640 }, { "epoch": 0.73, "learning_rate": 0.0001904883858976984, "loss": 0.0169, "step": 281650 }, { "epoch": 0.73, "learning_rate": 0.00019048449768132696, "loss": 0.0129, "step": 281660 }, { "epoch": 0.73, "learning_rate": 0.00019048060946495548, "loss": 0.0169, "step": 281670 }, { "epoch": 0.73, "learning_rate": 0.00019047672124858402, "loss": 0.0171, "step": 281680 }, { "epoch": 0.73, "learning_rate": 0.00019047283303221253, "loss": 0.0126, "step": 281690 }, { "epoch": 0.73, "learning_rate": 0.0001904689448158411, "loss": 0.0137, "step": 281700 }, { "epoch": 0.73, "learning_rate": 0.00019046505659946965, "loss": 0.0178, "step": 281710 }, { "epoch": 0.73, "learning_rate": 0.00019046116838309816, "loss": 0.0145, "step": 281720 }, { "epoch": 0.73, "learning_rate": 0.0001904572801667267, "loss": 0.0157, "step": 281730 }, { "epoch": 0.73, "learning_rate": 0.00019045339195035524, "loss": 0.012, "step": 281740 }, { "epoch": 0.73, "learning_rate": 0.00019044950373398378, "loss": 0.0136, "step": 281750 }, { "epoch": 0.73, "learning_rate": 0.0001904456155176123, "loss": 0.0145, "step": 281760 }, { "epoch": 0.73, "learning_rate": 0.00019044172730124084, "loss": 0.0142, "step": 281770 }, { "epoch": 0.73, "learning_rate": 0.00019043783908486938, "loss": 0.0283, "step": 281780 }, { "epoch": 0.73, "learning_rate": 0.00019043395086849792, "loss": 0.0161, "step": 281790 }, { "epoch": 0.73, "learning_rate": 0.00019043006265212644, "loss": 0.0145, "step": 281800 }, { "epoch": 0.73, "learning_rate": 0.00019042617443575498, "loss": 0.0174, "step": 281810 }, { "epoch": 0.73, "learning_rate": 0.00019042228621938352, "loss": 0.0128, "step": 281820 }, { "epoch": 0.73, "learning_rate": 0.00019041839800301206, "loss": 0.0145, "step": 281830 }, { "epoch": 0.73, "learning_rate": 0.00019041450978664058, "loss": 0.0177, "step": 281840 }, { "epoch": 0.73, "learning_rate": 0.00019041062157026912, "loss": 0.0167, "step": 281850 }, { "epoch": 0.73, "learning_rate": 0.00019040673335389763, "loss": 0.0154, "step": 281860 }, { "epoch": 0.73, "learning_rate": 0.0001904028451375262, "loss": 0.0108, "step": 281870 }, { "epoch": 0.73, "learning_rate": 0.00019039895692115474, "loss": 0.0149, "step": 281880 }, { "epoch": 0.73, "learning_rate": 0.00019039506870478326, "loss": 0.0156, "step": 281890 }, { "epoch": 0.73, "learning_rate": 0.0001903911804884118, "loss": 0.0129, "step": 281900 }, { "epoch": 0.73, "learning_rate": 0.00019038729227204034, "loss": 0.0135, "step": 281910 }, { "epoch": 0.73, "learning_rate": 0.00019038340405566888, "loss": 0.0144, "step": 281920 }, { "epoch": 0.73, "learning_rate": 0.0001903795158392974, "loss": 0.0146, "step": 281930 }, { "epoch": 0.73, "learning_rate": 0.00019037562762292594, "loss": 0.0166, "step": 281940 }, { "epoch": 0.73, "learning_rate": 0.00019037173940655448, "loss": 0.0114, "step": 281950 }, { "epoch": 0.73, "learning_rate": 0.00019036785119018302, "loss": 0.013, "step": 281960 }, { "epoch": 0.73, "learning_rate": 0.00019036396297381154, "loss": 0.0163, "step": 281970 }, { "epoch": 0.73, "learning_rate": 0.00019036007475744008, "loss": 0.0141, "step": 281980 }, { "epoch": 0.73, "learning_rate": 0.00019035618654106862, "loss": 0.0136, "step": 281990 }, { "epoch": 0.73, "learning_rate": 0.00019035229832469716, "loss": 0.0137, "step": 282000 }, { "epoch": 0.73, "eval_cer": 0.8816914892276944, "eval_loss": 0.009928989224135876, "eval_runtime": 108.1846, "eval_samples_per_second": 18.487, "eval_steps_per_second": 4.622, "step": 282000 }, { "epoch": 0.73, "learning_rate": 0.00019034841010832568, "loss": 0.0146, "step": 282010 }, { "epoch": 0.73, "learning_rate": 0.00019034452189195422, "loss": 0.012, "step": 282020 }, { "epoch": 0.73, "learning_rate": 0.0001903406336755828, "loss": 0.0128, "step": 282030 }, { "epoch": 0.73, "learning_rate": 0.0001903367454592113, "loss": 0.0145, "step": 282040 }, { "epoch": 0.73, "learning_rate": 0.00019033285724283984, "loss": 0.0155, "step": 282050 }, { "epoch": 0.73, "learning_rate": 0.00019032896902646836, "loss": 0.0133, "step": 282060 }, { "epoch": 0.73, "learning_rate": 0.00019032508081009693, "loss": 0.0159, "step": 282070 }, { "epoch": 0.73, "learning_rate": 0.00019032119259372544, "loss": 0.0148, "step": 282080 }, { "epoch": 0.73, "learning_rate": 0.00019031730437735398, "loss": 0.0127, "step": 282090 }, { "epoch": 0.73, "learning_rate": 0.0001903134161609825, "loss": 0.0153, "step": 282100 }, { "epoch": 0.73, "learning_rate": 0.00019030952794461104, "loss": 0.0137, "step": 282110 }, { "epoch": 0.73, "learning_rate": 0.00019030563972823958, "loss": 0.0109, "step": 282120 }, { "epoch": 0.73, "learning_rate": 0.00019030175151186812, "loss": 0.018, "step": 282130 }, { "epoch": 0.73, "learning_rate": 0.00019029786329549664, "loss": 0.0142, "step": 282140 }, { "epoch": 0.73, "learning_rate": 0.00019029397507912518, "loss": 0.0119, "step": 282150 }, { "epoch": 0.73, "learning_rate": 0.00019029008686275372, "loss": 0.0152, "step": 282160 }, { "epoch": 0.73, "learning_rate": 0.00019028619864638226, "loss": 0.0132, "step": 282170 }, { "epoch": 0.73, "learning_rate": 0.00019028231043001078, "loss": 0.0144, "step": 282180 }, { "epoch": 0.73, "learning_rate": 0.00019027842221363932, "loss": 0.0173, "step": 282190 }, { "epoch": 0.73, "learning_rate": 0.0001902745339972679, "loss": 0.015, "step": 282200 }, { "epoch": 0.73, "learning_rate": 0.0001902706457808964, "loss": 0.0188, "step": 282210 }, { "epoch": 0.73, "learning_rate": 0.00019026675756452492, "loss": 0.0127, "step": 282220 }, { "epoch": 0.73, "learning_rate": 0.00019026286934815346, "loss": 0.0142, "step": 282230 }, { "epoch": 0.73, "learning_rate": 0.00019025898113178203, "loss": 0.0137, "step": 282240 }, { "epoch": 0.73, "learning_rate": 0.00019025509291541054, "loss": 0.018, "step": 282250 }, { "epoch": 0.73, "learning_rate": 0.00019025120469903908, "loss": 0.0155, "step": 282260 }, { "epoch": 0.73, "learning_rate": 0.0001902473164826676, "loss": 0.0125, "step": 282270 }, { "epoch": 0.73, "learning_rate": 0.00019024342826629617, "loss": 0.013, "step": 282280 }, { "epoch": 0.73, "learning_rate": 0.00019023954004992468, "loss": 0.017, "step": 282290 }, { "epoch": 0.73, "learning_rate": 0.00019023565183355322, "loss": 0.0139, "step": 282300 }, { "epoch": 0.73, "learning_rate": 0.00019023176361718174, "loss": 0.0181, "step": 282310 }, { "epoch": 0.73, "learning_rate": 0.0001902278754008103, "loss": 0.0136, "step": 282320 }, { "epoch": 0.73, "learning_rate": 0.00019022398718443882, "loss": 0.0188, "step": 282330 }, { "epoch": 0.73, "learning_rate": 0.00019022009896806736, "loss": 0.0142, "step": 282340 }, { "epoch": 0.73, "learning_rate": 0.00019021621075169588, "loss": 0.015, "step": 282350 }, { "epoch": 0.73, "learning_rate": 0.00019021232253532442, "loss": 0.0137, "step": 282360 }, { "epoch": 0.73, "learning_rate": 0.000190208434318953, "loss": 0.0141, "step": 282370 }, { "epoch": 0.73, "learning_rate": 0.0001902045461025815, "loss": 0.0126, "step": 282380 }, { "epoch": 0.73, "learning_rate": 0.00019020065788621002, "loss": 0.0144, "step": 282390 }, { "epoch": 0.73, "learning_rate": 0.00019019676966983856, "loss": 0.0126, "step": 282400 }, { "epoch": 0.73, "learning_rate": 0.00019019288145346713, "loss": 0.0168, "step": 282410 }, { "epoch": 0.73, "learning_rate": 0.00019018899323709564, "loss": 0.0207, "step": 282420 }, { "epoch": 0.73, "learning_rate": 0.00019018510502072418, "loss": 0.0141, "step": 282430 }, { "epoch": 0.73, "learning_rate": 0.0001901812168043527, "loss": 0.0115, "step": 282440 }, { "epoch": 0.73, "learning_rate": 0.00019017732858798127, "loss": 0.019, "step": 282450 }, { "epoch": 0.73, "learning_rate": 0.00019017344037160978, "loss": 0.0172, "step": 282460 }, { "epoch": 0.73, "learning_rate": 0.00019016955215523832, "loss": 0.0135, "step": 282470 }, { "epoch": 0.73, "learning_rate": 0.00019016566393886684, "loss": 0.0144, "step": 282480 }, { "epoch": 0.73, "learning_rate": 0.0001901617757224954, "loss": 0.0167, "step": 282490 }, { "epoch": 0.73, "learning_rate": 0.00019015788750612392, "loss": 0.0137, "step": 282500 }, { "epoch": 0.73, "learning_rate": 0.00019015399928975246, "loss": 0.0149, "step": 282510 }, { "epoch": 0.73, "learning_rate": 0.00019015011107338098, "loss": 0.0149, "step": 282520 }, { "epoch": 0.73, "learning_rate": 0.00019014622285700954, "loss": 0.0138, "step": 282530 }, { "epoch": 0.73, "learning_rate": 0.00019014233464063806, "loss": 0.0138, "step": 282540 }, { "epoch": 0.73, "learning_rate": 0.0001901384464242666, "loss": 0.0146, "step": 282550 }, { "epoch": 0.73, "learning_rate": 0.00019013455820789512, "loss": 0.0116, "step": 282560 }, { "epoch": 0.73, "learning_rate": 0.00019013066999152368, "loss": 0.0157, "step": 282570 }, { "epoch": 0.73, "learning_rate": 0.00019012678177515223, "loss": 0.015, "step": 282580 }, { "epoch": 0.73, "learning_rate": 0.00019012289355878074, "loss": 0.0146, "step": 282590 }, { "epoch": 0.73, "learning_rate": 0.00019011900534240928, "loss": 0.0172, "step": 282600 }, { "epoch": 0.73, "learning_rate": 0.0001901151171260378, "loss": 0.0105, "step": 282610 }, { "epoch": 0.73, "learning_rate": 0.00019011122890966636, "loss": 0.0162, "step": 282620 }, { "epoch": 0.73, "learning_rate": 0.00019010734069329488, "loss": 0.0174, "step": 282630 }, { "epoch": 0.73, "learning_rate": 0.00019010345247692342, "loss": 0.0159, "step": 282640 }, { "epoch": 0.73, "learning_rate": 0.00019009956426055194, "loss": 0.0173, "step": 282650 }, { "epoch": 0.73, "learning_rate": 0.0001900956760441805, "loss": 0.0162, "step": 282660 }, { "epoch": 0.73, "learning_rate": 0.00019009178782780902, "loss": 0.0158, "step": 282670 }, { "epoch": 0.73, "learning_rate": 0.00019008789961143756, "loss": 0.0133, "step": 282680 }, { "epoch": 0.73, "learning_rate": 0.00019008401139506608, "loss": 0.015, "step": 282690 }, { "epoch": 0.73, "learning_rate": 0.00019008012317869464, "loss": 0.0128, "step": 282700 }, { "epoch": 0.73, "learning_rate": 0.00019007623496232316, "loss": 0.0198, "step": 282710 }, { "epoch": 0.73, "learning_rate": 0.0001900723467459517, "loss": 0.0139, "step": 282720 }, { "epoch": 0.73, "learning_rate": 0.00019006845852958021, "loss": 0.0136, "step": 282730 }, { "epoch": 0.73, "learning_rate": 0.00019006457031320878, "loss": 0.0149, "step": 282740 }, { "epoch": 0.73, "learning_rate": 0.00019006068209683732, "loss": 0.0208, "step": 282750 }, { "epoch": 0.73, "learning_rate": 0.00019005679388046584, "loss": 0.0158, "step": 282760 }, { "epoch": 0.73, "learning_rate": 0.00019005290566409438, "loss": 0.0135, "step": 282770 }, { "epoch": 0.73, "learning_rate": 0.00019004901744772292, "loss": 0.0143, "step": 282780 }, { "epoch": 0.73, "learning_rate": 0.00019004512923135146, "loss": 0.0169, "step": 282790 }, { "epoch": 0.73, "learning_rate": 0.00019004124101497998, "loss": 0.0147, "step": 282800 }, { "epoch": 0.73, "learning_rate": 0.00019003735279860852, "loss": 0.0179, "step": 282810 }, { "epoch": 0.73, "learning_rate": 0.00019003346458223706, "loss": 0.0153, "step": 282820 }, { "epoch": 0.73, "learning_rate": 0.0001900295763658656, "loss": 0.0148, "step": 282830 }, { "epoch": 0.73, "learning_rate": 0.00019002568814949412, "loss": 0.0153, "step": 282840 }, { "epoch": 0.73, "learning_rate": 0.00019002179993312266, "loss": 0.0141, "step": 282850 }, { "epoch": 0.73, "learning_rate": 0.00019001791171675117, "loss": 0.0137, "step": 282860 }, { "epoch": 0.73, "learning_rate": 0.00019001402350037974, "loss": 0.0179, "step": 282870 }, { "epoch": 0.73, "learning_rate": 0.00019001013528400826, "loss": 0.0119, "step": 282880 }, { "epoch": 0.73, "learning_rate": 0.0001900062470676368, "loss": 0.0169, "step": 282890 }, { "epoch": 0.73, "learning_rate": 0.00019000235885126531, "loss": 0.0175, "step": 282900 }, { "epoch": 0.73, "learning_rate": 0.00018999847063489388, "loss": 0.0166, "step": 282910 }, { "epoch": 0.73, "learning_rate": 0.00018999458241852242, "loss": 0.0143, "step": 282920 }, { "epoch": 0.73, "learning_rate": 0.00018999069420215094, "loss": 0.0175, "step": 282930 }, { "epoch": 0.73, "learning_rate": 0.00018998680598577945, "loss": 0.0133, "step": 282940 }, { "epoch": 0.73, "learning_rate": 0.00018998291776940802, "loss": 0.0127, "step": 282950 }, { "epoch": 0.73, "learning_rate": 0.00018997902955303656, "loss": 0.0162, "step": 282960 }, { "epoch": 0.73, "learning_rate": 0.00018997514133666508, "loss": 0.0181, "step": 282970 }, { "epoch": 0.73, "learning_rate": 0.00018997125312029362, "loss": 0.0156, "step": 282980 }, { "epoch": 0.73, "learning_rate": 0.00018996736490392216, "loss": 0.0151, "step": 282990 }, { "epoch": 0.73, "learning_rate": 0.0001899634766875507, "loss": 0.0129, "step": 283000 }, { "epoch": 0.73, "eval_cer": 0.8817348779726539, "eval_loss": 0.010007109493017197, "eval_runtime": 108.1539, "eval_samples_per_second": 18.492, "eval_steps_per_second": 4.623, "step": 283000 }, { "epoch": 0.73, "learning_rate": 0.00018995958847117922, "loss": 0.0133, "step": 283010 }, { "epoch": 0.73, "learning_rate": 0.00018995570025480776, "loss": 0.0122, "step": 283020 }, { "epoch": 0.73, "learning_rate": 0.0001899518120384363, "loss": 0.0172, "step": 283030 }, { "epoch": 0.73, "learning_rate": 0.00018994792382206484, "loss": 0.014, "step": 283040 }, { "epoch": 0.73, "learning_rate": 0.00018994403560569336, "loss": 0.0189, "step": 283050 }, { "epoch": 0.73, "learning_rate": 0.0001899401473893219, "loss": 0.0127, "step": 283060 }, { "epoch": 0.73, "learning_rate": 0.00018993625917295047, "loss": 0.0132, "step": 283070 }, { "epoch": 0.73, "learning_rate": 0.00018993237095657898, "loss": 0.0149, "step": 283080 }, { "epoch": 0.73, "learning_rate": 0.00018992848274020752, "loss": 0.0166, "step": 283090 }, { "epoch": 0.73, "learning_rate": 0.00018992459452383604, "loss": 0.0141, "step": 283100 }, { "epoch": 0.73, "learning_rate": 0.00018992070630746455, "loss": 0.0146, "step": 283110 }, { "epoch": 0.73, "learning_rate": 0.00018991681809109312, "loss": 0.0183, "step": 283120 }, { "epoch": 0.73, "learning_rate": 0.00018991292987472166, "loss": 0.0169, "step": 283130 }, { "epoch": 0.73, "learning_rate": 0.00018990904165835018, "loss": 0.0137, "step": 283140 }, { "epoch": 0.73, "learning_rate": 0.00018990515344197872, "loss": 0.0177, "step": 283150 }, { "epoch": 0.73, "learning_rate": 0.00018990126522560726, "loss": 0.0156, "step": 283160 }, { "epoch": 0.73, "learning_rate": 0.0001898973770092358, "loss": 0.0139, "step": 283170 }, { "epoch": 0.73, "learning_rate": 0.00018989348879286432, "loss": 0.0159, "step": 283180 }, { "epoch": 0.73, "learning_rate": 0.00018988960057649286, "loss": 0.0104, "step": 283190 }, { "epoch": 0.73, "learning_rate": 0.0001898857123601214, "loss": 0.0133, "step": 283200 }, { "epoch": 0.73, "learning_rate": 0.00018988182414374994, "loss": 0.0115, "step": 283210 }, { "epoch": 0.73, "learning_rate": 0.00018987793592737846, "loss": 0.0191, "step": 283220 }, { "epoch": 0.73, "learning_rate": 0.000189874047711007, "loss": 0.0134, "step": 283230 }, { "epoch": 0.73, "learning_rate": 0.00018987015949463557, "loss": 0.012, "step": 283240 }, { "epoch": 0.73, "learning_rate": 0.00018986627127826408, "loss": 0.0124, "step": 283250 }, { "epoch": 0.73, "learning_rate": 0.0001898623830618926, "loss": 0.0152, "step": 283260 }, { "epoch": 0.73, "learning_rate": 0.00018985849484552114, "loss": 0.0151, "step": 283270 }, { "epoch": 0.73, "learning_rate": 0.0001898546066291497, "loss": 0.0162, "step": 283280 }, { "epoch": 0.73, "learning_rate": 0.00018985071841277822, "loss": 0.0147, "step": 283290 }, { "epoch": 0.73, "learning_rate": 0.00018984683019640676, "loss": 0.0144, "step": 283300 }, { "epoch": 0.73, "learning_rate": 0.00018984294198003528, "loss": 0.0128, "step": 283310 }, { "epoch": 0.73, "learning_rate": 0.00018983905376366385, "loss": 0.013, "step": 283320 }, { "epoch": 0.73, "learning_rate": 0.00018983516554729236, "loss": 0.0139, "step": 283330 }, { "epoch": 0.73, "learning_rate": 0.0001898312773309209, "loss": 0.0138, "step": 283340 }, { "epoch": 0.73, "learning_rate": 0.00018982738911454942, "loss": 0.0133, "step": 283350 }, { "epoch": 0.73, "learning_rate": 0.00018982350089817796, "loss": 0.0121, "step": 283360 }, { "epoch": 0.73, "learning_rate": 0.0001898196126818065, "loss": 0.0141, "step": 283370 }, { "epoch": 0.73, "learning_rate": 0.00018981572446543504, "loss": 0.0135, "step": 283380 }, { "epoch": 0.73, "learning_rate": 0.00018981183624906356, "loss": 0.0146, "step": 283390 }, { "epoch": 0.73, "learning_rate": 0.0001898079480326921, "loss": 0.0197, "step": 283400 }, { "epoch": 0.73, "learning_rate": 0.00018980405981632064, "loss": 0.019, "step": 283410 }, { "epoch": 0.73, "learning_rate": 0.00018980017159994918, "loss": 0.0171, "step": 283420 }, { "epoch": 0.73, "learning_rate": 0.0001897962833835777, "loss": 0.0189, "step": 283430 }, { "epoch": 0.73, "learning_rate": 0.00018979239516720624, "loss": 0.0136, "step": 283440 }, { "epoch": 0.73, "learning_rate": 0.0001897885069508348, "loss": 0.0114, "step": 283450 }, { "epoch": 0.73, "learning_rate": 0.00018978461873446332, "loss": 0.0123, "step": 283460 }, { "epoch": 0.73, "learning_rate": 0.00018978073051809186, "loss": 0.0112, "step": 283470 }, { "epoch": 0.73, "learning_rate": 0.00018977684230172038, "loss": 0.0156, "step": 283480 }, { "epoch": 0.73, "learning_rate": 0.00018977295408534895, "loss": 0.0176, "step": 283490 }, { "epoch": 0.73, "learning_rate": 0.00018976906586897746, "loss": 0.0131, "step": 283500 }, { "epoch": 0.73, "learning_rate": 0.000189765177652606, "loss": 0.0154, "step": 283510 }, { "epoch": 0.73, "learning_rate": 0.00018976128943623452, "loss": 0.0162, "step": 283520 }, { "epoch": 0.73, "learning_rate": 0.00018975740121986308, "loss": 0.0183, "step": 283530 }, { "epoch": 0.73, "learning_rate": 0.0001897535130034916, "loss": 0.0169, "step": 283540 }, { "epoch": 0.74, "learning_rate": 0.00018974962478712014, "loss": 0.0125, "step": 283550 }, { "epoch": 0.74, "learning_rate": 0.00018974573657074866, "loss": 0.0142, "step": 283560 }, { "epoch": 0.74, "learning_rate": 0.00018974184835437722, "loss": 0.0153, "step": 283570 }, { "epoch": 0.74, "learning_rate": 0.00018973796013800574, "loss": 0.0125, "step": 283580 }, { "epoch": 0.74, "learning_rate": 0.00018973407192163428, "loss": 0.0197, "step": 283590 }, { "epoch": 0.74, "learning_rate": 0.0001897301837052628, "loss": 0.0154, "step": 283600 }, { "epoch": 0.74, "learning_rate": 0.00018972629548889134, "loss": 0.0113, "step": 283610 }, { "epoch": 0.74, "learning_rate": 0.0001897224072725199, "loss": 0.0133, "step": 283620 }, { "epoch": 0.74, "learning_rate": 0.00018971851905614842, "loss": 0.0173, "step": 283630 }, { "epoch": 0.74, "learning_rate": 0.00018971463083977696, "loss": 0.0144, "step": 283640 }, { "epoch": 0.74, "learning_rate": 0.00018971074262340548, "loss": 0.0145, "step": 283650 }, { "epoch": 0.74, "learning_rate": 0.00018970685440703404, "loss": 0.0151, "step": 283660 }, { "epoch": 0.74, "learning_rate": 0.00018970296619066256, "loss": 0.0177, "step": 283670 }, { "epoch": 0.74, "learning_rate": 0.0001896990779742911, "loss": 0.0201, "step": 283680 }, { "epoch": 0.74, "learning_rate": 0.00018969518975791962, "loss": 0.0166, "step": 283690 }, { "epoch": 0.74, "learning_rate": 0.00018969130154154818, "loss": 0.0192, "step": 283700 }, { "epoch": 0.74, "learning_rate": 0.0001896874133251767, "loss": 0.0135, "step": 283710 }, { "epoch": 0.74, "learning_rate": 0.00018968352510880524, "loss": 0.0123, "step": 283720 }, { "epoch": 0.74, "learning_rate": 0.00018967963689243375, "loss": 0.0144, "step": 283730 }, { "epoch": 0.74, "learning_rate": 0.00018967574867606232, "loss": 0.0155, "step": 283740 }, { "epoch": 0.74, "learning_rate": 0.00018967186045969084, "loss": 0.0155, "step": 283750 }, { "epoch": 0.74, "learning_rate": 0.00018966797224331938, "loss": 0.0153, "step": 283760 }, { "epoch": 0.74, "learning_rate": 0.0001896640840269479, "loss": 0.0228, "step": 283770 }, { "epoch": 0.74, "learning_rate": 0.00018966019581057646, "loss": 0.0165, "step": 283780 }, { "epoch": 0.74, "learning_rate": 0.000189656307594205, "loss": 0.0113, "step": 283790 }, { "epoch": 0.74, "learning_rate": 0.00018965241937783352, "loss": 0.0148, "step": 283800 }, { "epoch": 0.74, "learning_rate": 0.00018964853116146203, "loss": 0.0123, "step": 283810 }, { "epoch": 0.74, "learning_rate": 0.0001896446429450906, "loss": 0.0161, "step": 283820 }, { "epoch": 0.74, "learning_rate": 0.00018964075472871914, "loss": 0.0175, "step": 283830 }, { "epoch": 0.74, "learning_rate": 0.00018963686651234766, "loss": 0.0148, "step": 283840 }, { "epoch": 0.74, "learning_rate": 0.0001896329782959762, "loss": 0.0123, "step": 283850 }, { "epoch": 0.74, "learning_rate": 0.00018962909007960471, "loss": 0.0199, "step": 283860 }, { "epoch": 0.74, "learning_rate": 0.00018962520186323328, "loss": 0.0151, "step": 283870 }, { "epoch": 0.74, "learning_rate": 0.0001896213136468618, "loss": 0.0154, "step": 283880 }, { "epoch": 0.74, "learning_rate": 0.00018961742543049034, "loss": 0.0162, "step": 283890 }, { "epoch": 0.74, "learning_rate": 0.00018961353721411885, "loss": 0.0185, "step": 283900 }, { "epoch": 0.74, "learning_rate": 0.00018960964899774742, "loss": 0.017, "step": 283910 }, { "epoch": 0.74, "learning_rate": 0.00018960576078137594, "loss": 0.015, "step": 283920 }, { "epoch": 0.74, "learning_rate": 0.00018960187256500448, "loss": 0.0139, "step": 283930 }, { "epoch": 0.74, "learning_rate": 0.000189597984348633, "loss": 0.0149, "step": 283940 }, { "epoch": 0.74, "learning_rate": 0.00018959409613226156, "loss": 0.0108, "step": 283950 }, { "epoch": 0.74, "learning_rate": 0.0001895902079158901, "loss": 0.0158, "step": 283960 }, { "epoch": 0.74, "learning_rate": 0.00018958631969951862, "loss": 0.0154, "step": 283970 }, { "epoch": 0.74, "learning_rate": 0.00018958243148314713, "loss": 0.0139, "step": 283980 }, { "epoch": 0.74, "learning_rate": 0.0001895785432667757, "loss": 0.016, "step": 283990 }, { "epoch": 0.74, "learning_rate": 0.00018957465505040424, "loss": 0.0152, "step": 284000 }, { "epoch": 0.74, "eval_cer": 0.8817432757942589, "eval_loss": 0.009913179092109203, "eval_runtime": 108.0964, "eval_samples_per_second": 18.502, "eval_steps_per_second": 4.626, "step": 284000 }, { "epoch": 0.74, "learning_rate": 0.00018957076683403276, "loss": 0.0116, "step": 284010 }, { "epoch": 0.74, "learning_rate": 0.0001895668786176613, "loss": 0.0192, "step": 284020 }, { "epoch": 0.74, "learning_rate": 0.00018956299040128984, "loss": 0.0149, "step": 284030 }, { "epoch": 0.74, "learning_rate": 0.00018955910218491838, "loss": 0.0188, "step": 284040 }, { "epoch": 0.74, "learning_rate": 0.0001895552139685469, "loss": 0.011, "step": 284050 }, { "epoch": 0.74, "learning_rate": 0.00018955132575217544, "loss": 0.0142, "step": 284060 }, { "epoch": 0.74, "learning_rate": 0.00018954743753580398, "loss": 0.0119, "step": 284070 }, { "epoch": 0.74, "learning_rate": 0.00018954354931943252, "loss": 0.0151, "step": 284080 }, { "epoch": 0.74, "learning_rate": 0.00018953966110306104, "loss": 0.0141, "step": 284090 }, { "epoch": 0.74, "learning_rate": 0.00018953577288668958, "loss": 0.0162, "step": 284100 }, { "epoch": 0.74, "learning_rate": 0.0001895318846703181, "loss": 0.0142, "step": 284110 }, { "epoch": 0.74, "learning_rate": 0.00018952799645394666, "loss": 0.016, "step": 284120 }, { "epoch": 0.74, "learning_rate": 0.00018952410823757518, "loss": 0.0132, "step": 284130 }, { "epoch": 0.74, "learning_rate": 0.00018952022002120372, "loss": 0.0192, "step": 284140 }, { "epoch": 0.74, "learning_rate": 0.00018951633180483223, "loss": 0.0134, "step": 284150 }, { "epoch": 0.74, "learning_rate": 0.0001895124435884608, "loss": 0.0196, "step": 284160 }, { "epoch": 0.74, "learning_rate": 0.00018950855537208934, "loss": 0.0107, "step": 284170 }, { "epoch": 0.74, "learning_rate": 0.00018950466715571786, "loss": 0.0164, "step": 284180 }, { "epoch": 0.74, "learning_rate": 0.0001895007789393464, "loss": 0.0209, "step": 284190 }, { "epoch": 0.74, "learning_rate": 0.00018949689072297494, "loss": 0.0194, "step": 284200 }, { "epoch": 0.74, "learning_rate": 0.00018949300250660348, "loss": 0.0171, "step": 284210 }, { "epoch": 0.74, "learning_rate": 0.000189489114290232, "loss": 0.0166, "step": 284220 }, { "epoch": 0.74, "learning_rate": 0.00018948522607386054, "loss": 0.0141, "step": 284230 }, { "epoch": 0.74, "learning_rate": 0.00018948133785748908, "loss": 0.0141, "step": 284240 }, { "epoch": 0.74, "learning_rate": 0.00018947744964111762, "loss": 0.014, "step": 284250 }, { "epoch": 0.74, "learning_rate": 0.00018947356142474614, "loss": 0.0133, "step": 284260 }, { "epoch": 0.74, "learning_rate": 0.00018946967320837468, "loss": 0.0119, "step": 284270 }, { "epoch": 0.74, "learning_rate": 0.00018946578499200325, "loss": 0.0171, "step": 284280 }, { "epoch": 0.74, "learning_rate": 0.00018946189677563176, "loss": 0.0159, "step": 284290 }, { "epoch": 0.74, "learning_rate": 0.00018945800855926028, "loss": 0.02, "step": 284300 }, { "epoch": 0.74, "learning_rate": 0.00018945412034288882, "loss": 0.0154, "step": 284310 }, { "epoch": 0.74, "learning_rate": 0.00018945023212651739, "loss": 0.0133, "step": 284320 }, { "epoch": 0.74, "learning_rate": 0.0001894463439101459, "loss": 0.017, "step": 284330 }, { "epoch": 0.74, "learning_rate": 0.00018944245569377444, "loss": 0.0149, "step": 284340 }, { "epoch": 0.74, "learning_rate": 0.00018943856747740296, "loss": 0.0153, "step": 284350 }, { "epoch": 0.74, "learning_rate": 0.0001894346792610315, "loss": 0.0118, "step": 284360 }, { "epoch": 0.74, "learning_rate": 0.00018943079104466004, "loss": 0.0158, "step": 284370 }, { "epoch": 0.74, "learning_rate": 0.00018942690282828858, "loss": 0.0148, "step": 284380 }, { "epoch": 0.74, "learning_rate": 0.0001894230146119171, "loss": 0.0133, "step": 284390 }, { "epoch": 0.74, "learning_rate": 0.00018941912639554564, "loss": 0.0149, "step": 284400 }, { "epoch": 0.74, "learning_rate": 0.00018941523817917418, "loss": 0.0163, "step": 284410 }, { "epoch": 0.74, "learning_rate": 0.00018941134996280272, "loss": 0.0124, "step": 284420 }, { "epoch": 0.74, "learning_rate": 0.00018940746174643124, "loss": 0.012, "step": 284430 }, { "epoch": 0.74, "learning_rate": 0.00018940357353005978, "loss": 0.0135, "step": 284440 }, { "epoch": 0.74, "learning_rate": 0.00018939968531368832, "loss": 0.0139, "step": 284450 }, { "epoch": 0.74, "learning_rate": 0.00018939579709731686, "loss": 0.0129, "step": 284460 }, { "epoch": 0.74, "learning_rate": 0.00018939190888094538, "loss": 0.0142, "step": 284470 }, { "epoch": 0.74, "learning_rate": 0.00018938802066457392, "loss": 0.0157, "step": 284480 }, { "epoch": 0.74, "learning_rate": 0.00018938413244820249, "loss": 0.0198, "step": 284490 }, { "epoch": 0.74, "learning_rate": 0.000189380244231831, "loss": 0.015, "step": 284500 }, { "epoch": 0.74, "learning_rate": 0.00018937635601545954, "loss": 0.0144, "step": 284510 }, { "epoch": 0.74, "learning_rate": 0.00018937246779908806, "loss": 0.0148, "step": 284520 }, { "epoch": 0.74, "learning_rate": 0.00018936857958271663, "loss": 0.0187, "step": 284530 }, { "epoch": 0.74, "learning_rate": 0.00018936469136634514, "loss": 0.0133, "step": 284540 }, { "epoch": 0.74, "learning_rate": 0.00018936080314997368, "loss": 0.0118, "step": 284550 }, { "epoch": 0.74, "learning_rate": 0.0001893569149336022, "loss": 0.0167, "step": 284560 }, { "epoch": 0.74, "learning_rate": 0.00018935302671723076, "loss": 0.0214, "step": 284570 }, { "epoch": 0.74, "learning_rate": 0.00018934913850085928, "loss": 0.0154, "step": 284580 }, { "epoch": 0.74, "learning_rate": 0.00018934525028448782, "loss": 0.0151, "step": 284590 }, { "epoch": 0.74, "learning_rate": 0.00018934136206811634, "loss": 0.0169, "step": 284600 }, { "epoch": 0.74, "learning_rate": 0.00018933747385174488, "loss": 0.0127, "step": 284610 }, { "epoch": 0.74, "learning_rate": 0.00018933358563537342, "loss": 0.0151, "step": 284620 }, { "epoch": 0.74, "learning_rate": 0.00018932969741900196, "loss": 0.0113, "step": 284630 }, { "epoch": 0.74, "learning_rate": 0.00018932580920263047, "loss": 0.0128, "step": 284640 }, { "epoch": 0.74, "learning_rate": 0.00018932192098625902, "loss": 0.0152, "step": 284650 }, { "epoch": 0.74, "learning_rate": 0.00018931803276988759, "loss": 0.0132, "step": 284660 }, { "epoch": 0.74, "learning_rate": 0.0001893141445535161, "loss": 0.0149, "step": 284670 }, { "epoch": 0.74, "learning_rate": 0.00018931025633714464, "loss": 0.0133, "step": 284680 }, { "epoch": 0.74, "learning_rate": 0.00018930636812077316, "loss": 0.0139, "step": 284690 }, { "epoch": 0.74, "learning_rate": 0.00018930247990440172, "loss": 0.0145, "step": 284700 }, { "epoch": 0.74, "learning_rate": 0.00018929859168803024, "loss": 0.0145, "step": 284710 }, { "epoch": 0.74, "learning_rate": 0.00018929470347165878, "loss": 0.0166, "step": 284720 }, { "epoch": 0.74, "learning_rate": 0.0001892908152552873, "loss": 0.0154, "step": 284730 }, { "epoch": 0.74, "learning_rate": 0.00018928692703891586, "loss": 0.0141, "step": 284740 }, { "epoch": 0.74, "learning_rate": 0.00018928303882254438, "loss": 0.0159, "step": 284750 }, { "epoch": 0.74, "learning_rate": 0.00018927915060617292, "loss": 0.0129, "step": 284760 }, { "epoch": 0.74, "learning_rate": 0.00018927526238980143, "loss": 0.0152, "step": 284770 }, { "epoch": 0.74, "learning_rate": 0.00018927137417343, "loss": 0.0151, "step": 284780 }, { "epoch": 0.74, "learning_rate": 0.00018926748595705852, "loss": 0.0131, "step": 284790 }, { "epoch": 0.74, "learning_rate": 0.00018926359774068706, "loss": 0.0158, "step": 284800 }, { "epoch": 0.74, "learning_rate": 0.00018925970952431557, "loss": 0.0123, "step": 284810 }, { "epoch": 0.74, "learning_rate": 0.00018925582130794414, "loss": 0.0136, "step": 284820 }, { "epoch": 0.74, "learning_rate": 0.00018925193309157268, "loss": 0.0143, "step": 284830 }, { "epoch": 0.74, "learning_rate": 0.0001892480448752012, "loss": 0.0164, "step": 284840 }, { "epoch": 0.74, "learning_rate": 0.00018924415665882971, "loss": 0.0176, "step": 284850 }, { "epoch": 0.74, "learning_rate": 0.00018924026844245826, "loss": 0.0154, "step": 284860 }, { "epoch": 0.74, "learning_rate": 0.00018923638022608682, "loss": 0.0147, "step": 284870 }, { "epoch": 0.74, "learning_rate": 0.00018923249200971534, "loss": 0.0141, "step": 284880 }, { "epoch": 0.74, "learning_rate": 0.00018922860379334388, "loss": 0.0113, "step": 284890 }, { "epoch": 0.74, "learning_rate": 0.0001892247155769724, "loss": 0.0183, "step": 284900 }, { "epoch": 0.74, "learning_rate": 0.00018922082736060096, "loss": 0.0157, "step": 284910 }, { "epoch": 0.74, "learning_rate": 0.00018921693914422948, "loss": 0.0129, "step": 284920 }, { "epoch": 0.74, "learning_rate": 0.00018921305092785802, "loss": 0.0134, "step": 284930 }, { "epoch": 0.74, "learning_rate": 0.00018920916271148653, "loss": 0.0157, "step": 284940 }, { "epoch": 0.74, "learning_rate": 0.0001892052744951151, "loss": 0.0172, "step": 284950 }, { "epoch": 0.74, "learning_rate": 0.00018920138627874362, "loss": 0.0147, "step": 284960 }, { "epoch": 0.74, "learning_rate": 0.00018919749806237216, "loss": 0.0133, "step": 284970 }, { "epoch": 0.74, "learning_rate": 0.00018919360984600067, "loss": 0.0137, "step": 284980 }, { "epoch": 0.74, "learning_rate": 0.00018918972162962924, "loss": 0.0158, "step": 284990 }, { "epoch": 0.74, "learning_rate": 0.00018918583341325776, "loss": 0.0123, "step": 285000 }, { "epoch": 0.74, "eval_cer": 0.881704085960102, "eval_loss": 0.010136989876627922, "eval_runtime": 108.2121, "eval_samples_per_second": 18.482, "eval_steps_per_second": 4.621, "step": 285000 }, { "epoch": 0.74, "learning_rate": 0.0001891819451968863, "loss": 0.0153, "step": 285010 }, { "epoch": 0.74, "learning_rate": 0.0001891780569805148, "loss": 0.0191, "step": 285020 }, { "epoch": 0.74, "learning_rate": 0.00018917416876414338, "loss": 0.0122, "step": 285030 }, { "epoch": 0.74, "learning_rate": 0.00018917028054777192, "loss": 0.0173, "step": 285040 }, { "epoch": 0.74, "learning_rate": 0.00018916639233140044, "loss": 0.0152, "step": 285050 }, { "epoch": 0.74, "learning_rate": 0.00018916250411502898, "loss": 0.013, "step": 285060 }, { "epoch": 0.74, "learning_rate": 0.00018915861589865752, "loss": 0.0147, "step": 285070 }, { "epoch": 0.74, "learning_rate": 0.00018915472768228606, "loss": 0.0144, "step": 285080 }, { "epoch": 0.74, "learning_rate": 0.00018915083946591458, "loss": 0.012, "step": 285090 }, { "epoch": 0.74, "learning_rate": 0.00018914695124954312, "loss": 0.0128, "step": 285100 }, { "epoch": 0.74, "learning_rate": 0.00018914306303317163, "loss": 0.0109, "step": 285110 }, { "epoch": 0.74, "learning_rate": 0.0001891391748168002, "loss": 0.0139, "step": 285120 }, { "epoch": 0.74, "learning_rate": 0.00018913528660042872, "loss": 0.0141, "step": 285130 }, { "epoch": 0.74, "learning_rate": 0.00018913139838405726, "loss": 0.0189, "step": 285140 }, { "epoch": 0.74, "learning_rate": 0.00018912751016768577, "loss": 0.0131, "step": 285150 }, { "epoch": 0.74, "learning_rate": 0.00018912362195131434, "loss": 0.0136, "step": 285160 }, { "epoch": 0.74, "learning_rate": 0.00018911973373494286, "loss": 0.0153, "step": 285170 }, { "epoch": 0.74, "learning_rate": 0.0001891158455185714, "loss": 0.0143, "step": 285180 }, { "epoch": 0.74, "learning_rate": 0.0001891119573021999, "loss": 0.0158, "step": 285190 }, { "epoch": 0.74, "learning_rate": 0.00018910806908582848, "loss": 0.0168, "step": 285200 }, { "epoch": 0.74, "learning_rate": 0.00018910418086945702, "loss": 0.0103, "step": 285210 }, { "epoch": 0.74, "learning_rate": 0.00018910029265308554, "loss": 0.0174, "step": 285220 }, { "epoch": 0.74, "learning_rate": 0.00018909640443671408, "loss": 0.0146, "step": 285230 }, { "epoch": 0.74, "learning_rate": 0.00018909251622034262, "loss": 0.0175, "step": 285240 }, { "epoch": 0.74, "learning_rate": 0.00018908862800397116, "loss": 0.0131, "step": 285250 }, { "epoch": 0.74, "learning_rate": 0.00018908473978759968, "loss": 0.0175, "step": 285260 }, { "epoch": 0.74, "learning_rate": 0.00018908085157122822, "loss": 0.0138, "step": 285270 }, { "epoch": 0.74, "learning_rate": 0.00018907696335485676, "loss": 0.018, "step": 285280 }, { "epoch": 0.74, "learning_rate": 0.0001890730751384853, "loss": 0.015, "step": 285290 }, { "epoch": 0.74, "learning_rate": 0.00018906918692211382, "loss": 0.0135, "step": 285300 }, { "epoch": 0.74, "learning_rate": 0.00018906529870574236, "loss": 0.0168, "step": 285310 }, { "epoch": 0.74, "learning_rate": 0.0001890614104893709, "loss": 0.0182, "step": 285320 }, { "epoch": 0.74, "learning_rate": 0.00018905752227299944, "loss": 0.0153, "step": 285330 }, { "epoch": 0.74, "learning_rate": 0.00018905363405662796, "loss": 0.0171, "step": 285340 }, { "epoch": 0.74, "learning_rate": 0.0001890497458402565, "loss": 0.0151, "step": 285350 }, { "epoch": 0.74, "learning_rate": 0.000189045857623885, "loss": 0.0128, "step": 285360 }, { "epoch": 0.74, "learning_rate": 0.00018904196940751358, "loss": 0.0147, "step": 285370 }, { "epoch": 0.74, "learning_rate": 0.00018903808119114212, "loss": 0.0181, "step": 285380 }, { "epoch": 0.74, "learning_rate": 0.00018903419297477064, "loss": 0.0175, "step": 285390 }, { "epoch": 0.74, "learning_rate": 0.00018903030475839915, "loss": 0.0164, "step": 285400 }, { "epoch": 0.74, "learning_rate": 0.00018902641654202772, "loss": 0.0125, "step": 285410 }, { "epoch": 0.74, "learning_rate": 0.00018902252832565626, "loss": 0.0097, "step": 285420 }, { "epoch": 0.74, "learning_rate": 0.00018901864010928478, "loss": 0.0152, "step": 285430 }, { "epoch": 0.74, "learning_rate": 0.00018901475189291332, "loss": 0.0143, "step": 285440 }, { "epoch": 0.74, "learning_rate": 0.00018901086367654186, "loss": 0.0169, "step": 285450 }, { "epoch": 0.74, "learning_rate": 0.0001890069754601704, "loss": 0.0169, "step": 285460 }, { "epoch": 0.74, "learning_rate": 0.00018900308724379892, "loss": 0.0158, "step": 285470 }, { "epoch": 0.74, "learning_rate": 0.00018899919902742746, "loss": 0.0127, "step": 285480 }, { "epoch": 0.74, "learning_rate": 0.000188995310811056, "loss": 0.0171, "step": 285490 }, { "epoch": 0.74, "learning_rate": 0.00018899142259468454, "loss": 0.018, "step": 285500 }, { "epoch": 0.74, "learning_rate": 0.00018898753437831306, "loss": 0.0117, "step": 285510 }, { "epoch": 0.74, "learning_rate": 0.0001889836461619416, "loss": 0.0164, "step": 285520 }, { "epoch": 0.74, "learning_rate": 0.00018897975794557017, "loss": 0.0163, "step": 285530 }, { "epoch": 0.74, "learning_rate": 0.00018897586972919868, "loss": 0.0153, "step": 285540 }, { "epoch": 0.74, "learning_rate": 0.00018897198151282722, "loss": 0.0167, "step": 285550 }, { "epoch": 0.74, "learning_rate": 0.00018896809329645574, "loss": 0.0168, "step": 285560 }, { "epoch": 0.74, "learning_rate": 0.0001889642050800843, "loss": 0.0145, "step": 285570 }, { "epoch": 0.74, "learning_rate": 0.00018896031686371282, "loss": 0.0142, "step": 285580 }, { "epoch": 0.74, "learning_rate": 0.00018895642864734136, "loss": 0.0149, "step": 285590 }, { "epoch": 0.74, "learning_rate": 0.00018895254043096988, "loss": 0.0136, "step": 285600 }, { "epoch": 0.74, "learning_rate": 0.00018894865221459842, "loss": 0.0144, "step": 285610 }, { "epoch": 0.74, "learning_rate": 0.00018894476399822696, "loss": 0.0118, "step": 285620 }, { "epoch": 0.74, "learning_rate": 0.0001889408757818555, "loss": 0.0169, "step": 285630 }, { "epoch": 0.74, "learning_rate": 0.00018893698756548402, "loss": 0.0126, "step": 285640 }, { "epoch": 0.74, "learning_rate": 0.00018893309934911256, "loss": 0.0146, "step": 285650 }, { "epoch": 0.74, "learning_rate": 0.0001889292111327411, "loss": 0.0155, "step": 285660 }, { "epoch": 0.74, "learning_rate": 0.00018892532291636964, "loss": 0.0177, "step": 285670 }, { "epoch": 0.74, "learning_rate": 0.00018892143469999815, "loss": 0.0151, "step": 285680 }, { "epoch": 0.74, "learning_rate": 0.0001889175464836267, "loss": 0.0129, "step": 285690 }, { "epoch": 0.74, "learning_rate": 0.00018891365826725526, "loss": 0.0173, "step": 285700 }, { "epoch": 0.74, "learning_rate": 0.00018890977005088378, "loss": 0.0145, "step": 285710 }, { "epoch": 0.74, "learning_rate": 0.0001889058818345123, "loss": 0.0135, "step": 285720 }, { "epoch": 0.74, "learning_rate": 0.00018890199361814084, "loss": 0.0154, "step": 285730 }, { "epoch": 0.74, "learning_rate": 0.0001888981054017694, "loss": 0.0122, "step": 285740 }, { "epoch": 0.74, "learning_rate": 0.00018889421718539792, "loss": 0.0136, "step": 285750 }, { "epoch": 0.74, "learning_rate": 0.00018889032896902646, "loss": 0.0147, "step": 285760 }, { "epoch": 0.74, "learning_rate": 0.00018888644075265498, "loss": 0.0113, "step": 285770 }, { "epoch": 0.74, "learning_rate": 0.00018888255253628354, "loss": 0.0143, "step": 285780 }, { "epoch": 0.74, "learning_rate": 0.00018887866431991206, "loss": 0.0132, "step": 285790 }, { "epoch": 0.74, "learning_rate": 0.0001888747761035406, "loss": 0.0179, "step": 285800 }, { "epoch": 0.74, "learning_rate": 0.00018887088788716911, "loss": 0.0159, "step": 285810 }, { "epoch": 0.74, "learning_rate": 0.00018886699967079766, "loss": 0.0157, "step": 285820 }, { "epoch": 0.74, "learning_rate": 0.0001888631114544262, "loss": 0.0216, "step": 285830 }, { "epoch": 0.74, "learning_rate": 0.00018885922323805474, "loss": 0.0137, "step": 285840 }, { "epoch": 0.74, "learning_rate": 0.00018885533502168325, "loss": 0.0187, "step": 285850 }, { "epoch": 0.74, "learning_rate": 0.0001888514468053118, "loss": 0.0165, "step": 285860 }, { "epoch": 0.74, "learning_rate": 0.00018884755858894036, "loss": 0.0125, "step": 285870 }, { "epoch": 0.74, "learning_rate": 0.00018884367037256888, "loss": 0.0096, "step": 285880 }, { "epoch": 0.74, "learning_rate": 0.0001888397821561974, "loss": 0.0175, "step": 285890 }, { "epoch": 0.74, "learning_rate": 0.00018883589393982594, "loss": 0.011, "step": 285900 }, { "epoch": 0.74, "learning_rate": 0.0001888320057234545, "loss": 0.0144, "step": 285910 }, { "epoch": 0.74, "learning_rate": 0.00018882811750708302, "loss": 0.0139, "step": 285920 }, { "epoch": 0.74, "learning_rate": 0.00018882422929071156, "loss": 0.0123, "step": 285930 }, { "epoch": 0.74, "learning_rate": 0.00018882034107434007, "loss": 0.0127, "step": 285940 }, { "epoch": 0.74, "learning_rate": 0.00018881645285796864, "loss": 0.0138, "step": 285950 }, { "epoch": 0.74, "learning_rate": 0.00018881256464159716, "loss": 0.012, "step": 285960 }, { "epoch": 0.74, "learning_rate": 0.0001888086764252257, "loss": 0.0152, "step": 285970 }, { "epoch": 0.74, "learning_rate": 0.00018880478820885421, "loss": 0.0156, "step": 285980 }, { "epoch": 0.74, "learning_rate": 0.00018880089999248278, "loss": 0.015, "step": 285990 }, { "epoch": 0.74, "learning_rate": 0.0001887970117761113, "loss": 0.0144, "step": 286000 }, { "epoch": 0.74, "eval_cer": 0.8816928888646285, "eval_loss": 0.00980143342167139, "eval_runtime": 107.852, "eval_samples_per_second": 18.544, "eval_steps_per_second": 4.636, "step": 286000 }, { "epoch": 0.74, "learning_rate": 0.00018879312355973984, "loss": 0.0133, "step": 286010 }, { "epoch": 0.74, "learning_rate": 0.00018878923534336835, "loss": 0.0156, "step": 286020 }, { "epoch": 0.74, "learning_rate": 0.00018878534712699692, "loss": 0.0124, "step": 286030 }, { "epoch": 0.74, "learning_rate": 0.00018878145891062544, "loss": 0.0172, "step": 286040 }, { "epoch": 0.74, "learning_rate": 0.00018877757069425398, "loss": 0.0163, "step": 286050 }, { "epoch": 0.74, "learning_rate": 0.0001887736824778825, "loss": 0.0118, "step": 286060 }, { "epoch": 0.74, "learning_rate": 0.00018876979426151103, "loss": 0.0091, "step": 286070 }, { "epoch": 0.74, "learning_rate": 0.0001887659060451396, "loss": 0.0165, "step": 286080 }, { "epoch": 0.74, "learning_rate": 0.00018876201782876812, "loss": 0.0164, "step": 286090 }, { "epoch": 0.74, "learning_rate": 0.00018875812961239666, "loss": 0.0143, "step": 286100 }, { "epoch": 0.74, "learning_rate": 0.00018875424139602517, "loss": 0.0163, "step": 286110 }, { "epoch": 0.74, "learning_rate": 0.00018875035317965374, "loss": 0.016, "step": 286120 }, { "epoch": 0.74, "learning_rate": 0.00018874646496328226, "loss": 0.0115, "step": 286130 }, { "epoch": 0.74, "learning_rate": 0.0001887425767469108, "loss": 0.0146, "step": 286140 }, { "epoch": 0.74, "learning_rate": 0.0001887386885305393, "loss": 0.0121, "step": 286150 }, { "epoch": 0.74, "learning_rate": 0.00018873480031416788, "loss": 0.018, "step": 286160 }, { "epoch": 0.74, "learning_rate": 0.0001887309120977964, "loss": 0.0166, "step": 286170 }, { "epoch": 0.74, "learning_rate": 0.00018872702388142494, "loss": 0.014, "step": 286180 }, { "epoch": 0.74, "learning_rate": 0.00018872313566505345, "loss": 0.0131, "step": 286190 }, { "epoch": 0.74, "learning_rate": 0.00018871924744868202, "loss": 0.0142, "step": 286200 }, { "epoch": 0.74, "learning_rate": 0.00018871535923231054, "loss": 0.0153, "step": 286210 }, { "epoch": 0.74, "learning_rate": 0.00018871147101593908, "loss": 0.016, "step": 286220 }, { "epoch": 0.74, "learning_rate": 0.0001887075827995676, "loss": 0.0158, "step": 286230 }, { "epoch": 0.74, "learning_rate": 0.00018870369458319616, "loss": 0.0134, "step": 286240 }, { "epoch": 0.74, "learning_rate": 0.0001886998063668247, "loss": 0.0157, "step": 286250 }, { "epoch": 0.74, "learning_rate": 0.00018869591815045322, "loss": 0.0108, "step": 286260 }, { "epoch": 0.74, "learning_rate": 0.00018869202993408176, "loss": 0.014, "step": 286270 }, { "epoch": 0.74, "learning_rate": 0.0001886881417177103, "loss": 0.015, "step": 286280 }, { "epoch": 0.74, "learning_rate": 0.00018868425350133884, "loss": 0.0153, "step": 286290 }, { "epoch": 0.74, "learning_rate": 0.00018868036528496736, "loss": 0.0164, "step": 286300 }, { "epoch": 0.74, "learning_rate": 0.0001886764770685959, "loss": 0.0164, "step": 286310 }, { "epoch": 0.74, "learning_rate": 0.0001886725888522244, "loss": 0.019, "step": 286320 }, { "epoch": 0.74, "learning_rate": 0.00018866870063585298, "loss": 0.0138, "step": 286330 }, { "epoch": 0.74, "learning_rate": 0.0001886648124194815, "loss": 0.0165, "step": 286340 }, { "epoch": 0.74, "learning_rate": 0.00018866092420311004, "loss": 0.0179, "step": 286350 }, { "epoch": 0.74, "learning_rate": 0.00018865703598673855, "loss": 0.0121, "step": 286360 }, { "epoch": 0.74, "learning_rate": 0.00018865314777036712, "loss": 0.016, "step": 286370 }, { "epoch": 0.74, "learning_rate": 0.00018864925955399564, "loss": 0.0133, "step": 286380 }, { "epoch": 0.74, "learning_rate": 0.00018864537133762418, "loss": 0.0143, "step": 286390 }, { "epoch": 0.74, "learning_rate": 0.0001886414831212527, "loss": 0.0151, "step": 286400 }, { "epoch": 0.74, "learning_rate": 0.00018863759490488126, "loss": 0.0155, "step": 286410 }, { "epoch": 0.74, "learning_rate": 0.0001886337066885098, "loss": 0.0175, "step": 286420 }, { "epoch": 0.74, "learning_rate": 0.00018862981847213832, "loss": 0.0164, "step": 286430 }, { "epoch": 0.74, "learning_rate": 0.00018862593025576683, "loss": 0.0146, "step": 286440 }, { "epoch": 0.74, "learning_rate": 0.0001886220420393954, "loss": 0.0134, "step": 286450 }, { "epoch": 0.74, "learning_rate": 0.00018861815382302394, "loss": 0.0138, "step": 286460 }, { "epoch": 0.74, "learning_rate": 0.00018861426560665246, "loss": 0.0147, "step": 286470 }, { "epoch": 0.74, "learning_rate": 0.000188610377390281, "loss": 0.0178, "step": 286480 }, { "epoch": 0.74, "learning_rate": 0.00018860648917390954, "loss": 0.0173, "step": 286490 }, { "epoch": 0.74, "learning_rate": 0.00018860260095753808, "loss": 0.0148, "step": 286500 }, { "epoch": 0.74, "learning_rate": 0.0001885987127411666, "loss": 0.0154, "step": 286510 }, { "epoch": 0.74, "learning_rate": 0.00018859482452479514, "loss": 0.015, "step": 286520 }, { "epoch": 0.74, "learning_rate": 0.00018859093630842368, "loss": 0.0143, "step": 286530 }, { "epoch": 0.74, "learning_rate": 0.00018858704809205222, "loss": 0.0168, "step": 286540 }, { "epoch": 0.74, "learning_rate": 0.00018858315987568073, "loss": 0.015, "step": 286550 }, { "epoch": 0.74, "learning_rate": 0.00018857927165930928, "loss": 0.0136, "step": 286560 }, { "epoch": 0.74, "learning_rate": 0.0001885753834429378, "loss": 0.0132, "step": 286570 }, { "epoch": 0.74, "learning_rate": 0.00018857149522656636, "loss": 0.0138, "step": 286580 }, { "epoch": 0.74, "learning_rate": 0.00018856760701019487, "loss": 0.0145, "step": 286590 }, { "epoch": 0.74, "learning_rate": 0.00018856371879382342, "loss": 0.0147, "step": 286600 }, { "epoch": 0.74, "learning_rate": 0.00018855983057745193, "loss": 0.0131, "step": 286610 }, { "epoch": 0.74, "learning_rate": 0.0001885559423610805, "loss": 0.0162, "step": 286620 }, { "epoch": 0.74, "learning_rate": 0.00018855205414470904, "loss": 0.0141, "step": 286630 }, { "epoch": 0.74, "learning_rate": 0.00018854816592833756, "loss": 0.0133, "step": 286640 }, { "epoch": 0.74, "learning_rate": 0.0001885442777119661, "loss": 0.0171, "step": 286650 }, { "epoch": 0.74, "learning_rate": 0.00018854038949559464, "loss": 0.0151, "step": 286660 }, { "epoch": 0.74, "learning_rate": 0.00018853650127922318, "loss": 0.0132, "step": 286670 }, { "epoch": 0.74, "learning_rate": 0.0001885326130628517, "loss": 0.0123, "step": 286680 }, { "epoch": 0.74, "learning_rate": 0.00018852872484648024, "loss": 0.0124, "step": 286690 }, { "epoch": 0.74, "learning_rate": 0.00018852483663010878, "loss": 0.018, "step": 286700 }, { "epoch": 0.74, "learning_rate": 0.00018852094841373732, "loss": 0.0154, "step": 286710 }, { "epoch": 0.74, "learning_rate": 0.00018851706019736583, "loss": 0.0164, "step": 286720 }, { "epoch": 0.74, "learning_rate": 0.00018851317198099438, "loss": 0.013, "step": 286730 }, { "epoch": 0.74, "learning_rate": 0.00018850928376462294, "loss": 0.0136, "step": 286740 }, { "epoch": 0.74, "learning_rate": 0.00018850539554825146, "loss": 0.0149, "step": 286750 }, { "epoch": 0.74, "learning_rate": 0.00018850150733187997, "loss": 0.0144, "step": 286760 }, { "epoch": 0.74, "learning_rate": 0.00018849761911550852, "loss": 0.0114, "step": 286770 }, { "epoch": 0.74, "learning_rate": 0.00018849373089913708, "loss": 0.0131, "step": 286780 }, { "epoch": 0.74, "learning_rate": 0.0001884898426827656, "loss": 0.0155, "step": 286790 }, { "epoch": 0.74, "learning_rate": 0.00018848595446639414, "loss": 0.0161, "step": 286800 }, { "epoch": 0.74, "learning_rate": 0.00018848206625002265, "loss": 0.0156, "step": 286810 }, { "epoch": 0.74, "learning_rate": 0.0001884781780336512, "loss": 0.0152, "step": 286820 }, { "epoch": 0.74, "learning_rate": 0.00018847428981727974, "loss": 0.0155, "step": 286830 }, { "epoch": 0.74, "learning_rate": 0.00018847040160090828, "loss": 0.0125, "step": 286840 }, { "epoch": 0.74, "learning_rate": 0.0001884665133845368, "loss": 0.021, "step": 286850 }, { "epoch": 0.74, "learning_rate": 0.00018846262516816534, "loss": 0.0215, "step": 286860 }, { "epoch": 0.74, "learning_rate": 0.00018845873695179388, "loss": 0.0153, "step": 286870 }, { "epoch": 0.74, "learning_rate": 0.00018845484873542242, "loss": 0.0209, "step": 286880 }, { "epoch": 0.74, "learning_rate": 0.00018845096051905093, "loss": 0.0141, "step": 286890 }, { "epoch": 0.74, "learning_rate": 0.00018844707230267948, "loss": 0.0115, "step": 286900 }, { "epoch": 0.74, "learning_rate": 0.00018844318408630802, "loss": 0.0106, "step": 286910 }, { "epoch": 0.74, "learning_rate": 0.00018843929586993656, "loss": 0.014, "step": 286920 }, { "epoch": 0.74, "learning_rate": 0.00018843540765356507, "loss": 0.0173, "step": 286930 }, { "epoch": 0.74, "learning_rate": 0.00018843151943719361, "loss": 0.0147, "step": 286940 }, { "epoch": 0.74, "learning_rate": 0.00018842763122082218, "loss": 0.0183, "step": 286950 }, { "epoch": 0.74, "learning_rate": 0.0001884237430044507, "loss": 0.0168, "step": 286960 }, { "epoch": 0.74, "learning_rate": 0.00018841985478807924, "loss": 0.0136, "step": 286970 }, { "epoch": 0.74, "learning_rate": 0.00018841596657170775, "loss": 0.0145, "step": 286980 }, { "epoch": 0.74, "learning_rate": 0.00018841207835533632, "loss": 0.0176, "step": 286990 }, { "epoch": 0.74, "learning_rate": 0.00018840819013896484, "loss": 0.0137, "step": 287000 }, { "epoch": 0.74, "eval_cer": 0.8817096845078387, "eval_loss": 0.010108675807714462, "eval_runtime": 107.8967, "eval_samples_per_second": 18.536, "eval_steps_per_second": 4.634, "step": 287000 }, { "epoch": 0.74, "learning_rate": 0.00018840430192259338, "loss": 0.0134, "step": 287010 }, { "epoch": 0.74, "learning_rate": 0.0001884004137062219, "loss": 0.0159, "step": 287020 }, { "epoch": 0.74, "learning_rate": 0.00018839652548985046, "loss": 0.016, "step": 287030 }, { "epoch": 0.74, "learning_rate": 0.00018839263727347898, "loss": 0.0153, "step": 287040 }, { "epoch": 0.74, "learning_rate": 0.00018838874905710752, "loss": 0.0172, "step": 287050 }, { "epoch": 0.74, "learning_rate": 0.00018838486084073603, "loss": 0.0168, "step": 287060 }, { "epoch": 0.74, "learning_rate": 0.00018838097262436457, "loss": 0.0155, "step": 287070 }, { "epoch": 0.74, "learning_rate": 0.00018837708440799312, "loss": 0.0167, "step": 287080 }, { "epoch": 0.74, "learning_rate": 0.00018837319619162166, "loss": 0.0141, "step": 287090 }, { "epoch": 0.74, "learning_rate": 0.00018836930797525017, "loss": 0.0173, "step": 287100 }, { "epoch": 0.74, "learning_rate": 0.00018836541975887871, "loss": 0.0125, "step": 287110 }, { "epoch": 0.74, "learning_rate": 0.00018836153154250728, "loss": 0.0162, "step": 287120 }, { "epoch": 0.74, "learning_rate": 0.0001883576433261358, "loss": 0.0167, "step": 287130 }, { "epoch": 0.74, "learning_rate": 0.00018835375510976434, "loss": 0.0153, "step": 287140 }, { "epoch": 0.74, "learning_rate": 0.00018834986689339285, "loss": 0.0182, "step": 287150 }, { "epoch": 0.74, "learning_rate": 0.00018834597867702142, "loss": 0.0127, "step": 287160 }, { "epoch": 0.74, "learning_rate": 0.00018834209046064994, "loss": 0.0139, "step": 287170 }, { "epoch": 0.74, "learning_rate": 0.00018833820224427848, "loss": 0.0168, "step": 287180 }, { "epoch": 0.74, "learning_rate": 0.000188334314027907, "loss": 0.0133, "step": 287190 }, { "epoch": 0.74, "learning_rate": 0.00018833042581153556, "loss": 0.0171, "step": 287200 }, { "epoch": 0.74, "learning_rate": 0.00018832653759516408, "loss": 0.0137, "step": 287210 }, { "epoch": 0.74, "learning_rate": 0.00018832264937879262, "loss": 0.0137, "step": 287220 }, { "epoch": 0.74, "learning_rate": 0.00018831876116242113, "loss": 0.0144, "step": 287230 }, { "epoch": 0.74, "learning_rate": 0.0001883148729460497, "loss": 0.0158, "step": 287240 }, { "epoch": 0.74, "learning_rate": 0.00018831098472967822, "loss": 0.0134, "step": 287250 }, { "epoch": 0.74, "learning_rate": 0.00018830709651330676, "loss": 0.0112, "step": 287260 }, { "epoch": 0.74, "learning_rate": 0.00018830320829693527, "loss": 0.0119, "step": 287270 }, { "epoch": 0.74, "learning_rate": 0.00018829932008056384, "loss": 0.0154, "step": 287280 }, { "epoch": 0.74, "learning_rate": 0.00018829543186419238, "loss": 0.0144, "step": 287290 }, { "epoch": 0.74, "learning_rate": 0.0001882915436478209, "loss": 0.0123, "step": 287300 }, { "epoch": 0.74, "learning_rate": 0.0001882876554314494, "loss": 0.012, "step": 287310 }, { "epoch": 0.74, "learning_rate": 0.00018828376721507795, "loss": 0.0187, "step": 287320 }, { "epoch": 0.74, "learning_rate": 0.00018827987899870652, "loss": 0.014, "step": 287330 }, { "epoch": 0.74, "learning_rate": 0.00018827599078233504, "loss": 0.0122, "step": 287340 }, { "epoch": 0.74, "learning_rate": 0.00018827210256596358, "loss": 0.0167, "step": 287350 }, { "epoch": 0.74, "learning_rate": 0.0001882682143495921, "loss": 0.0132, "step": 287360 }, { "epoch": 0.74, "learning_rate": 0.00018826432613322066, "loss": 0.0165, "step": 287370 }, { "epoch": 0.74, "learning_rate": 0.00018826043791684918, "loss": 0.0167, "step": 287380 }, { "epoch": 0.74, "learning_rate": 0.00018825654970047772, "loss": 0.0185, "step": 287390 }, { "epoch": 0.74, "learning_rate": 0.00018825266148410623, "loss": 0.0132, "step": 287400 }, { "epoch": 0.75, "learning_rate": 0.0001882487732677348, "loss": 0.0175, "step": 287410 }, { "epoch": 0.75, "learning_rate": 0.00018824488505136332, "loss": 0.0118, "step": 287420 }, { "epoch": 0.75, "learning_rate": 0.00018824099683499186, "loss": 0.0132, "step": 287430 }, { "epoch": 0.75, "learning_rate": 0.00018823710861862037, "loss": 0.0154, "step": 287440 }, { "epoch": 0.75, "learning_rate": 0.00018823322040224894, "loss": 0.0112, "step": 287450 }, { "epoch": 0.75, "learning_rate": 0.00018822933218587748, "loss": 0.0122, "step": 287460 }, { "epoch": 0.75, "learning_rate": 0.000188225443969506, "loss": 0.0128, "step": 287470 }, { "epoch": 0.75, "learning_rate": 0.0001882215557531345, "loss": 0.016, "step": 287480 }, { "epoch": 0.75, "learning_rate": 0.00018821766753676308, "loss": 0.0125, "step": 287490 }, { "epoch": 0.75, "learning_rate": 0.00018821377932039162, "loss": 0.0145, "step": 287500 }, { "epoch": 0.75, "learning_rate": 0.00018820989110402014, "loss": 0.0167, "step": 287510 }, { "epoch": 0.75, "learning_rate": 0.00018820600288764868, "loss": 0.0138, "step": 287520 }, { "epoch": 0.75, "learning_rate": 0.00018820211467127722, "loss": 0.0136, "step": 287530 }, { "epoch": 0.75, "learning_rate": 0.00018819822645490576, "loss": 0.0113, "step": 287540 }, { "epoch": 0.75, "learning_rate": 0.00018819433823853428, "loss": 0.0129, "step": 287550 }, { "epoch": 0.75, "learning_rate": 0.00018819045002216282, "loss": 0.0147, "step": 287560 }, { "epoch": 0.75, "learning_rate": 0.00018818656180579133, "loss": 0.0172, "step": 287570 }, { "epoch": 0.75, "learning_rate": 0.0001881826735894199, "loss": 0.0191, "step": 287580 }, { "epoch": 0.75, "learning_rate": 0.00018817878537304841, "loss": 0.0156, "step": 287590 }, { "epoch": 0.75, "learning_rate": 0.00018817489715667696, "loss": 0.0153, "step": 287600 }, { "epoch": 0.75, "learning_rate": 0.00018817100894030547, "loss": 0.0165, "step": 287610 }, { "epoch": 0.75, "learning_rate": 0.00018816712072393404, "loss": 0.0144, "step": 287620 }, { "epoch": 0.75, "learning_rate": 0.00018816323250756255, "loss": 0.0122, "step": 287630 }, { "epoch": 0.75, "learning_rate": 0.0001881593442911911, "loss": 0.0149, "step": 287640 }, { "epoch": 0.75, "learning_rate": 0.0001881554560748196, "loss": 0.0167, "step": 287650 }, { "epoch": 0.75, "learning_rate": 0.00018815156785844818, "loss": 0.0172, "step": 287660 }, { "epoch": 0.75, "learning_rate": 0.00018814767964207672, "loss": 0.0111, "step": 287670 }, { "epoch": 0.75, "learning_rate": 0.00018814379142570524, "loss": 0.0126, "step": 287680 }, { "epoch": 0.75, "learning_rate": 0.00018813990320933378, "loss": 0.0124, "step": 287690 }, { "epoch": 0.75, "learning_rate": 0.00018813601499296232, "loss": 0.0175, "step": 287700 }, { "epoch": 0.75, "learning_rate": 0.00018813212677659086, "loss": 0.0165, "step": 287710 }, { "epoch": 0.75, "learning_rate": 0.00018812823856021937, "loss": 0.0171, "step": 287720 }, { "epoch": 0.75, "learning_rate": 0.00018812435034384792, "loss": 0.0184, "step": 287730 }, { "epoch": 0.75, "learning_rate": 0.00018812046212747646, "loss": 0.0147, "step": 287740 }, { "epoch": 0.75, "learning_rate": 0.000188116573911105, "loss": 0.0153, "step": 287750 }, { "epoch": 0.75, "learning_rate": 0.00018811268569473351, "loss": 0.0147, "step": 287760 }, { "epoch": 0.75, "learning_rate": 0.00018810879747836206, "loss": 0.0133, "step": 287770 }, { "epoch": 0.75, "learning_rate": 0.0001881049092619906, "loss": 0.0158, "step": 287780 }, { "epoch": 0.75, "learning_rate": 0.00018810102104561914, "loss": 0.0156, "step": 287790 }, { "epoch": 0.75, "learning_rate": 0.00018809713282924765, "loss": 0.0139, "step": 287800 }, { "epoch": 0.75, "learning_rate": 0.0001880932446128762, "loss": 0.0117, "step": 287810 }, { "epoch": 0.75, "learning_rate": 0.0001880893563965047, "loss": 0.0139, "step": 287820 }, { "epoch": 0.75, "learning_rate": 0.00018808546818013328, "loss": 0.0116, "step": 287830 }, { "epoch": 0.75, "learning_rate": 0.00018808157996376182, "loss": 0.017, "step": 287840 }, { "epoch": 0.75, "learning_rate": 0.00018807769174739033, "loss": 0.0169, "step": 287850 }, { "epoch": 0.75, "learning_rate": 0.00018807380353101888, "loss": 0.0175, "step": 287860 }, { "epoch": 0.75, "learning_rate": 0.00018806991531464742, "loss": 0.0166, "step": 287870 }, { "epoch": 0.75, "learning_rate": 0.00018806602709827596, "loss": 0.0152, "step": 287880 }, { "epoch": 0.75, "learning_rate": 0.00018806213888190447, "loss": 0.0121, "step": 287890 }, { "epoch": 0.75, "learning_rate": 0.00018805825066553302, "loss": 0.0138, "step": 287900 }, { "epoch": 0.75, "learning_rate": 0.00018805436244916156, "loss": 0.0149, "step": 287910 }, { "epoch": 0.75, "learning_rate": 0.0001880504742327901, "loss": 0.0164, "step": 287920 }, { "epoch": 0.75, "learning_rate": 0.00018804658601641861, "loss": 0.0154, "step": 287930 }, { "epoch": 0.75, "learning_rate": 0.00018804269780004716, "loss": 0.0141, "step": 287940 }, { "epoch": 0.75, "learning_rate": 0.0001880388095836757, "loss": 0.0136, "step": 287950 }, { "epoch": 0.75, "learning_rate": 0.00018803492136730424, "loss": 0.0178, "step": 287960 }, { "epoch": 0.75, "learning_rate": 0.00018803103315093275, "loss": 0.0142, "step": 287970 }, { "epoch": 0.75, "learning_rate": 0.0001880271449345613, "loss": 0.0124, "step": 287980 }, { "epoch": 0.75, "learning_rate": 0.00018802325671818986, "loss": 0.0129, "step": 287990 }, { "epoch": 0.75, "learning_rate": 0.00018801936850181838, "loss": 0.016, "step": 288000 }, { "epoch": 0.75, "eval_cer": 0.8817138834186412, "eval_loss": 0.009974485263228416, "eval_runtime": 107.8815, "eval_samples_per_second": 18.539, "eval_steps_per_second": 4.635, "step": 288000 }, { "epoch": 0.75, "learning_rate": 0.00018801548028544692, "loss": 0.0131, "step": 288010 }, { "epoch": 0.75, "learning_rate": 0.00018801159206907543, "loss": 0.0137, "step": 288020 }, { "epoch": 0.75, "learning_rate": 0.000188007703852704, "loss": 0.0153, "step": 288030 }, { "epoch": 0.75, "learning_rate": 0.00018800381563633252, "loss": 0.0122, "step": 288040 }, { "epoch": 0.75, "learning_rate": 0.00018799992741996106, "loss": 0.0142, "step": 288050 }, { "epoch": 0.75, "learning_rate": 0.00018799603920358957, "loss": 0.0153, "step": 288060 }, { "epoch": 0.75, "learning_rate": 0.00018799215098721812, "loss": 0.0135, "step": 288070 }, { "epoch": 0.75, "learning_rate": 0.00018798826277084666, "loss": 0.0201, "step": 288080 }, { "epoch": 0.75, "learning_rate": 0.0001879843745544752, "loss": 0.0167, "step": 288090 }, { "epoch": 0.75, "learning_rate": 0.0001879804863381037, "loss": 0.0146, "step": 288100 }, { "epoch": 0.75, "learning_rate": 0.00018797659812173225, "loss": 0.0161, "step": 288110 }, { "epoch": 0.75, "learning_rate": 0.0001879727099053608, "loss": 0.0146, "step": 288120 }, { "epoch": 0.75, "learning_rate": 0.00018796882168898934, "loss": 0.0125, "step": 288130 }, { "epoch": 0.75, "learning_rate": 0.00018796493347261785, "loss": 0.0191, "step": 288140 }, { "epoch": 0.75, "learning_rate": 0.0001879610452562464, "loss": 0.0133, "step": 288150 }, { "epoch": 0.75, "learning_rate": 0.00018795715703987496, "loss": 0.0134, "step": 288160 }, { "epoch": 0.75, "learning_rate": 0.00018795326882350348, "loss": 0.0217, "step": 288170 }, { "epoch": 0.75, "learning_rate": 0.000187949380607132, "loss": 0.0117, "step": 288180 }, { "epoch": 0.75, "learning_rate": 0.00018794549239076053, "loss": 0.0186, "step": 288190 }, { "epoch": 0.75, "learning_rate": 0.0001879416041743891, "loss": 0.0206, "step": 288200 }, { "epoch": 0.75, "learning_rate": 0.00018793771595801762, "loss": 0.0158, "step": 288210 }, { "epoch": 0.75, "learning_rate": 0.00018793382774164616, "loss": 0.0103, "step": 288220 }, { "epoch": 0.75, "learning_rate": 0.00018792993952527467, "loss": 0.0146, "step": 288230 }, { "epoch": 0.75, "learning_rate": 0.00018792605130890324, "loss": 0.0206, "step": 288240 }, { "epoch": 0.75, "learning_rate": 0.00018792216309253176, "loss": 0.0166, "step": 288250 }, { "epoch": 0.75, "learning_rate": 0.0001879182748761603, "loss": 0.0151, "step": 288260 }, { "epoch": 0.75, "learning_rate": 0.0001879143866597888, "loss": 0.015, "step": 288270 }, { "epoch": 0.75, "learning_rate": 0.00018791049844341738, "loss": 0.014, "step": 288280 }, { "epoch": 0.75, "learning_rate": 0.0001879066102270459, "loss": 0.0134, "step": 288290 }, { "epoch": 0.75, "learning_rate": 0.00018790272201067444, "loss": 0.0216, "step": 288300 }, { "epoch": 0.75, "learning_rate": 0.00018789883379430295, "loss": 0.017, "step": 288310 }, { "epoch": 0.75, "learning_rate": 0.0001878949455779315, "loss": 0.0147, "step": 288320 }, { "epoch": 0.75, "learning_rate": 0.00018789105736156006, "loss": 0.0137, "step": 288330 }, { "epoch": 0.75, "learning_rate": 0.00018788716914518858, "loss": 0.0143, "step": 288340 }, { "epoch": 0.75, "learning_rate": 0.0001878832809288171, "loss": 0.0132, "step": 288350 }, { "epoch": 0.75, "learning_rate": 0.00018787939271244563, "loss": 0.0141, "step": 288360 }, { "epoch": 0.75, "learning_rate": 0.0001878755044960742, "loss": 0.0143, "step": 288370 }, { "epoch": 0.75, "learning_rate": 0.00018787161627970272, "loss": 0.02, "step": 288380 }, { "epoch": 0.75, "learning_rate": 0.00018786772806333126, "loss": 0.0139, "step": 288390 }, { "epoch": 0.75, "learning_rate": 0.00018786383984695977, "loss": 0.0134, "step": 288400 }, { "epoch": 0.75, "learning_rate": 0.00018785995163058834, "loss": 0.014, "step": 288410 }, { "epoch": 0.75, "learning_rate": 0.00018785606341421686, "loss": 0.0153, "step": 288420 }, { "epoch": 0.75, "learning_rate": 0.0001878521751978454, "loss": 0.0106, "step": 288430 }, { "epoch": 0.75, "learning_rate": 0.0001878482869814739, "loss": 0.0141, "step": 288440 }, { "epoch": 0.75, "learning_rate": 0.00018784439876510248, "loss": 0.0134, "step": 288450 }, { "epoch": 0.75, "learning_rate": 0.000187840510548731, "loss": 0.0137, "step": 288460 }, { "epoch": 0.75, "learning_rate": 0.00018783662233235954, "loss": 0.0141, "step": 288470 }, { "epoch": 0.75, "learning_rate": 0.00018783273411598805, "loss": 0.0162, "step": 288480 }, { "epoch": 0.75, "learning_rate": 0.00018782884589961662, "loss": 0.0115, "step": 288490 }, { "epoch": 0.75, "learning_rate": 0.00018782495768324513, "loss": 0.0142, "step": 288500 }, { "epoch": 0.75, "learning_rate": 0.00018782106946687368, "loss": 0.0128, "step": 288510 }, { "epoch": 0.75, "learning_rate": 0.0001878171812505022, "loss": 0.0123, "step": 288520 }, { "epoch": 0.75, "learning_rate": 0.00018781329303413076, "loss": 0.0137, "step": 288530 }, { "epoch": 0.75, "learning_rate": 0.0001878094048177593, "loss": 0.0123, "step": 288540 }, { "epoch": 0.75, "learning_rate": 0.00018780551660138782, "loss": 0.0142, "step": 288550 }, { "epoch": 0.75, "learning_rate": 0.00018780162838501636, "loss": 0.014, "step": 288560 }, { "epoch": 0.75, "learning_rate": 0.00018779774016864487, "loss": 0.0131, "step": 288570 }, { "epoch": 0.75, "learning_rate": 0.00018779385195227344, "loss": 0.02, "step": 288580 }, { "epoch": 0.75, "learning_rate": 0.00018778996373590196, "loss": 0.0145, "step": 288590 }, { "epoch": 0.75, "learning_rate": 0.0001877860755195305, "loss": 0.0157, "step": 288600 }, { "epoch": 0.75, "learning_rate": 0.000187782187303159, "loss": 0.013, "step": 288610 }, { "epoch": 0.75, "learning_rate": 0.00018777829908678758, "loss": 0.0134, "step": 288620 }, { "epoch": 0.75, "learning_rate": 0.0001877744108704161, "loss": 0.0124, "step": 288630 }, { "epoch": 0.75, "learning_rate": 0.00018777052265404464, "loss": 0.0179, "step": 288640 }, { "epoch": 0.75, "learning_rate": 0.00018776663443767315, "loss": 0.0156, "step": 288650 }, { "epoch": 0.75, "learning_rate": 0.00018776274622130172, "loss": 0.0202, "step": 288660 }, { "epoch": 0.75, "learning_rate": 0.00018775885800493023, "loss": 0.0133, "step": 288670 }, { "epoch": 0.75, "learning_rate": 0.00018775496978855878, "loss": 0.014, "step": 288680 }, { "epoch": 0.75, "learning_rate": 0.0001877510815721873, "loss": 0.0146, "step": 288690 }, { "epoch": 0.75, "learning_rate": 0.00018774719335581586, "loss": 0.0121, "step": 288700 }, { "epoch": 0.75, "learning_rate": 0.0001877433051394444, "loss": 0.0098, "step": 288710 }, { "epoch": 0.75, "learning_rate": 0.00018773941692307292, "loss": 0.0146, "step": 288720 }, { "epoch": 0.75, "learning_rate": 0.00018773552870670146, "loss": 0.0142, "step": 288730 }, { "epoch": 0.75, "learning_rate": 0.00018773164049033, "loss": 0.0111, "step": 288740 }, { "epoch": 0.75, "learning_rate": 0.00018772775227395854, "loss": 0.0174, "step": 288750 }, { "epoch": 0.75, "learning_rate": 0.00018772386405758705, "loss": 0.0151, "step": 288760 }, { "epoch": 0.75, "learning_rate": 0.0001877199758412156, "loss": 0.0149, "step": 288770 }, { "epoch": 0.75, "learning_rate": 0.00018771608762484414, "loss": 0.0173, "step": 288780 }, { "epoch": 0.75, "learning_rate": 0.00018771219940847268, "loss": 0.0156, "step": 288790 }, { "epoch": 0.75, "learning_rate": 0.0001877083111921012, "loss": 0.0151, "step": 288800 }, { "epoch": 0.75, "learning_rate": 0.00018770442297572974, "loss": 0.014, "step": 288810 }, { "epoch": 0.75, "learning_rate": 0.00018770053475935825, "loss": 0.0151, "step": 288820 }, { "epoch": 0.75, "learning_rate": 0.00018769664654298682, "loss": 0.0149, "step": 288830 }, { "epoch": 0.75, "learning_rate": 0.00018769275832661533, "loss": 0.0145, "step": 288840 }, { "epoch": 0.75, "learning_rate": 0.00018768887011024388, "loss": 0.0111, "step": 288850 }, { "epoch": 0.75, "learning_rate": 0.0001876849818938724, "loss": 0.0137, "step": 288860 }, { "epoch": 0.75, "learning_rate": 0.00018768109367750096, "loss": 0.014, "step": 288870 }, { "epoch": 0.75, "learning_rate": 0.0001876772054611295, "loss": 0.0143, "step": 288880 }, { "epoch": 0.75, "learning_rate": 0.00018767331724475801, "loss": 0.0127, "step": 288890 }, { "epoch": 0.75, "learning_rate": 0.00018766942902838653, "loss": 0.0125, "step": 288900 }, { "epoch": 0.75, "learning_rate": 0.0001876655408120151, "loss": 0.0123, "step": 288910 }, { "epoch": 0.75, "learning_rate": 0.00018766165259564364, "loss": 0.0168, "step": 288920 }, { "epoch": 0.75, "learning_rate": 0.00018765776437927215, "loss": 0.0143, "step": 288930 }, { "epoch": 0.75, "learning_rate": 0.0001876538761629007, "loss": 0.0124, "step": 288940 }, { "epoch": 0.75, "learning_rate": 0.00018764998794652924, "loss": 0.0154, "step": 288950 }, { "epoch": 0.75, "learning_rate": 0.00018764609973015778, "loss": 0.0125, "step": 288960 }, { "epoch": 0.75, "learning_rate": 0.0001876422115137863, "loss": 0.017, "step": 288970 }, { "epoch": 0.75, "learning_rate": 0.00018763832329741484, "loss": 0.0144, "step": 288980 }, { "epoch": 0.75, "learning_rate": 0.00018763443508104338, "loss": 0.0152, "step": 288990 }, { "epoch": 0.75, "learning_rate": 0.00018763054686467192, "loss": 0.0144, "step": 289000 }, { "epoch": 0.75, "eval_cer": 0.8816816917691551, "eval_loss": 0.0096070421859622, "eval_runtime": 107.8246, "eval_samples_per_second": 18.549, "eval_steps_per_second": 4.637, "step": 289000 }, { "epoch": 0.75, "learning_rate": 0.00018762665864830043, "loss": 0.0106, "step": 289010 }, { "epoch": 0.75, "learning_rate": 0.00018762277043192897, "loss": 0.0159, "step": 289020 }, { "epoch": 0.75, "learning_rate": 0.00018761888221555754, "loss": 0.0164, "step": 289030 }, { "epoch": 0.75, "learning_rate": 0.00018761499399918606, "loss": 0.0135, "step": 289040 }, { "epoch": 0.75, "learning_rate": 0.00018761110578281457, "loss": 0.0144, "step": 289050 }, { "epoch": 0.75, "learning_rate": 0.00018760721756644311, "loss": 0.0161, "step": 289060 }, { "epoch": 0.75, "learning_rate": 0.00018760332935007163, "loss": 0.0134, "step": 289070 }, { "epoch": 0.75, "learning_rate": 0.0001875994411337002, "loss": 0.0167, "step": 289080 }, { "epoch": 0.75, "learning_rate": 0.00018759555291732874, "loss": 0.0154, "step": 289090 }, { "epoch": 0.75, "learning_rate": 0.00018759166470095725, "loss": 0.0145, "step": 289100 }, { "epoch": 0.75, "learning_rate": 0.0001875877764845858, "loss": 0.0154, "step": 289110 }, { "epoch": 0.75, "learning_rate": 0.00018758388826821434, "loss": 0.0192, "step": 289120 }, { "epoch": 0.75, "learning_rate": 0.00018758000005184288, "loss": 0.0141, "step": 289130 }, { "epoch": 0.75, "learning_rate": 0.0001875761118354714, "loss": 0.0129, "step": 289140 }, { "epoch": 0.75, "learning_rate": 0.00018757222361909993, "loss": 0.0112, "step": 289150 }, { "epoch": 0.75, "learning_rate": 0.00018756833540272848, "loss": 0.0115, "step": 289160 }, { "epoch": 0.75, "learning_rate": 0.00018756444718635702, "loss": 0.0163, "step": 289170 }, { "epoch": 0.75, "learning_rate": 0.00018756055896998553, "loss": 0.0175, "step": 289180 }, { "epoch": 0.75, "learning_rate": 0.00018755667075361407, "loss": 0.0139, "step": 289190 }, { "epoch": 0.75, "learning_rate": 0.00018755278253724264, "loss": 0.0131, "step": 289200 }, { "epoch": 0.75, "learning_rate": 0.00018754889432087116, "loss": 0.0179, "step": 289210 }, { "epoch": 0.75, "learning_rate": 0.00018754500610449967, "loss": 0.0128, "step": 289220 }, { "epoch": 0.75, "learning_rate": 0.0001875411178881282, "loss": 0.0149, "step": 289230 }, { "epoch": 0.75, "learning_rate": 0.00018753722967175678, "loss": 0.0134, "step": 289240 }, { "epoch": 0.75, "learning_rate": 0.0001875333414553853, "loss": 0.0151, "step": 289250 }, { "epoch": 0.75, "learning_rate": 0.00018752945323901384, "loss": 0.0142, "step": 289260 }, { "epoch": 0.75, "learning_rate": 0.00018752556502264235, "loss": 0.0121, "step": 289270 }, { "epoch": 0.75, "learning_rate": 0.00018752167680627092, "loss": 0.0119, "step": 289280 }, { "epoch": 0.75, "learning_rate": 0.00018751778858989944, "loss": 0.0174, "step": 289290 }, { "epoch": 0.75, "learning_rate": 0.00018751390037352798, "loss": 0.0153, "step": 289300 }, { "epoch": 0.75, "learning_rate": 0.0001875100121571565, "loss": 0.0128, "step": 289310 }, { "epoch": 0.75, "learning_rate": 0.00018750612394078503, "loss": 0.0173, "step": 289320 }, { "epoch": 0.75, "learning_rate": 0.00018750223572441358, "loss": 0.0157, "step": 289330 }, { "epoch": 0.75, "learning_rate": 0.00018749834750804212, "loss": 0.0159, "step": 289340 }, { "epoch": 0.75, "learning_rate": 0.00018749445929167063, "loss": 0.0139, "step": 289350 }, { "epoch": 0.75, "learning_rate": 0.00018749057107529917, "loss": 0.0173, "step": 289360 }, { "epoch": 0.75, "learning_rate": 0.00018748668285892771, "loss": 0.0152, "step": 289370 }, { "epoch": 0.75, "learning_rate": 0.00018748279464255626, "loss": 0.0143, "step": 289380 }, { "epoch": 0.75, "learning_rate": 0.00018747890642618477, "loss": 0.0157, "step": 289390 }, { "epoch": 0.75, "learning_rate": 0.0001874750182098133, "loss": 0.0162, "step": 289400 }, { "epoch": 0.75, "learning_rate": 0.00018747112999344188, "loss": 0.014, "step": 289410 }, { "epoch": 0.75, "learning_rate": 0.0001874672417770704, "loss": 0.0178, "step": 289420 }, { "epoch": 0.75, "learning_rate": 0.00018746335356069894, "loss": 0.0141, "step": 289430 }, { "epoch": 0.75, "learning_rate": 0.00018745946534432745, "loss": 0.0119, "step": 289440 }, { "epoch": 0.75, "learning_rate": 0.00018745557712795602, "loss": 0.0239, "step": 289450 }, { "epoch": 0.75, "learning_rate": 0.00018745168891158454, "loss": 0.0167, "step": 289460 }, { "epoch": 0.75, "learning_rate": 0.00018744780069521308, "loss": 0.0142, "step": 289470 }, { "epoch": 0.75, "learning_rate": 0.0001874439124788416, "loss": 0.0164, "step": 289480 }, { "epoch": 0.75, "learning_rate": 0.00018744002426247016, "loss": 0.0138, "step": 289490 }, { "epoch": 0.75, "learning_rate": 0.00018743613604609867, "loss": 0.0133, "step": 289500 }, { "epoch": 0.75, "learning_rate": 0.00018743224782972722, "loss": 0.0151, "step": 289510 }, { "epoch": 0.75, "learning_rate": 0.00018742835961335573, "loss": 0.0133, "step": 289520 }, { "epoch": 0.75, "learning_rate": 0.0001874244713969843, "loss": 0.0147, "step": 289530 }, { "epoch": 0.75, "learning_rate": 0.00018742058318061281, "loss": 0.0123, "step": 289540 }, { "epoch": 0.75, "learning_rate": 0.00018741669496424136, "loss": 0.0136, "step": 289550 }, { "epoch": 0.75, "learning_rate": 0.00018741280674786987, "loss": 0.0173, "step": 289560 }, { "epoch": 0.75, "learning_rate": 0.0001874089185314984, "loss": 0.0164, "step": 289570 }, { "epoch": 0.75, "learning_rate": 0.00018740503031512698, "loss": 0.0165, "step": 289580 }, { "epoch": 0.75, "learning_rate": 0.0001874011420987555, "loss": 0.018, "step": 289590 }, { "epoch": 0.75, "learning_rate": 0.00018739725388238404, "loss": 0.0134, "step": 289600 }, { "epoch": 0.75, "learning_rate": 0.00018739336566601255, "loss": 0.0138, "step": 289610 }, { "epoch": 0.75, "learning_rate": 0.00018738947744964112, "loss": 0.0143, "step": 289620 }, { "epoch": 0.75, "learning_rate": 0.00018738558923326963, "loss": 0.0149, "step": 289630 }, { "epoch": 0.75, "learning_rate": 0.00018738170101689818, "loss": 0.0204, "step": 289640 }, { "epoch": 0.75, "learning_rate": 0.0001873778128005267, "loss": 0.0134, "step": 289650 }, { "epoch": 0.75, "learning_rate": 0.00018737392458415526, "loss": 0.0136, "step": 289660 }, { "epoch": 0.75, "learning_rate": 0.00018737003636778377, "loss": 0.014, "step": 289670 }, { "epoch": 0.75, "learning_rate": 0.00018736614815141232, "loss": 0.0156, "step": 289680 }, { "epoch": 0.75, "learning_rate": 0.00018736225993504083, "loss": 0.0136, "step": 289690 }, { "epoch": 0.75, "learning_rate": 0.0001873583717186694, "loss": 0.0142, "step": 289700 }, { "epoch": 0.75, "learning_rate": 0.00018735448350229791, "loss": 0.0129, "step": 289710 }, { "epoch": 0.75, "learning_rate": 0.00018735059528592646, "loss": 0.0128, "step": 289720 }, { "epoch": 0.75, "learning_rate": 0.00018734670706955497, "loss": 0.0134, "step": 289730 }, { "epoch": 0.75, "learning_rate": 0.00018734281885318354, "loss": 0.0135, "step": 289740 }, { "epoch": 0.75, "learning_rate": 0.00018733893063681208, "loss": 0.0192, "step": 289750 }, { "epoch": 0.75, "learning_rate": 0.0001873350424204406, "loss": 0.0142, "step": 289760 }, { "epoch": 0.75, "learning_rate": 0.0001873311542040691, "loss": 0.0132, "step": 289770 }, { "epoch": 0.75, "learning_rate": 0.00018732726598769768, "loss": 0.0128, "step": 289780 }, { "epoch": 0.75, "learning_rate": 0.00018732337777132622, "loss": 0.0135, "step": 289790 }, { "epoch": 0.75, "learning_rate": 0.00018731948955495473, "loss": 0.0129, "step": 289800 }, { "epoch": 0.75, "learning_rate": 0.00018731560133858328, "loss": 0.0135, "step": 289810 }, { "epoch": 0.75, "learning_rate": 0.0001873117131222118, "loss": 0.0129, "step": 289820 }, { "epoch": 0.75, "learning_rate": 0.00018730782490584036, "loss": 0.0165, "step": 289830 }, { "epoch": 0.75, "learning_rate": 0.00018730393668946887, "loss": 0.0134, "step": 289840 }, { "epoch": 0.75, "learning_rate": 0.00018730004847309742, "loss": 0.0123, "step": 289850 }, { "epoch": 0.75, "learning_rate": 0.00018729616025672593, "loss": 0.0153, "step": 289860 }, { "epoch": 0.75, "learning_rate": 0.0001872922720403545, "loss": 0.0126, "step": 289870 }, { "epoch": 0.75, "learning_rate": 0.000187288383823983, "loss": 0.0176, "step": 289880 }, { "epoch": 0.75, "learning_rate": 0.00018728449560761155, "loss": 0.0145, "step": 289890 }, { "epoch": 0.75, "learning_rate": 0.00018728060739124007, "loss": 0.0102, "step": 289900 }, { "epoch": 0.75, "learning_rate": 0.00018727671917486864, "loss": 0.0143, "step": 289910 }, { "epoch": 0.75, "learning_rate": 0.00018727283095849718, "loss": 0.0164, "step": 289920 }, { "epoch": 0.75, "learning_rate": 0.0001872689427421257, "loss": 0.0149, "step": 289930 }, { "epoch": 0.75, "learning_rate": 0.0001872650545257542, "loss": 0.0137, "step": 289940 }, { "epoch": 0.75, "learning_rate": 0.00018726116630938278, "loss": 0.0122, "step": 289950 }, { "epoch": 0.75, "learning_rate": 0.00018725727809301132, "loss": 0.0119, "step": 289960 }, { "epoch": 0.75, "learning_rate": 0.00018725338987663983, "loss": 0.0172, "step": 289970 }, { "epoch": 0.75, "learning_rate": 0.00018724950166026838, "loss": 0.0324, "step": 289980 }, { "epoch": 0.75, "learning_rate": 0.00018724561344389692, "loss": 0.0143, "step": 289990 }, { "epoch": 0.75, "learning_rate": 0.00018724172522752546, "loss": 0.0155, "step": 290000 }, { "epoch": 0.75, "eval_cer": 0.8816816917691551, "eval_loss": 0.00951974093914032, "eval_runtime": 107.8612, "eval_samples_per_second": 18.542, "eval_steps_per_second": 4.636, "step": 290000 }, { "epoch": 0.75, "learning_rate": 0.00018723783701115397, "loss": 0.0136, "step": 290010 }, { "epoch": 0.75, "learning_rate": 0.00018723394879478251, "loss": 0.0121, "step": 290020 }, { "epoch": 0.75, "learning_rate": 0.00018723006057841106, "loss": 0.0122, "step": 290030 }, { "epoch": 0.75, "learning_rate": 0.0001872261723620396, "loss": 0.0119, "step": 290040 }, { "epoch": 0.75, "learning_rate": 0.0001872222841456681, "loss": 0.0195, "step": 290050 }, { "epoch": 0.75, "learning_rate": 0.00018721839592929665, "loss": 0.0132, "step": 290060 }, { "epoch": 0.75, "learning_rate": 0.00018721450771292517, "loss": 0.0152, "step": 290070 }, { "epoch": 0.75, "learning_rate": 0.00018721061949655374, "loss": 0.0145, "step": 290080 }, { "epoch": 0.75, "learning_rate": 0.00018720673128018225, "loss": 0.0156, "step": 290090 }, { "epoch": 0.75, "learning_rate": 0.0001872028430638108, "loss": 0.0188, "step": 290100 }, { "epoch": 0.75, "learning_rate": 0.0001871989548474393, "loss": 0.0116, "step": 290110 }, { "epoch": 0.75, "learning_rate": 0.00018719506663106788, "loss": 0.0148, "step": 290120 }, { "epoch": 0.75, "learning_rate": 0.00018719117841469642, "loss": 0.011, "step": 290130 }, { "epoch": 0.75, "learning_rate": 0.00018718729019832493, "loss": 0.0148, "step": 290140 }, { "epoch": 0.75, "learning_rate": 0.00018718340198195347, "loss": 0.0148, "step": 290150 }, { "epoch": 0.75, "learning_rate": 0.00018717951376558202, "loss": 0.0141, "step": 290160 }, { "epoch": 0.75, "learning_rate": 0.00018717562554921056, "loss": 0.0142, "step": 290170 }, { "epoch": 0.75, "learning_rate": 0.00018717173733283907, "loss": 0.013, "step": 290180 }, { "epoch": 0.75, "learning_rate": 0.00018716784911646761, "loss": 0.0138, "step": 290190 }, { "epoch": 0.75, "learning_rate": 0.00018716396090009616, "loss": 0.0119, "step": 290200 }, { "epoch": 0.75, "learning_rate": 0.0001871600726837247, "loss": 0.0114, "step": 290210 }, { "epoch": 0.75, "learning_rate": 0.0001871561844673532, "loss": 0.0154, "step": 290220 }, { "epoch": 0.75, "learning_rate": 0.00018715229625098175, "loss": 0.0149, "step": 290230 }, { "epoch": 0.75, "learning_rate": 0.0001871484080346103, "loss": 0.0165, "step": 290240 }, { "epoch": 0.75, "learning_rate": 0.00018714451981823884, "loss": 0.0132, "step": 290250 }, { "epoch": 0.75, "learning_rate": 0.00018714063160186735, "loss": 0.0134, "step": 290260 }, { "epoch": 0.75, "learning_rate": 0.0001871367433854959, "loss": 0.0155, "step": 290270 }, { "epoch": 0.75, "learning_rate": 0.00018713285516912446, "loss": 0.0136, "step": 290280 }, { "epoch": 0.75, "learning_rate": 0.00018712896695275298, "loss": 0.0121, "step": 290290 }, { "epoch": 0.75, "learning_rate": 0.00018712507873638152, "loss": 0.0195, "step": 290300 }, { "epoch": 0.75, "learning_rate": 0.00018712119052001003, "loss": 0.0144, "step": 290310 }, { "epoch": 0.75, "learning_rate": 0.00018711730230363857, "loss": 0.0141, "step": 290320 }, { "epoch": 0.75, "learning_rate": 0.00018711341408726712, "loss": 0.0206, "step": 290330 }, { "epoch": 0.75, "learning_rate": 0.00018710952587089566, "loss": 0.0126, "step": 290340 }, { "epoch": 0.75, "learning_rate": 0.00018710563765452417, "loss": 0.0146, "step": 290350 }, { "epoch": 0.75, "learning_rate": 0.00018710174943815271, "loss": 0.011, "step": 290360 }, { "epoch": 0.75, "learning_rate": 0.00018709786122178126, "loss": 0.0106, "step": 290370 }, { "epoch": 0.75, "learning_rate": 0.0001870939730054098, "loss": 0.0139, "step": 290380 }, { "epoch": 0.75, "learning_rate": 0.0001870900847890383, "loss": 0.0119, "step": 290390 }, { "epoch": 0.75, "learning_rate": 0.00018708619657266685, "loss": 0.0134, "step": 290400 }, { "epoch": 0.75, "learning_rate": 0.0001870823083562954, "loss": 0.017, "step": 290410 }, { "epoch": 0.75, "learning_rate": 0.00018707842013992394, "loss": 0.0133, "step": 290420 }, { "epoch": 0.75, "learning_rate": 0.00018707453192355245, "loss": 0.0127, "step": 290430 }, { "epoch": 0.75, "learning_rate": 0.000187070643707181, "loss": 0.0147, "step": 290440 }, { "epoch": 0.75, "learning_rate": 0.00018706675549080956, "loss": 0.0132, "step": 290450 }, { "epoch": 0.75, "learning_rate": 0.00018706286727443808, "loss": 0.0168, "step": 290460 }, { "epoch": 0.75, "learning_rate": 0.00018705897905806662, "loss": 0.0193, "step": 290470 }, { "epoch": 0.75, "learning_rate": 0.00018705509084169513, "loss": 0.015, "step": 290480 }, { "epoch": 0.75, "learning_rate": 0.0001870512026253237, "loss": 0.0131, "step": 290490 }, { "epoch": 0.75, "learning_rate": 0.00018704731440895222, "loss": 0.0155, "step": 290500 }, { "epoch": 0.75, "learning_rate": 0.00018704342619258076, "loss": 0.0165, "step": 290510 }, { "epoch": 0.75, "learning_rate": 0.00018703953797620927, "loss": 0.0153, "step": 290520 }, { "epoch": 0.75, "learning_rate": 0.00018703564975983784, "loss": 0.015, "step": 290530 }, { "epoch": 0.75, "learning_rate": 0.00018703176154346635, "loss": 0.0125, "step": 290540 }, { "epoch": 0.75, "learning_rate": 0.0001870278733270949, "loss": 0.0165, "step": 290550 }, { "epoch": 0.75, "learning_rate": 0.0001870239851107234, "loss": 0.0153, "step": 290560 }, { "epoch": 0.75, "learning_rate": 0.00018702009689435195, "loss": 0.013, "step": 290570 }, { "epoch": 0.75, "learning_rate": 0.0001870162086779805, "loss": 0.0134, "step": 290580 }, { "epoch": 0.75, "learning_rate": 0.00018701232046160904, "loss": 0.0158, "step": 290590 }, { "epoch": 0.75, "learning_rate": 0.00018700843224523755, "loss": 0.0147, "step": 290600 }, { "epoch": 0.75, "learning_rate": 0.0001870045440288661, "loss": 0.0139, "step": 290610 }, { "epoch": 0.75, "learning_rate": 0.00018700065581249466, "loss": 0.017, "step": 290620 }, { "epoch": 0.75, "learning_rate": 0.00018699676759612318, "loss": 0.0147, "step": 290630 }, { "epoch": 0.75, "learning_rate": 0.0001869928793797517, "loss": 0.013, "step": 290640 }, { "epoch": 0.75, "learning_rate": 0.00018698899116338023, "loss": 0.0137, "step": 290650 }, { "epoch": 0.75, "learning_rate": 0.0001869851029470088, "loss": 0.0153, "step": 290660 }, { "epoch": 0.75, "learning_rate": 0.00018698121473063731, "loss": 0.019, "step": 290670 }, { "epoch": 0.75, "learning_rate": 0.00018697732651426586, "loss": 0.0174, "step": 290680 }, { "epoch": 0.75, "learning_rate": 0.00018697343829789437, "loss": 0.0126, "step": 290690 }, { "epoch": 0.75, "learning_rate": 0.00018696955008152294, "loss": 0.0136, "step": 290700 }, { "epoch": 0.75, "learning_rate": 0.00018696566186515145, "loss": 0.0115, "step": 290710 }, { "epoch": 0.75, "learning_rate": 0.00018696177364878, "loss": 0.0153, "step": 290720 }, { "epoch": 0.75, "learning_rate": 0.0001869578854324085, "loss": 0.0143, "step": 290730 }, { "epoch": 0.75, "learning_rate": 0.00018695399721603708, "loss": 0.0153, "step": 290740 }, { "epoch": 0.75, "learning_rate": 0.0001869501089996656, "loss": 0.0163, "step": 290750 }, { "epoch": 0.75, "learning_rate": 0.00018694622078329414, "loss": 0.0136, "step": 290760 }, { "epoch": 0.75, "learning_rate": 0.00018694233256692265, "loss": 0.0151, "step": 290770 }, { "epoch": 0.75, "learning_rate": 0.00018693844435055122, "loss": 0.0164, "step": 290780 }, { "epoch": 0.75, "learning_rate": 0.00018693455613417976, "loss": 0.0177, "step": 290790 }, { "epoch": 0.75, "learning_rate": 0.00018693066791780827, "loss": 0.0139, "step": 290800 }, { "epoch": 0.75, "learning_rate": 0.0001869267797014368, "loss": 0.0143, "step": 290810 }, { "epoch": 0.75, "learning_rate": 0.00018692289148506533, "loss": 0.0144, "step": 290820 }, { "epoch": 0.75, "learning_rate": 0.0001869190032686939, "loss": 0.016, "step": 290830 }, { "epoch": 0.75, "learning_rate": 0.00018691511505232241, "loss": 0.017, "step": 290840 }, { "epoch": 0.75, "learning_rate": 0.00018691122683595096, "loss": 0.0155, "step": 290850 }, { "epoch": 0.75, "learning_rate": 0.00018690733861957947, "loss": 0.0144, "step": 290860 }, { "epoch": 0.75, "learning_rate": 0.00018690345040320804, "loss": 0.0126, "step": 290870 }, { "epoch": 0.75, "learning_rate": 0.00018689956218683655, "loss": 0.0146, "step": 290880 }, { "epoch": 0.75, "learning_rate": 0.0001868956739704651, "loss": 0.0168, "step": 290890 }, { "epoch": 0.75, "learning_rate": 0.0001868917857540936, "loss": 0.0139, "step": 290900 }, { "epoch": 0.75, "learning_rate": 0.00018688789753772218, "loss": 0.0133, "step": 290910 }, { "epoch": 0.75, "learning_rate": 0.0001868840093213507, "loss": 0.0132, "step": 290920 }, { "epoch": 0.75, "learning_rate": 0.00018688012110497923, "loss": 0.0131, "step": 290930 }, { "epoch": 0.75, "learning_rate": 0.00018687623288860775, "loss": 0.0152, "step": 290940 }, { "epoch": 0.75, "learning_rate": 0.00018687234467223632, "loss": 0.0144, "step": 290950 }, { "epoch": 0.75, "learning_rate": 0.00018686845645586483, "loss": 0.0147, "step": 290960 }, { "epoch": 0.75, "learning_rate": 0.00018686456823949337, "loss": 0.0146, "step": 290970 }, { "epoch": 0.75, "learning_rate": 0.0001868606800231219, "loss": 0.0117, "step": 290980 }, { "epoch": 0.75, "learning_rate": 0.00018685679180675046, "loss": 0.0159, "step": 290990 }, { "epoch": 0.75, "learning_rate": 0.000186852903590379, "loss": 0.0129, "step": 291000 }, { "epoch": 0.75, "eval_cer": 0.8817096845078387, "eval_loss": 0.009270302951335907, "eval_runtime": 107.7514, "eval_samples_per_second": 18.561, "eval_steps_per_second": 4.64, "step": 291000 }, { "epoch": 0.75, "learning_rate": 0.00018684901537400751, "loss": 0.0247, "step": 291010 }, { "epoch": 0.75, "learning_rate": 0.00018684512715763606, "loss": 0.0235, "step": 291020 }, { "epoch": 0.75, "learning_rate": 0.00018684123894126457, "loss": 0.0144, "step": 291030 }, { "epoch": 0.75, "learning_rate": 0.00018683735072489314, "loss": 0.0151, "step": 291040 }, { "epoch": 0.75, "learning_rate": 0.00018683346250852165, "loss": 0.0149, "step": 291050 }, { "epoch": 0.75, "learning_rate": 0.0001868295742921502, "loss": 0.0155, "step": 291060 }, { "epoch": 0.75, "learning_rate": 0.0001868256860757787, "loss": 0.0135, "step": 291070 }, { "epoch": 0.75, "learning_rate": 0.00018682179785940728, "loss": 0.0153, "step": 291080 }, { "epoch": 0.75, "learning_rate": 0.0001868179096430358, "loss": 0.0165, "step": 291090 }, { "epoch": 0.75, "learning_rate": 0.00018681402142666433, "loss": 0.0131, "step": 291100 }, { "epoch": 0.75, "learning_rate": 0.00018681013321029285, "loss": 0.0151, "step": 291110 }, { "epoch": 0.75, "learning_rate": 0.00018680624499392142, "loss": 0.0183, "step": 291120 }, { "epoch": 0.75, "learning_rate": 0.00018680235677754993, "loss": 0.0157, "step": 291130 }, { "epoch": 0.75, "learning_rate": 0.00018679846856117847, "loss": 0.0175, "step": 291140 }, { "epoch": 0.75, "learning_rate": 0.000186794580344807, "loss": 0.0135, "step": 291150 }, { "epoch": 0.75, "learning_rate": 0.00018679069212843556, "loss": 0.0188, "step": 291160 }, { "epoch": 0.75, "learning_rate": 0.0001867868039120641, "loss": 0.0169, "step": 291170 }, { "epoch": 0.75, "learning_rate": 0.0001867829156956926, "loss": 0.0126, "step": 291180 }, { "epoch": 0.75, "learning_rate": 0.00018677902747932115, "loss": 0.0164, "step": 291190 }, { "epoch": 0.75, "learning_rate": 0.0001867751392629497, "loss": 0.0158, "step": 291200 }, { "epoch": 0.75, "learning_rate": 0.00018677125104657824, "loss": 0.0136, "step": 291210 }, { "epoch": 0.75, "learning_rate": 0.00018676736283020675, "loss": 0.0143, "step": 291220 }, { "epoch": 0.75, "learning_rate": 0.0001867634746138353, "loss": 0.0158, "step": 291230 }, { "epoch": 0.75, "learning_rate": 0.00018675958639746384, "loss": 0.0166, "step": 291240 }, { "epoch": 0.75, "learning_rate": 0.00018675569818109238, "loss": 0.0133, "step": 291250 }, { "epoch": 0.75, "learning_rate": 0.0001867518099647209, "loss": 0.0171, "step": 291260 }, { "epoch": 0.76, "learning_rate": 0.00018674792174834943, "loss": 0.0125, "step": 291270 }, { "epoch": 0.76, "learning_rate": 0.00018674403353197795, "loss": 0.0133, "step": 291280 }, { "epoch": 0.76, "learning_rate": 0.00018674014531560652, "loss": 0.0159, "step": 291290 }, { "epoch": 0.76, "learning_rate": 0.00018673625709923503, "loss": 0.0133, "step": 291300 }, { "epoch": 0.76, "learning_rate": 0.00018673236888286357, "loss": 0.0147, "step": 291310 }, { "epoch": 0.76, "learning_rate": 0.0001867284806664921, "loss": 0.0135, "step": 291320 }, { "epoch": 0.76, "learning_rate": 0.00018672459245012066, "loss": 0.0139, "step": 291330 }, { "epoch": 0.76, "learning_rate": 0.0001867207042337492, "loss": 0.0146, "step": 291340 }, { "epoch": 0.76, "learning_rate": 0.0001867168160173777, "loss": 0.0179, "step": 291350 }, { "epoch": 0.76, "learning_rate": 0.00018671292780100623, "loss": 0.0201, "step": 291360 }, { "epoch": 0.76, "learning_rate": 0.0001867090395846348, "loss": 0.0114, "step": 291370 }, { "epoch": 0.76, "learning_rate": 0.00018670515136826334, "loss": 0.0147, "step": 291380 }, { "epoch": 0.76, "learning_rate": 0.00018670126315189185, "loss": 0.0147, "step": 291390 }, { "epoch": 0.76, "learning_rate": 0.0001866973749355204, "loss": 0.0158, "step": 291400 }, { "epoch": 0.76, "learning_rate": 0.00018669348671914894, "loss": 0.0144, "step": 291410 }, { "epoch": 0.76, "learning_rate": 0.00018668959850277748, "loss": 0.0122, "step": 291420 }, { "epoch": 0.76, "learning_rate": 0.000186685710286406, "loss": 0.0127, "step": 291430 }, { "epoch": 0.76, "learning_rate": 0.00018668182207003453, "loss": 0.0145, "step": 291440 }, { "epoch": 0.76, "learning_rate": 0.00018667793385366307, "loss": 0.0139, "step": 291450 }, { "epoch": 0.76, "learning_rate": 0.00018667404563729162, "loss": 0.0188, "step": 291460 }, { "epoch": 0.76, "learning_rate": 0.00018667015742092013, "loss": 0.0147, "step": 291470 }, { "epoch": 0.76, "learning_rate": 0.00018666626920454867, "loss": 0.0145, "step": 291480 }, { "epoch": 0.76, "learning_rate": 0.00018666238098817724, "loss": 0.0118, "step": 291490 }, { "epoch": 0.76, "learning_rate": 0.00018665849277180576, "loss": 0.0159, "step": 291500 }, { "epoch": 0.76, "learning_rate": 0.0001866546045554343, "loss": 0.0131, "step": 291510 }, { "epoch": 0.76, "learning_rate": 0.0001866507163390628, "loss": 0.0183, "step": 291520 }, { "epoch": 0.76, "learning_rate": 0.00018664682812269133, "loss": 0.018, "step": 291530 }, { "epoch": 0.76, "learning_rate": 0.0001866429399063199, "loss": 0.0169, "step": 291540 }, { "epoch": 0.76, "learning_rate": 0.00018663905168994844, "loss": 0.0156, "step": 291550 }, { "epoch": 0.76, "learning_rate": 0.00018663516347357695, "loss": 0.0169, "step": 291560 }, { "epoch": 0.76, "learning_rate": 0.0001866312752572055, "loss": 0.0151, "step": 291570 }, { "epoch": 0.76, "learning_rate": 0.00018662738704083403, "loss": 0.0138, "step": 291580 }, { "epoch": 0.76, "learning_rate": 0.00018662349882446258, "loss": 0.0153, "step": 291590 }, { "epoch": 0.76, "learning_rate": 0.0001866196106080911, "loss": 0.0149, "step": 291600 }, { "epoch": 0.76, "learning_rate": 0.00018661572239171963, "loss": 0.0124, "step": 291610 }, { "epoch": 0.76, "learning_rate": 0.00018661183417534817, "loss": 0.0129, "step": 291620 }, { "epoch": 0.76, "learning_rate": 0.00018660794595897672, "loss": 0.0124, "step": 291630 }, { "epoch": 0.76, "learning_rate": 0.00018660405774260523, "loss": 0.0139, "step": 291640 }, { "epoch": 0.76, "learning_rate": 0.00018660016952623377, "loss": 0.0192, "step": 291650 }, { "epoch": 0.76, "learning_rate": 0.00018659628130986234, "loss": 0.0154, "step": 291660 }, { "epoch": 0.76, "learning_rate": 0.00018659239309349086, "loss": 0.015, "step": 291670 }, { "epoch": 0.76, "learning_rate": 0.00018658850487711937, "loss": 0.0143, "step": 291680 }, { "epoch": 0.76, "learning_rate": 0.0001865846166607479, "loss": 0.0195, "step": 291690 }, { "epoch": 0.76, "learning_rate": 0.00018658072844437648, "loss": 0.0112, "step": 291700 }, { "epoch": 0.76, "learning_rate": 0.000186576840228005, "loss": 0.0134, "step": 291710 }, { "epoch": 0.76, "learning_rate": 0.00018657295201163354, "loss": 0.0144, "step": 291720 }, { "epoch": 0.76, "learning_rate": 0.00018656906379526205, "loss": 0.0133, "step": 291730 }, { "epoch": 0.76, "learning_rate": 0.00018656517557889062, "loss": 0.0144, "step": 291740 }, { "epoch": 0.76, "learning_rate": 0.00018656128736251913, "loss": 0.0125, "step": 291750 }, { "epoch": 0.76, "learning_rate": 0.00018655739914614768, "loss": 0.0125, "step": 291760 }, { "epoch": 0.76, "learning_rate": 0.0001865535109297762, "loss": 0.0151, "step": 291770 }, { "epoch": 0.76, "learning_rate": 0.00018654962271340473, "loss": 0.0123, "step": 291780 }, { "epoch": 0.76, "learning_rate": 0.00018654573449703327, "loss": 0.0124, "step": 291790 }, { "epoch": 0.76, "learning_rate": 0.00018654184628066182, "loss": 0.0175, "step": 291800 }, { "epoch": 0.76, "learning_rate": 0.00018653795806429033, "loss": 0.0146, "step": 291810 }, { "epoch": 0.76, "learning_rate": 0.00018653406984791887, "loss": 0.049, "step": 291820 }, { "epoch": 0.76, "learning_rate": 0.0001865301816315474, "loss": 0.0281, "step": 291830 }, { "epoch": 0.76, "learning_rate": 0.00018652629341517595, "loss": 0.0168, "step": 291840 }, { "epoch": 0.76, "learning_rate": 0.00018652240519880447, "loss": 0.014, "step": 291850 }, { "epoch": 0.76, "learning_rate": 0.000186518516982433, "loss": 0.016, "step": 291860 }, { "epoch": 0.76, "learning_rate": 0.00018651462876606158, "loss": 0.0118, "step": 291870 }, { "epoch": 0.76, "learning_rate": 0.0001865107405496901, "loss": 0.0105, "step": 291880 }, { "epoch": 0.76, "learning_rate": 0.00018650685233331864, "loss": 0.0158, "step": 291890 }, { "epoch": 0.76, "learning_rate": 0.00018650296411694715, "loss": 0.0147, "step": 291900 }, { "epoch": 0.76, "learning_rate": 0.00018649907590057572, "loss": 0.0125, "step": 291910 }, { "epoch": 0.76, "learning_rate": 0.00018649518768420423, "loss": 0.0169, "step": 291920 }, { "epoch": 0.76, "learning_rate": 0.00018649129946783278, "loss": 0.0154, "step": 291930 }, { "epoch": 0.76, "learning_rate": 0.0001864874112514613, "loss": 0.0126, "step": 291940 }, { "epoch": 0.76, "learning_rate": 0.00018648352303508986, "loss": 0.0136, "step": 291950 }, { "epoch": 0.76, "learning_rate": 0.00018647963481871837, "loss": 0.0139, "step": 291960 }, { "epoch": 0.76, "learning_rate": 0.00018647574660234691, "loss": 0.0132, "step": 291970 }, { "epoch": 0.76, "learning_rate": 0.00018647185838597543, "loss": 0.0157, "step": 291980 }, { "epoch": 0.76, "learning_rate": 0.000186467970169604, "loss": 0.0148, "step": 291990 }, { "epoch": 0.76, "learning_rate": 0.0001864640819532325, "loss": 0.0138, "step": 292000 }, { "epoch": 0.76, "eval_cer": 0.8817208816033121, "eval_loss": 0.009960480034351349, "eval_runtime": 107.9451, "eval_samples_per_second": 18.528, "eval_steps_per_second": 4.632, "step": 292000 }, { "epoch": 0.76, "learning_rate": 0.00018646019373686105, "loss": 0.0124, "step": 292010 }, { "epoch": 0.76, "learning_rate": 0.00018645630552048957, "loss": 0.0127, "step": 292020 }, { "epoch": 0.76, "learning_rate": 0.0001864524173041181, "loss": 0.0188, "step": 292030 }, { "epoch": 0.76, "learning_rate": 0.00018644852908774668, "loss": 0.0161, "step": 292040 }, { "epoch": 0.76, "learning_rate": 0.0001864446408713752, "loss": 0.0164, "step": 292050 }, { "epoch": 0.76, "learning_rate": 0.00018644075265500374, "loss": 0.0177, "step": 292060 }, { "epoch": 0.76, "learning_rate": 0.00018643686443863225, "loss": 0.0172, "step": 292070 }, { "epoch": 0.76, "learning_rate": 0.00018643297622226082, "loss": 0.0166, "step": 292080 }, { "epoch": 0.76, "learning_rate": 0.00018642908800588933, "loss": 0.0154, "step": 292090 }, { "epoch": 0.76, "learning_rate": 0.00018642519978951787, "loss": 0.0128, "step": 292100 }, { "epoch": 0.76, "learning_rate": 0.0001864213115731464, "loss": 0.0172, "step": 292110 }, { "epoch": 0.76, "learning_rate": 0.00018641742335677496, "loss": 0.0125, "step": 292120 }, { "epoch": 0.76, "learning_rate": 0.00018641353514040347, "loss": 0.0159, "step": 292130 }, { "epoch": 0.76, "learning_rate": 0.00018640964692403201, "loss": 0.0145, "step": 292140 }, { "epoch": 0.76, "learning_rate": 0.00018640575870766053, "loss": 0.0143, "step": 292150 }, { "epoch": 0.76, "learning_rate": 0.0001864018704912891, "loss": 0.0114, "step": 292160 }, { "epoch": 0.76, "learning_rate": 0.0001863979822749176, "loss": 0.0139, "step": 292170 }, { "epoch": 0.76, "learning_rate": 0.00018639409405854615, "loss": 0.0128, "step": 292180 }, { "epoch": 0.76, "learning_rate": 0.00018639020584217467, "loss": 0.0121, "step": 292190 }, { "epoch": 0.76, "learning_rate": 0.00018638631762580324, "loss": 0.0137, "step": 292200 }, { "epoch": 0.76, "learning_rate": 0.00018638242940943178, "loss": 0.0181, "step": 292210 }, { "epoch": 0.76, "learning_rate": 0.0001863785411930603, "loss": 0.0152, "step": 292220 }, { "epoch": 0.76, "learning_rate": 0.0001863746529766888, "loss": 0.0157, "step": 292230 }, { "epoch": 0.76, "learning_rate": 0.00018637076476031738, "loss": 0.0147, "step": 292240 }, { "epoch": 0.76, "learning_rate": 0.00018636687654394592, "loss": 0.0174, "step": 292250 }, { "epoch": 0.76, "learning_rate": 0.00018636298832757443, "loss": 0.0156, "step": 292260 }, { "epoch": 0.76, "learning_rate": 0.00018635910011120297, "loss": 0.017, "step": 292270 }, { "epoch": 0.76, "learning_rate": 0.0001863552118948315, "loss": 0.0183, "step": 292280 }, { "epoch": 0.76, "learning_rate": 0.00018635132367846006, "loss": 0.0107, "step": 292290 }, { "epoch": 0.76, "learning_rate": 0.00018634743546208857, "loss": 0.0141, "step": 292300 }, { "epoch": 0.76, "learning_rate": 0.0001863435472457171, "loss": 0.0132, "step": 292310 }, { "epoch": 0.76, "learning_rate": 0.00018633965902934563, "loss": 0.0145, "step": 292320 }, { "epoch": 0.76, "learning_rate": 0.0001863357708129742, "loss": 0.0147, "step": 292330 }, { "epoch": 0.76, "learning_rate": 0.0001863318825966027, "loss": 0.012, "step": 292340 }, { "epoch": 0.76, "learning_rate": 0.00018632799438023125, "loss": 0.0154, "step": 292350 }, { "epoch": 0.76, "learning_rate": 0.00018632410616385977, "loss": 0.0133, "step": 292360 }, { "epoch": 0.76, "learning_rate": 0.00018632021794748834, "loss": 0.0145, "step": 292370 }, { "epoch": 0.76, "learning_rate": 0.00018631632973111688, "loss": 0.0145, "step": 292380 }, { "epoch": 0.76, "learning_rate": 0.0001863124415147454, "loss": 0.0131, "step": 292390 }, { "epoch": 0.76, "learning_rate": 0.0001863085532983739, "loss": 0.0178, "step": 292400 }, { "epoch": 0.76, "learning_rate": 0.00018630466508200248, "loss": 0.0129, "step": 292410 }, { "epoch": 0.76, "learning_rate": 0.00018630077686563102, "loss": 0.0147, "step": 292420 }, { "epoch": 0.76, "learning_rate": 0.00018629688864925953, "loss": 0.0135, "step": 292430 }, { "epoch": 0.76, "learning_rate": 0.00018629300043288807, "loss": 0.0155, "step": 292440 }, { "epoch": 0.76, "learning_rate": 0.00018628911221651661, "loss": 0.0128, "step": 292450 }, { "epoch": 0.76, "learning_rate": 0.00018628522400014516, "loss": 0.0144, "step": 292460 }, { "epoch": 0.76, "learning_rate": 0.00018628133578377367, "loss": 0.0149, "step": 292470 }, { "epoch": 0.76, "learning_rate": 0.0001862774475674022, "loss": 0.0118, "step": 292480 }, { "epoch": 0.76, "learning_rate": 0.00018627355935103075, "loss": 0.0121, "step": 292490 }, { "epoch": 0.76, "learning_rate": 0.0001862696711346593, "loss": 0.0175, "step": 292500 }, { "epoch": 0.76, "learning_rate": 0.0001862657829182878, "loss": 0.0146, "step": 292510 }, { "epoch": 0.76, "learning_rate": 0.00018626189470191635, "loss": 0.0119, "step": 292520 }, { "epoch": 0.76, "learning_rate": 0.00018625800648554487, "loss": 0.0136, "step": 292530 }, { "epoch": 0.76, "learning_rate": 0.00018625411826917344, "loss": 0.0114, "step": 292540 }, { "epoch": 0.76, "learning_rate": 0.00018625023005280195, "loss": 0.0149, "step": 292550 }, { "epoch": 0.76, "learning_rate": 0.0001862463418364305, "loss": 0.0133, "step": 292560 }, { "epoch": 0.76, "learning_rate": 0.000186242453620059, "loss": 0.0149, "step": 292570 }, { "epoch": 0.76, "learning_rate": 0.00018623856540368757, "loss": 0.0167, "step": 292580 }, { "epoch": 0.76, "learning_rate": 0.00018623467718731612, "loss": 0.0124, "step": 292590 }, { "epoch": 0.76, "learning_rate": 0.00018623078897094463, "loss": 0.0178, "step": 292600 }, { "epoch": 0.76, "learning_rate": 0.00018622690075457317, "loss": 0.0144, "step": 292610 }, { "epoch": 0.76, "learning_rate": 0.00018622301253820171, "loss": 0.015, "step": 292620 }, { "epoch": 0.76, "learning_rate": 0.00018621912432183026, "loss": 0.0162, "step": 292630 }, { "epoch": 0.76, "learning_rate": 0.00018621523610545877, "loss": 0.0146, "step": 292640 }, { "epoch": 0.76, "learning_rate": 0.0001862113478890873, "loss": 0.0202, "step": 292650 }, { "epoch": 0.76, "learning_rate": 0.00018620745967271585, "loss": 0.0155, "step": 292660 }, { "epoch": 0.76, "learning_rate": 0.0001862035714563444, "loss": 0.0138, "step": 292670 }, { "epoch": 0.76, "learning_rate": 0.0001861996832399729, "loss": 0.015, "step": 292680 }, { "epoch": 0.76, "learning_rate": 0.00018619579502360145, "loss": 0.0131, "step": 292690 }, { "epoch": 0.76, "learning_rate": 0.00018619190680723002, "loss": 0.0149, "step": 292700 }, { "epoch": 0.76, "learning_rate": 0.00018618801859085853, "loss": 0.0152, "step": 292710 }, { "epoch": 0.76, "learning_rate": 0.00018618413037448705, "loss": 0.0147, "step": 292720 }, { "epoch": 0.76, "learning_rate": 0.0001861802421581156, "loss": 0.0159, "step": 292730 }, { "epoch": 0.76, "learning_rate": 0.00018617635394174416, "loss": 0.0204, "step": 292740 }, { "epoch": 0.76, "learning_rate": 0.00018617246572537267, "loss": 0.0126, "step": 292750 }, { "epoch": 0.76, "learning_rate": 0.00018616857750900122, "loss": 0.0131, "step": 292760 }, { "epoch": 0.76, "learning_rate": 0.00018616468929262973, "loss": 0.0175, "step": 292770 }, { "epoch": 0.76, "learning_rate": 0.00018616080107625827, "loss": 0.0167, "step": 292780 }, { "epoch": 0.76, "learning_rate": 0.00018615691285988681, "loss": 0.0139, "step": 292790 }, { "epoch": 0.76, "learning_rate": 0.00018615302464351536, "loss": 0.0222, "step": 292800 }, { "epoch": 0.76, "learning_rate": 0.00018614913642714387, "loss": 0.0144, "step": 292810 }, { "epoch": 0.76, "learning_rate": 0.0001861452482107724, "loss": 0.0117, "step": 292820 }, { "epoch": 0.76, "learning_rate": 0.00018614135999440095, "loss": 0.0187, "step": 292830 }, { "epoch": 0.76, "learning_rate": 0.0001861374717780295, "loss": 0.0172, "step": 292840 }, { "epoch": 0.76, "learning_rate": 0.000186133583561658, "loss": 0.0192, "step": 292850 }, { "epoch": 0.76, "learning_rate": 0.00018612969534528655, "loss": 0.0145, "step": 292860 }, { "epoch": 0.76, "learning_rate": 0.0001861258071289151, "loss": 0.0114, "step": 292870 }, { "epoch": 0.76, "learning_rate": 0.00018612191891254363, "loss": 0.0147, "step": 292880 }, { "epoch": 0.76, "learning_rate": 0.00018611803069617215, "loss": 0.0149, "step": 292890 }, { "epoch": 0.76, "learning_rate": 0.0001861141424798007, "loss": 0.0127, "step": 292900 }, { "epoch": 0.76, "learning_rate": 0.00018611025426342926, "loss": 0.0219, "step": 292910 }, { "epoch": 0.76, "learning_rate": 0.00018610636604705777, "loss": 0.017, "step": 292920 }, { "epoch": 0.76, "learning_rate": 0.00018610247783068632, "loss": 0.0222, "step": 292930 }, { "epoch": 0.76, "learning_rate": 0.00018609858961431483, "loss": 0.0167, "step": 292940 }, { "epoch": 0.76, "learning_rate": 0.0001860947013979434, "loss": 0.0134, "step": 292950 }, { "epoch": 0.76, "learning_rate": 0.0001860908131815719, "loss": 0.012, "step": 292960 }, { "epoch": 0.76, "learning_rate": 0.00018608692496520045, "loss": 0.0142, "step": 292970 }, { "epoch": 0.76, "learning_rate": 0.00018608303674882897, "loss": 0.0138, "step": 292980 }, { "epoch": 0.76, "learning_rate": 0.00018607914853245754, "loss": 0.013, "step": 292990 }, { "epoch": 0.76, "learning_rate": 0.00018607526031608605, "loss": 0.0135, "step": 293000 }, { "epoch": 0.76, "eval_cer": 0.8817320786987856, "eval_loss": 0.009882713668048382, "eval_runtime": 108.0807, "eval_samples_per_second": 18.505, "eval_steps_per_second": 4.626, "step": 293000 }, { "epoch": 0.76, "learning_rate": 0.0001860713720997146, "loss": 0.0113, "step": 293010 }, { "epoch": 0.76, "learning_rate": 0.0001860674838833431, "loss": 0.0217, "step": 293020 }, { "epoch": 0.76, "learning_rate": 0.00018606359566697165, "loss": 0.0152, "step": 293030 }, { "epoch": 0.76, "learning_rate": 0.0001860597074506002, "loss": 0.0135, "step": 293040 }, { "epoch": 0.76, "learning_rate": 0.00018605581923422873, "loss": 0.0136, "step": 293050 }, { "epoch": 0.76, "learning_rate": 0.00018605193101785725, "loss": 0.0158, "step": 293060 }, { "epoch": 0.76, "learning_rate": 0.0001860480428014858, "loss": 0.0142, "step": 293070 }, { "epoch": 0.76, "learning_rate": 0.00018604415458511436, "loss": 0.0123, "step": 293080 }, { "epoch": 0.76, "learning_rate": 0.00018604026636874287, "loss": 0.0141, "step": 293090 }, { "epoch": 0.76, "learning_rate": 0.00018603637815237141, "loss": 0.0153, "step": 293100 }, { "epoch": 0.76, "learning_rate": 0.00018603248993599993, "loss": 0.0136, "step": 293110 }, { "epoch": 0.76, "learning_rate": 0.0001860286017196285, "loss": 0.018, "step": 293120 }, { "epoch": 0.76, "learning_rate": 0.000186024713503257, "loss": 0.0142, "step": 293130 }, { "epoch": 0.76, "learning_rate": 0.00018602082528688555, "loss": 0.0191, "step": 293140 }, { "epoch": 0.76, "learning_rate": 0.00018601693707051407, "loss": 0.0117, "step": 293150 }, { "epoch": 0.76, "learning_rate": 0.00018601304885414264, "loss": 0.0151, "step": 293160 }, { "epoch": 0.76, "learning_rate": 0.00018600916063777115, "loss": 0.0145, "step": 293170 }, { "epoch": 0.76, "learning_rate": 0.0001860052724213997, "loss": 0.0147, "step": 293180 }, { "epoch": 0.76, "learning_rate": 0.0001860013842050282, "loss": 0.014, "step": 293190 }, { "epoch": 0.76, "learning_rate": 0.00018599749598865678, "loss": 0.0148, "step": 293200 }, { "epoch": 0.76, "learning_rate": 0.0001859936077722853, "loss": 0.0128, "step": 293210 }, { "epoch": 0.76, "learning_rate": 0.00018598971955591383, "loss": 0.0148, "step": 293220 }, { "epoch": 0.76, "learning_rate": 0.00018598583133954235, "loss": 0.0158, "step": 293230 }, { "epoch": 0.76, "learning_rate": 0.00018598194312317092, "loss": 0.0143, "step": 293240 }, { "epoch": 0.76, "learning_rate": 0.00018597805490679946, "loss": 0.0147, "step": 293250 }, { "epoch": 0.76, "learning_rate": 0.00018597416669042797, "loss": 0.0137, "step": 293260 }, { "epoch": 0.76, "learning_rate": 0.0001859702784740565, "loss": 0.0127, "step": 293270 }, { "epoch": 0.76, "learning_rate": 0.00018596639025768503, "loss": 0.0163, "step": 293280 }, { "epoch": 0.76, "learning_rate": 0.0001859625020413136, "loss": 0.016, "step": 293290 }, { "epoch": 0.76, "learning_rate": 0.0001859586138249421, "loss": 0.0145, "step": 293300 }, { "epoch": 0.76, "learning_rate": 0.00018595472560857065, "loss": 0.0115, "step": 293310 }, { "epoch": 0.76, "learning_rate": 0.00018595083739219917, "loss": 0.0158, "step": 293320 }, { "epoch": 0.76, "learning_rate": 0.00018594694917582774, "loss": 0.0119, "step": 293330 }, { "epoch": 0.76, "learning_rate": 0.00018594306095945625, "loss": 0.0139, "step": 293340 }, { "epoch": 0.76, "learning_rate": 0.0001859391727430848, "loss": 0.0186, "step": 293350 }, { "epoch": 0.76, "learning_rate": 0.0001859352845267133, "loss": 0.0182, "step": 293360 }, { "epoch": 0.76, "learning_rate": 0.00018593139631034188, "loss": 0.0164, "step": 293370 }, { "epoch": 0.76, "learning_rate": 0.0001859275080939704, "loss": 0.0156, "step": 293380 }, { "epoch": 0.76, "learning_rate": 0.00018592361987759893, "loss": 0.0136, "step": 293390 }, { "epoch": 0.76, "learning_rate": 0.00018591973166122745, "loss": 0.0126, "step": 293400 }, { "epoch": 0.76, "learning_rate": 0.00018591584344485602, "loss": 0.0127, "step": 293410 }, { "epoch": 0.76, "learning_rate": 0.00018591195522848453, "loss": 0.0174, "step": 293420 }, { "epoch": 0.76, "learning_rate": 0.00018590806701211307, "loss": 0.0131, "step": 293430 }, { "epoch": 0.76, "learning_rate": 0.0001859041787957416, "loss": 0.0128, "step": 293440 }, { "epoch": 0.76, "learning_rate": 0.00018590029057937016, "loss": 0.0146, "step": 293450 }, { "epoch": 0.76, "learning_rate": 0.0001858964023629987, "loss": 0.0144, "step": 293460 }, { "epoch": 0.76, "learning_rate": 0.0001858925141466272, "loss": 0.0158, "step": 293470 }, { "epoch": 0.76, "learning_rate": 0.00018588862593025575, "loss": 0.0131, "step": 293480 }, { "epoch": 0.76, "learning_rate": 0.0001858847377138843, "loss": 0.0192, "step": 293490 }, { "epoch": 0.76, "learning_rate": 0.00018588084949751284, "loss": 0.0169, "step": 293500 }, { "epoch": 0.76, "learning_rate": 0.00018587696128114135, "loss": 0.0115, "step": 293510 }, { "epoch": 0.76, "learning_rate": 0.0001858730730647699, "loss": 0.0127, "step": 293520 }, { "epoch": 0.76, "learning_rate": 0.0001858691848483984, "loss": 0.0173, "step": 293530 }, { "epoch": 0.76, "learning_rate": 0.00018586529663202698, "loss": 0.0145, "step": 293540 }, { "epoch": 0.76, "learning_rate": 0.0001858614084156555, "loss": 0.0144, "step": 293550 }, { "epoch": 0.76, "learning_rate": 0.00018585752019928403, "loss": 0.0151, "step": 293560 }, { "epoch": 0.76, "learning_rate": 0.00018585363198291255, "loss": 0.0196, "step": 293570 }, { "epoch": 0.76, "learning_rate": 0.00018584974376654112, "loss": 0.0142, "step": 293580 }, { "epoch": 0.76, "learning_rate": 0.00018584585555016963, "loss": 0.0133, "step": 293590 }, { "epoch": 0.76, "learning_rate": 0.00018584196733379817, "loss": 0.0143, "step": 293600 }, { "epoch": 0.76, "learning_rate": 0.00018583807911742669, "loss": 0.0134, "step": 293610 }, { "epoch": 0.76, "learning_rate": 0.00018583419090105525, "loss": 0.0143, "step": 293620 }, { "epoch": 0.76, "learning_rate": 0.0001858303026846838, "loss": 0.0134, "step": 293630 }, { "epoch": 0.76, "learning_rate": 0.0001858264144683123, "loss": 0.0174, "step": 293640 }, { "epoch": 0.76, "learning_rate": 0.00018582252625194085, "loss": 0.0144, "step": 293650 }, { "epoch": 0.76, "learning_rate": 0.0001858186380355694, "loss": 0.0168, "step": 293660 }, { "epoch": 0.76, "learning_rate": 0.00018581474981919794, "loss": 0.011, "step": 293670 }, { "epoch": 0.76, "learning_rate": 0.00018581086160282645, "loss": 0.0136, "step": 293680 }, { "epoch": 0.76, "learning_rate": 0.000185806973386455, "loss": 0.0153, "step": 293690 }, { "epoch": 0.76, "learning_rate": 0.00018580308517008353, "loss": 0.0166, "step": 293700 }, { "epoch": 0.76, "learning_rate": 0.00018579919695371208, "loss": 0.0121, "step": 293710 }, { "epoch": 0.76, "learning_rate": 0.0001857953087373406, "loss": 0.018, "step": 293720 }, { "epoch": 0.76, "learning_rate": 0.00018579142052096913, "loss": 0.0138, "step": 293730 }, { "epoch": 0.76, "learning_rate": 0.00018578753230459767, "loss": 0.0188, "step": 293740 }, { "epoch": 0.76, "learning_rate": 0.00018578364408822621, "loss": 0.0167, "step": 293750 }, { "epoch": 0.76, "learning_rate": 0.00018577975587185473, "loss": 0.0106, "step": 293760 }, { "epoch": 0.76, "learning_rate": 0.00018577586765548327, "loss": 0.0151, "step": 293770 }, { "epoch": 0.76, "learning_rate": 0.00018577197943911179, "loss": 0.0173, "step": 293780 }, { "epoch": 0.76, "learning_rate": 0.00018576809122274035, "loss": 0.0142, "step": 293790 }, { "epoch": 0.76, "learning_rate": 0.0001857642030063689, "loss": 0.0187, "step": 293800 }, { "epoch": 0.76, "learning_rate": 0.0001857603147899974, "loss": 0.0155, "step": 293810 }, { "epoch": 0.76, "learning_rate": 0.00018575642657362592, "loss": 0.0148, "step": 293820 }, { "epoch": 0.76, "learning_rate": 0.0001857525383572545, "loss": 0.0183, "step": 293830 }, { "epoch": 0.76, "learning_rate": 0.00018574865014088304, "loss": 0.0163, "step": 293840 }, { "epoch": 0.76, "learning_rate": 0.00018574476192451155, "loss": 0.017, "step": 293850 }, { "epoch": 0.76, "learning_rate": 0.0001857408737081401, "loss": 0.0161, "step": 293860 }, { "epoch": 0.76, "learning_rate": 0.00018573698549176863, "loss": 0.0103, "step": 293870 }, { "epoch": 0.76, "learning_rate": 0.00018573309727539717, "loss": 0.0132, "step": 293880 }, { "epoch": 0.76, "learning_rate": 0.0001857292090590257, "loss": 0.0148, "step": 293890 }, { "epoch": 0.76, "learning_rate": 0.00018572532084265423, "loss": 0.0157, "step": 293900 }, { "epoch": 0.76, "learning_rate": 0.00018572143262628277, "loss": 0.0175, "step": 293910 }, { "epoch": 0.76, "learning_rate": 0.00018571754440991131, "loss": 0.0118, "step": 293920 }, { "epoch": 0.76, "learning_rate": 0.00018571365619353983, "loss": 0.0133, "step": 293930 }, { "epoch": 0.76, "learning_rate": 0.00018570976797716837, "loss": 0.0165, "step": 293940 }, { "epoch": 0.76, "learning_rate": 0.00018570587976079694, "loss": 0.0136, "step": 293950 }, { "epoch": 0.76, "learning_rate": 0.00018570199154442545, "loss": 0.0171, "step": 293960 }, { "epoch": 0.76, "learning_rate": 0.000185698103328054, "loss": 0.0164, "step": 293970 }, { "epoch": 0.76, "learning_rate": 0.0001856942151116825, "loss": 0.017, "step": 293980 }, { "epoch": 0.76, "learning_rate": 0.00018569032689531108, "loss": 0.0141, "step": 293990 }, { "epoch": 0.76, "learning_rate": 0.0001856864386789396, "loss": 0.0123, "step": 294000 }, { "epoch": 0.76, "eval_cer": 0.8817306790618513, "eval_loss": 0.010044018737971783, "eval_runtime": 108.1094, "eval_samples_per_second": 18.5, "eval_steps_per_second": 4.625, "step": 294000 }, { "epoch": 0.76, "learning_rate": 0.00018568255046256813, "loss": 0.0099, "step": 294010 }, { "epoch": 0.76, "learning_rate": 0.00018567866224619665, "loss": 0.0134, "step": 294020 }, { "epoch": 0.76, "learning_rate": 0.0001856747740298252, "loss": 0.0173, "step": 294030 }, { "epoch": 0.76, "learning_rate": 0.00018567088581345373, "loss": 0.0127, "step": 294040 }, { "epoch": 0.76, "learning_rate": 0.00018566699759708227, "loss": 0.0113, "step": 294050 }, { "epoch": 0.76, "learning_rate": 0.0001856631093807108, "loss": 0.0164, "step": 294060 }, { "epoch": 0.76, "learning_rate": 0.00018565922116433933, "loss": 0.0167, "step": 294070 }, { "epoch": 0.76, "learning_rate": 0.00018565533294796787, "loss": 0.014, "step": 294080 }, { "epoch": 0.76, "learning_rate": 0.0001856514447315964, "loss": 0.012, "step": 294090 }, { "epoch": 0.76, "learning_rate": 0.00018564755651522493, "loss": 0.0161, "step": 294100 }, { "epoch": 0.76, "learning_rate": 0.00018564366829885347, "loss": 0.0159, "step": 294110 }, { "epoch": 0.76, "learning_rate": 0.00018563978008248204, "loss": 0.0147, "step": 294120 }, { "epoch": 0.76, "learning_rate": 0.00018563589186611055, "loss": 0.0134, "step": 294130 }, { "epoch": 0.76, "learning_rate": 0.00018563200364973907, "loss": 0.0125, "step": 294140 }, { "epoch": 0.76, "learning_rate": 0.0001856281154333676, "loss": 0.0143, "step": 294150 }, { "epoch": 0.76, "learning_rate": 0.00018562422721699618, "loss": 0.0137, "step": 294160 }, { "epoch": 0.76, "learning_rate": 0.0001856203390006247, "loss": 0.0151, "step": 294170 }, { "epoch": 0.76, "learning_rate": 0.00018561645078425323, "loss": 0.0132, "step": 294180 }, { "epoch": 0.76, "learning_rate": 0.00018561256256788175, "loss": 0.0126, "step": 294190 }, { "epoch": 0.76, "learning_rate": 0.00018560867435151032, "loss": 0.0154, "step": 294200 }, { "epoch": 0.76, "learning_rate": 0.00018560478613513883, "loss": 0.0146, "step": 294210 }, { "epoch": 0.76, "learning_rate": 0.00018560089791876737, "loss": 0.015, "step": 294220 }, { "epoch": 0.76, "learning_rate": 0.0001855970097023959, "loss": 0.0184, "step": 294230 }, { "epoch": 0.76, "learning_rate": 0.00018559312148602446, "loss": 0.0123, "step": 294240 }, { "epoch": 0.76, "learning_rate": 0.00018558923326965297, "loss": 0.013, "step": 294250 }, { "epoch": 0.76, "learning_rate": 0.0001855853450532815, "loss": 0.0138, "step": 294260 }, { "epoch": 0.76, "learning_rate": 0.00018558145683691003, "loss": 0.0135, "step": 294270 }, { "epoch": 0.76, "learning_rate": 0.00018557756862053857, "loss": 0.0116, "step": 294280 }, { "epoch": 0.76, "learning_rate": 0.00018557368040416714, "loss": 0.0118, "step": 294290 }, { "epoch": 0.76, "learning_rate": 0.00018556979218779565, "loss": 0.0149, "step": 294300 }, { "epoch": 0.76, "learning_rate": 0.00018556590397142417, "loss": 0.015, "step": 294310 }, { "epoch": 0.76, "learning_rate": 0.0001855620157550527, "loss": 0.0163, "step": 294320 }, { "epoch": 0.76, "learning_rate": 0.00018555812753868128, "loss": 0.0172, "step": 294330 }, { "epoch": 0.76, "learning_rate": 0.0001855542393223098, "loss": 0.0166, "step": 294340 }, { "epoch": 0.76, "learning_rate": 0.00018555035110593833, "loss": 0.0144, "step": 294350 }, { "epoch": 0.76, "learning_rate": 0.00018554646288956685, "loss": 0.011, "step": 294360 }, { "epoch": 0.76, "learning_rate": 0.00018554257467319542, "loss": 0.0117, "step": 294370 }, { "epoch": 0.76, "learning_rate": 0.00018553868645682393, "loss": 0.0127, "step": 294380 }, { "epoch": 0.76, "learning_rate": 0.00018553479824045247, "loss": 0.0132, "step": 294390 }, { "epoch": 0.76, "learning_rate": 0.000185530910024081, "loss": 0.0159, "step": 294400 }, { "epoch": 0.76, "learning_rate": 0.00018552702180770956, "loss": 0.013, "step": 294410 }, { "epoch": 0.76, "learning_rate": 0.00018552313359133807, "loss": 0.0125, "step": 294420 }, { "epoch": 0.76, "learning_rate": 0.0001855192453749666, "loss": 0.0149, "step": 294430 }, { "epoch": 0.76, "learning_rate": 0.00018551535715859513, "loss": 0.015, "step": 294440 }, { "epoch": 0.76, "learning_rate": 0.0001855114689422237, "loss": 0.0165, "step": 294450 }, { "epoch": 0.76, "learning_rate": 0.0001855075807258522, "loss": 0.019, "step": 294460 }, { "epoch": 0.76, "learning_rate": 0.00018550369250948075, "loss": 0.0111, "step": 294470 }, { "epoch": 0.76, "learning_rate": 0.00018549980429310927, "loss": 0.016, "step": 294480 }, { "epoch": 0.76, "learning_rate": 0.00018549591607673784, "loss": 0.0166, "step": 294490 }, { "epoch": 0.76, "learning_rate": 0.00018549202786036638, "loss": 0.0166, "step": 294500 }, { "epoch": 0.76, "learning_rate": 0.0001854881396439949, "loss": 0.0144, "step": 294510 }, { "epoch": 0.76, "learning_rate": 0.00018548425142762343, "loss": 0.0163, "step": 294520 }, { "epoch": 0.76, "learning_rate": 0.00018548036321125195, "loss": 0.0159, "step": 294530 }, { "epoch": 0.76, "learning_rate": 0.00018547647499488052, "loss": 0.0129, "step": 294540 }, { "epoch": 0.76, "learning_rate": 0.00018547258677850903, "loss": 0.0146, "step": 294550 }, { "epoch": 0.76, "learning_rate": 0.00018546869856213757, "loss": 0.0123, "step": 294560 }, { "epoch": 0.76, "learning_rate": 0.0001854648103457661, "loss": 0.0142, "step": 294570 }, { "epoch": 0.76, "learning_rate": 0.00018546092212939466, "loss": 0.0145, "step": 294580 }, { "epoch": 0.76, "learning_rate": 0.00018545703391302317, "loss": 0.0145, "step": 294590 }, { "epoch": 0.76, "learning_rate": 0.0001854531456966517, "loss": 0.0121, "step": 294600 }, { "epoch": 0.76, "learning_rate": 0.00018544925748028023, "loss": 0.0134, "step": 294610 }, { "epoch": 0.76, "learning_rate": 0.0001854453692639088, "loss": 0.012, "step": 294620 }, { "epoch": 0.76, "learning_rate": 0.0001854414810475373, "loss": 0.0116, "step": 294630 }, { "epoch": 0.76, "learning_rate": 0.00018543759283116585, "loss": 0.0161, "step": 294640 }, { "epoch": 0.76, "learning_rate": 0.00018543370461479437, "loss": 0.0132, "step": 294650 }, { "epoch": 0.76, "learning_rate": 0.00018542981639842293, "loss": 0.0149, "step": 294660 }, { "epoch": 0.76, "learning_rate": 0.00018542592818205148, "loss": 0.0125, "step": 294670 }, { "epoch": 0.76, "learning_rate": 0.00018542203996568, "loss": 0.0114, "step": 294680 }, { "epoch": 0.76, "learning_rate": 0.00018541815174930853, "loss": 0.0163, "step": 294690 }, { "epoch": 0.76, "learning_rate": 0.00018541426353293707, "loss": 0.016, "step": 294700 }, { "epoch": 0.76, "learning_rate": 0.00018541037531656562, "loss": 0.0152, "step": 294710 }, { "epoch": 0.76, "learning_rate": 0.00018540648710019413, "loss": 0.0131, "step": 294720 }, { "epoch": 0.76, "learning_rate": 0.00018540259888382267, "loss": 0.017, "step": 294730 }, { "epoch": 0.76, "learning_rate": 0.0001853987106674512, "loss": 0.0151, "step": 294740 }, { "epoch": 0.76, "learning_rate": 0.00018539482245107976, "loss": 0.0133, "step": 294750 }, { "epoch": 0.76, "learning_rate": 0.00018539093423470827, "loss": 0.0133, "step": 294760 }, { "epoch": 0.76, "learning_rate": 0.0001853870460183368, "loss": 0.0136, "step": 294770 }, { "epoch": 0.76, "learning_rate": 0.00018538315780196533, "loss": 0.0129, "step": 294780 }, { "epoch": 0.76, "learning_rate": 0.0001853792695855939, "loss": 0.0129, "step": 294790 }, { "epoch": 0.76, "learning_rate": 0.0001853753813692224, "loss": 0.0195, "step": 294800 }, { "epoch": 0.76, "learning_rate": 0.00018537149315285095, "loss": 0.0135, "step": 294810 }, { "epoch": 0.76, "learning_rate": 0.00018536760493647947, "loss": 0.0152, "step": 294820 }, { "epoch": 0.76, "learning_rate": 0.00018536371672010803, "loss": 0.0141, "step": 294830 }, { "epoch": 0.76, "learning_rate": 0.00018535982850373658, "loss": 0.0137, "step": 294840 }, { "epoch": 0.76, "learning_rate": 0.0001853559402873651, "loss": 0.0138, "step": 294850 }, { "epoch": 0.76, "learning_rate": 0.0001853520520709936, "loss": 0.0137, "step": 294860 }, { "epoch": 0.76, "learning_rate": 0.00018534816385462217, "loss": 0.0128, "step": 294870 }, { "epoch": 0.76, "learning_rate": 0.00018534427563825072, "loss": 0.0133, "step": 294880 }, { "epoch": 0.76, "learning_rate": 0.00018534038742187923, "loss": 0.0154, "step": 294890 }, { "epoch": 0.76, "learning_rate": 0.00018533649920550777, "loss": 0.0142, "step": 294900 }, { "epoch": 0.76, "learning_rate": 0.0001853326109891363, "loss": 0.0101, "step": 294910 }, { "epoch": 0.76, "learning_rate": 0.00018532872277276485, "loss": 0.016, "step": 294920 }, { "epoch": 0.76, "learning_rate": 0.00018532483455639337, "loss": 0.0136, "step": 294930 }, { "epoch": 0.76, "learning_rate": 0.0001853209463400219, "loss": 0.0211, "step": 294940 }, { "epoch": 0.76, "learning_rate": 0.00018531705812365045, "loss": 0.014, "step": 294950 }, { "epoch": 0.76, "learning_rate": 0.000185313169907279, "loss": 0.0136, "step": 294960 }, { "epoch": 0.76, "learning_rate": 0.0001853092816909075, "loss": 0.0171, "step": 294970 }, { "epoch": 0.76, "learning_rate": 0.00018530539347453605, "loss": 0.0174, "step": 294980 }, { "epoch": 0.76, "learning_rate": 0.00018530150525816462, "loss": 0.0119, "step": 294990 }, { "epoch": 0.76, "learning_rate": 0.00018529761704179313, "loss": 0.0135, "step": 295000 }, { "epoch": 0.76, "eval_cer": 0.881688689953826, "eval_loss": 0.00990963727235794, "eval_runtime": 107.8953, "eval_samples_per_second": 18.536, "eval_steps_per_second": 4.634, "step": 295000 }, { "epoch": 0.76, "learning_rate": 0.00018529372882542165, "loss": 0.0182, "step": 295010 }, { "epoch": 0.76, "learning_rate": 0.0001852898406090502, "loss": 0.0148, "step": 295020 }, { "epoch": 0.76, "learning_rate": 0.0001852859523926787, "loss": 0.0116, "step": 295030 }, { "epoch": 0.76, "learning_rate": 0.00018528206417630727, "loss": 0.0166, "step": 295040 }, { "epoch": 0.76, "learning_rate": 0.00018527817595993581, "loss": 0.0164, "step": 295050 }, { "epoch": 0.76, "learning_rate": 0.00018527428774356433, "loss": 0.0121, "step": 295060 }, { "epoch": 0.76, "learning_rate": 0.00018527039952719287, "loss": 0.0115, "step": 295070 }, { "epoch": 0.76, "learning_rate": 0.0001852665113108214, "loss": 0.0162, "step": 295080 }, { "epoch": 0.76, "learning_rate": 0.00018526262309444995, "loss": 0.0168, "step": 295090 }, { "epoch": 0.76, "learning_rate": 0.00018525873487807847, "loss": 0.015, "step": 295100 }, { "epoch": 0.76, "learning_rate": 0.000185254846661707, "loss": 0.014, "step": 295110 }, { "epoch": 0.76, "learning_rate": 0.00018525095844533555, "loss": 0.0162, "step": 295120 }, { "epoch": 0.77, "learning_rate": 0.0001852470702289641, "loss": 0.0123, "step": 295130 }, { "epoch": 0.77, "learning_rate": 0.0001852431820125926, "loss": 0.019, "step": 295140 }, { "epoch": 0.77, "learning_rate": 0.00018523929379622115, "loss": 0.0133, "step": 295150 }, { "epoch": 0.77, "learning_rate": 0.00018523540557984972, "loss": 0.015, "step": 295160 }, { "epoch": 0.77, "learning_rate": 0.00018523151736347823, "loss": 0.0191, "step": 295170 }, { "epoch": 0.77, "learning_rate": 0.00018522762914710675, "loss": 0.0169, "step": 295180 }, { "epoch": 0.77, "learning_rate": 0.0001852237409307353, "loss": 0.0154, "step": 295190 }, { "epoch": 0.77, "learning_rate": 0.00018521985271436386, "loss": 0.0157, "step": 295200 }, { "epoch": 0.77, "learning_rate": 0.00018521596449799237, "loss": 0.0157, "step": 295210 }, { "epoch": 0.77, "learning_rate": 0.00018521207628162091, "loss": 0.0138, "step": 295220 }, { "epoch": 0.77, "learning_rate": 0.00018520818806524943, "loss": 0.0132, "step": 295230 }, { "epoch": 0.77, "learning_rate": 0.000185204299848878, "loss": 0.014, "step": 295240 }, { "epoch": 0.77, "learning_rate": 0.0001852004116325065, "loss": 0.0108, "step": 295250 }, { "epoch": 0.77, "learning_rate": 0.00018519652341613505, "loss": 0.0173, "step": 295260 }, { "epoch": 0.77, "learning_rate": 0.00018519263519976357, "loss": 0.0174, "step": 295270 }, { "epoch": 0.77, "learning_rate": 0.0001851887469833921, "loss": 0.0128, "step": 295280 }, { "epoch": 0.77, "learning_rate": 0.00018518485876702065, "loss": 0.015, "step": 295290 }, { "epoch": 0.77, "learning_rate": 0.0001851809705506492, "loss": 0.0117, "step": 295300 }, { "epoch": 0.77, "learning_rate": 0.0001851770823342777, "loss": 0.0134, "step": 295310 }, { "epoch": 0.77, "learning_rate": 0.00018517319411790625, "loss": 0.0125, "step": 295320 }, { "epoch": 0.77, "learning_rate": 0.0001851693059015348, "loss": 0.0132, "step": 295330 }, { "epoch": 0.77, "learning_rate": 0.00018516541768516333, "loss": 0.0134, "step": 295340 }, { "epoch": 0.77, "learning_rate": 0.00018516152946879185, "loss": 0.0143, "step": 295350 }, { "epoch": 0.77, "learning_rate": 0.0001851576412524204, "loss": 0.0209, "step": 295360 }, { "epoch": 0.77, "learning_rate": 0.00018515375303604896, "loss": 0.0184, "step": 295370 }, { "epoch": 0.77, "learning_rate": 0.00018514986481967747, "loss": 0.0122, "step": 295380 }, { "epoch": 0.77, "learning_rate": 0.000185145976603306, "loss": 0.0123, "step": 295390 }, { "epoch": 0.77, "learning_rate": 0.00018514208838693453, "loss": 0.0153, "step": 295400 }, { "epoch": 0.77, "learning_rate": 0.0001851382001705631, "loss": 0.0165, "step": 295410 }, { "epoch": 0.77, "learning_rate": 0.0001851343119541916, "loss": 0.0181, "step": 295420 }, { "epoch": 0.77, "learning_rate": 0.00018513042373782015, "loss": 0.015, "step": 295430 }, { "epoch": 0.77, "learning_rate": 0.00018512653552144867, "loss": 0.013, "step": 295440 }, { "epoch": 0.77, "learning_rate": 0.00018512264730507724, "loss": 0.0154, "step": 295450 }, { "epoch": 0.77, "learning_rate": 0.00018511875908870575, "loss": 0.0101, "step": 295460 }, { "epoch": 0.77, "learning_rate": 0.0001851148708723343, "loss": 0.0161, "step": 295470 }, { "epoch": 0.77, "learning_rate": 0.0001851109826559628, "loss": 0.0175, "step": 295480 }, { "epoch": 0.77, "learning_rate": 0.00018510709443959138, "loss": 0.0193, "step": 295490 }, { "epoch": 0.77, "learning_rate": 0.0001851032062232199, "loss": 0.0131, "step": 295500 }, { "epoch": 0.77, "learning_rate": 0.00018509931800684843, "loss": 0.0164, "step": 295510 }, { "epoch": 0.77, "learning_rate": 0.00018509542979047695, "loss": 0.0137, "step": 295520 }, { "epoch": 0.77, "learning_rate": 0.0001850915415741055, "loss": 0.0139, "step": 295530 }, { "epoch": 0.77, "learning_rate": 0.00018508765335773406, "loss": 0.0112, "step": 295540 }, { "epoch": 0.77, "learning_rate": 0.00018508376514136257, "loss": 0.0139, "step": 295550 }, { "epoch": 0.77, "learning_rate": 0.0001850798769249911, "loss": 0.014, "step": 295560 }, { "epoch": 0.77, "learning_rate": 0.00018507598870861963, "loss": 0.0141, "step": 295570 }, { "epoch": 0.77, "learning_rate": 0.0001850721004922482, "loss": 0.0162, "step": 295580 }, { "epoch": 0.77, "learning_rate": 0.0001850682122758767, "loss": 0.0153, "step": 295590 }, { "epoch": 0.77, "learning_rate": 0.00018506432405950525, "loss": 0.0167, "step": 295600 }, { "epoch": 0.77, "learning_rate": 0.00018506043584313377, "loss": 0.0254, "step": 295610 }, { "epoch": 0.77, "learning_rate": 0.00018505654762676234, "loss": 0.0158, "step": 295620 }, { "epoch": 0.77, "learning_rate": 0.00018505265941039085, "loss": 0.0132, "step": 295630 }, { "epoch": 0.77, "learning_rate": 0.0001850487711940194, "loss": 0.0185, "step": 295640 }, { "epoch": 0.77, "learning_rate": 0.0001850448829776479, "loss": 0.0179, "step": 295650 }, { "epoch": 0.77, "learning_rate": 0.00018504099476127647, "loss": 0.014, "step": 295660 }, { "epoch": 0.77, "learning_rate": 0.000185037106544905, "loss": 0.0156, "step": 295670 }, { "epoch": 0.77, "learning_rate": 0.00018503321832853353, "loss": 0.013, "step": 295680 }, { "epoch": 0.77, "learning_rate": 0.00018502933011216205, "loss": 0.0157, "step": 295690 }, { "epoch": 0.77, "learning_rate": 0.00018502544189579061, "loss": 0.0142, "step": 295700 }, { "epoch": 0.77, "learning_rate": 0.00018502155367941916, "loss": 0.0106, "step": 295710 }, { "epoch": 0.77, "learning_rate": 0.00018501766546304767, "loss": 0.012, "step": 295720 }, { "epoch": 0.77, "learning_rate": 0.00018501377724667619, "loss": 0.0152, "step": 295730 }, { "epoch": 0.77, "learning_rate": 0.00018500988903030475, "loss": 0.0161, "step": 295740 }, { "epoch": 0.77, "learning_rate": 0.0001850060008139333, "loss": 0.0133, "step": 295750 }, { "epoch": 0.77, "learning_rate": 0.0001850021125975618, "loss": 0.0138, "step": 295760 }, { "epoch": 0.77, "learning_rate": 0.00018499822438119035, "loss": 0.0131, "step": 295770 }, { "epoch": 0.77, "learning_rate": 0.00018499433616481887, "loss": 0.0143, "step": 295780 }, { "epoch": 0.77, "learning_rate": 0.00018499044794844743, "loss": 0.0151, "step": 295790 }, { "epoch": 0.77, "learning_rate": 0.00018498655973207595, "loss": 0.0126, "step": 295800 }, { "epoch": 0.77, "learning_rate": 0.0001849826715157045, "loss": 0.0122, "step": 295810 }, { "epoch": 0.77, "learning_rate": 0.000184978783299333, "loss": 0.0159, "step": 295820 }, { "epoch": 0.77, "learning_rate": 0.00018497489508296157, "loss": 0.0164, "step": 295830 }, { "epoch": 0.77, "learning_rate": 0.0001849710068665901, "loss": 0.0173, "step": 295840 }, { "epoch": 0.77, "learning_rate": 0.00018496711865021863, "loss": 0.0132, "step": 295850 }, { "epoch": 0.77, "learning_rate": 0.00018496323043384715, "loss": 0.0125, "step": 295860 }, { "epoch": 0.77, "learning_rate": 0.00018495934221747571, "loss": 0.0155, "step": 295870 }, { "epoch": 0.77, "learning_rate": 0.00018495545400110423, "loss": 0.0111, "step": 295880 }, { "epoch": 0.77, "learning_rate": 0.00018495156578473277, "loss": 0.0156, "step": 295890 }, { "epoch": 0.77, "learning_rate": 0.00018494767756836128, "loss": 0.0118, "step": 295900 }, { "epoch": 0.77, "learning_rate": 0.00018494378935198985, "loss": 0.0151, "step": 295910 }, { "epoch": 0.77, "learning_rate": 0.0001849399011356184, "loss": 0.0125, "step": 295920 }, { "epoch": 0.77, "learning_rate": 0.0001849360129192469, "loss": 0.0144, "step": 295930 }, { "epoch": 0.77, "learning_rate": 0.00018493212470287545, "loss": 0.0151, "step": 295940 }, { "epoch": 0.77, "learning_rate": 0.000184928236486504, "loss": 0.0136, "step": 295950 }, { "epoch": 0.77, "learning_rate": 0.00018492434827013253, "loss": 0.013, "step": 295960 }, { "epoch": 0.77, "learning_rate": 0.00018492046005376105, "loss": 0.0131, "step": 295970 }, { "epoch": 0.77, "learning_rate": 0.0001849165718373896, "loss": 0.0119, "step": 295980 }, { "epoch": 0.77, "learning_rate": 0.00018491268362101813, "loss": 0.0113, "step": 295990 }, { "epoch": 0.77, "learning_rate": 0.00018490879540464667, "loss": 0.0132, "step": 296000 }, { "epoch": 0.77, "eval_cer": 0.881727879787983, "eval_loss": 0.00943910051137209, "eval_runtime": 107.9554, "eval_samples_per_second": 18.526, "eval_steps_per_second": 4.632, "step": 296000 }, { "epoch": 0.77, "learning_rate": 0.0001849049071882752, "loss": 0.012, "step": 296010 }, { "epoch": 0.77, "learning_rate": 0.00018490101897190373, "loss": 0.0153, "step": 296020 }, { "epoch": 0.77, "learning_rate": 0.00018489713075553224, "loss": 0.0116, "step": 296030 }, { "epoch": 0.77, "learning_rate": 0.0001848932425391608, "loss": 0.0146, "step": 296040 }, { "epoch": 0.77, "learning_rate": 0.00018488935432278933, "loss": 0.0132, "step": 296050 }, { "epoch": 0.77, "learning_rate": 0.00018488546610641787, "loss": 0.0139, "step": 296060 }, { "epoch": 0.77, "learning_rate": 0.00018488157789004638, "loss": 0.0164, "step": 296070 }, { "epoch": 0.77, "learning_rate": 0.00018487768967367495, "loss": 0.0123, "step": 296080 }, { "epoch": 0.77, "learning_rate": 0.0001848738014573035, "loss": 0.0144, "step": 296090 }, { "epoch": 0.77, "learning_rate": 0.000184869913240932, "loss": 0.0167, "step": 296100 }, { "epoch": 0.77, "learning_rate": 0.00018486602502456055, "loss": 0.0174, "step": 296110 }, { "epoch": 0.77, "learning_rate": 0.0001848621368081891, "loss": 0.0149, "step": 296120 }, { "epoch": 0.77, "learning_rate": 0.00018485824859181763, "loss": 0.0193, "step": 296130 }, { "epoch": 0.77, "learning_rate": 0.00018485436037544615, "loss": 0.0133, "step": 296140 }, { "epoch": 0.77, "learning_rate": 0.0001848504721590747, "loss": 0.0143, "step": 296150 }, { "epoch": 0.77, "learning_rate": 0.00018484658394270323, "loss": 0.0139, "step": 296160 }, { "epoch": 0.77, "learning_rate": 0.00018484269572633177, "loss": 0.0163, "step": 296170 }, { "epoch": 0.77, "learning_rate": 0.0001848388075099603, "loss": 0.0142, "step": 296180 }, { "epoch": 0.77, "learning_rate": 0.00018483491929358883, "loss": 0.0134, "step": 296190 }, { "epoch": 0.77, "learning_rate": 0.00018483103107721737, "loss": 0.0151, "step": 296200 }, { "epoch": 0.77, "learning_rate": 0.0001848271428608459, "loss": 0.0162, "step": 296210 }, { "epoch": 0.77, "learning_rate": 0.00018482325464447443, "loss": 0.0181, "step": 296220 }, { "epoch": 0.77, "learning_rate": 0.00018481936642810297, "loss": 0.0171, "step": 296230 }, { "epoch": 0.77, "learning_rate": 0.00018481547821173148, "loss": 0.0143, "step": 296240 }, { "epoch": 0.77, "learning_rate": 0.00018481158999536005, "loss": 0.0142, "step": 296250 }, { "epoch": 0.77, "learning_rate": 0.0001848077017789886, "loss": 0.0146, "step": 296260 }, { "epoch": 0.77, "learning_rate": 0.0001848038135626171, "loss": 0.0149, "step": 296270 }, { "epoch": 0.77, "learning_rate": 0.00018479992534624565, "loss": 0.0126, "step": 296280 }, { "epoch": 0.77, "learning_rate": 0.0001847960371298742, "loss": 0.0146, "step": 296290 }, { "epoch": 0.77, "learning_rate": 0.00018479214891350273, "loss": 0.0165, "step": 296300 }, { "epoch": 0.77, "learning_rate": 0.00018478826069713125, "loss": 0.0147, "step": 296310 }, { "epoch": 0.77, "learning_rate": 0.0001847843724807598, "loss": 0.0128, "step": 296320 }, { "epoch": 0.77, "learning_rate": 0.00018478048426438833, "loss": 0.0128, "step": 296330 }, { "epoch": 0.77, "learning_rate": 0.00018477659604801687, "loss": 0.0131, "step": 296340 }, { "epoch": 0.77, "learning_rate": 0.0001847727078316454, "loss": 0.0126, "step": 296350 }, { "epoch": 0.77, "learning_rate": 0.00018476881961527393, "loss": 0.011, "step": 296360 }, { "epoch": 0.77, "learning_rate": 0.00018476493139890247, "loss": 0.015, "step": 296370 }, { "epoch": 0.77, "learning_rate": 0.000184761043182531, "loss": 0.0167, "step": 296380 }, { "epoch": 0.77, "learning_rate": 0.00018475715496615953, "loss": 0.0146, "step": 296390 }, { "epoch": 0.77, "learning_rate": 0.00018475326674978807, "loss": 0.0234, "step": 296400 }, { "epoch": 0.77, "learning_rate": 0.00018474937853341664, "loss": 0.0167, "step": 296410 }, { "epoch": 0.77, "learning_rate": 0.00018474549031704515, "loss": 0.012, "step": 296420 }, { "epoch": 0.77, "learning_rate": 0.0001847416021006737, "loss": 0.0161, "step": 296430 }, { "epoch": 0.77, "learning_rate": 0.0001847377138843022, "loss": 0.0139, "step": 296440 }, { "epoch": 0.77, "learning_rate": 0.00018473382566793078, "loss": 0.0135, "step": 296450 }, { "epoch": 0.77, "learning_rate": 0.0001847299374515593, "loss": 0.0125, "step": 296460 }, { "epoch": 0.77, "learning_rate": 0.00018472604923518783, "loss": 0.0173, "step": 296470 }, { "epoch": 0.77, "learning_rate": 0.00018472216101881635, "loss": 0.0153, "step": 296480 }, { "epoch": 0.77, "learning_rate": 0.0001847182728024449, "loss": 0.0133, "step": 296490 }, { "epoch": 0.77, "learning_rate": 0.00018471438458607343, "loss": 0.0156, "step": 296500 }, { "epoch": 0.77, "learning_rate": 0.00018471049636970197, "loss": 0.0136, "step": 296510 }, { "epoch": 0.77, "learning_rate": 0.0001847066081533305, "loss": 0.0193, "step": 296520 }, { "epoch": 0.77, "learning_rate": 0.00018470271993695903, "loss": 0.0152, "step": 296530 }, { "epoch": 0.77, "learning_rate": 0.00018469883172058757, "loss": 0.0119, "step": 296540 }, { "epoch": 0.77, "learning_rate": 0.0001846949435042161, "loss": 0.0161, "step": 296550 }, { "epoch": 0.77, "learning_rate": 0.00018469105528784463, "loss": 0.0176, "step": 296560 }, { "epoch": 0.77, "learning_rate": 0.00018468716707147317, "loss": 0.0182, "step": 296570 }, { "epoch": 0.77, "learning_rate": 0.00018468327885510174, "loss": 0.0121, "step": 296580 }, { "epoch": 0.77, "learning_rate": 0.00018467939063873025, "loss": 0.0158, "step": 296590 }, { "epoch": 0.77, "learning_rate": 0.00018467550242235877, "loss": 0.0139, "step": 296600 }, { "epoch": 0.77, "learning_rate": 0.0001846716142059873, "loss": 0.0134, "step": 296610 }, { "epoch": 0.77, "learning_rate": 0.00018466772598961588, "loss": 0.0175, "step": 296620 }, { "epoch": 0.77, "learning_rate": 0.0001846638377732444, "loss": 0.0124, "step": 296630 }, { "epoch": 0.77, "learning_rate": 0.00018465994955687293, "loss": 0.0115, "step": 296640 }, { "epoch": 0.77, "learning_rate": 0.00018465606134050145, "loss": 0.0173, "step": 296650 }, { "epoch": 0.77, "learning_rate": 0.00018465217312413002, "loss": 0.014, "step": 296660 }, { "epoch": 0.77, "learning_rate": 0.00018464828490775853, "loss": 0.0145, "step": 296670 }, { "epoch": 0.77, "learning_rate": 0.00018464439669138707, "loss": 0.0153, "step": 296680 }, { "epoch": 0.77, "learning_rate": 0.00018464050847501559, "loss": 0.0153, "step": 296690 }, { "epoch": 0.77, "learning_rate": 0.00018463662025864415, "loss": 0.0127, "step": 296700 }, { "epoch": 0.77, "learning_rate": 0.00018463273204227267, "loss": 0.0147, "step": 296710 }, { "epoch": 0.77, "learning_rate": 0.0001846288438259012, "loss": 0.0146, "step": 296720 }, { "epoch": 0.77, "learning_rate": 0.00018462495560952973, "loss": 0.0124, "step": 296730 }, { "epoch": 0.77, "learning_rate": 0.00018462106739315827, "loss": 0.0134, "step": 296740 }, { "epoch": 0.77, "learning_rate": 0.00018461717917678684, "loss": 0.0141, "step": 296750 }, { "epoch": 0.77, "learning_rate": 0.00018461329096041535, "loss": 0.0137, "step": 296760 }, { "epoch": 0.77, "learning_rate": 0.00018460940274404386, "loss": 0.016, "step": 296770 }, { "epoch": 0.77, "learning_rate": 0.0001846055145276724, "loss": 0.0157, "step": 296780 }, { "epoch": 0.77, "learning_rate": 0.00018460162631130098, "loss": 0.0134, "step": 296790 }, { "epoch": 0.77, "learning_rate": 0.0001845977380949295, "loss": 0.0104, "step": 296800 }, { "epoch": 0.77, "learning_rate": 0.00018459384987855803, "loss": 0.015, "step": 296810 }, { "epoch": 0.77, "learning_rate": 0.00018458996166218655, "loss": 0.0158, "step": 296820 }, { "epoch": 0.77, "learning_rate": 0.00018458607344581511, "loss": 0.0179, "step": 296830 }, { "epoch": 0.77, "learning_rate": 0.00018458218522944363, "loss": 0.015, "step": 296840 }, { "epoch": 0.77, "learning_rate": 0.00018457829701307217, "loss": 0.0152, "step": 296850 }, { "epoch": 0.77, "learning_rate": 0.00018457440879670069, "loss": 0.0128, "step": 296860 }, { "epoch": 0.77, "learning_rate": 0.00018457052058032925, "loss": 0.0183, "step": 296870 }, { "epoch": 0.77, "learning_rate": 0.00018456663236395777, "loss": 0.0131, "step": 296880 }, { "epoch": 0.77, "learning_rate": 0.0001845627441475863, "loss": 0.0154, "step": 296890 }, { "epoch": 0.77, "learning_rate": 0.00018455885593121482, "loss": 0.0163, "step": 296900 }, { "epoch": 0.77, "learning_rate": 0.0001845549677148434, "loss": 0.0159, "step": 296910 }, { "epoch": 0.77, "learning_rate": 0.0001845510794984719, "loss": 0.0148, "step": 296920 }, { "epoch": 0.77, "learning_rate": 0.00018454719128210045, "loss": 0.0179, "step": 296930 }, { "epoch": 0.77, "learning_rate": 0.00018454330306572896, "loss": 0.0171, "step": 296940 }, { "epoch": 0.77, "learning_rate": 0.00018453941484935753, "loss": 0.013, "step": 296950 }, { "epoch": 0.77, "learning_rate": 0.00018453552663298607, "loss": 0.0114, "step": 296960 }, { "epoch": 0.77, "learning_rate": 0.0001845316384166146, "loss": 0.0117, "step": 296970 }, { "epoch": 0.77, "learning_rate": 0.00018452775020024313, "loss": 0.0127, "step": 296980 }, { "epoch": 0.77, "learning_rate": 0.00018452386198387165, "loss": 0.0157, "step": 296990 }, { "epoch": 0.77, "learning_rate": 0.00018451997376750021, "loss": 0.0137, "step": 297000 }, { "epoch": 0.77, "eval_cer": 0.8817432757942589, "eval_loss": 0.010051160119473934, "eval_runtime": 108.1046, "eval_samples_per_second": 18.501, "eval_steps_per_second": 4.625, "step": 297000 }, { "epoch": 0.77, "learning_rate": 0.00018451608555112873, "loss": 0.0122, "step": 297010 }, { "epoch": 0.77, "learning_rate": 0.00018451219733475727, "loss": 0.0184, "step": 297020 }, { "epoch": 0.77, "learning_rate": 0.00018450830911838578, "loss": 0.0161, "step": 297030 }, { "epoch": 0.77, "learning_rate": 0.00018450442090201435, "loss": 0.0141, "step": 297040 }, { "epoch": 0.77, "learning_rate": 0.00018450053268564287, "loss": 0.0119, "step": 297050 }, { "epoch": 0.77, "learning_rate": 0.0001844966444692714, "loss": 0.0152, "step": 297060 }, { "epoch": 0.77, "learning_rate": 0.00018449275625289992, "loss": 0.0156, "step": 297070 }, { "epoch": 0.77, "learning_rate": 0.0001844888680365285, "loss": 0.0131, "step": 297080 }, { "epoch": 0.77, "learning_rate": 0.000184484979820157, "loss": 0.0135, "step": 297090 }, { "epoch": 0.77, "learning_rate": 0.00018448109160378555, "loss": 0.0134, "step": 297100 }, { "epoch": 0.77, "learning_rate": 0.00018447720338741406, "loss": 0.012, "step": 297110 }, { "epoch": 0.77, "learning_rate": 0.00018447331517104263, "loss": 0.014, "step": 297120 }, { "epoch": 0.77, "learning_rate": 0.00018446942695467117, "loss": 0.0163, "step": 297130 }, { "epoch": 0.77, "learning_rate": 0.0001844655387382997, "loss": 0.0184, "step": 297140 }, { "epoch": 0.77, "learning_rate": 0.00018446165052192823, "loss": 0.016, "step": 297150 }, { "epoch": 0.77, "learning_rate": 0.00018445776230555677, "loss": 0.0128, "step": 297160 }, { "epoch": 0.77, "learning_rate": 0.0001844538740891853, "loss": 0.0139, "step": 297170 }, { "epoch": 0.77, "learning_rate": 0.00018444998587281383, "loss": 0.0119, "step": 297180 }, { "epoch": 0.77, "learning_rate": 0.00018444609765644237, "loss": 0.0118, "step": 297190 }, { "epoch": 0.77, "learning_rate": 0.0001844422094400709, "loss": 0.0153, "step": 297200 }, { "epoch": 0.77, "learning_rate": 0.00018443832122369945, "loss": 0.0115, "step": 297210 }, { "epoch": 0.77, "learning_rate": 0.00018443443300732797, "loss": 0.0168, "step": 297220 }, { "epoch": 0.77, "learning_rate": 0.0001844305447909565, "loss": 0.0147, "step": 297230 }, { "epoch": 0.77, "learning_rate": 0.00018442665657458502, "loss": 0.0155, "step": 297240 }, { "epoch": 0.77, "learning_rate": 0.0001844227683582136, "loss": 0.015, "step": 297250 }, { "epoch": 0.77, "learning_rate": 0.0001844188801418421, "loss": 0.016, "step": 297260 }, { "epoch": 0.77, "learning_rate": 0.00018441499192547065, "loss": 0.0164, "step": 297270 }, { "epoch": 0.77, "learning_rate": 0.00018441110370909916, "loss": 0.0164, "step": 297280 }, { "epoch": 0.77, "learning_rate": 0.00018440721549272773, "loss": 0.0114, "step": 297290 }, { "epoch": 0.77, "learning_rate": 0.00018440332727635627, "loss": 0.0168, "step": 297300 }, { "epoch": 0.77, "learning_rate": 0.0001843994390599848, "loss": 0.0112, "step": 297310 }, { "epoch": 0.77, "learning_rate": 0.0001843955508436133, "loss": 0.015, "step": 297320 }, { "epoch": 0.77, "learning_rate": 0.00018439166262724187, "loss": 0.0153, "step": 297330 }, { "epoch": 0.77, "learning_rate": 0.0001843877744108704, "loss": 0.0117, "step": 297340 }, { "epoch": 0.77, "learning_rate": 0.00018438388619449893, "loss": 0.0176, "step": 297350 }, { "epoch": 0.77, "learning_rate": 0.00018437999797812747, "loss": 0.0167, "step": 297360 }, { "epoch": 0.77, "learning_rate": 0.000184376109761756, "loss": 0.0136, "step": 297370 }, { "epoch": 0.77, "learning_rate": 0.00018437222154538455, "loss": 0.0136, "step": 297380 }, { "epoch": 0.77, "learning_rate": 0.00018436833332901307, "loss": 0.0164, "step": 297390 }, { "epoch": 0.77, "learning_rate": 0.0001843644451126416, "loss": 0.0158, "step": 297400 }, { "epoch": 0.77, "learning_rate": 0.00018436055689627015, "loss": 0.014, "step": 297410 }, { "epoch": 0.77, "learning_rate": 0.0001843566686798987, "loss": 0.0142, "step": 297420 }, { "epoch": 0.77, "learning_rate": 0.0001843527804635272, "loss": 0.0146, "step": 297430 }, { "epoch": 0.77, "learning_rate": 0.00018434889224715575, "loss": 0.0143, "step": 297440 }, { "epoch": 0.77, "learning_rate": 0.00018434500403078432, "loss": 0.0154, "step": 297450 }, { "epoch": 0.77, "learning_rate": 0.00018434111581441283, "loss": 0.018, "step": 297460 }, { "epoch": 0.77, "learning_rate": 0.00018433722759804135, "loss": 0.0127, "step": 297470 }, { "epoch": 0.77, "learning_rate": 0.0001843333393816699, "loss": 0.0138, "step": 297480 }, { "epoch": 0.77, "learning_rate": 0.0001843294511652984, "loss": 0.0144, "step": 297490 }, { "epoch": 0.77, "learning_rate": 0.00018432556294892697, "loss": 0.0141, "step": 297500 }, { "epoch": 0.77, "learning_rate": 0.0001843216747325555, "loss": 0.0154, "step": 297510 }, { "epoch": 0.77, "learning_rate": 0.00018431778651618403, "loss": 0.0115, "step": 297520 }, { "epoch": 0.77, "learning_rate": 0.00018431389829981257, "loss": 0.0117, "step": 297530 }, { "epoch": 0.77, "learning_rate": 0.0001843100100834411, "loss": 0.0126, "step": 297540 }, { "epoch": 0.77, "learning_rate": 0.00018430612186706965, "loss": 0.0129, "step": 297550 }, { "epoch": 0.77, "learning_rate": 0.00018430223365069817, "loss": 0.0138, "step": 297560 }, { "epoch": 0.77, "learning_rate": 0.0001842983454343267, "loss": 0.0132, "step": 297570 }, { "epoch": 0.77, "learning_rate": 0.00018429445721795525, "loss": 0.018, "step": 297580 }, { "epoch": 0.77, "learning_rate": 0.0001842905690015838, "loss": 0.0142, "step": 297590 }, { "epoch": 0.77, "learning_rate": 0.0001842866807852123, "loss": 0.0145, "step": 297600 }, { "epoch": 0.77, "learning_rate": 0.00018428279256884085, "loss": 0.0155, "step": 297610 }, { "epoch": 0.77, "learning_rate": 0.00018427890435246942, "loss": 0.0147, "step": 297620 }, { "epoch": 0.77, "learning_rate": 0.00018427501613609793, "loss": 0.0156, "step": 297630 }, { "epoch": 0.77, "learning_rate": 0.00018427112791972645, "loss": 0.0126, "step": 297640 }, { "epoch": 0.77, "learning_rate": 0.000184267239703355, "loss": 0.0137, "step": 297650 }, { "epoch": 0.77, "learning_rate": 0.00018426335148698356, "loss": 0.0135, "step": 297660 }, { "epoch": 0.77, "learning_rate": 0.00018425946327061207, "loss": 0.0126, "step": 297670 }, { "epoch": 0.77, "learning_rate": 0.0001842555750542406, "loss": 0.0133, "step": 297680 }, { "epoch": 0.77, "learning_rate": 0.00018425168683786913, "loss": 0.0133, "step": 297690 }, { "epoch": 0.77, "learning_rate": 0.0001842477986214977, "loss": 0.017, "step": 297700 }, { "epoch": 0.77, "learning_rate": 0.0001842439104051262, "loss": 0.0128, "step": 297710 }, { "epoch": 0.77, "learning_rate": 0.00018424002218875475, "loss": 0.0124, "step": 297720 }, { "epoch": 0.77, "learning_rate": 0.00018423613397238327, "loss": 0.0138, "step": 297730 }, { "epoch": 0.77, "learning_rate": 0.0001842322457560118, "loss": 0.0161, "step": 297740 }, { "epoch": 0.77, "learning_rate": 0.00018422835753964035, "loss": 0.0128, "step": 297750 }, { "epoch": 0.77, "learning_rate": 0.0001842244693232689, "loss": 0.0205, "step": 297760 }, { "epoch": 0.77, "learning_rate": 0.0001842205811068974, "loss": 0.0132, "step": 297770 }, { "epoch": 0.77, "learning_rate": 0.00018421669289052595, "loss": 0.0121, "step": 297780 }, { "epoch": 0.77, "learning_rate": 0.0001842128046741545, "loss": 0.0142, "step": 297790 }, { "epoch": 0.77, "learning_rate": 0.00018420891645778303, "loss": 0.0136, "step": 297800 }, { "epoch": 0.77, "learning_rate": 0.00018420502824141154, "loss": 0.0162, "step": 297810 }, { "epoch": 0.77, "learning_rate": 0.00018420114002504009, "loss": 0.0148, "step": 297820 }, { "epoch": 0.77, "learning_rate": 0.00018419725180866866, "loss": 0.0139, "step": 297830 }, { "epoch": 0.77, "learning_rate": 0.00018419336359229717, "loss": 0.0138, "step": 297840 }, { "epoch": 0.77, "learning_rate": 0.0001841894753759257, "loss": 0.0129, "step": 297850 }, { "epoch": 0.77, "learning_rate": 0.00018418558715955423, "loss": 0.0205, "step": 297860 }, { "epoch": 0.77, "learning_rate": 0.0001841816989431828, "loss": 0.0159, "step": 297870 }, { "epoch": 0.77, "learning_rate": 0.0001841778107268113, "loss": 0.0129, "step": 297880 }, { "epoch": 0.77, "learning_rate": 0.00018417392251043985, "loss": 0.014, "step": 297890 }, { "epoch": 0.77, "learning_rate": 0.00018417003429406837, "loss": 0.0124, "step": 297900 }, { "epoch": 0.77, "learning_rate": 0.00018416614607769693, "loss": 0.013, "step": 297910 }, { "epoch": 0.77, "learning_rate": 0.00018416225786132545, "loss": 0.0186, "step": 297920 }, { "epoch": 0.77, "learning_rate": 0.000184158369644954, "loss": 0.0104, "step": 297930 }, { "epoch": 0.77, "learning_rate": 0.0001841544814285825, "loss": 0.0163, "step": 297940 }, { "epoch": 0.77, "learning_rate": 0.00018415059321221107, "loss": 0.0149, "step": 297950 }, { "epoch": 0.77, "learning_rate": 0.0001841467049958396, "loss": 0.0108, "step": 297960 }, { "epoch": 0.77, "learning_rate": 0.00018414281677946813, "loss": 0.0181, "step": 297970 }, { "epoch": 0.77, "learning_rate": 0.00018413892856309664, "loss": 0.011, "step": 297980 }, { "epoch": 0.77, "learning_rate": 0.00018413504034672519, "loss": 0.0185, "step": 297990 }, { "epoch": 0.77, "learning_rate": 0.00018413115213035375, "loss": 0.0159, "step": 298000 }, { "epoch": 0.77, "eval_cer": 0.8817348779726539, "eval_loss": 0.00948801077902317, "eval_runtime": 107.7174, "eval_samples_per_second": 18.567, "eval_steps_per_second": 4.642, "step": 298000 }, { "epoch": 0.77, "learning_rate": 0.00018412726391398227, "loss": 0.0123, "step": 298010 }, { "epoch": 0.77, "learning_rate": 0.0001841233756976108, "loss": 0.013, "step": 298020 }, { "epoch": 0.77, "learning_rate": 0.00018411948748123933, "loss": 0.0125, "step": 298030 }, { "epoch": 0.77, "learning_rate": 0.0001841155992648679, "loss": 0.0146, "step": 298040 }, { "epoch": 0.77, "learning_rate": 0.0001841117110484964, "loss": 0.0128, "step": 298050 }, { "epoch": 0.77, "learning_rate": 0.00018410782283212495, "loss": 0.0143, "step": 298060 }, { "epoch": 0.77, "learning_rate": 0.00018410393461575346, "loss": 0.0162, "step": 298070 }, { "epoch": 0.77, "learning_rate": 0.00018410004639938203, "loss": 0.018, "step": 298080 }, { "epoch": 0.77, "learning_rate": 0.00018409615818301055, "loss": 0.0158, "step": 298090 }, { "epoch": 0.77, "learning_rate": 0.0001840922699666391, "loss": 0.0127, "step": 298100 }, { "epoch": 0.77, "learning_rate": 0.0001840883817502676, "loss": 0.0159, "step": 298110 }, { "epoch": 0.77, "learning_rate": 0.00018408449353389617, "loss": 0.0159, "step": 298120 }, { "epoch": 0.77, "learning_rate": 0.0001840806053175247, "loss": 0.0144, "step": 298130 }, { "epoch": 0.77, "learning_rate": 0.00018407671710115323, "loss": 0.013, "step": 298140 }, { "epoch": 0.77, "learning_rate": 0.00018407282888478174, "loss": 0.0126, "step": 298150 }, { "epoch": 0.77, "learning_rate": 0.0001840689406684103, "loss": 0.0142, "step": 298160 }, { "epoch": 0.77, "learning_rate": 0.00018406505245203885, "loss": 0.0151, "step": 298170 }, { "epoch": 0.77, "learning_rate": 0.00018406116423566737, "loss": 0.0141, "step": 298180 }, { "epoch": 0.77, "learning_rate": 0.00018405727601929588, "loss": 0.0158, "step": 298190 }, { "epoch": 0.77, "learning_rate": 0.00018405338780292445, "loss": 0.0161, "step": 298200 }, { "epoch": 0.77, "learning_rate": 0.000184049499586553, "loss": 0.0113, "step": 298210 }, { "epoch": 0.77, "learning_rate": 0.0001840456113701815, "loss": 0.0099, "step": 298220 }, { "epoch": 0.77, "learning_rate": 0.00018404172315381005, "loss": 0.017, "step": 298230 }, { "epoch": 0.77, "learning_rate": 0.00018403783493743856, "loss": 0.0158, "step": 298240 }, { "epoch": 0.77, "learning_rate": 0.00018403394672106713, "loss": 0.0148, "step": 298250 }, { "epoch": 0.77, "learning_rate": 0.00018403005850469565, "loss": 0.0128, "step": 298260 }, { "epoch": 0.77, "learning_rate": 0.0001840261702883242, "loss": 0.0122, "step": 298270 }, { "epoch": 0.77, "learning_rate": 0.0001840222820719527, "loss": 0.0152, "step": 298280 }, { "epoch": 0.77, "learning_rate": 0.00018401839385558127, "loss": 0.0138, "step": 298290 }, { "epoch": 0.77, "learning_rate": 0.0001840145056392098, "loss": 0.0165, "step": 298300 }, { "epoch": 0.77, "learning_rate": 0.00018401061742283833, "loss": 0.0164, "step": 298310 }, { "epoch": 0.77, "learning_rate": 0.00018400672920646684, "loss": 0.0183, "step": 298320 }, { "epoch": 0.77, "learning_rate": 0.0001840028409900954, "loss": 0.0143, "step": 298330 }, { "epoch": 0.77, "learning_rate": 0.00018399895277372395, "loss": 0.0146, "step": 298340 }, { "epoch": 0.77, "learning_rate": 0.00018399506455735247, "loss": 0.0132, "step": 298350 }, { "epoch": 0.77, "learning_rate": 0.00018399117634098098, "loss": 0.0129, "step": 298360 }, { "epoch": 0.77, "learning_rate": 0.00018398728812460955, "loss": 0.0145, "step": 298370 }, { "epoch": 0.77, "learning_rate": 0.0001839833999082381, "loss": 0.0122, "step": 298380 }, { "epoch": 0.77, "learning_rate": 0.0001839795116918666, "loss": 0.0134, "step": 298390 }, { "epoch": 0.77, "learning_rate": 0.00018397562347549515, "loss": 0.0151, "step": 298400 }, { "epoch": 0.77, "learning_rate": 0.0001839717352591237, "loss": 0.0117, "step": 298410 }, { "epoch": 0.77, "learning_rate": 0.00018396784704275223, "loss": 0.0138, "step": 298420 }, { "epoch": 0.77, "learning_rate": 0.00018396395882638075, "loss": 0.0149, "step": 298430 }, { "epoch": 0.77, "learning_rate": 0.0001839600706100093, "loss": 0.0157, "step": 298440 }, { "epoch": 0.77, "learning_rate": 0.00018395618239363783, "loss": 0.0128, "step": 298450 }, { "epoch": 0.77, "learning_rate": 0.00018395229417726637, "loss": 0.017, "step": 298460 }, { "epoch": 0.77, "learning_rate": 0.00018394840596089489, "loss": 0.0174, "step": 298470 }, { "epoch": 0.77, "learning_rate": 0.00018394451774452343, "loss": 0.013, "step": 298480 }, { "epoch": 0.77, "learning_rate": 0.00018394062952815194, "loss": 0.0109, "step": 298490 }, { "epoch": 0.77, "learning_rate": 0.0001839367413117805, "loss": 0.0151, "step": 298500 }, { "epoch": 0.77, "learning_rate": 0.00018393285309540903, "loss": 0.0151, "step": 298510 }, { "epoch": 0.77, "learning_rate": 0.00018392896487903757, "loss": 0.0128, "step": 298520 }, { "epoch": 0.77, "learning_rate": 0.00018392507666266608, "loss": 0.0158, "step": 298530 }, { "epoch": 0.77, "learning_rate": 0.00018392118844629465, "loss": 0.0107, "step": 298540 }, { "epoch": 0.77, "learning_rate": 0.0001839173002299232, "loss": 0.0142, "step": 298550 }, { "epoch": 0.77, "learning_rate": 0.0001839134120135517, "loss": 0.0126, "step": 298560 }, { "epoch": 0.77, "learning_rate": 0.00018390952379718025, "loss": 0.0121, "step": 298570 }, { "epoch": 0.77, "learning_rate": 0.0001839056355808088, "loss": 0.0145, "step": 298580 }, { "epoch": 0.77, "learning_rate": 0.00018390174736443733, "loss": 0.0146, "step": 298590 }, { "epoch": 0.77, "learning_rate": 0.00018389785914806585, "loss": 0.0159, "step": 298600 }, { "epoch": 0.77, "learning_rate": 0.0001838939709316944, "loss": 0.016, "step": 298610 }, { "epoch": 0.77, "learning_rate": 0.00018389008271532293, "loss": 0.0115, "step": 298620 }, { "epoch": 0.77, "learning_rate": 0.00018388619449895147, "loss": 0.0128, "step": 298630 }, { "epoch": 0.77, "learning_rate": 0.00018388230628257999, "loss": 0.0136, "step": 298640 }, { "epoch": 0.77, "learning_rate": 0.00018387841806620853, "loss": 0.0158, "step": 298650 }, { "epoch": 0.77, "learning_rate": 0.00018387452984983707, "loss": 0.0145, "step": 298660 }, { "epoch": 0.77, "learning_rate": 0.0001838706416334656, "loss": 0.0146, "step": 298670 }, { "epoch": 0.77, "learning_rate": 0.00018386675341709413, "loss": 0.0153, "step": 298680 }, { "epoch": 0.77, "learning_rate": 0.00018386286520072267, "loss": 0.0141, "step": 298690 }, { "epoch": 0.77, "learning_rate": 0.00018385897698435124, "loss": 0.0134, "step": 298700 }, { "epoch": 0.77, "learning_rate": 0.00018385508876797975, "loss": 0.0141, "step": 298710 }, { "epoch": 0.77, "learning_rate": 0.0001838512005516083, "loss": 0.0114, "step": 298720 }, { "epoch": 0.77, "learning_rate": 0.0001838473123352368, "loss": 0.0153, "step": 298730 }, { "epoch": 0.77, "learning_rate": 0.00018384342411886535, "loss": 0.014, "step": 298740 }, { "epoch": 0.77, "learning_rate": 0.0001838395359024939, "loss": 0.0096, "step": 298750 }, { "epoch": 0.77, "learning_rate": 0.00018383564768612243, "loss": 0.0162, "step": 298760 }, { "epoch": 0.77, "learning_rate": 0.00018383175946975095, "loss": 0.0136, "step": 298770 }, { "epoch": 0.77, "learning_rate": 0.0001838278712533795, "loss": 0.0146, "step": 298780 }, { "epoch": 0.77, "learning_rate": 0.00018382398303700803, "loss": 0.0143, "step": 298790 }, { "epoch": 0.77, "learning_rate": 0.00018382009482063657, "loss": 0.0129, "step": 298800 }, { "epoch": 0.77, "learning_rate": 0.00018381620660426509, "loss": 0.0153, "step": 298810 }, { "epoch": 0.77, "learning_rate": 0.00018381231838789363, "loss": 0.0119, "step": 298820 }, { "epoch": 0.77, "learning_rate": 0.00018380843017152217, "loss": 0.0164, "step": 298830 }, { "epoch": 0.77, "learning_rate": 0.0001838045419551507, "loss": 0.0155, "step": 298840 }, { "epoch": 0.77, "learning_rate": 0.00018380065373877922, "loss": 0.0151, "step": 298850 }, { "epoch": 0.77, "learning_rate": 0.00018379676552240777, "loss": 0.0146, "step": 298860 }, { "epoch": 0.77, "learning_rate": 0.00018379287730603633, "loss": 0.0147, "step": 298870 }, { "epoch": 0.77, "learning_rate": 0.00018378898908966485, "loss": 0.0158, "step": 298880 }, { "epoch": 0.77, "learning_rate": 0.0001837851008732934, "loss": 0.0157, "step": 298890 }, { "epoch": 0.77, "learning_rate": 0.0001837812126569219, "loss": 0.0178, "step": 298900 }, { "epoch": 0.77, "learning_rate": 0.00018377732444055047, "loss": 0.0147, "step": 298910 }, { "epoch": 0.77, "learning_rate": 0.000183773436224179, "loss": 0.0132, "step": 298920 }, { "epoch": 0.77, "learning_rate": 0.00018376954800780753, "loss": 0.0132, "step": 298930 }, { "epoch": 0.77, "learning_rate": 0.00018376565979143604, "loss": 0.0153, "step": 298940 }, { "epoch": 0.77, "learning_rate": 0.00018376177157506461, "loss": 0.0132, "step": 298950 }, { "epoch": 0.77, "learning_rate": 0.00018375788335869313, "loss": 0.0186, "step": 298960 }, { "epoch": 0.77, "learning_rate": 0.00018375399514232167, "loss": 0.011, "step": 298970 }, { "epoch": 0.77, "learning_rate": 0.00018375010692595018, "loss": 0.0177, "step": 298980 }, { "epoch": 0.78, "learning_rate": 0.00018374621870957873, "loss": 0.0142, "step": 298990 }, { "epoch": 0.78, "learning_rate": 0.00018374233049320727, "loss": 0.0109, "step": 299000 }, { "epoch": 0.78, "eval_cer": 0.881657897941274, "eval_loss": 0.009355046786367893, "eval_runtime": 107.8593, "eval_samples_per_second": 18.543, "eval_steps_per_second": 4.636, "step": 299000 }, { "epoch": 0.78, "learning_rate": 0.0001837384422768358, "loss": 0.0178, "step": 299010 }, { "epoch": 0.78, "learning_rate": 0.00018373455406046432, "loss": 0.017, "step": 299020 }, { "epoch": 0.78, "learning_rate": 0.00018373066584409287, "loss": 0.0144, "step": 299030 }, { "epoch": 0.78, "learning_rate": 0.00018372677762772143, "loss": 0.0134, "step": 299040 }, { "epoch": 0.78, "learning_rate": 0.00018372288941134995, "loss": 0.0155, "step": 299050 }, { "epoch": 0.78, "learning_rate": 0.00018371900119497846, "loss": 0.0134, "step": 299060 }, { "epoch": 0.78, "learning_rate": 0.000183715112978607, "loss": 0.0108, "step": 299070 }, { "epoch": 0.78, "learning_rate": 0.00018371122476223557, "loss": 0.0145, "step": 299080 }, { "epoch": 0.78, "learning_rate": 0.0001837073365458641, "loss": 0.0139, "step": 299090 }, { "epoch": 0.78, "learning_rate": 0.00018370344832949263, "loss": 0.0143, "step": 299100 }, { "epoch": 0.78, "learning_rate": 0.00018369956011312114, "loss": 0.0124, "step": 299110 }, { "epoch": 0.78, "learning_rate": 0.0001836956718967497, "loss": 0.0218, "step": 299120 }, { "epoch": 0.78, "learning_rate": 0.00018369178368037823, "loss": 0.0157, "step": 299130 }, { "epoch": 0.78, "learning_rate": 0.00018368789546400677, "loss": 0.0127, "step": 299140 }, { "epoch": 0.78, "learning_rate": 0.00018368400724763528, "loss": 0.0161, "step": 299150 }, { "epoch": 0.78, "learning_rate": 0.00018368011903126385, "loss": 0.0168, "step": 299160 }, { "epoch": 0.78, "learning_rate": 0.00018367623081489237, "loss": 0.0125, "step": 299170 }, { "epoch": 0.78, "learning_rate": 0.0001836723425985209, "loss": 0.0122, "step": 299180 }, { "epoch": 0.78, "learning_rate": 0.00018366845438214942, "loss": 0.0142, "step": 299190 }, { "epoch": 0.78, "learning_rate": 0.000183664566165778, "loss": 0.0144, "step": 299200 }, { "epoch": 0.78, "learning_rate": 0.00018366067794940653, "loss": 0.0136, "step": 299210 }, { "epoch": 0.78, "learning_rate": 0.00018365678973303505, "loss": 0.0148, "step": 299220 }, { "epoch": 0.78, "learning_rate": 0.00018365290151666356, "loss": 0.0142, "step": 299230 }, { "epoch": 0.78, "learning_rate": 0.0001836490133002921, "loss": 0.0165, "step": 299240 }, { "epoch": 0.78, "learning_rate": 0.00018364512508392067, "loss": 0.0141, "step": 299250 }, { "epoch": 0.78, "learning_rate": 0.0001836412368675492, "loss": 0.0153, "step": 299260 }, { "epoch": 0.78, "learning_rate": 0.00018363734865117773, "loss": 0.0174, "step": 299270 }, { "epoch": 0.78, "learning_rate": 0.00018363346043480624, "loss": 0.0142, "step": 299280 }, { "epoch": 0.78, "learning_rate": 0.0001836295722184348, "loss": 0.0192, "step": 299290 }, { "epoch": 0.78, "learning_rate": 0.00018362568400206333, "loss": 0.0117, "step": 299300 }, { "epoch": 0.78, "learning_rate": 0.00018362179578569187, "loss": 0.0115, "step": 299310 }, { "epoch": 0.78, "learning_rate": 0.00018361790756932038, "loss": 0.0132, "step": 299320 }, { "epoch": 0.78, "learning_rate": 0.00018361401935294895, "loss": 0.0188, "step": 299330 }, { "epoch": 0.78, "learning_rate": 0.00018361013113657747, "loss": 0.0129, "step": 299340 }, { "epoch": 0.78, "learning_rate": 0.000183606242920206, "loss": 0.0161, "step": 299350 }, { "epoch": 0.78, "learning_rate": 0.00018360235470383452, "loss": 0.0128, "step": 299360 }, { "epoch": 0.78, "learning_rate": 0.0001835984664874631, "loss": 0.0182, "step": 299370 }, { "epoch": 0.78, "learning_rate": 0.0001835945782710916, "loss": 0.0145, "step": 299380 }, { "epoch": 0.78, "learning_rate": 0.00018359069005472015, "loss": 0.0137, "step": 299390 }, { "epoch": 0.78, "learning_rate": 0.00018358680183834866, "loss": 0.0131, "step": 299400 }, { "epoch": 0.78, "learning_rate": 0.00018358291362197723, "loss": 0.0151, "step": 299410 }, { "epoch": 0.78, "learning_rate": 0.00018357902540560577, "loss": 0.0126, "step": 299420 }, { "epoch": 0.78, "learning_rate": 0.0001835751371892343, "loss": 0.0105, "step": 299430 }, { "epoch": 0.78, "learning_rate": 0.00018357124897286283, "loss": 0.0146, "step": 299440 }, { "epoch": 0.78, "learning_rate": 0.00018356736075649137, "loss": 0.0155, "step": 299450 }, { "epoch": 0.78, "learning_rate": 0.0001835634725401199, "loss": 0.0116, "step": 299460 }, { "epoch": 0.78, "learning_rate": 0.00018355958432374843, "loss": 0.0149, "step": 299470 }, { "epoch": 0.78, "learning_rate": 0.00018355569610737697, "loss": 0.0179, "step": 299480 }, { "epoch": 0.78, "learning_rate": 0.00018355180789100548, "loss": 0.0153, "step": 299490 }, { "epoch": 0.78, "learning_rate": 0.00018354791967463405, "loss": 0.0108, "step": 299500 }, { "epoch": 0.78, "learning_rate": 0.00018354403145826257, "loss": 0.0163, "step": 299510 }, { "epoch": 0.78, "learning_rate": 0.0001835401432418911, "loss": 0.0164, "step": 299520 }, { "epoch": 0.78, "learning_rate": 0.00018353625502551962, "loss": 0.0172, "step": 299530 }, { "epoch": 0.78, "learning_rate": 0.0001835323668091482, "loss": 0.0145, "step": 299540 }, { "epoch": 0.78, "learning_rate": 0.0001835284785927767, "loss": 0.0117, "step": 299550 }, { "epoch": 0.78, "learning_rate": 0.00018352459037640525, "loss": 0.0129, "step": 299560 }, { "epoch": 0.78, "learning_rate": 0.00018352070216003376, "loss": 0.0145, "step": 299570 }, { "epoch": 0.78, "learning_rate": 0.00018351681394366233, "loss": 0.0151, "step": 299580 }, { "epoch": 0.78, "learning_rate": 0.00018351292572729087, "loss": 0.0112, "step": 299590 }, { "epoch": 0.78, "learning_rate": 0.0001835090375109194, "loss": 0.0144, "step": 299600 }, { "epoch": 0.78, "learning_rate": 0.00018350514929454793, "loss": 0.012, "step": 299610 }, { "epoch": 0.78, "learning_rate": 0.00018350126107817647, "loss": 0.0135, "step": 299620 }, { "epoch": 0.78, "learning_rate": 0.000183497372861805, "loss": 0.0158, "step": 299630 }, { "epoch": 0.78, "learning_rate": 0.00018349348464543353, "loss": 0.018, "step": 299640 }, { "epoch": 0.78, "learning_rate": 0.00018348959642906207, "loss": 0.0158, "step": 299650 }, { "epoch": 0.78, "learning_rate": 0.0001834857082126906, "loss": 0.014, "step": 299660 }, { "epoch": 0.78, "learning_rate": 0.00018348181999631915, "loss": 0.0159, "step": 299670 }, { "epoch": 0.78, "learning_rate": 0.00018347793177994767, "loss": 0.0106, "step": 299680 }, { "epoch": 0.78, "learning_rate": 0.0001834740435635762, "loss": 0.0166, "step": 299690 }, { "epoch": 0.78, "learning_rate": 0.00018347015534720475, "loss": 0.0147, "step": 299700 }, { "epoch": 0.78, "learning_rate": 0.0001834662671308333, "loss": 0.0149, "step": 299710 }, { "epoch": 0.78, "learning_rate": 0.0001834623789144618, "loss": 0.0137, "step": 299720 }, { "epoch": 0.78, "learning_rate": 0.00018345849069809035, "loss": 0.0124, "step": 299730 }, { "epoch": 0.78, "learning_rate": 0.00018345460248171886, "loss": 0.0136, "step": 299740 }, { "epoch": 0.78, "learning_rate": 0.00018345071426534743, "loss": 0.0094, "step": 299750 }, { "epoch": 0.78, "learning_rate": 0.00018344682604897597, "loss": 0.0159, "step": 299760 }, { "epoch": 0.78, "learning_rate": 0.00018344293783260449, "loss": 0.013, "step": 299770 }, { "epoch": 0.78, "learning_rate": 0.000183439049616233, "loss": 0.0149, "step": 299780 }, { "epoch": 0.78, "learning_rate": 0.00018343516139986157, "loss": 0.0126, "step": 299790 }, { "epoch": 0.78, "learning_rate": 0.0001834312731834901, "loss": 0.0181, "step": 299800 }, { "epoch": 0.78, "learning_rate": 0.00018342738496711863, "loss": 0.0138, "step": 299810 }, { "epoch": 0.78, "learning_rate": 0.00018342349675074717, "loss": 0.0138, "step": 299820 }, { "epoch": 0.78, "learning_rate": 0.0001834196085343757, "loss": 0.0135, "step": 299830 }, { "epoch": 0.78, "learning_rate": 0.00018341572031800425, "loss": 0.0153, "step": 299840 }, { "epoch": 0.78, "learning_rate": 0.00018341183210163276, "loss": 0.0107, "step": 299850 }, { "epoch": 0.78, "learning_rate": 0.0001834079438852613, "loss": 0.0152, "step": 299860 }, { "epoch": 0.78, "learning_rate": 0.00018340405566888985, "loss": 0.0162, "step": 299870 }, { "epoch": 0.78, "learning_rate": 0.0001834001674525184, "loss": 0.0114, "step": 299880 }, { "epoch": 0.78, "learning_rate": 0.0001833962792361469, "loss": 0.0147, "step": 299890 }, { "epoch": 0.78, "learning_rate": 0.00018339239101977545, "loss": 0.0143, "step": 299900 }, { "epoch": 0.78, "learning_rate": 0.00018338850280340401, "loss": 0.0176, "step": 299910 }, { "epoch": 0.78, "learning_rate": 0.00018338461458703253, "loss": 0.0151, "step": 299920 }, { "epoch": 0.78, "learning_rate": 0.00018338072637066107, "loss": 0.0125, "step": 299930 }, { "epoch": 0.78, "learning_rate": 0.00018337683815428959, "loss": 0.0187, "step": 299940 }, { "epoch": 0.78, "learning_rate": 0.00018337294993791815, "loss": 0.0145, "step": 299950 }, { "epoch": 0.78, "learning_rate": 0.00018336906172154667, "loss": 0.0156, "step": 299960 }, { "epoch": 0.78, "learning_rate": 0.0001833651735051752, "loss": 0.0169, "step": 299970 }, { "epoch": 0.78, "learning_rate": 0.00018336128528880372, "loss": 0.0149, "step": 299980 }, { "epoch": 0.78, "learning_rate": 0.00018335739707243227, "loss": 0.0106, "step": 299990 }, { "epoch": 0.78, "learning_rate": 0.0001833535088560608, "loss": 0.0111, "step": 300000 }, { "epoch": 0.78, "eval_cer": 0.881688689953826, "eval_loss": 0.009534839540719986, "eval_runtime": 107.6279, "eval_samples_per_second": 18.583, "eval_steps_per_second": 4.646, "step": 300000 }, { "epoch": 0.78, "learning_rate": 0.00018334962063968935, "loss": 0.0164, "step": 300010 }, { "epoch": 0.78, "learning_rate": 0.00018334573242331786, "loss": 0.0125, "step": 300020 }, { "epoch": 0.78, "learning_rate": 0.0001833418442069464, "loss": 0.0183, "step": 300030 }, { "epoch": 0.78, "learning_rate": 0.00018333795599057495, "loss": 0.0127, "step": 300040 }, { "epoch": 0.78, "learning_rate": 0.0001833340677742035, "loss": 0.0168, "step": 300050 }, { "epoch": 0.78, "learning_rate": 0.000183330179557832, "loss": 0.0135, "step": 300060 }, { "epoch": 0.78, "learning_rate": 0.00018332629134146055, "loss": 0.02, "step": 300070 }, { "epoch": 0.78, "learning_rate": 0.00018332240312508911, "loss": 0.0152, "step": 300080 }, { "epoch": 0.78, "learning_rate": 0.00018331851490871763, "loss": 0.0216, "step": 300090 }, { "epoch": 0.78, "learning_rate": 0.00018331462669234614, "loss": 0.015, "step": 300100 }, { "epoch": 0.78, "learning_rate": 0.00018331073847597468, "loss": 0.0151, "step": 300110 }, { "epoch": 0.78, "learning_rate": 0.00018330685025960325, "loss": 0.0157, "step": 300120 }, { "epoch": 0.78, "learning_rate": 0.00018330296204323177, "loss": 0.0107, "step": 300130 }, { "epoch": 0.78, "learning_rate": 0.0001832990738268603, "loss": 0.012, "step": 300140 }, { "epoch": 0.78, "learning_rate": 0.00018329518561048882, "loss": 0.0145, "step": 300150 }, { "epoch": 0.78, "learning_rate": 0.0001832912973941174, "loss": 0.0135, "step": 300160 }, { "epoch": 0.78, "learning_rate": 0.0001832874091777459, "loss": 0.0143, "step": 300170 }, { "epoch": 0.78, "learning_rate": 0.00018328352096137445, "loss": 0.0153, "step": 300180 }, { "epoch": 0.78, "learning_rate": 0.00018327963274500296, "loss": 0.0134, "step": 300190 }, { "epoch": 0.78, "learning_rate": 0.00018327574452863153, "loss": 0.0143, "step": 300200 }, { "epoch": 0.78, "learning_rate": 0.00018327185631226005, "loss": 0.0149, "step": 300210 }, { "epoch": 0.78, "learning_rate": 0.0001832679680958886, "loss": 0.0162, "step": 300220 }, { "epoch": 0.78, "learning_rate": 0.0001832640798795171, "loss": 0.0125, "step": 300230 }, { "epoch": 0.78, "learning_rate": 0.00018326019166314564, "loss": 0.0116, "step": 300240 }, { "epoch": 0.78, "learning_rate": 0.00018325630344677419, "loss": 0.0161, "step": 300250 }, { "epoch": 0.78, "learning_rate": 0.00018325241523040273, "loss": 0.0176, "step": 300260 }, { "epoch": 0.78, "learning_rate": 0.00018324852701403124, "loss": 0.0125, "step": 300270 }, { "epoch": 0.78, "learning_rate": 0.00018324463879765978, "loss": 0.0146, "step": 300280 }, { "epoch": 0.78, "learning_rate": 0.00018324075058128835, "loss": 0.0132, "step": 300290 }, { "epoch": 0.78, "learning_rate": 0.00018323686236491687, "loss": 0.0105, "step": 300300 }, { "epoch": 0.78, "learning_rate": 0.0001832329741485454, "loss": 0.021, "step": 300310 }, { "epoch": 0.78, "learning_rate": 0.00018322908593217392, "loss": 0.0197, "step": 300320 }, { "epoch": 0.78, "learning_rate": 0.0001832251977158025, "loss": 0.0161, "step": 300330 }, { "epoch": 0.78, "learning_rate": 0.000183221309499431, "loss": 0.015, "step": 300340 }, { "epoch": 0.78, "learning_rate": 0.00018321742128305955, "loss": 0.015, "step": 300350 }, { "epoch": 0.78, "learning_rate": 0.00018321353306668806, "loss": 0.0138, "step": 300360 }, { "epoch": 0.78, "learning_rate": 0.00018320964485031663, "loss": 0.014, "step": 300370 }, { "epoch": 0.78, "learning_rate": 0.00018320575663394515, "loss": 0.0191, "step": 300380 }, { "epoch": 0.78, "learning_rate": 0.0001832018684175737, "loss": 0.0115, "step": 300390 }, { "epoch": 0.78, "learning_rate": 0.0001831979802012022, "loss": 0.0129, "step": 300400 }, { "epoch": 0.78, "learning_rate": 0.00018319409198483077, "loss": 0.0136, "step": 300410 }, { "epoch": 0.78, "learning_rate": 0.00018319020376845929, "loss": 0.0133, "step": 300420 }, { "epoch": 0.78, "learning_rate": 0.00018318631555208783, "loss": 0.0132, "step": 300430 }, { "epoch": 0.78, "learning_rate": 0.00018318242733571634, "loss": 0.018, "step": 300440 }, { "epoch": 0.78, "learning_rate": 0.0001831785391193449, "loss": 0.0134, "step": 300450 }, { "epoch": 0.78, "learning_rate": 0.00018317465090297345, "loss": 0.0159, "step": 300460 }, { "epoch": 0.78, "learning_rate": 0.00018317076268660197, "loss": 0.0168, "step": 300470 }, { "epoch": 0.78, "learning_rate": 0.0001831668744702305, "loss": 0.0136, "step": 300480 }, { "epoch": 0.78, "learning_rate": 0.00018316298625385902, "loss": 0.0172, "step": 300490 }, { "epoch": 0.78, "learning_rate": 0.0001831590980374876, "loss": 0.0123, "step": 300500 }, { "epoch": 0.78, "learning_rate": 0.0001831552098211161, "loss": 0.0162, "step": 300510 }, { "epoch": 0.78, "learning_rate": 0.00018315132160474465, "loss": 0.0148, "step": 300520 }, { "epoch": 0.78, "learning_rate": 0.00018314743338837316, "loss": 0.0157, "step": 300530 }, { "epoch": 0.78, "learning_rate": 0.00018314354517200173, "loss": 0.0153, "step": 300540 }, { "epoch": 0.78, "learning_rate": 0.00018313965695563025, "loss": 0.0184, "step": 300550 }, { "epoch": 0.78, "learning_rate": 0.0001831357687392588, "loss": 0.0113, "step": 300560 }, { "epoch": 0.78, "learning_rate": 0.0001831318805228873, "loss": 0.0172, "step": 300570 }, { "epoch": 0.78, "learning_rate": 0.00018312799230651587, "loss": 0.0134, "step": 300580 }, { "epoch": 0.78, "learning_rate": 0.00018312410409014439, "loss": 0.0145, "step": 300590 }, { "epoch": 0.78, "learning_rate": 0.00018312021587377293, "loss": 0.0165, "step": 300600 }, { "epoch": 0.78, "learning_rate": 0.00018311632765740144, "loss": 0.0163, "step": 300610 }, { "epoch": 0.78, "learning_rate": 0.00018311243944103, "loss": 0.0149, "step": 300620 }, { "epoch": 0.78, "learning_rate": 0.00018310855122465855, "loss": 0.0127, "step": 300630 }, { "epoch": 0.78, "learning_rate": 0.00018310466300828707, "loss": 0.0148, "step": 300640 }, { "epoch": 0.78, "learning_rate": 0.00018310077479191558, "loss": 0.0198, "step": 300650 }, { "epoch": 0.78, "learning_rate": 0.00018309688657554415, "loss": 0.0156, "step": 300660 }, { "epoch": 0.78, "learning_rate": 0.0001830929983591727, "loss": 0.0148, "step": 300670 }, { "epoch": 0.78, "learning_rate": 0.0001830891101428012, "loss": 0.0172, "step": 300680 }, { "epoch": 0.78, "learning_rate": 0.00018308522192642975, "loss": 0.0125, "step": 300690 }, { "epoch": 0.78, "learning_rate": 0.0001830813337100583, "loss": 0.0153, "step": 300700 }, { "epoch": 0.78, "learning_rate": 0.00018307744549368683, "loss": 0.0132, "step": 300710 }, { "epoch": 0.78, "learning_rate": 0.00018307355727731535, "loss": 0.0112, "step": 300720 }, { "epoch": 0.78, "learning_rate": 0.0001830696690609439, "loss": 0.0126, "step": 300730 }, { "epoch": 0.78, "learning_rate": 0.0001830657808445724, "loss": 0.0125, "step": 300740 }, { "epoch": 0.78, "learning_rate": 0.00018306189262820097, "loss": 0.0185, "step": 300750 }, { "epoch": 0.78, "learning_rate": 0.00018305800441182948, "loss": 0.0126, "step": 300760 }, { "epoch": 0.78, "learning_rate": 0.00018305411619545803, "loss": 0.0122, "step": 300770 }, { "epoch": 0.78, "learning_rate": 0.00018305022797908654, "loss": 0.011, "step": 300780 }, { "epoch": 0.78, "learning_rate": 0.0001830463397627151, "loss": 0.0148, "step": 300790 }, { "epoch": 0.78, "learning_rate": 0.00018304245154634365, "loss": 0.0141, "step": 300800 }, { "epoch": 0.78, "learning_rate": 0.00018303856332997217, "loss": 0.0113, "step": 300810 }, { "epoch": 0.78, "learning_rate": 0.00018303467511360068, "loss": 0.0175, "step": 300820 }, { "epoch": 0.78, "learning_rate": 0.00018303078689722925, "loss": 0.0139, "step": 300830 }, { "epoch": 0.78, "learning_rate": 0.0001830268986808578, "loss": 0.0146, "step": 300840 }, { "epoch": 0.78, "learning_rate": 0.0001830230104644863, "loss": 0.0119, "step": 300850 }, { "epoch": 0.78, "learning_rate": 0.00018301912224811485, "loss": 0.0151, "step": 300860 }, { "epoch": 0.78, "learning_rate": 0.0001830152340317434, "loss": 0.0149, "step": 300870 }, { "epoch": 0.78, "learning_rate": 0.00018301134581537193, "loss": 0.0164, "step": 300880 }, { "epoch": 0.78, "learning_rate": 0.00018300745759900044, "loss": 0.0133, "step": 300890 }, { "epoch": 0.78, "learning_rate": 0.00018300356938262899, "loss": 0.0145, "step": 300900 }, { "epoch": 0.78, "learning_rate": 0.00018299968116625753, "loss": 0.0155, "step": 300910 }, { "epoch": 0.78, "learning_rate": 0.00018299579294988607, "loss": 0.0121, "step": 300920 }, { "epoch": 0.78, "learning_rate": 0.00018299190473351458, "loss": 0.0109, "step": 300930 }, { "epoch": 0.78, "learning_rate": 0.00018298801651714313, "loss": 0.0154, "step": 300940 }, { "epoch": 0.78, "learning_rate": 0.0001829841283007717, "loss": 0.0164, "step": 300950 }, { "epoch": 0.78, "learning_rate": 0.0001829802400844002, "loss": 0.0128, "step": 300960 }, { "epoch": 0.78, "learning_rate": 0.00018297635186802872, "loss": 0.015, "step": 300970 }, { "epoch": 0.78, "learning_rate": 0.00018297246365165727, "loss": 0.0087, "step": 300980 }, { "epoch": 0.78, "learning_rate": 0.00018296857543528578, "loss": 0.0132, "step": 300990 }, { "epoch": 0.78, "learning_rate": 0.00018296468721891435, "loss": 0.0151, "step": 301000 }, { "epoch": 0.78, "eval_cer": 0.8817250805141147, "eval_loss": 0.009607135318219662, "eval_runtime": 107.6603, "eval_samples_per_second": 18.577, "eval_steps_per_second": 4.644, "step": 301000 }, { "epoch": 0.78, "learning_rate": 0.0001829607990025429, "loss": 0.0145, "step": 301010 }, { "epoch": 0.78, "learning_rate": 0.0001829569107861714, "loss": 0.0154, "step": 301020 }, { "epoch": 0.78, "learning_rate": 0.00018295302256979995, "loss": 0.0118, "step": 301030 }, { "epoch": 0.78, "learning_rate": 0.0001829491343534285, "loss": 0.017, "step": 301040 }, { "epoch": 0.78, "learning_rate": 0.00018294524613705703, "loss": 0.0143, "step": 301050 }, { "epoch": 0.78, "learning_rate": 0.00018294135792068554, "loss": 0.0156, "step": 301060 }, { "epoch": 0.78, "learning_rate": 0.00018293746970431409, "loss": 0.0151, "step": 301070 }, { "epoch": 0.78, "learning_rate": 0.00018293358148794263, "loss": 0.0205, "step": 301080 }, { "epoch": 0.78, "learning_rate": 0.00018292969327157117, "loss": 0.0089, "step": 301090 }, { "epoch": 0.78, "learning_rate": 0.00018292580505519968, "loss": 0.0172, "step": 301100 }, { "epoch": 0.78, "learning_rate": 0.00018292191683882823, "loss": 0.0151, "step": 301110 }, { "epoch": 0.78, "learning_rate": 0.0001829180286224568, "loss": 0.0137, "step": 301120 }, { "epoch": 0.78, "learning_rate": 0.0001829141404060853, "loss": 0.0162, "step": 301130 }, { "epoch": 0.78, "learning_rate": 0.00018291025218971382, "loss": 0.0151, "step": 301140 }, { "epoch": 0.78, "learning_rate": 0.00018290636397334236, "loss": 0.0165, "step": 301150 }, { "epoch": 0.78, "learning_rate": 0.00018290247575697093, "loss": 0.0146, "step": 301160 }, { "epoch": 0.78, "learning_rate": 0.00018289858754059945, "loss": 0.0128, "step": 301170 }, { "epoch": 0.78, "learning_rate": 0.000182894699324228, "loss": 0.0138, "step": 301180 }, { "epoch": 0.78, "learning_rate": 0.0001828908111078565, "loss": 0.0147, "step": 301190 }, { "epoch": 0.78, "learning_rate": 0.00018288692289148507, "loss": 0.0123, "step": 301200 }, { "epoch": 0.78, "learning_rate": 0.0001828830346751136, "loss": 0.0192, "step": 301210 }, { "epoch": 0.78, "learning_rate": 0.00018287914645874213, "loss": 0.0131, "step": 301220 }, { "epoch": 0.78, "learning_rate": 0.00018287525824237064, "loss": 0.018, "step": 301230 }, { "epoch": 0.78, "learning_rate": 0.00018287137002599919, "loss": 0.0113, "step": 301240 }, { "epoch": 0.78, "learning_rate": 0.00018286748180962773, "loss": 0.012, "step": 301250 }, { "epoch": 0.78, "learning_rate": 0.00018286359359325627, "loss": 0.0143, "step": 301260 }, { "epoch": 0.78, "learning_rate": 0.00018285970537688478, "loss": 0.0158, "step": 301270 }, { "epoch": 0.78, "learning_rate": 0.00018285581716051332, "loss": 0.0156, "step": 301280 }, { "epoch": 0.78, "learning_rate": 0.00018285192894414187, "loss": 0.018, "step": 301290 }, { "epoch": 0.78, "learning_rate": 0.0001828480407277704, "loss": 0.0129, "step": 301300 }, { "epoch": 0.78, "learning_rate": 0.00018284415251139892, "loss": 0.017, "step": 301310 }, { "epoch": 0.78, "learning_rate": 0.00018284026429502746, "loss": 0.0133, "step": 301320 }, { "epoch": 0.78, "learning_rate": 0.00018283637607865603, "loss": 0.0168, "step": 301330 }, { "epoch": 0.78, "learning_rate": 0.00018283248786228455, "loss": 0.0146, "step": 301340 }, { "epoch": 0.78, "learning_rate": 0.0001828285996459131, "loss": 0.0137, "step": 301350 }, { "epoch": 0.78, "learning_rate": 0.0001828247114295416, "loss": 0.012, "step": 301360 }, { "epoch": 0.78, "learning_rate": 0.00018282082321317017, "loss": 0.0137, "step": 301370 }, { "epoch": 0.78, "learning_rate": 0.0001828169349967987, "loss": 0.0157, "step": 301380 }, { "epoch": 0.78, "learning_rate": 0.00018281304678042723, "loss": 0.0151, "step": 301390 }, { "epoch": 0.78, "learning_rate": 0.00018280915856405574, "loss": 0.0148, "step": 301400 }, { "epoch": 0.78, "learning_rate": 0.0001828052703476843, "loss": 0.0141, "step": 301410 }, { "epoch": 0.78, "learning_rate": 0.00018280138213131283, "loss": 0.016, "step": 301420 }, { "epoch": 0.78, "learning_rate": 0.00018279749391494137, "loss": 0.014, "step": 301430 }, { "epoch": 0.78, "learning_rate": 0.00018279360569856988, "loss": 0.0132, "step": 301440 }, { "epoch": 0.78, "learning_rate": 0.00018278971748219842, "loss": 0.0139, "step": 301450 }, { "epoch": 0.78, "learning_rate": 0.00018278582926582697, "loss": 0.0148, "step": 301460 }, { "epoch": 0.78, "learning_rate": 0.0001827819410494555, "loss": 0.0139, "step": 301470 }, { "epoch": 0.78, "learning_rate": 0.00018277805283308402, "loss": 0.0124, "step": 301480 }, { "epoch": 0.78, "learning_rate": 0.00018277416461671256, "loss": 0.0138, "step": 301490 }, { "epoch": 0.78, "learning_rate": 0.00018277027640034113, "loss": 0.0163, "step": 301500 }, { "epoch": 0.78, "learning_rate": 0.00018276638818396965, "loss": 0.0128, "step": 301510 }, { "epoch": 0.78, "learning_rate": 0.0001827624999675982, "loss": 0.0206, "step": 301520 }, { "epoch": 0.78, "learning_rate": 0.0001827586117512267, "loss": 0.0175, "step": 301530 }, { "epoch": 0.78, "learning_rate": 0.00018275472353485527, "loss": 0.0169, "step": 301540 }, { "epoch": 0.78, "learning_rate": 0.00018275083531848379, "loss": 0.0148, "step": 301550 }, { "epoch": 0.78, "learning_rate": 0.00018274694710211233, "loss": 0.0137, "step": 301560 }, { "epoch": 0.78, "learning_rate": 0.00018274305888574084, "loss": 0.0161, "step": 301570 }, { "epoch": 0.78, "learning_rate": 0.0001827391706693694, "loss": 0.0124, "step": 301580 }, { "epoch": 0.78, "learning_rate": 0.00018273528245299793, "loss": 0.0129, "step": 301590 }, { "epoch": 0.78, "learning_rate": 0.00018273139423662647, "loss": 0.0129, "step": 301600 }, { "epoch": 0.78, "learning_rate": 0.00018272750602025498, "loss": 0.0129, "step": 301610 }, { "epoch": 0.78, "learning_rate": 0.00018272361780388355, "loss": 0.0155, "step": 301620 }, { "epoch": 0.78, "learning_rate": 0.00018271972958751207, "loss": 0.0161, "step": 301630 }, { "epoch": 0.78, "learning_rate": 0.0001827158413711406, "loss": 0.0163, "step": 301640 }, { "epoch": 0.78, "learning_rate": 0.00018271195315476912, "loss": 0.0138, "step": 301650 }, { "epoch": 0.78, "learning_rate": 0.0001827080649383977, "loss": 0.0199, "step": 301660 }, { "epoch": 0.78, "learning_rate": 0.00018270417672202623, "loss": 0.0168, "step": 301670 }, { "epoch": 0.78, "learning_rate": 0.00018270028850565475, "loss": 0.0169, "step": 301680 }, { "epoch": 0.78, "learning_rate": 0.00018269640028928326, "loss": 0.011, "step": 301690 }, { "epoch": 0.78, "learning_rate": 0.0001826925120729118, "loss": 0.0166, "step": 301700 }, { "epoch": 0.78, "learning_rate": 0.00018268862385654037, "loss": 0.0133, "step": 301710 }, { "epoch": 0.78, "learning_rate": 0.00018268473564016889, "loss": 0.02, "step": 301720 }, { "epoch": 0.78, "learning_rate": 0.00018268084742379743, "loss": 0.0133, "step": 301730 }, { "epoch": 0.78, "learning_rate": 0.00018267695920742594, "loss": 0.0145, "step": 301740 }, { "epoch": 0.78, "learning_rate": 0.0001826730709910545, "loss": 0.0138, "step": 301750 }, { "epoch": 0.78, "learning_rate": 0.00018266918277468303, "loss": 0.0198, "step": 301760 }, { "epoch": 0.78, "learning_rate": 0.00018266529455831157, "loss": 0.0138, "step": 301770 }, { "epoch": 0.78, "learning_rate": 0.00018266140634194008, "loss": 0.0128, "step": 301780 }, { "epoch": 0.78, "learning_rate": 0.00018265751812556865, "loss": 0.0135, "step": 301790 }, { "epoch": 0.78, "learning_rate": 0.00018265362990919716, "loss": 0.0134, "step": 301800 }, { "epoch": 0.78, "learning_rate": 0.0001826497416928257, "loss": 0.0106, "step": 301810 }, { "epoch": 0.78, "learning_rate": 0.00018264585347645422, "loss": 0.0134, "step": 301820 }, { "epoch": 0.78, "learning_rate": 0.0001826419652600828, "loss": 0.013, "step": 301830 }, { "epoch": 0.78, "learning_rate": 0.0001826380770437113, "loss": 0.0162, "step": 301840 }, { "epoch": 0.78, "learning_rate": 0.00018263418882733985, "loss": 0.0133, "step": 301850 }, { "epoch": 0.78, "learning_rate": 0.00018263030061096836, "loss": 0.0106, "step": 301860 }, { "epoch": 0.78, "learning_rate": 0.00018262641239459693, "loss": 0.0152, "step": 301870 }, { "epoch": 0.78, "learning_rate": 0.00018262252417822547, "loss": 0.0175, "step": 301880 }, { "epoch": 0.78, "learning_rate": 0.00018261863596185398, "loss": 0.0144, "step": 301890 }, { "epoch": 0.78, "learning_rate": 0.00018261474774548253, "loss": 0.0158, "step": 301900 }, { "epoch": 0.78, "learning_rate": 0.00018261085952911107, "loss": 0.0177, "step": 301910 }, { "epoch": 0.78, "learning_rate": 0.0001826069713127396, "loss": 0.0155, "step": 301920 }, { "epoch": 0.78, "learning_rate": 0.00018260308309636812, "loss": 0.0136, "step": 301930 }, { "epoch": 0.78, "learning_rate": 0.00018259919487999667, "loss": 0.014, "step": 301940 }, { "epoch": 0.78, "learning_rate": 0.00018259530666362518, "loss": 0.0187, "step": 301950 }, { "epoch": 0.78, "learning_rate": 0.00018259141844725375, "loss": 0.018, "step": 301960 }, { "epoch": 0.78, "learning_rate": 0.00018258753023088226, "loss": 0.0118, "step": 301970 }, { "epoch": 0.78, "learning_rate": 0.0001825836420145108, "loss": 0.0137, "step": 301980 }, { "epoch": 0.78, "learning_rate": 0.00018257975379813932, "loss": 0.0131, "step": 301990 }, { "epoch": 0.78, "learning_rate": 0.0001825758655817679, "loss": 0.0156, "step": 302000 }, { "epoch": 0.78, "eval_cer": 0.8817026863231677, "eval_loss": 0.00945495255291462, "eval_runtime": 107.8912, "eval_samples_per_second": 18.537, "eval_steps_per_second": 4.634, "step": 302000 }, { "epoch": 0.78, "learning_rate": 0.0001825719773653964, "loss": 0.0123, "step": 302010 }, { "epoch": 0.78, "learning_rate": 0.00018256808914902494, "loss": 0.0183, "step": 302020 }, { "epoch": 0.78, "learning_rate": 0.00018256420093265346, "loss": 0.0139, "step": 302030 }, { "epoch": 0.78, "learning_rate": 0.00018256031271628203, "loss": 0.0136, "step": 302040 }, { "epoch": 0.78, "learning_rate": 0.00018255642449991057, "loss": 0.0134, "step": 302050 }, { "epoch": 0.78, "learning_rate": 0.00018255253628353908, "loss": 0.0158, "step": 302060 }, { "epoch": 0.78, "learning_rate": 0.00018254864806716763, "loss": 0.0107, "step": 302070 }, { "epoch": 0.78, "learning_rate": 0.00018254475985079617, "loss": 0.0156, "step": 302080 }, { "epoch": 0.78, "learning_rate": 0.0001825408716344247, "loss": 0.0134, "step": 302090 }, { "epoch": 0.78, "learning_rate": 0.00018253698341805322, "loss": 0.0156, "step": 302100 }, { "epoch": 0.78, "learning_rate": 0.00018253309520168177, "loss": 0.0145, "step": 302110 }, { "epoch": 0.78, "learning_rate": 0.0001825292069853103, "loss": 0.0114, "step": 302120 }, { "epoch": 0.78, "learning_rate": 0.00018252531876893885, "loss": 0.0144, "step": 302130 }, { "epoch": 0.78, "learning_rate": 0.00018252143055256736, "loss": 0.0152, "step": 302140 }, { "epoch": 0.78, "learning_rate": 0.0001825175423361959, "loss": 0.0168, "step": 302150 }, { "epoch": 0.78, "learning_rate": 0.00018251365411982445, "loss": 0.0185, "step": 302160 }, { "epoch": 0.78, "learning_rate": 0.000182509765903453, "loss": 0.0135, "step": 302170 }, { "epoch": 0.78, "learning_rate": 0.0001825058776870815, "loss": 0.0146, "step": 302180 }, { "epoch": 0.78, "learning_rate": 0.00018250198947071004, "loss": 0.0127, "step": 302190 }, { "epoch": 0.78, "learning_rate": 0.00018249810125433856, "loss": 0.0104, "step": 302200 }, { "epoch": 0.78, "learning_rate": 0.00018249421303796713, "loss": 0.0114, "step": 302210 }, { "epoch": 0.78, "learning_rate": 0.00018249032482159567, "loss": 0.0132, "step": 302220 }, { "epoch": 0.78, "learning_rate": 0.00018248643660522418, "loss": 0.0131, "step": 302230 }, { "epoch": 0.78, "learning_rate": 0.0001824825483888527, "loss": 0.009, "step": 302240 }, { "epoch": 0.78, "learning_rate": 0.00018247866017248127, "loss": 0.0142, "step": 302250 }, { "epoch": 0.78, "learning_rate": 0.0001824747719561098, "loss": 0.0137, "step": 302260 }, { "epoch": 0.78, "learning_rate": 0.00018247088373973832, "loss": 0.0124, "step": 302270 }, { "epoch": 0.78, "learning_rate": 0.00018246699552336686, "loss": 0.0204, "step": 302280 }, { "epoch": 0.78, "learning_rate": 0.0001824631073069954, "loss": 0.014, "step": 302290 }, { "epoch": 0.78, "learning_rate": 0.00018245921909062395, "loss": 0.0138, "step": 302300 }, { "epoch": 0.78, "learning_rate": 0.00018245533087425246, "loss": 0.0157, "step": 302310 }, { "epoch": 0.78, "learning_rate": 0.000182451442657881, "loss": 0.0184, "step": 302320 }, { "epoch": 0.78, "learning_rate": 0.00018244755444150955, "loss": 0.0154, "step": 302330 }, { "epoch": 0.78, "learning_rate": 0.0001824436662251381, "loss": 0.017, "step": 302340 }, { "epoch": 0.78, "learning_rate": 0.0001824397780087666, "loss": 0.015, "step": 302350 }, { "epoch": 0.78, "learning_rate": 0.00018243588979239514, "loss": 0.0126, "step": 302360 }, { "epoch": 0.78, "learning_rate": 0.0001824320015760237, "loss": 0.0153, "step": 302370 }, { "epoch": 0.78, "learning_rate": 0.00018242811335965223, "loss": 0.0099, "step": 302380 }, { "epoch": 0.78, "learning_rate": 0.00018242422514328077, "loss": 0.0143, "step": 302390 }, { "epoch": 0.78, "learning_rate": 0.00018242033692690928, "loss": 0.0139, "step": 302400 }, { "epoch": 0.78, "learning_rate": 0.00018241644871053785, "loss": 0.0127, "step": 302410 }, { "epoch": 0.78, "learning_rate": 0.00018241256049416637, "loss": 0.0146, "step": 302420 }, { "epoch": 0.78, "learning_rate": 0.0001824086722777949, "loss": 0.0158, "step": 302430 }, { "epoch": 0.78, "learning_rate": 0.00018240478406142342, "loss": 0.0138, "step": 302440 }, { "epoch": 0.78, "learning_rate": 0.00018240089584505196, "loss": 0.0153, "step": 302450 }, { "epoch": 0.78, "learning_rate": 0.0001823970076286805, "loss": 0.0134, "step": 302460 }, { "epoch": 0.78, "learning_rate": 0.00018239311941230905, "loss": 0.0145, "step": 302470 }, { "epoch": 0.78, "learning_rate": 0.00018238923119593756, "loss": 0.0147, "step": 302480 }, { "epoch": 0.78, "learning_rate": 0.0001823853429795661, "loss": 0.0209, "step": 302490 }, { "epoch": 0.78, "learning_rate": 0.00018238145476319465, "loss": 0.0152, "step": 302500 }, { "epoch": 0.78, "learning_rate": 0.0001823775665468232, "loss": 0.0126, "step": 302510 }, { "epoch": 0.78, "learning_rate": 0.0001823736783304517, "loss": 0.016, "step": 302520 }, { "epoch": 0.78, "learning_rate": 0.00018236979011408024, "loss": 0.0144, "step": 302530 }, { "epoch": 0.78, "learning_rate": 0.0001823659018977088, "loss": 0.0155, "step": 302540 }, { "epoch": 0.78, "learning_rate": 0.00018236201368133733, "loss": 0.0167, "step": 302550 }, { "epoch": 0.78, "learning_rate": 0.00018235812546496584, "loss": 0.0149, "step": 302560 }, { "epoch": 0.78, "learning_rate": 0.00018235423724859438, "loss": 0.0144, "step": 302570 }, { "epoch": 0.78, "learning_rate": 0.00018235034903222295, "loss": 0.0133, "step": 302580 }, { "epoch": 0.78, "learning_rate": 0.00018234646081585147, "loss": 0.017, "step": 302590 }, { "epoch": 0.78, "learning_rate": 0.00018234257259948, "loss": 0.0126, "step": 302600 }, { "epoch": 0.78, "learning_rate": 0.00018233868438310852, "loss": 0.0149, "step": 302610 }, { "epoch": 0.78, "learning_rate": 0.0001823347961667371, "loss": 0.0108, "step": 302620 }, { "epoch": 0.78, "learning_rate": 0.0001823309079503656, "loss": 0.0155, "step": 302630 }, { "epoch": 0.78, "learning_rate": 0.00018232701973399415, "loss": 0.0117, "step": 302640 }, { "epoch": 0.78, "learning_rate": 0.00018232313151762266, "loss": 0.0164, "step": 302650 }, { "epoch": 0.78, "learning_rate": 0.00018231924330125123, "loss": 0.0118, "step": 302660 }, { "epoch": 0.78, "learning_rate": 0.00018231535508487974, "loss": 0.0164, "step": 302670 }, { "epoch": 0.78, "learning_rate": 0.0001823114668685083, "loss": 0.0135, "step": 302680 }, { "epoch": 0.78, "learning_rate": 0.0001823075786521368, "loss": 0.0168, "step": 302690 }, { "epoch": 0.78, "learning_rate": 0.00018230369043576534, "loss": 0.0157, "step": 302700 }, { "epoch": 0.78, "learning_rate": 0.0001822998022193939, "loss": 0.0107, "step": 302710 }, { "epoch": 0.78, "learning_rate": 0.00018229591400302243, "loss": 0.0118, "step": 302720 }, { "epoch": 0.78, "learning_rate": 0.00018229202578665094, "loss": 0.0149, "step": 302730 }, { "epoch": 0.78, "learning_rate": 0.00018228813757027948, "loss": 0.0146, "step": 302740 }, { "epoch": 0.78, "learning_rate": 0.00018228424935390805, "loss": 0.0132, "step": 302750 }, { "epoch": 0.78, "learning_rate": 0.00018228036113753657, "loss": 0.0146, "step": 302760 }, { "epoch": 0.78, "learning_rate": 0.0001822764729211651, "loss": 0.0128, "step": 302770 }, { "epoch": 0.78, "learning_rate": 0.00018227258470479362, "loss": 0.0116, "step": 302780 }, { "epoch": 0.78, "learning_rate": 0.0001822686964884222, "loss": 0.0141, "step": 302790 }, { "epoch": 0.78, "learning_rate": 0.0001822648082720507, "loss": 0.0198, "step": 302800 }, { "epoch": 0.78, "learning_rate": 0.00018226092005567925, "loss": 0.0135, "step": 302810 }, { "epoch": 0.78, "learning_rate": 0.00018225703183930776, "loss": 0.015, "step": 302820 }, { "epoch": 0.78, "learning_rate": 0.00018225314362293633, "loss": 0.0163, "step": 302830 }, { "epoch": 0.79, "learning_rate": 0.00018224925540656484, "loss": 0.0138, "step": 302840 }, { "epoch": 0.79, "learning_rate": 0.00018224536719019339, "loss": 0.0137, "step": 302850 }, { "epoch": 0.79, "learning_rate": 0.0001822414789738219, "loss": 0.0146, "step": 302860 }, { "epoch": 0.79, "learning_rate": 0.00018223759075745047, "loss": 0.0145, "step": 302870 }, { "epoch": 0.79, "learning_rate": 0.00018223370254107898, "loss": 0.0165, "step": 302880 }, { "epoch": 0.79, "learning_rate": 0.00018222981432470753, "loss": 0.0151, "step": 302890 }, { "epoch": 0.79, "learning_rate": 0.00018222592610833604, "loss": 0.0132, "step": 302900 }, { "epoch": 0.79, "learning_rate": 0.0001822220378919646, "loss": 0.0166, "step": 302910 }, { "epoch": 0.79, "learning_rate": 0.00018221814967559315, "loss": 0.0157, "step": 302920 }, { "epoch": 0.79, "learning_rate": 0.00018221426145922166, "loss": 0.0162, "step": 302930 }, { "epoch": 0.79, "learning_rate": 0.0001822103732428502, "loss": 0.0134, "step": 302940 }, { "epoch": 0.79, "learning_rate": 0.00018220648502647872, "loss": 0.0169, "step": 302950 }, { "epoch": 0.79, "learning_rate": 0.0001822025968101073, "loss": 0.0146, "step": 302960 }, { "epoch": 0.79, "learning_rate": 0.0001821987085937358, "loss": 0.011, "step": 302970 }, { "epoch": 0.79, "learning_rate": 0.00018219482037736435, "loss": 0.0181, "step": 302980 }, { "epoch": 0.79, "learning_rate": 0.00018219093216099286, "loss": 0.0197, "step": 302990 }, { "epoch": 0.79, "learning_rate": 0.00018218704394462143, "loss": 0.0104, "step": 303000 }, { "epoch": 0.79, "eval_cer": 0.8817306790618513, "eval_loss": 0.009238921105861664, "eval_runtime": 107.8053, "eval_samples_per_second": 18.552, "eval_steps_per_second": 4.638, "step": 303000 }, { "epoch": 0.79, "learning_rate": 0.00018218315572824994, "loss": 0.0163, "step": 303010 }, { "epoch": 0.79, "learning_rate": 0.00018217926751187849, "loss": 0.0127, "step": 303020 }, { "epoch": 0.79, "learning_rate": 0.000182175379295507, "loss": 0.0149, "step": 303030 }, { "epoch": 0.79, "learning_rate": 0.00018217149107913557, "loss": 0.0146, "step": 303040 }, { "epoch": 0.79, "learning_rate": 0.00018216760286276408, "loss": 0.0164, "step": 303050 }, { "epoch": 0.79, "learning_rate": 0.00018216371464639262, "loss": 0.0179, "step": 303060 }, { "epoch": 0.79, "learning_rate": 0.00018215982643002114, "loss": 0.0168, "step": 303070 }, { "epoch": 0.79, "learning_rate": 0.0001821559382136497, "loss": 0.0148, "step": 303080 }, { "epoch": 0.79, "learning_rate": 0.00018215204999727825, "loss": 0.0124, "step": 303090 }, { "epoch": 0.79, "learning_rate": 0.00018214816178090676, "loss": 0.0131, "step": 303100 }, { "epoch": 0.79, "learning_rate": 0.0001821442735645353, "loss": 0.009, "step": 303110 }, { "epoch": 0.79, "learning_rate": 0.00018214038534816385, "loss": 0.0166, "step": 303120 }, { "epoch": 0.79, "learning_rate": 0.0001821364971317924, "loss": 0.0147, "step": 303130 }, { "epoch": 0.79, "learning_rate": 0.0001821326089154209, "loss": 0.0144, "step": 303140 }, { "epoch": 0.79, "learning_rate": 0.00018212872069904945, "loss": 0.012, "step": 303150 }, { "epoch": 0.79, "learning_rate": 0.000182124832482678, "loss": 0.013, "step": 303160 }, { "epoch": 0.79, "learning_rate": 0.00018212094426630653, "loss": 0.0139, "step": 303170 }, { "epoch": 0.79, "learning_rate": 0.00018211705604993504, "loss": 0.0144, "step": 303180 }, { "epoch": 0.79, "learning_rate": 0.00018211316783356358, "loss": 0.0157, "step": 303190 }, { "epoch": 0.79, "learning_rate": 0.0001821092796171921, "loss": 0.013, "step": 303200 }, { "epoch": 0.79, "learning_rate": 0.00018210539140082067, "loss": 0.0168, "step": 303210 }, { "epoch": 0.79, "learning_rate": 0.00018210150318444918, "loss": 0.0162, "step": 303220 }, { "epoch": 0.79, "learning_rate": 0.00018209761496807772, "loss": 0.0129, "step": 303230 }, { "epoch": 0.79, "learning_rate": 0.00018209372675170624, "loss": 0.0147, "step": 303240 }, { "epoch": 0.79, "learning_rate": 0.0001820898385353348, "loss": 0.013, "step": 303250 }, { "epoch": 0.79, "learning_rate": 0.00018208595031896335, "loss": 0.0123, "step": 303260 }, { "epoch": 0.79, "learning_rate": 0.00018208206210259186, "loss": 0.0137, "step": 303270 }, { "epoch": 0.79, "learning_rate": 0.00018207817388622038, "loss": 0.0142, "step": 303280 }, { "epoch": 0.79, "learning_rate": 0.00018207428566984895, "loss": 0.0126, "step": 303290 }, { "epoch": 0.79, "learning_rate": 0.0001820703974534775, "loss": 0.0144, "step": 303300 }, { "epoch": 0.79, "learning_rate": 0.000182066509237106, "loss": 0.0156, "step": 303310 }, { "epoch": 0.79, "learning_rate": 0.00018206262102073454, "loss": 0.0166, "step": 303320 }, { "epoch": 0.79, "learning_rate": 0.00018205873280436309, "loss": 0.0091, "step": 303330 }, { "epoch": 0.79, "learning_rate": 0.00018205484458799163, "loss": 0.0148, "step": 303340 }, { "epoch": 0.79, "learning_rate": 0.00018205095637162014, "loss": 0.0154, "step": 303350 }, { "epoch": 0.79, "learning_rate": 0.00018204706815524868, "loss": 0.0137, "step": 303360 }, { "epoch": 0.79, "learning_rate": 0.00018204317993887723, "loss": 0.0173, "step": 303370 }, { "epoch": 0.79, "learning_rate": 0.00018203929172250577, "loss": 0.0156, "step": 303380 }, { "epoch": 0.79, "learning_rate": 0.00018203540350613428, "loss": 0.0158, "step": 303390 }, { "epoch": 0.79, "learning_rate": 0.00018203151528976282, "loss": 0.0127, "step": 303400 }, { "epoch": 0.79, "learning_rate": 0.0001820276270733914, "loss": 0.0161, "step": 303410 }, { "epoch": 0.79, "learning_rate": 0.0001820237388570199, "loss": 0.0155, "step": 303420 }, { "epoch": 0.79, "learning_rate": 0.00018201985064064842, "loss": 0.0124, "step": 303430 }, { "epoch": 0.79, "learning_rate": 0.00018201596242427696, "loss": 0.0161, "step": 303440 }, { "epoch": 0.79, "learning_rate": 0.00018201207420790548, "loss": 0.013, "step": 303450 }, { "epoch": 0.79, "learning_rate": 0.00018200818599153405, "loss": 0.0147, "step": 303460 }, { "epoch": 0.79, "learning_rate": 0.0001820042977751626, "loss": 0.0179, "step": 303470 }, { "epoch": 0.79, "learning_rate": 0.0001820004095587911, "loss": 0.0127, "step": 303480 }, { "epoch": 0.79, "learning_rate": 0.00018199652134241964, "loss": 0.0156, "step": 303490 }, { "epoch": 0.79, "learning_rate": 0.00018199263312604819, "loss": 0.0137, "step": 303500 }, { "epoch": 0.79, "learning_rate": 0.00018198874490967673, "loss": 0.0166, "step": 303510 }, { "epoch": 0.79, "learning_rate": 0.00018198485669330524, "loss": 0.0127, "step": 303520 }, { "epoch": 0.79, "learning_rate": 0.00018198096847693378, "loss": 0.0123, "step": 303530 }, { "epoch": 0.79, "learning_rate": 0.00018197708026056233, "loss": 0.0183, "step": 303540 }, { "epoch": 0.79, "learning_rate": 0.00018197319204419087, "loss": 0.0148, "step": 303550 }, { "epoch": 0.79, "learning_rate": 0.00018196930382781938, "loss": 0.0137, "step": 303560 }, { "epoch": 0.79, "learning_rate": 0.00018196541561144792, "loss": 0.011, "step": 303570 }, { "epoch": 0.79, "learning_rate": 0.0001819615273950765, "loss": 0.0115, "step": 303580 }, { "epoch": 0.79, "learning_rate": 0.000181957639178705, "loss": 0.013, "step": 303590 }, { "epoch": 0.79, "learning_rate": 0.00018195375096233352, "loss": 0.015, "step": 303600 }, { "epoch": 0.79, "learning_rate": 0.00018194986274596206, "loss": 0.0121, "step": 303610 }, { "epoch": 0.79, "learning_rate": 0.00018194597452959063, "loss": 0.0155, "step": 303620 }, { "epoch": 0.79, "learning_rate": 0.00018194208631321915, "loss": 0.0119, "step": 303630 }, { "epoch": 0.79, "learning_rate": 0.0001819381980968477, "loss": 0.0142, "step": 303640 }, { "epoch": 0.79, "learning_rate": 0.0001819343098804762, "loss": 0.0122, "step": 303650 }, { "epoch": 0.79, "learning_rate": 0.00018193042166410477, "loss": 0.0167, "step": 303660 }, { "epoch": 0.79, "learning_rate": 0.00018192653344773329, "loss": 0.0146, "step": 303670 }, { "epoch": 0.79, "learning_rate": 0.00018192264523136183, "loss": 0.0133, "step": 303680 }, { "epoch": 0.79, "learning_rate": 0.00018191875701499034, "loss": 0.0117, "step": 303690 }, { "epoch": 0.79, "learning_rate": 0.00018191486879861888, "loss": 0.0121, "step": 303700 }, { "epoch": 0.79, "learning_rate": 0.00018191098058224742, "loss": 0.0132, "step": 303710 }, { "epoch": 0.79, "learning_rate": 0.00018190709236587597, "loss": 0.015, "step": 303720 }, { "epoch": 0.79, "learning_rate": 0.00018190320414950448, "loss": 0.0126, "step": 303730 }, { "epoch": 0.79, "learning_rate": 0.00018189931593313302, "loss": 0.0136, "step": 303740 }, { "epoch": 0.79, "learning_rate": 0.00018189542771676156, "loss": 0.0212, "step": 303750 }, { "epoch": 0.79, "learning_rate": 0.0001818915395003901, "loss": 0.0184, "step": 303760 }, { "epoch": 0.79, "learning_rate": 0.00018188765128401862, "loss": 0.014, "step": 303770 }, { "epoch": 0.79, "learning_rate": 0.00018188376306764716, "loss": 0.0168, "step": 303780 }, { "epoch": 0.79, "learning_rate": 0.00018187987485127573, "loss": 0.0132, "step": 303790 }, { "epoch": 0.79, "learning_rate": 0.00018187598663490425, "loss": 0.0159, "step": 303800 }, { "epoch": 0.79, "learning_rate": 0.0001818720984185328, "loss": 0.0135, "step": 303810 }, { "epoch": 0.79, "learning_rate": 0.0001818682102021613, "loss": 0.0163, "step": 303820 }, { "epoch": 0.79, "learning_rate": 0.00018186432198578987, "loss": 0.0184, "step": 303830 }, { "epoch": 0.79, "learning_rate": 0.00018186043376941838, "loss": 0.0174, "step": 303840 }, { "epoch": 0.79, "learning_rate": 0.00018185654555304693, "loss": 0.0163, "step": 303850 }, { "epoch": 0.79, "learning_rate": 0.00018185265733667544, "loss": 0.0153, "step": 303860 }, { "epoch": 0.79, "learning_rate": 0.000181848769120304, "loss": 0.0164, "step": 303870 }, { "epoch": 0.79, "learning_rate": 0.00018184488090393252, "loss": 0.0134, "step": 303880 }, { "epoch": 0.79, "learning_rate": 0.00018184099268756107, "loss": 0.013, "step": 303890 }, { "epoch": 0.79, "learning_rate": 0.00018183710447118958, "loss": 0.0128, "step": 303900 }, { "epoch": 0.79, "learning_rate": 0.00018183321625481815, "loss": 0.0167, "step": 303910 }, { "epoch": 0.79, "learning_rate": 0.00018182932803844666, "loss": 0.0149, "step": 303920 }, { "epoch": 0.79, "learning_rate": 0.0001818254398220752, "loss": 0.014, "step": 303930 }, { "epoch": 0.79, "learning_rate": 0.00018182155160570372, "loss": 0.0154, "step": 303940 }, { "epoch": 0.79, "learning_rate": 0.00018181766338933226, "loss": 0.012, "step": 303950 }, { "epoch": 0.79, "learning_rate": 0.00018181377517296083, "loss": 0.0172, "step": 303960 }, { "epoch": 0.79, "learning_rate": 0.00018180988695658934, "loss": 0.0165, "step": 303970 }, { "epoch": 0.79, "learning_rate": 0.00018180599874021789, "loss": 0.0175, "step": 303980 }, { "epoch": 0.79, "learning_rate": 0.0001818021105238464, "loss": 0.0159, "step": 303990 }, { "epoch": 0.79, "learning_rate": 0.00018179822230747497, "loss": 0.0132, "step": 304000 }, { "epoch": 0.79, "eval_cer": 0.8817474747050615, "eval_loss": 0.009092407301068306, "eval_runtime": 107.6272, "eval_samples_per_second": 18.583, "eval_steps_per_second": 4.646, "step": 304000 }, { "epoch": 0.79, "learning_rate": 0.00018179433409110348, "loss": 0.0175, "step": 304010 }, { "epoch": 0.79, "learning_rate": 0.00018179044587473203, "loss": 0.0127, "step": 304020 }, { "epoch": 0.79, "learning_rate": 0.00018178655765836054, "loss": 0.0161, "step": 304030 }, { "epoch": 0.79, "learning_rate": 0.0001817826694419891, "loss": 0.0113, "step": 304040 }, { "epoch": 0.79, "learning_rate": 0.00018177878122561762, "loss": 0.0164, "step": 304050 }, { "epoch": 0.79, "learning_rate": 0.00018177489300924617, "loss": 0.0152, "step": 304060 }, { "epoch": 0.79, "learning_rate": 0.00018177100479287468, "loss": 0.0178, "step": 304070 }, { "epoch": 0.79, "learning_rate": 0.00018176711657650325, "loss": 0.0094, "step": 304080 }, { "epoch": 0.79, "learning_rate": 0.00018176322836013176, "loss": 0.0136, "step": 304090 }, { "epoch": 0.79, "learning_rate": 0.0001817593401437603, "loss": 0.015, "step": 304100 }, { "epoch": 0.79, "learning_rate": 0.00018175545192738882, "loss": 0.0146, "step": 304110 }, { "epoch": 0.79, "learning_rate": 0.0001817515637110174, "loss": 0.0126, "step": 304120 }, { "epoch": 0.79, "learning_rate": 0.00018174767549464593, "loss": 0.0118, "step": 304130 }, { "epoch": 0.79, "learning_rate": 0.00018174378727827444, "loss": 0.0147, "step": 304140 }, { "epoch": 0.79, "learning_rate": 0.00018173989906190296, "loss": 0.0132, "step": 304150 }, { "epoch": 0.79, "learning_rate": 0.00018173601084553153, "loss": 0.0132, "step": 304160 }, { "epoch": 0.79, "learning_rate": 0.00018173212262916007, "loss": 0.0113, "step": 304170 }, { "epoch": 0.79, "learning_rate": 0.00018172823441278858, "loss": 0.0127, "step": 304180 }, { "epoch": 0.79, "learning_rate": 0.00018172434619641713, "loss": 0.0113, "step": 304190 }, { "epoch": 0.79, "learning_rate": 0.00018172045798004564, "loss": 0.0114, "step": 304200 }, { "epoch": 0.79, "learning_rate": 0.0001817165697636742, "loss": 0.0138, "step": 304210 }, { "epoch": 0.79, "learning_rate": 0.00018171268154730272, "loss": 0.0109, "step": 304220 }, { "epoch": 0.79, "learning_rate": 0.00018170879333093126, "loss": 0.0122, "step": 304230 }, { "epoch": 0.79, "learning_rate": 0.00018170490511455978, "loss": 0.0156, "step": 304240 }, { "epoch": 0.79, "learning_rate": 0.00018170101689818835, "loss": 0.0136, "step": 304250 }, { "epoch": 0.79, "learning_rate": 0.00018169712868181686, "loss": 0.0134, "step": 304260 }, { "epoch": 0.79, "learning_rate": 0.0001816932404654454, "loss": 0.0152, "step": 304270 }, { "epoch": 0.79, "learning_rate": 0.00018168935224907392, "loss": 0.0119, "step": 304280 }, { "epoch": 0.79, "learning_rate": 0.0001816854640327025, "loss": 0.0139, "step": 304290 }, { "epoch": 0.79, "learning_rate": 0.000181681575816331, "loss": 0.0116, "step": 304300 }, { "epoch": 0.79, "learning_rate": 0.00018167768759995954, "loss": 0.0112, "step": 304310 }, { "epoch": 0.79, "learning_rate": 0.00018167379938358806, "loss": 0.0134, "step": 304320 }, { "epoch": 0.79, "learning_rate": 0.00018166991116721663, "loss": 0.0179, "step": 304330 }, { "epoch": 0.79, "learning_rate": 0.00018166602295084517, "loss": 0.0168, "step": 304340 }, { "epoch": 0.79, "learning_rate": 0.00018166213473447368, "loss": 0.0135, "step": 304350 }, { "epoch": 0.79, "learning_rate": 0.00018165824651810222, "loss": 0.0128, "step": 304360 }, { "epoch": 0.79, "learning_rate": 0.00018165435830173077, "loss": 0.0168, "step": 304370 }, { "epoch": 0.79, "learning_rate": 0.0001816504700853593, "loss": 0.0106, "step": 304380 }, { "epoch": 0.79, "learning_rate": 0.00018164658186898782, "loss": 0.0132, "step": 304390 }, { "epoch": 0.79, "learning_rate": 0.00018164269365261636, "loss": 0.0141, "step": 304400 }, { "epoch": 0.79, "learning_rate": 0.0001816388054362449, "loss": 0.0161, "step": 304410 }, { "epoch": 0.79, "learning_rate": 0.00018163491721987345, "loss": 0.0125, "step": 304420 }, { "epoch": 0.79, "learning_rate": 0.00018163102900350196, "loss": 0.0134, "step": 304430 }, { "epoch": 0.79, "learning_rate": 0.0001816271407871305, "loss": 0.0141, "step": 304440 }, { "epoch": 0.79, "learning_rate": 0.00018162325257075902, "loss": 0.0151, "step": 304450 }, { "epoch": 0.79, "learning_rate": 0.0001816193643543876, "loss": 0.0127, "step": 304460 }, { "epoch": 0.79, "learning_rate": 0.0001816154761380161, "loss": 0.0148, "step": 304470 }, { "epoch": 0.79, "learning_rate": 0.00018161158792164464, "loss": 0.0139, "step": 304480 }, { "epoch": 0.79, "learning_rate": 0.00018160769970527316, "loss": 0.0147, "step": 304490 }, { "epoch": 0.79, "learning_rate": 0.00018160381148890173, "loss": 0.0144, "step": 304500 }, { "epoch": 0.79, "learning_rate": 0.00018159992327253027, "loss": 0.0183, "step": 304510 }, { "epoch": 0.79, "learning_rate": 0.00018159603505615878, "loss": 0.0144, "step": 304520 }, { "epoch": 0.79, "learning_rate": 0.00018159214683978732, "loss": 0.016, "step": 304530 }, { "epoch": 0.79, "learning_rate": 0.00018158825862341587, "loss": 0.0166, "step": 304540 }, { "epoch": 0.79, "learning_rate": 0.0001815843704070444, "loss": 0.0126, "step": 304550 }, { "epoch": 0.79, "learning_rate": 0.00018158048219067292, "loss": 0.0153, "step": 304560 }, { "epoch": 0.79, "learning_rate": 0.00018157659397430146, "loss": 0.0159, "step": 304570 }, { "epoch": 0.79, "learning_rate": 0.00018157270575793, "loss": 0.0158, "step": 304580 }, { "epoch": 0.79, "learning_rate": 0.00018156881754155855, "loss": 0.0122, "step": 304590 }, { "epoch": 0.79, "learning_rate": 0.00018156492932518706, "loss": 0.0185, "step": 304600 }, { "epoch": 0.79, "learning_rate": 0.0001815610411088156, "loss": 0.0152, "step": 304610 }, { "epoch": 0.79, "learning_rate": 0.00018155715289244414, "loss": 0.0125, "step": 304620 }, { "epoch": 0.79, "learning_rate": 0.00018155326467607269, "loss": 0.0146, "step": 304630 }, { "epoch": 0.79, "learning_rate": 0.0001815493764597012, "loss": 0.0139, "step": 304640 }, { "epoch": 0.79, "learning_rate": 0.00018154548824332974, "loss": 0.0148, "step": 304650 }, { "epoch": 0.79, "learning_rate": 0.0001815416000269583, "loss": 0.0215, "step": 304660 }, { "epoch": 0.79, "learning_rate": 0.00018153771181058683, "loss": 0.017, "step": 304670 }, { "epoch": 0.79, "learning_rate": 0.00018153382359421537, "loss": 0.0136, "step": 304680 }, { "epoch": 0.79, "learning_rate": 0.00018152993537784388, "loss": 0.0121, "step": 304690 }, { "epoch": 0.79, "learning_rate": 0.00018152604716147242, "loss": 0.0401, "step": 304700 }, { "epoch": 0.79, "learning_rate": 0.00018152215894510097, "loss": 0.0176, "step": 304710 }, { "epoch": 0.79, "learning_rate": 0.0001815182707287295, "loss": 0.0147, "step": 304720 }, { "epoch": 0.79, "learning_rate": 0.00018151438251235802, "loss": 0.0182, "step": 304730 }, { "epoch": 0.79, "learning_rate": 0.00018151049429598656, "loss": 0.0182, "step": 304740 }, { "epoch": 0.79, "learning_rate": 0.0001815066060796151, "loss": 0.0119, "step": 304750 }, { "epoch": 0.79, "learning_rate": 0.00018150271786324365, "loss": 0.015, "step": 304760 }, { "epoch": 0.79, "learning_rate": 0.00018149882964687216, "loss": 0.0157, "step": 304770 }, { "epoch": 0.79, "learning_rate": 0.0001814949414305007, "loss": 0.0137, "step": 304780 }, { "epoch": 0.79, "learning_rate": 0.00018149105321412924, "loss": 0.0156, "step": 304790 }, { "epoch": 0.79, "learning_rate": 0.00018148716499775779, "loss": 0.0143, "step": 304800 }, { "epoch": 0.79, "learning_rate": 0.0001814832767813863, "loss": 0.0152, "step": 304810 }, { "epoch": 0.79, "learning_rate": 0.00018147938856501484, "loss": 0.0166, "step": 304820 }, { "epoch": 0.79, "learning_rate": 0.0001814755003486434, "loss": 0.0155, "step": 304830 }, { "epoch": 0.79, "learning_rate": 0.00018147161213227192, "loss": 0.0166, "step": 304840 }, { "epoch": 0.79, "learning_rate": 0.00018146772391590047, "loss": 0.017, "step": 304850 }, { "epoch": 0.79, "learning_rate": 0.00018146383569952898, "loss": 0.0154, "step": 304860 }, { "epoch": 0.79, "learning_rate": 0.00018145994748315755, "loss": 0.012, "step": 304870 }, { "epoch": 0.79, "learning_rate": 0.00018145605926678606, "loss": 0.0131, "step": 304880 }, { "epoch": 0.79, "learning_rate": 0.0001814521710504146, "loss": 0.0215, "step": 304890 }, { "epoch": 0.79, "learning_rate": 0.00018144828283404312, "loss": 0.0155, "step": 304900 }, { "epoch": 0.79, "learning_rate": 0.0001814443946176717, "loss": 0.0147, "step": 304910 }, { "epoch": 0.79, "learning_rate": 0.0001814405064013002, "loss": 0.0151, "step": 304920 }, { "epoch": 0.79, "learning_rate": 0.00018143661818492875, "loss": 0.0134, "step": 304930 }, { "epoch": 0.79, "learning_rate": 0.00018143272996855726, "loss": 0.0161, "step": 304940 }, { "epoch": 0.79, "learning_rate": 0.0001814288417521858, "loss": 0.0133, "step": 304950 }, { "epoch": 0.79, "learning_rate": 0.00018142495353581434, "loss": 0.0202, "step": 304960 }, { "epoch": 0.79, "learning_rate": 0.00018142106531944288, "loss": 0.0178, "step": 304970 }, { "epoch": 0.79, "learning_rate": 0.0001814171771030714, "loss": 0.0125, "step": 304980 }, { "epoch": 0.79, "learning_rate": 0.00018141328888669994, "loss": 0.0128, "step": 304990 }, { "epoch": 0.79, "learning_rate": 0.0001814094006703285, "loss": 0.0116, "step": 305000 }, { "epoch": 0.79, "eval_cer": 0.8817292794249172, "eval_loss": 0.009619629941880703, "eval_runtime": 107.6086, "eval_samples_per_second": 18.586, "eval_steps_per_second": 4.646, "step": 305000 }, { "epoch": 0.79, "learning_rate": 0.00018140551245395702, "loss": 0.014, "step": 305010 }, { "epoch": 0.79, "learning_rate": 0.00018140162423758554, "loss": 0.0148, "step": 305020 }, { "epoch": 0.79, "learning_rate": 0.00018139773602121408, "loss": 0.0119, "step": 305030 }, { "epoch": 0.79, "learning_rate": 0.00018139384780484265, "loss": 0.0167, "step": 305040 }, { "epoch": 0.79, "learning_rate": 0.00018138995958847116, "loss": 0.0112, "step": 305050 }, { "epoch": 0.79, "learning_rate": 0.0001813860713720997, "loss": 0.0158, "step": 305060 }, { "epoch": 0.79, "learning_rate": 0.00018138218315572822, "loss": 0.0146, "step": 305070 }, { "epoch": 0.79, "learning_rate": 0.0001813782949393568, "loss": 0.0179, "step": 305080 }, { "epoch": 0.79, "learning_rate": 0.0001813744067229853, "loss": 0.0129, "step": 305090 }, { "epoch": 0.79, "learning_rate": 0.00018137051850661384, "loss": 0.0169, "step": 305100 }, { "epoch": 0.79, "learning_rate": 0.00018136663029024236, "loss": 0.0136, "step": 305110 }, { "epoch": 0.79, "learning_rate": 0.00018136274207387093, "loss": 0.0133, "step": 305120 }, { "epoch": 0.79, "learning_rate": 0.00018135885385749944, "loss": 0.0155, "step": 305130 }, { "epoch": 0.79, "learning_rate": 0.00018135496564112798, "loss": 0.0115, "step": 305140 }, { "epoch": 0.79, "learning_rate": 0.0001813510774247565, "loss": 0.0192, "step": 305150 }, { "epoch": 0.79, "learning_rate": 0.00018134718920838507, "loss": 0.0164, "step": 305160 }, { "epoch": 0.79, "learning_rate": 0.0001813433009920136, "loss": 0.0158, "step": 305170 }, { "epoch": 0.79, "learning_rate": 0.00018133941277564212, "loss": 0.0135, "step": 305180 }, { "epoch": 0.79, "learning_rate": 0.00018133552455927064, "loss": 0.0132, "step": 305190 }, { "epoch": 0.79, "learning_rate": 0.00018133163634289918, "loss": 0.014, "step": 305200 }, { "epoch": 0.79, "learning_rate": 0.00018132774812652775, "loss": 0.0156, "step": 305210 }, { "epoch": 0.79, "learning_rate": 0.00018132385991015626, "loss": 0.0158, "step": 305220 }, { "epoch": 0.79, "learning_rate": 0.0001813199716937848, "loss": 0.0135, "step": 305230 }, { "epoch": 0.79, "learning_rate": 0.00018131608347741332, "loss": 0.018, "step": 305240 }, { "epoch": 0.79, "learning_rate": 0.0001813121952610419, "loss": 0.016, "step": 305250 }, { "epoch": 0.79, "learning_rate": 0.0001813083070446704, "loss": 0.0138, "step": 305260 }, { "epoch": 0.79, "learning_rate": 0.00018130441882829894, "loss": 0.0097, "step": 305270 }, { "epoch": 0.79, "learning_rate": 0.00018130053061192746, "loss": 0.0142, "step": 305280 }, { "epoch": 0.79, "learning_rate": 0.00018129664239555603, "loss": 0.0148, "step": 305290 }, { "epoch": 0.79, "learning_rate": 0.00018129275417918454, "loss": 0.0124, "step": 305300 }, { "epoch": 0.79, "learning_rate": 0.00018128886596281308, "loss": 0.0153, "step": 305310 }, { "epoch": 0.79, "learning_rate": 0.0001812849777464416, "loss": 0.015, "step": 305320 }, { "epoch": 0.79, "learning_rate": 0.00018128108953007017, "loss": 0.0147, "step": 305330 }, { "epoch": 0.79, "learning_rate": 0.00018127720131369868, "loss": 0.0179, "step": 305340 }, { "epoch": 0.79, "learning_rate": 0.00018127331309732722, "loss": 0.0132, "step": 305350 }, { "epoch": 0.79, "learning_rate": 0.00018126942488095574, "loss": 0.0154, "step": 305360 }, { "epoch": 0.79, "learning_rate": 0.0001812655366645843, "loss": 0.015, "step": 305370 }, { "epoch": 0.79, "learning_rate": 0.00018126164844821285, "loss": 0.011, "step": 305380 }, { "epoch": 0.79, "learning_rate": 0.00018125776023184136, "loss": 0.0134, "step": 305390 }, { "epoch": 0.79, "learning_rate": 0.0001812538720154699, "loss": 0.013, "step": 305400 }, { "epoch": 0.79, "learning_rate": 0.00018124998379909845, "loss": 0.0139, "step": 305410 }, { "epoch": 0.79, "learning_rate": 0.000181246095582727, "loss": 0.0146, "step": 305420 }, { "epoch": 0.79, "learning_rate": 0.0001812422073663555, "loss": 0.0156, "step": 305430 }, { "epoch": 0.79, "learning_rate": 0.00018123831914998404, "loss": 0.0127, "step": 305440 }, { "epoch": 0.79, "learning_rate": 0.00018123443093361256, "loss": 0.0163, "step": 305450 }, { "epoch": 0.79, "learning_rate": 0.00018123054271724113, "loss": 0.0142, "step": 305460 }, { "epoch": 0.79, "learning_rate": 0.00018122665450086964, "loss": 0.0155, "step": 305470 }, { "epoch": 0.79, "learning_rate": 0.00018122276628449818, "loss": 0.0158, "step": 305480 }, { "epoch": 0.79, "learning_rate": 0.0001812188780681267, "loss": 0.0181, "step": 305490 }, { "epoch": 0.79, "learning_rate": 0.00018121498985175527, "loss": 0.0194, "step": 305500 }, { "epoch": 0.79, "learning_rate": 0.00018121110163538378, "loss": 0.0168, "step": 305510 }, { "epoch": 0.79, "learning_rate": 0.00018120721341901232, "loss": 0.0149, "step": 305520 }, { "epoch": 0.79, "learning_rate": 0.00018120332520264084, "loss": 0.0121, "step": 305530 }, { "epoch": 0.79, "learning_rate": 0.0001811994369862694, "loss": 0.0119, "step": 305540 }, { "epoch": 0.79, "learning_rate": 0.00018119554876989795, "loss": 0.0122, "step": 305550 }, { "epoch": 0.79, "learning_rate": 0.00018119166055352646, "loss": 0.0116, "step": 305560 }, { "epoch": 0.79, "learning_rate": 0.000181187772337155, "loss": 0.0108, "step": 305570 }, { "epoch": 0.79, "learning_rate": 0.00018118388412078355, "loss": 0.0154, "step": 305580 }, { "epoch": 0.79, "learning_rate": 0.0001811799959044121, "loss": 0.0129, "step": 305590 }, { "epoch": 0.79, "learning_rate": 0.0001811761076880406, "loss": 0.0128, "step": 305600 }, { "epoch": 0.79, "learning_rate": 0.00018117221947166914, "loss": 0.0109, "step": 305610 }, { "epoch": 0.79, "learning_rate": 0.00018116833125529768, "loss": 0.0117, "step": 305620 }, { "epoch": 0.79, "learning_rate": 0.00018116444303892623, "loss": 0.0127, "step": 305630 }, { "epoch": 0.79, "learning_rate": 0.00018116055482255474, "loss": 0.0129, "step": 305640 }, { "epoch": 0.79, "learning_rate": 0.00018115666660618328, "loss": 0.0127, "step": 305650 }, { "epoch": 0.79, "learning_rate": 0.00018115277838981182, "loss": 0.0118, "step": 305660 }, { "epoch": 0.79, "learning_rate": 0.00018114889017344037, "loss": 0.0144, "step": 305670 }, { "epoch": 0.79, "learning_rate": 0.00018114500195706888, "loss": 0.0179, "step": 305680 }, { "epoch": 0.79, "learning_rate": 0.00018114111374069742, "loss": 0.015, "step": 305690 }, { "epoch": 0.79, "learning_rate": 0.00018113722552432594, "loss": 0.0138, "step": 305700 }, { "epoch": 0.79, "learning_rate": 0.0001811333373079545, "loss": 0.0157, "step": 305710 }, { "epoch": 0.79, "learning_rate": 0.00018112944909158305, "loss": 0.0151, "step": 305720 }, { "epoch": 0.79, "learning_rate": 0.00018112556087521156, "loss": 0.0118, "step": 305730 }, { "epoch": 0.79, "learning_rate": 0.00018112167265884008, "loss": 0.0116, "step": 305740 }, { "epoch": 0.79, "learning_rate": 0.00018111778444246864, "loss": 0.0142, "step": 305750 }, { "epoch": 0.79, "learning_rate": 0.0001811138962260972, "loss": 0.0112, "step": 305760 }, { "epoch": 0.79, "learning_rate": 0.0001811100080097257, "loss": 0.0144, "step": 305770 }, { "epoch": 0.79, "learning_rate": 0.00018110611979335424, "loss": 0.013, "step": 305780 }, { "epoch": 0.79, "learning_rate": 0.00018110223157698278, "loss": 0.0138, "step": 305790 }, { "epoch": 0.79, "learning_rate": 0.00018109834336061133, "loss": 0.0137, "step": 305800 }, { "epoch": 0.79, "learning_rate": 0.00018109445514423984, "loss": 0.014, "step": 305810 }, { "epoch": 0.79, "learning_rate": 0.00018109056692786838, "loss": 0.015, "step": 305820 }, { "epoch": 0.79, "learning_rate": 0.00018108667871149692, "loss": 0.0133, "step": 305830 }, { "epoch": 0.79, "learning_rate": 0.00018108279049512547, "loss": 0.0109, "step": 305840 }, { "epoch": 0.79, "learning_rate": 0.00018107890227875398, "loss": 0.0149, "step": 305850 }, { "epoch": 0.79, "learning_rate": 0.00018107501406238252, "loss": 0.0155, "step": 305860 }, { "epoch": 0.79, "learning_rate": 0.0001810711258460111, "loss": 0.0155, "step": 305870 }, { "epoch": 0.79, "learning_rate": 0.0001810672376296396, "loss": 0.0139, "step": 305880 }, { "epoch": 0.79, "learning_rate": 0.00018106334941326812, "loss": 0.0142, "step": 305890 }, { "epoch": 0.79, "learning_rate": 0.00018105946119689666, "loss": 0.0122, "step": 305900 }, { "epoch": 0.79, "learning_rate": 0.00018105557298052523, "loss": 0.0179, "step": 305910 }, { "epoch": 0.79, "learning_rate": 0.00018105168476415374, "loss": 0.016, "step": 305920 }, { "epoch": 0.79, "learning_rate": 0.00018104779654778229, "loss": 0.0145, "step": 305930 }, { "epoch": 0.79, "learning_rate": 0.0001810439083314108, "loss": 0.0161, "step": 305940 }, { "epoch": 0.79, "learning_rate": 0.00018104002011503934, "loss": 0.0134, "step": 305950 }, { "epoch": 0.79, "learning_rate": 0.00018103613189866788, "loss": 0.0138, "step": 305960 }, { "epoch": 0.79, "learning_rate": 0.00018103224368229643, "loss": 0.0172, "step": 305970 }, { "epoch": 0.79, "learning_rate": 0.00018102835546592494, "loss": 0.0113, "step": 305980 }, { "epoch": 0.79, "learning_rate": 0.00018102446724955348, "loss": 0.0119, "step": 305990 }, { "epoch": 0.79, "learning_rate": 0.00018102057903318202, "loss": 0.0146, "step": 306000 }, { "epoch": 0.79, "eval_cer": 0.8817306790618513, "eval_loss": 0.009411798790097237, "eval_runtime": 107.6226, "eval_samples_per_second": 18.583, "eval_steps_per_second": 4.646, "step": 306000 }, { "epoch": 0.79, "learning_rate": 0.00018101669081681056, "loss": 0.0154, "step": 306010 }, { "epoch": 0.79, "learning_rate": 0.00018101280260043908, "loss": 0.0155, "step": 306020 }, { "epoch": 0.79, "learning_rate": 0.00018100891438406762, "loss": 0.018, "step": 306030 }, { "epoch": 0.79, "learning_rate": 0.0001810050261676962, "loss": 0.0166, "step": 306040 }, { "epoch": 0.79, "learning_rate": 0.0001810011379513247, "loss": 0.0132, "step": 306050 }, { "epoch": 0.79, "learning_rate": 0.00018099724973495322, "loss": 0.0116, "step": 306060 }, { "epoch": 0.79, "learning_rate": 0.00018099336151858176, "loss": 0.0157, "step": 306070 }, { "epoch": 0.79, "learning_rate": 0.00018098947330221033, "loss": 0.0142, "step": 306080 }, { "epoch": 0.79, "learning_rate": 0.00018098558508583884, "loss": 0.0175, "step": 306090 }, { "epoch": 0.79, "learning_rate": 0.00018098169686946739, "loss": 0.0121, "step": 306100 }, { "epoch": 0.79, "learning_rate": 0.0001809778086530959, "loss": 0.0126, "step": 306110 }, { "epoch": 0.79, "learning_rate": 0.00018097392043672447, "loss": 0.0154, "step": 306120 }, { "epoch": 0.79, "learning_rate": 0.00018097003222035298, "loss": 0.0162, "step": 306130 }, { "epoch": 0.79, "learning_rate": 0.00018096614400398152, "loss": 0.0141, "step": 306140 }, { "epoch": 0.79, "learning_rate": 0.00018096225578761004, "loss": 0.0143, "step": 306150 }, { "epoch": 0.79, "learning_rate": 0.0001809583675712386, "loss": 0.0182, "step": 306160 }, { "epoch": 0.79, "learning_rate": 0.00018095447935486712, "loss": 0.0172, "step": 306170 }, { "epoch": 0.79, "learning_rate": 0.00018095059113849566, "loss": 0.0142, "step": 306180 }, { "epoch": 0.79, "learning_rate": 0.00018094670292212418, "loss": 0.0125, "step": 306190 }, { "epoch": 0.79, "learning_rate": 0.00018094281470575272, "loss": 0.0149, "step": 306200 }, { "epoch": 0.79, "learning_rate": 0.00018093892648938126, "loss": 0.0155, "step": 306210 }, { "epoch": 0.79, "learning_rate": 0.0001809350382730098, "loss": 0.0144, "step": 306220 }, { "epoch": 0.79, "learning_rate": 0.00018093115005663832, "loss": 0.016, "step": 306230 }, { "epoch": 0.79, "learning_rate": 0.00018092726184026686, "loss": 0.0128, "step": 306240 }, { "epoch": 0.79, "learning_rate": 0.00018092337362389543, "loss": 0.0151, "step": 306250 }, { "epoch": 0.79, "learning_rate": 0.00018091948540752394, "loss": 0.0169, "step": 306260 }, { "epoch": 0.79, "learning_rate": 0.00018091559719115248, "loss": 0.0156, "step": 306270 }, { "epoch": 0.79, "learning_rate": 0.000180911708974781, "loss": 0.0123, "step": 306280 }, { "epoch": 0.79, "learning_rate": 0.00018090782075840957, "loss": 0.0172, "step": 306290 }, { "epoch": 0.79, "learning_rate": 0.00018090393254203808, "loss": 0.0144, "step": 306300 }, { "epoch": 0.79, "learning_rate": 0.00018090004432566662, "loss": 0.0149, "step": 306310 }, { "epoch": 0.79, "learning_rate": 0.00018089615610929514, "loss": 0.0157, "step": 306320 }, { "epoch": 0.79, "learning_rate": 0.0001808922678929237, "loss": 0.0142, "step": 306330 }, { "epoch": 0.79, "learning_rate": 0.00018088837967655222, "loss": 0.0118, "step": 306340 }, { "epoch": 0.79, "learning_rate": 0.00018088449146018076, "loss": 0.015, "step": 306350 }, { "epoch": 0.79, "learning_rate": 0.00018088060324380928, "loss": 0.01, "step": 306360 }, { "epoch": 0.79, "learning_rate": 0.00018087671502743785, "loss": 0.0163, "step": 306370 }, { "epoch": 0.79, "learning_rate": 0.00018087282681106636, "loss": 0.0151, "step": 306380 }, { "epoch": 0.79, "learning_rate": 0.0001808689385946949, "loss": 0.0156, "step": 306390 }, { "epoch": 0.79, "learning_rate": 0.00018086505037832342, "loss": 0.0153, "step": 306400 }, { "epoch": 0.79, "learning_rate": 0.00018086116216195199, "loss": 0.016, "step": 306410 }, { "epoch": 0.79, "learning_rate": 0.00018085727394558053, "loss": 0.0142, "step": 306420 }, { "epoch": 0.79, "learning_rate": 0.00018085338572920904, "loss": 0.0123, "step": 306430 }, { "epoch": 0.79, "learning_rate": 0.00018084949751283758, "loss": 0.0162, "step": 306440 }, { "epoch": 0.79, "learning_rate": 0.0001808456092964661, "loss": 0.0166, "step": 306450 }, { "epoch": 0.79, "learning_rate": 0.00018084172108009467, "loss": 0.0124, "step": 306460 }, { "epoch": 0.79, "learning_rate": 0.00018083783286372318, "loss": 0.0114, "step": 306470 }, { "epoch": 0.79, "learning_rate": 0.00018083394464735172, "loss": 0.0104, "step": 306480 }, { "epoch": 0.79, "learning_rate": 0.00018083005643098024, "loss": 0.0144, "step": 306490 }, { "epoch": 0.79, "learning_rate": 0.0001808261682146088, "loss": 0.014, "step": 306500 }, { "epoch": 0.79, "learning_rate": 0.00018082227999823732, "loss": 0.0126, "step": 306510 }, { "epoch": 0.79, "learning_rate": 0.00018081839178186586, "loss": 0.0127, "step": 306520 }, { "epoch": 0.79, "learning_rate": 0.00018081450356549438, "loss": 0.0146, "step": 306530 }, { "epoch": 0.79, "learning_rate": 0.00018081061534912295, "loss": 0.0146, "step": 306540 }, { "epoch": 0.79, "learning_rate": 0.00018080672713275146, "loss": 0.0148, "step": 306550 }, { "epoch": 0.79, "learning_rate": 0.00018080283891638, "loss": 0.0111, "step": 306560 }, { "epoch": 0.79, "learning_rate": 0.00018079895070000852, "loss": 0.0173, "step": 306570 }, { "epoch": 0.79, "learning_rate": 0.00018079506248363709, "loss": 0.0146, "step": 306580 }, { "epoch": 0.79, "learning_rate": 0.00018079117426726563, "loss": 0.0141, "step": 306590 }, { "epoch": 0.79, "learning_rate": 0.00018078728605089414, "loss": 0.0152, "step": 306600 }, { "epoch": 0.79, "learning_rate": 0.00018078339783452266, "loss": 0.0144, "step": 306610 }, { "epoch": 0.79, "learning_rate": 0.00018077950961815123, "loss": 0.0173, "step": 306620 }, { "epoch": 0.79, "learning_rate": 0.00018077562140177977, "loss": 0.0113, "step": 306630 }, { "epoch": 0.79, "learning_rate": 0.00018077173318540828, "loss": 0.0123, "step": 306640 }, { "epoch": 0.79, "learning_rate": 0.00018076784496903682, "loss": 0.016, "step": 306650 }, { "epoch": 0.79, "learning_rate": 0.00018076395675266534, "loss": 0.0145, "step": 306660 }, { "epoch": 0.79, "learning_rate": 0.0001807600685362939, "loss": 0.0116, "step": 306670 }, { "epoch": 0.79, "learning_rate": 0.00018075618031992242, "loss": 0.0141, "step": 306680 }, { "epoch": 0.79, "learning_rate": 0.00018075229210355096, "loss": 0.0168, "step": 306690 }, { "epoch": 0.8, "learning_rate": 0.00018074840388717948, "loss": 0.0148, "step": 306700 }, { "epoch": 0.8, "learning_rate": 0.00018074451567080805, "loss": 0.0135, "step": 306710 }, { "epoch": 0.8, "learning_rate": 0.00018074062745443656, "loss": 0.0132, "step": 306720 }, { "epoch": 0.8, "learning_rate": 0.0001807367392380651, "loss": 0.0145, "step": 306730 }, { "epoch": 0.8, "learning_rate": 0.00018073285102169362, "loss": 0.011, "step": 306740 }, { "epoch": 0.8, "learning_rate": 0.00018072896280532219, "loss": 0.0115, "step": 306750 }, { "epoch": 0.8, "learning_rate": 0.00018072507458895073, "loss": 0.0115, "step": 306760 }, { "epoch": 0.8, "learning_rate": 0.00018072118637257924, "loss": 0.0151, "step": 306770 }, { "epoch": 0.8, "learning_rate": 0.00018071729815620776, "loss": 0.013, "step": 306780 }, { "epoch": 0.8, "learning_rate": 0.00018071340993983632, "loss": 0.0144, "step": 306790 }, { "epoch": 0.8, "learning_rate": 0.00018070952172346487, "loss": 0.0129, "step": 306800 }, { "epoch": 0.8, "learning_rate": 0.00018070563350709338, "loss": 0.0166, "step": 306810 }, { "epoch": 0.8, "learning_rate": 0.00018070174529072192, "loss": 0.0138, "step": 306820 }, { "epoch": 0.8, "learning_rate": 0.00018069785707435046, "loss": 0.0137, "step": 306830 }, { "epoch": 0.8, "learning_rate": 0.000180693968857979, "loss": 0.0111, "step": 306840 }, { "epoch": 0.8, "learning_rate": 0.00018069008064160752, "loss": 0.0124, "step": 306850 }, { "epoch": 0.8, "learning_rate": 0.00018068619242523606, "loss": 0.0156, "step": 306860 }, { "epoch": 0.8, "learning_rate": 0.0001806823042088646, "loss": 0.0128, "step": 306870 }, { "epoch": 0.8, "learning_rate": 0.00018067841599249315, "loss": 0.0155, "step": 306880 }, { "epoch": 0.8, "learning_rate": 0.00018067452777612166, "loss": 0.0128, "step": 306890 }, { "epoch": 0.8, "learning_rate": 0.0001806706395597502, "loss": 0.0175, "step": 306900 }, { "epoch": 0.8, "learning_rate": 0.00018066675134337872, "loss": 0.0152, "step": 306910 }, { "epoch": 0.8, "learning_rate": 0.00018066286312700728, "loss": 0.0157, "step": 306920 }, { "epoch": 0.8, "learning_rate": 0.0001806589749106358, "loss": 0.0166, "step": 306930 }, { "epoch": 0.8, "learning_rate": 0.00018065508669426434, "loss": 0.0152, "step": 306940 }, { "epoch": 0.8, "learning_rate": 0.00018065119847789286, "loss": 0.0139, "step": 306950 }, { "epoch": 0.8, "learning_rate": 0.00018064731026152142, "loss": 0.0119, "step": 306960 }, { "epoch": 0.8, "learning_rate": 0.00018064342204514997, "loss": 0.0138, "step": 306970 }, { "epoch": 0.8, "learning_rate": 0.00018063953382877848, "loss": 0.0185, "step": 306980 }, { "epoch": 0.8, "learning_rate": 0.00018063564561240702, "loss": 0.0133, "step": 306990 }, { "epoch": 0.8, "learning_rate": 0.00018063175739603556, "loss": 0.0123, "step": 307000 }, { "epoch": 0.8, "eval_cer": 0.8817082848709045, "eval_loss": 0.00944979302585125, "eval_runtime": 107.8315, "eval_samples_per_second": 18.547, "eval_steps_per_second": 4.637, "step": 307000 }, { "epoch": 0.8, "learning_rate": 0.0001806278691796641, "loss": 0.0138, "step": 307010 }, { "epoch": 0.8, "learning_rate": 0.00018062398096329262, "loss": 0.0126, "step": 307020 }, { "epoch": 0.8, "learning_rate": 0.00018062009274692116, "loss": 0.0156, "step": 307030 }, { "epoch": 0.8, "learning_rate": 0.0001806162045305497, "loss": 0.0137, "step": 307040 }, { "epoch": 0.8, "learning_rate": 0.00018061231631417824, "loss": 0.0168, "step": 307050 }, { "epoch": 0.8, "learning_rate": 0.00018060842809780676, "loss": 0.0258, "step": 307060 }, { "epoch": 0.8, "learning_rate": 0.0001806045398814353, "loss": 0.0147, "step": 307070 }, { "epoch": 0.8, "learning_rate": 0.00018060065166506384, "loss": 0.0202, "step": 307080 }, { "epoch": 0.8, "learning_rate": 0.00018059676344869238, "loss": 0.0161, "step": 307090 }, { "epoch": 0.8, "learning_rate": 0.0001805928752323209, "loss": 0.0198, "step": 307100 }, { "epoch": 0.8, "learning_rate": 0.00018058898701594944, "loss": 0.0133, "step": 307110 }, { "epoch": 0.8, "learning_rate": 0.000180585098799578, "loss": 0.0128, "step": 307120 }, { "epoch": 0.8, "learning_rate": 0.00018058121058320652, "loss": 0.0154, "step": 307130 }, { "epoch": 0.8, "learning_rate": 0.00018057732236683507, "loss": 0.0152, "step": 307140 }, { "epoch": 0.8, "learning_rate": 0.00018057343415046358, "loss": 0.0107, "step": 307150 }, { "epoch": 0.8, "learning_rate": 0.00018056954593409212, "loss": 0.0215, "step": 307160 }, { "epoch": 0.8, "learning_rate": 0.00018056565771772066, "loss": 0.0168, "step": 307170 }, { "epoch": 0.8, "learning_rate": 0.0001805617695013492, "loss": 0.0147, "step": 307180 }, { "epoch": 0.8, "learning_rate": 0.00018055788128497772, "loss": 0.015, "step": 307190 }, { "epoch": 0.8, "learning_rate": 0.00018055399306860626, "loss": 0.0116, "step": 307200 }, { "epoch": 0.8, "learning_rate": 0.0001805501048522348, "loss": 0.0153, "step": 307210 }, { "epoch": 0.8, "learning_rate": 0.00018054621663586334, "loss": 0.0141, "step": 307220 }, { "epoch": 0.8, "learning_rate": 0.00018054232841949186, "loss": 0.0099, "step": 307230 }, { "epoch": 0.8, "learning_rate": 0.0001805384402031204, "loss": 0.0151, "step": 307240 }, { "epoch": 0.8, "learning_rate": 0.00018053455198674894, "loss": 0.0129, "step": 307250 }, { "epoch": 0.8, "learning_rate": 0.00018053066377037748, "loss": 0.0177, "step": 307260 }, { "epoch": 0.8, "learning_rate": 0.000180526775554006, "loss": 0.0146, "step": 307270 }, { "epoch": 0.8, "learning_rate": 0.00018052288733763454, "loss": 0.0175, "step": 307280 }, { "epoch": 0.8, "learning_rate": 0.0001805189991212631, "loss": 0.0169, "step": 307290 }, { "epoch": 0.8, "learning_rate": 0.00018051511090489162, "loss": 0.0156, "step": 307300 }, { "epoch": 0.8, "learning_rate": 0.00018051122268852016, "loss": 0.0166, "step": 307310 }, { "epoch": 0.8, "learning_rate": 0.00018050733447214868, "loss": 0.0188, "step": 307320 }, { "epoch": 0.8, "learning_rate": 0.00018050344625577725, "loss": 0.0149, "step": 307330 }, { "epoch": 0.8, "learning_rate": 0.00018049955803940576, "loss": 0.0133, "step": 307340 }, { "epoch": 0.8, "learning_rate": 0.0001804956698230343, "loss": 0.013, "step": 307350 }, { "epoch": 0.8, "learning_rate": 0.00018049178160666282, "loss": 0.0127, "step": 307360 }, { "epoch": 0.8, "learning_rate": 0.0001804878933902914, "loss": 0.0203, "step": 307370 }, { "epoch": 0.8, "learning_rate": 0.0001804840051739199, "loss": 0.0157, "step": 307380 }, { "epoch": 0.8, "learning_rate": 0.00018048011695754844, "loss": 0.0141, "step": 307390 }, { "epoch": 0.8, "learning_rate": 0.00018047622874117696, "loss": 0.0114, "step": 307400 }, { "epoch": 0.8, "learning_rate": 0.0001804723405248055, "loss": 0.0139, "step": 307410 }, { "epoch": 0.8, "learning_rate": 0.00018046845230843404, "loss": 0.0165, "step": 307420 }, { "epoch": 0.8, "learning_rate": 0.00018046456409206258, "loss": 0.0127, "step": 307430 }, { "epoch": 0.8, "learning_rate": 0.0001804606758756911, "loss": 0.0201, "step": 307440 }, { "epoch": 0.8, "learning_rate": 0.00018045678765931964, "loss": 0.0157, "step": 307450 }, { "epoch": 0.8, "learning_rate": 0.0001804528994429482, "loss": 0.0135, "step": 307460 }, { "epoch": 0.8, "learning_rate": 0.00018044901122657672, "loss": 0.0176, "step": 307470 }, { "epoch": 0.8, "learning_rate": 0.00018044512301020524, "loss": 0.0131, "step": 307480 }, { "epoch": 0.8, "learning_rate": 0.00018044123479383378, "loss": 0.0162, "step": 307490 }, { "epoch": 0.8, "learning_rate": 0.00018043734657746235, "loss": 0.0195, "step": 307500 }, { "epoch": 0.8, "learning_rate": 0.00018043345836109086, "loss": 0.0135, "step": 307510 }, { "epoch": 0.8, "learning_rate": 0.0001804295701447194, "loss": 0.0137, "step": 307520 }, { "epoch": 0.8, "learning_rate": 0.00018042568192834792, "loss": 0.015, "step": 307530 }, { "epoch": 0.8, "learning_rate": 0.0001804217937119765, "loss": 0.0129, "step": 307540 }, { "epoch": 0.8, "learning_rate": 0.000180417905495605, "loss": 0.0159, "step": 307550 }, { "epoch": 0.8, "learning_rate": 0.00018041401727923354, "loss": 0.0129, "step": 307560 }, { "epoch": 0.8, "learning_rate": 0.00018041012906286206, "loss": 0.0129, "step": 307570 }, { "epoch": 0.8, "learning_rate": 0.00018040624084649063, "loss": 0.0125, "step": 307580 }, { "epoch": 0.8, "learning_rate": 0.00018040235263011914, "loss": 0.0141, "step": 307590 }, { "epoch": 0.8, "learning_rate": 0.00018039846441374768, "loss": 0.0177, "step": 307600 }, { "epoch": 0.8, "learning_rate": 0.0001803945761973762, "loss": 0.0123, "step": 307610 }, { "epoch": 0.8, "learning_rate": 0.00018039068798100477, "loss": 0.0166, "step": 307620 }, { "epoch": 0.8, "learning_rate": 0.0001803867997646333, "loss": 0.0128, "step": 307630 }, { "epoch": 0.8, "learning_rate": 0.00018038291154826182, "loss": 0.0173, "step": 307640 }, { "epoch": 0.8, "learning_rate": 0.00018037902333189034, "loss": 0.0139, "step": 307650 }, { "epoch": 0.8, "learning_rate": 0.00018037513511551888, "loss": 0.0132, "step": 307660 }, { "epoch": 0.8, "learning_rate": 0.00018037124689914745, "loss": 0.0126, "step": 307670 }, { "epoch": 0.8, "learning_rate": 0.00018036735868277596, "loss": 0.0138, "step": 307680 }, { "epoch": 0.8, "learning_rate": 0.0001803634704664045, "loss": 0.0121, "step": 307690 }, { "epoch": 0.8, "learning_rate": 0.00018035958225003302, "loss": 0.0158, "step": 307700 }, { "epoch": 0.8, "learning_rate": 0.00018035569403366159, "loss": 0.0143, "step": 307710 }, { "epoch": 0.8, "learning_rate": 0.0001803518058172901, "loss": 0.0147, "step": 307720 }, { "epoch": 0.8, "learning_rate": 0.00018034791760091864, "loss": 0.0174, "step": 307730 }, { "epoch": 0.8, "learning_rate": 0.00018034402938454716, "loss": 0.0147, "step": 307740 }, { "epoch": 0.8, "learning_rate": 0.00018034014116817573, "loss": 0.0125, "step": 307750 }, { "epoch": 0.8, "learning_rate": 0.00018033625295180424, "loss": 0.0139, "step": 307760 }, { "epoch": 0.8, "learning_rate": 0.00018033236473543278, "loss": 0.0161, "step": 307770 }, { "epoch": 0.8, "learning_rate": 0.0001803284765190613, "loss": 0.0146, "step": 307780 }, { "epoch": 0.8, "learning_rate": 0.00018032458830268986, "loss": 0.0153, "step": 307790 }, { "epoch": 0.8, "learning_rate": 0.00018032070008631838, "loss": 0.0109, "step": 307800 }, { "epoch": 0.8, "learning_rate": 0.00018031681186994692, "loss": 0.0137, "step": 307810 }, { "epoch": 0.8, "learning_rate": 0.00018031292365357544, "loss": 0.0142, "step": 307820 }, { "epoch": 0.8, "learning_rate": 0.000180309035437204, "loss": 0.0157, "step": 307830 }, { "epoch": 0.8, "learning_rate": 0.00018030514722083255, "loss": 0.0095, "step": 307840 }, { "epoch": 0.8, "learning_rate": 0.00018030125900446106, "loss": 0.0138, "step": 307850 }, { "epoch": 0.8, "learning_rate": 0.0001802973707880896, "loss": 0.0112, "step": 307860 }, { "epoch": 0.8, "learning_rate": 0.00018029348257171814, "loss": 0.0153, "step": 307870 }, { "epoch": 0.8, "learning_rate": 0.00018028959435534669, "loss": 0.0121, "step": 307880 }, { "epoch": 0.8, "learning_rate": 0.0001802857061389752, "loss": 0.0118, "step": 307890 }, { "epoch": 0.8, "learning_rate": 0.00018028181792260374, "loss": 0.0135, "step": 307900 }, { "epoch": 0.8, "learning_rate": 0.00018027792970623226, "loss": 0.0109, "step": 307910 }, { "epoch": 0.8, "learning_rate": 0.00018027404148986082, "loss": 0.014, "step": 307920 }, { "epoch": 0.8, "learning_rate": 0.00018027015327348934, "loss": 0.0157, "step": 307930 }, { "epoch": 0.8, "learning_rate": 0.00018026626505711788, "loss": 0.0174, "step": 307940 }, { "epoch": 0.8, "learning_rate": 0.0001802623768407464, "loss": 0.0124, "step": 307950 }, { "epoch": 0.8, "learning_rate": 0.00018025848862437496, "loss": 0.0143, "step": 307960 }, { "epoch": 0.8, "learning_rate": 0.00018025460040800348, "loss": 0.0136, "step": 307970 }, { "epoch": 0.8, "learning_rate": 0.00018025071219163202, "loss": 0.0161, "step": 307980 }, { "epoch": 0.8, "learning_rate": 0.00018024682397526054, "loss": 0.0131, "step": 307990 }, { "epoch": 0.8, "learning_rate": 0.0001802429357588891, "loss": 0.0138, "step": 308000 }, { "epoch": 0.8, "eval_cer": 0.8817264801510488, "eval_loss": 0.00954010896384716, "eval_runtime": 107.7412, "eval_samples_per_second": 18.563, "eval_steps_per_second": 4.641, "step": 308000 }, { "epoch": 0.8, "learning_rate": 0.00018023904754251765, "loss": 0.014, "step": 308010 }, { "epoch": 0.8, "learning_rate": 0.00018023515932614616, "loss": 0.0127, "step": 308020 }, { "epoch": 0.8, "learning_rate": 0.0001802312711097747, "loss": 0.0163, "step": 308030 }, { "epoch": 0.8, "learning_rate": 0.00018022738289340324, "loss": 0.0429, "step": 308040 }, { "epoch": 0.8, "learning_rate": 0.00018022349467703178, "loss": 0.0144, "step": 308050 }, { "epoch": 0.8, "learning_rate": 0.0001802196064606603, "loss": 0.0119, "step": 308060 }, { "epoch": 0.8, "learning_rate": 0.00018021571824428884, "loss": 0.02, "step": 308070 }, { "epoch": 0.8, "learning_rate": 0.00018021183002791738, "loss": 0.0129, "step": 308080 }, { "epoch": 0.8, "learning_rate": 0.00018020794181154592, "loss": 0.0168, "step": 308090 }, { "epoch": 0.8, "learning_rate": 0.00018020405359517444, "loss": 0.0161, "step": 308100 }, { "epoch": 0.8, "learning_rate": 0.00018020016537880298, "loss": 0.0186, "step": 308110 }, { "epoch": 0.8, "learning_rate": 0.00018019627716243152, "loss": 0.0127, "step": 308120 }, { "epoch": 0.8, "learning_rate": 0.00018019238894606006, "loss": 0.0112, "step": 308130 }, { "epoch": 0.8, "learning_rate": 0.00018018850072968858, "loss": 0.0126, "step": 308140 }, { "epoch": 0.8, "learning_rate": 0.00018018461251331712, "loss": 0.014, "step": 308150 }, { "epoch": 0.8, "learning_rate": 0.00018018072429694563, "loss": 0.0102, "step": 308160 }, { "epoch": 0.8, "learning_rate": 0.0001801768360805742, "loss": 0.0149, "step": 308170 }, { "epoch": 0.8, "learning_rate": 0.00018017294786420274, "loss": 0.0143, "step": 308180 }, { "epoch": 0.8, "learning_rate": 0.00018016905964783126, "loss": 0.0147, "step": 308190 }, { "epoch": 0.8, "learning_rate": 0.00018016517143145977, "loss": 0.0155, "step": 308200 }, { "epoch": 0.8, "learning_rate": 0.00018016128321508834, "loss": 0.0156, "step": 308210 }, { "epoch": 0.8, "learning_rate": 0.00018015739499871688, "loss": 0.0155, "step": 308220 }, { "epoch": 0.8, "learning_rate": 0.0001801535067823454, "loss": 0.0121, "step": 308230 }, { "epoch": 0.8, "learning_rate": 0.00018014961856597394, "loss": 0.0157, "step": 308240 }, { "epoch": 0.8, "learning_rate": 0.00018014573034960248, "loss": 0.0165, "step": 308250 }, { "epoch": 0.8, "learning_rate": 0.00018014184213323102, "loss": 0.0136, "step": 308260 }, { "epoch": 0.8, "learning_rate": 0.00018013795391685954, "loss": 0.0152, "step": 308270 }, { "epoch": 0.8, "learning_rate": 0.00018013406570048808, "loss": 0.012, "step": 308280 }, { "epoch": 0.8, "learning_rate": 0.00018013017748411662, "loss": 0.0122, "step": 308290 }, { "epoch": 0.8, "learning_rate": 0.00018012628926774516, "loss": 0.0158, "step": 308300 }, { "epoch": 0.8, "learning_rate": 0.00018012240105137368, "loss": 0.0171, "step": 308310 }, { "epoch": 0.8, "learning_rate": 0.00018011851283500222, "loss": 0.015, "step": 308320 }, { "epoch": 0.8, "learning_rate": 0.0001801146246186308, "loss": 0.0156, "step": 308330 }, { "epoch": 0.8, "learning_rate": 0.0001801107364022593, "loss": 0.0137, "step": 308340 }, { "epoch": 0.8, "learning_rate": 0.00018010684818588784, "loss": 0.0169, "step": 308350 }, { "epoch": 0.8, "learning_rate": 0.00018010295996951636, "loss": 0.0121, "step": 308360 }, { "epoch": 0.8, "learning_rate": 0.00018009907175314493, "loss": 0.0202, "step": 308370 }, { "epoch": 0.8, "learning_rate": 0.00018009518353677344, "loss": 0.0159, "step": 308380 }, { "epoch": 0.8, "learning_rate": 0.00018009129532040198, "loss": 0.0141, "step": 308390 }, { "epoch": 0.8, "learning_rate": 0.0001800874071040305, "loss": 0.0113, "step": 308400 }, { "epoch": 0.8, "learning_rate": 0.00018008351888765904, "loss": 0.0119, "step": 308410 }, { "epoch": 0.8, "learning_rate": 0.00018007963067128758, "loss": 0.0158, "step": 308420 }, { "epoch": 0.8, "learning_rate": 0.00018007574245491612, "loss": 0.0177, "step": 308430 }, { "epoch": 0.8, "learning_rate": 0.00018007185423854464, "loss": 0.017, "step": 308440 }, { "epoch": 0.8, "learning_rate": 0.00018006796602217318, "loss": 0.0146, "step": 308450 }, { "epoch": 0.8, "learning_rate": 0.00018006407780580172, "loss": 0.013, "step": 308460 }, { "epoch": 0.8, "learning_rate": 0.00018006018958943026, "loss": 0.014, "step": 308470 }, { "epoch": 0.8, "learning_rate": 0.00018005630137305878, "loss": 0.012, "step": 308480 }, { "epoch": 0.8, "learning_rate": 0.00018005241315668732, "loss": 0.013, "step": 308490 }, { "epoch": 0.8, "learning_rate": 0.0001800485249403159, "loss": 0.0167, "step": 308500 }, { "epoch": 0.8, "learning_rate": 0.0001800446367239444, "loss": 0.0112, "step": 308510 }, { "epoch": 0.8, "learning_rate": 0.00018004074850757292, "loss": 0.0191, "step": 308520 }, { "epoch": 0.8, "learning_rate": 0.00018003686029120146, "loss": 0.0143, "step": 308530 }, { "epoch": 0.8, "learning_rate": 0.00018003297207483003, "loss": 0.0167, "step": 308540 }, { "epoch": 0.8, "learning_rate": 0.00018002908385845854, "loss": 0.0105, "step": 308550 }, { "epoch": 0.8, "learning_rate": 0.00018002519564208708, "loss": 0.0128, "step": 308560 }, { "epoch": 0.8, "learning_rate": 0.0001800213074257156, "loss": 0.0149, "step": 308570 }, { "epoch": 0.8, "learning_rate": 0.00018001741920934417, "loss": 0.015, "step": 308580 }, { "epoch": 0.8, "learning_rate": 0.00018001353099297268, "loss": 0.0141, "step": 308590 }, { "epoch": 0.8, "learning_rate": 0.00018000964277660122, "loss": 0.012, "step": 308600 }, { "epoch": 0.8, "learning_rate": 0.00018000575456022974, "loss": 0.0171, "step": 308610 }, { "epoch": 0.8, "learning_rate": 0.0001800018663438583, "loss": 0.013, "step": 308620 }, { "epoch": 0.8, "learning_rate": 0.00017999797812748682, "loss": 0.0135, "step": 308630 }, { "epoch": 0.8, "learning_rate": 0.00017999408991111536, "loss": 0.0126, "step": 308640 }, { "epoch": 0.8, "learning_rate": 0.00017999020169474388, "loss": 0.0163, "step": 308650 }, { "epoch": 0.8, "learning_rate": 0.00017998631347837242, "loss": 0.0138, "step": 308660 }, { "epoch": 0.8, "learning_rate": 0.00017998242526200096, "loss": 0.0151, "step": 308670 }, { "epoch": 0.8, "learning_rate": 0.0001799785370456295, "loss": 0.0137, "step": 308680 }, { "epoch": 0.8, "learning_rate": 0.00017997464882925802, "loss": 0.0149, "step": 308690 }, { "epoch": 0.8, "learning_rate": 0.00017997076061288656, "loss": 0.0153, "step": 308700 }, { "epoch": 0.8, "learning_rate": 0.00017996687239651513, "loss": 0.018, "step": 308710 }, { "epoch": 0.8, "learning_rate": 0.00017996298418014364, "loss": 0.0136, "step": 308720 }, { "epoch": 0.8, "learning_rate": 0.00017995909596377218, "loss": 0.0123, "step": 308730 }, { "epoch": 0.8, "learning_rate": 0.0001799552077474007, "loss": 0.0108, "step": 308740 }, { "epoch": 0.8, "learning_rate": 0.00017995131953102927, "loss": 0.0188, "step": 308750 }, { "epoch": 0.8, "learning_rate": 0.00017994743131465778, "loss": 0.0106, "step": 308760 }, { "epoch": 0.8, "learning_rate": 0.00017994354309828632, "loss": 0.0167, "step": 308770 }, { "epoch": 0.8, "learning_rate": 0.00017993965488191484, "loss": 0.0158, "step": 308780 }, { "epoch": 0.8, "learning_rate": 0.0001799357666655434, "loss": 0.0143, "step": 308790 }, { "epoch": 0.8, "learning_rate": 0.00017993187844917192, "loss": 0.014, "step": 308800 }, { "epoch": 0.8, "learning_rate": 0.00017992799023280046, "loss": 0.0156, "step": 308810 }, { "epoch": 0.8, "learning_rate": 0.00017992410201642898, "loss": 0.015, "step": 308820 }, { "epoch": 0.8, "learning_rate": 0.00017992021380005754, "loss": 0.0128, "step": 308830 }, { "epoch": 0.8, "learning_rate": 0.00017991632558368606, "loss": 0.0157, "step": 308840 }, { "epoch": 0.8, "learning_rate": 0.0001799124373673146, "loss": 0.0129, "step": 308850 }, { "epoch": 0.8, "learning_rate": 0.00017990854915094312, "loss": 0.0153, "step": 308860 }, { "epoch": 0.8, "learning_rate": 0.00017990466093457168, "loss": 0.0167, "step": 308870 }, { "epoch": 0.8, "learning_rate": 0.00017990077271820023, "loss": 0.0117, "step": 308880 }, { "epoch": 0.8, "learning_rate": 0.00017989688450182874, "loss": 0.0151, "step": 308890 }, { "epoch": 0.8, "learning_rate": 0.00017989299628545728, "loss": 0.0163, "step": 308900 }, { "epoch": 0.8, "learning_rate": 0.0001798891080690858, "loss": 0.0129, "step": 308910 }, { "epoch": 0.8, "learning_rate": 0.00017988521985271437, "loss": 0.0142, "step": 308920 }, { "epoch": 0.8, "learning_rate": 0.00017988133163634288, "loss": 0.0163, "step": 308930 }, { "epoch": 0.8, "learning_rate": 0.00017987744341997142, "loss": 0.0177, "step": 308940 }, { "epoch": 0.8, "learning_rate": 0.00017987355520359994, "loss": 0.0156, "step": 308950 }, { "epoch": 0.8, "learning_rate": 0.0001798696669872285, "loss": 0.0154, "step": 308960 }, { "epoch": 0.8, "learning_rate": 0.00017986577877085702, "loss": 0.0104, "step": 308970 }, { "epoch": 0.8, "learning_rate": 0.00017986189055448556, "loss": 0.0151, "step": 308980 }, { "epoch": 0.8, "learning_rate": 0.00017985800233811408, "loss": 0.0162, "step": 308990 }, { "epoch": 0.8, "learning_rate": 0.00017985411412174264, "loss": 0.0138, "step": 309000 }, { "epoch": 0.8, "eval_cer": 0.8817138834186412, "eval_loss": 0.009455575607717037, "eval_runtime": 107.8878, "eval_samples_per_second": 18.538, "eval_steps_per_second": 4.634, "step": 309000 }, { "epoch": 0.8, "learning_rate": 0.00017985022590537116, "loss": 0.0127, "step": 309010 }, { "epoch": 0.8, "learning_rate": 0.0001798463376889997, "loss": 0.0138, "step": 309020 }, { "epoch": 0.8, "learning_rate": 0.00017984244947262821, "loss": 0.0113, "step": 309030 }, { "epoch": 0.8, "learning_rate": 0.00017983856125625678, "loss": 0.0121, "step": 309040 }, { "epoch": 0.8, "learning_rate": 0.00017983467303988533, "loss": 0.0122, "step": 309050 }, { "epoch": 0.8, "learning_rate": 0.00017983078482351384, "loss": 0.0171, "step": 309060 }, { "epoch": 0.8, "learning_rate": 0.00017982689660714235, "loss": 0.0115, "step": 309070 }, { "epoch": 0.8, "learning_rate": 0.00017982300839077092, "loss": 0.0125, "step": 309080 }, { "epoch": 0.8, "learning_rate": 0.00017981912017439946, "loss": 0.015, "step": 309090 }, { "epoch": 0.8, "learning_rate": 0.00017981523195802798, "loss": 0.0178, "step": 309100 }, { "epoch": 0.8, "learning_rate": 0.00017981134374165652, "loss": 0.0131, "step": 309110 }, { "epoch": 0.8, "learning_rate": 0.00017980745552528506, "loss": 0.0124, "step": 309120 }, { "epoch": 0.8, "learning_rate": 0.0001798035673089136, "loss": 0.0106, "step": 309130 }, { "epoch": 0.8, "learning_rate": 0.00017979967909254212, "loss": 0.0177, "step": 309140 }, { "epoch": 0.8, "learning_rate": 0.00017979579087617066, "loss": 0.011, "step": 309150 }, { "epoch": 0.8, "learning_rate": 0.00017979190265979917, "loss": 0.0135, "step": 309160 }, { "epoch": 0.8, "learning_rate": 0.00017978801444342774, "loss": 0.0143, "step": 309170 }, { "epoch": 0.8, "learning_rate": 0.00017978412622705626, "loss": 0.0125, "step": 309180 }, { "epoch": 0.8, "learning_rate": 0.0001797802380106848, "loss": 0.0152, "step": 309190 }, { "epoch": 0.8, "learning_rate": 0.00017977634979431331, "loss": 0.0131, "step": 309200 }, { "epoch": 0.8, "learning_rate": 0.00017977246157794188, "loss": 0.0137, "step": 309210 }, { "epoch": 0.8, "learning_rate": 0.00017976857336157042, "loss": 0.0144, "step": 309220 }, { "epoch": 0.8, "learning_rate": 0.00017976468514519894, "loss": 0.0156, "step": 309230 }, { "epoch": 0.8, "learning_rate": 0.00017976079692882745, "loss": 0.012, "step": 309240 }, { "epoch": 0.8, "learning_rate": 0.00017975690871245602, "loss": 0.0143, "step": 309250 }, { "epoch": 0.8, "learning_rate": 0.00017975302049608456, "loss": 0.0133, "step": 309260 }, { "epoch": 0.8, "learning_rate": 0.00017974913227971308, "loss": 0.0163, "step": 309270 }, { "epoch": 0.8, "learning_rate": 0.00017974524406334162, "loss": 0.0144, "step": 309280 }, { "epoch": 0.8, "learning_rate": 0.00017974135584697016, "loss": 0.0172, "step": 309290 }, { "epoch": 0.8, "learning_rate": 0.0001797374676305987, "loss": 0.0145, "step": 309300 }, { "epoch": 0.8, "learning_rate": 0.00017973357941422722, "loss": 0.0139, "step": 309310 }, { "epoch": 0.8, "learning_rate": 0.00017972969119785576, "loss": 0.013, "step": 309320 }, { "epoch": 0.8, "learning_rate": 0.0001797258029814843, "loss": 0.0163, "step": 309330 }, { "epoch": 0.8, "learning_rate": 0.00017972191476511284, "loss": 0.0139, "step": 309340 }, { "epoch": 0.8, "learning_rate": 0.00017971802654874136, "loss": 0.0113, "step": 309350 }, { "epoch": 0.8, "learning_rate": 0.0001797141383323699, "loss": 0.013, "step": 309360 }, { "epoch": 0.8, "learning_rate": 0.00017971025011599847, "loss": 0.0142, "step": 309370 }, { "epoch": 0.8, "learning_rate": 0.00017970636189962698, "loss": 0.0158, "step": 309380 }, { "epoch": 0.8, "learning_rate": 0.0001797024736832555, "loss": 0.0128, "step": 309390 }, { "epoch": 0.8, "learning_rate": 0.00017969858546688404, "loss": 0.0163, "step": 309400 }, { "epoch": 0.8, "learning_rate": 0.00017969469725051255, "loss": 0.014, "step": 309410 }, { "epoch": 0.8, "learning_rate": 0.00017969080903414112, "loss": 0.0145, "step": 309420 }, { "epoch": 0.8, "learning_rate": 0.00017968692081776966, "loss": 0.0151, "step": 309430 }, { "epoch": 0.8, "learning_rate": 0.00017968303260139818, "loss": 0.0132, "step": 309440 }, { "epoch": 0.8, "learning_rate": 0.00017967914438502672, "loss": 0.0141, "step": 309450 }, { "epoch": 0.8, "learning_rate": 0.00017967525616865526, "loss": 0.0152, "step": 309460 }, { "epoch": 0.8, "learning_rate": 0.0001796713679522838, "loss": 0.015, "step": 309470 }, { "epoch": 0.8, "learning_rate": 0.00017966747973591232, "loss": 0.015, "step": 309480 }, { "epoch": 0.8, "learning_rate": 0.00017966359151954086, "loss": 0.0122, "step": 309490 }, { "epoch": 0.8, "learning_rate": 0.0001796597033031694, "loss": 0.0137, "step": 309500 }, { "epoch": 0.8, "learning_rate": 0.00017965581508679794, "loss": 0.0146, "step": 309510 }, { "epoch": 0.8, "learning_rate": 0.00017965192687042646, "loss": 0.0144, "step": 309520 }, { "epoch": 0.8, "learning_rate": 0.000179648038654055, "loss": 0.015, "step": 309530 }, { "epoch": 0.8, "learning_rate": 0.00017964415043768357, "loss": 0.0117, "step": 309540 }, { "epoch": 0.8, "learning_rate": 0.00017964026222131208, "loss": 0.0164, "step": 309550 }, { "epoch": 0.8, "learning_rate": 0.0001796363740049406, "loss": 0.0156, "step": 309560 }, { "epoch": 0.8, "learning_rate": 0.00017963248578856914, "loss": 0.01, "step": 309570 }, { "epoch": 0.8, "learning_rate": 0.0001796285975721977, "loss": 0.014, "step": 309580 }, { "epoch": 0.8, "learning_rate": 0.00017962470935582622, "loss": 0.0146, "step": 309590 }, { "epoch": 0.8, "learning_rate": 0.00017962082113945476, "loss": 0.0142, "step": 309600 }, { "epoch": 0.8, "learning_rate": 0.00017961693292308328, "loss": 0.0139, "step": 309610 }, { "epoch": 0.8, "learning_rate": 0.00017961304470671185, "loss": 0.0123, "step": 309620 }, { "epoch": 0.8, "learning_rate": 0.00017960915649034036, "loss": 0.0196, "step": 309630 }, { "epoch": 0.8, "learning_rate": 0.0001796052682739689, "loss": 0.0162, "step": 309640 }, { "epoch": 0.8, "learning_rate": 0.00017960138005759742, "loss": 0.0141, "step": 309650 }, { "epoch": 0.8, "learning_rate": 0.00017959749184122596, "loss": 0.0137, "step": 309660 }, { "epoch": 0.8, "learning_rate": 0.0001795936036248545, "loss": 0.0133, "step": 309670 }, { "epoch": 0.8, "learning_rate": 0.00017958971540848304, "loss": 0.0153, "step": 309680 }, { "epoch": 0.8, "learning_rate": 0.00017958582719211156, "loss": 0.0172, "step": 309690 }, { "epoch": 0.8, "learning_rate": 0.0001795819389757401, "loss": 0.015, "step": 309700 }, { "epoch": 0.8, "learning_rate": 0.00017957805075936864, "loss": 0.0166, "step": 309710 }, { "epoch": 0.8, "learning_rate": 0.00017957416254299718, "loss": 0.0139, "step": 309720 }, { "epoch": 0.8, "learning_rate": 0.0001795702743266257, "loss": 0.0136, "step": 309730 }, { "epoch": 0.8, "learning_rate": 0.00017956638611025424, "loss": 0.0153, "step": 309740 }, { "epoch": 0.8, "learning_rate": 0.0001795624978938828, "loss": 0.0158, "step": 309750 }, { "epoch": 0.8, "learning_rate": 0.00017955860967751132, "loss": 0.0131, "step": 309760 }, { "epoch": 0.8, "learning_rate": 0.00017955472146113986, "loss": 0.012, "step": 309770 }, { "epoch": 0.8, "learning_rate": 0.00017955083324476838, "loss": 0.0154, "step": 309780 }, { "epoch": 0.8, "learning_rate": 0.00017954694502839695, "loss": 0.0115, "step": 309790 }, { "epoch": 0.8, "learning_rate": 0.00017954305681202546, "loss": 0.0146, "step": 309800 }, { "epoch": 0.8, "learning_rate": 0.000179539168595654, "loss": 0.0155, "step": 309810 }, { "epoch": 0.8, "learning_rate": 0.00017953528037928252, "loss": 0.0202, "step": 309820 }, { "epoch": 0.8, "learning_rate": 0.00017953139216291109, "loss": 0.0125, "step": 309830 }, { "epoch": 0.8, "learning_rate": 0.0001795275039465396, "loss": 0.0182, "step": 309840 }, { "epoch": 0.8, "learning_rate": 0.00017952361573016814, "loss": 0.0162, "step": 309850 }, { "epoch": 0.8, "learning_rate": 0.00017951972751379666, "loss": 0.0166, "step": 309860 }, { "epoch": 0.8, "learning_rate": 0.00017951583929742522, "loss": 0.013, "step": 309870 }, { "epoch": 0.8, "learning_rate": 0.00017951195108105374, "loss": 0.0134, "step": 309880 }, { "epoch": 0.8, "learning_rate": 0.00017950806286468228, "loss": 0.0145, "step": 309890 }, { "epoch": 0.8, "learning_rate": 0.0001795041746483108, "loss": 0.0132, "step": 309900 }, { "epoch": 0.8, "learning_rate": 0.00017950028643193934, "loss": 0.0153, "step": 309910 }, { "epoch": 0.8, "learning_rate": 0.0001794963982155679, "loss": 0.0146, "step": 309920 }, { "epoch": 0.8, "learning_rate": 0.00017949250999919642, "loss": 0.0152, "step": 309930 }, { "epoch": 0.8, "learning_rate": 0.00017948862178282496, "loss": 0.0114, "step": 309940 }, { "epoch": 0.8, "learning_rate": 0.00017948473356645348, "loss": 0.0175, "step": 309950 }, { "epoch": 0.8, "learning_rate": 0.00017948084535008205, "loss": 0.0154, "step": 309960 }, { "epoch": 0.8, "learning_rate": 0.00017947695713371056, "loss": 0.0162, "step": 309970 }, { "epoch": 0.8, "learning_rate": 0.0001794730689173391, "loss": 0.012, "step": 309980 }, { "epoch": 0.8, "learning_rate": 0.00017946918070096762, "loss": 0.0156, "step": 309990 }, { "epoch": 0.8, "learning_rate": 0.00017946529248459618, "loss": 0.0144, "step": 310000 }, { "epoch": 0.8, "eval_cer": 0.8817222812402463, "eval_loss": 0.009546291083097458, "eval_runtime": 107.8383, "eval_samples_per_second": 18.546, "eval_steps_per_second": 4.637, "step": 310000 }, { "epoch": 0.8, "learning_rate": 0.0001794614042682247, "loss": 0.0172, "step": 310010 }, { "epoch": 0.8, "learning_rate": 0.00017945751605185324, "loss": 0.0134, "step": 310020 }, { "epoch": 0.8, "learning_rate": 0.00017945362783548176, "loss": 0.0173, "step": 310030 }, { "epoch": 0.8, "learning_rate": 0.00017944973961911032, "loss": 0.0127, "step": 310040 }, { "epoch": 0.8, "learning_rate": 0.00017944585140273884, "loss": 0.0145, "step": 310050 }, { "epoch": 0.8, "learning_rate": 0.00017944196318636738, "loss": 0.0168, "step": 310060 }, { "epoch": 0.8, "learning_rate": 0.0001794380749699959, "loss": 0.0138, "step": 310070 }, { "epoch": 0.8, "learning_rate": 0.00017943418675362446, "loss": 0.0147, "step": 310080 }, { "epoch": 0.8, "learning_rate": 0.000179430298537253, "loss": 0.0104, "step": 310090 }, { "epoch": 0.8, "learning_rate": 0.00017942641032088152, "loss": 0.0153, "step": 310100 }, { "epoch": 0.8, "learning_rate": 0.00017942252210451003, "loss": 0.0108, "step": 310110 }, { "epoch": 0.8, "learning_rate": 0.0001794186338881386, "loss": 0.0158, "step": 310120 }, { "epoch": 0.8, "learning_rate": 0.00017941474567176714, "loss": 0.0133, "step": 310130 }, { "epoch": 0.8, "learning_rate": 0.00017941085745539566, "loss": 0.0132, "step": 310140 }, { "epoch": 0.8, "learning_rate": 0.0001794069692390242, "loss": 0.0132, "step": 310150 }, { "epoch": 0.8, "learning_rate": 0.00017940308102265272, "loss": 0.0095, "step": 310160 }, { "epoch": 0.8, "learning_rate": 0.00017939919280628128, "loss": 0.0094, "step": 310170 }, { "epoch": 0.8, "learning_rate": 0.0001793953045899098, "loss": 0.0134, "step": 310180 }, { "epoch": 0.8, "learning_rate": 0.00017939141637353834, "loss": 0.0139, "step": 310190 }, { "epoch": 0.8, "learning_rate": 0.00017938752815716685, "loss": 0.0141, "step": 310200 }, { "epoch": 0.8, "learning_rate": 0.00017938363994079542, "loss": 0.0117, "step": 310210 }, { "epoch": 0.8, "learning_rate": 0.00017937975172442394, "loss": 0.0119, "step": 310220 }, { "epoch": 0.8, "learning_rate": 0.00017937586350805248, "loss": 0.0116, "step": 310230 }, { "epoch": 0.8, "learning_rate": 0.000179371975291681, "loss": 0.0126, "step": 310240 }, { "epoch": 0.8, "learning_rate": 0.00017936808707530956, "loss": 0.0155, "step": 310250 }, { "epoch": 0.8, "learning_rate": 0.00017936419885893808, "loss": 0.0156, "step": 310260 }, { "epoch": 0.8, "learning_rate": 0.00017936031064256662, "loss": 0.0145, "step": 310270 }, { "epoch": 0.8, "learning_rate": 0.00017935642242619513, "loss": 0.0129, "step": 310280 }, { "epoch": 0.8, "learning_rate": 0.0001793525342098237, "loss": 0.0136, "step": 310290 }, { "epoch": 0.8, "learning_rate": 0.00017934864599345224, "loss": 0.0168, "step": 310300 }, { "epoch": 0.8, "learning_rate": 0.00017934475777708076, "loss": 0.0134, "step": 310310 }, { "epoch": 0.8, "learning_rate": 0.0001793408695607093, "loss": 0.014, "step": 310320 }, { "epoch": 0.8, "learning_rate": 0.00017933698134433784, "loss": 0.0157, "step": 310330 }, { "epoch": 0.8, "learning_rate": 0.00017933309312796638, "loss": 0.0157, "step": 310340 }, { "epoch": 0.8, "learning_rate": 0.0001793292049115949, "loss": 0.0136, "step": 310350 }, { "epoch": 0.8, "learning_rate": 0.00017932531669522344, "loss": 0.0109, "step": 310360 }, { "epoch": 0.8, "learning_rate": 0.00017932142847885198, "loss": 0.0177, "step": 310370 }, { "epoch": 0.8, "learning_rate": 0.00017931754026248052, "loss": 0.0178, "step": 310380 }, { "epoch": 0.8, "learning_rate": 0.00017931365204610904, "loss": 0.0141, "step": 310390 }, { "epoch": 0.8, "learning_rate": 0.00017930976382973758, "loss": 0.0152, "step": 310400 }, { "epoch": 0.8, "learning_rate": 0.0001793058756133661, "loss": 0.0144, "step": 310410 }, { "epoch": 0.8, "learning_rate": 0.00017930198739699466, "loss": 0.0165, "step": 310420 }, { "epoch": 0.8, "learning_rate": 0.00017929809918062318, "loss": 0.014, "step": 310430 }, { "epoch": 0.8, "learning_rate": 0.00017929421096425172, "loss": 0.0127, "step": 310440 }, { "epoch": 0.8, "learning_rate": 0.00017929032274788023, "loss": 0.0163, "step": 310450 }, { "epoch": 0.8, "learning_rate": 0.0001792864345315088, "loss": 0.0138, "step": 310460 }, { "epoch": 0.8, "learning_rate": 0.00017928254631513734, "loss": 0.0141, "step": 310470 }, { "epoch": 0.8, "learning_rate": 0.00017927865809876586, "loss": 0.0146, "step": 310480 }, { "epoch": 0.8, "learning_rate": 0.0001792747698823944, "loss": 0.0122, "step": 310490 }, { "epoch": 0.8, "learning_rate": 0.00017927088166602294, "loss": 0.0152, "step": 310500 }, { "epoch": 0.8, "learning_rate": 0.00017926699344965148, "loss": 0.0138, "step": 310510 }, { "epoch": 0.8, "learning_rate": 0.00017926310523328, "loss": 0.0114, "step": 310520 }, { "epoch": 0.8, "learning_rate": 0.00017925921701690854, "loss": 0.0115, "step": 310530 }, { "epoch": 0.8, "learning_rate": 0.00017925532880053708, "loss": 0.0128, "step": 310540 }, { "epoch": 0.8, "learning_rate": 0.00017925144058416562, "loss": 0.0135, "step": 310550 }, { "epoch": 0.81, "learning_rate": 0.00017924755236779414, "loss": 0.013, "step": 310560 }, { "epoch": 0.81, "learning_rate": 0.00017924366415142268, "loss": 0.0142, "step": 310570 }, { "epoch": 0.81, "learning_rate": 0.00017923977593505122, "loss": 0.016, "step": 310580 }, { "epoch": 0.81, "learning_rate": 0.00017923588771867976, "loss": 0.0126, "step": 310590 }, { "epoch": 0.81, "learning_rate": 0.00017923199950230828, "loss": 0.0145, "step": 310600 }, { "epoch": 0.81, "learning_rate": 0.00017922811128593682, "loss": 0.0155, "step": 310610 }, { "epoch": 0.81, "learning_rate": 0.0001792242230695654, "loss": 0.0119, "step": 310620 }, { "epoch": 0.81, "learning_rate": 0.0001792203348531939, "loss": 0.0151, "step": 310630 }, { "epoch": 0.81, "learning_rate": 0.00017921644663682244, "loss": 0.0171, "step": 310640 }, { "epoch": 0.81, "learning_rate": 0.00017921255842045096, "loss": 0.0145, "step": 310650 }, { "epoch": 0.81, "learning_rate": 0.00017920867020407947, "loss": 0.0132, "step": 310660 }, { "epoch": 0.81, "learning_rate": 0.00017920478198770804, "loss": 0.0144, "step": 310670 }, { "epoch": 0.81, "learning_rate": 0.00017920089377133658, "loss": 0.0143, "step": 310680 }, { "epoch": 0.81, "learning_rate": 0.0001791970055549651, "loss": 0.0096, "step": 310690 }, { "epoch": 0.81, "learning_rate": 0.00017919311733859364, "loss": 0.0138, "step": 310700 }, { "epoch": 0.81, "learning_rate": 0.00017918922912222218, "loss": 0.0125, "step": 310710 }, { "epoch": 0.81, "learning_rate": 0.00017918534090585072, "loss": 0.0144, "step": 310720 }, { "epoch": 0.81, "learning_rate": 0.00017918145268947924, "loss": 0.0109, "step": 310730 }, { "epoch": 0.81, "learning_rate": 0.00017917756447310778, "loss": 0.0137, "step": 310740 }, { "epoch": 0.81, "learning_rate": 0.00017917367625673632, "loss": 0.0167, "step": 310750 }, { "epoch": 0.81, "learning_rate": 0.00017916978804036486, "loss": 0.0159, "step": 310760 }, { "epoch": 0.81, "learning_rate": 0.00017916589982399338, "loss": 0.0134, "step": 310770 }, { "epoch": 0.81, "learning_rate": 0.00017916201160762192, "loss": 0.0144, "step": 310780 }, { "epoch": 0.81, "learning_rate": 0.00017915812339125049, "loss": 0.0163, "step": 310790 }, { "epoch": 0.81, "learning_rate": 0.000179154235174879, "loss": 0.0112, "step": 310800 }, { "epoch": 0.81, "learning_rate": 0.00017915034695850754, "loss": 0.0153, "step": 310810 }, { "epoch": 0.81, "learning_rate": 0.00017914645874213606, "loss": 0.0124, "step": 310820 }, { "epoch": 0.81, "learning_rate": 0.00017914257052576463, "loss": 0.013, "step": 310830 }, { "epoch": 0.81, "learning_rate": 0.00017913868230939314, "loss": 0.0148, "step": 310840 }, { "epoch": 0.81, "learning_rate": 0.00017913479409302168, "loss": 0.0102, "step": 310850 }, { "epoch": 0.81, "learning_rate": 0.0001791309058766502, "loss": 0.0222, "step": 310860 }, { "epoch": 0.81, "learning_rate": 0.00017912701766027876, "loss": 0.0163, "step": 310870 }, { "epoch": 0.81, "learning_rate": 0.00017912312944390728, "loss": 0.0134, "step": 310880 }, { "epoch": 0.81, "learning_rate": 0.00017911924122753582, "loss": 0.0115, "step": 310890 }, { "epoch": 0.81, "learning_rate": 0.00017911535301116434, "loss": 0.0146, "step": 310900 }, { "epoch": 0.81, "learning_rate": 0.00017911146479479288, "loss": 0.0154, "step": 310910 }, { "epoch": 0.81, "learning_rate": 0.00017910757657842142, "loss": 0.012, "step": 310920 }, { "epoch": 0.81, "learning_rate": 0.00017910368836204996, "loss": 0.015, "step": 310930 }, { "epoch": 0.81, "learning_rate": 0.00017909980014567848, "loss": 0.0169, "step": 310940 }, { "epoch": 0.81, "learning_rate": 0.00017909591192930702, "loss": 0.0122, "step": 310950 }, { "epoch": 0.81, "learning_rate": 0.00017909202371293559, "loss": 0.013, "step": 310960 }, { "epoch": 0.81, "learning_rate": 0.0001790881354965641, "loss": 0.0115, "step": 310970 }, { "epoch": 0.81, "learning_rate": 0.00017908424728019261, "loss": 0.0124, "step": 310980 }, { "epoch": 0.81, "learning_rate": 0.00017908035906382116, "loss": 0.013, "step": 310990 }, { "epoch": 0.81, "learning_rate": 0.00017907647084744972, "loss": 0.0165, "step": 311000 }, { "epoch": 0.81, "eval_cer": 0.8817222812402463, "eval_loss": 0.009462043642997742, "eval_runtime": 107.7393, "eval_samples_per_second": 18.563, "eval_steps_per_second": 4.641, "step": 311000 }, { "epoch": 0.81, "learning_rate": 0.00017907258263107824, "loss": 0.0137, "step": 311010 }, { "epoch": 0.81, "learning_rate": 0.00017906869441470678, "loss": 0.0148, "step": 311020 }, { "epoch": 0.81, "learning_rate": 0.0001790648061983353, "loss": 0.0125, "step": 311030 }, { "epoch": 0.81, "learning_rate": 0.00017906091798196386, "loss": 0.0136, "step": 311040 }, { "epoch": 0.81, "learning_rate": 0.00017905702976559238, "loss": 0.016, "step": 311050 }, { "epoch": 0.81, "learning_rate": 0.00017905314154922092, "loss": 0.0151, "step": 311060 }, { "epoch": 0.81, "learning_rate": 0.00017904925333284944, "loss": 0.0115, "step": 311070 }, { "epoch": 0.81, "learning_rate": 0.000179045365116478, "loss": 0.0164, "step": 311080 }, { "epoch": 0.81, "learning_rate": 0.00017904147690010652, "loss": 0.0128, "step": 311090 }, { "epoch": 0.81, "learning_rate": 0.00017903758868373506, "loss": 0.0131, "step": 311100 }, { "epoch": 0.81, "learning_rate": 0.00017903370046736357, "loss": 0.0192, "step": 311110 }, { "epoch": 0.81, "learning_rate": 0.00017902981225099214, "loss": 0.0105, "step": 311120 }, { "epoch": 0.81, "learning_rate": 0.00017902592403462066, "loss": 0.0138, "step": 311130 }, { "epoch": 0.81, "learning_rate": 0.0001790220358182492, "loss": 0.0137, "step": 311140 }, { "epoch": 0.81, "learning_rate": 0.00017901814760187771, "loss": 0.0123, "step": 311150 }, { "epoch": 0.81, "learning_rate": 0.00017901425938550626, "loss": 0.0139, "step": 311160 }, { "epoch": 0.81, "learning_rate": 0.00017901037116913482, "loss": 0.0151, "step": 311170 }, { "epoch": 0.81, "learning_rate": 0.00017900648295276334, "loss": 0.0145, "step": 311180 }, { "epoch": 0.81, "learning_rate": 0.00017900259473639188, "loss": 0.0126, "step": 311190 }, { "epoch": 0.81, "learning_rate": 0.0001789987065200204, "loss": 0.0129, "step": 311200 }, { "epoch": 0.81, "learning_rate": 0.00017899481830364896, "loss": 0.0157, "step": 311210 }, { "epoch": 0.81, "learning_rate": 0.00017899093008727748, "loss": 0.0122, "step": 311220 }, { "epoch": 0.81, "learning_rate": 0.00017898704187090602, "loss": 0.0116, "step": 311230 }, { "epoch": 0.81, "learning_rate": 0.00017898315365453453, "loss": 0.0155, "step": 311240 }, { "epoch": 0.81, "learning_rate": 0.0001789792654381631, "loss": 0.0138, "step": 311250 }, { "epoch": 0.81, "learning_rate": 0.00017897537722179162, "loss": 0.0114, "step": 311260 }, { "epoch": 0.81, "learning_rate": 0.00017897148900542016, "loss": 0.0113, "step": 311270 }, { "epoch": 0.81, "learning_rate": 0.00017896760078904867, "loss": 0.0163, "step": 311280 }, { "epoch": 0.81, "learning_rate": 0.00017896371257267724, "loss": 0.011, "step": 311290 }, { "epoch": 0.81, "learning_rate": 0.00017895982435630576, "loss": 0.0136, "step": 311300 }, { "epoch": 0.81, "learning_rate": 0.0001789559361399343, "loss": 0.0129, "step": 311310 }, { "epoch": 0.81, "learning_rate": 0.0001789520479235628, "loss": 0.014, "step": 311320 }, { "epoch": 0.81, "learning_rate": 0.00017894815970719138, "loss": 0.0137, "step": 311330 }, { "epoch": 0.81, "learning_rate": 0.00017894427149081992, "loss": 0.0124, "step": 311340 }, { "epoch": 0.81, "learning_rate": 0.00017894038327444844, "loss": 0.0129, "step": 311350 }, { "epoch": 0.81, "learning_rate": 0.00017893649505807698, "loss": 0.0167, "step": 311360 }, { "epoch": 0.81, "learning_rate": 0.00017893260684170552, "loss": 0.0136, "step": 311370 }, { "epoch": 0.81, "learning_rate": 0.00017892871862533406, "loss": 0.0124, "step": 311380 }, { "epoch": 0.81, "learning_rate": 0.00017892483040896258, "loss": 0.0124, "step": 311390 }, { "epoch": 0.81, "learning_rate": 0.00017892094219259112, "loss": 0.0144, "step": 311400 }, { "epoch": 0.81, "learning_rate": 0.00017891705397621963, "loss": 0.0123, "step": 311410 }, { "epoch": 0.81, "learning_rate": 0.0001789131657598482, "loss": 0.0143, "step": 311420 }, { "epoch": 0.81, "learning_rate": 0.00017890927754347672, "loss": 0.0136, "step": 311430 }, { "epoch": 0.81, "learning_rate": 0.00017890538932710526, "loss": 0.017, "step": 311440 }, { "epoch": 0.81, "learning_rate": 0.00017890150111073377, "loss": 0.0131, "step": 311450 }, { "epoch": 0.81, "learning_rate": 0.00017889761289436234, "loss": 0.0148, "step": 311460 }, { "epoch": 0.81, "learning_rate": 0.00017889372467799086, "loss": 0.0102, "step": 311470 }, { "epoch": 0.81, "learning_rate": 0.0001788898364616194, "loss": 0.0168, "step": 311480 }, { "epoch": 0.81, "learning_rate": 0.0001788859482452479, "loss": 0.0206, "step": 311490 }, { "epoch": 0.81, "learning_rate": 0.00017888206002887648, "loss": 0.0153, "step": 311500 }, { "epoch": 0.81, "learning_rate": 0.00017887817181250502, "loss": 0.0148, "step": 311510 }, { "epoch": 0.81, "learning_rate": 0.00017887428359613354, "loss": 0.0141, "step": 311520 }, { "epoch": 0.81, "learning_rate": 0.00017887039537976208, "loss": 0.0141, "step": 311530 }, { "epoch": 0.81, "learning_rate": 0.00017886650716339062, "loss": 0.0143, "step": 311540 }, { "epoch": 0.81, "learning_rate": 0.00017886261894701916, "loss": 0.0149, "step": 311550 }, { "epoch": 0.81, "learning_rate": 0.00017885873073064768, "loss": 0.0122, "step": 311560 }, { "epoch": 0.81, "learning_rate": 0.00017885484251427622, "loss": 0.0142, "step": 311570 }, { "epoch": 0.81, "learning_rate": 0.00017885095429790476, "loss": 0.0128, "step": 311580 }, { "epoch": 0.81, "learning_rate": 0.0001788470660815333, "loss": 0.015, "step": 311590 }, { "epoch": 0.81, "learning_rate": 0.00017884317786516182, "loss": 0.0104, "step": 311600 }, { "epoch": 0.81, "learning_rate": 0.00017883928964879036, "loss": 0.0142, "step": 311610 }, { "epoch": 0.81, "learning_rate": 0.0001788354014324189, "loss": 0.0137, "step": 311620 }, { "epoch": 0.81, "learning_rate": 0.00017883151321604744, "loss": 0.0152, "step": 311630 }, { "epoch": 0.81, "learning_rate": 0.00017882762499967596, "loss": 0.0149, "step": 311640 }, { "epoch": 0.81, "learning_rate": 0.0001788237367833045, "loss": 0.0152, "step": 311650 }, { "epoch": 0.81, "learning_rate": 0.000178819848566933, "loss": 0.0115, "step": 311660 }, { "epoch": 0.81, "learning_rate": 0.00017881596035056158, "loss": 0.0145, "step": 311670 }, { "epoch": 0.81, "learning_rate": 0.00017881207213419012, "loss": 0.0156, "step": 311680 }, { "epoch": 0.81, "learning_rate": 0.00017880818391781864, "loss": 0.0141, "step": 311690 }, { "epoch": 0.81, "learning_rate": 0.00017880429570144715, "loss": 0.0081, "step": 311700 }, { "epoch": 0.81, "learning_rate": 0.00017880040748507572, "loss": 0.0117, "step": 311710 }, { "epoch": 0.81, "learning_rate": 0.00017879651926870426, "loss": 0.014, "step": 311720 }, { "epoch": 0.81, "learning_rate": 0.00017879263105233278, "loss": 0.0122, "step": 311730 }, { "epoch": 0.81, "learning_rate": 0.00017878874283596132, "loss": 0.0145, "step": 311740 }, { "epoch": 0.81, "learning_rate": 0.00017878485461958986, "loss": 0.0166, "step": 311750 }, { "epoch": 0.81, "learning_rate": 0.0001787809664032184, "loss": 0.0131, "step": 311760 }, { "epoch": 0.81, "learning_rate": 0.00017877707818684692, "loss": 0.0146, "step": 311770 }, { "epoch": 0.81, "learning_rate": 0.00017877318997047546, "loss": 0.0126, "step": 311780 }, { "epoch": 0.81, "learning_rate": 0.000178769301754104, "loss": 0.0168, "step": 311790 }, { "epoch": 0.81, "learning_rate": 0.00017876541353773254, "loss": 0.01, "step": 311800 }, { "epoch": 0.81, "learning_rate": 0.00017876152532136106, "loss": 0.013, "step": 311810 }, { "epoch": 0.81, "learning_rate": 0.0001787576371049896, "loss": 0.014, "step": 311820 }, { "epoch": 0.81, "learning_rate": 0.00017875374888861817, "loss": 0.013, "step": 311830 }, { "epoch": 0.81, "learning_rate": 0.00017874986067224668, "loss": 0.0154, "step": 311840 }, { "epoch": 0.81, "learning_rate": 0.0001787459724558752, "loss": 0.011, "step": 311850 }, { "epoch": 0.81, "learning_rate": 0.00017874208423950374, "loss": 0.0164, "step": 311860 }, { "epoch": 0.81, "learning_rate": 0.0001787381960231323, "loss": 0.014, "step": 311870 }, { "epoch": 0.81, "learning_rate": 0.00017873430780676082, "loss": 0.014, "step": 311880 }, { "epoch": 0.81, "learning_rate": 0.00017873041959038936, "loss": 0.0163, "step": 311890 }, { "epoch": 0.81, "learning_rate": 0.00017872653137401788, "loss": 0.0146, "step": 311900 }, { "epoch": 0.81, "learning_rate": 0.00017872264315764642, "loss": 0.016, "step": 311910 }, { "epoch": 0.81, "learning_rate": 0.00017871875494127496, "loss": 0.0168, "step": 311920 }, { "epoch": 0.81, "learning_rate": 0.0001787148667249035, "loss": 0.0166, "step": 311930 }, { "epoch": 0.81, "learning_rate": 0.00017871097850853202, "loss": 0.014, "step": 311940 }, { "epoch": 0.81, "learning_rate": 0.00017870709029216056, "loss": 0.014, "step": 311950 }, { "epoch": 0.81, "learning_rate": 0.0001787032020757891, "loss": 0.014, "step": 311960 }, { "epoch": 0.81, "learning_rate": 0.00017869931385941764, "loss": 0.0134, "step": 311970 }, { "epoch": 0.81, "learning_rate": 0.00017869542564304615, "loss": 0.0136, "step": 311980 }, { "epoch": 0.81, "learning_rate": 0.0001786915374266747, "loss": 0.0118, "step": 311990 }, { "epoch": 0.81, "learning_rate": 0.00017868764921030327, "loss": 0.0147, "step": 312000 }, { "epoch": 0.81, "eval_cer": 0.8817222812402463, "eval_loss": 0.009489587508141994, "eval_runtime": 107.733, "eval_samples_per_second": 18.564, "eval_steps_per_second": 4.641, "step": 312000 }, { "epoch": 0.81, "learning_rate": 0.00017868376099393178, "loss": 0.0161, "step": 312010 }, { "epoch": 0.81, "learning_rate": 0.0001786798727775603, "loss": 0.0142, "step": 312020 }, { "epoch": 0.81, "learning_rate": 0.00017867598456118884, "loss": 0.0109, "step": 312030 }, { "epoch": 0.81, "learning_rate": 0.0001786720963448174, "loss": 0.0124, "step": 312040 }, { "epoch": 0.81, "learning_rate": 0.00017866820812844592, "loss": 0.0108, "step": 312050 }, { "epoch": 0.81, "learning_rate": 0.00017866431991207446, "loss": 0.0146, "step": 312060 }, { "epoch": 0.81, "learning_rate": 0.00017866043169570298, "loss": 0.0143, "step": 312070 }, { "epoch": 0.81, "learning_rate": 0.00017865654347933154, "loss": 0.0172, "step": 312080 }, { "epoch": 0.81, "learning_rate": 0.00017865265526296006, "loss": 0.0092, "step": 312090 }, { "epoch": 0.81, "learning_rate": 0.0001786487670465886, "loss": 0.0143, "step": 312100 }, { "epoch": 0.81, "learning_rate": 0.00017864487883021711, "loss": 0.0136, "step": 312110 }, { "epoch": 0.81, "learning_rate": 0.00017864099061384566, "loss": 0.0165, "step": 312120 }, { "epoch": 0.81, "learning_rate": 0.0001786371023974742, "loss": 0.015, "step": 312130 }, { "epoch": 0.81, "learning_rate": 0.00017863321418110274, "loss": 0.0131, "step": 312140 }, { "epoch": 0.81, "learning_rate": 0.00017862932596473125, "loss": 0.0149, "step": 312150 }, { "epoch": 0.81, "learning_rate": 0.0001786254377483598, "loss": 0.0134, "step": 312160 }, { "epoch": 0.81, "learning_rate": 0.00017862154953198834, "loss": 0.0214, "step": 312170 }, { "epoch": 0.81, "learning_rate": 0.00017861766131561688, "loss": 0.0127, "step": 312180 }, { "epoch": 0.81, "learning_rate": 0.0001786137730992454, "loss": 0.0136, "step": 312190 }, { "epoch": 0.81, "learning_rate": 0.00017860988488287394, "loss": 0.013, "step": 312200 }, { "epoch": 0.81, "learning_rate": 0.0001786059966665025, "loss": 0.0133, "step": 312210 }, { "epoch": 0.81, "learning_rate": 0.00017860210845013102, "loss": 0.0132, "step": 312220 }, { "epoch": 0.81, "learning_rate": 0.00017859822023375956, "loss": 0.0112, "step": 312230 }, { "epoch": 0.81, "learning_rate": 0.00017859433201738807, "loss": 0.0108, "step": 312240 }, { "epoch": 0.81, "learning_rate": 0.00017859044380101664, "loss": 0.0121, "step": 312250 }, { "epoch": 0.81, "learning_rate": 0.00017858655558464516, "loss": 0.0154, "step": 312260 }, { "epoch": 0.81, "learning_rate": 0.0001785826673682737, "loss": 0.0129, "step": 312270 }, { "epoch": 0.81, "learning_rate": 0.00017857877915190221, "loss": 0.0159, "step": 312280 }, { "epoch": 0.81, "learning_rate": 0.00017857489093553078, "loss": 0.0139, "step": 312290 }, { "epoch": 0.81, "learning_rate": 0.0001785710027191593, "loss": 0.0109, "step": 312300 }, { "epoch": 0.81, "learning_rate": 0.00017856711450278784, "loss": 0.0139, "step": 312310 }, { "epoch": 0.81, "learning_rate": 0.00017856322628641635, "loss": 0.0115, "step": 312320 }, { "epoch": 0.81, "learning_rate": 0.00017855933807004492, "loss": 0.0146, "step": 312330 }, { "epoch": 0.81, "learning_rate": 0.00017855544985367344, "loss": 0.0151, "step": 312340 }, { "epoch": 0.81, "learning_rate": 0.00017855156163730198, "loss": 0.0143, "step": 312350 }, { "epoch": 0.81, "learning_rate": 0.0001785476734209305, "loss": 0.0158, "step": 312360 }, { "epoch": 0.81, "learning_rate": 0.00017854378520455903, "loss": 0.0114, "step": 312370 }, { "epoch": 0.81, "learning_rate": 0.0001785398969881876, "loss": 0.0125, "step": 312380 }, { "epoch": 0.81, "learning_rate": 0.00017853600877181612, "loss": 0.0136, "step": 312390 }, { "epoch": 0.81, "learning_rate": 0.00017853212055544466, "loss": 0.0143, "step": 312400 }, { "epoch": 0.81, "learning_rate": 0.00017852823233907317, "loss": 0.0119, "step": 312410 }, { "epoch": 0.81, "learning_rate": 0.00017852434412270174, "loss": 0.0155, "step": 312420 }, { "epoch": 0.81, "learning_rate": 0.00017852045590633026, "loss": 0.0131, "step": 312430 }, { "epoch": 0.81, "learning_rate": 0.0001785165676899588, "loss": 0.0112, "step": 312440 }, { "epoch": 0.81, "learning_rate": 0.00017851267947358731, "loss": 0.0167, "step": 312450 }, { "epoch": 0.81, "learning_rate": 0.00017850879125721588, "loss": 0.0172, "step": 312460 }, { "epoch": 0.81, "learning_rate": 0.0001785049030408444, "loss": 0.0144, "step": 312470 }, { "epoch": 0.81, "learning_rate": 0.00017850101482447294, "loss": 0.0129, "step": 312480 }, { "epoch": 0.81, "learning_rate": 0.00017849712660810145, "loss": 0.0127, "step": 312490 }, { "epoch": 0.81, "learning_rate": 0.00017849323839173002, "loss": 0.0128, "step": 312500 }, { "epoch": 0.81, "learning_rate": 0.00017848935017535854, "loss": 0.0162, "step": 312510 }, { "epoch": 0.81, "learning_rate": 0.00017848546195898708, "loss": 0.0174, "step": 312520 }, { "epoch": 0.81, "learning_rate": 0.0001784815737426156, "loss": 0.0145, "step": 312530 }, { "epoch": 0.81, "learning_rate": 0.00017847768552624416, "loss": 0.0143, "step": 312540 }, { "epoch": 0.81, "learning_rate": 0.0001784737973098727, "loss": 0.0135, "step": 312550 }, { "epoch": 0.81, "learning_rate": 0.00017846990909350122, "loss": 0.0176, "step": 312560 }, { "epoch": 0.81, "learning_rate": 0.00017846602087712973, "loss": 0.0144, "step": 312570 }, { "epoch": 0.81, "learning_rate": 0.0001784621326607583, "loss": 0.0121, "step": 312580 }, { "epoch": 0.81, "learning_rate": 0.00017845824444438684, "loss": 0.0129, "step": 312590 }, { "epoch": 0.81, "learning_rate": 0.00017845435622801536, "loss": 0.0146, "step": 312600 }, { "epoch": 0.81, "learning_rate": 0.0001784504680116439, "loss": 0.0148, "step": 312610 }, { "epoch": 0.81, "learning_rate": 0.0001784465797952724, "loss": 0.0111, "step": 312620 }, { "epoch": 0.81, "learning_rate": 0.00017844269157890098, "loss": 0.0106, "step": 312630 }, { "epoch": 0.81, "learning_rate": 0.0001784388033625295, "loss": 0.0143, "step": 312640 }, { "epoch": 0.81, "learning_rate": 0.00017843491514615804, "loss": 0.0189, "step": 312650 }, { "epoch": 0.81, "learning_rate": 0.00017843102692978655, "loss": 0.0149, "step": 312660 }, { "epoch": 0.81, "learning_rate": 0.00017842713871341512, "loss": 0.0147, "step": 312670 }, { "epoch": 0.81, "learning_rate": 0.00017842325049704364, "loss": 0.0133, "step": 312680 }, { "epoch": 0.81, "learning_rate": 0.00017841936228067218, "loss": 0.0134, "step": 312690 }, { "epoch": 0.81, "learning_rate": 0.0001784154740643007, "loss": 0.0131, "step": 312700 }, { "epoch": 0.81, "learning_rate": 0.00017841158584792926, "loss": 0.0162, "step": 312710 }, { "epoch": 0.81, "learning_rate": 0.00017840769763155778, "loss": 0.0159, "step": 312720 }, { "epoch": 0.81, "learning_rate": 0.00017840380941518632, "loss": 0.0135, "step": 312730 }, { "epoch": 0.81, "learning_rate": 0.00017839992119881483, "loss": 0.0172, "step": 312740 }, { "epoch": 0.81, "learning_rate": 0.0001783960329824434, "loss": 0.0145, "step": 312750 }, { "epoch": 0.81, "learning_rate": 0.00017839214476607194, "loss": 0.0158, "step": 312760 }, { "epoch": 0.81, "learning_rate": 0.00017838825654970046, "loss": 0.0118, "step": 312770 }, { "epoch": 0.81, "learning_rate": 0.000178384368333329, "loss": 0.0138, "step": 312780 }, { "epoch": 0.81, "learning_rate": 0.00017838048011695754, "loss": 0.0159, "step": 312790 }, { "epoch": 0.81, "learning_rate": 0.00017837659190058608, "loss": 0.0127, "step": 312800 }, { "epoch": 0.81, "learning_rate": 0.0001783727036842146, "loss": 0.0187, "step": 312810 }, { "epoch": 0.81, "learning_rate": 0.00017836881546784314, "loss": 0.013, "step": 312820 }, { "epoch": 0.81, "learning_rate": 0.00017836492725147168, "loss": 0.0146, "step": 312830 }, { "epoch": 0.81, "learning_rate": 0.00017836103903510022, "loss": 0.0147, "step": 312840 }, { "epoch": 0.81, "learning_rate": 0.00017835715081872874, "loss": 0.0114, "step": 312850 }, { "epoch": 0.81, "learning_rate": 0.00017835326260235728, "loss": 0.0157, "step": 312860 }, { "epoch": 0.81, "learning_rate": 0.0001783493743859858, "loss": 0.0126, "step": 312870 }, { "epoch": 0.81, "learning_rate": 0.00017834548616961436, "loss": 0.0136, "step": 312880 }, { "epoch": 0.81, "learning_rate": 0.00017834159795324287, "loss": 0.0135, "step": 312890 }, { "epoch": 0.81, "learning_rate": 0.00017833770973687142, "loss": 0.0138, "step": 312900 }, { "epoch": 0.81, "learning_rate": 0.00017833382152049993, "loss": 0.0168, "step": 312910 }, { "epoch": 0.81, "learning_rate": 0.0001783299333041285, "loss": 0.0139, "step": 312920 }, { "epoch": 0.81, "learning_rate": 0.00017832604508775704, "loss": 0.0132, "step": 312930 }, { "epoch": 0.81, "learning_rate": 0.00017832215687138556, "loss": 0.0131, "step": 312940 }, { "epoch": 0.81, "learning_rate": 0.0001783182686550141, "loss": 0.0148, "step": 312950 }, { "epoch": 0.81, "learning_rate": 0.00017831438043864264, "loss": 0.0151, "step": 312960 }, { "epoch": 0.81, "learning_rate": 0.00017831049222227118, "loss": 0.0138, "step": 312970 }, { "epoch": 0.81, "learning_rate": 0.0001783066040058997, "loss": 0.0103, "step": 312980 }, { "epoch": 0.81, "learning_rate": 0.00017830271578952824, "loss": 0.0135, "step": 312990 }, { "epoch": 0.81, "learning_rate": 0.00017829882757315678, "loss": 0.0127, "step": 313000 }, { "epoch": 0.81, "eval_cer": 0.8817208816033121, "eval_loss": 0.009489119984209538, "eval_runtime": 107.6322, "eval_samples_per_second": 18.582, "eval_steps_per_second": 4.645, "step": 313000 }, { "epoch": 0.81, "learning_rate": 0.00017829493935678532, "loss": 0.0174, "step": 313010 }, { "epoch": 0.81, "learning_rate": 0.00017829105114041383, "loss": 0.0113, "step": 313020 }, { "epoch": 0.81, "learning_rate": 0.00017828716292404238, "loss": 0.0159, "step": 313030 }, { "epoch": 0.81, "learning_rate": 0.00017828327470767092, "loss": 0.0129, "step": 313040 }, { "epoch": 0.81, "learning_rate": 0.00017827938649129946, "loss": 0.0109, "step": 313050 }, { "epoch": 0.81, "learning_rate": 0.00017827549827492797, "loss": 0.0133, "step": 313060 }, { "epoch": 0.81, "learning_rate": 0.00017827161005855652, "loss": 0.0138, "step": 313070 }, { "epoch": 0.81, "learning_rate": 0.00017826772184218508, "loss": 0.0117, "step": 313080 }, { "epoch": 0.81, "learning_rate": 0.0001782638336258136, "loss": 0.0126, "step": 313090 }, { "epoch": 0.81, "learning_rate": 0.00017825994540944214, "loss": 0.0115, "step": 313100 }, { "epoch": 0.81, "learning_rate": 0.00017825605719307066, "loss": 0.0152, "step": 313110 }, { "epoch": 0.81, "learning_rate": 0.0001782521689766992, "loss": 0.0107, "step": 313120 }, { "epoch": 0.81, "learning_rate": 0.00017824828076032774, "loss": 0.0191, "step": 313130 }, { "epoch": 0.81, "learning_rate": 0.00017824439254395628, "loss": 0.0161, "step": 313140 }, { "epoch": 0.81, "learning_rate": 0.0001782405043275848, "loss": 0.0103, "step": 313150 }, { "epoch": 0.81, "learning_rate": 0.00017823661611121334, "loss": 0.0144, "step": 313160 }, { "epoch": 0.81, "learning_rate": 0.00017823272789484188, "loss": 0.0161, "step": 313170 }, { "epoch": 0.81, "learning_rate": 0.00017822883967847042, "loss": 0.0126, "step": 313180 }, { "epoch": 0.81, "learning_rate": 0.00017822495146209893, "loss": 0.0112, "step": 313190 }, { "epoch": 0.81, "learning_rate": 0.00017822106324572748, "loss": 0.0139, "step": 313200 }, { "epoch": 0.81, "learning_rate": 0.00017821717502935602, "loss": 0.0139, "step": 313210 }, { "epoch": 0.81, "learning_rate": 0.00017821328681298456, "loss": 0.0117, "step": 313220 }, { "epoch": 0.81, "learning_rate": 0.00017820939859661307, "loss": 0.0154, "step": 313230 }, { "epoch": 0.81, "learning_rate": 0.00017820551038024162, "loss": 0.0154, "step": 313240 }, { "epoch": 0.81, "learning_rate": 0.00017820162216387018, "loss": 0.0117, "step": 313250 }, { "epoch": 0.81, "learning_rate": 0.0001781977339474987, "loss": 0.0138, "step": 313260 }, { "epoch": 0.81, "learning_rate": 0.00017819384573112724, "loss": 0.0189, "step": 313270 }, { "epoch": 0.81, "learning_rate": 0.00017818995751475575, "loss": 0.0158, "step": 313280 }, { "epoch": 0.81, "learning_rate": 0.00017818606929838432, "loss": 0.0177, "step": 313290 }, { "epoch": 0.81, "learning_rate": 0.00017818218108201284, "loss": 0.0127, "step": 313300 }, { "epoch": 0.81, "learning_rate": 0.00017817829286564138, "loss": 0.0145, "step": 313310 }, { "epoch": 0.81, "learning_rate": 0.0001781744046492699, "loss": 0.0184, "step": 313320 }, { "epoch": 0.81, "learning_rate": 0.00017817051643289846, "loss": 0.0142, "step": 313330 }, { "epoch": 0.81, "learning_rate": 0.00017816662821652698, "loss": 0.0136, "step": 313340 }, { "epoch": 0.81, "learning_rate": 0.00017816274000015552, "loss": 0.014, "step": 313350 }, { "epoch": 0.81, "learning_rate": 0.00017815885178378403, "loss": 0.0124, "step": 313360 }, { "epoch": 0.81, "learning_rate": 0.00017815496356741258, "loss": 0.0108, "step": 313370 }, { "epoch": 0.81, "learning_rate": 0.00017815107535104112, "loss": 0.0105, "step": 313380 }, { "epoch": 0.81, "learning_rate": 0.00017814718713466966, "loss": 0.015, "step": 313390 }, { "epoch": 0.81, "learning_rate": 0.00017814329891829817, "loss": 0.017, "step": 313400 }, { "epoch": 0.81, "learning_rate": 0.00017813941070192671, "loss": 0.0134, "step": 313410 }, { "epoch": 0.81, "learning_rate": 0.00017813552248555528, "loss": 0.0144, "step": 313420 }, { "epoch": 0.81, "learning_rate": 0.0001781316342691838, "loss": 0.0182, "step": 313430 }, { "epoch": 0.81, "learning_rate": 0.0001781277460528123, "loss": 0.0171, "step": 313440 }, { "epoch": 0.81, "learning_rate": 0.00017812385783644085, "loss": 0.0147, "step": 313450 }, { "epoch": 0.81, "learning_rate": 0.00017811996962006942, "loss": 0.0146, "step": 313460 }, { "epoch": 0.81, "learning_rate": 0.00017811608140369794, "loss": 0.0122, "step": 313470 }, { "epoch": 0.81, "learning_rate": 0.00017811219318732648, "loss": 0.0158, "step": 313480 }, { "epoch": 0.81, "learning_rate": 0.000178108304970955, "loss": 0.0169, "step": 313490 }, { "epoch": 0.81, "learning_rate": 0.00017810441675458356, "loss": 0.0125, "step": 313500 }, { "epoch": 0.81, "learning_rate": 0.00017810052853821208, "loss": 0.0133, "step": 313510 }, { "epoch": 0.81, "learning_rate": 0.00017809664032184062, "loss": 0.0178, "step": 313520 }, { "epoch": 0.81, "learning_rate": 0.00017809275210546913, "loss": 0.0139, "step": 313530 }, { "epoch": 0.81, "learning_rate": 0.0001780888638890977, "loss": 0.0141, "step": 313540 }, { "epoch": 0.81, "learning_rate": 0.00017808497567272622, "loss": 0.0156, "step": 313550 }, { "epoch": 0.81, "learning_rate": 0.00017808108745635476, "loss": 0.0113, "step": 313560 }, { "epoch": 0.81, "learning_rate": 0.00017807719923998327, "loss": 0.0129, "step": 313570 }, { "epoch": 0.81, "learning_rate": 0.00017807331102361184, "loss": 0.0129, "step": 313580 }, { "epoch": 0.81, "learning_rate": 0.00017806942280724038, "loss": 0.0131, "step": 313590 }, { "epoch": 0.81, "learning_rate": 0.0001780655345908689, "loss": 0.0132, "step": 313600 }, { "epoch": 0.81, "learning_rate": 0.0001780616463744974, "loss": 0.0166, "step": 313610 }, { "epoch": 0.81, "learning_rate": 0.00017805775815812595, "loss": 0.0147, "step": 313620 }, { "epoch": 0.81, "learning_rate": 0.00017805386994175452, "loss": 0.0172, "step": 313630 }, { "epoch": 0.81, "learning_rate": 0.00017804998172538304, "loss": 0.0171, "step": 313640 }, { "epoch": 0.81, "learning_rate": 0.00017804609350901158, "loss": 0.0148, "step": 313650 }, { "epoch": 0.81, "learning_rate": 0.0001780422052926401, "loss": 0.0194, "step": 313660 }, { "epoch": 0.81, "learning_rate": 0.00017803831707626866, "loss": 0.0142, "step": 313670 }, { "epoch": 0.81, "learning_rate": 0.00017803442885989718, "loss": 0.0141, "step": 313680 }, { "epoch": 0.81, "learning_rate": 0.00017803054064352572, "loss": 0.014, "step": 313690 }, { "epoch": 0.81, "learning_rate": 0.00017802665242715423, "loss": 0.0159, "step": 313700 }, { "epoch": 0.81, "learning_rate": 0.0001780227642107828, "loss": 0.0111, "step": 313710 }, { "epoch": 0.81, "learning_rate": 0.00017801887599441132, "loss": 0.0144, "step": 313720 }, { "epoch": 0.81, "learning_rate": 0.00017801498777803986, "loss": 0.0159, "step": 313730 }, { "epoch": 0.81, "learning_rate": 0.00017801109956166837, "loss": 0.0148, "step": 313740 }, { "epoch": 0.81, "learning_rate": 0.00017800721134529694, "loss": 0.0129, "step": 313750 }, { "epoch": 0.81, "learning_rate": 0.00017800332312892546, "loss": 0.0185, "step": 313760 }, { "epoch": 0.81, "learning_rate": 0.000177999434912554, "loss": 0.0144, "step": 313770 }, { "epoch": 0.81, "learning_rate": 0.0001779955466961825, "loss": 0.0131, "step": 313780 }, { "epoch": 0.81, "learning_rate": 0.00017799165847981108, "loss": 0.0141, "step": 313790 }, { "epoch": 0.81, "learning_rate": 0.00017798777026343962, "loss": 0.0131, "step": 313800 }, { "epoch": 0.81, "learning_rate": 0.00017798388204706814, "loss": 0.0173, "step": 313810 }, { "epoch": 0.81, "learning_rate": 0.00017797999383069668, "loss": 0.0157, "step": 313820 }, { "epoch": 0.81, "learning_rate": 0.00017797610561432522, "loss": 0.0142, "step": 313830 }, { "epoch": 0.81, "learning_rate": 0.00017797221739795376, "loss": 0.0146, "step": 313840 }, { "epoch": 0.81, "learning_rate": 0.00017796832918158228, "loss": 0.0188, "step": 313850 }, { "epoch": 0.81, "learning_rate": 0.00017796444096521082, "loss": 0.0187, "step": 313860 }, { "epoch": 0.81, "learning_rate": 0.00017796055274883933, "loss": 0.0122, "step": 313870 }, { "epoch": 0.81, "learning_rate": 0.0001779566645324679, "loss": 0.0124, "step": 313880 }, { "epoch": 0.81, "learning_rate": 0.00017795277631609642, "loss": 0.0155, "step": 313890 }, { "epoch": 0.81, "learning_rate": 0.00017794888809972496, "loss": 0.0122, "step": 313900 }, { "epoch": 0.81, "learning_rate": 0.00017794499988335347, "loss": 0.0112, "step": 313910 }, { "epoch": 0.81, "learning_rate": 0.00017794111166698204, "loss": 0.0132, "step": 313920 }, { "epoch": 0.81, "learning_rate": 0.00017793722345061055, "loss": 0.0159, "step": 313930 }, { "epoch": 0.81, "learning_rate": 0.0001779333352342391, "loss": 0.0109, "step": 313940 }, { "epoch": 0.81, "learning_rate": 0.0001779294470178676, "loss": 0.0126, "step": 313950 }, { "epoch": 0.81, "learning_rate": 0.00017792555880149618, "loss": 0.0143, "step": 313960 }, { "epoch": 0.81, "learning_rate": 0.00017792167058512472, "loss": 0.0152, "step": 313970 }, { "epoch": 0.81, "learning_rate": 0.00017791778236875324, "loss": 0.0124, "step": 313980 }, { "epoch": 0.81, "learning_rate": 0.00017791389415238178, "loss": 0.0134, "step": 313990 }, { "epoch": 0.81, "learning_rate": 0.00017791000593601032, "loss": 0.0175, "step": 314000 }, { "epoch": 0.81, "eval_cer": 0.8817376772465223, "eval_loss": 0.00921955332159996, "eval_runtime": 107.7056, "eval_samples_per_second": 18.569, "eval_steps_per_second": 4.642, "step": 314000 }, { "epoch": 0.81, "learning_rate": 0.00017790611771963886, "loss": 0.0127, "step": 314010 }, { "epoch": 0.81, "learning_rate": 0.00017790222950326738, "loss": 0.014, "step": 314020 }, { "epoch": 0.81, "learning_rate": 0.00017789834128689592, "loss": 0.0157, "step": 314030 }, { "epoch": 0.81, "learning_rate": 0.00017789445307052446, "loss": 0.0136, "step": 314040 }, { "epoch": 0.81, "learning_rate": 0.000177890564854153, "loss": 0.0132, "step": 314050 }, { "epoch": 0.81, "learning_rate": 0.00017788667663778151, "loss": 0.0131, "step": 314060 }, { "epoch": 0.81, "learning_rate": 0.00017788278842141006, "loss": 0.0135, "step": 314070 }, { "epoch": 0.81, "learning_rate": 0.0001778789002050386, "loss": 0.013, "step": 314080 }, { "epoch": 0.81, "learning_rate": 0.00017787501198866714, "loss": 0.0132, "step": 314090 }, { "epoch": 0.81, "learning_rate": 0.00017787112377229565, "loss": 0.0149, "step": 314100 }, { "epoch": 0.81, "learning_rate": 0.0001778672355559242, "loss": 0.0144, "step": 314110 }, { "epoch": 0.81, "learning_rate": 0.0001778633473395527, "loss": 0.018, "step": 314120 }, { "epoch": 0.81, "learning_rate": 0.00017785945912318128, "loss": 0.013, "step": 314130 }, { "epoch": 0.81, "learning_rate": 0.00017785557090680982, "loss": 0.0133, "step": 314140 }, { "epoch": 0.81, "learning_rate": 0.00017785168269043834, "loss": 0.012, "step": 314150 }, { "epoch": 0.81, "learning_rate": 0.00017784779447406685, "loss": 0.0148, "step": 314160 }, { "epoch": 0.81, "learning_rate": 0.00017784390625769542, "loss": 0.0142, "step": 314170 }, { "epoch": 0.81, "learning_rate": 0.00017784001804132396, "loss": 0.0119, "step": 314180 }, { "epoch": 0.81, "learning_rate": 0.00017783612982495247, "loss": 0.016, "step": 314190 }, { "epoch": 0.81, "learning_rate": 0.00017783224160858102, "loss": 0.0145, "step": 314200 }, { "epoch": 0.81, "learning_rate": 0.00017782835339220956, "loss": 0.0144, "step": 314210 }, { "epoch": 0.81, "learning_rate": 0.0001778244651758381, "loss": 0.0132, "step": 314220 }, { "epoch": 0.81, "learning_rate": 0.00017782057695946661, "loss": 0.0138, "step": 314230 }, { "epoch": 0.81, "learning_rate": 0.00017781668874309516, "loss": 0.0129, "step": 314240 }, { "epoch": 0.81, "learning_rate": 0.0001778128005267237, "loss": 0.025, "step": 314250 }, { "epoch": 0.81, "learning_rate": 0.00017780891231035224, "loss": 0.0131, "step": 314260 }, { "epoch": 0.81, "learning_rate": 0.00017780502409398075, "loss": 0.0158, "step": 314270 }, { "epoch": 0.81, "learning_rate": 0.0001778011358776093, "loss": 0.0108, "step": 314280 }, { "epoch": 0.81, "learning_rate": 0.00017779724766123786, "loss": 0.0142, "step": 314290 }, { "epoch": 0.81, "learning_rate": 0.00017779335944486638, "loss": 0.0108, "step": 314300 }, { "epoch": 0.81, "learning_rate": 0.0001777894712284949, "loss": 0.0107, "step": 314310 }, { "epoch": 0.81, "learning_rate": 0.00017778558301212343, "loss": 0.0153, "step": 314320 }, { "epoch": 0.81, "learning_rate": 0.000177781694795752, "loss": 0.0169, "step": 314330 }, { "epoch": 0.81, "learning_rate": 0.00017777780657938052, "loss": 0.0137, "step": 314340 }, { "epoch": 0.81, "learning_rate": 0.00017777391836300906, "loss": 0.0126, "step": 314350 }, { "epoch": 0.81, "learning_rate": 0.00017777003014663757, "loss": 0.013, "step": 314360 }, { "epoch": 0.81, "learning_rate": 0.00017776614193026612, "loss": 0.0134, "step": 314370 }, { "epoch": 0.81, "learning_rate": 0.00017776225371389466, "loss": 0.0124, "step": 314380 }, { "epoch": 0.81, "learning_rate": 0.0001777583654975232, "loss": 0.0141, "step": 314390 }, { "epoch": 0.81, "learning_rate": 0.0001777544772811517, "loss": 0.0139, "step": 314400 }, { "epoch": 0.81, "learning_rate": 0.00017775058906478026, "loss": 0.0116, "step": 314410 }, { "epoch": 0.82, "learning_rate": 0.0001777467008484088, "loss": 0.0148, "step": 314420 }, { "epoch": 0.82, "learning_rate": 0.00017774281263203734, "loss": 0.0115, "step": 314430 }, { "epoch": 0.82, "learning_rate": 0.00017773892441566585, "loss": 0.0142, "step": 314440 }, { "epoch": 0.82, "learning_rate": 0.0001777350361992944, "loss": 0.0146, "step": 314450 }, { "epoch": 0.82, "learning_rate": 0.00017773114798292296, "loss": 0.0131, "step": 314460 }, { "epoch": 0.82, "learning_rate": 0.00017772725976655148, "loss": 0.0124, "step": 314470 }, { "epoch": 0.82, "learning_rate": 0.00017772337155018, "loss": 0.0137, "step": 314480 }, { "epoch": 0.82, "learning_rate": 0.00017771948333380853, "loss": 0.0206, "step": 314490 }, { "epoch": 0.82, "learning_rate": 0.0001777155951174371, "loss": 0.0129, "step": 314500 }, { "epoch": 0.82, "learning_rate": 0.00017771170690106562, "loss": 0.0146, "step": 314510 }, { "epoch": 0.82, "learning_rate": 0.00017770781868469416, "loss": 0.0162, "step": 314520 }, { "epoch": 0.82, "learning_rate": 0.00017770393046832267, "loss": 0.0152, "step": 314530 }, { "epoch": 0.82, "learning_rate": 0.00017770004225195124, "loss": 0.0146, "step": 314540 }, { "epoch": 0.82, "learning_rate": 0.00017769615403557976, "loss": 0.0103, "step": 314550 }, { "epoch": 0.82, "learning_rate": 0.0001776922658192083, "loss": 0.0129, "step": 314560 }, { "epoch": 0.82, "learning_rate": 0.0001776883776028368, "loss": 0.0132, "step": 314570 }, { "epoch": 0.82, "learning_rate": 0.00017768448938646538, "loss": 0.0188, "step": 314580 }, { "epoch": 0.82, "learning_rate": 0.0001776806011700939, "loss": 0.0136, "step": 314590 }, { "epoch": 0.82, "learning_rate": 0.00017767671295372244, "loss": 0.0155, "step": 314600 }, { "epoch": 0.82, "learning_rate": 0.00017767282473735095, "loss": 0.0119, "step": 314610 }, { "epoch": 0.82, "learning_rate": 0.0001776689365209795, "loss": 0.0161, "step": 314620 }, { "epoch": 0.82, "learning_rate": 0.00017766504830460804, "loss": 0.0143, "step": 314630 }, { "epoch": 0.82, "learning_rate": 0.00017766116008823658, "loss": 0.0131, "step": 314640 }, { "epoch": 0.82, "learning_rate": 0.0001776572718718651, "loss": 0.0111, "step": 314650 }, { "epoch": 0.82, "learning_rate": 0.00017765338365549363, "loss": 0.0124, "step": 314660 }, { "epoch": 0.82, "learning_rate": 0.0001776494954391222, "loss": 0.0148, "step": 314670 }, { "epoch": 0.82, "learning_rate": 0.00017764560722275072, "loss": 0.0159, "step": 314680 }, { "epoch": 0.82, "learning_rate": 0.00017764171900637926, "loss": 0.0122, "step": 314690 }, { "epoch": 0.82, "learning_rate": 0.00017763783079000777, "loss": 0.0144, "step": 314700 }, { "epoch": 0.82, "learning_rate": 0.00017763394257363634, "loss": 0.0175, "step": 314710 }, { "epoch": 0.82, "learning_rate": 0.00017763005435726486, "loss": 0.012, "step": 314720 }, { "epoch": 0.82, "learning_rate": 0.0001776261661408934, "loss": 0.0138, "step": 314730 }, { "epoch": 0.82, "learning_rate": 0.0001776222779245219, "loss": 0.0128, "step": 314740 }, { "epoch": 0.82, "learning_rate": 0.00017761838970815048, "loss": 0.0121, "step": 314750 }, { "epoch": 0.82, "learning_rate": 0.000177614501491779, "loss": 0.0136, "step": 314760 }, { "epoch": 0.82, "learning_rate": 0.00017761061327540754, "loss": 0.0171, "step": 314770 }, { "epoch": 0.82, "learning_rate": 0.00017760672505903605, "loss": 0.0142, "step": 314780 }, { "epoch": 0.82, "learning_rate": 0.00017760283684266462, "loss": 0.0184, "step": 314790 }, { "epoch": 0.82, "learning_rate": 0.00017759894862629313, "loss": 0.0168, "step": 314800 }, { "epoch": 0.82, "learning_rate": 0.00017759506040992168, "loss": 0.0112, "step": 314810 }, { "epoch": 0.82, "learning_rate": 0.0001775911721935502, "loss": 0.0152, "step": 314820 }, { "epoch": 0.82, "learning_rate": 0.00017758728397717876, "loss": 0.0178, "step": 314830 }, { "epoch": 0.82, "learning_rate": 0.0001775833957608073, "loss": 0.0131, "step": 314840 }, { "epoch": 0.82, "learning_rate": 0.00017757950754443582, "loss": 0.0142, "step": 314850 }, { "epoch": 0.82, "learning_rate": 0.00017757561932806436, "loss": 0.0104, "step": 314860 }, { "epoch": 0.82, "learning_rate": 0.00017757173111169287, "loss": 0.0206, "step": 314870 }, { "epoch": 0.82, "learning_rate": 0.00017756784289532144, "loss": 0.0137, "step": 314880 }, { "epoch": 0.82, "learning_rate": 0.00017756395467894996, "loss": 0.0163, "step": 314890 }, { "epoch": 0.82, "learning_rate": 0.0001775600664625785, "loss": 0.021, "step": 314900 }, { "epoch": 0.82, "learning_rate": 0.000177556178246207, "loss": 0.0149, "step": 314910 }, { "epoch": 0.82, "learning_rate": 0.00017755229002983558, "loss": 0.0164, "step": 314920 }, { "epoch": 0.82, "learning_rate": 0.0001775484018134641, "loss": 0.0169, "step": 314930 }, { "epoch": 0.82, "learning_rate": 0.00017754451359709264, "loss": 0.0123, "step": 314940 }, { "epoch": 0.82, "learning_rate": 0.00017754062538072115, "loss": 0.0167, "step": 314950 }, { "epoch": 0.82, "learning_rate": 0.00017753673716434972, "loss": 0.0131, "step": 314960 }, { "epoch": 0.82, "learning_rate": 0.00017753284894797823, "loss": 0.0146, "step": 314970 }, { "epoch": 0.82, "learning_rate": 0.00017752896073160678, "loss": 0.0137, "step": 314980 }, { "epoch": 0.82, "learning_rate": 0.0001775250725152353, "loss": 0.013, "step": 314990 }, { "epoch": 0.82, "learning_rate": 0.00017752118429886386, "loss": 0.0138, "step": 315000 }, { "epoch": 0.82, "eval_cer": 0.8817446754311932, "eval_loss": 0.009523827582597733, "eval_runtime": 107.5021, "eval_samples_per_second": 18.604, "eval_steps_per_second": 4.651, "step": 315000 }, { "epoch": 0.82, "learning_rate": 0.0001775172960824924, "loss": 0.0146, "step": 315010 }, { "epoch": 0.82, "learning_rate": 0.00017751340786612092, "loss": 0.0146, "step": 315020 }, { "epoch": 0.82, "learning_rate": 0.00017750951964974943, "loss": 0.014, "step": 315030 }, { "epoch": 0.82, "learning_rate": 0.000177505631433378, "loss": 0.0107, "step": 315040 }, { "epoch": 0.82, "learning_rate": 0.00017750174321700654, "loss": 0.0157, "step": 315050 }, { "epoch": 0.82, "learning_rate": 0.00017749785500063505, "loss": 0.0109, "step": 315060 }, { "epoch": 0.82, "learning_rate": 0.0001774939667842636, "loss": 0.0139, "step": 315070 }, { "epoch": 0.82, "learning_rate": 0.00017749007856789214, "loss": 0.0187, "step": 315080 }, { "epoch": 0.82, "learning_rate": 0.00017748619035152068, "loss": 0.0137, "step": 315090 }, { "epoch": 0.82, "learning_rate": 0.0001774823021351492, "loss": 0.0141, "step": 315100 }, { "epoch": 0.82, "learning_rate": 0.00017747841391877774, "loss": 0.0158, "step": 315110 }, { "epoch": 0.82, "learning_rate": 0.00017747452570240625, "loss": 0.0122, "step": 315120 }, { "epoch": 0.82, "learning_rate": 0.00017747063748603482, "loss": 0.0124, "step": 315130 }, { "epoch": 0.82, "learning_rate": 0.00017746674926966333, "loss": 0.0145, "step": 315140 }, { "epoch": 0.82, "learning_rate": 0.00017746286105329188, "loss": 0.0146, "step": 315150 }, { "epoch": 0.82, "learning_rate": 0.0001774589728369204, "loss": 0.0146, "step": 315160 }, { "epoch": 0.82, "learning_rate": 0.00017745508462054896, "loss": 0.0124, "step": 315170 }, { "epoch": 0.82, "learning_rate": 0.0001774511964041775, "loss": 0.0186, "step": 315180 }, { "epoch": 0.82, "learning_rate": 0.00017744730818780601, "loss": 0.0166, "step": 315190 }, { "epoch": 0.82, "learning_rate": 0.00017744341997143453, "loss": 0.0156, "step": 315200 }, { "epoch": 0.82, "learning_rate": 0.0001774395317550631, "loss": 0.0143, "step": 315210 }, { "epoch": 0.82, "learning_rate": 0.00017743564353869164, "loss": 0.0141, "step": 315220 }, { "epoch": 0.82, "learning_rate": 0.00017743175532232015, "loss": 0.0122, "step": 315230 }, { "epoch": 0.82, "learning_rate": 0.0001774278671059487, "loss": 0.0118, "step": 315240 }, { "epoch": 0.82, "learning_rate": 0.00017742397888957724, "loss": 0.0119, "step": 315250 }, { "epoch": 0.82, "learning_rate": 0.00017742009067320578, "loss": 0.0169, "step": 315260 }, { "epoch": 0.82, "learning_rate": 0.0001774162024568343, "loss": 0.0136, "step": 315270 }, { "epoch": 0.82, "learning_rate": 0.00017741231424046284, "loss": 0.0134, "step": 315280 }, { "epoch": 0.82, "learning_rate": 0.00017740842602409138, "loss": 0.0146, "step": 315290 }, { "epoch": 0.82, "learning_rate": 0.00017740453780771992, "loss": 0.0131, "step": 315300 }, { "epoch": 0.82, "learning_rate": 0.00017740064959134843, "loss": 0.0158, "step": 315310 }, { "epoch": 0.82, "learning_rate": 0.00017739676137497697, "loss": 0.0402, "step": 315320 }, { "epoch": 0.82, "learning_rate": 0.00017739287315860554, "loss": 0.0161, "step": 315330 }, { "epoch": 0.82, "learning_rate": 0.00017738898494223406, "loss": 0.0141, "step": 315340 }, { "epoch": 0.82, "learning_rate": 0.00017738509672586257, "loss": 0.0138, "step": 315350 }, { "epoch": 0.82, "learning_rate": 0.00017738120850949111, "loss": 0.0114, "step": 315360 }, { "epoch": 0.82, "learning_rate": 0.00017737732029311963, "loss": 0.0159, "step": 315370 }, { "epoch": 0.82, "learning_rate": 0.0001773734320767482, "loss": 0.0168, "step": 315380 }, { "epoch": 0.82, "learning_rate": 0.00017736954386037674, "loss": 0.0099, "step": 315390 }, { "epoch": 0.82, "learning_rate": 0.00017736565564400525, "loss": 0.0132, "step": 315400 }, { "epoch": 0.82, "learning_rate": 0.0001773617674276338, "loss": 0.0151, "step": 315410 }, { "epoch": 0.82, "learning_rate": 0.00017735787921126234, "loss": 0.0133, "step": 315420 }, { "epoch": 0.82, "learning_rate": 0.00017735399099489088, "loss": 0.0198, "step": 315430 }, { "epoch": 0.82, "learning_rate": 0.0001773501027785194, "loss": 0.0172, "step": 315440 }, { "epoch": 0.82, "learning_rate": 0.00017734621456214793, "loss": 0.0158, "step": 315450 }, { "epoch": 0.82, "learning_rate": 0.00017734232634577648, "loss": 0.0158, "step": 315460 }, { "epoch": 0.82, "learning_rate": 0.00017733843812940502, "loss": 0.0146, "step": 315470 }, { "epoch": 0.82, "learning_rate": 0.00017733454991303353, "loss": 0.0151, "step": 315480 }, { "epoch": 0.82, "learning_rate": 0.00017733066169666207, "loss": 0.012, "step": 315490 }, { "epoch": 0.82, "learning_rate": 0.00017732677348029062, "loss": 0.0114, "step": 315500 }, { "epoch": 0.82, "learning_rate": 0.00017732288526391916, "loss": 0.0147, "step": 315510 }, { "epoch": 0.82, "learning_rate": 0.00017731899704754767, "loss": 0.0123, "step": 315520 }, { "epoch": 0.82, "learning_rate": 0.00017731510883117621, "loss": 0.0131, "step": 315530 }, { "epoch": 0.82, "learning_rate": 0.00017731122061480478, "loss": 0.0135, "step": 315540 }, { "epoch": 0.82, "learning_rate": 0.0001773073323984333, "loss": 0.015, "step": 315550 }, { "epoch": 0.82, "learning_rate": 0.00017730344418206184, "loss": 0.0126, "step": 315560 }, { "epoch": 0.82, "learning_rate": 0.00017729955596569035, "loss": 0.0169, "step": 315570 }, { "epoch": 0.82, "learning_rate": 0.00017729566774931892, "loss": 0.0127, "step": 315580 }, { "epoch": 0.82, "learning_rate": 0.00017729177953294744, "loss": 0.0125, "step": 315590 }, { "epoch": 0.82, "learning_rate": 0.00017728789131657598, "loss": 0.0164, "step": 315600 }, { "epoch": 0.82, "learning_rate": 0.0001772840031002045, "loss": 0.011, "step": 315610 }, { "epoch": 0.82, "learning_rate": 0.00017728011488383303, "loss": 0.0146, "step": 315620 }, { "epoch": 0.82, "learning_rate": 0.00017727622666746158, "loss": 0.0165, "step": 315630 }, { "epoch": 0.82, "learning_rate": 0.00017727233845109012, "loss": 0.015, "step": 315640 }, { "epoch": 0.82, "learning_rate": 0.00017726845023471863, "loss": 0.0125, "step": 315650 }, { "epoch": 0.82, "learning_rate": 0.00017726456201834717, "loss": 0.0127, "step": 315660 }, { "epoch": 0.82, "learning_rate": 0.00017726067380197572, "loss": 0.0113, "step": 315670 }, { "epoch": 0.82, "learning_rate": 0.00017725678558560426, "loss": 0.0183, "step": 315680 }, { "epoch": 0.82, "learning_rate": 0.00017725289736923277, "loss": 0.0128, "step": 315690 }, { "epoch": 0.82, "learning_rate": 0.0001772490091528613, "loss": 0.0158, "step": 315700 }, { "epoch": 0.82, "learning_rate": 0.00017724512093648988, "loss": 0.0151, "step": 315710 }, { "epoch": 0.82, "learning_rate": 0.0001772412327201184, "loss": 0.0124, "step": 315720 }, { "epoch": 0.82, "learning_rate": 0.00017723734450374694, "loss": 0.0124, "step": 315730 }, { "epoch": 0.82, "learning_rate": 0.00017723345628737545, "loss": 0.0137, "step": 315740 }, { "epoch": 0.82, "learning_rate": 0.00017722956807100402, "loss": 0.0114, "step": 315750 }, { "epoch": 0.82, "learning_rate": 0.00017722567985463254, "loss": 0.0131, "step": 315760 }, { "epoch": 0.82, "learning_rate": 0.00017722179163826108, "loss": 0.0138, "step": 315770 }, { "epoch": 0.82, "learning_rate": 0.0001772179034218896, "loss": 0.0129, "step": 315780 }, { "epoch": 0.82, "learning_rate": 0.00017721401520551816, "loss": 0.0123, "step": 315790 }, { "epoch": 0.82, "learning_rate": 0.00017721012698914668, "loss": 0.0128, "step": 315800 }, { "epoch": 0.82, "learning_rate": 0.00017720623877277522, "loss": 0.0152, "step": 315810 }, { "epoch": 0.82, "learning_rate": 0.00017720235055640373, "loss": 0.017, "step": 315820 }, { "epoch": 0.82, "learning_rate": 0.0001771984623400323, "loss": 0.0126, "step": 315830 }, { "epoch": 0.82, "learning_rate": 0.00017719457412366081, "loss": 0.0146, "step": 315840 }, { "epoch": 0.82, "learning_rate": 0.00017719068590728936, "loss": 0.012, "step": 315850 }, { "epoch": 0.82, "learning_rate": 0.00017718679769091787, "loss": 0.0142, "step": 315860 }, { "epoch": 0.82, "learning_rate": 0.0001771829094745464, "loss": 0.011, "step": 315870 }, { "epoch": 0.82, "learning_rate": 0.00017717902125817498, "loss": 0.0167, "step": 315880 }, { "epoch": 0.82, "learning_rate": 0.0001771751330418035, "loss": 0.0164, "step": 315890 }, { "epoch": 0.82, "learning_rate": 0.000177171244825432, "loss": 0.0121, "step": 315900 }, { "epoch": 0.82, "learning_rate": 0.00017716735660906055, "loss": 0.0134, "step": 315910 }, { "epoch": 0.82, "learning_rate": 0.00017716346839268912, "loss": 0.0137, "step": 315920 }, { "epoch": 0.82, "learning_rate": 0.00017715958017631764, "loss": 0.0136, "step": 315930 }, { "epoch": 0.82, "learning_rate": 0.00017715569195994618, "loss": 0.0118, "step": 315940 }, { "epoch": 0.82, "learning_rate": 0.0001771518037435747, "loss": 0.0123, "step": 315950 }, { "epoch": 0.82, "learning_rate": 0.00017714791552720326, "loss": 0.0117, "step": 315960 }, { "epoch": 0.82, "learning_rate": 0.00017714402731083177, "loss": 0.0118, "step": 315970 }, { "epoch": 0.82, "learning_rate": 0.00017714013909446032, "loss": 0.0132, "step": 315980 }, { "epoch": 0.82, "learning_rate": 0.00017713625087808883, "loss": 0.0145, "step": 315990 }, { "epoch": 0.82, "learning_rate": 0.0001771323626617174, "loss": 0.0163, "step": 316000 }, { "epoch": 0.82, "eval_cer": 0.8817068852339703, "eval_loss": 0.00930152740329504, "eval_runtime": 107.6124, "eval_samples_per_second": 18.585, "eval_steps_per_second": 4.646, "step": 316000 }, { "epoch": 0.82, "learning_rate": 0.00017712847444534591, "loss": 0.013, "step": 316010 }, { "epoch": 0.82, "learning_rate": 0.00017712458622897446, "loss": 0.0178, "step": 316020 }, { "epoch": 0.82, "learning_rate": 0.00017712069801260297, "loss": 0.0121, "step": 316030 }, { "epoch": 0.82, "learning_rate": 0.00017711680979623154, "loss": 0.0131, "step": 316040 }, { "epoch": 0.82, "learning_rate": 0.00017711292157986008, "loss": 0.0146, "step": 316050 }, { "epoch": 0.82, "learning_rate": 0.0001771090333634886, "loss": 0.0149, "step": 316060 }, { "epoch": 0.82, "learning_rate": 0.0001771051451471171, "loss": 0.0115, "step": 316070 }, { "epoch": 0.82, "learning_rate": 0.00017710125693074568, "loss": 0.015, "step": 316080 }, { "epoch": 0.82, "learning_rate": 0.00017709736871437422, "loss": 0.0108, "step": 316090 }, { "epoch": 0.82, "learning_rate": 0.00017709348049800273, "loss": 0.0124, "step": 316100 }, { "epoch": 0.82, "learning_rate": 0.00017708959228163128, "loss": 0.0129, "step": 316110 }, { "epoch": 0.82, "learning_rate": 0.0001770857040652598, "loss": 0.0163, "step": 316120 }, { "epoch": 0.82, "learning_rate": 0.00017708181584888836, "loss": 0.0168, "step": 316130 }, { "epoch": 0.82, "learning_rate": 0.00017707792763251687, "loss": 0.012, "step": 316140 }, { "epoch": 0.82, "learning_rate": 0.00017707403941614542, "loss": 0.0163, "step": 316150 }, { "epoch": 0.82, "learning_rate": 0.00017707015119977393, "loss": 0.0102, "step": 316160 }, { "epoch": 0.82, "learning_rate": 0.0001770662629834025, "loss": 0.0148, "step": 316170 }, { "epoch": 0.82, "learning_rate": 0.00017706237476703101, "loss": 0.0139, "step": 316180 }, { "epoch": 0.82, "learning_rate": 0.00017705848655065956, "loss": 0.0146, "step": 316190 }, { "epoch": 0.82, "learning_rate": 0.00017705459833428807, "loss": 0.0144, "step": 316200 }, { "epoch": 0.82, "learning_rate": 0.00017705071011791664, "loss": 0.0163, "step": 316210 }, { "epoch": 0.82, "learning_rate": 0.00017704682190154515, "loss": 0.0133, "step": 316220 }, { "epoch": 0.82, "learning_rate": 0.0001770429336851737, "loss": 0.0153, "step": 316230 }, { "epoch": 0.82, "learning_rate": 0.0001770390454688022, "loss": 0.0104, "step": 316240 }, { "epoch": 0.82, "learning_rate": 0.00017703515725243078, "loss": 0.0142, "step": 316250 }, { "epoch": 0.82, "learning_rate": 0.00017703126903605932, "loss": 0.0105, "step": 316260 }, { "epoch": 0.82, "learning_rate": 0.00017702738081968783, "loss": 0.0126, "step": 316270 }, { "epoch": 0.82, "learning_rate": 0.00017702349260331638, "loss": 0.0146, "step": 316280 }, { "epoch": 0.82, "learning_rate": 0.00017701960438694492, "loss": 0.0129, "step": 316290 }, { "epoch": 0.82, "learning_rate": 0.00017701571617057346, "loss": 0.0147, "step": 316300 }, { "epoch": 0.82, "learning_rate": 0.00017701182795420197, "loss": 0.0139, "step": 316310 }, { "epoch": 0.82, "learning_rate": 0.00017700793973783052, "loss": 0.012, "step": 316320 }, { "epoch": 0.82, "learning_rate": 0.00017700405152145906, "loss": 0.0151, "step": 316330 }, { "epoch": 0.82, "learning_rate": 0.0001770001633050876, "loss": 0.0109, "step": 316340 }, { "epoch": 0.82, "learning_rate": 0.0001769962750887161, "loss": 0.013, "step": 316350 }, { "epoch": 0.82, "learning_rate": 0.00017699238687234465, "loss": 0.0162, "step": 316360 }, { "epoch": 0.82, "learning_rate": 0.00017698849865597317, "loss": 0.0132, "step": 316370 }, { "epoch": 0.82, "learning_rate": 0.00017698461043960174, "loss": 0.014, "step": 316380 }, { "epoch": 0.82, "learning_rate": 0.00017698072222323025, "loss": 0.0139, "step": 316390 }, { "epoch": 0.82, "learning_rate": 0.0001769768340068588, "loss": 0.0173, "step": 316400 }, { "epoch": 0.82, "learning_rate": 0.0001769729457904873, "loss": 0.014, "step": 316410 }, { "epoch": 0.82, "learning_rate": 0.00017696905757411588, "loss": 0.0132, "step": 316420 }, { "epoch": 0.82, "learning_rate": 0.00017696516935774442, "loss": 0.0162, "step": 316430 }, { "epoch": 0.82, "learning_rate": 0.00017696128114137293, "loss": 0.0122, "step": 316440 }, { "epoch": 0.82, "learning_rate": 0.00017695739292500148, "loss": 0.0114, "step": 316450 }, { "epoch": 0.82, "learning_rate": 0.00017695350470863002, "loss": 0.0143, "step": 316460 }, { "epoch": 0.82, "learning_rate": 0.00017694961649225856, "loss": 0.0139, "step": 316470 }, { "epoch": 0.82, "learning_rate": 0.00017694572827588707, "loss": 0.0119, "step": 316480 }, { "epoch": 0.82, "learning_rate": 0.00017694184005951561, "loss": 0.0162, "step": 316490 }, { "epoch": 0.82, "learning_rate": 0.00017693795184314416, "loss": 0.0138, "step": 316500 }, { "epoch": 0.82, "learning_rate": 0.0001769340636267727, "loss": 0.0121, "step": 316510 }, { "epoch": 0.82, "learning_rate": 0.0001769301754104012, "loss": 0.0099, "step": 316520 }, { "epoch": 0.82, "learning_rate": 0.00017692628719402975, "loss": 0.0122, "step": 316530 }, { "epoch": 0.82, "learning_rate": 0.0001769223989776583, "loss": 0.0146, "step": 316540 }, { "epoch": 0.82, "learning_rate": 0.00017691851076128684, "loss": 0.0136, "step": 316550 }, { "epoch": 0.82, "learning_rate": 0.00017691462254491535, "loss": 0.0111, "step": 316560 }, { "epoch": 0.82, "learning_rate": 0.0001769107343285439, "loss": 0.0143, "step": 316570 }, { "epoch": 0.82, "learning_rate": 0.00017690684611217246, "loss": 0.0165, "step": 316580 }, { "epoch": 0.82, "learning_rate": 0.00017690295789580098, "loss": 0.0098, "step": 316590 }, { "epoch": 0.82, "learning_rate": 0.00017689906967942952, "loss": 0.011, "step": 316600 }, { "epoch": 0.82, "learning_rate": 0.00017689518146305803, "loss": 0.0134, "step": 316610 }, { "epoch": 0.82, "learning_rate": 0.00017689129324668655, "loss": 0.0126, "step": 316620 }, { "epoch": 0.82, "learning_rate": 0.00017688740503031512, "loss": 0.0166, "step": 316630 }, { "epoch": 0.82, "learning_rate": 0.00017688351681394366, "loss": 0.0123, "step": 316640 }, { "epoch": 0.82, "learning_rate": 0.00017687962859757217, "loss": 0.0129, "step": 316650 }, { "epoch": 0.82, "learning_rate": 0.00017687574038120071, "loss": 0.0119, "step": 316660 }, { "epoch": 0.82, "learning_rate": 0.00017687185216482926, "loss": 0.0126, "step": 316670 }, { "epoch": 0.82, "learning_rate": 0.0001768679639484578, "loss": 0.0168, "step": 316680 }, { "epoch": 0.82, "learning_rate": 0.0001768640757320863, "loss": 0.0142, "step": 316690 }, { "epoch": 0.82, "learning_rate": 0.00017686018751571485, "loss": 0.0145, "step": 316700 }, { "epoch": 0.82, "learning_rate": 0.0001768562992993434, "loss": 0.0143, "step": 316710 }, { "epoch": 0.82, "learning_rate": 0.00017685241108297194, "loss": 0.0117, "step": 316720 }, { "epoch": 0.82, "learning_rate": 0.00017684852286660045, "loss": 0.0137, "step": 316730 }, { "epoch": 0.82, "learning_rate": 0.000176844634650229, "loss": 0.0133, "step": 316740 }, { "epoch": 0.82, "learning_rate": 0.00017684074643385756, "loss": 0.0137, "step": 316750 }, { "epoch": 0.82, "learning_rate": 0.00017683685821748608, "loss": 0.0153, "step": 316760 }, { "epoch": 0.82, "learning_rate": 0.00017683297000111462, "loss": 0.0179, "step": 316770 }, { "epoch": 0.82, "learning_rate": 0.00017682908178474313, "loss": 0.017, "step": 316780 }, { "epoch": 0.82, "learning_rate": 0.0001768251935683717, "loss": 0.0151, "step": 316790 }, { "epoch": 0.82, "learning_rate": 0.00017682130535200022, "loss": 0.0135, "step": 316800 }, { "epoch": 0.82, "learning_rate": 0.00017681741713562876, "loss": 0.0126, "step": 316810 }, { "epoch": 0.82, "learning_rate": 0.00017681352891925727, "loss": 0.015, "step": 316820 }, { "epoch": 0.82, "learning_rate": 0.00017680964070288584, "loss": 0.0132, "step": 316830 }, { "epoch": 0.82, "learning_rate": 0.00017680575248651436, "loss": 0.0125, "step": 316840 }, { "epoch": 0.82, "learning_rate": 0.0001768018642701429, "loss": 0.0121, "step": 316850 }, { "epoch": 0.82, "learning_rate": 0.0001767979760537714, "loss": 0.0142, "step": 316860 }, { "epoch": 0.82, "learning_rate": 0.00017679408783739995, "loss": 0.0163, "step": 316870 }, { "epoch": 0.82, "learning_rate": 0.0001767901996210285, "loss": 0.0156, "step": 316880 }, { "epoch": 0.82, "learning_rate": 0.00017678631140465704, "loss": 0.0104, "step": 316890 }, { "epoch": 0.82, "learning_rate": 0.00017678242318828555, "loss": 0.0174, "step": 316900 }, { "epoch": 0.82, "learning_rate": 0.0001767785349719141, "loss": 0.0136, "step": 316910 }, { "epoch": 0.82, "learning_rate": 0.00017677464675554266, "loss": 0.0135, "step": 316920 }, { "epoch": 0.82, "learning_rate": 0.00017677075853917118, "loss": 0.0128, "step": 316930 }, { "epoch": 0.82, "learning_rate": 0.0001767668703227997, "loss": 0.0097, "step": 316940 }, { "epoch": 0.82, "learning_rate": 0.00017676298210642823, "loss": 0.0147, "step": 316950 }, { "epoch": 0.82, "learning_rate": 0.0001767590938900568, "loss": 0.0149, "step": 316960 }, { "epoch": 0.82, "learning_rate": 0.00017675520567368532, "loss": 0.0153, "step": 316970 }, { "epoch": 0.82, "learning_rate": 0.00017675131745731386, "loss": 0.0146, "step": 316980 }, { "epoch": 0.82, "learning_rate": 0.00017674742924094237, "loss": 0.0154, "step": 316990 }, { "epoch": 0.82, "learning_rate": 0.00017674354102457094, "loss": 0.0141, "step": 317000 }, { "epoch": 0.82, "eval_cer": 0.8817502739789299, "eval_loss": 0.01099375169724226, "eval_runtime": 107.5512, "eval_samples_per_second": 18.596, "eval_steps_per_second": 4.649, "step": 317000 }, { "epoch": 0.82, "learning_rate": 0.00017673965280819945, "loss": 0.0143, "step": 317010 }, { "epoch": 0.82, "learning_rate": 0.000176735764591828, "loss": 0.018, "step": 317020 }, { "epoch": 0.82, "learning_rate": 0.0001767318763754565, "loss": 0.0141, "step": 317030 }, { "epoch": 0.82, "learning_rate": 0.00017672798815908508, "loss": 0.0152, "step": 317040 }, { "epoch": 0.82, "learning_rate": 0.0001767240999427136, "loss": 0.0138, "step": 317050 }, { "epoch": 0.82, "learning_rate": 0.00017672021172634214, "loss": 0.0121, "step": 317060 }, { "epoch": 0.82, "learning_rate": 0.00017671632350997065, "loss": 0.0165, "step": 317070 }, { "epoch": 0.82, "learning_rate": 0.00017671243529359922, "loss": 0.012, "step": 317080 }, { "epoch": 0.82, "learning_rate": 0.00017670854707722773, "loss": 0.0127, "step": 317090 }, { "epoch": 0.82, "learning_rate": 0.00017670465886085628, "loss": 0.0193, "step": 317100 }, { "epoch": 0.82, "learning_rate": 0.0001767007706444848, "loss": 0.0172, "step": 317110 }, { "epoch": 0.82, "learning_rate": 0.00017669688242811333, "loss": 0.0152, "step": 317120 }, { "epoch": 0.82, "learning_rate": 0.0001766929942117419, "loss": 0.0121, "step": 317130 }, { "epoch": 0.82, "learning_rate": 0.00017668910599537041, "loss": 0.0119, "step": 317140 }, { "epoch": 0.82, "learning_rate": 0.00017668521777899896, "loss": 0.0105, "step": 317150 }, { "epoch": 0.82, "learning_rate": 0.00017668132956262747, "loss": 0.0123, "step": 317160 }, { "epoch": 0.82, "learning_rate": 0.00017667744134625604, "loss": 0.0144, "step": 317170 }, { "epoch": 0.82, "learning_rate": 0.00017667355312988455, "loss": 0.0126, "step": 317180 }, { "epoch": 0.82, "learning_rate": 0.0001766696649135131, "loss": 0.013, "step": 317190 }, { "epoch": 0.82, "learning_rate": 0.0001766657766971416, "loss": 0.0163, "step": 317200 }, { "epoch": 0.82, "learning_rate": 0.00017666188848077018, "loss": 0.0148, "step": 317210 }, { "epoch": 0.82, "learning_rate": 0.0001766580002643987, "loss": 0.0112, "step": 317220 }, { "epoch": 0.82, "learning_rate": 0.00017665411204802724, "loss": 0.0181, "step": 317230 }, { "epoch": 0.82, "learning_rate": 0.00017665022383165575, "loss": 0.0109, "step": 317240 }, { "epoch": 0.82, "learning_rate": 0.00017664633561528432, "loss": 0.014, "step": 317250 }, { "epoch": 0.82, "learning_rate": 0.00017664244739891283, "loss": 0.013, "step": 317260 }, { "epoch": 0.82, "learning_rate": 0.00017663855918254137, "loss": 0.0206, "step": 317270 }, { "epoch": 0.82, "learning_rate": 0.0001766346709661699, "loss": 0.0145, "step": 317280 }, { "epoch": 0.82, "learning_rate": 0.00017663078274979846, "loss": 0.0149, "step": 317290 }, { "epoch": 0.82, "learning_rate": 0.000176626894533427, "loss": 0.0112, "step": 317300 }, { "epoch": 0.82, "learning_rate": 0.00017662300631705551, "loss": 0.0133, "step": 317310 }, { "epoch": 0.82, "learning_rate": 0.00017661911810068406, "loss": 0.0176, "step": 317320 }, { "epoch": 0.82, "learning_rate": 0.00017661522988431257, "loss": 0.0102, "step": 317330 }, { "epoch": 0.82, "learning_rate": 0.00017661134166794114, "loss": 0.0123, "step": 317340 }, { "epoch": 0.82, "learning_rate": 0.00017660745345156965, "loss": 0.0146, "step": 317350 }, { "epoch": 0.82, "learning_rate": 0.0001766035652351982, "loss": 0.015, "step": 317360 }, { "epoch": 0.82, "learning_rate": 0.0001765996770188267, "loss": 0.0131, "step": 317370 }, { "epoch": 0.82, "learning_rate": 0.00017659578880245528, "loss": 0.0112, "step": 317380 }, { "epoch": 0.82, "learning_rate": 0.0001765919005860838, "loss": 0.0133, "step": 317390 }, { "epoch": 0.82, "learning_rate": 0.00017658801236971233, "loss": 0.0127, "step": 317400 }, { "epoch": 0.82, "learning_rate": 0.00017658412415334085, "loss": 0.014, "step": 317410 }, { "epoch": 0.82, "learning_rate": 0.00017658023593696942, "loss": 0.0114, "step": 317420 }, { "epoch": 0.82, "learning_rate": 0.00017657634772059793, "loss": 0.0117, "step": 317430 }, { "epoch": 0.82, "learning_rate": 0.00017657245950422647, "loss": 0.0116, "step": 317440 }, { "epoch": 0.82, "learning_rate": 0.000176568571287855, "loss": 0.0131, "step": 317450 }, { "epoch": 0.82, "learning_rate": 0.00017656468307148356, "loss": 0.014, "step": 317460 }, { "epoch": 0.82, "learning_rate": 0.0001765607948551121, "loss": 0.014, "step": 317470 }, { "epoch": 0.82, "learning_rate": 0.0001765569066387406, "loss": 0.0124, "step": 317480 }, { "epoch": 0.82, "learning_rate": 0.00017655301842236913, "loss": 0.0158, "step": 317490 }, { "epoch": 0.82, "learning_rate": 0.0001765491302059977, "loss": 0.0144, "step": 317500 }, { "epoch": 0.82, "learning_rate": 0.00017654524198962624, "loss": 0.0129, "step": 317510 }, { "epoch": 0.82, "learning_rate": 0.00017654135377325475, "loss": 0.0141, "step": 317520 }, { "epoch": 0.82, "learning_rate": 0.0001765374655568833, "loss": 0.0133, "step": 317530 }, { "epoch": 0.82, "learning_rate": 0.00017653357734051184, "loss": 0.0134, "step": 317540 }, { "epoch": 0.82, "learning_rate": 0.00017652968912414038, "loss": 0.0126, "step": 317550 }, { "epoch": 0.82, "learning_rate": 0.0001765258009077689, "loss": 0.0134, "step": 317560 }, { "epoch": 0.82, "learning_rate": 0.00017652191269139743, "loss": 0.0165, "step": 317570 }, { "epoch": 0.82, "learning_rate": 0.00017651802447502595, "loss": 0.0109, "step": 317580 }, { "epoch": 0.82, "learning_rate": 0.00017651413625865452, "loss": 0.0116, "step": 317590 }, { "epoch": 0.82, "learning_rate": 0.00017651024804228303, "loss": 0.0182, "step": 317600 }, { "epoch": 0.82, "learning_rate": 0.00017650635982591157, "loss": 0.0141, "step": 317610 }, { "epoch": 0.82, "learning_rate": 0.0001765024716095401, "loss": 0.0139, "step": 317620 }, { "epoch": 0.82, "learning_rate": 0.00017649858339316866, "loss": 0.0107, "step": 317630 }, { "epoch": 0.82, "learning_rate": 0.0001764946951767972, "loss": 0.01, "step": 317640 }, { "epoch": 0.82, "learning_rate": 0.0001764908069604257, "loss": 0.0103, "step": 317650 }, { "epoch": 0.82, "learning_rate": 0.00017648691874405423, "loss": 0.0131, "step": 317660 }, { "epoch": 0.82, "learning_rate": 0.0001764830305276828, "loss": 0.0152, "step": 317670 }, { "epoch": 0.82, "learning_rate": 0.00017647914231131134, "loss": 0.0111, "step": 317680 }, { "epoch": 0.82, "learning_rate": 0.00017647525409493985, "loss": 0.0143, "step": 317690 }, { "epoch": 0.82, "learning_rate": 0.0001764713658785684, "loss": 0.0127, "step": 317700 }, { "epoch": 0.82, "learning_rate": 0.00017646747766219694, "loss": 0.015, "step": 317710 }, { "epoch": 0.82, "learning_rate": 0.00017646358944582548, "loss": 0.0153, "step": 317720 }, { "epoch": 0.82, "learning_rate": 0.000176459701229454, "loss": 0.0129, "step": 317730 }, { "epoch": 0.82, "learning_rate": 0.00017645581301308253, "loss": 0.0121, "step": 317740 }, { "epoch": 0.82, "learning_rate": 0.00017645192479671107, "loss": 0.018, "step": 317750 }, { "epoch": 0.82, "learning_rate": 0.00017644803658033962, "loss": 0.014, "step": 317760 }, { "epoch": 0.82, "learning_rate": 0.00017644414836396813, "loss": 0.0106, "step": 317770 }, { "epoch": 0.82, "learning_rate": 0.00017644026014759667, "loss": 0.0113, "step": 317780 }, { "epoch": 0.82, "learning_rate": 0.00017643637193122524, "loss": 0.0113, "step": 317790 }, { "epoch": 0.82, "learning_rate": 0.00017643248371485376, "loss": 0.014, "step": 317800 }, { "epoch": 0.82, "learning_rate": 0.00017642859549848227, "loss": 0.014, "step": 317810 }, { "epoch": 0.82, "learning_rate": 0.0001764247072821108, "loss": 0.0108, "step": 317820 }, { "epoch": 0.82, "learning_rate": 0.00017642081906573933, "loss": 0.0164, "step": 317830 }, { "epoch": 0.82, "learning_rate": 0.0001764169308493679, "loss": 0.0122, "step": 317840 }, { "epoch": 0.82, "learning_rate": 0.00017641304263299644, "loss": 0.0134, "step": 317850 }, { "epoch": 0.82, "learning_rate": 0.00017640915441662495, "loss": 0.0125, "step": 317860 }, { "epoch": 0.82, "learning_rate": 0.0001764052662002535, "loss": 0.0133, "step": 317870 }, { "epoch": 0.82, "learning_rate": 0.00017640137798388203, "loss": 0.0123, "step": 317880 }, { "epoch": 0.82, "learning_rate": 0.00017639748976751058, "loss": 0.0142, "step": 317890 }, { "epoch": 0.82, "learning_rate": 0.0001763936015511391, "loss": 0.0137, "step": 317900 }, { "epoch": 0.82, "learning_rate": 0.00017638971333476763, "loss": 0.0142, "step": 317910 }, { "epoch": 0.82, "learning_rate": 0.00017638582511839617, "loss": 0.0102, "step": 317920 }, { "epoch": 0.82, "learning_rate": 0.00017638193690202472, "loss": 0.0125, "step": 317930 }, { "epoch": 0.82, "learning_rate": 0.00017637804868565323, "loss": 0.0113, "step": 317940 }, { "epoch": 0.82, "learning_rate": 0.00017637416046928177, "loss": 0.0129, "step": 317950 }, { "epoch": 0.82, "learning_rate": 0.00017637027225291034, "loss": 0.0126, "step": 317960 }, { "epoch": 0.82, "learning_rate": 0.00017636638403653886, "loss": 0.0128, "step": 317970 }, { "epoch": 0.82, "learning_rate": 0.00017636249582016737, "loss": 0.0114, "step": 317980 }, { "epoch": 0.82, "learning_rate": 0.0001763586076037959, "loss": 0.0232, "step": 317990 }, { "epoch": 0.82, "learning_rate": 0.00017635471938742448, "loss": 0.023, "step": 318000 }, { "epoch": 0.82, "eval_cer": 0.8816956881384969, "eval_loss": 0.009950380772352219, "eval_runtime": 107.6438, "eval_samples_per_second": 18.58, "eval_steps_per_second": 4.645, "step": 318000 }, { "epoch": 0.82, "learning_rate": 0.000176350831171053, "loss": 0.0163, "step": 318010 }, { "epoch": 0.82, "learning_rate": 0.00017634694295468154, "loss": 0.015, "step": 318020 }, { "epoch": 0.82, "learning_rate": 0.00017634305473831005, "loss": 0.015, "step": 318030 }, { "epoch": 0.82, "learning_rate": 0.00017633916652193862, "loss": 0.0161, "step": 318040 }, { "epoch": 0.82, "learning_rate": 0.00017633527830556713, "loss": 0.0122, "step": 318050 }, { "epoch": 0.82, "learning_rate": 0.00017633139008919568, "loss": 0.0197, "step": 318060 }, { "epoch": 0.82, "learning_rate": 0.0001763275018728242, "loss": 0.0125, "step": 318070 }, { "epoch": 0.82, "learning_rate": 0.00017632361365645273, "loss": 0.0186, "step": 318080 }, { "epoch": 0.82, "learning_rate": 0.00017631972544008127, "loss": 0.0187, "step": 318090 }, { "epoch": 0.82, "learning_rate": 0.00017631583722370982, "loss": 0.0159, "step": 318100 }, { "epoch": 0.82, "learning_rate": 0.00017631194900733833, "loss": 0.0142, "step": 318110 }, { "epoch": 0.82, "learning_rate": 0.00017630806079096687, "loss": 0.0187, "step": 318120 }, { "epoch": 0.82, "learning_rate": 0.0001763041725745954, "loss": 0.0112, "step": 318130 }, { "epoch": 0.82, "learning_rate": 0.00017630028435822395, "loss": 0.0127, "step": 318140 }, { "epoch": 0.82, "learning_rate": 0.00017629639614185247, "loss": 0.0134, "step": 318150 }, { "epoch": 0.82, "learning_rate": 0.000176292507925481, "loss": 0.01, "step": 318160 }, { "epoch": 0.82, "learning_rate": 0.00017628861970910958, "loss": 0.0115, "step": 318170 }, { "epoch": 0.82, "learning_rate": 0.0001762847314927381, "loss": 0.0131, "step": 318180 }, { "epoch": 0.82, "learning_rate": 0.00017628084327636664, "loss": 0.0139, "step": 318190 }, { "epoch": 0.82, "learning_rate": 0.00017627695505999515, "loss": 0.0145, "step": 318200 }, { "epoch": 0.82, "learning_rate": 0.00017627306684362372, "loss": 0.0122, "step": 318210 }, { "epoch": 0.82, "learning_rate": 0.00017626917862725223, "loss": 0.0124, "step": 318220 }, { "epoch": 0.82, "learning_rate": 0.00017626529041088078, "loss": 0.0101, "step": 318230 }, { "epoch": 0.82, "learning_rate": 0.0001762614021945093, "loss": 0.0112, "step": 318240 }, { "epoch": 0.82, "learning_rate": 0.00017625751397813786, "loss": 0.0157, "step": 318250 }, { "epoch": 0.82, "learning_rate": 0.00017625362576176637, "loss": 0.0183, "step": 318260 }, { "epoch": 0.83, "learning_rate": 0.00017624973754539491, "loss": 0.0134, "step": 318270 }, { "epoch": 0.83, "learning_rate": 0.00017624584932902343, "loss": 0.0103, "step": 318280 }, { "epoch": 0.83, "learning_rate": 0.000176241961112652, "loss": 0.0175, "step": 318290 }, { "epoch": 0.83, "learning_rate": 0.0001762380728962805, "loss": 0.0145, "step": 318300 }, { "epoch": 0.83, "learning_rate": 0.00017623418467990905, "loss": 0.0223, "step": 318310 }, { "epoch": 0.83, "learning_rate": 0.00017623029646353757, "loss": 0.0132, "step": 318320 }, { "epoch": 0.83, "learning_rate": 0.0001762264082471661, "loss": 0.0121, "step": 318330 }, { "epoch": 0.83, "learning_rate": 0.00017622252003079468, "loss": 0.0164, "step": 318340 }, { "epoch": 0.83, "learning_rate": 0.0001762186318144232, "loss": 0.0151, "step": 318350 }, { "epoch": 0.83, "learning_rate": 0.00017621474359805174, "loss": 0.0146, "step": 318360 }, { "epoch": 0.83, "learning_rate": 0.00017621085538168025, "loss": 0.0164, "step": 318370 }, { "epoch": 0.83, "learning_rate": 0.00017620696716530882, "loss": 0.0139, "step": 318380 }, { "epoch": 0.83, "learning_rate": 0.00017620307894893733, "loss": 0.0172, "step": 318390 }, { "epoch": 0.83, "learning_rate": 0.00017619919073256587, "loss": 0.0146, "step": 318400 }, { "epoch": 0.83, "learning_rate": 0.0001761953025161944, "loss": 0.0143, "step": 318410 }, { "epoch": 0.83, "learning_rate": 0.00017619141429982296, "loss": 0.0137, "step": 318420 }, { "epoch": 0.83, "learning_rate": 0.00017618752608345147, "loss": 0.0153, "step": 318430 }, { "epoch": 0.83, "learning_rate": 0.00017618363786708001, "loss": 0.0123, "step": 318440 }, { "epoch": 0.83, "learning_rate": 0.00017617974965070853, "loss": 0.0142, "step": 318450 }, { "epoch": 0.83, "learning_rate": 0.0001761758614343371, "loss": 0.0111, "step": 318460 }, { "epoch": 0.83, "learning_rate": 0.0001761719732179656, "loss": 0.0108, "step": 318470 }, { "epoch": 0.83, "learning_rate": 0.00017616808500159415, "loss": 0.0167, "step": 318480 }, { "epoch": 0.83, "learning_rate": 0.00017616419678522267, "loss": 0.0114, "step": 318490 }, { "epoch": 0.83, "learning_rate": 0.00017616030856885124, "loss": 0.0136, "step": 318500 }, { "epoch": 0.83, "learning_rate": 0.00017615642035247978, "loss": 0.0144, "step": 318510 }, { "epoch": 0.83, "learning_rate": 0.0001761525321361083, "loss": 0.0148, "step": 318520 }, { "epoch": 0.83, "learning_rate": 0.0001761486439197368, "loss": 0.0124, "step": 318530 }, { "epoch": 0.83, "learning_rate": 0.00017614475570336538, "loss": 0.0134, "step": 318540 }, { "epoch": 0.83, "learning_rate": 0.00017614086748699392, "loss": 0.0136, "step": 318550 }, { "epoch": 0.83, "learning_rate": 0.00017613697927062243, "loss": 0.0149, "step": 318560 }, { "epoch": 0.83, "learning_rate": 0.00017613309105425097, "loss": 0.015, "step": 318570 }, { "epoch": 0.83, "learning_rate": 0.0001761292028378795, "loss": 0.0127, "step": 318580 }, { "epoch": 0.83, "learning_rate": 0.00017612531462150806, "loss": 0.0163, "step": 318590 }, { "epoch": 0.83, "learning_rate": 0.00017612142640513657, "loss": 0.0135, "step": 318600 }, { "epoch": 0.83, "learning_rate": 0.00017611753818876511, "loss": 0.0157, "step": 318610 }, { "epoch": 0.83, "learning_rate": 0.00017611364997239363, "loss": 0.0131, "step": 318620 }, { "epoch": 0.83, "learning_rate": 0.0001761097617560222, "loss": 0.0132, "step": 318630 }, { "epoch": 0.83, "learning_rate": 0.0001761058735396507, "loss": 0.0159, "step": 318640 }, { "epoch": 0.83, "learning_rate": 0.00017610198532327925, "loss": 0.0137, "step": 318650 }, { "epoch": 0.83, "learning_rate": 0.00017609809710690777, "loss": 0.0133, "step": 318660 }, { "epoch": 0.83, "learning_rate": 0.00017609420889053634, "loss": 0.0124, "step": 318670 }, { "epoch": 0.83, "learning_rate": 0.00017609032067416485, "loss": 0.0139, "step": 318680 }, { "epoch": 0.83, "learning_rate": 0.0001760864324577934, "loss": 0.0115, "step": 318690 }, { "epoch": 0.83, "learning_rate": 0.0001760825442414219, "loss": 0.0119, "step": 318700 }, { "epoch": 0.83, "learning_rate": 0.00017607865602505048, "loss": 0.0116, "step": 318710 }, { "epoch": 0.83, "learning_rate": 0.00017607476780867902, "loss": 0.0159, "step": 318720 }, { "epoch": 0.83, "learning_rate": 0.00017607087959230753, "loss": 0.0117, "step": 318730 }, { "epoch": 0.83, "learning_rate": 0.00017606699137593607, "loss": 0.014, "step": 318740 }, { "epoch": 0.83, "learning_rate": 0.00017606310315956462, "loss": 0.0121, "step": 318750 }, { "epoch": 0.83, "learning_rate": 0.00017605921494319316, "loss": 0.0124, "step": 318760 }, { "epoch": 0.83, "learning_rate": 0.00017605532672682167, "loss": 0.0152, "step": 318770 }, { "epoch": 0.83, "learning_rate": 0.0001760514385104502, "loss": 0.0142, "step": 318780 }, { "epoch": 0.83, "learning_rate": 0.00017604755029407875, "loss": 0.0179, "step": 318790 }, { "epoch": 0.83, "learning_rate": 0.0001760436620777073, "loss": 0.0161, "step": 318800 }, { "epoch": 0.83, "learning_rate": 0.0001760397738613358, "loss": 0.0131, "step": 318810 }, { "epoch": 0.83, "learning_rate": 0.00017603588564496435, "loss": 0.0128, "step": 318820 }, { "epoch": 0.83, "learning_rate": 0.00017603199742859287, "loss": 0.0218, "step": 318830 }, { "epoch": 0.83, "learning_rate": 0.00017602810921222144, "loss": 0.0155, "step": 318840 }, { "epoch": 0.83, "learning_rate": 0.00017602422099584995, "loss": 0.0156, "step": 318850 }, { "epoch": 0.83, "learning_rate": 0.0001760203327794785, "loss": 0.0132, "step": 318860 }, { "epoch": 0.83, "learning_rate": 0.000176016444563107, "loss": 0.0166, "step": 318870 }, { "epoch": 0.83, "learning_rate": 0.00017601255634673558, "loss": 0.0144, "step": 318880 }, { "epoch": 0.83, "learning_rate": 0.00017600866813036412, "loss": 0.0134, "step": 318890 }, { "epoch": 0.83, "learning_rate": 0.00017600477991399263, "loss": 0.0152, "step": 318900 }, { "epoch": 0.83, "learning_rate": 0.00017600089169762117, "loss": 0.0142, "step": 318910 }, { "epoch": 0.83, "learning_rate": 0.00017599700348124971, "loss": 0.0139, "step": 318920 }, { "epoch": 0.83, "learning_rate": 0.00017599311526487826, "loss": 0.0161, "step": 318930 }, { "epoch": 0.83, "learning_rate": 0.00017598922704850677, "loss": 0.0141, "step": 318940 }, { "epoch": 0.83, "learning_rate": 0.0001759853388321353, "loss": 0.0158, "step": 318950 }, { "epoch": 0.83, "learning_rate": 0.00017598145061576385, "loss": 0.0117, "step": 318960 }, { "epoch": 0.83, "learning_rate": 0.0001759775623993924, "loss": 0.0119, "step": 318970 }, { "epoch": 0.83, "learning_rate": 0.0001759736741830209, "loss": 0.0127, "step": 318980 }, { "epoch": 0.83, "learning_rate": 0.00017596978596664945, "loss": 0.0135, "step": 318990 }, { "epoch": 0.83, "learning_rate": 0.000175965897750278, "loss": 0.0133, "step": 319000 }, { "epoch": 0.83, "eval_cer": 0.8817096845078387, "eval_loss": 0.00930393859744072, "eval_runtime": 107.7238, "eval_samples_per_second": 18.566, "eval_steps_per_second": 4.641, "step": 319000 }, { "epoch": 0.83, "learning_rate": 0.00017596200953390654, "loss": 0.0146, "step": 319010 }, { "epoch": 0.83, "learning_rate": 0.00017595812131753505, "loss": 0.0205, "step": 319020 }, { "epoch": 0.83, "learning_rate": 0.0001759542331011636, "loss": 0.0136, "step": 319030 }, { "epoch": 0.83, "learning_rate": 0.00017595034488479216, "loss": 0.0117, "step": 319040 }, { "epoch": 0.83, "learning_rate": 0.00017594645666842067, "loss": 0.0155, "step": 319050 }, { "epoch": 0.83, "learning_rate": 0.00017594256845204922, "loss": 0.0166, "step": 319060 }, { "epoch": 0.83, "learning_rate": 0.00017593868023567773, "loss": 0.0159, "step": 319070 }, { "epoch": 0.83, "learning_rate": 0.00017593479201930625, "loss": 0.0149, "step": 319080 }, { "epoch": 0.83, "learning_rate": 0.00017593090380293481, "loss": 0.0163, "step": 319090 }, { "epoch": 0.83, "learning_rate": 0.00017592701558656336, "loss": 0.0121, "step": 319100 }, { "epoch": 0.83, "learning_rate": 0.00017592312737019187, "loss": 0.0118, "step": 319110 }, { "epoch": 0.83, "learning_rate": 0.0001759192391538204, "loss": 0.0177, "step": 319120 }, { "epoch": 0.83, "learning_rate": 0.00017591535093744895, "loss": 0.015, "step": 319130 }, { "epoch": 0.83, "learning_rate": 0.0001759114627210775, "loss": 0.0112, "step": 319140 }, { "epoch": 0.83, "learning_rate": 0.000175907574504706, "loss": 0.0134, "step": 319150 }, { "epoch": 0.83, "learning_rate": 0.00017590368628833455, "loss": 0.0119, "step": 319160 }, { "epoch": 0.83, "learning_rate": 0.0001758997980719631, "loss": 0.0115, "step": 319170 }, { "epoch": 0.83, "learning_rate": 0.00017589590985559163, "loss": 0.0136, "step": 319180 }, { "epoch": 0.83, "learning_rate": 0.00017589202163922015, "loss": 0.0169, "step": 319190 }, { "epoch": 0.83, "learning_rate": 0.0001758881334228487, "loss": 0.0129, "step": 319200 }, { "epoch": 0.83, "learning_rate": 0.00017588424520647726, "loss": 0.0168, "step": 319210 }, { "epoch": 0.83, "learning_rate": 0.00017588035699010577, "loss": 0.0131, "step": 319220 }, { "epoch": 0.83, "learning_rate": 0.00017587646877373432, "loss": 0.0144, "step": 319230 }, { "epoch": 0.83, "learning_rate": 0.00017587258055736283, "loss": 0.0148, "step": 319240 }, { "epoch": 0.83, "learning_rate": 0.0001758686923409914, "loss": 0.0159, "step": 319250 }, { "epoch": 0.83, "learning_rate": 0.00017586480412461991, "loss": 0.0099, "step": 319260 }, { "epoch": 0.83, "learning_rate": 0.00017586091590824846, "loss": 0.0125, "step": 319270 }, { "epoch": 0.83, "learning_rate": 0.00017585702769187697, "loss": 0.0147, "step": 319280 }, { "epoch": 0.83, "learning_rate": 0.00017585313947550554, "loss": 0.0126, "step": 319290 }, { "epoch": 0.83, "learning_rate": 0.00017584925125913405, "loss": 0.0157, "step": 319300 }, { "epoch": 0.83, "learning_rate": 0.0001758453630427626, "loss": 0.0167, "step": 319310 }, { "epoch": 0.83, "learning_rate": 0.0001758414748263911, "loss": 0.0128, "step": 319320 }, { "epoch": 0.83, "learning_rate": 0.00017583758661001965, "loss": 0.0199, "step": 319330 }, { "epoch": 0.83, "learning_rate": 0.0001758336983936482, "loss": 0.0162, "step": 319340 }, { "epoch": 0.83, "learning_rate": 0.00017582981017727673, "loss": 0.0136, "step": 319350 }, { "epoch": 0.83, "learning_rate": 0.00017582592196090525, "loss": 0.0108, "step": 319360 }, { "epoch": 0.83, "learning_rate": 0.0001758220337445338, "loss": 0.0162, "step": 319370 }, { "epoch": 0.83, "learning_rate": 0.00017581814552816236, "loss": 0.0158, "step": 319380 }, { "epoch": 0.83, "learning_rate": 0.00017581425731179087, "loss": 0.0129, "step": 319390 }, { "epoch": 0.83, "learning_rate": 0.0001758103690954194, "loss": 0.0128, "step": 319400 }, { "epoch": 0.83, "learning_rate": 0.00017580648087904793, "loss": 0.0127, "step": 319410 }, { "epoch": 0.83, "learning_rate": 0.0001758025926626765, "loss": 0.011, "step": 319420 }, { "epoch": 0.83, "learning_rate": 0.000175798704446305, "loss": 0.0126, "step": 319430 }, { "epoch": 0.83, "learning_rate": 0.00017579481622993355, "loss": 0.0105, "step": 319440 }, { "epoch": 0.83, "learning_rate": 0.00017579092801356207, "loss": 0.0147, "step": 319450 }, { "epoch": 0.83, "learning_rate": 0.00017578703979719064, "loss": 0.0139, "step": 319460 }, { "epoch": 0.83, "learning_rate": 0.00017578315158081915, "loss": 0.0113, "step": 319470 }, { "epoch": 0.83, "learning_rate": 0.0001757792633644477, "loss": 0.0197, "step": 319480 }, { "epoch": 0.83, "learning_rate": 0.0001757753751480762, "loss": 0.014, "step": 319490 }, { "epoch": 0.83, "learning_rate": 0.00017577148693170478, "loss": 0.0108, "step": 319500 }, { "epoch": 0.83, "learning_rate": 0.0001757675987153333, "loss": 0.0131, "step": 319510 }, { "epoch": 0.83, "learning_rate": 0.00017576371049896183, "loss": 0.0108, "step": 319520 }, { "epoch": 0.83, "learning_rate": 0.00017575982228259035, "loss": 0.0146, "step": 319530 }, { "epoch": 0.83, "learning_rate": 0.00017575593406621892, "loss": 0.0147, "step": 319540 }, { "epoch": 0.83, "learning_rate": 0.00017575204584984743, "loss": 0.0151, "step": 319550 }, { "epoch": 0.83, "learning_rate": 0.00017574815763347597, "loss": 0.0132, "step": 319560 }, { "epoch": 0.83, "learning_rate": 0.0001757442694171045, "loss": 0.0137, "step": 319570 }, { "epoch": 0.83, "learning_rate": 0.00017574038120073303, "loss": 0.0116, "step": 319580 }, { "epoch": 0.83, "learning_rate": 0.0001757364929843616, "loss": 0.0148, "step": 319590 }, { "epoch": 0.83, "learning_rate": 0.0001757326047679901, "loss": 0.0193, "step": 319600 }, { "epoch": 0.83, "learning_rate": 0.00017572871655161865, "loss": 0.013, "step": 319610 }, { "epoch": 0.83, "learning_rate": 0.00017572482833524717, "loss": 0.0124, "step": 319620 }, { "epoch": 0.83, "learning_rate": 0.00017572094011887574, "loss": 0.0104, "step": 319630 }, { "epoch": 0.83, "learning_rate": 0.00017571705190250425, "loss": 0.0166, "step": 319640 }, { "epoch": 0.83, "learning_rate": 0.0001757131636861328, "loss": 0.0149, "step": 319650 }, { "epoch": 0.83, "learning_rate": 0.0001757092754697613, "loss": 0.0123, "step": 319660 }, { "epoch": 0.83, "learning_rate": 0.00017570538725338988, "loss": 0.0156, "step": 319670 }, { "epoch": 0.83, "learning_rate": 0.0001757014990370184, "loss": 0.0144, "step": 319680 }, { "epoch": 0.83, "learning_rate": 0.00017569761082064693, "loss": 0.0122, "step": 319690 }, { "epoch": 0.83, "learning_rate": 0.00017569372260427545, "loss": 0.011, "step": 319700 }, { "epoch": 0.83, "learning_rate": 0.00017568983438790402, "loss": 0.0139, "step": 319710 }, { "epoch": 0.83, "learning_rate": 0.00017568594617153253, "loss": 0.0105, "step": 319720 }, { "epoch": 0.83, "learning_rate": 0.00017568205795516107, "loss": 0.013, "step": 319730 }, { "epoch": 0.83, "learning_rate": 0.0001756781697387896, "loss": 0.016, "step": 319740 }, { "epoch": 0.83, "learning_rate": 0.00017567428152241816, "loss": 0.0131, "step": 319750 }, { "epoch": 0.83, "learning_rate": 0.0001756703933060467, "loss": 0.0144, "step": 319760 }, { "epoch": 0.83, "learning_rate": 0.0001756665050896752, "loss": 0.0129, "step": 319770 }, { "epoch": 0.83, "learning_rate": 0.00017566261687330375, "loss": 0.0207, "step": 319780 }, { "epoch": 0.83, "learning_rate": 0.0001756587286569323, "loss": 0.0124, "step": 319790 }, { "epoch": 0.83, "learning_rate": 0.00017565484044056084, "loss": 0.0164, "step": 319800 }, { "epoch": 0.83, "learning_rate": 0.00017565095222418935, "loss": 0.01, "step": 319810 }, { "epoch": 0.83, "learning_rate": 0.0001756470640078179, "loss": 0.0173, "step": 319820 }, { "epoch": 0.83, "learning_rate": 0.0001756431757914464, "loss": 0.0167, "step": 319830 }, { "epoch": 0.83, "learning_rate": 0.00017563928757507498, "loss": 0.0124, "step": 319840 }, { "epoch": 0.83, "learning_rate": 0.0001756353993587035, "loss": 0.0158, "step": 319850 }, { "epoch": 0.83, "learning_rate": 0.00017563151114233203, "loss": 0.0146, "step": 319860 }, { "epoch": 0.83, "learning_rate": 0.00017562762292596055, "loss": 0.014, "step": 319870 }, { "epoch": 0.83, "learning_rate": 0.00017562373470958912, "loss": 0.0206, "step": 319880 }, { "epoch": 0.83, "learning_rate": 0.00017561984649321763, "loss": 0.0133, "step": 319890 }, { "epoch": 0.83, "learning_rate": 0.00017561595827684617, "loss": 0.0119, "step": 319900 }, { "epoch": 0.83, "learning_rate": 0.00017561207006047469, "loss": 0.0111, "step": 319910 }, { "epoch": 0.83, "learning_rate": 0.00017560818184410326, "loss": 0.0141, "step": 319920 }, { "epoch": 0.83, "learning_rate": 0.0001756042936277318, "loss": 0.0159, "step": 319930 }, { "epoch": 0.83, "learning_rate": 0.0001756004054113603, "loss": 0.013, "step": 319940 }, { "epoch": 0.83, "learning_rate": 0.00017559651719498885, "loss": 0.0123, "step": 319950 }, { "epoch": 0.83, "learning_rate": 0.0001755926289786174, "loss": 0.0135, "step": 319960 }, { "epoch": 0.83, "learning_rate": 0.00017558874076224594, "loss": 0.0127, "step": 319970 }, { "epoch": 0.83, "learning_rate": 0.00017558485254587445, "loss": 0.0161, "step": 319980 }, { "epoch": 0.83, "learning_rate": 0.000175580964329503, "loss": 0.0119, "step": 319990 }, { "epoch": 0.83, "learning_rate": 0.00017557707611313153, "loss": 0.0151, "step": 320000 }, { "epoch": 0.83, "eval_cer": 0.8816998870492994, "eval_loss": 0.009145650081336498, "eval_runtime": 107.5595, "eval_samples_per_second": 18.594, "eval_steps_per_second": 4.649, "step": 320000 }, { "epoch": 0.83, "learning_rate": 0.00017557318789676008, "loss": 0.014, "step": 320010 }, { "epoch": 0.83, "learning_rate": 0.0001755692996803886, "loss": 0.0102, "step": 320020 }, { "epoch": 0.83, "learning_rate": 0.00017556541146401713, "loss": 0.0166, "step": 320030 }, { "epoch": 0.83, "learning_rate": 0.00017556152324764567, "loss": 0.0124, "step": 320040 }, { "epoch": 0.83, "learning_rate": 0.00017555763503127422, "loss": 0.012, "step": 320050 }, { "epoch": 0.83, "learning_rate": 0.00017555374681490273, "loss": 0.0132, "step": 320060 }, { "epoch": 0.83, "learning_rate": 0.00017554985859853127, "loss": 0.0173, "step": 320070 }, { "epoch": 0.83, "learning_rate": 0.00017554597038215979, "loss": 0.0112, "step": 320080 }, { "epoch": 0.83, "learning_rate": 0.00017554208216578835, "loss": 0.0141, "step": 320090 }, { "epoch": 0.83, "learning_rate": 0.0001755381939494169, "loss": 0.0148, "step": 320100 }, { "epoch": 0.83, "learning_rate": 0.0001755343057330454, "loss": 0.0146, "step": 320110 }, { "epoch": 0.83, "learning_rate": 0.00017553041751667393, "loss": 0.0164, "step": 320120 }, { "epoch": 0.83, "learning_rate": 0.0001755265293003025, "loss": 0.0116, "step": 320130 }, { "epoch": 0.83, "learning_rate": 0.00017552264108393104, "loss": 0.0162, "step": 320140 }, { "epoch": 0.83, "learning_rate": 0.00017551875286755955, "loss": 0.0125, "step": 320150 }, { "epoch": 0.83, "learning_rate": 0.0001755148646511881, "loss": 0.0128, "step": 320160 }, { "epoch": 0.83, "learning_rate": 0.00017551097643481663, "loss": 0.012, "step": 320170 }, { "epoch": 0.83, "learning_rate": 0.00017550708821844518, "loss": 0.0136, "step": 320180 }, { "epoch": 0.83, "learning_rate": 0.0001755032000020737, "loss": 0.013, "step": 320190 }, { "epoch": 0.83, "learning_rate": 0.00017549931178570223, "loss": 0.0134, "step": 320200 }, { "epoch": 0.83, "learning_rate": 0.00017549542356933077, "loss": 0.0124, "step": 320210 }, { "epoch": 0.83, "learning_rate": 0.00017549153535295931, "loss": 0.0173, "step": 320220 }, { "epoch": 0.83, "learning_rate": 0.00017548764713658783, "loss": 0.0169, "step": 320230 }, { "epoch": 0.83, "learning_rate": 0.00017548375892021637, "loss": 0.0116, "step": 320240 }, { "epoch": 0.83, "learning_rate": 0.00017547987070384494, "loss": 0.0156, "step": 320250 }, { "epoch": 0.83, "learning_rate": 0.00017547598248747345, "loss": 0.0121, "step": 320260 }, { "epoch": 0.83, "learning_rate": 0.00017547209427110197, "loss": 0.0104, "step": 320270 }, { "epoch": 0.83, "learning_rate": 0.0001754682060547305, "loss": 0.0146, "step": 320280 }, { "epoch": 0.83, "learning_rate": 0.00017546431783835908, "loss": 0.0134, "step": 320290 }, { "epoch": 0.83, "learning_rate": 0.0001754604296219876, "loss": 0.0134, "step": 320300 }, { "epoch": 0.83, "learning_rate": 0.00017545654140561614, "loss": 0.0121, "step": 320310 }, { "epoch": 0.83, "learning_rate": 0.00017545265318924465, "loss": 0.0171, "step": 320320 }, { "epoch": 0.83, "learning_rate": 0.0001754487649728732, "loss": 0.0172, "step": 320330 }, { "epoch": 0.83, "learning_rate": 0.00017544487675650173, "loss": 0.0131, "step": 320340 }, { "epoch": 0.83, "learning_rate": 0.00017544098854013027, "loss": 0.0133, "step": 320350 }, { "epoch": 0.83, "learning_rate": 0.0001754371003237588, "loss": 0.0138, "step": 320360 }, { "epoch": 0.83, "learning_rate": 0.00017543321210738733, "loss": 0.0122, "step": 320370 }, { "epoch": 0.83, "learning_rate": 0.00017542932389101587, "loss": 0.0143, "step": 320380 }, { "epoch": 0.83, "learning_rate": 0.00017542543567464441, "loss": 0.0183, "step": 320390 }, { "epoch": 0.83, "learning_rate": 0.00017542154745827293, "loss": 0.0126, "step": 320400 }, { "epoch": 0.83, "learning_rate": 0.00017541765924190147, "loss": 0.0166, "step": 320410 }, { "epoch": 0.83, "learning_rate": 0.00017541377102553004, "loss": 0.0156, "step": 320420 }, { "epoch": 0.83, "learning_rate": 0.00017540988280915855, "loss": 0.0106, "step": 320430 }, { "epoch": 0.83, "learning_rate": 0.00017540599459278707, "loss": 0.0136, "step": 320440 }, { "epoch": 0.83, "learning_rate": 0.0001754021063764156, "loss": 0.0122, "step": 320450 }, { "epoch": 0.83, "learning_rate": 0.00017539821816004418, "loss": 0.0106, "step": 320460 }, { "epoch": 0.83, "learning_rate": 0.0001753943299436727, "loss": 0.0145, "step": 320470 }, { "epoch": 0.83, "learning_rate": 0.00017539044172730123, "loss": 0.0152, "step": 320480 }, { "epoch": 0.83, "learning_rate": 0.00017538655351092975, "loss": 0.0129, "step": 320490 }, { "epoch": 0.83, "learning_rate": 0.00017538266529455832, "loss": 0.0118, "step": 320500 }, { "epoch": 0.83, "learning_rate": 0.00017537877707818683, "loss": 0.015, "step": 320510 }, { "epoch": 0.83, "learning_rate": 0.00017537488886181537, "loss": 0.0161, "step": 320520 }, { "epoch": 0.83, "learning_rate": 0.0001753710006454439, "loss": 0.0157, "step": 320530 }, { "epoch": 0.83, "learning_rate": 0.00017536711242907246, "loss": 0.0187, "step": 320540 }, { "epoch": 0.83, "learning_rate": 0.00017536322421270097, "loss": 0.0165, "step": 320550 }, { "epoch": 0.83, "learning_rate": 0.0001753593359963295, "loss": 0.0154, "step": 320560 }, { "epoch": 0.83, "learning_rate": 0.00017535544777995803, "loss": 0.0126, "step": 320570 }, { "epoch": 0.83, "learning_rate": 0.00017535155956358657, "loss": 0.0151, "step": 320580 }, { "epoch": 0.83, "learning_rate": 0.0001753476713472151, "loss": 0.0114, "step": 320590 }, { "epoch": 0.83, "learning_rate": 0.00017534378313084365, "loss": 0.0117, "step": 320600 }, { "epoch": 0.83, "learning_rate": 0.00017533989491447217, "loss": 0.019, "step": 320610 }, { "epoch": 0.83, "learning_rate": 0.0001753360066981007, "loss": 0.0184, "step": 320620 }, { "epoch": 0.83, "learning_rate": 0.00017533211848172928, "loss": 0.0134, "step": 320630 }, { "epoch": 0.83, "learning_rate": 0.0001753282302653578, "loss": 0.0127, "step": 320640 }, { "epoch": 0.83, "learning_rate": 0.00017532434204898633, "loss": 0.0115, "step": 320650 }, { "epoch": 0.83, "learning_rate": 0.00017532045383261485, "loss": 0.0096, "step": 320660 }, { "epoch": 0.83, "learning_rate": 0.00017531656561624342, "loss": 0.0135, "step": 320670 }, { "epoch": 0.83, "learning_rate": 0.00017531267739987193, "loss": 0.0112, "step": 320680 }, { "epoch": 0.83, "learning_rate": 0.00017530878918350047, "loss": 0.0159, "step": 320690 }, { "epoch": 0.83, "learning_rate": 0.000175304900967129, "loss": 0.013, "step": 320700 }, { "epoch": 0.83, "learning_rate": 0.00017530101275075756, "loss": 0.021, "step": 320710 }, { "epoch": 0.83, "learning_rate": 0.00017529712453438607, "loss": 0.0166, "step": 320720 }, { "epoch": 0.83, "learning_rate": 0.0001752932363180146, "loss": 0.0133, "step": 320730 }, { "epoch": 0.83, "learning_rate": 0.00017528934810164313, "loss": 0.0129, "step": 320740 }, { "epoch": 0.83, "learning_rate": 0.0001752854598852717, "loss": 0.0173, "step": 320750 }, { "epoch": 0.83, "learning_rate": 0.0001752815716689002, "loss": 0.0157, "step": 320760 }, { "epoch": 0.83, "learning_rate": 0.00017527768345252875, "loss": 0.0123, "step": 320770 }, { "epoch": 0.83, "learning_rate": 0.00017527379523615727, "loss": 0.0144, "step": 320780 }, { "epoch": 0.83, "learning_rate": 0.00017526990701978584, "loss": 0.0136, "step": 320790 }, { "epoch": 0.83, "learning_rate": 0.00017526601880341438, "loss": 0.015, "step": 320800 }, { "epoch": 0.83, "learning_rate": 0.0001752621305870429, "loss": 0.0145, "step": 320810 }, { "epoch": 0.83, "learning_rate": 0.00017525824237067143, "loss": 0.013, "step": 320820 }, { "epoch": 0.83, "learning_rate": 0.00017525435415429995, "loss": 0.0154, "step": 320830 }, { "epoch": 0.83, "learning_rate": 0.00017525046593792852, "loss": 0.0176, "step": 320840 }, { "epoch": 0.83, "learning_rate": 0.00017524657772155703, "loss": 0.0174, "step": 320850 }, { "epoch": 0.83, "learning_rate": 0.00017524268950518557, "loss": 0.0133, "step": 320860 }, { "epoch": 0.83, "learning_rate": 0.0001752388012888141, "loss": 0.0142, "step": 320870 }, { "epoch": 0.83, "learning_rate": 0.00017523491307244266, "loss": 0.0146, "step": 320880 }, { "epoch": 0.83, "learning_rate": 0.00017523102485607117, "loss": 0.0136, "step": 320890 }, { "epoch": 0.83, "learning_rate": 0.0001752271366396997, "loss": 0.0134, "step": 320900 }, { "epoch": 0.83, "learning_rate": 0.00017522324842332823, "loss": 0.0134, "step": 320910 }, { "epoch": 0.83, "learning_rate": 0.0001752193602069568, "loss": 0.0109, "step": 320920 }, { "epoch": 0.83, "learning_rate": 0.0001752154719905853, "loss": 0.0143, "step": 320930 }, { "epoch": 0.83, "learning_rate": 0.00017521158377421385, "loss": 0.0123, "step": 320940 }, { "epoch": 0.83, "learning_rate": 0.00017520769555784237, "loss": 0.0152, "step": 320950 }, { "epoch": 0.83, "learning_rate": 0.00017520380734147093, "loss": 0.0146, "step": 320960 }, { "epoch": 0.83, "learning_rate": 0.00017519991912509948, "loss": 0.0112, "step": 320970 }, { "epoch": 0.83, "learning_rate": 0.000175196030908728, "loss": 0.0145, "step": 320980 }, { "epoch": 0.83, "learning_rate": 0.0001751921426923565, "loss": 0.0135, "step": 320990 }, { "epoch": 0.83, "learning_rate": 0.00017518825447598507, "loss": 0.0112, "step": 321000 }, { "epoch": 0.83, "eval_cer": 0.8816914892276944, "eval_loss": 0.00950040016323328, "eval_runtime": 107.7703, "eval_samples_per_second": 18.558, "eval_steps_per_second": 4.639, "step": 321000 }, { "epoch": 0.83, "learning_rate": 0.00017518436625961362, "loss": 0.0165, "step": 321010 }, { "epoch": 0.83, "learning_rate": 0.00017518047804324213, "loss": 0.0115, "step": 321020 }, { "epoch": 0.83, "learning_rate": 0.00017517658982687067, "loss": 0.0124, "step": 321030 }, { "epoch": 0.83, "learning_rate": 0.00017517270161049921, "loss": 0.0176, "step": 321040 }, { "epoch": 0.83, "learning_rate": 0.00017516881339412776, "loss": 0.0146, "step": 321050 }, { "epoch": 0.83, "learning_rate": 0.00017516492517775627, "loss": 0.0112, "step": 321060 }, { "epoch": 0.83, "learning_rate": 0.0001751610369613848, "loss": 0.0129, "step": 321070 }, { "epoch": 0.83, "learning_rate": 0.00017515714874501333, "loss": 0.0111, "step": 321080 }, { "epoch": 0.83, "learning_rate": 0.0001751532605286419, "loss": 0.0121, "step": 321090 }, { "epoch": 0.83, "learning_rate": 0.0001751493723122704, "loss": 0.0152, "step": 321100 }, { "epoch": 0.83, "learning_rate": 0.00017514548409589895, "loss": 0.0129, "step": 321110 }, { "epoch": 0.83, "learning_rate": 0.00017514159587952747, "loss": 0.0136, "step": 321120 }, { "epoch": 0.83, "learning_rate": 0.00017513770766315603, "loss": 0.0129, "step": 321130 }, { "epoch": 0.83, "learning_rate": 0.00017513381944678455, "loss": 0.0133, "step": 321140 }, { "epoch": 0.83, "learning_rate": 0.0001751299312304131, "loss": 0.0117, "step": 321150 }, { "epoch": 0.83, "learning_rate": 0.0001751260430140416, "loss": 0.0164, "step": 321160 }, { "epoch": 0.83, "learning_rate": 0.00017512215479767017, "loss": 0.0122, "step": 321170 }, { "epoch": 0.83, "learning_rate": 0.00017511826658129872, "loss": 0.0097, "step": 321180 }, { "epoch": 0.83, "learning_rate": 0.00017511437836492723, "loss": 0.0243, "step": 321190 }, { "epoch": 0.83, "learning_rate": 0.00017511049014855577, "loss": 0.015, "step": 321200 }, { "epoch": 0.83, "learning_rate": 0.0001751066019321843, "loss": 0.0127, "step": 321210 }, { "epoch": 0.83, "learning_rate": 0.00017510271371581285, "loss": 0.0108, "step": 321220 }, { "epoch": 0.83, "learning_rate": 0.00017509882549944137, "loss": 0.0119, "step": 321230 }, { "epoch": 0.83, "learning_rate": 0.0001750949372830699, "loss": 0.014, "step": 321240 }, { "epoch": 0.83, "learning_rate": 0.00017509104906669845, "loss": 0.0114, "step": 321250 }, { "epoch": 0.83, "learning_rate": 0.000175087160850327, "loss": 0.0123, "step": 321260 }, { "epoch": 0.83, "learning_rate": 0.0001750832726339555, "loss": 0.0142, "step": 321270 }, { "epoch": 0.83, "learning_rate": 0.00017507938441758405, "loss": 0.0121, "step": 321280 }, { "epoch": 0.83, "learning_rate": 0.00017507549620121262, "loss": 0.0134, "step": 321290 }, { "epoch": 0.83, "learning_rate": 0.00017507160798484113, "loss": 0.0142, "step": 321300 }, { "epoch": 0.83, "learning_rate": 0.00017506771976846965, "loss": 0.0114, "step": 321310 }, { "epoch": 0.83, "learning_rate": 0.0001750638315520982, "loss": 0.0124, "step": 321320 }, { "epoch": 0.83, "learning_rate": 0.0001750599433357267, "loss": 0.0113, "step": 321330 }, { "epoch": 0.83, "learning_rate": 0.00017505605511935527, "loss": 0.0143, "step": 321340 }, { "epoch": 0.83, "learning_rate": 0.00017505216690298381, "loss": 0.0131, "step": 321350 }, { "epoch": 0.83, "learning_rate": 0.00017504827868661233, "loss": 0.0127, "step": 321360 }, { "epoch": 0.83, "learning_rate": 0.00017504439047024087, "loss": 0.0171, "step": 321370 }, { "epoch": 0.83, "learning_rate": 0.0001750405022538694, "loss": 0.0136, "step": 321380 }, { "epoch": 0.83, "learning_rate": 0.00017503661403749795, "loss": 0.0179, "step": 321390 }, { "epoch": 0.83, "learning_rate": 0.00017503272582112647, "loss": 0.0112, "step": 321400 }, { "epoch": 0.83, "learning_rate": 0.000175028837604755, "loss": 0.0152, "step": 321410 }, { "epoch": 0.83, "learning_rate": 0.00017502494938838355, "loss": 0.0098, "step": 321420 }, { "epoch": 0.83, "learning_rate": 0.0001750210611720121, "loss": 0.0146, "step": 321430 }, { "epoch": 0.83, "learning_rate": 0.0001750171729556406, "loss": 0.0137, "step": 321440 }, { "epoch": 0.83, "learning_rate": 0.00017501328473926915, "loss": 0.0159, "step": 321450 }, { "epoch": 0.83, "learning_rate": 0.0001750093965228977, "loss": 0.0121, "step": 321460 }, { "epoch": 0.83, "learning_rate": 0.00017500550830652623, "loss": 0.0169, "step": 321470 }, { "epoch": 0.83, "learning_rate": 0.00017500162009015475, "loss": 0.0121, "step": 321480 }, { "epoch": 0.83, "learning_rate": 0.0001749977318737833, "loss": 0.0133, "step": 321490 }, { "epoch": 0.83, "learning_rate": 0.00017499384365741186, "loss": 0.0158, "step": 321500 }, { "epoch": 0.83, "learning_rate": 0.00017498995544104037, "loss": 0.0143, "step": 321510 }, { "epoch": 0.83, "learning_rate": 0.00017498606722466891, "loss": 0.0132, "step": 321520 }, { "epoch": 0.83, "learning_rate": 0.00017498217900829743, "loss": 0.0145, "step": 321530 }, { "epoch": 0.83, "learning_rate": 0.000174978290791926, "loss": 0.0147, "step": 321540 }, { "epoch": 0.83, "learning_rate": 0.0001749744025755545, "loss": 0.0144, "step": 321550 }, { "epoch": 0.83, "learning_rate": 0.00017497051435918305, "loss": 0.0168, "step": 321560 }, { "epoch": 0.83, "learning_rate": 0.00017496662614281157, "loss": 0.017, "step": 321570 }, { "epoch": 0.83, "learning_rate": 0.0001749627379264401, "loss": 0.012, "step": 321580 }, { "epoch": 0.83, "learning_rate": 0.00017495884971006865, "loss": 0.0112, "step": 321590 }, { "epoch": 0.83, "learning_rate": 0.0001749549614936972, "loss": 0.0193, "step": 321600 }, { "epoch": 0.83, "learning_rate": 0.0001749510732773257, "loss": 0.012, "step": 321610 }, { "epoch": 0.83, "learning_rate": 0.00017494718506095425, "loss": 0.0178, "step": 321620 }, { "epoch": 0.83, "learning_rate": 0.0001749432968445828, "loss": 0.0129, "step": 321630 }, { "epoch": 0.83, "learning_rate": 0.00017493940862821133, "loss": 0.0131, "step": 321640 }, { "epoch": 0.83, "learning_rate": 0.00017493552041183985, "loss": 0.0186, "step": 321650 }, { "epoch": 0.83, "learning_rate": 0.0001749316321954684, "loss": 0.0121, "step": 321660 }, { "epoch": 0.83, "learning_rate": 0.00017492774397909696, "loss": 0.0153, "step": 321670 }, { "epoch": 0.83, "learning_rate": 0.00017492385576272547, "loss": 0.0136, "step": 321680 }, { "epoch": 0.83, "learning_rate": 0.00017491996754635401, "loss": 0.0129, "step": 321690 }, { "epoch": 0.83, "learning_rate": 0.00017491607932998253, "loss": 0.0138, "step": 321700 }, { "epoch": 0.83, "learning_rate": 0.0001749121911136111, "loss": 0.016, "step": 321710 }, { "epoch": 0.83, "learning_rate": 0.0001749083028972396, "loss": 0.0115, "step": 321720 }, { "epoch": 0.83, "learning_rate": 0.00017490441468086815, "loss": 0.0144, "step": 321730 }, { "epoch": 0.83, "learning_rate": 0.00017490052646449667, "loss": 0.0156, "step": 321740 }, { "epoch": 0.83, "learning_rate": 0.00017489663824812524, "loss": 0.0135, "step": 321750 }, { "epoch": 0.83, "learning_rate": 0.00017489275003175375, "loss": 0.0136, "step": 321760 }, { "epoch": 0.83, "learning_rate": 0.0001748888618153823, "loss": 0.0125, "step": 321770 }, { "epoch": 0.83, "learning_rate": 0.0001748849735990108, "loss": 0.0133, "step": 321780 }, { "epoch": 0.83, "learning_rate": 0.00017488108538263938, "loss": 0.0137, "step": 321790 }, { "epoch": 0.83, "learning_rate": 0.0001748771971662679, "loss": 0.0116, "step": 321800 }, { "epoch": 0.83, "learning_rate": 0.00017487330894989643, "loss": 0.0137, "step": 321810 }, { "epoch": 0.83, "learning_rate": 0.00017486942073352495, "loss": 0.0121, "step": 321820 }, { "epoch": 0.83, "learning_rate": 0.0001748655325171535, "loss": 0.0122, "step": 321830 }, { "epoch": 0.83, "learning_rate": 0.00017486164430078206, "loss": 0.0094, "step": 321840 }, { "epoch": 0.83, "learning_rate": 0.00017485775608441057, "loss": 0.0167, "step": 321850 }, { "epoch": 0.83, "learning_rate": 0.00017485386786803909, "loss": 0.0129, "step": 321860 }, { "epoch": 0.83, "learning_rate": 0.00017484997965166763, "loss": 0.0129, "step": 321870 }, { "epoch": 0.83, "learning_rate": 0.0001748460914352962, "loss": 0.0107, "step": 321880 }, { "epoch": 0.83, "learning_rate": 0.0001748422032189247, "loss": 0.0138, "step": 321890 }, { "epoch": 0.83, "learning_rate": 0.00017483831500255325, "loss": 0.0174, "step": 321900 }, { "epoch": 0.83, "learning_rate": 0.00017483442678618177, "loss": 0.013, "step": 321910 }, { "epoch": 0.83, "learning_rate": 0.00017483053856981034, "loss": 0.0128, "step": 321920 }, { "epoch": 0.83, "learning_rate": 0.00017482665035343885, "loss": 0.0138, "step": 321930 }, { "epoch": 0.83, "learning_rate": 0.0001748227621370674, "loss": 0.0163, "step": 321940 }, { "epoch": 0.83, "learning_rate": 0.0001748188739206959, "loss": 0.0124, "step": 321950 }, { "epoch": 0.83, "learning_rate": 0.00017481498570432448, "loss": 0.015, "step": 321960 }, { "epoch": 0.83, "learning_rate": 0.000174811097487953, "loss": 0.0147, "step": 321970 }, { "epoch": 0.83, "learning_rate": 0.00017480720927158153, "loss": 0.0116, "step": 321980 }, { "epoch": 0.83, "learning_rate": 0.00017480332105521005, "loss": 0.0123, "step": 321990 }, { "epoch": 0.83, "learning_rate": 0.00017479943283883861, "loss": 0.0118, "step": 322000 }, { "epoch": 0.83, "eval_cer": 0.8817208816033121, "eval_loss": 0.00928072165697813, "eval_runtime": 107.7164, "eval_samples_per_second": 18.567, "eval_steps_per_second": 4.642, "step": 322000 }, { "epoch": 0.83, "learning_rate": 0.00017479554462246716, "loss": 0.0122, "step": 322010 }, { "epoch": 0.83, "learning_rate": 0.00017479165640609567, "loss": 0.0135, "step": 322020 }, { "epoch": 0.83, "learning_rate": 0.00017478776818972419, "loss": 0.0153, "step": 322030 }, { "epoch": 0.83, "learning_rate": 0.00017478387997335275, "loss": 0.0143, "step": 322040 }, { "epoch": 0.83, "learning_rate": 0.0001747799917569813, "loss": 0.0099, "step": 322050 }, { "epoch": 0.83, "learning_rate": 0.0001747761035406098, "loss": 0.0157, "step": 322060 }, { "epoch": 0.83, "learning_rate": 0.00017477221532423835, "loss": 0.0159, "step": 322070 }, { "epoch": 0.83, "learning_rate": 0.00017476832710786687, "loss": 0.0146, "step": 322080 }, { "epoch": 0.83, "learning_rate": 0.00017476443889149544, "loss": 0.0118, "step": 322090 }, { "epoch": 0.83, "learning_rate": 0.00017476055067512395, "loss": 0.0115, "step": 322100 }, { "epoch": 0.83, "learning_rate": 0.0001747566624587525, "loss": 0.0104, "step": 322110 }, { "epoch": 0.83, "learning_rate": 0.000174752774242381, "loss": 0.0151, "step": 322120 }, { "epoch": 0.84, "learning_rate": 0.00017474888602600957, "loss": 0.015, "step": 322130 }, { "epoch": 0.84, "learning_rate": 0.0001747449978096381, "loss": 0.0112, "step": 322140 }, { "epoch": 0.84, "learning_rate": 0.00017474110959326663, "loss": 0.0136, "step": 322150 }, { "epoch": 0.84, "learning_rate": 0.00017473722137689515, "loss": 0.0151, "step": 322160 }, { "epoch": 0.84, "learning_rate": 0.00017473333316052371, "loss": 0.0115, "step": 322170 }, { "epoch": 0.84, "learning_rate": 0.00017472944494415223, "loss": 0.0194, "step": 322180 }, { "epoch": 0.84, "learning_rate": 0.00017472555672778077, "loss": 0.0121, "step": 322190 }, { "epoch": 0.84, "learning_rate": 0.00017472166851140928, "loss": 0.016, "step": 322200 }, { "epoch": 0.84, "learning_rate": 0.00017471778029503785, "loss": 0.0105, "step": 322210 }, { "epoch": 0.84, "learning_rate": 0.0001747138920786664, "loss": 0.0182, "step": 322220 }, { "epoch": 0.84, "learning_rate": 0.0001747100038622949, "loss": 0.0121, "step": 322230 }, { "epoch": 0.84, "learning_rate": 0.00017470611564592345, "loss": 0.0111, "step": 322240 }, { "epoch": 0.84, "learning_rate": 0.000174702227429552, "loss": 0.0132, "step": 322250 }, { "epoch": 0.84, "learning_rate": 0.00017469833921318053, "loss": 0.0149, "step": 322260 }, { "epoch": 0.84, "learning_rate": 0.00017469445099680905, "loss": 0.0144, "step": 322270 }, { "epoch": 0.84, "learning_rate": 0.0001746905627804376, "loss": 0.0158, "step": 322280 }, { "epoch": 0.84, "learning_rate": 0.00017468667456406613, "loss": 0.0147, "step": 322290 }, { "epoch": 0.84, "learning_rate": 0.00017468278634769467, "loss": 0.0138, "step": 322300 }, { "epoch": 0.84, "learning_rate": 0.0001746788981313232, "loss": 0.0159, "step": 322310 }, { "epoch": 0.84, "learning_rate": 0.00017467500991495173, "loss": 0.0129, "step": 322320 }, { "epoch": 0.84, "learning_rate": 0.00017467112169858024, "loss": 0.015, "step": 322330 }, { "epoch": 0.84, "learning_rate": 0.0001746672334822088, "loss": 0.0162, "step": 322340 }, { "epoch": 0.84, "learning_rate": 0.00017466334526583733, "loss": 0.0154, "step": 322350 }, { "epoch": 0.84, "learning_rate": 0.00017465945704946587, "loss": 0.0136, "step": 322360 }, { "epoch": 0.84, "learning_rate": 0.00017465556883309438, "loss": 0.0136, "step": 322370 }, { "epoch": 0.84, "learning_rate": 0.00017465168061672295, "loss": 0.012, "step": 322380 }, { "epoch": 0.84, "learning_rate": 0.0001746477924003515, "loss": 0.0147, "step": 322390 }, { "epoch": 0.84, "learning_rate": 0.00017464390418398, "loss": 0.0113, "step": 322400 }, { "epoch": 0.84, "learning_rate": 0.00017464001596760855, "loss": 0.0125, "step": 322410 }, { "epoch": 0.84, "learning_rate": 0.0001746361277512371, "loss": 0.0144, "step": 322420 }, { "epoch": 0.84, "learning_rate": 0.00017463223953486563, "loss": 0.0132, "step": 322430 }, { "epoch": 0.84, "learning_rate": 0.00017462835131849415, "loss": 0.011, "step": 322440 }, { "epoch": 0.84, "learning_rate": 0.0001746244631021227, "loss": 0.0139, "step": 322450 }, { "epoch": 0.84, "learning_rate": 0.00017462057488575123, "loss": 0.016, "step": 322460 }, { "epoch": 0.84, "learning_rate": 0.00017461668666937977, "loss": 0.0107, "step": 322470 }, { "epoch": 0.84, "learning_rate": 0.0001746127984530083, "loss": 0.0147, "step": 322480 }, { "epoch": 0.84, "learning_rate": 0.00017460891023663683, "loss": 0.0152, "step": 322490 }, { "epoch": 0.84, "learning_rate": 0.00017460502202026537, "loss": 0.0144, "step": 322500 }, { "epoch": 0.84, "learning_rate": 0.0001746011338038939, "loss": 0.0164, "step": 322510 }, { "epoch": 0.84, "learning_rate": 0.00017459724558752243, "loss": 0.0129, "step": 322520 }, { "epoch": 0.84, "learning_rate": 0.00017459335737115097, "loss": 0.0168, "step": 322530 }, { "epoch": 0.84, "learning_rate": 0.00017458946915477948, "loss": 0.0122, "step": 322540 }, { "epoch": 0.84, "learning_rate": 0.00017458558093840805, "loss": 0.0138, "step": 322550 }, { "epoch": 0.84, "learning_rate": 0.0001745816927220366, "loss": 0.0201, "step": 322560 }, { "epoch": 0.84, "learning_rate": 0.0001745778045056651, "loss": 0.0128, "step": 322570 }, { "epoch": 0.84, "learning_rate": 0.00017457391628929362, "loss": 0.0134, "step": 322580 }, { "epoch": 0.84, "learning_rate": 0.0001745700280729222, "loss": 0.0211, "step": 322590 }, { "epoch": 0.84, "learning_rate": 0.00017456613985655073, "loss": 0.0128, "step": 322600 }, { "epoch": 0.84, "learning_rate": 0.00017456225164017925, "loss": 0.0128, "step": 322610 }, { "epoch": 0.84, "learning_rate": 0.0001745583634238078, "loss": 0.013, "step": 322620 }, { "epoch": 0.84, "learning_rate": 0.00017455447520743633, "loss": 0.0135, "step": 322630 }, { "epoch": 0.84, "learning_rate": 0.00017455058699106487, "loss": 0.0131, "step": 322640 }, { "epoch": 0.84, "learning_rate": 0.0001745466987746934, "loss": 0.0127, "step": 322650 }, { "epoch": 0.84, "learning_rate": 0.00017454281055832193, "loss": 0.014, "step": 322660 }, { "epoch": 0.84, "learning_rate": 0.00017453892234195047, "loss": 0.0122, "step": 322670 }, { "epoch": 0.84, "learning_rate": 0.000174535034125579, "loss": 0.0131, "step": 322680 }, { "epoch": 0.84, "learning_rate": 0.00017453114590920753, "loss": 0.0123, "step": 322690 }, { "epoch": 0.84, "learning_rate": 0.00017452725769283607, "loss": 0.0127, "step": 322700 }, { "epoch": 0.84, "learning_rate": 0.00017452336947646464, "loss": 0.0169, "step": 322710 }, { "epoch": 0.84, "learning_rate": 0.00017451948126009315, "loss": 0.0102, "step": 322720 }, { "epoch": 0.84, "learning_rate": 0.00017451559304372167, "loss": 0.0158, "step": 322730 }, { "epoch": 0.84, "learning_rate": 0.0001745117048273502, "loss": 0.0125, "step": 322740 }, { "epoch": 0.84, "learning_rate": 0.00017450781661097878, "loss": 0.0141, "step": 322750 }, { "epoch": 0.84, "learning_rate": 0.0001745039283946073, "loss": 0.0144, "step": 322760 }, { "epoch": 0.84, "learning_rate": 0.00017450004017823583, "loss": 0.0123, "step": 322770 }, { "epoch": 0.84, "learning_rate": 0.00017449615196186435, "loss": 0.0148, "step": 322780 }, { "epoch": 0.84, "learning_rate": 0.0001744922637454929, "loss": 0.0154, "step": 322790 }, { "epoch": 0.84, "learning_rate": 0.00017448837552912143, "loss": 0.02, "step": 322800 }, { "epoch": 0.84, "learning_rate": 0.00017448448731274997, "loss": 0.0128, "step": 322810 }, { "epoch": 0.84, "learning_rate": 0.0001744805990963785, "loss": 0.0153, "step": 322820 }, { "epoch": 0.84, "learning_rate": 0.00017447671088000703, "loss": 0.0132, "step": 322830 }, { "epoch": 0.84, "learning_rate": 0.00017447282266363557, "loss": 0.0171, "step": 322840 }, { "epoch": 0.84, "learning_rate": 0.0001744689344472641, "loss": 0.0138, "step": 322850 }, { "epoch": 0.84, "learning_rate": 0.00017446504623089263, "loss": 0.0185, "step": 322860 }, { "epoch": 0.84, "learning_rate": 0.00017446115801452117, "loss": 0.0149, "step": 322870 }, { "epoch": 0.84, "learning_rate": 0.00017445726979814974, "loss": 0.0169, "step": 322880 }, { "epoch": 0.84, "learning_rate": 0.00017445338158177825, "loss": 0.0187, "step": 322890 }, { "epoch": 0.84, "learning_rate": 0.00017444949336540677, "loss": 0.0146, "step": 322900 }, { "epoch": 0.84, "learning_rate": 0.0001744456051490353, "loss": 0.0148, "step": 322910 }, { "epoch": 0.84, "learning_rate": 0.00017444171693266388, "loss": 0.0144, "step": 322920 }, { "epoch": 0.84, "learning_rate": 0.0001744378287162924, "loss": 0.0133, "step": 322930 }, { "epoch": 0.84, "learning_rate": 0.00017443394049992093, "loss": 0.0114, "step": 322940 }, { "epoch": 0.84, "learning_rate": 0.00017443005228354945, "loss": 0.0131, "step": 322950 }, { "epoch": 0.84, "learning_rate": 0.00017442616406717802, "loss": 0.0155, "step": 322960 }, { "epoch": 0.84, "learning_rate": 0.00017442227585080653, "loss": 0.0125, "step": 322970 }, { "epoch": 0.84, "learning_rate": 0.00017441838763443507, "loss": 0.0104, "step": 322980 }, { "epoch": 0.84, "learning_rate": 0.00017441449941806359, "loss": 0.0131, "step": 322990 }, { "epoch": 0.84, "learning_rate": 0.00017441061120169216, "loss": 0.0112, "step": 323000 }, { "epoch": 0.84, "eval_cer": 0.881688689953826, "eval_loss": 0.009281335398554802, "eval_runtime": 107.738, "eval_samples_per_second": 18.564, "eval_steps_per_second": 4.641, "step": 323000 }, { "epoch": 0.84, "learning_rate": 0.00017440672298532067, "loss": 0.0108, "step": 323010 }, { "epoch": 0.84, "learning_rate": 0.0001744028347689492, "loss": 0.0152, "step": 323020 }, { "epoch": 0.84, "learning_rate": 0.00017439894655257773, "loss": 0.0139, "step": 323030 }, { "epoch": 0.84, "learning_rate": 0.00017439505833620627, "loss": 0.0107, "step": 323040 }, { "epoch": 0.84, "learning_rate": 0.0001743911701198348, "loss": 0.013, "step": 323050 }, { "epoch": 0.84, "learning_rate": 0.00017438728190346335, "loss": 0.0131, "step": 323060 }, { "epoch": 0.84, "learning_rate": 0.00017438339368709187, "loss": 0.0175, "step": 323070 }, { "epoch": 0.84, "learning_rate": 0.0001743795054707204, "loss": 0.0148, "step": 323080 }, { "epoch": 0.84, "learning_rate": 0.00017437561725434898, "loss": 0.0148, "step": 323090 }, { "epoch": 0.84, "learning_rate": 0.0001743717290379775, "loss": 0.0161, "step": 323100 }, { "epoch": 0.84, "learning_rate": 0.00017436784082160603, "loss": 0.0117, "step": 323110 }, { "epoch": 0.84, "learning_rate": 0.00017436395260523455, "loss": 0.0179, "step": 323120 }, { "epoch": 0.84, "learning_rate": 0.00017436006438886312, "loss": 0.0121, "step": 323130 }, { "epoch": 0.84, "learning_rate": 0.00017435617617249163, "loss": 0.0142, "step": 323140 }, { "epoch": 0.84, "learning_rate": 0.00017435228795612017, "loss": 0.0124, "step": 323150 }, { "epoch": 0.84, "learning_rate": 0.00017434839973974869, "loss": 0.017, "step": 323160 }, { "epoch": 0.84, "learning_rate": 0.00017434451152337725, "loss": 0.0124, "step": 323170 }, { "epoch": 0.84, "learning_rate": 0.00017434062330700577, "loss": 0.0122, "step": 323180 }, { "epoch": 0.84, "learning_rate": 0.0001743367350906343, "loss": 0.0147, "step": 323190 }, { "epoch": 0.84, "learning_rate": 0.00017433284687426283, "loss": 0.0142, "step": 323200 }, { "epoch": 0.84, "learning_rate": 0.0001743289586578914, "loss": 0.0125, "step": 323210 }, { "epoch": 0.84, "learning_rate": 0.0001743250704415199, "loss": 0.0248, "step": 323220 }, { "epoch": 0.84, "learning_rate": 0.00017432118222514845, "loss": 0.0136, "step": 323230 }, { "epoch": 0.84, "learning_rate": 0.00017431729400877696, "loss": 0.0155, "step": 323240 }, { "epoch": 0.84, "learning_rate": 0.00017431340579240553, "loss": 0.0127, "step": 323250 }, { "epoch": 0.84, "learning_rate": 0.00017430951757603408, "loss": 0.0136, "step": 323260 }, { "epoch": 0.84, "learning_rate": 0.0001743056293596626, "loss": 0.0149, "step": 323270 }, { "epoch": 0.84, "learning_rate": 0.00017430174114329113, "loss": 0.0153, "step": 323280 }, { "epoch": 0.84, "learning_rate": 0.00017429785292691965, "loss": 0.0137, "step": 323290 }, { "epoch": 0.84, "learning_rate": 0.00017429396471054821, "loss": 0.0155, "step": 323300 }, { "epoch": 0.84, "learning_rate": 0.00017429007649417673, "loss": 0.0127, "step": 323310 }, { "epoch": 0.84, "learning_rate": 0.00017428618827780527, "loss": 0.0141, "step": 323320 }, { "epoch": 0.84, "learning_rate": 0.00017428230006143379, "loss": 0.0111, "step": 323330 }, { "epoch": 0.84, "learning_rate": 0.00017427841184506235, "loss": 0.0144, "step": 323340 }, { "epoch": 0.84, "learning_rate": 0.00017427452362869087, "loss": 0.011, "step": 323350 }, { "epoch": 0.84, "learning_rate": 0.0001742706354123194, "loss": 0.0191, "step": 323360 }, { "epoch": 0.84, "learning_rate": 0.00017426674719594792, "loss": 0.0117, "step": 323370 }, { "epoch": 0.84, "learning_rate": 0.0001742628589795765, "loss": 0.0133, "step": 323380 }, { "epoch": 0.84, "learning_rate": 0.000174258970763205, "loss": 0.0136, "step": 323390 }, { "epoch": 0.84, "learning_rate": 0.00017425508254683355, "loss": 0.0099, "step": 323400 }, { "epoch": 0.84, "learning_rate": 0.00017425119433046206, "loss": 0.0153, "step": 323410 }, { "epoch": 0.84, "learning_rate": 0.00017424730611409063, "loss": 0.0151, "step": 323420 }, { "epoch": 0.84, "learning_rate": 0.00017424341789771917, "loss": 0.0109, "step": 323430 }, { "epoch": 0.84, "learning_rate": 0.0001742395296813477, "loss": 0.0155, "step": 323440 }, { "epoch": 0.84, "learning_rate": 0.0001742356414649762, "loss": 0.0162, "step": 323450 }, { "epoch": 0.84, "learning_rate": 0.00017423175324860477, "loss": 0.0121, "step": 323460 }, { "epoch": 0.84, "learning_rate": 0.00017422786503223331, "loss": 0.017, "step": 323470 }, { "epoch": 0.84, "learning_rate": 0.00017422397681586183, "loss": 0.0114, "step": 323480 }, { "epoch": 0.84, "learning_rate": 0.00017422008859949037, "loss": 0.012, "step": 323490 }, { "epoch": 0.84, "learning_rate": 0.0001742162003831189, "loss": 0.0138, "step": 323500 }, { "epoch": 0.84, "learning_rate": 0.00017421231216674745, "loss": 0.0147, "step": 323510 }, { "epoch": 0.84, "learning_rate": 0.00017420842395037597, "loss": 0.0158, "step": 323520 }, { "epoch": 0.84, "learning_rate": 0.0001742045357340045, "loss": 0.012, "step": 323530 }, { "epoch": 0.84, "learning_rate": 0.00017420064751763302, "loss": 0.0135, "step": 323540 }, { "epoch": 0.84, "learning_rate": 0.0001741967593012616, "loss": 0.0135, "step": 323550 }, { "epoch": 0.84, "learning_rate": 0.0001741928710848901, "loss": 0.0149, "step": 323560 }, { "epoch": 0.84, "learning_rate": 0.00017418898286851865, "loss": 0.0098, "step": 323570 }, { "epoch": 0.84, "learning_rate": 0.00017418509465214716, "loss": 0.0197, "step": 323580 }, { "epoch": 0.84, "learning_rate": 0.00017418120643577573, "loss": 0.0168, "step": 323590 }, { "epoch": 0.84, "learning_rate": 0.00017417731821940427, "loss": 0.0136, "step": 323600 }, { "epoch": 0.84, "learning_rate": 0.0001741734300030328, "loss": 0.016, "step": 323610 }, { "epoch": 0.84, "learning_rate": 0.0001741695417866613, "loss": 0.0125, "step": 323620 }, { "epoch": 0.84, "learning_rate": 0.00017416565357028987, "loss": 0.0137, "step": 323630 }, { "epoch": 0.84, "learning_rate": 0.0001741617653539184, "loss": 0.0139, "step": 323640 }, { "epoch": 0.84, "learning_rate": 0.00017415787713754693, "loss": 0.0121, "step": 323650 }, { "epoch": 0.84, "learning_rate": 0.00017415398892117547, "loss": 0.0143, "step": 323660 }, { "epoch": 0.84, "learning_rate": 0.000174150100704804, "loss": 0.0117, "step": 323670 }, { "epoch": 0.84, "learning_rate": 0.00017414621248843255, "loss": 0.0148, "step": 323680 }, { "epoch": 0.84, "learning_rate": 0.00017414232427206107, "loss": 0.0107, "step": 323690 }, { "epoch": 0.84, "learning_rate": 0.0001741384360556896, "loss": 0.0157, "step": 323700 }, { "epoch": 0.84, "learning_rate": 0.00017413454783931815, "loss": 0.014, "step": 323710 }, { "epoch": 0.84, "learning_rate": 0.0001741306596229467, "loss": 0.0163, "step": 323720 }, { "epoch": 0.84, "learning_rate": 0.0001741267714065752, "loss": 0.0177, "step": 323730 }, { "epoch": 0.84, "learning_rate": 0.00017412288319020375, "loss": 0.0145, "step": 323740 }, { "epoch": 0.84, "learning_rate": 0.00017411899497383232, "loss": 0.0175, "step": 323750 }, { "epoch": 0.84, "learning_rate": 0.00017411510675746083, "loss": 0.0151, "step": 323760 }, { "epoch": 0.84, "learning_rate": 0.00017411121854108935, "loss": 0.012, "step": 323770 }, { "epoch": 0.84, "learning_rate": 0.0001741073303247179, "loss": 0.0118, "step": 323780 }, { "epoch": 0.84, "learning_rate": 0.0001741034421083464, "loss": 0.0178, "step": 323790 }, { "epoch": 0.84, "learning_rate": 0.00017409955389197497, "loss": 0.0127, "step": 323800 }, { "epoch": 0.84, "learning_rate": 0.0001740956656756035, "loss": 0.0134, "step": 323810 }, { "epoch": 0.84, "learning_rate": 0.00017409177745923203, "loss": 0.0158, "step": 323820 }, { "epoch": 0.84, "learning_rate": 0.00017408788924286057, "loss": 0.0136, "step": 323830 }, { "epoch": 0.84, "learning_rate": 0.0001740840010264891, "loss": 0.0125, "step": 323840 }, { "epoch": 0.84, "learning_rate": 0.00017408011281011765, "loss": 0.0152, "step": 323850 }, { "epoch": 0.84, "learning_rate": 0.00017407622459374617, "loss": 0.017, "step": 323860 }, { "epoch": 0.84, "learning_rate": 0.0001740723363773747, "loss": 0.0127, "step": 323870 }, { "epoch": 0.84, "learning_rate": 0.00017406844816100325, "loss": 0.0123, "step": 323880 }, { "epoch": 0.84, "learning_rate": 0.0001740645599446318, "loss": 0.013, "step": 323890 }, { "epoch": 0.84, "learning_rate": 0.0001740606717282603, "loss": 0.0126, "step": 323900 }, { "epoch": 0.84, "learning_rate": 0.00017405678351188885, "loss": 0.0176, "step": 323910 }, { "epoch": 0.84, "learning_rate": 0.0001740528952955174, "loss": 0.0167, "step": 323920 }, { "epoch": 0.84, "learning_rate": 0.00017404900707914593, "loss": 0.0138, "step": 323930 }, { "epoch": 0.84, "learning_rate": 0.00017404511886277445, "loss": 0.0145, "step": 323940 }, { "epoch": 0.84, "learning_rate": 0.000174041230646403, "loss": 0.012, "step": 323950 }, { "epoch": 0.84, "learning_rate": 0.00017403734243003156, "loss": 0.012, "step": 323960 }, { "epoch": 0.84, "learning_rate": 0.00017403345421366007, "loss": 0.0143, "step": 323970 }, { "epoch": 0.84, "learning_rate": 0.0001740295659972886, "loss": 0.0126, "step": 323980 }, { "epoch": 0.84, "learning_rate": 0.00017402567778091713, "loss": 0.0123, "step": 323990 }, { "epoch": 0.84, "learning_rate": 0.0001740217895645457, "loss": 0.0106, "step": 324000 }, { "epoch": 0.84, "eval_cer": 0.8816970877754311, "eval_loss": 0.009332822635769844, "eval_runtime": 107.8709, "eval_samples_per_second": 18.541, "eval_steps_per_second": 4.635, "step": 324000 }, { "epoch": 0.84, "learning_rate": 0.0001740179013481742, "loss": 0.0139, "step": 324010 }, { "epoch": 0.84, "learning_rate": 0.00017401401313180275, "loss": 0.0142, "step": 324020 }, { "epoch": 0.84, "learning_rate": 0.00017401012491543127, "loss": 0.0136, "step": 324030 }, { "epoch": 0.84, "learning_rate": 0.0001740062366990598, "loss": 0.0186, "step": 324040 }, { "epoch": 0.84, "learning_rate": 0.00017400234848268835, "loss": 0.016, "step": 324050 }, { "epoch": 0.84, "learning_rate": 0.0001739984602663169, "loss": 0.0139, "step": 324060 }, { "epoch": 0.84, "learning_rate": 0.0001739945720499454, "loss": 0.0123, "step": 324070 }, { "epoch": 0.84, "learning_rate": 0.00017399068383357395, "loss": 0.0155, "step": 324080 }, { "epoch": 0.84, "learning_rate": 0.0001739867956172025, "loss": 0.0169, "step": 324090 }, { "epoch": 0.84, "learning_rate": 0.00017398290740083103, "loss": 0.0153, "step": 324100 }, { "epoch": 0.84, "learning_rate": 0.00017397901918445955, "loss": 0.0137, "step": 324110 }, { "epoch": 0.84, "learning_rate": 0.0001739751309680881, "loss": 0.0138, "step": 324120 }, { "epoch": 0.84, "learning_rate": 0.00017397124275171666, "loss": 0.0137, "step": 324130 }, { "epoch": 0.84, "learning_rate": 0.00017396735453534517, "loss": 0.0138, "step": 324140 }, { "epoch": 0.84, "learning_rate": 0.0001739634663189737, "loss": 0.024, "step": 324150 }, { "epoch": 0.84, "learning_rate": 0.00017395957810260223, "loss": 0.0175, "step": 324160 }, { "epoch": 0.84, "learning_rate": 0.0001739556898862308, "loss": 0.0154, "step": 324170 }, { "epoch": 0.84, "learning_rate": 0.0001739518016698593, "loss": 0.015, "step": 324180 }, { "epoch": 0.84, "learning_rate": 0.00017394791345348785, "loss": 0.0152, "step": 324190 }, { "epoch": 0.84, "learning_rate": 0.00017394402523711637, "loss": 0.0136, "step": 324200 }, { "epoch": 0.84, "learning_rate": 0.00017394013702074493, "loss": 0.0199, "step": 324210 }, { "epoch": 0.84, "learning_rate": 0.00017393624880437345, "loss": 0.0115, "step": 324220 }, { "epoch": 0.84, "learning_rate": 0.000173932360588002, "loss": 0.0119, "step": 324230 }, { "epoch": 0.84, "learning_rate": 0.0001739284723716305, "loss": 0.0162, "step": 324240 }, { "epoch": 0.84, "learning_rate": 0.00017392458415525907, "loss": 0.0118, "step": 324250 }, { "epoch": 0.84, "learning_rate": 0.0001739206959388876, "loss": 0.0137, "step": 324260 }, { "epoch": 0.84, "learning_rate": 0.00017391680772251613, "loss": 0.0122, "step": 324270 }, { "epoch": 0.84, "learning_rate": 0.00017391291950614464, "loss": 0.0193, "step": 324280 }, { "epoch": 0.84, "learning_rate": 0.00017390903128977319, "loss": 0.0135, "step": 324290 }, { "epoch": 0.84, "learning_rate": 0.00017390514307340175, "loss": 0.015, "step": 324300 }, { "epoch": 0.84, "learning_rate": 0.00017390125485703027, "loss": 0.0144, "step": 324310 }, { "epoch": 0.84, "learning_rate": 0.00017389736664065878, "loss": 0.016, "step": 324320 }, { "epoch": 0.84, "learning_rate": 0.00017389347842428733, "loss": 0.0142, "step": 324330 }, { "epoch": 0.84, "learning_rate": 0.0001738895902079159, "loss": 0.0149, "step": 324340 }, { "epoch": 0.84, "learning_rate": 0.0001738857019915444, "loss": 0.0142, "step": 324350 }, { "epoch": 0.84, "learning_rate": 0.00017388181377517295, "loss": 0.0169, "step": 324360 }, { "epoch": 0.84, "learning_rate": 0.00017387792555880146, "loss": 0.0154, "step": 324370 }, { "epoch": 0.84, "learning_rate": 0.00017387403734243003, "loss": 0.0159, "step": 324380 }, { "epoch": 0.84, "learning_rate": 0.00017387014912605855, "loss": 0.012, "step": 324390 }, { "epoch": 0.84, "learning_rate": 0.0001738662609096871, "loss": 0.0116, "step": 324400 }, { "epoch": 0.84, "learning_rate": 0.0001738623726933156, "loss": 0.0121, "step": 324410 }, { "epoch": 0.84, "learning_rate": 0.00017385848447694417, "loss": 0.0126, "step": 324420 }, { "epoch": 0.84, "learning_rate": 0.0001738545962605727, "loss": 0.0138, "step": 324430 }, { "epoch": 0.84, "learning_rate": 0.00017385070804420123, "loss": 0.0112, "step": 324440 }, { "epoch": 0.84, "learning_rate": 0.00017384681982782974, "loss": 0.0159, "step": 324450 }, { "epoch": 0.84, "learning_rate": 0.0001738429316114583, "loss": 0.0106, "step": 324460 }, { "epoch": 0.84, "learning_rate": 0.00017383904339508685, "loss": 0.0132, "step": 324470 }, { "epoch": 0.84, "learning_rate": 0.00017383515517871537, "loss": 0.0139, "step": 324480 }, { "epoch": 0.84, "learning_rate": 0.00017383126696234388, "loss": 0.0132, "step": 324490 }, { "epoch": 0.84, "learning_rate": 0.00017382737874597245, "loss": 0.0147, "step": 324500 }, { "epoch": 0.84, "learning_rate": 0.000173823490529601, "loss": 0.0164, "step": 324510 }, { "epoch": 0.84, "learning_rate": 0.0001738196023132295, "loss": 0.0212, "step": 324520 }, { "epoch": 0.84, "learning_rate": 0.00017381571409685805, "loss": 0.012, "step": 324530 }, { "epoch": 0.84, "learning_rate": 0.00017381182588048656, "loss": 0.012, "step": 324540 }, { "epoch": 0.84, "learning_rate": 0.00017380793766411513, "loss": 0.0154, "step": 324550 }, { "epoch": 0.84, "learning_rate": 0.00017380404944774365, "loss": 0.0155, "step": 324560 }, { "epoch": 0.84, "learning_rate": 0.0001738001612313722, "loss": 0.014, "step": 324570 }, { "epoch": 0.84, "learning_rate": 0.0001737962730150007, "loss": 0.0163, "step": 324580 }, { "epoch": 0.84, "learning_rate": 0.00017379238479862927, "loss": 0.0153, "step": 324590 }, { "epoch": 0.84, "learning_rate": 0.0001737884965822578, "loss": 0.0173, "step": 324600 }, { "epoch": 0.84, "learning_rate": 0.00017378460836588633, "loss": 0.0149, "step": 324610 }, { "epoch": 0.84, "learning_rate": 0.00017378072014951484, "loss": 0.0135, "step": 324620 }, { "epoch": 0.84, "learning_rate": 0.0001737768319331434, "loss": 0.0151, "step": 324630 }, { "epoch": 0.84, "learning_rate": 0.00017377294371677193, "loss": 0.0136, "step": 324640 }, { "epoch": 0.84, "learning_rate": 0.00017376905550040047, "loss": 0.0132, "step": 324650 }, { "epoch": 0.84, "learning_rate": 0.00017376516728402898, "loss": 0.0134, "step": 324660 }, { "epoch": 0.84, "learning_rate": 0.00017376127906765755, "loss": 0.0158, "step": 324670 }, { "epoch": 0.84, "learning_rate": 0.0001737573908512861, "loss": 0.0165, "step": 324680 }, { "epoch": 0.84, "learning_rate": 0.0001737535026349146, "loss": 0.0124, "step": 324690 }, { "epoch": 0.84, "learning_rate": 0.00017374961441854315, "loss": 0.0153, "step": 324700 }, { "epoch": 0.84, "learning_rate": 0.0001737457262021717, "loss": 0.0127, "step": 324710 }, { "epoch": 0.84, "learning_rate": 0.00017374183798580023, "loss": 0.0131, "step": 324720 }, { "epoch": 0.84, "learning_rate": 0.00017373794976942875, "loss": 0.0122, "step": 324730 }, { "epoch": 0.84, "learning_rate": 0.0001737340615530573, "loss": 0.0122, "step": 324740 }, { "epoch": 0.84, "learning_rate": 0.00017373017333668583, "loss": 0.0119, "step": 324750 }, { "epoch": 0.84, "learning_rate": 0.00017372628512031437, "loss": 0.0162, "step": 324760 }, { "epoch": 0.84, "learning_rate": 0.0001737223969039429, "loss": 0.0172, "step": 324770 }, { "epoch": 0.84, "learning_rate": 0.00017371850868757143, "loss": 0.0125, "step": 324780 }, { "epoch": 0.84, "learning_rate": 0.00017371462047119994, "loss": 0.0112, "step": 324790 }, { "epoch": 0.84, "learning_rate": 0.0001737107322548285, "loss": 0.0153, "step": 324800 }, { "epoch": 0.84, "learning_rate": 0.00017370684403845703, "loss": 0.0123, "step": 324810 }, { "epoch": 0.84, "learning_rate": 0.00017370295582208557, "loss": 0.0131, "step": 324820 }, { "epoch": 0.84, "learning_rate": 0.00017369906760571408, "loss": 0.0126, "step": 324830 }, { "epoch": 0.84, "learning_rate": 0.00017369517938934265, "loss": 0.0129, "step": 324840 }, { "epoch": 0.84, "learning_rate": 0.0001736912911729712, "loss": 0.0111, "step": 324850 }, { "epoch": 0.84, "learning_rate": 0.0001736874029565997, "loss": 0.0116, "step": 324860 }, { "epoch": 0.84, "learning_rate": 0.00017368351474022825, "loss": 0.0139, "step": 324870 }, { "epoch": 0.84, "learning_rate": 0.0001736796265238568, "loss": 0.0158, "step": 324880 }, { "epoch": 0.84, "learning_rate": 0.00017367573830748533, "loss": 0.0141, "step": 324890 }, { "epoch": 0.84, "learning_rate": 0.00017367185009111385, "loss": 0.0137, "step": 324900 }, { "epoch": 0.84, "learning_rate": 0.0001736679618747424, "loss": 0.0133, "step": 324910 }, { "epoch": 0.84, "learning_rate": 0.00017366407365837093, "loss": 0.0132, "step": 324920 }, { "epoch": 0.84, "learning_rate": 0.00017366018544199947, "loss": 0.0145, "step": 324930 }, { "epoch": 0.84, "learning_rate": 0.00017365629722562799, "loss": 0.012, "step": 324940 }, { "epoch": 0.84, "learning_rate": 0.00017365240900925653, "loss": 0.0119, "step": 324950 }, { "epoch": 0.84, "learning_rate": 0.00017364852079288507, "loss": 0.0148, "step": 324960 }, { "epoch": 0.84, "learning_rate": 0.0001736446325765136, "loss": 0.0167, "step": 324970 }, { "epoch": 0.84, "learning_rate": 0.00017364074436014213, "loss": 0.0147, "step": 324980 }, { "epoch": 0.84, "learning_rate": 0.00017363685614377067, "loss": 0.0174, "step": 324990 }, { "epoch": 0.84, "learning_rate": 0.00017363296792739924, "loss": 0.011, "step": 325000 }, { "epoch": 0.84, "eval_cer": 0.8817362776095881, "eval_loss": 0.009082542732357979, "eval_runtime": 107.6825, "eval_samples_per_second": 18.573, "eval_steps_per_second": 4.643, "step": 325000 }, { "epoch": 0.84, "learning_rate": 0.00017362907971102775, "loss": 0.0131, "step": 325010 }, { "epoch": 0.84, "learning_rate": 0.0001736251914946563, "loss": 0.0125, "step": 325020 }, { "epoch": 0.84, "learning_rate": 0.0001736213032782848, "loss": 0.0129, "step": 325030 }, { "epoch": 0.84, "learning_rate": 0.00017361741506191332, "loss": 0.0109, "step": 325040 }, { "epoch": 0.84, "learning_rate": 0.0001736135268455419, "loss": 0.0112, "step": 325050 }, { "epoch": 0.84, "learning_rate": 0.00017360963862917043, "loss": 0.0129, "step": 325060 }, { "epoch": 0.84, "learning_rate": 0.00017360575041279895, "loss": 0.0146, "step": 325070 }, { "epoch": 0.84, "learning_rate": 0.0001736018621964275, "loss": 0.0128, "step": 325080 }, { "epoch": 0.84, "learning_rate": 0.00017359797398005603, "loss": 0.0146, "step": 325090 }, { "epoch": 0.84, "learning_rate": 0.00017359408576368457, "loss": 0.0161, "step": 325100 }, { "epoch": 0.84, "learning_rate": 0.00017359019754731309, "loss": 0.0147, "step": 325110 }, { "epoch": 0.84, "learning_rate": 0.00017358630933094163, "loss": 0.0126, "step": 325120 }, { "epoch": 0.84, "learning_rate": 0.00017358242111457017, "loss": 0.0136, "step": 325130 }, { "epoch": 0.84, "learning_rate": 0.0001735785328981987, "loss": 0.0147, "step": 325140 }, { "epoch": 0.84, "learning_rate": 0.00017357464468182722, "loss": 0.0122, "step": 325150 }, { "epoch": 0.84, "learning_rate": 0.00017357075646545577, "loss": 0.0103, "step": 325160 }, { "epoch": 0.84, "learning_rate": 0.00017356686824908434, "loss": 0.0122, "step": 325170 }, { "epoch": 0.84, "learning_rate": 0.00017356298003271285, "loss": 0.0138, "step": 325180 }, { "epoch": 0.84, "learning_rate": 0.0001735590918163414, "loss": 0.0163, "step": 325190 }, { "epoch": 0.84, "learning_rate": 0.0001735552035999699, "loss": 0.0128, "step": 325200 }, { "epoch": 0.84, "learning_rate": 0.00017355131538359847, "loss": 0.0135, "step": 325210 }, { "epoch": 0.84, "learning_rate": 0.000173547427167227, "loss": 0.0137, "step": 325220 }, { "epoch": 0.84, "learning_rate": 0.00017354353895085553, "loss": 0.0132, "step": 325230 }, { "epoch": 0.84, "learning_rate": 0.00017353965073448405, "loss": 0.0106, "step": 325240 }, { "epoch": 0.84, "learning_rate": 0.00017353576251811261, "loss": 0.013, "step": 325250 }, { "epoch": 0.84, "learning_rate": 0.00017353187430174113, "loss": 0.0167, "step": 325260 }, { "epoch": 0.84, "learning_rate": 0.00017352798608536967, "loss": 0.0109, "step": 325270 }, { "epoch": 0.84, "learning_rate": 0.00017352409786899818, "loss": 0.0143, "step": 325280 }, { "epoch": 0.84, "learning_rate": 0.00017352020965262673, "loss": 0.0113, "step": 325290 }, { "epoch": 0.84, "learning_rate": 0.00017351632143625527, "loss": 0.0185, "step": 325300 }, { "epoch": 0.84, "learning_rate": 0.0001735124332198838, "loss": 0.0126, "step": 325310 }, { "epoch": 0.84, "learning_rate": 0.00017350854500351232, "loss": 0.0144, "step": 325320 }, { "epoch": 0.84, "learning_rate": 0.00017350465678714087, "loss": 0.0136, "step": 325330 }, { "epoch": 0.84, "learning_rate": 0.00017350076857076943, "loss": 0.0138, "step": 325340 }, { "epoch": 0.84, "learning_rate": 0.00017349688035439795, "loss": 0.0147, "step": 325350 }, { "epoch": 0.84, "learning_rate": 0.00017349299213802646, "loss": 0.0146, "step": 325360 }, { "epoch": 0.84, "learning_rate": 0.000173489103921655, "loss": 0.0116, "step": 325370 }, { "epoch": 0.84, "learning_rate": 0.00017348521570528357, "loss": 0.015, "step": 325380 }, { "epoch": 0.84, "learning_rate": 0.0001734813274889121, "loss": 0.0153, "step": 325390 }, { "epoch": 0.84, "learning_rate": 0.00017347743927254063, "loss": 0.0116, "step": 325400 }, { "epoch": 0.84, "learning_rate": 0.00017347355105616914, "loss": 0.0119, "step": 325410 }, { "epoch": 0.84, "learning_rate": 0.0001734696628397977, "loss": 0.0135, "step": 325420 }, { "epoch": 0.84, "learning_rate": 0.00017346577462342623, "loss": 0.0143, "step": 325430 }, { "epoch": 0.84, "learning_rate": 0.00017346188640705477, "loss": 0.0158, "step": 325440 }, { "epoch": 0.84, "learning_rate": 0.00017345799819068328, "loss": 0.0107, "step": 325450 }, { "epoch": 0.84, "learning_rate": 0.00017345410997431185, "loss": 0.0127, "step": 325460 }, { "epoch": 0.84, "learning_rate": 0.00017345022175794037, "loss": 0.0125, "step": 325470 }, { "epoch": 0.84, "learning_rate": 0.0001734463335415689, "loss": 0.0132, "step": 325480 }, { "epoch": 0.84, "learning_rate": 0.00017344244532519742, "loss": 0.0108, "step": 325490 }, { "epoch": 0.84, "learning_rate": 0.000173438557108826, "loss": 0.0166, "step": 325500 }, { "epoch": 0.84, "learning_rate": 0.0001734346688924545, "loss": 0.012, "step": 325510 }, { "epoch": 0.84, "learning_rate": 0.00017343078067608305, "loss": 0.012, "step": 325520 }, { "epoch": 0.84, "learning_rate": 0.00017342689245971156, "loss": 0.0189, "step": 325530 }, { "epoch": 0.84, "learning_rate": 0.0001734230042433401, "loss": 0.0139, "step": 325540 }, { "epoch": 0.84, "learning_rate": 0.00017341911602696867, "loss": 0.0157, "step": 325550 }, { "epoch": 0.84, "learning_rate": 0.0001734152278105972, "loss": 0.0164, "step": 325560 }, { "epoch": 0.84, "learning_rate": 0.00017341133959422573, "loss": 0.0141, "step": 325570 }, { "epoch": 0.84, "learning_rate": 0.00017340745137785424, "loss": 0.0189, "step": 325580 }, { "epoch": 0.84, "learning_rate": 0.0001734035631614828, "loss": 0.0135, "step": 325590 }, { "epoch": 0.84, "learning_rate": 0.00017339967494511133, "loss": 0.0135, "step": 325600 }, { "epoch": 0.84, "learning_rate": 0.00017339578672873987, "loss": 0.0127, "step": 325610 }, { "epoch": 0.84, "learning_rate": 0.00017339189851236838, "loss": 0.0144, "step": 325620 }, { "epoch": 0.84, "learning_rate": 0.00017338801029599695, "loss": 0.0152, "step": 325630 }, { "epoch": 0.84, "learning_rate": 0.00017338412207962547, "loss": 0.0132, "step": 325640 }, { "epoch": 0.84, "learning_rate": 0.000173380233863254, "loss": 0.0124, "step": 325650 }, { "epoch": 0.84, "learning_rate": 0.00017337634564688252, "loss": 0.0134, "step": 325660 }, { "epoch": 0.84, "learning_rate": 0.0001733724574305111, "loss": 0.0105, "step": 325670 }, { "epoch": 0.84, "learning_rate": 0.0001733685692141396, "loss": 0.0144, "step": 325680 }, { "epoch": 0.84, "learning_rate": 0.00017336468099776815, "loss": 0.0121, "step": 325690 }, { "epoch": 0.84, "learning_rate": 0.00017336079278139666, "loss": 0.0144, "step": 325700 }, { "epoch": 0.84, "learning_rate": 0.00017335690456502523, "loss": 0.0139, "step": 325710 }, { "epoch": 0.84, "learning_rate": 0.00017335301634865377, "loss": 0.0112, "step": 325720 }, { "epoch": 0.84, "learning_rate": 0.0001733491281322823, "loss": 0.0128, "step": 325730 }, { "epoch": 0.84, "learning_rate": 0.00017334523991591083, "loss": 0.0137, "step": 325740 }, { "epoch": 0.84, "learning_rate": 0.00017334135169953937, "loss": 0.013, "step": 325750 }, { "epoch": 0.84, "learning_rate": 0.0001733374634831679, "loss": 0.0137, "step": 325760 }, { "epoch": 0.84, "learning_rate": 0.00017333357526679643, "loss": 0.0154, "step": 325770 }, { "epoch": 0.84, "learning_rate": 0.00017332968705042497, "loss": 0.0176, "step": 325780 }, { "epoch": 0.84, "learning_rate": 0.00017332579883405348, "loss": 0.0152, "step": 325790 }, { "epoch": 0.84, "learning_rate": 0.00017332191061768205, "loss": 0.011, "step": 325800 }, { "epoch": 0.84, "learning_rate": 0.00017331802240131057, "loss": 0.0107, "step": 325810 }, { "epoch": 0.84, "learning_rate": 0.0001733141341849391, "loss": 0.0131, "step": 325820 }, { "epoch": 0.84, "learning_rate": 0.00017331024596856762, "loss": 0.0123, "step": 325830 }, { "epoch": 0.84, "learning_rate": 0.0001733063577521962, "loss": 0.0123, "step": 325840 }, { "epoch": 0.84, "learning_rate": 0.0001733024695358247, "loss": 0.0185, "step": 325850 }, { "epoch": 0.84, "learning_rate": 0.00017329858131945325, "loss": 0.0146, "step": 325860 }, { "epoch": 0.84, "learning_rate": 0.00017329469310308176, "loss": 0.0094, "step": 325870 }, { "epoch": 0.84, "learning_rate": 0.00017329080488671033, "loss": 0.0111, "step": 325880 }, { "epoch": 0.84, "learning_rate": 0.00017328691667033887, "loss": 0.0133, "step": 325890 }, { "epoch": 0.84, "learning_rate": 0.0001732830284539674, "loss": 0.0155, "step": 325900 }, { "epoch": 0.84, "learning_rate": 0.0001732791402375959, "loss": 0.0174, "step": 325910 }, { "epoch": 0.84, "learning_rate": 0.00017327525202122447, "loss": 0.0104, "step": 325920 }, { "epoch": 0.84, "learning_rate": 0.000173271363804853, "loss": 0.0121, "step": 325930 }, { "epoch": 0.84, "learning_rate": 0.00017326747558848153, "loss": 0.0103, "step": 325940 }, { "epoch": 0.84, "learning_rate": 0.00017326358737211007, "loss": 0.0096, "step": 325950 }, { "epoch": 0.84, "learning_rate": 0.0001732596991557386, "loss": 0.0149, "step": 325960 }, { "epoch": 0.84, "learning_rate": 0.00017325581093936715, "loss": 0.0124, "step": 325970 }, { "epoch": 0.84, "learning_rate": 0.00017325192272299567, "loss": 0.0149, "step": 325980 }, { "epoch": 0.85, "learning_rate": 0.0001732480345066242, "loss": 0.0139, "step": 325990 }, { "epoch": 0.85, "learning_rate": 0.00017324414629025275, "loss": 0.0144, "step": 326000 }, { "epoch": 0.85, "eval_cer": 0.8817180823294437, "eval_loss": 0.008809900842607021, "eval_runtime": 107.5599, "eval_samples_per_second": 18.594, "eval_steps_per_second": 4.649, "step": 326000 }, { "epoch": 0.85, "learning_rate": 0.0001732402580738813, "loss": 0.0124, "step": 326010 }, { "epoch": 0.85, "learning_rate": 0.0001732363698575098, "loss": 0.013, "step": 326020 }, { "epoch": 0.85, "learning_rate": 0.00017323248164113835, "loss": 0.0132, "step": 326030 }, { "epoch": 0.85, "learning_rate": 0.00017322859342476686, "loss": 0.0117, "step": 326040 }, { "epoch": 0.85, "learning_rate": 0.00017322470520839543, "loss": 0.0145, "step": 326050 }, { "epoch": 0.85, "learning_rate": 0.00017322081699202397, "loss": 0.0137, "step": 326060 }, { "epoch": 0.85, "learning_rate": 0.00017321692877565249, "loss": 0.0132, "step": 326070 }, { "epoch": 0.85, "learning_rate": 0.000173213040559281, "loss": 0.0152, "step": 326080 }, { "epoch": 0.85, "learning_rate": 0.00017320915234290957, "loss": 0.0176, "step": 326090 }, { "epoch": 0.85, "learning_rate": 0.0001732052641265381, "loss": 0.0135, "step": 326100 }, { "epoch": 0.85, "learning_rate": 0.00017320137591016663, "loss": 0.0144, "step": 326110 }, { "epoch": 0.85, "learning_rate": 0.00017319748769379517, "loss": 0.0169, "step": 326120 }, { "epoch": 0.85, "learning_rate": 0.0001731935994774237, "loss": 0.0103, "step": 326130 }, { "epoch": 0.85, "learning_rate": 0.00017318971126105225, "loss": 0.0097, "step": 326140 }, { "epoch": 0.85, "learning_rate": 0.00017318582304468077, "loss": 0.0134, "step": 326150 }, { "epoch": 0.85, "learning_rate": 0.0001731819348283093, "loss": 0.0115, "step": 326160 }, { "epoch": 0.85, "learning_rate": 0.00017317804661193785, "loss": 0.0163, "step": 326170 }, { "epoch": 0.85, "learning_rate": 0.0001731741583955664, "loss": 0.0173, "step": 326180 }, { "epoch": 0.85, "learning_rate": 0.0001731702701791949, "loss": 0.0125, "step": 326190 }, { "epoch": 0.85, "learning_rate": 0.00017316638196282345, "loss": 0.0127, "step": 326200 }, { "epoch": 0.85, "learning_rate": 0.00017316249374645202, "loss": 0.0123, "step": 326210 }, { "epoch": 0.85, "learning_rate": 0.00017315860553008053, "loss": 0.0154, "step": 326220 }, { "epoch": 0.85, "learning_rate": 0.00017315471731370904, "loss": 0.0119, "step": 326230 }, { "epoch": 0.85, "learning_rate": 0.00017315082909733759, "loss": 0.0107, "step": 326240 }, { "epoch": 0.85, "learning_rate": 0.00017314694088096615, "loss": 0.0122, "step": 326250 }, { "epoch": 0.85, "learning_rate": 0.00017314305266459467, "loss": 0.0174, "step": 326260 }, { "epoch": 0.85, "learning_rate": 0.0001731391644482232, "loss": 0.0159, "step": 326270 }, { "epoch": 0.85, "learning_rate": 0.00017313527623185173, "loss": 0.012, "step": 326280 }, { "epoch": 0.85, "learning_rate": 0.00017313138801548027, "loss": 0.0142, "step": 326290 }, { "epoch": 0.85, "learning_rate": 0.0001731274997991088, "loss": 0.018, "step": 326300 }, { "epoch": 0.85, "learning_rate": 0.00017312361158273735, "loss": 0.0135, "step": 326310 }, { "epoch": 0.85, "learning_rate": 0.00017311972336636586, "loss": 0.0134, "step": 326320 }, { "epoch": 0.85, "learning_rate": 0.0001731158351499944, "loss": 0.0156, "step": 326330 }, { "epoch": 0.85, "learning_rate": 0.00017311194693362295, "loss": 0.012, "step": 326340 }, { "epoch": 0.85, "learning_rate": 0.0001731080587172515, "loss": 0.0164, "step": 326350 }, { "epoch": 0.85, "learning_rate": 0.00017310417050088, "loss": 0.0152, "step": 326360 }, { "epoch": 0.85, "learning_rate": 0.00017310028228450855, "loss": 0.0173, "step": 326370 }, { "epoch": 0.85, "learning_rate": 0.0001730963940681371, "loss": 0.0126, "step": 326380 }, { "epoch": 0.85, "learning_rate": 0.00017309250585176563, "loss": 0.0111, "step": 326390 }, { "epoch": 0.85, "learning_rate": 0.00017308861763539414, "loss": 0.016, "step": 326400 }, { "epoch": 0.85, "learning_rate": 0.00017308472941902269, "loss": 0.0137, "step": 326410 }, { "epoch": 0.85, "learning_rate": 0.00017308084120265125, "loss": 0.0141, "step": 326420 }, { "epoch": 0.85, "learning_rate": 0.00017307695298627977, "loss": 0.0136, "step": 326430 }, { "epoch": 0.85, "learning_rate": 0.0001730730647699083, "loss": 0.0127, "step": 326440 }, { "epoch": 0.85, "learning_rate": 0.00017306917655353682, "loss": 0.0123, "step": 326450 }, { "epoch": 0.85, "learning_rate": 0.0001730652883371654, "loss": 0.0133, "step": 326460 }, { "epoch": 0.85, "learning_rate": 0.0001730614001207939, "loss": 0.0158, "step": 326470 }, { "epoch": 0.85, "learning_rate": 0.00017305751190442245, "loss": 0.0134, "step": 326480 }, { "epoch": 0.85, "learning_rate": 0.00017305362368805096, "loss": 0.0128, "step": 326490 }, { "epoch": 0.85, "learning_rate": 0.00017304973547167953, "loss": 0.0147, "step": 326500 }, { "epoch": 0.85, "learning_rate": 0.00017304584725530805, "loss": 0.0161, "step": 326510 }, { "epoch": 0.85, "learning_rate": 0.0001730419590389366, "loss": 0.0126, "step": 326520 }, { "epoch": 0.85, "learning_rate": 0.0001730380708225651, "loss": 0.013, "step": 326530 }, { "epoch": 0.85, "learning_rate": 0.00017303418260619365, "loss": 0.017, "step": 326540 }, { "epoch": 0.85, "learning_rate": 0.0001730302943898222, "loss": 0.0116, "step": 326550 }, { "epoch": 0.85, "learning_rate": 0.00017302640617345073, "loss": 0.0158, "step": 326560 }, { "epoch": 0.85, "learning_rate": 0.00017302251795707924, "loss": 0.0151, "step": 326570 }, { "epoch": 0.85, "learning_rate": 0.00017301862974070778, "loss": 0.0255, "step": 326580 }, { "epoch": 0.85, "learning_rate": 0.00017301474152433635, "loss": 0.0153, "step": 326590 }, { "epoch": 0.85, "learning_rate": 0.00017301085330796487, "loss": 0.0241, "step": 326600 }, { "epoch": 0.85, "learning_rate": 0.0001730069650915934, "loss": 0.0177, "step": 326610 }, { "epoch": 0.85, "learning_rate": 0.00017300307687522192, "loss": 0.0149, "step": 326620 }, { "epoch": 0.85, "learning_rate": 0.0001729991886588505, "loss": 0.0123, "step": 326630 }, { "epoch": 0.85, "learning_rate": 0.000172995300442479, "loss": 0.0143, "step": 326640 }, { "epoch": 0.85, "learning_rate": 0.00017299141222610755, "loss": 0.0112, "step": 326650 }, { "epoch": 0.85, "learning_rate": 0.00017298752400973606, "loss": 0.0106, "step": 326660 }, { "epoch": 0.85, "learning_rate": 0.00017298363579336463, "loss": 0.0153, "step": 326670 }, { "epoch": 0.85, "learning_rate": 0.00017297974757699315, "loss": 0.0154, "step": 326680 }, { "epoch": 0.85, "learning_rate": 0.0001729758593606217, "loss": 0.013, "step": 326690 }, { "epoch": 0.85, "learning_rate": 0.0001729719711442502, "loss": 0.0172, "step": 326700 }, { "epoch": 0.85, "learning_rate": 0.00017296808292787877, "loss": 0.0094, "step": 326710 }, { "epoch": 0.85, "learning_rate": 0.00017296419471150729, "loss": 0.0126, "step": 326720 }, { "epoch": 0.85, "learning_rate": 0.00017296030649513583, "loss": 0.0175, "step": 326730 }, { "epoch": 0.85, "learning_rate": 0.00017295641827876434, "loss": 0.0164, "step": 326740 }, { "epoch": 0.85, "learning_rate": 0.0001729525300623929, "loss": 0.0105, "step": 326750 }, { "epoch": 0.85, "learning_rate": 0.00017294864184602145, "loss": 0.0177, "step": 326760 }, { "epoch": 0.85, "learning_rate": 0.00017294475362964997, "loss": 0.0155, "step": 326770 }, { "epoch": 0.85, "learning_rate": 0.0001729408654132785, "loss": 0.0135, "step": 326780 }, { "epoch": 0.85, "learning_rate": 0.00017293697719690702, "loss": 0.0146, "step": 326790 }, { "epoch": 0.85, "learning_rate": 0.0001729330889805356, "loss": 0.0142, "step": 326800 }, { "epoch": 0.85, "learning_rate": 0.0001729292007641641, "loss": 0.0153, "step": 326810 }, { "epoch": 0.85, "learning_rate": 0.00017292531254779265, "loss": 0.0134, "step": 326820 }, { "epoch": 0.85, "learning_rate": 0.00017292142433142116, "loss": 0.0146, "step": 326830 }, { "epoch": 0.85, "learning_rate": 0.00017291753611504973, "loss": 0.011, "step": 326840 }, { "epoch": 0.85, "learning_rate": 0.00017291364789867825, "loss": 0.0136, "step": 326850 }, { "epoch": 0.85, "learning_rate": 0.0001729097596823068, "loss": 0.0146, "step": 326860 }, { "epoch": 0.85, "learning_rate": 0.0001729058714659353, "loss": 0.0143, "step": 326870 }, { "epoch": 0.85, "learning_rate": 0.00017290198324956387, "loss": 0.013, "step": 326880 }, { "epoch": 0.85, "learning_rate": 0.00017289809503319239, "loss": 0.0153, "step": 326890 }, { "epoch": 0.85, "learning_rate": 0.00017289420681682093, "loss": 0.012, "step": 326900 }, { "epoch": 0.85, "learning_rate": 0.00017289031860044944, "loss": 0.0105, "step": 326910 }, { "epoch": 0.85, "learning_rate": 0.000172886430384078, "loss": 0.0152, "step": 326920 }, { "epoch": 0.85, "learning_rate": 0.00017288254216770655, "loss": 0.0158, "step": 326930 }, { "epoch": 0.85, "learning_rate": 0.00017287865395133507, "loss": 0.0092, "step": 326940 }, { "epoch": 0.85, "learning_rate": 0.00017287476573496358, "loss": 0.015, "step": 326950 }, { "epoch": 0.85, "learning_rate": 0.00017287087751859215, "loss": 0.0156, "step": 326960 }, { "epoch": 0.85, "learning_rate": 0.0001728669893022207, "loss": 0.0132, "step": 326970 }, { "epoch": 0.85, "learning_rate": 0.0001728631010858492, "loss": 0.01, "step": 326980 }, { "epoch": 0.85, "learning_rate": 0.00017285921286947775, "loss": 0.0143, "step": 326990 }, { "epoch": 0.85, "learning_rate": 0.0001728553246531063, "loss": 0.0128, "step": 327000 }, { "epoch": 0.85, "eval_cer": 0.8817334783357197, "eval_loss": 0.009260199032723904, "eval_runtime": 107.8033, "eval_samples_per_second": 18.552, "eval_steps_per_second": 4.638, "step": 327000 }, { "epoch": 0.85, "learning_rate": 0.00017285143643673483, "loss": 0.0156, "step": 327010 }, { "epoch": 0.85, "learning_rate": 0.00017284754822036335, "loss": 0.0143, "step": 327020 }, { "epoch": 0.85, "learning_rate": 0.0001728436600039919, "loss": 0.0125, "step": 327030 }, { "epoch": 0.85, "learning_rate": 0.0001728397717876204, "loss": 0.013, "step": 327040 }, { "epoch": 0.85, "learning_rate": 0.00017283588357124897, "loss": 0.0144, "step": 327050 }, { "epoch": 0.85, "learning_rate": 0.00017283199535487749, "loss": 0.0126, "step": 327060 }, { "epoch": 0.85, "learning_rate": 0.00017282810713850603, "loss": 0.012, "step": 327070 }, { "epoch": 0.85, "learning_rate": 0.00017282421892213454, "loss": 0.0119, "step": 327080 }, { "epoch": 0.85, "learning_rate": 0.0001728203307057631, "loss": 0.0119, "step": 327090 }, { "epoch": 0.85, "learning_rate": 0.00017281644248939162, "loss": 0.0142, "step": 327100 }, { "epoch": 0.85, "learning_rate": 0.00017281255427302017, "loss": 0.014, "step": 327110 }, { "epoch": 0.85, "learning_rate": 0.00017280866605664868, "loss": 0.0134, "step": 327120 }, { "epoch": 0.85, "learning_rate": 0.00017280477784027725, "loss": 0.0143, "step": 327130 }, { "epoch": 0.85, "learning_rate": 0.0001728008896239058, "loss": 0.0145, "step": 327140 }, { "epoch": 0.85, "learning_rate": 0.0001727970014075343, "loss": 0.0165, "step": 327150 }, { "epoch": 0.85, "learning_rate": 0.00017279311319116285, "loss": 0.0146, "step": 327160 }, { "epoch": 0.85, "learning_rate": 0.0001727892249747914, "loss": 0.0154, "step": 327170 }, { "epoch": 0.85, "learning_rate": 0.00017278533675841993, "loss": 0.0145, "step": 327180 }, { "epoch": 0.85, "learning_rate": 0.00017278144854204844, "loss": 0.012, "step": 327190 }, { "epoch": 0.85, "learning_rate": 0.000172777560325677, "loss": 0.0127, "step": 327200 }, { "epoch": 0.85, "learning_rate": 0.00017277367210930553, "loss": 0.0164, "step": 327210 }, { "epoch": 0.85, "learning_rate": 0.00017276978389293407, "loss": 0.0122, "step": 327220 }, { "epoch": 0.85, "learning_rate": 0.00017276589567656258, "loss": 0.0095, "step": 327230 }, { "epoch": 0.85, "learning_rate": 0.00017276200746019113, "loss": 0.0136, "step": 327240 }, { "epoch": 0.85, "learning_rate": 0.0001727581192438197, "loss": 0.0163, "step": 327250 }, { "epoch": 0.85, "learning_rate": 0.0001727542310274482, "loss": 0.0161, "step": 327260 }, { "epoch": 0.85, "learning_rate": 0.00017275034281107672, "loss": 0.0143, "step": 327270 }, { "epoch": 0.85, "learning_rate": 0.00017274645459470527, "loss": 0.0131, "step": 327280 }, { "epoch": 0.85, "learning_rate": 0.00017274256637833378, "loss": 0.0152, "step": 327290 }, { "epoch": 0.85, "learning_rate": 0.00017273867816196235, "loss": 0.0116, "step": 327300 }, { "epoch": 0.85, "learning_rate": 0.0001727347899455909, "loss": 0.0112, "step": 327310 }, { "epoch": 0.85, "learning_rate": 0.0001727309017292194, "loss": 0.0134, "step": 327320 }, { "epoch": 0.85, "learning_rate": 0.00017272701351284795, "loss": 0.0095, "step": 327330 }, { "epoch": 0.85, "learning_rate": 0.0001727231252964765, "loss": 0.0125, "step": 327340 }, { "epoch": 0.85, "learning_rate": 0.00017271923708010503, "loss": 0.0136, "step": 327350 }, { "epoch": 0.85, "learning_rate": 0.00017271534886373354, "loss": 0.0156, "step": 327360 }, { "epoch": 0.85, "learning_rate": 0.00017271146064736209, "loss": 0.0133, "step": 327370 }, { "epoch": 0.85, "learning_rate": 0.00017270757243099063, "loss": 0.0124, "step": 327380 }, { "epoch": 0.85, "learning_rate": 0.00017270368421461917, "loss": 0.0127, "step": 327390 }, { "epoch": 0.85, "learning_rate": 0.00017269979599824768, "loss": 0.0136, "step": 327400 }, { "epoch": 0.85, "learning_rate": 0.00017269590778187623, "loss": 0.0113, "step": 327410 }, { "epoch": 0.85, "learning_rate": 0.00017269201956550477, "loss": 0.0122, "step": 327420 }, { "epoch": 0.85, "learning_rate": 0.0001726881313491333, "loss": 0.021, "step": 327430 }, { "epoch": 0.85, "learning_rate": 0.00017268424313276182, "loss": 0.013, "step": 327440 }, { "epoch": 0.85, "learning_rate": 0.00017268035491639036, "loss": 0.0138, "step": 327450 }, { "epoch": 0.85, "learning_rate": 0.00017267646670001893, "loss": 0.0163, "step": 327460 }, { "epoch": 0.85, "learning_rate": 0.00017267257848364745, "loss": 0.0135, "step": 327470 }, { "epoch": 0.85, "learning_rate": 0.000172668690267276, "loss": 0.0129, "step": 327480 }, { "epoch": 0.85, "learning_rate": 0.0001726648020509045, "loss": 0.0132, "step": 327490 }, { "epoch": 0.85, "learning_rate": 0.00017266091383453307, "loss": 0.0116, "step": 327500 }, { "epoch": 0.85, "learning_rate": 0.0001726570256181616, "loss": 0.0148, "step": 327510 }, { "epoch": 0.85, "learning_rate": 0.00017265313740179013, "loss": 0.0173, "step": 327520 }, { "epoch": 0.85, "learning_rate": 0.00017264924918541864, "loss": 0.015, "step": 327530 }, { "epoch": 0.85, "learning_rate": 0.00017264536096904719, "loss": 0.014, "step": 327540 }, { "epoch": 0.85, "learning_rate": 0.00017264147275267573, "loss": 0.0128, "step": 327550 }, { "epoch": 0.85, "learning_rate": 0.00017263758453630427, "loss": 0.0129, "step": 327560 }, { "epoch": 0.85, "learning_rate": 0.00017263369631993278, "loss": 0.0136, "step": 327570 }, { "epoch": 0.85, "learning_rate": 0.00017262980810356132, "loss": 0.011, "step": 327580 }, { "epoch": 0.85, "learning_rate": 0.00017262591988718987, "loss": 0.0154, "step": 327590 }, { "epoch": 0.85, "learning_rate": 0.0001726220316708184, "loss": 0.0112, "step": 327600 }, { "epoch": 0.85, "learning_rate": 0.00017261814345444692, "loss": 0.0116, "step": 327610 }, { "epoch": 0.85, "learning_rate": 0.00017261425523807546, "loss": 0.0167, "step": 327620 }, { "epoch": 0.85, "learning_rate": 0.00017261036702170403, "loss": 0.0145, "step": 327630 }, { "epoch": 0.85, "learning_rate": 0.00017260647880533255, "loss": 0.0113, "step": 327640 }, { "epoch": 0.85, "learning_rate": 0.0001726025905889611, "loss": 0.0141, "step": 327650 }, { "epoch": 0.85, "learning_rate": 0.0001725987023725896, "loss": 0.0116, "step": 327660 }, { "epoch": 0.85, "learning_rate": 0.00017259481415621817, "loss": 0.0152, "step": 327670 }, { "epoch": 0.85, "learning_rate": 0.0001725909259398467, "loss": 0.0147, "step": 327680 }, { "epoch": 0.85, "learning_rate": 0.00017258703772347523, "loss": 0.0197, "step": 327690 }, { "epoch": 0.85, "learning_rate": 0.00017258314950710374, "loss": 0.0149, "step": 327700 }, { "epoch": 0.85, "learning_rate": 0.0001725792612907323, "loss": 0.012, "step": 327710 }, { "epoch": 0.85, "learning_rate": 0.00017257537307436083, "loss": 0.0142, "step": 327720 }, { "epoch": 0.85, "learning_rate": 0.00017257148485798937, "loss": 0.0154, "step": 327730 }, { "epoch": 0.85, "learning_rate": 0.00017256759664161788, "loss": 0.0113, "step": 327740 }, { "epoch": 0.85, "learning_rate": 0.00017256370842524642, "loss": 0.0161, "step": 327750 }, { "epoch": 0.85, "learning_rate": 0.00017255982020887497, "loss": 0.0141, "step": 327760 }, { "epoch": 0.85, "learning_rate": 0.0001725559319925035, "loss": 0.0132, "step": 327770 }, { "epoch": 0.85, "learning_rate": 0.00017255204377613202, "loss": 0.0115, "step": 327780 }, { "epoch": 0.85, "learning_rate": 0.00017254815555976056, "loss": 0.0173, "step": 327790 }, { "epoch": 0.85, "learning_rate": 0.00017254426734338913, "loss": 0.0208, "step": 327800 }, { "epoch": 0.85, "learning_rate": 0.00017254037912701765, "loss": 0.0145, "step": 327810 }, { "epoch": 0.85, "learning_rate": 0.00017253649091064616, "loss": 0.0137, "step": 327820 }, { "epoch": 0.85, "learning_rate": 0.0001725326026942747, "loss": 0.0146, "step": 327830 }, { "epoch": 0.85, "learning_rate": 0.00017252871447790327, "loss": 0.0122, "step": 327840 }, { "epoch": 0.85, "learning_rate": 0.0001725248262615318, "loss": 0.0123, "step": 327850 }, { "epoch": 0.85, "learning_rate": 0.00017252093804516033, "loss": 0.015, "step": 327860 }, { "epoch": 0.85, "learning_rate": 0.00017251704982878884, "loss": 0.0129, "step": 327870 }, { "epoch": 0.85, "learning_rate": 0.0001725131616124174, "loss": 0.0125, "step": 327880 }, { "epoch": 0.85, "learning_rate": 0.00017250927339604593, "loss": 0.0143, "step": 327890 }, { "epoch": 0.85, "learning_rate": 0.00017250538517967447, "loss": 0.0116, "step": 327900 }, { "epoch": 0.85, "learning_rate": 0.00017250149696330298, "loss": 0.0186, "step": 327910 }, { "epoch": 0.85, "learning_rate": 0.00017249760874693155, "loss": 0.015, "step": 327920 }, { "epoch": 0.85, "learning_rate": 0.00017249372053056007, "loss": 0.016, "step": 327930 }, { "epoch": 0.85, "learning_rate": 0.0001724898323141886, "loss": 0.0113, "step": 327940 }, { "epoch": 0.85, "learning_rate": 0.00017248594409781712, "loss": 0.0156, "step": 327950 }, { "epoch": 0.85, "learning_rate": 0.0001724820558814457, "loss": 0.0145, "step": 327960 }, { "epoch": 0.85, "learning_rate": 0.0001724781676650742, "loss": 0.0138, "step": 327970 }, { "epoch": 0.85, "learning_rate": 0.00017247427944870275, "loss": 0.013, "step": 327980 }, { "epoch": 0.85, "learning_rate": 0.00017247039123233126, "loss": 0.0133, "step": 327990 }, { "epoch": 0.85, "learning_rate": 0.0001724665030159598, "loss": 0.0127, "step": 328000 }, { "epoch": 0.85, "eval_cer": 0.8817222812402463, "eval_loss": 0.009132904931902885, "eval_runtime": 107.5638, "eval_samples_per_second": 18.594, "eval_steps_per_second": 4.648, "step": 328000 }, { "epoch": 0.85, "learning_rate": 0.00017246261479958837, "loss": 0.0146, "step": 328010 }, { "epoch": 0.85, "learning_rate": 0.00017245872658321689, "loss": 0.0105, "step": 328020 }, { "epoch": 0.85, "learning_rate": 0.00017245483836684543, "loss": 0.0131, "step": 328030 }, { "epoch": 0.85, "learning_rate": 0.00017245095015047394, "loss": 0.0128, "step": 328040 }, { "epoch": 0.85, "learning_rate": 0.0001724470619341025, "loss": 0.0125, "step": 328050 }, { "epoch": 0.85, "learning_rate": 0.00017244317371773103, "loss": 0.0126, "step": 328060 }, { "epoch": 0.85, "learning_rate": 0.00017243928550135957, "loss": 0.014, "step": 328070 }, { "epoch": 0.85, "learning_rate": 0.00017243539728498808, "loss": 0.0143, "step": 328080 }, { "epoch": 0.85, "learning_rate": 0.00017243150906861665, "loss": 0.0197, "step": 328090 }, { "epoch": 0.85, "learning_rate": 0.00017242762085224516, "loss": 0.0125, "step": 328100 }, { "epoch": 0.85, "learning_rate": 0.0001724237326358737, "loss": 0.0164, "step": 328110 }, { "epoch": 0.85, "learning_rate": 0.00017241984441950222, "loss": 0.0135, "step": 328120 }, { "epoch": 0.85, "learning_rate": 0.0001724159562031308, "loss": 0.0141, "step": 328130 }, { "epoch": 0.85, "learning_rate": 0.0001724120679867593, "loss": 0.0173, "step": 328140 }, { "epoch": 0.85, "learning_rate": 0.00017240817977038785, "loss": 0.014, "step": 328150 }, { "epoch": 0.85, "learning_rate": 0.00017240429155401636, "loss": 0.0158, "step": 328160 }, { "epoch": 0.85, "learning_rate": 0.00017240040333764493, "loss": 0.0153, "step": 328170 }, { "epoch": 0.85, "learning_rate": 0.00017239651512127347, "loss": 0.0166, "step": 328180 }, { "epoch": 0.85, "learning_rate": 0.00017239262690490199, "loss": 0.0129, "step": 328190 }, { "epoch": 0.85, "learning_rate": 0.00017238873868853053, "loss": 0.0146, "step": 328200 }, { "epoch": 0.85, "learning_rate": 0.00017238485047215907, "loss": 0.0145, "step": 328210 }, { "epoch": 0.85, "learning_rate": 0.0001723809622557876, "loss": 0.0157, "step": 328220 }, { "epoch": 0.85, "learning_rate": 0.00017237707403941612, "loss": 0.013, "step": 328230 }, { "epoch": 0.85, "learning_rate": 0.00017237318582304467, "loss": 0.0132, "step": 328240 }, { "epoch": 0.85, "learning_rate": 0.00017236929760667318, "loss": 0.0153, "step": 328250 }, { "epoch": 0.85, "learning_rate": 0.00017236540939030175, "loss": 0.013, "step": 328260 }, { "epoch": 0.85, "learning_rate": 0.00017236152117393026, "loss": 0.0165, "step": 328270 }, { "epoch": 0.85, "learning_rate": 0.0001723576329575588, "loss": 0.0118, "step": 328280 }, { "epoch": 0.85, "learning_rate": 0.00017235374474118732, "loss": 0.0171, "step": 328290 }, { "epoch": 0.85, "learning_rate": 0.0001723498565248159, "loss": 0.0106, "step": 328300 }, { "epoch": 0.85, "learning_rate": 0.0001723459683084444, "loss": 0.0137, "step": 328310 }, { "epoch": 0.85, "learning_rate": 0.00017234208009207295, "loss": 0.0141, "step": 328320 }, { "epoch": 0.85, "learning_rate": 0.00017233819187570146, "loss": 0.0147, "step": 328330 }, { "epoch": 0.85, "learning_rate": 0.00017233430365933003, "loss": 0.0175, "step": 328340 }, { "epoch": 0.85, "learning_rate": 0.00017233041544295857, "loss": 0.014, "step": 328350 }, { "epoch": 0.85, "learning_rate": 0.00017232652722658708, "loss": 0.0171, "step": 328360 }, { "epoch": 0.85, "learning_rate": 0.00017232263901021563, "loss": 0.0157, "step": 328370 }, { "epoch": 0.85, "learning_rate": 0.00017231875079384417, "loss": 0.0172, "step": 328380 }, { "epoch": 0.85, "learning_rate": 0.0001723148625774727, "loss": 0.013, "step": 328390 }, { "epoch": 0.85, "learning_rate": 0.00017231097436110122, "loss": 0.0124, "step": 328400 }, { "epoch": 0.85, "learning_rate": 0.00017230708614472977, "loss": 0.0129, "step": 328410 }, { "epoch": 0.85, "learning_rate": 0.0001723031979283583, "loss": 0.0138, "step": 328420 }, { "epoch": 0.85, "learning_rate": 0.00017229930971198685, "loss": 0.0142, "step": 328430 }, { "epoch": 0.85, "learning_rate": 0.00017229542149561536, "loss": 0.0128, "step": 328440 }, { "epoch": 0.85, "learning_rate": 0.0001722915332792439, "loss": 0.014, "step": 328450 }, { "epoch": 0.85, "learning_rate": 0.00017228764506287245, "loss": 0.0135, "step": 328460 }, { "epoch": 0.85, "learning_rate": 0.000172283756846501, "loss": 0.0111, "step": 328470 }, { "epoch": 0.85, "learning_rate": 0.0001722798686301295, "loss": 0.0349, "step": 328480 }, { "epoch": 0.85, "learning_rate": 0.00017227598041375804, "loss": 0.0137, "step": 328490 }, { "epoch": 0.85, "learning_rate": 0.00017227209219738656, "loss": 0.0122, "step": 328500 }, { "epoch": 0.85, "learning_rate": 0.00017226820398101513, "loss": 0.0211, "step": 328510 }, { "epoch": 0.85, "learning_rate": 0.00017226431576464367, "loss": 0.011, "step": 328520 }, { "epoch": 0.85, "learning_rate": 0.00017226042754827218, "loss": 0.011, "step": 328530 }, { "epoch": 0.85, "learning_rate": 0.0001722565393319007, "loss": 0.0129, "step": 328540 }, { "epoch": 0.85, "learning_rate": 0.00017225265111552927, "loss": 0.0204, "step": 328550 }, { "epoch": 0.85, "learning_rate": 0.0001722487628991578, "loss": 0.0129, "step": 328560 }, { "epoch": 0.85, "learning_rate": 0.00017224487468278632, "loss": 0.0115, "step": 328570 }, { "epoch": 0.85, "learning_rate": 0.00017224098646641487, "loss": 0.0104, "step": 328580 }, { "epoch": 0.85, "learning_rate": 0.0001722370982500434, "loss": 0.0133, "step": 328590 }, { "epoch": 0.85, "learning_rate": 0.00017223321003367195, "loss": 0.0137, "step": 328600 }, { "epoch": 0.85, "learning_rate": 0.00017222932181730046, "loss": 0.0165, "step": 328610 }, { "epoch": 0.85, "learning_rate": 0.000172225433600929, "loss": 0.0169, "step": 328620 }, { "epoch": 0.85, "learning_rate": 0.00017222154538455755, "loss": 0.0118, "step": 328630 }, { "epoch": 0.85, "learning_rate": 0.0001722176571681861, "loss": 0.0143, "step": 328640 }, { "epoch": 0.85, "learning_rate": 0.0001722137689518146, "loss": 0.0121, "step": 328650 }, { "epoch": 0.85, "learning_rate": 0.00017220988073544314, "loss": 0.0165, "step": 328660 }, { "epoch": 0.85, "learning_rate": 0.0001722059925190717, "loss": 0.012, "step": 328670 }, { "epoch": 0.85, "learning_rate": 0.00017220210430270023, "loss": 0.0139, "step": 328680 }, { "epoch": 0.85, "learning_rate": 0.00017219821608632874, "loss": 0.0109, "step": 328690 }, { "epoch": 0.85, "learning_rate": 0.00017219432786995728, "loss": 0.0138, "step": 328700 }, { "epoch": 0.85, "learning_rate": 0.00017219043965358585, "loss": 0.0128, "step": 328710 }, { "epoch": 0.85, "learning_rate": 0.00017218655143721437, "loss": 0.0142, "step": 328720 }, { "epoch": 0.85, "learning_rate": 0.0001721826632208429, "loss": 0.0129, "step": 328730 }, { "epoch": 0.85, "learning_rate": 0.00017217877500447142, "loss": 0.0131, "step": 328740 }, { "epoch": 0.85, "learning_rate": 0.00017217488678809996, "loss": 0.011, "step": 328750 }, { "epoch": 0.85, "learning_rate": 0.0001721709985717285, "loss": 0.013, "step": 328760 }, { "epoch": 0.85, "learning_rate": 0.00017216711035535705, "loss": 0.0145, "step": 328770 }, { "epoch": 0.85, "learning_rate": 0.00017216322213898556, "loss": 0.0171, "step": 328780 }, { "epoch": 0.85, "learning_rate": 0.0001721593339226141, "loss": 0.0098, "step": 328790 }, { "epoch": 0.85, "learning_rate": 0.00017215544570624265, "loss": 0.0114, "step": 328800 }, { "epoch": 0.85, "learning_rate": 0.0001721515574898712, "loss": 0.0123, "step": 328810 }, { "epoch": 0.85, "learning_rate": 0.0001721476692734997, "loss": 0.0252, "step": 328820 }, { "epoch": 0.85, "learning_rate": 0.00017214378105712824, "loss": 0.0145, "step": 328830 }, { "epoch": 0.85, "learning_rate": 0.0001721398928407568, "loss": 0.0156, "step": 328840 }, { "epoch": 0.85, "learning_rate": 0.00017213600462438533, "loss": 0.015, "step": 328850 }, { "epoch": 0.85, "learning_rate": 0.00017213211640801384, "loss": 0.0142, "step": 328860 }, { "epoch": 0.85, "learning_rate": 0.00017212822819164238, "loss": 0.0127, "step": 328870 }, { "epoch": 0.85, "learning_rate": 0.00017212433997527095, "loss": 0.0112, "step": 328880 }, { "epoch": 0.85, "learning_rate": 0.00017212045175889947, "loss": 0.0196, "step": 328890 }, { "epoch": 0.85, "learning_rate": 0.000172116563542528, "loss": 0.015, "step": 328900 }, { "epoch": 0.85, "learning_rate": 0.00017211267532615652, "loss": 0.0139, "step": 328910 }, { "epoch": 0.85, "learning_rate": 0.0001721087871097851, "loss": 0.0185, "step": 328920 }, { "epoch": 0.85, "learning_rate": 0.0001721048988934136, "loss": 0.0116, "step": 328930 }, { "epoch": 0.85, "learning_rate": 0.00017210101067704215, "loss": 0.0124, "step": 328940 }, { "epoch": 0.85, "learning_rate": 0.00017209712246067066, "loss": 0.0144, "step": 328950 }, { "epoch": 0.85, "learning_rate": 0.00017209323424429923, "loss": 0.0115, "step": 328960 }, { "epoch": 0.85, "learning_rate": 0.00017208934602792775, "loss": 0.0127, "step": 328970 }, { "epoch": 0.85, "learning_rate": 0.0001720854578115563, "loss": 0.0117, "step": 328980 }, { "epoch": 0.85, "learning_rate": 0.0001720815695951848, "loss": 0.0105, "step": 328990 }, { "epoch": 0.85, "learning_rate": 0.00017207768137881334, "loss": 0.013, "step": 329000 }, { "epoch": 0.85, "eval_cer": 0.8817348779726539, "eval_loss": 0.009153938852250576, "eval_runtime": 107.5607, "eval_samples_per_second": 18.594, "eval_steps_per_second": 4.649, "step": 329000 }, { "epoch": 0.85, "learning_rate": 0.00017207379316244188, "loss": 0.0126, "step": 329010 }, { "epoch": 0.85, "learning_rate": 0.00017206990494607043, "loss": 0.0101, "step": 329020 }, { "epoch": 0.85, "learning_rate": 0.00017206601672969894, "loss": 0.0113, "step": 329030 }, { "epoch": 0.85, "learning_rate": 0.00017206212851332748, "loss": 0.0129, "step": 329040 }, { "epoch": 0.85, "learning_rate": 0.00017205824029695605, "loss": 0.0165, "step": 329050 }, { "epoch": 0.85, "learning_rate": 0.00017205435208058457, "loss": 0.0136, "step": 329060 }, { "epoch": 0.85, "learning_rate": 0.0001720504638642131, "loss": 0.015, "step": 329070 }, { "epoch": 0.85, "learning_rate": 0.00017204657564784162, "loss": 0.0145, "step": 329080 }, { "epoch": 0.85, "learning_rate": 0.0001720426874314702, "loss": 0.0143, "step": 329090 }, { "epoch": 0.85, "learning_rate": 0.0001720387992150987, "loss": 0.013, "step": 329100 }, { "epoch": 0.85, "learning_rate": 0.00017203491099872725, "loss": 0.0144, "step": 329110 }, { "epoch": 0.85, "learning_rate": 0.00017203102278235576, "loss": 0.0118, "step": 329120 }, { "epoch": 0.85, "learning_rate": 0.00017202713456598433, "loss": 0.0129, "step": 329130 }, { "epoch": 0.85, "learning_rate": 0.00017202324634961284, "loss": 0.0175, "step": 329140 }, { "epoch": 0.85, "learning_rate": 0.00017201935813324139, "loss": 0.0116, "step": 329150 }, { "epoch": 0.85, "learning_rate": 0.0001720154699168699, "loss": 0.0123, "step": 329160 }, { "epoch": 0.85, "learning_rate": 0.00017201158170049847, "loss": 0.0142, "step": 329170 }, { "epoch": 0.85, "learning_rate": 0.00017200769348412698, "loss": 0.015, "step": 329180 }, { "epoch": 0.85, "learning_rate": 0.00017200380526775553, "loss": 0.0116, "step": 329190 }, { "epoch": 0.85, "learning_rate": 0.00017199991705138404, "loss": 0.0145, "step": 329200 }, { "epoch": 0.85, "learning_rate": 0.0001719960288350126, "loss": 0.0157, "step": 329210 }, { "epoch": 0.85, "learning_rate": 0.00017199214061864115, "loss": 0.0109, "step": 329220 }, { "epoch": 0.85, "learning_rate": 0.00017198825240226967, "loss": 0.0126, "step": 329230 }, { "epoch": 0.85, "learning_rate": 0.0001719843641858982, "loss": 0.0102, "step": 329240 }, { "epoch": 0.85, "learning_rate": 0.00017198047596952672, "loss": 0.0148, "step": 329250 }, { "epoch": 0.85, "learning_rate": 0.0001719765877531553, "loss": 0.0178, "step": 329260 }, { "epoch": 0.85, "learning_rate": 0.0001719726995367838, "loss": 0.0133, "step": 329270 }, { "epoch": 0.85, "learning_rate": 0.00017196881132041235, "loss": 0.012, "step": 329280 }, { "epoch": 0.85, "learning_rate": 0.00017196492310404086, "loss": 0.013, "step": 329290 }, { "epoch": 0.85, "learning_rate": 0.00017196103488766943, "loss": 0.0154, "step": 329300 }, { "epoch": 0.85, "learning_rate": 0.00017195714667129794, "loss": 0.0109, "step": 329310 }, { "epoch": 0.85, "learning_rate": 0.00017195325845492649, "loss": 0.0142, "step": 329320 }, { "epoch": 0.85, "learning_rate": 0.000171949370238555, "loss": 0.0132, "step": 329330 }, { "epoch": 0.85, "learning_rate": 0.00017194548202218357, "loss": 0.0151, "step": 329340 }, { "epoch": 0.85, "learning_rate": 0.00017194159380581208, "loss": 0.0124, "step": 329350 }, { "epoch": 0.85, "learning_rate": 0.00017193770558944063, "loss": 0.0231, "step": 329360 }, { "epoch": 0.85, "learning_rate": 0.00017193381737306914, "loss": 0.0133, "step": 329370 }, { "epoch": 0.85, "learning_rate": 0.0001719299291566977, "loss": 0.0112, "step": 329380 }, { "epoch": 0.85, "learning_rate": 0.00017192604094032625, "loss": 0.0149, "step": 329390 }, { "epoch": 0.85, "learning_rate": 0.00017192215272395476, "loss": 0.0142, "step": 329400 }, { "epoch": 0.85, "learning_rate": 0.00017191826450758328, "loss": 0.0253, "step": 329410 }, { "epoch": 0.85, "learning_rate": 0.00017191437629121185, "loss": 0.0118, "step": 329420 }, { "epoch": 0.85, "learning_rate": 0.0001719104880748404, "loss": 0.0094, "step": 329430 }, { "epoch": 0.85, "learning_rate": 0.0001719065998584689, "loss": 0.016, "step": 329440 }, { "epoch": 0.85, "learning_rate": 0.00017190271164209745, "loss": 0.0149, "step": 329450 }, { "epoch": 0.85, "learning_rate": 0.000171898823425726, "loss": 0.0165, "step": 329460 }, { "epoch": 0.85, "learning_rate": 0.00017189493520935453, "loss": 0.0103, "step": 329470 }, { "epoch": 0.85, "learning_rate": 0.00017189104699298304, "loss": 0.0106, "step": 329480 }, { "epoch": 0.85, "learning_rate": 0.00017188715877661159, "loss": 0.013, "step": 329490 }, { "epoch": 0.85, "learning_rate": 0.0001718832705602401, "loss": 0.0111, "step": 329500 }, { "epoch": 0.85, "learning_rate": 0.00017187938234386867, "loss": 0.0145, "step": 329510 }, { "epoch": 0.85, "learning_rate": 0.00017187549412749718, "loss": 0.0162, "step": 329520 }, { "epoch": 0.85, "learning_rate": 0.00017187160591112572, "loss": 0.0129, "step": 329530 }, { "epoch": 0.85, "learning_rate": 0.00017186771769475424, "loss": 0.0222, "step": 329540 }, { "epoch": 0.85, "learning_rate": 0.0001718638294783828, "loss": 0.0121, "step": 329550 }, { "epoch": 0.85, "learning_rate": 0.00017185994126201132, "loss": 0.0138, "step": 329560 }, { "epoch": 0.85, "learning_rate": 0.00017185605304563986, "loss": 0.0118, "step": 329570 }, { "epoch": 0.85, "learning_rate": 0.00017185216482926838, "loss": 0.0111, "step": 329580 }, { "epoch": 0.85, "learning_rate": 0.00017184827661289695, "loss": 0.0156, "step": 329590 }, { "epoch": 0.85, "learning_rate": 0.0001718443883965255, "loss": 0.0132, "step": 329600 }, { "epoch": 0.85, "learning_rate": 0.000171840500180154, "loss": 0.0138, "step": 329610 }, { "epoch": 0.85, "learning_rate": 0.00017183661196378255, "loss": 0.0125, "step": 329620 }, { "epoch": 0.85, "learning_rate": 0.0001718327237474111, "loss": 0.0167, "step": 329630 }, { "epoch": 0.85, "learning_rate": 0.00017182883553103963, "loss": 0.0159, "step": 329640 }, { "epoch": 0.85, "learning_rate": 0.00017182494731466814, "loss": 0.0127, "step": 329650 }, { "epoch": 0.85, "learning_rate": 0.00017182105909829668, "loss": 0.0129, "step": 329660 }, { "epoch": 0.85, "learning_rate": 0.00017181717088192523, "loss": 0.0138, "step": 329670 }, { "epoch": 0.85, "learning_rate": 0.00017181328266555377, "loss": 0.0125, "step": 329680 }, { "epoch": 0.85, "learning_rate": 0.00017180939444918228, "loss": 0.0113, "step": 329690 }, { "epoch": 0.85, "learning_rate": 0.00017180550623281082, "loss": 0.0139, "step": 329700 }, { "epoch": 0.85, "learning_rate": 0.0001718016180164394, "loss": 0.0163, "step": 329710 }, { "epoch": 0.85, "learning_rate": 0.0001717977298000679, "loss": 0.0123, "step": 329720 }, { "epoch": 0.85, "learning_rate": 0.00017179384158369642, "loss": 0.0134, "step": 329730 }, { "epoch": 0.85, "learning_rate": 0.00017178995336732496, "loss": 0.0121, "step": 329740 }, { "epoch": 0.85, "learning_rate": 0.00017178606515095348, "loss": 0.0131, "step": 329750 }, { "epoch": 0.85, "learning_rate": 0.00017178217693458205, "loss": 0.016, "step": 329760 }, { "epoch": 0.85, "learning_rate": 0.0001717782887182106, "loss": 0.0152, "step": 329770 }, { "epoch": 0.85, "learning_rate": 0.0001717744005018391, "loss": 0.0106, "step": 329780 }, { "epoch": 0.85, "learning_rate": 0.00017177051228546764, "loss": 0.0146, "step": 329790 }, { "epoch": 0.85, "learning_rate": 0.00017176662406909619, "loss": 0.015, "step": 329800 }, { "epoch": 0.85, "learning_rate": 0.00017176273585272473, "loss": 0.0155, "step": 329810 }, { "epoch": 0.85, "learning_rate": 0.00017175884763635324, "loss": 0.0131, "step": 329820 }, { "epoch": 0.85, "learning_rate": 0.00017175495941998178, "loss": 0.0152, "step": 329830 }, { "epoch": 0.85, "learning_rate": 0.00017175107120361033, "loss": 0.0122, "step": 329840 }, { "epoch": 0.86, "learning_rate": 0.00017174718298723887, "loss": 0.0153, "step": 329850 }, { "epoch": 0.86, "learning_rate": 0.00017174329477086738, "loss": 0.0179, "step": 329860 }, { "epoch": 0.86, "learning_rate": 0.00017173940655449592, "loss": 0.013, "step": 329870 }, { "epoch": 0.86, "learning_rate": 0.00017173551833812447, "loss": 0.0115, "step": 329880 }, { "epoch": 0.86, "learning_rate": 0.000171731630121753, "loss": 0.0168, "step": 329890 }, { "epoch": 0.86, "learning_rate": 0.00017172774190538152, "loss": 0.0148, "step": 329900 }, { "epoch": 0.86, "learning_rate": 0.00017172385368901006, "loss": 0.0208, "step": 329910 }, { "epoch": 0.86, "learning_rate": 0.00017171996547263863, "loss": 0.0132, "step": 329920 }, { "epoch": 0.86, "learning_rate": 0.00017171607725626715, "loss": 0.0151, "step": 329930 }, { "epoch": 0.86, "learning_rate": 0.0001717121890398957, "loss": 0.0174, "step": 329940 }, { "epoch": 0.86, "learning_rate": 0.0001717083008235242, "loss": 0.0138, "step": 329950 }, { "epoch": 0.86, "learning_rate": 0.00017170441260715277, "loss": 0.0126, "step": 329960 }, { "epoch": 0.86, "learning_rate": 0.00017170052439078129, "loss": 0.0125, "step": 329970 }, { "epoch": 0.86, "learning_rate": 0.00017169663617440983, "loss": 0.0162, "step": 329980 }, { "epoch": 0.86, "learning_rate": 0.00017169274795803834, "loss": 0.0123, "step": 329990 }, { "epoch": 0.86, "learning_rate": 0.00017168885974166688, "loss": 0.0171, "step": 330000 }, { "epoch": 0.86, "eval_cer": 0.881719481966378, "eval_loss": 0.008729472756385803, "eval_runtime": 107.757, "eval_samples_per_second": 18.56, "eval_steps_per_second": 4.64, "step": 330000 }, { "epoch": 0.86, "learning_rate": 0.00017168497152529543, "loss": 0.0129, "step": 330010 }, { "epoch": 0.86, "learning_rate": 0.00017168108330892397, "loss": 0.0154, "step": 330020 }, { "epoch": 0.86, "learning_rate": 0.00017167719509255248, "loss": 0.0135, "step": 330030 }, { "epoch": 0.86, "learning_rate": 0.00017167330687618102, "loss": 0.0169, "step": 330040 }, { "epoch": 0.86, "learning_rate": 0.00017166941865980956, "loss": 0.0126, "step": 330050 }, { "epoch": 0.86, "learning_rate": 0.0001716655304434381, "loss": 0.0143, "step": 330060 }, { "epoch": 0.86, "learning_rate": 0.00017166164222706662, "loss": 0.0127, "step": 330070 }, { "epoch": 0.86, "learning_rate": 0.00017165775401069516, "loss": 0.011, "step": 330080 }, { "epoch": 0.86, "learning_rate": 0.00017165386579432373, "loss": 0.0126, "step": 330090 }, { "epoch": 0.86, "learning_rate": 0.00017164997757795225, "loss": 0.0132, "step": 330100 }, { "epoch": 0.86, "learning_rate": 0.0001716460893615808, "loss": 0.0159, "step": 330110 }, { "epoch": 0.86, "learning_rate": 0.0001716422011452093, "loss": 0.0141, "step": 330120 }, { "epoch": 0.86, "learning_rate": 0.00017163831292883787, "loss": 0.0119, "step": 330130 }, { "epoch": 0.86, "learning_rate": 0.00017163442471246638, "loss": 0.0111, "step": 330140 }, { "epoch": 0.86, "learning_rate": 0.00017163053649609493, "loss": 0.0141, "step": 330150 }, { "epoch": 0.86, "learning_rate": 0.00017162664827972344, "loss": 0.0101, "step": 330160 }, { "epoch": 0.86, "learning_rate": 0.000171622760063352, "loss": 0.0165, "step": 330170 }, { "epoch": 0.86, "learning_rate": 0.00017161887184698052, "loss": 0.0127, "step": 330180 }, { "epoch": 0.86, "learning_rate": 0.00017161498363060907, "loss": 0.0128, "step": 330190 }, { "epoch": 0.86, "learning_rate": 0.00017161109541423758, "loss": 0.0119, "step": 330200 }, { "epoch": 0.86, "learning_rate": 0.00017160720719786615, "loss": 0.0122, "step": 330210 }, { "epoch": 0.86, "learning_rate": 0.00017160331898149466, "loss": 0.0122, "step": 330220 }, { "epoch": 0.86, "learning_rate": 0.0001715994307651232, "loss": 0.0159, "step": 330230 }, { "epoch": 0.86, "learning_rate": 0.00017159554254875172, "loss": 0.0131, "step": 330240 }, { "epoch": 0.86, "learning_rate": 0.00017159165433238026, "loss": 0.0141, "step": 330250 }, { "epoch": 0.86, "learning_rate": 0.00017158776611600883, "loss": 0.0148, "step": 330260 }, { "epoch": 0.86, "learning_rate": 0.00017158387789963734, "loss": 0.0136, "step": 330270 }, { "epoch": 0.86, "learning_rate": 0.00017157998968326586, "loss": 0.016, "step": 330280 }, { "epoch": 0.86, "learning_rate": 0.0001715761014668944, "loss": 0.0119, "step": 330290 }, { "epoch": 0.86, "learning_rate": 0.00017157221325052297, "loss": 0.0149, "step": 330300 }, { "epoch": 0.86, "learning_rate": 0.00017156832503415148, "loss": 0.012, "step": 330310 }, { "epoch": 0.86, "learning_rate": 0.00017156443681778003, "loss": 0.0102, "step": 330320 }, { "epoch": 0.86, "learning_rate": 0.00017156054860140854, "loss": 0.0113, "step": 330330 }, { "epoch": 0.86, "learning_rate": 0.0001715566603850371, "loss": 0.0127, "step": 330340 }, { "epoch": 0.86, "learning_rate": 0.00017155277216866562, "loss": 0.0156, "step": 330350 }, { "epoch": 0.86, "learning_rate": 0.00017154888395229417, "loss": 0.0149, "step": 330360 }, { "epoch": 0.86, "learning_rate": 0.00017154499573592268, "loss": 0.0176, "step": 330370 }, { "epoch": 0.86, "learning_rate": 0.00017154110751955125, "loss": 0.0153, "step": 330380 }, { "epoch": 0.86, "learning_rate": 0.00017153721930317976, "loss": 0.0135, "step": 330390 }, { "epoch": 0.86, "learning_rate": 0.0001715333310868083, "loss": 0.0135, "step": 330400 }, { "epoch": 0.86, "learning_rate": 0.00017152944287043682, "loss": 0.0138, "step": 330410 }, { "epoch": 0.86, "learning_rate": 0.0001715255546540654, "loss": 0.0133, "step": 330420 }, { "epoch": 0.86, "learning_rate": 0.00017152166643769393, "loss": 0.014, "step": 330430 }, { "epoch": 0.86, "learning_rate": 0.00017151777822132244, "loss": 0.0143, "step": 330440 }, { "epoch": 0.86, "learning_rate": 0.00017151389000495096, "loss": 0.0118, "step": 330450 }, { "epoch": 0.86, "learning_rate": 0.00017151000178857953, "loss": 0.0109, "step": 330460 }, { "epoch": 0.86, "learning_rate": 0.00017150611357220807, "loss": 0.0138, "step": 330470 }, { "epoch": 0.86, "learning_rate": 0.00017150222535583658, "loss": 0.0124, "step": 330480 }, { "epoch": 0.86, "learning_rate": 0.00017149833713946513, "loss": 0.0115, "step": 330490 }, { "epoch": 0.86, "learning_rate": 0.00017149444892309364, "loss": 0.018, "step": 330500 }, { "epoch": 0.86, "learning_rate": 0.0001714905607067222, "loss": 0.0112, "step": 330510 }, { "epoch": 0.86, "learning_rate": 0.00017148667249035072, "loss": 0.0116, "step": 330520 }, { "epoch": 0.86, "learning_rate": 0.00017148278427397926, "loss": 0.0113, "step": 330530 }, { "epoch": 0.86, "learning_rate": 0.00017147889605760778, "loss": 0.0144, "step": 330540 }, { "epoch": 0.86, "learning_rate": 0.00017147500784123635, "loss": 0.0136, "step": 330550 }, { "epoch": 0.86, "learning_rate": 0.00017147111962486486, "loss": 0.0137, "step": 330560 }, { "epoch": 0.86, "learning_rate": 0.0001714672314084934, "loss": 0.0128, "step": 330570 }, { "epoch": 0.86, "learning_rate": 0.00017146334319212192, "loss": 0.0134, "step": 330580 }, { "epoch": 0.86, "learning_rate": 0.0001714594549757505, "loss": 0.0225, "step": 330590 }, { "epoch": 0.86, "learning_rate": 0.000171455566759379, "loss": 0.0123, "step": 330600 }, { "epoch": 0.86, "learning_rate": 0.00017145167854300754, "loss": 0.017, "step": 330610 }, { "epoch": 0.86, "learning_rate": 0.00017144779032663606, "loss": 0.0155, "step": 330620 }, { "epoch": 0.86, "learning_rate": 0.00017144390211026463, "loss": 0.0159, "step": 330630 }, { "epoch": 0.86, "learning_rate": 0.00017144001389389317, "loss": 0.013, "step": 330640 }, { "epoch": 0.86, "learning_rate": 0.00017143612567752168, "loss": 0.0136, "step": 330650 }, { "epoch": 0.86, "learning_rate": 0.00017143223746115022, "loss": 0.0144, "step": 330660 }, { "epoch": 0.86, "learning_rate": 0.00017142834924477877, "loss": 0.0139, "step": 330670 }, { "epoch": 0.86, "learning_rate": 0.0001714244610284073, "loss": 0.0201, "step": 330680 }, { "epoch": 0.86, "learning_rate": 0.00017142057281203582, "loss": 0.0151, "step": 330690 }, { "epoch": 0.86, "learning_rate": 0.00017141668459566436, "loss": 0.0164, "step": 330700 }, { "epoch": 0.86, "learning_rate": 0.0001714127963792929, "loss": 0.0154, "step": 330710 }, { "epoch": 0.86, "learning_rate": 0.00017140890816292145, "loss": 0.0152, "step": 330720 }, { "epoch": 0.86, "learning_rate": 0.00017140501994654996, "loss": 0.0147, "step": 330730 }, { "epoch": 0.86, "learning_rate": 0.0001714011317301785, "loss": 0.0122, "step": 330740 }, { "epoch": 0.86, "learning_rate": 0.00017139724351380702, "loss": 0.0146, "step": 330750 }, { "epoch": 0.86, "learning_rate": 0.0001713933552974356, "loss": 0.0129, "step": 330760 }, { "epoch": 0.86, "learning_rate": 0.0001713894670810641, "loss": 0.0182, "step": 330770 }, { "epoch": 0.86, "learning_rate": 0.00017138557886469264, "loss": 0.019, "step": 330780 }, { "epoch": 0.86, "learning_rate": 0.00017138169064832116, "loss": 0.0162, "step": 330790 }, { "epoch": 0.86, "learning_rate": 0.00017137780243194973, "loss": 0.0137, "step": 330800 }, { "epoch": 0.86, "learning_rate": 0.00017137391421557827, "loss": 0.0141, "step": 330810 }, { "epoch": 0.86, "learning_rate": 0.00017137002599920678, "loss": 0.0165, "step": 330820 }, { "epoch": 0.86, "learning_rate": 0.00017136613778283532, "loss": 0.0161, "step": 330830 }, { "epoch": 0.86, "learning_rate": 0.00017136224956646387, "loss": 0.0141, "step": 330840 }, { "epoch": 0.86, "learning_rate": 0.0001713583613500924, "loss": 0.0126, "step": 330850 }, { "epoch": 0.86, "learning_rate": 0.00017135447313372092, "loss": 0.0146, "step": 330860 }, { "epoch": 0.86, "learning_rate": 0.00017135058491734946, "loss": 0.0105, "step": 330870 }, { "epoch": 0.86, "learning_rate": 0.000171346696700978, "loss": 0.014, "step": 330880 }, { "epoch": 0.86, "learning_rate": 0.00017134280848460655, "loss": 0.0153, "step": 330890 }, { "epoch": 0.86, "learning_rate": 0.00017133892026823506, "loss": 0.013, "step": 330900 }, { "epoch": 0.86, "learning_rate": 0.0001713350320518636, "loss": 0.0146, "step": 330910 }, { "epoch": 0.86, "learning_rate": 0.00017133114383549214, "loss": 0.0178, "step": 330920 }, { "epoch": 0.86, "learning_rate": 0.0001713272556191207, "loss": 0.0146, "step": 330930 }, { "epoch": 0.86, "learning_rate": 0.0001713233674027492, "loss": 0.0125, "step": 330940 }, { "epoch": 0.86, "learning_rate": 0.00017131947918637774, "loss": 0.0151, "step": 330950 }, { "epoch": 0.86, "learning_rate": 0.0001713155909700063, "loss": 0.0131, "step": 330960 }, { "epoch": 0.86, "learning_rate": 0.00017131170275363483, "loss": 0.0151, "step": 330970 }, { "epoch": 0.86, "learning_rate": 0.00017130781453726337, "loss": 0.0112, "step": 330980 }, { "epoch": 0.86, "learning_rate": 0.00017130392632089188, "loss": 0.0154, "step": 330990 }, { "epoch": 0.86, "learning_rate": 0.0001713000381045204, "loss": 0.0131, "step": 331000 }, { "epoch": 0.86, "eval_cer": 0.881751673615864, "eval_loss": 0.008923850953578949, "eval_runtime": 107.6261, "eval_samples_per_second": 18.583, "eval_steps_per_second": 4.646, "step": 331000 }, { "epoch": 0.86, "learning_rate": 0.00017129614988814897, "loss": 0.0114, "step": 331010 }, { "epoch": 0.86, "learning_rate": 0.0001712922616717775, "loss": 0.0155, "step": 331020 }, { "epoch": 0.86, "learning_rate": 0.00017128837345540602, "loss": 0.0134, "step": 331030 }, { "epoch": 0.86, "learning_rate": 0.00017128448523903456, "loss": 0.0115, "step": 331040 }, { "epoch": 0.86, "learning_rate": 0.0001712805970226631, "loss": 0.012, "step": 331050 }, { "epoch": 0.86, "learning_rate": 0.00017127670880629165, "loss": 0.0119, "step": 331060 }, { "epoch": 0.86, "learning_rate": 0.00017127282058992016, "loss": 0.0099, "step": 331070 }, { "epoch": 0.86, "learning_rate": 0.0001712689323735487, "loss": 0.0112, "step": 331080 }, { "epoch": 0.86, "learning_rate": 0.00017126504415717724, "loss": 0.0124, "step": 331090 }, { "epoch": 0.86, "learning_rate": 0.00017126115594080579, "loss": 0.0145, "step": 331100 }, { "epoch": 0.86, "learning_rate": 0.0001712572677244343, "loss": 0.0109, "step": 331110 }, { "epoch": 0.86, "learning_rate": 0.00017125337950806284, "loss": 0.0146, "step": 331120 }, { "epoch": 0.86, "learning_rate": 0.0001712494912916914, "loss": 0.0133, "step": 331130 }, { "epoch": 0.86, "learning_rate": 0.00017124560307531993, "loss": 0.0123, "step": 331140 }, { "epoch": 0.86, "learning_rate": 0.00017124171485894844, "loss": 0.0105, "step": 331150 }, { "epoch": 0.86, "learning_rate": 0.00017123782664257698, "loss": 0.0137, "step": 331160 }, { "epoch": 0.86, "learning_rate": 0.00017123393842620555, "loss": 0.0087, "step": 331170 }, { "epoch": 0.86, "learning_rate": 0.00017123005020983406, "loss": 0.014, "step": 331180 }, { "epoch": 0.86, "learning_rate": 0.0001712261619934626, "loss": 0.0133, "step": 331190 }, { "epoch": 0.86, "learning_rate": 0.00017122227377709112, "loss": 0.0117, "step": 331200 }, { "epoch": 0.86, "learning_rate": 0.0001712183855607197, "loss": 0.0222, "step": 331210 }, { "epoch": 0.86, "learning_rate": 0.0001712144973443482, "loss": 0.0128, "step": 331220 }, { "epoch": 0.86, "learning_rate": 0.00017121060912797675, "loss": 0.0151, "step": 331230 }, { "epoch": 0.86, "learning_rate": 0.00017120672091160526, "loss": 0.0166, "step": 331240 }, { "epoch": 0.86, "learning_rate": 0.0001712028326952338, "loss": 0.0176, "step": 331250 }, { "epoch": 0.86, "learning_rate": 0.00017119894447886234, "loss": 0.0131, "step": 331260 }, { "epoch": 0.86, "learning_rate": 0.00017119505626249089, "loss": 0.0138, "step": 331270 }, { "epoch": 0.86, "learning_rate": 0.0001711911680461194, "loss": 0.0142, "step": 331280 }, { "epoch": 0.86, "learning_rate": 0.00017118727982974794, "loss": 0.0138, "step": 331290 }, { "epoch": 0.86, "learning_rate": 0.0001711833916133765, "loss": 0.0156, "step": 331300 }, { "epoch": 0.86, "learning_rate": 0.00017117950339700502, "loss": 0.0109, "step": 331310 }, { "epoch": 0.86, "learning_rate": 0.00017117561518063354, "loss": 0.0128, "step": 331320 }, { "epoch": 0.86, "learning_rate": 0.00017117172696426208, "loss": 0.0102, "step": 331330 }, { "epoch": 0.86, "learning_rate": 0.00017116783874789065, "loss": 0.0139, "step": 331340 }, { "epoch": 0.86, "learning_rate": 0.00017116395053151916, "loss": 0.0145, "step": 331350 }, { "epoch": 0.86, "learning_rate": 0.0001711600623151477, "loss": 0.017, "step": 331360 }, { "epoch": 0.86, "learning_rate": 0.00017115617409877622, "loss": 0.0148, "step": 331370 }, { "epoch": 0.86, "learning_rate": 0.0001711522858824048, "loss": 0.0167, "step": 331380 }, { "epoch": 0.86, "learning_rate": 0.0001711483976660333, "loss": 0.0107, "step": 331390 }, { "epoch": 0.86, "learning_rate": 0.00017114450944966185, "loss": 0.0157, "step": 331400 }, { "epoch": 0.86, "learning_rate": 0.00017114062123329036, "loss": 0.0146, "step": 331410 }, { "epoch": 0.86, "learning_rate": 0.00017113673301691893, "loss": 0.0148, "step": 331420 }, { "epoch": 0.86, "learning_rate": 0.00017113284480054744, "loss": 0.0122, "step": 331430 }, { "epoch": 0.86, "learning_rate": 0.00017112895658417598, "loss": 0.0095, "step": 331440 }, { "epoch": 0.86, "learning_rate": 0.0001711250683678045, "loss": 0.0139, "step": 331450 }, { "epoch": 0.86, "learning_rate": 0.00017112118015143307, "loss": 0.0113, "step": 331460 }, { "epoch": 0.86, "learning_rate": 0.00017111729193506158, "loss": 0.0146, "step": 331470 }, { "epoch": 0.86, "learning_rate": 0.00017111340371869012, "loss": 0.0152, "step": 331480 }, { "epoch": 0.86, "learning_rate": 0.00017110951550231864, "loss": 0.0145, "step": 331490 }, { "epoch": 0.86, "learning_rate": 0.00017110562728594718, "loss": 0.0123, "step": 331500 }, { "epoch": 0.86, "learning_rate": 0.00017110173906957575, "loss": 0.0177, "step": 331510 }, { "epoch": 0.86, "learning_rate": 0.00017109785085320426, "loss": 0.0129, "step": 331520 }, { "epoch": 0.86, "learning_rate": 0.0001710939626368328, "loss": 0.0123, "step": 331530 }, { "epoch": 0.86, "learning_rate": 0.00017109007442046132, "loss": 0.0134, "step": 331540 }, { "epoch": 0.86, "learning_rate": 0.0001710861862040899, "loss": 0.0136, "step": 331550 }, { "epoch": 0.86, "learning_rate": 0.0001710822979877184, "loss": 0.015, "step": 331560 }, { "epoch": 0.86, "learning_rate": 0.00017107840977134694, "loss": 0.0148, "step": 331570 }, { "epoch": 0.86, "learning_rate": 0.00017107452155497546, "loss": 0.013, "step": 331580 }, { "epoch": 0.86, "learning_rate": 0.00017107063333860403, "loss": 0.0106, "step": 331590 }, { "epoch": 0.86, "learning_rate": 0.00017106674512223254, "loss": 0.0158, "step": 331600 }, { "epoch": 0.86, "learning_rate": 0.00017106285690586108, "loss": 0.0109, "step": 331610 }, { "epoch": 0.86, "learning_rate": 0.0001710589686894896, "loss": 0.0098, "step": 331620 }, { "epoch": 0.86, "learning_rate": 0.00017105508047311817, "loss": 0.0135, "step": 331630 }, { "epoch": 0.86, "learning_rate": 0.00017105119225674668, "loss": 0.0149, "step": 331640 }, { "epoch": 0.86, "learning_rate": 0.00017104730404037522, "loss": 0.014, "step": 331650 }, { "epoch": 0.86, "learning_rate": 0.00017104341582400374, "loss": 0.0132, "step": 331660 }, { "epoch": 0.86, "learning_rate": 0.0001710395276076323, "loss": 0.0137, "step": 331670 }, { "epoch": 0.86, "learning_rate": 0.00017103563939126085, "loss": 0.0146, "step": 331680 }, { "epoch": 0.86, "learning_rate": 0.00017103175117488936, "loss": 0.0137, "step": 331690 }, { "epoch": 0.86, "learning_rate": 0.0001710278629585179, "loss": 0.0107, "step": 331700 }, { "epoch": 0.86, "learning_rate": 0.00017102397474214645, "loss": 0.0133, "step": 331710 }, { "epoch": 0.86, "learning_rate": 0.000171020086525775, "loss": 0.0117, "step": 331720 }, { "epoch": 0.86, "learning_rate": 0.0001710161983094035, "loss": 0.0121, "step": 331730 }, { "epoch": 0.86, "learning_rate": 0.00017101231009303204, "loss": 0.0108, "step": 331740 }, { "epoch": 0.86, "learning_rate": 0.00017100842187666056, "loss": 0.0139, "step": 331750 }, { "epoch": 0.86, "learning_rate": 0.00017100453366028913, "loss": 0.0117, "step": 331760 }, { "epoch": 0.86, "learning_rate": 0.00017100064544391764, "loss": 0.0131, "step": 331770 }, { "epoch": 0.86, "learning_rate": 0.00017099675722754618, "loss": 0.013, "step": 331780 }, { "epoch": 0.86, "learning_rate": 0.0001709928690111747, "loss": 0.0102, "step": 331790 }, { "epoch": 0.86, "learning_rate": 0.00017098898079480327, "loss": 0.0127, "step": 331800 }, { "epoch": 0.86, "learning_rate": 0.00017098509257843178, "loss": 0.0174, "step": 331810 }, { "epoch": 0.86, "learning_rate": 0.00017098120436206032, "loss": 0.0113, "step": 331820 }, { "epoch": 0.86, "learning_rate": 0.00017097731614568884, "loss": 0.0113, "step": 331830 }, { "epoch": 0.86, "learning_rate": 0.0001709734279293174, "loss": 0.0131, "step": 331840 }, { "epoch": 0.86, "learning_rate": 0.00017096953971294595, "loss": 0.0127, "step": 331850 }, { "epoch": 0.86, "learning_rate": 0.00017096565149657446, "loss": 0.0098, "step": 331860 }, { "epoch": 0.86, "learning_rate": 0.00017096176328020298, "loss": 0.0137, "step": 331870 }, { "epoch": 0.86, "learning_rate": 0.00017095787506383155, "loss": 0.0098, "step": 331880 }, { "epoch": 0.86, "learning_rate": 0.0001709539868474601, "loss": 0.0137, "step": 331890 }, { "epoch": 0.86, "learning_rate": 0.0001709500986310886, "loss": 0.0197, "step": 331900 }, { "epoch": 0.86, "learning_rate": 0.00017094621041471714, "loss": 0.0109, "step": 331910 }, { "epoch": 0.86, "learning_rate": 0.00017094232219834569, "loss": 0.0142, "step": 331920 }, { "epoch": 0.86, "learning_rate": 0.00017093843398197423, "loss": 0.0144, "step": 331930 }, { "epoch": 0.86, "learning_rate": 0.00017093454576560274, "loss": 0.0135, "step": 331940 }, { "epoch": 0.86, "learning_rate": 0.00017093065754923128, "loss": 0.0132, "step": 331950 }, { "epoch": 0.86, "learning_rate": 0.00017092676933285982, "loss": 0.0142, "step": 331960 }, { "epoch": 0.86, "learning_rate": 0.00017092288111648837, "loss": 0.0137, "step": 331970 }, { "epoch": 0.86, "learning_rate": 0.00017091899290011688, "loss": 0.0121, "step": 331980 }, { "epoch": 0.86, "learning_rate": 0.00017091510468374542, "loss": 0.015, "step": 331990 }, { "epoch": 0.86, "learning_rate": 0.00017091121646737394, "loss": 0.0125, "step": 332000 }, { "epoch": 0.86, "eval_cer": 0.8816900895907601, "eval_loss": 0.008775945752859116, "eval_runtime": 107.8889, "eval_samples_per_second": 18.538, "eval_steps_per_second": 4.634, "step": 332000 }, { "epoch": 0.86, "learning_rate": 0.0001709073282510025, "loss": 0.015, "step": 332010 }, { "epoch": 0.86, "learning_rate": 0.00017090344003463105, "loss": 0.0138, "step": 332020 }, { "epoch": 0.86, "learning_rate": 0.00017089955181825956, "loss": 0.017, "step": 332030 }, { "epoch": 0.86, "learning_rate": 0.00017089566360188808, "loss": 0.0146, "step": 332040 }, { "epoch": 0.86, "learning_rate": 0.00017089177538551665, "loss": 0.0199, "step": 332050 }, { "epoch": 0.86, "learning_rate": 0.0001708878871691452, "loss": 0.0132, "step": 332060 }, { "epoch": 0.86, "learning_rate": 0.0001708839989527737, "loss": 0.0123, "step": 332070 }, { "epoch": 0.86, "learning_rate": 0.00017088011073640224, "loss": 0.0106, "step": 332080 }, { "epoch": 0.86, "learning_rate": 0.00017087622252003078, "loss": 0.0132, "step": 332090 }, { "epoch": 0.86, "learning_rate": 0.00017087233430365933, "loss": 0.0136, "step": 332100 }, { "epoch": 0.86, "learning_rate": 0.00017086844608728784, "loss": 0.0139, "step": 332110 }, { "epoch": 0.86, "learning_rate": 0.00017086455787091638, "loss": 0.0131, "step": 332120 }, { "epoch": 0.86, "learning_rate": 0.00017086066965454492, "loss": 0.0116, "step": 332130 }, { "epoch": 0.86, "learning_rate": 0.00017085678143817347, "loss": 0.0118, "step": 332140 }, { "epoch": 0.86, "learning_rate": 0.00017085289322180198, "loss": 0.0178, "step": 332150 }, { "epoch": 0.86, "learning_rate": 0.00017084900500543052, "loss": 0.0125, "step": 332160 }, { "epoch": 0.86, "learning_rate": 0.0001708451167890591, "loss": 0.0115, "step": 332170 }, { "epoch": 0.86, "learning_rate": 0.0001708412285726876, "loss": 0.0173, "step": 332180 }, { "epoch": 0.86, "learning_rate": 0.00017083734035631612, "loss": 0.01, "step": 332190 }, { "epoch": 0.86, "learning_rate": 0.00017083345213994466, "loss": 0.0127, "step": 332200 }, { "epoch": 0.86, "learning_rate": 0.00017082956392357323, "loss": 0.0217, "step": 332210 }, { "epoch": 0.86, "learning_rate": 0.00017082567570720174, "loss": 0.0123, "step": 332220 }, { "epoch": 0.86, "learning_rate": 0.00017082178749083029, "loss": 0.024, "step": 332230 }, { "epoch": 0.86, "learning_rate": 0.0001708178992744588, "loss": 0.0116, "step": 332240 }, { "epoch": 0.86, "learning_rate": 0.00017081401105808734, "loss": 0.0123, "step": 332250 }, { "epoch": 0.86, "learning_rate": 0.00017081012284171588, "loss": 0.0166, "step": 332260 }, { "epoch": 0.86, "learning_rate": 0.00017080623462534443, "loss": 0.0113, "step": 332270 }, { "epoch": 0.86, "learning_rate": 0.00017080234640897294, "loss": 0.0109, "step": 332280 }, { "epoch": 0.86, "learning_rate": 0.00017079845819260148, "loss": 0.0148, "step": 332290 }, { "epoch": 0.86, "learning_rate": 0.00017079456997623002, "loss": 0.0157, "step": 332300 }, { "epoch": 0.86, "learning_rate": 0.00017079068175985857, "loss": 0.012, "step": 332310 }, { "epoch": 0.86, "learning_rate": 0.00017078679354348708, "loss": 0.0125, "step": 332320 }, { "epoch": 0.86, "learning_rate": 0.00017078290532711562, "loss": 0.0242, "step": 332330 }, { "epoch": 0.86, "learning_rate": 0.00017077901711074416, "loss": 0.0101, "step": 332340 }, { "epoch": 0.86, "learning_rate": 0.0001707751288943727, "loss": 0.017, "step": 332350 }, { "epoch": 0.86, "learning_rate": 0.00017077124067800122, "loss": 0.0117, "step": 332360 }, { "epoch": 0.86, "learning_rate": 0.00017076735246162976, "loss": 0.0156, "step": 332370 }, { "epoch": 0.86, "learning_rate": 0.00017076346424525833, "loss": 0.0124, "step": 332380 }, { "epoch": 0.86, "learning_rate": 0.00017075957602888684, "loss": 0.0128, "step": 332390 }, { "epoch": 0.86, "learning_rate": 0.00017075568781251539, "loss": 0.0131, "step": 332400 }, { "epoch": 0.86, "learning_rate": 0.0001707517995961439, "loss": 0.0149, "step": 332410 }, { "epoch": 0.86, "learning_rate": 0.00017074791137977247, "loss": 0.011, "step": 332420 }, { "epoch": 0.86, "learning_rate": 0.00017074402316340098, "loss": 0.0156, "step": 332430 }, { "epoch": 0.86, "learning_rate": 0.00017074013494702953, "loss": 0.0137, "step": 332440 }, { "epoch": 0.86, "learning_rate": 0.00017073624673065804, "loss": 0.0189, "step": 332450 }, { "epoch": 0.86, "learning_rate": 0.0001707323585142866, "loss": 0.016, "step": 332460 }, { "epoch": 0.86, "learning_rate": 0.00017072847029791512, "loss": 0.016, "step": 332470 }, { "epoch": 0.86, "learning_rate": 0.00017072458208154366, "loss": 0.0127, "step": 332480 }, { "epoch": 0.86, "learning_rate": 0.00017072069386517218, "loss": 0.0099, "step": 332490 }, { "epoch": 0.86, "learning_rate": 0.00017071680564880072, "loss": 0.0143, "step": 332500 }, { "epoch": 0.86, "learning_rate": 0.00017071291743242926, "loss": 0.0144, "step": 332510 }, { "epoch": 0.86, "learning_rate": 0.0001707090292160578, "loss": 0.0136, "step": 332520 }, { "epoch": 0.86, "learning_rate": 0.00017070514099968632, "loss": 0.0109, "step": 332530 }, { "epoch": 0.86, "learning_rate": 0.00017070125278331486, "loss": 0.0157, "step": 332540 }, { "epoch": 0.86, "learning_rate": 0.00017069736456694343, "loss": 0.0183, "step": 332550 }, { "epoch": 0.86, "learning_rate": 0.00017069347635057194, "loss": 0.0135, "step": 332560 }, { "epoch": 0.86, "learning_rate": 0.00017068958813420049, "loss": 0.0117, "step": 332570 }, { "epoch": 0.86, "learning_rate": 0.000170685699917829, "loss": 0.0142, "step": 332580 }, { "epoch": 0.86, "learning_rate": 0.00017068181170145757, "loss": 0.014, "step": 332590 }, { "epoch": 0.86, "learning_rate": 0.00017067792348508608, "loss": 0.0137, "step": 332600 }, { "epoch": 0.86, "learning_rate": 0.00017067403526871462, "loss": 0.0156, "step": 332610 }, { "epoch": 0.86, "learning_rate": 0.00017067014705234314, "loss": 0.0187, "step": 332620 }, { "epoch": 0.86, "learning_rate": 0.0001706662588359717, "loss": 0.016, "step": 332630 }, { "epoch": 0.86, "learning_rate": 0.00017066237061960022, "loss": 0.0123, "step": 332640 }, { "epoch": 0.86, "learning_rate": 0.00017065848240322876, "loss": 0.0118, "step": 332650 }, { "epoch": 0.86, "learning_rate": 0.00017065459418685728, "loss": 0.0126, "step": 332660 }, { "epoch": 0.86, "learning_rate": 0.00017065070597048585, "loss": 0.011, "step": 332670 }, { "epoch": 0.86, "learning_rate": 0.00017064681775411436, "loss": 0.0171, "step": 332680 }, { "epoch": 0.86, "learning_rate": 0.0001706429295377429, "loss": 0.0108, "step": 332690 }, { "epoch": 0.86, "learning_rate": 0.00017063904132137142, "loss": 0.0155, "step": 332700 }, { "epoch": 0.86, "learning_rate": 0.000170635153105, "loss": 0.0129, "step": 332710 }, { "epoch": 0.86, "learning_rate": 0.00017063126488862853, "loss": 0.0119, "step": 332720 }, { "epoch": 0.86, "learning_rate": 0.00017062737667225704, "loss": 0.0148, "step": 332730 }, { "epoch": 0.86, "learning_rate": 0.00017062348845588556, "loss": 0.0152, "step": 332740 }, { "epoch": 0.86, "learning_rate": 0.0001706196002395141, "loss": 0.0131, "step": 332750 }, { "epoch": 0.86, "learning_rate": 0.00017061571202314267, "loss": 0.0103, "step": 332760 }, { "epoch": 0.86, "learning_rate": 0.00017061182380677118, "loss": 0.013, "step": 332770 }, { "epoch": 0.86, "learning_rate": 0.00017060793559039972, "loss": 0.0127, "step": 332780 }, { "epoch": 0.86, "learning_rate": 0.00017060404737402824, "loss": 0.0133, "step": 332790 }, { "epoch": 0.86, "learning_rate": 0.0001706001591576568, "loss": 0.0165, "step": 332800 }, { "epoch": 0.86, "learning_rate": 0.00017059627094128532, "loss": 0.0134, "step": 332810 }, { "epoch": 0.86, "learning_rate": 0.00017059238272491386, "loss": 0.016, "step": 332820 }, { "epoch": 0.86, "learning_rate": 0.00017058849450854238, "loss": 0.0113, "step": 332830 }, { "epoch": 0.86, "learning_rate": 0.00017058460629217095, "loss": 0.0147, "step": 332840 }, { "epoch": 0.86, "learning_rate": 0.00017058071807579946, "loss": 0.0153, "step": 332850 }, { "epoch": 0.86, "learning_rate": 0.000170576829859428, "loss": 0.0107, "step": 332860 }, { "epoch": 0.86, "learning_rate": 0.00017057294164305652, "loss": 0.0156, "step": 332870 }, { "epoch": 0.86, "learning_rate": 0.00017056905342668509, "loss": 0.0128, "step": 332880 }, { "epoch": 0.86, "learning_rate": 0.00017056516521031363, "loss": 0.0112, "step": 332890 }, { "epoch": 0.86, "learning_rate": 0.00017056127699394214, "loss": 0.0139, "step": 332900 }, { "epoch": 0.86, "learning_rate": 0.00017055738877757066, "loss": 0.0098, "step": 332910 }, { "epoch": 0.86, "learning_rate": 0.00017055350056119923, "loss": 0.0166, "step": 332920 }, { "epoch": 0.86, "learning_rate": 0.00017054961234482777, "loss": 0.0125, "step": 332930 }, { "epoch": 0.86, "learning_rate": 0.00017054572412845628, "loss": 0.017, "step": 332940 }, { "epoch": 0.86, "learning_rate": 0.00017054183591208482, "loss": 0.0117, "step": 332950 }, { "epoch": 0.86, "learning_rate": 0.00017053794769571334, "loss": 0.0127, "step": 332960 }, { "epoch": 0.86, "learning_rate": 0.0001705340594793419, "loss": 0.0141, "step": 332970 }, { "epoch": 0.86, "learning_rate": 0.00017053017126297042, "loss": 0.0121, "step": 332980 }, { "epoch": 0.86, "learning_rate": 0.00017052628304659896, "loss": 0.0117, "step": 332990 }, { "epoch": 0.86, "learning_rate": 0.00017052239483022748, "loss": 0.0094, "step": 333000 }, { "epoch": 0.86, "eval_cer": 0.8817502739789299, "eval_loss": 0.009038124233484268, "eval_runtime": 107.8356, "eval_samples_per_second": 18.547, "eval_steps_per_second": 4.637, "step": 333000 }, { "epoch": 0.86, "learning_rate": 0.00017051850661385605, "loss": 0.0133, "step": 333010 }, { "epoch": 0.86, "learning_rate": 0.00017051461839748456, "loss": 0.0106, "step": 333020 }, { "epoch": 0.86, "learning_rate": 0.0001705107301811131, "loss": 0.0144, "step": 333030 }, { "epoch": 0.86, "learning_rate": 0.00017050684196474162, "loss": 0.018, "step": 333040 }, { "epoch": 0.86, "learning_rate": 0.00017050295374837019, "loss": 0.0132, "step": 333050 }, { "epoch": 0.86, "learning_rate": 0.0001704990655319987, "loss": 0.0163, "step": 333060 }, { "epoch": 0.86, "learning_rate": 0.00017049517731562724, "loss": 0.0099, "step": 333070 }, { "epoch": 0.86, "learning_rate": 0.00017049128909925576, "loss": 0.0146, "step": 333080 }, { "epoch": 0.86, "learning_rate": 0.00017048740088288432, "loss": 0.0134, "step": 333090 }, { "epoch": 0.86, "learning_rate": 0.00017048351266651287, "loss": 0.0133, "step": 333100 }, { "epoch": 0.86, "learning_rate": 0.00017047962445014138, "loss": 0.0141, "step": 333110 }, { "epoch": 0.86, "learning_rate": 0.00017047573623376992, "loss": 0.0133, "step": 333120 }, { "epoch": 0.86, "learning_rate": 0.00017047184801739846, "loss": 0.0126, "step": 333130 }, { "epoch": 0.86, "learning_rate": 0.000170467959801027, "loss": 0.0124, "step": 333140 }, { "epoch": 0.86, "learning_rate": 0.00017046407158465552, "loss": 0.0158, "step": 333150 }, { "epoch": 0.86, "learning_rate": 0.00017046018336828406, "loss": 0.0114, "step": 333160 }, { "epoch": 0.86, "learning_rate": 0.0001704562951519126, "loss": 0.013, "step": 333170 }, { "epoch": 0.86, "learning_rate": 0.00017045240693554115, "loss": 0.0127, "step": 333180 }, { "epoch": 0.86, "learning_rate": 0.00017044851871916966, "loss": 0.0138, "step": 333190 }, { "epoch": 0.86, "learning_rate": 0.0001704446305027982, "loss": 0.0122, "step": 333200 }, { "epoch": 0.86, "learning_rate": 0.00017044074228642672, "loss": 0.0177, "step": 333210 }, { "epoch": 0.86, "learning_rate": 0.00017043685407005528, "loss": 0.0155, "step": 333220 }, { "epoch": 0.86, "learning_rate": 0.0001704329658536838, "loss": 0.0159, "step": 333230 }, { "epoch": 0.86, "learning_rate": 0.00017042907763731234, "loss": 0.0158, "step": 333240 }, { "epoch": 0.86, "learning_rate": 0.00017042518942094086, "loss": 0.0141, "step": 333250 }, { "epoch": 0.86, "learning_rate": 0.00017042130120456942, "loss": 0.0108, "step": 333260 }, { "epoch": 0.86, "learning_rate": 0.00017041741298819797, "loss": 0.0146, "step": 333270 }, { "epoch": 0.86, "learning_rate": 0.00017041352477182648, "loss": 0.0165, "step": 333280 }, { "epoch": 0.86, "learning_rate": 0.00017040963655545502, "loss": 0.0111, "step": 333290 }, { "epoch": 0.86, "learning_rate": 0.00017040574833908356, "loss": 0.0141, "step": 333300 }, { "epoch": 0.86, "learning_rate": 0.0001704018601227121, "loss": 0.0136, "step": 333310 }, { "epoch": 0.86, "learning_rate": 0.00017039797190634062, "loss": 0.0144, "step": 333320 }, { "epoch": 0.86, "learning_rate": 0.00017039408368996916, "loss": 0.013, "step": 333330 }, { "epoch": 0.86, "learning_rate": 0.0001703901954735977, "loss": 0.0131, "step": 333340 }, { "epoch": 0.86, "learning_rate": 0.00017038630725722624, "loss": 0.0133, "step": 333350 }, { "epoch": 0.86, "learning_rate": 0.00017038241904085476, "loss": 0.0116, "step": 333360 }, { "epoch": 0.86, "learning_rate": 0.0001703785308244833, "loss": 0.0102, "step": 333370 }, { "epoch": 0.86, "learning_rate": 0.00017037464260811184, "loss": 0.0123, "step": 333380 }, { "epoch": 0.86, "learning_rate": 0.00017037075439174038, "loss": 0.0139, "step": 333390 }, { "epoch": 0.86, "learning_rate": 0.0001703668661753689, "loss": 0.0153, "step": 333400 }, { "epoch": 0.86, "learning_rate": 0.00017036297795899744, "loss": 0.0127, "step": 333410 }, { "epoch": 0.86, "learning_rate": 0.000170359089742626, "loss": 0.0135, "step": 333420 }, { "epoch": 0.86, "learning_rate": 0.00017035520152625452, "loss": 0.0097, "step": 333430 }, { "epoch": 0.86, "learning_rate": 0.00017035131330988307, "loss": 0.0096, "step": 333440 }, { "epoch": 0.86, "learning_rate": 0.00017034742509351158, "loss": 0.0144, "step": 333450 }, { "epoch": 0.86, "learning_rate": 0.0001703435368771401, "loss": 0.0133, "step": 333460 }, { "epoch": 0.86, "learning_rate": 0.00017033964866076866, "loss": 0.014, "step": 333470 }, { "epoch": 0.86, "learning_rate": 0.0001703357604443972, "loss": 0.015, "step": 333480 }, { "epoch": 0.86, "learning_rate": 0.00017033187222802572, "loss": 0.0113, "step": 333490 }, { "epoch": 0.86, "learning_rate": 0.00017032798401165426, "loss": 0.0123, "step": 333500 }, { "epoch": 0.86, "learning_rate": 0.0001703240957952828, "loss": 0.0098, "step": 333510 }, { "epoch": 0.86, "learning_rate": 0.00017032020757891134, "loss": 0.0142, "step": 333520 }, { "epoch": 0.86, "learning_rate": 0.00017031631936253986, "loss": 0.0116, "step": 333530 }, { "epoch": 0.86, "learning_rate": 0.0001703124311461684, "loss": 0.0156, "step": 333540 }, { "epoch": 0.86, "learning_rate": 0.00017030854292979694, "loss": 0.0153, "step": 333550 }, { "epoch": 0.86, "learning_rate": 0.00017030465471342548, "loss": 0.0145, "step": 333560 }, { "epoch": 0.86, "learning_rate": 0.000170300766497054, "loss": 0.0108, "step": 333570 }, { "epoch": 0.86, "learning_rate": 0.00017029687828068254, "loss": 0.017, "step": 333580 }, { "epoch": 0.86, "learning_rate": 0.0001702929900643111, "loss": 0.0138, "step": 333590 }, { "epoch": 0.86, "learning_rate": 0.00017028910184793962, "loss": 0.0129, "step": 333600 }, { "epoch": 0.86, "learning_rate": 0.00017028521363156816, "loss": 0.0126, "step": 333610 }, { "epoch": 0.86, "learning_rate": 0.00017028132541519668, "loss": 0.0093, "step": 333620 }, { "epoch": 0.86, "learning_rate": 0.00017027743719882525, "loss": 0.0149, "step": 333630 }, { "epoch": 0.86, "learning_rate": 0.00017027354898245376, "loss": 0.0108, "step": 333640 }, { "epoch": 0.86, "learning_rate": 0.0001702696607660823, "loss": 0.0145, "step": 333650 }, { "epoch": 0.86, "learning_rate": 0.00017026577254971082, "loss": 0.0123, "step": 333660 }, { "epoch": 0.86, "learning_rate": 0.0001702618843333394, "loss": 0.0113, "step": 333670 }, { "epoch": 0.86, "learning_rate": 0.0001702579961169679, "loss": 0.0119, "step": 333680 }, { "epoch": 0.86, "learning_rate": 0.00017025410790059644, "loss": 0.0107, "step": 333690 }, { "epoch": 0.86, "learning_rate": 0.00017025021968422496, "loss": 0.0176, "step": 333700 }, { "epoch": 0.87, "learning_rate": 0.0001702463314678535, "loss": 0.0151, "step": 333710 }, { "epoch": 0.87, "learning_rate": 0.00017024244325148204, "loss": 0.0241, "step": 333720 }, { "epoch": 0.87, "learning_rate": 0.00017023855503511058, "loss": 0.0129, "step": 333730 }, { "epoch": 0.87, "learning_rate": 0.0001702346668187391, "loss": 0.0136, "step": 333740 }, { "epoch": 0.87, "learning_rate": 0.00017023077860236764, "loss": 0.0139, "step": 333750 }, { "epoch": 0.87, "learning_rate": 0.0001702268903859962, "loss": 0.0134, "step": 333760 }, { "epoch": 0.87, "learning_rate": 0.00017022300216962472, "loss": 0.0107, "step": 333770 }, { "epoch": 0.87, "learning_rate": 0.00017021911395325324, "loss": 0.0168, "step": 333780 }, { "epoch": 0.87, "learning_rate": 0.00017021522573688178, "loss": 0.0126, "step": 333790 }, { "epoch": 0.87, "learning_rate": 0.00017021133752051035, "loss": 0.013, "step": 333800 }, { "epoch": 0.87, "learning_rate": 0.00017020744930413886, "loss": 0.0137, "step": 333810 }, { "epoch": 0.87, "learning_rate": 0.0001702035610877674, "loss": 0.0125, "step": 333820 }, { "epoch": 0.87, "learning_rate": 0.00017019967287139592, "loss": 0.0251, "step": 333830 }, { "epoch": 0.87, "learning_rate": 0.0001701957846550245, "loss": 0.0148, "step": 333840 }, { "epoch": 0.87, "learning_rate": 0.000170191896438653, "loss": 0.0147, "step": 333850 }, { "epoch": 0.87, "learning_rate": 0.00017018800822228154, "loss": 0.0138, "step": 333860 }, { "epoch": 0.87, "learning_rate": 0.00017018412000591006, "loss": 0.0183, "step": 333870 }, { "epoch": 0.87, "learning_rate": 0.00017018023178953863, "loss": 0.0129, "step": 333880 }, { "epoch": 0.87, "learning_rate": 0.00017017634357316714, "loss": 0.0138, "step": 333890 }, { "epoch": 0.87, "learning_rate": 0.00017017245535679568, "loss": 0.0117, "step": 333900 }, { "epoch": 0.87, "learning_rate": 0.0001701685671404242, "loss": 0.012, "step": 333910 }, { "epoch": 0.87, "learning_rate": 0.00017016467892405277, "loss": 0.0099, "step": 333920 }, { "epoch": 0.87, "learning_rate": 0.00017016079070768128, "loss": 0.0159, "step": 333930 }, { "epoch": 0.87, "learning_rate": 0.00017015690249130982, "loss": 0.0135, "step": 333940 }, { "epoch": 0.87, "learning_rate": 0.00017015301427493834, "loss": 0.0145, "step": 333950 }, { "epoch": 0.87, "learning_rate": 0.00017014912605856688, "loss": 0.0103, "step": 333960 }, { "epoch": 0.87, "learning_rate": 0.00017014523784219545, "loss": 0.0151, "step": 333970 }, { "epoch": 0.87, "learning_rate": 0.00017014134962582396, "loss": 0.013, "step": 333980 }, { "epoch": 0.87, "learning_rate": 0.0001701374614094525, "loss": 0.0148, "step": 333990 }, { "epoch": 0.87, "learning_rate": 0.00017013357319308102, "loss": 0.0121, "step": 334000 }, { "epoch": 0.87, "eval_cer": 0.8817306790618513, "eval_loss": 0.009081809781491756, "eval_runtime": 107.8501, "eval_samples_per_second": 18.544, "eval_steps_per_second": 4.636, "step": 334000 }, { "epoch": 0.87, "learning_rate": 0.0001701296849767096, "loss": 0.0123, "step": 334010 }, { "epoch": 0.87, "learning_rate": 0.0001701257967603381, "loss": 0.0134, "step": 334020 }, { "epoch": 0.87, "learning_rate": 0.00017012190854396664, "loss": 0.0162, "step": 334030 }, { "epoch": 0.87, "learning_rate": 0.00017011802032759516, "loss": 0.0145, "step": 334040 }, { "epoch": 0.87, "learning_rate": 0.00017011413211122373, "loss": 0.0147, "step": 334050 }, { "epoch": 0.87, "learning_rate": 0.00017011024389485224, "loss": 0.0129, "step": 334060 }, { "epoch": 0.87, "learning_rate": 0.00017010635567848078, "loss": 0.0114, "step": 334070 }, { "epoch": 0.87, "learning_rate": 0.0001701024674621093, "loss": 0.0134, "step": 334080 }, { "epoch": 0.87, "learning_rate": 0.00017009857924573787, "loss": 0.0109, "step": 334090 }, { "epoch": 0.87, "learning_rate": 0.00017009469102936638, "loss": 0.0136, "step": 334100 }, { "epoch": 0.87, "learning_rate": 0.00017009080281299492, "loss": 0.0125, "step": 334110 }, { "epoch": 0.87, "learning_rate": 0.00017008691459662344, "loss": 0.0112, "step": 334120 }, { "epoch": 0.87, "learning_rate": 0.000170083026380252, "loss": 0.015, "step": 334130 }, { "epoch": 0.87, "learning_rate": 0.00017007913816388055, "loss": 0.0137, "step": 334140 }, { "epoch": 0.87, "learning_rate": 0.00017007524994750906, "loss": 0.0119, "step": 334150 }, { "epoch": 0.87, "learning_rate": 0.0001700713617311376, "loss": 0.0108, "step": 334160 }, { "epoch": 0.87, "learning_rate": 0.00017006747351476614, "loss": 0.012, "step": 334170 }, { "epoch": 0.87, "learning_rate": 0.00017006358529839469, "loss": 0.015, "step": 334180 }, { "epoch": 0.87, "learning_rate": 0.0001700596970820232, "loss": 0.0124, "step": 334190 }, { "epoch": 0.87, "learning_rate": 0.00017005580886565174, "loss": 0.0119, "step": 334200 }, { "epoch": 0.87, "learning_rate": 0.00017005192064928026, "loss": 0.0177, "step": 334210 }, { "epoch": 0.87, "learning_rate": 0.00017004803243290883, "loss": 0.0119, "step": 334220 }, { "epoch": 0.87, "learning_rate": 0.00017004414421653734, "loss": 0.0169, "step": 334230 }, { "epoch": 0.87, "learning_rate": 0.00017004025600016588, "loss": 0.0137, "step": 334240 }, { "epoch": 0.87, "learning_rate": 0.0001700363677837944, "loss": 0.0145, "step": 334250 }, { "epoch": 0.87, "learning_rate": 0.00017003247956742296, "loss": 0.0116, "step": 334260 }, { "epoch": 0.87, "learning_rate": 0.00017002859135105148, "loss": 0.013, "step": 334270 }, { "epoch": 0.87, "learning_rate": 0.00017002470313468002, "loss": 0.0133, "step": 334280 }, { "epoch": 0.87, "learning_rate": 0.00017002081491830854, "loss": 0.0153, "step": 334290 }, { "epoch": 0.87, "learning_rate": 0.0001700169267019371, "loss": 0.0138, "step": 334300 }, { "epoch": 0.87, "learning_rate": 0.00017001303848556565, "loss": 0.0154, "step": 334310 }, { "epoch": 0.87, "learning_rate": 0.00017000915026919416, "loss": 0.0131, "step": 334320 }, { "epoch": 0.87, "learning_rate": 0.00017000526205282267, "loss": 0.0167, "step": 334330 }, { "epoch": 0.87, "learning_rate": 0.00017000137383645124, "loss": 0.0142, "step": 334340 }, { "epoch": 0.87, "learning_rate": 0.00016999748562007979, "loss": 0.0128, "step": 334350 }, { "epoch": 0.87, "learning_rate": 0.0001699935974037083, "loss": 0.0144, "step": 334360 }, { "epoch": 0.87, "learning_rate": 0.00016998970918733684, "loss": 0.0137, "step": 334370 }, { "epoch": 0.87, "learning_rate": 0.00016998582097096538, "loss": 0.0127, "step": 334380 }, { "epoch": 0.87, "learning_rate": 0.00016998193275459392, "loss": 0.013, "step": 334390 }, { "epoch": 0.87, "learning_rate": 0.00016997804453822244, "loss": 0.0138, "step": 334400 }, { "epoch": 0.87, "learning_rate": 0.00016997415632185098, "loss": 0.0111, "step": 334410 }, { "epoch": 0.87, "learning_rate": 0.00016997026810547952, "loss": 0.0158, "step": 334420 }, { "epoch": 0.87, "learning_rate": 0.00016996637988910806, "loss": 0.017, "step": 334430 }, { "epoch": 0.87, "learning_rate": 0.00016996249167273658, "loss": 0.0131, "step": 334440 }, { "epoch": 0.87, "learning_rate": 0.00016995860345636512, "loss": 0.0144, "step": 334450 }, { "epoch": 0.87, "learning_rate": 0.00016995471523999363, "loss": 0.0169, "step": 334460 }, { "epoch": 0.87, "learning_rate": 0.0001699508270236222, "loss": 0.0133, "step": 334470 }, { "epoch": 0.87, "learning_rate": 0.00016994693880725075, "loss": 0.0108, "step": 334480 }, { "epoch": 0.87, "learning_rate": 0.00016994305059087926, "loss": 0.0106, "step": 334490 }, { "epoch": 0.87, "learning_rate": 0.00016993916237450777, "loss": 0.0195, "step": 334500 }, { "epoch": 0.87, "learning_rate": 0.00016993527415813634, "loss": 0.0179, "step": 334510 }, { "epoch": 0.87, "learning_rate": 0.00016993138594176488, "loss": 0.0149, "step": 334520 }, { "epoch": 0.87, "learning_rate": 0.0001699274977253934, "loss": 0.0128, "step": 334530 }, { "epoch": 0.87, "learning_rate": 0.00016992360950902194, "loss": 0.0127, "step": 334540 }, { "epoch": 0.87, "learning_rate": 0.00016991972129265048, "loss": 0.0146, "step": 334550 }, { "epoch": 0.87, "learning_rate": 0.00016991583307627902, "loss": 0.014, "step": 334560 }, { "epoch": 0.87, "learning_rate": 0.00016991194485990754, "loss": 0.016, "step": 334570 }, { "epoch": 0.87, "learning_rate": 0.00016990805664353608, "loss": 0.0115, "step": 334580 }, { "epoch": 0.87, "learning_rate": 0.00016990416842716462, "loss": 0.0148, "step": 334590 }, { "epoch": 0.87, "learning_rate": 0.00016990028021079316, "loss": 0.0139, "step": 334600 }, { "epoch": 0.87, "learning_rate": 0.00016989639199442168, "loss": 0.0129, "step": 334610 }, { "epoch": 0.87, "learning_rate": 0.00016989250377805022, "loss": 0.0167, "step": 334620 }, { "epoch": 0.87, "learning_rate": 0.0001698886155616788, "loss": 0.0154, "step": 334630 }, { "epoch": 0.87, "learning_rate": 0.0001698847273453073, "loss": 0.0113, "step": 334640 }, { "epoch": 0.87, "learning_rate": 0.00016988083912893582, "loss": 0.0175, "step": 334650 }, { "epoch": 0.87, "learning_rate": 0.00016987695091256436, "loss": 0.0112, "step": 334660 }, { "epoch": 0.87, "learning_rate": 0.00016987306269619293, "loss": 0.0154, "step": 334670 }, { "epoch": 0.87, "learning_rate": 0.00016986917447982144, "loss": 0.0136, "step": 334680 }, { "epoch": 0.87, "learning_rate": 0.00016986528626344998, "loss": 0.0128, "step": 334690 }, { "epoch": 0.87, "learning_rate": 0.0001698613980470785, "loss": 0.0126, "step": 334700 }, { "epoch": 0.87, "learning_rate": 0.00016985750983070704, "loss": 0.0154, "step": 334710 }, { "epoch": 0.87, "learning_rate": 0.00016985362161433558, "loss": 0.019, "step": 334720 }, { "epoch": 0.87, "learning_rate": 0.00016984973339796412, "loss": 0.0125, "step": 334730 }, { "epoch": 0.87, "learning_rate": 0.00016984584518159264, "loss": 0.0103, "step": 334740 }, { "epoch": 0.87, "learning_rate": 0.00016984195696522118, "loss": 0.0126, "step": 334750 }, { "epoch": 0.87, "learning_rate": 0.00016983806874884972, "loss": 0.014, "step": 334760 }, { "epoch": 0.87, "learning_rate": 0.00016983418053247826, "loss": 0.0183, "step": 334770 }, { "epoch": 0.87, "learning_rate": 0.00016983029231610678, "loss": 0.0165, "step": 334780 }, { "epoch": 0.87, "learning_rate": 0.00016982640409973532, "loss": 0.0127, "step": 334790 }, { "epoch": 0.87, "learning_rate": 0.00016982251588336386, "loss": 0.0123, "step": 334800 }, { "epoch": 0.87, "learning_rate": 0.0001698186276669924, "loss": 0.0142, "step": 334810 }, { "epoch": 0.87, "learning_rate": 0.00016981473945062092, "loss": 0.0123, "step": 334820 }, { "epoch": 0.87, "learning_rate": 0.00016981085123424946, "loss": 0.0141, "step": 334830 }, { "epoch": 0.87, "learning_rate": 0.00016980696301787803, "loss": 0.0122, "step": 334840 }, { "epoch": 0.87, "learning_rate": 0.00016980307480150654, "loss": 0.0134, "step": 334850 }, { "epoch": 0.87, "learning_rate": 0.00016979918658513508, "loss": 0.0135, "step": 334860 }, { "epoch": 0.87, "learning_rate": 0.0001697952983687636, "loss": 0.0117, "step": 334870 }, { "epoch": 0.87, "learning_rate": 0.00016979141015239217, "loss": 0.0146, "step": 334880 }, { "epoch": 0.87, "learning_rate": 0.00016978752193602068, "loss": 0.0121, "step": 334890 }, { "epoch": 0.87, "learning_rate": 0.00016978363371964922, "loss": 0.0152, "step": 334900 }, { "epoch": 0.87, "learning_rate": 0.00016977974550327774, "loss": 0.0138, "step": 334910 }, { "epoch": 0.87, "learning_rate": 0.0001697758572869063, "loss": 0.0119, "step": 334920 }, { "epoch": 0.87, "learning_rate": 0.00016977196907053482, "loss": 0.0113, "step": 334930 }, { "epoch": 0.87, "learning_rate": 0.00016976808085416336, "loss": 0.0137, "step": 334940 }, { "epoch": 0.87, "learning_rate": 0.00016976419263779188, "loss": 0.0122, "step": 334950 }, { "epoch": 0.87, "learning_rate": 0.00016976030442142042, "loss": 0.01, "step": 334960 }, { "epoch": 0.87, "learning_rate": 0.00016975641620504896, "loss": 0.0201, "step": 334970 }, { "epoch": 0.87, "learning_rate": 0.0001697525279886775, "loss": 0.0162, "step": 334980 }, { "epoch": 0.87, "learning_rate": 0.00016974863977230602, "loss": 0.0127, "step": 334990 }, { "epoch": 0.87, "learning_rate": 0.00016974475155593456, "loss": 0.0106, "step": 335000 }, { "epoch": 0.87, "eval_cer": 0.8817180823294437, "eval_loss": 0.009029078297317028, "eval_runtime": 107.7187, "eval_samples_per_second": 18.567, "eval_steps_per_second": 4.642, "step": 335000 }, { "epoch": 0.87, "learning_rate": 0.00016974086333956313, "loss": 0.0122, "step": 335010 }, { "epoch": 0.87, "learning_rate": 0.00016973697512319164, "loss": 0.0172, "step": 335020 }, { "epoch": 0.87, "learning_rate": 0.00016973308690682018, "loss": 0.0143, "step": 335030 }, { "epoch": 0.87, "learning_rate": 0.0001697291986904487, "loss": 0.014, "step": 335040 }, { "epoch": 0.87, "learning_rate": 0.00016972531047407727, "loss": 0.0146, "step": 335050 }, { "epoch": 0.87, "learning_rate": 0.00016972142225770578, "loss": 0.0117, "step": 335060 }, { "epoch": 0.87, "learning_rate": 0.00016971753404133432, "loss": 0.0148, "step": 335070 }, { "epoch": 0.87, "learning_rate": 0.00016971364582496284, "loss": 0.0178, "step": 335080 }, { "epoch": 0.87, "learning_rate": 0.0001697097576085914, "loss": 0.0139, "step": 335090 }, { "epoch": 0.87, "learning_rate": 0.00016970586939221992, "loss": 0.0149, "step": 335100 }, { "epoch": 0.87, "learning_rate": 0.00016970198117584846, "loss": 0.0109, "step": 335110 }, { "epoch": 0.87, "learning_rate": 0.00016969809295947698, "loss": 0.0137, "step": 335120 }, { "epoch": 0.87, "learning_rate": 0.00016969420474310555, "loss": 0.0112, "step": 335130 }, { "epoch": 0.87, "learning_rate": 0.00016969031652673406, "loss": 0.0111, "step": 335140 }, { "epoch": 0.87, "learning_rate": 0.0001696864283103626, "loss": 0.018, "step": 335150 }, { "epoch": 0.87, "learning_rate": 0.00016968254009399112, "loss": 0.0171, "step": 335160 }, { "epoch": 0.87, "learning_rate": 0.00016967865187761968, "loss": 0.0136, "step": 335170 }, { "epoch": 0.87, "learning_rate": 0.00016967476366124823, "loss": 0.0133, "step": 335180 }, { "epoch": 0.87, "learning_rate": 0.00016967087544487674, "loss": 0.0116, "step": 335190 }, { "epoch": 0.87, "learning_rate": 0.00016966698722850528, "loss": 0.0151, "step": 335200 }, { "epoch": 0.87, "learning_rate": 0.0001696630990121338, "loss": 0.0116, "step": 335210 }, { "epoch": 0.87, "learning_rate": 0.00016965921079576237, "loss": 0.0176, "step": 335220 }, { "epoch": 0.87, "learning_rate": 0.00016965532257939088, "loss": 0.016, "step": 335230 }, { "epoch": 0.87, "learning_rate": 0.00016965143436301942, "loss": 0.0141, "step": 335240 }, { "epoch": 0.87, "learning_rate": 0.00016964754614664794, "loss": 0.0115, "step": 335250 }, { "epoch": 0.87, "learning_rate": 0.0001696436579302765, "loss": 0.0154, "step": 335260 }, { "epoch": 0.87, "learning_rate": 0.00016963976971390502, "loss": 0.0137, "step": 335270 }, { "epoch": 0.87, "learning_rate": 0.00016963588149753356, "loss": 0.0129, "step": 335280 }, { "epoch": 0.87, "learning_rate": 0.00016963199328116208, "loss": 0.0148, "step": 335290 }, { "epoch": 0.87, "learning_rate": 0.00016962810506479064, "loss": 0.0131, "step": 335300 }, { "epoch": 0.87, "learning_rate": 0.00016962421684841916, "loss": 0.0106, "step": 335310 }, { "epoch": 0.87, "learning_rate": 0.0001696203286320477, "loss": 0.0152, "step": 335320 }, { "epoch": 0.87, "learning_rate": 0.00016961644041567622, "loss": 0.0147, "step": 335330 }, { "epoch": 0.87, "learning_rate": 0.00016961255219930478, "loss": 0.0137, "step": 335340 }, { "epoch": 0.87, "learning_rate": 0.00016960866398293333, "loss": 0.0093, "step": 335350 }, { "epoch": 0.87, "learning_rate": 0.00016960477576656184, "loss": 0.0126, "step": 335360 }, { "epoch": 0.87, "learning_rate": 0.00016960088755019035, "loss": 0.014, "step": 335370 }, { "epoch": 0.87, "learning_rate": 0.00016959699933381892, "loss": 0.0115, "step": 335380 }, { "epoch": 0.87, "learning_rate": 0.00016959311111744747, "loss": 0.0151, "step": 335390 }, { "epoch": 0.87, "learning_rate": 0.00016958922290107598, "loss": 0.0114, "step": 335400 }, { "epoch": 0.87, "learning_rate": 0.00016958533468470452, "loss": 0.0173, "step": 335410 }, { "epoch": 0.87, "learning_rate": 0.00016958144646833306, "loss": 0.0158, "step": 335420 }, { "epoch": 0.87, "learning_rate": 0.0001695775582519616, "loss": 0.0136, "step": 335430 }, { "epoch": 0.87, "learning_rate": 0.00016957367003559012, "loss": 0.014, "step": 335440 }, { "epoch": 0.87, "learning_rate": 0.00016956978181921866, "loss": 0.0158, "step": 335450 }, { "epoch": 0.87, "learning_rate": 0.00016956589360284718, "loss": 0.0112, "step": 335460 }, { "epoch": 0.87, "learning_rate": 0.00016956200538647574, "loss": 0.0131, "step": 335470 }, { "epoch": 0.87, "learning_rate": 0.00016955811717010426, "loss": 0.017, "step": 335480 }, { "epoch": 0.87, "learning_rate": 0.0001695542289537328, "loss": 0.0126, "step": 335490 }, { "epoch": 0.87, "learning_rate": 0.00016955034073736131, "loss": 0.013, "step": 335500 }, { "epoch": 0.87, "learning_rate": 0.00016954645252098988, "loss": 0.016, "step": 335510 }, { "epoch": 0.87, "learning_rate": 0.0001695425643046184, "loss": 0.0175, "step": 335520 }, { "epoch": 0.87, "learning_rate": 0.00016953867608824694, "loss": 0.0118, "step": 335530 }, { "epoch": 0.87, "learning_rate": 0.00016953478787187545, "loss": 0.0119, "step": 335540 }, { "epoch": 0.87, "learning_rate": 0.00016953089965550402, "loss": 0.0171, "step": 335550 }, { "epoch": 0.87, "learning_rate": 0.00016952701143913256, "loss": 0.0142, "step": 335560 }, { "epoch": 0.87, "learning_rate": 0.00016952312322276108, "loss": 0.0125, "step": 335570 }, { "epoch": 0.87, "learning_rate": 0.00016951923500638962, "loss": 0.0184, "step": 335580 }, { "epoch": 0.87, "learning_rate": 0.00016951534679001816, "loss": 0.0169, "step": 335590 }, { "epoch": 0.87, "learning_rate": 0.0001695114585736467, "loss": 0.0125, "step": 335600 }, { "epoch": 0.87, "learning_rate": 0.00016950757035727522, "loss": 0.0271, "step": 335610 }, { "epoch": 0.87, "learning_rate": 0.00016950368214090376, "loss": 0.0148, "step": 335620 }, { "epoch": 0.87, "learning_rate": 0.0001694997939245323, "loss": 0.0122, "step": 335630 }, { "epoch": 0.87, "learning_rate": 0.00016949590570816084, "loss": 0.0142, "step": 335640 }, { "epoch": 0.87, "learning_rate": 0.00016949201749178936, "loss": 0.0114, "step": 335650 }, { "epoch": 0.87, "learning_rate": 0.0001694881292754179, "loss": 0.0167, "step": 335660 }, { "epoch": 0.87, "learning_rate": 0.00016948424105904647, "loss": 0.0159, "step": 335670 }, { "epoch": 0.87, "learning_rate": 0.00016948035284267498, "loss": 0.0157, "step": 335680 }, { "epoch": 0.87, "learning_rate": 0.0001694764646263035, "loss": 0.0142, "step": 335690 }, { "epoch": 0.87, "learning_rate": 0.00016947257640993204, "loss": 0.0134, "step": 335700 }, { "epoch": 0.87, "learning_rate": 0.00016946868819356055, "loss": 0.0126, "step": 335710 }, { "epoch": 0.87, "learning_rate": 0.00016946479997718912, "loss": 0.0118, "step": 335720 }, { "epoch": 0.87, "learning_rate": 0.00016946091176081766, "loss": 0.0133, "step": 335730 }, { "epoch": 0.87, "learning_rate": 0.00016945702354444618, "loss": 0.0116, "step": 335740 }, { "epoch": 0.87, "learning_rate": 0.00016945313532807472, "loss": 0.0204, "step": 335750 }, { "epoch": 0.87, "learning_rate": 0.00016944924711170326, "loss": 0.0156, "step": 335760 }, { "epoch": 0.87, "learning_rate": 0.0001694453588953318, "loss": 0.0134, "step": 335770 }, { "epoch": 0.87, "learning_rate": 0.00016944147067896032, "loss": 0.0114, "step": 335780 }, { "epoch": 0.87, "learning_rate": 0.00016943758246258886, "loss": 0.0142, "step": 335790 }, { "epoch": 0.87, "learning_rate": 0.0001694336942462174, "loss": 0.0139, "step": 335800 }, { "epoch": 0.87, "learning_rate": 0.00016942980602984594, "loss": 0.0269, "step": 335810 }, { "epoch": 0.87, "learning_rate": 0.00016942591781347446, "loss": 0.0674, "step": 335820 }, { "epoch": 0.87, "learning_rate": 0.000169422029597103, "loss": 0.03, "step": 335830 }, { "epoch": 0.87, "learning_rate": 0.00016941814138073154, "loss": 0.0132, "step": 335840 }, { "epoch": 0.87, "learning_rate": 0.00016941425316436008, "loss": 0.0179, "step": 335850 }, { "epoch": 0.87, "learning_rate": 0.0001694103649479886, "loss": 0.0124, "step": 335860 }, { "epoch": 0.87, "learning_rate": 0.00016940647673161714, "loss": 0.015, "step": 335870 }, { "epoch": 0.87, "learning_rate": 0.0001694025885152457, "loss": 0.0158, "step": 335880 }, { "epoch": 0.87, "learning_rate": 0.00016939870029887422, "loss": 0.0123, "step": 335890 }, { "epoch": 0.87, "learning_rate": 0.00016939481208250276, "loss": 0.0197, "step": 335900 }, { "epoch": 0.87, "learning_rate": 0.00016939092386613128, "loss": 0.0125, "step": 335910 }, { "epoch": 0.87, "learning_rate": 0.00016938703564975985, "loss": 0.0161, "step": 335920 }, { "epoch": 0.87, "learning_rate": 0.00016938314743338836, "loss": 0.0158, "step": 335930 }, { "epoch": 0.87, "learning_rate": 0.0001693792592170169, "loss": 0.0125, "step": 335940 }, { "epoch": 0.87, "learning_rate": 0.00016937537100064542, "loss": 0.0094, "step": 335950 }, { "epoch": 0.87, "learning_rate": 0.00016937148278427396, "loss": 0.0152, "step": 335960 }, { "epoch": 0.87, "learning_rate": 0.0001693675945679025, "loss": 0.0121, "step": 335970 }, { "epoch": 0.87, "learning_rate": 0.00016936370635153104, "loss": 0.0127, "step": 335980 }, { "epoch": 0.87, "learning_rate": 0.00016935981813515956, "loss": 0.0159, "step": 335990 }, { "epoch": 0.87, "learning_rate": 0.0001693559299187881, "loss": 0.0134, "step": 336000 }, { "epoch": 0.87, "eval_cer": 0.8817334783357197, "eval_loss": 0.009199898689985275, "eval_runtime": 107.6047, "eval_samples_per_second": 18.587, "eval_steps_per_second": 4.647, "step": 336000 }, { "epoch": 0.87, "learning_rate": 0.00016935204170241664, "loss": 0.0142, "step": 336010 }, { "epoch": 0.87, "learning_rate": 0.00016934815348604518, "loss": 0.0123, "step": 336020 }, { "epoch": 0.87, "learning_rate": 0.0001693442652696737, "loss": 0.018, "step": 336030 }, { "epoch": 0.87, "learning_rate": 0.00016934037705330224, "loss": 0.0124, "step": 336040 }, { "epoch": 0.87, "learning_rate": 0.0001693364888369308, "loss": 0.0155, "step": 336050 }, { "epoch": 0.87, "learning_rate": 0.00016933260062055932, "loss": 0.0152, "step": 336060 }, { "epoch": 0.87, "learning_rate": 0.00016932871240418786, "loss": 0.0168, "step": 336070 }, { "epoch": 0.87, "learning_rate": 0.00016932482418781638, "loss": 0.0123, "step": 336080 }, { "epoch": 0.87, "learning_rate": 0.00016932093597144495, "loss": 0.0152, "step": 336090 }, { "epoch": 0.87, "learning_rate": 0.00016931704775507346, "loss": 0.0143, "step": 336100 }, { "epoch": 0.87, "learning_rate": 0.000169313159538702, "loss": 0.014, "step": 336110 }, { "epoch": 0.87, "learning_rate": 0.00016930927132233052, "loss": 0.0166, "step": 336120 }, { "epoch": 0.87, "learning_rate": 0.00016930538310595909, "loss": 0.0142, "step": 336130 }, { "epoch": 0.87, "learning_rate": 0.0001693014948895876, "loss": 0.0114, "step": 336140 }, { "epoch": 0.87, "learning_rate": 0.00016929760667321614, "loss": 0.0127, "step": 336150 }, { "epoch": 0.87, "learning_rate": 0.00016929371845684466, "loss": 0.0106, "step": 336160 }, { "epoch": 0.87, "learning_rate": 0.00016928983024047322, "loss": 0.0186, "step": 336170 }, { "epoch": 0.87, "learning_rate": 0.00016928594202410174, "loss": 0.0118, "step": 336180 }, { "epoch": 0.87, "learning_rate": 0.00016928205380773028, "loss": 0.0139, "step": 336190 }, { "epoch": 0.87, "learning_rate": 0.0001692781655913588, "loss": 0.0175, "step": 336200 }, { "epoch": 0.87, "learning_rate": 0.00016927427737498734, "loss": 0.0109, "step": 336210 }, { "epoch": 0.87, "learning_rate": 0.0001692703891586159, "loss": 0.014, "step": 336220 }, { "epoch": 0.87, "learning_rate": 0.00016926650094224442, "loss": 0.0124, "step": 336230 }, { "epoch": 0.87, "learning_rate": 0.00016926261272587294, "loss": 0.0119, "step": 336240 }, { "epoch": 0.87, "learning_rate": 0.00016925872450950148, "loss": 0.014, "step": 336250 }, { "epoch": 0.87, "learning_rate": 0.00016925483629313005, "loss": 0.0122, "step": 336260 }, { "epoch": 0.87, "learning_rate": 0.00016925094807675856, "loss": 0.0126, "step": 336270 }, { "epoch": 0.87, "learning_rate": 0.0001692470598603871, "loss": 0.0124, "step": 336280 }, { "epoch": 0.87, "learning_rate": 0.00016924317164401562, "loss": 0.015, "step": 336290 }, { "epoch": 0.87, "learning_rate": 0.00016923928342764418, "loss": 0.0099, "step": 336300 }, { "epoch": 0.87, "learning_rate": 0.0001692353952112727, "loss": 0.0144, "step": 336310 }, { "epoch": 0.87, "learning_rate": 0.00016923150699490124, "loss": 0.0116, "step": 336320 }, { "epoch": 0.87, "learning_rate": 0.00016922761877852976, "loss": 0.0138, "step": 336330 }, { "epoch": 0.87, "learning_rate": 0.00016922373056215832, "loss": 0.0175, "step": 336340 }, { "epoch": 0.87, "learning_rate": 0.00016921984234578684, "loss": 0.0147, "step": 336350 }, { "epoch": 0.87, "learning_rate": 0.00016921595412941538, "loss": 0.0128, "step": 336360 }, { "epoch": 0.87, "learning_rate": 0.0001692120659130439, "loss": 0.0141, "step": 336370 }, { "epoch": 0.87, "learning_rate": 0.00016920817769667246, "loss": 0.0129, "step": 336380 }, { "epoch": 0.87, "learning_rate": 0.00016920428948030098, "loss": 0.0127, "step": 336390 }, { "epoch": 0.87, "learning_rate": 0.00016920040126392952, "loss": 0.0126, "step": 336400 }, { "epoch": 0.87, "learning_rate": 0.00016919651304755803, "loss": 0.0174, "step": 336410 }, { "epoch": 0.87, "learning_rate": 0.0001691926248311866, "loss": 0.0125, "step": 336420 }, { "epoch": 0.87, "learning_rate": 0.00016918873661481514, "loss": 0.0125, "step": 336430 }, { "epoch": 0.87, "learning_rate": 0.00016918484839844366, "loss": 0.0119, "step": 336440 }, { "epoch": 0.87, "learning_rate": 0.0001691809601820722, "loss": 0.0158, "step": 336450 }, { "epoch": 0.87, "learning_rate": 0.00016917707196570072, "loss": 0.0149, "step": 336460 }, { "epoch": 0.87, "learning_rate": 0.00016917318374932928, "loss": 0.0139, "step": 336470 }, { "epoch": 0.87, "learning_rate": 0.0001691692955329578, "loss": 0.0187, "step": 336480 }, { "epoch": 0.87, "learning_rate": 0.00016916540731658634, "loss": 0.014, "step": 336490 }, { "epoch": 0.87, "learning_rate": 0.00016916151910021486, "loss": 0.0126, "step": 336500 }, { "epoch": 0.87, "learning_rate": 0.00016915763088384342, "loss": 0.0191, "step": 336510 }, { "epoch": 0.87, "learning_rate": 0.00016915374266747194, "loss": 0.0118, "step": 336520 }, { "epoch": 0.87, "learning_rate": 0.00016914985445110048, "loss": 0.0095, "step": 336530 }, { "epoch": 0.87, "learning_rate": 0.000169145966234729, "loss": 0.015, "step": 336540 }, { "epoch": 0.87, "learning_rate": 0.00016914207801835756, "loss": 0.0162, "step": 336550 }, { "epoch": 0.87, "learning_rate": 0.00016913818980198608, "loss": 0.0183, "step": 336560 }, { "epoch": 0.87, "learning_rate": 0.00016913430158561462, "loss": 0.0146, "step": 336570 }, { "epoch": 0.87, "learning_rate": 0.00016913041336924313, "loss": 0.0143, "step": 336580 }, { "epoch": 0.87, "learning_rate": 0.0001691265251528717, "loss": 0.0137, "step": 336590 }, { "epoch": 0.87, "learning_rate": 0.00016912263693650024, "loss": 0.0157, "step": 336600 }, { "epoch": 0.87, "learning_rate": 0.00016911874872012876, "loss": 0.0289, "step": 336610 }, { "epoch": 0.87, "learning_rate": 0.0001691148605037573, "loss": 0.0142, "step": 336620 }, { "epoch": 0.87, "learning_rate": 0.00016911097228738584, "loss": 0.0146, "step": 336630 }, { "epoch": 0.87, "learning_rate": 0.00016910708407101438, "loss": 0.0155, "step": 336640 }, { "epoch": 0.87, "learning_rate": 0.0001691031958546429, "loss": 0.0117, "step": 336650 }, { "epoch": 0.87, "learning_rate": 0.00016909930763827144, "loss": 0.0148, "step": 336660 }, { "epoch": 0.87, "learning_rate": 0.00016909541942189998, "loss": 0.0117, "step": 336670 }, { "epoch": 0.87, "learning_rate": 0.00016909153120552852, "loss": 0.0151, "step": 336680 }, { "epoch": 0.87, "learning_rate": 0.00016908764298915704, "loss": 0.0113, "step": 336690 }, { "epoch": 0.87, "learning_rate": 0.00016908375477278558, "loss": 0.0104, "step": 336700 }, { "epoch": 0.87, "learning_rate": 0.0001690798665564141, "loss": 0.0133, "step": 336710 }, { "epoch": 0.87, "learning_rate": 0.00016907597834004266, "loss": 0.0142, "step": 336720 }, { "epoch": 0.87, "learning_rate": 0.00016907209012367118, "loss": 0.0124, "step": 336730 }, { "epoch": 0.87, "learning_rate": 0.00016906820190729972, "loss": 0.0141, "step": 336740 }, { "epoch": 0.87, "learning_rate": 0.00016906431369092823, "loss": 0.0134, "step": 336750 }, { "epoch": 0.87, "learning_rate": 0.0001690604254745568, "loss": 0.0144, "step": 336760 }, { "epoch": 0.87, "learning_rate": 0.00016905653725818534, "loss": 0.0156, "step": 336770 }, { "epoch": 0.87, "learning_rate": 0.00016905264904181386, "loss": 0.0123, "step": 336780 }, { "epoch": 0.87, "learning_rate": 0.0001690487608254424, "loss": 0.0115, "step": 336790 }, { "epoch": 0.87, "learning_rate": 0.00016904487260907094, "loss": 0.0143, "step": 336800 }, { "epoch": 0.87, "learning_rate": 0.00016904098439269948, "loss": 0.0121, "step": 336810 }, { "epoch": 0.87, "learning_rate": 0.000169037096176328, "loss": 0.017, "step": 336820 }, { "epoch": 0.87, "learning_rate": 0.00016903320795995654, "loss": 0.0148, "step": 336830 }, { "epoch": 0.87, "learning_rate": 0.00016902931974358508, "loss": 0.0157, "step": 336840 }, { "epoch": 0.87, "learning_rate": 0.00016902543152721362, "loss": 0.0113, "step": 336850 }, { "epoch": 0.87, "learning_rate": 0.00016902154331084214, "loss": 0.0103, "step": 336860 }, { "epoch": 0.87, "learning_rate": 0.00016901765509447068, "loss": 0.0145, "step": 336870 }, { "epoch": 0.87, "learning_rate": 0.00016901376687809922, "loss": 0.0136, "step": 336880 }, { "epoch": 0.87, "learning_rate": 0.00016900987866172776, "loss": 0.0149, "step": 336890 }, { "epoch": 0.87, "learning_rate": 0.00016900599044535628, "loss": 0.0147, "step": 336900 }, { "epoch": 0.87, "learning_rate": 0.00016900210222898482, "loss": 0.0129, "step": 336910 }, { "epoch": 0.87, "learning_rate": 0.0001689982140126134, "loss": 0.0135, "step": 336920 }, { "epoch": 0.87, "learning_rate": 0.0001689943257962419, "loss": 0.013, "step": 336930 }, { "epoch": 0.87, "learning_rate": 0.00016899043757987044, "loss": 0.0145, "step": 336940 }, { "epoch": 0.87, "learning_rate": 0.00016898654936349896, "loss": 0.013, "step": 336950 }, { "epoch": 0.87, "learning_rate": 0.00016898266114712747, "loss": 0.0149, "step": 336960 }, { "epoch": 0.87, "learning_rate": 0.00016897877293075604, "loss": 0.0118, "step": 336970 }, { "epoch": 0.87, "learning_rate": 0.00016897488471438458, "loss": 0.0139, "step": 336980 }, { "epoch": 0.87, "learning_rate": 0.0001689709964980131, "loss": 0.0136, "step": 336990 }, { "epoch": 0.87, "learning_rate": 0.00016896710828164164, "loss": 0.0113, "step": 337000 }, { "epoch": 0.87, "eval_cer": 0.8817166826925096, "eval_loss": 0.008749060332775116, "eval_runtime": 107.716, "eval_samples_per_second": 18.567, "eval_steps_per_second": 4.642, "step": 337000 }, { "epoch": 0.87, "learning_rate": 0.00016896322006527018, "loss": 0.0128, "step": 337010 }, { "epoch": 0.87, "learning_rate": 0.00016895933184889872, "loss": 0.0141, "step": 337020 }, { "epoch": 0.87, "learning_rate": 0.00016895544363252724, "loss": 0.0114, "step": 337030 }, { "epoch": 0.87, "learning_rate": 0.00016895155541615578, "loss": 0.0135, "step": 337040 }, { "epoch": 0.87, "learning_rate": 0.00016894766719978432, "loss": 0.0151, "step": 337050 }, { "epoch": 0.87, "learning_rate": 0.00016894377898341286, "loss": 0.0122, "step": 337060 }, { "epoch": 0.87, "learning_rate": 0.00016893989076704138, "loss": 0.014, "step": 337070 }, { "epoch": 0.87, "learning_rate": 0.00016893600255066992, "loss": 0.0106, "step": 337080 }, { "epoch": 0.87, "learning_rate": 0.00016893211433429849, "loss": 0.0099, "step": 337090 }, { "epoch": 0.87, "learning_rate": 0.000168928226117927, "loss": 0.0103, "step": 337100 }, { "epoch": 0.87, "learning_rate": 0.00016892433790155552, "loss": 0.0129, "step": 337110 }, { "epoch": 0.87, "learning_rate": 0.00016892044968518406, "loss": 0.0112, "step": 337120 }, { "epoch": 0.87, "learning_rate": 0.00016891656146881263, "loss": 0.0147, "step": 337130 }, { "epoch": 0.87, "learning_rate": 0.00016891267325244114, "loss": 0.0141, "step": 337140 }, { "epoch": 0.87, "learning_rate": 0.00016890878503606968, "loss": 0.0125, "step": 337150 }, { "epoch": 0.87, "learning_rate": 0.0001689048968196982, "loss": 0.0137, "step": 337160 }, { "epoch": 0.87, "learning_rate": 0.00016890100860332677, "loss": 0.0105, "step": 337170 }, { "epoch": 0.87, "learning_rate": 0.00016889712038695528, "loss": 0.0139, "step": 337180 }, { "epoch": 0.87, "learning_rate": 0.00016889323217058382, "loss": 0.0141, "step": 337190 }, { "epoch": 0.87, "learning_rate": 0.00016888934395421234, "loss": 0.0123, "step": 337200 }, { "epoch": 0.87, "learning_rate": 0.00016888545573784088, "loss": 0.0134, "step": 337210 }, { "epoch": 0.87, "learning_rate": 0.00016888156752146942, "loss": 0.0149, "step": 337220 }, { "epoch": 0.87, "learning_rate": 0.00016887767930509796, "loss": 0.0142, "step": 337230 }, { "epoch": 0.87, "learning_rate": 0.00016887379108872648, "loss": 0.0121, "step": 337240 }, { "epoch": 0.87, "learning_rate": 0.00016886990287235502, "loss": 0.0133, "step": 337250 }, { "epoch": 0.87, "learning_rate": 0.00016886601465598359, "loss": 0.0126, "step": 337260 }, { "epoch": 0.87, "learning_rate": 0.0001688621264396121, "loss": 0.0168, "step": 337270 }, { "epoch": 0.87, "learning_rate": 0.00016885823822324061, "loss": 0.0154, "step": 337280 }, { "epoch": 0.87, "learning_rate": 0.00016885435000686916, "loss": 0.0134, "step": 337290 }, { "epoch": 0.87, "learning_rate": 0.00016885046179049773, "loss": 0.0104, "step": 337300 }, { "epoch": 0.87, "learning_rate": 0.00016884657357412624, "loss": 0.0119, "step": 337310 }, { "epoch": 0.87, "learning_rate": 0.00016884268535775478, "loss": 0.0167, "step": 337320 }, { "epoch": 0.87, "learning_rate": 0.0001688387971413833, "loss": 0.0156, "step": 337330 }, { "epoch": 0.87, "learning_rate": 0.00016883490892501186, "loss": 0.0113, "step": 337340 }, { "epoch": 0.87, "learning_rate": 0.00016883102070864038, "loss": 0.0109, "step": 337350 }, { "epoch": 0.87, "learning_rate": 0.00016882713249226892, "loss": 0.0122, "step": 337360 }, { "epoch": 0.87, "learning_rate": 0.00016882324427589744, "loss": 0.0105, "step": 337370 }, { "epoch": 0.87, "learning_rate": 0.000168819356059526, "loss": 0.0139, "step": 337380 }, { "epoch": 0.87, "learning_rate": 0.00016881546784315452, "loss": 0.0128, "step": 337390 }, { "epoch": 0.87, "learning_rate": 0.00016881157962678306, "loss": 0.0147, "step": 337400 }, { "epoch": 0.87, "learning_rate": 0.00016880769141041157, "loss": 0.0135, "step": 337410 }, { "epoch": 0.87, "learning_rate": 0.00016880380319404014, "loss": 0.012, "step": 337420 }, { "epoch": 0.87, "learning_rate": 0.00016879991497766866, "loss": 0.0123, "step": 337430 }, { "epoch": 0.87, "learning_rate": 0.0001687960267612972, "loss": 0.0123, "step": 337440 }, { "epoch": 0.87, "learning_rate": 0.00016879213854492571, "loss": 0.0133, "step": 337450 }, { "epoch": 0.87, "learning_rate": 0.00016878825032855426, "loss": 0.0127, "step": 337460 }, { "epoch": 0.87, "learning_rate": 0.00016878436211218282, "loss": 0.0116, "step": 337470 }, { "epoch": 0.87, "learning_rate": 0.00016878047389581134, "loss": 0.0157, "step": 337480 }, { "epoch": 0.87, "learning_rate": 0.00016877658567943988, "loss": 0.0121, "step": 337490 }, { "epoch": 0.87, "learning_rate": 0.0001687726974630684, "loss": 0.0178, "step": 337500 }, { "epoch": 0.87, "learning_rate": 0.00016876880924669696, "loss": 0.0099, "step": 337510 }, { "epoch": 0.87, "learning_rate": 0.00016876492103032548, "loss": 0.012, "step": 337520 }, { "epoch": 0.87, "learning_rate": 0.00016876103281395402, "loss": 0.0188, "step": 337530 }, { "epoch": 0.87, "learning_rate": 0.00016875714459758253, "loss": 0.0174, "step": 337540 }, { "epoch": 0.87, "learning_rate": 0.0001687532563812111, "loss": 0.0129, "step": 337550 }, { "epoch": 0.88, "learning_rate": 0.00016874936816483962, "loss": 0.0254, "step": 337560 }, { "epoch": 0.88, "learning_rate": 0.00016874547994846816, "loss": 0.0116, "step": 337570 }, { "epoch": 0.88, "learning_rate": 0.00016874159173209667, "loss": 0.0124, "step": 337580 }, { "epoch": 0.88, "learning_rate": 0.00016873770351572524, "loss": 0.0121, "step": 337590 }, { "epoch": 0.88, "learning_rate": 0.00016873381529935376, "loss": 0.0141, "step": 337600 }, { "epoch": 0.88, "learning_rate": 0.0001687299270829823, "loss": 0.0132, "step": 337610 }, { "epoch": 0.88, "learning_rate": 0.00016872603886661081, "loss": 0.0148, "step": 337620 }, { "epoch": 0.88, "learning_rate": 0.00016872215065023938, "loss": 0.0093, "step": 337630 }, { "epoch": 0.88, "learning_rate": 0.00016871826243386792, "loss": 0.0147, "step": 337640 }, { "epoch": 0.88, "learning_rate": 0.00016871437421749644, "loss": 0.0124, "step": 337650 }, { "epoch": 0.88, "learning_rate": 0.00016871048600112498, "loss": 0.0108, "step": 337660 }, { "epoch": 0.88, "learning_rate": 0.00016870659778475352, "loss": 0.0128, "step": 337670 }, { "epoch": 0.88, "learning_rate": 0.00016870270956838206, "loss": 0.0128, "step": 337680 }, { "epoch": 0.88, "learning_rate": 0.00016869882135201058, "loss": 0.0141, "step": 337690 }, { "epoch": 0.88, "learning_rate": 0.00016869493313563912, "loss": 0.0128, "step": 337700 }, { "epoch": 0.88, "learning_rate": 0.00016869104491926763, "loss": 0.0115, "step": 337710 }, { "epoch": 0.88, "learning_rate": 0.0001686871567028962, "loss": 0.0115, "step": 337720 }, { "epoch": 0.88, "learning_rate": 0.00016868326848652472, "loss": 0.012, "step": 337730 }, { "epoch": 0.88, "learning_rate": 0.00016867938027015326, "loss": 0.0118, "step": 337740 }, { "epoch": 0.88, "learning_rate": 0.00016867549205378177, "loss": 0.0113, "step": 337750 }, { "epoch": 0.88, "learning_rate": 0.00016867160383741034, "loss": 0.0128, "step": 337760 }, { "epoch": 0.88, "learning_rate": 0.00016866771562103886, "loss": 0.0105, "step": 337770 }, { "epoch": 0.88, "learning_rate": 0.0001686638274046674, "loss": 0.015, "step": 337780 }, { "epoch": 0.88, "learning_rate": 0.0001686599391882959, "loss": 0.0137, "step": 337790 }, { "epoch": 0.88, "learning_rate": 0.00016865605097192448, "loss": 0.0147, "step": 337800 }, { "epoch": 0.88, "learning_rate": 0.00016865216275555302, "loss": 0.0119, "step": 337810 }, { "epoch": 0.88, "learning_rate": 0.00016864827453918154, "loss": 0.0132, "step": 337820 }, { "epoch": 0.88, "learning_rate": 0.00016864438632281005, "loss": 0.0195, "step": 337830 }, { "epoch": 0.88, "learning_rate": 0.00016864049810643862, "loss": 0.0134, "step": 337840 }, { "epoch": 0.88, "learning_rate": 0.00016863660989006716, "loss": 0.0162, "step": 337850 }, { "epoch": 0.88, "learning_rate": 0.00016863272167369568, "loss": 0.0128, "step": 337860 }, { "epoch": 0.88, "learning_rate": 0.00016862883345732422, "loss": 0.0129, "step": 337870 }, { "epoch": 0.88, "learning_rate": 0.00016862494524095276, "loss": 0.0143, "step": 337880 }, { "epoch": 0.88, "learning_rate": 0.0001686210570245813, "loss": 0.0091, "step": 337890 }, { "epoch": 0.88, "learning_rate": 0.00016861716880820982, "loss": 0.0391, "step": 337900 }, { "epoch": 0.88, "learning_rate": 0.00016861328059183836, "loss": 0.0178, "step": 337910 }, { "epoch": 0.88, "learning_rate": 0.0001686093923754669, "loss": 0.0135, "step": 337920 }, { "epoch": 0.88, "learning_rate": 0.00016860550415909544, "loss": 0.0155, "step": 337930 }, { "epoch": 0.88, "learning_rate": 0.00016860161594272396, "loss": 0.0129, "step": 337940 }, { "epoch": 0.88, "learning_rate": 0.0001685977277263525, "loss": 0.013, "step": 337950 }, { "epoch": 0.88, "learning_rate": 0.000168593839509981, "loss": 0.0118, "step": 337960 }, { "epoch": 0.88, "learning_rate": 0.00016858995129360958, "loss": 0.0176, "step": 337970 }, { "epoch": 0.88, "learning_rate": 0.0001685860630772381, "loss": 0.0116, "step": 337980 }, { "epoch": 0.88, "learning_rate": 0.00016858217486086664, "loss": 0.0145, "step": 337990 }, { "epoch": 0.88, "learning_rate": 0.00016857828664449515, "loss": 0.0145, "step": 338000 }, { "epoch": 0.88, "eval_cer": 0.8817600714374692, "eval_loss": 0.00871712900698185, "eval_runtime": 107.6623, "eval_samples_per_second": 18.577, "eval_steps_per_second": 4.644, "step": 338000 }, { "epoch": 0.88, "learning_rate": 0.00016857439842812372, "loss": 0.0126, "step": 338010 }, { "epoch": 0.88, "learning_rate": 0.00016857051021175226, "loss": 0.0117, "step": 338020 }, { "epoch": 0.88, "learning_rate": 0.00016856662199538078, "loss": 0.0143, "step": 338030 }, { "epoch": 0.88, "learning_rate": 0.00016856273377900932, "loss": 0.0136, "step": 338040 }, { "epoch": 0.88, "learning_rate": 0.00016855884556263786, "loss": 0.0121, "step": 338050 }, { "epoch": 0.88, "learning_rate": 0.0001685549573462664, "loss": 0.0123, "step": 338060 }, { "epoch": 0.88, "learning_rate": 0.00016855106912989492, "loss": 0.0137, "step": 338070 }, { "epoch": 0.88, "learning_rate": 0.00016854718091352346, "loss": 0.0165, "step": 338080 }, { "epoch": 0.88, "learning_rate": 0.000168543292697152, "loss": 0.0132, "step": 338090 }, { "epoch": 0.88, "learning_rate": 0.00016853940448078054, "loss": 0.0137, "step": 338100 }, { "epoch": 0.88, "learning_rate": 0.00016853551626440906, "loss": 0.0127, "step": 338110 }, { "epoch": 0.88, "learning_rate": 0.0001685316280480376, "loss": 0.0104, "step": 338120 }, { "epoch": 0.88, "learning_rate": 0.00016852773983166617, "loss": 0.0123, "step": 338130 }, { "epoch": 0.88, "learning_rate": 0.00016852385161529468, "loss": 0.0105, "step": 338140 }, { "epoch": 0.88, "learning_rate": 0.0001685199633989232, "loss": 0.0148, "step": 338150 }, { "epoch": 0.88, "learning_rate": 0.00016851607518255174, "loss": 0.0122, "step": 338160 }, { "epoch": 0.88, "learning_rate": 0.00016851218696618025, "loss": 0.0113, "step": 338170 }, { "epoch": 0.88, "learning_rate": 0.00016850829874980882, "loss": 0.0119, "step": 338180 }, { "epoch": 0.88, "learning_rate": 0.00016850441053343736, "loss": 0.0136, "step": 338190 }, { "epoch": 0.88, "learning_rate": 0.00016850052231706588, "loss": 0.0108, "step": 338200 }, { "epoch": 0.88, "learning_rate": 0.00016849663410069442, "loss": 0.0174, "step": 338210 }, { "epoch": 0.88, "learning_rate": 0.00016849274588432296, "loss": 0.0125, "step": 338220 }, { "epoch": 0.88, "learning_rate": 0.0001684888576679515, "loss": 0.0109, "step": 338230 }, { "epoch": 0.88, "learning_rate": 0.00016848496945158002, "loss": 0.0103, "step": 338240 }, { "epoch": 0.88, "learning_rate": 0.00016848108123520856, "loss": 0.0116, "step": 338250 }, { "epoch": 0.88, "learning_rate": 0.0001684771930188371, "loss": 0.0112, "step": 338260 }, { "epoch": 0.88, "learning_rate": 0.00016847330480246564, "loss": 0.0156, "step": 338270 }, { "epoch": 0.88, "learning_rate": 0.00016846941658609416, "loss": 0.0199, "step": 338280 }, { "epoch": 0.88, "learning_rate": 0.0001684655283697227, "loss": 0.0133, "step": 338290 }, { "epoch": 0.88, "learning_rate": 0.00016846164015335124, "loss": 0.0134, "step": 338300 }, { "epoch": 0.88, "learning_rate": 0.00016845775193697978, "loss": 0.0154, "step": 338310 }, { "epoch": 0.88, "learning_rate": 0.0001684538637206083, "loss": 0.0149, "step": 338320 }, { "epoch": 0.88, "learning_rate": 0.00016844997550423684, "loss": 0.0161, "step": 338330 }, { "epoch": 0.88, "learning_rate": 0.0001684460872878654, "loss": 0.0123, "step": 338340 }, { "epoch": 0.88, "learning_rate": 0.00016844219907149392, "loss": 0.0175, "step": 338350 }, { "epoch": 0.88, "learning_rate": 0.00016843831085512246, "loss": 0.0191, "step": 338360 }, { "epoch": 0.88, "learning_rate": 0.00016843442263875098, "loss": 0.0143, "step": 338370 }, { "epoch": 0.88, "learning_rate": 0.00016843053442237954, "loss": 0.0113, "step": 338380 }, { "epoch": 0.88, "learning_rate": 0.00016842664620600806, "loss": 0.0159, "step": 338390 }, { "epoch": 0.88, "learning_rate": 0.0001684227579896366, "loss": 0.0132, "step": 338400 }, { "epoch": 0.88, "learning_rate": 0.00016841886977326512, "loss": 0.0114, "step": 338410 }, { "epoch": 0.88, "learning_rate": 0.00016841498155689366, "loss": 0.0134, "step": 338420 }, { "epoch": 0.88, "learning_rate": 0.0001684110933405222, "loss": 0.0244, "step": 338430 }, { "epoch": 0.88, "learning_rate": 0.00016840720512415074, "loss": 0.0144, "step": 338440 }, { "epoch": 0.88, "learning_rate": 0.00016840331690777925, "loss": 0.0116, "step": 338450 }, { "epoch": 0.88, "learning_rate": 0.0001683994286914078, "loss": 0.0403, "step": 338460 }, { "epoch": 0.88, "learning_rate": 0.00016839554047503634, "loss": 0.0135, "step": 338470 }, { "epoch": 0.88, "learning_rate": 0.00016839165225866488, "loss": 0.0094, "step": 338480 }, { "epoch": 0.88, "learning_rate": 0.0001683877640422934, "loss": 0.0159, "step": 338490 }, { "epoch": 0.88, "learning_rate": 0.00016838387582592194, "loss": 0.0123, "step": 338500 }, { "epoch": 0.88, "learning_rate": 0.0001683799876095505, "loss": 0.0136, "step": 338510 }, { "epoch": 0.88, "learning_rate": 0.00016837609939317902, "loss": 0.0154, "step": 338520 }, { "epoch": 0.88, "learning_rate": 0.00016837221117680756, "loss": 0.0108, "step": 338530 }, { "epoch": 0.88, "learning_rate": 0.00016836832296043608, "loss": 0.0128, "step": 338540 }, { "epoch": 0.88, "learning_rate": 0.00016836443474406464, "loss": 0.0156, "step": 338550 }, { "epoch": 0.88, "learning_rate": 0.00016836054652769316, "loss": 0.0102, "step": 338560 }, { "epoch": 0.88, "learning_rate": 0.0001683566583113217, "loss": 0.0188, "step": 338570 }, { "epoch": 0.88, "learning_rate": 0.00016835277009495021, "loss": 0.0097, "step": 338580 }, { "epoch": 0.88, "learning_rate": 0.00016834888187857878, "loss": 0.0168, "step": 338590 }, { "epoch": 0.88, "learning_rate": 0.0001683449936622073, "loss": 0.0142, "step": 338600 }, { "epoch": 0.88, "learning_rate": 0.00016834110544583584, "loss": 0.01, "step": 338610 }, { "epoch": 0.88, "learning_rate": 0.00016833721722946435, "loss": 0.0145, "step": 338620 }, { "epoch": 0.88, "learning_rate": 0.00016833332901309292, "loss": 0.0147, "step": 338630 }, { "epoch": 0.88, "learning_rate": 0.00016832944079672144, "loss": 0.014, "step": 338640 }, { "epoch": 0.88, "learning_rate": 0.00016832555258034998, "loss": 0.015, "step": 338650 }, { "epoch": 0.88, "learning_rate": 0.0001683216643639785, "loss": 0.0115, "step": 338660 }, { "epoch": 0.88, "learning_rate": 0.00016831777614760704, "loss": 0.0112, "step": 338670 }, { "epoch": 0.88, "learning_rate": 0.0001683138879312356, "loss": 0.0134, "step": 338680 }, { "epoch": 0.88, "learning_rate": 0.00016830999971486412, "loss": 0.0139, "step": 338690 }, { "epoch": 0.88, "learning_rate": 0.00016830611149849263, "loss": 0.0137, "step": 338700 }, { "epoch": 0.88, "learning_rate": 0.00016830222328212117, "loss": 0.0137, "step": 338710 }, { "epoch": 0.88, "learning_rate": 0.00016829833506574974, "loss": 0.0138, "step": 338720 }, { "epoch": 0.88, "learning_rate": 0.00016829444684937826, "loss": 0.0158, "step": 338730 }, { "epoch": 0.88, "learning_rate": 0.0001682905586330068, "loss": 0.0127, "step": 338740 }, { "epoch": 0.88, "learning_rate": 0.00016828667041663531, "loss": 0.0173, "step": 338750 }, { "epoch": 0.88, "learning_rate": 0.00016828278220026388, "loss": 0.0105, "step": 338760 }, { "epoch": 0.88, "learning_rate": 0.0001682788939838924, "loss": 0.0141, "step": 338770 }, { "epoch": 0.88, "learning_rate": 0.00016827500576752094, "loss": 0.013, "step": 338780 }, { "epoch": 0.88, "learning_rate": 0.00016827111755114945, "loss": 0.0128, "step": 338790 }, { "epoch": 0.88, "learning_rate": 0.00016826722933477802, "loss": 0.0158, "step": 338800 }, { "epoch": 0.88, "learning_rate": 0.00016826334111840654, "loss": 0.0131, "step": 338810 }, { "epoch": 0.88, "learning_rate": 0.00016825945290203508, "loss": 0.0111, "step": 338820 }, { "epoch": 0.88, "learning_rate": 0.0001682555646856636, "loss": 0.0155, "step": 338830 }, { "epoch": 0.88, "learning_rate": 0.00016825167646929216, "loss": 0.0162, "step": 338840 }, { "epoch": 0.88, "learning_rate": 0.0001682477882529207, "loss": 0.0136, "step": 338850 }, { "epoch": 0.88, "learning_rate": 0.00016824390003654922, "loss": 0.0141, "step": 338860 }, { "epoch": 0.88, "learning_rate": 0.00016824001182017773, "loss": 0.0158, "step": 338870 }, { "epoch": 0.88, "learning_rate": 0.0001682361236038063, "loss": 0.0141, "step": 338880 }, { "epoch": 0.88, "learning_rate": 0.00016823223538743484, "loss": 0.0138, "step": 338890 }, { "epoch": 0.88, "learning_rate": 0.00016822834717106336, "loss": 0.0143, "step": 338900 }, { "epoch": 0.88, "learning_rate": 0.0001682244589546919, "loss": 0.0147, "step": 338910 }, { "epoch": 0.88, "learning_rate": 0.0001682205707383204, "loss": 0.0146, "step": 338920 }, { "epoch": 0.88, "learning_rate": 0.00016821668252194898, "loss": 0.0159, "step": 338930 }, { "epoch": 0.88, "learning_rate": 0.0001682127943055775, "loss": 0.0146, "step": 338940 }, { "epoch": 0.88, "learning_rate": 0.00016820890608920604, "loss": 0.0192, "step": 338950 }, { "epoch": 0.88, "learning_rate": 0.00016820501787283455, "loss": 0.0107, "step": 338960 }, { "epoch": 0.88, "learning_rate": 0.00016820112965646312, "loss": 0.0151, "step": 338970 }, { "epoch": 0.88, "learning_rate": 0.00016819724144009164, "loss": 0.0132, "step": 338980 }, { "epoch": 0.88, "learning_rate": 0.00016819335322372018, "loss": 0.0148, "step": 338990 }, { "epoch": 0.88, "learning_rate": 0.0001681894650073487, "loss": 0.0153, "step": 339000 }, { "epoch": 0.88, "eval_cer": 0.8817222812402463, "eval_loss": 0.008869285695254803, "eval_runtime": 107.8634, "eval_samples_per_second": 18.542, "eval_steps_per_second": 4.635, "step": 339000 }, { "epoch": 0.88, "learning_rate": 0.00016818557679097726, "loss": 0.0173, "step": 339010 }, { "epoch": 0.88, "learning_rate": 0.00016818168857460578, "loss": 0.0122, "step": 339020 }, { "epoch": 0.88, "learning_rate": 0.00016817780035823432, "loss": 0.0158, "step": 339030 }, { "epoch": 0.88, "learning_rate": 0.00016817391214186283, "loss": 0.0123, "step": 339040 }, { "epoch": 0.88, "learning_rate": 0.0001681700239254914, "loss": 0.015, "step": 339050 }, { "epoch": 0.88, "learning_rate": 0.00016816613570911994, "loss": 0.0122, "step": 339060 }, { "epoch": 0.88, "learning_rate": 0.00016816224749274846, "loss": 0.0133, "step": 339070 }, { "epoch": 0.88, "learning_rate": 0.000168158359276377, "loss": 0.012, "step": 339080 }, { "epoch": 0.88, "learning_rate": 0.00016815447106000554, "loss": 0.0116, "step": 339090 }, { "epoch": 0.88, "learning_rate": 0.00016815058284363408, "loss": 0.0104, "step": 339100 }, { "epoch": 0.88, "learning_rate": 0.0001681466946272626, "loss": 0.0137, "step": 339110 }, { "epoch": 0.88, "learning_rate": 0.00016814280641089114, "loss": 0.0111, "step": 339120 }, { "epoch": 0.88, "learning_rate": 0.00016813891819451968, "loss": 0.0151, "step": 339130 }, { "epoch": 0.88, "learning_rate": 0.00016813502997814822, "loss": 0.0188, "step": 339140 }, { "epoch": 0.88, "learning_rate": 0.00016813114176177674, "loss": 0.0175, "step": 339150 }, { "epoch": 0.88, "learning_rate": 0.00016812725354540528, "loss": 0.011, "step": 339160 }, { "epoch": 0.88, "learning_rate": 0.0001681233653290338, "loss": 0.0112, "step": 339170 }, { "epoch": 0.88, "learning_rate": 0.00016811947711266236, "loss": 0.0142, "step": 339180 }, { "epoch": 0.88, "learning_rate": 0.00016811558889629088, "loss": 0.0147, "step": 339190 }, { "epoch": 0.88, "learning_rate": 0.00016811170067991942, "loss": 0.0174, "step": 339200 }, { "epoch": 0.88, "learning_rate": 0.00016810781246354793, "loss": 0.0137, "step": 339210 }, { "epoch": 0.88, "learning_rate": 0.0001681039242471765, "loss": 0.013, "step": 339220 }, { "epoch": 0.88, "learning_rate": 0.00016810003603080504, "loss": 0.0112, "step": 339230 }, { "epoch": 0.88, "learning_rate": 0.00016809614781443356, "loss": 0.0129, "step": 339240 }, { "epoch": 0.88, "learning_rate": 0.0001680922595980621, "loss": 0.0143, "step": 339250 }, { "epoch": 0.88, "learning_rate": 0.00016808837138169064, "loss": 0.0131, "step": 339260 }, { "epoch": 0.88, "learning_rate": 0.00016808448316531918, "loss": 0.0147, "step": 339270 }, { "epoch": 0.88, "learning_rate": 0.0001680805949489477, "loss": 0.0148, "step": 339280 }, { "epoch": 0.88, "learning_rate": 0.00016807670673257624, "loss": 0.0166, "step": 339290 }, { "epoch": 0.88, "learning_rate": 0.00016807281851620478, "loss": 0.0118, "step": 339300 }, { "epoch": 0.88, "learning_rate": 0.00016806893029983332, "loss": 0.0125, "step": 339310 }, { "epoch": 0.88, "learning_rate": 0.00016806504208346184, "loss": 0.0122, "step": 339320 }, { "epoch": 0.88, "learning_rate": 0.00016806115386709038, "loss": 0.0158, "step": 339330 }, { "epoch": 0.88, "learning_rate": 0.00016805726565071892, "loss": 0.0173, "step": 339340 }, { "epoch": 0.88, "learning_rate": 0.00016805337743434746, "loss": 0.012, "step": 339350 }, { "epoch": 0.88, "learning_rate": 0.00016804948921797597, "loss": 0.0126, "step": 339360 }, { "epoch": 0.88, "learning_rate": 0.00016804560100160452, "loss": 0.0156, "step": 339370 }, { "epoch": 0.88, "learning_rate": 0.00016804171278523308, "loss": 0.0125, "step": 339380 }, { "epoch": 0.88, "learning_rate": 0.0001680378245688616, "loss": 0.0121, "step": 339390 }, { "epoch": 0.88, "learning_rate": 0.00016803393635249014, "loss": 0.0102, "step": 339400 }, { "epoch": 0.88, "learning_rate": 0.00016803004813611866, "loss": 0.0105, "step": 339410 }, { "epoch": 0.88, "learning_rate": 0.00016802615991974717, "loss": 0.011, "step": 339420 }, { "epoch": 0.88, "learning_rate": 0.00016802227170337574, "loss": 0.012, "step": 339430 }, { "epoch": 0.88, "learning_rate": 0.00016801838348700428, "loss": 0.0117, "step": 339440 }, { "epoch": 0.88, "learning_rate": 0.0001680144952706328, "loss": 0.014, "step": 339450 }, { "epoch": 0.88, "learning_rate": 0.00016801060705426134, "loss": 0.0115, "step": 339460 }, { "epoch": 0.88, "learning_rate": 0.00016800671883788988, "loss": 0.0125, "step": 339470 }, { "epoch": 0.88, "learning_rate": 0.00016800283062151842, "loss": 0.0148, "step": 339480 }, { "epoch": 0.88, "learning_rate": 0.00016799894240514693, "loss": 0.014, "step": 339490 }, { "epoch": 0.88, "learning_rate": 0.00016799505418877548, "loss": 0.0135, "step": 339500 }, { "epoch": 0.88, "learning_rate": 0.00016799116597240402, "loss": 0.0175, "step": 339510 }, { "epoch": 0.88, "learning_rate": 0.00016798727775603256, "loss": 0.0127, "step": 339520 }, { "epoch": 0.88, "learning_rate": 0.00016798338953966107, "loss": 0.0119, "step": 339530 }, { "epoch": 0.88, "learning_rate": 0.00016797950132328962, "loss": 0.0182, "step": 339540 }, { "epoch": 0.88, "learning_rate": 0.00016797561310691818, "loss": 0.0123, "step": 339550 }, { "epoch": 0.88, "learning_rate": 0.0001679717248905467, "loss": 0.0097, "step": 339560 }, { "epoch": 0.88, "learning_rate": 0.0001679678366741752, "loss": 0.0162, "step": 339570 }, { "epoch": 0.88, "learning_rate": 0.00016796394845780376, "loss": 0.015, "step": 339580 }, { "epoch": 0.88, "learning_rate": 0.00016796006024143232, "loss": 0.0108, "step": 339590 }, { "epoch": 0.88, "learning_rate": 0.00016795617202506084, "loss": 0.0134, "step": 339600 }, { "epoch": 0.88, "learning_rate": 0.00016795228380868938, "loss": 0.018, "step": 339610 }, { "epoch": 0.88, "learning_rate": 0.0001679483955923179, "loss": 0.0109, "step": 339620 }, { "epoch": 0.88, "learning_rate": 0.00016794450737594646, "loss": 0.0114, "step": 339630 }, { "epoch": 0.88, "learning_rate": 0.00016794061915957498, "loss": 0.0148, "step": 339640 }, { "epoch": 0.88, "learning_rate": 0.00016793673094320352, "loss": 0.0118, "step": 339650 }, { "epoch": 0.88, "learning_rate": 0.00016793284272683203, "loss": 0.014, "step": 339660 }, { "epoch": 0.88, "learning_rate": 0.00016792895451046058, "loss": 0.0155, "step": 339670 }, { "epoch": 0.88, "learning_rate": 0.00016792506629408912, "loss": 0.0146, "step": 339680 }, { "epoch": 0.88, "learning_rate": 0.00016792117807771766, "loss": 0.0127, "step": 339690 }, { "epoch": 0.88, "learning_rate": 0.00016791728986134617, "loss": 0.0124, "step": 339700 }, { "epoch": 0.88, "learning_rate": 0.00016791340164497472, "loss": 0.0116, "step": 339710 }, { "epoch": 0.88, "learning_rate": 0.00016790951342860328, "loss": 0.0137, "step": 339720 }, { "epoch": 0.88, "learning_rate": 0.0001679056252122318, "loss": 0.015, "step": 339730 }, { "epoch": 0.88, "learning_rate": 0.0001679017369958603, "loss": 0.0117, "step": 339740 }, { "epoch": 0.88, "learning_rate": 0.00016789784877948885, "loss": 0.013, "step": 339750 }, { "epoch": 0.88, "learning_rate": 0.00016789396056311742, "loss": 0.0139, "step": 339760 }, { "epoch": 0.88, "learning_rate": 0.00016789007234674594, "loss": 0.0106, "step": 339770 }, { "epoch": 0.88, "learning_rate": 0.00016788618413037448, "loss": 0.0144, "step": 339780 }, { "epoch": 0.88, "learning_rate": 0.000167882295914003, "loss": 0.0125, "step": 339790 }, { "epoch": 0.88, "learning_rate": 0.00016787840769763156, "loss": 0.0155, "step": 339800 }, { "epoch": 0.88, "learning_rate": 0.00016787451948126008, "loss": 0.0164, "step": 339810 }, { "epoch": 0.88, "learning_rate": 0.00016787063126488862, "loss": 0.0131, "step": 339820 }, { "epoch": 0.88, "learning_rate": 0.00016786674304851713, "loss": 0.0143, "step": 339830 }, { "epoch": 0.88, "learning_rate": 0.0001678628548321457, "loss": 0.0135, "step": 339840 }, { "epoch": 0.88, "learning_rate": 0.00016785896661577422, "loss": 0.0142, "step": 339850 }, { "epoch": 0.88, "learning_rate": 0.00016785507839940276, "loss": 0.0104, "step": 339860 }, { "epoch": 0.88, "learning_rate": 0.00016785119018303127, "loss": 0.0136, "step": 339870 }, { "epoch": 0.88, "learning_rate": 0.00016784730196665984, "loss": 0.0192, "step": 339880 }, { "epoch": 0.88, "learning_rate": 0.00016784341375028836, "loss": 0.0146, "step": 339890 }, { "epoch": 0.88, "learning_rate": 0.0001678395255339169, "loss": 0.0134, "step": 339900 }, { "epoch": 0.88, "learning_rate": 0.0001678356373175454, "loss": 0.0129, "step": 339910 }, { "epoch": 0.88, "learning_rate": 0.00016783174910117395, "loss": 0.0176, "step": 339920 }, { "epoch": 0.88, "learning_rate": 0.00016782786088480252, "loss": 0.0114, "step": 339930 }, { "epoch": 0.88, "learning_rate": 0.00016782397266843104, "loss": 0.0148, "step": 339940 }, { "epoch": 0.88, "learning_rate": 0.00016782008445205958, "loss": 0.0123, "step": 339950 }, { "epoch": 0.88, "learning_rate": 0.0001678161962356881, "loss": 0.0111, "step": 339960 }, { "epoch": 0.88, "learning_rate": 0.00016781230801931666, "loss": 0.0134, "step": 339970 }, { "epoch": 0.88, "learning_rate": 0.00016780841980294518, "loss": 0.0164, "step": 339980 }, { "epoch": 0.88, "learning_rate": 0.00016780453158657372, "loss": 0.0138, "step": 339990 }, { "epoch": 0.88, "learning_rate": 0.00016780064337020223, "loss": 0.0115, "step": 340000 }, { "epoch": 0.88, "eval_cer": 0.881751673615864, "eval_loss": 0.008945505134761333, "eval_runtime": 107.8028, "eval_samples_per_second": 18.552, "eval_steps_per_second": 4.638, "step": 340000 }, { "epoch": 0.88, "learning_rate": 0.0001677967551538308, "loss": 0.0123, "step": 340010 }, { "epoch": 0.88, "learning_rate": 0.00016779286693745932, "loss": 0.0096, "step": 340020 }, { "epoch": 0.88, "learning_rate": 0.00016778897872108786, "loss": 0.0126, "step": 340030 }, { "epoch": 0.88, "learning_rate": 0.00016778509050471637, "loss": 0.0152, "step": 340040 }, { "epoch": 0.88, "learning_rate": 0.00016778120228834494, "loss": 0.0208, "step": 340050 }, { "epoch": 0.88, "learning_rate": 0.00016777731407197346, "loss": 0.0112, "step": 340060 }, { "epoch": 0.88, "learning_rate": 0.000167773425855602, "loss": 0.0157, "step": 340070 }, { "epoch": 0.88, "learning_rate": 0.0001677695376392305, "loss": 0.0103, "step": 340080 }, { "epoch": 0.88, "learning_rate": 0.00016776564942285908, "loss": 0.0134, "step": 340090 }, { "epoch": 0.88, "learning_rate": 0.00016776176120648762, "loss": 0.0144, "step": 340100 }, { "epoch": 0.88, "learning_rate": 0.00016775787299011614, "loss": 0.01, "step": 340110 }, { "epoch": 0.88, "learning_rate": 0.00016775398477374468, "loss": 0.0135, "step": 340120 }, { "epoch": 0.88, "learning_rate": 0.00016775009655737322, "loss": 0.0104, "step": 340130 }, { "epoch": 0.88, "learning_rate": 0.00016774620834100176, "loss": 0.0187, "step": 340140 }, { "epoch": 0.88, "learning_rate": 0.00016774232012463028, "loss": 0.0113, "step": 340150 }, { "epoch": 0.88, "learning_rate": 0.00016773843190825882, "loss": 0.0129, "step": 340160 }, { "epoch": 0.88, "learning_rate": 0.00016773454369188733, "loss": 0.0095, "step": 340170 }, { "epoch": 0.88, "learning_rate": 0.0001677306554755159, "loss": 0.0221, "step": 340180 }, { "epoch": 0.88, "learning_rate": 0.00016772676725914442, "loss": 0.0124, "step": 340190 }, { "epoch": 0.88, "learning_rate": 0.00016772287904277296, "loss": 0.0126, "step": 340200 }, { "epoch": 0.88, "learning_rate": 0.00016771899082640147, "loss": 0.0146, "step": 340210 }, { "epoch": 0.88, "learning_rate": 0.00016771510261003004, "loss": 0.0145, "step": 340220 }, { "epoch": 0.88, "learning_rate": 0.00016771121439365855, "loss": 0.0169, "step": 340230 }, { "epoch": 0.88, "learning_rate": 0.0001677073261772871, "loss": 0.0127, "step": 340240 }, { "epoch": 0.88, "learning_rate": 0.0001677034379609156, "loss": 0.0161, "step": 340250 }, { "epoch": 0.88, "learning_rate": 0.00016769954974454418, "loss": 0.0192, "step": 340260 }, { "epoch": 0.88, "learning_rate": 0.00016769566152817272, "loss": 0.0125, "step": 340270 }, { "epoch": 0.88, "learning_rate": 0.00016769177331180124, "loss": 0.0142, "step": 340280 }, { "epoch": 0.88, "learning_rate": 0.00016768788509542975, "loss": 0.0125, "step": 340290 }, { "epoch": 0.88, "learning_rate": 0.00016768399687905832, "loss": 0.0126, "step": 340300 }, { "epoch": 0.88, "learning_rate": 0.00016768010866268686, "loss": 0.0102, "step": 340310 }, { "epoch": 0.88, "learning_rate": 0.00016767622044631538, "loss": 0.0128, "step": 340320 }, { "epoch": 0.88, "learning_rate": 0.00016767233222994392, "loss": 0.0194, "step": 340330 }, { "epoch": 0.88, "learning_rate": 0.00016766844401357246, "loss": 0.0162, "step": 340340 }, { "epoch": 0.88, "learning_rate": 0.000167664555797201, "loss": 0.0135, "step": 340350 }, { "epoch": 0.88, "learning_rate": 0.00016766066758082951, "loss": 0.016, "step": 340360 }, { "epoch": 0.88, "learning_rate": 0.00016765677936445806, "loss": 0.0121, "step": 340370 }, { "epoch": 0.88, "learning_rate": 0.0001676528911480866, "loss": 0.0127, "step": 340380 }, { "epoch": 0.88, "learning_rate": 0.00016764900293171514, "loss": 0.0129, "step": 340390 }, { "epoch": 0.88, "learning_rate": 0.00016764511471534365, "loss": 0.0128, "step": 340400 }, { "epoch": 0.88, "learning_rate": 0.0001676412264989722, "loss": 0.0102, "step": 340410 }, { "epoch": 0.88, "learning_rate": 0.0001676373382826007, "loss": 0.0095, "step": 340420 }, { "epoch": 0.88, "learning_rate": 0.00016763345006622928, "loss": 0.0123, "step": 340430 }, { "epoch": 0.88, "learning_rate": 0.00016762956184985782, "loss": 0.0109, "step": 340440 }, { "epoch": 0.88, "learning_rate": 0.00016762567363348634, "loss": 0.0127, "step": 340450 }, { "epoch": 0.88, "learning_rate": 0.00016762178541711485, "loss": 0.0108, "step": 340460 }, { "epoch": 0.88, "learning_rate": 0.00016761789720074342, "loss": 0.0093, "step": 340470 }, { "epoch": 0.88, "learning_rate": 0.00016761400898437196, "loss": 0.0131, "step": 340480 }, { "epoch": 0.88, "learning_rate": 0.00016761012076800047, "loss": 0.0119, "step": 340490 }, { "epoch": 0.88, "learning_rate": 0.00016760623255162902, "loss": 0.0135, "step": 340500 }, { "epoch": 0.88, "learning_rate": 0.00016760234433525756, "loss": 0.0154, "step": 340510 }, { "epoch": 0.88, "learning_rate": 0.0001675984561188861, "loss": 0.0131, "step": 340520 }, { "epoch": 0.88, "learning_rate": 0.00016759456790251461, "loss": 0.0174, "step": 340530 }, { "epoch": 0.88, "learning_rate": 0.00016759067968614316, "loss": 0.0139, "step": 340540 }, { "epoch": 0.88, "learning_rate": 0.0001675867914697717, "loss": 0.0132, "step": 340550 }, { "epoch": 0.88, "learning_rate": 0.00016758290325340024, "loss": 0.0132, "step": 340560 }, { "epoch": 0.88, "learning_rate": 0.00016757901503702875, "loss": 0.0117, "step": 340570 }, { "epoch": 0.88, "learning_rate": 0.0001675751268206573, "loss": 0.0138, "step": 340580 }, { "epoch": 0.88, "learning_rate": 0.00016757123860428586, "loss": 0.0165, "step": 340590 }, { "epoch": 0.88, "learning_rate": 0.00016756735038791438, "loss": 0.0148, "step": 340600 }, { "epoch": 0.88, "learning_rate": 0.0001675634621715429, "loss": 0.0164, "step": 340610 }, { "epoch": 0.88, "learning_rate": 0.00016755957395517143, "loss": 0.014, "step": 340620 }, { "epoch": 0.88, "learning_rate": 0.0001675556857388, "loss": 0.0123, "step": 340630 }, { "epoch": 0.88, "learning_rate": 0.00016755179752242852, "loss": 0.014, "step": 340640 }, { "epoch": 0.88, "learning_rate": 0.00016754790930605706, "loss": 0.0105, "step": 340650 }, { "epoch": 0.88, "learning_rate": 0.00016754402108968557, "loss": 0.0137, "step": 340660 }, { "epoch": 0.88, "learning_rate": 0.00016754013287331412, "loss": 0.0141, "step": 340670 }, { "epoch": 0.88, "learning_rate": 0.00016753624465694266, "loss": 0.011, "step": 340680 }, { "epoch": 0.88, "learning_rate": 0.0001675323564405712, "loss": 0.011, "step": 340690 }, { "epoch": 0.88, "learning_rate": 0.00016752846822419971, "loss": 0.0161, "step": 340700 }, { "epoch": 0.88, "learning_rate": 0.00016752458000782826, "loss": 0.013, "step": 340710 }, { "epoch": 0.88, "learning_rate": 0.0001675206917914568, "loss": 0.0136, "step": 340720 }, { "epoch": 0.88, "learning_rate": 0.00016751680357508534, "loss": 0.0128, "step": 340730 }, { "epoch": 0.88, "learning_rate": 0.00016751291535871385, "loss": 0.0148, "step": 340740 }, { "epoch": 0.88, "learning_rate": 0.0001675090271423424, "loss": 0.0117, "step": 340750 }, { "epoch": 0.88, "learning_rate": 0.00016750513892597094, "loss": 0.016, "step": 340760 }, { "epoch": 0.88, "learning_rate": 0.00016750125070959948, "loss": 0.0173, "step": 340770 }, { "epoch": 0.88, "learning_rate": 0.000167497362493228, "loss": 0.0119, "step": 340780 }, { "epoch": 0.88, "learning_rate": 0.00016749347427685653, "loss": 0.0142, "step": 340790 }, { "epoch": 0.88, "learning_rate": 0.0001674895860604851, "loss": 0.0191, "step": 340800 }, { "epoch": 0.88, "learning_rate": 0.00016748569784411362, "loss": 0.0115, "step": 340810 }, { "epoch": 0.88, "learning_rate": 0.00016748180962774216, "loss": 0.0136, "step": 340820 }, { "epoch": 0.88, "learning_rate": 0.00016747792141137067, "loss": 0.0126, "step": 340830 }, { "epoch": 0.88, "learning_rate": 0.00016747403319499924, "loss": 0.0148, "step": 340840 }, { "epoch": 0.88, "learning_rate": 0.00016747014497862776, "loss": 0.0132, "step": 340850 }, { "epoch": 0.88, "learning_rate": 0.0001674662567622563, "loss": 0.0107, "step": 340860 }, { "epoch": 0.88, "learning_rate": 0.0001674623685458848, "loss": 0.0155, "step": 340870 }, { "epoch": 0.88, "learning_rate": 0.00016745848032951338, "loss": 0.0147, "step": 340880 }, { "epoch": 0.88, "learning_rate": 0.0001674545921131419, "loss": 0.0156, "step": 340890 }, { "epoch": 0.88, "learning_rate": 0.00016745070389677044, "loss": 0.0136, "step": 340900 }, { "epoch": 0.88, "learning_rate": 0.00016744681568039895, "loss": 0.011, "step": 340910 }, { "epoch": 0.88, "learning_rate": 0.0001674429274640275, "loss": 0.0162, "step": 340920 }, { "epoch": 0.88, "learning_rate": 0.00016743903924765604, "loss": 0.012, "step": 340930 }, { "epoch": 0.88, "learning_rate": 0.00016743515103128458, "loss": 0.0107, "step": 340940 }, { "epoch": 0.88, "learning_rate": 0.0001674312628149131, "loss": 0.014, "step": 340950 }, { "epoch": 0.88, "learning_rate": 0.00016742737459854163, "loss": 0.0131, "step": 340960 }, { "epoch": 0.88, "learning_rate": 0.0001674234863821702, "loss": 0.0127, "step": 340970 }, { "epoch": 0.88, "learning_rate": 0.00016741959816579872, "loss": 0.0146, "step": 340980 }, { "epoch": 0.88, "learning_rate": 0.00016741570994942726, "loss": 0.0129, "step": 340990 }, { "epoch": 0.88, "learning_rate": 0.00016741182173305577, "loss": 0.0123, "step": 341000 }, { "epoch": 0.88, "eval_cer": 0.8817390768834564, "eval_loss": 0.008974668569862843, "eval_runtime": 107.5548, "eval_samples_per_second": 18.595, "eval_steps_per_second": 4.649, "step": 341000 }, { "epoch": 0.88, "learning_rate": 0.00016740793351668434, "loss": 0.0118, "step": 341010 }, { "epoch": 0.88, "learning_rate": 0.00016740404530031286, "loss": 0.0127, "step": 341020 }, { "epoch": 0.88, "learning_rate": 0.0001674001570839414, "loss": 0.016, "step": 341030 }, { "epoch": 0.88, "learning_rate": 0.0001673962688675699, "loss": 0.0158, "step": 341040 }, { "epoch": 0.88, "learning_rate": 0.00016739238065119848, "loss": 0.0118, "step": 341050 }, { "epoch": 0.88, "learning_rate": 0.000167388492434827, "loss": 0.0117, "step": 341060 }, { "epoch": 0.88, "learning_rate": 0.00016738460421845554, "loss": 0.0131, "step": 341070 }, { "epoch": 0.88, "learning_rate": 0.00016738071600208405, "loss": 0.0138, "step": 341080 }, { "epoch": 0.88, "learning_rate": 0.00016737682778571262, "loss": 0.0142, "step": 341090 }, { "epoch": 0.88, "learning_rate": 0.00016737293956934114, "loss": 0.0137, "step": 341100 }, { "epoch": 0.88, "learning_rate": 0.00016736905135296968, "loss": 0.0156, "step": 341110 }, { "epoch": 0.88, "learning_rate": 0.0001673651631365982, "loss": 0.014, "step": 341120 }, { "epoch": 0.88, "learning_rate": 0.00016736127492022676, "loss": 0.0131, "step": 341130 }, { "epoch": 0.88, "learning_rate": 0.0001673573867038553, "loss": 0.0148, "step": 341140 }, { "epoch": 0.88, "learning_rate": 0.00016735349848748382, "loss": 0.0136, "step": 341150 }, { "epoch": 0.88, "learning_rate": 0.00016734961027111233, "loss": 0.0134, "step": 341160 }, { "epoch": 0.88, "learning_rate": 0.00016734572205474087, "loss": 0.0115, "step": 341170 }, { "epoch": 0.88, "learning_rate": 0.00016734183383836944, "loss": 0.0128, "step": 341180 }, { "epoch": 0.88, "learning_rate": 0.00016733794562199796, "loss": 0.0136, "step": 341190 }, { "epoch": 0.88, "learning_rate": 0.0001673340574056265, "loss": 0.0127, "step": 341200 }, { "epoch": 0.88, "learning_rate": 0.000167330169189255, "loss": 0.0115, "step": 341210 }, { "epoch": 0.88, "learning_rate": 0.00016732628097288358, "loss": 0.0161, "step": 341220 }, { "epoch": 0.88, "learning_rate": 0.0001673223927565121, "loss": 0.0141, "step": 341230 }, { "epoch": 0.88, "learning_rate": 0.00016731850454014064, "loss": 0.0151, "step": 341240 }, { "epoch": 0.88, "learning_rate": 0.00016731461632376915, "loss": 0.0119, "step": 341250 }, { "epoch": 0.88, "learning_rate": 0.00016731072810739772, "loss": 0.0166, "step": 341260 }, { "epoch": 0.88, "learning_rate": 0.00016730683989102623, "loss": 0.0127, "step": 341270 }, { "epoch": 0.88, "learning_rate": 0.00016730295167465478, "loss": 0.0129, "step": 341280 }, { "epoch": 0.88, "learning_rate": 0.0001672990634582833, "loss": 0.0142, "step": 341290 }, { "epoch": 0.88, "learning_rate": 0.00016729517524191186, "loss": 0.0127, "step": 341300 }, { "epoch": 0.88, "learning_rate": 0.0001672912870255404, "loss": 0.0134, "step": 341310 }, { "epoch": 0.88, "learning_rate": 0.00016728739880916892, "loss": 0.0099, "step": 341320 }, { "epoch": 0.88, "learning_rate": 0.00016728351059279743, "loss": 0.0123, "step": 341330 }, { "epoch": 0.88, "learning_rate": 0.000167279622376426, "loss": 0.0138, "step": 341340 }, { "epoch": 0.88, "learning_rate": 0.00016727573416005454, "loss": 0.0128, "step": 341350 }, { "epoch": 0.88, "learning_rate": 0.00016727184594368306, "loss": 0.0115, "step": 341360 }, { "epoch": 0.88, "learning_rate": 0.0001672679577273116, "loss": 0.0126, "step": 341370 }, { "epoch": 0.88, "learning_rate": 0.00016726406951094014, "loss": 0.0136, "step": 341380 }, { "epoch": 0.88, "learning_rate": 0.00016726018129456868, "loss": 0.0136, "step": 341390 }, { "epoch": 0.88, "learning_rate": 0.0001672562930781972, "loss": 0.0134, "step": 341400 }, { "epoch": 0.88, "learning_rate": 0.00016725240486182574, "loss": 0.0121, "step": 341410 }, { "epoch": 0.89, "learning_rate": 0.00016724851664545425, "loss": 0.0161, "step": 341420 }, { "epoch": 0.89, "learning_rate": 0.00016724462842908282, "loss": 0.013, "step": 341430 }, { "epoch": 0.89, "learning_rate": 0.00016724074021271133, "loss": 0.0121, "step": 341440 }, { "epoch": 0.89, "learning_rate": 0.00016723685199633988, "loss": 0.0156, "step": 341450 }, { "epoch": 0.89, "learning_rate": 0.0001672329637799684, "loss": 0.0139, "step": 341460 }, { "epoch": 0.89, "learning_rate": 0.00016722907556359696, "loss": 0.0136, "step": 341470 }, { "epoch": 0.89, "learning_rate": 0.00016722518734722547, "loss": 0.0151, "step": 341480 }, { "epoch": 0.89, "learning_rate": 0.00016722129913085402, "loss": 0.0135, "step": 341490 }, { "epoch": 0.89, "learning_rate": 0.00016721741091448253, "loss": 0.0112, "step": 341500 }, { "epoch": 0.89, "learning_rate": 0.0001672135226981111, "loss": 0.0129, "step": 341510 }, { "epoch": 0.89, "learning_rate": 0.00016720963448173964, "loss": 0.0108, "step": 341520 }, { "epoch": 0.89, "learning_rate": 0.00016720574626536815, "loss": 0.0137, "step": 341530 }, { "epoch": 0.89, "learning_rate": 0.0001672018580489967, "loss": 0.0122, "step": 341540 }, { "epoch": 0.89, "learning_rate": 0.00016719796983262524, "loss": 0.0138, "step": 341550 }, { "epoch": 0.89, "learning_rate": 0.00016719408161625378, "loss": 0.0118, "step": 341560 }, { "epoch": 0.89, "learning_rate": 0.0001671901933998823, "loss": 0.013, "step": 341570 }, { "epoch": 0.89, "learning_rate": 0.00016718630518351084, "loss": 0.0131, "step": 341580 }, { "epoch": 0.89, "learning_rate": 0.00016718241696713938, "loss": 0.0127, "step": 341590 }, { "epoch": 0.89, "learning_rate": 0.00016717852875076792, "loss": 0.013, "step": 341600 }, { "epoch": 0.89, "learning_rate": 0.00016717464053439643, "loss": 0.0122, "step": 341610 }, { "epoch": 0.89, "learning_rate": 0.00016717075231802498, "loss": 0.0115, "step": 341620 }, { "epoch": 0.89, "learning_rate": 0.00016716686410165352, "loss": 0.0112, "step": 341630 }, { "epoch": 0.89, "learning_rate": 0.00016716297588528206, "loss": 0.0114, "step": 341640 }, { "epoch": 0.89, "learning_rate": 0.00016715908766891057, "loss": 0.0142, "step": 341650 }, { "epoch": 0.89, "learning_rate": 0.00016715519945253911, "loss": 0.0132, "step": 341660 }, { "epoch": 0.89, "learning_rate": 0.00016715131123616763, "loss": 0.0159, "step": 341670 }, { "epoch": 0.89, "learning_rate": 0.0001671474230197962, "loss": 0.0133, "step": 341680 }, { "epoch": 0.89, "learning_rate": 0.00016714353480342474, "loss": 0.0125, "step": 341690 }, { "epoch": 0.89, "learning_rate": 0.00016713964658705325, "loss": 0.0172, "step": 341700 }, { "epoch": 0.89, "learning_rate": 0.0001671357583706818, "loss": 0.0124, "step": 341710 }, { "epoch": 0.89, "learning_rate": 0.00016713187015431034, "loss": 0.0143, "step": 341720 }, { "epoch": 0.89, "learning_rate": 0.00016712798193793888, "loss": 0.0119, "step": 341730 }, { "epoch": 0.89, "learning_rate": 0.0001671240937215674, "loss": 0.0107, "step": 341740 }, { "epoch": 0.89, "learning_rate": 0.00016712020550519594, "loss": 0.0126, "step": 341750 }, { "epoch": 0.89, "learning_rate": 0.00016711631728882448, "loss": 0.0111, "step": 341760 }, { "epoch": 0.89, "learning_rate": 0.00016711242907245302, "loss": 0.0113, "step": 341770 }, { "epoch": 0.89, "learning_rate": 0.00016710854085608153, "loss": 0.0136, "step": 341780 }, { "epoch": 0.89, "learning_rate": 0.00016710465263971007, "loss": 0.0163, "step": 341790 }, { "epoch": 0.89, "learning_rate": 0.00016710076442333862, "loss": 0.0141, "step": 341800 }, { "epoch": 0.89, "learning_rate": 0.00016709687620696716, "loss": 0.016, "step": 341810 }, { "epoch": 0.89, "learning_rate": 0.00016709298799059567, "loss": 0.012, "step": 341820 }, { "epoch": 0.89, "learning_rate": 0.00016708909977422421, "loss": 0.0155, "step": 341830 }, { "epoch": 0.89, "learning_rate": 0.00016708521155785278, "loss": 0.013, "step": 341840 }, { "epoch": 0.89, "learning_rate": 0.0001670813233414813, "loss": 0.0161, "step": 341850 }, { "epoch": 0.89, "learning_rate": 0.00016707743512510984, "loss": 0.0122, "step": 341860 }, { "epoch": 0.89, "learning_rate": 0.00016707354690873835, "loss": 0.0152, "step": 341870 }, { "epoch": 0.89, "learning_rate": 0.00016706965869236692, "loss": 0.012, "step": 341880 }, { "epoch": 0.89, "learning_rate": 0.00016706577047599544, "loss": 0.014, "step": 341890 }, { "epoch": 0.89, "learning_rate": 0.00016706188225962398, "loss": 0.0113, "step": 341900 }, { "epoch": 0.89, "learning_rate": 0.0001670579940432525, "loss": 0.0122, "step": 341910 }, { "epoch": 0.89, "learning_rate": 0.00016705410582688103, "loss": 0.0114, "step": 341920 }, { "epoch": 0.89, "learning_rate": 0.00016705021761050958, "loss": 0.0144, "step": 341930 }, { "epoch": 0.89, "learning_rate": 0.00016704632939413812, "loss": 0.0178, "step": 341940 }, { "epoch": 0.89, "learning_rate": 0.00016704244117776663, "loss": 0.0128, "step": 341950 }, { "epoch": 0.89, "learning_rate": 0.00016703855296139517, "loss": 0.0138, "step": 341960 }, { "epoch": 0.89, "learning_rate": 0.00016703466474502372, "loss": 0.0122, "step": 341970 }, { "epoch": 0.89, "learning_rate": 0.00016703077652865226, "loss": 0.0133, "step": 341980 }, { "epoch": 0.89, "learning_rate": 0.00016702688831228077, "loss": 0.0149, "step": 341990 }, { "epoch": 0.89, "learning_rate": 0.0001670230000959093, "loss": 0.0081, "step": 342000 }, { "epoch": 0.89, "eval_cer": 0.8817460750681273, "eval_loss": 0.009189891628921032, "eval_runtime": 107.711, "eval_samples_per_second": 18.568, "eval_steps_per_second": 4.642, "step": 342000 }, { "epoch": 0.89, "learning_rate": 0.00016701911187953788, "loss": 0.0144, "step": 342010 }, { "epoch": 0.89, "learning_rate": 0.0001670152236631664, "loss": 0.0166, "step": 342020 }, { "epoch": 0.89, "learning_rate": 0.00016701133544679494, "loss": 0.0131, "step": 342030 }, { "epoch": 0.89, "learning_rate": 0.00016700744723042345, "loss": 0.011, "step": 342040 }, { "epoch": 0.89, "learning_rate": 0.00016700355901405202, "loss": 0.0102, "step": 342050 }, { "epoch": 0.89, "learning_rate": 0.00016699967079768054, "loss": 0.0101, "step": 342060 }, { "epoch": 0.89, "learning_rate": 0.00016699578258130908, "loss": 0.0155, "step": 342070 }, { "epoch": 0.89, "learning_rate": 0.0001669918943649376, "loss": 0.0123, "step": 342080 }, { "epoch": 0.89, "learning_rate": 0.00016698800614856616, "loss": 0.0113, "step": 342090 }, { "epoch": 0.89, "learning_rate": 0.00016698411793219468, "loss": 0.0123, "step": 342100 }, { "epoch": 0.89, "learning_rate": 0.00016698022971582322, "loss": 0.0125, "step": 342110 }, { "epoch": 0.89, "learning_rate": 0.00016697634149945173, "loss": 0.0108, "step": 342120 }, { "epoch": 0.89, "learning_rate": 0.0001669724532830803, "loss": 0.0156, "step": 342130 }, { "epoch": 0.89, "learning_rate": 0.00016696856506670882, "loss": 0.0122, "step": 342140 }, { "epoch": 0.89, "learning_rate": 0.00016696467685033736, "loss": 0.0146, "step": 342150 }, { "epoch": 0.89, "learning_rate": 0.00016696078863396587, "loss": 0.0134, "step": 342160 }, { "epoch": 0.89, "learning_rate": 0.0001669569004175944, "loss": 0.0173, "step": 342170 }, { "epoch": 0.89, "learning_rate": 0.00016695301220122298, "loss": 0.0162, "step": 342180 }, { "epoch": 0.89, "learning_rate": 0.0001669491239848515, "loss": 0.0183, "step": 342190 }, { "epoch": 0.89, "learning_rate": 0.00016694523576848, "loss": 0.0132, "step": 342200 }, { "epoch": 0.89, "learning_rate": 0.00016694134755210855, "loss": 0.0133, "step": 342210 }, { "epoch": 0.89, "learning_rate": 0.00016693745933573712, "loss": 0.0129, "step": 342220 }, { "epoch": 0.89, "learning_rate": 0.00016693357111936564, "loss": 0.0158, "step": 342230 }, { "epoch": 0.89, "learning_rate": 0.00016692968290299418, "loss": 0.0148, "step": 342240 }, { "epoch": 0.89, "learning_rate": 0.0001669257946866227, "loss": 0.0172, "step": 342250 }, { "epoch": 0.89, "learning_rate": 0.00016692190647025126, "loss": 0.0175, "step": 342260 }, { "epoch": 0.89, "learning_rate": 0.00016691801825387978, "loss": 0.0118, "step": 342270 }, { "epoch": 0.89, "learning_rate": 0.00016691413003750832, "loss": 0.0102, "step": 342280 }, { "epoch": 0.89, "learning_rate": 0.00016691024182113683, "loss": 0.0136, "step": 342290 }, { "epoch": 0.89, "learning_rate": 0.0001669063536047654, "loss": 0.0132, "step": 342300 }, { "epoch": 0.89, "learning_rate": 0.00016690246538839391, "loss": 0.0131, "step": 342310 }, { "epoch": 0.89, "learning_rate": 0.00016689857717202246, "loss": 0.0132, "step": 342320 }, { "epoch": 0.89, "learning_rate": 0.00016689468895565097, "loss": 0.0139, "step": 342330 }, { "epoch": 0.89, "learning_rate": 0.00016689080073927954, "loss": 0.0142, "step": 342340 }, { "epoch": 0.89, "learning_rate": 0.00016688691252290805, "loss": 0.015, "step": 342350 }, { "epoch": 0.89, "learning_rate": 0.0001668830243065366, "loss": 0.0122, "step": 342360 }, { "epoch": 0.89, "learning_rate": 0.0001668791360901651, "loss": 0.0131, "step": 342370 }, { "epoch": 0.89, "learning_rate": 0.00016687524787379368, "loss": 0.0146, "step": 342380 }, { "epoch": 0.89, "learning_rate": 0.00016687135965742222, "loss": 0.0142, "step": 342390 }, { "epoch": 0.89, "learning_rate": 0.00016686747144105074, "loss": 0.0123, "step": 342400 }, { "epoch": 0.89, "learning_rate": 0.00016686358322467928, "loss": 0.0158, "step": 342410 }, { "epoch": 0.89, "learning_rate": 0.0001668596950083078, "loss": 0.0197, "step": 342420 }, { "epoch": 0.89, "learning_rate": 0.00016685580679193636, "loss": 0.0134, "step": 342430 }, { "epoch": 0.89, "learning_rate": 0.00016685191857556487, "loss": 0.0137, "step": 342440 }, { "epoch": 0.89, "learning_rate": 0.00016684803035919342, "loss": 0.0164, "step": 342450 }, { "epoch": 0.89, "learning_rate": 0.00016684414214282193, "loss": 0.0123, "step": 342460 }, { "epoch": 0.89, "learning_rate": 0.0001668402539264505, "loss": 0.0144, "step": 342470 }, { "epoch": 0.89, "learning_rate": 0.00016683636571007901, "loss": 0.0118, "step": 342480 }, { "epoch": 0.89, "learning_rate": 0.00016683247749370756, "loss": 0.0159, "step": 342490 }, { "epoch": 0.89, "learning_rate": 0.00016682858927733607, "loss": 0.0127, "step": 342500 }, { "epoch": 0.89, "learning_rate": 0.00016682470106096464, "loss": 0.0129, "step": 342510 }, { "epoch": 0.89, "learning_rate": 0.00016682081284459315, "loss": 0.0152, "step": 342520 }, { "epoch": 0.89, "learning_rate": 0.0001668169246282217, "loss": 0.0128, "step": 342530 }, { "epoch": 0.89, "learning_rate": 0.0001668130364118502, "loss": 0.0092, "step": 342540 }, { "epoch": 0.89, "learning_rate": 0.00016680914819547878, "loss": 0.0122, "step": 342550 }, { "epoch": 0.89, "learning_rate": 0.00016680525997910732, "loss": 0.0145, "step": 342560 }, { "epoch": 0.89, "learning_rate": 0.00016680137176273583, "loss": 0.0172, "step": 342570 }, { "epoch": 0.89, "learning_rate": 0.00016679748354636438, "loss": 0.0217, "step": 342580 }, { "epoch": 0.89, "learning_rate": 0.00016679359532999292, "loss": 0.0114, "step": 342590 }, { "epoch": 0.89, "learning_rate": 0.00016678970711362146, "loss": 0.0138, "step": 342600 }, { "epoch": 0.89, "learning_rate": 0.00016678581889724997, "loss": 0.0136, "step": 342610 }, { "epoch": 0.89, "learning_rate": 0.00016678193068087852, "loss": 0.0118, "step": 342620 }, { "epoch": 0.89, "learning_rate": 0.00016677804246450706, "loss": 0.0156, "step": 342630 }, { "epoch": 0.89, "learning_rate": 0.0001667741542481356, "loss": 0.0119, "step": 342640 }, { "epoch": 0.89, "learning_rate": 0.0001667702660317641, "loss": 0.0152, "step": 342650 }, { "epoch": 0.89, "learning_rate": 0.00016676637781539266, "loss": 0.0161, "step": 342660 }, { "epoch": 0.89, "learning_rate": 0.00016676248959902117, "loss": 0.0119, "step": 342670 }, { "epoch": 0.89, "learning_rate": 0.00016675860138264974, "loss": 0.0187, "step": 342680 }, { "epoch": 0.89, "learning_rate": 0.00016675471316627825, "loss": 0.0139, "step": 342690 }, { "epoch": 0.89, "learning_rate": 0.0001667508249499068, "loss": 0.0142, "step": 342700 }, { "epoch": 0.89, "learning_rate": 0.0001667469367335353, "loss": 0.0162, "step": 342710 }, { "epoch": 0.89, "learning_rate": 0.00016674304851716388, "loss": 0.0103, "step": 342720 }, { "epoch": 0.89, "learning_rate": 0.00016673916030079242, "loss": 0.0113, "step": 342730 }, { "epoch": 0.89, "learning_rate": 0.00016673527208442093, "loss": 0.014, "step": 342740 }, { "epoch": 0.89, "learning_rate": 0.00016673138386804945, "loss": 0.0127, "step": 342750 }, { "epoch": 0.89, "learning_rate": 0.00016672749565167802, "loss": 0.0125, "step": 342760 }, { "epoch": 0.89, "learning_rate": 0.00016672360743530656, "loss": 0.015, "step": 342770 }, { "epoch": 0.89, "learning_rate": 0.00016671971921893507, "loss": 0.0122, "step": 342780 }, { "epoch": 0.89, "learning_rate": 0.00016671583100256361, "loss": 0.0184, "step": 342790 }, { "epoch": 0.89, "learning_rate": 0.00016671194278619216, "loss": 0.0146, "step": 342800 }, { "epoch": 0.89, "learning_rate": 0.0001667080545698207, "loss": 0.0142, "step": 342810 }, { "epoch": 0.89, "learning_rate": 0.0001667041663534492, "loss": 0.0133, "step": 342820 }, { "epoch": 0.89, "learning_rate": 0.00016670027813707775, "loss": 0.0117, "step": 342830 }, { "epoch": 0.89, "learning_rate": 0.0001666963899207063, "loss": 0.015, "step": 342840 }, { "epoch": 0.89, "learning_rate": 0.00016669250170433484, "loss": 0.0124, "step": 342850 }, { "epoch": 0.89, "learning_rate": 0.00016668861348796335, "loss": 0.0143, "step": 342860 }, { "epoch": 0.89, "learning_rate": 0.0001666847252715919, "loss": 0.0116, "step": 342870 }, { "epoch": 0.89, "learning_rate": 0.00016668083705522046, "loss": 0.0129, "step": 342880 }, { "epoch": 0.89, "learning_rate": 0.00016667694883884898, "loss": 0.0119, "step": 342890 }, { "epoch": 0.89, "learning_rate": 0.00016667306062247752, "loss": 0.0146, "step": 342900 }, { "epoch": 0.89, "learning_rate": 0.00016666917240610603, "loss": 0.0182, "step": 342910 }, { "epoch": 0.89, "learning_rate": 0.00016666528418973455, "loss": 0.0131, "step": 342920 }, { "epoch": 0.89, "learning_rate": 0.00016666139597336312, "loss": 0.0143, "step": 342930 }, { "epoch": 0.89, "learning_rate": 0.00016665750775699166, "loss": 0.0136, "step": 342940 }, { "epoch": 0.89, "learning_rate": 0.00016665361954062017, "loss": 0.0146, "step": 342950 }, { "epoch": 0.89, "learning_rate": 0.00016664973132424871, "loss": 0.0244, "step": 342960 }, { "epoch": 0.89, "learning_rate": 0.00016664584310787726, "loss": 0.0123, "step": 342970 }, { "epoch": 0.89, "learning_rate": 0.0001666419548915058, "loss": 0.0138, "step": 342980 }, { "epoch": 0.89, "learning_rate": 0.0001666380666751343, "loss": 0.0117, "step": 342990 }, { "epoch": 0.89, "learning_rate": 0.00016663417845876285, "loss": 0.0133, "step": 343000 }, { "epoch": 0.89, "eval_cer": 0.8817236808771804, "eval_loss": 0.008914493024349213, "eval_runtime": 107.4576, "eval_samples_per_second": 18.612, "eval_steps_per_second": 4.653, "step": 343000 }, { "epoch": 0.89, "learning_rate": 0.0001666302902423914, "loss": 0.0131, "step": 343010 }, { "epoch": 0.89, "learning_rate": 0.00016662640202601994, "loss": 0.0119, "step": 343020 }, { "epoch": 0.89, "learning_rate": 0.00016662251380964845, "loss": 0.0125, "step": 343030 }, { "epoch": 0.89, "learning_rate": 0.000166618625593277, "loss": 0.0132, "step": 343040 }, { "epoch": 0.89, "learning_rate": 0.00016661473737690556, "loss": 0.0138, "step": 343050 }, { "epoch": 0.89, "learning_rate": 0.00016661084916053408, "loss": 0.0157, "step": 343060 }, { "epoch": 0.89, "learning_rate": 0.0001666069609441626, "loss": 0.0111, "step": 343070 }, { "epoch": 0.89, "learning_rate": 0.00016660307272779113, "loss": 0.0123, "step": 343080 }, { "epoch": 0.89, "learning_rate": 0.0001665991845114197, "loss": 0.0132, "step": 343090 }, { "epoch": 0.89, "learning_rate": 0.00016659529629504822, "loss": 0.0129, "step": 343100 }, { "epoch": 0.89, "learning_rate": 0.00016659140807867676, "loss": 0.0158, "step": 343110 }, { "epoch": 0.89, "learning_rate": 0.00016658751986230527, "loss": 0.0149, "step": 343120 }, { "epoch": 0.89, "learning_rate": 0.00016658363164593384, "loss": 0.0138, "step": 343130 }, { "epoch": 0.89, "learning_rate": 0.00016657974342956236, "loss": 0.0142, "step": 343140 }, { "epoch": 0.89, "learning_rate": 0.0001665758552131909, "loss": 0.0115, "step": 343150 }, { "epoch": 0.89, "learning_rate": 0.0001665719669968194, "loss": 0.0123, "step": 343160 }, { "epoch": 0.89, "learning_rate": 0.00016656807878044795, "loss": 0.0126, "step": 343170 }, { "epoch": 0.89, "learning_rate": 0.0001665641905640765, "loss": 0.0125, "step": 343180 }, { "epoch": 0.89, "learning_rate": 0.00016656030234770504, "loss": 0.0137, "step": 343190 }, { "epoch": 0.89, "learning_rate": 0.00016655641413133355, "loss": 0.0146, "step": 343200 }, { "epoch": 0.89, "learning_rate": 0.0001665525259149621, "loss": 0.0119, "step": 343210 }, { "epoch": 0.89, "learning_rate": 0.00016654863769859063, "loss": 0.0141, "step": 343220 }, { "epoch": 0.89, "learning_rate": 0.00016654474948221918, "loss": 0.0134, "step": 343230 }, { "epoch": 0.89, "learning_rate": 0.0001665408612658477, "loss": 0.0162, "step": 343240 }, { "epoch": 0.89, "learning_rate": 0.00016653697304947623, "loss": 0.0165, "step": 343250 }, { "epoch": 0.89, "learning_rate": 0.0001665330848331048, "loss": 0.013, "step": 343260 }, { "epoch": 0.89, "learning_rate": 0.00016652919661673332, "loss": 0.0117, "step": 343270 }, { "epoch": 0.89, "learning_rate": 0.00016652530840036186, "loss": 0.0138, "step": 343280 }, { "epoch": 0.89, "learning_rate": 0.00016652142018399037, "loss": 0.011, "step": 343290 }, { "epoch": 0.89, "learning_rate": 0.00016651753196761894, "loss": 0.0132, "step": 343300 }, { "epoch": 0.89, "learning_rate": 0.00016651364375124745, "loss": 0.0144, "step": 343310 }, { "epoch": 0.89, "learning_rate": 0.000166509755534876, "loss": 0.0126, "step": 343320 }, { "epoch": 0.89, "learning_rate": 0.0001665058673185045, "loss": 0.0141, "step": 343330 }, { "epoch": 0.89, "learning_rate": 0.00016650197910213308, "loss": 0.0154, "step": 343340 }, { "epoch": 0.89, "learning_rate": 0.0001664980908857616, "loss": 0.0129, "step": 343350 }, { "epoch": 0.89, "learning_rate": 0.00016649420266939014, "loss": 0.0155, "step": 343360 }, { "epoch": 0.89, "learning_rate": 0.00016649031445301865, "loss": 0.0124, "step": 343370 }, { "epoch": 0.89, "learning_rate": 0.0001664864262366472, "loss": 0.0192, "step": 343380 }, { "epoch": 0.89, "learning_rate": 0.00016648253802027573, "loss": 0.0142, "step": 343390 }, { "epoch": 0.89, "learning_rate": 0.00016647864980390428, "loss": 0.0151, "step": 343400 }, { "epoch": 0.89, "learning_rate": 0.0001664747615875328, "loss": 0.0146, "step": 343410 }, { "epoch": 0.89, "learning_rate": 0.00016647087337116133, "loss": 0.0139, "step": 343420 }, { "epoch": 0.89, "learning_rate": 0.0001664669851547899, "loss": 0.0144, "step": 343430 }, { "epoch": 0.89, "learning_rate": 0.00016646309693841841, "loss": 0.0155, "step": 343440 }, { "epoch": 0.89, "learning_rate": 0.00016645920872204696, "loss": 0.0141, "step": 343450 }, { "epoch": 0.89, "learning_rate": 0.00016645532050567547, "loss": 0.0107, "step": 343460 }, { "epoch": 0.89, "learning_rate": 0.00016645143228930404, "loss": 0.0141, "step": 343470 }, { "epoch": 0.89, "learning_rate": 0.00016644754407293255, "loss": 0.011, "step": 343480 }, { "epoch": 0.89, "learning_rate": 0.0001664436558565611, "loss": 0.0375, "step": 343490 }, { "epoch": 0.89, "learning_rate": 0.0001664397676401896, "loss": 0.0137, "step": 343500 }, { "epoch": 0.89, "learning_rate": 0.00016643587942381818, "loss": 0.015, "step": 343510 }, { "epoch": 0.89, "learning_rate": 0.0001664319912074467, "loss": 0.0165, "step": 343520 }, { "epoch": 0.89, "learning_rate": 0.00016642810299107524, "loss": 0.014, "step": 343530 }, { "epoch": 0.89, "learning_rate": 0.00016642421477470375, "loss": 0.0119, "step": 343540 }, { "epoch": 0.89, "learning_rate": 0.00016642032655833232, "loss": 0.0126, "step": 343550 }, { "epoch": 0.89, "learning_rate": 0.00016641643834196083, "loss": 0.0126, "step": 343560 }, { "epoch": 0.89, "learning_rate": 0.00016641255012558937, "loss": 0.0119, "step": 343570 }, { "epoch": 0.89, "learning_rate": 0.0001664086619092179, "loss": 0.0123, "step": 343580 }, { "epoch": 0.89, "learning_rate": 0.00016640477369284646, "loss": 0.0155, "step": 343590 }, { "epoch": 0.89, "learning_rate": 0.000166400885476475, "loss": 0.0156, "step": 343600 }, { "epoch": 0.89, "learning_rate": 0.00016639699726010351, "loss": 0.014, "step": 343610 }, { "epoch": 0.89, "learning_rate": 0.00016639310904373206, "loss": 0.0166, "step": 343620 }, { "epoch": 0.89, "learning_rate": 0.00016638922082736057, "loss": 0.0133, "step": 343630 }, { "epoch": 0.89, "learning_rate": 0.00016638533261098914, "loss": 0.0157, "step": 343640 }, { "epoch": 0.89, "learning_rate": 0.00016638144439461765, "loss": 0.0121, "step": 343650 }, { "epoch": 0.89, "learning_rate": 0.0001663775561782462, "loss": 0.0144, "step": 343660 }, { "epoch": 0.89, "learning_rate": 0.0001663736679618747, "loss": 0.0157, "step": 343670 }, { "epoch": 0.89, "learning_rate": 0.00016636977974550328, "loss": 0.0139, "step": 343680 }, { "epoch": 0.89, "learning_rate": 0.0001663658915291318, "loss": 0.015, "step": 343690 }, { "epoch": 0.89, "learning_rate": 0.00016636200331276033, "loss": 0.0123, "step": 343700 }, { "epoch": 0.89, "learning_rate": 0.00016635811509638885, "loss": 0.0126, "step": 343710 }, { "epoch": 0.89, "learning_rate": 0.00016635422688001742, "loss": 0.0148, "step": 343720 }, { "epoch": 0.89, "learning_rate": 0.00016635033866364593, "loss": 0.0116, "step": 343730 }, { "epoch": 0.89, "learning_rate": 0.00016634645044727447, "loss": 0.0122, "step": 343740 }, { "epoch": 0.89, "learning_rate": 0.000166342562230903, "loss": 0.0156, "step": 343750 }, { "epoch": 0.89, "learning_rate": 0.00016633867401453156, "loss": 0.0145, "step": 343760 }, { "epoch": 0.89, "learning_rate": 0.0001663347857981601, "loss": 0.0122, "step": 343770 }, { "epoch": 0.89, "learning_rate": 0.00016633089758178861, "loss": 0.0135, "step": 343780 }, { "epoch": 0.89, "learning_rate": 0.00016632700936541713, "loss": 0.0128, "step": 343790 }, { "epoch": 0.89, "learning_rate": 0.0001663231211490457, "loss": 0.0111, "step": 343800 }, { "epoch": 0.89, "learning_rate": 0.00016631923293267424, "loss": 0.013, "step": 343810 }, { "epoch": 0.89, "learning_rate": 0.00016631534471630275, "loss": 0.0147, "step": 343820 }, { "epoch": 0.89, "learning_rate": 0.0001663114564999313, "loss": 0.0145, "step": 343830 }, { "epoch": 0.89, "learning_rate": 0.00016630756828355984, "loss": 0.021, "step": 343840 }, { "epoch": 0.89, "learning_rate": 0.00016630368006718838, "loss": 0.0127, "step": 343850 }, { "epoch": 0.89, "learning_rate": 0.0001662997918508169, "loss": 0.0138, "step": 343860 }, { "epoch": 0.89, "learning_rate": 0.00016629590363444543, "loss": 0.0135, "step": 343870 }, { "epoch": 0.89, "learning_rate": 0.00016629201541807395, "loss": 0.0134, "step": 343880 }, { "epoch": 0.89, "learning_rate": 0.00016628812720170252, "loss": 0.0136, "step": 343890 }, { "epoch": 0.89, "learning_rate": 0.00016628423898533103, "loss": 0.0112, "step": 343900 }, { "epoch": 0.89, "learning_rate": 0.00016628035076895957, "loss": 0.0129, "step": 343910 }, { "epoch": 0.89, "learning_rate": 0.0001662764625525881, "loss": 0.0139, "step": 343920 }, { "epoch": 0.89, "learning_rate": 0.00016627257433621666, "loss": 0.0159, "step": 343930 }, { "epoch": 0.89, "learning_rate": 0.00016626868611984517, "loss": 0.0127, "step": 343940 }, { "epoch": 0.89, "learning_rate": 0.0001662647979034737, "loss": 0.0126, "step": 343950 }, { "epoch": 0.89, "learning_rate": 0.00016626090968710223, "loss": 0.0138, "step": 343960 }, { "epoch": 0.89, "learning_rate": 0.0001662570214707308, "loss": 0.0129, "step": 343970 }, { "epoch": 0.89, "learning_rate": 0.00016625313325435934, "loss": 0.0105, "step": 343980 }, { "epoch": 0.89, "learning_rate": 0.00016624924503798785, "loss": 0.0122, "step": 343990 }, { "epoch": 0.89, "learning_rate": 0.0001662453568216164, "loss": 0.0123, "step": 344000 }, { "epoch": 0.89, "eval_cer": 0.8817558725266665, "eval_loss": 0.008971183560788631, "eval_runtime": 107.4319, "eval_samples_per_second": 18.616, "eval_steps_per_second": 4.654, "step": 344000 }, { "epoch": 0.89, "learning_rate": 0.00016624146860524494, "loss": 0.0164, "step": 344010 }, { "epoch": 0.89, "learning_rate": 0.00016623758038887348, "loss": 0.0116, "step": 344020 }, { "epoch": 0.89, "learning_rate": 0.000166233692172502, "loss": 0.0129, "step": 344030 }, { "epoch": 0.89, "learning_rate": 0.00016622980395613053, "loss": 0.0159, "step": 344040 }, { "epoch": 0.89, "learning_rate": 0.00016622591573975908, "loss": 0.0154, "step": 344050 }, { "epoch": 0.89, "learning_rate": 0.00016622202752338762, "loss": 0.0135, "step": 344060 }, { "epoch": 0.89, "learning_rate": 0.00016621813930701613, "loss": 0.0168, "step": 344070 }, { "epoch": 0.89, "learning_rate": 0.00016621425109064467, "loss": 0.0153, "step": 344080 }, { "epoch": 0.89, "learning_rate": 0.00016621036287427324, "loss": 0.0157, "step": 344090 }, { "epoch": 0.89, "learning_rate": 0.00016620647465790176, "loss": 0.0122, "step": 344100 }, { "epoch": 0.89, "learning_rate": 0.00016620258644153027, "loss": 0.0131, "step": 344110 }, { "epoch": 0.89, "learning_rate": 0.0001661986982251588, "loss": 0.0125, "step": 344120 }, { "epoch": 0.89, "learning_rate": 0.00016619481000878733, "loss": 0.0126, "step": 344130 }, { "epoch": 0.89, "learning_rate": 0.0001661909217924159, "loss": 0.0161, "step": 344140 }, { "epoch": 0.89, "learning_rate": 0.00016618703357604444, "loss": 0.0122, "step": 344150 }, { "epoch": 0.89, "learning_rate": 0.00016618314535967295, "loss": 0.0129, "step": 344160 }, { "epoch": 0.89, "learning_rate": 0.0001661792571433015, "loss": 0.014, "step": 344170 }, { "epoch": 0.89, "learning_rate": 0.00016617536892693004, "loss": 0.0111, "step": 344180 }, { "epoch": 0.89, "learning_rate": 0.00016617148071055858, "loss": 0.0113, "step": 344190 }, { "epoch": 0.89, "learning_rate": 0.0001661675924941871, "loss": 0.0129, "step": 344200 }, { "epoch": 0.89, "learning_rate": 0.00016616370427781563, "loss": 0.015, "step": 344210 }, { "epoch": 0.89, "learning_rate": 0.00016615981606144417, "loss": 0.0127, "step": 344220 }, { "epoch": 0.89, "learning_rate": 0.00016615592784507272, "loss": 0.0164, "step": 344230 }, { "epoch": 0.89, "learning_rate": 0.00016615203962870123, "loss": 0.0125, "step": 344240 }, { "epoch": 0.89, "learning_rate": 0.00016614815141232977, "loss": 0.0152, "step": 344250 }, { "epoch": 0.89, "learning_rate": 0.00016614426319595831, "loss": 0.0128, "step": 344260 }, { "epoch": 0.89, "learning_rate": 0.00016614037497958686, "loss": 0.0135, "step": 344270 }, { "epoch": 0.89, "learning_rate": 0.00016613648676321537, "loss": 0.0165, "step": 344280 }, { "epoch": 0.89, "learning_rate": 0.0001661325985468439, "loss": 0.0133, "step": 344290 }, { "epoch": 0.89, "learning_rate": 0.00016612871033047248, "loss": 0.0114, "step": 344300 }, { "epoch": 0.89, "learning_rate": 0.000166124822114101, "loss": 0.0117, "step": 344310 }, { "epoch": 0.89, "learning_rate": 0.00016612093389772954, "loss": 0.0177, "step": 344320 }, { "epoch": 0.89, "learning_rate": 0.00016611704568135805, "loss": 0.0098, "step": 344330 }, { "epoch": 0.89, "learning_rate": 0.00016611315746498662, "loss": 0.0145, "step": 344340 }, { "epoch": 0.89, "learning_rate": 0.00016610926924861513, "loss": 0.0118, "step": 344350 }, { "epoch": 0.89, "learning_rate": 0.00016610538103224368, "loss": 0.0138, "step": 344360 }, { "epoch": 0.89, "learning_rate": 0.0001661014928158722, "loss": 0.0106, "step": 344370 }, { "epoch": 0.89, "learning_rate": 0.00016609760459950073, "loss": 0.0166, "step": 344380 }, { "epoch": 0.89, "learning_rate": 0.00016609371638312927, "loss": 0.0107, "step": 344390 }, { "epoch": 0.89, "learning_rate": 0.00016608982816675782, "loss": 0.0129, "step": 344400 }, { "epoch": 0.89, "learning_rate": 0.00016608593995038633, "loss": 0.0181, "step": 344410 }, { "epoch": 0.89, "learning_rate": 0.00016608205173401487, "loss": 0.0173, "step": 344420 }, { "epoch": 0.89, "learning_rate": 0.00016607816351764341, "loss": 0.013, "step": 344430 }, { "epoch": 0.89, "learning_rate": 0.00016607427530127196, "loss": 0.0113, "step": 344440 }, { "epoch": 0.89, "learning_rate": 0.00016607038708490047, "loss": 0.0113, "step": 344450 }, { "epoch": 0.89, "learning_rate": 0.000166066498868529, "loss": 0.0146, "step": 344460 }, { "epoch": 0.89, "learning_rate": 0.00016606261065215758, "loss": 0.0147, "step": 344470 }, { "epoch": 0.89, "learning_rate": 0.0001660587224357861, "loss": 0.009, "step": 344480 }, { "epoch": 0.89, "learning_rate": 0.00016605483421941464, "loss": 0.0136, "step": 344490 }, { "epoch": 0.89, "learning_rate": 0.00016605094600304315, "loss": 0.0106, "step": 344500 }, { "epoch": 0.89, "learning_rate": 0.00016604705778667172, "loss": 0.0121, "step": 344510 }, { "epoch": 0.89, "learning_rate": 0.00016604316957030023, "loss": 0.0122, "step": 344520 }, { "epoch": 0.89, "learning_rate": 0.00016603928135392878, "loss": 0.012, "step": 344530 }, { "epoch": 0.89, "learning_rate": 0.0001660353931375573, "loss": 0.015, "step": 344540 }, { "epoch": 0.89, "learning_rate": 0.00016603150492118586, "loss": 0.0116, "step": 344550 }, { "epoch": 0.89, "learning_rate": 0.00016602761670481437, "loss": 0.0134, "step": 344560 }, { "epoch": 0.89, "learning_rate": 0.00016602372848844292, "loss": 0.0169, "step": 344570 }, { "epoch": 0.89, "learning_rate": 0.00016601984027207143, "loss": 0.0136, "step": 344580 }, { "epoch": 0.89, "learning_rate": 0.0001660159520557, "loss": 0.0126, "step": 344590 }, { "epoch": 0.89, "learning_rate": 0.0001660120638393285, "loss": 0.0116, "step": 344600 }, { "epoch": 0.89, "learning_rate": 0.00016600817562295705, "loss": 0.0099, "step": 344610 }, { "epoch": 0.89, "learning_rate": 0.00016600428740658557, "loss": 0.016, "step": 344620 }, { "epoch": 0.89, "learning_rate": 0.0001660003991902141, "loss": 0.0132, "step": 344630 }, { "epoch": 0.89, "learning_rate": 0.00016599651097384268, "loss": 0.0176, "step": 344640 }, { "epoch": 0.89, "learning_rate": 0.0001659926227574712, "loss": 0.0157, "step": 344650 }, { "epoch": 0.89, "learning_rate": 0.0001659887345410997, "loss": 0.0119, "step": 344660 }, { "epoch": 0.89, "learning_rate": 0.00016598484632472825, "loss": 0.0138, "step": 344670 }, { "epoch": 0.89, "learning_rate": 0.00016598095810835682, "loss": 0.0123, "step": 344680 }, { "epoch": 0.89, "learning_rate": 0.00016597706989198533, "loss": 0.0128, "step": 344690 }, { "epoch": 0.89, "learning_rate": 0.00016597318167561388, "loss": 0.0151, "step": 344700 }, { "epoch": 0.89, "learning_rate": 0.0001659692934592424, "loss": 0.0135, "step": 344710 }, { "epoch": 0.89, "learning_rate": 0.00016596540524287096, "loss": 0.0134, "step": 344720 }, { "epoch": 0.89, "learning_rate": 0.00016596151702649947, "loss": 0.0149, "step": 344730 }, { "epoch": 0.89, "learning_rate": 0.00016595762881012801, "loss": 0.0135, "step": 344740 }, { "epoch": 0.89, "learning_rate": 0.00016595374059375653, "loss": 0.0131, "step": 344750 }, { "epoch": 0.89, "learning_rate": 0.0001659498523773851, "loss": 0.016, "step": 344760 }, { "epoch": 0.89, "learning_rate": 0.0001659459641610136, "loss": 0.0144, "step": 344770 }, { "epoch": 0.89, "learning_rate": 0.00016594207594464215, "loss": 0.0156, "step": 344780 }, { "epoch": 0.89, "learning_rate": 0.00016593818772827067, "loss": 0.0146, "step": 344790 }, { "epoch": 0.89, "learning_rate": 0.00016593429951189924, "loss": 0.0115, "step": 344800 }, { "epoch": 0.89, "learning_rate": 0.00016593041129552775, "loss": 0.0121, "step": 344810 }, { "epoch": 0.89, "learning_rate": 0.0001659265230791563, "loss": 0.0147, "step": 344820 }, { "epoch": 0.89, "learning_rate": 0.0001659226348627848, "loss": 0.0099, "step": 344830 }, { "epoch": 0.89, "learning_rate": 0.00016591874664641338, "loss": 0.0123, "step": 344840 }, { "epoch": 0.89, "learning_rate": 0.00016591485843004192, "loss": 0.0141, "step": 344850 }, { "epoch": 0.89, "learning_rate": 0.00016591097021367043, "loss": 0.014, "step": 344860 }, { "epoch": 0.89, "learning_rate": 0.00016590708199729897, "loss": 0.0118, "step": 344870 }, { "epoch": 0.89, "learning_rate": 0.0001659031937809275, "loss": 0.0122, "step": 344880 }, { "epoch": 0.89, "learning_rate": 0.00016589930556455606, "loss": 0.0132, "step": 344890 }, { "epoch": 0.89, "learning_rate": 0.00016589541734818457, "loss": 0.0173, "step": 344900 }, { "epoch": 0.89, "learning_rate": 0.00016589152913181311, "loss": 0.0134, "step": 344910 }, { "epoch": 0.89, "learning_rate": 0.00016588764091544163, "loss": 0.0098, "step": 344920 }, { "epoch": 0.89, "learning_rate": 0.0001658837526990702, "loss": 0.0164, "step": 344930 }, { "epoch": 0.89, "learning_rate": 0.0001658798644826987, "loss": 0.0148, "step": 344940 }, { "epoch": 0.89, "learning_rate": 0.00016587597626632725, "loss": 0.0154, "step": 344950 }, { "epoch": 0.89, "learning_rate": 0.00016587208804995577, "loss": 0.0124, "step": 344960 }, { "epoch": 0.89, "learning_rate": 0.00016586819983358434, "loss": 0.0142, "step": 344970 }, { "epoch": 0.89, "learning_rate": 0.00016586431161721285, "loss": 0.0119, "step": 344980 }, { "epoch": 0.89, "learning_rate": 0.0001658604234008414, "loss": 0.0159, "step": 344990 }, { "epoch": 0.89, "learning_rate": 0.0001658565351844699, "loss": 0.0155, "step": 345000 }, { "epoch": 0.89, "eval_cer": 0.8817334783357197, "eval_loss": 0.008910181932151318, "eval_runtime": 107.3178, "eval_samples_per_second": 18.636, "eval_steps_per_second": 4.659, "step": 345000 }, { "epoch": 0.89, "learning_rate": 0.00016585264696809848, "loss": 0.0124, "step": 345010 }, { "epoch": 0.89, "learning_rate": 0.00016584875875172702, "loss": 0.0131, "step": 345020 }, { "epoch": 0.89, "learning_rate": 0.00016584487053535553, "loss": 0.0139, "step": 345030 }, { "epoch": 0.89, "learning_rate": 0.00016584098231898407, "loss": 0.0161, "step": 345040 }, { "epoch": 0.89, "learning_rate": 0.00016583709410261262, "loss": 0.0104, "step": 345050 }, { "epoch": 0.89, "learning_rate": 0.00016583320588624116, "loss": 0.0153, "step": 345060 }, { "epoch": 0.89, "learning_rate": 0.00016582931766986967, "loss": 0.014, "step": 345070 }, { "epoch": 0.89, "learning_rate": 0.0001658254294534982, "loss": 0.0122, "step": 345080 }, { "epoch": 0.89, "learning_rate": 0.00016582154123712676, "loss": 0.0118, "step": 345090 }, { "epoch": 0.89, "learning_rate": 0.0001658176530207553, "loss": 0.0125, "step": 345100 }, { "epoch": 0.89, "learning_rate": 0.0001658137648043838, "loss": 0.0127, "step": 345110 }, { "epoch": 0.89, "learning_rate": 0.00016580987658801235, "loss": 0.0117, "step": 345120 }, { "epoch": 0.89, "learning_rate": 0.00016580598837164087, "loss": 0.0117, "step": 345130 }, { "epoch": 0.89, "learning_rate": 0.00016580210015526944, "loss": 0.0131, "step": 345140 }, { "epoch": 0.89, "learning_rate": 0.00016579821193889795, "loss": 0.0098, "step": 345150 }, { "epoch": 0.89, "learning_rate": 0.0001657943237225265, "loss": 0.0097, "step": 345160 }, { "epoch": 0.89, "learning_rate": 0.000165790435506155, "loss": 0.0099, "step": 345170 }, { "epoch": 0.89, "learning_rate": 0.00016578654728978358, "loss": 0.0137, "step": 345180 }, { "epoch": 0.89, "learning_rate": 0.00016578265907341212, "loss": 0.014, "step": 345190 }, { "epoch": 0.89, "learning_rate": 0.00016577877085704063, "loss": 0.0123, "step": 345200 }, { "epoch": 0.89, "learning_rate": 0.00016577488264066917, "loss": 0.0132, "step": 345210 }, { "epoch": 0.89, "learning_rate": 0.00016577099442429772, "loss": 0.0149, "step": 345220 }, { "epoch": 0.89, "learning_rate": 0.00016576710620792626, "loss": 0.0116, "step": 345230 }, { "epoch": 0.89, "learning_rate": 0.00016576321799155477, "loss": 0.0116, "step": 345240 }, { "epoch": 0.89, "learning_rate": 0.0001657593297751833, "loss": 0.0151, "step": 345250 }, { "epoch": 0.89, "learning_rate": 0.00016575544155881185, "loss": 0.0142, "step": 345260 }, { "epoch": 0.89, "learning_rate": 0.0001657515533424404, "loss": 0.0114, "step": 345270 }, { "epoch": 0.9, "learning_rate": 0.0001657476651260689, "loss": 0.0158, "step": 345280 }, { "epoch": 0.9, "learning_rate": 0.00016574377690969745, "loss": 0.0112, "step": 345290 }, { "epoch": 0.9, "learning_rate": 0.000165739888693326, "loss": 0.0123, "step": 345300 }, { "epoch": 0.9, "learning_rate": 0.00016573600047695454, "loss": 0.0125, "step": 345310 }, { "epoch": 0.9, "learning_rate": 0.00016573211226058305, "loss": 0.0151, "step": 345320 }, { "epoch": 0.9, "learning_rate": 0.0001657282240442116, "loss": 0.009, "step": 345330 }, { "epoch": 0.9, "learning_rate": 0.00016572433582784016, "loss": 0.0111, "step": 345340 }, { "epoch": 0.9, "learning_rate": 0.00016572044761146868, "loss": 0.014, "step": 345350 }, { "epoch": 0.9, "learning_rate": 0.00016571655939509722, "loss": 0.0127, "step": 345360 }, { "epoch": 0.9, "learning_rate": 0.00016571267117872573, "loss": 0.0132, "step": 345370 }, { "epoch": 0.9, "learning_rate": 0.00016570878296235425, "loss": 0.0117, "step": 345380 }, { "epoch": 0.9, "learning_rate": 0.00016570489474598281, "loss": 0.017, "step": 345390 }, { "epoch": 0.9, "learning_rate": 0.00016570100652961136, "loss": 0.011, "step": 345400 }, { "epoch": 0.9, "learning_rate": 0.00016569711831323987, "loss": 0.0146, "step": 345410 }, { "epoch": 0.9, "learning_rate": 0.0001656932300968684, "loss": 0.0144, "step": 345420 }, { "epoch": 0.9, "learning_rate": 0.00016568934188049695, "loss": 0.0122, "step": 345430 }, { "epoch": 0.9, "learning_rate": 0.0001656854536641255, "loss": 0.0127, "step": 345440 }, { "epoch": 0.9, "learning_rate": 0.000165681565447754, "loss": 0.0153, "step": 345450 }, { "epoch": 0.9, "learning_rate": 0.00016567767723138255, "loss": 0.0102, "step": 345460 }, { "epoch": 0.9, "learning_rate": 0.0001656737890150111, "loss": 0.0142, "step": 345470 }, { "epoch": 0.9, "learning_rate": 0.00016566990079863964, "loss": 0.0122, "step": 345480 }, { "epoch": 0.9, "learning_rate": 0.00016566601258226815, "loss": 0.0124, "step": 345490 }, { "epoch": 0.9, "learning_rate": 0.0001656621243658967, "loss": 0.0133, "step": 345500 }, { "epoch": 0.9, "learning_rate": 0.00016565823614952526, "loss": 0.0144, "step": 345510 }, { "epoch": 0.9, "learning_rate": 0.00016565434793315377, "loss": 0.012, "step": 345520 }, { "epoch": 0.9, "learning_rate": 0.0001656504597167823, "loss": 0.016, "step": 345530 }, { "epoch": 0.9, "learning_rate": 0.00016564657150041083, "loss": 0.0095, "step": 345540 }, { "epoch": 0.9, "learning_rate": 0.0001656426832840394, "loss": 0.016, "step": 345550 }, { "epoch": 0.9, "learning_rate": 0.00016563879506766791, "loss": 0.0109, "step": 345560 }, { "epoch": 0.9, "learning_rate": 0.00016563490685129646, "loss": 0.012, "step": 345570 }, { "epoch": 0.9, "learning_rate": 0.00016563101863492497, "loss": 0.0143, "step": 345580 }, { "epoch": 0.9, "learning_rate": 0.00016562713041855354, "loss": 0.0126, "step": 345590 }, { "epoch": 0.9, "learning_rate": 0.00016562324220218205, "loss": 0.0127, "step": 345600 }, { "epoch": 0.9, "learning_rate": 0.0001656193539858106, "loss": 0.0127, "step": 345610 }, { "epoch": 0.9, "learning_rate": 0.0001656154657694391, "loss": 0.0147, "step": 345620 }, { "epoch": 0.9, "learning_rate": 0.00016561157755306765, "loss": 0.0119, "step": 345630 }, { "epoch": 0.9, "learning_rate": 0.0001656076893366962, "loss": 0.0141, "step": 345640 }, { "epoch": 0.9, "learning_rate": 0.00016560380112032473, "loss": 0.0111, "step": 345650 }, { "epoch": 0.9, "learning_rate": 0.00016559991290395325, "loss": 0.0155, "step": 345660 }, { "epoch": 0.9, "learning_rate": 0.0001655960246875818, "loss": 0.0118, "step": 345670 }, { "epoch": 0.9, "learning_rate": 0.00016559213647121036, "loss": 0.0127, "step": 345680 }, { "epoch": 0.9, "learning_rate": 0.00016558824825483887, "loss": 0.015, "step": 345690 }, { "epoch": 0.9, "learning_rate": 0.0001655843600384674, "loss": 0.02, "step": 345700 }, { "epoch": 0.9, "learning_rate": 0.00016558047182209593, "loss": 0.0156, "step": 345710 }, { "epoch": 0.9, "learning_rate": 0.0001655765836057245, "loss": 0.0143, "step": 345720 }, { "epoch": 0.9, "learning_rate": 0.000165572695389353, "loss": 0.0139, "step": 345730 }, { "epoch": 0.9, "learning_rate": 0.00016556880717298155, "loss": 0.0159, "step": 345740 }, { "epoch": 0.9, "learning_rate": 0.00016556491895661007, "loss": 0.0102, "step": 345750 }, { "epoch": 0.9, "learning_rate": 0.00016556103074023864, "loss": 0.016, "step": 345760 }, { "epoch": 0.9, "learning_rate": 0.00016555714252386715, "loss": 0.0115, "step": 345770 }, { "epoch": 0.9, "learning_rate": 0.0001655532543074957, "loss": 0.0118, "step": 345780 }, { "epoch": 0.9, "learning_rate": 0.0001655493660911242, "loss": 0.0145, "step": 345790 }, { "epoch": 0.9, "learning_rate": 0.00016554547787475278, "loss": 0.0114, "step": 345800 }, { "epoch": 0.9, "learning_rate": 0.0001655415896583813, "loss": 0.0136, "step": 345810 }, { "epoch": 0.9, "learning_rate": 0.00016553770144200983, "loss": 0.0104, "step": 345820 }, { "epoch": 0.9, "learning_rate": 0.00016553381322563835, "loss": 0.0095, "step": 345830 }, { "epoch": 0.9, "learning_rate": 0.00016552992500926692, "loss": 0.0136, "step": 345840 }, { "epoch": 0.9, "learning_rate": 0.00016552603679289543, "loss": 0.012, "step": 345850 }, { "epoch": 0.9, "learning_rate": 0.00016552214857652397, "loss": 0.014, "step": 345860 }, { "epoch": 0.9, "learning_rate": 0.0001655182603601525, "loss": 0.0181, "step": 345870 }, { "epoch": 0.9, "learning_rate": 0.00016551437214378103, "loss": 0.0154, "step": 345880 }, { "epoch": 0.9, "learning_rate": 0.0001655104839274096, "loss": 0.0124, "step": 345890 }, { "epoch": 0.9, "learning_rate": 0.0001655065957110381, "loss": 0.0139, "step": 345900 }, { "epoch": 0.9, "learning_rate": 0.00016550270749466665, "loss": 0.0173, "step": 345910 }, { "epoch": 0.9, "learning_rate": 0.00016549881927829517, "loss": 0.0129, "step": 345920 }, { "epoch": 0.9, "learning_rate": 0.00016549493106192374, "loss": 0.0116, "step": 345930 }, { "epoch": 0.9, "learning_rate": 0.00016549104284555225, "loss": 0.012, "step": 345940 }, { "epoch": 0.9, "learning_rate": 0.0001654871546291808, "loss": 0.0157, "step": 345950 }, { "epoch": 0.9, "learning_rate": 0.0001654832664128093, "loss": 0.0132, "step": 345960 }, { "epoch": 0.9, "learning_rate": 0.00016547937819643788, "loss": 0.0107, "step": 345970 }, { "epoch": 0.9, "learning_rate": 0.0001654754899800664, "loss": 0.0149, "step": 345980 }, { "epoch": 0.9, "learning_rate": 0.00016547160176369493, "loss": 0.016, "step": 345990 }, { "epoch": 0.9, "learning_rate": 0.00016546771354732345, "loss": 0.0109, "step": 346000 }, { "epoch": 0.9, "eval_cer": 0.8817082848709045, "eval_loss": 0.009006353095173836, "eval_runtime": 107.5267, "eval_samples_per_second": 18.6, "eval_steps_per_second": 4.65, "step": 346000 }, { "epoch": 0.9, "learning_rate": 0.00016546382533095202, "loss": 0.0119, "step": 346010 }, { "epoch": 0.9, "learning_rate": 0.00016545993711458053, "loss": 0.0151, "step": 346020 }, { "epoch": 0.9, "learning_rate": 0.00016545604889820907, "loss": 0.0149, "step": 346030 }, { "epoch": 0.9, "learning_rate": 0.0001654521606818376, "loss": 0.0154, "step": 346040 }, { "epoch": 0.9, "learning_rate": 0.00016544827246546616, "loss": 0.0135, "step": 346050 }, { "epoch": 0.9, "learning_rate": 0.0001654443842490947, "loss": 0.0141, "step": 346060 }, { "epoch": 0.9, "learning_rate": 0.0001654404960327232, "loss": 0.0135, "step": 346070 }, { "epoch": 0.9, "learning_rate": 0.00016543660781635175, "loss": 0.0131, "step": 346080 }, { "epoch": 0.9, "learning_rate": 0.0001654327195999803, "loss": 0.0121, "step": 346090 }, { "epoch": 0.9, "learning_rate": 0.00016542883138360884, "loss": 0.0105, "step": 346100 }, { "epoch": 0.9, "learning_rate": 0.00016542494316723735, "loss": 0.0104, "step": 346110 }, { "epoch": 0.9, "learning_rate": 0.0001654210549508659, "loss": 0.0111, "step": 346120 }, { "epoch": 0.9, "learning_rate": 0.0001654171667344944, "loss": 0.0129, "step": 346130 }, { "epoch": 0.9, "learning_rate": 0.00016541327851812298, "loss": 0.0113, "step": 346140 }, { "epoch": 0.9, "learning_rate": 0.0001654093903017515, "loss": 0.0124, "step": 346150 }, { "epoch": 0.9, "learning_rate": 0.00016540550208538003, "loss": 0.0128, "step": 346160 }, { "epoch": 0.9, "learning_rate": 0.00016540161386900855, "loss": 0.0161, "step": 346170 }, { "epoch": 0.9, "learning_rate": 0.00016539772565263712, "loss": 0.0098, "step": 346180 }, { "epoch": 0.9, "learning_rate": 0.00016539383743626563, "loss": 0.0117, "step": 346190 }, { "epoch": 0.9, "learning_rate": 0.00016538994921989417, "loss": 0.0131, "step": 346200 }, { "epoch": 0.9, "learning_rate": 0.0001653860610035227, "loss": 0.0142, "step": 346210 }, { "epoch": 0.9, "learning_rate": 0.00016538217278715126, "loss": 0.0135, "step": 346220 }, { "epoch": 0.9, "learning_rate": 0.0001653782845707798, "loss": 0.0116, "step": 346230 }, { "epoch": 0.9, "learning_rate": 0.0001653743963544083, "loss": 0.0122, "step": 346240 }, { "epoch": 0.9, "learning_rate": 0.00016537050813803683, "loss": 0.0144, "step": 346250 }, { "epoch": 0.9, "learning_rate": 0.0001653666199216654, "loss": 0.0105, "step": 346260 }, { "epoch": 0.9, "learning_rate": 0.00016536273170529394, "loss": 0.0156, "step": 346270 }, { "epoch": 0.9, "learning_rate": 0.00016535884348892245, "loss": 0.0114, "step": 346280 }, { "epoch": 0.9, "learning_rate": 0.000165354955272551, "loss": 0.0158, "step": 346290 }, { "epoch": 0.9, "learning_rate": 0.00016535106705617953, "loss": 0.0121, "step": 346300 }, { "epoch": 0.9, "learning_rate": 0.00016534717883980808, "loss": 0.0112, "step": 346310 }, { "epoch": 0.9, "learning_rate": 0.0001653432906234366, "loss": 0.011, "step": 346320 }, { "epoch": 0.9, "learning_rate": 0.00016533940240706513, "loss": 0.0126, "step": 346330 }, { "epoch": 0.9, "learning_rate": 0.00016533551419069367, "loss": 0.0154, "step": 346340 }, { "epoch": 0.9, "learning_rate": 0.00016533162597432222, "loss": 0.0129, "step": 346350 }, { "epoch": 0.9, "learning_rate": 0.00016532773775795073, "loss": 0.0111, "step": 346360 }, { "epoch": 0.9, "learning_rate": 0.00016532384954157927, "loss": 0.0144, "step": 346370 }, { "epoch": 0.9, "learning_rate": 0.00016531996132520779, "loss": 0.0199, "step": 346380 }, { "epoch": 0.9, "learning_rate": 0.00016531607310883635, "loss": 0.012, "step": 346390 }, { "epoch": 0.9, "learning_rate": 0.00016531218489246487, "loss": 0.0123, "step": 346400 }, { "epoch": 0.9, "learning_rate": 0.0001653082966760934, "loss": 0.012, "step": 346410 }, { "epoch": 0.9, "learning_rate": 0.00016530440845972193, "loss": 0.0117, "step": 346420 }, { "epoch": 0.9, "learning_rate": 0.0001653005202433505, "loss": 0.0122, "step": 346430 }, { "epoch": 0.9, "learning_rate": 0.00016529663202697904, "loss": 0.0123, "step": 346440 }, { "epoch": 0.9, "learning_rate": 0.00016529274381060755, "loss": 0.0131, "step": 346450 }, { "epoch": 0.9, "learning_rate": 0.0001652888555942361, "loss": 0.0104, "step": 346460 }, { "epoch": 0.9, "learning_rate": 0.00016528496737786463, "loss": 0.0162, "step": 346470 }, { "epoch": 0.9, "learning_rate": 0.00016528107916149318, "loss": 0.0115, "step": 346480 }, { "epoch": 0.9, "learning_rate": 0.0001652771909451217, "loss": 0.0155, "step": 346490 }, { "epoch": 0.9, "learning_rate": 0.00016527330272875023, "loss": 0.023, "step": 346500 }, { "epoch": 0.9, "learning_rate": 0.00016526941451237877, "loss": 0.0155, "step": 346510 }, { "epoch": 0.9, "learning_rate": 0.00016526552629600731, "loss": 0.0136, "step": 346520 }, { "epoch": 0.9, "learning_rate": 0.00016526163807963583, "loss": 0.0166, "step": 346530 }, { "epoch": 0.9, "learning_rate": 0.00016525774986326437, "loss": 0.0118, "step": 346540 }, { "epoch": 0.9, "learning_rate": 0.00016525386164689294, "loss": 0.0147, "step": 346550 }, { "epoch": 0.9, "learning_rate": 0.00016524997343052145, "loss": 0.0153, "step": 346560 }, { "epoch": 0.9, "learning_rate": 0.00016524608521414997, "loss": 0.0144, "step": 346570 }, { "epoch": 0.9, "learning_rate": 0.0001652421969977785, "loss": 0.011, "step": 346580 }, { "epoch": 0.9, "learning_rate": 0.00016523830878140708, "loss": 0.0158, "step": 346590 }, { "epoch": 0.9, "learning_rate": 0.0001652344205650356, "loss": 0.0137, "step": 346600 }, { "epoch": 0.9, "learning_rate": 0.00016523053234866414, "loss": 0.0112, "step": 346610 }, { "epoch": 0.9, "learning_rate": 0.00016522664413229265, "loss": 0.0162, "step": 346620 }, { "epoch": 0.9, "learning_rate": 0.0001652227559159212, "loss": 0.0116, "step": 346630 }, { "epoch": 0.9, "learning_rate": 0.00016521886769954973, "loss": 0.0121, "step": 346640 }, { "epoch": 0.9, "learning_rate": 0.00016521497948317827, "loss": 0.0181, "step": 346650 }, { "epoch": 0.9, "learning_rate": 0.0001652110912668068, "loss": 0.0168, "step": 346660 }, { "epoch": 0.9, "learning_rate": 0.00016520720305043533, "loss": 0.0132, "step": 346670 }, { "epoch": 0.9, "learning_rate": 0.00016520331483406387, "loss": 0.019, "step": 346680 }, { "epoch": 0.9, "learning_rate": 0.00016519942661769241, "loss": 0.0142, "step": 346690 }, { "epoch": 0.9, "learning_rate": 0.00016519553840132093, "loss": 0.0146, "step": 346700 }, { "epoch": 0.9, "learning_rate": 0.00016519165018494947, "loss": 0.0148, "step": 346710 }, { "epoch": 0.9, "learning_rate": 0.000165187761968578, "loss": 0.0113, "step": 346720 }, { "epoch": 0.9, "learning_rate": 0.00016518387375220655, "loss": 0.0116, "step": 346730 }, { "epoch": 0.9, "learning_rate": 0.00016517998553583507, "loss": 0.0152, "step": 346740 }, { "epoch": 0.9, "learning_rate": 0.0001651760973194636, "loss": 0.0121, "step": 346750 }, { "epoch": 0.9, "learning_rate": 0.00016517220910309218, "loss": 0.0128, "step": 346760 }, { "epoch": 0.9, "learning_rate": 0.0001651683208867207, "loss": 0.0149, "step": 346770 }, { "epoch": 0.9, "learning_rate": 0.00016516443267034923, "loss": 0.0122, "step": 346780 }, { "epoch": 0.9, "learning_rate": 0.00016516054445397775, "loss": 0.0138, "step": 346790 }, { "epoch": 0.9, "learning_rate": 0.00016515665623760632, "loss": 0.0097, "step": 346800 }, { "epoch": 0.9, "learning_rate": 0.00016515276802123483, "loss": 0.0112, "step": 346810 }, { "epoch": 0.9, "learning_rate": 0.00016514887980486337, "loss": 0.0131, "step": 346820 }, { "epoch": 0.9, "learning_rate": 0.0001651449915884919, "loss": 0.0143, "step": 346830 }, { "epoch": 0.9, "learning_rate": 0.00016514110337212046, "loss": 0.0144, "step": 346840 }, { "epoch": 0.9, "learning_rate": 0.00016513721515574897, "loss": 0.011, "step": 346850 }, { "epoch": 0.9, "learning_rate": 0.00016513332693937751, "loss": 0.0136, "step": 346860 }, { "epoch": 0.9, "learning_rate": 0.00016512943872300603, "loss": 0.0106, "step": 346870 }, { "epoch": 0.9, "learning_rate": 0.00016512555050663457, "loss": 0.0141, "step": 346880 }, { "epoch": 0.9, "learning_rate": 0.0001651216622902631, "loss": 0.0177, "step": 346890 }, { "epoch": 0.9, "learning_rate": 0.00016511777407389165, "loss": 0.0099, "step": 346900 }, { "epoch": 0.9, "learning_rate": 0.00016511388585752017, "loss": 0.0143, "step": 346910 }, { "epoch": 0.9, "learning_rate": 0.0001651099976411487, "loss": 0.0098, "step": 346920 }, { "epoch": 0.9, "learning_rate": 0.00016510610942477728, "loss": 0.0123, "step": 346930 }, { "epoch": 0.9, "learning_rate": 0.0001651022212084058, "loss": 0.0121, "step": 346940 }, { "epoch": 0.9, "learning_rate": 0.00016509833299203433, "loss": 0.0139, "step": 346950 }, { "epoch": 0.9, "learning_rate": 0.00016509444477566285, "loss": 0.0119, "step": 346960 }, { "epoch": 0.9, "learning_rate": 0.00016509055655929142, "loss": 0.012, "step": 346970 }, { "epoch": 0.9, "learning_rate": 0.00016508666834291993, "loss": 0.0124, "step": 346980 }, { "epoch": 0.9, "learning_rate": 0.00016508278012654847, "loss": 0.0125, "step": 346990 }, { "epoch": 0.9, "learning_rate": 0.000165078891910177, "loss": 0.0137, "step": 347000 }, { "epoch": 0.9, "eval_cer": 0.8817502739789299, "eval_loss": 0.008850464597344398, "eval_runtime": 107.5314, "eval_samples_per_second": 18.599, "eval_steps_per_second": 4.65, "step": 347000 }, { "epoch": 0.9, "learning_rate": 0.00016507500369380556, "loss": 0.0101, "step": 347010 }, { "epoch": 0.9, "learning_rate": 0.00016507111547743407, "loss": 0.0126, "step": 347020 }, { "epoch": 0.9, "learning_rate": 0.0001650672272610626, "loss": 0.0119, "step": 347030 }, { "epoch": 0.9, "learning_rate": 0.00016506333904469113, "loss": 0.0134, "step": 347040 }, { "epoch": 0.9, "learning_rate": 0.0001650594508283197, "loss": 0.0122, "step": 347050 }, { "epoch": 0.9, "learning_rate": 0.0001650555626119482, "loss": 0.0151, "step": 347060 }, { "epoch": 0.9, "learning_rate": 0.00016505167439557675, "loss": 0.0135, "step": 347070 }, { "epoch": 0.9, "learning_rate": 0.00016504778617920527, "loss": 0.0137, "step": 347080 }, { "epoch": 0.9, "learning_rate": 0.00016504389796283384, "loss": 0.0135, "step": 347090 }, { "epoch": 0.9, "learning_rate": 0.00016504000974646238, "loss": 0.0152, "step": 347100 }, { "epoch": 0.9, "learning_rate": 0.0001650361215300909, "loss": 0.0132, "step": 347110 }, { "epoch": 0.9, "learning_rate": 0.0001650322333137194, "loss": 0.0164, "step": 347120 }, { "epoch": 0.9, "learning_rate": 0.00016502834509734795, "loss": 0.0106, "step": 347130 }, { "epoch": 0.9, "learning_rate": 0.00016502445688097652, "loss": 0.0113, "step": 347140 }, { "epoch": 0.9, "learning_rate": 0.00016502056866460503, "loss": 0.0131, "step": 347150 }, { "epoch": 0.9, "learning_rate": 0.00016501668044823357, "loss": 0.014, "step": 347160 }, { "epoch": 0.9, "learning_rate": 0.0001650127922318621, "loss": 0.0119, "step": 347170 }, { "epoch": 0.9, "learning_rate": 0.00016500890401549066, "loss": 0.012, "step": 347180 }, { "epoch": 0.9, "learning_rate": 0.00016500501579911917, "loss": 0.013, "step": 347190 }, { "epoch": 0.9, "learning_rate": 0.0001650011275827477, "loss": 0.0139, "step": 347200 }, { "epoch": 0.9, "learning_rate": 0.00016499723936637623, "loss": 0.0121, "step": 347210 }, { "epoch": 0.9, "learning_rate": 0.0001649933511500048, "loss": 0.0149, "step": 347220 }, { "epoch": 0.9, "learning_rate": 0.0001649894629336333, "loss": 0.0143, "step": 347230 }, { "epoch": 0.9, "learning_rate": 0.00016498557471726185, "loss": 0.0126, "step": 347240 }, { "epoch": 0.9, "learning_rate": 0.00016498168650089037, "loss": 0.0132, "step": 347250 }, { "epoch": 0.9, "learning_rate": 0.00016497779828451894, "loss": 0.0135, "step": 347260 }, { "epoch": 0.9, "learning_rate": 0.00016497391006814748, "loss": 0.0116, "step": 347270 }, { "epoch": 0.9, "learning_rate": 0.000164970021851776, "loss": 0.0151, "step": 347280 }, { "epoch": 0.9, "learning_rate": 0.0001649661336354045, "loss": 0.0146, "step": 347290 }, { "epoch": 0.9, "learning_rate": 0.00016496224541903307, "loss": 0.0148, "step": 347300 }, { "epoch": 0.9, "learning_rate": 0.00016495835720266162, "loss": 0.0118, "step": 347310 }, { "epoch": 0.9, "learning_rate": 0.00016495446898629013, "loss": 0.0141, "step": 347320 }, { "epoch": 0.9, "learning_rate": 0.00016495058076991867, "loss": 0.013, "step": 347330 }, { "epoch": 0.9, "learning_rate": 0.00016494669255354721, "loss": 0.0125, "step": 347340 }, { "epoch": 0.9, "learning_rate": 0.00016494280433717576, "loss": 0.0125, "step": 347350 }, { "epoch": 0.9, "learning_rate": 0.00016493891612080427, "loss": 0.0131, "step": 347360 }, { "epoch": 0.9, "learning_rate": 0.0001649350279044328, "loss": 0.013, "step": 347370 }, { "epoch": 0.9, "learning_rate": 0.00016493113968806133, "loss": 0.0102, "step": 347380 }, { "epoch": 0.9, "learning_rate": 0.0001649272514716899, "loss": 0.013, "step": 347390 }, { "epoch": 0.9, "learning_rate": 0.0001649233632553184, "loss": 0.0156, "step": 347400 }, { "epoch": 0.9, "learning_rate": 0.00016491947503894695, "loss": 0.0186, "step": 347410 }, { "epoch": 0.9, "learning_rate": 0.00016491558682257547, "loss": 0.0128, "step": 347420 }, { "epoch": 0.9, "learning_rate": 0.00016491169860620403, "loss": 0.0155, "step": 347430 }, { "epoch": 0.9, "learning_rate": 0.00016490781038983255, "loss": 0.0093, "step": 347440 }, { "epoch": 0.9, "learning_rate": 0.0001649039221734611, "loss": 0.0131, "step": 347450 }, { "epoch": 0.9, "learning_rate": 0.0001649000339570896, "loss": 0.0137, "step": 347460 }, { "epoch": 0.9, "learning_rate": 0.00016489614574071817, "loss": 0.0133, "step": 347470 }, { "epoch": 0.9, "learning_rate": 0.00016489225752434672, "loss": 0.0124, "step": 347480 }, { "epoch": 0.9, "learning_rate": 0.00016488836930797523, "loss": 0.0121, "step": 347490 }, { "epoch": 0.9, "learning_rate": 0.00016488448109160377, "loss": 0.0096, "step": 347500 }, { "epoch": 0.9, "learning_rate": 0.00016488059287523231, "loss": 0.0109, "step": 347510 }, { "epoch": 0.9, "learning_rate": 0.00016487670465886086, "loss": 0.0146, "step": 347520 }, { "epoch": 0.9, "learning_rate": 0.00016487281644248937, "loss": 0.0161, "step": 347530 }, { "epoch": 0.9, "learning_rate": 0.0001648689282261179, "loss": 0.0157, "step": 347540 }, { "epoch": 0.9, "learning_rate": 0.00016486504000974645, "loss": 0.0142, "step": 347550 }, { "epoch": 0.9, "learning_rate": 0.000164861151793375, "loss": 0.0145, "step": 347560 }, { "epoch": 0.9, "learning_rate": 0.0001648572635770035, "loss": 0.0129, "step": 347570 }, { "epoch": 0.9, "learning_rate": 0.00016485337536063205, "loss": 0.0098, "step": 347580 }, { "epoch": 0.9, "learning_rate": 0.0001648494871442606, "loss": 0.0123, "step": 347590 }, { "epoch": 0.9, "learning_rate": 0.00016484559892788913, "loss": 0.0122, "step": 347600 }, { "epoch": 0.9, "learning_rate": 0.00016484171071151765, "loss": 0.0137, "step": 347610 }, { "epoch": 0.9, "learning_rate": 0.0001648378224951462, "loss": 0.0152, "step": 347620 }, { "epoch": 0.9, "learning_rate": 0.0001648339342787747, "loss": 0.0113, "step": 347630 }, { "epoch": 0.9, "learning_rate": 0.00016483004606240327, "loss": 0.013, "step": 347640 }, { "epoch": 0.9, "learning_rate": 0.00016482615784603182, "loss": 0.0173, "step": 347650 }, { "epoch": 0.9, "learning_rate": 0.00016482226962966033, "loss": 0.0154, "step": 347660 }, { "epoch": 0.9, "learning_rate": 0.00016481838141328887, "loss": 0.0139, "step": 347670 }, { "epoch": 0.9, "learning_rate": 0.0001648144931969174, "loss": 0.0116, "step": 347680 }, { "epoch": 0.9, "learning_rate": 0.00016481060498054595, "loss": 0.0119, "step": 347690 }, { "epoch": 0.9, "learning_rate": 0.00016480671676417447, "loss": 0.0114, "step": 347700 }, { "epoch": 0.9, "learning_rate": 0.000164802828547803, "loss": 0.0106, "step": 347710 }, { "epoch": 0.9, "learning_rate": 0.00016479894033143155, "loss": 0.0145, "step": 347720 }, { "epoch": 0.9, "learning_rate": 0.0001647950521150601, "loss": 0.0117, "step": 347730 }, { "epoch": 0.9, "learning_rate": 0.0001647911638986886, "loss": 0.0116, "step": 347740 }, { "epoch": 0.9, "learning_rate": 0.00016478727568231715, "loss": 0.0158, "step": 347750 }, { "epoch": 0.9, "learning_rate": 0.0001647833874659457, "loss": 0.0101, "step": 347760 }, { "epoch": 0.9, "learning_rate": 0.00016477949924957423, "loss": 0.0162, "step": 347770 }, { "epoch": 0.9, "learning_rate": 0.00016477561103320275, "loss": 0.0146, "step": 347780 }, { "epoch": 0.9, "learning_rate": 0.0001647717228168313, "loss": 0.0114, "step": 347790 }, { "epoch": 0.9, "learning_rate": 0.00016476783460045986, "loss": 0.0159, "step": 347800 }, { "epoch": 0.9, "learning_rate": 0.00016476394638408837, "loss": 0.0127, "step": 347810 }, { "epoch": 0.9, "learning_rate": 0.00016476005816771691, "loss": 0.0135, "step": 347820 }, { "epoch": 0.9, "learning_rate": 0.00016475616995134543, "loss": 0.0143, "step": 347830 }, { "epoch": 0.9, "learning_rate": 0.000164752281734974, "loss": 0.0113, "step": 347840 }, { "epoch": 0.9, "learning_rate": 0.0001647483935186025, "loss": 0.0147, "step": 347850 }, { "epoch": 0.9, "learning_rate": 0.00016474450530223105, "loss": 0.0156, "step": 347860 }, { "epoch": 0.9, "learning_rate": 0.00016474061708585957, "loss": 0.014, "step": 347870 }, { "epoch": 0.9, "learning_rate": 0.0001647367288694881, "loss": 0.0128, "step": 347880 }, { "epoch": 0.9, "learning_rate": 0.00016473284065311665, "loss": 0.0129, "step": 347890 }, { "epoch": 0.9, "learning_rate": 0.0001647289524367452, "loss": 0.0142, "step": 347900 }, { "epoch": 0.9, "learning_rate": 0.0001647250642203737, "loss": 0.0138, "step": 347910 }, { "epoch": 0.9, "learning_rate": 0.00016472117600400225, "loss": 0.0132, "step": 347920 }, { "epoch": 0.9, "learning_rate": 0.0001647172877876308, "loss": 0.0129, "step": 347930 }, { "epoch": 0.9, "learning_rate": 0.00016471339957125933, "loss": 0.0103, "step": 347940 }, { "epoch": 0.9, "learning_rate": 0.00016470951135488785, "loss": 0.0137, "step": 347950 }, { "epoch": 0.9, "learning_rate": 0.0001647056231385164, "loss": 0.012, "step": 347960 }, { "epoch": 0.9, "learning_rate": 0.00016470173492214496, "loss": 0.0122, "step": 347970 }, { "epoch": 0.9, "learning_rate": 0.00016469784670577347, "loss": 0.0124, "step": 347980 }, { "epoch": 0.9, "learning_rate": 0.000164693958489402, "loss": 0.0188, "step": 347990 }, { "epoch": 0.9, "learning_rate": 0.00016469007027303053, "loss": 0.0143, "step": 348000 }, { "epoch": 0.9, "eval_cer": 0.8817348779726539, "eval_loss": 0.008867635391652584, "eval_runtime": 107.6298, "eval_samples_per_second": 18.582, "eval_steps_per_second": 4.646, "step": 348000 }, { "epoch": 0.9, "learning_rate": 0.0001646861820566591, "loss": 0.0167, "step": 348010 }, { "epoch": 0.9, "learning_rate": 0.0001646822938402876, "loss": 0.0128, "step": 348020 }, { "epoch": 0.9, "learning_rate": 0.00016467840562391615, "loss": 0.0151, "step": 348030 }, { "epoch": 0.9, "learning_rate": 0.00016467451740754467, "loss": 0.0115, "step": 348040 }, { "epoch": 0.9, "learning_rate": 0.00016467062919117324, "loss": 0.0119, "step": 348050 }, { "epoch": 0.9, "learning_rate": 0.00016466674097480175, "loss": 0.0138, "step": 348060 }, { "epoch": 0.9, "learning_rate": 0.0001646628527584303, "loss": 0.0143, "step": 348070 }, { "epoch": 0.9, "learning_rate": 0.0001646589645420588, "loss": 0.0135, "step": 348080 }, { "epoch": 0.9, "learning_rate": 0.00016465507632568738, "loss": 0.011, "step": 348090 }, { "epoch": 0.9, "learning_rate": 0.0001646511881093159, "loss": 0.0147, "step": 348100 }, { "epoch": 0.9, "learning_rate": 0.00016464729989294443, "loss": 0.0108, "step": 348110 }, { "epoch": 0.9, "learning_rate": 0.00016464341167657295, "loss": 0.0142, "step": 348120 }, { "epoch": 0.9, "learning_rate": 0.0001646395234602015, "loss": 0.0134, "step": 348130 }, { "epoch": 0.9, "learning_rate": 0.00016463563524383006, "loss": 0.0122, "step": 348140 }, { "epoch": 0.9, "learning_rate": 0.00016463174702745857, "loss": 0.0142, "step": 348150 }, { "epoch": 0.9, "learning_rate": 0.00016462785881108709, "loss": 0.0129, "step": 348160 }, { "epoch": 0.9, "learning_rate": 0.00016462397059471563, "loss": 0.012, "step": 348170 }, { "epoch": 0.9, "learning_rate": 0.0001646200823783442, "loss": 0.0122, "step": 348180 }, { "epoch": 0.9, "learning_rate": 0.0001646161941619727, "loss": 0.0145, "step": 348190 }, { "epoch": 0.9, "learning_rate": 0.00016461230594560125, "loss": 0.0142, "step": 348200 }, { "epoch": 0.9, "learning_rate": 0.00016460841772922977, "loss": 0.0154, "step": 348210 }, { "epoch": 0.9, "learning_rate": 0.00016460452951285834, "loss": 0.0123, "step": 348220 }, { "epoch": 0.9, "learning_rate": 0.00016460064129648685, "loss": 0.0141, "step": 348230 }, { "epoch": 0.9, "learning_rate": 0.0001645967530801154, "loss": 0.0105, "step": 348240 }, { "epoch": 0.9, "learning_rate": 0.0001645928648637439, "loss": 0.0125, "step": 348250 }, { "epoch": 0.9, "learning_rate": 0.00016458897664737248, "loss": 0.0108, "step": 348260 }, { "epoch": 0.9, "learning_rate": 0.000164585088431001, "loss": 0.0129, "step": 348270 }, { "epoch": 0.9, "learning_rate": 0.00016458120021462953, "loss": 0.0101, "step": 348280 }, { "epoch": 0.9, "learning_rate": 0.00016457731199825805, "loss": 0.0114, "step": 348290 }, { "epoch": 0.9, "learning_rate": 0.00016457342378188662, "loss": 0.0116, "step": 348300 }, { "epoch": 0.9, "learning_rate": 0.00016456953556551513, "loss": 0.012, "step": 348310 }, { "epoch": 0.9, "learning_rate": 0.00016456564734914367, "loss": 0.0145, "step": 348320 }, { "epoch": 0.9, "learning_rate": 0.00016456175913277219, "loss": 0.0148, "step": 348330 }, { "epoch": 0.9, "learning_rate": 0.00016455787091640075, "loss": 0.0147, "step": 348340 }, { "epoch": 0.9, "learning_rate": 0.0001645539827000293, "loss": 0.0128, "step": 348350 }, { "epoch": 0.9, "learning_rate": 0.0001645500944836578, "loss": 0.0114, "step": 348360 }, { "epoch": 0.9, "learning_rate": 0.00016454620626728635, "loss": 0.0243, "step": 348370 }, { "epoch": 0.9, "learning_rate": 0.00016454231805091487, "loss": 0.0173, "step": 348380 }, { "epoch": 0.9, "learning_rate": 0.00016453842983454344, "loss": 0.0131, "step": 348390 }, { "epoch": 0.9, "learning_rate": 0.00016453454161817195, "loss": 0.0115, "step": 348400 }, { "epoch": 0.9, "learning_rate": 0.0001645306534018005, "loss": 0.0152, "step": 348410 }, { "epoch": 0.9, "learning_rate": 0.000164526765185429, "loss": 0.0168, "step": 348420 }, { "epoch": 0.9, "learning_rate": 0.00016452287696905758, "loss": 0.0132, "step": 348430 }, { "epoch": 0.9, "learning_rate": 0.0001645189887526861, "loss": 0.0112, "step": 348440 }, { "epoch": 0.9, "learning_rate": 0.00016451510053631463, "loss": 0.015, "step": 348450 }, { "epoch": 0.9, "learning_rate": 0.00016451121231994315, "loss": 0.0117, "step": 348460 }, { "epoch": 0.9, "learning_rate": 0.00016450732410357171, "loss": 0.0195, "step": 348470 }, { "epoch": 0.9, "learning_rate": 0.00016450343588720023, "loss": 0.0145, "step": 348480 }, { "epoch": 0.9, "learning_rate": 0.00016449954767082877, "loss": 0.0144, "step": 348490 }, { "epoch": 0.9, "learning_rate": 0.00016449565945445729, "loss": 0.0135, "step": 348500 }, { "epoch": 0.9, "learning_rate": 0.00016449177123808585, "loss": 0.0146, "step": 348510 }, { "epoch": 0.9, "learning_rate": 0.0001644878830217144, "loss": 0.0157, "step": 348520 }, { "epoch": 0.9, "learning_rate": 0.0001644839948053429, "loss": 0.0113, "step": 348530 }, { "epoch": 0.9, "learning_rate": 0.00016448010658897145, "loss": 0.0135, "step": 348540 }, { "epoch": 0.9, "learning_rate": 0.0001644762183726, "loss": 0.0125, "step": 348550 }, { "epoch": 0.9, "learning_rate": 0.00016447233015622854, "loss": 0.0158, "step": 348560 }, { "epoch": 0.9, "learning_rate": 0.00016446844193985705, "loss": 0.0123, "step": 348570 }, { "epoch": 0.9, "learning_rate": 0.0001644645537234856, "loss": 0.0139, "step": 348580 }, { "epoch": 0.9, "learning_rate": 0.0001644606655071141, "loss": 0.0158, "step": 348590 }, { "epoch": 0.9, "learning_rate": 0.00016445677729074267, "loss": 0.0097, "step": 348600 }, { "epoch": 0.9, "learning_rate": 0.0001644528890743712, "loss": 0.0121, "step": 348610 }, { "epoch": 0.9, "learning_rate": 0.00016444900085799973, "loss": 0.0161, "step": 348620 }, { "epoch": 0.9, "learning_rate": 0.00016444511264162825, "loss": 0.012, "step": 348630 }, { "epoch": 0.9, "learning_rate": 0.00016444122442525681, "loss": 0.0139, "step": 348640 }, { "epoch": 0.9, "learning_rate": 0.00016443733620888533, "loss": 0.0119, "step": 348650 }, { "epoch": 0.9, "learning_rate": 0.00016443344799251387, "loss": 0.0154, "step": 348660 }, { "epoch": 0.9, "learning_rate": 0.00016442955977614238, "loss": 0.0119, "step": 348670 }, { "epoch": 0.9, "learning_rate": 0.00016442567155977095, "loss": 0.0135, "step": 348680 }, { "epoch": 0.9, "learning_rate": 0.0001644217833433995, "loss": 0.0134, "step": 348690 }, { "epoch": 0.9, "learning_rate": 0.000164417895127028, "loss": 0.0123, "step": 348700 }, { "epoch": 0.9, "learning_rate": 0.00016441400691065652, "loss": 0.0174, "step": 348710 }, { "epoch": 0.9, "learning_rate": 0.0001644101186942851, "loss": 0.0152, "step": 348720 }, { "epoch": 0.9, "learning_rate": 0.00016440623047791363, "loss": 0.0117, "step": 348730 }, { "epoch": 0.9, "learning_rate": 0.00016440234226154215, "loss": 0.0113, "step": 348740 }, { "epoch": 0.9, "learning_rate": 0.0001643984540451707, "loss": 0.0118, "step": 348750 }, { "epoch": 0.9, "learning_rate": 0.00016439456582879923, "loss": 0.0146, "step": 348760 }, { "epoch": 0.9, "learning_rate": 0.00016439067761242777, "loss": 0.0108, "step": 348770 }, { "epoch": 0.9, "learning_rate": 0.0001643867893960563, "loss": 0.0125, "step": 348780 }, { "epoch": 0.9, "learning_rate": 0.00016438290117968483, "loss": 0.0132, "step": 348790 }, { "epoch": 0.9, "learning_rate": 0.00016437901296331337, "loss": 0.011, "step": 348800 }, { "epoch": 0.9, "learning_rate": 0.0001643751247469419, "loss": 0.0157, "step": 348810 }, { "epoch": 0.9, "learning_rate": 0.00016437123653057043, "loss": 0.0137, "step": 348820 }, { "epoch": 0.9, "learning_rate": 0.00016436734831419897, "loss": 0.016, "step": 348830 }, { "epoch": 0.9, "learning_rate": 0.00016436346009782748, "loss": 0.0116, "step": 348840 }, { "epoch": 0.9, "learning_rate": 0.00016435957188145605, "loss": 0.0136, "step": 348850 }, { "epoch": 0.9, "learning_rate": 0.0001643556836650846, "loss": 0.0117, "step": 348860 }, { "epoch": 0.9, "learning_rate": 0.0001643517954487131, "loss": 0.0156, "step": 348870 }, { "epoch": 0.9, "learning_rate": 0.00016434790723234162, "loss": 0.0107, "step": 348880 }, { "epoch": 0.9, "learning_rate": 0.0001643440190159702, "loss": 0.0119, "step": 348890 }, { "epoch": 0.9, "learning_rate": 0.00016434013079959873, "loss": 0.0107, "step": 348900 }, { "epoch": 0.9, "learning_rate": 0.00016433624258322725, "loss": 0.011, "step": 348910 }, { "epoch": 0.9, "learning_rate": 0.0001643323543668558, "loss": 0.0144, "step": 348920 }, { "epoch": 0.9, "learning_rate": 0.00016432846615048433, "loss": 0.0112, "step": 348930 }, { "epoch": 0.9, "learning_rate": 0.00016432457793411287, "loss": 0.0128, "step": 348940 }, { "epoch": 0.9, "learning_rate": 0.0001643206897177414, "loss": 0.0113, "step": 348950 }, { "epoch": 0.9, "learning_rate": 0.00016431680150136993, "loss": 0.0149, "step": 348960 }, { "epoch": 0.9, "learning_rate": 0.00016431291328499847, "loss": 0.0147, "step": 348970 }, { "epoch": 0.9, "learning_rate": 0.000164309025068627, "loss": 0.0102, "step": 348980 }, { "epoch": 0.9, "learning_rate": 0.00016430513685225553, "loss": 0.0127, "step": 348990 }, { "epoch": 0.9, "learning_rate": 0.00016430124863588407, "loss": 0.0116, "step": 349000 }, { "epoch": 0.9, "eval_cer": 0.8817376772465223, "eval_loss": 0.008726708590984344, "eval_runtime": 107.6491, "eval_samples_per_second": 18.579, "eval_steps_per_second": 4.645, "step": 349000 }, { "epoch": 0.9, "learning_rate": 0.00016429736041951264, "loss": 0.0118, "step": 349010 }, { "epoch": 0.9, "learning_rate": 0.00016429347220314115, "loss": 0.0138, "step": 349020 }, { "epoch": 0.9, "learning_rate": 0.00016428958398676967, "loss": 0.0177, "step": 349030 }, { "epoch": 0.9, "learning_rate": 0.0001642856957703982, "loss": 0.0132, "step": 349040 }, { "epoch": 0.9, "learning_rate": 0.00016428180755402678, "loss": 0.0132, "step": 349050 }, { "epoch": 0.9, "learning_rate": 0.0001642779193376553, "loss": 0.0135, "step": 349060 }, { "epoch": 0.9, "learning_rate": 0.00016427403112128383, "loss": 0.0124, "step": 349070 }, { "epoch": 0.9, "learning_rate": 0.00016427014290491235, "loss": 0.0185, "step": 349080 }, { "epoch": 0.9, "learning_rate": 0.0001642662546885409, "loss": 0.01, "step": 349090 }, { "epoch": 0.9, "learning_rate": 0.00016426236647216943, "loss": 0.0203, "step": 349100 }, { "epoch": 0.9, "learning_rate": 0.00016425847825579797, "loss": 0.0124, "step": 349110 }, { "epoch": 0.9, "learning_rate": 0.0001642545900394265, "loss": 0.011, "step": 349120 }, { "epoch": 0.9, "learning_rate": 0.00016425070182305503, "loss": 0.0103, "step": 349130 }, { "epoch": 0.91, "learning_rate": 0.00016424681360668357, "loss": 0.0121, "step": 349140 }, { "epoch": 0.91, "learning_rate": 0.0001642429253903121, "loss": 0.0131, "step": 349150 }, { "epoch": 0.91, "learning_rate": 0.00016423903717394063, "loss": 0.0139, "step": 349160 }, { "epoch": 0.91, "learning_rate": 0.00016423514895756917, "loss": 0.0152, "step": 349170 }, { "epoch": 0.91, "learning_rate": 0.0001642312607411977, "loss": 0.0168, "step": 349180 }, { "epoch": 0.91, "learning_rate": 0.00016422737252482625, "loss": 0.014, "step": 349190 }, { "epoch": 0.91, "learning_rate": 0.00016422348430845477, "loss": 0.0147, "step": 349200 }, { "epoch": 0.91, "learning_rate": 0.0001642195960920833, "loss": 0.0113, "step": 349210 }, { "epoch": 0.91, "learning_rate": 0.00016421570787571188, "loss": 0.0148, "step": 349220 }, { "epoch": 0.91, "learning_rate": 0.0001642118196593404, "loss": 0.0131, "step": 349230 }, { "epoch": 0.91, "learning_rate": 0.00016420793144296893, "loss": 0.014, "step": 349240 }, { "epoch": 0.91, "learning_rate": 0.00016420404322659745, "loss": 0.0117, "step": 349250 }, { "epoch": 0.91, "learning_rate": 0.00016420015501022602, "loss": 0.0406, "step": 349260 }, { "epoch": 0.91, "learning_rate": 0.00016419626679385453, "loss": 0.0141, "step": 349270 }, { "epoch": 0.91, "learning_rate": 0.00016419237857748307, "loss": 0.0128, "step": 349280 }, { "epoch": 0.91, "learning_rate": 0.0001641884903611116, "loss": 0.0136, "step": 349290 }, { "epoch": 0.91, "learning_rate": 0.00016418460214474016, "loss": 0.0176, "step": 349300 }, { "epoch": 0.91, "learning_rate": 0.00016418071392836867, "loss": 0.0188, "step": 349310 }, { "epoch": 0.91, "learning_rate": 0.0001641768257119972, "loss": 0.0127, "step": 349320 }, { "epoch": 0.91, "learning_rate": 0.00016417293749562573, "loss": 0.011, "step": 349330 }, { "epoch": 0.91, "learning_rate": 0.00016416904927925427, "loss": 0.0132, "step": 349340 }, { "epoch": 0.91, "learning_rate": 0.0001641651610628828, "loss": 0.0142, "step": 349350 }, { "epoch": 0.91, "learning_rate": 0.00016416127284651135, "loss": 0.0126, "step": 349360 }, { "epoch": 0.91, "learning_rate": 0.00016415738463013987, "loss": 0.0136, "step": 349370 }, { "epoch": 0.91, "learning_rate": 0.0001641534964137684, "loss": 0.0141, "step": 349380 }, { "epoch": 0.91, "learning_rate": 0.00016414960819739698, "loss": 0.0141, "step": 349390 }, { "epoch": 0.91, "learning_rate": 0.0001641457199810255, "loss": 0.0135, "step": 349400 }, { "epoch": 0.91, "learning_rate": 0.00016414183176465403, "loss": 0.0153, "step": 349410 }, { "epoch": 0.91, "learning_rate": 0.00016413794354828255, "loss": 0.0134, "step": 349420 }, { "epoch": 0.91, "learning_rate": 0.00016413405533191112, "loss": 0.0113, "step": 349430 }, { "epoch": 0.91, "learning_rate": 0.00016413016711553963, "loss": 0.0134, "step": 349440 }, { "epoch": 0.91, "learning_rate": 0.00016412627889916817, "loss": 0.0139, "step": 349450 }, { "epoch": 0.91, "learning_rate": 0.00016412239068279669, "loss": 0.0123, "step": 349460 }, { "epoch": 0.91, "learning_rate": 0.00016411850246642525, "loss": 0.0134, "step": 349470 }, { "epoch": 0.91, "learning_rate": 0.00016411461425005377, "loss": 0.0162, "step": 349480 }, { "epoch": 0.91, "learning_rate": 0.0001641107260336823, "loss": 0.0122, "step": 349490 }, { "epoch": 0.91, "learning_rate": 0.00016410683781731083, "loss": 0.0105, "step": 349500 }, { "epoch": 0.91, "learning_rate": 0.0001641029496009394, "loss": 0.0136, "step": 349510 }, { "epoch": 0.91, "learning_rate": 0.0001640990613845679, "loss": 0.0118, "step": 349520 }, { "epoch": 0.91, "learning_rate": 0.00016409517316819645, "loss": 0.0144, "step": 349530 }, { "epoch": 0.91, "learning_rate": 0.00016409128495182496, "loss": 0.0138, "step": 349540 }, { "epoch": 0.91, "learning_rate": 0.00016408739673545353, "loss": 0.0134, "step": 349550 }, { "epoch": 0.91, "learning_rate": 0.00016408350851908208, "loss": 0.0185, "step": 349560 }, { "epoch": 0.91, "learning_rate": 0.0001640796203027106, "loss": 0.0143, "step": 349570 }, { "epoch": 0.91, "learning_rate": 0.0001640757320863391, "loss": 0.0143, "step": 349580 }, { "epoch": 0.91, "learning_rate": 0.00016407184386996765, "loss": 0.0133, "step": 349590 }, { "epoch": 0.91, "learning_rate": 0.00016406795565359621, "loss": 0.0158, "step": 349600 }, { "epoch": 0.91, "learning_rate": 0.00016406406743722473, "loss": 0.0138, "step": 349610 }, { "epoch": 0.91, "learning_rate": 0.00016406017922085327, "loss": 0.0126, "step": 349620 }, { "epoch": 0.91, "learning_rate": 0.00016405629100448179, "loss": 0.0125, "step": 349630 }, { "epoch": 0.91, "learning_rate": 0.00016405240278811035, "loss": 0.0145, "step": 349640 }, { "epoch": 0.91, "learning_rate": 0.00016404851457173887, "loss": 0.0154, "step": 349650 }, { "epoch": 0.91, "learning_rate": 0.0001640446263553674, "loss": 0.0104, "step": 349660 }, { "epoch": 0.91, "learning_rate": 0.00016404073813899592, "loss": 0.0117, "step": 349670 }, { "epoch": 0.91, "learning_rate": 0.0001640368499226245, "loss": 0.0122, "step": 349680 }, { "epoch": 0.91, "learning_rate": 0.000164032961706253, "loss": 0.0208, "step": 349690 }, { "epoch": 0.91, "learning_rate": 0.00016402907348988155, "loss": 0.0155, "step": 349700 }, { "epoch": 0.91, "learning_rate": 0.00016402518527351006, "loss": 0.0122, "step": 349710 }, { "epoch": 0.91, "learning_rate": 0.00016402129705713863, "loss": 0.0125, "step": 349720 }, { "epoch": 0.91, "learning_rate": 0.00016401740884076717, "loss": 0.0133, "step": 349730 }, { "epoch": 0.91, "learning_rate": 0.0001640135206243957, "loss": 0.0129, "step": 349740 }, { "epoch": 0.91, "learning_rate": 0.0001640096324080242, "loss": 0.0144, "step": 349750 }, { "epoch": 0.91, "learning_rate": 0.00016400574419165277, "loss": 0.0139, "step": 349760 }, { "epoch": 0.91, "learning_rate": 0.00016400185597528131, "loss": 0.0143, "step": 349770 }, { "epoch": 0.91, "learning_rate": 0.00016399796775890983, "loss": 0.013, "step": 349780 }, { "epoch": 0.91, "learning_rate": 0.00016399407954253837, "loss": 0.0119, "step": 349790 }, { "epoch": 0.91, "learning_rate": 0.0001639901913261669, "loss": 0.0149, "step": 349800 }, { "epoch": 0.91, "learning_rate": 0.00016398630310979545, "loss": 0.014, "step": 349810 }, { "epoch": 0.91, "learning_rate": 0.00016398241489342397, "loss": 0.0124, "step": 349820 }, { "epoch": 0.91, "learning_rate": 0.0001639785266770525, "loss": 0.0146, "step": 349830 }, { "epoch": 0.91, "learning_rate": 0.00016397463846068102, "loss": 0.015, "step": 349840 }, { "epoch": 0.91, "learning_rate": 0.0001639707502443096, "loss": 0.0127, "step": 349850 }, { "epoch": 0.91, "learning_rate": 0.0001639668620279381, "loss": 0.0147, "step": 349860 }, { "epoch": 0.91, "learning_rate": 0.00016396297381156665, "loss": 0.0128, "step": 349870 }, { "epoch": 0.91, "learning_rate": 0.00016395908559519516, "loss": 0.0131, "step": 349880 }, { "epoch": 0.91, "learning_rate": 0.00016395519737882373, "loss": 0.0131, "step": 349890 }, { "epoch": 0.91, "learning_rate": 0.00016395130916245225, "loss": 0.0104, "step": 349900 }, { "epoch": 0.91, "learning_rate": 0.0001639474209460808, "loss": 0.0133, "step": 349910 }, { "epoch": 0.91, "learning_rate": 0.0001639435327297093, "loss": 0.0108, "step": 349920 }, { "epoch": 0.91, "learning_rate": 0.00016393964451333787, "loss": 0.0117, "step": 349930 }, { "epoch": 0.91, "learning_rate": 0.00016393575629696641, "loss": 0.0096, "step": 349940 }, { "epoch": 0.91, "learning_rate": 0.00016393186808059493, "loss": 0.0107, "step": 349950 }, { "epoch": 0.91, "learning_rate": 0.00016392797986422347, "loss": 0.0125, "step": 349960 }, { "epoch": 0.91, "learning_rate": 0.000163924091647852, "loss": 0.0206, "step": 349970 }, { "epoch": 0.91, "learning_rate": 0.00016392020343148055, "loss": 0.0126, "step": 349980 }, { "epoch": 0.91, "learning_rate": 0.00016391631521510907, "loss": 0.0113, "step": 349990 }, { "epoch": 0.91, "learning_rate": 0.0001639124269987376, "loss": 0.0143, "step": 350000 }, { "epoch": 0.91, "eval_cer": 0.8817964619977577, "eval_loss": 0.009117286652326584, "eval_runtime": 107.4916, "eval_samples_per_second": 18.606, "eval_steps_per_second": 4.652, "step": 350000 }, { "epoch": 0.91, "learning_rate": 0.00016390853878236615, "loss": 0.0109, "step": 350010 }, { "epoch": 0.91, "learning_rate": 0.0001639046505659947, "loss": 0.0111, "step": 350020 }, { "epoch": 0.91, "learning_rate": 0.0001639007623496232, "loss": 0.0124, "step": 350030 }, { "epoch": 0.91, "learning_rate": 0.00016389687413325175, "loss": 0.0134, "step": 350040 }, { "epoch": 0.91, "learning_rate": 0.0001638929859168803, "loss": 0.0132, "step": 350050 }, { "epoch": 0.91, "learning_rate": 0.00016388909770050883, "loss": 0.0153, "step": 350060 }, { "epoch": 0.91, "learning_rate": 0.00016388520948413735, "loss": 0.0119, "step": 350070 }, { "epoch": 0.91, "learning_rate": 0.0001638813212677659, "loss": 0.0129, "step": 350080 }, { "epoch": 0.91, "learning_rate": 0.0001638774330513944, "loss": 0.0117, "step": 350090 }, { "epoch": 0.91, "learning_rate": 0.00016387354483502297, "loss": 0.0161, "step": 350100 }, { "epoch": 0.91, "learning_rate": 0.0001638696566186515, "loss": 0.0127, "step": 350110 }, { "epoch": 0.91, "learning_rate": 0.00016386576840228003, "loss": 0.0149, "step": 350120 }, { "epoch": 0.91, "learning_rate": 0.00016386188018590857, "loss": 0.0114, "step": 350130 }, { "epoch": 0.91, "learning_rate": 0.0001638579919695371, "loss": 0.0116, "step": 350140 }, { "epoch": 0.91, "learning_rate": 0.00016385410375316565, "loss": 0.0122, "step": 350150 }, { "epoch": 0.91, "learning_rate": 0.00016385021553679417, "loss": 0.012, "step": 350160 }, { "epoch": 0.91, "learning_rate": 0.0001638463273204227, "loss": 0.0095, "step": 350170 }, { "epoch": 0.91, "learning_rate": 0.00016384243910405125, "loss": 0.0144, "step": 350180 }, { "epoch": 0.91, "learning_rate": 0.0001638385508876798, "loss": 0.0141, "step": 350190 }, { "epoch": 0.91, "learning_rate": 0.0001638346626713083, "loss": 0.0125, "step": 350200 }, { "epoch": 0.91, "learning_rate": 0.00016383077445493685, "loss": 0.0124, "step": 350210 }, { "epoch": 0.91, "learning_rate": 0.0001638268862385654, "loss": 0.0157, "step": 350220 }, { "epoch": 0.91, "learning_rate": 0.00016382299802219393, "loss": 0.0155, "step": 350230 }, { "epoch": 0.91, "learning_rate": 0.00016381910980582245, "loss": 0.0142, "step": 350240 }, { "epoch": 0.91, "learning_rate": 0.000163815221589451, "loss": 0.0116, "step": 350250 }, { "epoch": 0.91, "learning_rate": 0.00016381133337307956, "loss": 0.0128, "step": 350260 }, { "epoch": 0.91, "learning_rate": 0.00016380744515670807, "loss": 0.0124, "step": 350270 }, { "epoch": 0.91, "learning_rate": 0.0001638035569403366, "loss": 0.0143, "step": 350280 }, { "epoch": 0.91, "learning_rate": 0.00016379966872396513, "loss": 0.0124, "step": 350290 }, { "epoch": 0.91, "learning_rate": 0.0001637957805075937, "loss": 0.0131, "step": 350300 }, { "epoch": 0.91, "learning_rate": 0.0001637918922912222, "loss": 0.0128, "step": 350310 }, { "epoch": 0.91, "learning_rate": 0.00016378800407485075, "loss": 0.0096, "step": 350320 }, { "epoch": 0.91, "learning_rate": 0.00016378411585847927, "loss": 0.016, "step": 350330 }, { "epoch": 0.91, "learning_rate": 0.0001637802276421078, "loss": 0.013, "step": 350340 }, { "epoch": 0.91, "learning_rate": 0.00016377633942573635, "loss": 0.0111, "step": 350350 }, { "epoch": 0.91, "learning_rate": 0.0001637724512093649, "loss": 0.018, "step": 350360 }, { "epoch": 0.91, "learning_rate": 0.0001637685629929934, "loss": 0.0113, "step": 350370 }, { "epoch": 0.91, "learning_rate": 0.00016376467477662195, "loss": 0.0139, "step": 350380 }, { "epoch": 0.91, "learning_rate": 0.0001637607865602505, "loss": 0.0108, "step": 350390 }, { "epoch": 0.91, "learning_rate": 0.00016375689834387903, "loss": 0.0117, "step": 350400 }, { "epoch": 0.91, "learning_rate": 0.00016375301012750755, "loss": 0.0103, "step": 350410 }, { "epoch": 0.91, "learning_rate": 0.0001637491219111361, "loss": 0.0115, "step": 350420 }, { "epoch": 0.91, "learning_rate": 0.00016374523369476466, "loss": 0.0116, "step": 350430 }, { "epoch": 0.91, "learning_rate": 0.00016374134547839317, "loss": 0.0126, "step": 350440 }, { "epoch": 0.91, "learning_rate": 0.0001637374572620217, "loss": 0.0092, "step": 350450 }, { "epoch": 0.91, "learning_rate": 0.00016373356904565023, "loss": 0.0099, "step": 350460 }, { "epoch": 0.91, "learning_rate": 0.0001637296808292788, "loss": 0.0144, "step": 350470 }, { "epoch": 0.91, "learning_rate": 0.0001637257926129073, "loss": 0.0123, "step": 350480 }, { "epoch": 0.91, "learning_rate": 0.00016372190439653585, "loss": 0.0134, "step": 350490 }, { "epoch": 0.91, "learning_rate": 0.00016371801618016437, "loss": 0.0135, "step": 350500 }, { "epoch": 0.91, "learning_rate": 0.00016371412796379293, "loss": 0.0138, "step": 350510 }, { "epoch": 0.91, "learning_rate": 0.00016371023974742145, "loss": 0.0128, "step": 350520 }, { "epoch": 0.91, "learning_rate": 0.00016370635153105, "loss": 0.013, "step": 350530 }, { "epoch": 0.91, "learning_rate": 0.0001637024633146785, "loss": 0.0111, "step": 350540 }, { "epoch": 0.91, "learning_rate": 0.00016369857509830707, "loss": 0.0141, "step": 350550 }, { "epoch": 0.91, "learning_rate": 0.0001636946868819356, "loss": 0.0136, "step": 350560 }, { "epoch": 0.91, "learning_rate": 0.00016369079866556413, "loss": 0.0135, "step": 350570 }, { "epoch": 0.91, "learning_rate": 0.00016368691044919264, "loss": 0.012, "step": 350580 }, { "epoch": 0.91, "learning_rate": 0.00016368302223282119, "loss": 0.0107, "step": 350590 }, { "epoch": 0.91, "learning_rate": 0.00016367913401644976, "loss": 0.0114, "step": 350600 }, { "epoch": 0.91, "learning_rate": 0.00016367524580007827, "loss": 0.0119, "step": 350610 }, { "epoch": 0.91, "learning_rate": 0.00016367135758370678, "loss": 0.0121, "step": 350620 }, { "epoch": 0.91, "learning_rate": 0.00016366746936733533, "loss": 0.0125, "step": 350630 }, { "epoch": 0.91, "learning_rate": 0.0001636635811509639, "loss": 0.0106, "step": 350640 }, { "epoch": 0.91, "learning_rate": 0.0001636596929345924, "loss": 0.0132, "step": 350650 }, { "epoch": 0.91, "learning_rate": 0.00016365580471822095, "loss": 0.0125, "step": 350660 }, { "epoch": 0.91, "learning_rate": 0.00016365191650184947, "loss": 0.0118, "step": 350670 }, { "epoch": 0.91, "learning_rate": 0.00016364802828547803, "loss": 0.017, "step": 350680 }, { "epoch": 0.91, "learning_rate": 0.00016364414006910655, "loss": 0.0116, "step": 350690 }, { "epoch": 0.91, "learning_rate": 0.0001636402518527351, "loss": 0.014, "step": 350700 }, { "epoch": 0.91, "learning_rate": 0.0001636363636363636, "loss": 0.0146, "step": 350710 }, { "epoch": 0.91, "learning_rate": 0.00016363247541999217, "loss": 0.0113, "step": 350720 }, { "epoch": 0.91, "learning_rate": 0.0001636285872036207, "loss": 0.0128, "step": 350730 }, { "epoch": 0.91, "learning_rate": 0.00016362469898724923, "loss": 0.0098, "step": 350740 }, { "epoch": 0.91, "learning_rate": 0.00016362081077087774, "loss": 0.0096, "step": 350750 }, { "epoch": 0.91, "learning_rate": 0.0001636169225545063, "loss": 0.0134, "step": 350760 }, { "epoch": 0.91, "learning_rate": 0.00016361303433813483, "loss": 0.0125, "step": 350770 }, { "epoch": 0.91, "learning_rate": 0.00016360914612176337, "loss": 0.0131, "step": 350780 }, { "epoch": 0.91, "learning_rate": 0.00016360525790539188, "loss": 0.0128, "step": 350790 }, { "epoch": 0.91, "learning_rate": 0.00016360136968902045, "loss": 0.011, "step": 350800 }, { "epoch": 0.91, "learning_rate": 0.000163597481472649, "loss": 0.0118, "step": 350810 }, { "epoch": 0.91, "learning_rate": 0.0001635935932562775, "loss": 0.0099, "step": 350820 }, { "epoch": 0.91, "learning_rate": 0.00016358970503990605, "loss": 0.0111, "step": 350830 }, { "epoch": 0.91, "learning_rate": 0.00016358581682353456, "loss": 0.0152, "step": 350840 }, { "epoch": 0.91, "learning_rate": 0.00016358192860716313, "loss": 0.0135, "step": 350850 }, { "epoch": 0.91, "learning_rate": 0.00016357804039079165, "loss": 0.0089, "step": 350860 }, { "epoch": 0.91, "learning_rate": 0.0001635741521744202, "loss": 0.0091, "step": 350870 }, { "epoch": 0.91, "learning_rate": 0.0001635702639580487, "loss": 0.0184, "step": 350880 }, { "epoch": 0.91, "learning_rate": 0.00016356637574167727, "loss": 0.0126, "step": 350890 }, { "epoch": 0.91, "learning_rate": 0.0001635624875253058, "loss": 0.0121, "step": 350900 }, { "epoch": 0.91, "learning_rate": 0.00016355859930893433, "loss": 0.0116, "step": 350910 }, { "epoch": 0.91, "learning_rate": 0.00016355471109256284, "loss": 0.0189, "step": 350920 }, { "epoch": 0.91, "learning_rate": 0.0001635508228761914, "loss": 0.0141, "step": 350930 }, { "epoch": 0.91, "learning_rate": 0.00016354693465981993, "loss": 0.0128, "step": 350940 }, { "epoch": 0.91, "learning_rate": 0.00016354304644344847, "loss": 0.0159, "step": 350950 }, { "epoch": 0.91, "learning_rate": 0.00016353915822707698, "loss": 0.0128, "step": 350960 }, { "epoch": 0.91, "learning_rate": 0.00016353527001070555, "loss": 0.0105, "step": 350970 }, { "epoch": 0.91, "learning_rate": 0.0001635313817943341, "loss": 0.0127, "step": 350980 }, { "epoch": 0.91, "learning_rate": 0.0001635274935779626, "loss": 0.0146, "step": 350990 }, { "epoch": 0.91, "learning_rate": 0.00016352360536159115, "loss": 0.0124, "step": 351000 }, { "epoch": 0.91, "eval_cer": 0.8817642703482717, "eval_loss": 0.008518124930560589, "eval_runtime": 107.3251, "eval_samples_per_second": 18.635, "eval_steps_per_second": 4.659, "step": 351000 }, { "epoch": 0.91, "learning_rate": 0.0001635197171452197, "loss": 0.0127, "step": 351010 }, { "epoch": 0.91, "learning_rate": 0.00016351582892884823, "loss": 0.0115, "step": 351020 }, { "epoch": 0.91, "learning_rate": 0.00016351194071247675, "loss": 0.0132, "step": 351030 }, { "epoch": 0.91, "learning_rate": 0.0001635080524961053, "loss": 0.0143, "step": 351040 }, { "epoch": 0.91, "learning_rate": 0.00016350416427973383, "loss": 0.0125, "step": 351050 }, { "epoch": 0.91, "learning_rate": 0.00016350027606336237, "loss": 0.0161, "step": 351060 }, { "epoch": 0.91, "learning_rate": 0.0001634963878469909, "loss": 0.0105, "step": 351070 }, { "epoch": 0.91, "learning_rate": 0.00016349249963061943, "loss": 0.0174, "step": 351080 }, { "epoch": 0.91, "learning_rate": 0.00016348861141424794, "loss": 0.0135, "step": 351090 }, { "epoch": 0.91, "learning_rate": 0.0001634847231978765, "loss": 0.0136, "step": 351100 }, { "epoch": 0.91, "learning_rate": 0.00016348083498150503, "loss": 0.0092, "step": 351110 }, { "epoch": 0.91, "learning_rate": 0.00016347694676513357, "loss": 0.0122, "step": 351120 }, { "epoch": 0.91, "learning_rate": 0.00016347305854876208, "loss": 0.0107, "step": 351130 }, { "epoch": 0.91, "learning_rate": 0.00016346917033239065, "loss": 0.0139, "step": 351140 }, { "epoch": 0.91, "learning_rate": 0.0001634652821160192, "loss": 0.0136, "step": 351150 }, { "epoch": 0.91, "learning_rate": 0.0001634613938996477, "loss": 0.0133, "step": 351160 }, { "epoch": 0.91, "learning_rate": 0.00016345750568327622, "loss": 0.0122, "step": 351170 }, { "epoch": 0.91, "learning_rate": 0.0001634536174669048, "loss": 0.0113, "step": 351180 }, { "epoch": 0.91, "learning_rate": 0.00016344972925053333, "loss": 0.009, "step": 351190 }, { "epoch": 0.91, "learning_rate": 0.00016344584103416185, "loss": 0.0126, "step": 351200 }, { "epoch": 0.91, "learning_rate": 0.0001634419528177904, "loss": 0.0131, "step": 351210 }, { "epoch": 0.91, "learning_rate": 0.00016343806460141893, "loss": 0.0143, "step": 351220 }, { "epoch": 0.91, "learning_rate": 0.00016343417638504747, "loss": 0.0113, "step": 351230 }, { "epoch": 0.91, "learning_rate": 0.00016343028816867599, "loss": 0.014, "step": 351240 }, { "epoch": 0.91, "learning_rate": 0.00016342639995230453, "loss": 0.015, "step": 351250 }, { "epoch": 0.91, "learning_rate": 0.00016342251173593307, "loss": 0.0125, "step": 351260 }, { "epoch": 0.91, "learning_rate": 0.0001634186235195616, "loss": 0.014, "step": 351270 }, { "epoch": 0.91, "learning_rate": 0.00016341473530319013, "loss": 0.0112, "step": 351280 }, { "epoch": 0.91, "learning_rate": 0.00016341084708681867, "loss": 0.0118, "step": 351290 }, { "epoch": 0.91, "learning_rate": 0.00016340695887044724, "loss": 0.0156, "step": 351300 }, { "epoch": 0.91, "learning_rate": 0.00016340307065407575, "loss": 0.0121, "step": 351310 }, { "epoch": 0.91, "learning_rate": 0.0001633991824377043, "loss": 0.0134, "step": 351320 }, { "epoch": 0.91, "learning_rate": 0.0001633952942213328, "loss": 0.0112, "step": 351330 }, { "epoch": 0.91, "learning_rate": 0.00016339140600496132, "loss": 0.0121, "step": 351340 }, { "epoch": 0.91, "learning_rate": 0.0001633875177885899, "loss": 0.0149, "step": 351350 }, { "epoch": 0.91, "learning_rate": 0.00016338362957221843, "loss": 0.0119, "step": 351360 }, { "epoch": 0.91, "learning_rate": 0.00016337974135584695, "loss": 0.0145, "step": 351370 }, { "epoch": 0.91, "learning_rate": 0.0001633758531394755, "loss": 0.015, "step": 351380 }, { "epoch": 0.91, "learning_rate": 0.00016337196492310403, "loss": 0.0144, "step": 351390 }, { "epoch": 0.91, "learning_rate": 0.00016336807670673257, "loss": 0.0185, "step": 351400 }, { "epoch": 0.91, "learning_rate": 0.00016336418849036109, "loss": 0.0153, "step": 351410 }, { "epoch": 0.91, "learning_rate": 0.00016336030027398963, "loss": 0.0142, "step": 351420 }, { "epoch": 0.91, "learning_rate": 0.00016335641205761817, "loss": 0.0121, "step": 351430 }, { "epoch": 0.91, "learning_rate": 0.0001633525238412467, "loss": 0.0119, "step": 351440 }, { "epoch": 0.91, "learning_rate": 0.00016334863562487523, "loss": 0.0145, "step": 351450 }, { "epoch": 0.91, "learning_rate": 0.00016334474740850377, "loss": 0.0116, "step": 351460 }, { "epoch": 0.91, "learning_rate": 0.00016334085919213234, "loss": 0.0109, "step": 351470 }, { "epoch": 0.91, "learning_rate": 0.00016333697097576085, "loss": 0.0127, "step": 351480 }, { "epoch": 0.91, "learning_rate": 0.00016333308275938936, "loss": 0.0134, "step": 351490 }, { "epoch": 0.91, "learning_rate": 0.0001633291945430179, "loss": 0.017, "step": 351500 }, { "epoch": 0.91, "learning_rate": 0.00016332530632664648, "loss": 0.0179, "step": 351510 }, { "epoch": 0.91, "learning_rate": 0.000163321418110275, "loss": 0.0139, "step": 351520 }, { "epoch": 0.91, "learning_rate": 0.00016331752989390353, "loss": 0.0122, "step": 351530 }, { "epoch": 0.91, "learning_rate": 0.00016331364167753205, "loss": 0.0161, "step": 351540 }, { "epoch": 0.91, "learning_rate": 0.00016330975346116061, "loss": 0.0144, "step": 351550 }, { "epoch": 0.91, "learning_rate": 0.00016330586524478913, "loss": 0.0132, "step": 351560 }, { "epoch": 0.91, "learning_rate": 0.00016330197702841767, "loss": 0.0205, "step": 351570 }, { "epoch": 0.91, "learning_rate": 0.00016329808881204619, "loss": 0.0097, "step": 351580 }, { "epoch": 0.91, "learning_rate": 0.00016329420059567473, "loss": 0.0136, "step": 351590 }, { "epoch": 0.91, "learning_rate": 0.00016329031237930327, "loss": 0.0124, "step": 351600 }, { "epoch": 0.91, "learning_rate": 0.0001632864241629318, "loss": 0.0119, "step": 351610 }, { "epoch": 0.91, "learning_rate": 0.00016328253594656032, "loss": 0.0121, "step": 351620 }, { "epoch": 0.91, "learning_rate": 0.00016327864773018887, "loss": 0.0168, "step": 351630 }, { "epoch": 0.91, "learning_rate": 0.0001632747595138174, "loss": 0.0091, "step": 351640 }, { "epoch": 0.91, "learning_rate": 0.00016327087129744595, "loss": 0.0129, "step": 351650 }, { "epoch": 0.91, "learning_rate": 0.00016326698308107446, "loss": 0.0132, "step": 351660 }, { "epoch": 0.91, "learning_rate": 0.000163263094864703, "loss": 0.0146, "step": 351670 }, { "epoch": 0.91, "learning_rate": 0.00016325920664833157, "loss": 0.0091, "step": 351680 }, { "epoch": 0.91, "learning_rate": 0.0001632553184319601, "loss": 0.0137, "step": 351690 }, { "epoch": 0.91, "learning_rate": 0.00016325143021558863, "loss": 0.0103, "step": 351700 }, { "epoch": 0.91, "learning_rate": 0.00016324754199921715, "loss": 0.0163, "step": 351710 }, { "epoch": 0.91, "learning_rate": 0.00016324365378284571, "loss": 0.0184, "step": 351720 }, { "epoch": 0.91, "learning_rate": 0.00016323976556647423, "loss": 0.0109, "step": 351730 }, { "epoch": 0.91, "learning_rate": 0.00016323587735010277, "loss": 0.0109, "step": 351740 }, { "epoch": 0.91, "learning_rate": 0.00016323198913373128, "loss": 0.0147, "step": 351750 }, { "epoch": 0.91, "learning_rate": 0.00016322810091735985, "loss": 0.0119, "step": 351760 }, { "epoch": 0.91, "learning_rate": 0.00016322421270098837, "loss": 0.0124, "step": 351770 }, { "epoch": 0.91, "learning_rate": 0.0001632203244846169, "loss": 0.0114, "step": 351780 }, { "epoch": 0.91, "learning_rate": 0.00016321643626824542, "loss": 0.013, "step": 351790 }, { "epoch": 0.91, "learning_rate": 0.000163212548051874, "loss": 0.012, "step": 351800 }, { "epoch": 0.91, "learning_rate": 0.0001632086598355025, "loss": 0.0169, "step": 351810 }, { "epoch": 0.91, "learning_rate": 0.00016320477161913105, "loss": 0.0133, "step": 351820 }, { "epoch": 0.91, "learning_rate": 0.00016320088340275956, "loss": 0.0118, "step": 351830 }, { "epoch": 0.91, "learning_rate": 0.0001631969951863881, "loss": 0.0153, "step": 351840 }, { "epoch": 0.91, "learning_rate": 0.00016319310697001667, "loss": 0.0149, "step": 351850 }, { "epoch": 0.91, "learning_rate": 0.0001631892187536452, "loss": 0.0129, "step": 351860 }, { "epoch": 0.91, "learning_rate": 0.00016318533053727373, "loss": 0.0214, "step": 351870 }, { "epoch": 0.91, "learning_rate": 0.00016318144232090224, "loss": 0.0118, "step": 351880 }, { "epoch": 0.91, "learning_rate": 0.0001631775541045308, "loss": 0.0176, "step": 351890 }, { "epoch": 0.91, "learning_rate": 0.00016317366588815933, "loss": 0.0122, "step": 351900 }, { "epoch": 0.91, "learning_rate": 0.00016316977767178787, "loss": 0.0121, "step": 351910 }, { "epoch": 0.91, "learning_rate": 0.00016316588945541638, "loss": 0.0122, "step": 351920 }, { "epoch": 0.91, "learning_rate": 0.00016316200123904495, "loss": 0.0124, "step": 351930 }, { "epoch": 0.91, "learning_rate": 0.00016315811302267347, "loss": 0.0119, "step": 351940 }, { "epoch": 0.91, "learning_rate": 0.000163154224806302, "loss": 0.0143, "step": 351950 }, { "epoch": 0.91, "learning_rate": 0.00016315033658993052, "loss": 0.0129, "step": 351960 }, { "epoch": 0.91, "learning_rate": 0.0001631464483735591, "loss": 0.0099, "step": 351970 }, { "epoch": 0.91, "learning_rate": 0.0001631425601571876, "loss": 0.0154, "step": 351980 }, { "epoch": 0.91, "learning_rate": 0.00016313867194081615, "loss": 0.0148, "step": 351990 }, { "epoch": 0.91, "learning_rate": 0.00016313478372444466, "loss": 0.0144, "step": 352000 }, { "epoch": 0.91, "eval_cer": 0.8817558725266665, "eval_loss": 0.00876292772591114, "eval_runtime": 107.5104, "eval_samples_per_second": 18.603, "eval_steps_per_second": 4.651, "step": 352000 }, { "epoch": 0.91, "learning_rate": 0.00016313089550807323, "loss": 0.0124, "step": 352010 }, { "epoch": 0.91, "learning_rate": 0.00016312700729170177, "loss": 0.0125, "step": 352020 }, { "epoch": 0.91, "learning_rate": 0.0001631231190753303, "loss": 0.0131, "step": 352030 }, { "epoch": 0.91, "learning_rate": 0.00016311923085895883, "loss": 0.0111, "step": 352040 }, { "epoch": 0.91, "learning_rate": 0.00016311534264258737, "loss": 0.0144, "step": 352050 }, { "epoch": 0.91, "learning_rate": 0.0001631114544262159, "loss": 0.0144, "step": 352060 }, { "epoch": 0.91, "learning_rate": 0.00016310756620984443, "loss": 0.0121, "step": 352070 }, { "epoch": 0.91, "learning_rate": 0.00016310367799347297, "loss": 0.0152, "step": 352080 }, { "epoch": 0.91, "learning_rate": 0.00016309978977710148, "loss": 0.0124, "step": 352090 }, { "epoch": 0.91, "learning_rate": 0.00016309590156073005, "loss": 0.0125, "step": 352100 }, { "epoch": 0.91, "learning_rate": 0.00016309201334435857, "loss": 0.0114, "step": 352110 }, { "epoch": 0.91, "learning_rate": 0.0001630881251279871, "loss": 0.0166, "step": 352120 }, { "epoch": 0.91, "learning_rate": 0.00016308423691161562, "loss": 0.0121, "step": 352130 }, { "epoch": 0.91, "learning_rate": 0.0001630803486952442, "loss": 0.0124, "step": 352140 }, { "epoch": 0.91, "learning_rate": 0.0001630764604788727, "loss": 0.0103, "step": 352150 }, { "epoch": 0.91, "learning_rate": 0.00016307257226250125, "loss": 0.0108, "step": 352160 }, { "epoch": 0.91, "learning_rate": 0.00016306868404612976, "loss": 0.0117, "step": 352170 }, { "epoch": 0.91, "learning_rate": 0.00016306479582975833, "loss": 0.0162, "step": 352180 }, { "epoch": 0.91, "learning_rate": 0.00016306090761338687, "loss": 0.0114, "step": 352190 }, { "epoch": 0.91, "learning_rate": 0.0001630570193970154, "loss": 0.0122, "step": 352200 }, { "epoch": 0.91, "learning_rate": 0.0001630531311806439, "loss": 0.0139, "step": 352210 }, { "epoch": 0.91, "learning_rate": 0.00016304924296427247, "loss": 0.0115, "step": 352220 }, { "epoch": 0.91, "learning_rate": 0.000163045354747901, "loss": 0.0121, "step": 352230 }, { "epoch": 0.91, "learning_rate": 0.00016304146653152953, "loss": 0.0167, "step": 352240 }, { "epoch": 0.91, "learning_rate": 0.00016303757831515807, "loss": 0.0131, "step": 352250 }, { "epoch": 0.91, "learning_rate": 0.0001630336900987866, "loss": 0.0127, "step": 352260 }, { "epoch": 0.91, "learning_rate": 0.00016302980188241515, "loss": 0.0141, "step": 352270 }, { "epoch": 0.91, "learning_rate": 0.00016302591366604367, "loss": 0.0156, "step": 352280 }, { "epoch": 0.91, "learning_rate": 0.0001630220254496722, "loss": 0.0114, "step": 352290 }, { "epoch": 0.91, "learning_rate": 0.00016301813723330075, "loss": 0.0125, "step": 352300 }, { "epoch": 0.91, "learning_rate": 0.0001630142490169293, "loss": 0.0097, "step": 352310 }, { "epoch": 0.91, "learning_rate": 0.0001630103608005578, "loss": 0.0132, "step": 352320 }, { "epoch": 0.91, "learning_rate": 0.00016300647258418635, "loss": 0.0143, "step": 352330 }, { "epoch": 0.91, "learning_rate": 0.00016300258436781486, "loss": 0.0107, "step": 352340 }, { "epoch": 0.91, "learning_rate": 0.00016299869615144343, "loss": 0.0151, "step": 352350 }, { "epoch": 0.91, "learning_rate": 0.00016299480793507195, "loss": 0.0128, "step": 352360 }, { "epoch": 0.91, "learning_rate": 0.0001629909197187005, "loss": 0.0159, "step": 352370 }, { "epoch": 0.91, "learning_rate": 0.000162987031502329, "loss": 0.0097, "step": 352380 }, { "epoch": 0.91, "learning_rate": 0.00016298314328595757, "loss": 0.0144, "step": 352390 }, { "epoch": 0.91, "learning_rate": 0.0001629792550695861, "loss": 0.0133, "step": 352400 }, { "epoch": 0.91, "learning_rate": 0.00016297536685321463, "loss": 0.0147, "step": 352410 }, { "epoch": 0.91, "learning_rate": 0.00016297147863684317, "loss": 0.0148, "step": 352420 }, { "epoch": 0.91, "learning_rate": 0.0001629675904204717, "loss": 0.0107, "step": 352430 }, { "epoch": 0.91, "learning_rate": 0.00016296370220410025, "loss": 0.0123, "step": 352440 }, { "epoch": 0.91, "learning_rate": 0.00016295981398772877, "loss": 0.0131, "step": 352450 }, { "epoch": 0.91, "learning_rate": 0.0001629559257713573, "loss": 0.0133, "step": 352460 }, { "epoch": 0.91, "learning_rate": 0.00016295203755498585, "loss": 0.0141, "step": 352470 }, { "epoch": 0.91, "learning_rate": 0.0001629481493386144, "loss": 0.0149, "step": 352480 }, { "epoch": 0.91, "learning_rate": 0.0001629442611222429, "loss": 0.0158, "step": 352490 }, { "epoch": 0.91, "learning_rate": 0.00016294037290587145, "loss": 0.0139, "step": 352500 }, { "epoch": 0.91, "learning_rate": 0.00016293648468950002, "loss": 0.0128, "step": 352510 }, { "epoch": 0.91, "learning_rate": 0.00016293259647312853, "loss": 0.0172, "step": 352520 }, { "epoch": 0.91, "learning_rate": 0.00016292870825675704, "loss": 0.0123, "step": 352530 }, { "epoch": 0.91, "learning_rate": 0.00016292482004038559, "loss": 0.0138, "step": 352540 }, { "epoch": 0.91, "learning_rate": 0.00016292093182401415, "loss": 0.0185, "step": 352550 }, { "epoch": 0.91, "learning_rate": 0.00016291704360764267, "loss": 0.0181, "step": 352560 }, { "epoch": 0.91, "learning_rate": 0.0001629131553912712, "loss": 0.0125, "step": 352570 }, { "epoch": 0.91, "learning_rate": 0.00016290926717489973, "loss": 0.017, "step": 352580 }, { "epoch": 0.91, "learning_rate": 0.00016290537895852827, "loss": 0.0189, "step": 352590 }, { "epoch": 0.91, "learning_rate": 0.0001629014907421568, "loss": 0.015, "step": 352600 }, { "epoch": 0.91, "learning_rate": 0.00016289760252578535, "loss": 0.016, "step": 352610 }, { "epoch": 0.91, "learning_rate": 0.00016289371430941386, "loss": 0.011, "step": 352620 }, { "epoch": 0.91, "learning_rate": 0.0001628898260930424, "loss": 0.0144, "step": 352630 }, { "epoch": 0.91, "learning_rate": 0.00016288593787667095, "loss": 0.0095, "step": 352640 }, { "epoch": 0.91, "learning_rate": 0.0001628820496602995, "loss": 0.0119, "step": 352650 }, { "epoch": 0.91, "learning_rate": 0.000162878161443928, "loss": 0.0111, "step": 352660 }, { "epoch": 0.91, "learning_rate": 0.00016287427322755655, "loss": 0.0159, "step": 352670 }, { "epoch": 0.91, "learning_rate": 0.0001628703850111851, "loss": 0.0138, "step": 352680 }, { "epoch": 0.91, "learning_rate": 0.00016286649679481363, "loss": 0.0142, "step": 352690 }, { "epoch": 0.91, "learning_rate": 0.00016286260857844214, "loss": 0.0124, "step": 352700 }, { "epoch": 0.91, "learning_rate": 0.00016285872036207069, "loss": 0.0107, "step": 352710 }, { "epoch": 0.91, "learning_rate": 0.00016285483214569925, "loss": 0.0121, "step": 352720 }, { "epoch": 0.91, "learning_rate": 0.00016285094392932777, "loss": 0.0152, "step": 352730 }, { "epoch": 0.91, "learning_rate": 0.0001628470557129563, "loss": 0.0126, "step": 352740 }, { "epoch": 0.91, "learning_rate": 0.00016284316749658482, "loss": 0.0114, "step": 352750 }, { "epoch": 0.91, "learning_rate": 0.0001628392792802134, "loss": 0.0123, "step": 352760 }, { "epoch": 0.91, "learning_rate": 0.0001628353910638419, "loss": 0.0154, "step": 352770 }, { "epoch": 0.91, "learning_rate": 0.00016283150284747045, "loss": 0.0162, "step": 352780 }, { "epoch": 0.91, "learning_rate": 0.00016282761463109896, "loss": 0.0139, "step": 352790 }, { "epoch": 0.91, "learning_rate": 0.00016282372641472753, "loss": 0.0112, "step": 352800 }, { "epoch": 0.91, "learning_rate": 0.00016281983819835605, "loss": 0.014, "step": 352810 }, { "epoch": 0.91, "learning_rate": 0.0001628159499819846, "loss": 0.0126, "step": 352820 }, { "epoch": 0.91, "learning_rate": 0.0001628120617656131, "loss": 0.0196, "step": 352830 }, { "epoch": 0.91, "learning_rate": 0.00016280817354924165, "loss": 0.0138, "step": 352840 }, { "epoch": 0.91, "learning_rate": 0.0001628042853328702, "loss": 0.0122, "step": 352850 }, { "epoch": 0.91, "learning_rate": 0.00016280039711649873, "loss": 0.015, "step": 352860 }, { "epoch": 0.91, "learning_rate": 0.00016279650890012724, "loss": 0.0129, "step": 352870 }, { "epoch": 0.91, "learning_rate": 0.00016279262068375578, "loss": 0.0111, "step": 352880 }, { "epoch": 0.91, "learning_rate": 0.00016278873246738435, "loss": 0.0173, "step": 352890 }, { "epoch": 0.91, "learning_rate": 0.00016278484425101287, "loss": 0.014, "step": 352900 }, { "epoch": 0.91, "learning_rate": 0.0001627809560346414, "loss": 0.0137, "step": 352910 }, { "epoch": 0.91, "learning_rate": 0.00016277706781826992, "loss": 0.0107, "step": 352920 }, { "epoch": 0.91, "learning_rate": 0.0001627731796018985, "loss": 0.0155, "step": 352930 }, { "epoch": 0.91, "learning_rate": 0.000162769291385527, "loss": 0.0101, "step": 352940 }, { "epoch": 0.91, "learning_rate": 0.00016276540316915555, "loss": 0.0157, "step": 352950 }, { "epoch": 0.91, "learning_rate": 0.00016276151495278406, "loss": 0.0117, "step": 352960 }, { "epoch": 0.91, "learning_rate": 0.00016275762673641263, "loss": 0.0151, "step": 352970 }, { "epoch": 0.91, "learning_rate": 0.00016275373852004115, "loss": 0.0148, "step": 352980 }, { "epoch": 0.92, "learning_rate": 0.0001627498503036697, "loss": 0.0178, "step": 352990 }, { "epoch": 0.92, "learning_rate": 0.0001627459620872982, "loss": 0.0131, "step": 353000 }, { "epoch": 0.92, "eval_cer": 0.8817110841447728, "eval_loss": 0.008378801867365837, "eval_runtime": 107.4189, "eval_samples_per_second": 18.619, "eval_steps_per_second": 4.655, "step": 353000 }, { "epoch": 0.92, "learning_rate": 0.00016274207387092677, "loss": 0.013, "step": 353010 }, { "epoch": 0.92, "learning_rate": 0.0001627381856545553, "loss": 0.0122, "step": 353020 }, { "epoch": 0.92, "learning_rate": 0.00016273429743818383, "loss": 0.0135, "step": 353030 }, { "epoch": 0.92, "learning_rate": 0.00016273040922181234, "loss": 0.0148, "step": 353040 }, { "epoch": 0.92, "learning_rate": 0.0001627265210054409, "loss": 0.0135, "step": 353050 }, { "epoch": 0.92, "learning_rate": 0.00016272263278906945, "loss": 0.0146, "step": 353060 }, { "epoch": 0.92, "learning_rate": 0.00016271874457269797, "loss": 0.0148, "step": 353070 }, { "epoch": 0.92, "learning_rate": 0.00016271485635632648, "loss": 0.0171, "step": 353080 }, { "epoch": 0.92, "learning_rate": 0.00016271096813995502, "loss": 0.0113, "step": 353090 }, { "epoch": 0.92, "learning_rate": 0.0001627070799235836, "loss": 0.0168, "step": 353100 }, { "epoch": 0.92, "learning_rate": 0.0001627031917072121, "loss": 0.0115, "step": 353110 }, { "epoch": 0.92, "learning_rate": 0.00016269930349084065, "loss": 0.0141, "step": 353120 }, { "epoch": 0.92, "learning_rate": 0.00016269541527446916, "loss": 0.0156, "step": 353130 }, { "epoch": 0.92, "learning_rate": 0.00016269152705809773, "loss": 0.0131, "step": 353140 }, { "epoch": 0.92, "learning_rate": 0.00016268763884172625, "loss": 0.0107, "step": 353150 }, { "epoch": 0.92, "learning_rate": 0.0001626837506253548, "loss": 0.0136, "step": 353160 }, { "epoch": 0.92, "learning_rate": 0.0001626798624089833, "loss": 0.0134, "step": 353170 }, { "epoch": 0.92, "learning_rate": 0.00016267597419261187, "loss": 0.009, "step": 353180 }, { "epoch": 0.92, "learning_rate": 0.00016267208597624039, "loss": 0.0111, "step": 353190 }, { "epoch": 0.92, "learning_rate": 0.00016266819775986893, "loss": 0.0157, "step": 353200 }, { "epoch": 0.92, "learning_rate": 0.00016266430954349744, "loss": 0.0124, "step": 353210 }, { "epoch": 0.92, "learning_rate": 0.000162660421327126, "loss": 0.0112, "step": 353220 }, { "epoch": 0.92, "learning_rate": 0.00016265653311075453, "loss": 0.0127, "step": 353230 }, { "epoch": 0.92, "learning_rate": 0.00016265264489438307, "loss": 0.0172, "step": 353240 }, { "epoch": 0.92, "learning_rate": 0.00016264875667801158, "loss": 0.0131, "step": 353250 }, { "epoch": 0.92, "learning_rate": 0.00016264486846164015, "loss": 0.011, "step": 353260 }, { "epoch": 0.92, "learning_rate": 0.0001626409802452687, "loss": 0.0141, "step": 353270 }, { "epoch": 0.92, "learning_rate": 0.0001626370920288972, "loss": 0.014, "step": 353280 }, { "epoch": 0.92, "learning_rate": 0.00016263320381252575, "loss": 0.0171, "step": 353290 }, { "epoch": 0.92, "learning_rate": 0.0001626293155961543, "loss": 0.0115, "step": 353300 }, { "epoch": 0.92, "learning_rate": 0.00016262542737978283, "loss": 0.0106, "step": 353310 }, { "epoch": 0.92, "learning_rate": 0.00016262153916341135, "loss": 0.0134, "step": 353320 }, { "epoch": 0.92, "learning_rate": 0.0001626176509470399, "loss": 0.0164, "step": 353330 }, { "epoch": 0.92, "learning_rate": 0.0001626137627306684, "loss": 0.0148, "step": 353340 }, { "epoch": 0.92, "learning_rate": 0.00016260987451429697, "loss": 0.0106, "step": 353350 }, { "epoch": 0.92, "learning_rate": 0.00016260598629792549, "loss": 0.014, "step": 353360 }, { "epoch": 0.92, "learning_rate": 0.00016260209808155403, "loss": 0.0132, "step": 353370 }, { "epoch": 0.92, "learning_rate": 0.00016259820986518254, "loss": 0.0107, "step": 353380 }, { "epoch": 0.92, "learning_rate": 0.0001625943216488111, "loss": 0.017, "step": 353390 }, { "epoch": 0.92, "learning_rate": 0.00016259043343243962, "loss": 0.0173, "step": 353400 }, { "epoch": 0.92, "learning_rate": 0.00016258654521606817, "loss": 0.0128, "step": 353410 }, { "epoch": 0.92, "learning_rate": 0.00016258265699969668, "loss": 0.0138, "step": 353420 }, { "epoch": 0.92, "learning_rate": 0.00016257876878332525, "loss": 0.0146, "step": 353430 }, { "epoch": 0.92, "learning_rate": 0.0001625748805669538, "loss": 0.016, "step": 353440 }, { "epoch": 0.92, "learning_rate": 0.0001625709923505823, "loss": 0.0113, "step": 353450 }, { "epoch": 0.92, "learning_rate": 0.00016256710413421085, "loss": 0.0134, "step": 353460 }, { "epoch": 0.92, "learning_rate": 0.0001625632159178394, "loss": 0.0123, "step": 353470 }, { "epoch": 0.92, "learning_rate": 0.00016255932770146793, "loss": 0.0156, "step": 353480 }, { "epoch": 0.92, "learning_rate": 0.00016255543948509645, "loss": 0.0127, "step": 353490 }, { "epoch": 0.92, "learning_rate": 0.000162551551268725, "loss": 0.0143, "step": 353500 }, { "epoch": 0.92, "learning_rate": 0.00016254766305235353, "loss": 0.0148, "step": 353510 }, { "epoch": 0.92, "learning_rate": 0.00016254377483598207, "loss": 0.0143, "step": 353520 }, { "epoch": 0.92, "learning_rate": 0.00016253988661961058, "loss": 0.0136, "step": 353530 }, { "epoch": 0.92, "learning_rate": 0.00016253599840323913, "loss": 0.0148, "step": 353540 }, { "epoch": 0.92, "learning_rate": 0.00016253211018686767, "loss": 0.0122, "step": 353550 }, { "epoch": 0.92, "learning_rate": 0.0001625282219704962, "loss": 0.0133, "step": 353560 }, { "epoch": 0.92, "learning_rate": 0.00016252433375412472, "loss": 0.0122, "step": 353570 }, { "epoch": 0.92, "learning_rate": 0.00016252044553775327, "loss": 0.0129, "step": 353580 }, { "epoch": 0.92, "learning_rate": 0.00016251655732138178, "loss": 0.014, "step": 353590 }, { "epoch": 0.92, "learning_rate": 0.00016251266910501035, "loss": 0.0157, "step": 353600 }, { "epoch": 0.92, "learning_rate": 0.0001625087808886389, "loss": 0.0113, "step": 353610 }, { "epoch": 0.92, "learning_rate": 0.0001625048926722674, "loss": 0.0153, "step": 353620 }, { "epoch": 0.92, "learning_rate": 0.00016250100445589595, "loss": 0.0147, "step": 353630 }, { "epoch": 0.92, "learning_rate": 0.0001624971162395245, "loss": 0.0154, "step": 353640 }, { "epoch": 0.92, "learning_rate": 0.00016249322802315303, "loss": 0.0154, "step": 353650 }, { "epoch": 0.92, "learning_rate": 0.00016248933980678154, "loss": 0.0105, "step": 353660 }, { "epoch": 0.92, "learning_rate": 0.00016248545159041009, "loss": 0.012, "step": 353670 }, { "epoch": 0.92, "learning_rate": 0.00016248156337403863, "loss": 0.0156, "step": 353680 }, { "epoch": 0.92, "learning_rate": 0.00016247767515766717, "loss": 0.0128, "step": 353690 }, { "epoch": 0.92, "learning_rate": 0.00016247378694129568, "loss": 0.0139, "step": 353700 }, { "epoch": 0.92, "learning_rate": 0.00016246989872492423, "loss": 0.0119, "step": 353710 }, { "epoch": 0.92, "learning_rate": 0.00016246601050855277, "loss": 0.0174, "step": 353720 }, { "epoch": 0.92, "learning_rate": 0.0001624621222921813, "loss": 0.0117, "step": 353730 }, { "epoch": 0.92, "learning_rate": 0.00016245823407580982, "loss": 0.012, "step": 353740 }, { "epoch": 0.92, "learning_rate": 0.00016245434585943837, "loss": 0.0131, "step": 353750 }, { "epoch": 0.92, "learning_rate": 0.00016245045764306693, "loss": 0.0145, "step": 353760 }, { "epoch": 0.92, "learning_rate": 0.00016244656942669545, "loss": 0.01, "step": 353770 }, { "epoch": 0.92, "learning_rate": 0.000162442681210324, "loss": 0.0111, "step": 353780 }, { "epoch": 0.92, "learning_rate": 0.0001624387929939525, "loss": 0.0151, "step": 353790 }, { "epoch": 0.92, "learning_rate": 0.00016243490477758107, "loss": 0.0142, "step": 353800 }, { "epoch": 0.92, "learning_rate": 0.0001624310165612096, "loss": 0.0167, "step": 353810 }, { "epoch": 0.92, "learning_rate": 0.00016242712834483813, "loss": 0.0112, "step": 353820 }, { "epoch": 0.92, "learning_rate": 0.00016242324012846664, "loss": 0.0156, "step": 353830 }, { "epoch": 0.92, "learning_rate": 0.00016241935191209519, "loss": 0.013, "step": 353840 }, { "epoch": 0.92, "learning_rate": 0.00016241546369572373, "loss": 0.0118, "step": 353850 }, { "epoch": 0.92, "learning_rate": 0.00016241157547935227, "loss": 0.0149, "step": 353860 }, { "epoch": 0.92, "learning_rate": 0.00016240768726298078, "loss": 0.0106, "step": 353870 }, { "epoch": 0.92, "learning_rate": 0.00016240379904660933, "loss": 0.0146, "step": 353880 }, { "epoch": 0.92, "learning_rate": 0.00016239991083023787, "loss": 0.0116, "step": 353890 }, { "epoch": 0.92, "learning_rate": 0.0001623960226138664, "loss": 0.0115, "step": 353900 }, { "epoch": 0.92, "learning_rate": 0.00016239213439749492, "loss": 0.0154, "step": 353910 }, { "epoch": 0.92, "learning_rate": 0.00016238824618112346, "loss": 0.0144, "step": 353920 }, { "epoch": 0.92, "learning_rate": 0.00016238435796475203, "loss": 0.0148, "step": 353930 }, { "epoch": 0.92, "learning_rate": 0.00016238046974838055, "loss": 0.0112, "step": 353940 }, { "epoch": 0.92, "learning_rate": 0.00016237658153200906, "loss": 0.0122, "step": 353950 }, { "epoch": 0.92, "learning_rate": 0.0001623726933156376, "loss": 0.0114, "step": 353960 }, { "epoch": 0.92, "learning_rate": 0.00016236880509926617, "loss": 0.0136, "step": 353970 }, { "epoch": 0.92, "learning_rate": 0.0001623649168828947, "loss": 0.0154, "step": 353980 }, { "epoch": 0.92, "learning_rate": 0.00016236102866652323, "loss": 0.0127, "step": 353990 }, { "epoch": 0.92, "learning_rate": 0.00016235714045015174, "loss": 0.0125, "step": 354000 }, { "epoch": 0.92, "eval_cer": 0.8817684692590742, "eval_loss": 0.008665827102959156, "eval_runtime": 107.3976, "eval_samples_per_second": 18.622, "eval_steps_per_second": 4.656, "step": 354000 }, { "epoch": 0.92, "learning_rate": 0.0001623532522337803, "loss": 0.0149, "step": 354010 }, { "epoch": 0.92, "learning_rate": 0.00016234936401740883, "loss": 0.0122, "step": 354020 }, { "epoch": 0.92, "learning_rate": 0.00016234547580103737, "loss": 0.0127, "step": 354030 }, { "epoch": 0.92, "learning_rate": 0.00016234158758466588, "loss": 0.014, "step": 354040 }, { "epoch": 0.92, "learning_rate": 0.00016233769936829442, "loss": 0.0109, "step": 354050 }, { "epoch": 0.92, "learning_rate": 0.00016233381115192297, "loss": 0.016, "step": 354060 }, { "epoch": 0.92, "learning_rate": 0.0001623299229355515, "loss": 0.011, "step": 354070 }, { "epoch": 0.92, "learning_rate": 0.00016232603471918002, "loss": 0.0137, "step": 354080 }, { "epoch": 0.92, "learning_rate": 0.00016232214650280856, "loss": 0.0117, "step": 354090 }, { "epoch": 0.92, "learning_rate": 0.00016231825828643713, "loss": 0.0103, "step": 354100 }, { "epoch": 0.92, "learning_rate": 0.00016231437007006565, "loss": 0.0125, "step": 354110 }, { "epoch": 0.92, "learning_rate": 0.00016231048185369416, "loss": 0.0132, "step": 354120 }, { "epoch": 0.92, "learning_rate": 0.0001623065936373227, "loss": 0.0113, "step": 354130 }, { "epoch": 0.92, "learning_rate": 0.00016230270542095127, "loss": 0.014, "step": 354140 }, { "epoch": 0.92, "learning_rate": 0.0001622988172045798, "loss": 0.0105, "step": 354150 }, { "epoch": 0.92, "learning_rate": 0.00016229492898820833, "loss": 0.0103, "step": 354160 }, { "epoch": 0.92, "learning_rate": 0.00016229104077183684, "loss": 0.0125, "step": 354170 }, { "epoch": 0.92, "learning_rate": 0.0001622871525554654, "loss": 0.011, "step": 354180 }, { "epoch": 0.92, "learning_rate": 0.00016228326433909393, "loss": 0.0128, "step": 354190 }, { "epoch": 0.92, "learning_rate": 0.00016227937612272247, "loss": 0.014, "step": 354200 }, { "epoch": 0.92, "learning_rate": 0.00016227548790635098, "loss": 0.0125, "step": 354210 }, { "epoch": 0.92, "learning_rate": 0.00016227159968997955, "loss": 0.0143, "step": 354220 }, { "epoch": 0.92, "learning_rate": 0.00016226771147360807, "loss": 0.0128, "step": 354230 }, { "epoch": 0.92, "learning_rate": 0.0001622638232572366, "loss": 0.0104, "step": 354240 }, { "epoch": 0.92, "learning_rate": 0.00016225993504086512, "loss": 0.011, "step": 354250 }, { "epoch": 0.92, "learning_rate": 0.0001622560468244937, "loss": 0.0111, "step": 354260 }, { "epoch": 0.92, "learning_rate": 0.0001622521586081222, "loss": 0.0128, "step": 354270 }, { "epoch": 0.92, "learning_rate": 0.00016224827039175075, "loss": 0.013, "step": 354280 }, { "epoch": 0.92, "learning_rate": 0.00016224438217537926, "loss": 0.0156, "step": 354290 }, { "epoch": 0.92, "learning_rate": 0.0001622404939590078, "loss": 0.0145, "step": 354300 }, { "epoch": 0.92, "learning_rate": 0.00016223660574263637, "loss": 0.0128, "step": 354310 }, { "epoch": 0.92, "learning_rate": 0.00016223271752626489, "loss": 0.0131, "step": 354320 }, { "epoch": 0.92, "learning_rate": 0.00016222882930989343, "loss": 0.0111, "step": 354330 }, { "epoch": 0.92, "learning_rate": 0.00016222494109352194, "loss": 0.0137, "step": 354340 }, { "epoch": 0.92, "learning_rate": 0.0001622210528771505, "loss": 0.016, "step": 354350 }, { "epoch": 0.92, "learning_rate": 0.00016221716466077903, "loss": 0.012, "step": 354360 }, { "epoch": 0.92, "learning_rate": 0.00016221327644440757, "loss": 0.012, "step": 354370 }, { "epoch": 0.92, "learning_rate": 0.00016220938822803608, "loss": 0.0124, "step": 354380 }, { "epoch": 0.92, "learning_rate": 0.00016220550001166465, "loss": 0.0101, "step": 354390 }, { "epoch": 0.92, "learning_rate": 0.00016220161179529317, "loss": 0.012, "step": 354400 }, { "epoch": 0.92, "learning_rate": 0.0001621977235789217, "loss": 0.0133, "step": 354410 }, { "epoch": 0.92, "learning_rate": 0.00016219383536255022, "loss": 0.0108, "step": 354420 }, { "epoch": 0.92, "learning_rate": 0.0001621899471461788, "loss": 0.0124, "step": 354430 }, { "epoch": 0.92, "learning_rate": 0.0001621860589298073, "loss": 0.0134, "step": 354440 }, { "epoch": 0.92, "learning_rate": 0.00016218217071343585, "loss": 0.0121, "step": 354450 }, { "epoch": 0.92, "learning_rate": 0.00016217828249706436, "loss": 0.0106, "step": 354460 }, { "epoch": 0.92, "learning_rate": 0.00016217439428069293, "loss": 0.0139, "step": 354470 }, { "epoch": 0.92, "learning_rate": 0.00016217050606432147, "loss": 0.0178, "step": 354480 }, { "epoch": 0.92, "learning_rate": 0.00016216661784794999, "loss": 0.0159, "step": 354490 }, { "epoch": 0.92, "learning_rate": 0.00016216272963157853, "loss": 0.0123, "step": 354500 }, { "epoch": 0.92, "learning_rate": 0.00016215884141520707, "loss": 0.0156, "step": 354510 }, { "epoch": 0.92, "learning_rate": 0.0001621549531988356, "loss": 0.0145, "step": 354520 }, { "epoch": 0.92, "learning_rate": 0.00016215106498246413, "loss": 0.0115, "step": 354530 }, { "epoch": 0.92, "learning_rate": 0.00016214717676609267, "loss": 0.0113, "step": 354540 }, { "epoch": 0.92, "learning_rate": 0.00016214328854972118, "loss": 0.0106, "step": 354550 }, { "epoch": 0.92, "learning_rate": 0.00016213940033334975, "loss": 0.0155, "step": 354560 }, { "epoch": 0.92, "learning_rate": 0.00016213551211697826, "loss": 0.0129, "step": 354570 }, { "epoch": 0.92, "learning_rate": 0.0001621316239006068, "loss": 0.014, "step": 354580 }, { "epoch": 0.92, "learning_rate": 0.00016212773568423532, "loss": 0.0099, "step": 354590 }, { "epoch": 0.92, "learning_rate": 0.0001621238474678639, "loss": 0.018, "step": 354600 }, { "epoch": 0.92, "learning_rate": 0.0001621199592514924, "loss": 0.0125, "step": 354610 }, { "epoch": 0.92, "learning_rate": 0.00016211607103512095, "loss": 0.0151, "step": 354620 }, { "epoch": 0.92, "learning_rate": 0.00016211218281874946, "loss": 0.0129, "step": 354630 }, { "epoch": 0.92, "learning_rate": 0.00016210829460237803, "loss": 0.0156, "step": 354640 }, { "epoch": 0.92, "learning_rate": 0.00016210440638600657, "loss": 0.0119, "step": 354650 }, { "epoch": 0.92, "learning_rate": 0.00016210051816963509, "loss": 0.014, "step": 354660 }, { "epoch": 0.92, "learning_rate": 0.0001620966299532636, "loss": 0.0199, "step": 354670 }, { "epoch": 0.92, "learning_rate": 0.00016209274173689217, "loss": 0.0124, "step": 354680 }, { "epoch": 0.92, "learning_rate": 0.0001620888535205207, "loss": 0.0132, "step": 354690 }, { "epoch": 0.92, "learning_rate": 0.00016208496530414922, "loss": 0.0135, "step": 354700 }, { "epoch": 0.92, "learning_rate": 0.00016208107708777777, "loss": 0.0136, "step": 354710 }, { "epoch": 0.92, "learning_rate": 0.0001620771888714063, "loss": 0.0111, "step": 354720 }, { "epoch": 0.92, "learning_rate": 0.00016207330065503485, "loss": 0.0119, "step": 354730 }, { "epoch": 0.92, "learning_rate": 0.00016206941243866336, "loss": 0.0146, "step": 354740 }, { "epoch": 0.92, "learning_rate": 0.0001620655242222919, "loss": 0.0138, "step": 354750 }, { "epoch": 0.92, "learning_rate": 0.00016206163600592045, "loss": 0.0143, "step": 354760 }, { "epoch": 0.92, "learning_rate": 0.000162057747789549, "loss": 0.0127, "step": 354770 }, { "epoch": 0.92, "learning_rate": 0.0001620538595731775, "loss": 0.0126, "step": 354780 }, { "epoch": 0.92, "learning_rate": 0.00016204997135680605, "loss": 0.0139, "step": 354790 }, { "epoch": 0.92, "learning_rate": 0.00016204608314043456, "loss": 0.0114, "step": 354800 }, { "epoch": 0.92, "learning_rate": 0.00016204219492406313, "loss": 0.0151, "step": 354810 }, { "epoch": 0.92, "learning_rate": 0.00016203830670769164, "loss": 0.0123, "step": 354820 }, { "epoch": 0.92, "learning_rate": 0.00016203441849132018, "loss": 0.0137, "step": 354830 }, { "epoch": 0.92, "learning_rate": 0.0001620305302749487, "loss": 0.0121, "step": 354840 }, { "epoch": 0.92, "learning_rate": 0.00016202664205857727, "loss": 0.0167, "step": 354850 }, { "epoch": 0.92, "learning_rate": 0.0001620227538422058, "loss": 0.0114, "step": 354860 }, { "epoch": 0.92, "learning_rate": 0.00016201886562583432, "loss": 0.0126, "step": 354870 }, { "epoch": 0.92, "learning_rate": 0.00016201497740946287, "loss": 0.0157, "step": 354880 }, { "epoch": 0.92, "learning_rate": 0.0001620110891930914, "loss": 0.0117, "step": 354890 }, { "epoch": 0.92, "learning_rate": 0.00016200720097671995, "loss": 0.0128, "step": 354900 }, { "epoch": 0.92, "learning_rate": 0.00016200331276034846, "loss": 0.0117, "step": 354910 }, { "epoch": 0.92, "learning_rate": 0.000161999424543977, "loss": 0.0104, "step": 354920 }, { "epoch": 0.92, "learning_rate": 0.00016199553632760555, "loss": 0.0147, "step": 354930 }, { "epoch": 0.92, "learning_rate": 0.0001619916481112341, "loss": 0.0124, "step": 354940 }, { "epoch": 0.92, "learning_rate": 0.0001619877598948626, "loss": 0.0166, "step": 354950 }, { "epoch": 0.92, "learning_rate": 0.00016198387167849114, "loss": 0.009, "step": 354960 }, { "epoch": 0.92, "learning_rate": 0.0001619799834621197, "loss": 0.0144, "step": 354970 }, { "epoch": 0.92, "learning_rate": 0.00016197609524574823, "loss": 0.0111, "step": 354980 }, { "epoch": 0.92, "learning_rate": 0.00016197220702937674, "loss": 0.0142, "step": 354990 }, { "epoch": 0.92, "learning_rate": 0.00016196831881300528, "loss": 0.009, "step": 355000 }, { "epoch": 0.92, "eval_cer": 0.8817362776095881, "eval_loss": 0.008503294549882412, "eval_runtime": 107.342, "eval_samples_per_second": 18.632, "eval_steps_per_second": 4.658, "step": 355000 }, { "epoch": 0.92, "learning_rate": 0.00016196443059663385, "loss": 0.0141, "step": 355010 }, { "epoch": 0.92, "learning_rate": 0.00016196054238026237, "loss": 0.0128, "step": 355020 }, { "epoch": 0.92, "learning_rate": 0.0001619566541638909, "loss": 0.0149, "step": 355030 }, { "epoch": 0.92, "learning_rate": 0.00016195276594751942, "loss": 0.0188, "step": 355040 }, { "epoch": 0.92, "learning_rate": 0.00016194887773114797, "loss": 0.016, "step": 355050 }, { "epoch": 0.92, "learning_rate": 0.0001619449895147765, "loss": 0.0166, "step": 355060 }, { "epoch": 0.92, "learning_rate": 0.00016194110129840505, "loss": 0.0111, "step": 355070 }, { "epoch": 0.92, "learning_rate": 0.00016193721308203356, "loss": 0.0151, "step": 355080 }, { "epoch": 0.92, "learning_rate": 0.0001619333248656621, "loss": 0.0161, "step": 355090 }, { "epoch": 0.92, "learning_rate": 0.00016192943664929065, "loss": 0.0102, "step": 355100 }, { "epoch": 0.92, "learning_rate": 0.0001619255484329192, "loss": 0.0149, "step": 355110 }, { "epoch": 0.92, "learning_rate": 0.0001619216602165477, "loss": 0.0139, "step": 355120 }, { "epoch": 0.92, "learning_rate": 0.00016191777200017624, "loss": 0.0128, "step": 355130 }, { "epoch": 0.92, "learning_rate": 0.00016191388378380479, "loss": 0.0138, "step": 355140 }, { "epoch": 0.92, "learning_rate": 0.00016190999556743333, "loss": 0.0144, "step": 355150 }, { "epoch": 0.92, "learning_rate": 0.00016190610735106184, "loss": 0.0154, "step": 355160 }, { "epoch": 0.92, "learning_rate": 0.00016190221913469038, "loss": 0.0107, "step": 355170 }, { "epoch": 0.92, "learning_rate": 0.00016189833091831895, "loss": 0.0125, "step": 355180 }, { "epoch": 0.92, "learning_rate": 0.00016189444270194747, "loss": 0.0169, "step": 355190 }, { "epoch": 0.92, "learning_rate": 0.000161890554485576, "loss": 0.017, "step": 355200 }, { "epoch": 0.92, "learning_rate": 0.00016188666626920452, "loss": 0.012, "step": 355210 }, { "epoch": 0.92, "learning_rate": 0.0001618827780528331, "loss": 0.0109, "step": 355220 }, { "epoch": 0.92, "learning_rate": 0.0001618788898364616, "loss": 0.0107, "step": 355230 }, { "epoch": 0.92, "learning_rate": 0.00016187500162009015, "loss": 0.0145, "step": 355240 }, { "epoch": 0.92, "learning_rate": 0.00016187111340371866, "loss": 0.0137, "step": 355250 }, { "epoch": 0.92, "learning_rate": 0.00016186722518734723, "loss": 0.0119, "step": 355260 }, { "epoch": 0.92, "learning_rate": 0.00016186333697097575, "loss": 0.0117, "step": 355270 }, { "epoch": 0.92, "learning_rate": 0.0001618594487546043, "loss": 0.0153, "step": 355280 }, { "epoch": 0.92, "learning_rate": 0.0001618555605382328, "loss": 0.0158, "step": 355290 }, { "epoch": 0.92, "learning_rate": 0.00016185167232186134, "loss": 0.0111, "step": 355300 }, { "epoch": 0.92, "learning_rate": 0.00016184778410548989, "loss": 0.0133, "step": 355310 }, { "epoch": 0.92, "learning_rate": 0.00016184389588911843, "loss": 0.0114, "step": 355320 }, { "epoch": 0.92, "learning_rate": 0.00016184000767274694, "loss": 0.0124, "step": 355330 }, { "epoch": 0.92, "learning_rate": 0.00016183611945637548, "loss": 0.0182, "step": 355340 }, { "epoch": 0.92, "learning_rate": 0.00016183223124000405, "loss": 0.0121, "step": 355350 }, { "epoch": 0.92, "learning_rate": 0.00016182834302363257, "loss": 0.0144, "step": 355360 }, { "epoch": 0.92, "learning_rate": 0.0001618244548072611, "loss": 0.0114, "step": 355370 }, { "epoch": 0.92, "learning_rate": 0.00016182056659088962, "loss": 0.0119, "step": 355380 }, { "epoch": 0.92, "learning_rate": 0.0001618166783745182, "loss": 0.0098, "step": 355390 }, { "epoch": 0.92, "learning_rate": 0.0001618127901581467, "loss": 0.0154, "step": 355400 }, { "epoch": 0.92, "learning_rate": 0.00016180890194177525, "loss": 0.0128, "step": 355410 }, { "epoch": 0.92, "learning_rate": 0.00016180501372540376, "loss": 0.0148, "step": 355420 }, { "epoch": 0.92, "learning_rate": 0.00016180112550903233, "loss": 0.0137, "step": 355430 }, { "epoch": 0.92, "learning_rate": 0.00016179723729266084, "loss": 0.0139, "step": 355440 }, { "epoch": 0.92, "learning_rate": 0.0001617933490762894, "loss": 0.0124, "step": 355450 }, { "epoch": 0.92, "learning_rate": 0.0001617894608599179, "loss": 0.0155, "step": 355460 }, { "epoch": 0.92, "learning_rate": 0.00016178557264354647, "loss": 0.0142, "step": 355470 }, { "epoch": 0.92, "learning_rate": 0.00016178168442717498, "loss": 0.015, "step": 355480 }, { "epoch": 0.92, "learning_rate": 0.00016177779621080353, "loss": 0.0158, "step": 355490 }, { "epoch": 0.92, "learning_rate": 0.00016177390799443204, "loss": 0.0152, "step": 355500 }, { "epoch": 0.92, "learning_rate": 0.0001617700197780606, "loss": 0.0135, "step": 355510 }, { "epoch": 0.92, "learning_rate": 0.00016176613156168915, "loss": 0.0104, "step": 355520 }, { "epoch": 0.92, "learning_rate": 0.00016176224334531767, "loss": 0.0118, "step": 355530 }, { "epoch": 0.92, "learning_rate": 0.00016175835512894618, "loss": 0.0156, "step": 355540 }, { "epoch": 0.92, "learning_rate": 0.00016175446691257472, "loss": 0.0143, "step": 355550 }, { "epoch": 0.92, "learning_rate": 0.0001617505786962033, "loss": 0.0153, "step": 355560 }, { "epoch": 0.92, "learning_rate": 0.0001617466904798318, "loss": 0.0164, "step": 355570 }, { "epoch": 0.92, "learning_rate": 0.00016174280226346035, "loss": 0.0132, "step": 355580 }, { "epoch": 0.92, "learning_rate": 0.00016173891404708886, "loss": 0.0148, "step": 355590 }, { "epoch": 0.92, "learning_rate": 0.00016173502583071743, "loss": 0.0115, "step": 355600 }, { "epoch": 0.92, "learning_rate": 0.00016173113761434594, "loss": 0.0105, "step": 355610 }, { "epoch": 0.92, "learning_rate": 0.00016172724939797449, "loss": 0.0128, "step": 355620 }, { "epoch": 0.92, "learning_rate": 0.000161723361181603, "loss": 0.0136, "step": 355630 }, { "epoch": 0.92, "learning_rate": 0.00016171947296523157, "loss": 0.013, "step": 355640 }, { "epoch": 0.92, "learning_rate": 0.00016171558474886008, "loss": 0.0126, "step": 355650 }, { "epoch": 0.92, "learning_rate": 0.00016171169653248863, "loss": 0.0146, "step": 355660 }, { "epoch": 0.92, "learning_rate": 0.00016170780831611714, "loss": 0.0101, "step": 355670 }, { "epoch": 0.92, "learning_rate": 0.0001617039200997457, "loss": 0.0146, "step": 355680 }, { "epoch": 0.92, "learning_rate": 0.00016170003188337425, "loss": 0.0143, "step": 355690 }, { "epoch": 0.92, "learning_rate": 0.00016169614366700276, "loss": 0.014, "step": 355700 }, { "epoch": 0.92, "learning_rate": 0.00016169225545063128, "loss": 0.0133, "step": 355710 }, { "epoch": 0.92, "learning_rate": 0.00016168836723425985, "loss": 0.0122, "step": 355720 }, { "epoch": 0.92, "learning_rate": 0.0001616844790178884, "loss": 0.0131, "step": 355730 }, { "epoch": 0.92, "learning_rate": 0.0001616805908015169, "loss": 0.0109, "step": 355740 }, { "epoch": 0.92, "learning_rate": 0.00016167670258514545, "loss": 0.0131, "step": 355750 }, { "epoch": 0.92, "learning_rate": 0.000161672814368774, "loss": 0.0121, "step": 355760 }, { "epoch": 0.92, "learning_rate": 0.00016166892615240253, "loss": 0.0123, "step": 355770 }, { "epoch": 0.92, "learning_rate": 0.00016166503793603104, "loss": 0.0149, "step": 355780 }, { "epoch": 0.92, "learning_rate": 0.00016166114971965959, "loss": 0.0147, "step": 355790 }, { "epoch": 0.92, "learning_rate": 0.0001616572615032881, "loss": 0.0123, "step": 355800 }, { "epoch": 0.92, "learning_rate": 0.00016165337328691667, "loss": 0.0111, "step": 355810 }, { "epoch": 0.92, "learning_rate": 0.00016164948507054518, "loss": 0.012, "step": 355820 }, { "epoch": 0.92, "learning_rate": 0.00016164559685417372, "loss": 0.0122, "step": 355830 }, { "epoch": 0.92, "learning_rate": 0.00016164170863780224, "loss": 0.0148, "step": 355840 }, { "epoch": 0.92, "learning_rate": 0.0001616378204214308, "loss": 0.0149, "step": 355850 }, { "epoch": 0.92, "learning_rate": 0.00016163393220505932, "loss": 0.011, "step": 355860 }, { "epoch": 0.92, "learning_rate": 0.00016163004398868786, "loss": 0.0142, "step": 355870 }, { "epoch": 0.92, "learning_rate": 0.00016162615577231638, "loss": 0.0138, "step": 355880 }, { "epoch": 0.92, "learning_rate": 0.00016162226755594495, "loss": 0.0164, "step": 355890 }, { "epoch": 0.92, "learning_rate": 0.0001616183793395735, "loss": 0.0146, "step": 355900 }, { "epoch": 0.92, "learning_rate": 0.000161614491123202, "loss": 0.0126, "step": 355910 }, { "epoch": 0.92, "learning_rate": 0.00016161060290683055, "loss": 0.0131, "step": 355920 }, { "epoch": 0.92, "learning_rate": 0.0001616067146904591, "loss": 0.0144, "step": 355930 }, { "epoch": 0.92, "learning_rate": 0.00016160282647408763, "loss": 0.0118, "step": 355940 }, { "epoch": 0.92, "learning_rate": 0.00016159893825771614, "loss": 0.0135, "step": 355950 }, { "epoch": 0.92, "learning_rate": 0.00016159505004134468, "loss": 0.0165, "step": 355960 }, { "epoch": 0.92, "learning_rate": 0.00016159116182497323, "loss": 0.0143, "step": 355970 }, { "epoch": 0.92, "learning_rate": 0.00016158727360860177, "loss": 0.0174, "step": 355980 }, { "epoch": 0.92, "learning_rate": 0.00016158338539223028, "loss": 0.0144, "step": 355990 }, { "epoch": 0.92, "learning_rate": 0.00016157949717585882, "loss": 0.0134, "step": 356000 }, { "epoch": 0.92, "eval_cer": 0.8817866645392185, "eval_loss": 0.008485401049256325, "eval_runtime": 107.1956, "eval_samples_per_second": 18.657, "eval_steps_per_second": 4.664, "step": 356000 }, { "epoch": 0.92, "learning_rate": 0.00016157560895948737, "loss": 0.0088, "step": 356010 }, { "epoch": 0.92, "learning_rate": 0.0001615717207431159, "loss": 0.0102, "step": 356020 }, { "epoch": 0.92, "learning_rate": 0.00016156783252674442, "loss": 0.0121, "step": 356030 }, { "epoch": 0.92, "learning_rate": 0.00016156394431037296, "loss": 0.0107, "step": 356040 }, { "epoch": 0.92, "learning_rate": 0.00016156005609400148, "loss": 0.014, "step": 356050 }, { "epoch": 0.92, "learning_rate": 0.00016155616787763005, "loss": 0.0128, "step": 356060 }, { "epoch": 0.92, "learning_rate": 0.0001615522796612586, "loss": 0.0145, "step": 356070 }, { "epoch": 0.92, "learning_rate": 0.0001615483914448871, "loss": 0.0113, "step": 356080 }, { "epoch": 0.92, "learning_rate": 0.00016154450322851564, "loss": 0.0111, "step": 356090 }, { "epoch": 0.92, "learning_rate": 0.0001615406150121442, "loss": 0.0108, "step": 356100 }, { "epoch": 0.92, "learning_rate": 0.00016153672679577273, "loss": 0.0139, "step": 356110 }, { "epoch": 0.92, "learning_rate": 0.00016153283857940124, "loss": 0.013, "step": 356120 }, { "epoch": 0.92, "learning_rate": 0.00016152895036302978, "loss": 0.0129, "step": 356130 }, { "epoch": 0.92, "learning_rate": 0.00016152506214665833, "loss": 0.014, "step": 356140 }, { "epoch": 0.92, "learning_rate": 0.00016152117393028687, "loss": 0.0145, "step": 356150 }, { "epoch": 0.92, "learning_rate": 0.00016151728571391538, "loss": 0.0112, "step": 356160 }, { "epoch": 0.92, "learning_rate": 0.00016151339749754392, "loss": 0.0135, "step": 356170 }, { "epoch": 0.92, "learning_rate": 0.00016150950928117247, "loss": 0.0147, "step": 356180 }, { "epoch": 0.92, "learning_rate": 0.000161505621064801, "loss": 0.0162, "step": 356190 }, { "epoch": 0.92, "learning_rate": 0.00016150173284842952, "loss": 0.0141, "step": 356200 }, { "epoch": 0.92, "learning_rate": 0.00016149784463205806, "loss": 0.0155, "step": 356210 }, { "epoch": 0.92, "learning_rate": 0.00016149395641568663, "loss": 0.0152, "step": 356220 }, { "epoch": 0.92, "learning_rate": 0.00016149006819931515, "loss": 0.0137, "step": 356230 }, { "epoch": 0.92, "learning_rate": 0.0001614861799829437, "loss": 0.0111, "step": 356240 }, { "epoch": 0.92, "learning_rate": 0.0001614822917665722, "loss": 0.0192, "step": 356250 }, { "epoch": 0.92, "learning_rate": 0.00016147840355020077, "loss": 0.0119, "step": 356260 }, { "epoch": 0.92, "learning_rate": 0.00016147451533382929, "loss": 0.0128, "step": 356270 }, { "epoch": 0.92, "learning_rate": 0.00016147062711745783, "loss": 0.0092, "step": 356280 }, { "epoch": 0.92, "learning_rate": 0.00016146673890108634, "loss": 0.0122, "step": 356290 }, { "epoch": 0.92, "learning_rate": 0.00016146285068471488, "loss": 0.0162, "step": 356300 }, { "epoch": 0.92, "learning_rate": 0.00016145896246834343, "loss": 0.0155, "step": 356310 }, { "epoch": 0.92, "learning_rate": 0.00016145507425197197, "loss": 0.0152, "step": 356320 }, { "epoch": 0.92, "learning_rate": 0.00016145118603560048, "loss": 0.011, "step": 356330 }, { "epoch": 0.92, "learning_rate": 0.00016144729781922902, "loss": 0.0124, "step": 356340 }, { "epoch": 0.92, "learning_rate": 0.00016144340960285756, "loss": 0.0136, "step": 356350 }, { "epoch": 0.92, "learning_rate": 0.0001614395213864861, "loss": 0.0117, "step": 356360 }, { "epoch": 0.92, "learning_rate": 0.00016143563317011462, "loss": 0.0131, "step": 356370 }, { "epoch": 0.92, "learning_rate": 0.00016143174495374316, "loss": 0.0122, "step": 356380 }, { "epoch": 0.92, "learning_rate": 0.00016142785673737173, "loss": 0.0122, "step": 356390 }, { "epoch": 0.92, "learning_rate": 0.00016142396852100025, "loss": 0.0112, "step": 356400 }, { "epoch": 0.92, "learning_rate": 0.00016142008030462876, "loss": 0.0181, "step": 356410 }, { "epoch": 0.92, "learning_rate": 0.0001614161920882573, "loss": 0.011, "step": 356420 }, { "epoch": 0.92, "learning_rate": 0.00016141230387188587, "loss": 0.0125, "step": 356430 }, { "epoch": 0.92, "learning_rate": 0.00016140841565551439, "loss": 0.0095, "step": 356440 }, { "epoch": 0.92, "learning_rate": 0.00016140452743914293, "loss": 0.014, "step": 356450 }, { "epoch": 0.92, "learning_rate": 0.00016140063922277144, "loss": 0.0138, "step": 356460 }, { "epoch": 0.92, "learning_rate": 0.0001613967510064, "loss": 0.0123, "step": 356470 }, { "epoch": 0.92, "learning_rate": 0.00016139286279002852, "loss": 0.0144, "step": 356480 }, { "epoch": 0.92, "learning_rate": 0.00016138897457365707, "loss": 0.013, "step": 356490 }, { "epoch": 0.92, "learning_rate": 0.00016138508635728558, "loss": 0.0127, "step": 356500 }, { "epoch": 0.92, "learning_rate": 0.00016138119814091415, "loss": 0.0125, "step": 356510 }, { "epoch": 0.92, "learning_rate": 0.00016137730992454266, "loss": 0.0116, "step": 356520 }, { "epoch": 0.92, "learning_rate": 0.0001613734217081712, "loss": 0.014, "step": 356530 }, { "epoch": 0.92, "learning_rate": 0.00016136953349179972, "loss": 0.0114, "step": 356540 }, { "epoch": 0.92, "learning_rate": 0.00016136564527542826, "loss": 0.0116, "step": 356550 }, { "epoch": 0.92, "learning_rate": 0.00016136175705905683, "loss": 0.0134, "step": 356560 }, { "epoch": 0.92, "learning_rate": 0.00016135786884268535, "loss": 0.0133, "step": 356570 }, { "epoch": 0.92, "learning_rate": 0.00016135398062631386, "loss": 0.0159, "step": 356580 }, { "epoch": 0.92, "learning_rate": 0.0001613500924099424, "loss": 0.0167, "step": 356590 }, { "epoch": 0.92, "learning_rate": 0.00016134620419357097, "loss": 0.011, "step": 356600 }, { "epoch": 0.92, "learning_rate": 0.00016134231597719948, "loss": 0.0139, "step": 356610 }, { "epoch": 0.92, "learning_rate": 0.00016133842776082803, "loss": 0.0125, "step": 356620 }, { "epoch": 0.92, "learning_rate": 0.00016133453954445654, "loss": 0.0137, "step": 356630 }, { "epoch": 0.92, "learning_rate": 0.0001613306513280851, "loss": 0.0111, "step": 356640 }, { "epoch": 0.92, "learning_rate": 0.00016132676311171362, "loss": 0.0158, "step": 356650 }, { "epoch": 0.92, "learning_rate": 0.00016132287489534217, "loss": 0.0134, "step": 356660 }, { "epoch": 0.92, "learning_rate": 0.00016131898667897068, "loss": 0.0137, "step": 356670 }, { "epoch": 0.92, "learning_rate": 0.00016131509846259925, "loss": 0.0145, "step": 356680 }, { "epoch": 0.92, "learning_rate": 0.00016131121024622776, "loss": 0.0143, "step": 356690 }, { "epoch": 0.92, "learning_rate": 0.0001613073220298563, "loss": 0.0128, "step": 356700 }, { "epoch": 0.92, "learning_rate": 0.00016130343381348482, "loss": 0.0098, "step": 356710 }, { "epoch": 0.92, "learning_rate": 0.0001612995455971134, "loss": 0.01, "step": 356720 }, { "epoch": 0.92, "learning_rate": 0.0001612956573807419, "loss": 0.014, "step": 356730 }, { "epoch": 0.92, "learning_rate": 0.00016129176916437044, "loss": 0.0142, "step": 356740 }, { "epoch": 0.92, "learning_rate": 0.00016128788094799896, "loss": 0.0126, "step": 356750 }, { "epoch": 0.92, "learning_rate": 0.00016128399273162753, "loss": 0.0134, "step": 356760 }, { "epoch": 0.92, "learning_rate": 0.00016128010451525607, "loss": 0.0101, "step": 356770 }, { "epoch": 0.92, "learning_rate": 0.00016127621629888458, "loss": 0.0123, "step": 356780 }, { "epoch": 0.92, "learning_rate": 0.00016127232808251313, "loss": 0.0186, "step": 356790 }, { "epoch": 0.92, "learning_rate": 0.00016126843986614164, "loss": 0.0096, "step": 356800 }, { "epoch": 0.92, "learning_rate": 0.0001612645516497702, "loss": 0.0115, "step": 356810 }, { "epoch": 0.92, "learning_rate": 0.00016126066343339872, "loss": 0.0134, "step": 356820 }, { "epoch": 0.92, "learning_rate": 0.00016125677521702727, "loss": 0.0126, "step": 356830 }, { "epoch": 0.92, "learning_rate": 0.00016125288700065578, "loss": 0.0112, "step": 356840 }, { "epoch": 0.93, "learning_rate": 0.00016124899878428435, "loss": 0.0135, "step": 356850 }, { "epoch": 0.93, "learning_rate": 0.00016124511056791286, "loss": 0.013, "step": 356860 }, { "epoch": 0.93, "learning_rate": 0.0001612412223515414, "loss": 0.0126, "step": 356870 }, { "epoch": 0.93, "learning_rate": 0.00016123733413516992, "loss": 0.0109, "step": 356880 }, { "epoch": 0.93, "learning_rate": 0.0001612334459187985, "loss": 0.0139, "step": 356890 }, { "epoch": 0.93, "learning_rate": 0.000161229557702427, "loss": 0.0138, "step": 356900 }, { "epoch": 0.93, "learning_rate": 0.00016122566948605554, "loss": 0.0122, "step": 356910 }, { "epoch": 0.93, "learning_rate": 0.00016122178126968406, "loss": 0.0124, "step": 356920 }, { "epoch": 0.93, "learning_rate": 0.00016121789305331263, "loss": 0.0132, "step": 356930 }, { "epoch": 0.93, "learning_rate": 0.00016121400483694117, "loss": 0.0147, "step": 356940 }, { "epoch": 0.93, "learning_rate": 0.00016121011662056968, "loss": 0.0121, "step": 356950 }, { "epoch": 0.93, "learning_rate": 0.00016120622840419823, "loss": 0.0113, "step": 356960 }, { "epoch": 0.93, "learning_rate": 0.00016120234018782677, "loss": 0.0105, "step": 356970 }, { "epoch": 0.93, "learning_rate": 0.0001611984519714553, "loss": 0.0153, "step": 356980 }, { "epoch": 0.93, "learning_rate": 0.00016119456375508382, "loss": 0.0111, "step": 356990 }, { "epoch": 0.93, "learning_rate": 0.00016119067553871236, "loss": 0.0144, "step": 357000 }, { "epoch": 0.93, "eval_cer": 0.8817502739789299, "eval_loss": 0.00885064247995615, "eval_runtime": 107.1821, "eval_samples_per_second": 18.66, "eval_steps_per_second": 4.665, "step": 357000 }, { "epoch": 0.93, "learning_rate": 0.0001611867873223409, "loss": 0.015, "step": 357010 }, { "epoch": 0.93, "learning_rate": 0.00016118289910596945, "loss": 0.0115, "step": 357020 }, { "epoch": 0.93, "learning_rate": 0.00016117901088959796, "loss": 0.0103, "step": 357030 }, { "epoch": 0.93, "learning_rate": 0.0001611751226732265, "loss": 0.0141, "step": 357040 }, { "epoch": 0.93, "learning_rate": 0.00016117123445685502, "loss": 0.0122, "step": 357050 }, { "epoch": 0.93, "learning_rate": 0.0001611673462404836, "loss": 0.0134, "step": 357060 }, { "epoch": 0.93, "learning_rate": 0.0001611634580241121, "loss": 0.0108, "step": 357070 }, { "epoch": 0.93, "learning_rate": 0.00016115956980774064, "loss": 0.0118, "step": 357080 }, { "epoch": 0.93, "learning_rate": 0.00016115568159136916, "loss": 0.015, "step": 357090 }, { "epoch": 0.93, "learning_rate": 0.00016115179337499773, "loss": 0.0163, "step": 357100 }, { "epoch": 0.93, "learning_rate": 0.00016114790515862627, "loss": 0.0101, "step": 357110 }, { "epoch": 0.93, "learning_rate": 0.00016114401694225478, "loss": 0.0138, "step": 357120 }, { "epoch": 0.93, "learning_rate": 0.0001611401287258833, "loss": 0.0149, "step": 357130 }, { "epoch": 0.93, "learning_rate": 0.00016113624050951187, "loss": 0.013, "step": 357140 }, { "epoch": 0.93, "learning_rate": 0.0001611323522931404, "loss": 0.0141, "step": 357150 }, { "epoch": 0.93, "learning_rate": 0.00016112846407676892, "loss": 0.0136, "step": 357160 }, { "epoch": 0.93, "learning_rate": 0.00016112457586039746, "loss": 0.0116, "step": 357170 }, { "epoch": 0.93, "learning_rate": 0.000161120687644026, "loss": 0.0158, "step": 357180 }, { "epoch": 0.93, "learning_rate": 0.00016111679942765455, "loss": 0.0154, "step": 357190 }, { "epoch": 0.93, "learning_rate": 0.00016111291121128306, "loss": 0.012, "step": 357200 }, { "epoch": 0.93, "learning_rate": 0.0001611090229949116, "loss": 0.0133, "step": 357210 }, { "epoch": 0.93, "learning_rate": 0.00016110513477854015, "loss": 0.0161, "step": 357220 }, { "epoch": 0.93, "learning_rate": 0.0001611012465621687, "loss": 0.0135, "step": 357230 }, { "epoch": 0.93, "learning_rate": 0.0001610973583457972, "loss": 0.0123, "step": 357240 }, { "epoch": 0.93, "learning_rate": 0.00016109347012942574, "loss": 0.0135, "step": 357250 }, { "epoch": 0.93, "learning_rate": 0.0001610895819130543, "loss": 0.0166, "step": 357260 }, { "epoch": 0.93, "learning_rate": 0.00016108569369668283, "loss": 0.0126, "step": 357270 }, { "epoch": 0.93, "learning_rate": 0.00016108180548031137, "loss": 0.0111, "step": 357280 }, { "epoch": 0.93, "learning_rate": 0.00016107791726393988, "loss": 0.0132, "step": 357290 }, { "epoch": 0.93, "learning_rate": 0.0001610740290475684, "loss": 0.0121, "step": 357300 }, { "epoch": 0.93, "learning_rate": 0.00016107014083119697, "loss": 0.0116, "step": 357310 }, { "epoch": 0.93, "learning_rate": 0.0001610662526148255, "loss": 0.0136, "step": 357320 }, { "epoch": 0.93, "learning_rate": 0.00016106236439845402, "loss": 0.0142, "step": 357330 }, { "epoch": 0.93, "learning_rate": 0.00016105847618208256, "loss": 0.0142, "step": 357340 }, { "epoch": 0.93, "learning_rate": 0.0001610545879657111, "loss": 0.0157, "step": 357350 }, { "epoch": 0.93, "learning_rate": 0.00016105069974933965, "loss": 0.0148, "step": 357360 }, { "epoch": 0.93, "learning_rate": 0.00016104681153296816, "loss": 0.0173, "step": 357370 }, { "epoch": 0.93, "learning_rate": 0.0001610429233165967, "loss": 0.0139, "step": 357380 }, { "epoch": 0.93, "learning_rate": 0.00016103903510022524, "loss": 0.0114, "step": 357390 }, { "epoch": 0.93, "learning_rate": 0.00016103514688385379, "loss": 0.014, "step": 357400 }, { "epoch": 0.93, "learning_rate": 0.0001610312586674823, "loss": 0.0187, "step": 357410 }, { "epoch": 0.93, "learning_rate": 0.00016102737045111084, "loss": 0.015, "step": 357420 }, { "epoch": 0.93, "learning_rate": 0.0001610234822347394, "loss": 0.0138, "step": 357430 }, { "epoch": 0.93, "learning_rate": 0.00016101959401836793, "loss": 0.0131, "step": 357440 }, { "epoch": 0.93, "learning_rate": 0.00016101570580199644, "loss": 0.0116, "step": 357450 }, { "epoch": 0.93, "learning_rate": 0.00016101181758562498, "loss": 0.0134, "step": 357460 }, { "epoch": 0.93, "learning_rate": 0.00016100792936925355, "loss": 0.0096, "step": 357470 }, { "epoch": 0.93, "learning_rate": 0.00016100404115288207, "loss": 0.0132, "step": 357480 }, { "epoch": 0.93, "learning_rate": 0.0001610001529365106, "loss": 0.0159, "step": 357490 }, { "epoch": 0.93, "learning_rate": 0.00016099626472013912, "loss": 0.0127, "step": 357500 }, { "epoch": 0.93, "learning_rate": 0.0001609923765037677, "loss": 0.0107, "step": 357510 }, { "epoch": 0.93, "learning_rate": 0.0001609884882873962, "loss": 0.0101, "step": 357520 }, { "epoch": 0.93, "learning_rate": 0.00016098460007102475, "loss": 0.0113, "step": 357530 }, { "epoch": 0.93, "learning_rate": 0.00016098071185465326, "loss": 0.0164, "step": 357540 }, { "epoch": 0.93, "learning_rate": 0.0001609768236382818, "loss": 0.0089, "step": 357550 }, { "epoch": 0.93, "learning_rate": 0.00016097293542191034, "loss": 0.012, "step": 357560 }, { "epoch": 0.93, "learning_rate": 0.00016096904720553889, "loss": 0.0131, "step": 357570 }, { "epoch": 0.93, "learning_rate": 0.0001609651589891674, "loss": 0.0111, "step": 357580 }, { "epoch": 0.93, "learning_rate": 0.00016096127077279594, "loss": 0.0162, "step": 357590 }, { "epoch": 0.93, "learning_rate": 0.00016095738255642448, "loss": 0.0109, "step": 357600 }, { "epoch": 0.93, "learning_rate": 0.00016095349434005303, "loss": 0.0124, "step": 357610 }, { "epoch": 0.93, "learning_rate": 0.00016094960612368154, "loss": 0.0131, "step": 357620 }, { "epoch": 0.93, "learning_rate": 0.00016094571790731008, "loss": 0.0114, "step": 357630 }, { "epoch": 0.93, "learning_rate": 0.00016094182969093865, "loss": 0.0118, "step": 357640 }, { "epoch": 0.93, "learning_rate": 0.00016093794147456716, "loss": 0.0127, "step": 357650 }, { "epoch": 0.93, "learning_rate": 0.0001609340532581957, "loss": 0.0105, "step": 357660 }, { "epoch": 0.93, "learning_rate": 0.00016093016504182422, "loss": 0.0109, "step": 357670 }, { "epoch": 0.93, "learning_rate": 0.0001609262768254528, "loss": 0.0103, "step": 357680 }, { "epoch": 0.93, "learning_rate": 0.0001609223886090813, "loss": 0.0132, "step": 357690 }, { "epoch": 0.93, "learning_rate": 0.00016091850039270985, "loss": 0.0135, "step": 357700 }, { "epoch": 0.93, "learning_rate": 0.00016091461217633836, "loss": 0.0124, "step": 357710 }, { "epoch": 0.93, "learning_rate": 0.00016091072395996693, "loss": 0.0121, "step": 357720 }, { "epoch": 0.93, "learning_rate": 0.00016090683574359544, "loss": 0.0166, "step": 357730 }, { "epoch": 0.93, "learning_rate": 0.00016090294752722399, "loss": 0.0168, "step": 357740 }, { "epoch": 0.93, "learning_rate": 0.0001608990593108525, "loss": 0.0114, "step": 357750 }, { "epoch": 0.93, "learning_rate": 0.00016089517109448107, "loss": 0.014, "step": 357760 }, { "epoch": 0.93, "learning_rate": 0.00016089128287810958, "loss": 0.0179, "step": 357770 }, { "epoch": 0.93, "learning_rate": 0.00016088739466173812, "loss": 0.0119, "step": 357780 }, { "epoch": 0.93, "learning_rate": 0.00016088350644536664, "loss": 0.013, "step": 357790 }, { "epoch": 0.93, "learning_rate": 0.00016087961822899518, "loss": 0.0103, "step": 357800 }, { "epoch": 0.93, "learning_rate": 0.00016087573001262375, "loss": 0.0162, "step": 357810 }, { "epoch": 0.93, "learning_rate": 0.00016087184179625226, "loss": 0.0127, "step": 357820 }, { "epoch": 0.93, "learning_rate": 0.0001608679535798808, "loss": 0.0128, "step": 357830 }, { "epoch": 0.93, "learning_rate": 0.00016086406536350932, "loss": 0.0129, "step": 357840 }, { "epoch": 0.93, "learning_rate": 0.0001608601771471379, "loss": 0.0133, "step": 357850 }, { "epoch": 0.93, "learning_rate": 0.0001608562889307664, "loss": 0.0147, "step": 357860 }, { "epoch": 0.93, "learning_rate": 0.00016085240071439495, "loss": 0.0126, "step": 357870 }, { "epoch": 0.93, "learning_rate": 0.00016084851249802346, "loss": 0.0151, "step": 357880 }, { "epoch": 0.93, "learning_rate": 0.00016084462428165203, "loss": 0.0101, "step": 357890 }, { "epoch": 0.93, "learning_rate": 0.00016084073606528054, "loss": 0.0136, "step": 357900 }, { "epoch": 0.93, "learning_rate": 0.00016083684784890908, "loss": 0.0187, "step": 357910 }, { "epoch": 0.93, "learning_rate": 0.0001608329596325376, "loss": 0.0147, "step": 357920 }, { "epoch": 0.93, "learning_rate": 0.00016082907141616617, "loss": 0.0147, "step": 357930 }, { "epoch": 0.93, "learning_rate": 0.00016082518319979468, "loss": 0.0133, "step": 357940 }, { "epoch": 0.93, "learning_rate": 0.00016082129498342322, "loss": 0.0143, "step": 357950 }, { "epoch": 0.93, "learning_rate": 0.00016081740676705174, "loss": 0.0129, "step": 357960 }, { "epoch": 0.93, "learning_rate": 0.0001608135185506803, "loss": 0.0101, "step": 357970 }, { "epoch": 0.93, "learning_rate": 0.00016080963033430885, "loss": 0.0133, "step": 357980 }, { "epoch": 0.93, "learning_rate": 0.00016080574211793736, "loss": 0.012, "step": 357990 }, { "epoch": 0.93, "learning_rate": 0.00016080185390156588, "loss": 0.0095, "step": 358000 }, { "epoch": 0.93, "eval_cer": 0.8817642703482717, "eval_loss": 0.008927177637815475, "eval_runtime": 107.5563, "eval_samples_per_second": 18.595, "eval_steps_per_second": 4.649, "step": 358000 }, { "epoch": 0.93, "learning_rate": 0.00016079796568519445, "loss": 0.0095, "step": 358010 }, { "epoch": 0.93, "learning_rate": 0.000160794077468823, "loss": 0.0112, "step": 358020 }, { "epoch": 0.93, "learning_rate": 0.0001607901892524515, "loss": 0.01, "step": 358030 }, { "epoch": 0.93, "learning_rate": 0.00016078630103608004, "loss": 0.0125, "step": 358040 }, { "epoch": 0.93, "learning_rate": 0.00016078241281970856, "loss": 0.0134, "step": 358050 }, { "epoch": 0.93, "learning_rate": 0.00016077852460333713, "loss": 0.015, "step": 358060 }, { "epoch": 0.93, "learning_rate": 0.00016077463638696564, "loss": 0.0113, "step": 358070 }, { "epoch": 0.93, "learning_rate": 0.00016077074817059418, "loss": 0.013, "step": 358080 }, { "epoch": 0.93, "learning_rate": 0.0001607668599542227, "loss": 0.0105, "step": 358090 }, { "epoch": 0.93, "learning_rate": 0.00016076297173785127, "loss": 0.012, "step": 358100 }, { "epoch": 0.93, "learning_rate": 0.00016075908352147978, "loss": 0.0129, "step": 358110 }, { "epoch": 0.93, "learning_rate": 0.00016075519530510832, "loss": 0.0113, "step": 358120 }, { "epoch": 0.93, "learning_rate": 0.00016075130708873684, "loss": 0.0114, "step": 358130 }, { "epoch": 0.93, "learning_rate": 0.0001607474188723654, "loss": 0.0146, "step": 358140 }, { "epoch": 0.93, "learning_rate": 0.00016074353065599395, "loss": 0.0135, "step": 358150 }, { "epoch": 0.93, "learning_rate": 0.00016073964243962246, "loss": 0.0132, "step": 358160 }, { "epoch": 0.93, "learning_rate": 0.00016073575422325098, "loss": 0.0162, "step": 358170 }, { "epoch": 0.93, "learning_rate": 0.00016073186600687955, "loss": 0.0136, "step": 358180 }, { "epoch": 0.93, "learning_rate": 0.0001607279777905081, "loss": 0.0139, "step": 358190 }, { "epoch": 0.93, "learning_rate": 0.0001607240895741366, "loss": 0.0115, "step": 358200 }, { "epoch": 0.93, "learning_rate": 0.00016072020135776514, "loss": 0.0126, "step": 358210 }, { "epoch": 0.93, "learning_rate": 0.00016071631314139369, "loss": 0.0143, "step": 358220 }, { "epoch": 0.93, "learning_rate": 0.00016071242492502223, "loss": 0.0112, "step": 358230 }, { "epoch": 0.93, "learning_rate": 0.00016070853670865074, "loss": 0.0115, "step": 358240 }, { "epoch": 0.93, "learning_rate": 0.00016070464849227928, "loss": 0.0125, "step": 358250 }, { "epoch": 0.93, "learning_rate": 0.00016070076027590783, "loss": 0.0158, "step": 358260 }, { "epoch": 0.93, "learning_rate": 0.00016069687205953637, "loss": 0.0132, "step": 358270 }, { "epoch": 0.93, "learning_rate": 0.00016069298384316488, "loss": 0.0114, "step": 358280 }, { "epoch": 0.93, "learning_rate": 0.00016068909562679342, "loss": 0.0124, "step": 358290 }, { "epoch": 0.93, "learning_rate": 0.00016068520741042194, "loss": 0.0133, "step": 358300 }, { "epoch": 0.93, "learning_rate": 0.0001606813191940505, "loss": 0.0114, "step": 358310 }, { "epoch": 0.93, "learning_rate": 0.00016067743097767902, "loss": 0.0123, "step": 358320 }, { "epoch": 0.93, "learning_rate": 0.00016067354276130756, "loss": 0.0141, "step": 358330 }, { "epoch": 0.93, "learning_rate": 0.00016066965454493608, "loss": 0.0102, "step": 358340 }, { "epoch": 0.93, "learning_rate": 0.00016066576632856465, "loss": 0.0156, "step": 358350 }, { "epoch": 0.93, "learning_rate": 0.0001606618781121932, "loss": 0.013, "step": 358360 }, { "epoch": 0.93, "learning_rate": 0.0001606579898958217, "loss": 0.0217, "step": 358370 }, { "epoch": 0.93, "learning_rate": 0.00016065410167945024, "loss": 0.0167, "step": 358380 }, { "epoch": 0.93, "learning_rate": 0.00016065021346307878, "loss": 0.0123, "step": 358390 }, { "epoch": 0.93, "learning_rate": 0.00016064632524670733, "loss": 0.0099, "step": 358400 }, { "epoch": 0.93, "learning_rate": 0.00016064243703033584, "loss": 0.0133, "step": 358410 }, { "epoch": 0.93, "learning_rate": 0.00016063854881396438, "loss": 0.0134, "step": 358420 }, { "epoch": 0.93, "learning_rate": 0.00016063466059759292, "loss": 0.0125, "step": 358430 }, { "epoch": 0.93, "learning_rate": 0.00016063077238122147, "loss": 0.0113, "step": 358440 }, { "epoch": 0.93, "learning_rate": 0.00016062688416484998, "loss": 0.0135, "step": 358450 }, { "epoch": 0.93, "learning_rate": 0.00016062299594847852, "loss": 0.0128, "step": 358460 }, { "epoch": 0.93, "learning_rate": 0.00016061910773210706, "loss": 0.0109, "step": 358470 }, { "epoch": 0.93, "learning_rate": 0.0001606152195157356, "loss": 0.0161, "step": 358480 }, { "epoch": 0.93, "learning_rate": 0.00016061133129936412, "loss": 0.0134, "step": 358490 }, { "epoch": 0.93, "learning_rate": 0.00016060744308299266, "loss": 0.0147, "step": 358500 }, { "epoch": 0.93, "learning_rate": 0.00016060355486662123, "loss": 0.0138, "step": 358510 }, { "epoch": 0.93, "learning_rate": 0.00016059966665024974, "loss": 0.0176, "step": 358520 }, { "epoch": 0.93, "learning_rate": 0.0001605957784338783, "loss": 0.0138, "step": 358530 }, { "epoch": 0.93, "learning_rate": 0.0001605918902175068, "loss": 0.0121, "step": 358540 }, { "epoch": 0.93, "learning_rate": 0.00016058800200113534, "loss": 0.0113, "step": 358550 }, { "epoch": 0.93, "learning_rate": 0.00016058411378476388, "loss": 0.0141, "step": 358560 }, { "epoch": 0.93, "learning_rate": 0.00016058022556839243, "loss": 0.011, "step": 358570 }, { "epoch": 0.93, "learning_rate": 0.00016057633735202094, "loss": 0.0112, "step": 358580 }, { "epoch": 0.93, "learning_rate": 0.00016057244913564948, "loss": 0.0109, "step": 358590 }, { "epoch": 0.93, "learning_rate": 0.00016056856091927802, "loss": 0.0105, "step": 358600 }, { "epoch": 0.93, "learning_rate": 0.00016056467270290657, "loss": 0.0111, "step": 358610 }, { "epoch": 0.93, "learning_rate": 0.00016056078448653508, "loss": 0.0109, "step": 358620 }, { "epoch": 0.93, "learning_rate": 0.00016055689627016362, "loss": 0.0127, "step": 358630 }, { "epoch": 0.93, "learning_rate": 0.00016055300805379216, "loss": 0.0119, "step": 358640 }, { "epoch": 0.93, "learning_rate": 0.0001605491198374207, "loss": 0.0124, "step": 358650 }, { "epoch": 0.93, "learning_rate": 0.00016054523162104922, "loss": 0.0147, "step": 358660 }, { "epoch": 0.93, "learning_rate": 0.00016054134340467776, "loss": 0.0149, "step": 358670 }, { "epoch": 0.93, "learning_rate": 0.00016053745518830633, "loss": 0.0146, "step": 358680 }, { "epoch": 0.93, "learning_rate": 0.00016053356697193484, "loss": 0.0145, "step": 358690 }, { "epoch": 0.93, "learning_rate": 0.00016052967875556339, "loss": 0.0137, "step": 358700 }, { "epoch": 0.93, "learning_rate": 0.0001605257905391919, "loss": 0.0142, "step": 358710 }, { "epoch": 0.93, "learning_rate": 0.00016052190232282047, "loss": 0.0129, "step": 358720 }, { "epoch": 0.93, "learning_rate": 0.00016051801410644898, "loss": 0.0149, "step": 358730 }, { "epoch": 0.93, "learning_rate": 0.00016051412589007753, "loss": 0.0145, "step": 358740 }, { "epoch": 0.93, "learning_rate": 0.00016051023767370604, "loss": 0.0132, "step": 358750 }, { "epoch": 0.93, "learning_rate": 0.0001605063494573346, "loss": 0.0153, "step": 358760 }, { "epoch": 0.93, "learning_rate": 0.00016050246124096312, "loss": 0.0158, "step": 358770 }, { "epoch": 0.93, "learning_rate": 0.00016049857302459166, "loss": 0.0142, "step": 358780 }, { "epoch": 0.93, "learning_rate": 0.00016049468480822018, "loss": 0.0132, "step": 358790 }, { "epoch": 0.93, "learning_rate": 0.00016049079659184872, "loss": 0.0148, "step": 358800 }, { "epoch": 0.93, "learning_rate": 0.00016048690837547726, "loss": 0.0127, "step": 358810 }, { "epoch": 0.93, "learning_rate": 0.0001604830201591058, "loss": 0.0158, "step": 358820 }, { "epoch": 0.93, "learning_rate": 0.00016047913194273432, "loss": 0.0189, "step": 358830 }, { "epoch": 0.93, "learning_rate": 0.00016047524372636286, "loss": 0.013, "step": 358840 }, { "epoch": 0.93, "learning_rate": 0.00016047135550999143, "loss": 0.0151, "step": 358850 }, { "epoch": 0.93, "learning_rate": 0.00016046746729361994, "loss": 0.0143, "step": 358860 }, { "epoch": 0.93, "learning_rate": 0.00016046357907724849, "loss": 0.0141, "step": 358870 }, { "epoch": 0.93, "learning_rate": 0.000160459690860877, "loss": 0.0097, "step": 358880 }, { "epoch": 0.93, "learning_rate": 0.00016045580264450557, "loss": 0.0156, "step": 358890 }, { "epoch": 0.93, "learning_rate": 0.00016045191442813408, "loss": 0.0127, "step": 358900 }, { "epoch": 0.93, "learning_rate": 0.00016044802621176262, "loss": 0.0123, "step": 358910 }, { "epoch": 0.93, "learning_rate": 0.00016044413799539114, "loss": 0.0147, "step": 358920 }, { "epoch": 0.93, "learning_rate": 0.0001604402497790197, "loss": 0.0091, "step": 358930 }, { "epoch": 0.93, "learning_rate": 0.00016043636156264822, "loss": 0.0116, "step": 358940 }, { "epoch": 0.93, "learning_rate": 0.00016043247334627676, "loss": 0.013, "step": 358950 }, { "epoch": 0.93, "learning_rate": 0.00016042858512990528, "loss": 0.0114, "step": 358960 }, { "epoch": 0.93, "learning_rate": 0.00016042469691353385, "loss": 0.0163, "step": 358970 }, { "epoch": 0.93, "learning_rate": 0.00016042080869716236, "loss": 0.0154, "step": 358980 }, { "epoch": 0.93, "learning_rate": 0.0001604169204807909, "loss": 0.0131, "step": 358990 }, { "epoch": 0.93, "learning_rate": 0.00016041303226441942, "loss": 0.0134, "step": 359000 }, { "epoch": 0.93, "eval_cer": 0.8817712685329425, "eval_loss": 0.008768617175519466, "eval_runtime": 107.5531, "eval_samples_per_second": 18.595, "eval_steps_per_second": 4.649, "step": 359000 }, { "epoch": 0.93, "learning_rate": 0.000160409144048048, "loss": 0.0086, "step": 359010 }, { "epoch": 0.93, "learning_rate": 0.00016040525583167653, "loss": 0.0117, "step": 359020 }, { "epoch": 0.93, "learning_rate": 0.00016040136761530504, "loss": 0.0163, "step": 359030 }, { "epoch": 0.93, "learning_rate": 0.00016039747939893356, "loss": 0.0169, "step": 359040 }, { "epoch": 0.93, "learning_rate": 0.0001603935911825621, "loss": 0.0128, "step": 359050 }, { "epoch": 0.93, "learning_rate": 0.00016038970296619067, "loss": 0.0112, "step": 359060 }, { "epoch": 0.93, "learning_rate": 0.00016038581474981918, "loss": 0.0138, "step": 359070 }, { "epoch": 0.93, "learning_rate": 0.00016038192653344772, "loss": 0.0135, "step": 359080 }, { "epoch": 0.93, "learning_rate": 0.00016037803831707624, "loss": 0.0168, "step": 359090 }, { "epoch": 0.93, "learning_rate": 0.0001603741501007048, "loss": 0.0115, "step": 359100 }, { "epoch": 0.93, "learning_rate": 0.00016037026188433332, "loss": 0.0121, "step": 359110 }, { "epoch": 0.93, "learning_rate": 0.00016036637366796186, "loss": 0.0126, "step": 359120 }, { "epoch": 0.93, "learning_rate": 0.00016036248545159038, "loss": 0.0159, "step": 359130 }, { "epoch": 0.93, "learning_rate": 0.00016035859723521895, "loss": 0.0105, "step": 359140 }, { "epoch": 0.93, "learning_rate": 0.00016035470901884746, "loss": 0.0132, "step": 359150 }, { "epoch": 0.93, "learning_rate": 0.000160350820802476, "loss": 0.0112, "step": 359160 }, { "epoch": 0.93, "learning_rate": 0.00016034693258610452, "loss": 0.0152, "step": 359170 }, { "epoch": 0.93, "learning_rate": 0.0001603430443697331, "loss": 0.0108, "step": 359180 }, { "epoch": 0.93, "learning_rate": 0.0001603391561533616, "loss": 0.0147, "step": 359190 }, { "epoch": 0.93, "learning_rate": 0.00016033526793699014, "loss": 0.0144, "step": 359200 }, { "epoch": 0.93, "learning_rate": 0.00016033137972061866, "loss": 0.0138, "step": 359210 }, { "epoch": 0.93, "learning_rate": 0.00016032749150424723, "loss": 0.0132, "step": 359220 }, { "epoch": 0.93, "learning_rate": 0.00016032360328787577, "loss": 0.0143, "step": 359230 }, { "epoch": 0.93, "learning_rate": 0.00016031971507150428, "loss": 0.0111, "step": 359240 }, { "epoch": 0.93, "learning_rate": 0.00016031582685513282, "loss": 0.0115, "step": 359250 }, { "epoch": 0.93, "learning_rate": 0.00016031193863876134, "loss": 0.0138, "step": 359260 }, { "epoch": 0.93, "learning_rate": 0.0001603080504223899, "loss": 0.0098, "step": 359270 }, { "epoch": 0.93, "learning_rate": 0.00016030416220601842, "loss": 0.016, "step": 359280 }, { "epoch": 0.93, "learning_rate": 0.00016030027398964696, "loss": 0.0127, "step": 359290 }, { "epoch": 0.93, "learning_rate": 0.00016029638577327548, "loss": 0.0146, "step": 359300 }, { "epoch": 0.93, "learning_rate": 0.00016029249755690405, "loss": 0.012, "step": 359310 }, { "epoch": 0.93, "learning_rate": 0.00016028860934053256, "loss": 0.0138, "step": 359320 }, { "epoch": 0.93, "learning_rate": 0.0001602847211241611, "loss": 0.0133, "step": 359330 }, { "epoch": 0.93, "learning_rate": 0.00016028083290778962, "loss": 0.0113, "step": 359340 }, { "epoch": 0.93, "learning_rate": 0.00016027694469141819, "loss": 0.0126, "step": 359350 }, { "epoch": 0.93, "learning_rate": 0.0001602730564750467, "loss": 0.0162, "step": 359360 }, { "epoch": 0.93, "learning_rate": 0.00016026916825867524, "loss": 0.0111, "step": 359370 }, { "epoch": 0.93, "learning_rate": 0.00016026528004230376, "loss": 0.0103, "step": 359380 }, { "epoch": 0.93, "learning_rate": 0.00016026139182593233, "loss": 0.0122, "step": 359390 }, { "epoch": 0.93, "learning_rate": 0.00016025750360956087, "loss": 0.0135, "step": 359400 }, { "epoch": 0.93, "learning_rate": 0.00016025361539318938, "loss": 0.0085, "step": 359410 }, { "epoch": 0.93, "learning_rate": 0.00016024972717681792, "loss": 0.0125, "step": 359420 }, { "epoch": 0.93, "learning_rate": 0.00016024583896044646, "loss": 0.0138, "step": 359430 }, { "epoch": 0.93, "learning_rate": 0.000160241950744075, "loss": 0.0145, "step": 359440 }, { "epoch": 0.93, "learning_rate": 0.00016023806252770352, "loss": 0.0144, "step": 359450 }, { "epoch": 0.93, "learning_rate": 0.00016023417431133206, "loss": 0.0141, "step": 359460 }, { "epoch": 0.93, "learning_rate": 0.0001602302860949606, "loss": 0.0143, "step": 359470 }, { "epoch": 0.93, "learning_rate": 0.00016022639787858915, "loss": 0.0118, "step": 359480 }, { "epoch": 0.93, "learning_rate": 0.00016022250966221766, "loss": 0.0134, "step": 359490 }, { "epoch": 0.93, "learning_rate": 0.0001602186214458462, "loss": 0.0191, "step": 359500 }, { "epoch": 0.93, "learning_rate": 0.00016021473322947472, "loss": 0.0104, "step": 359510 }, { "epoch": 0.93, "learning_rate": 0.00016021084501310329, "loss": 0.0169, "step": 359520 }, { "epoch": 0.93, "learning_rate": 0.0001602069567967318, "loss": 0.0113, "step": 359530 }, { "epoch": 0.93, "learning_rate": 0.00016020306858036034, "loss": 0.016, "step": 359540 }, { "epoch": 0.93, "learning_rate": 0.00016019918036398886, "loss": 0.0147, "step": 359550 }, { "epoch": 0.93, "learning_rate": 0.00016019529214761742, "loss": 0.0137, "step": 359560 }, { "epoch": 0.93, "learning_rate": 0.00016019140393124597, "loss": 0.0127, "step": 359570 }, { "epoch": 0.93, "learning_rate": 0.00016018751571487448, "loss": 0.0131, "step": 359580 }, { "epoch": 0.93, "learning_rate": 0.000160183627498503, "loss": 0.0141, "step": 359590 }, { "epoch": 0.93, "learning_rate": 0.00016017973928213156, "loss": 0.0126, "step": 359600 }, { "epoch": 0.93, "learning_rate": 0.0001601758510657601, "loss": 0.0126, "step": 359610 }, { "epoch": 0.93, "learning_rate": 0.00016017196284938862, "loss": 0.0131, "step": 359620 }, { "epoch": 0.93, "learning_rate": 0.00016016807463301716, "loss": 0.0117, "step": 359630 }, { "epoch": 0.93, "learning_rate": 0.0001601641864166457, "loss": 0.0142, "step": 359640 }, { "epoch": 0.93, "learning_rate": 0.00016016029820027425, "loss": 0.0129, "step": 359650 }, { "epoch": 0.93, "learning_rate": 0.00016015640998390276, "loss": 0.015, "step": 359660 }, { "epoch": 0.93, "learning_rate": 0.0001601525217675313, "loss": 0.0111, "step": 359670 }, { "epoch": 0.93, "learning_rate": 0.00016014863355115984, "loss": 0.0137, "step": 359680 }, { "epoch": 0.93, "learning_rate": 0.00016014474533478838, "loss": 0.0121, "step": 359690 }, { "epoch": 0.93, "learning_rate": 0.0001601408571184169, "loss": 0.0129, "step": 359700 }, { "epoch": 0.93, "learning_rate": 0.00016013696890204544, "loss": 0.0158, "step": 359710 }, { "epoch": 0.93, "learning_rate": 0.000160133080685674, "loss": 0.011, "step": 359720 }, { "epoch": 0.93, "learning_rate": 0.00016012919246930252, "loss": 0.0132, "step": 359730 }, { "epoch": 0.93, "learning_rate": 0.00016012530425293107, "loss": 0.0177, "step": 359740 }, { "epoch": 0.93, "learning_rate": 0.00016012141603655958, "loss": 0.0135, "step": 359750 }, { "epoch": 0.93, "learning_rate": 0.0001601175278201881, "loss": 0.0094, "step": 359760 }, { "epoch": 0.93, "learning_rate": 0.00016011363960381666, "loss": 0.0127, "step": 359770 }, { "epoch": 0.93, "learning_rate": 0.0001601097513874452, "loss": 0.0162, "step": 359780 }, { "epoch": 0.93, "learning_rate": 0.00016010586317107372, "loss": 0.0127, "step": 359790 }, { "epoch": 0.93, "learning_rate": 0.00016010197495470226, "loss": 0.0151, "step": 359800 }, { "epoch": 0.93, "learning_rate": 0.0001600980867383308, "loss": 0.0119, "step": 359810 }, { "epoch": 0.93, "learning_rate": 0.00016009419852195934, "loss": 0.0114, "step": 359820 }, { "epoch": 0.93, "learning_rate": 0.00016009031030558786, "loss": 0.013, "step": 359830 }, { "epoch": 0.93, "learning_rate": 0.0001600864220892164, "loss": 0.013, "step": 359840 }, { "epoch": 0.93, "learning_rate": 0.00016008253387284494, "loss": 0.0156, "step": 359850 }, { "epoch": 0.93, "learning_rate": 0.00016007864565647348, "loss": 0.0135, "step": 359860 }, { "epoch": 0.93, "learning_rate": 0.000160074757440102, "loss": 0.0142, "step": 359870 }, { "epoch": 0.93, "learning_rate": 0.00016007086922373054, "loss": 0.0114, "step": 359880 }, { "epoch": 0.93, "learning_rate": 0.0001600669810073591, "loss": 0.0125, "step": 359890 }, { "epoch": 0.93, "learning_rate": 0.00016006309279098762, "loss": 0.0099, "step": 359900 }, { "epoch": 0.93, "learning_rate": 0.00016005920457461614, "loss": 0.0142, "step": 359910 }, { "epoch": 0.93, "learning_rate": 0.00016005531635824468, "loss": 0.0102, "step": 359920 }, { "epoch": 0.93, "learning_rate": 0.00016005142814187325, "loss": 0.0121, "step": 359930 }, { "epoch": 0.93, "learning_rate": 0.00016004753992550176, "loss": 0.0126, "step": 359940 }, { "epoch": 0.93, "learning_rate": 0.0001600436517091303, "loss": 0.0094, "step": 359950 }, { "epoch": 0.93, "learning_rate": 0.00016003976349275882, "loss": 0.0125, "step": 359960 }, { "epoch": 0.93, "learning_rate": 0.0001600358752763874, "loss": 0.0146, "step": 359970 }, { "epoch": 0.93, "learning_rate": 0.0001600319870600159, "loss": 0.0106, "step": 359980 }, { "epoch": 0.93, "learning_rate": 0.00016002809884364444, "loss": 0.0128, "step": 359990 }, { "epoch": 0.93, "learning_rate": 0.00016002421062727296, "loss": 0.0148, "step": 360000 }, { "epoch": 0.93, "eval_cer": 0.8817110841447728, "eval_loss": 0.008698065765202045, "eval_runtime": 107.5328, "eval_samples_per_second": 18.599, "eval_steps_per_second": 4.65, "step": 360000 }, { "epoch": 0.93, "learning_rate": 0.0001600203224109015, "loss": 0.0115, "step": 360010 }, { "epoch": 0.93, "learning_rate": 0.00016001643419453004, "loss": 0.0101, "step": 360020 }, { "epoch": 0.93, "learning_rate": 0.00016001254597815858, "loss": 0.0103, "step": 360030 }, { "epoch": 0.93, "learning_rate": 0.0001600086577617871, "loss": 0.0123, "step": 360040 }, { "epoch": 0.93, "learning_rate": 0.00016000476954541564, "loss": 0.0157, "step": 360050 }, { "epoch": 0.93, "learning_rate": 0.00016000088132904418, "loss": 0.0127, "step": 360060 }, { "epoch": 0.93, "learning_rate": 0.00015999699311267272, "loss": 0.0107, "step": 360070 }, { "epoch": 0.93, "learning_rate": 0.00015999310489630124, "loss": 0.0111, "step": 360080 }, { "epoch": 0.93, "learning_rate": 0.00015998921667992978, "loss": 0.0135, "step": 360090 }, { "epoch": 0.93, "learning_rate": 0.00015998532846355835, "loss": 0.0136, "step": 360100 }, { "epoch": 0.93, "learning_rate": 0.00015998144024718686, "loss": 0.0134, "step": 360110 }, { "epoch": 0.93, "learning_rate": 0.0001599775520308154, "loss": 0.0121, "step": 360120 }, { "epoch": 0.93, "learning_rate": 0.00015997366381444392, "loss": 0.012, "step": 360130 }, { "epoch": 0.93, "learning_rate": 0.0001599697755980725, "loss": 0.0121, "step": 360140 }, { "epoch": 0.93, "learning_rate": 0.000159965887381701, "loss": 0.013, "step": 360150 }, { "epoch": 0.93, "learning_rate": 0.00015996199916532954, "loss": 0.0121, "step": 360160 }, { "epoch": 0.93, "learning_rate": 0.00015995811094895806, "loss": 0.0156, "step": 360170 }, { "epoch": 0.93, "learning_rate": 0.00015995422273258663, "loss": 0.0136, "step": 360180 }, { "epoch": 0.93, "learning_rate": 0.00015995033451621514, "loss": 0.0121, "step": 360190 }, { "epoch": 0.93, "learning_rate": 0.00015994644629984368, "loss": 0.0149, "step": 360200 }, { "epoch": 0.93, "learning_rate": 0.0001599425580834722, "loss": 0.012, "step": 360210 }, { "epoch": 0.93, "learning_rate": 0.00015993866986710077, "loss": 0.013, "step": 360220 }, { "epoch": 0.93, "learning_rate": 0.00015993478165072928, "loss": 0.0138, "step": 360230 }, { "epoch": 0.93, "learning_rate": 0.00015993089343435782, "loss": 0.0113, "step": 360240 }, { "epoch": 0.93, "learning_rate": 0.00015992700521798634, "loss": 0.0152, "step": 360250 }, { "epoch": 0.93, "learning_rate": 0.00015992311700161488, "loss": 0.0129, "step": 360260 }, { "epoch": 0.93, "learning_rate": 0.00015991922878524345, "loss": 0.0111, "step": 360270 }, { "epoch": 0.93, "learning_rate": 0.00015991534056887196, "loss": 0.0115, "step": 360280 }, { "epoch": 0.93, "learning_rate": 0.0001599114523525005, "loss": 0.0126, "step": 360290 }, { "epoch": 0.93, "learning_rate": 0.00015990756413612902, "loss": 0.0202, "step": 360300 }, { "epoch": 0.93, "learning_rate": 0.0001599036759197576, "loss": 0.0111, "step": 360310 }, { "epoch": 0.93, "learning_rate": 0.0001598997877033861, "loss": 0.011, "step": 360320 }, { "epoch": 0.93, "learning_rate": 0.00015989589948701464, "loss": 0.0114, "step": 360330 }, { "epoch": 0.93, "learning_rate": 0.00015989201127064316, "loss": 0.0138, "step": 360340 }, { "epoch": 0.93, "learning_rate": 0.00015988812305427173, "loss": 0.0149, "step": 360350 }, { "epoch": 0.93, "learning_rate": 0.00015988423483790024, "loss": 0.0124, "step": 360360 }, { "epoch": 0.93, "learning_rate": 0.00015988034662152878, "loss": 0.0113, "step": 360370 }, { "epoch": 0.93, "learning_rate": 0.0001598764584051573, "loss": 0.0105, "step": 360380 }, { "epoch": 0.93, "learning_rate": 0.00015987257018878587, "loss": 0.0119, "step": 360390 }, { "epoch": 0.93, "learning_rate": 0.00015986868197241438, "loss": 0.0131, "step": 360400 }, { "epoch": 0.93, "learning_rate": 0.00015986479375604292, "loss": 0.0105, "step": 360410 }, { "epoch": 0.93, "learning_rate": 0.00015986090553967144, "loss": 0.0129, "step": 360420 }, { "epoch": 0.93, "learning_rate": 0.0001598570173233, "loss": 0.0139, "step": 360430 }, { "epoch": 0.93, "learning_rate": 0.00015985312910692855, "loss": 0.0125, "step": 360440 }, { "epoch": 0.93, "learning_rate": 0.00015984924089055706, "loss": 0.0118, "step": 360450 }, { "epoch": 0.93, "learning_rate": 0.0001598453526741856, "loss": 0.0135, "step": 360460 }, { "epoch": 0.93, "learning_rate": 0.00015984146445781414, "loss": 0.0103, "step": 360470 }, { "epoch": 0.93, "learning_rate": 0.00015983757624144269, "loss": 0.0165, "step": 360480 }, { "epoch": 0.93, "learning_rate": 0.0001598336880250712, "loss": 0.0146, "step": 360490 }, { "epoch": 0.93, "learning_rate": 0.00015982979980869974, "loss": 0.0145, "step": 360500 }, { "epoch": 0.93, "learning_rate": 0.00015982591159232826, "loss": 0.0116, "step": 360510 }, { "epoch": 0.93, "learning_rate": 0.00015982202337595683, "loss": 0.0124, "step": 360520 }, { "epoch": 0.93, "learning_rate": 0.00015981813515958534, "loss": 0.0104, "step": 360530 }, { "epoch": 0.93, "learning_rate": 0.00015981424694321388, "loss": 0.0133, "step": 360540 }, { "epoch": 0.93, "learning_rate": 0.0001598103587268424, "loss": 0.0116, "step": 360550 }, { "epoch": 0.93, "learning_rate": 0.00015980647051047097, "loss": 0.0145, "step": 360560 }, { "epoch": 0.93, "learning_rate": 0.00015980258229409948, "loss": 0.0152, "step": 360570 }, { "epoch": 0.93, "learning_rate": 0.00015979869407772802, "loss": 0.0123, "step": 360580 }, { "epoch": 0.93, "learning_rate": 0.00015979480586135654, "loss": 0.0109, "step": 360590 }, { "epoch": 0.93, "learning_rate": 0.0001597909176449851, "loss": 0.0169, "step": 360600 }, { "epoch": 0.93, "learning_rate": 0.00015978702942861365, "loss": 0.0157, "step": 360610 }, { "epoch": 0.93, "learning_rate": 0.00015978314121224216, "loss": 0.0116, "step": 360620 }, { "epoch": 0.93, "learning_rate": 0.00015977925299587068, "loss": 0.015, "step": 360630 }, { "epoch": 0.93, "learning_rate": 0.00015977536477949924, "loss": 0.0118, "step": 360640 }, { "epoch": 0.93, "learning_rate": 0.00015977147656312779, "loss": 0.0117, "step": 360650 }, { "epoch": 0.93, "learning_rate": 0.0001597675883467563, "loss": 0.0111, "step": 360660 }, { "epoch": 0.93, "learning_rate": 0.00015976370013038484, "loss": 0.0145, "step": 360670 }, { "epoch": 0.93, "learning_rate": 0.00015975981191401338, "loss": 0.0114, "step": 360680 }, { "epoch": 0.93, "learning_rate": 0.00015975592369764193, "loss": 0.0132, "step": 360690 }, { "epoch": 0.93, "learning_rate": 0.00015975203548127044, "loss": 0.0154, "step": 360700 }, { "epoch": 0.94, "learning_rate": 0.00015974814726489898, "loss": 0.0133, "step": 360710 }, { "epoch": 0.94, "learning_rate": 0.00015974425904852752, "loss": 0.0099, "step": 360720 }, { "epoch": 0.94, "learning_rate": 0.00015974037083215606, "loss": 0.0105, "step": 360730 }, { "epoch": 0.94, "learning_rate": 0.00015973648261578458, "loss": 0.0126, "step": 360740 }, { "epoch": 0.94, "learning_rate": 0.00015973259439941312, "loss": 0.0118, "step": 360750 }, { "epoch": 0.94, "learning_rate": 0.00015972870618304164, "loss": 0.0133, "step": 360760 }, { "epoch": 0.94, "learning_rate": 0.0001597248179666702, "loss": 0.0124, "step": 360770 }, { "epoch": 0.94, "learning_rate": 0.00015972092975029872, "loss": 0.0143, "step": 360780 }, { "epoch": 0.94, "learning_rate": 0.00015971704153392726, "loss": 0.0123, "step": 360790 }, { "epoch": 0.94, "learning_rate": 0.00015971315331755577, "loss": 0.0141, "step": 360800 }, { "epoch": 0.94, "learning_rate": 0.00015970926510118434, "loss": 0.0123, "step": 360810 }, { "epoch": 0.94, "learning_rate": 0.00015970537688481289, "loss": 0.0116, "step": 360820 }, { "epoch": 0.94, "learning_rate": 0.0001597014886684414, "loss": 0.0172, "step": 360830 }, { "epoch": 0.94, "learning_rate": 0.00015969760045206994, "loss": 0.0137, "step": 360840 }, { "epoch": 0.94, "learning_rate": 0.00015969371223569848, "loss": 0.011, "step": 360850 }, { "epoch": 0.94, "learning_rate": 0.00015968982401932702, "loss": 0.011, "step": 360860 }, { "epoch": 0.94, "learning_rate": 0.00015968593580295554, "loss": 0.0122, "step": 360870 }, { "epoch": 0.94, "learning_rate": 0.00015968204758658408, "loss": 0.0148, "step": 360880 }, { "epoch": 0.94, "learning_rate": 0.00015967815937021262, "loss": 0.0117, "step": 360890 }, { "epoch": 0.94, "learning_rate": 0.00015967427115384116, "loss": 0.0145, "step": 360900 }, { "epoch": 0.94, "learning_rate": 0.00015967038293746968, "loss": 0.0107, "step": 360910 }, { "epoch": 0.94, "learning_rate": 0.00015966649472109822, "loss": 0.0125, "step": 360920 }, { "epoch": 0.94, "learning_rate": 0.0001596626065047268, "loss": 0.0224, "step": 360930 }, { "epoch": 0.94, "learning_rate": 0.0001596587182883553, "loss": 0.0142, "step": 360940 }, { "epoch": 0.94, "learning_rate": 0.00015965483007198382, "loss": 0.011, "step": 360950 }, { "epoch": 0.94, "learning_rate": 0.00015965094185561236, "loss": 0.0114, "step": 360960 }, { "epoch": 0.94, "learning_rate": 0.00015964705363924093, "loss": 0.013, "step": 360970 }, { "epoch": 0.94, "learning_rate": 0.00015964316542286944, "loss": 0.0128, "step": 360980 }, { "epoch": 0.94, "learning_rate": 0.00015963927720649798, "loss": 0.0114, "step": 360990 }, { "epoch": 0.94, "learning_rate": 0.0001596353889901265, "loss": 0.0139, "step": 361000 }, { "epoch": 0.94, "eval_cer": 0.8817684692590742, "eval_loss": 0.008725974708795547, "eval_runtime": 107.3705, "eval_samples_per_second": 18.627, "eval_steps_per_second": 4.657, "step": 361000 }, { "epoch": 0.94, "learning_rate": 0.00015963150077375504, "loss": 0.0134, "step": 361010 }, { "epoch": 0.94, "learning_rate": 0.00015962761255738358, "loss": 0.0112, "step": 361020 }, { "epoch": 0.94, "learning_rate": 0.00015962372434101212, "loss": 0.0154, "step": 361030 }, { "epoch": 0.94, "learning_rate": 0.00015961983612464064, "loss": 0.0118, "step": 361040 }, { "epoch": 0.94, "learning_rate": 0.00015961594790826918, "loss": 0.0129, "step": 361050 }, { "epoch": 0.94, "learning_rate": 0.00015961205969189772, "loss": 0.0142, "step": 361060 }, { "epoch": 0.94, "learning_rate": 0.00015960817147552626, "loss": 0.0106, "step": 361070 }, { "epoch": 0.94, "learning_rate": 0.00015960428325915478, "loss": 0.0147, "step": 361080 }, { "epoch": 0.94, "learning_rate": 0.00015960039504278332, "loss": 0.0121, "step": 361090 }, { "epoch": 0.94, "learning_rate": 0.00015959650682641186, "loss": 0.0117, "step": 361100 }, { "epoch": 0.94, "learning_rate": 0.0001595926186100404, "loss": 0.0121, "step": 361110 }, { "epoch": 0.94, "learning_rate": 0.00015958873039366892, "loss": 0.0118, "step": 361120 }, { "epoch": 0.94, "learning_rate": 0.00015958484217729746, "loss": 0.0151, "step": 361130 }, { "epoch": 0.94, "learning_rate": 0.00015958095396092603, "loss": 0.0166, "step": 361140 }, { "epoch": 0.94, "learning_rate": 0.00015957706574455454, "loss": 0.0121, "step": 361150 }, { "epoch": 0.94, "learning_rate": 0.00015957317752818308, "loss": 0.0113, "step": 361160 }, { "epoch": 0.94, "learning_rate": 0.0001595692893118116, "loss": 0.0127, "step": 361170 }, { "epoch": 0.94, "learning_rate": 0.00015956540109544017, "loss": 0.0136, "step": 361180 }, { "epoch": 0.94, "learning_rate": 0.00015956151287906868, "loss": 0.0157, "step": 361190 }, { "epoch": 0.94, "learning_rate": 0.00015955762466269722, "loss": 0.0115, "step": 361200 }, { "epoch": 0.94, "learning_rate": 0.00015955373644632574, "loss": 0.0131, "step": 361210 }, { "epoch": 0.94, "learning_rate": 0.0001595498482299543, "loss": 0.0122, "step": 361220 }, { "epoch": 0.94, "learning_rate": 0.00015954596001358282, "loss": 0.0102, "step": 361230 }, { "epoch": 0.94, "learning_rate": 0.00015954207179721136, "loss": 0.0125, "step": 361240 }, { "epoch": 0.94, "learning_rate": 0.00015953818358083988, "loss": 0.0111, "step": 361250 }, { "epoch": 0.94, "learning_rate": 0.00015953429536446842, "loss": 0.0135, "step": 361260 }, { "epoch": 0.94, "learning_rate": 0.00015953040714809696, "loss": 0.014, "step": 361270 }, { "epoch": 0.94, "learning_rate": 0.0001595265189317255, "loss": 0.0144, "step": 361280 }, { "epoch": 0.94, "learning_rate": 0.00015952263071535402, "loss": 0.0116, "step": 361290 }, { "epoch": 0.94, "learning_rate": 0.00015951874249898256, "loss": 0.0103, "step": 361300 }, { "epoch": 0.94, "learning_rate": 0.00015951485428261113, "loss": 0.0137, "step": 361310 }, { "epoch": 0.94, "learning_rate": 0.00015951096606623964, "loss": 0.0135, "step": 361320 }, { "epoch": 0.94, "learning_rate": 0.00015950707784986818, "loss": 0.015, "step": 361330 }, { "epoch": 0.94, "learning_rate": 0.0001595031896334967, "loss": 0.0127, "step": 361340 }, { "epoch": 0.94, "learning_rate": 0.00015949930141712527, "loss": 0.0122, "step": 361350 }, { "epoch": 0.94, "learning_rate": 0.00015949541320075378, "loss": 0.0117, "step": 361360 }, { "epoch": 0.94, "learning_rate": 0.00015949152498438232, "loss": 0.0123, "step": 361370 }, { "epoch": 0.94, "learning_rate": 0.00015948763676801084, "loss": 0.0145, "step": 361380 }, { "epoch": 0.94, "learning_rate": 0.0001594837485516394, "loss": 0.0131, "step": 361390 }, { "epoch": 0.94, "learning_rate": 0.00015947986033526792, "loss": 0.0143, "step": 361400 }, { "epoch": 0.94, "learning_rate": 0.00015947597211889646, "loss": 0.013, "step": 361410 }, { "epoch": 0.94, "learning_rate": 0.00015947208390252498, "loss": 0.0134, "step": 361420 }, { "epoch": 0.94, "learning_rate": 0.00015946819568615355, "loss": 0.0121, "step": 361430 }, { "epoch": 0.94, "learning_rate": 0.00015946430746978206, "loss": 0.0126, "step": 361440 }, { "epoch": 0.94, "learning_rate": 0.0001594604192534106, "loss": 0.0109, "step": 361450 }, { "epoch": 0.94, "learning_rate": 0.00015945653103703912, "loss": 0.0178, "step": 361460 }, { "epoch": 0.94, "learning_rate": 0.00015945264282066768, "loss": 0.0153, "step": 361470 }, { "epoch": 0.94, "learning_rate": 0.00015944875460429623, "loss": 0.0141, "step": 361480 }, { "epoch": 0.94, "learning_rate": 0.00015944486638792474, "loss": 0.0117, "step": 361490 }, { "epoch": 0.94, "learning_rate": 0.00015944097817155326, "loss": 0.0167, "step": 361500 }, { "epoch": 0.94, "learning_rate": 0.0001594370899551818, "loss": 0.0142, "step": 361510 }, { "epoch": 0.94, "learning_rate": 0.00015943320173881037, "loss": 0.0175, "step": 361520 }, { "epoch": 0.94, "learning_rate": 0.00015942931352243888, "loss": 0.0173, "step": 361530 }, { "epoch": 0.94, "learning_rate": 0.00015942542530606742, "loss": 0.0142, "step": 361540 }, { "epoch": 0.94, "learning_rate": 0.00015942153708969594, "loss": 0.0167, "step": 361550 }, { "epoch": 0.94, "learning_rate": 0.0001594176488733245, "loss": 0.0093, "step": 361560 }, { "epoch": 0.94, "learning_rate": 0.00015941376065695302, "loss": 0.0129, "step": 361570 }, { "epoch": 0.94, "learning_rate": 0.00015940987244058156, "loss": 0.0193, "step": 361580 }, { "epoch": 0.94, "learning_rate": 0.00015940598422421008, "loss": 0.0115, "step": 361590 }, { "epoch": 0.94, "learning_rate": 0.00015940209600783864, "loss": 0.0109, "step": 361600 }, { "epoch": 0.94, "learning_rate": 0.00015939820779146716, "loss": 0.0133, "step": 361610 }, { "epoch": 0.94, "learning_rate": 0.0001593943195750957, "loss": 0.012, "step": 361620 }, { "epoch": 0.94, "learning_rate": 0.00015939043135872422, "loss": 0.0143, "step": 361630 }, { "epoch": 0.94, "learning_rate": 0.00015938654314235278, "loss": 0.0141, "step": 361640 }, { "epoch": 0.94, "learning_rate": 0.0001593826549259813, "loss": 0.0119, "step": 361650 }, { "epoch": 0.94, "learning_rate": 0.00015937876670960984, "loss": 0.0106, "step": 361660 }, { "epoch": 0.94, "learning_rate": 0.00015937487849323836, "loss": 0.0124, "step": 361670 }, { "epoch": 0.94, "learning_rate": 0.00015937099027686692, "loss": 0.0144, "step": 361680 }, { "epoch": 0.94, "learning_rate": 0.00015936710206049547, "loss": 0.0135, "step": 361690 }, { "epoch": 0.94, "learning_rate": 0.00015936321384412398, "loss": 0.0105, "step": 361700 }, { "epoch": 0.94, "learning_rate": 0.00015935932562775252, "loss": 0.0117, "step": 361710 }, { "epoch": 0.94, "learning_rate": 0.00015935543741138106, "loss": 0.0122, "step": 361720 }, { "epoch": 0.94, "learning_rate": 0.0001593515491950096, "loss": 0.0123, "step": 361730 }, { "epoch": 0.94, "learning_rate": 0.00015934766097863812, "loss": 0.0149, "step": 361740 }, { "epoch": 0.94, "learning_rate": 0.00015934377276226666, "loss": 0.0173, "step": 361750 }, { "epoch": 0.94, "learning_rate": 0.00015933988454589518, "loss": 0.0126, "step": 361760 }, { "epoch": 0.94, "learning_rate": 0.00015933599632952374, "loss": 0.0141, "step": 361770 }, { "epoch": 0.94, "learning_rate": 0.00015933210811315226, "loss": 0.0154, "step": 361780 }, { "epoch": 0.94, "learning_rate": 0.0001593282198967808, "loss": 0.0133, "step": 361790 }, { "epoch": 0.94, "learning_rate": 0.00015932433168040932, "loss": 0.0185, "step": 361800 }, { "epoch": 0.94, "learning_rate": 0.00015932044346403788, "loss": 0.0112, "step": 361810 }, { "epoch": 0.94, "learning_rate": 0.0001593165552476664, "loss": 0.014, "step": 361820 }, { "epoch": 0.94, "learning_rate": 0.00015931266703129494, "loss": 0.0165, "step": 361830 }, { "epoch": 0.94, "learning_rate": 0.00015930877881492345, "loss": 0.0127, "step": 361840 }, { "epoch": 0.94, "learning_rate": 0.00015930489059855202, "loss": 0.0131, "step": 361850 }, { "epoch": 0.94, "learning_rate": 0.00015930100238218056, "loss": 0.0122, "step": 361860 }, { "epoch": 0.94, "learning_rate": 0.00015929711416580908, "loss": 0.0119, "step": 361870 }, { "epoch": 0.94, "learning_rate": 0.00015929322594943762, "loss": 0.0131, "step": 361880 }, { "epoch": 0.94, "learning_rate": 0.00015928933773306616, "loss": 0.0136, "step": 361890 }, { "epoch": 0.94, "learning_rate": 0.0001592854495166947, "loss": 0.0116, "step": 361900 }, { "epoch": 0.94, "learning_rate": 0.00015928156130032322, "loss": 0.0135, "step": 361910 }, { "epoch": 0.94, "learning_rate": 0.00015927767308395176, "loss": 0.0118, "step": 361920 }, { "epoch": 0.94, "learning_rate": 0.0001592737848675803, "loss": 0.0112, "step": 361930 }, { "epoch": 0.94, "learning_rate": 0.00015926989665120884, "loss": 0.0126, "step": 361940 }, { "epoch": 0.94, "learning_rate": 0.00015926600843483736, "loss": 0.0137, "step": 361950 }, { "epoch": 0.94, "learning_rate": 0.0001592621202184659, "loss": 0.0148, "step": 361960 }, { "epoch": 0.94, "learning_rate": 0.00015925823200209444, "loss": 0.0137, "step": 361970 }, { "epoch": 0.94, "learning_rate": 0.00015925434378572298, "loss": 0.0119, "step": 361980 }, { "epoch": 0.94, "learning_rate": 0.0001592504555693515, "loss": 0.014, "step": 361990 }, { "epoch": 0.94, "learning_rate": 0.00015924656735298004, "loss": 0.0136, "step": 362000 }, { "epoch": 0.94, "eval_cer": 0.8817222812402463, "eval_loss": 0.008736135438084602, "eval_runtime": 107.4655, "eval_samples_per_second": 18.611, "eval_steps_per_second": 4.653, "step": 362000 }, { "epoch": 0.94, "learning_rate": 0.00015924267913660855, "loss": 0.015, "step": 362010 }, { "epoch": 0.94, "learning_rate": 0.00015923879092023712, "loss": 0.0129, "step": 362020 }, { "epoch": 0.94, "learning_rate": 0.00015923490270386566, "loss": 0.0126, "step": 362030 }, { "epoch": 0.94, "learning_rate": 0.00015923101448749418, "loss": 0.0117, "step": 362040 }, { "epoch": 0.94, "learning_rate": 0.0001592271262711227, "loss": 0.0145, "step": 362050 }, { "epoch": 0.94, "learning_rate": 0.00015922323805475126, "loss": 0.0107, "step": 362060 }, { "epoch": 0.94, "learning_rate": 0.0001592193498383798, "loss": 0.0174, "step": 362070 }, { "epoch": 0.94, "learning_rate": 0.00015921546162200832, "loss": 0.0141, "step": 362080 }, { "epoch": 0.94, "learning_rate": 0.00015921157340563686, "loss": 0.0119, "step": 362090 }, { "epoch": 0.94, "learning_rate": 0.0001592076851892654, "loss": 0.0133, "step": 362100 }, { "epoch": 0.94, "learning_rate": 0.00015920379697289394, "loss": 0.0136, "step": 362110 }, { "epoch": 0.94, "learning_rate": 0.00015919990875652246, "loss": 0.0127, "step": 362120 }, { "epoch": 0.94, "learning_rate": 0.000159196020540151, "loss": 0.0144, "step": 362130 }, { "epoch": 0.94, "learning_rate": 0.00015919213232377954, "loss": 0.0098, "step": 362140 }, { "epoch": 0.94, "learning_rate": 0.00015918824410740808, "loss": 0.0125, "step": 362150 }, { "epoch": 0.94, "learning_rate": 0.0001591843558910366, "loss": 0.0099, "step": 362160 }, { "epoch": 0.94, "learning_rate": 0.00015918046767466514, "loss": 0.0137, "step": 362170 }, { "epoch": 0.94, "learning_rate": 0.0001591765794582937, "loss": 0.0127, "step": 362180 }, { "epoch": 0.94, "learning_rate": 0.00015917269124192222, "loss": 0.0126, "step": 362190 }, { "epoch": 0.94, "learning_rate": 0.00015916880302555076, "loss": 0.0145, "step": 362200 }, { "epoch": 0.94, "learning_rate": 0.00015916491480917928, "loss": 0.0122, "step": 362210 }, { "epoch": 0.94, "learning_rate": 0.00015916102659280785, "loss": 0.0114, "step": 362220 }, { "epoch": 0.94, "learning_rate": 0.00015915713837643636, "loss": 0.0109, "step": 362230 }, { "epoch": 0.94, "learning_rate": 0.0001591532501600649, "loss": 0.0094, "step": 362240 }, { "epoch": 0.94, "learning_rate": 0.00015914936194369342, "loss": 0.0146, "step": 362250 }, { "epoch": 0.94, "learning_rate": 0.00015914547372732196, "loss": 0.0128, "step": 362260 }, { "epoch": 0.94, "learning_rate": 0.0001591415855109505, "loss": 0.0148, "step": 362270 }, { "epoch": 0.94, "learning_rate": 0.00015913769729457904, "loss": 0.0115, "step": 362280 }, { "epoch": 0.94, "learning_rate": 0.00015913380907820756, "loss": 0.0114, "step": 362290 }, { "epoch": 0.94, "learning_rate": 0.0001591299208618361, "loss": 0.0135, "step": 362300 }, { "epoch": 0.94, "learning_rate": 0.00015912603264546464, "loss": 0.0094, "step": 362310 }, { "epoch": 0.94, "learning_rate": 0.00015912214442909318, "loss": 0.0096, "step": 362320 }, { "epoch": 0.94, "learning_rate": 0.0001591182562127217, "loss": 0.0124, "step": 362330 }, { "epoch": 0.94, "learning_rate": 0.00015911436799635024, "loss": 0.0118, "step": 362340 }, { "epoch": 0.94, "learning_rate": 0.0001591104797799788, "loss": 0.0109, "step": 362350 }, { "epoch": 0.94, "learning_rate": 0.00015910659156360732, "loss": 0.0144, "step": 362360 }, { "epoch": 0.94, "learning_rate": 0.00015910270334723584, "loss": 0.0117, "step": 362370 }, { "epoch": 0.94, "learning_rate": 0.00015909881513086438, "loss": 0.0111, "step": 362380 }, { "epoch": 0.94, "learning_rate": 0.00015909492691449295, "loss": 0.0111, "step": 362390 }, { "epoch": 0.94, "learning_rate": 0.00015909103869812146, "loss": 0.0148, "step": 362400 }, { "epoch": 0.94, "learning_rate": 0.00015908715048175, "loss": 0.0124, "step": 362410 }, { "epoch": 0.94, "learning_rate": 0.00015908326226537852, "loss": 0.0111, "step": 362420 }, { "epoch": 0.94, "learning_rate": 0.00015907937404900709, "loss": 0.0138, "step": 362430 }, { "epoch": 0.94, "learning_rate": 0.0001590754858326356, "loss": 0.0138, "step": 362440 }, { "epoch": 0.94, "learning_rate": 0.00015907159761626414, "loss": 0.0155, "step": 362450 }, { "epoch": 0.94, "learning_rate": 0.00015906770939989266, "loss": 0.0118, "step": 362460 }, { "epoch": 0.94, "learning_rate": 0.00015906382118352123, "loss": 0.0146, "step": 362470 }, { "epoch": 0.94, "learning_rate": 0.00015905993296714974, "loss": 0.0118, "step": 362480 }, { "epoch": 0.94, "learning_rate": 0.00015905604475077828, "loss": 0.0132, "step": 362490 }, { "epoch": 0.94, "learning_rate": 0.0001590521565344068, "loss": 0.0119, "step": 362500 }, { "epoch": 0.94, "learning_rate": 0.00015904826831803534, "loss": 0.0091, "step": 362510 }, { "epoch": 0.94, "learning_rate": 0.0001590443801016639, "loss": 0.0134, "step": 362520 }, { "epoch": 0.94, "learning_rate": 0.00015904049188529242, "loss": 0.0164, "step": 362530 }, { "epoch": 0.94, "learning_rate": 0.00015903660366892094, "loss": 0.0147, "step": 362540 }, { "epoch": 0.94, "learning_rate": 0.00015903271545254948, "loss": 0.0124, "step": 362550 }, { "epoch": 0.94, "learning_rate": 0.00015902882723617805, "loss": 0.0105, "step": 362560 }, { "epoch": 0.94, "learning_rate": 0.00015902493901980656, "loss": 0.0139, "step": 362570 }, { "epoch": 0.94, "learning_rate": 0.0001590210508034351, "loss": 0.0118, "step": 362580 }, { "epoch": 0.94, "learning_rate": 0.00015901716258706362, "loss": 0.0175, "step": 362590 }, { "epoch": 0.94, "learning_rate": 0.00015901327437069219, "loss": 0.0129, "step": 362600 }, { "epoch": 0.94, "learning_rate": 0.0001590093861543207, "loss": 0.0138, "step": 362610 }, { "epoch": 0.94, "learning_rate": 0.00015900549793794924, "loss": 0.0156, "step": 362620 }, { "epoch": 0.94, "learning_rate": 0.00015900160972157776, "loss": 0.0151, "step": 362630 }, { "epoch": 0.94, "learning_rate": 0.00015899772150520632, "loss": 0.0137, "step": 362640 }, { "epoch": 0.94, "learning_rate": 0.00015899383328883484, "loss": 0.0149, "step": 362650 }, { "epoch": 0.94, "learning_rate": 0.00015898994507246338, "loss": 0.0114, "step": 362660 }, { "epoch": 0.94, "learning_rate": 0.0001589860568560919, "loss": 0.0122, "step": 362670 }, { "epoch": 0.94, "learning_rate": 0.00015898216863972046, "loss": 0.0152, "step": 362680 }, { "epoch": 0.94, "learning_rate": 0.00015897828042334898, "loss": 0.0124, "step": 362690 }, { "epoch": 0.94, "learning_rate": 0.00015897439220697752, "loss": 0.0154, "step": 362700 }, { "epoch": 0.94, "learning_rate": 0.00015897050399060603, "loss": 0.0145, "step": 362710 }, { "epoch": 0.94, "learning_rate": 0.0001589666157742346, "loss": 0.0117, "step": 362720 }, { "epoch": 0.94, "learning_rate": 0.00015896272755786315, "loss": 0.0139, "step": 362730 }, { "epoch": 0.94, "learning_rate": 0.00015895883934149166, "loss": 0.0116, "step": 362740 }, { "epoch": 0.94, "learning_rate": 0.0001589549511251202, "loss": 0.0123, "step": 362750 }, { "epoch": 0.94, "learning_rate": 0.00015895106290874872, "loss": 0.0117, "step": 362760 }, { "epoch": 0.94, "learning_rate": 0.00015894717469237728, "loss": 0.012, "step": 362770 }, { "epoch": 0.94, "learning_rate": 0.0001589432864760058, "loss": 0.011, "step": 362780 }, { "epoch": 0.94, "learning_rate": 0.00015893939825963434, "loss": 0.0121, "step": 362790 }, { "epoch": 0.94, "learning_rate": 0.00015893551004326286, "loss": 0.0111, "step": 362800 }, { "epoch": 0.94, "learning_rate": 0.00015893162182689142, "loss": 0.0098, "step": 362810 }, { "epoch": 0.94, "learning_rate": 0.00015892773361051994, "loss": 0.012, "step": 362820 }, { "epoch": 0.94, "learning_rate": 0.00015892384539414848, "loss": 0.0155, "step": 362830 }, { "epoch": 0.94, "learning_rate": 0.000158919957177777, "loss": 0.0104, "step": 362840 }, { "epoch": 0.94, "learning_rate": 0.00015891606896140556, "loss": 0.0116, "step": 362850 }, { "epoch": 0.94, "learning_rate": 0.00015891218074503408, "loss": 0.0104, "step": 362860 }, { "epoch": 0.94, "learning_rate": 0.00015890829252866262, "loss": 0.0124, "step": 362870 }, { "epoch": 0.94, "learning_rate": 0.00015890440431229113, "loss": 0.015, "step": 362880 }, { "epoch": 0.94, "learning_rate": 0.0001589005160959197, "loss": 0.0136, "step": 362890 }, { "epoch": 0.94, "learning_rate": 0.00015889662787954824, "loss": 0.0132, "step": 362900 }, { "epoch": 0.94, "learning_rate": 0.00015889273966317676, "loss": 0.0133, "step": 362910 }, { "epoch": 0.94, "learning_rate": 0.0001588888514468053, "loss": 0.0101, "step": 362920 }, { "epoch": 0.94, "learning_rate": 0.00015888496323043384, "loss": 0.0116, "step": 362930 }, { "epoch": 0.94, "learning_rate": 0.00015888107501406238, "loss": 0.0119, "step": 362940 }, { "epoch": 0.94, "learning_rate": 0.0001588771867976909, "loss": 0.0133, "step": 362950 }, { "epoch": 0.94, "learning_rate": 0.00015887329858131944, "loss": 0.0133, "step": 362960 }, { "epoch": 0.94, "learning_rate": 0.00015886941036494798, "loss": 0.0127, "step": 362970 }, { "epoch": 0.94, "learning_rate": 0.00015886552214857652, "loss": 0.011, "step": 362980 }, { "epoch": 0.94, "learning_rate": 0.00015886163393220504, "loss": 0.013, "step": 362990 }, { "epoch": 0.94, "learning_rate": 0.00015885774571583358, "loss": 0.0122, "step": 363000 }, { "epoch": 0.94, "eval_cer": 0.8817474747050615, "eval_loss": 0.0086388373747468, "eval_runtime": 107.5493, "eval_samples_per_second": 18.596, "eval_steps_per_second": 4.649, "step": 363000 }, { "epoch": 0.94, "learning_rate": 0.0001588538574994621, "loss": 0.0145, "step": 363010 }, { "epoch": 0.94, "learning_rate": 0.00015884996928309066, "loss": 0.0131, "step": 363020 }, { "epoch": 0.94, "learning_rate": 0.00015884608106671918, "loss": 0.0121, "step": 363030 }, { "epoch": 0.94, "learning_rate": 0.00015884219285034772, "loss": 0.0131, "step": 363040 }, { "epoch": 0.94, "learning_rate": 0.00015883830463397623, "loss": 0.0086, "step": 363050 }, { "epoch": 0.94, "learning_rate": 0.0001588344164176048, "loss": 0.0095, "step": 363060 }, { "epoch": 0.94, "learning_rate": 0.00015883052820123334, "loss": 0.0112, "step": 363070 }, { "epoch": 0.94, "learning_rate": 0.00015882663998486186, "loss": 0.0121, "step": 363080 }, { "epoch": 0.94, "learning_rate": 0.00015882275176849037, "loss": 0.0126, "step": 363090 }, { "epoch": 0.94, "learning_rate": 0.00015881886355211894, "loss": 0.0112, "step": 363100 }, { "epoch": 0.94, "learning_rate": 0.00015881497533574748, "loss": 0.0168, "step": 363110 }, { "epoch": 0.94, "learning_rate": 0.000158811087119376, "loss": 0.0109, "step": 363120 }, { "epoch": 0.94, "learning_rate": 0.00015880719890300454, "loss": 0.013, "step": 363130 }, { "epoch": 0.94, "learning_rate": 0.00015880331068663308, "loss": 0.0115, "step": 363140 }, { "epoch": 0.94, "learning_rate": 0.00015879942247026162, "loss": 0.0121, "step": 363150 }, { "epoch": 0.94, "learning_rate": 0.00015879553425389014, "loss": 0.0118, "step": 363160 }, { "epoch": 0.94, "learning_rate": 0.00015879164603751868, "loss": 0.0141, "step": 363170 }, { "epoch": 0.94, "learning_rate": 0.00015878775782114722, "loss": 0.012, "step": 363180 }, { "epoch": 0.94, "learning_rate": 0.00015878386960477576, "loss": 0.0159, "step": 363190 }, { "epoch": 0.94, "learning_rate": 0.00015877998138840428, "loss": 0.0123, "step": 363200 }, { "epoch": 0.94, "learning_rate": 0.00015877609317203282, "loss": 0.0135, "step": 363210 }, { "epoch": 0.94, "learning_rate": 0.0001587722049556614, "loss": 0.0132, "step": 363220 }, { "epoch": 0.94, "learning_rate": 0.0001587683167392899, "loss": 0.0097, "step": 363230 }, { "epoch": 0.94, "learning_rate": 0.00015876442852291842, "loss": 0.015, "step": 363240 }, { "epoch": 0.94, "learning_rate": 0.00015876054030654696, "loss": 0.012, "step": 363250 }, { "epoch": 0.94, "learning_rate": 0.00015875665209017547, "loss": 0.0118, "step": 363260 }, { "epoch": 0.94, "learning_rate": 0.00015875276387380404, "loss": 0.0115, "step": 363270 }, { "epoch": 0.94, "learning_rate": 0.00015874887565743258, "loss": 0.0138, "step": 363280 }, { "epoch": 0.94, "learning_rate": 0.0001587449874410611, "loss": 0.0133, "step": 363290 }, { "epoch": 0.94, "learning_rate": 0.00015874109922468964, "loss": 0.0108, "step": 363300 }, { "epoch": 0.94, "learning_rate": 0.00015873721100831818, "loss": 0.0124, "step": 363310 }, { "epoch": 0.94, "learning_rate": 0.00015873332279194672, "loss": 0.0097, "step": 363320 }, { "epoch": 0.94, "learning_rate": 0.00015872943457557524, "loss": 0.0149, "step": 363330 }, { "epoch": 0.94, "learning_rate": 0.00015872554635920378, "loss": 0.0127, "step": 363340 }, { "epoch": 0.94, "learning_rate": 0.00015872165814283232, "loss": 0.0113, "step": 363350 }, { "epoch": 0.94, "learning_rate": 0.00015871776992646086, "loss": 0.0136, "step": 363360 }, { "epoch": 0.94, "learning_rate": 0.00015871388171008938, "loss": 0.0136, "step": 363370 }, { "epoch": 0.94, "learning_rate": 0.00015870999349371792, "loss": 0.0182, "step": 363380 }, { "epoch": 0.94, "learning_rate": 0.0001587061052773465, "loss": 0.0109, "step": 363390 }, { "epoch": 0.94, "learning_rate": 0.000158702217060975, "loss": 0.0159, "step": 363400 }, { "epoch": 0.94, "learning_rate": 0.00015869832884460352, "loss": 0.0135, "step": 363410 }, { "epoch": 0.94, "learning_rate": 0.00015869444062823206, "loss": 0.0141, "step": 363420 }, { "epoch": 0.94, "learning_rate": 0.00015869055241186063, "loss": 0.0139, "step": 363430 }, { "epoch": 0.94, "learning_rate": 0.00015868666419548914, "loss": 0.0145, "step": 363440 }, { "epoch": 0.94, "learning_rate": 0.00015868277597911768, "loss": 0.0106, "step": 363450 }, { "epoch": 0.94, "learning_rate": 0.0001586788877627462, "loss": 0.0131, "step": 363460 }, { "epoch": 0.94, "learning_rate": 0.00015867499954637477, "loss": 0.0146, "step": 363470 }, { "epoch": 0.94, "learning_rate": 0.00015867111133000328, "loss": 0.0118, "step": 363480 }, { "epoch": 0.94, "learning_rate": 0.00015866722311363182, "loss": 0.0123, "step": 363490 }, { "epoch": 0.94, "learning_rate": 0.00015866333489726034, "loss": 0.0122, "step": 363500 }, { "epoch": 0.94, "learning_rate": 0.00015865944668088888, "loss": 0.0149, "step": 363510 }, { "epoch": 0.94, "learning_rate": 0.00015865555846451742, "loss": 0.0134, "step": 363520 }, { "epoch": 0.94, "learning_rate": 0.00015865167024814596, "loss": 0.0111, "step": 363530 }, { "epoch": 0.94, "learning_rate": 0.00015864778203177448, "loss": 0.0146, "step": 363540 }, { "epoch": 0.94, "learning_rate": 0.00015864389381540302, "loss": 0.0123, "step": 363550 }, { "epoch": 0.94, "learning_rate": 0.00015864000559903156, "loss": 0.0135, "step": 363560 }, { "epoch": 0.94, "learning_rate": 0.0001586361173826601, "loss": 0.0136, "step": 363570 }, { "epoch": 0.94, "learning_rate": 0.00015863222916628862, "loss": 0.0161, "step": 363580 }, { "epoch": 0.94, "learning_rate": 0.00015862834094991716, "loss": 0.0128, "step": 363590 }, { "epoch": 0.94, "learning_rate": 0.00015862445273354573, "loss": 0.0127, "step": 363600 }, { "epoch": 0.94, "learning_rate": 0.00015862056451717424, "loss": 0.0133, "step": 363610 }, { "epoch": 0.94, "learning_rate": 0.00015861667630080278, "loss": 0.0115, "step": 363620 }, { "epoch": 0.94, "learning_rate": 0.0001586127880844313, "loss": 0.0114, "step": 363630 }, { "epoch": 0.94, "learning_rate": 0.00015860889986805987, "loss": 0.013, "step": 363640 }, { "epoch": 0.94, "learning_rate": 0.00015860501165168838, "loss": 0.0132, "step": 363650 }, { "epoch": 0.94, "learning_rate": 0.00015860112343531692, "loss": 0.0145, "step": 363660 }, { "epoch": 0.94, "learning_rate": 0.00015859723521894544, "loss": 0.0127, "step": 363670 }, { "epoch": 0.94, "learning_rate": 0.000158593347002574, "loss": 0.0114, "step": 363680 }, { "epoch": 0.94, "learning_rate": 0.00015858945878620252, "loss": 0.0111, "step": 363690 }, { "epoch": 0.94, "learning_rate": 0.00015858557056983106, "loss": 0.0115, "step": 363700 }, { "epoch": 0.94, "learning_rate": 0.00015858168235345958, "loss": 0.0125, "step": 363710 }, { "epoch": 0.94, "learning_rate": 0.00015857779413708814, "loss": 0.011, "step": 363720 }, { "epoch": 0.94, "learning_rate": 0.00015857390592071666, "loss": 0.0123, "step": 363730 }, { "epoch": 0.94, "learning_rate": 0.0001585700177043452, "loss": 0.0121, "step": 363740 }, { "epoch": 0.94, "learning_rate": 0.00015856612948797371, "loss": 0.0125, "step": 363750 }, { "epoch": 0.94, "learning_rate": 0.00015856224127160226, "loss": 0.0112, "step": 363760 }, { "epoch": 0.94, "learning_rate": 0.00015855835305523083, "loss": 0.0126, "step": 363770 }, { "epoch": 0.94, "learning_rate": 0.00015855446483885934, "loss": 0.0143, "step": 363780 }, { "epoch": 0.94, "learning_rate": 0.00015855057662248788, "loss": 0.0117, "step": 363790 }, { "epoch": 0.94, "learning_rate": 0.0001585466884061164, "loss": 0.0087, "step": 363800 }, { "epoch": 0.94, "learning_rate": 0.00015854280018974496, "loss": 0.0133, "step": 363810 }, { "epoch": 0.94, "learning_rate": 0.00015853891197337348, "loss": 0.0143, "step": 363820 }, { "epoch": 0.94, "learning_rate": 0.00015853502375700202, "loss": 0.0123, "step": 363830 }, { "epoch": 0.94, "learning_rate": 0.00015853113554063054, "loss": 0.0116, "step": 363840 }, { "epoch": 0.94, "learning_rate": 0.0001585272473242591, "loss": 0.0192, "step": 363850 }, { "epoch": 0.94, "learning_rate": 0.00015852335910788762, "loss": 0.0112, "step": 363860 }, { "epoch": 0.94, "learning_rate": 0.00015851947089151616, "loss": 0.0122, "step": 363870 }, { "epoch": 0.94, "learning_rate": 0.00015851558267514467, "loss": 0.0163, "step": 363880 }, { "epoch": 0.94, "learning_rate": 0.00015851169445877324, "loss": 0.0123, "step": 363890 }, { "epoch": 0.94, "learning_rate": 0.00015850780624240176, "loss": 0.0123, "step": 363900 }, { "epoch": 0.94, "learning_rate": 0.0001585039180260303, "loss": 0.0201, "step": 363910 }, { "epoch": 0.94, "learning_rate": 0.00015850002980965881, "loss": 0.0125, "step": 363920 }, { "epoch": 0.94, "learning_rate": 0.00015849614159328738, "loss": 0.0125, "step": 363930 }, { "epoch": 0.94, "learning_rate": 0.00015849225337691592, "loss": 0.0118, "step": 363940 }, { "epoch": 0.94, "learning_rate": 0.00015848836516054444, "loss": 0.0157, "step": 363950 }, { "epoch": 0.94, "learning_rate": 0.00015848447694417295, "loss": 0.0152, "step": 363960 }, { "epoch": 0.94, "learning_rate": 0.00015848058872780152, "loss": 0.012, "step": 363970 }, { "epoch": 0.94, "learning_rate": 0.00015847670051143006, "loss": 0.0112, "step": 363980 }, { "epoch": 0.94, "learning_rate": 0.00015847281229505858, "loss": 0.0134, "step": 363990 }, { "epoch": 0.94, "learning_rate": 0.00015846892407868712, "loss": 0.0142, "step": 364000 }, { "epoch": 0.94, "eval_cer": 0.8817432757942589, "eval_loss": 0.008785239420831203, "eval_runtime": 107.5582, "eval_samples_per_second": 18.595, "eval_steps_per_second": 4.649, "step": 364000 }, { "epoch": 0.94, "learning_rate": 0.00015846503586231563, "loss": 0.0128, "step": 364010 }, { "epoch": 0.94, "learning_rate": 0.0001584611476459442, "loss": 0.0163, "step": 364020 }, { "epoch": 0.94, "learning_rate": 0.00015845725942957272, "loss": 0.0146, "step": 364030 }, { "epoch": 0.94, "learning_rate": 0.00015845337121320126, "loss": 0.0107, "step": 364040 }, { "epoch": 0.94, "learning_rate": 0.00015844948299682977, "loss": 0.0112, "step": 364050 }, { "epoch": 0.94, "learning_rate": 0.00015844559478045834, "loss": 0.011, "step": 364060 }, { "epoch": 0.94, "learning_rate": 0.00015844170656408686, "loss": 0.0107, "step": 364070 }, { "epoch": 0.94, "learning_rate": 0.0001584378183477154, "loss": 0.011, "step": 364080 }, { "epoch": 0.94, "learning_rate": 0.0001584339301313439, "loss": 0.0123, "step": 364090 }, { "epoch": 0.94, "learning_rate": 0.00015843004191497248, "loss": 0.0117, "step": 364100 }, { "epoch": 0.94, "learning_rate": 0.00015842615369860102, "loss": 0.0155, "step": 364110 }, { "epoch": 0.94, "learning_rate": 0.00015842226548222954, "loss": 0.0136, "step": 364120 }, { "epoch": 0.94, "learning_rate": 0.00015841837726585805, "loss": 0.0153, "step": 364130 }, { "epoch": 0.94, "learning_rate": 0.00015841448904948662, "loss": 0.0112, "step": 364140 }, { "epoch": 0.94, "learning_rate": 0.00015841060083311516, "loss": 0.0133, "step": 364150 }, { "epoch": 0.94, "learning_rate": 0.00015840671261674368, "loss": 0.0132, "step": 364160 }, { "epoch": 0.94, "learning_rate": 0.00015840282440037222, "loss": 0.0103, "step": 364170 }, { "epoch": 0.94, "learning_rate": 0.00015839893618400076, "loss": 0.011, "step": 364180 }, { "epoch": 0.94, "learning_rate": 0.0001583950479676293, "loss": 0.0128, "step": 364190 }, { "epoch": 0.94, "learning_rate": 0.00015839115975125782, "loss": 0.011, "step": 364200 }, { "epoch": 0.94, "learning_rate": 0.00015838727153488636, "loss": 0.0096, "step": 364210 }, { "epoch": 0.94, "learning_rate": 0.0001583833833185149, "loss": 0.011, "step": 364220 }, { "epoch": 0.94, "learning_rate": 0.00015837949510214344, "loss": 0.0136, "step": 364230 }, { "epoch": 0.94, "learning_rate": 0.00015837560688577196, "loss": 0.0127, "step": 364240 }, { "epoch": 0.94, "learning_rate": 0.0001583717186694005, "loss": 0.0155, "step": 364250 }, { "epoch": 0.94, "learning_rate": 0.000158367830453029, "loss": 0.0122, "step": 364260 }, { "epoch": 0.94, "learning_rate": 0.00015836394223665758, "loss": 0.0134, "step": 364270 }, { "epoch": 0.94, "learning_rate": 0.0001583600540202861, "loss": 0.0135, "step": 364280 }, { "epoch": 0.94, "learning_rate": 0.00015835616580391464, "loss": 0.0128, "step": 364290 }, { "epoch": 0.94, "learning_rate": 0.00015835227758754315, "loss": 0.0161, "step": 364300 }, { "epoch": 0.94, "learning_rate": 0.00015834838937117172, "loss": 0.0138, "step": 364310 }, { "epoch": 0.94, "learning_rate": 0.00015834450115480026, "loss": 0.0131, "step": 364320 }, { "epoch": 0.94, "learning_rate": 0.00015834061293842878, "loss": 0.0127, "step": 364330 }, { "epoch": 0.94, "learning_rate": 0.00015833672472205732, "loss": 0.0155, "step": 364340 }, { "epoch": 0.94, "learning_rate": 0.00015833283650568586, "loss": 0.0108, "step": 364350 }, { "epoch": 0.94, "learning_rate": 0.0001583289482893144, "loss": 0.0105, "step": 364360 }, { "epoch": 0.94, "learning_rate": 0.00015832506007294292, "loss": 0.0121, "step": 364370 }, { "epoch": 0.94, "learning_rate": 0.00015832117185657146, "loss": 0.0128, "step": 364380 }, { "epoch": 0.94, "learning_rate": 0.0001583172836402, "loss": 0.0109, "step": 364390 }, { "epoch": 0.94, "learning_rate": 0.00015831339542382854, "loss": 0.0108, "step": 364400 }, { "epoch": 0.94, "learning_rate": 0.00015830950720745706, "loss": 0.0111, "step": 364410 }, { "epoch": 0.94, "learning_rate": 0.0001583056189910856, "loss": 0.0138, "step": 364420 }, { "epoch": 0.94, "learning_rate": 0.00015830173077471414, "loss": 0.0124, "step": 364430 }, { "epoch": 0.94, "learning_rate": 0.00015829784255834268, "loss": 0.0118, "step": 364440 }, { "epoch": 0.94, "learning_rate": 0.0001582939543419712, "loss": 0.0134, "step": 364450 }, { "epoch": 0.94, "learning_rate": 0.00015829006612559974, "loss": 0.0124, "step": 364460 }, { "epoch": 0.94, "learning_rate": 0.00015828617790922825, "loss": 0.0131, "step": 364470 }, { "epoch": 0.94, "learning_rate": 0.00015828228969285682, "loss": 0.0201, "step": 364480 }, { "epoch": 0.94, "learning_rate": 0.00015827840147648536, "loss": 0.0129, "step": 364490 }, { "epoch": 0.94, "learning_rate": 0.00015827451326011388, "loss": 0.0136, "step": 364500 }, { "epoch": 0.94, "learning_rate": 0.00015827062504374242, "loss": 0.0112, "step": 364510 }, { "epoch": 0.94, "learning_rate": 0.00015826673682737096, "loss": 0.0121, "step": 364520 }, { "epoch": 0.94, "learning_rate": 0.0001582628486109995, "loss": 0.0131, "step": 364530 }, { "epoch": 0.94, "learning_rate": 0.00015825896039462802, "loss": 0.0122, "step": 364540 }, { "epoch": 0.94, "learning_rate": 0.00015825507217825656, "loss": 0.013, "step": 364550 }, { "epoch": 0.94, "learning_rate": 0.0001582511839618851, "loss": 0.01, "step": 364560 }, { "epoch": 0.95, "learning_rate": 0.00015824729574551364, "loss": 0.0108, "step": 364570 }, { "epoch": 0.95, "learning_rate": 0.00015824340752914216, "loss": 0.0126, "step": 364580 }, { "epoch": 0.95, "learning_rate": 0.0001582395193127707, "loss": 0.0126, "step": 364590 }, { "epoch": 0.95, "learning_rate": 0.00015823563109639924, "loss": 0.0131, "step": 364600 }, { "epoch": 0.95, "learning_rate": 0.00015823174288002778, "loss": 0.0113, "step": 364610 }, { "epoch": 0.95, "learning_rate": 0.0001582278546636563, "loss": 0.012, "step": 364620 }, { "epoch": 0.95, "learning_rate": 0.00015822396644728484, "loss": 0.0121, "step": 364630 }, { "epoch": 0.95, "learning_rate": 0.0001582200782309134, "loss": 0.0156, "step": 364640 }, { "epoch": 0.95, "learning_rate": 0.00015821619001454192, "loss": 0.0114, "step": 364650 }, { "epoch": 0.95, "learning_rate": 0.00015821230179817046, "loss": 0.0119, "step": 364660 }, { "epoch": 0.95, "learning_rate": 0.00015820841358179898, "loss": 0.0111, "step": 364670 }, { "epoch": 0.95, "learning_rate": 0.00015820452536542754, "loss": 0.0137, "step": 364680 }, { "epoch": 0.95, "learning_rate": 0.00015820063714905606, "loss": 0.0117, "step": 364690 }, { "epoch": 0.95, "learning_rate": 0.0001581967489326846, "loss": 0.0169, "step": 364700 }, { "epoch": 0.95, "learning_rate": 0.00015819286071631312, "loss": 0.0123, "step": 364710 }, { "epoch": 0.95, "learning_rate": 0.00015818897249994166, "loss": 0.011, "step": 364720 }, { "epoch": 0.95, "learning_rate": 0.0001581850842835702, "loss": 0.0152, "step": 364730 }, { "epoch": 0.95, "learning_rate": 0.00015818119606719874, "loss": 0.0102, "step": 364740 }, { "epoch": 0.95, "learning_rate": 0.00015817730785082726, "loss": 0.0143, "step": 364750 }, { "epoch": 0.95, "learning_rate": 0.0001581734196344558, "loss": 0.0115, "step": 364760 }, { "epoch": 0.95, "learning_rate": 0.00015816953141808434, "loss": 0.0142, "step": 364770 }, { "epoch": 0.95, "learning_rate": 0.00015816564320171288, "loss": 0.0155, "step": 364780 }, { "epoch": 0.95, "learning_rate": 0.0001581617549853414, "loss": 0.0096, "step": 364790 }, { "epoch": 0.95, "learning_rate": 0.00015815786676896994, "loss": 0.0182, "step": 364800 }, { "epoch": 0.95, "learning_rate": 0.0001581539785525985, "loss": 0.0151, "step": 364810 }, { "epoch": 0.95, "learning_rate": 0.00015815009033622702, "loss": 0.0138, "step": 364820 }, { "epoch": 0.95, "learning_rate": 0.00015814620211985553, "loss": 0.011, "step": 364830 }, { "epoch": 0.95, "learning_rate": 0.00015814231390348408, "loss": 0.0131, "step": 364840 }, { "epoch": 0.95, "learning_rate": 0.00015813842568711264, "loss": 0.0166, "step": 364850 }, { "epoch": 0.95, "learning_rate": 0.00015813453747074116, "loss": 0.0128, "step": 364860 }, { "epoch": 0.95, "learning_rate": 0.0001581306492543697, "loss": 0.0161, "step": 364870 }, { "epoch": 0.95, "learning_rate": 0.00015812676103799822, "loss": 0.0142, "step": 364880 }, { "epoch": 0.95, "learning_rate": 0.00015812287282162678, "loss": 0.0135, "step": 364890 }, { "epoch": 0.95, "learning_rate": 0.0001581189846052553, "loss": 0.0122, "step": 364900 }, { "epoch": 0.95, "learning_rate": 0.00015811509638888384, "loss": 0.0134, "step": 364910 }, { "epoch": 0.95, "learning_rate": 0.00015811120817251235, "loss": 0.0122, "step": 364920 }, { "epoch": 0.95, "learning_rate": 0.00015810731995614092, "loss": 0.0122, "step": 364930 }, { "epoch": 0.95, "learning_rate": 0.00015810343173976944, "loss": 0.0146, "step": 364940 }, { "epoch": 0.95, "learning_rate": 0.00015809954352339798, "loss": 0.0108, "step": 364950 }, { "epoch": 0.95, "learning_rate": 0.0001580956553070265, "loss": 0.0119, "step": 364960 }, { "epoch": 0.95, "learning_rate": 0.00015809176709065504, "loss": 0.0125, "step": 364970 }, { "epoch": 0.95, "learning_rate": 0.0001580878788742836, "loss": 0.0171, "step": 364980 }, { "epoch": 0.95, "learning_rate": 0.00015808399065791212, "loss": 0.0142, "step": 364990 }, { "epoch": 0.95, "learning_rate": 0.00015808010244154063, "loss": 0.0161, "step": 365000 }, { "epoch": 0.95, "eval_cer": 0.8817390768834564, "eval_loss": 0.00836771447211504, "eval_runtime": 107.6249, "eval_samples_per_second": 18.583, "eval_steps_per_second": 4.646, "step": 365000 }, { "epoch": 0.95, "learning_rate": 0.00015807621422516918, "loss": 0.0127, "step": 365010 }, { "epoch": 0.95, "learning_rate": 0.00015807232600879774, "loss": 0.0161, "step": 365020 }, { "epoch": 0.95, "learning_rate": 0.00015806843779242626, "loss": 0.0155, "step": 365030 }, { "epoch": 0.95, "learning_rate": 0.0001580645495760548, "loss": 0.0113, "step": 365040 }, { "epoch": 0.95, "learning_rate": 0.00015806066135968331, "loss": 0.0109, "step": 365050 }, { "epoch": 0.95, "learning_rate": 0.00015805677314331188, "loss": 0.0157, "step": 365060 }, { "epoch": 0.95, "learning_rate": 0.0001580528849269404, "loss": 0.0126, "step": 365070 }, { "epoch": 0.95, "learning_rate": 0.00015804899671056894, "loss": 0.0158, "step": 365080 }, { "epoch": 0.95, "learning_rate": 0.00015804510849419745, "loss": 0.0119, "step": 365090 }, { "epoch": 0.95, "learning_rate": 0.00015804122027782602, "loss": 0.0125, "step": 365100 }, { "epoch": 0.95, "learning_rate": 0.00015803733206145454, "loss": 0.0133, "step": 365110 }, { "epoch": 0.95, "learning_rate": 0.00015803344384508308, "loss": 0.0173, "step": 365120 }, { "epoch": 0.95, "learning_rate": 0.0001580295556287116, "loss": 0.0111, "step": 365130 }, { "epoch": 0.95, "learning_rate": 0.00015802566741234016, "loss": 0.0141, "step": 365140 }, { "epoch": 0.95, "learning_rate": 0.00015802177919596868, "loss": 0.0127, "step": 365150 }, { "epoch": 0.95, "learning_rate": 0.00015801789097959722, "loss": 0.0134, "step": 365160 }, { "epoch": 0.95, "learning_rate": 0.00015801400276322573, "loss": 0.014, "step": 365170 }, { "epoch": 0.95, "learning_rate": 0.0001580101145468543, "loss": 0.0137, "step": 365180 }, { "epoch": 0.95, "learning_rate": 0.00015800622633048284, "loss": 0.0131, "step": 365190 }, { "epoch": 0.95, "learning_rate": 0.00015800233811411136, "loss": 0.013, "step": 365200 }, { "epoch": 0.95, "learning_rate": 0.0001579984498977399, "loss": 0.0183, "step": 365210 }, { "epoch": 0.95, "learning_rate": 0.00015799456168136841, "loss": 0.0131, "step": 365220 }, { "epoch": 0.95, "learning_rate": 0.00015799067346499698, "loss": 0.0136, "step": 365230 }, { "epoch": 0.95, "learning_rate": 0.0001579867852486255, "loss": 0.0105, "step": 365240 }, { "epoch": 0.95, "learning_rate": 0.00015798289703225404, "loss": 0.0113, "step": 365250 }, { "epoch": 0.95, "learning_rate": 0.00015797900881588255, "loss": 0.0132, "step": 365260 }, { "epoch": 0.95, "learning_rate": 0.00015797512059951112, "loss": 0.0137, "step": 365270 }, { "epoch": 0.95, "learning_rate": 0.00015797123238313964, "loss": 0.0128, "step": 365280 }, { "epoch": 0.95, "learning_rate": 0.00015796734416676818, "loss": 0.0167, "step": 365290 }, { "epoch": 0.95, "learning_rate": 0.0001579634559503967, "loss": 0.0105, "step": 365300 }, { "epoch": 0.95, "learning_rate": 0.00015795956773402526, "loss": 0.0169, "step": 365310 }, { "epoch": 0.95, "learning_rate": 0.00015795567951765378, "loss": 0.0115, "step": 365320 }, { "epoch": 0.95, "learning_rate": 0.00015795179130128232, "loss": 0.0142, "step": 365330 }, { "epoch": 0.95, "learning_rate": 0.00015794790308491083, "loss": 0.0102, "step": 365340 }, { "epoch": 0.95, "learning_rate": 0.0001579440148685394, "loss": 0.014, "step": 365350 }, { "epoch": 0.95, "learning_rate": 0.00015794012665216794, "loss": 0.0111, "step": 365360 }, { "epoch": 0.95, "learning_rate": 0.00015793623843579646, "loss": 0.0121, "step": 365370 }, { "epoch": 0.95, "learning_rate": 0.000157932350219425, "loss": 0.0131, "step": 365380 }, { "epoch": 0.95, "learning_rate": 0.00015792846200305354, "loss": 0.0132, "step": 365390 }, { "epoch": 0.95, "learning_rate": 0.00015792457378668208, "loss": 0.0149, "step": 365400 }, { "epoch": 0.95, "learning_rate": 0.0001579206855703106, "loss": 0.0112, "step": 365410 }, { "epoch": 0.95, "learning_rate": 0.00015791679735393914, "loss": 0.01, "step": 365420 }, { "epoch": 0.95, "learning_rate": 0.00015791290913756768, "loss": 0.0138, "step": 365430 }, { "epoch": 0.95, "learning_rate": 0.00015790902092119622, "loss": 0.0119, "step": 365440 }, { "epoch": 0.95, "learning_rate": 0.00015790513270482474, "loss": 0.0145, "step": 365450 }, { "epoch": 0.95, "learning_rate": 0.00015790124448845328, "loss": 0.0131, "step": 365460 }, { "epoch": 0.95, "learning_rate": 0.0001578973562720818, "loss": 0.0139, "step": 365470 }, { "epoch": 0.95, "learning_rate": 0.00015789346805571036, "loss": 0.0166, "step": 365480 }, { "epoch": 0.95, "learning_rate": 0.00015788957983933888, "loss": 0.0136, "step": 365490 }, { "epoch": 0.95, "learning_rate": 0.00015788569162296742, "loss": 0.0165, "step": 365500 }, { "epoch": 0.95, "learning_rate": 0.00015788180340659593, "loss": 0.01, "step": 365510 }, { "epoch": 0.95, "learning_rate": 0.0001578779151902245, "loss": 0.016, "step": 365520 }, { "epoch": 0.95, "learning_rate": 0.00015787402697385304, "loss": 0.0177, "step": 365530 }, { "epoch": 0.95, "learning_rate": 0.00015787013875748156, "loss": 0.0111, "step": 365540 }, { "epoch": 0.95, "learning_rate": 0.00015786625054111007, "loss": 0.0104, "step": 365550 }, { "epoch": 0.95, "learning_rate": 0.00015786236232473864, "loss": 0.0152, "step": 365560 }, { "epoch": 0.95, "learning_rate": 0.00015785847410836718, "loss": 0.0144, "step": 365570 }, { "epoch": 0.95, "learning_rate": 0.0001578545858919957, "loss": 0.0123, "step": 365580 }, { "epoch": 0.95, "learning_rate": 0.00015785069767562424, "loss": 0.0124, "step": 365590 }, { "epoch": 0.95, "learning_rate": 0.00015784680945925278, "loss": 0.0153, "step": 365600 }, { "epoch": 0.95, "learning_rate": 0.00015784292124288132, "loss": 0.0093, "step": 365610 }, { "epoch": 0.95, "learning_rate": 0.00015783903302650984, "loss": 0.0114, "step": 365620 }, { "epoch": 0.95, "learning_rate": 0.00015783514481013838, "loss": 0.0128, "step": 365630 }, { "epoch": 0.95, "learning_rate": 0.00015783125659376692, "loss": 0.0145, "step": 365640 }, { "epoch": 0.95, "learning_rate": 0.00015782736837739546, "loss": 0.0123, "step": 365650 }, { "epoch": 0.95, "learning_rate": 0.00015782348016102397, "loss": 0.011, "step": 365660 }, { "epoch": 0.95, "learning_rate": 0.00015781959194465252, "loss": 0.0114, "step": 365670 }, { "epoch": 0.95, "learning_rate": 0.00015781570372828109, "loss": 0.0123, "step": 365680 }, { "epoch": 0.95, "learning_rate": 0.0001578118155119096, "loss": 0.0111, "step": 365690 }, { "epoch": 0.95, "learning_rate": 0.00015780792729553814, "loss": 0.0125, "step": 365700 }, { "epoch": 0.95, "learning_rate": 0.00015780403907916666, "loss": 0.0148, "step": 365710 }, { "epoch": 0.95, "learning_rate": 0.00015780015086279517, "loss": 0.0125, "step": 365720 }, { "epoch": 0.95, "learning_rate": 0.00015779626264642374, "loss": 0.0103, "step": 365730 }, { "epoch": 0.95, "learning_rate": 0.00015779237443005228, "loss": 0.0139, "step": 365740 }, { "epoch": 0.95, "learning_rate": 0.0001577884862136808, "loss": 0.0128, "step": 365750 }, { "epoch": 0.95, "learning_rate": 0.00015778459799730934, "loss": 0.0125, "step": 365760 }, { "epoch": 0.95, "learning_rate": 0.00015778070978093788, "loss": 0.0134, "step": 365770 }, { "epoch": 0.95, "learning_rate": 0.00015777682156456642, "loss": 0.013, "step": 365780 }, { "epoch": 0.95, "learning_rate": 0.00015777293334819493, "loss": 0.0161, "step": 365790 }, { "epoch": 0.95, "learning_rate": 0.00015776904513182348, "loss": 0.0126, "step": 365800 }, { "epoch": 0.95, "learning_rate": 0.00015776515691545202, "loss": 0.0132, "step": 365810 }, { "epoch": 0.95, "learning_rate": 0.00015776126869908056, "loss": 0.0151, "step": 365820 }, { "epoch": 0.95, "learning_rate": 0.00015775738048270907, "loss": 0.0133, "step": 365830 }, { "epoch": 0.95, "learning_rate": 0.00015775349226633762, "loss": 0.0109, "step": 365840 }, { "epoch": 0.95, "learning_rate": 0.00015774960404996618, "loss": 0.0122, "step": 365850 }, { "epoch": 0.95, "learning_rate": 0.0001577457158335947, "loss": 0.0146, "step": 365860 }, { "epoch": 0.95, "learning_rate": 0.00015774182761722321, "loss": 0.0159, "step": 365870 }, { "epoch": 0.95, "learning_rate": 0.00015773793940085176, "loss": 0.016, "step": 365880 }, { "epoch": 0.95, "learning_rate": 0.00015773405118448032, "loss": 0.0157, "step": 365890 }, { "epoch": 0.95, "learning_rate": 0.00015773016296810884, "loss": 0.0116, "step": 365900 }, { "epoch": 0.95, "learning_rate": 0.00015772627475173738, "loss": 0.0125, "step": 365910 }, { "epoch": 0.95, "learning_rate": 0.0001577223865353659, "loss": 0.0119, "step": 365920 }, { "epoch": 0.95, "learning_rate": 0.00015771849831899446, "loss": 0.0105, "step": 365930 }, { "epoch": 0.95, "learning_rate": 0.00015771461010262298, "loss": 0.0115, "step": 365940 }, { "epoch": 0.95, "learning_rate": 0.00015771072188625152, "loss": 0.0116, "step": 365950 }, { "epoch": 0.95, "learning_rate": 0.00015770683366988003, "loss": 0.0128, "step": 365960 }, { "epoch": 0.95, "learning_rate": 0.00015770294545350858, "loss": 0.0179, "step": 365970 }, { "epoch": 0.95, "learning_rate": 0.00015769905723713712, "loss": 0.0106, "step": 365980 }, { "epoch": 0.95, "learning_rate": 0.00015769516902076566, "loss": 0.0158, "step": 365990 }, { "epoch": 0.95, "learning_rate": 0.00015769128080439417, "loss": 0.0128, "step": 366000 }, { "epoch": 0.95, "eval_cer": 0.8817306790618513, "eval_loss": 0.008484454825520515, "eval_runtime": 107.5251, "eval_samples_per_second": 18.6, "eval_steps_per_second": 4.65, "step": 366000 }, { "epoch": 0.95, "learning_rate": 0.00015768739258802272, "loss": 0.0139, "step": 366010 }, { "epoch": 0.95, "learning_rate": 0.00015768350437165126, "loss": 0.0125, "step": 366020 }, { "epoch": 0.95, "learning_rate": 0.0001576796161552798, "loss": 0.011, "step": 366030 }, { "epoch": 0.95, "learning_rate": 0.0001576757279389083, "loss": 0.0134, "step": 366040 }, { "epoch": 0.95, "learning_rate": 0.00015767183972253685, "loss": 0.0152, "step": 366050 }, { "epoch": 0.95, "learning_rate": 0.00015766795150616542, "loss": 0.0149, "step": 366060 }, { "epoch": 0.95, "learning_rate": 0.00015766406328979394, "loss": 0.017, "step": 366070 }, { "epoch": 0.95, "learning_rate": 0.00015766017507342248, "loss": 0.0127, "step": 366080 }, { "epoch": 0.95, "learning_rate": 0.000157656286857051, "loss": 0.0116, "step": 366090 }, { "epoch": 0.95, "learning_rate": 0.00015765239864067956, "loss": 0.019, "step": 366100 }, { "epoch": 0.95, "learning_rate": 0.00015764851042430808, "loss": 0.0129, "step": 366110 }, { "epoch": 0.95, "learning_rate": 0.00015764462220793662, "loss": 0.01, "step": 366120 }, { "epoch": 0.95, "learning_rate": 0.00015764073399156513, "loss": 0.0132, "step": 366130 }, { "epoch": 0.95, "learning_rate": 0.0001576368457751937, "loss": 0.0142, "step": 366140 }, { "epoch": 0.95, "learning_rate": 0.00015763295755882222, "loss": 0.0114, "step": 366150 }, { "epoch": 0.95, "learning_rate": 0.00015762906934245076, "loss": 0.0135, "step": 366160 }, { "epoch": 0.95, "learning_rate": 0.00015762518112607927, "loss": 0.0112, "step": 366170 }, { "epoch": 0.95, "learning_rate": 0.00015762129290970784, "loss": 0.0103, "step": 366180 }, { "epoch": 0.95, "learning_rate": 0.00015761740469333636, "loss": 0.0116, "step": 366190 }, { "epoch": 0.95, "learning_rate": 0.0001576135164769649, "loss": 0.0112, "step": 366200 }, { "epoch": 0.95, "learning_rate": 0.0001576096282605934, "loss": 0.011, "step": 366210 }, { "epoch": 0.95, "learning_rate": 0.00015760574004422195, "loss": 0.0129, "step": 366220 }, { "epoch": 0.95, "learning_rate": 0.00015760185182785052, "loss": 0.014, "step": 366230 }, { "epoch": 0.95, "learning_rate": 0.00015759796361147904, "loss": 0.0135, "step": 366240 }, { "epoch": 0.95, "learning_rate": 0.00015759407539510758, "loss": 0.0151, "step": 366250 }, { "epoch": 0.95, "learning_rate": 0.0001575901871787361, "loss": 0.0119, "step": 366260 }, { "epoch": 0.95, "learning_rate": 0.00015758629896236466, "loss": 0.0202, "step": 366270 }, { "epoch": 0.95, "learning_rate": 0.00015758241074599318, "loss": 0.0128, "step": 366280 }, { "epoch": 0.95, "learning_rate": 0.00015757852252962172, "loss": 0.0131, "step": 366290 }, { "epoch": 0.95, "learning_rate": 0.00015757463431325023, "loss": 0.0136, "step": 366300 }, { "epoch": 0.95, "learning_rate": 0.0001575707460968788, "loss": 0.0124, "step": 366310 }, { "epoch": 0.95, "learning_rate": 0.00015756685788050732, "loss": 0.0111, "step": 366320 }, { "epoch": 0.95, "learning_rate": 0.00015756296966413586, "loss": 0.0154, "step": 366330 }, { "epoch": 0.95, "learning_rate": 0.00015755908144776437, "loss": 0.0136, "step": 366340 }, { "epoch": 0.95, "learning_rate": 0.00015755519323139294, "loss": 0.0142, "step": 366350 }, { "epoch": 0.95, "learning_rate": 0.00015755130501502146, "loss": 0.0153, "step": 366360 }, { "epoch": 0.95, "learning_rate": 0.00015754741679865, "loss": 0.0134, "step": 366370 }, { "epoch": 0.95, "learning_rate": 0.0001575435285822785, "loss": 0.013, "step": 366380 }, { "epoch": 0.95, "learning_rate": 0.00015753964036590708, "loss": 0.0105, "step": 366390 }, { "epoch": 0.95, "learning_rate": 0.00015753575214953562, "loss": 0.0109, "step": 366400 }, { "epoch": 0.95, "learning_rate": 0.00015753186393316414, "loss": 0.0125, "step": 366410 }, { "epoch": 0.95, "learning_rate": 0.00015752797571679265, "loss": 0.0101, "step": 366420 }, { "epoch": 0.95, "learning_rate": 0.00015752408750042122, "loss": 0.0145, "step": 366430 }, { "epoch": 0.95, "learning_rate": 0.00015752019928404976, "loss": 0.0132, "step": 366440 }, { "epoch": 0.95, "learning_rate": 0.00015751631106767828, "loss": 0.0136, "step": 366450 }, { "epoch": 0.95, "learning_rate": 0.00015751242285130682, "loss": 0.0129, "step": 366460 }, { "epoch": 0.95, "learning_rate": 0.00015750853463493533, "loss": 0.0144, "step": 366470 }, { "epoch": 0.95, "learning_rate": 0.0001575046464185639, "loss": 0.0127, "step": 366480 }, { "epoch": 0.95, "learning_rate": 0.00015750075820219242, "loss": 0.0125, "step": 366490 }, { "epoch": 0.95, "learning_rate": 0.00015749686998582096, "loss": 0.0094, "step": 366500 }, { "epoch": 0.95, "learning_rate": 0.00015749298176944947, "loss": 0.0148, "step": 366510 }, { "epoch": 0.95, "learning_rate": 0.00015748909355307804, "loss": 0.0128, "step": 366520 }, { "epoch": 0.95, "learning_rate": 0.00015748520533670656, "loss": 0.014, "step": 366530 }, { "epoch": 0.95, "learning_rate": 0.0001574813171203351, "loss": 0.0129, "step": 366540 }, { "epoch": 0.95, "learning_rate": 0.0001574774289039636, "loss": 0.0174, "step": 366550 }, { "epoch": 0.95, "learning_rate": 0.00015747354068759218, "loss": 0.0118, "step": 366560 }, { "epoch": 0.95, "learning_rate": 0.00015746965247122072, "loss": 0.0158, "step": 366570 }, { "epoch": 0.95, "learning_rate": 0.00015746576425484924, "loss": 0.0168, "step": 366580 }, { "epoch": 0.95, "learning_rate": 0.00015746187603847775, "loss": 0.011, "step": 366590 }, { "epoch": 0.95, "learning_rate": 0.00015745798782210632, "loss": 0.0124, "step": 366600 }, { "epoch": 0.95, "learning_rate": 0.00015745409960573486, "loss": 0.0135, "step": 366610 }, { "epoch": 0.95, "learning_rate": 0.00015745021138936338, "loss": 0.0133, "step": 366620 }, { "epoch": 0.95, "learning_rate": 0.00015744632317299192, "loss": 0.0131, "step": 366630 }, { "epoch": 0.95, "learning_rate": 0.00015744243495662046, "loss": 0.0125, "step": 366640 }, { "epoch": 0.95, "learning_rate": 0.000157438546740249, "loss": 0.012, "step": 366650 }, { "epoch": 0.95, "learning_rate": 0.00015743465852387752, "loss": 0.0133, "step": 366660 }, { "epoch": 0.95, "learning_rate": 0.00015743077030750606, "loss": 0.0106, "step": 366670 }, { "epoch": 0.95, "learning_rate": 0.0001574268820911346, "loss": 0.0126, "step": 366680 }, { "epoch": 0.95, "learning_rate": 0.00015742299387476314, "loss": 0.0142, "step": 366690 }, { "epoch": 0.95, "learning_rate": 0.00015741910565839165, "loss": 0.0125, "step": 366700 }, { "epoch": 0.95, "learning_rate": 0.0001574152174420202, "loss": 0.0118, "step": 366710 }, { "epoch": 0.95, "learning_rate": 0.0001574113292256487, "loss": 0.0141, "step": 366720 }, { "epoch": 0.95, "learning_rate": 0.00015740744100927728, "loss": 0.016, "step": 366730 }, { "epoch": 0.95, "learning_rate": 0.0001574035527929058, "loss": 0.0133, "step": 366740 }, { "epoch": 0.95, "learning_rate": 0.00015739966457653434, "loss": 0.0115, "step": 366750 }, { "epoch": 0.95, "learning_rate": 0.00015739577636016285, "loss": 0.0119, "step": 366760 }, { "epoch": 0.95, "learning_rate": 0.00015739188814379142, "loss": 0.0122, "step": 366770 }, { "epoch": 0.95, "learning_rate": 0.00015738799992741996, "loss": 0.011, "step": 366780 }, { "epoch": 0.95, "learning_rate": 0.00015738411171104848, "loss": 0.0119, "step": 366790 }, { "epoch": 0.95, "learning_rate": 0.00015738022349467702, "loss": 0.0129, "step": 366800 }, { "epoch": 0.95, "learning_rate": 0.00015737633527830556, "loss": 0.0121, "step": 366810 }, { "epoch": 0.95, "learning_rate": 0.0001573724470619341, "loss": 0.0124, "step": 366820 }, { "epoch": 0.95, "learning_rate": 0.00015736855884556261, "loss": 0.0108, "step": 366830 }, { "epoch": 0.95, "learning_rate": 0.00015736467062919116, "loss": 0.0199, "step": 366840 }, { "epoch": 0.95, "learning_rate": 0.0001573607824128197, "loss": 0.0222, "step": 366850 }, { "epoch": 0.95, "learning_rate": 0.00015735689419644824, "loss": 0.0108, "step": 366860 }, { "epoch": 0.95, "learning_rate": 0.00015735300598007675, "loss": 0.0178, "step": 366870 }, { "epoch": 0.95, "learning_rate": 0.0001573491177637053, "loss": 0.011, "step": 366880 }, { "epoch": 0.95, "learning_rate": 0.00015734522954733384, "loss": 0.0134, "step": 366890 }, { "epoch": 0.95, "learning_rate": 0.00015734134133096238, "loss": 0.0227, "step": 366900 }, { "epoch": 0.95, "learning_rate": 0.0001573374531145909, "loss": 0.0129, "step": 366910 }, { "epoch": 0.95, "learning_rate": 0.00015733356489821944, "loss": 0.012, "step": 366920 }, { "epoch": 0.95, "learning_rate": 0.000157329676681848, "loss": 0.0125, "step": 366930 }, { "epoch": 0.95, "learning_rate": 0.00015732578846547652, "loss": 0.0112, "step": 366940 }, { "epoch": 0.95, "learning_rate": 0.00015732190024910506, "loss": 0.0134, "step": 366950 }, { "epoch": 0.95, "learning_rate": 0.00015731801203273357, "loss": 0.0135, "step": 366960 }, { "epoch": 0.95, "learning_rate": 0.00015731412381636212, "loss": 0.013, "step": 366970 }, { "epoch": 0.95, "learning_rate": 0.00015731023559999066, "loss": 0.012, "step": 366980 }, { "epoch": 0.95, "learning_rate": 0.0001573063473836192, "loss": 0.0154, "step": 366990 }, { "epoch": 0.95, "learning_rate": 0.00015730245916724771, "loss": 0.0138, "step": 367000 }, { "epoch": 0.95, "eval_cer": 0.8817208816033121, "eval_loss": 0.008482192642986774, "eval_runtime": 107.6733, "eval_samples_per_second": 18.575, "eval_steps_per_second": 4.644, "step": 367000 }, { "epoch": 0.95, "learning_rate": 0.00015729857095087626, "loss": 0.0093, "step": 367010 }, { "epoch": 0.95, "learning_rate": 0.0001572946827345048, "loss": 0.012, "step": 367020 }, { "epoch": 0.95, "learning_rate": 0.00015729079451813334, "loss": 0.0121, "step": 367030 }, { "epoch": 0.95, "learning_rate": 0.00015728690630176185, "loss": 0.0134, "step": 367040 }, { "epoch": 0.95, "learning_rate": 0.0001572830180853904, "loss": 0.0134, "step": 367050 }, { "epoch": 0.95, "learning_rate": 0.00015727912986901894, "loss": 0.0115, "step": 367060 }, { "epoch": 0.95, "learning_rate": 0.00015727524165264748, "loss": 0.0131, "step": 367070 }, { "epoch": 0.95, "learning_rate": 0.000157271353436276, "loss": 0.0137, "step": 367080 }, { "epoch": 0.95, "learning_rate": 0.00015726746521990453, "loss": 0.0131, "step": 367090 }, { "epoch": 0.95, "learning_rate": 0.0001572635770035331, "loss": 0.0096, "step": 367100 }, { "epoch": 0.95, "learning_rate": 0.00015725968878716162, "loss": 0.0143, "step": 367110 }, { "epoch": 0.95, "learning_rate": 0.00015725580057079016, "loss": 0.017, "step": 367120 }, { "epoch": 0.95, "learning_rate": 0.00015725191235441867, "loss": 0.0112, "step": 367130 }, { "epoch": 0.95, "learning_rate": 0.00015724802413804724, "loss": 0.0099, "step": 367140 }, { "epoch": 0.95, "learning_rate": 0.00015724413592167576, "loss": 0.0125, "step": 367150 }, { "epoch": 0.95, "learning_rate": 0.0001572402477053043, "loss": 0.0136, "step": 367160 }, { "epoch": 0.95, "learning_rate": 0.0001572363594889328, "loss": 0.0151, "step": 367170 }, { "epoch": 0.95, "learning_rate": 0.00015723247127256138, "loss": 0.0136, "step": 367180 }, { "epoch": 0.95, "learning_rate": 0.0001572285830561899, "loss": 0.0114, "step": 367190 }, { "epoch": 0.95, "learning_rate": 0.00015722469483981844, "loss": 0.0123, "step": 367200 }, { "epoch": 0.95, "learning_rate": 0.00015722080662344695, "loss": 0.0154, "step": 367210 }, { "epoch": 0.95, "learning_rate": 0.0001572169184070755, "loss": 0.013, "step": 367220 }, { "epoch": 0.95, "learning_rate": 0.00015721303019070404, "loss": 0.011, "step": 367230 }, { "epoch": 0.95, "learning_rate": 0.00015720914197433258, "loss": 0.0125, "step": 367240 }, { "epoch": 0.95, "learning_rate": 0.0001572052537579611, "loss": 0.013, "step": 367250 }, { "epoch": 0.95, "learning_rate": 0.00015720136554158963, "loss": 0.0112, "step": 367260 }, { "epoch": 0.95, "learning_rate": 0.0001571974773252182, "loss": 0.0085, "step": 367270 }, { "epoch": 0.95, "learning_rate": 0.00015719358910884672, "loss": 0.0173, "step": 367280 }, { "epoch": 0.95, "learning_rate": 0.00015718970089247526, "loss": 0.009, "step": 367290 }, { "epoch": 0.95, "learning_rate": 0.00015718581267610377, "loss": 0.014, "step": 367300 }, { "epoch": 0.95, "learning_rate": 0.00015718192445973234, "loss": 0.0123, "step": 367310 }, { "epoch": 0.95, "learning_rate": 0.00015717803624336086, "loss": 0.0125, "step": 367320 }, { "epoch": 0.95, "learning_rate": 0.0001571741480269894, "loss": 0.0147, "step": 367330 }, { "epoch": 0.95, "learning_rate": 0.0001571702598106179, "loss": 0.0163, "step": 367340 }, { "epoch": 0.95, "learning_rate": 0.00015716637159424648, "loss": 0.0136, "step": 367350 }, { "epoch": 0.95, "learning_rate": 0.000157162483377875, "loss": 0.0101, "step": 367360 }, { "epoch": 0.95, "learning_rate": 0.00015715859516150354, "loss": 0.0123, "step": 367370 }, { "epoch": 0.95, "learning_rate": 0.00015715470694513205, "loss": 0.0134, "step": 367380 }, { "epoch": 0.95, "learning_rate": 0.00015715081872876062, "loss": 0.0124, "step": 367390 }, { "epoch": 0.95, "learning_rate": 0.00015714693051238914, "loss": 0.013, "step": 367400 }, { "epoch": 0.95, "learning_rate": 0.00015714304229601768, "loss": 0.0145, "step": 367410 }, { "epoch": 0.95, "learning_rate": 0.0001571391540796462, "loss": 0.0131, "step": 367420 }, { "epoch": 0.95, "learning_rate": 0.00015713526586327476, "loss": 0.0172, "step": 367430 }, { "epoch": 0.95, "learning_rate": 0.0001571313776469033, "loss": 0.0144, "step": 367440 }, { "epoch": 0.95, "learning_rate": 0.00015712748943053182, "loss": 0.0124, "step": 367450 }, { "epoch": 0.95, "learning_rate": 0.00015712360121416033, "loss": 0.0143, "step": 367460 }, { "epoch": 0.95, "learning_rate": 0.00015711971299778887, "loss": 0.0163, "step": 367470 }, { "epoch": 0.95, "learning_rate": 0.00015711582478141744, "loss": 0.0144, "step": 367480 }, { "epoch": 0.95, "learning_rate": 0.00015711193656504596, "loss": 0.0106, "step": 367490 }, { "epoch": 0.95, "learning_rate": 0.0001571080483486745, "loss": 0.0113, "step": 367500 }, { "epoch": 0.95, "learning_rate": 0.000157104160132303, "loss": 0.0105, "step": 367510 }, { "epoch": 0.95, "learning_rate": 0.00015710027191593158, "loss": 0.0121, "step": 367520 }, { "epoch": 0.95, "learning_rate": 0.0001570963836995601, "loss": 0.0117, "step": 367530 }, { "epoch": 0.95, "learning_rate": 0.00015709249548318864, "loss": 0.0142, "step": 367540 }, { "epoch": 0.95, "learning_rate": 0.00015708860726681715, "loss": 0.0126, "step": 367550 }, { "epoch": 0.95, "learning_rate": 0.00015708471905044572, "loss": 0.011, "step": 367560 }, { "epoch": 0.95, "learning_rate": 0.00015708083083407424, "loss": 0.012, "step": 367570 }, { "epoch": 0.95, "learning_rate": 0.00015707694261770278, "loss": 0.0122, "step": 367580 }, { "epoch": 0.95, "learning_rate": 0.0001570730544013313, "loss": 0.0106, "step": 367590 }, { "epoch": 0.95, "learning_rate": 0.00015706916618495986, "loss": 0.0146, "step": 367600 }, { "epoch": 0.95, "learning_rate": 0.00015706527796858837, "loss": 0.0173, "step": 367610 }, { "epoch": 0.95, "learning_rate": 0.00015706138975221692, "loss": 0.013, "step": 367620 }, { "epoch": 0.95, "learning_rate": 0.00015705750153584543, "loss": 0.0131, "step": 367630 }, { "epoch": 0.95, "learning_rate": 0.000157053613319474, "loss": 0.013, "step": 367640 }, { "epoch": 0.95, "learning_rate": 0.00015704972510310254, "loss": 0.0131, "step": 367650 }, { "epoch": 0.95, "learning_rate": 0.00015704583688673106, "loss": 0.0126, "step": 367660 }, { "epoch": 0.95, "learning_rate": 0.0001570419486703596, "loss": 0.0123, "step": 367670 }, { "epoch": 0.95, "learning_rate": 0.00015703806045398814, "loss": 0.0141, "step": 367680 }, { "epoch": 0.95, "learning_rate": 0.00015703417223761668, "loss": 0.0133, "step": 367690 }, { "epoch": 0.95, "learning_rate": 0.0001570302840212452, "loss": 0.015, "step": 367700 }, { "epoch": 0.95, "learning_rate": 0.00015702639580487374, "loss": 0.0155, "step": 367710 }, { "epoch": 0.95, "learning_rate": 0.00015702250758850225, "loss": 0.0132, "step": 367720 }, { "epoch": 0.95, "learning_rate": 0.00015701861937213082, "loss": 0.0108, "step": 367730 }, { "epoch": 0.95, "learning_rate": 0.00015701473115575933, "loss": 0.0116, "step": 367740 }, { "epoch": 0.95, "learning_rate": 0.00015701084293938788, "loss": 0.0166, "step": 367750 }, { "epoch": 0.95, "learning_rate": 0.0001570069547230164, "loss": 0.0116, "step": 367760 }, { "epoch": 0.95, "learning_rate": 0.00015700306650664496, "loss": 0.0138, "step": 367770 }, { "epoch": 0.95, "learning_rate": 0.00015699917829027347, "loss": 0.0117, "step": 367780 }, { "epoch": 0.95, "learning_rate": 0.00015699529007390202, "loss": 0.012, "step": 367790 }, { "epoch": 0.95, "learning_rate": 0.00015699140185753053, "loss": 0.011, "step": 367800 }, { "epoch": 0.95, "learning_rate": 0.0001569875136411591, "loss": 0.0166, "step": 367810 }, { "epoch": 0.95, "learning_rate": 0.00015698362542478764, "loss": 0.0114, "step": 367820 }, { "epoch": 0.95, "learning_rate": 0.00015697973720841616, "loss": 0.0138, "step": 367830 }, { "epoch": 0.95, "learning_rate": 0.0001569758489920447, "loss": 0.013, "step": 367840 }, { "epoch": 0.95, "learning_rate": 0.00015697196077567324, "loss": 0.018, "step": 367850 }, { "epoch": 0.95, "learning_rate": 0.00015696807255930178, "loss": 0.0122, "step": 367860 }, { "epoch": 0.95, "learning_rate": 0.0001569641843429303, "loss": 0.0115, "step": 367870 }, { "epoch": 0.95, "learning_rate": 0.00015696029612655884, "loss": 0.0108, "step": 367880 }, { "epoch": 0.95, "learning_rate": 0.00015695640791018738, "loss": 0.0157, "step": 367890 }, { "epoch": 0.95, "learning_rate": 0.00015695251969381592, "loss": 0.0152, "step": 367900 }, { "epoch": 0.95, "learning_rate": 0.00015694863147744443, "loss": 0.0105, "step": 367910 }, { "epoch": 0.95, "learning_rate": 0.00015694474326107298, "loss": 0.009, "step": 367920 }, { "epoch": 0.95, "learning_rate": 0.00015694085504470152, "loss": 0.0132, "step": 367930 }, { "epoch": 0.95, "learning_rate": 0.00015693696682833006, "loss": 0.0121, "step": 367940 }, { "epoch": 0.95, "learning_rate": 0.00015693307861195857, "loss": 0.013, "step": 367950 }, { "epoch": 0.95, "learning_rate": 0.00015692919039558712, "loss": 0.0131, "step": 367960 }, { "epoch": 0.95, "learning_rate": 0.00015692530217921563, "loss": 0.013, "step": 367970 }, { "epoch": 0.95, "learning_rate": 0.0001569214139628442, "loss": 0.0135, "step": 367980 }, { "epoch": 0.95, "learning_rate": 0.00015691752574647274, "loss": 0.0118, "step": 367990 }, { "epoch": 0.95, "learning_rate": 0.00015691363753010125, "loss": 0.0121, "step": 368000 }, { "epoch": 0.95, "eval_cer": 0.8817138834186412, "eval_loss": 0.008444735780358315, "eval_runtime": 107.6844, "eval_samples_per_second": 18.573, "eval_steps_per_second": 4.643, "step": 368000 }, { "epoch": 0.95, "learning_rate": 0.00015690974931372977, "loss": 0.0152, "step": 368010 }, { "epoch": 0.95, "learning_rate": 0.00015690586109735834, "loss": 0.011, "step": 368020 }, { "epoch": 0.95, "learning_rate": 0.00015690197288098688, "loss": 0.0137, "step": 368030 }, { "epoch": 0.95, "learning_rate": 0.0001568980846646154, "loss": 0.0153, "step": 368040 }, { "epoch": 0.95, "learning_rate": 0.00015689419644824394, "loss": 0.0169, "step": 368050 }, { "epoch": 0.95, "learning_rate": 0.00015689030823187248, "loss": 0.0136, "step": 368060 }, { "epoch": 0.95, "learning_rate": 0.00015688642001550102, "loss": 0.0134, "step": 368070 }, { "epoch": 0.95, "learning_rate": 0.00015688253179912953, "loss": 0.0142, "step": 368080 }, { "epoch": 0.95, "learning_rate": 0.00015687864358275807, "loss": 0.017, "step": 368090 }, { "epoch": 0.95, "learning_rate": 0.00015687475536638662, "loss": 0.0106, "step": 368100 }, { "epoch": 0.95, "learning_rate": 0.00015687086715001516, "loss": 0.0112, "step": 368110 }, { "epoch": 0.95, "learning_rate": 0.00015686697893364367, "loss": 0.0127, "step": 368120 }, { "epoch": 0.95, "learning_rate": 0.00015686309071727221, "loss": 0.014, "step": 368130 }, { "epoch": 0.95, "learning_rate": 0.00015685920250090078, "loss": 0.016, "step": 368140 }, { "epoch": 0.95, "learning_rate": 0.0001568553142845293, "loss": 0.0114, "step": 368150 }, { "epoch": 0.95, "learning_rate": 0.00015685142606815784, "loss": 0.0104, "step": 368160 }, { "epoch": 0.95, "learning_rate": 0.00015684753785178635, "loss": 0.0134, "step": 368170 }, { "epoch": 0.95, "learning_rate": 0.00015684364963541492, "loss": 0.0114, "step": 368180 }, { "epoch": 0.95, "learning_rate": 0.00015683976141904344, "loss": 0.0121, "step": 368190 }, { "epoch": 0.95, "learning_rate": 0.00015683587320267198, "loss": 0.0184, "step": 368200 }, { "epoch": 0.95, "learning_rate": 0.0001568319849863005, "loss": 0.0149, "step": 368210 }, { "epoch": 0.95, "learning_rate": 0.00015682809676992903, "loss": 0.0108, "step": 368220 }, { "epoch": 0.95, "learning_rate": 0.00015682420855355758, "loss": 0.01, "step": 368230 }, { "epoch": 0.95, "learning_rate": 0.00015682032033718612, "loss": 0.0112, "step": 368240 }, { "epoch": 0.95, "learning_rate": 0.00015681643212081463, "loss": 0.0127, "step": 368250 }, { "epoch": 0.95, "learning_rate": 0.00015681254390444317, "loss": 0.0112, "step": 368260 }, { "epoch": 0.95, "learning_rate": 0.00015680865568807172, "loss": 0.0113, "step": 368270 }, { "epoch": 0.95, "learning_rate": 0.00015680476747170026, "loss": 0.0116, "step": 368280 }, { "epoch": 0.95, "learning_rate": 0.00015680087925532877, "loss": 0.0133, "step": 368290 }, { "epoch": 0.95, "learning_rate": 0.00015679699103895731, "loss": 0.0142, "step": 368300 }, { "epoch": 0.95, "learning_rate": 0.00015679310282258588, "loss": 0.0137, "step": 368310 }, { "epoch": 0.95, "learning_rate": 0.0001567892146062144, "loss": 0.0129, "step": 368320 }, { "epoch": 0.95, "learning_rate": 0.0001567853263898429, "loss": 0.0109, "step": 368330 }, { "epoch": 0.95, "learning_rate": 0.00015678143817347145, "loss": 0.0151, "step": 368340 }, { "epoch": 0.95, "learning_rate": 0.00015677754995710002, "loss": 0.0118, "step": 368350 }, { "epoch": 0.95, "learning_rate": 0.00015677366174072854, "loss": 0.0125, "step": 368360 }, { "epoch": 0.95, "learning_rate": 0.00015676977352435708, "loss": 0.0179, "step": 368370 }, { "epoch": 0.95, "learning_rate": 0.0001567658853079856, "loss": 0.0137, "step": 368380 }, { "epoch": 0.95, "learning_rate": 0.00015676199709161416, "loss": 0.0139, "step": 368390 }, { "epoch": 0.95, "learning_rate": 0.00015675810887524268, "loss": 0.0139, "step": 368400 }, { "epoch": 0.95, "learning_rate": 0.00015675422065887122, "loss": 0.0119, "step": 368410 }, { "epoch": 0.95, "learning_rate": 0.00015675033244249973, "loss": 0.0145, "step": 368420 }, { "epoch": 0.96, "learning_rate": 0.0001567464442261283, "loss": 0.0121, "step": 368430 }, { "epoch": 0.96, "learning_rate": 0.00015674255600975682, "loss": 0.0121, "step": 368440 }, { "epoch": 0.96, "learning_rate": 0.00015673866779338536, "loss": 0.0116, "step": 368450 }, { "epoch": 0.96, "learning_rate": 0.00015673477957701387, "loss": 0.0111, "step": 368460 }, { "epoch": 0.96, "learning_rate": 0.0001567308913606424, "loss": 0.0148, "step": 368470 }, { "epoch": 0.96, "learning_rate": 0.00015672700314427095, "loss": 0.0102, "step": 368480 }, { "epoch": 0.96, "learning_rate": 0.0001567231149278995, "loss": 0.012, "step": 368490 }, { "epoch": 0.96, "learning_rate": 0.000156719226711528, "loss": 0.0133, "step": 368500 }, { "epoch": 0.96, "learning_rate": 0.00015671533849515655, "loss": 0.0098, "step": 368510 }, { "epoch": 0.96, "learning_rate": 0.00015671145027878512, "loss": 0.0144, "step": 368520 }, { "epoch": 0.96, "learning_rate": 0.00015670756206241364, "loss": 0.0192, "step": 368530 }, { "epoch": 0.96, "learning_rate": 0.00015670367384604218, "loss": 0.0124, "step": 368540 }, { "epoch": 0.96, "learning_rate": 0.0001566997856296707, "loss": 0.0115, "step": 368550 }, { "epoch": 0.96, "learning_rate": 0.00015669589741329926, "loss": 0.0131, "step": 368560 }, { "epoch": 0.96, "learning_rate": 0.00015669200919692778, "loss": 0.0135, "step": 368570 }, { "epoch": 0.96, "learning_rate": 0.00015668812098055632, "loss": 0.0136, "step": 368580 }, { "epoch": 0.96, "learning_rate": 0.00015668423276418483, "loss": 0.0131, "step": 368590 }, { "epoch": 0.96, "learning_rate": 0.0001566803445478134, "loss": 0.0147, "step": 368600 }, { "epoch": 0.96, "learning_rate": 0.00015667645633144191, "loss": 0.0126, "step": 368610 }, { "epoch": 0.96, "learning_rate": 0.00015667256811507046, "loss": 0.0145, "step": 368620 }, { "epoch": 0.96, "learning_rate": 0.00015666867989869897, "loss": 0.0136, "step": 368630 }, { "epoch": 0.96, "learning_rate": 0.00015666479168232754, "loss": 0.0144, "step": 368640 }, { "epoch": 0.96, "learning_rate": 0.00015666090346595605, "loss": 0.0126, "step": 368650 }, { "epoch": 0.96, "learning_rate": 0.0001566570152495846, "loss": 0.0132, "step": 368660 }, { "epoch": 0.96, "learning_rate": 0.0001566531270332131, "loss": 0.0153, "step": 368670 }, { "epoch": 0.96, "learning_rate": 0.00015664923881684168, "loss": 0.0128, "step": 368680 }, { "epoch": 0.96, "learning_rate": 0.00015664535060047022, "loss": 0.0126, "step": 368690 }, { "epoch": 0.96, "learning_rate": 0.00015664146238409874, "loss": 0.0157, "step": 368700 }, { "epoch": 0.96, "learning_rate": 0.00015663757416772728, "loss": 0.0208, "step": 368710 }, { "epoch": 0.96, "learning_rate": 0.0001566336859513558, "loss": 0.0129, "step": 368720 }, { "epoch": 0.96, "learning_rate": 0.00015662979773498436, "loss": 0.0136, "step": 368730 }, { "epoch": 0.96, "learning_rate": 0.00015662590951861287, "loss": 0.0147, "step": 368740 }, { "epoch": 0.96, "learning_rate": 0.00015662202130224142, "loss": 0.0129, "step": 368750 }, { "epoch": 0.96, "learning_rate": 0.00015661813308586993, "loss": 0.0131, "step": 368760 }, { "epoch": 0.96, "learning_rate": 0.0001566142448694985, "loss": 0.0126, "step": 368770 }, { "epoch": 0.96, "learning_rate": 0.00015661035665312701, "loss": 0.0162, "step": 368780 }, { "epoch": 0.96, "learning_rate": 0.00015660646843675556, "loss": 0.0142, "step": 368790 }, { "epoch": 0.96, "learning_rate": 0.00015660258022038407, "loss": 0.0139, "step": 368800 }, { "epoch": 0.96, "learning_rate": 0.00015659869200401264, "loss": 0.012, "step": 368810 }, { "epoch": 0.96, "learning_rate": 0.00015659480378764115, "loss": 0.0116, "step": 368820 }, { "epoch": 0.96, "learning_rate": 0.0001565909155712697, "loss": 0.0114, "step": 368830 }, { "epoch": 0.96, "learning_rate": 0.0001565870273548982, "loss": 0.0126, "step": 368840 }, { "epoch": 0.96, "learning_rate": 0.00015658313913852678, "loss": 0.0115, "step": 368850 }, { "epoch": 0.96, "learning_rate": 0.00015657925092215532, "loss": 0.0101, "step": 368860 }, { "epoch": 0.96, "learning_rate": 0.00015657536270578383, "loss": 0.0121, "step": 368870 }, { "epoch": 0.96, "learning_rate": 0.00015657147448941238, "loss": 0.0133, "step": 368880 }, { "epoch": 0.96, "learning_rate": 0.00015656758627304092, "loss": 0.0158, "step": 368890 }, { "epoch": 0.96, "learning_rate": 0.00015656369805666946, "loss": 0.0166, "step": 368900 }, { "epoch": 0.96, "learning_rate": 0.00015655980984029797, "loss": 0.0139, "step": 368910 }, { "epoch": 0.96, "learning_rate": 0.00015655592162392652, "loss": 0.0141, "step": 368920 }, { "epoch": 0.96, "learning_rate": 0.00015655203340755506, "loss": 0.0123, "step": 368930 }, { "epoch": 0.96, "learning_rate": 0.0001565481451911836, "loss": 0.0167, "step": 368940 }, { "epoch": 0.96, "learning_rate": 0.00015654425697481211, "loss": 0.0147, "step": 368950 }, { "epoch": 0.96, "learning_rate": 0.00015654036875844066, "loss": 0.009, "step": 368960 }, { "epoch": 0.96, "learning_rate": 0.00015653648054206917, "loss": 0.0138, "step": 368970 }, { "epoch": 0.96, "learning_rate": 0.00015653259232569774, "loss": 0.0155, "step": 368980 }, { "epoch": 0.96, "learning_rate": 0.00015652870410932625, "loss": 0.0165, "step": 368990 }, { "epoch": 0.96, "learning_rate": 0.0001565248158929548, "loss": 0.0112, "step": 369000 }, { "epoch": 0.96, "eval_cer": 0.8817586718005349, "eval_loss": 0.008379627019166946, "eval_runtime": 107.6158, "eval_samples_per_second": 18.585, "eval_steps_per_second": 4.646, "step": 369000 }, { "epoch": 0.96, "learning_rate": 0.0001565209276765833, "loss": 0.0113, "step": 369010 }, { "epoch": 0.96, "learning_rate": 0.00015651703946021188, "loss": 0.0141, "step": 369020 }, { "epoch": 0.96, "learning_rate": 0.00015651315124384042, "loss": 0.0177, "step": 369030 }, { "epoch": 0.96, "learning_rate": 0.00015650926302746893, "loss": 0.0142, "step": 369040 }, { "epoch": 0.96, "learning_rate": 0.00015650537481109745, "loss": 0.0106, "step": 369050 }, { "epoch": 0.96, "learning_rate": 0.00015650148659472602, "loss": 0.0175, "step": 369060 }, { "epoch": 0.96, "learning_rate": 0.00015649759837835456, "loss": 0.0104, "step": 369070 }, { "epoch": 0.96, "learning_rate": 0.00015649371016198307, "loss": 0.0124, "step": 369080 }, { "epoch": 0.96, "learning_rate": 0.00015648982194561162, "loss": 0.0149, "step": 369090 }, { "epoch": 0.96, "learning_rate": 0.00015648593372924016, "loss": 0.0161, "step": 369100 }, { "epoch": 0.96, "learning_rate": 0.0001564820455128687, "loss": 0.0134, "step": 369110 }, { "epoch": 0.96, "learning_rate": 0.0001564781572964972, "loss": 0.014, "step": 369120 }, { "epoch": 0.96, "learning_rate": 0.00015647426908012575, "loss": 0.0105, "step": 369130 }, { "epoch": 0.96, "learning_rate": 0.0001564703808637543, "loss": 0.0171, "step": 369140 }, { "epoch": 0.96, "learning_rate": 0.00015646649264738284, "loss": 0.0131, "step": 369150 }, { "epoch": 0.96, "learning_rate": 0.00015646260443101135, "loss": 0.0129, "step": 369160 }, { "epoch": 0.96, "learning_rate": 0.0001564587162146399, "loss": 0.0159, "step": 369170 }, { "epoch": 0.96, "learning_rate": 0.00015645482799826846, "loss": 0.0107, "step": 369180 }, { "epoch": 0.96, "learning_rate": 0.00015645093978189698, "loss": 0.0132, "step": 369190 }, { "epoch": 0.96, "learning_rate": 0.0001564470515655255, "loss": 0.0127, "step": 369200 }, { "epoch": 0.96, "learning_rate": 0.00015644316334915403, "loss": 0.0127, "step": 369210 }, { "epoch": 0.96, "learning_rate": 0.00015643927513278255, "loss": 0.0115, "step": 369220 }, { "epoch": 0.96, "learning_rate": 0.00015643538691641112, "loss": 0.0172, "step": 369230 }, { "epoch": 0.96, "learning_rate": 0.00015643149870003966, "loss": 0.0142, "step": 369240 }, { "epoch": 0.96, "learning_rate": 0.00015642761048366817, "loss": 0.0169, "step": 369250 }, { "epoch": 0.96, "learning_rate": 0.00015642372226729671, "loss": 0.0149, "step": 369260 }, { "epoch": 0.96, "learning_rate": 0.00015641983405092526, "loss": 0.0144, "step": 369270 }, { "epoch": 0.96, "learning_rate": 0.0001564159458345538, "loss": 0.0125, "step": 369280 }, { "epoch": 0.96, "learning_rate": 0.0001564120576181823, "loss": 0.0122, "step": 369290 }, { "epoch": 0.96, "learning_rate": 0.00015640816940181085, "loss": 0.0103, "step": 369300 }, { "epoch": 0.96, "learning_rate": 0.0001564042811854394, "loss": 0.0167, "step": 369310 }, { "epoch": 0.96, "learning_rate": 0.00015640039296906794, "loss": 0.0126, "step": 369320 }, { "epoch": 0.96, "learning_rate": 0.00015639650475269645, "loss": 0.0131, "step": 369330 }, { "epoch": 0.96, "learning_rate": 0.000156392616536325, "loss": 0.0123, "step": 369340 }, { "epoch": 0.96, "learning_rate": 0.00015638872831995356, "loss": 0.0124, "step": 369350 }, { "epoch": 0.96, "learning_rate": 0.00015638484010358208, "loss": 0.0148, "step": 369360 }, { "epoch": 0.96, "learning_rate": 0.0001563809518872106, "loss": 0.0124, "step": 369370 }, { "epoch": 0.96, "learning_rate": 0.00015637706367083913, "loss": 0.0095, "step": 369380 }, { "epoch": 0.96, "learning_rate": 0.0001563731754544677, "loss": 0.0108, "step": 369390 }, { "epoch": 0.96, "learning_rate": 0.00015636928723809622, "loss": 0.0135, "step": 369400 }, { "epoch": 0.96, "learning_rate": 0.00015636539902172476, "loss": 0.0179, "step": 369410 }, { "epoch": 0.96, "learning_rate": 0.00015636151080535327, "loss": 0.0124, "step": 369420 }, { "epoch": 0.96, "learning_rate": 0.00015635762258898184, "loss": 0.0136, "step": 369430 }, { "epoch": 0.96, "learning_rate": 0.00015635373437261036, "loss": 0.0146, "step": 369440 }, { "epoch": 0.96, "learning_rate": 0.0001563498461562389, "loss": 0.0118, "step": 369450 }, { "epoch": 0.96, "learning_rate": 0.0001563459579398674, "loss": 0.0148, "step": 369460 }, { "epoch": 0.96, "learning_rate": 0.00015634206972349595, "loss": 0.0166, "step": 369470 }, { "epoch": 0.96, "learning_rate": 0.0001563381815071245, "loss": 0.011, "step": 369480 }, { "epoch": 0.96, "learning_rate": 0.00015633429329075304, "loss": 0.0158, "step": 369490 }, { "epoch": 0.96, "learning_rate": 0.00015633040507438155, "loss": 0.0097, "step": 369500 }, { "epoch": 0.96, "learning_rate": 0.0001563265168580101, "loss": 0.0144, "step": 369510 }, { "epoch": 0.96, "learning_rate": 0.00015632262864163863, "loss": 0.0107, "step": 369520 }, { "epoch": 0.96, "learning_rate": 0.00015631874042526718, "loss": 0.0185, "step": 369530 }, { "epoch": 0.96, "learning_rate": 0.0001563148522088957, "loss": 0.0116, "step": 369540 }, { "epoch": 0.96, "learning_rate": 0.00015631096399252423, "loss": 0.0129, "step": 369550 }, { "epoch": 0.96, "learning_rate": 0.0001563070757761528, "loss": 0.0141, "step": 369560 }, { "epoch": 0.96, "learning_rate": 0.00015630318755978132, "loss": 0.0103, "step": 369570 }, { "epoch": 0.96, "learning_rate": 0.00015629929934340986, "loss": 0.0135, "step": 369580 }, { "epoch": 0.96, "learning_rate": 0.00015629541112703837, "loss": 0.0105, "step": 369590 }, { "epoch": 0.96, "learning_rate": 0.00015629152291066694, "loss": 0.0168, "step": 369600 }, { "epoch": 0.96, "learning_rate": 0.00015628763469429546, "loss": 0.0118, "step": 369610 }, { "epoch": 0.96, "learning_rate": 0.000156283746477924, "loss": 0.0108, "step": 369620 }, { "epoch": 0.96, "learning_rate": 0.0001562798582615525, "loss": 0.0119, "step": 369630 }, { "epoch": 0.96, "learning_rate": 0.00015627597004518108, "loss": 0.0121, "step": 369640 }, { "epoch": 0.96, "learning_rate": 0.0001562720818288096, "loss": 0.0124, "step": 369650 }, { "epoch": 0.96, "learning_rate": 0.00015626819361243814, "loss": 0.0108, "step": 369660 }, { "epoch": 0.96, "learning_rate": 0.00015626430539606665, "loss": 0.0112, "step": 369670 }, { "epoch": 0.96, "learning_rate": 0.0001562604171796952, "loss": 0.0137, "step": 369680 }, { "epoch": 0.96, "learning_rate": 0.00015625652896332373, "loss": 0.0107, "step": 369690 }, { "epoch": 0.96, "learning_rate": 0.00015625264074695228, "loss": 0.0126, "step": 369700 }, { "epoch": 0.96, "learning_rate": 0.0001562487525305808, "loss": 0.014, "step": 369710 }, { "epoch": 0.96, "learning_rate": 0.00015624486431420933, "loss": 0.0146, "step": 369720 }, { "epoch": 0.96, "learning_rate": 0.0001562409760978379, "loss": 0.0136, "step": 369730 }, { "epoch": 0.96, "learning_rate": 0.00015623708788146642, "loss": 0.0146, "step": 369740 }, { "epoch": 0.96, "learning_rate": 0.00015623319966509496, "loss": 0.016, "step": 369750 }, { "epoch": 0.96, "learning_rate": 0.00015622931144872347, "loss": 0.0135, "step": 369760 }, { "epoch": 0.96, "learning_rate": 0.00015622542323235204, "loss": 0.0119, "step": 369770 }, { "epoch": 0.96, "learning_rate": 0.00015622153501598055, "loss": 0.0137, "step": 369780 }, { "epoch": 0.96, "learning_rate": 0.0001562176467996091, "loss": 0.0165, "step": 369790 }, { "epoch": 0.96, "learning_rate": 0.0001562137585832376, "loss": 0.0159, "step": 369800 }, { "epoch": 0.96, "learning_rate": 0.00015620987036686618, "loss": 0.0116, "step": 369810 }, { "epoch": 0.96, "learning_rate": 0.0001562059821504947, "loss": 0.012, "step": 369820 }, { "epoch": 0.96, "learning_rate": 0.00015620209393412324, "loss": 0.0105, "step": 369830 }, { "epoch": 0.96, "learning_rate": 0.00015619820571775175, "loss": 0.0132, "step": 369840 }, { "epoch": 0.96, "learning_rate": 0.00015619431750138032, "loss": 0.0099, "step": 369850 }, { "epoch": 0.96, "learning_rate": 0.00015619042928500883, "loss": 0.0116, "step": 369860 }, { "epoch": 0.96, "learning_rate": 0.00015618654106863738, "loss": 0.0221, "step": 369870 }, { "epoch": 0.96, "learning_rate": 0.0001561826528522659, "loss": 0.0167, "step": 369880 }, { "epoch": 0.96, "learning_rate": 0.00015617876463589446, "loss": 0.011, "step": 369890 }, { "epoch": 0.96, "learning_rate": 0.000156174876419523, "loss": 0.0134, "step": 369900 }, { "epoch": 0.96, "learning_rate": 0.00015617098820315151, "loss": 0.011, "step": 369910 }, { "epoch": 0.96, "learning_rate": 0.00015616709998678003, "loss": 0.012, "step": 369920 }, { "epoch": 0.96, "learning_rate": 0.00015616321177040857, "loss": 0.0131, "step": 369930 }, { "epoch": 0.96, "learning_rate": 0.00015615932355403714, "loss": 0.0112, "step": 369940 }, { "epoch": 0.96, "learning_rate": 0.00015615543533766565, "loss": 0.0145, "step": 369950 }, { "epoch": 0.96, "learning_rate": 0.0001561515471212942, "loss": 0.0178, "step": 369960 }, { "epoch": 0.96, "learning_rate": 0.0001561476589049227, "loss": 0.016, "step": 369970 }, { "epoch": 0.96, "learning_rate": 0.00015614377068855128, "loss": 0.0095, "step": 369980 }, { "epoch": 0.96, "learning_rate": 0.0001561398824721798, "loss": 0.0164, "step": 369990 }, { "epoch": 0.96, "learning_rate": 0.00015613599425580834, "loss": 0.0116, "step": 370000 }, { "epoch": 0.96, "eval_cer": 0.8817068852339703, "eval_loss": 0.008635921403765678, "eval_runtime": 107.4637, "eval_samples_per_second": 18.611, "eval_steps_per_second": 4.653, "step": 370000 }, { "epoch": 0.96, "learning_rate": 0.00015613210603943685, "loss": 0.0141, "step": 370010 }, { "epoch": 0.96, "learning_rate": 0.00015612821782306542, "loss": 0.0127, "step": 370020 }, { "epoch": 0.96, "learning_rate": 0.00015612432960669393, "loss": 0.0136, "step": 370030 }, { "epoch": 0.96, "learning_rate": 0.00015612044139032247, "loss": 0.022, "step": 370040 }, { "epoch": 0.96, "learning_rate": 0.000156116553173951, "loss": 0.0175, "step": 370050 }, { "epoch": 0.96, "learning_rate": 0.00015611266495757956, "loss": 0.0168, "step": 370060 }, { "epoch": 0.96, "learning_rate": 0.00015610877674120807, "loss": 0.0143, "step": 370070 }, { "epoch": 0.96, "learning_rate": 0.00015610488852483661, "loss": 0.0107, "step": 370080 }, { "epoch": 0.96, "learning_rate": 0.00015610100030846513, "loss": 0.0133, "step": 370090 }, { "epoch": 0.96, "learning_rate": 0.0001560971120920937, "loss": 0.0125, "step": 370100 }, { "epoch": 0.96, "learning_rate": 0.00015609322387572224, "loss": 0.0106, "step": 370110 }, { "epoch": 0.96, "learning_rate": 0.00015608933565935075, "loss": 0.0127, "step": 370120 }, { "epoch": 0.96, "learning_rate": 0.0001560854474429793, "loss": 0.0148, "step": 370130 }, { "epoch": 0.96, "learning_rate": 0.00015608155922660784, "loss": 0.016, "step": 370140 }, { "epoch": 0.96, "learning_rate": 0.00015607767101023638, "loss": 0.0108, "step": 370150 }, { "epoch": 0.96, "learning_rate": 0.0001560737827938649, "loss": 0.0151, "step": 370160 }, { "epoch": 0.96, "learning_rate": 0.00015606989457749343, "loss": 0.0139, "step": 370170 }, { "epoch": 0.96, "learning_rate": 0.00015606600636112195, "loss": 0.0118, "step": 370180 }, { "epoch": 0.96, "learning_rate": 0.00015606211814475052, "loss": 0.01, "step": 370190 }, { "epoch": 0.96, "learning_rate": 0.00015605822992837903, "loss": 0.0124, "step": 370200 }, { "epoch": 0.96, "learning_rate": 0.00015605434171200757, "loss": 0.0147, "step": 370210 }, { "epoch": 0.96, "learning_rate": 0.0001560504534956361, "loss": 0.0128, "step": 370220 }, { "epoch": 0.96, "learning_rate": 0.00015604656527926466, "loss": 0.014, "step": 370230 }, { "epoch": 0.96, "learning_rate": 0.00015604267706289317, "loss": 0.0142, "step": 370240 }, { "epoch": 0.96, "learning_rate": 0.0001560387888465217, "loss": 0.0151, "step": 370250 }, { "epoch": 0.96, "learning_rate": 0.00015603490063015023, "loss": 0.013, "step": 370260 }, { "epoch": 0.96, "learning_rate": 0.0001560310124137788, "loss": 0.0136, "step": 370270 }, { "epoch": 0.96, "learning_rate": 0.00015602712419740734, "loss": 0.0138, "step": 370280 }, { "epoch": 0.96, "learning_rate": 0.00015602323598103585, "loss": 0.0122, "step": 370290 }, { "epoch": 0.96, "learning_rate": 0.0001560193477646644, "loss": 0.0121, "step": 370300 }, { "epoch": 0.96, "learning_rate": 0.00015601545954829294, "loss": 0.0105, "step": 370310 }, { "epoch": 0.96, "learning_rate": 0.00015601157133192148, "loss": 0.0118, "step": 370320 }, { "epoch": 0.96, "learning_rate": 0.00015600768311555, "loss": 0.01, "step": 370330 }, { "epoch": 0.96, "learning_rate": 0.00015600379489917853, "loss": 0.0125, "step": 370340 }, { "epoch": 0.96, "learning_rate": 0.00015599990668280708, "loss": 0.0124, "step": 370350 }, { "epoch": 0.96, "learning_rate": 0.00015599601846643562, "loss": 0.0186, "step": 370360 }, { "epoch": 0.96, "learning_rate": 0.00015599213025006413, "loss": 0.0143, "step": 370370 }, { "epoch": 0.96, "learning_rate": 0.00015598824203369267, "loss": 0.0147, "step": 370380 }, { "epoch": 0.96, "learning_rate": 0.00015598435381732122, "loss": 0.0132, "step": 370390 }, { "epoch": 0.96, "learning_rate": 0.00015598046560094976, "loss": 0.0121, "step": 370400 }, { "epoch": 0.96, "learning_rate": 0.00015597657738457827, "loss": 0.0148, "step": 370410 }, { "epoch": 0.96, "learning_rate": 0.0001559726891682068, "loss": 0.0118, "step": 370420 }, { "epoch": 0.96, "learning_rate": 0.00015596880095183533, "loss": 0.0116, "step": 370430 }, { "epoch": 0.96, "learning_rate": 0.0001559649127354639, "loss": 0.0141, "step": 370440 }, { "epoch": 0.96, "learning_rate": 0.00015596102451909244, "loss": 0.0126, "step": 370450 }, { "epoch": 0.96, "learning_rate": 0.00015595713630272095, "loss": 0.0165, "step": 370460 }, { "epoch": 0.96, "learning_rate": 0.00015595324808634947, "loss": 0.0137, "step": 370470 }, { "epoch": 0.96, "learning_rate": 0.00015594935986997804, "loss": 0.0163, "step": 370480 }, { "epoch": 0.96, "learning_rate": 0.00015594547165360658, "loss": 0.0136, "step": 370490 }, { "epoch": 0.96, "learning_rate": 0.0001559415834372351, "loss": 0.0137, "step": 370500 }, { "epoch": 0.96, "learning_rate": 0.00015593769522086363, "loss": 0.0135, "step": 370510 }, { "epoch": 0.96, "learning_rate": 0.00015593380700449218, "loss": 0.0157, "step": 370520 }, { "epoch": 0.96, "learning_rate": 0.00015592991878812072, "loss": 0.0127, "step": 370530 }, { "epoch": 0.96, "learning_rate": 0.00015592603057174923, "loss": 0.0112, "step": 370540 }, { "epoch": 0.96, "learning_rate": 0.00015592214235537777, "loss": 0.0131, "step": 370550 }, { "epoch": 0.96, "learning_rate": 0.00015591825413900631, "loss": 0.0109, "step": 370560 }, { "epoch": 0.96, "learning_rate": 0.00015591436592263486, "loss": 0.0155, "step": 370570 }, { "epoch": 0.96, "learning_rate": 0.00015591047770626337, "loss": 0.0222, "step": 370580 }, { "epoch": 0.96, "learning_rate": 0.0001559065894898919, "loss": 0.0089, "step": 370590 }, { "epoch": 0.96, "learning_rate": 0.00015590270127352048, "loss": 0.0125, "step": 370600 }, { "epoch": 0.96, "learning_rate": 0.000155898813057149, "loss": 0.0112, "step": 370610 }, { "epoch": 0.96, "learning_rate": 0.00015589492484077754, "loss": 0.019, "step": 370620 }, { "epoch": 0.96, "learning_rate": 0.00015589103662440605, "loss": 0.0109, "step": 370630 }, { "epoch": 0.96, "learning_rate": 0.00015588714840803462, "loss": 0.0174, "step": 370640 }, { "epoch": 0.96, "learning_rate": 0.00015588326019166314, "loss": 0.0131, "step": 370650 }, { "epoch": 0.96, "learning_rate": 0.00015587937197529168, "loss": 0.0113, "step": 370660 }, { "epoch": 0.96, "learning_rate": 0.0001558754837589202, "loss": 0.0103, "step": 370670 }, { "epoch": 0.96, "learning_rate": 0.00015587159554254873, "loss": 0.0134, "step": 370680 }, { "epoch": 0.96, "learning_rate": 0.00015586770732617727, "loss": 0.0128, "step": 370690 }, { "epoch": 0.96, "learning_rate": 0.00015586381910980582, "loss": 0.0109, "step": 370700 }, { "epoch": 0.96, "learning_rate": 0.00015585993089343433, "loss": 0.0124, "step": 370710 }, { "epoch": 0.96, "learning_rate": 0.00015585604267706287, "loss": 0.0112, "step": 370720 }, { "epoch": 0.96, "learning_rate": 0.00015585215446069141, "loss": 0.015, "step": 370730 }, { "epoch": 0.96, "learning_rate": 0.00015584826624431996, "loss": 0.0136, "step": 370740 }, { "epoch": 0.96, "learning_rate": 0.00015584437802794847, "loss": 0.012, "step": 370750 }, { "epoch": 0.96, "learning_rate": 0.000155840489811577, "loss": 0.0135, "step": 370760 }, { "epoch": 0.96, "learning_rate": 0.00015583660159520558, "loss": 0.0088, "step": 370770 }, { "epoch": 0.96, "learning_rate": 0.0001558327133788341, "loss": 0.0152, "step": 370780 }, { "epoch": 0.96, "learning_rate": 0.0001558288251624626, "loss": 0.0113, "step": 370790 }, { "epoch": 0.96, "learning_rate": 0.00015582493694609115, "loss": 0.0159, "step": 370800 }, { "epoch": 0.96, "learning_rate": 0.00015582104872971972, "loss": 0.012, "step": 370810 }, { "epoch": 0.96, "learning_rate": 0.00015581716051334823, "loss": 0.0088, "step": 370820 }, { "epoch": 0.96, "learning_rate": 0.00015581327229697678, "loss": 0.015, "step": 370830 }, { "epoch": 0.96, "learning_rate": 0.0001558093840806053, "loss": 0.0109, "step": 370840 }, { "epoch": 0.96, "learning_rate": 0.00015580549586423386, "loss": 0.0105, "step": 370850 }, { "epoch": 0.96, "learning_rate": 0.00015580160764786237, "loss": 0.0121, "step": 370860 }, { "epoch": 0.96, "learning_rate": 0.00015579771943149092, "loss": 0.0137, "step": 370870 }, { "epoch": 0.96, "learning_rate": 0.00015579383121511943, "loss": 0.0118, "step": 370880 }, { "epoch": 0.96, "learning_rate": 0.000155789942998748, "loss": 0.0135, "step": 370890 }, { "epoch": 0.96, "learning_rate": 0.0001557860547823765, "loss": 0.0135, "step": 370900 }, { "epoch": 0.96, "learning_rate": 0.00015578216656600506, "loss": 0.0163, "step": 370910 }, { "epoch": 0.96, "learning_rate": 0.00015577827834963357, "loss": 0.0118, "step": 370920 }, { "epoch": 0.96, "learning_rate": 0.0001557743901332621, "loss": 0.0141, "step": 370930 }, { "epoch": 0.96, "learning_rate": 0.00015577050191689068, "loss": 0.01, "step": 370940 }, { "epoch": 0.96, "learning_rate": 0.0001557666137005192, "loss": 0.0098, "step": 370950 }, { "epoch": 0.96, "learning_rate": 0.0001557627254841477, "loss": 0.0195, "step": 370960 }, { "epoch": 0.96, "learning_rate": 0.00015575883726777625, "loss": 0.0135, "step": 370970 }, { "epoch": 0.96, "learning_rate": 0.00015575494905140482, "loss": 0.0137, "step": 370980 }, { "epoch": 0.96, "learning_rate": 0.00015575106083503333, "loss": 0.0114, "step": 370990 }, { "epoch": 0.96, "learning_rate": 0.00015574717261866188, "loss": 0.0123, "step": 371000 }, { "epoch": 0.96, "eval_cer": 0.8817334783357197, "eval_loss": 0.008374325931072235, "eval_runtime": 107.4524, "eval_samples_per_second": 18.613, "eval_steps_per_second": 4.653, "step": 371000 }, { "epoch": 0.96, "learning_rate": 0.0001557432844022904, "loss": 0.0131, "step": 371010 }, { "epoch": 0.96, "learning_rate": 0.00015573939618591896, "loss": 0.0143, "step": 371020 }, { "epoch": 0.96, "learning_rate": 0.00015573550796954747, "loss": 0.0111, "step": 371030 }, { "epoch": 0.96, "learning_rate": 0.00015573161975317601, "loss": 0.0133, "step": 371040 }, { "epoch": 0.96, "learning_rate": 0.00015572773153680453, "loss": 0.0104, "step": 371050 }, { "epoch": 0.96, "learning_rate": 0.0001557238433204331, "loss": 0.0139, "step": 371060 }, { "epoch": 0.96, "learning_rate": 0.0001557199551040616, "loss": 0.0118, "step": 371070 }, { "epoch": 0.96, "learning_rate": 0.00015571606688769015, "loss": 0.009, "step": 371080 }, { "epoch": 0.96, "learning_rate": 0.00015571217867131867, "loss": 0.0123, "step": 371090 }, { "epoch": 0.96, "learning_rate": 0.00015570829045494724, "loss": 0.0111, "step": 371100 }, { "epoch": 0.96, "learning_rate": 0.00015570440223857575, "loss": 0.0137, "step": 371110 }, { "epoch": 0.96, "learning_rate": 0.0001557005140222043, "loss": 0.0112, "step": 371120 }, { "epoch": 0.96, "learning_rate": 0.0001556966258058328, "loss": 0.0116, "step": 371130 }, { "epoch": 0.96, "learning_rate": 0.00015569273758946138, "loss": 0.0115, "step": 371140 }, { "epoch": 0.96, "learning_rate": 0.00015568884937308992, "loss": 0.012, "step": 371150 }, { "epoch": 0.96, "learning_rate": 0.00015568496115671843, "loss": 0.011, "step": 371160 }, { "epoch": 0.96, "learning_rate": 0.00015568107294034697, "loss": 0.0147, "step": 371170 }, { "epoch": 0.96, "learning_rate": 0.0001556771847239755, "loss": 0.0117, "step": 371180 }, { "epoch": 0.96, "learning_rate": 0.00015567329650760406, "loss": 0.0126, "step": 371190 }, { "epoch": 0.96, "learning_rate": 0.00015566940829123257, "loss": 0.0131, "step": 371200 }, { "epoch": 0.96, "learning_rate": 0.00015566552007486111, "loss": 0.0119, "step": 371210 }, { "epoch": 0.96, "learning_rate": 0.00015566163185848963, "loss": 0.014, "step": 371220 }, { "epoch": 0.96, "learning_rate": 0.0001556577436421182, "loss": 0.013, "step": 371230 }, { "epoch": 0.96, "learning_rate": 0.0001556538554257467, "loss": 0.0109, "step": 371240 }, { "epoch": 0.96, "learning_rate": 0.00015564996720937525, "loss": 0.0112, "step": 371250 }, { "epoch": 0.96, "learning_rate": 0.00015564607899300377, "loss": 0.0114, "step": 371260 }, { "epoch": 0.96, "learning_rate": 0.00015564219077663234, "loss": 0.0133, "step": 371270 }, { "epoch": 0.96, "learning_rate": 0.00015563830256026085, "loss": 0.0137, "step": 371280 }, { "epoch": 0.96, "learning_rate": 0.0001556344143438894, "loss": 0.0126, "step": 371290 }, { "epoch": 0.96, "learning_rate": 0.0001556305261275179, "loss": 0.0149, "step": 371300 }, { "epoch": 0.96, "learning_rate": 0.00015562663791114648, "loss": 0.012, "step": 371310 }, { "epoch": 0.96, "learning_rate": 0.00015562274969477502, "loss": 0.0111, "step": 371320 }, { "epoch": 0.96, "learning_rate": 0.00015561886147840353, "loss": 0.0093, "step": 371330 }, { "epoch": 0.96, "learning_rate": 0.00015561497326203207, "loss": 0.0108, "step": 371340 }, { "epoch": 0.96, "learning_rate": 0.00015561108504566062, "loss": 0.0114, "step": 371350 }, { "epoch": 0.96, "learning_rate": 0.00015560719682928916, "loss": 0.0153, "step": 371360 }, { "epoch": 0.96, "learning_rate": 0.00015560330861291767, "loss": 0.0117, "step": 371370 }, { "epoch": 0.96, "learning_rate": 0.00015559942039654621, "loss": 0.0105, "step": 371380 }, { "epoch": 0.96, "learning_rate": 0.00015559553218017476, "loss": 0.0112, "step": 371390 }, { "epoch": 0.96, "learning_rate": 0.0001555916439638033, "loss": 0.0185, "step": 371400 }, { "epoch": 0.96, "learning_rate": 0.0001555877557474318, "loss": 0.0159, "step": 371410 }, { "epoch": 0.96, "learning_rate": 0.00015558386753106035, "loss": 0.0163, "step": 371420 }, { "epoch": 0.96, "learning_rate": 0.00015557997931468887, "loss": 0.0114, "step": 371430 }, { "epoch": 0.96, "learning_rate": 0.00015557609109831744, "loss": 0.0111, "step": 371440 }, { "epoch": 0.96, "learning_rate": 0.00015557220288194595, "loss": 0.0092, "step": 371450 }, { "epoch": 0.96, "learning_rate": 0.0001555683146655745, "loss": 0.0092, "step": 371460 }, { "epoch": 0.96, "learning_rate": 0.000155564426449203, "loss": 0.0127, "step": 371470 }, { "epoch": 0.96, "learning_rate": 0.00015556053823283158, "loss": 0.0191, "step": 371480 }, { "epoch": 0.96, "learning_rate": 0.00015555665001646012, "loss": 0.0147, "step": 371490 }, { "epoch": 0.96, "learning_rate": 0.00015555276180008863, "loss": 0.0108, "step": 371500 }, { "epoch": 0.96, "learning_rate": 0.00015554887358371715, "loss": 0.0105, "step": 371510 }, { "epoch": 0.96, "learning_rate": 0.00015554498536734572, "loss": 0.0124, "step": 371520 }, { "epoch": 0.96, "learning_rate": 0.00015554109715097426, "loss": 0.0117, "step": 371530 }, { "epoch": 0.96, "learning_rate": 0.00015553720893460277, "loss": 0.0121, "step": 371540 }, { "epoch": 0.96, "learning_rate": 0.0001555333207182313, "loss": 0.0124, "step": 371550 }, { "epoch": 0.96, "learning_rate": 0.00015552943250185985, "loss": 0.0102, "step": 371560 }, { "epoch": 0.96, "learning_rate": 0.0001555255442854884, "loss": 0.0099, "step": 371570 }, { "epoch": 0.96, "learning_rate": 0.0001555216560691169, "loss": 0.0121, "step": 371580 }, { "epoch": 0.96, "learning_rate": 0.00015551776785274545, "loss": 0.017, "step": 371590 }, { "epoch": 0.96, "learning_rate": 0.000155513879636374, "loss": 0.0101, "step": 371600 }, { "epoch": 0.96, "learning_rate": 0.00015550999142000254, "loss": 0.013, "step": 371610 }, { "epoch": 0.96, "learning_rate": 0.00015550610320363105, "loss": 0.0121, "step": 371620 }, { "epoch": 0.96, "learning_rate": 0.0001555022149872596, "loss": 0.0134, "step": 371630 }, { "epoch": 0.96, "learning_rate": 0.00015549832677088816, "loss": 0.0094, "step": 371640 }, { "epoch": 0.96, "learning_rate": 0.00015549443855451668, "loss": 0.0104, "step": 371650 }, { "epoch": 0.96, "learning_rate": 0.0001554905503381452, "loss": 0.0133, "step": 371660 }, { "epoch": 0.96, "learning_rate": 0.00015548666212177373, "loss": 0.0118, "step": 371670 }, { "epoch": 0.96, "learning_rate": 0.00015548277390540225, "loss": 0.0117, "step": 371680 }, { "epoch": 0.96, "learning_rate": 0.00015547888568903081, "loss": 0.009, "step": 371690 }, { "epoch": 0.96, "learning_rate": 0.00015547499747265936, "loss": 0.0106, "step": 371700 }, { "epoch": 0.96, "learning_rate": 0.00015547110925628787, "loss": 0.0104, "step": 371710 }, { "epoch": 0.96, "learning_rate": 0.0001554672210399164, "loss": 0.0135, "step": 371720 }, { "epoch": 0.96, "learning_rate": 0.00015546333282354495, "loss": 0.0126, "step": 371730 }, { "epoch": 0.96, "learning_rate": 0.0001554594446071735, "loss": 0.0108, "step": 371740 }, { "epoch": 0.96, "learning_rate": 0.000155455556390802, "loss": 0.0111, "step": 371750 }, { "epoch": 0.96, "learning_rate": 0.00015545166817443055, "loss": 0.0108, "step": 371760 }, { "epoch": 0.96, "learning_rate": 0.0001554477799580591, "loss": 0.0169, "step": 371770 }, { "epoch": 0.96, "learning_rate": 0.00015544389174168764, "loss": 0.0128, "step": 371780 }, { "epoch": 0.96, "learning_rate": 0.00015544000352531615, "loss": 0.0123, "step": 371790 }, { "epoch": 0.96, "learning_rate": 0.0001554361153089447, "loss": 0.0141, "step": 371800 }, { "epoch": 0.96, "learning_rate": 0.00015543222709257326, "loss": 0.0115, "step": 371810 }, { "epoch": 0.96, "learning_rate": 0.00015542833887620177, "loss": 0.0115, "step": 371820 }, { "epoch": 0.96, "learning_rate": 0.0001554244506598303, "loss": 0.0102, "step": 371830 }, { "epoch": 0.96, "learning_rate": 0.00015542056244345883, "loss": 0.0122, "step": 371840 }, { "epoch": 0.96, "learning_rate": 0.0001554166742270874, "loss": 0.0125, "step": 371850 }, { "epoch": 0.96, "learning_rate": 0.00015541278601071591, "loss": 0.0121, "step": 371860 }, { "epoch": 0.96, "learning_rate": 0.00015540889779434446, "loss": 0.0137, "step": 371870 }, { "epoch": 0.96, "learning_rate": 0.00015540500957797297, "loss": 0.0142, "step": 371880 }, { "epoch": 0.96, "learning_rate": 0.00015540112136160154, "loss": 0.0121, "step": 371890 }, { "epoch": 0.96, "learning_rate": 0.00015539723314523005, "loss": 0.0119, "step": 371900 }, { "epoch": 0.96, "learning_rate": 0.0001553933449288586, "loss": 0.0118, "step": 371910 }, { "epoch": 0.96, "learning_rate": 0.0001553894567124871, "loss": 0.0097, "step": 371920 }, { "epoch": 0.96, "learning_rate": 0.00015538556849611565, "loss": 0.0102, "step": 371930 }, { "epoch": 0.96, "learning_rate": 0.0001553816802797442, "loss": 0.0122, "step": 371940 }, { "epoch": 0.96, "learning_rate": 0.00015537779206337273, "loss": 0.0124, "step": 371950 }, { "epoch": 0.96, "learning_rate": 0.00015537390384700125, "loss": 0.0101, "step": 371960 }, { "epoch": 0.96, "learning_rate": 0.0001553700156306298, "loss": 0.0119, "step": 371970 }, { "epoch": 0.96, "learning_rate": 0.00015536612741425833, "loss": 0.0113, "step": 371980 }, { "epoch": 0.96, "learning_rate": 0.00015536223919788687, "loss": 0.0101, "step": 371990 }, { "epoch": 0.96, "learning_rate": 0.0001553583509815154, "loss": 0.0149, "step": 372000 }, { "epoch": 0.96, "eval_cer": 0.8816872903168917, "eval_loss": 0.008426784537732601, "eval_runtime": 107.8013, "eval_samples_per_second": 18.553, "eval_steps_per_second": 4.638, "step": 372000 }, { "epoch": 0.96, "learning_rate": 0.00015535446276514393, "loss": 0.0121, "step": 372010 }, { "epoch": 0.96, "learning_rate": 0.0001553505745487725, "loss": 0.013, "step": 372020 }, { "epoch": 0.96, "learning_rate": 0.00015534668633240101, "loss": 0.0123, "step": 372030 }, { "epoch": 0.96, "learning_rate": 0.00015534279811602956, "loss": 0.0123, "step": 372040 }, { "epoch": 0.96, "learning_rate": 0.00015533890989965807, "loss": 0.0132, "step": 372050 }, { "epoch": 0.96, "learning_rate": 0.00015533502168328664, "loss": 0.0104, "step": 372060 }, { "epoch": 0.96, "learning_rate": 0.00015533113346691515, "loss": 0.0121, "step": 372070 }, { "epoch": 0.96, "learning_rate": 0.0001553272452505437, "loss": 0.0129, "step": 372080 }, { "epoch": 0.96, "learning_rate": 0.0001553233570341722, "loss": 0.0188, "step": 372090 }, { "epoch": 0.96, "learning_rate": 0.00015531946881780078, "loss": 0.0122, "step": 372100 }, { "epoch": 0.96, "learning_rate": 0.0001553155806014293, "loss": 0.0147, "step": 372110 }, { "epoch": 0.96, "learning_rate": 0.00015531169238505783, "loss": 0.0094, "step": 372120 }, { "epoch": 0.96, "learning_rate": 0.00015530780416868635, "loss": 0.0135, "step": 372130 }, { "epoch": 0.96, "learning_rate": 0.00015530391595231492, "loss": 0.015, "step": 372140 }, { "epoch": 0.96, "learning_rate": 0.00015530002773594343, "loss": 0.0149, "step": 372150 }, { "epoch": 0.96, "learning_rate": 0.00015529613951957197, "loss": 0.0103, "step": 372160 }, { "epoch": 0.96, "learning_rate": 0.0001552922513032005, "loss": 0.0164, "step": 372170 }, { "epoch": 0.96, "learning_rate": 0.00015528836308682903, "loss": 0.0117, "step": 372180 }, { "epoch": 0.96, "learning_rate": 0.0001552844748704576, "loss": 0.0114, "step": 372190 }, { "epoch": 0.96, "learning_rate": 0.0001552805866540861, "loss": 0.0126, "step": 372200 }, { "epoch": 0.96, "learning_rate": 0.00015527669843771465, "loss": 0.0109, "step": 372210 }, { "epoch": 0.96, "learning_rate": 0.00015527281022134317, "loss": 0.0091, "step": 372220 }, { "epoch": 0.96, "learning_rate": 0.00015526892200497174, "loss": 0.0144, "step": 372230 }, { "epoch": 0.96, "learning_rate": 0.00015526503378860025, "loss": 0.0109, "step": 372240 }, { "epoch": 0.96, "learning_rate": 0.0001552611455722288, "loss": 0.0176, "step": 372250 }, { "epoch": 0.96, "learning_rate": 0.0001552572573558573, "loss": 0.0149, "step": 372260 }, { "epoch": 0.96, "learning_rate": 0.00015525336913948588, "loss": 0.0098, "step": 372270 }, { "epoch": 0.97, "learning_rate": 0.0001552494809231144, "loss": 0.0143, "step": 372280 }, { "epoch": 0.97, "learning_rate": 0.00015524559270674293, "loss": 0.0132, "step": 372290 }, { "epoch": 0.97, "learning_rate": 0.00015524170449037145, "loss": 0.0114, "step": 372300 }, { "epoch": 0.97, "learning_rate": 0.00015523781627400002, "loss": 0.0099, "step": 372310 }, { "epoch": 0.97, "learning_rate": 0.00015523392805762853, "loss": 0.0128, "step": 372320 }, { "epoch": 0.97, "learning_rate": 0.00015523003984125707, "loss": 0.0148, "step": 372330 }, { "epoch": 0.97, "learning_rate": 0.0001552261516248856, "loss": 0.0115, "step": 372340 }, { "epoch": 0.97, "learning_rate": 0.00015522226340851416, "loss": 0.0149, "step": 372350 }, { "epoch": 0.97, "learning_rate": 0.0001552183751921427, "loss": 0.0117, "step": 372360 }, { "epoch": 0.97, "learning_rate": 0.0001552144869757712, "loss": 0.0106, "step": 372370 }, { "epoch": 0.97, "learning_rate": 0.00015521059875939973, "loss": 0.0119, "step": 372380 }, { "epoch": 0.97, "learning_rate": 0.0001552067105430283, "loss": 0.0129, "step": 372390 }, { "epoch": 0.97, "learning_rate": 0.00015520282232665684, "loss": 0.0125, "step": 372400 }, { "epoch": 0.97, "learning_rate": 0.00015519893411028535, "loss": 0.013, "step": 372410 }, { "epoch": 0.97, "learning_rate": 0.0001551950458939139, "loss": 0.0112, "step": 372420 }, { "epoch": 0.97, "learning_rate": 0.0001551911576775424, "loss": 0.0143, "step": 372430 }, { "epoch": 0.97, "learning_rate": 0.00015518726946117098, "loss": 0.0122, "step": 372440 }, { "epoch": 0.97, "learning_rate": 0.0001551833812447995, "loss": 0.0163, "step": 372450 }, { "epoch": 0.97, "learning_rate": 0.00015517949302842803, "loss": 0.0164, "step": 372460 }, { "epoch": 0.97, "learning_rate": 0.00015517560481205655, "loss": 0.0123, "step": 372470 }, { "epoch": 0.97, "learning_rate": 0.00015517171659568512, "loss": 0.0201, "step": 372480 }, { "epoch": 0.97, "learning_rate": 0.00015516782837931363, "loss": 0.0112, "step": 372490 }, { "epoch": 0.97, "learning_rate": 0.00015516394016294217, "loss": 0.0115, "step": 372500 }, { "epoch": 0.97, "learning_rate": 0.0001551600519465707, "loss": 0.0132, "step": 372510 }, { "epoch": 0.97, "learning_rate": 0.00015515616373019926, "loss": 0.0164, "step": 372520 }, { "epoch": 0.97, "learning_rate": 0.0001551522755138278, "loss": 0.0155, "step": 372530 }, { "epoch": 0.97, "learning_rate": 0.0001551483872974563, "loss": 0.0113, "step": 372540 }, { "epoch": 0.97, "learning_rate": 0.00015514449908108483, "loss": 0.0156, "step": 372550 }, { "epoch": 0.97, "learning_rate": 0.0001551406108647134, "loss": 0.0124, "step": 372560 }, { "epoch": 0.97, "learning_rate": 0.00015513672264834194, "loss": 0.0134, "step": 372570 }, { "epoch": 0.97, "learning_rate": 0.00015513283443197045, "loss": 0.011, "step": 372580 }, { "epoch": 0.97, "learning_rate": 0.000155128946215599, "loss": 0.0116, "step": 372590 }, { "epoch": 0.97, "learning_rate": 0.00015512505799922753, "loss": 0.0124, "step": 372600 }, { "epoch": 0.97, "learning_rate": 0.00015512116978285608, "loss": 0.0139, "step": 372610 }, { "epoch": 0.97, "learning_rate": 0.0001551172815664846, "loss": 0.0144, "step": 372620 }, { "epoch": 0.97, "learning_rate": 0.00015511339335011313, "loss": 0.0111, "step": 372630 }, { "epoch": 0.97, "learning_rate": 0.00015510950513374167, "loss": 0.0107, "step": 372640 }, { "epoch": 0.97, "learning_rate": 0.00015510561691737022, "loss": 0.013, "step": 372650 }, { "epoch": 0.97, "learning_rate": 0.00015510172870099873, "loss": 0.01, "step": 372660 }, { "epoch": 0.97, "learning_rate": 0.00015509784048462727, "loss": 0.0097, "step": 372670 }, { "epoch": 0.97, "learning_rate": 0.0001550939522682558, "loss": 0.0112, "step": 372680 }, { "epoch": 0.97, "learning_rate": 0.00015509006405188436, "loss": 0.0158, "step": 372690 }, { "epoch": 0.97, "learning_rate": 0.00015508617583551287, "loss": 0.0109, "step": 372700 }, { "epoch": 0.97, "learning_rate": 0.0001550822876191414, "loss": 0.0121, "step": 372710 }, { "epoch": 0.97, "learning_rate": 0.00015507839940276993, "loss": 0.011, "step": 372720 }, { "epoch": 0.97, "learning_rate": 0.0001550745111863985, "loss": 0.0135, "step": 372730 }, { "epoch": 0.97, "learning_rate": 0.00015507062297002704, "loss": 0.012, "step": 372740 }, { "epoch": 0.97, "learning_rate": 0.00015506673475365555, "loss": 0.0118, "step": 372750 }, { "epoch": 0.97, "learning_rate": 0.0001550628465372841, "loss": 0.0151, "step": 372760 }, { "epoch": 0.97, "learning_rate": 0.00015505895832091263, "loss": 0.0128, "step": 372770 }, { "epoch": 0.97, "learning_rate": 0.00015505507010454118, "loss": 0.0126, "step": 372780 }, { "epoch": 0.97, "learning_rate": 0.0001550511818881697, "loss": 0.013, "step": 372790 }, { "epoch": 0.97, "learning_rate": 0.00015504729367179823, "loss": 0.0117, "step": 372800 }, { "epoch": 0.97, "learning_rate": 0.00015504340545542677, "loss": 0.0136, "step": 372810 }, { "epoch": 0.97, "learning_rate": 0.00015503951723905532, "loss": 0.0126, "step": 372820 }, { "epoch": 0.97, "learning_rate": 0.00015503562902268383, "loss": 0.0097, "step": 372830 }, { "epoch": 0.97, "learning_rate": 0.00015503174080631237, "loss": 0.0134, "step": 372840 }, { "epoch": 0.97, "learning_rate": 0.0001550278525899409, "loss": 0.0243, "step": 372850 }, { "epoch": 0.97, "learning_rate": 0.00015502396437356945, "loss": 0.0162, "step": 372860 }, { "epoch": 0.97, "learning_rate": 0.00015502007615719797, "loss": 0.0105, "step": 372870 }, { "epoch": 0.97, "learning_rate": 0.0001550161879408265, "loss": 0.012, "step": 372880 }, { "epoch": 0.97, "learning_rate": 0.00015501229972445508, "loss": 0.0103, "step": 372890 }, { "epoch": 0.97, "learning_rate": 0.0001550084115080836, "loss": 0.0131, "step": 372900 }, { "epoch": 0.97, "learning_rate": 0.00015500452329171214, "loss": 0.0152, "step": 372910 }, { "epoch": 0.97, "learning_rate": 0.00015500063507534065, "loss": 0.0154, "step": 372920 }, { "epoch": 0.97, "learning_rate": 0.0001549967468589692, "loss": 0.012, "step": 372930 }, { "epoch": 0.97, "learning_rate": 0.00015499285864259773, "loss": 0.0127, "step": 372940 }, { "epoch": 0.97, "learning_rate": 0.00015498897042622628, "loss": 0.0118, "step": 372950 }, { "epoch": 0.97, "learning_rate": 0.0001549850822098548, "loss": 0.0107, "step": 372960 }, { "epoch": 0.97, "learning_rate": 0.00015498119399348333, "loss": 0.0119, "step": 372970 }, { "epoch": 0.97, "learning_rate": 0.00015497730577711187, "loss": 0.0118, "step": 372980 }, { "epoch": 0.97, "learning_rate": 0.00015497341756074041, "loss": 0.0132, "step": 372990 }, { "epoch": 0.97, "learning_rate": 0.00015496952934436893, "loss": 0.0096, "step": 373000 }, { "epoch": 0.97, "eval_cer": 0.8817138834186412, "eval_loss": 0.00843864493072033, "eval_runtime": 107.4926, "eval_samples_per_second": 18.606, "eval_steps_per_second": 4.651, "step": 373000 }, { "epoch": 0.97, "learning_rate": 0.00015496564112799747, "loss": 0.0131, "step": 373010 }, { "epoch": 0.97, "learning_rate": 0.000154961752911626, "loss": 0.0161, "step": 373020 }, { "epoch": 0.97, "learning_rate": 0.00015495786469525455, "loss": 0.0118, "step": 373030 }, { "epoch": 0.97, "learning_rate": 0.00015495397647888307, "loss": 0.0147, "step": 373040 }, { "epoch": 0.97, "learning_rate": 0.0001549500882625116, "loss": 0.0164, "step": 373050 }, { "epoch": 0.97, "learning_rate": 0.00015494620004614018, "loss": 0.0155, "step": 373060 }, { "epoch": 0.97, "learning_rate": 0.0001549423118297687, "loss": 0.0131, "step": 373070 }, { "epoch": 0.97, "learning_rate": 0.00015493842361339724, "loss": 0.0121, "step": 373080 }, { "epoch": 0.97, "learning_rate": 0.00015493453539702575, "loss": 0.0155, "step": 373090 }, { "epoch": 0.97, "learning_rate": 0.00015493064718065432, "loss": 0.0112, "step": 373100 }, { "epoch": 0.97, "learning_rate": 0.00015492675896428283, "loss": 0.0123, "step": 373110 }, { "epoch": 0.97, "learning_rate": 0.00015492287074791137, "loss": 0.0128, "step": 373120 }, { "epoch": 0.97, "learning_rate": 0.0001549189825315399, "loss": 0.0091, "step": 373130 }, { "epoch": 0.97, "learning_rate": 0.00015491509431516846, "loss": 0.0115, "step": 373140 }, { "epoch": 0.97, "learning_rate": 0.00015491120609879697, "loss": 0.0123, "step": 373150 }, { "epoch": 0.97, "learning_rate": 0.00015490731788242551, "loss": 0.0099, "step": 373160 }, { "epoch": 0.97, "learning_rate": 0.00015490342966605403, "loss": 0.012, "step": 373170 }, { "epoch": 0.97, "learning_rate": 0.00015489954144968257, "loss": 0.0122, "step": 373180 }, { "epoch": 0.97, "learning_rate": 0.0001548956532333111, "loss": 0.0122, "step": 373190 }, { "epoch": 0.97, "learning_rate": 0.00015489176501693965, "loss": 0.0132, "step": 373200 }, { "epoch": 0.97, "learning_rate": 0.00015488787680056817, "loss": 0.0137, "step": 373210 }, { "epoch": 0.97, "learning_rate": 0.0001548839885841967, "loss": 0.0127, "step": 373220 }, { "epoch": 0.97, "learning_rate": 0.00015488010036782528, "loss": 0.0118, "step": 373230 }, { "epoch": 0.97, "learning_rate": 0.0001548762121514538, "loss": 0.0123, "step": 373240 }, { "epoch": 0.97, "learning_rate": 0.0001548723239350823, "loss": 0.0101, "step": 373250 }, { "epoch": 0.97, "learning_rate": 0.00015486843571871085, "loss": 0.0136, "step": 373260 }, { "epoch": 0.97, "learning_rate": 0.00015486454750233942, "loss": 0.0115, "step": 373270 }, { "epoch": 0.97, "learning_rate": 0.00015486065928596793, "loss": 0.0128, "step": 373280 }, { "epoch": 0.97, "learning_rate": 0.00015485677106959647, "loss": 0.0151, "step": 373290 }, { "epoch": 0.97, "learning_rate": 0.000154852882853225, "loss": 0.0104, "step": 373300 }, { "epoch": 0.97, "learning_rate": 0.00015484899463685356, "loss": 0.0116, "step": 373310 }, { "epoch": 0.97, "learning_rate": 0.00015484510642048207, "loss": 0.0115, "step": 373320 }, { "epoch": 0.97, "learning_rate": 0.0001548412182041106, "loss": 0.0153, "step": 373330 }, { "epoch": 0.97, "learning_rate": 0.00015483732998773913, "loss": 0.0112, "step": 373340 }, { "epoch": 0.97, "learning_rate": 0.0001548334417713677, "loss": 0.0146, "step": 373350 }, { "epoch": 0.97, "learning_rate": 0.0001548295535549962, "loss": 0.0123, "step": 373360 }, { "epoch": 0.97, "learning_rate": 0.00015482566533862475, "loss": 0.0098, "step": 373370 }, { "epoch": 0.97, "learning_rate": 0.00015482177712225327, "loss": 0.0102, "step": 373380 }, { "epoch": 0.97, "learning_rate": 0.00015481788890588184, "loss": 0.0136, "step": 373390 }, { "epoch": 0.97, "learning_rate": 0.00015481400068951038, "loss": 0.0119, "step": 373400 }, { "epoch": 0.97, "learning_rate": 0.0001548101124731389, "loss": 0.009, "step": 373410 }, { "epoch": 0.97, "learning_rate": 0.0001548062242567674, "loss": 0.0105, "step": 373420 }, { "epoch": 0.97, "learning_rate": 0.00015480233604039595, "loss": 0.0096, "step": 373430 }, { "epoch": 0.97, "learning_rate": 0.00015479844782402452, "loss": 0.0152, "step": 373440 }, { "epoch": 0.97, "learning_rate": 0.00015479455960765303, "loss": 0.0124, "step": 373450 }, { "epoch": 0.97, "learning_rate": 0.00015479067139128157, "loss": 0.0105, "step": 373460 }, { "epoch": 0.97, "learning_rate": 0.0001547867831749101, "loss": 0.01, "step": 373470 }, { "epoch": 0.97, "learning_rate": 0.00015478289495853866, "loss": 0.0129, "step": 373480 }, { "epoch": 0.97, "learning_rate": 0.00015477900674216717, "loss": 0.0141, "step": 373490 }, { "epoch": 0.97, "learning_rate": 0.0001547751185257957, "loss": 0.0122, "step": 373500 }, { "epoch": 0.97, "learning_rate": 0.00015477123030942423, "loss": 0.0144, "step": 373510 }, { "epoch": 0.97, "learning_rate": 0.0001547673420930528, "loss": 0.0136, "step": 373520 }, { "epoch": 0.97, "learning_rate": 0.0001547634538766813, "loss": 0.0121, "step": 373530 }, { "epoch": 0.97, "learning_rate": 0.00015475956566030985, "loss": 0.0209, "step": 373540 }, { "epoch": 0.97, "learning_rate": 0.00015475567744393837, "loss": 0.0131, "step": 373550 }, { "epoch": 0.97, "learning_rate": 0.00015475178922756694, "loss": 0.014, "step": 373560 }, { "epoch": 0.97, "learning_rate": 0.00015474790101119545, "loss": 0.011, "step": 373570 }, { "epoch": 0.97, "learning_rate": 0.000154744012794824, "loss": 0.0137, "step": 373580 }, { "epoch": 0.97, "learning_rate": 0.0001547401245784525, "loss": 0.0133, "step": 373590 }, { "epoch": 0.97, "learning_rate": 0.00015473623636208108, "loss": 0.0128, "step": 373600 }, { "epoch": 0.97, "learning_rate": 0.00015473234814570962, "loss": 0.0141, "step": 373610 }, { "epoch": 0.97, "learning_rate": 0.00015472845992933813, "loss": 0.0121, "step": 373620 }, { "epoch": 0.97, "learning_rate": 0.00015472457171296667, "loss": 0.0111, "step": 373630 }, { "epoch": 0.97, "learning_rate": 0.00015472068349659521, "loss": 0.0136, "step": 373640 }, { "epoch": 0.97, "learning_rate": 0.00015471679528022376, "loss": 0.012, "step": 373650 }, { "epoch": 0.97, "learning_rate": 0.00015471290706385227, "loss": 0.0145, "step": 373660 }, { "epoch": 0.97, "learning_rate": 0.0001547090188474808, "loss": 0.0117, "step": 373670 }, { "epoch": 0.97, "learning_rate": 0.00015470513063110933, "loss": 0.0133, "step": 373680 }, { "epoch": 0.97, "learning_rate": 0.0001547012424147379, "loss": 0.0121, "step": 373690 }, { "epoch": 0.97, "learning_rate": 0.0001546973541983664, "loss": 0.0139, "step": 373700 }, { "epoch": 0.97, "learning_rate": 0.00015469346598199495, "loss": 0.0119, "step": 373710 }, { "epoch": 0.97, "learning_rate": 0.00015468957776562347, "loss": 0.0119, "step": 373720 }, { "epoch": 0.97, "learning_rate": 0.00015468568954925204, "loss": 0.0095, "step": 373730 }, { "epoch": 0.97, "learning_rate": 0.00015468180133288055, "loss": 0.0121, "step": 373740 }, { "epoch": 0.97, "learning_rate": 0.0001546779131165091, "loss": 0.0375, "step": 373750 }, { "epoch": 0.97, "learning_rate": 0.0001546740249001376, "loss": 0.0106, "step": 373760 }, { "epoch": 0.97, "learning_rate": 0.00015467013668376617, "loss": 0.0124, "step": 373770 }, { "epoch": 0.97, "learning_rate": 0.00015466624846739472, "loss": 0.0335, "step": 373780 }, { "epoch": 0.97, "learning_rate": 0.00015466236025102323, "loss": 0.0131, "step": 373790 }, { "epoch": 0.97, "learning_rate": 0.00015465847203465177, "loss": 0.0119, "step": 373800 }, { "epoch": 0.97, "learning_rate": 0.00015465458381828031, "loss": 0.0126, "step": 373810 }, { "epoch": 0.97, "learning_rate": 0.00015465069560190886, "loss": 0.0152, "step": 373820 }, { "epoch": 0.97, "learning_rate": 0.00015464680738553737, "loss": 0.0144, "step": 373830 }, { "epoch": 0.97, "learning_rate": 0.0001546429191691659, "loss": 0.0127, "step": 373840 }, { "epoch": 0.97, "learning_rate": 0.00015463903095279445, "loss": 0.0101, "step": 373850 }, { "epoch": 0.97, "learning_rate": 0.000154635142736423, "loss": 0.0117, "step": 373860 }, { "epoch": 0.97, "learning_rate": 0.0001546312545200515, "loss": 0.015, "step": 373870 }, { "epoch": 0.97, "learning_rate": 0.00015462736630368005, "loss": 0.0143, "step": 373880 }, { "epoch": 0.97, "learning_rate": 0.0001546234780873086, "loss": 0.0178, "step": 373890 }, { "epoch": 0.97, "learning_rate": 0.00015461958987093713, "loss": 0.0122, "step": 373900 }, { "epoch": 0.97, "learning_rate": 0.00015461570165456565, "loss": 0.012, "step": 373910 }, { "epoch": 0.97, "learning_rate": 0.0001546118134381942, "loss": 0.0124, "step": 373920 }, { "epoch": 0.97, "learning_rate": 0.0001546079252218227, "loss": 0.0177, "step": 373930 }, { "epoch": 0.97, "learning_rate": 0.00015460403700545127, "loss": 0.0123, "step": 373940 }, { "epoch": 0.97, "learning_rate": 0.00015460014878907982, "loss": 0.0124, "step": 373950 }, { "epoch": 0.97, "learning_rate": 0.00015459626057270833, "loss": 0.0116, "step": 373960 }, { "epoch": 0.97, "learning_rate": 0.00015459237235633684, "loss": 0.0106, "step": 373970 }, { "epoch": 0.97, "learning_rate": 0.0001545884841399654, "loss": 0.0225, "step": 373980 }, { "epoch": 0.97, "learning_rate": 0.00015458459592359395, "loss": 0.0136, "step": 373990 }, { "epoch": 0.97, "learning_rate": 0.00015458070770722247, "loss": 0.0093, "step": 374000 }, { "epoch": 0.97, "eval_cer": 0.8817306790618513, "eval_loss": 0.00830517616122961, "eval_runtime": 107.6382, "eval_samples_per_second": 18.581, "eval_steps_per_second": 4.645, "step": 374000 }, { "epoch": 0.97, "learning_rate": 0.000154576819490851, "loss": 0.0149, "step": 374010 }, { "epoch": 0.97, "learning_rate": 0.00015457293127447955, "loss": 0.0112, "step": 374020 }, { "epoch": 0.97, "learning_rate": 0.0001545690430581081, "loss": 0.0113, "step": 374030 }, { "epoch": 0.97, "learning_rate": 0.0001545651548417366, "loss": 0.011, "step": 374040 }, { "epoch": 0.97, "learning_rate": 0.00015456126662536515, "loss": 0.0121, "step": 374050 }, { "epoch": 0.97, "learning_rate": 0.0001545573784089937, "loss": 0.0136, "step": 374060 }, { "epoch": 0.97, "learning_rate": 0.00015455349019262223, "loss": 0.0113, "step": 374070 }, { "epoch": 0.97, "learning_rate": 0.00015454960197625075, "loss": 0.0106, "step": 374080 }, { "epoch": 0.97, "learning_rate": 0.0001545457137598793, "loss": 0.0127, "step": 374090 }, { "epoch": 0.97, "learning_rate": 0.00015454182554350786, "loss": 0.0128, "step": 374100 }, { "epoch": 0.97, "learning_rate": 0.00015453793732713637, "loss": 0.0105, "step": 374110 }, { "epoch": 0.97, "learning_rate": 0.00015453404911076491, "loss": 0.0117, "step": 374120 }, { "epoch": 0.97, "learning_rate": 0.00015453016089439343, "loss": 0.0128, "step": 374130 }, { "epoch": 0.97, "learning_rate": 0.000154526272678022, "loss": 0.0095, "step": 374140 }, { "epoch": 0.97, "learning_rate": 0.0001545223844616505, "loss": 0.0117, "step": 374150 }, { "epoch": 0.97, "learning_rate": 0.00015451849624527905, "loss": 0.0129, "step": 374160 }, { "epoch": 0.97, "learning_rate": 0.00015451460802890757, "loss": 0.0164, "step": 374170 }, { "epoch": 0.97, "learning_rate": 0.0001545107198125361, "loss": 0.0122, "step": 374180 }, { "epoch": 0.97, "learning_rate": 0.00015450683159616465, "loss": 0.0124, "step": 374190 }, { "epoch": 0.97, "learning_rate": 0.0001545029433797932, "loss": 0.0113, "step": 374200 }, { "epoch": 0.97, "learning_rate": 0.0001544990551634217, "loss": 0.0121, "step": 374210 }, { "epoch": 0.97, "learning_rate": 0.00015449516694705025, "loss": 0.0144, "step": 374220 }, { "epoch": 0.97, "learning_rate": 0.0001544912787306788, "loss": 0.0105, "step": 374230 }, { "epoch": 0.97, "learning_rate": 0.00015448739051430733, "loss": 0.012, "step": 374240 }, { "epoch": 0.97, "learning_rate": 0.00015448350229793585, "loss": 0.0113, "step": 374250 }, { "epoch": 0.97, "learning_rate": 0.0001544796140815644, "loss": 0.0101, "step": 374260 }, { "epoch": 0.97, "learning_rate": 0.00015447572586519296, "loss": 0.0124, "step": 374270 }, { "epoch": 0.97, "learning_rate": 0.00015447183764882147, "loss": 0.0119, "step": 374280 }, { "epoch": 0.97, "learning_rate": 0.00015446794943245, "loss": 0.0113, "step": 374290 }, { "epoch": 0.97, "learning_rate": 0.00015446406121607853, "loss": 0.0136, "step": 374300 }, { "epoch": 0.97, "learning_rate": 0.0001544601729997071, "loss": 0.0129, "step": 374310 }, { "epoch": 0.97, "learning_rate": 0.0001544562847833356, "loss": 0.0132, "step": 374320 }, { "epoch": 0.97, "learning_rate": 0.00015445239656696415, "loss": 0.0102, "step": 374330 }, { "epoch": 0.97, "learning_rate": 0.00015444850835059267, "loss": 0.0136, "step": 374340 }, { "epoch": 0.97, "learning_rate": 0.00015444462013422124, "loss": 0.0133, "step": 374350 }, { "epoch": 0.97, "learning_rate": 0.00015444073191784975, "loss": 0.0124, "step": 374360 }, { "epoch": 0.97, "learning_rate": 0.0001544368437014783, "loss": 0.0125, "step": 374370 }, { "epoch": 0.97, "learning_rate": 0.0001544329554851068, "loss": 0.0131, "step": 374380 }, { "epoch": 0.97, "learning_rate": 0.00015442906726873538, "loss": 0.0148, "step": 374390 }, { "epoch": 0.97, "learning_rate": 0.0001544251790523639, "loss": 0.0112, "step": 374400 }, { "epoch": 0.97, "learning_rate": 0.00015442129083599243, "loss": 0.0128, "step": 374410 }, { "epoch": 0.97, "learning_rate": 0.00015441740261962095, "loss": 0.0117, "step": 374420 }, { "epoch": 0.97, "learning_rate": 0.0001544135144032495, "loss": 0.0117, "step": 374430 }, { "epoch": 0.97, "learning_rate": 0.00015440962618687803, "loss": 0.0116, "step": 374440 }, { "epoch": 0.97, "learning_rate": 0.00015440573797050657, "loss": 0.0103, "step": 374450 }, { "epoch": 0.97, "learning_rate": 0.0001544018497541351, "loss": 0.0122, "step": 374460 }, { "epoch": 0.97, "learning_rate": 0.00015439796153776363, "loss": 0.0107, "step": 374470 }, { "epoch": 0.97, "learning_rate": 0.0001543940733213922, "loss": 0.0156, "step": 374480 }, { "epoch": 0.97, "learning_rate": 0.0001543901851050207, "loss": 0.0129, "step": 374490 }, { "epoch": 0.97, "learning_rate": 0.00015438629688864925, "loss": 0.0138, "step": 374500 }, { "epoch": 0.97, "learning_rate": 0.00015438240867227777, "loss": 0.0105, "step": 374510 }, { "epoch": 0.97, "learning_rate": 0.00015437852045590634, "loss": 0.018, "step": 374520 }, { "epoch": 0.97, "learning_rate": 0.00015437463223953485, "loss": 0.011, "step": 374530 }, { "epoch": 0.97, "learning_rate": 0.0001543707440231634, "loss": 0.0123, "step": 374540 }, { "epoch": 0.97, "learning_rate": 0.0001543668558067919, "loss": 0.0084, "step": 374550 }, { "epoch": 0.97, "learning_rate": 0.00015436296759042048, "loss": 0.0109, "step": 374560 }, { "epoch": 0.97, "learning_rate": 0.000154359079374049, "loss": 0.0099, "step": 374570 }, { "epoch": 0.97, "learning_rate": 0.00015435519115767753, "loss": 0.01, "step": 374580 }, { "epoch": 0.97, "learning_rate": 0.00015435130294130605, "loss": 0.0104, "step": 374590 }, { "epoch": 0.97, "learning_rate": 0.00015434741472493462, "loss": 0.0114, "step": 374600 }, { "epoch": 0.97, "learning_rate": 0.00015434352650856313, "loss": 0.0107, "step": 374610 }, { "epoch": 0.97, "learning_rate": 0.00015433963829219167, "loss": 0.0104, "step": 374620 }, { "epoch": 0.97, "learning_rate": 0.00015433575007582019, "loss": 0.0132, "step": 374630 }, { "epoch": 0.97, "learning_rate": 0.00015433186185944875, "loss": 0.0109, "step": 374640 }, { "epoch": 0.97, "learning_rate": 0.0001543279736430773, "loss": 0.0116, "step": 374650 }, { "epoch": 0.97, "learning_rate": 0.0001543240854267058, "loss": 0.0136, "step": 374660 }, { "epoch": 0.97, "learning_rate": 0.00015432019721033435, "loss": 0.0124, "step": 374670 }, { "epoch": 0.97, "learning_rate": 0.00015431630899396287, "loss": 0.0108, "step": 374680 }, { "epoch": 0.97, "learning_rate": 0.00015431242077759144, "loss": 0.0153, "step": 374690 }, { "epoch": 0.97, "learning_rate": 0.00015430853256121995, "loss": 0.0108, "step": 374700 }, { "epoch": 0.97, "learning_rate": 0.0001543046443448485, "loss": 0.0102, "step": 374710 }, { "epoch": 0.97, "learning_rate": 0.000154300756128477, "loss": 0.0133, "step": 374720 }, { "epoch": 0.97, "learning_rate": 0.00015429686791210558, "loss": 0.0158, "step": 374730 }, { "epoch": 0.97, "learning_rate": 0.0001542929796957341, "loss": 0.0147, "step": 374740 }, { "epoch": 0.97, "learning_rate": 0.00015428909147936263, "loss": 0.0155, "step": 374750 }, { "epoch": 0.97, "learning_rate": 0.00015428520326299115, "loss": 0.0162, "step": 374760 }, { "epoch": 0.97, "learning_rate": 0.00015428131504661971, "loss": 0.0135, "step": 374770 }, { "epoch": 0.97, "learning_rate": 0.00015427742683024823, "loss": 0.0142, "step": 374780 }, { "epoch": 0.97, "learning_rate": 0.00015427353861387677, "loss": 0.0167, "step": 374790 }, { "epoch": 0.97, "learning_rate": 0.00015426965039750529, "loss": 0.0111, "step": 374800 }, { "epoch": 0.97, "learning_rate": 0.00015426576218113385, "loss": 0.0144, "step": 374810 }, { "epoch": 0.97, "learning_rate": 0.0001542618739647624, "loss": 0.0119, "step": 374820 }, { "epoch": 0.97, "learning_rate": 0.0001542579857483909, "loss": 0.0121, "step": 374830 }, { "epoch": 0.97, "learning_rate": 0.00015425409753201942, "loss": 0.0109, "step": 374840 }, { "epoch": 0.97, "learning_rate": 0.000154250209315648, "loss": 0.0141, "step": 374850 }, { "epoch": 0.97, "learning_rate": 0.00015424632109927654, "loss": 0.0165, "step": 374860 }, { "epoch": 0.97, "learning_rate": 0.00015424243288290505, "loss": 0.0116, "step": 374870 }, { "epoch": 0.97, "learning_rate": 0.0001542385446665336, "loss": 0.0142, "step": 374880 }, { "epoch": 0.97, "learning_rate": 0.0001542346564501621, "loss": 0.0122, "step": 374890 }, { "epoch": 0.97, "learning_rate": 0.00015423076823379067, "loss": 0.0128, "step": 374900 }, { "epoch": 0.97, "learning_rate": 0.0001542268800174192, "loss": 0.0132, "step": 374910 }, { "epoch": 0.97, "learning_rate": 0.00015422299180104773, "loss": 0.012, "step": 374920 }, { "epoch": 0.97, "learning_rate": 0.00015421910358467625, "loss": 0.0115, "step": 374930 }, { "epoch": 0.97, "learning_rate": 0.00015421521536830481, "loss": 0.0129, "step": 374940 }, { "epoch": 0.97, "learning_rate": 0.00015421132715193333, "loss": 0.0138, "step": 374950 }, { "epoch": 0.97, "learning_rate": 0.00015420743893556187, "loss": 0.0132, "step": 374960 }, { "epoch": 0.97, "learning_rate": 0.00015420355071919038, "loss": 0.0121, "step": 374970 }, { "epoch": 0.97, "learning_rate": 0.00015419966250281895, "loss": 0.01, "step": 374980 }, { "epoch": 0.97, "learning_rate": 0.0001541957742864475, "loss": 0.0172, "step": 374990 }, { "epoch": 0.97, "learning_rate": 0.000154191886070076, "loss": 0.0126, "step": 375000 }, { "epoch": 0.97, "eval_cer": 0.8817390768834564, "eval_loss": 0.008427051827311516, "eval_runtime": 107.5685, "eval_samples_per_second": 18.593, "eval_steps_per_second": 4.648, "step": 375000 }, { "epoch": 0.97, "learning_rate": 0.00015418799785370452, "loss": 0.012, "step": 375010 }, { "epoch": 0.97, "learning_rate": 0.0001541841096373331, "loss": 0.0136, "step": 375020 }, { "epoch": 0.97, "learning_rate": 0.00015418022142096163, "loss": 0.0121, "step": 375030 }, { "epoch": 0.97, "learning_rate": 0.00015417633320459015, "loss": 0.0115, "step": 375040 }, { "epoch": 0.97, "learning_rate": 0.0001541724449882187, "loss": 0.0122, "step": 375050 }, { "epoch": 0.97, "learning_rate": 0.00015416855677184723, "loss": 0.0134, "step": 375060 }, { "epoch": 0.97, "learning_rate": 0.00015416466855547577, "loss": 0.0157, "step": 375070 }, { "epoch": 0.97, "learning_rate": 0.0001541607803391043, "loss": 0.0129, "step": 375080 }, { "epoch": 0.97, "learning_rate": 0.00015415689212273283, "loss": 0.0113, "step": 375090 }, { "epoch": 0.97, "learning_rate": 0.00015415300390636137, "loss": 0.0138, "step": 375100 }, { "epoch": 0.97, "learning_rate": 0.00015414911568998991, "loss": 0.0128, "step": 375110 }, { "epoch": 0.97, "learning_rate": 0.00015414522747361843, "loss": 0.0138, "step": 375120 }, { "epoch": 0.97, "learning_rate": 0.00015414133925724697, "loss": 0.0142, "step": 375130 }, { "epoch": 0.97, "learning_rate": 0.00015413745104087548, "loss": 0.0141, "step": 375140 }, { "epoch": 0.97, "learning_rate": 0.00015413356282450405, "loss": 0.0139, "step": 375150 }, { "epoch": 0.97, "learning_rate": 0.00015412967460813257, "loss": 0.0134, "step": 375160 }, { "epoch": 0.97, "learning_rate": 0.0001541257863917611, "loss": 0.0132, "step": 375170 }, { "epoch": 0.97, "learning_rate": 0.00015412189817538962, "loss": 0.0132, "step": 375180 }, { "epoch": 0.97, "learning_rate": 0.0001541180099590182, "loss": 0.0134, "step": 375190 }, { "epoch": 0.97, "learning_rate": 0.00015411412174264673, "loss": 0.0126, "step": 375200 }, { "epoch": 0.97, "learning_rate": 0.00015411023352627525, "loss": 0.0144, "step": 375210 }, { "epoch": 0.97, "learning_rate": 0.0001541063453099038, "loss": 0.0116, "step": 375220 }, { "epoch": 0.97, "learning_rate": 0.00015410245709353233, "loss": 0.0129, "step": 375230 }, { "epoch": 0.97, "learning_rate": 0.00015409856887716087, "loss": 0.0108, "step": 375240 }, { "epoch": 0.97, "learning_rate": 0.0001540946806607894, "loss": 0.0103, "step": 375250 }, { "epoch": 0.97, "learning_rate": 0.00015409079244441793, "loss": 0.012, "step": 375260 }, { "epoch": 0.97, "learning_rate": 0.00015408690422804647, "loss": 0.012, "step": 375270 }, { "epoch": 0.97, "learning_rate": 0.000154083016011675, "loss": 0.0162, "step": 375280 }, { "epoch": 0.97, "learning_rate": 0.00015407912779530353, "loss": 0.0113, "step": 375290 }, { "epoch": 0.97, "learning_rate": 0.00015407523957893207, "loss": 0.012, "step": 375300 }, { "epoch": 0.97, "learning_rate": 0.0001540713513625606, "loss": 0.0138, "step": 375310 }, { "epoch": 0.97, "learning_rate": 0.00015406746314618915, "loss": 0.0123, "step": 375320 }, { "epoch": 0.97, "learning_rate": 0.00015406357492981767, "loss": 0.0154, "step": 375330 }, { "epoch": 0.97, "learning_rate": 0.0001540596867134462, "loss": 0.0112, "step": 375340 }, { "epoch": 0.97, "learning_rate": 0.00015405579849707478, "loss": 0.0159, "step": 375350 }, { "epoch": 0.97, "learning_rate": 0.0001540519102807033, "loss": 0.0166, "step": 375360 }, { "epoch": 0.97, "learning_rate": 0.00015404802206433183, "loss": 0.013, "step": 375370 }, { "epoch": 0.97, "learning_rate": 0.00015404413384796035, "loss": 0.0176, "step": 375380 }, { "epoch": 0.97, "learning_rate": 0.0001540402456315889, "loss": 0.012, "step": 375390 }, { "epoch": 0.97, "learning_rate": 0.00015403635741521743, "loss": 0.0134, "step": 375400 }, { "epoch": 0.97, "learning_rate": 0.00015403246919884597, "loss": 0.0095, "step": 375410 }, { "epoch": 0.97, "learning_rate": 0.0001540285809824745, "loss": 0.0134, "step": 375420 }, { "epoch": 0.97, "learning_rate": 0.00015402469276610303, "loss": 0.0123, "step": 375430 }, { "epoch": 0.97, "learning_rate": 0.00015402080454973157, "loss": 0.0093, "step": 375440 }, { "epoch": 0.97, "learning_rate": 0.0001540169163333601, "loss": 0.0111, "step": 375450 }, { "epoch": 0.97, "learning_rate": 0.00015401302811698863, "loss": 0.0144, "step": 375460 }, { "epoch": 0.97, "learning_rate": 0.00015400913990061717, "loss": 0.0089, "step": 375470 }, { "epoch": 0.97, "learning_rate": 0.0001540052516842457, "loss": 0.0119, "step": 375480 }, { "epoch": 0.97, "learning_rate": 0.00015400136346787425, "loss": 0.0127, "step": 375490 }, { "epoch": 0.97, "learning_rate": 0.00015399747525150277, "loss": 0.0097, "step": 375500 }, { "epoch": 0.97, "learning_rate": 0.0001539935870351313, "loss": 0.0121, "step": 375510 }, { "epoch": 0.97, "learning_rate": 0.00015398969881875988, "loss": 0.0147, "step": 375520 }, { "epoch": 0.97, "learning_rate": 0.0001539858106023884, "loss": 0.0114, "step": 375530 }, { "epoch": 0.97, "learning_rate": 0.00015398192238601693, "loss": 0.0141, "step": 375540 }, { "epoch": 0.97, "learning_rate": 0.00015397803416964545, "loss": 0.013, "step": 375550 }, { "epoch": 0.97, "learning_rate": 0.00015397414595327402, "loss": 0.0153, "step": 375560 }, { "epoch": 0.97, "learning_rate": 0.00015397025773690253, "loss": 0.016, "step": 375570 }, { "epoch": 0.97, "learning_rate": 0.00015396636952053107, "loss": 0.0156, "step": 375580 }, { "epoch": 0.97, "learning_rate": 0.0001539624813041596, "loss": 0.0181, "step": 375590 }, { "epoch": 0.97, "learning_rate": 0.00015395859308778816, "loss": 0.0137, "step": 375600 }, { "epoch": 0.97, "learning_rate": 0.00015395470487141667, "loss": 0.019, "step": 375610 }, { "epoch": 0.97, "learning_rate": 0.0001539508166550452, "loss": 0.0165, "step": 375620 }, { "epoch": 0.97, "learning_rate": 0.00015394692843867373, "loss": 0.0128, "step": 375630 }, { "epoch": 0.97, "learning_rate": 0.00015394304022230227, "loss": 0.0121, "step": 375640 }, { "epoch": 0.97, "learning_rate": 0.0001539391520059308, "loss": 0.0133, "step": 375650 }, { "epoch": 0.97, "learning_rate": 0.00015393526378955935, "loss": 0.0156, "step": 375660 }, { "epoch": 0.97, "learning_rate": 0.00015393137557318787, "loss": 0.0127, "step": 375670 }, { "epoch": 0.97, "learning_rate": 0.0001539274873568164, "loss": 0.0118, "step": 375680 }, { "epoch": 0.97, "learning_rate": 0.00015392359914044498, "loss": 0.022, "step": 375690 }, { "epoch": 0.97, "learning_rate": 0.0001539197109240735, "loss": 0.0113, "step": 375700 }, { "epoch": 0.97, "learning_rate": 0.00015391582270770203, "loss": 0.0122, "step": 375710 }, { "epoch": 0.97, "learning_rate": 0.00015391193449133055, "loss": 0.0158, "step": 375720 }, { "epoch": 0.97, "learning_rate": 0.00015390804627495912, "loss": 0.0138, "step": 375730 }, { "epoch": 0.97, "learning_rate": 0.00015390415805858763, "loss": 0.0114, "step": 375740 }, { "epoch": 0.97, "learning_rate": 0.00015390026984221617, "loss": 0.014, "step": 375750 }, { "epoch": 0.97, "learning_rate": 0.0001538963816258447, "loss": 0.0115, "step": 375760 }, { "epoch": 0.97, "learning_rate": 0.00015389249340947326, "loss": 0.009, "step": 375770 }, { "epoch": 0.97, "learning_rate": 0.00015388860519310177, "loss": 0.0104, "step": 375780 }, { "epoch": 0.97, "learning_rate": 0.0001538847169767303, "loss": 0.0113, "step": 375790 }, { "epoch": 0.97, "learning_rate": 0.00015388082876035883, "loss": 0.0145, "step": 375800 }, { "epoch": 0.97, "learning_rate": 0.0001538769405439874, "loss": 0.012, "step": 375810 }, { "epoch": 0.97, "learning_rate": 0.0001538730523276159, "loss": 0.0172, "step": 375820 }, { "epoch": 0.97, "learning_rate": 0.00015386916411124445, "loss": 0.011, "step": 375830 }, { "epoch": 0.97, "learning_rate": 0.00015386527589487297, "loss": 0.015, "step": 375840 }, { "epoch": 0.97, "learning_rate": 0.00015386138767850153, "loss": 0.0109, "step": 375850 }, { "epoch": 0.97, "learning_rate": 0.00015385749946213008, "loss": 0.013, "step": 375860 }, { "epoch": 0.97, "learning_rate": 0.0001538536112457586, "loss": 0.0108, "step": 375870 }, { "epoch": 0.97, "learning_rate": 0.0001538497230293871, "loss": 0.0117, "step": 375880 }, { "epoch": 0.97, "learning_rate": 0.00015384583481301565, "loss": 0.0118, "step": 375890 }, { "epoch": 0.97, "learning_rate": 0.00015384194659664422, "loss": 0.0131, "step": 375900 }, { "epoch": 0.97, "learning_rate": 0.00015383805838027273, "loss": 0.0132, "step": 375910 }, { "epoch": 0.97, "learning_rate": 0.00015383417016390127, "loss": 0.0114, "step": 375920 }, { "epoch": 0.97, "learning_rate": 0.00015383028194752979, "loss": 0.0118, "step": 375930 }, { "epoch": 0.97, "learning_rate": 0.00015382639373115835, "loss": 0.0125, "step": 375940 }, { "epoch": 0.97, "learning_rate": 0.00015382250551478687, "loss": 0.0095, "step": 375950 }, { "epoch": 0.97, "learning_rate": 0.0001538186172984154, "loss": 0.0148, "step": 375960 }, { "epoch": 0.97, "learning_rate": 0.00015381472908204393, "loss": 0.0193, "step": 375970 }, { "epoch": 0.97, "learning_rate": 0.0001538108408656725, "loss": 0.0105, "step": 375980 }, { "epoch": 0.97, "learning_rate": 0.000153806952649301, "loss": 0.0117, "step": 375990 }, { "epoch": 0.97, "learning_rate": 0.00015380306443292955, "loss": 0.0167, "step": 376000 }, { "epoch": 0.97, "eval_cer": 0.8817334783357197, "eval_loss": 0.008328206837177277, "eval_runtime": 107.5837, "eval_samples_per_second": 18.59, "eval_steps_per_second": 4.648, "step": 376000 }, { "epoch": 0.97, "learning_rate": 0.00015379917621655806, "loss": 0.0117, "step": 376010 }, { "epoch": 0.97, "learning_rate": 0.00015379528800018663, "loss": 0.0131, "step": 376020 }, { "epoch": 0.97, "learning_rate": 0.00015379139978381515, "loss": 0.0111, "step": 376030 }, { "epoch": 0.97, "learning_rate": 0.0001537875115674437, "loss": 0.0131, "step": 376040 }, { "epoch": 0.97, "learning_rate": 0.0001537836233510722, "loss": 0.0131, "step": 376050 }, { "epoch": 0.97, "learning_rate": 0.00015377973513470077, "loss": 0.0114, "step": 376060 }, { "epoch": 0.97, "learning_rate": 0.00015377584691832931, "loss": 0.0101, "step": 376070 }, { "epoch": 0.97, "learning_rate": 0.00015377195870195783, "loss": 0.0125, "step": 376080 }, { "epoch": 0.97, "learning_rate": 0.00015376807048558637, "loss": 0.0163, "step": 376090 }, { "epoch": 0.97, "learning_rate": 0.0001537641822692149, "loss": 0.0117, "step": 376100 }, { "epoch": 0.97, "learning_rate": 0.00015376029405284345, "loss": 0.0099, "step": 376110 }, { "epoch": 0.97, "learning_rate": 0.00015375640583647197, "loss": 0.0119, "step": 376120 }, { "epoch": 0.97, "learning_rate": 0.0001537525176201005, "loss": 0.0125, "step": 376130 }, { "epoch": 0.98, "learning_rate": 0.00015374862940372902, "loss": 0.0134, "step": 376140 }, { "epoch": 0.98, "learning_rate": 0.0001537447411873576, "loss": 0.0094, "step": 376150 }, { "epoch": 0.98, "learning_rate": 0.0001537408529709861, "loss": 0.0121, "step": 376160 }, { "epoch": 0.98, "learning_rate": 0.00015373696475461465, "loss": 0.0121, "step": 376170 }, { "epoch": 0.98, "learning_rate": 0.00015373307653824316, "loss": 0.0144, "step": 376180 }, { "epoch": 0.98, "learning_rate": 0.00015372918832187173, "loss": 0.0118, "step": 376190 }, { "epoch": 0.98, "learning_rate": 0.00015372530010550025, "loss": 0.0126, "step": 376200 }, { "epoch": 0.98, "learning_rate": 0.0001537214118891288, "loss": 0.0116, "step": 376210 }, { "epoch": 0.98, "learning_rate": 0.0001537175236727573, "loss": 0.0099, "step": 376220 }, { "epoch": 0.98, "learning_rate": 0.00015371363545638587, "loss": 0.0126, "step": 376230 }, { "epoch": 0.98, "learning_rate": 0.00015370974724001441, "loss": 0.0149, "step": 376240 }, { "epoch": 0.98, "learning_rate": 0.00015370585902364293, "loss": 0.0143, "step": 376250 }, { "epoch": 0.98, "learning_rate": 0.00015370197080727147, "loss": 0.0122, "step": 376260 }, { "epoch": 0.98, "learning_rate": 0.0001536980825909, "loss": 0.0151, "step": 376270 }, { "epoch": 0.98, "learning_rate": 0.00015369419437452855, "loss": 0.0107, "step": 376280 }, { "epoch": 0.98, "learning_rate": 0.00015369030615815707, "loss": 0.0111, "step": 376290 }, { "epoch": 0.98, "learning_rate": 0.0001536864179417856, "loss": 0.0106, "step": 376300 }, { "epoch": 0.98, "learning_rate": 0.00015368252972541415, "loss": 0.0125, "step": 376310 }, { "epoch": 0.98, "learning_rate": 0.0001536786415090427, "loss": 0.0105, "step": 376320 }, { "epoch": 0.98, "learning_rate": 0.0001536747532926712, "loss": 0.0126, "step": 376330 }, { "epoch": 0.98, "learning_rate": 0.00015367086507629975, "loss": 0.012, "step": 376340 }, { "epoch": 0.98, "learning_rate": 0.0001536669768599283, "loss": 0.0126, "step": 376350 }, { "epoch": 0.98, "learning_rate": 0.00015366308864355683, "loss": 0.0164, "step": 376360 }, { "epoch": 0.98, "learning_rate": 0.00015365920042718535, "loss": 0.0115, "step": 376370 }, { "epoch": 0.98, "learning_rate": 0.0001536553122108139, "loss": 0.0146, "step": 376380 }, { "epoch": 0.98, "learning_rate": 0.0001536514239944424, "loss": 0.0122, "step": 376390 }, { "epoch": 0.98, "learning_rate": 0.00015364753577807097, "loss": 0.0119, "step": 376400 }, { "epoch": 0.98, "learning_rate": 0.0001536436475616995, "loss": 0.0133, "step": 376410 }, { "epoch": 0.98, "learning_rate": 0.00015363975934532803, "loss": 0.0097, "step": 376420 }, { "epoch": 0.98, "learning_rate": 0.00015363587112895654, "loss": 0.0119, "step": 376430 }, { "epoch": 0.98, "learning_rate": 0.0001536319829125851, "loss": 0.011, "step": 376440 }, { "epoch": 0.98, "learning_rate": 0.00015362809469621365, "loss": 0.0143, "step": 376450 }, { "epoch": 0.98, "learning_rate": 0.00015362420647984217, "loss": 0.0145, "step": 376460 }, { "epoch": 0.98, "learning_rate": 0.0001536203182634707, "loss": 0.0138, "step": 376470 }, { "epoch": 0.98, "learning_rate": 0.00015361643004709925, "loss": 0.0131, "step": 376480 }, { "epoch": 0.98, "learning_rate": 0.0001536125418307278, "loss": 0.0128, "step": 376490 }, { "epoch": 0.98, "learning_rate": 0.0001536086536143563, "loss": 0.0168, "step": 376500 }, { "epoch": 0.98, "learning_rate": 0.00015360476539798485, "loss": 0.0113, "step": 376510 }, { "epoch": 0.98, "learning_rate": 0.0001536008771816134, "loss": 0.0134, "step": 376520 }, { "epoch": 0.98, "learning_rate": 0.00015359698896524193, "loss": 0.0103, "step": 376530 }, { "epoch": 0.98, "learning_rate": 0.00015359310074887045, "loss": 0.0116, "step": 376540 }, { "epoch": 0.98, "learning_rate": 0.000153589212532499, "loss": 0.0098, "step": 376550 }, { "epoch": 0.98, "learning_rate": 0.00015358532431612756, "loss": 0.0138, "step": 376560 }, { "epoch": 0.98, "learning_rate": 0.00015358143609975607, "loss": 0.015, "step": 376570 }, { "epoch": 0.98, "learning_rate": 0.0001535775478833846, "loss": 0.02, "step": 376580 }, { "epoch": 0.98, "learning_rate": 0.00015357365966701313, "loss": 0.0111, "step": 376590 }, { "epoch": 0.98, "learning_rate": 0.0001535697714506417, "loss": 0.0141, "step": 376600 }, { "epoch": 0.98, "learning_rate": 0.0001535658832342702, "loss": 0.0106, "step": 376610 }, { "epoch": 0.98, "learning_rate": 0.00015356199501789875, "loss": 0.0111, "step": 376620 }, { "epoch": 0.98, "learning_rate": 0.00015355810680152727, "loss": 0.0108, "step": 376630 }, { "epoch": 0.98, "learning_rate": 0.0001535542185851558, "loss": 0.0119, "step": 376640 }, { "epoch": 0.98, "learning_rate": 0.00015355033036878435, "loss": 0.0127, "step": 376650 }, { "epoch": 0.98, "learning_rate": 0.0001535464421524129, "loss": 0.012, "step": 376660 }, { "epoch": 0.98, "learning_rate": 0.0001535425539360414, "loss": 0.0129, "step": 376670 }, { "epoch": 0.98, "learning_rate": 0.00015353866571966995, "loss": 0.0101, "step": 376680 }, { "epoch": 0.98, "learning_rate": 0.0001535347775032985, "loss": 0.0116, "step": 376690 }, { "epoch": 0.98, "learning_rate": 0.00015353088928692703, "loss": 0.0155, "step": 376700 }, { "epoch": 0.98, "learning_rate": 0.00015352700107055555, "loss": 0.0125, "step": 376710 }, { "epoch": 0.98, "learning_rate": 0.0001535231128541841, "loss": 0.0108, "step": 376720 }, { "epoch": 0.98, "learning_rate": 0.00015351922463781266, "loss": 0.0146, "step": 376730 }, { "epoch": 0.98, "learning_rate": 0.00015351533642144117, "loss": 0.0108, "step": 376740 }, { "epoch": 0.98, "learning_rate": 0.00015351144820506969, "loss": 0.011, "step": 376750 }, { "epoch": 0.98, "learning_rate": 0.00015350755998869823, "loss": 0.0123, "step": 376760 }, { "epoch": 0.98, "learning_rate": 0.0001535036717723268, "loss": 0.0093, "step": 376770 }, { "epoch": 0.98, "learning_rate": 0.0001534997835559553, "loss": 0.0158, "step": 376780 }, { "epoch": 0.98, "learning_rate": 0.00015349589533958385, "loss": 0.0162, "step": 376790 }, { "epoch": 0.98, "learning_rate": 0.00015349200712321237, "loss": 0.0099, "step": 376800 }, { "epoch": 0.98, "learning_rate": 0.00015348811890684094, "loss": 0.0122, "step": 376810 }, { "epoch": 0.98, "learning_rate": 0.00015348423069046945, "loss": 0.0103, "step": 376820 }, { "epoch": 0.98, "learning_rate": 0.000153480342474098, "loss": 0.0084, "step": 376830 }, { "epoch": 0.98, "learning_rate": 0.0001534764542577265, "loss": 0.0109, "step": 376840 }, { "epoch": 0.98, "learning_rate": 0.00015347256604135507, "loss": 0.0149, "step": 376850 }, { "epoch": 0.98, "learning_rate": 0.0001534686778249836, "loss": 0.0115, "step": 376860 }, { "epoch": 0.98, "learning_rate": 0.00015346478960861213, "loss": 0.0099, "step": 376870 }, { "epoch": 0.98, "learning_rate": 0.00015346090139224065, "loss": 0.0134, "step": 376880 }, { "epoch": 0.98, "learning_rate": 0.0001534570131758692, "loss": 0.0121, "step": 376890 }, { "epoch": 0.98, "learning_rate": 0.00015345312495949773, "loss": 0.0126, "step": 376900 }, { "epoch": 0.98, "learning_rate": 0.00015344923674312627, "loss": 0.0098, "step": 376910 }, { "epoch": 0.98, "learning_rate": 0.00015344534852675478, "loss": 0.01, "step": 376920 }, { "epoch": 0.98, "learning_rate": 0.00015344146031038333, "loss": 0.0118, "step": 376930 }, { "epoch": 0.98, "learning_rate": 0.0001534375720940119, "loss": 0.0104, "step": 376940 }, { "epoch": 0.98, "learning_rate": 0.0001534336838776404, "loss": 0.0127, "step": 376950 }, { "epoch": 0.98, "learning_rate": 0.00015342979566126895, "loss": 0.0136, "step": 376960 }, { "epoch": 0.98, "learning_rate": 0.00015342590744489747, "loss": 0.0106, "step": 376970 }, { "epoch": 0.98, "learning_rate": 0.00015342201922852603, "loss": 0.0127, "step": 376980 }, { "epoch": 0.98, "learning_rate": 0.00015341813101215455, "loss": 0.012, "step": 376990 }, { "epoch": 0.98, "learning_rate": 0.0001534142427957831, "loss": 0.0122, "step": 377000 }, { "epoch": 0.98, "eval_cer": 0.8817376772465223, "eval_loss": 0.008020076900720596, "eval_runtime": 107.5591, "eval_samples_per_second": 18.594, "eval_steps_per_second": 4.649, "step": 377000 }, { "epoch": 0.98, "learning_rate": 0.0001534103545794116, "loss": 0.0136, "step": 377010 }, { "epoch": 0.98, "learning_rate": 0.00015340646636304017, "loss": 0.013, "step": 377020 }, { "epoch": 0.98, "learning_rate": 0.0001534025781466687, "loss": 0.0139, "step": 377030 }, { "epoch": 0.98, "learning_rate": 0.00015339868993029723, "loss": 0.0122, "step": 377040 }, { "epoch": 0.98, "learning_rate": 0.00015339480171392574, "loss": 0.0121, "step": 377050 }, { "epoch": 0.98, "learning_rate": 0.0001533909134975543, "loss": 0.0132, "step": 377060 }, { "epoch": 0.98, "learning_rate": 0.00015338702528118283, "loss": 0.0164, "step": 377070 }, { "epoch": 0.98, "learning_rate": 0.00015338313706481137, "loss": 0.0148, "step": 377080 }, { "epoch": 0.98, "learning_rate": 0.00015337924884843988, "loss": 0.0108, "step": 377090 }, { "epoch": 0.98, "learning_rate": 0.00015337536063206845, "loss": 0.0115, "step": 377100 }, { "epoch": 0.98, "learning_rate": 0.000153371472415697, "loss": 0.0153, "step": 377110 }, { "epoch": 0.98, "learning_rate": 0.0001533675841993255, "loss": 0.0136, "step": 377120 }, { "epoch": 0.98, "learning_rate": 0.00015336369598295405, "loss": 0.0125, "step": 377130 }, { "epoch": 0.98, "learning_rate": 0.00015335980776658257, "loss": 0.0153, "step": 377140 }, { "epoch": 0.98, "learning_rate": 0.00015335591955021113, "loss": 0.0119, "step": 377150 }, { "epoch": 0.98, "learning_rate": 0.00015335203133383965, "loss": 0.0117, "step": 377160 }, { "epoch": 0.98, "learning_rate": 0.0001533481431174682, "loss": 0.0142, "step": 377170 }, { "epoch": 0.98, "learning_rate": 0.0001533442549010967, "loss": 0.0155, "step": 377180 }, { "epoch": 0.98, "learning_rate": 0.00015334036668472527, "loss": 0.013, "step": 377190 }, { "epoch": 0.98, "learning_rate": 0.0001533364784683538, "loss": 0.014, "step": 377200 }, { "epoch": 0.98, "learning_rate": 0.00015333259025198233, "loss": 0.0097, "step": 377210 }, { "epoch": 0.98, "learning_rate": 0.00015332870203561084, "loss": 0.0111, "step": 377220 }, { "epoch": 0.98, "learning_rate": 0.0001533248138192394, "loss": 0.0103, "step": 377230 }, { "epoch": 0.98, "learning_rate": 0.00015332092560286793, "loss": 0.0173, "step": 377240 }, { "epoch": 0.98, "learning_rate": 0.00015331703738649647, "loss": 0.0107, "step": 377250 }, { "epoch": 0.98, "learning_rate": 0.00015331314917012498, "loss": 0.0136, "step": 377260 }, { "epoch": 0.98, "learning_rate": 0.00015330926095375355, "loss": 0.0142, "step": 377270 }, { "epoch": 0.98, "learning_rate": 0.0001533053727373821, "loss": 0.0126, "step": 377280 }, { "epoch": 0.98, "learning_rate": 0.0001533014845210106, "loss": 0.0124, "step": 377290 }, { "epoch": 0.98, "learning_rate": 0.00015329759630463912, "loss": 0.0116, "step": 377300 }, { "epoch": 0.98, "learning_rate": 0.0001532937080882677, "loss": 0.0132, "step": 377310 }, { "epoch": 0.98, "learning_rate": 0.00015328981987189623, "loss": 0.0159, "step": 377320 }, { "epoch": 0.98, "learning_rate": 0.00015328593165552475, "loss": 0.0113, "step": 377330 }, { "epoch": 0.98, "learning_rate": 0.0001532820434391533, "loss": 0.0164, "step": 377340 }, { "epoch": 0.98, "learning_rate": 0.00015327815522278183, "loss": 0.0129, "step": 377350 }, { "epoch": 0.98, "learning_rate": 0.00015327426700641037, "loss": 0.0112, "step": 377360 }, { "epoch": 0.98, "learning_rate": 0.0001532703787900389, "loss": 0.0139, "step": 377370 }, { "epoch": 0.98, "learning_rate": 0.00015326649057366743, "loss": 0.0149, "step": 377380 }, { "epoch": 0.98, "learning_rate": 0.00015326260235729594, "loss": 0.0128, "step": 377390 }, { "epoch": 0.98, "learning_rate": 0.0001532587141409245, "loss": 0.0113, "step": 377400 }, { "epoch": 0.98, "learning_rate": 0.00015325482592455303, "loss": 0.0165, "step": 377410 }, { "epoch": 0.98, "learning_rate": 0.00015325093770818157, "loss": 0.014, "step": 377420 }, { "epoch": 0.98, "learning_rate": 0.00015324704949181008, "loss": 0.0112, "step": 377430 }, { "epoch": 0.98, "learning_rate": 0.00015324316127543865, "loss": 0.011, "step": 377440 }, { "epoch": 0.98, "learning_rate": 0.0001532392730590672, "loss": 0.0126, "step": 377450 }, { "epoch": 0.98, "learning_rate": 0.0001532353848426957, "loss": 0.0112, "step": 377460 }, { "epoch": 0.98, "learning_rate": 0.00015323149662632422, "loss": 0.0141, "step": 377470 }, { "epoch": 0.98, "learning_rate": 0.0001532276084099528, "loss": 0.0146, "step": 377480 }, { "epoch": 0.98, "learning_rate": 0.00015322372019358133, "loss": 0.0167, "step": 377490 }, { "epoch": 0.98, "learning_rate": 0.00015321983197720985, "loss": 0.0122, "step": 377500 }, { "epoch": 0.98, "learning_rate": 0.0001532159437608384, "loss": 0.0103, "step": 377510 }, { "epoch": 0.98, "learning_rate": 0.00015321205554446693, "loss": 0.0164, "step": 377520 }, { "epoch": 0.98, "learning_rate": 0.00015320816732809547, "loss": 0.0119, "step": 377530 }, { "epoch": 0.98, "learning_rate": 0.000153204279111724, "loss": 0.0133, "step": 377540 }, { "epoch": 0.98, "learning_rate": 0.00015320039089535253, "loss": 0.0155, "step": 377550 }, { "epoch": 0.98, "learning_rate": 0.00015319650267898107, "loss": 0.0158, "step": 377560 }, { "epoch": 0.98, "learning_rate": 0.0001531926144626096, "loss": 0.0127, "step": 377570 }, { "epoch": 0.98, "learning_rate": 0.00015318872624623813, "loss": 0.0121, "step": 377580 }, { "epoch": 0.98, "learning_rate": 0.00015318483802986667, "loss": 0.0123, "step": 377590 }, { "epoch": 0.98, "learning_rate": 0.00015318094981349524, "loss": 0.0129, "step": 377600 }, { "epoch": 0.98, "learning_rate": 0.00015317706159712375, "loss": 0.0137, "step": 377610 }, { "epoch": 0.98, "learning_rate": 0.00015317317338075227, "loss": 0.0115, "step": 377620 }, { "epoch": 0.98, "learning_rate": 0.0001531692851643808, "loss": 0.0162, "step": 377630 }, { "epoch": 0.98, "learning_rate": 0.00015316539694800932, "loss": 0.012, "step": 377640 }, { "epoch": 0.98, "learning_rate": 0.0001531615087316379, "loss": 0.016, "step": 377650 }, { "epoch": 0.98, "learning_rate": 0.00015315762051526643, "loss": 0.0138, "step": 377660 }, { "epoch": 0.98, "learning_rate": 0.00015315373229889495, "loss": 0.0119, "step": 377670 }, { "epoch": 0.98, "learning_rate": 0.0001531498440825235, "loss": 0.0092, "step": 377680 }, { "epoch": 0.98, "learning_rate": 0.00015314595586615203, "loss": 0.0142, "step": 377690 }, { "epoch": 0.98, "learning_rate": 0.00015314206764978057, "loss": 0.0119, "step": 377700 }, { "epoch": 0.98, "learning_rate": 0.00015313817943340909, "loss": 0.0115, "step": 377710 }, { "epoch": 0.98, "learning_rate": 0.00015313429121703763, "loss": 0.0131, "step": 377720 }, { "epoch": 0.98, "learning_rate": 0.00015313040300066617, "loss": 0.0123, "step": 377730 }, { "epoch": 0.98, "learning_rate": 0.0001531265147842947, "loss": 0.015, "step": 377740 }, { "epoch": 0.98, "learning_rate": 0.00015312262656792323, "loss": 0.0177, "step": 377750 }, { "epoch": 0.98, "learning_rate": 0.00015311873835155177, "loss": 0.0122, "step": 377760 }, { "epoch": 0.98, "learning_rate": 0.00015311485013518034, "loss": 0.0168, "step": 377770 }, { "epoch": 0.98, "learning_rate": 0.00015311096191880885, "loss": 0.0161, "step": 377780 }, { "epoch": 0.98, "learning_rate": 0.00015310707370243736, "loss": 0.0113, "step": 377790 }, { "epoch": 0.98, "learning_rate": 0.0001531031854860659, "loss": 0.0118, "step": 377800 }, { "epoch": 0.98, "learning_rate": 0.00015309929726969448, "loss": 0.0152, "step": 377810 }, { "epoch": 0.98, "learning_rate": 0.000153095409053323, "loss": 0.0119, "step": 377820 }, { "epoch": 0.98, "learning_rate": 0.00015309152083695153, "loss": 0.0119, "step": 377830 }, { "epoch": 0.98, "learning_rate": 0.00015308763262058005, "loss": 0.0152, "step": 377840 }, { "epoch": 0.98, "learning_rate": 0.00015308374440420861, "loss": 0.0141, "step": 377850 }, { "epoch": 0.98, "learning_rate": 0.00015307985618783713, "loss": 0.0201, "step": 377860 }, { "epoch": 0.98, "learning_rate": 0.00015307596797146567, "loss": 0.0134, "step": 377870 }, { "epoch": 0.98, "learning_rate": 0.00015307207975509419, "loss": 0.0149, "step": 377880 }, { "epoch": 0.98, "learning_rate": 0.00015306819153872273, "loss": 0.0148, "step": 377890 }, { "epoch": 0.98, "learning_rate": 0.00015306430332235127, "loss": 0.0097, "step": 377900 }, { "epoch": 0.98, "learning_rate": 0.0001530604151059798, "loss": 0.017, "step": 377910 }, { "epoch": 0.98, "learning_rate": 0.00015305652688960832, "loss": 0.0128, "step": 377920 }, { "epoch": 0.98, "learning_rate": 0.00015305263867323687, "loss": 0.0106, "step": 377930 }, { "epoch": 0.98, "learning_rate": 0.0001530487504568654, "loss": 0.015, "step": 377940 }, { "epoch": 0.98, "learning_rate": 0.00015304486224049395, "loss": 0.0151, "step": 377950 }, { "epoch": 0.98, "learning_rate": 0.00015304097402412246, "loss": 0.0135, "step": 377960 }, { "epoch": 0.98, "learning_rate": 0.000153037085807751, "loss": 0.0145, "step": 377970 }, { "epoch": 0.98, "learning_rate": 0.00015303319759137957, "loss": 0.0121, "step": 377980 }, { "epoch": 0.98, "learning_rate": 0.0001530293093750081, "loss": 0.0123, "step": 377990 }, { "epoch": 0.98, "learning_rate": 0.00015302542115863663, "loss": 0.0192, "step": 378000 }, { "epoch": 0.98, "eval_cer": 0.8817712685329425, "eval_loss": 0.008189625106751919, "eval_runtime": 107.5946, "eval_samples_per_second": 18.588, "eval_steps_per_second": 4.647, "step": 378000 }, { "epoch": 0.98, "learning_rate": 0.00015302153294226515, "loss": 0.0133, "step": 378010 }, { "epoch": 0.98, "learning_rate": 0.00015301764472589371, "loss": 0.0129, "step": 378020 }, { "epoch": 0.98, "learning_rate": 0.00015301375650952223, "loss": 0.0125, "step": 378030 }, { "epoch": 0.98, "learning_rate": 0.00015300986829315077, "loss": 0.0116, "step": 378040 }, { "epoch": 0.98, "learning_rate": 0.00015300598007677928, "loss": 0.0158, "step": 378050 }, { "epoch": 0.98, "learning_rate": 0.00015300209186040785, "loss": 0.0118, "step": 378060 }, { "epoch": 0.98, "learning_rate": 0.00015299820364403637, "loss": 0.011, "step": 378070 }, { "epoch": 0.98, "learning_rate": 0.0001529943154276649, "loss": 0.0133, "step": 378080 }, { "epoch": 0.98, "learning_rate": 0.00015299042721129342, "loss": 0.0109, "step": 378090 }, { "epoch": 0.98, "learning_rate": 0.000152986538994922, "loss": 0.0133, "step": 378100 }, { "epoch": 0.98, "learning_rate": 0.0001529826507785505, "loss": 0.0132, "step": 378110 }, { "epoch": 0.98, "learning_rate": 0.00015297876256217905, "loss": 0.009, "step": 378120 }, { "epoch": 0.98, "learning_rate": 0.00015297487434580756, "loss": 0.0114, "step": 378130 }, { "epoch": 0.98, "learning_rate": 0.0001529709861294361, "loss": 0.0119, "step": 378140 }, { "epoch": 0.98, "learning_rate": 0.00015296709791306467, "loss": 0.0121, "step": 378150 }, { "epoch": 0.98, "learning_rate": 0.0001529632096966932, "loss": 0.0115, "step": 378160 }, { "epoch": 0.98, "learning_rate": 0.00015295932148032173, "loss": 0.0106, "step": 378170 }, { "epoch": 0.98, "learning_rate": 0.00015295543326395024, "loss": 0.0128, "step": 378180 }, { "epoch": 0.98, "learning_rate": 0.00015295154504757881, "loss": 0.013, "step": 378190 }, { "epoch": 0.98, "learning_rate": 0.00015294765683120733, "loss": 0.0101, "step": 378200 }, { "epoch": 0.98, "learning_rate": 0.00015294376861483587, "loss": 0.0101, "step": 378210 }, { "epoch": 0.98, "learning_rate": 0.00015293988039846438, "loss": 0.0133, "step": 378220 }, { "epoch": 0.98, "learning_rate": 0.00015293599218209295, "loss": 0.0182, "step": 378230 }, { "epoch": 0.98, "learning_rate": 0.00015293210396572147, "loss": 0.0135, "step": 378240 }, { "epoch": 0.98, "learning_rate": 0.00015292821574935, "loss": 0.0099, "step": 378250 }, { "epoch": 0.98, "learning_rate": 0.00015292432753297852, "loss": 0.0126, "step": 378260 }, { "epoch": 0.98, "learning_rate": 0.0001529204393166071, "loss": 0.0152, "step": 378270 }, { "epoch": 0.98, "learning_rate": 0.0001529165511002356, "loss": 0.0152, "step": 378280 }, { "epoch": 0.98, "learning_rate": 0.00015291266288386415, "loss": 0.0116, "step": 378290 }, { "epoch": 0.98, "learning_rate": 0.00015290877466749266, "loss": 0.0096, "step": 378300 }, { "epoch": 0.98, "learning_rate": 0.00015290488645112123, "loss": 0.0143, "step": 378310 }, { "epoch": 0.98, "learning_rate": 0.00015290099823474977, "loss": 0.0135, "step": 378320 }, { "epoch": 0.98, "learning_rate": 0.0001528971100183783, "loss": 0.0113, "step": 378330 }, { "epoch": 0.98, "learning_rate": 0.0001528932218020068, "loss": 0.0145, "step": 378340 }, { "epoch": 0.98, "learning_rate": 0.00015288933358563537, "loss": 0.0112, "step": 378350 }, { "epoch": 0.98, "learning_rate": 0.0001528854453692639, "loss": 0.0123, "step": 378360 }, { "epoch": 0.98, "learning_rate": 0.00015288155715289243, "loss": 0.0118, "step": 378370 }, { "epoch": 0.98, "learning_rate": 0.00015287766893652097, "loss": 0.0152, "step": 378380 }, { "epoch": 0.98, "learning_rate": 0.00015287378072014948, "loss": 0.0138, "step": 378390 }, { "epoch": 0.98, "learning_rate": 0.00015286989250377805, "loss": 0.0114, "step": 378400 }, { "epoch": 0.98, "learning_rate": 0.00015286600428740657, "loss": 0.0131, "step": 378410 }, { "epoch": 0.98, "learning_rate": 0.0001528621160710351, "loss": 0.014, "step": 378420 }, { "epoch": 0.98, "learning_rate": 0.00015285822785466362, "loss": 0.0155, "step": 378430 }, { "epoch": 0.98, "learning_rate": 0.0001528543396382922, "loss": 0.0135, "step": 378440 }, { "epoch": 0.98, "learning_rate": 0.0001528504514219207, "loss": 0.0117, "step": 378450 }, { "epoch": 0.98, "learning_rate": 0.00015284656320554925, "loss": 0.0115, "step": 378460 }, { "epoch": 0.98, "learning_rate": 0.00015284267498917776, "loss": 0.0112, "step": 378470 }, { "epoch": 0.98, "learning_rate": 0.00015283878677280633, "loss": 0.014, "step": 378480 }, { "epoch": 0.98, "learning_rate": 0.00015283489855643485, "loss": 0.0117, "step": 378490 }, { "epoch": 0.98, "learning_rate": 0.0001528310103400634, "loss": 0.0149, "step": 378500 }, { "epoch": 0.98, "learning_rate": 0.0001528271221236919, "loss": 0.0124, "step": 378510 }, { "epoch": 0.98, "learning_rate": 0.00015282323390732047, "loss": 0.0122, "step": 378520 }, { "epoch": 0.98, "learning_rate": 0.000152819345690949, "loss": 0.0106, "step": 378530 }, { "epoch": 0.98, "learning_rate": 0.00015281545747457753, "loss": 0.0119, "step": 378540 }, { "epoch": 0.98, "learning_rate": 0.00015281156925820607, "loss": 0.0136, "step": 378550 }, { "epoch": 0.98, "learning_rate": 0.0001528076810418346, "loss": 0.0128, "step": 378560 }, { "epoch": 0.98, "learning_rate": 0.00015280379282546315, "loss": 0.0156, "step": 378570 }, { "epoch": 0.98, "learning_rate": 0.00015279990460909167, "loss": 0.0131, "step": 378580 }, { "epoch": 0.98, "learning_rate": 0.0001527960163927202, "loss": 0.0132, "step": 378590 }, { "epoch": 0.98, "learning_rate": 0.00015279212817634875, "loss": 0.0234, "step": 378600 }, { "epoch": 0.98, "learning_rate": 0.0001527882399599773, "loss": 0.0157, "step": 378610 }, { "epoch": 0.98, "learning_rate": 0.0001527843517436058, "loss": 0.0112, "step": 378620 }, { "epoch": 0.98, "learning_rate": 0.00015278046352723435, "loss": 0.0135, "step": 378630 }, { "epoch": 0.98, "learning_rate": 0.00015277657531086286, "loss": 0.0121, "step": 378640 }, { "epoch": 0.98, "learning_rate": 0.00015277268709449143, "loss": 0.0107, "step": 378650 }, { "epoch": 0.98, "learning_rate": 0.00015276879887811995, "loss": 0.0113, "step": 378660 }, { "epoch": 0.98, "learning_rate": 0.0001527649106617485, "loss": 0.0127, "step": 378670 }, { "epoch": 0.98, "learning_rate": 0.000152761022445377, "loss": 0.01, "step": 378680 }, { "epoch": 0.98, "learning_rate": 0.00015275713422900557, "loss": 0.0106, "step": 378690 }, { "epoch": 0.98, "learning_rate": 0.0001527532460126341, "loss": 0.0124, "step": 378700 }, { "epoch": 0.98, "learning_rate": 0.00015274935779626263, "loss": 0.009, "step": 378710 }, { "epoch": 0.98, "learning_rate": 0.00015274546957989117, "loss": 0.0128, "step": 378720 }, { "epoch": 0.98, "learning_rate": 0.0001527415813635197, "loss": 0.012, "step": 378730 }, { "epoch": 0.98, "learning_rate": 0.00015273769314714825, "loss": 0.0131, "step": 378740 }, { "epoch": 0.98, "learning_rate": 0.00015273380493077677, "loss": 0.0093, "step": 378750 }, { "epoch": 0.98, "learning_rate": 0.0001527299167144053, "loss": 0.0124, "step": 378760 }, { "epoch": 0.98, "learning_rate": 0.00015272602849803385, "loss": 0.0117, "step": 378770 }, { "epoch": 0.98, "learning_rate": 0.0001527221402816624, "loss": 0.012, "step": 378780 }, { "epoch": 0.98, "learning_rate": 0.0001527182520652909, "loss": 0.0092, "step": 378790 }, { "epoch": 0.98, "learning_rate": 0.00015271436384891945, "loss": 0.0117, "step": 378800 }, { "epoch": 0.98, "learning_rate": 0.000152710475632548, "loss": 0.0111, "step": 378810 }, { "epoch": 0.98, "learning_rate": 0.00015270658741617653, "loss": 0.0131, "step": 378820 }, { "epoch": 0.98, "learning_rate": 0.00015270269919980504, "loss": 0.0147, "step": 378830 }, { "epoch": 0.98, "learning_rate": 0.00015269881098343359, "loss": 0.0123, "step": 378840 }, { "epoch": 0.98, "learning_rate": 0.00015269492276706216, "loss": 0.0133, "step": 378850 }, { "epoch": 0.98, "learning_rate": 0.00015269103455069067, "loss": 0.0118, "step": 378860 }, { "epoch": 0.98, "learning_rate": 0.0001526871463343192, "loss": 0.0107, "step": 378870 }, { "epoch": 0.98, "learning_rate": 0.00015268325811794773, "loss": 0.0139, "step": 378880 }, { "epoch": 0.98, "learning_rate": 0.00015267936990157624, "loss": 0.0118, "step": 378890 }, { "epoch": 0.98, "learning_rate": 0.0001526754816852048, "loss": 0.0159, "step": 378900 }, { "epoch": 0.98, "learning_rate": 0.00015267159346883335, "loss": 0.0155, "step": 378910 }, { "epoch": 0.98, "learning_rate": 0.00015266770525246187, "loss": 0.0126, "step": 378920 }, { "epoch": 0.98, "learning_rate": 0.0001526638170360904, "loss": 0.0132, "step": 378930 }, { "epoch": 0.98, "learning_rate": 0.00015265992881971895, "loss": 0.0153, "step": 378940 }, { "epoch": 0.98, "learning_rate": 0.0001526560406033475, "loss": 0.0165, "step": 378950 }, { "epoch": 0.98, "learning_rate": 0.000152652152386976, "loss": 0.0099, "step": 378960 }, { "epoch": 0.98, "learning_rate": 0.00015264826417060455, "loss": 0.0103, "step": 378970 }, { "epoch": 0.98, "learning_rate": 0.0001526443759542331, "loss": 0.0103, "step": 378980 }, { "epoch": 0.98, "learning_rate": 0.00015264048773786163, "loss": 0.0134, "step": 378990 }, { "epoch": 0.98, "learning_rate": 0.00015263659952149014, "loss": 0.0152, "step": 379000 }, { "epoch": 0.98, "eval_cer": 0.8817432757942589, "eval_loss": 0.008436217904090881, "eval_runtime": 107.5614, "eval_samples_per_second": 18.594, "eval_steps_per_second": 4.649, "step": 379000 }, { "epoch": 0.98, "learning_rate": 0.00015263271130511869, "loss": 0.0142, "step": 379010 }, { "epoch": 0.98, "learning_rate": 0.00015262882308874725, "loss": 0.0159, "step": 379020 }, { "epoch": 0.98, "learning_rate": 0.00015262493487237577, "loss": 0.0169, "step": 379030 }, { "epoch": 0.98, "learning_rate": 0.0001526210466560043, "loss": 0.0121, "step": 379040 }, { "epoch": 0.98, "learning_rate": 0.00015261715843963283, "loss": 0.0127, "step": 379050 }, { "epoch": 0.98, "learning_rate": 0.0001526132702232614, "loss": 0.0139, "step": 379060 }, { "epoch": 0.98, "learning_rate": 0.0001526093820068899, "loss": 0.0124, "step": 379070 }, { "epoch": 0.98, "learning_rate": 0.00015260549379051845, "loss": 0.0136, "step": 379080 }, { "epoch": 0.98, "learning_rate": 0.00015260160557414696, "loss": 0.0137, "step": 379090 }, { "epoch": 0.98, "learning_rate": 0.00015259771735777553, "loss": 0.013, "step": 379100 }, { "epoch": 0.98, "learning_rate": 0.00015259382914140405, "loss": 0.0141, "step": 379110 }, { "epoch": 0.98, "learning_rate": 0.0001525899409250326, "loss": 0.011, "step": 379120 }, { "epoch": 0.98, "learning_rate": 0.0001525860527086611, "loss": 0.0134, "step": 379130 }, { "epoch": 0.98, "learning_rate": 0.00015258216449228965, "loss": 0.0133, "step": 379140 }, { "epoch": 0.98, "learning_rate": 0.0001525782762759182, "loss": 0.0157, "step": 379150 }, { "epoch": 0.98, "learning_rate": 0.00015257438805954673, "loss": 0.0118, "step": 379160 }, { "epoch": 0.98, "learning_rate": 0.00015257049984317524, "loss": 0.0135, "step": 379170 }, { "epoch": 0.98, "learning_rate": 0.00015256661162680379, "loss": 0.0144, "step": 379180 }, { "epoch": 0.98, "learning_rate": 0.00015256272341043235, "loss": 0.0123, "step": 379190 }, { "epoch": 0.98, "learning_rate": 0.00015255883519406087, "loss": 0.0118, "step": 379200 }, { "epoch": 0.98, "learning_rate": 0.00015255494697768938, "loss": 0.0103, "step": 379210 }, { "epoch": 0.98, "learning_rate": 0.00015255105876131792, "loss": 0.0136, "step": 379220 }, { "epoch": 0.98, "learning_rate": 0.0001525471705449465, "loss": 0.0159, "step": 379230 }, { "epoch": 0.98, "learning_rate": 0.000152543282328575, "loss": 0.0114, "step": 379240 }, { "epoch": 0.98, "learning_rate": 0.00015253939411220355, "loss": 0.0131, "step": 379250 }, { "epoch": 0.98, "learning_rate": 0.00015253550589583206, "loss": 0.0119, "step": 379260 }, { "epoch": 0.98, "learning_rate": 0.00015253161767946063, "loss": 0.0119, "step": 379270 }, { "epoch": 0.98, "learning_rate": 0.00015252772946308915, "loss": 0.012, "step": 379280 }, { "epoch": 0.98, "learning_rate": 0.0001525238412467177, "loss": 0.0116, "step": 379290 }, { "epoch": 0.98, "learning_rate": 0.0001525199530303462, "loss": 0.0136, "step": 379300 }, { "epoch": 0.98, "learning_rate": 0.00015251606481397477, "loss": 0.0107, "step": 379310 }, { "epoch": 0.98, "learning_rate": 0.0001525121765976033, "loss": 0.0143, "step": 379320 }, { "epoch": 0.98, "learning_rate": 0.00015250828838123183, "loss": 0.0122, "step": 379330 }, { "epoch": 0.98, "learning_rate": 0.00015250440016486034, "loss": 0.0172, "step": 379340 }, { "epoch": 0.98, "learning_rate": 0.0001525005119484889, "loss": 0.0158, "step": 379350 }, { "epoch": 0.98, "learning_rate": 0.00015249662373211745, "loss": 0.0136, "step": 379360 }, { "epoch": 0.98, "learning_rate": 0.00015249273551574597, "loss": 0.0141, "step": 379370 }, { "epoch": 0.98, "learning_rate": 0.00015248884729937448, "loss": 0.0129, "step": 379380 }, { "epoch": 0.98, "learning_rate": 0.00015248495908300302, "loss": 0.0153, "step": 379390 }, { "epoch": 0.98, "learning_rate": 0.0001524810708666316, "loss": 0.012, "step": 379400 }, { "epoch": 0.98, "learning_rate": 0.0001524771826502601, "loss": 0.0138, "step": 379410 }, { "epoch": 0.98, "learning_rate": 0.00015247329443388865, "loss": 0.0127, "step": 379420 }, { "epoch": 0.98, "learning_rate": 0.00015246940621751716, "loss": 0.0124, "step": 379430 }, { "epoch": 0.98, "learning_rate": 0.00015246551800114573, "loss": 0.0133, "step": 379440 }, { "epoch": 0.98, "learning_rate": 0.00015246162978477425, "loss": 0.0141, "step": 379450 }, { "epoch": 0.98, "learning_rate": 0.0001524577415684028, "loss": 0.0106, "step": 379460 }, { "epoch": 0.98, "learning_rate": 0.0001524538533520313, "loss": 0.0176, "step": 379470 }, { "epoch": 0.98, "learning_rate": 0.00015244996513565987, "loss": 0.0124, "step": 379480 }, { "epoch": 0.98, "learning_rate": 0.00015244607691928839, "loss": 0.0117, "step": 379490 }, { "epoch": 0.98, "learning_rate": 0.00015244218870291693, "loss": 0.0177, "step": 379500 }, { "epoch": 0.98, "learning_rate": 0.00015243830048654544, "loss": 0.0122, "step": 379510 }, { "epoch": 0.98, "learning_rate": 0.000152434412270174, "loss": 0.0128, "step": 379520 }, { "epoch": 0.98, "learning_rate": 0.00015243052405380253, "loss": 0.0124, "step": 379530 }, { "epoch": 0.98, "learning_rate": 0.00015242663583743107, "loss": 0.0531, "step": 379540 }, { "epoch": 0.98, "learning_rate": 0.00015242274762105958, "loss": 0.011, "step": 379550 }, { "epoch": 0.98, "learning_rate": 0.00015241885940468815, "loss": 0.0169, "step": 379560 }, { "epoch": 0.98, "learning_rate": 0.0001524149711883167, "loss": 0.0119, "step": 379570 }, { "epoch": 0.98, "learning_rate": 0.0001524110829719452, "loss": 0.0111, "step": 379580 }, { "epoch": 0.98, "learning_rate": 0.00015240719475557375, "loss": 0.0139, "step": 379590 }, { "epoch": 0.98, "learning_rate": 0.0001524033065392023, "loss": 0.0128, "step": 379600 }, { "epoch": 0.98, "learning_rate": 0.00015239941832283083, "loss": 0.0119, "step": 379610 }, { "epoch": 0.98, "learning_rate": 0.00015239553010645935, "loss": 0.012, "step": 379620 }, { "epoch": 0.98, "learning_rate": 0.0001523916418900879, "loss": 0.0178, "step": 379630 }, { "epoch": 0.98, "learning_rate": 0.0001523877536737164, "loss": 0.0135, "step": 379640 }, { "epoch": 0.98, "learning_rate": 0.00015238386545734497, "loss": 0.0147, "step": 379650 }, { "epoch": 0.98, "learning_rate": 0.00015237997724097349, "loss": 0.0127, "step": 379660 }, { "epoch": 0.98, "learning_rate": 0.00015237608902460203, "loss": 0.0166, "step": 379670 }, { "epoch": 0.98, "learning_rate": 0.00015237220080823054, "loss": 0.0101, "step": 379680 }, { "epoch": 0.98, "learning_rate": 0.0001523683125918591, "loss": 0.0114, "step": 379690 }, { "epoch": 0.98, "learning_rate": 0.00015236442437548763, "loss": 0.018, "step": 379700 }, { "epoch": 0.98, "learning_rate": 0.00015236053615911617, "loss": 0.0195, "step": 379710 }, { "epoch": 0.98, "learning_rate": 0.00015235664794274468, "loss": 0.0137, "step": 379720 }, { "epoch": 0.98, "learning_rate": 0.00015235275972637325, "loss": 0.0106, "step": 379730 }, { "epoch": 0.98, "learning_rate": 0.0001523488715100018, "loss": 0.0117, "step": 379740 }, { "epoch": 0.98, "learning_rate": 0.0001523449832936303, "loss": 0.0154, "step": 379750 }, { "epoch": 0.98, "learning_rate": 0.00015234109507725885, "loss": 0.0145, "step": 379760 }, { "epoch": 0.98, "learning_rate": 0.0001523372068608874, "loss": 0.0129, "step": 379770 }, { "epoch": 0.98, "learning_rate": 0.00015233331864451593, "loss": 0.0152, "step": 379780 }, { "epoch": 0.98, "learning_rate": 0.00015232943042814445, "loss": 0.015, "step": 379790 }, { "epoch": 0.98, "learning_rate": 0.000152325542211773, "loss": 0.0106, "step": 379800 }, { "epoch": 0.98, "learning_rate": 0.00015232165399540153, "loss": 0.0131, "step": 379810 }, { "epoch": 0.98, "learning_rate": 0.00015231776577903007, "loss": 0.0174, "step": 379820 }, { "epoch": 0.98, "learning_rate": 0.00015231387756265859, "loss": 0.0095, "step": 379830 }, { "epoch": 0.98, "learning_rate": 0.00015230998934628713, "loss": 0.012, "step": 379840 }, { "epoch": 0.98, "learning_rate": 0.00015230610112991567, "loss": 0.0114, "step": 379850 }, { "epoch": 0.98, "learning_rate": 0.0001523022129135442, "loss": 0.012, "step": 379860 }, { "epoch": 0.98, "learning_rate": 0.00015229832469717272, "loss": 0.0139, "step": 379870 }, { "epoch": 0.98, "learning_rate": 0.00015229443648080127, "loss": 0.0125, "step": 379880 }, { "epoch": 0.98, "learning_rate": 0.00015229054826442978, "loss": 0.0141, "step": 379890 }, { "epoch": 0.98, "learning_rate": 0.00015228666004805835, "loss": 0.0105, "step": 379900 }, { "epoch": 0.98, "learning_rate": 0.0001522827718316869, "loss": 0.013, "step": 379910 }, { "epoch": 0.98, "learning_rate": 0.0001522788836153154, "loss": 0.0107, "step": 379920 }, { "epoch": 0.98, "learning_rate": 0.00015227499539894392, "loss": 0.0138, "step": 379930 }, { "epoch": 0.98, "learning_rate": 0.0001522711071825725, "loss": 0.0159, "step": 379940 }, { "epoch": 0.98, "learning_rate": 0.00015226721896620103, "loss": 0.0123, "step": 379950 }, { "epoch": 0.98, "learning_rate": 0.00015226333074982955, "loss": 0.0093, "step": 379960 }, { "epoch": 0.98, "learning_rate": 0.0001522594425334581, "loss": 0.0145, "step": 379970 }, { "epoch": 0.98, "learning_rate": 0.00015225555431708663, "loss": 0.0125, "step": 379980 }, { "epoch": 0.98, "learning_rate": 0.00015225166610071517, "loss": 0.01, "step": 379990 }, { "epoch": 0.99, "learning_rate": 0.00015224777788434368, "loss": 0.0122, "step": 380000 }, { "epoch": 0.99, "eval_cer": 0.8816942885015627, "eval_loss": 0.008343157358467579, "eval_runtime": 107.6029, "eval_samples_per_second": 18.587, "eval_steps_per_second": 4.647, "step": 380000 }, { "epoch": 0.99, "learning_rate": 0.00015224388966797223, "loss": 0.0107, "step": 380010 }, { "epoch": 0.99, "learning_rate": 0.00015224000145160077, "loss": 0.0127, "step": 380020 }, { "epoch": 0.99, "learning_rate": 0.0001522361132352293, "loss": 0.0132, "step": 380030 }, { "epoch": 0.99, "learning_rate": 0.00015223222501885782, "loss": 0.0113, "step": 380040 }, { "epoch": 0.99, "learning_rate": 0.00015222833680248637, "loss": 0.0179, "step": 380050 }, { "epoch": 0.99, "learning_rate": 0.00015222444858611493, "loss": 0.0115, "step": 380060 }, { "epoch": 0.99, "learning_rate": 0.00015222056036974345, "loss": 0.0135, "step": 380070 }, { "epoch": 0.99, "learning_rate": 0.00015221667215337196, "loss": 0.0119, "step": 380080 }, { "epoch": 0.99, "learning_rate": 0.0001522127839370005, "loss": 0.0118, "step": 380090 }, { "epoch": 0.99, "learning_rate": 0.00015220889572062902, "loss": 0.0354, "step": 380100 }, { "epoch": 0.99, "learning_rate": 0.0001522050075042576, "loss": 0.0109, "step": 380110 }, { "epoch": 0.99, "learning_rate": 0.00015220111928788613, "loss": 0.0158, "step": 380120 }, { "epoch": 0.99, "learning_rate": 0.00015219723107151464, "loss": 0.0141, "step": 380130 }, { "epoch": 0.99, "learning_rate": 0.00015219334285514319, "loss": 0.0127, "step": 380140 }, { "epoch": 0.99, "learning_rate": 0.00015218945463877173, "loss": 0.0107, "step": 380150 }, { "epoch": 0.99, "learning_rate": 0.00015218556642240027, "loss": 0.0131, "step": 380160 }, { "epoch": 0.99, "learning_rate": 0.00015218167820602878, "loss": 0.0113, "step": 380170 }, { "epoch": 0.99, "learning_rate": 0.00015217778998965733, "loss": 0.0141, "step": 380180 }, { "epoch": 0.99, "learning_rate": 0.00015217390177328587, "loss": 0.0135, "step": 380190 }, { "epoch": 0.99, "learning_rate": 0.0001521700135569144, "loss": 0.014, "step": 380200 }, { "epoch": 0.99, "learning_rate": 0.00015216612534054292, "loss": 0.0153, "step": 380210 }, { "epoch": 0.99, "learning_rate": 0.00015216223712417147, "loss": 0.0172, "step": 380220 }, { "epoch": 0.99, "learning_rate": 0.00015215834890780003, "loss": 0.0097, "step": 380230 }, { "epoch": 0.99, "learning_rate": 0.00015215446069142855, "loss": 0.0116, "step": 380240 }, { "epoch": 0.99, "learning_rate": 0.00015215057247505706, "loss": 0.0098, "step": 380250 }, { "epoch": 0.99, "learning_rate": 0.0001521466842586856, "loss": 0.0101, "step": 380260 }, { "epoch": 0.99, "learning_rate": 0.00015214279604231417, "loss": 0.0151, "step": 380270 }, { "epoch": 0.99, "learning_rate": 0.0001521389078259427, "loss": 0.0119, "step": 380280 }, { "epoch": 0.99, "learning_rate": 0.00015213501960957123, "loss": 0.0105, "step": 380290 }, { "epoch": 0.99, "learning_rate": 0.00015213113139319974, "loss": 0.0116, "step": 380300 }, { "epoch": 0.99, "learning_rate": 0.0001521272431768283, "loss": 0.0124, "step": 380310 }, { "epoch": 0.99, "learning_rate": 0.00015212335496045683, "loss": 0.012, "step": 380320 }, { "epoch": 0.99, "learning_rate": 0.00015211946674408537, "loss": 0.0147, "step": 380330 }, { "epoch": 0.99, "learning_rate": 0.00015211557852771388, "loss": 0.0135, "step": 380340 }, { "epoch": 0.99, "learning_rate": 0.00015211169031134243, "loss": 0.0107, "step": 380350 }, { "epoch": 0.99, "learning_rate": 0.00015210780209497097, "loss": 0.0114, "step": 380360 }, { "epoch": 0.99, "learning_rate": 0.0001521039138785995, "loss": 0.012, "step": 380370 }, { "epoch": 0.99, "learning_rate": 0.00015210002566222802, "loss": 0.0156, "step": 380380 }, { "epoch": 0.99, "learning_rate": 0.00015209613744585656, "loss": 0.0202, "step": 380390 }, { "epoch": 0.99, "learning_rate": 0.0001520922492294851, "loss": 0.0149, "step": 380400 }, { "epoch": 0.99, "learning_rate": 0.00015208836101311365, "loss": 0.0109, "step": 380410 }, { "epoch": 0.99, "learning_rate": 0.00015208447279674216, "loss": 0.0132, "step": 380420 }, { "epoch": 0.99, "learning_rate": 0.0001520805845803707, "loss": 0.0109, "step": 380430 }, { "epoch": 0.99, "learning_rate": 0.00015207669636399927, "loss": 0.0134, "step": 380440 }, { "epoch": 0.99, "learning_rate": 0.0001520728081476278, "loss": 0.0116, "step": 380450 }, { "epoch": 0.99, "learning_rate": 0.00015206891993125633, "loss": 0.0168, "step": 380460 }, { "epoch": 0.99, "learning_rate": 0.00015206503171488484, "loss": 0.0127, "step": 380470 }, { "epoch": 0.99, "learning_rate": 0.0001520611434985134, "loss": 0.0132, "step": 380480 }, { "epoch": 0.99, "learning_rate": 0.00015205725528214193, "loss": 0.0201, "step": 380490 }, { "epoch": 0.99, "learning_rate": 0.00015205336706577047, "loss": 0.0149, "step": 380500 }, { "epoch": 0.99, "learning_rate": 0.00015204947884939898, "loss": 0.0108, "step": 380510 }, { "epoch": 0.99, "learning_rate": 0.00015204559063302755, "loss": 0.0124, "step": 380520 }, { "epoch": 0.99, "learning_rate": 0.00015204170241665607, "loss": 0.0134, "step": 380530 }, { "epoch": 0.99, "learning_rate": 0.0001520378142002846, "loss": 0.0103, "step": 380540 }, { "epoch": 0.99, "learning_rate": 0.00015203392598391312, "loss": 0.0113, "step": 380550 }, { "epoch": 0.99, "learning_rate": 0.0001520300377675417, "loss": 0.0163, "step": 380560 }, { "epoch": 0.99, "learning_rate": 0.0001520261495511702, "loss": 0.0144, "step": 380570 }, { "epoch": 0.99, "learning_rate": 0.00015202226133479875, "loss": 0.0203, "step": 380580 }, { "epoch": 0.99, "learning_rate": 0.00015201837311842726, "loss": 0.0163, "step": 380590 }, { "epoch": 0.99, "learning_rate": 0.0001520144849020558, "loss": 0.0153, "step": 380600 }, { "epoch": 0.99, "learning_rate": 0.00015201059668568437, "loss": 0.0158, "step": 380610 }, { "epoch": 0.99, "learning_rate": 0.0001520067084693129, "loss": 0.0106, "step": 380620 }, { "epoch": 0.99, "learning_rate": 0.00015200282025294143, "loss": 0.0145, "step": 380630 }, { "epoch": 0.99, "learning_rate": 0.00015199893203656994, "loss": 0.0122, "step": 380640 }, { "epoch": 0.99, "learning_rate": 0.0001519950438201985, "loss": 0.0108, "step": 380650 }, { "epoch": 0.99, "learning_rate": 0.00015199115560382703, "loss": 0.011, "step": 380660 }, { "epoch": 0.99, "learning_rate": 0.00015198726738745557, "loss": 0.0112, "step": 380670 }, { "epoch": 0.99, "learning_rate": 0.00015198337917108408, "loss": 0.0137, "step": 380680 }, { "epoch": 0.99, "learning_rate": 0.00015197949095471265, "loss": 0.0129, "step": 380690 }, { "epoch": 0.99, "learning_rate": 0.00015197560273834117, "loss": 0.0111, "step": 380700 }, { "epoch": 0.99, "learning_rate": 0.0001519717145219697, "loss": 0.0136, "step": 380710 }, { "epoch": 0.99, "learning_rate": 0.00015196782630559822, "loss": 0.0135, "step": 380720 }, { "epoch": 0.99, "learning_rate": 0.0001519639380892268, "loss": 0.01, "step": 380730 }, { "epoch": 0.99, "learning_rate": 0.0001519600498728553, "loss": 0.0142, "step": 380740 }, { "epoch": 0.99, "learning_rate": 0.00015195616165648385, "loss": 0.0107, "step": 380750 }, { "epoch": 0.99, "learning_rate": 0.00015195227344011236, "loss": 0.0132, "step": 380760 }, { "epoch": 0.99, "learning_rate": 0.00015194838522374093, "loss": 0.0103, "step": 380770 }, { "epoch": 0.99, "learning_rate": 0.00015194449700736947, "loss": 0.0116, "step": 380780 }, { "epoch": 0.99, "learning_rate": 0.00015194060879099799, "loss": 0.0109, "step": 380790 }, { "epoch": 0.99, "learning_rate": 0.0001519367205746265, "loss": 0.0139, "step": 380800 }, { "epoch": 0.99, "learning_rate": 0.00015193283235825507, "loss": 0.0137, "step": 380810 }, { "epoch": 0.99, "learning_rate": 0.0001519289441418836, "loss": 0.0128, "step": 380820 }, { "epoch": 0.99, "learning_rate": 0.00015192505592551213, "loss": 0.0114, "step": 380830 }, { "epoch": 0.99, "learning_rate": 0.00015192116770914067, "loss": 0.0118, "step": 380840 }, { "epoch": 0.99, "learning_rate": 0.00015191727949276918, "loss": 0.0211, "step": 380850 }, { "epoch": 0.99, "learning_rate": 0.00015191339127639775, "loss": 0.0106, "step": 380860 }, { "epoch": 0.99, "learning_rate": 0.00015190950306002626, "loss": 0.0115, "step": 380870 }, { "epoch": 0.99, "learning_rate": 0.0001519056148436548, "loss": 0.0112, "step": 380880 }, { "epoch": 0.99, "learning_rate": 0.00015190172662728332, "loss": 0.0152, "step": 380890 }, { "epoch": 0.99, "learning_rate": 0.0001518978384109119, "loss": 0.0142, "step": 380900 }, { "epoch": 0.99, "learning_rate": 0.0001518939501945404, "loss": 0.015, "step": 380910 }, { "epoch": 0.99, "learning_rate": 0.00015189006197816895, "loss": 0.0113, "step": 380920 }, { "epoch": 0.99, "learning_rate": 0.00015188617376179746, "loss": 0.0137, "step": 380930 }, { "epoch": 0.99, "learning_rate": 0.00015188228554542603, "loss": 0.0128, "step": 380940 }, { "epoch": 0.99, "learning_rate": 0.00015187839732905457, "loss": 0.0112, "step": 380950 }, { "epoch": 0.99, "learning_rate": 0.00015187450911268309, "loss": 0.0132, "step": 380960 }, { "epoch": 0.99, "learning_rate": 0.0001518706208963116, "loss": 0.0118, "step": 380970 }, { "epoch": 0.99, "learning_rate": 0.00015186673267994017, "loss": 0.0097, "step": 380980 }, { "epoch": 0.99, "learning_rate": 0.0001518628444635687, "loss": 0.0103, "step": 380990 }, { "epoch": 0.99, "learning_rate": 0.00015185895624719722, "loss": 0.0135, "step": 381000 }, { "epoch": 0.99, "eval_cer": 0.8817096845078387, "eval_loss": 0.008428123779594898, "eval_runtime": 107.512, "eval_samples_per_second": 18.603, "eval_steps_per_second": 4.651, "step": 381000 }, { "epoch": 0.99, "learning_rate": 0.00015185506803082577, "loss": 0.0122, "step": 381010 }, { "epoch": 0.99, "learning_rate": 0.0001518511798144543, "loss": 0.0099, "step": 381020 }, { "epoch": 0.99, "learning_rate": 0.00015184729159808285, "loss": 0.0101, "step": 381030 }, { "epoch": 0.99, "learning_rate": 0.00015184340338171136, "loss": 0.0148, "step": 381040 }, { "epoch": 0.99, "learning_rate": 0.0001518395151653399, "loss": 0.014, "step": 381050 }, { "epoch": 0.99, "learning_rate": 0.00015183562694896845, "loss": 0.0107, "step": 381060 }, { "epoch": 0.99, "learning_rate": 0.000151831738732597, "loss": 0.0107, "step": 381070 }, { "epoch": 0.99, "learning_rate": 0.0001518278505162255, "loss": 0.0106, "step": 381080 }, { "epoch": 0.99, "learning_rate": 0.00015182396229985405, "loss": 0.0124, "step": 381090 }, { "epoch": 0.99, "learning_rate": 0.00015182007408348256, "loss": 0.014, "step": 381100 }, { "epoch": 0.99, "learning_rate": 0.00015181618586711113, "loss": 0.0136, "step": 381110 }, { "epoch": 0.99, "learning_rate": 0.00015181229765073964, "loss": 0.0117, "step": 381120 }, { "epoch": 0.99, "learning_rate": 0.00015180840943436818, "loss": 0.0137, "step": 381130 }, { "epoch": 0.99, "learning_rate": 0.0001518045212179967, "loss": 0.0155, "step": 381140 }, { "epoch": 0.99, "learning_rate": 0.00015180063300162527, "loss": 0.0138, "step": 381150 }, { "epoch": 0.99, "learning_rate": 0.0001517967447852538, "loss": 0.0118, "step": 381160 }, { "epoch": 0.99, "learning_rate": 0.00015179285656888232, "loss": 0.0119, "step": 381170 }, { "epoch": 0.99, "learning_rate": 0.00015178896835251087, "loss": 0.0118, "step": 381180 }, { "epoch": 0.99, "learning_rate": 0.0001517850801361394, "loss": 0.0117, "step": 381190 }, { "epoch": 0.99, "learning_rate": 0.00015178119191976795, "loss": 0.0182, "step": 381200 }, { "epoch": 0.99, "learning_rate": 0.00015177730370339646, "loss": 0.0133, "step": 381210 }, { "epoch": 0.99, "learning_rate": 0.000151773415487025, "loss": 0.0117, "step": 381220 }, { "epoch": 0.99, "learning_rate": 0.00015176952727065355, "loss": 0.0121, "step": 381230 }, { "epoch": 0.99, "learning_rate": 0.0001517656390542821, "loss": 0.015, "step": 381240 }, { "epoch": 0.99, "learning_rate": 0.0001517617508379106, "loss": 0.0132, "step": 381250 }, { "epoch": 0.99, "learning_rate": 0.00015175786262153914, "loss": 0.0129, "step": 381260 }, { "epoch": 0.99, "learning_rate": 0.0001517539744051677, "loss": 0.0094, "step": 381270 }, { "epoch": 0.99, "learning_rate": 0.00015175008618879623, "loss": 0.0117, "step": 381280 }, { "epoch": 0.99, "learning_rate": 0.00015174619797242474, "loss": 0.0126, "step": 381290 }, { "epoch": 0.99, "learning_rate": 0.00015174230975605328, "loss": 0.018, "step": 381300 }, { "epoch": 0.99, "learning_rate": 0.00015173842153968185, "loss": 0.015, "step": 381310 }, { "epoch": 0.99, "learning_rate": 0.00015173453332331037, "loss": 0.0124, "step": 381320 }, { "epoch": 0.99, "learning_rate": 0.0001517306451069389, "loss": 0.011, "step": 381330 }, { "epoch": 0.99, "learning_rate": 0.00015172675689056742, "loss": 0.0156, "step": 381340 }, { "epoch": 0.99, "learning_rate": 0.00015172286867419597, "loss": 0.0114, "step": 381350 }, { "epoch": 0.99, "learning_rate": 0.0001517189804578245, "loss": 0.0096, "step": 381360 }, { "epoch": 0.99, "learning_rate": 0.00015171509224145305, "loss": 0.0113, "step": 381370 }, { "epoch": 0.99, "learning_rate": 0.00015171120402508156, "loss": 0.0154, "step": 381380 }, { "epoch": 0.99, "learning_rate": 0.0001517073158087101, "loss": 0.0107, "step": 381390 }, { "epoch": 0.99, "learning_rate": 0.00015170342759233865, "loss": 0.0149, "step": 381400 }, { "epoch": 0.99, "learning_rate": 0.0001516995393759672, "loss": 0.0132, "step": 381410 }, { "epoch": 0.99, "learning_rate": 0.0001516956511595957, "loss": 0.0119, "step": 381420 }, { "epoch": 0.99, "learning_rate": 0.00015169176294322424, "loss": 0.0112, "step": 381430 }, { "epoch": 0.99, "learning_rate": 0.00015168787472685279, "loss": 0.0109, "step": 381440 }, { "epoch": 0.99, "learning_rate": 0.00015168398651048133, "loss": 0.0154, "step": 381450 }, { "epoch": 0.99, "learning_rate": 0.00015168009829410984, "loss": 0.0125, "step": 381460 }, { "epoch": 0.99, "learning_rate": 0.00015167621007773838, "loss": 0.0131, "step": 381470 }, { "epoch": 0.99, "learning_rate": 0.00015167232186136695, "loss": 0.0155, "step": 381480 }, { "epoch": 0.99, "learning_rate": 0.00015166843364499547, "loss": 0.0145, "step": 381490 }, { "epoch": 0.99, "learning_rate": 0.000151664545428624, "loss": 0.0147, "step": 381500 }, { "epoch": 0.99, "learning_rate": 0.00015166065721225252, "loss": 0.0137, "step": 381510 }, { "epoch": 0.99, "learning_rate": 0.0001516567689958811, "loss": 0.0105, "step": 381520 }, { "epoch": 0.99, "learning_rate": 0.0001516528807795096, "loss": 0.0133, "step": 381530 }, { "epoch": 0.99, "learning_rate": 0.00015164899256313815, "loss": 0.0159, "step": 381540 }, { "epoch": 0.99, "learning_rate": 0.00015164510434676666, "loss": 0.0101, "step": 381550 }, { "epoch": 0.99, "learning_rate": 0.00015164121613039523, "loss": 0.0163, "step": 381560 }, { "epoch": 0.99, "learning_rate": 0.00015163732791402375, "loss": 0.0135, "step": 381570 }, { "epoch": 0.99, "learning_rate": 0.0001516334396976523, "loss": 0.0112, "step": 381580 }, { "epoch": 0.99, "learning_rate": 0.0001516295514812808, "loss": 0.0139, "step": 381590 }, { "epoch": 0.99, "learning_rate": 0.00015162566326490934, "loss": 0.0126, "step": 381600 }, { "epoch": 0.99, "learning_rate": 0.00015162177504853789, "loss": 0.0123, "step": 381610 }, { "epoch": 0.99, "learning_rate": 0.00015161788683216643, "loss": 0.0105, "step": 381620 }, { "epoch": 0.99, "learning_rate": 0.00015161399861579494, "loss": 0.0114, "step": 381630 }, { "epoch": 0.99, "learning_rate": 0.00015161011039942348, "loss": 0.011, "step": 381640 }, { "epoch": 0.99, "learning_rate": 0.00015160622218305205, "loss": 0.01, "step": 381650 }, { "epoch": 0.99, "learning_rate": 0.00015160233396668057, "loss": 0.0154, "step": 381660 }, { "epoch": 0.99, "learning_rate": 0.00015159844575030908, "loss": 0.0119, "step": 381670 }, { "epoch": 0.99, "learning_rate": 0.00015159455753393762, "loss": 0.0108, "step": 381680 }, { "epoch": 0.99, "learning_rate": 0.0001515906693175662, "loss": 0.0121, "step": 381690 }, { "epoch": 0.99, "learning_rate": 0.0001515867811011947, "loss": 0.013, "step": 381700 }, { "epoch": 0.99, "learning_rate": 0.00015158289288482325, "loss": 0.012, "step": 381710 }, { "epoch": 0.99, "learning_rate": 0.00015157900466845176, "loss": 0.014, "step": 381720 }, { "epoch": 0.99, "learning_rate": 0.00015157511645208033, "loss": 0.0117, "step": 381730 }, { "epoch": 0.99, "learning_rate": 0.00015157122823570885, "loss": 0.0113, "step": 381740 }, { "epoch": 0.99, "learning_rate": 0.0001515673400193374, "loss": 0.0156, "step": 381750 }, { "epoch": 0.99, "learning_rate": 0.0001515634518029659, "loss": 0.0116, "step": 381760 }, { "epoch": 0.99, "learning_rate": 0.00015155956358659447, "loss": 0.0136, "step": 381770 }, { "epoch": 0.99, "learning_rate": 0.00015155567537022298, "loss": 0.0135, "step": 381780 }, { "epoch": 0.99, "learning_rate": 0.00015155178715385153, "loss": 0.0127, "step": 381790 }, { "epoch": 0.99, "learning_rate": 0.00015154789893748004, "loss": 0.0098, "step": 381800 }, { "epoch": 0.99, "learning_rate": 0.0001515440107211086, "loss": 0.014, "step": 381810 }, { "epoch": 0.99, "learning_rate": 0.00015154012250473715, "loss": 0.0108, "step": 381820 }, { "epoch": 0.99, "learning_rate": 0.00015153623428836567, "loss": 0.0135, "step": 381830 }, { "epoch": 0.99, "learning_rate": 0.00015153234607199418, "loss": 0.0129, "step": 381840 }, { "epoch": 0.99, "learning_rate": 0.00015152845785562272, "loss": 0.0138, "step": 381850 }, { "epoch": 0.99, "learning_rate": 0.0001515245696392513, "loss": 0.0115, "step": 381860 }, { "epoch": 0.99, "learning_rate": 0.0001515206814228798, "loss": 0.0108, "step": 381870 }, { "epoch": 0.99, "learning_rate": 0.00015151679320650835, "loss": 0.0127, "step": 381880 }, { "epoch": 0.99, "learning_rate": 0.00015151290499013686, "loss": 0.0096, "step": 381890 }, { "epoch": 0.99, "learning_rate": 0.00015150901677376543, "loss": 0.013, "step": 381900 }, { "epoch": 0.99, "learning_rate": 0.00015150512855739394, "loss": 0.0121, "step": 381910 }, { "epoch": 0.99, "learning_rate": 0.00015150124034102249, "loss": 0.0158, "step": 381920 }, { "epoch": 0.99, "learning_rate": 0.000151497352124651, "loss": 0.0129, "step": 381930 }, { "epoch": 0.99, "learning_rate": 0.00015149346390827957, "loss": 0.0119, "step": 381940 }, { "epoch": 0.99, "learning_rate": 0.00015148957569190808, "loss": 0.0108, "step": 381950 }, { "epoch": 0.99, "learning_rate": 0.00015148568747553663, "loss": 0.0136, "step": 381960 }, { "epoch": 0.99, "learning_rate": 0.00015148179925916514, "loss": 0.0141, "step": 381970 }, { "epoch": 0.99, "learning_rate": 0.0001514779110427937, "loss": 0.0107, "step": 381980 }, { "epoch": 0.99, "learning_rate": 0.00015147402282642222, "loss": 0.0168, "step": 381990 }, { "epoch": 0.99, "learning_rate": 0.00015147013461005077, "loss": 0.0126, "step": 382000 }, { "epoch": 0.99, "eval_cer": 0.8817096845078387, "eval_loss": 0.007775302045047283, "eval_runtime": 107.5939, "eval_samples_per_second": 18.588, "eval_steps_per_second": 4.647, "step": 382000 }, { "epoch": 0.99, "learning_rate": 0.00015146624639367928, "loss": 0.0112, "step": 382010 }, { "epoch": 0.99, "learning_rate": 0.00015146235817730785, "loss": 0.0113, "step": 382020 }, { "epoch": 0.99, "learning_rate": 0.0001514584699609364, "loss": 0.0106, "step": 382030 }, { "epoch": 0.99, "learning_rate": 0.0001514545817445649, "loss": 0.0124, "step": 382040 }, { "epoch": 0.99, "learning_rate": 0.00015145069352819345, "loss": 0.013, "step": 382050 }, { "epoch": 0.99, "learning_rate": 0.000151446805311822, "loss": 0.0092, "step": 382060 }, { "epoch": 0.99, "learning_rate": 0.00015144291709545053, "loss": 0.0116, "step": 382070 }, { "epoch": 0.99, "learning_rate": 0.00015143902887907904, "loss": 0.0183, "step": 382080 }, { "epoch": 0.99, "learning_rate": 0.00015143514066270759, "loss": 0.0138, "step": 382090 }, { "epoch": 0.99, "learning_rate": 0.0001514312524463361, "loss": 0.0116, "step": 382100 }, { "epoch": 0.99, "learning_rate": 0.00015142736422996467, "loss": 0.011, "step": 382110 }, { "epoch": 0.99, "learning_rate": 0.00015142347601359318, "loss": 0.0172, "step": 382120 }, { "epoch": 0.99, "learning_rate": 0.00015141958779722173, "loss": 0.0115, "step": 382130 }, { "epoch": 0.99, "learning_rate": 0.00015141569958085024, "loss": 0.0123, "step": 382140 }, { "epoch": 0.99, "learning_rate": 0.0001514118113644788, "loss": 0.0118, "step": 382150 }, { "epoch": 0.99, "learning_rate": 0.00015140792314810732, "loss": 0.0119, "step": 382160 }, { "epoch": 0.99, "learning_rate": 0.00015140403493173586, "loss": 0.0161, "step": 382170 }, { "epoch": 0.99, "learning_rate": 0.00015140014671536438, "loss": 0.0135, "step": 382180 }, { "epoch": 0.99, "learning_rate": 0.00015139625849899295, "loss": 0.0136, "step": 382190 }, { "epoch": 0.99, "learning_rate": 0.0001513923702826215, "loss": 0.0135, "step": 382200 }, { "epoch": 0.99, "learning_rate": 0.00015138848206625, "loss": 0.0123, "step": 382210 }, { "epoch": 0.99, "learning_rate": 0.00015138459384987855, "loss": 0.0135, "step": 382220 }, { "epoch": 0.99, "learning_rate": 0.0001513807056335071, "loss": 0.0103, "step": 382230 }, { "epoch": 0.99, "learning_rate": 0.00015137681741713563, "loss": 0.0134, "step": 382240 }, { "epoch": 0.99, "learning_rate": 0.00015137292920076414, "loss": 0.0134, "step": 382250 }, { "epoch": 0.99, "learning_rate": 0.00015136904098439269, "loss": 0.0129, "step": 382260 }, { "epoch": 0.99, "learning_rate": 0.00015136515276802123, "loss": 0.0148, "step": 382270 }, { "epoch": 0.99, "learning_rate": 0.00015136126455164977, "loss": 0.0167, "step": 382280 }, { "epoch": 0.99, "learning_rate": 0.00015135737633527828, "loss": 0.0138, "step": 382290 }, { "epoch": 0.99, "learning_rate": 0.00015135348811890682, "loss": 0.0125, "step": 382300 }, { "epoch": 0.99, "learning_rate": 0.00015134959990253537, "loss": 0.0104, "step": 382310 }, { "epoch": 0.99, "learning_rate": 0.0001513457116861639, "loss": 0.0109, "step": 382320 }, { "epoch": 0.99, "learning_rate": 0.00015134182346979242, "loss": 0.0138, "step": 382330 }, { "epoch": 0.99, "learning_rate": 0.00015133793525342096, "loss": 0.0171, "step": 382340 }, { "epoch": 0.99, "learning_rate": 0.00015133404703704948, "loss": 0.0103, "step": 382350 }, { "epoch": 0.99, "learning_rate": 0.00015133015882067805, "loss": 0.0125, "step": 382360 }, { "epoch": 0.99, "learning_rate": 0.0001513262706043066, "loss": 0.0146, "step": 382370 }, { "epoch": 0.99, "learning_rate": 0.0001513223823879351, "loss": 0.0116, "step": 382380 }, { "epoch": 0.99, "learning_rate": 0.00015131849417156362, "loss": 0.0127, "step": 382390 }, { "epoch": 0.99, "learning_rate": 0.0001513146059551922, "loss": 0.0118, "step": 382400 }, { "epoch": 0.99, "learning_rate": 0.00015131071773882073, "loss": 0.0138, "step": 382410 }, { "epoch": 0.99, "learning_rate": 0.00015130682952244924, "loss": 0.0132, "step": 382420 }, { "epoch": 0.99, "learning_rate": 0.00015130294130607778, "loss": 0.014, "step": 382430 }, { "epoch": 0.99, "learning_rate": 0.00015129905308970633, "loss": 0.0127, "step": 382440 }, { "epoch": 0.99, "learning_rate": 0.00015129516487333487, "loss": 0.01, "step": 382450 }, { "epoch": 0.99, "learning_rate": 0.00015129127665696338, "loss": 0.015, "step": 382460 }, { "epoch": 0.99, "learning_rate": 0.00015128738844059192, "loss": 0.0118, "step": 382470 }, { "epoch": 0.99, "learning_rate": 0.00015128350022422047, "loss": 0.0185, "step": 382480 }, { "epoch": 0.99, "learning_rate": 0.000151279612007849, "loss": 0.0154, "step": 382490 }, { "epoch": 0.99, "learning_rate": 0.00015127572379147752, "loss": 0.0121, "step": 382500 }, { "epoch": 0.99, "learning_rate": 0.00015127183557510606, "loss": 0.0139, "step": 382510 }, { "epoch": 0.99, "learning_rate": 0.00015126794735873463, "loss": 0.0131, "step": 382520 }, { "epoch": 0.99, "learning_rate": 0.00015126405914236315, "loss": 0.0136, "step": 382530 }, { "epoch": 0.99, "learning_rate": 0.0001512601709259917, "loss": 0.0116, "step": 382540 }, { "epoch": 0.99, "learning_rate": 0.0001512562827096202, "loss": 0.017, "step": 382550 }, { "epoch": 0.99, "learning_rate": 0.00015125239449324877, "loss": 0.014, "step": 382560 }, { "epoch": 0.99, "learning_rate": 0.00015124850627687729, "loss": 0.0135, "step": 382570 }, { "epoch": 0.99, "learning_rate": 0.00015124461806050583, "loss": 0.0113, "step": 382580 }, { "epoch": 0.99, "learning_rate": 0.00015124072984413434, "loss": 0.01, "step": 382590 }, { "epoch": 0.99, "learning_rate": 0.00015123684162776288, "loss": 0.013, "step": 382600 }, { "epoch": 0.99, "learning_rate": 0.00015123295341139143, "loss": 0.0124, "step": 382610 }, { "epoch": 0.99, "learning_rate": 0.00015122906519501997, "loss": 0.0131, "step": 382620 }, { "epoch": 0.99, "learning_rate": 0.00015122517697864848, "loss": 0.01, "step": 382630 }, { "epoch": 0.99, "learning_rate": 0.00015122128876227702, "loss": 0.0113, "step": 382640 }, { "epoch": 0.99, "learning_rate": 0.00015121740054590557, "loss": 0.0106, "step": 382650 }, { "epoch": 0.99, "learning_rate": 0.0001512135123295341, "loss": 0.0105, "step": 382660 }, { "epoch": 0.99, "learning_rate": 0.00015120962411316262, "loss": 0.0126, "step": 382670 }, { "epoch": 0.99, "learning_rate": 0.00015120573589679116, "loss": 0.0108, "step": 382680 }, { "epoch": 0.99, "learning_rate": 0.00015120184768041973, "loss": 0.0115, "step": 382690 }, { "epoch": 0.99, "learning_rate": 0.00015119795946404825, "loss": 0.0132, "step": 382700 }, { "epoch": 0.99, "learning_rate": 0.00015119407124767676, "loss": 0.0128, "step": 382710 }, { "epoch": 0.99, "learning_rate": 0.0001511901830313053, "loss": 0.0108, "step": 382720 }, { "epoch": 0.99, "learning_rate": 0.00015118629481493387, "loss": 0.0126, "step": 382730 }, { "epoch": 0.99, "learning_rate": 0.00015118240659856239, "loss": 0.0094, "step": 382740 }, { "epoch": 0.99, "learning_rate": 0.00015117851838219093, "loss": 0.0116, "step": 382750 }, { "epoch": 0.99, "learning_rate": 0.00015117463016581944, "loss": 0.0106, "step": 382760 }, { "epoch": 0.99, "learning_rate": 0.000151170741949448, "loss": 0.0123, "step": 382770 }, { "epoch": 0.99, "learning_rate": 0.00015116685373307653, "loss": 0.0114, "step": 382780 }, { "epoch": 0.99, "learning_rate": 0.00015116296551670507, "loss": 0.0107, "step": 382790 }, { "epoch": 0.99, "learning_rate": 0.00015115907730033358, "loss": 0.014, "step": 382800 }, { "epoch": 0.99, "learning_rate": 0.00015115518908396215, "loss": 0.0137, "step": 382810 }, { "epoch": 0.99, "learning_rate": 0.00015115130086759066, "loss": 0.0116, "step": 382820 }, { "epoch": 0.99, "learning_rate": 0.0001511474126512192, "loss": 0.0133, "step": 382830 }, { "epoch": 0.99, "learning_rate": 0.00015114352443484772, "loss": 0.0133, "step": 382840 }, { "epoch": 0.99, "learning_rate": 0.00015113963621847626, "loss": 0.0109, "step": 382850 }, { "epoch": 0.99, "learning_rate": 0.0001511357480021048, "loss": 0.0122, "step": 382860 }, { "epoch": 0.99, "learning_rate": 0.00015113185978573335, "loss": 0.0142, "step": 382870 }, { "epoch": 0.99, "learning_rate": 0.00015112797156936186, "loss": 0.0115, "step": 382880 }, { "epoch": 0.99, "learning_rate": 0.0001511240833529904, "loss": 0.0164, "step": 382890 }, { "epoch": 0.99, "learning_rate": 0.00015112019513661897, "loss": 0.012, "step": 382900 }, { "epoch": 0.99, "learning_rate": 0.00015111630692024749, "loss": 0.0116, "step": 382910 }, { "epoch": 0.99, "learning_rate": 0.00015111241870387603, "loss": 0.0138, "step": 382920 }, { "epoch": 0.99, "learning_rate": 0.00015110853048750454, "loss": 0.0124, "step": 382930 }, { "epoch": 0.99, "learning_rate": 0.0001511046422711331, "loss": 0.0149, "step": 382940 }, { "epoch": 0.99, "learning_rate": 0.00015110075405476162, "loss": 0.0135, "step": 382950 }, { "epoch": 0.99, "learning_rate": 0.00015109686583839017, "loss": 0.0111, "step": 382960 }, { "epoch": 0.99, "learning_rate": 0.00015109297762201868, "loss": 0.0147, "step": 382970 }, { "epoch": 0.99, "learning_rate": 0.00015108908940564725, "loss": 0.0155, "step": 382980 }, { "epoch": 0.99, "learning_rate": 0.00015108520118927576, "loss": 0.0117, "step": 382990 }, { "epoch": 0.99, "learning_rate": 0.0001510813129729043, "loss": 0.0117, "step": 383000 }, { "epoch": 0.99, "eval_cer": 0.8817096845078387, "eval_loss": 0.007927495054900646, "eval_runtime": 107.7064, "eval_samples_per_second": 18.569, "eval_steps_per_second": 4.642, "step": 383000 }, { "epoch": 0.99, "learning_rate": 0.00015107742475653282, "loss": 0.0139, "step": 383010 }, { "epoch": 0.99, "learning_rate": 0.0001510735365401614, "loss": 0.0155, "step": 383020 }, { "epoch": 0.99, "learning_rate": 0.0001510696483237899, "loss": 0.0108, "step": 383030 }, { "epoch": 0.99, "learning_rate": 0.00015106576010741845, "loss": 0.0092, "step": 383040 }, { "epoch": 0.99, "learning_rate": 0.00015106187189104696, "loss": 0.0114, "step": 383050 }, { "epoch": 0.99, "learning_rate": 0.00015105798367467553, "loss": 0.0119, "step": 383060 }, { "epoch": 0.99, "learning_rate": 0.00015105409545830407, "loss": 0.0147, "step": 383070 }, { "epoch": 0.99, "learning_rate": 0.00015105020724193258, "loss": 0.0122, "step": 383080 }, { "epoch": 0.99, "learning_rate": 0.00015104631902556113, "loss": 0.0143, "step": 383090 }, { "epoch": 0.99, "learning_rate": 0.00015104243080918964, "loss": 0.0155, "step": 383100 }, { "epoch": 0.99, "learning_rate": 0.0001510385425928182, "loss": 0.0108, "step": 383110 }, { "epoch": 0.99, "learning_rate": 0.00015103465437644672, "loss": 0.0242, "step": 383120 }, { "epoch": 0.99, "learning_rate": 0.00015103076616007527, "loss": 0.0108, "step": 383130 }, { "epoch": 0.99, "learning_rate": 0.00015102687794370378, "loss": 0.0117, "step": 383140 }, { "epoch": 0.99, "learning_rate": 0.00015102298972733235, "loss": 0.0103, "step": 383150 }, { "epoch": 0.99, "learning_rate": 0.00015101910151096086, "loss": 0.0116, "step": 383160 }, { "epoch": 0.99, "learning_rate": 0.0001510152132945894, "loss": 0.0157, "step": 383170 }, { "epoch": 0.99, "learning_rate": 0.00015101132507821792, "loss": 0.0145, "step": 383180 }, { "epoch": 0.99, "learning_rate": 0.0001510074368618465, "loss": 0.0142, "step": 383190 }, { "epoch": 0.99, "learning_rate": 0.000151003548645475, "loss": 0.0126, "step": 383200 }, { "epoch": 0.99, "learning_rate": 0.00015099966042910354, "loss": 0.0128, "step": 383210 }, { "epoch": 0.99, "learning_rate": 0.00015099577221273206, "loss": 0.0142, "step": 383220 }, { "epoch": 0.99, "learning_rate": 0.00015099188399636063, "loss": 0.0126, "step": 383230 }, { "epoch": 0.99, "learning_rate": 0.00015098799577998917, "loss": 0.0134, "step": 383240 }, { "epoch": 0.99, "learning_rate": 0.00015098410756361768, "loss": 0.0111, "step": 383250 }, { "epoch": 0.99, "learning_rate": 0.0001509802193472462, "loss": 0.0126, "step": 383260 }, { "epoch": 0.99, "learning_rate": 0.00015097633113087477, "loss": 0.0134, "step": 383270 }, { "epoch": 0.99, "learning_rate": 0.0001509724429145033, "loss": 0.0146, "step": 383280 }, { "epoch": 0.99, "learning_rate": 0.00015096855469813182, "loss": 0.0133, "step": 383290 }, { "epoch": 0.99, "learning_rate": 0.00015096466648176037, "loss": 0.009, "step": 383300 }, { "epoch": 0.99, "learning_rate": 0.0001509607782653889, "loss": 0.0138, "step": 383310 }, { "epoch": 0.99, "learning_rate": 0.00015095689004901745, "loss": 0.0114, "step": 383320 }, { "epoch": 0.99, "learning_rate": 0.00015095300183264596, "loss": 0.0128, "step": 383330 }, { "epoch": 0.99, "learning_rate": 0.0001509491136162745, "loss": 0.0102, "step": 383340 }, { "epoch": 0.99, "learning_rate": 0.00015094522539990302, "loss": 0.0133, "step": 383350 }, { "epoch": 0.99, "learning_rate": 0.0001509413371835316, "loss": 0.014, "step": 383360 }, { "epoch": 0.99, "learning_rate": 0.0001509374489671601, "loss": 0.0157, "step": 383370 }, { "epoch": 0.99, "learning_rate": 0.00015093356075078864, "loss": 0.0139, "step": 383380 }, { "epoch": 0.99, "learning_rate": 0.00015092967253441716, "loss": 0.0178, "step": 383390 }, { "epoch": 0.99, "learning_rate": 0.00015092578431804573, "loss": 0.0184, "step": 383400 }, { "epoch": 0.99, "learning_rate": 0.00015092189610167427, "loss": 0.0112, "step": 383410 }, { "epoch": 0.99, "learning_rate": 0.00015091800788530278, "loss": 0.0135, "step": 383420 }, { "epoch": 0.99, "learning_rate": 0.0001509141196689313, "loss": 0.0116, "step": 383430 }, { "epoch": 0.99, "learning_rate": 0.00015091023145255987, "loss": 0.0149, "step": 383440 }, { "epoch": 0.99, "learning_rate": 0.0001509063432361884, "loss": 0.0173, "step": 383450 }, { "epoch": 0.99, "learning_rate": 0.00015090245501981692, "loss": 0.0138, "step": 383460 }, { "epoch": 0.99, "learning_rate": 0.00015089856680344546, "loss": 0.0106, "step": 383470 }, { "epoch": 0.99, "learning_rate": 0.000150894678587074, "loss": 0.0126, "step": 383480 }, { "epoch": 0.99, "learning_rate": 0.00015089079037070255, "loss": 0.0106, "step": 383490 }, { "epoch": 0.99, "learning_rate": 0.00015088690215433106, "loss": 0.0113, "step": 383500 }, { "epoch": 0.99, "learning_rate": 0.0001508830139379596, "loss": 0.0112, "step": 383510 }, { "epoch": 0.99, "learning_rate": 0.00015087912572158815, "loss": 0.0123, "step": 383520 }, { "epoch": 0.99, "learning_rate": 0.0001508752375052167, "loss": 0.0125, "step": 383530 }, { "epoch": 0.99, "learning_rate": 0.0001508713492888452, "loss": 0.0095, "step": 383540 }, { "epoch": 0.99, "learning_rate": 0.00015086746107247374, "loss": 0.0099, "step": 383550 }, { "epoch": 0.99, "learning_rate": 0.0001508635728561023, "loss": 0.0119, "step": 383560 }, { "epoch": 0.99, "learning_rate": 0.00015085968463973083, "loss": 0.0121, "step": 383570 }, { "epoch": 0.99, "learning_rate": 0.00015085579642335934, "loss": 0.013, "step": 383580 }, { "epoch": 0.99, "learning_rate": 0.00015085190820698788, "loss": 0.0144, "step": 383590 }, { "epoch": 0.99, "learning_rate": 0.0001508480199906164, "loss": 0.0091, "step": 383600 }, { "epoch": 0.99, "learning_rate": 0.00015084413177424497, "loss": 0.0111, "step": 383610 }, { "epoch": 0.99, "learning_rate": 0.0001508402435578735, "loss": 0.0099, "step": 383620 }, { "epoch": 0.99, "learning_rate": 0.00015083635534150202, "loss": 0.0111, "step": 383630 }, { "epoch": 0.99, "learning_rate": 0.00015083246712513056, "loss": 0.0098, "step": 383640 }, { "epoch": 0.99, "learning_rate": 0.0001508285789087591, "loss": 0.0119, "step": 383650 }, { "epoch": 0.99, "learning_rate": 0.00015082469069238765, "loss": 0.01, "step": 383660 }, { "epoch": 0.99, "learning_rate": 0.00015082080247601616, "loss": 0.0126, "step": 383670 }, { "epoch": 0.99, "learning_rate": 0.0001508169142596447, "loss": 0.015, "step": 383680 }, { "epoch": 0.99, "learning_rate": 0.00015081302604327324, "loss": 0.0209, "step": 383690 }, { "epoch": 0.99, "learning_rate": 0.0001508091378269018, "loss": 0.0127, "step": 383700 }, { "epoch": 0.99, "learning_rate": 0.0001508052496105303, "loss": 0.0144, "step": 383710 }, { "epoch": 0.99, "learning_rate": 0.00015080136139415884, "loss": 0.0173, "step": 383720 }, { "epoch": 0.99, "learning_rate": 0.00015079747317778738, "loss": 0.0117, "step": 383730 }, { "epoch": 0.99, "learning_rate": 0.00015079358496141593, "loss": 0.0108, "step": 383740 }, { "epoch": 0.99, "learning_rate": 0.00015078969674504444, "loss": 0.0114, "step": 383750 }, { "epoch": 0.99, "learning_rate": 0.00015078580852867298, "loss": 0.0105, "step": 383760 }, { "epoch": 0.99, "learning_rate": 0.00015078192031230155, "loss": 0.0156, "step": 383770 }, { "epoch": 0.99, "learning_rate": 0.00015077803209593007, "loss": 0.0161, "step": 383780 }, { "epoch": 0.99, "learning_rate": 0.0001507741438795586, "loss": 0.0138, "step": 383790 }, { "epoch": 0.99, "learning_rate": 0.00015077025566318712, "loss": 0.0151, "step": 383800 }, { "epoch": 0.99, "learning_rate": 0.0001507663674468157, "loss": 0.0129, "step": 383810 }, { "epoch": 0.99, "learning_rate": 0.0001507624792304442, "loss": 0.0121, "step": 383820 }, { "epoch": 0.99, "learning_rate": 0.00015075859101407275, "loss": 0.0115, "step": 383830 }, { "epoch": 0.99, "learning_rate": 0.00015075470279770126, "loss": 0.0112, "step": 383840 }, { "epoch": 0.99, "learning_rate": 0.0001507508145813298, "loss": 0.0095, "step": 383850 }, { "epoch": 1.0, "learning_rate": 0.00015074692636495834, "loss": 0.0146, "step": 383860 }, { "epoch": 1.0, "learning_rate": 0.00015074303814858689, "loss": 0.012, "step": 383870 }, { "epoch": 1.0, "learning_rate": 0.0001507391499322154, "loss": 0.0118, "step": 383880 }, { "epoch": 1.0, "learning_rate": 0.00015073526171584394, "loss": 0.0104, "step": 383890 }, { "epoch": 1.0, "learning_rate": 0.00015073137349947248, "loss": 0.0106, "step": 383900 }, { "epoch": 1.0, "learning_rate": 0.00015072748528310103, "loss": 0.0099, "step": 383910 }, { "epoch": 1.0, "learning_rate": 0.00015072359706672954, "loss": 0.0112, "step": 383920 }, { "epoch": 1.0, "learning_rate": 0.00015071970885035808, "loss": 0.0108, "step": 383930 }, { "epoch": 1.0, "learning_rate": 0.00015071582063398665, "loss": 0.0096, "step": 383940 }, { "epoch": 1.0, "learning_rate": 0.00015071193241761516, "loss": 0.0128, "step": 383950 }, { "epoch": 1.0, "learning_rate": 0.0001507080442012437, "loss": 0.0121, "step": 383960 }, { "epoch": 1.0, "learning_rate": 0.00015070415598487222, "loss": 0.0115, "step": 383970 }, { "epoch": 1.0, "learning_rate": 0.0001507002677685008, "loss": 0.0121, "step": 383980 }, { "epoch": 1.0, "learning_rate": 0.0001506963795521293, "loss": 0.0113, "step": 383990 }, { "epoch": 1.0, "learning_rate": 0.00015069249133575785, "loss": 0.0105, "step": 384000 }, { "epoch": 1.0, "eval_cer": 0.8817054855970361, "eval_loss": 0.007804430089890957, "eval_runtime": 107.5434, "eval_samples_per_second": 18.597, "eval_steps_per_second": 4.649, "step": 384000 }, { "epoch": 1.0, "learning_rate": 0.00015068860311938636, "loss": 0.0113, "step": 384010 }, { "epoch": 1.0, "learning_rate": 0.00015068471490301493, "loss": 0.0136, "step": 384020 }, { "epoch": 1.0, "learning_rate": 0.00015068082668664344, "loss": 0.0141, "step": 384030 }, { "epoch": 1.0, "learning_rate": 0.00015067693847027199, "loss": 0.0123, "step": 384040 }, { "epoch": 1.0, "learning_rate": 0.0001506730502539005, "loss": 0.0147, "step": 384050 }, { "epoch": 1.0, "learning_rate": 0.00015066916203752907, "loss": 0.0108, "step": 384060 }, { "epoch": 1.0, "learning_rate": 0.00015066527382115758, "loss": 0.0143, "step": 384070 }, { "epoch": 1.0, "learning_rate": 0.00015066138560478612, "loss": 0.0113, "step": 384080 }, { "epoch": 1.0, "learning_rate": 0.00015065749738841464, "loss": 0.0119, "step": 384090 }, { "epoch": 1.0, "learning_rate": 0.00015065360917204318, "loss": 0.0123, "step": 384100 }, { "epoch": 1.0, "learning_rate": 0.00015064972095567175, "loss": 0.0116, "step": 384110 }, { "epoch": 1.0, "learning_rate": 0.00015064583273930026, "loss": 0.01, "step": 384120 }, { "epoch": 1.0, "learning_rate": 0.0001506419445229288, "loss": 0.0107, "step": 384130 }, { "epoch": 1.0, "learning_rate": 0.00015063805630655732, "loss": 0.0083, "step": 384140 }, { "epoch": 1.0, "learning_rate": 0.0001506341680901859, "loss": 0.0102, "step": 384150 }, { "epoch": 1.0, "learning_rate": 0.0001506302798738144, "loss": 0.0103, "step": 384160 }, { "epoch": 1.0, "learning_rate": 0.00015062639165744295, "loss": 0.0144, "step": 384170 }, { "epoch": 1.0, "learning_rate": 0.00015062250344107146, "loss": 0.0112, "step": 384180 }, { "epoch": 1.0, "learning_rate": 0.00015061861522470003, "loss": 0.0129, "step": 384190 }, { "epoch": 1.0, "learning_rate": 0.00015061472700832854, "loss": 0.0132, "step": 384200 }, { "epoch": 1.0, "learning_rate": 0.00015061083879195708, "loss": 0.01, "step": 384210 }, { "epoch": 1.0, "learning_rate": 0.0001506069505755856, "loss": 0.0116, "step": 384220 }, { "epoch": 1.0, "learning_rate": 0.00015060306235921417, "loss": 0.0119, "step": 384230 }, { "epoch": 1.0, "learning_rate": 0.00015059917414284268, "loss": 0.0107, "step": 384240 }, { "epoch": 1.0, "learning_rate": 0.00015059528592647122, "loss": 0.0119, "step": 384250 }, { "epoch": 1.0, "learning_rate": 0.00015059139771009974, "loss": 0.0129, "step": 384260 }, { "epoch": 1.0, "learning_rate": 0.0001505875094937283, "loss": 0.014, "step": 384270 }, { "epoch": 1.0, "learning_rate": 0.00015058362127735685, "loss": 0.011, "step": 384280 }, { "epoch": 1.0, "learning_rate": 0.00015057973306098536, "loss": 0.0124, "step": 384290 }, { "epoch": 1.0, "learning_rate": 0.00015057584484461388, "loss": 0.0145, "step": 384300 }, { "epoch": 1.0, "learning_rate": 0.00015057195662824245, "loss": 0.0105, "step": 384310 }, { "epoch": 1.0, "learning_rate": 0.000150568068411871, "loss": 0.0187, "step": 384320 }, { "epoch": 1.0, "learning_rate": 0.0001505641801954995, "loss": 0.0113, "step": 384330 }, { "epoch": 1.0, "learning_rate": 0.00015056029197912804, "loss": 0.0134, "step": 384340 }, { "epoch": 1.0, "learning_rate": 0.00015055640376275656, "loss": 0.012, "step": 384350 }, { "epoch": 1.0, "learning_rate": 0.00015055251554638513, "loss": 0.0111, "step": 384360 }, { "epoch": 1.0, "learning_rate": 0.00015054862733001364, "loss": 0.0099, "step": 384370 }, { "epoch": 1.0, "learning_rate": 0.00015054473911364218, "loss": 0.0109, "step": 384380 }, { "epoch": 1.0, "learning_rate": 0.0001505408508972707, "loss": 0.0145, "step": 384390 }, { "epoch": 1.0, "learning_rate": 0.00015053696268089927, "loss": 0.0145, "step": 384400 }, { "epoch": 1.0, "learning_rate": 0.00015053307446452778, "loss": 0.0165, "step": 384410 }, { "epoch": 1.0, "learning_rate": 0.00015052918624815632, "loss": 0.0141, "step": 384420 }, { "epoch": 1.0, "learning_rate": 0.00015052529803178484, "loss": 0.013, "step": 384430 }, { "epoch": 1.0, "learning_rate": 0.0001505214098154134, "loss": 0.0132, "step": 384440 }, { "epoch": 1.0, "learning_rate": 0.00015051752159904192, "loss": 0.0123, "step": 384450 }, { "epoch": 1.0, "learning_rate": 0.00015051363338267046, "loss": 0.0123, "step": 384460 }, { "epoch": 1.0, "learning_rate": 0.00015050974516629898, "loss": 0.0157, "step": 384470 }, { "epoch": 1.0, "learning_rate": 0.00015050585694992755, "loss": 0.014, "step": 384480 }, { "epoch": 1.0, "learning_rate": 0.0001505019687335561, "loss": 0.0114, "step": 384490 }, { "epoch": 1.0, "learning_rate": 0.0001504980805171846, "loss": 0.0138, "step": 384500 }, { "epoch": 1.0, "learning_rate": 0.00015049419230081314, "loss": 0.0127, "step": 384510 }, { "epoch": 1.0, "learning_rate": 0.00015049030408444169, "loss": 0.0106, "step": 384520 }, { "epoch": 1.0, "learning_rate": 0.00015048641586807023, "loss": 0.0103, "step": 384530 }, { "epoch": 1.0, "learning_rate": 0.00015048252765169874, "loss": 0.0133, "step": 384540 }, { "epoch": 1.0, "learning_rate": 0.00015047863943532728, "loss": 0.0101, "step": 384550 }, { "epoch": 1.0, "learning_rate": 0.00015047475121895583, "loss": 0.0129, "step": 384560 }, { "epoch": 1.0, "learning_rate": 0.00015047086300258437, "loss": 0.011, "step": 384570 }, { "epoch": 1.0, "learning_rate": 0.00015046697478621288, "loss": 0.0148, "step": 384580 }, { "epoch": 1.0, "learning_rate": 0.00015046308656984142, "loss": 0.014, "step": 384590 }, { "epoch": 1.0, "learning_rate": 0.00015045919835346994, "loss": 0.0102, "step": 384600 }, { "epoch": 1.0, "learning_rate": 0.0001504553101370985, "loss": 0.0137, "step": 384610 }, { "epoch": 1.0, "learning_rate": 0.00015045142192072702, "loss": 0.0123, "step": 384620 }, { "epoch": 1.0, "learning_rate": 0.00015044753370435556, "loss": 0.0105, "step": 384630 }, { "epoch": 1.0, "learning_rate": 0.00015044364548798408, "loss": 0.0161, "step": 384640 }, { "epoch": 1.0, "learning_rate": 0.00015043975727161265, "loss": 0.0134, "step": 384650 }, { "epoch": 1.0, "learning_rate": 0.0001504358690552412, "loss": 0.0097, "step": 384660 }, { "epoch": 1.0, "learning_rate": 0.0001504319808388697, "loss": 0.0136, "step": 384670 }, { "epoch": 1.0, "learning_rate": 0.00015042809262249824, "loss": 0.013, "step": 384680 }, { "epoch": 1.0, "learning_rate": 0.00015042420440612679, "loss": 0.0129, "step": 384690 }, { "epoch": 1.0, "learning_rate": 0.00015042031618975533, "loss": 0.0158, "step": 384700 }, { "epoch": 1.0, "learning_rate": 0.00015041642797338384, "loss": 0.0154, "step": 384710 }, { "epoch": 1.0, "learning_rate": 0.00015041253975701238, "loss": 0.0128, "step": 384720 }, { "epoch": 1.0, "learning_rate": 0.00015040865154064092, "loss": 0.0132, "step": 384730 }, { "epoch": 1.0, "learning_rate": 0.00015040476332426947, "loss": 0.0127, "step": 384740 }, { "epoch": 1.0, "learning_rate": 0.00015040087510789798, "loss": 0.0137, "step": 384750 }, { "epoch": 1.0, "learning_rate": 0.00015039698689152652, "loss": 0.011, "step": 384760 }, { "epoch": 1.0, "learning_rate": 0.00015039309867515506, "loss": 0.013, "step": 384770 }, { "epoch": 1.0, "learning_rate": 0.0001503892104587836, "loss": 0.0136, "step": 384780 }, { "epoch": 1.0, "learning_rate": 0.00015038532224241212, "loss": 0.013, "step": 384790 }, { "epoch": 1.0, "learning_rate": 0.00015038143402604066, "loss": 0.0152, "step": 384800 }, { "epoch": 1.0, "learning_rate": 0.00015037754580966923, "loss": 0.0136, "step": 384810 }, { "epoch": 1.0, "learning_rate": 0.00015037365759329775, "loss": 0.0135, "step": 384820 }, { "epoch": 1.0, "learning_rate": 0.0001503697693769263, "loss": 0.0113, "step": 384830 }, { "epoch": 1.0, "learning_rate": 0.0001503658811605548, "loss": 0.0111, "step": 384840 }, { "epoch": 1.0, "learning_rate": 0.00015036199294418332, "loss": 0.0124, "step": 384850 }, { "epoch": 1.0, "learning_rate": 0.00015035810472781188, "loss": 0.0149, "step": 384860 }, { "epoch": 1.0, "learning_rate": 0.00015035421651144043, "loss": 0.0117, "step": 384870 }, { "epoch": 1.0, "learning_rate": 0.00015035032829506894, "loss": 0.0097, "step": 384880 }, { "epoch": 1.0, "learning_rate": 0.00015034644007869748, "loss": 0.0115, "step": 384890 }, { "epoch": 1.0, "learning_rate": 0.00015034255186232602, "loss": 0.0122, "step": 384900 }, { "epoch": 1.0, "learning_rate": 0.00015033866364595457, "loss": 0.0114, "step": 384910 }, { "epoch": 1.0, "learning_rate": 0.00015033477542958308, "loss": 0.0139, "step": 384920 }, { "epoch": 1.0, "learning_rate": 0.00015033088721321162, "loss": 0.0123, "step": 384930 }, { "epoch": 1.0, "learning_rate": 0.00015032699899684016, "loss": 0.0112, "step": 384940 }, { "epoch": 1.0, "learning_rate": 0.0001503231107804687, "loss": 0.0172, "step": 384950 }, { "epoch": 1.0, "learning_rate": 0.00015031922256409722, "loss": 0.0141, "step": 384960 }, { "epoch": 1.0, "learning_rate": 0.00015031533434772576, "loss": 0.0112, "step": 384970 }, { "epoch": 1.0, "learning_rate": 0.00015031144613135433, "loss": 0.0193, "step": 384980 }, { "epoch": 1.0, "learning_rate": 0.00015030755791498284, "loss": 0.0177, "step": 384990 }, { "epoch": 1.0, "learning_rate": 0.00015030366969861139, "loss": 0.0152, "step": 385000 }, { "epoch": 1.0, "eval_cer": 0.8817684692590742, "eval_loss": 0.00825272686779499, "eval_runtime": 107.6549, "eval_samples_per_second": 18.578, "eval_steps_per_second": 4.644, "step": 385000 }, { "epoch": 1.0, "learning_rate": 0.0001502997814822399, "loss": 0.0123, "step": 385010 }, { "epoch": 1.0, "learning_rate": 0.00015029589326586847, "loss": 0.0152, "step": 385020 }, { "epoch": 1.0, "learning_rate": 0.00015029200504949698, "loss": 0.0131, "step": 385030 }, { "epoch": 1.0, "learning_rate": 0.00015028811683312553, "loss": 0.0146, "step": 385040 }, { "epoch": 1.0, "learning_rate": 0.00015028422861675404, "loss": 0.0111, "step": 385050 }, { "epoch": 1.0, "learning_rate": 0.0001502803404003826, "loss": 0.0283, "step": 385060 }, { "epoch": 1.0, "learning_rate": 0.00015027645218401112, "loss": 0.0101, "step": 385070 }, { "epoch": 1.0, "learning_rate": 0.00015027256396763967, "loss": 0.0164, "step": 385080 }, { "epoch": 1.0, "learning_rate": 0.00015026867575126818, "loss": 0.0117, "step": 385090 }, { "epoch": 1.0, "learning_rate": 0.00015026478753489672, "loss": 0.0097, "step": 385100 }, { "epoch": 1.0, "learning_rate": 0.00015026089931852526, "loss": 0.0122, "step": 385110 }, { "epoch": 1.0, "learning_rate": 0.0001502570111021538, "loss": 0.0146, "step": 385120 }, { "epoch": 1.0, "learning_rate": 0.00015025312288578232, "loss": 0.0125, "step": 385130 }, { "epoch": 1.0, "learning_rate": 0.00015024923466941086, "loss": 0.0106, "step": 385140 }, { "epoch": 1.0, "learning_rate": 0.00015024534645303943, "loss": 0.0127, "step": 385150 }, { "epoch": 1.0, "learning_rate": 0.00015024145823666794, "loss": 0.0134, "step": 385160 }, { "epoch": 1.0, "learning_rate": 0.00015023757002029646, "loss": 0.0124, "step": 385170 }, { "epoch": 1.0, "learning_rate": 0.000150233681803925, "loss": 0.01, "step": 385180 }, { "epoch": 1.0, "learning_rate": 0.00015022979358755357, "loss": 0.0133, "step": 385190 }, { "epoch": 1.0, "learning_rate": 0.00015022590537118208, "loss": 0.0118, "step": 385200 }, { "epoch": 1.0, "learning_rate": 0.00015022201715481063, "loss": 0.0146, "step": 385210 }, { "epoch": 1.0, "learning_rate": 0.00015021812893843914, "loss": 0.0123, "step": 385220 }, { "epoch": 1.0, "learning_rate": 0.0001502142407220677, "loss": 0.0109, "step": 385230 }, { "epoch": 1.0, "learning_rate": 0.00015021035250569622, "loss": 0.0147, "step": 385240 }, { "epoch": 1.0, "learning_rate": 0.00015020646428932476, "loss": 0.0116, "step": 385250 }, { "epoch": 1.0, "learning_rate": 0.00015020257607295328, "loss": 0.0148, "step": 385260 }, { "epoch": 1.0, "learning_rate": 0.00015019868785658185, "loss": 0.0129, "step": 385270 }, { "epoch": 1.0, "learning_rate": 0.00015019479964021036, "loss": 0.0109, "step": 385280 }, { "epoch": 1.0, "learning_rate": 0.0001501909114238389, "loss": 0.0143, "step": 385290 }, { "epoch": 1.0, "learning_rate": 0.00015018702320746742, "loss": 0.0145, "step": 385300 }, { "epoch": 1.0, "learning_rate": 0.00015018313499109596, "loss": 0.0175, "step": 385310 }, { "epoch": 1.0, "learning_rate": 0.0001501792467747245, "loss": 0.0132, "step": 385320 }, { "epoch": 1.0, "learning_rate": 0.00015017535855835304, "loss": 0.0113, "step": 385330 }, { "epoch": 1.0, "learning_rate": 0.00015017147034198156, "loss": 0.0115, "step": 385340 }, { "epoch": 1.0, "learning_rate": 0.0001501675821256101, "loss": 0.0132, "step": 385350 }, { "epoch": 1.0, "learning_rate": 0.00015016369390923867, "loss": 0.0101, "step": 385360 }, { "epoch": 1.0, "learning_rate": 0.00015015980569286718, "loss": 0.0134, "step": 385370 }, { "epoch": 1.0, "learning_rate": 0.00015015591747649572, "loss": 0.0125, "step": 385380 }, { "epoch": 1.0, "learning_rate": 0.00015015202926012424, "loss": 0.0112, "step": 385390 }, { "epoch": 1.0, "learning_rate": 0.0001501481410437528, "loss": 0.0132, "step": 385400 }, { "epoch": 1.0, "learning_rate": 0.00015014425282738132, "loss": 0.0116, "step": 385410 }, { "epoch": 1.0, "learning_rate": 0.00015014036461100986, "loss": 0.013, "step": 385420 }, { "epoch": 1.0, "learning_rate": 0.00015013647639463838, "loss": 0.0124, "step": 385430 }, { "epoch": 1.0, "learning_rate": 0.00015013258817826695, "loss": 0.0119, "step": 385440 }, { "epoch": 1.0, "learning_rate": 0.00015012869996189546, "loss": 0.0138, "step": 385450 }, { "epoch": 1.0, "learning_rate": 0.000150124811745524, "loss": 0.0112, "step": 385460 }, { "epoch": 1.0, "learning_rate": 0.00015012092352915252, "loss": 0.0169, "step": 385470 }, { "epoch": 1.0, "learning_rate": 0.0001501170353127811, "loss": 0.0123, "step": 385480 }, { "epoch": 1.0, "learning_rate": 0.0001501131470964096, "loss": 0.0102, "step": 385490 }, { "epoch": 1.0, "learning_rate": 0.00015010925888003814, "loss": 0.014, "step": 385500 }, { "epoch": 1.0, "learning_rate": 0.00015010537066366666, "loss": 0.0085, "step": 385510 }, { "epoch": 1.0, "learning_rate": 0.00015010148244729523, "loss": 0.0164, "step": 385520 }, { "epoch": 1.0, "learning_rate": 0.00015009759423092377, "loss": 0.0149, "step": 385530 }, { "epoch": 1.0, "learning_rate": 0.00015009370601455228, "loss": 0.0147, "step": 385540 }, { "epoch": 1.0, "learning_rate": 0.00015008981779818082, "loss": 0.0134, "step": 385550 }, { "epoch": 1.0, "learning_rate": 0.00015008592958180934, "loss": 0.0155, "step": 385560 }, { "epoch": 1.0, "learning_rate": 0.0001500820413654379, "loss": 0.0123, "step": 385570 }, { "epoch": 1.0, "learning_rate": 0.00015007815314906642, "loss": 0.0111, "step": 385580 }, { "epoch": 1.0, "learning_rate": 0.00015007426493269496, "loss": 0.01, "step": 385590 }, { "epoch": 1.0, "learning_rate": 0.00015007037671632348, "loss": 0.0141, "step": 385600 }, { "epoch": 1.0, "learning_rate": 0.00015006648849995205, "loss": 0.0108, "step": 385610 }, { "epoch": 1.0, "learning_rate": 0.00015006260028358056, "loss": 0.0098, "step": 385620 }, { "epoch": 1.0, "learning_rate": 0.0001500587120672091, "loss": 0.014, "step": 385630 }, { "epoch": 1.0, "learning_rate": 0.00015005482385083762, "loss": 0.0129, "step": 385640 }, { "epoch": 1.0, "learning_rate": 0.00015005093563446619, "loss": 0.0148, "step": 385650 }, { "epoch": 1.0, "learning_rate": 0.0001500470474180947, "loss": 0.014, "step": 385660 }, { "epoch": 1.0, "learning_rate": 0.00015004315920172324, "loss": 0.0143, "step": 385670 }, { "epoch": 1.0, "learning_rate": 0.00015003927098535176, "loss": 0.0189, "step": 385680 }, { "epoch": 1.0, "learning_rate": 0.00015003538276898033, "loss": 0.0143, "step": 385690 }, { "epoch": 1.0, "learning_rate": 0.00015003149455260887, "loss": 0.0148, "step": 385700 }, { "epoch": 1.0, "learning_rate": 0.00015002760633623738, "loss": 0.0109, "step": 385710 }, { "epoch": 1.0, "learning_rate": 0.0001500237181198659, "loss": 0.0114, "step": 385720 }, { "epoch": 1.0, "learning_rate": 0.00015001982990349447, "loss": 0.0103, "step": 385730 }, { "epoch": 1.0, "learning_rate": 0.000150015941687123, "loss": 0.0139, "step": 385740 }, { "epoch": 1.0, "learning_rate": 0.00015001205347075152, "loss": 0.0154, "step": 385750 }, { "epoch": 1.0, "learning_rate": 0.00015000816525438006, "loss": 0.0091, "step": 385760 }, { "epoch": 1.0, "learning_rate": 0.0001500042770380086, "loss": 0.0138, "step": 385770 }, { "epoch": 1.0, "learning_rate": 0.00015000038882163715, "loss": 0.0131, "step": 385780 }, { "epoch": 1.0, "learning_rate": 0.00014999650060526566, "loss": 0.0111, "step": 385790 }, { "epoch": 1.0, "learning_rate": 0.0001499926123888942, "loss": 0.0114, "step": 385800 }, { "epoch": 1.0, "learning_rate": 0.00014998872417252274, "loss": 0.0098, "step": 385810 }, { "epoch": 1.0, "learning_rate": 0.00014998483595615126, "loss": 0.0126, "step": 385820 }, { "epoch": 1.0, "learning_rate": 0.0001499809477397798, "loss": 0.0163, "step": 385830 }, { "epoch": 1.0, "learning_rate": 0.00014997705952340834, "loss": 0.0095, "step": 385840 }, { "epoch": 1.0, "learning_rate": 0.00014997317130703688, "loss": 0.0119, "step": 385850 }, { "epoch": 1.0, "learning_rate": 0.0001499692830906654, "loss": 0.0107, "step": 385860 }, { "epoch": 1.0, "learning_rate": 0.00014996539487429397, "loss": 0.0109, "step": 385870 }, { "epoch": 1.0, "learning_rate": 0.00014996150665792248, "loss": 0.0148, "step": 385880 }, { "epoch": 1.0, "learning_rate": 0.00014995761844155102, "loss": 0.0087, "step": 385890 }, { "epoch": 1.0, "learning_rate": 0.00014995373022517956, "loss": 0.0119, "step": 385900 }, { "epoch": 1.0, "learning_rate": 0.0001499498420088081, "loss": 0.0113, "step": 385910 }, { "epoch": 1.0, "learning_rate": 0.00014994595379243662, "loss": 0.0124, "step": 385920 }, { "epoch": 1.0, "learning_rate": 0.00014994206557606516, "loss": 0.0123, "step": 385930 }, { "epoch": 1.0, "learning_rate": 0.0001499381773596937, "loss": 0.0094, "step": 385940 }, { "epoch": 1.0, "learning_rate": 0.00014993428914332225, "loss": 0.0124, "step": 385950 }, { "epoch": 1.0, "learning_rate": 0.00014993040092695076, "loss": 0.0124, "step": 385960 }, { "epoch": 1.0, "learning_rate": 0.0001499265127105793, "loss": 0.0127, "step": 385970 }, { "epoch": 1.0, "learning_rate": 0.00014992262449420784, "loss": 0.0145, "step": 385980 }, { "epoch": 1.0, "learning_rate": 0.00014991873627783639, "loss": 0.0126, "step": 385990 }, { "epoch": 1.0, "learning_rate": 0.0001499148480614649, "loss": 0.0114, "step": 386000 }, { "epoch": 1.0, "eval_cer": 0.8817152830555753, "eval_loss": 0.008142529986798763, "eval_runtime": 108.5328, "eval_samples_per_second": 18.428, "eval_steps_per_second": 4.607, "step": 386000 }, { "epoch": 1.0, "learning_rate": 0.00014991095984509344, "loss": 0.0097, "step": 386010 }, { "epoch": 1.0, "learning_rate": 0.00014990707162872198, "loss": 0.0101, "step": 386020 }, { "epoch": 1.0, "learning_rate": 0.00014990318341235052, "loss": 0.0224, "step": 386030 }, { "epoch": 1.0, "learning_rate": 0.00014989929519597904, "loss": 0.011, "step": 386040 }, { "epoch": 1.0, "learning_rate": 0.0001498954069796076, "loss": 0.009, "step": 386050 }, { "epoch": 1.0, "learning_rate": 0.00014989151876323612, "loss": 0.0136, "step": 386060 }, { "epoch": 1.0, "learning_rate": 0.00014988763054686466, "loss": 0.0163, "step": 386070 }, { "epoch": 1.0, "learning_rate": 0.0001498837423304932, "loss": 0.0121, "step": 386080 }, { "epoch": 1.0, "learning_rate": 0.00014987985411412172, "loss": 0.0124, "step": 386090 }, { "epoch": 1.0, "learning_rate": 0.00014987596589775026, "loss": 0.0129, "step": 386100 }, { "epoch": 1.0, "learning_rate": 0.0001498720776813788, "loss": 0.01, "step": 386110 }, { "epoch": 1.0, "learning_rate": 0.00014986818946500735, "loss": 0.0123, "step": 386120 }, { "epoch": 1.0, "learning_rate": 0.00014986430124863586, "loss": 0.0117, "step": 386130 }, { "epoch": 1.0, "learning_rate": 0.0001498604130322644, "loss": 0.0137, "step": 386140 }, { "epoch": 1.0, "learning_rate": 0.00014985652481589294, "loss": 0.0128, "step": 386150 }, { "epoch": 1.0, "learning_rate": 0.00014985263659952148, "loss": 0.0109, "step": 386160 }, { "epoch": 1.0, "learning_rate": 0.00014984874838315, "loss": 0.0151, "step": 386170 }, { "epoch": 1.0, "learning_rate": 0.00014984486016677854, "loss": 0.0159, "step": 386180 }, { "epoch": 1.0, "learning_rate": 0.00014984097195040708, "loss": 0.0119, "step": 386190 }, { "epoch": 1.0, "learning_rate": 0.00014983708373403562, "loss": 0.0076, "step": 386200 }, { "epoch": 1.0, "learning_rate": 0.00014983319551766414, "loss": 0.0124, "step": 386210 }, { "epoch": 1.0, "learning_rate": 0.0001498293073012927, "loss": 0.0112, "step": 386220 }, { "epoch": 1.0, "learning_rate": 0.00014982541908492122, "loss": 0.0115, "step": 386230 }, { "epoch": 1.0, "learning_rate": 0.00014982153086854976, "loss": 0.0139, "step": 386240 }, { "epoch": 1.0, "learning_rate": 0.0001498176426521783, "loss": 0.0147, "step": 386250 }, { "epoch": 1.0, "learning_rate": 0.00014981375443580685, "loss": 0.0116, "step": 386260 }, { "epoch": 1.0, "learning_rate": 0.00014980986621943536, "loss": 0.0134, "step": 386270 }, { "epoch": 1.0, "learning_rate": 0.0001498059780030639, "loss": 0.0308, "step": 386280 }, { "epoch": 1.0, "learning_rate": 0.00014980208978669244, "loss": 0.0141, "step": 386290 }, { "epoch": 1.0, "learning_rate": 0.00014979820157032099, "loss": 0.104, "step": 386300 }, { "epoch": 1.0, "learning_rate": 0.0001497943133539495, "loss": 0.5434, "step": 386310 }, { "epoch": 1.0, "learning_rate": 0.00014979042513757804, "loss": 1.8435, "step": 386320 }, { "epoch": 1.0, "learning_rate": 0.00014978653692120658, "loss": 2.0344, "step": 386330 }, { "epoch": 1.0, "learning_rate": 0.0001497826487048351, "loss": 0.1523, "step": 386340 }, { "epoch": 1.0, "learning_rate": 0.00014977876048846364, "loss": 0.0122, "step": 386350 }, { "epoch": 1.0, "learning_rate": 0.00014977487227209218, "loss": 0.014, "step": 386360 }, { "epoch": 1.0, "learning_rate": 0.00014977098405572072, "loss": 0.0085, "step": 386370 }, { "epoch": 1.0, "learning_rate": 0.00014976709583934924, "loss": 0.0128, "step": 386380 }, { "epoch": 1.0, "learning_rate": 0.0001497632076229778, "loss": 0.0133, "step": 386390 }, { "epoch": 1.0, "learning_rate": 0.00014975931940660632, "loss": 0.0289, "step": 386400 }, { "epoch": 1.0, "learning_rate": 0.00014975543119023486, "loss": 0.0107, "step": 386410 }, { "epoch": 1.0, "learning_rate": 0.0001497515429738634, "loss": 0.0279, "step": 386420 }, { "epoch": 1.0, "learning_rate": 0.00014974765475749195, "loss": 0.0266, "step": 386430 }, { "epoch": 1.0, "learning_rate": 0.00014974376654112046, "loss": 0.0116, "step": 386440 }, { "epoch": 1.0, "learning_rate": 0.000149739878324749, "loss": 0.0258, "step": 386450 }, { "epoch": 1.0, "learning_rate": 0.00014973599010837754, "loss": 0.0115, "step": 386460 }, { "epoch": 1.0, "learning_rate": 0.00014973210189200609, "loss": 0.0249, "step": 386470 }, { "epoch": 1.0, "learning_rate": 0.0001497282136756346, "loss": 0.0266, "step": 386480 }, { "epoch": 1.0, "learning_rate": 0.00014972432545926314, "loss": 0.0361, "step": 386490 }, { "epoch": 1.0, "learning_rate": 0.00014972043724289168, "loss": 0.0119, "step": 386500 }, { "epoch": 1.0, "learning_rate": 0.00014971654902652023, "loss": 0.0286, "step": 386510 }, { "epoch": 1.0, "learning_rate": 0.00014971266081014874, "loss": 0.0329, "step": 386520 }, { "epoch": 1.0, "learning_rate": 0.00014970877259377728, "loss": 0.0098, "step": 386530 }, { "epoch": 1.0, "learning_rate": 0.00014970488437740582, "loss": 0.0288, "step": 386540 }, { "epoch": 1.0, "learning_rate": 0.00014970099616103436, "loss": 0.013, "step": 386550 }, { "epoch": 1.0, "learning_rate": 0.00014969710794466288, "loss": 0.0258, "step": 386560 }, { "epoch": 1.0, "learning_rate": 0.00014969321972829142, "loss": 0.0126, "step": 386570 }, { "epoch": 1.0, "learning_rate": 0.00014968933151191996, "loss": 0.0116, "step": 386580 }, { "epoch": 1.0, "learning_rate": 0.0001496854432955485, "loss": 0.012, "step": 386590 }, { "epoch": 1.0, "learning_rate": 0.00014968155507917705, "loss": 0.0145, "step": 386600 }, { "epoch": 1.0, "learning_rate": 0.00014967766686280556, "loss": 0.0123, "step": 386610 }, { "epoch": 1.0, "learning_rate": 0.0001496737786464341, "loss": 0.01, "step": 386620 }, { "epoch": 1.0, "learning_rate": 0.00014966989043006264, "loss": 0.0102, "step": 386630 }, { "epoch": 1.0, "learning_rate": 0.00014966600221369118, "loss": 0.0129, "step": 386640 }, { "epoch": 1.0, "learning_rate": 0.0001496621139973197, "loss": 0.0136, "step": 386650 }, { "epoch": 1.0, "learning_rate": 0.00014965822578094824, "loss": 0.01, "step": 386660 }, { "epoch": 1.0, "learning_rate": 0.00014965433756457678, "loss": 0.0135, "step": 386670 }, { "epoch": 1.0, "learning_rate": 0.00014965044934820532, "loss": 0.012, "step": 386680 }, { "epoch": 1.0, "learning_rate": 0.00014964656113183384, "loss": 0.0095, "step": 386690 }, { "epoch": 1.0, "learning_rate": 0.00014964267291546238, "loss": 0.0127, "step": 386700 }, { "epoch": 1.0, "learning_rate": 0.00014963878469909092, "loss": 0.012, "step": 386710 }, { "epoch": 1.0, "learning_rate": 0.00014963489648271946, "loss": 0.0108, "step": 386720 }, { "epoch": 1.0, "learning_rate": 0.00014963100826634798, "loss": 0.01, "step": 386730 }, { "epoch": 1.0, "learning_rate": 0.00014962712004997655, "loss": 0.0122, "step": 386740 }, { "epoch": 1.0, "learning_rate": 0.00014962323183360506, "loss": 0.0106, "step": 386750 }, { "epoch": 1.0, "learning_rate": 0.0001496193436172336, "loss": 0.0119, "step": 386760 }, { "epoch": 1.0, "learning_rate": 0.00014961545540086214, "loss": 0.0141, "step": 386770 }, { "epoch": 1.0, "learning_rate": 0.0001496115671844907, "loss": 0.0131, "step": 386780 }, { "epoch": 1.0, "learning_rate": 0.0001496076789681192, "loss": 0.0109, "step": 386790 }, { "epoch": 1.0, "learning_rate": 0.00014960379075174774, "loss": 0.0148, "step": 386800 }, { "epoch": 1.0, "learning_rate": 0.00014959990253537628, "loss": 0.0126, "step": 386810 }, { "epoch": 1.0, "learning_rate": 0.0001495960143190048, "loss": 0.0102, "step": 386820 }, { "epoch": 1.0, "learning_rate": 0.00014959212610263334, "loss": 0.0091, "step": 386830 }, { "epoch": 1.0, "learning_rate": 0.00014958823788626188, "loss": 0.0117, "step": 386840 }, { "epoch": 1.0, "learning_rate": 0.00014958434966989042, "loss": 0.0137, "step": 386850 }, { "epoch": 1.0, "learning_rate": 0.00014958046145351894, "loss": 0.0133, "step": 386860 }, { "epoch": 1.0, "learning_rate": 0.00014957657323714748, "loss": 0.01, "step": 386870 }, { "epoch": 1.0, "learning_rate": 0.00014957268502077602, "loss": 0.0159, "step": 386880 }, { "epoch": 1.0, "learning_rate": 0.00014956879680440456, "loss": 0.0113, "step": 386890 }, { "epoch": 1.0, "learning_rate": 0.00014956490858803308, "loss": 0.0119, "step": 386900 }, { "epoch": 1.0, "learning_rate": 0.00014956102037166162, "loss": 0.0114, "step": 386910 }, { "epoch": 1.0, "learning_rate": 0.00014955713215529016, "loss": 0.0117, "step": 386920 }, { "epoch": 1.0, "learning_rate": 0.0001495532439389187, "loss": 0.0106, "step": 386930 }, { "epoch": 1.0, "learning_rate": 0.00014954935572254724, "loss": 0.0142, "step": 386940 }, { "epoch": 1.0, "learning_rate": 0.00014954546750617579, "loss": 0.0123, "step": 386950 }, { "epoch": 1.0, "learning_rate": 0.0001495415792898043, "loss": 0.0103, "step": 386960 }, { "epoch": 1.0, "learning_rate": 0.00014953769107343284, "loss": 0.0124, "step": 386970 }, { "epoch": 1.0, "learning_rate": 0.00014953380285706138, "loss": 0.0139, "step": 386980 }, { "epoch": 1.0, "learning_rate": 0.00014952991464068993, "loss": 0.0107, "step": 386990 }, { "epoch": 1.0, "learning_rate": 0.00014952602642431844, "loss": 0.0135, "step": 387000 }, { "epoch": 1.0, "eval_cer": 0.8817306790618513, "eval_loss": 0.014083863236010075, "eval_runtime": 108.3195, "eval_samples_per_second": 18.464, "eval_steps_per_second": 4.616, "step": 387000 }, { "epoch": 1.0, "learning_rate": 0.00014952213820794698, "loss": 0.013, "step": 387010 }, { "epoch": 1.0, "learning_rate": 0.00014951824999157552, "loss": 0.0124, "step": 387020 }, { "epoch": 1.0, "learning_rate": 0.00014951436177520406, "loss": 0.0104, "step": 387030 }, { "epoch": 1.0, "learning_rate": 0.00014951047355883258, "loss": 0.0103, "step": 387040 }, { "epoch": 1.0, "learning_rate": 0.00014950658534246112, "loss": 0.0104, "step": 387050 }, { "epoch": 1.0, "learning_rate": 0.00014950269712608966, "loss": 0.0115, "step": 387060 }, { "epoch": 1.0, "learning_rate": 0.00014949880890971818, "loss": 0.0115, "step": 387070 }, { "epoch": 1.0, "learning_rate": 0.00014949492069334672, "loss": 0.015, "step": 387080 }, { "epoch": 1.0, "learning_rate": 0.00014949103247697526, "loss": 0.0103, "step": 387090 }, { "epoch": 1.0, "learning_rate": 0.0001494871442606038, "loss": 0.0179, "step": 387100 }, { "epoch": 1.0, "learning_rate": 0.00014948325604423232, "loss": 0.0102, "step": 387110 }, { "epoch": 1.0, "learning_rate": 0.00014947936782786089, "loss": 0.0106, "step": 387120 }, { "epoch": 1.0, "learning_rate": 0.0001494754796114894, "loss": 0.0114, "step": 387130 }, { "epoch": 1.0, "learning_rate": 0.00014947159139511794, "loss": 0.0096, "step": 387140 }, { "epoch": 1.0, "learning_rate": 0.00014946770317874648, "loss": 0.0101, "step": 387150 }, { "epoch": 1.0, "learning_rate": 0.00014946381496237502, "loss": 0.0119, "step": 387160 }, { "epoch": 1.0, "learning_rate": 0.00014945992674600354, "loss": 0.0115, "step": 387170 }, { "epoch": 1.0, "learning_rate": 0.00014945603852963208, "loss": 0.0091, "step": 387180 }, { "epoch": 1.0, "learning_rate": 0.00014945215031326062, "loss": 0.0087, "step": 387190 }, { "epoch": 1.0, "learning_rate": 0.00014944826209688916, "loss": 0.0128, "step": 387200 }, { "epoch": 1.0, "learning_rate": 0.00014944437388051768, "loss": 0.0106, "step": 387210 }, { "epoch": 1.0, "learning_rate": 0.00014944048566414622, "loss": 0.0131, "step": 387220 }, { "epoch": 1.0, "learning_rate": 0.00014943659744777476, "loss": 0.0108, "step": 387230 }, { "epoch": 1.0, "learning_rate": 0.0001494327092314033, "loss": 0.012, "step": 387240 }, { "epoch": 1.0, "learning_rate": 0.00014942882101503182, "loss": 0.0115, "step": 387250 }, { "epoch": 1.0, "learning_rate": 0.0001494249327986604, "loss": 0.011, "step": 387260 }, { "epoch": 1.0, "learning_rate": 0.0001494210445822889, "loss": 0.0116, "step": 387270 }, { "epoch": 1.0, "learning_rate": 0.00014941715636591744, "loss": 0.0101, "step": 387280 }, { "epoch": 1.0, "learning_rate": 0.00014941326814954598, "loss": 0.014, "step": 387290 }, { "epoch": 1.0, "learning_rate": 0.0001494093799331745, "loss": 0.0124, "step": 387300 }, { "epoch": 1.0, "learning_rate": 0.00014940549171680304, "loss": 0.009, "step": 387310 }, { "epoch": 1.0, "learning_rate": 0.00014940160350043158, "loss": 0.0124, "step": 387320 }, { "epoch": 1.0, "learning_rate": 0.00014939771528406012, "loss": 0.0157, "step": 387330 }, { "epoch": 1.0, "learning_rate": 0.00014939382706768864, "loss": 0.0123, "step": 387340 }, { "epoch": 1.0, "learning_rate": 0.00014938993885131718, "loss": 0.0132, "step": 387350 }, { "epoch": 1.0, "learning_rate": 0.00014938605063494572, "loss": 0.0107, "step": 387360 }, { "epoch": 1.0, "learning_rate": 0.00014938216241857426, "loss": 0.0137, "step": 387370 }, { "epoch": 1.0, "learning_rate": 0.00014937827420220278, "loss": 0.011, "step": 387380 }, { "epoch": 1.0, "learning_rate": 0.00014937438598583132, "loss": 0.0107, "step": 387390 }, { "epoch": 1.0, "learning_rate": 0.00014937049776945986, "loss": 0.0099, "step": 387400 }, { "epoch": 1.0, "learning_rate": 0.0001493666095530884, "loss": 0.0099, "step": 387410 }, { "epoch": 1.0, "learning_rate": 0.00014936272133671692, "loss": 0.0086, "step": 387420 }, { "epoch": 1.0, "learning_rate": 0.00014935883312034546, "loss": 0.0257, "step": 387430 }, { "epoch": 1.0, "learning_rate": 0.000149354944903974, "loss": 0.0138, "step": 387440 }, { "epoch": 1.0, "learning_rate": 0.00014935105668760254, "loss": 0.0133, "step": 387450 }, { "epoch": 1.0, "learning_rate": 0.00014934716847123108, "loss": 0.0129, "step": 387460 }, { "epoch": 1.0, "learning_rate": 0.00014934328025485963, "loss": 0.0101, "step": 387470 }, { "epoch": 1.0, "learning_rate": 0.00014933939203848814, "loss": 0.0114, "step": 387480 }, { "epoch": 1.0, "learning_rate": 0.00014933550382211668, "loss": 0.0112, "step": 387490 }, { "epoch": 1.0, "learning_rate": 0.00014933161560574522, "loss": 0.0142, "step": 387500 }, { "epoch": 1.0, "learning_rate": 0.00014932772738937377, "loss": 0.0098, "step": 387510 }, { "epoch": 1.0, "learning_rate": 0.00014932383917300228, "loss": 0.0132, "step": 387520 }, { "epoch": 1.0, "learning_rate": 0.00014931995095663082, "loss": 0.0101, "step": 387530 }, { "epoch": 1.0, "learning_rate": 0.00014931606274025936, "loss": 0.0148, "step": 387540 }, { "epoch": 1.0, "learning_rate": 0.00014931217452388788, "loss": 0.0112, "step": 387550 }, { "epoch": 1.0, "learning_rate": 0.00014930828630751642, "loss": 0.0127, "step": 387560 }, { "epoch": 1.0, "learning_rate": 0.00014930439809114496, "loss": 0.0124, "step": 387570 }, { "epoch": 1.0, "learning_rate": 0.0001493005098747735, "loss": 0.0127, "step": 387580 }, { "epoch": 1.0, "learning_rate": 0.00014929662165840202, "loss": 0.0103, "step": 387590 }, { "epoch": 1.0, "learning_rate": 0.00014929273344203056, "loss": 0.0132, "step": 387600 }, { "epoch": 1.0, "learning_rate": 0.0001492888452256591, "loss": 0.0127, "step": 387610 }, { "epoch": 1.0, "learning_rate": 0.00014928495700928764, "loss": 0.0114, "step": 387620 }, { "epoch": 1.0, "learning_rate": 0.00014928106879291616, "loss": 0.011, "step": 387630 }, { "epoch": 1.0, "learning_rate": 0.00014927718057654473, "loss": 0.0114, "step": 387640 }, { "epoch": 1.0, "learning_rate": 0.00014927329236017324, "loss": 0.013, "step": 387650 }, { "epoch": 1.0, "learning_rate": 0.00014926940414380178, "loss": 0.0103, "step": 387660 }, { "epoch": 1.0, "learning_rate": 0.00014926551592743032, "loss": 0.0124, "step": 387670 }, { "epoch": 1.0, "learning_rate": 0.00014926162771105886, "loss": 0.0225, "step": 387680 }, { "epoch": 1.0, "learning_rate": 0.00014925773949468738, "loss": 0.0105, "step": 387690 }, { "epoch": 1.0, "learning_rate": 0.00014925385127831592, "loss": 0.0121, "step": 387700 }, { "epoch": 1.0, "learning_rate": 0.00014924996306194446, "loss": 0.0313, "step": 387710 }, { "epoch": 1.01, "learning_rate": 0.000149246074845573, "loss": 0.0196, "step": 387720 }, { "epoch": 1.01, "learning_rate": 0.00014924218662920152, "loss": 0.0139, "step": 387730 }, { "epoch": 1.01, "learning_rate": 0.00014923829841283006, "loss": 0.0138, "step": 387740 }, { "epoch": 1.01, "learning_rate": 0.0001492344101964586, "loss": 0.0087, "step": 387750 }, { "epoch": 1.01, "learning_rate": 0.00014923052198008714, "loss": 0.0147, "step": 387760 }, { "epoch": 1.01, "learning_rate": 0.00014922663376371566, "loss": 0.0103, "step": 387770 }, { "epoch": 1.01, "learning_rate": 0.00014922274554734423, "loss": 0.0121, "step": 387780 }, { "epoch": 1.01, "learning_rate": 0.00014921885733097274, "loss": 0.01, "step": 387790 }, { "epoch": 1.01, "learning_rate": 0.00014921496911460126, "loss": 0.01, "step": 387800 }, { "epoch": 1.01, "learning_rate": 0.00014921108089822982, "loss": 0.0122, "step": 387810 }, { "epoch": 1.01, "learning_rate": 0.00014920719268185834, "loss": 0.0101, "step": 387820 }, { "epoch": 1.01, "learning_rate": 0.00014920330446548688, "loss": 0.0162, "step": 387830 }, { "epoch": 1.01, "learning_rate": 0.00014919941624911542, "loss": 0.011, "step": 387840 }, { "epoch": 1.01, "learning_rate": 0.00014919552803274396, "loss": 0.0137, "step": 387850 }, { "epoch": 1.01, "learning_rate": 0.00014919163981637248, "loss": 0.0105, "step": 387860 }, { "epoch": 1.01, "learning_rate": 0.00014918775160000102, "loss": 0.0105, "step": 387870 }, { "epoch": 1.01, "learning_rate": 0.00014918386338362956, "loss": 0.0127, "step": 387880 }, { "epoch": 1.01, "learning_rate": 0.0001491799751672581, "loss": 0.0102, "step": 387890 }, { "epoch": 1.01, "learning_rate": 0.00014917608695088662, "loss": 0.0103, "step": 387900 }, { "epoch": 1.01, "learning_rate": 0.00014917219873451516, "loss": 0.009, "step": 387910 }, { "epoch": 1.01, "learning_rate": 0.0001491683105181437, "loss": 0.0108, "step": 387920 }, { "epoch": 1.01, "learning_rate": 0.00014916442230177224, "loss": 0.0123, "step": 387930 }, { "epoch": 1.01, "learning_rate": 0.00014916053408540076, "loss": 0.0152, "step": 387940 }, { "epoch": 1.01, "learning_rate": 0.0001491566458690293, "loss": 0.0122, "step": 387950 }, { "epoch": 1.01, "learning_rate": 0.00014915275765265784, "loss": 0.0121, "step": 387960 }, { "epoch": 1.01, "learning_rate": 0.00014914886943628638, "loss": 0.0137, "step": 387970 }, { "epoch": 1.01, "learning_rate": 0.00014914498121991492, "loss": 0.0114, "step": 387980 }, { "epoch": 1.01, "learning_rate": 0.00014914109300354347, "loss": 0.0109, "step": 387990 }, { "epoch": 1.01, "learning_rate": 0.00014913720478717198, "loss": 0.0137, "step": 388000 }, { "epoch": 1.01, "eval_cer": 0.8817124837817071, "eval_loss": 0.007554326672106981, "eval_runtime": 108.2118, "eval_samples_per_second": 18.482, "eval_steps_per_second": 4.621, "step": 388000 }, { "epoch": 1.01, "learning_rate": 0.00014913331657080052, "loss": 0.0097, "step": 388010 }, { "epoch": 1.01, "learning_rate": 0.00014912942835442906, "loss": 0.0101, "step": 388020 }, { "epoch": 1.01, "learning_rate": 0.0001491255401380576, "loss": 0.0137, "step": 388030 }, { "epoch": 1.01, "learning_rate": 0.00014912165192168612, "loss": 0.0115, "step": 388040 }, { "epoch": 1.01, "learning_rate": 0.00014911776370531466, "loss": 0.011, "step": 388050 }, { "epoch": 1.01, "learning_rate": 0.0001491138754889432, "loss": 0.0092, "step": 388060 }, { "epoch": 1.01, "learning_rate": 0.00014910998727257172, "loss": 0.012, "step": 388070 }, { "epoch": 1.01, "learning_rate": 0.00014910609905620026, "loss": 0.0107, "step": 388080 }, { "epoch": 1.01, "learning_rate": 0.0001491022108398288, "loss": 0.0106, "step": 388090 }, { "epoch": 1.01, "learning_rate": 0.00014909832262345734, "loss": 0.0107, "step": 388100 }, { "epoch": 1.01, "learning_rate": 0.00014909443440708586, "loss": 0.0155, "step": 388110 }, { "epoch": 1.01, "learning_rate": 0.0001490905461907144, "loss": 0.0098, "step": 388120 }, { "epoch": 1.01, "learning_rate": 0.00014908665797434294, "loss": 0.0119, "step": 388130 }, { "epoch": 1.01, "learning_rate": 0.00014908276975797148, "loss": 0.0136, "step": 388140 }, { "epoch": 1.01, "learning_rate": 0.0001490788815416, "loss": 0.0097, "step": 388150 }, { "epoch": 1.01, "learning_rate": 0.00014907499332522857, "loss": 0.0116, "step": 388160 }, { "epoch": 1.01, "learning_rate": 0.00014907110510885708, "loss": 0.014, "step": 388170 }, { "epoch": 1.01, "learning_rate": 0.00014906721689248562, "loss": 0.0131, "step": 388180 }, { "epoch": 1.01, "learning_rate": 0.00014906332867611416, "loss": 0.0127, "step": 388190 }, { "epoch": 1.01, "learning_rate": 0.0001490594404597427, "loss": 0.0127, "step": 388200 }, { "epoch": 1.01, "learning_rate": 0.00014905555224337122, "loss": 0.0119, "step": 388210 }, { "epoch": 1.01, "learning_rate": 0.00014905166402699976, "loss": 0.0108, "step": 388220 }, { "epoch": 1.01, "learning_rate": 0.0001490477758106283, "loss": 0.0102, "step": 388230 }, { "epoch": 1.01, "learning_rate": 0.00014904388759425684, "loss": 0.0095, "step": 388240 }, { "epoch": 1.01, "learning_rate": 0.00014903999937788536, "loss": 0.0106, "step": 388250 }, { "epoch": 1.01, "learning_rate": 0.0001490361111615139, "loss": 0.0107, "step": 388260 }, { "epoch": 1.01, "learning_rate": 0.00014903222294514244, "loss": 0.0113, "step": 388270 }, { "epoch": 1.01, "learning_rate": 0.00014902833472877098, "loss": 0.0101, "step": 388280 }, { "epoch": 1.01, "learning_rate": 0.0001490244465123995, "loss": 0.0142, "step": 388290 }, { "epoch": 1.01, "learning_rate": 0.00014902055829602804, "loss": 0.0094, "step": 388300 }, { "epoch": 1.01, "learning_rate": 0.00014901667007965658, "loss": 0.0149, "step": 388310 }, { "epoch": 1.01, "learning_rate": 0.0001490127818632851, "loss": 0.0128, "step": 388320 }, { "epoch": 1.01, "learning_rate": 0.00014900889364691366, "loss": 0.0113, "step": 388330 }, { "epoch": 1.01, "learning_rate": 0.00014900500543054218, "loss": 0.0132, "step": 388340 }, { "epoch": 1.01, "learning_rate": 0.00014900111721417072, "loss": 0.0152, "step": 388350 }, { "epoch": 1.01, "learning_rate": 0.00014899722899779926, "loss": 0.0104, "step": 388360 }, { "epoch": 1.01, "learning_rate": 0.0001489933407814278, "loss": 0.0152, "step": 388370 }, { "epoch": 1.01, "learning_rate": 0.00014898945256505632, "loss": 0.0119, "step": 388380 }, { "epoch": 1.01, "learning_rate": 0.00014898556434868486, "loss": 0.009, "step": 388390 }, { "epoch": 1.01, "learning_rate": 0.0001489816761323134, "loss": 0.0109, "step": 388400 }, { "epoch": 1.01, "learning_rate": 0.00014897778791594194, "loss": 0.0134, "step": 388410 }, { "epoch": 1.01, "learning_rate": 0.00014897389969957046, "loss": 0.0115, "step": 388420 }, { "epoch": 1.01, "learning_rate": 0.000148970011483199, "loss": 0.0106, "step": 388430 }, { "epoch": 1.01, "learning_rate": 0.00014896612326682754, "loss": 0.0144, "step": 388440 }, { "epoch": 1.01, "learning_rate": 0.00014896223505045608, "loss": 0.0134, "step": 388450 }, { "epoch": 1.01, "learning_rate": 0.0001489583468340846, "loss": 0.0132, "step": 388460 }, { "epoch": 1.01, "learning_rate": 0.00014895445861771314, "loss": 0.014, "step": 388470 }, { "epoch": 1.01, "learning_rate": 0.00014895057040134168, "loss": 0.0119, "step": 388480 }, { "epoch": 1.01, "learning_rate": 0.00014894668218497022, "loss": 0.0128, "step": 388490 }, { "epoch": 1.01, "learning_rate": 0.00014894279396859874, "loss": 0.0178, "step": 388500 }, { "epoch": 1.01, "learning_rate": 0.0001489389057522273, "loss": 0.0116, "step": 388510 }, { "epoch": 1.01, "learning_rate": 0.00014893501753585582, "loss": 0.01, "step": 388520 }, { "epoch": 1.01, "learning_rate": 0.00014893112931948436, "loss": 0.0124, "step": 388530 }, { "epoch": 1.01, "learning_rate": 0.0001489272411031129, "loss": 0.0109, "step": 388540 }, { "epoch": 1.01, "learning_rate": 0.00014892335288674142, "loss": 0.0137, "step": 388550 }, { "epoch": 1.01, "learning_rate": 0.00014891946467036996, "loss": 0.0104, "step": 388560 }, { "epoch": 1.01, "learning_rate": 0.0001489155764539985, "loss": 0.0116, "step": 388570 }, { "epoch": 1.01, "learning_rate": 0.00014891168823762704, "loss": 0.015, "step": 388580 }, { "epoch": 1.01, "learning_rate": 0.00014890780002125556, "loss": 0.0117, "step": 388590 }, { "epoch": 1.01, "learning_rate": 0.0001489039118048841, "loss": 0.0105, "step": 388600 }, { "epoch": 1.01, "learning_rate": 0.00014890002358851264, "loss": 0.0126, "step": 388610 }, { "epoch": 1.01, "learning_rate": 0.00014889613537214118, "loss": 0.013, "step": 388620 }, { "epoch": 1.01, "learning_rate": 0.0001488922471557697, "loss": 0.0116, "step": 388630 }, { "epoch": 1.01, "learning_rate": 0.00014888835893939824, "loss": 0.0127, "step": 388640 }, { "epoch": 1.01, "learning_rate": 0.00014888447072302678, "loss": 0.0129, "step": 388650 }, { "epoch": 1.01, "learning_rate": 0.00014888058250665532, "loss": 0.0146, "step": 388660 }, { "epoch": 1.01, "learning_rate": 0.00014887669429028384, "loss": 0.009, "step": 388670 }, { "epoch": 1.01, "learning_rate": 0.0001488728060739124, "loss": 0.0081, "step": 388680 }, { "epoch": 1.01, "learning_rate": 0.00014886891785754092, "loss": 0.0132, "step": 388690 }, { "epoch": 1.01, "learning_rate": 0.00014886502964116946, "loss": 0.0134, "step": 388700 }, { "epoch": 1.01, "learning_rate": 0.000148861141424798, "loss": 0.0104, "step": 388710 }, { "epoch": 1.01, "learning_rate": 0.00014885725320842654, "loss": 0.0098, "step": 388720 }, { "epoch": 1.01, "learning_rate": 0.00014885336499205506, "loss": 0.0113, "step": 388730 }, { "epoch": 1.01, "learning_rate": 0.0001488494767756836, "loss": 0.0135, "step": 388740 }, { "epoch": 1.01, "learning_rate": 0.00014884558855931214, "loss": 0.0136, "step": 388750 }, { "epoch": 1.01, "learning_rate": 0.00014884170034294068, "loss": 0.0081, "step": 388760 }, { "epoch": 1.01, "learning_rate": 0.0001488378121265692, "loss": 0.0119, "step": 388770 }, { "epoch": 1.01, "learning_rate": 0.00014883392391019774, "loss": 0.0111, "step": 388780 }, { "epoch": 1.01, "learning_rate": 0.00014883003569382628, "loss": 0.0094, "step": 388790 }, { "epoch": 1.01, "learning_rate": 0.0001488261474774548, "loss": 0.0135, "step": 388800 }, { "epoch": 1.01, "learning_rate": 0.00014882225926108334, "loss": 0.0102, "step": 388810 }, { "epoch": 1.01, "learning_rate": 0.00014881837104471188, "loss": 0.0171, "step": 388820 }, { "epoch": 1.01, "learning_rate": 0.00014881448282834042, "loss": 0.012, "step": 388830 }, { "epoch": 1.01, "learning_rate": 0.00014881059461196894, "loss": 0.0164, "step": 388840 }, { "epoch": 1.01, "learning_rate": 0.0001488067063955975, "loss": 0.0118, "step": 388850 }, { "epoch": 1.01, "learning_rate": 0.00014880281817922602, "loss": 0.0116, "step": 388860 }, { "epoch": 1.01, "learning_rate": 0.00014879892996285456, "loss": 0.0102, "step": 388870 }, { "epoch": 1.01, "learning_rate": 0.0001487950417464831, "loss": 0.013, "step": 388880 }, { "epoch": 1.01, "learning_rate": 0.00014879115353011164, "loss": 0.0085, "step": 388890 }, { "epoch": 1.01, "learning_rate": 0.00014878726531374016, "loss": 0.0115, "step": 388900 }, { "epoch": 1.01, "learning_rate": 0.0001487833770973687, "loss": 0.011, "step": 388910 }, { "epoch": 1.01, "learning_rate": 0.00014877948888099724, "loss": 0.011, "step": 388920 }, { "epoch": 1.01, "learning_rate": 0.00014877560066462578, "loss": 0.0099, "step": 388930 }, { "epoch": 1.01, "learning_rate": 0.0001487717124482543, "loss": 0.0103, "step": 388940 }, { "epoch": 1.01, "learning_rate": 0.00014876782423188284, "loss": 0.012, "step": 388950 }, { "epoch": 1.01, "learning_rate": 0.00014876393601551138, "loss": 0.0124, "step": 388960 }, { "epoch": 1.01, "learning_rate": 0.00014876004779913992, "loss": 0.0081, "step": 388970 }, { "epoch": 1.01, "learning_rate": 0.00014875615958276844, "loss": 0.0137, "step": 388980 }, { "epoch": 1.01, "learning_rate": 0.00014875227136639698, "loss": 0.0123, "step": 388990 }, { "epoch": 1.01, "learning_rate": 0.00014874838315002552, "loss": 0.0107, "step": 389000 }, { "epoch": 1.01, "eval_cer": 0.881704085960102, "eval_loss": 0.007840441539883614, "eval_runtime": 107.9934, "eval_samples_per_second": 18.52, "eval_steps_per_second": 4.63, "step": 389000 }, { "epoch": 1.01, "learning_rate": 0.00014874449493365406, "loss": 0.0104, "step": 389010 }, { "epoch": 1.01, "learning_rate": 0.00014874060671728258, "loss": 0.0126, "step": 389020 }, { "epoch": 1.01, "learning_rate": 0.00014873671850091115, "loss": 0.0098, "step": 389030 }, { "epoch": 1.01, "learning_rate": 0.00014873283028453966, "loss": 0.0095, "step": 389040 }, { "epoch": 1.01, "learning_rate": 0.0001487289420681682, "loss": 0.0121, "step": 389050 }, { "epoch": 1.01, "learning_rate": 0.00014872505385179674, "loss": 0.0113, "step": 389060 }, { "epoch": 1.01, "learning_rate": 0.00014872116563542526, "loss": 0.0087, "step": 389070 }, { "epoch": 1.01, "learning_rate": 0.0001487172774190538, "loss": 0.0094, "step": 389080 }, { "epoch": 1.01, "learning_rate": 0.00014871338920268234, "loss": 0.0111, "step": 389090 }, { "epoch": 1.01, "learning_rate": 0.00014870950098631088, "loss": 0.0113, "step": 389100 }, { "epoch": 1.01, "learning_rate": 0.0001487056127699394, "loss": 0.0121, "step": 389110 }, { "epoch": 1.01, "learning_rate": 0.00014870172455356794, "loss": 0.0146, "step": 389120 }, { "epoch": 1.01, "learning_rate": 0.00014869783633719648, "loss": 0.0106, "step": 389130 }, { "epoch": 1.01, "learning_rate": 0.00014869394812082502, "loss": 0.0091, "step": 389140 }, { "epoch": 1.01, "learning_rate": 0.00014869005990445354, "loss": 0.011, "step": 389150 }, { "epoch": 1.01, "learning_rate": 0.00014868617168808208, "loss": 0.0174, "step": 389160 }, { "epoch": 1.01, "learning_rate": 0.00014868228347171062, "loss": 0.0187, "step": 389170 }, { "epoch": 1.01, "learning_rate": 0.00014867839525533916, "loss": 0.0113, "step": 389180 }, { "epoch": 1.01, "learning_rate": 0.00014867450703896768, "loss": 0.0106, "step": 389190 }, { "epoch": 1.01, "learning_rate": 0.00014867061882259625, "loss": 0.0121, "step": 389200 }, { "epoch": 1.01, "learning_rate": 0.00014866673060622476, "loss": 0.011, "step": 389210 }, { "epoch": 1.01, "learning_rate": 0.0001486628423898533, "loss": 0.0111, "step": 389220 }, { "epoch": 1.01, "learning_rate": 0.00014865895417348184, "loss": 0.01, "step": 389230 }, { "epoch": 1.01, "learning_rate": 0.00014865506595711038, "loss": 0.0126, "step": 389240 }, { "epoch": 1.01, "learning_rate": 0.0001486511777407389, "loss": 0.0152, "step": 389250 }, { "epoch": 1.01, "learning_rate": 0.00014864728952436744, "loss": 0.0134, "step": 389260 }, { "epoch": 1.01, "learning_rate": 0.00014864340130799598, "loss": 0.0141, "step": 389270 }, { "epoch": 1.01, "learning_rate": 0.0001486395130916245, "loss": 0.0128, "step": 389280 }, { "epoch": 1.01, "learning_rate": 0.00014863562487525304, "loss": 0.0124, "step": 389290 }, { "epoch": 1.01, "learning_rate": 0.00014863173665888158, "loss": 0.0092, "step": 389300 }, { "epoch": 1.01, "learning_rate": 0.00014862784844251012, "loss": 0.0097, "step": 389310 }, { "epoch": 1.01, "learning_rate": 0.00014862396022613864, "loss": 0.0109, "step": 389320 }, { "epoch": 1.01, "learning_rate": 0.00014862007200976718, "loss": 0.0117, "step": 389330 }, { "epoch": 1.01, "learning_rate": 0.00014861618379339572, "loss": 0.0109, "step": 389340 }, { "epoch": 1.01, "learning_rate": 0.00014861229557702426, "loss": 0.0118, "step": 389350 }, { "epoch": 1.01, "learning_rate": 0.00014860840736065278, "loss": 0.0107, "step": 389360 }, { "epoch": 1.01, "learning_rate": 0.00014860451914428134, "loss": 0.0113, "step": 389370 }, { "epoch": 1.01, "learning_rate": 0.00014860063092790986, "loss": 0.0111, "step": 389380 }, { "epoch": 1.01, "learning_rate": 0.0001485967427115384, "loss": 0.0149, "step": 389390 }, { "epoch": 1.01, "learning_rate": 0.00014859285449516694, "loss": 0.0123, "step": 389400 }, { "epoch": 1.01, "learning_rate": 0.00014858896627879548, "loss": 0.0097, "step": 389410 }, { "epoch": 1.01, "learning_rate": 0.000148585078062424, "loss": 0.0129, "step": 389420 }, { "epoch": 1.01, "learning_rate": 0.00014858118984605254, "loss": 0.0109, "step": 389430 }, { "epoch": 1.01, "learning_rate": 0.00014857730162968108, "loss": 0.0096, "step": 389440 }, { "epoch": 1.01, "learning_rate": 0.00014857341341330962, "loss": 0.0105, "step": 389450 }, { "epoch": 1.01, "learning_rate": 0.00014856952519693814, "loss": 0.0145, "step": 389460 }, { "epoch": 1.01, "learning_rate": 0.00014856563698056668, "loss": 0.0097, "step": 389470 }, { "epoch": 1.01, "learning_rate": 0.00014856174876419522, "loss": 0.0118, "step": 389480 }, { "epoch": 1.01, "learning_rate": 0.00014855786054782376, "loss": 0.0118, "step": 389490 }, { "epoch": 1.01, "learning_rate": 0.00014855397233145228, "loss": 0.0103, "step": 389500 }, { "epoch": 1.01, "learning_rate": 0.00014855008411508082, "loss": 0.0093, "step": 389510 }, { "epoch": 1.01, "learning_rate": 0.00014854619589870936, "loss": 0.0096, "step": 389520 }, { "epoch": 1.01, "learning_rate": 0.00014854230768233788, "loss": 0.009, "step": 389530 }, { "epoch": 1.01, "learning_rate": 0.00014853841946596642, "loss": 0.0148, "step": 389540 }, { "epoch": 1.01, "learning_rate": 0.00014853453124959496, "loss": 0.0245, "step": 389550 }, { "epoch": 1.01, "learning_rate": 0.0001485306430332235, "loss": 0.0094, "step": 389560 }, { "epoch": 1.01, "learning_rate": 0.00014852675481685204, "loss": 0.0091, "step": 389570 }, { "epoch": 1.01, "learning_rate": 0.00014852286660048058, "loss": 0.014, "step": 389580 }, { "epoch": 1.01, "learning_rate": 0.0001485189783841091, "loss": 0.0085, "step": 389590 }, { "epoch": 1.01, "learning_rate": 0.00014851509016773764, "loss": 0.0123, "step": 389600 }, { "epoch": 1.01, "learning_rate": 0.00014851120195136618, "loss": 0.011, "step": 389610 }, { "epoch": 1.01, "learning_rate": 0.00014850731373499472, "loss": 0.0122, "step": 389620 }, { "epoch": 1.01, "learning_rate": 0.00014850342551862324, "loss": 0.0122, "step": 389630 }, { "epoch": 1.01, "learning_rate": 0.00014849953730225178, "loss": 0.0093, "step": 389640 }, { "epoch": 1.01, "learning_rate": 0.00014849564908588032, "loss": 0.0111, "step": 389650 }, { "epoch": 1.01, "learning_rate": 0.00014849176086950886, "loss": 0.0107, "step": 389660 }, { "epoch": 1.01, "learning_rate": 0.00014848787265313738, "loss": 0.0123, "step": 389670 }, { "epoch": 1.01, "learning_rate": 0.00014848398443676592, "loss": 0.0135, "step": 389680 }, { "epoch": 1.01, "learning_rate": 0.00014848009622039446, "loss": 0.013, "step": 389690 }, { "epoch": 1.01, "learning_rate": 0.000148476208004023, "loss": 0.0095, "step": 389700 }, { "epoch": 1.01, "learning_rate": 0.00014847231978765152, "loss": 0.0109, "step": 389710 }, { "epoch": 1.01, "learning_rate": 0.00014846843157128008, "loss": 0.0103, "step": 389720 }, { "epoch": 1.01, "learning_rate": 0.0001484645433549086, "loss": 0.0114, "step": 389730 }, { "epoch": 1.01, "learning_rate": 0.00014846065513853714, "loss": 0.0145, "step": 389740 }, { "epoch": 1.01, "learning_rate": 0.00014845676692216568, "loss": 0.01, "step": 389750 }, { "epoch": 1.01, "learning_rate": 0.00014845287870579422, "loss": 0.0105, "step": 389760 }, { "epoch": 1.01, "learning_rate": 0.00014844899048942274, "loss": 0.0113, "step": 389770 }, { "epoch": 1.01, "learning_rate": 0.00014844510227305128, "loss": 0.0142, "step": 389780 }, { "epoch": 1.01, "learning_rate": 0.00014844121405667982, "loss": 0.0134, "step": 389790 }, { "epoch": 1.01, "learning_rate": 0.00014843732584030834, "loss": 0.0134, "step": 389800 }, { "epoch": 1.01, "learning_rate": 0.00014843343762393688, "loss": 0.0116, "step": 389810 }, { "epoch": 1.01, "learning_rate": 0.00014842954940756542, "loss": 0.0123, "step": 389820 }, { "epoch": 1.01, "learning_rate": 0.00014842566119119396, "loss": 0.0091, "step": 389830 }, { "epoch": 1.01, "learning_rate": 0.00014842177297482248, "loss": 0.0104, "step": 389840 }, { "epoch": 1.01, "learning_rate": 0.00014841788475845102, "loss": 0.0129, "step": 389850 }, { "epoch": 1.01, "learning_rate": 0.00014841399654207956, "loss": 0.0098, "step": 389860 }, { "epoch": 1.01, "learning_rate": 0.0001484101083257081, "loss": 0.0104, "step": 389870 }, { "epoch": 1.01, "learning_rate": 0.00014840622010933662, "loss": 0.0115, "step": 389880 }, { "epoch": 1.01, "learning_rate": 0.00014840233189296516, "loss": 0.0106, "step": 389890 }, { "epoch": 1.01, "learning_rate": 0.0001483984436765937, "loss": 0.0156, "step": 389900 }, { "epoch": 1.01, "learning_rate": 0.00014839455546022224, "loss": 0.0115, "step": 389910 }, { "epoch": 1.01, "learning_rate": 0.00014839066724385078, "loss": 0.0123, "step": 389920 }, { "epoch": 1.01, "learning_rate": 0.00014838677902747932, "loss": 0.0114, "step": 389930 }, { "epoch": 1.01, "learning_rate": 0.00014838289081110784, "loss": 0.0116, "step": 389940 }, { "epoch": 1.01, "learning_rate": 0.00014837900259473638, "loss": 0.0085, "step": 389950 }, { "epoch": 1.01, "learning_rate": 0.00014837511437836492, "loss": 0.0116, "step": 389960 }, { "epoch": 1.01, "learning_rate": 0.00014837122616199346, "loss": 0.0108, "step": 389970 }, { "epoch": 1.01, "learning_rate": 0.00014836733794562198, "loss": 0.0116, "step": 389980 }, { "epoch": 1.01, "learning_rate": 0.00014836344972925052, "loss": 0.0161, "step": 389990 }, { "epoch": 1.01, "learning_rate": 0.00014835956151287906, "loss": 0.0119, "step": 390000 }, { "epoch": 1.01, "eval_cer": 0.881719481966378, "eval_loss": 0.007798693608492613, "eval_runtime": 108.0106, "eval_samples_per_second": 18.517, "eval_steps_per_second": 4.629, "step": 390000 }, { "epoch": 1.01, "learning_rate": 0.0001483556732965076, "loss": 0.0131, "step": 390010 }, { "epoch": 1.01, "learning_rate": 0.00014835178508013612, "loss": 0.0174, "step": 390020 }, { "epoch": 1.01, "learning_rate": 0.00014834789686376466, "loss": 0.0146, "step": 390030 }, { "epoch": 1.01, "learning_rate": 0.0001483440086473932, "loss": 0.0092, "step": 390040 }, { "epoch": 1.01, "learning_rate": 0.00014834012043102172, "loss": 0.0126, "step": 390050 }, { "epoch": 1.01, "learning_rate": 0.00014833623221465026, "loss": 0.0122, "step": 390060 }, { "epoch": 1.01, "learning_rate": 0.0001483323439982788, "loss": 0.0126, "step": 390070 }, { "epoch": 1.01, "learning_rate": 0.00014832845578190734, "loss": 0.0113, "step": 390080 }, { "epoch": 1.01, "learning_rate": 0.00014832456756553585, "loss": 0.0101, "step": 390090 }, { "epoch": 1.01, "learning_rate": 0.00014832067934916442, "loss": 0.0135, "step": 390100 }, { "epoch": 1.01, "learning_rate": 0.00014831679113279294, "loss": 0.0095, "step": 390110 }, { "epoch": 1.01, "learning_rate": 0.00014831290291642148, "loss": 0.0114, "step": 390120 }, { "epoch": 1.01, "learning_rate": 0.00014830901470005002, "loss": 0.0109, "step": 390130 }, { "epoch": 1.01, "learning_rate": 0.00014830512648367856, "loss": 0.0191, "step": 390140 }, { "epoch": 1.01, "learning_rate": 0.00014830123826730708, "loss": 0.0103, "step": 390150 }, { "epoch": 1.01, "learning_rate": 0.00014829735005093562, "loss": 0.014, "step": 390160 }, { "epoch": 1.01, "learning_rate": 0.00014829346183456416, "loss": 0.0111, "step": 390170 }, { "epoch": 1.01, "learning_rate": 0.0001482895736181927, "loss": 0.0127, "step": 390180 }, { "epoch": 1.01, "learning_rate": 0.00014828568540182122, "loss": 0.013, "step": 390190 }, { "epoch": 1.01, "learning_rate": 0.00014828179718544976, "loss": 0.01, "step": 390200 }, { "epoch": 1.01, "learning_rate": 0.0001482779089690783, "loss": 0.0118, "step": 390210 }, { "epoch": 1.01, "learning_rate": 0.00014827402075270684, "loss": 0.0097, "step": 390220 }, { "epoch": 1.01, "learning_rate": 0.00014827013253633536, "loss": 0.0139, "step": 390230 }, { "epoch": 1.01, "learning_rate": 0.00014826624431996392, "loss": 0.016, "step": 390240 }, { "epoch": 1.01, "learning_rate": 0.00014826235610359244, "loss": 0.0108, "step": 390250 }, { "epoch": 1.01, "learning_rate": 0.00014825846788722098, "loss": 0.0102, "step": 390260 }, { "epoch": 1.01, "learning_rate": 0.00014825457967084952, "loss": 0.0128, "step": 390270 }, { "epoch": 1.01, "learning_rate": 0.00014825069145447804, "loss": 0.0108, "step": 390280 }, { "epoch": 1.01, "learning_rate": 0.00014824680323810658, "loss": 0.0084, "step": 390290 }, { "epoch": 1.01, "learning_rate": 0.00014824291502173512, "loss": 0.0126, "step": 390300 }, { "epoch": 1.01, "learning_rate": 0.00014823902680536366, "loss": 0.013, "step": 390310 }, { "epoch": 1.01, "learning_rate": 0.00014823513858899218, "loss": 0.0167, "step": 390320 }, { "epoch": 1.01, "learning_rate": 0.00014823125037262072, "loss": 0.0093, "step": 390330 }, { "epoch": 1.01, "learning_rate": 0.00014822736215624926, "loss": 0.0114, "step": 390340 }, { "epoch": 1.01, "learning_rate": 0.0001482234739398778, "loss": 0.0099, "step": 390350 }, { "epoch": 1.01, "learning_rate": 0.00014821958572350632, "loss": 0.0126, "step": 390360 }, { "epoch": 1.01, "learning_rate": 0.00014821569750713486, "loss": 0.0093, "step": 390370 }, { "epoch": 1.01, "learning_rate": 0.0001482118092907634, "loss": 0.0137, "step": 390380 }, { "epoch": 1.01, "learning_rate": 0.00014820792107439194, "loss": 0.0093, "step": 390390 }, { "epoch": 1.01, "learning_rate": 0.00014820403285802046, "loss": 0.0138, "step": 390400 }, { "epoch": 1.01, "learning_rate": 0.000148200144641649, "loss": 0.0111, "step": 390410 }, { "epoch": 1.01, "learning_rate": 0.00014819625642527754, "loss": 0.0102, "step": 390420 }, { "epoch": 1.01, "learning_rate": 0.00014819236820890608, "loss": 0.0131, "step": 390430 }, { "epoch": 1.01, "learning_rate": 0.00014818847999253462, "loss": 0.0123, "step": 390440 }, { "epoch": 1.01, "learning_rate": 0.00014818459177616316, "loss": 0.009, "step": 390450 }, { "epoch": 1.01, "learning_rate": 0.00014818070355979168, "loss": 0.0148, "step": 390460 }, { "epoch": 1.01, "learning_rate": 0.00014817681534342022, "loss": 0.0096, "step": 390470 }, { "epoch": 1.01, "learning_rate": 0.00014817292712704876, "loss": 0.0123, "step": 390480 }, { "epoch": 1.01, "learning_rate": 0.0001481690389106773, "loss": 0.0099, "step": 390490 }, { "epoch": 1.01, "learning_rate": 0.00014816515069430582, "loss": 0.0109, "step": 390500 }, { "epoch": 1.01, "learning_rate": 0.00014816126247793436, "loss": 0.0145, "step": 390510 }, { "epoch": 1.01, "learning_rate": 0.0001481573742615629, "loss": 0.0112, "step": 390520 }, { "epoch": 1.01, "learning_rate": 0.00014815348604519142, "loss": 0.0111, "step": 390530 }, { "epoch": 1.01, "learning_rate": 0.00014814959782881996, "loss": 0.0128, "step": 390540 }, { "epoch": 1.01, "learning_rate": 0.0001481457096124485, "loss": 0.0111, "step": 390550 }, { "epoch": 1.01, "learning_rate": 0.00014814182139607704, "loss": 0.0118, "step": 390560 }, { "epoch": 1.01, "learning_rate": 0.00014813793317970555, "loss": 0.0096, "step": 390570 }, { "epoch": 1.01, "learning_rate": 0.0001481340449633341, "loss": 0.0112, "step": 390580 }, { "epoch": 1.01, "learning_rate": 0.00014813015674696264, "loss": 0.01, "step": 390590 }, { "epoch": 1.01, "learning_rate": 0.00014812626853059118, "loss": 0.0121, "step": 390600 }, { "epoch": 1.01, "learning_rate": 0.0001481223803142197, "loss": 0.0123, "step": 390610 }, { "epoch": 1.01, "learning_rate": 0.00014811849209784826, "loss": 0.0135, "step": 390620 }, { "epoch": 1.01, "learning_rate": 0.00014811460388147678, "loss": 0.0098, "step": 390630 }, { "epoch": 1.01, "learning_rate": 0.00014811071566510532, "loss": 0.0134, "step": 390640 }, { "epoch": 1.01, "learning_rate": 0.00014810682744873386, "loss": 0.0132, "step": 390650 }, { "epoch": 1.01, "learning_rate": 0.0001481029392323624, "loss": 0.0094, "step": 390660 }, { "epoch": 1.01, "learning_rate": 0.00014809905101599092, "loss": 0.0112, "step": 390670 }, { "epoch": 1.01, "learning_rate": 0.00014809516279961946, "loss": 0.0132, "step": 390680 }, { "epoch": 1.01, "learning_rate": 0.000148091274583248, "loss": 0.0109, "step": 390690 }, { "epoch": 1.01, "learning_rate": 0.00014808738636687654, "loss": 0.012, "step": 390700 }, { "epoch": 1.01, "learning_rate": 0.00014808349815050506, "loss": 0.0114, "step": 390710 }, { "epoch": 1.01, "learning_rate": 0.0001480796099341336, "loss": 0.0126, "step": 390720 }, { "epoch": 1.01, "learning_rate": 0.00014807572171776214, "loss": 0.01, "step": 390730 }, { "epoch": 1.01, "learning_rate": 0.00014807183350139068, "loss": 0.0121, "step": 390740 }, { "epoch": 1.01, "learning_rate": 0.0001480679452850192, "loss": 0.0122, "step": 390750 }, { "epoch": 1.01, "learning_rate": 0.00014806405706864774, "loss": 0.0088, "step": 390760 }, { "epoch": 1.01, "learning_rate": 0.00014806016885227628, "loss": 0.023, "step": 390770 }, { "epoch": 1.01, "learning_rate": 0.0001480562806359048, "loss": 0.0168, "step": 390780 }, { "epoch": 1.01, "learning_rate": 0.00014805239241953336, "loss": 0.0145, "step": 390790 }, { "epoch": 1.01, "learning_rate": 0.00014804850420316188, "loss": 0.0112, "step": 390800 }, { "epoch": 1.01, "learning_rate": 0.00014804461598679042, "loss": 0.0115, "step": 390810 }, { "epoch": 1.01, "learning_rate": 0.00014804072777041896, "loss": 0.0087, "step": 390820 }, { "epoch": 1.01, "learning_rate": 0.0001480368395540475, "loss": 0.0147, "step": 390830 }, { "epoch": 1.01, "learning_rate": 0.00014803295133767602, "loss": 0.0113, "step": 390840 }, { "epoch": 1.01, "learning_rate": 0.00014802906312130456, "loss": 0.0101, "step": 390850 }, { "epoch": 1.01, "learning_rate": 0.0001480251749049331, "loss": 0.0158, "step": 390860 }, { "epoch": 1.01, "learning_rate": 0.00014802128668856164, "loss": 0.0167, "step": 390870 }, { "epoch": 1.01, "learning_rate": 0.00014801739847219016, "loss": 0.0087, "step": 390880 }, { "epoch": 1.01, "learning_rate": 0.0001480135102558187, "loss": 0.0177, "step": 390890 }, { "epoch": 1.01, "learning_rate": 0.00014800962203944724, "loss": 0.0098, "step": 390900 }, { "epoch": 1.01, "learning_rate": 0.00014800573382307578, "loss": 0.0129, "step": 390910 }, { "epoch": 1.01, "learning_rate": 0.0001480018456067043, "loss": 0.0116, "step": 390920 }, { "epoch": 1.01, "learning_rate": 0.00014799795739033284, "loss": 0.0112, "step": 390930 }, { "epoch": 1.01, "learning_rate": 0.00014799406917396138, "loss": 0.013, "step": 390940 }, { "epoch": 1.01, "learning_rate": 0.00014799018095758992, "loss": 0.0128, "step": 390950 }, { "epoch": 1.01, "learning_rate": 0.00014798629274121846, "loss": 0.0115, "step": 390960 }, { "epoch": 1.01, "learning_rate": 0.000147982404524847, "loss": 0.0106, "step": 390970 }, { "epoch": 1.01, "learning_rate": 0.00014797851630847552, "loss": 0.0117, "step": 390980 }, { "epoch": 1.01, "learning_rate": 0.00014797462809210406, "loss": 0.0098, "step": 390990 }, { "epoch": 1.01, "learning_rate": 0.0001479707398757326, "loss": 0.0121, "step": 391000 }, { "epoch": 1.01, "eval_cer": 0.8817124837817071, "eval_loss": 0.007885308936238289, "eval_runtime": 107.5773, "eval_samples_per_second": 18.591, "eval_steps_per_second": 4.648, "step": 391000 }, { "epoch": 1.01, "learning_rate": 0.00014796685165936114, "loss": 0.011, "step": 391010 }, { "epoch": 1.01, "learning_rate": 0.00014796296344298966, "loss": 0.0124, "step": 391020 }, { "epoch": 1.01, "learning_rate": 0.0001479590752266182, "loss": 0.0118, "step": 391030 }, { "epoch": 1.01, "learning_rate": 0.00014795518701024674, "loss": 0.0129, "step": 391040 }, { "epoch": 1.01, "learning_rate": 0.00014795129879387526, "loss": 0.0124, "step": 391050 }, { "epoch": 1.01, "learning_rate": 0.0001479474105775038, "loss": 0.0151, "step": 391060 }, { "epoch": 1.01, "learning_rate": 0.00014794352236113234, "loss": 0.0108, "step": 391070 }, { "epoch": 1.01, "learning_rate": 0.00014793963414476088, "loss": 0.0123, "step": 391080 }, { "epoch": 1.01, "learning_rate": 0.0001479357459283894, "loss": 0.0134, "step": 391090 }, { "epoch": 1.01, "learning_rate": 0.00014793185771201794, "loss": 0.0142, "step": 391100 }, { "epoch": 1.01, "learning_rate": 0.00014792796949564648, "loss": 0.0101, "step": 391110 }, { "epoch": 1.01, "learning_rate": 0.00014792408127927502, "loss": 0.016, "step": 391120 }, { "epoch": 1.01, "learning_rate": 0.00014792019306290353, "loss": 0.0117, "step": 391130 }, { "epoch": 1.01, "learning_rate": 0.0001479163048465321, "loss": 0.0134, "step": 391140 }, { "epoch": 1.01, "learning_rate": 0.00014791241663016062, "loss": 0.0094, "step": 391150 }, { "epoch": 1.01, "learning_rate": 0.00014790852841378916, "loss": 0.0106, "step": 391160 }, { "epoch": 1.01, "learning_rate": 0.0001479046401974177, "loss": 0.0107, "step": 391170 }, { "epoch": 1.01, "learning_rate": 0.00014790075198104624, "loss": 0.0124, "step": 391180 }, { "epoch": 1.01, "learning_rate": 0.00014789686376467476, "loss": 0.0083, "step": 391190 }, { "epoch": 1.01, "learning_rate": 0.0001478929755483033, "loss": 0.0165, "step": 391200 }, { "epoch": 1.01, "learning_rate": 0.00014788908733193184, "loss": 0.012, "step": 391210 }, { "epoch": 1.01, "learning_rate": 0.00014788519911556038, "loss": 0.0098, "step": 391220 }, { "epoch": 1.01, "learning_rate": 0.0001478813108991889, "loss": 0.0117, "step": 391230 }, { "epoch": 1.01, "learning_rate": 0.00014787742268281744, "loss": 0.0145, "step": 391240 }, { "epoch": 1.01, "learning_rate": 0.00014787353446644598, "loss": 0.0108, "step": 391250 }, { "epoch": 1.01, "learning_rate": 0.00014786964625007452, "loss": 0.0124, "step": 391260 }, { "epoch": 1.01, "learning_rate": 0.00014786575803370304, "loss": 0.0125, "step": 391270 }, { "epoch": 1.01, "learning_rate": 0.00014786186981733158, "loss": 0.0099, "step": 391280 }, { "epoch": 1.01, "learning_rate": 0.00014785798160096012, "loss": 0.0118, "step": 391290 }, { "epoch": 1.01, "learning_rate": 0.00014785409338458863, "loss": 0.0132, "step": 391300 }, { "epoch": 1.01, "learning_rate": 0.0001478502051682172, "loss": 0.0123, "step": 391310 }, { "epoch": 1.01, "learning_rate": 0.00014784631695184572, "loss": 0.0108, "step": 391320 }, { "epoch": 1.01, "learning_rate": 0.00014784242873547426, "loss": 0.0111, "step": 391330 }, { "epoch": 1.01, "learning_rate": 0.0001478385405191028, "loss": 0.0126, "step": 391340 }, { "epoch": 1.01, "learning_rate": 0.00014783465230273134, "loss": 0.0136, "step": 391350 }, { "epoch": 1.01, "learning_rate": 0.00014783076408635986, "loss": 0.0108, "step": 391360 }, { "epoch": 1.01, "learning_rate": 0.0001478268758699884, "loss": 0.0107, "step": 391370 }, { "epoch": 1.01, "learning_rate": 0.00014782298765361694, "loss": 0.0102, "step": 391380 }, { "epoch": 1.01, "learning_rate": 0.00014781909943724548, "loss": 0.0107, "step": 391390 }, { "epoch": 1.01, "learning_rate": 0.000147815211220874, "loss": 0.0116, "step": 391400 }, { "epoch": 1.01, "learning_rate": 0.00014781132300450254, "loss": 0.0127, "step": 391410 }, { "epoch": 1.01, "learning_rate": 0.00014780743478813108, "loss": 0.0109, "step": 391420 }, { "epoch": 1.01, "learning_rate": 0.00014780354657175962, "loss": 0.0104, "step": 391430 }, { "epoch": 1.01, "learning_rate": 0.00014779965835538814, "loss": 0.0099, "step": 391440 }, { "epoch": 1.01, "learning_rate": 0.00014779577013901668, "loss": 0.0128, "step": 391450 }, { "epoch": 1.01, "learning_rate": 0.00014779188192264522, "loss": 0.0097, "step": 391460 }, { "epoch": 1.01, "learning_rate": 0.00014778799370627376, "loss": 0.0142, "step": 391470 }, { "epoch": 1.01, "learning_rate": 0.00014778410548990227, "loss": 0.0167, "step": 391480 }, { "epoch": 1.01, "learning_rate": 0.00014778021727353084, "loss": 0.0122, "step": 391490 }, { "epoch": 1.01, "learning_rate": 0.00014777632905715936, "loss": 0.0122, "step": 391500 }, { "epoch": 1.01, "learning_rate": 0.0001477724408407879, "loss": 0.0119, "step": 391510 }, { "epoch": 1.01, "learning_rate": 0.00014776855262441644, "loss": 0.0105, "step": 391520 }, { "epoch": 1.01, "learning_rate": 0.00014776466440804496, "loss": 0.0085, "step": 391530 }, { "epoch": 1.01, "learning_rate": 0.0001477607761916735, "loss": 0.0134, "step": 391540 }, { "epoch": 1.01, "learning_rate": 0.00014775688797530204, "loss": 0.0097, "step": 391550 }, { "epoch": 1.01, "learning_rate": 0.00014775299975893058, "loss": 0.0121, "step": 391560 }, { "epoch": 1.02, "learning_rate": 0.0001477491115425591, "loss": 0.0114, "step": 391570 }, { "epoch": 1.02, "learning_rate": 0.00014774522332618764, "loss": 0.0107, "step": 391580 }, { "epoch": 1.02, "learning_rate": 0.00014774133510981618, "loss": 0.016, "step": 391590 }, { "epoch": 1.02, "learning_rate": 0.00014773744689344472, "loss": 0.0125, "step": 391600 }, { "epoch": 1.02, "learning_rate": 0.00014773355867707323, "loss": 0.0119, "step": 391610 }, { "epoch": 1.02, "learning_rate": 0.00014772967046070178, "loss": 0.0136, "step": 391620 }, { "epoch": 1.02, "learning_rate": 0.00014772578224433032, "loss": 0.0109, "step": 391630 }, { "epoch": 1.02, "learning_rate": 0.00014772189402795886, "loss": 0.0139, "step": 391640 }, { "epoch": 1.02, "learning_rate": 0.00014771800581158737, "loss": 0.0143, "step": 391650 }, { "epoch": 1.02, "learning_rate": 0.00014771411759521594, "loss": 0.0122, "step": 391660 }, { "epoch": 1.02, "learning_rate": 0.00014771022937884446, "loss": 0.0134, "step": 391670 }, { "epoch": 1.02, "learning_rate": 0.000147706341162473, "loss": 0.0126, "step": 391680 }, { "epoch": 1.02, "learning_rate": 0.00014770245294610154, "loss": 0.0095, "step": 391690 }, { "epoch": 1.02, "learning_rate": 0.00014769856472973008, "loss": 0.0105, "step": 391700 }, { "epoch": 1.02, "learning_rate": 0.0001476946765133586, "loss": 0.0084, "step": 391710 }, { "epoch": 1.02, "learning_rate": 0.00014769078829698714, "loss": 0.0118, "step": 391720 }, { "epoch": 1.02, "learning_rate": 0.00014768690008061568, "loss": 0.0141, "step": 391730 }, { "epoch": 1.02, "learning_rate": 0.00014768301186424422, "loss": 0.0119, "step": 391740 }, { "epoch": 1.02, "learning_rate": 0.00014767912364787274, "loss": 0.0118, "step": 391750 }, { "epoch": 1.02, "learning_rate": 0.00014767523543150128, "loss": 0.0129, "step": 391760 }, { "epoch": 1.02, "learning_rate": 0.00014767134721512982, "loss": 0.0114, "step": 391770 }, { "epoch": 1.02, "learning_rate": 0.00014766745899875833, "loss": 0.0101, "step": 391780 }, { "epoch": 1.02, "learning_rate": 0.00014766357078238688, "loss": 0.0112, "step": 391790 }, { "epoch": 1.02, "learning_rate": 0.00014765968256601542, "loss": 0.0113, "step": 391800 }, { "epoch": 1.02, "learning_rate": 0.00014765579434964396, "loss": 0.0097, "step": 391810 }, { "epoch": 1.02, "learning_rate": 0.00014765190613327247, "loss": 0.01, "step": 391820 }, { "epoch": 1.02, "learning_rate": 0.00014764801791690104, "loss": 0.0126, "step": 391830 }, { "epoch": 1.02, "learning_rate": 0.00014764412970052956, "loss": 0.0099, "step": 391840 }, { "epoch": 1.02, "learning_rate": 0.0001476402414841581, "loss": 0.0135, "step": 391850 }, { "epoch": 1.02, "learning_rate": 0.00014763635326778664, "loss": 0.0128, "step": 391860 }, { "epoch": 1.02, "learning_rate": 0.00014763246505141518, "loss": 0.0091, "step": 391870 }, { "epoch": 1.02, "learning_rate": 0.0001476285768350437, "loss": 0.0118, "step": 391880 }, { "epoch": 1.02, "learning_rate": 0.00014762468861867224, "loss": 0.0156, "step": 391890 }, { "epoch": 1.02, "learning_rate": 0.00014762080040230078, "loss": 0.0141, "step": 391900 }, { "epoch": 1.02, "learning_rate": 0.00014761691218592932, "loss": 0.0196, "step": 391910 }, { "epoch": 1.02, "learning_rate": 0.00014761302396955784, "loss": 0.0109, "step": 391920 }, { "epoch": 1.02, "learning_rate": 0.00014760913575318638, "loss": 0.0143, "step": 391930 }, { "epoch": 1.02, "learning_rate": 0.00014760524753681492, "loss": 0.013, "step": 391940 }, { "epoch": 1.02, "learning_rate": 0.00014760135932044346, "loss": 0.0103, "step": 391950 }, { "epoch": 1.02, "learning_rate": 0.00014759747110407198, "loss": 0.0097, "step": 391960 }, { "epoch": 1.02, "learning_rate": 0.00014759358288770052, "loss": 0.0104, "step": 391970 }, { "epoch": 1.02, "learning_rate": 0.00014758969467132906, "loss": 0.0109, "step": 391980 }, { "epoch": 1.02, "learning_rate": 0.0001475858064549576, "loss": 0.0133, "step": 391990 }, { "epoch": 1.02, "learning_rate": 0.00014758191823858611, "loss": 0.0114, "step": 392000 }, { "epoch": 1.02, "eval_cer": 0.8817488743419957, "eval_loss": 0.007738828659057617, "eval_runtime": 107.489, "eval_samples_per_second": 18.607, "eval_steps_per_second": 4.652, "step": 392000 }, { "epoch": 1.02, "learning_rate": 0.00014757803002221466, "loss": 0.0153, "step": 392010 }, { "epoch": 1.02, "learning_rate": 0.0001475741418058432, "loss": 0.0097, "step": 392020 }, { "epoch": 1.02, "learning_rate": 0.00014757025358947174, "loss": 0.0129, "step": 392030 }, { "epoch": 1.02, "learning_rate": 0.00014756636537310028, "loss": 0.0159, "step": 392040 }, { "epoch": 1.02, "learning_rate": 0.0001475624771567288, "loss": 0.0127, "step": 392050 }, { "epoch": 1.02, "learning_rate": 0.00014755858894035734, "loss": 0.0104, "step": 392060 }, { "epoch": 1.02, "learning_rate": 0.00014755470072398588, "loss": 0.0096, "step": 392070 }, { "epoch": 1.02, "learning_rate": 0.00014755081250761442, "loss": 0.0109, "step": 392080 }, { "epoch": 1.02, "learning_rate": 0.00014754692429124294, "loss": 0.0106, "step": 392090 }, { "epoch": 1.02, "learning_rate": 0.00014754303607487148, "loss": 0.0174, "step": 392100 }, { "epoch": 1.02, "learning_rate": 0.00014753914785850002, "loss": 0.0128, "step": 392110 }, { "epoch": 1.02, "learning_rate": 0.00014753525964212856, "loss": 0.0129, "step": 392120 }, { "epoch": 1.02, "learning_rate": 0.00014753137142575707, "loss": 0.0126, "step": 392130 }, { "epoch": 1.02, "learning_rate": 0.00014752748320938562, "loss": 0.0092, "step": 392140 }, { "epoch": 1.02, "learning_rate": 0.00014752359499301416, "loss": 0.0159, "step": 392150 }, { "epoch": 1.02, "learning_rate": 0.0001475197067766427, "loss": 0.0128, "step": 392160 }, { "epoch": 1.02, "learning_rate": 0.00014751581856027121, "loss": 0.0118, "step": 392170 }, { "epoch": 1.02, "learning_rate": 0.00014751193034389978, "loss": 0.0111, "step": 392180 }, { "epoch": 1.02, "learning_rate": 0.0001475080421275283, "loss": 0.0136, "step": 392190 }, { "epoch": 1.02, "learning_rate": 0.00014750415391115684, "loss": 0.0122, "step": 392200 }, { "epoch": 1.02, "learning_rate": 0.00014750026569478538, "loss": 0.0119, "step": 392210 }, { "epoch": 1.02, "learning_rate": 0.00014749637747841392, "loss": 0.0125, "step": 392220 }, { "epoch": 1.02, "learning_rate": 0.00014749248926204244, "loss": 0.0132, "step": 392230 }, { "epoch": 1.02, "learning_rate": 0.00014748860104567098, "loss": 0.012, "step": 392240 }, { "epoch": 1.02, "learning_rate": 0.00014748471282929952, "loss": 0.0092, "step": 392250 }, { "epoch": 1.02, "learning_rate": 0.00014748082461292803, "loss": 0.0115, "step": 392260 }, { "epoch": 1.02, "learning_rate": 0.00014747693639655658, "loss": 0.0116, "step": 392270 }, { "epoch": 1.02, "learning_rate": 0.00014747304818018512, "loss": 0.0092, "step": 392280 }, { "epoch": 1.02, "learning_rate": 0.00014746915996381366, "loss": 0.0167, "step": 392290 }, { "epoch": 1.02, "learning_rate": 0.00014746527174744217, "loss": 0.0119, "step": 392300 }, { "epoch": 1.02, "learning_rate": 0.00014746138353107072, "loss": 0.0125, "step": 392310 }, { "epoch": 1.02, "learning_rate": 0.00014745749531469926, "loss": 0.0107, "step": 392320 }, { "epoch": 1.02, "learning_rate": 0.0001474536070983278, "loss": 0.0151, "step": 392330 }, { "epoch": 1.02, "learning_rate": 0.00014744971888195631, "loss": 0.0124, "step": 392340 }, { "epoch": 1.02, "learning_rate": 0.00014744583066558486, "loss": 0.013, "step": 392350 }, { "epoch": 1.02, "learning_rate": 0.0001474419424492134, "loss": 0.0116, "step": 392360 }, { "epoch": 1.02, "learning_rate": 0.00014743805423284194, "loss": 0.0165, "step": 392370 }, { "epoch": 1.02, "learning_rate": 0.00014743416601647048, "loss": 0.0108, "step": 392380 }, { "epoch": 1.02, "learning_rate": 0.00014743027780009902, "loss": 0.0101, "step": 392390 }, { "epoch": 1.02, "learning_rate": 0.00014742638958372754, "loss": 0.0117, "step": 392400 }, { "epoch": 1.02, "learning_rate": 0.00014742250136735608, "loss": 0.0108, "step": 392410 }, { "epoch": 1.02, "learning_rate": 0.00014741861315098462, "loss": 0.0094, "step": 392420 }, { "epoch": 1.02, "learning_rate": 0.00014741472493461316, "loss": 0.0094, "step": 392430 }, { "epoch": 1.02, "learning_rate": 0.00014741083671824168, "loss": 0.0107, "step": 392440 }, { "epoch": 1.02, "learning_rate": 0.00014740694850187022, "loss": 0.0122, "step": 392450 }, { "epoch": 1.02, "learning_rate": 0.00014740306028549876, "loss": 0.011, "step": 392460 }, { "epoch": 1.02, "learning_rate": 0.0001473991720691273, "loss": 0.0109, "step": 392470 }, { "epoch": 1.02, "learning_rate": 0.00014739528385275582, "loss": 0.0121, "step": 392480 }, { "epoch": 1.02, "learning_rate": 0.00014739139563638436, "loss": 0.0124, "step": 392490 }, { "epoch": 1.02, "learning_rate": 0.0001473875074200129, "loss": 0.0113, "step": 392500 }, { "epoch": 1.02, "learning_rate": 0.0001473836192036414, "loss": 0.0108, "step": 392510 }, { "epoch": 1.02, "learning_rate": 0.00014737973098726995, "loss": 0.0156, "step": 392520 }, { "epoch": 1.02, "learning_rate": 0.0001473758427708985, "loss": 0.0108, "step": 392530 }, { "epoch": 1.02, "learning_rate": 0.00014737195455452704, "loss": 0.0112, "step": 392540 }, { "epoch": 1.02, "learning_rate": 0.00014736806633815555, "loss": 0.0124, "step": 392550 }, { "epoch": 1.02, "learning_rate": 0.00014736417812178412, "loss": 0.0158, "step": 392560 }, { "epoch": 1.02, "learning_rate": 0.00014736028990541264, "loss": 0.0111, "step": 392570 }, { "epoch": 1.02, "learning_rate": 0.00014735640168904118, "loss": 0.0122, "step": 392580 }, { "epoch": 1.02, "learning_rate": 0.00014735251347266972, "loss": 0.0242, "step": 392590 }, { "epoch": 1.02, "learning_rate": 0.00014734862525629826, "loss": 0.0129, "step": 392600 }, { "epoch": 1.02, "learning_rate": 0.00014734473703992678, "loss": 0.0103, "step": 392610 }, { "epoch": 1.02, "learning_rate": 0.00014734084882355532, "loss": 0.0083, "step": 392620 }, { "epoch": 1.02, "learning_rate": 0.00014733696060718386, "loss": 0.01, "step": 392630 }, { "epoch": 1.02, "learning_rate": 0.0001473330723908124, "loss": 0.0101, "step": 392640 }, { "epoch": 1.02, "learning_rate": 0.00014732918417444091, "loss": 0.0102, "step": 392650 }, { "epoch": 1.02, "learning_rate": 0.00014732529595806946, "loss": 0.0097, "step": 392660 }, { "epoch": 1.02, "learning_rate": 0.000147321407741698, "loss": 0.0113, "step": 392670 }, { "epoch": 1.02, "learning_rate": 0.00014731751952532654, "loss": 0.0149, "step": 392680 }, { "epoch": 1.02, "learning_rate": 0.00014731363130895505, "loss": 0.0152, "step": 392690 }, { "epoch": 1.02, "learning_rate": 0.00014730974309258362, "loss": 0.009, "step": 392700 }, { "epoch": 1.02, "learning_rate": 0.00014730585487621214, "loss": 0.0104, "step": 392710 }, { "epoch": 1.02, "learning_rate": 0.00014730196665984068, "loss": 0.0108, "step": 392720 }, { "epoch": 1.02, "learning_rate": 0.00014729807844346922, "loss": 0.0116, "step": 392730 }, { "epoch": 1.02, "learning_rate": 0.00014729419022709776, "loss": 0.0109, "step": 392740 }, { "epoch": 1.02, "learning_rate": 0.00014729030201072628, "loss": 0.0178, "step": 392750 }, { "epoch": 1.02, "learning_rate": 0.00014728641379435482, "loss": 0.0109, "step": 392760 }, { "epoch": 1.02, "learning_rate": 0.00014728252557798336, "loss": 0.0183, "step": 392770 }, { "epoch": 1.02, "learning_rate": 0.00014727863736161187, "loss": 0.0121, "step": 392780 }, { "epoch": 1.02, "learning_rate": 0.00014727474914524042, "loss": 0.0158, "step": 392790 }, { "epoch": 1.02, "learning_rate": 0.00014727086092886896, "loss": 0.0121, "step": 392800 }, { "epoch": 1.02, "learning_rate": 0.0001472669727124975, "loss": 0.0103, "step": 392810 }, { "epoch": 1.02, "learning_rate": 0.00014726308449612601, "loss": 0.0108, "step": 392820 }, { "epoch": 1.02, "learning_rate": 0.00014725919627975456, "loss": 0.0129, "step": 392830 }, { "epoch": 1.02, "learning_rate": 0.0001472553080633831, "loss": 0.0106, "step": 392840 }, { "epoch": 1.02, "learning_rate": 0.00014725141984701164, "loss": 0.0119, "step": 392850 }, { "epoch": 1.02, "learning_rate": 0.00014724753163064015, "loss": 0.0109, "step": 392860 }, { "epoch": 1.02, "learning_rate": 0.0001472436434142687, "loss": 0.0088, "step": 392870 }, { "epoch": 1.02, "learning_rate": 0.00014723975519789724, "loss": 0.0107, "step": 392880 }, { "epoch": 1.02, "learning_rate": 0.00014723586698152578, "loss": 0.0113, "step": 392890 }, { "epoch": 1.02, "learning_rate": 0.00014723197876515432, "loss": 0.015, "step": 392900 }, { "epoch": 1.02, "learning_rate": 0.00014722809054878286, "loss": 0.0119, "step": 392910 }, { "epoch": 1.02, "learning_rate": 0.00014722420233241138, "loss": 0.0132, "step": 392920 }, { "epoch": 1.02, "learning_rate": 0.00014722031411603992, "loss": 0.0159, "step": 392930 }, { "epoch": 1.02, "learning_rate": 0.00014721642589966846, "loss": 0.0097, "step": 392940 }, { "epoch": 1.02, "learning_rate": 0.000147212537683297, "loss": 0.0112, "step": 392950 }, { "epoch": 1.02, "learning_rate": 0.00014720864946692552, "loss": 0.0129, "step": 392960 }, { "epoch": 1.02, "learning_rate": 0.00014720476125055406, "loss": 0.0189, "step": 392970 }, { "epoch": 1.02, "learning_rate": 0.0001472008730341826, "loss": 0.0119, "step": 392980 }, { "epoch": 1.02, "learning_rate": 0.00014719698481781114, "loss": 0.0102, "step": 392990 }, { "epoch": 1.02, "learning_rate": 0.00014719309660143966, "loss": 0.0101, "step": 393000 }, { "epoch": 1.02, "eval_cer": 0.8817138834186412, "eval_loss": 0.008117906749248505, "eval_runtime": 107.5812, "eval_samples_per_second": 18.591, "eval_steps_per_second": 4.648, "step": 393000 }, { "epoch": 1.02, "learning_rate": 0.0001471892083850682, "loss": 0.0108, "step": 393010 }, { "epoch": 1.02, "learning_rate": 0.00014718532016869674, "loss": 0.013, "step": 393020 }, { "epoch": 1.02, "learning_rate": 0.00014718143195232525, "loss": 0.0116, "step": 393030 }, { "epoch": 1.02, "learning_rate": 0.0001471775437359538, "loss": 0.0129, "step": 393040 }, { "epoch": 1.02, "learning_rate": 0.00014717365551958234, "loss": 0.0113, "step": 393050 }, { "epoch": 1.02, "learning_rate": 0.00014716976730321088, "loss": 0.0117, "step": 393060 }, { "epoch": 1.02, "learning_rate": 0.0001471658790868394, "loss": 0.0105, "step": 393070 }, { "epoch": 1.02, "learning_rate": 0.00014716199087046796, "loss": 0.0118, "step": 393080 }, { "epoch": 1.02, "learning_rate": 0.00014715810265409648, "loss": 0.0078, "step": 393090 }, { "epoch": 1.02, "learning_rate": 0.00014715421443772502, "loss": 0.0121, "step": 393100 }, { "epoch": 1.02, "learning_rate": 0.00014715032622135356, "loss": 0.0067, "step": 393110 }, { "epoch": 1.02, "learning_rate": 0.0001471464380049821, "loss": 0.0152, "step": 393120 }, { "epoch": 1.02, "learning_rate": 0.00014714254978861062, "loss": 0.0113, "step": 393130 }, { "epoch": 1.02, "learning_rate": 0.00014713866157223916, "loss": 0.0106, "step": 393140 }, { "epoch": 1.02, "learning_rate": 0.0001471347733558677, "loss": 0.0112, "step": 393150 }, { "epoch": 1.02, "learning_rate": 0.00014713088513949624, "loss": 0.0106, "step": 393160 }, { "epoch": 1.02, "learning_rate": 0.00014712699692312475, "loss": 0.0126, "step": 393170 }, { "epoch": 1.02, "learning_rate": 0.0001471231087067533, "loss": 0.0094, "step": 393180 }, { "epoch": 1.02, "learning_rate": 0.00014711922049038184, "loss": 0.0104, "step": 393190 }, { "epoch": 1.02, "learning_rate": 0.00014711533227401038, "loss": 0.0119, "step": 393200 }, { "epoch": 1.02, "learning_rate": 0.0001471114440576389, "loss": 0.0141, "step": 393210 }, { "epoch": 1.02, "learning_rate": 0.00014710755584126746, "loss": 0.0102, "step": 393220 }, { "epoch": 1.02, "learning_rate": 0.00014710366762489598, "loss": 0.0144, "step": 393230 }, { "epoch": 1.02, "learning_rate": 0.00014709977940852452, "loss": 0.0084, "step": 393240 }, { "epoch": 1.02, "learning_rate": 0.00014709589119215306, "loss": 0.014, "step": 393250 }, { "epoch": 1.02, "learning_rate": 0.00014709200297578158, "loss": 0.0253, "step": 393260 }, { "epoch": 1.02, "learning_rate": 0.00014708811475941012, "loss": 0.0128, "step": 393270 }, { "epoch": 1.02, "learning_rate": 0.00014708422654303866, "loss": 0.0135, "step": 393280 }, { "epoch": 1.02, "learning_rate": 0.0001470803383266672, "loss": 0.0145, "step": 393290 }, { "epoch": 1.02, "learning_rate": 0.00014707645011029571, "loss": 0.012, "step": 393300 }, { "epoch": 1.02, "learning_rate": 0.00014707256189392426, "loss": 0.0116, "step": 393310 }, { "epoch": 1.02, "learning_rate": 0.0001470686736775528, "loss": 0.013, "step": 393320 }, { "epoch": 1.02, "learning_rate": 0.00014706478546118134, "loss": 0.016, "step": 393330 }, { "epoch": 1.02, "learning_rate": 0.00014706089724480985, "loss": 0.0117, "step": 393340 }, { "epoch": 1.02, "learning_rate": 0.0001470570090284384, "loss": 0.0104, "step": 393350 }, { "epoch": 1.02, "learning_rate": 0.00014705312081206694, "loss": 0.0131, "step": 393360 }, { "epoch": 1.02, "learning_rate": 0.00014704923259569548, "loss": 0.0127, "step": 393370 }, { "epoch": 1.02, "learning_rate": 0.000147045344379324, "loss": 0.0167, "step": 393380 }, { "epoch": 1.02, "learning_rate": 0.00014704145616295253, "loss": 0.0107, "step": 393390 }, { "epoch": 1.02, "learning_rate": 0.00014703756794658108, "loss": 0.0106, "step": 393400 }, { "epoch": 1.02, "learning_rate": 0.00014703367973020962, "loss": 0.0121, "step": 393410 }, { "epoch": 1.02, "learning_rate": 0.00014702979151383816, "loss": 0.0146, "step": 393420 }, { "epoch": 1.02, "learning_rate": 0.0001470259032974667, "loss": 0.0105, "step": 393430 }, { "epoch": 1.02, "learning_rate": 0.00014702201508109522, "loss": 0.0117, "step": 393440 }, { "epoch": 1.02, "learning_rate": 0.00014701812686472376, "loss": 0.0119, "step": 393450 }, { "epoch": 1.02, "learning_rate": 0.0001470142386483523, "loss": 0.0118, "step": 393460 }, { "epoch": 1.02, "learning_rate": 0.00014701035043198084, "loss": 0.0124, "step": 393470 }, { "epoch": 1.02, "learning_rate": 0.00014700646221560936, "loss": 0.0104, "step": 393480 }, { "epoch": 1.02, "learning_rate": 0.0001470025739992379, "loss": 0.0119, "step": 393490 }, { "epoch": 1.02, "learning_rate": 0.00014699868578286644, "loss": 0.011, "step": 393500 }, { "epoch": 1.02, "learning_rate": 0.00014699479756649495, "loss": 0.0093, "step": 393510 }, { "epoch": 1.02, "learning_rate": 0.0001469909093501235, "loss": 0.0163, "step": 393520 }, { "epoch": 1.02, "learning_rate": 0.00014698702113375204, "loss": 0.0088, "step": 393530 }, { "epoch": 1.02, "learning_rate": 0.00014698313291738058, "loss": 0.0121, "step": 393540 }, { "epoch": 1.02, "learning_rate": 0.0001469792447010091, "loss": 0.0097, "step": 393550 }, { "epoch": 1.02, "learning_rate": 0.00014697535648463763, "loss": 0.0091, "step": 393560 }, { "epoch": 1.02, "learning_rate": 0.00014697146826826618, "loss": 0.0121, "step": 393570 }, { "epoch": 1.02, "learning_rate": 0.00014696758005189472, "loss": 0.0107, "step": 393580 }, { "epoch": 1.02, "learning_rate": 0.00014696369183552323, "loss": 0.0153, "step": 393590 }, { "epoch": 1.02, "learning_rate": 0.0001469598036191518, "loss": 0.013, "step": 393600 }, { "epoch": 1.02, "learning_rate": 0.00014695591540278032, "loss": 0.013, "step": 393610 }, { "epoch": 1.02, "learning_rate": 0.00014695202718640886, "loss": 0.0151, "step": 393620 }, { "epoch": 1.02, "learning_rate": 0.0001469481389700374, "loss": 0.0108, "step": 393630 }, { "epoch": 1.02, "learning_rate": 0.00014694425075366594, "loss": 0.0098, "step": 393640 }, { "epoch": 1.02, "learning_rate": 0.00014694036253729445, "loss": 0.0117, "step": 393650 }, { "epoch": 1.02, "learning_rate": 0.000146936474320923, "loss": 0.0129, "step": 393660 }, { "epoch": 1.02, "learning_rate": 0.00014693258610455154, "loss": 0.0129, "step": 393670 }, { "epoch": 1.02, "learning_rate": 0.00014692869788818008, "loss": 0.0133, "step": 393680 }, { "epoch": 1.02, "learning_rate": 0.0001469248096718086, "loss": 0.0107, "step": 393690 }, { "epoch": 1.02, "learning_rate": 0.00014692092145543714, "loss": 0.0112, "step": 393700 }, { "epoch": 1.02, "learning_rate": 0.00014691703323906568, "loss": 0.0129, "step": 393710 }, { "epoch": 1.02, "learning_rate": 0.00014691314502269422, "loss": 0.01, "step": 393720 }, { "epoch": 1.02, "learning_rate": 0.00014690925680632273, "loss": 0.0106, "step": 393730 }, { "epoch": 1.02, "learning_rate": 0.00014690536858995128, "loss": 0.0106, "step": 393740 }, { "epoch": 1.02, "learning_rate": 0.00014690148037357982, "loss": 0.0086, "step": 393750 }, { "epoch": 1.02, "learning_rate": 0.00014689759215720833, "loss": 0.0109, "step": 393760 }, { "epoch": 1.02, "learning_rate": 0.0001468937039408369, "loss": 0.0121, "step": 393770 }, { "epoch": 1.02, "learning_rate": 0.00014688981572446541, "loss": 0.0094, "step": 393780 }, { "epoch": 1.02, "learning_rate": 0.00014688592750809396, "loss": 0.0123, "step": 393790 }, { "epoch": 1.02, "learning_rate": 0.0001468820392917225, "loss": 0.0116, "step": 393800 }, { "epoch": 1.02, "learning_rate": 0.00014687815107535104, "loss": 0.0106, "step": 393810 }, { "epoch": 1.02, "learning_rate": 0.00014687426285897955, "loss": 0.0104, "step": 393820 }, { "epoch": 1.02, "learning_rate": 0.0001468703746426081, "loss": 0.0098, "step": 393830 }, { "epoch": 1.02, "learning_rate": 0.00014686648642623664, "loss": 0.0142, "step": 393840 }, { "epoch": 1.02, "learning_rate": 0.00014686259820986518, "loss": 0.0129, "step": 393850 }, { "epoch": 1.02, "learning_rate": 0.0001468587099934937, "loss": 0.0133, "step": 393860 }, { "epoch": 1.02, "learning_rate": 0.00014685482177712224, "loss": 0.0103, "step": 393870 }, { "epoch": 1.02, "learning_rate": 0.00014685093356075078, "loss": 0.0097, "step": 393880 }, { "epoch": 1.02, "learning_rate": 0.00014684704534437932, "loss": 0.0123, "step": 393890 }, { "epoch": 1.02, "learning_rate": 0.00014684315712800783, "loss": 0.0089, "step": 393900 }, { "epoch": 1.02, "learning_rate": 0.00014683926891163637, "loss": 0.0111, "step": 393910 }, { "epoch": 1.02, "learning_rate": 0.00014683538069526492, "loss": 0.0102, "step": 393920 }, { "epoch": 1.02, "learning_rate": 0.00014683149247889346, "loss": 0.0106, "step": 393930 }, { "epoch": 1.02, "learning_rate": 0.00014682760426252197, "loss": 0.0149, "step": 393940 }, { "epoch": 1.02, "learning_rate": 0.00014682371604615054, "loss": 0.0102, "step": 393950 }, { "epoch": 1.02, "learning_rate": 0.00014681982782977906, "loss": 0.0166, "step": 393960 }, { "epoch": 1.02, "learning_rate": 0.0001468159396134076, "loss": 0.0136, "step": 393970 }, { "epoch": 1.02, "learning_rate": 0.00014681205139703614, "loss": 0.0137, "step": 393980 }, { "epoch": 1.02, "learning_rate": 0.00014680816318066468, "loss": 0.0101, "step": 393990 }, { "epoch": 1.02, "learning_rate": 0.0001468042749642932, "loss": 0.0095, "step": 394000 }, { "epoch": 1.02, "eval_cer": 0.8816858906799576, "eval_loss": 0.0077973357401788235, "eval_runtime": 107.7965, "eval_samples_per_second": 18.553, "eval_steps_per_second": 4.638, "step": 394000 }, { "epoch": 1.02, "learning_rate": 0.00014680038674792174, "loss": 0.0125, "step": 394010 }, { "epoch": 1.02, "learning_rate": 0.00014679649853155028, "loss": 0.0099, "step": 394020 }, { "epoch": 1.02, "learning_rate": 0.0001467926103151788, "loss": 0.0104, "step": 394030 }, { "epoch": 1.02, "learning_rate": 0.00014678872209880733, "loss": 0.0111, "step": 394040 }, { "epoch": 1.02, "learning_rate": 0.00014678483388243588, "loss": 0.01, "step": 394050 }, { "epoch": 1.02, "learning_rate": 0.00014678094566606442, "loss": 0.0101, "step": 394060 }, { "epoch": 1.02, "learning_rate": 0.00014677705744969293, "loss": 0.0164, "step": 394070 }, { "epoch": 1.02, "learning_rate": 0.00014677316923332147, "loss": 0.009, "step": 394080 }, { "epoch": 1.02, "learning_rate": 0.00014676928101695002, "loss": 0.0151, "step": 394090 }, { "epoch": 1.02, "learning_rate": 0.00014676539280057856, "loss": 0.0094, "step": 394100 }, { "epoch": 1.02, "learning_rate": 0.00014676150458420707, "loss": 0.0092, "step": 394110 }, { "epoch": 1.02, "learning_rate": 0.00014675761636783564, "loss": 0.0146, "step": 394120 }, { "epoch": 1.02, "learning_rate": 0.00014675372815146416, "loss": 0.0123, "step": 394130 }, { "epoch": 1.02, "learning_rate": 0.0001467498399350927, "loss": 0.017, "step": 394140 }, { "epoch": 1.02, "learning_rate": 0.00014674595171872124, "loss": 0.012, "step": 394150 }, { "epoch": 1.02, "learning_rate": 0.00014674206350234978, "loss": 0.0138, "step": 394160 }, { "epoch": 1.02, "learning_rate": 0.0001467381752859783, "loss": 0.0136, "step": 394170 }, { "epoch": 1.02, "learning_rate": 0.00014673428706960684, "loss": 0.0111, "step": 394180 }, { "epoch": 1.02, "learning_rate": 0.00014673039885323538, "loss": 0.0125, "step": 394190 }, { "epoch": 1.02, "learning_rate": 0.00014672651063686392, "loss": 0.0134, "step": 394200 }, { "epoch": 1.02, "learning_rate": 0.00014672262242049243, "loss": 0.0101, "step": 394210 }, { "epoch": 1.02, "learning_rate": 0.00014671873420412098, "loss": 0.0117, "step": 394220 }, { "epoch": 1.02, "learning_rate": 0.00014671484598774952, "loss": 0.012, "step": 394230 }, { "epoch": 1.02, "learning_rate": 0.00014671095777137806, "loss": 0.0093, "step": 394240 }, { "epoch": 1.02, "learning_rate": 0.00014670706955500657, "loss": 0.0096, "step": 394250 }, { "epoch": 1.02, "learning_rate": 0.00014670318133863512, "loss": 0.0127, "step": 394260 }, { "epoch": 1.02, "learning_rate": 0.00014669929312226366, "loss": 0.0117, "step": 394270 }, { "epoch": 1.02, "learning_rate": 0.00014669540490589217, "loss": 0.0114, "step": 394280 }, { "epoch": 1.02, "learning_rate": 0.00014669151668952074, "loss": 0.0123, "step": 394290 }, { "epoch": 1.02, "learning_rate": 0.00014668762847314925, "loss": 0.0125, "step": 394300 }, { "epoch": 1.02, "learning_rate": 0.0001466837402567778, "loss": 0.011, "step": 394310 }, { "epoch": 1.02, "learning_rate": 0.00014667985204040634, "loss": 0.0126, "step": 394320 }, { "epoch": 1.02, "learning_rate": 0.00014667596382403488, "loss": 0.0115, "step": 394330 }, { "epoch": 1.02, "learning_rate": 0.0001466720756076634, "loss": 0.0103, "step": 394340 }, { "epoch": 1.02, "learning_rate": 0.00014666818739129194, "loss": 0.0133, "step": 394350 }, { "epoch": 1.02, "learning_rate": 0.00014666429917492048, "loss": 0.0096, "step": 394360 }, { "epoch": 1.02, "learning_rate": 0.00014666041095854902, "loss": 0.0133, "step": 394370 }, { "epoch": 1.02, "learning_rate": 0.00014665652274217753, "loss": 0.0121, "step": 394380 }, { "epoch": 1.02, "learning_rate": 0.00014665263452580608, "loss": 0.0149, "step": 394390 }, { "epoch": 1.02, "learning_rate": 0.00014664874630943462, "loss": 0.0158, "step": 394400 }, { "epoch": 1.02, "learning_rate": 0.00014664485809306316, "loss": 0.0102, "step": 394410 }, { "epoch": 1.02, "learning_rate": 0.00014664096987669167, "loss": 0.01, "step": 394420 }, { "epoch": 1.02, "learning_rate": 0.00014663708166032021, "loss": 0.0121, "step": 394430 }, { "epoch": 1.02, "learning_rate": 0.00014663319344394876, "loss": 0.0092, "step": 394440 }, { "epoch": 1.02, "learning_rate": 0.0001466293052275773, "loss": 0.0124, "step": 394450 }, { "epoch": 1.02, "learning_rate": 0.0001466254170112058, "loss": 0.0126, "step": 394460 }, { "epoch": 1.02, "learning_rate": 0.00014662152879483438, "loss": 0.0124, "step": 394470 }, { "epoch": 1.02, "learning_rate": 0.0001466176405784629, "loss": 0.0084, "step": 394480 }, { "epoch": 1.02, "learning_rate": 0.00014661375236209144, "loss": 0.0112, "step": 394490 }, { "epoch": 1.02, "learning_rate": 0.00014660986414571998, "loss": 0.0109, "step": 394500 }, { "epoch": 1.02, "learning_rate": 0.0001466059759293485, "loss": 0.0112, "step": 394510 }, { "epoch": 1.02, "learning_rate": 0.00014660208771297704, "loss": 0.012, "step": 394520 }, { "epoch": 1.02, "learning_rate": 0.00014659819949660558, "loss": 0.0111, "step": 394530 }, { "epoch": 1.02, "learning_rate": 0.00014659431128023412, "loss": 0.0095, "step": 394540 }, { "epoch": 1.02, "learning_rate": 0.00014659042306386263, "loss": 0.0099, "step": 394550 }, { "epoch": 1.02, "learning_rate": 0.00014658653484749117, "loss": 0.0102, "step": 394560 }, { "epoch": 1.02, "learning_rate": 0.00014658264663111972, "loss": 0.0119, "step": 394570 }, { "epoch": 1.02, "learning_rate": 0.00014657875841474826, "loss": 0.0127, "step": 394580 }, { "epoch": 1.02, "learning_rate": 0.00014657487019837677, "loss": 0.0103, "step": 394590 }, { "epoch": 1.02, "learning_rate": 0.00014657098198200531, "loss": 0.0109, "step": 394600 }, { "epoch": 1.02, "learning_rate": 0.00014656709376563386, "loss": 0.0098, "step": 394610 }, { "epoch": 1.02, "learning_rate": 0.0001465632055492624, "loss": 0.0085, "step": 394620 }, { "epoch": 1.02, "learning_rate": 0.0001465593173328909, "loss": 0.0109, "step": 394630 }, { "epoch": 1.02, "learning_rate": 0.00014655542911651948, "loss": 0.0106, "step": 394640 }, { "epoch": 1.02, "learning_rate": 0.000146551540900148, "loss": 0.0137, "step": 394650 }, { "epoch": 1.02, "learning_rate": 0.00014654765268377654, "loss": 0.013, "step": 394660 }, { "epoch": 1.02, "learning_rate": 0.00014654376446740508, "loss": 0.0112, "step": 394670 }, { "epoch": 1.02, "learning_rate": 0.00014653987625103362, "loss": 0.0096, "step": 394680 }, { "epoch": 1.02, "learning_rate": 0.00014653598803466213, "loss": 0.0127, "step": 394690 }, { "epoch": 1.02, "learning_rate": 0.00014653209981829068, "loss": 0.0107, "step": 394700 }, { "epoch": 1.02, "learning_rate": 0.00014652821160191922, "loss": 0.0119, "step": 394710 }, { "epoch": 1.02, "learning_rate": 0.00014652432338554776, "loss": 0.018, "step": 394720 }, { "epoch": 1.02, "learning_rate": 0.00014652043516917627, "loss": 0.0127, "step": 394730 }, { "epoch": 1.02, "learning_rate": 0.00014651654695280482, "loss": 0.0165, "step": 394740 }, { "epoch": 1.02, "learning_rate": 0.00014651265873643336, "loss": 0.013, "step": 394750 }, { "epoch": 1.02, "learning_rate": 0.00014650877052006187, "loss": 0.0118, "step": 394760 }, { "epoch": 1.02, "learning_rate": 0.00014650488230369041, "loss": 0.0146, "step": 394770 }, { "epoch": 1.02, "learning_rate": 0.00014650099408731896, "loss": 0.0147, "step": 394780 }, { "epoch": 1.02, "learning_rate": 0.0001464971058709475, "loss": 0.009, "step": 394790 }, { "epoch": 1.02, "learning_rate": 0.000146493217654576, "loss": 0.0119, "step": 394800 }, { "epoch": 1.02, "learning_rate": 0.00014648932943820458, "loss": 0.0097, "step": 394810 }, { "epoch": 1.02, "learning_rate": 0.0001464854412218331, "loss": 0.0115, "step": 394820 }, { "epoch": 1.02, "learning_rate": 0.00014648155300546164, "loss": 0.0144, "step": 394830 }, { "epoch": 1.02, "learning_rate": 0.00014647766478909018, "loss": 0.0145, "step": 394840 }, { "epoch": 1.02, "learning_rate": 0.00014647377657271872, "loss": 0.0078, "step": 394850 }, { "epoch": 1.02, "learning_rate": 0.00014646988835634723, "loss": 0.0091, "step": 394860 }, { "epoch": 1.02, "learning_rate": 0.00014646600013997578, "loss": 0.0113, "step": 394870 }, { "epoch": 1.02, "learning_rate": 0.00014646211192360432, "loss": 0.0107, "step": 394880 }, { "epoch": 1.02, "learning_rate": 0.00014645822370723286, "loss": 0.0121, "step": 394890 }, { "epoch": 1.02, "learning_rate": 0.00014645433549086137, "loss": 0.0113, "step": 394900 }, { "epoch": 1.02, "learning_rate": 0.00014645044727448992, "loss": 0.0122, "step": 394910 }, { "epoch": 1.02, "learning_rate": 0.00014644655905811846, "loss": 0.0102, "step": 394920 }, { "epoch": 1.02, "learning_rate": 0.000146442670841747, "loss": 0.0107, "step": 394930 }, { "epoch": 1.02, "learning_rate": 0.0001464387826253755, "loss": 0.0129, "step": 394940 }, { "epoch": 1.02, "learning_rate": 0.00014643489440900405, "loss": 0.0101, "step": 394950 }, { "epoch": 1.02, "learning_rate": 0.0001464310061926326, "loss": 0.0158, "step": 394960 }, { "epoch": 1.02, "learning_rate": 0.00014642711797626114, "loss": 0.0127, "step": 394970 }, { "epoch": 1.02, "learning_rate": 0.00014642322975988965, "loss": 0.0098, "step": 394980 }, { "epoch": 1.02, "learning_rate": 0.0001464193415435182, "loss": 0.0129, "step": 394990 }, { "epoch": 1.02, "learning_rate": 0.00014641545332714674, "loss": 0.0121, "step": 395000 }, { "epoch": 1.02, "eval_cer": 0.8816970877754311, "eval_loss": 0.007893171161413193, "eval_runtime": 107.5146, "eval_samples_per_second": 18.602, "eval_steps_per_second": 4.651, "step": 395000 }, { "epoch": 1.02, "learning_rate": 0.00014641156511077528, "loss": 0.0108, "step": 395010 }, { "epoch": 1.02, "learning_rate": 0.00014640767689440382, "loss": 0.0098, "step": 395020 }, { "epoch": 1.02, "learning_rate": 0.00014640378867803233, "loss": 0.0089, "step": 395030 }, { "epoch": 1.02, "learning_rate": 0.00014639990046166088, "loss": 0.0092, "step": 395040 }, { "epoch": 1.02, "learning_rate": 0.00014639601224528942, "loss": 0.0132, "step": 395050 }, { "epoch": 1.02, "learning_rate": 0.00014639212402891796, "loss": 0.0141, "step": 395060 }, { "epoch": 1.02, "learning_rate": 0.00014638823581254647, "loss": 0.0105, "step": 395070 }, { "epoch": 1.02, "learning_rate": 0.00014638434759617501, "loss": 0.0146, "step": 395080 }, { "epoch": 1.02, "learning_rate": 0.00014638045937980356, "loss": 0.0109, "step": 395090 }, { "epoch": 1.02, "learning_rate": 0.0001463765711634321, "loss": 0.0114, "step": 395100 }, { "epoch": 1.02, "learning_rate": 0.0001463726829470606, "loss": 0.0095, "step": 395110 }, { "epoch": 1.02, "learning_rate": 0.00014636879473068915, "loss": 0.0136, "step": 395120 }, { "epoch": 1.02, "learning_rate": 0.0001463649065143177, "loss": 0.0113, "step": 395130 }, { "epoch": 1.02, "learning_rate": 0.00014636101829794624, "loss": 0.0118, "step": 395140 }, { "epoch": 1.02, "learning_rate": 0.00014635713008157475, "loss": 0.0162, "step": 395150 }, { "epoch": 1.02, "learning_rate": 0.00014635324186520332, "loss": 0.0162, "step": 395160 }, { "epoch": 1.02, "learning_rate": 0.00014634935364883184, "loss": 0.0122, "step": 395170 }, { "epoch": 1.02, "learning_rate": 0.00014634546543246038, "loss": 0.0096, "step": 395180 }, { "epoch": 1.02, "learning_rate": 0.00014634157721608892, "loss": 0.0144, "step": 395190 }, { "epoch": 1.02, "learning_rate": 0.00014633768899971746, "loss": 0.012, "step": 395200 }, { "epoch": 1.02, "learning_rate": 0.00014633380078334597, "loss": 0.0099, "step": 395210 }, { "epoch": 1.02, "learning_rate": 0.00014632991256697452, "loss": 0.012, "step": 395220 }, { "epoch": 1.02, "learning_rate": 0.00014632602435060306, "loss": 0.0088, "step": 395230 }, { "epoch": 1.02, "learning_rate": 0.00014632213613423157, "loss": 0.0105, "step": 395240 }, { "epoch": 1.02, "learning_rate": 0.00014631824791786011, "loss": 0.0104, "step": 395250 }, { "epoch": 1.02, "learning_rate": 0.00014631435970148866, "loss": 0.0086, "step": 395260 }, { "epoch": 1.02, "learning_rate": 0.0001463104714851172, "loss": 0.011, "step": 395270 }, { "epoch": 1.02, "learning_rate": 0.0001463065832687457, "loss": 0.0154, "step": 395280 }, { "epoch": 1.02, "learning_rate": 0.00014630269505237425, "loss": 0.0138, "step": 395290 }, { "epoch": 1.02, "learning_rate": 0.0001462988068360028, "loss": 0.0148, "step": 395300 }, { "epoch": 1.02, "learning_rate": 0.00014629491861963134, "loss": 0.0153, "step": 395310 }, { "epoch": 1.02, "learning_rate": 0.00014629103040325985, "loss": 0.0109, "step": 395320 }, { "epoch": 1.02, "learning_rate": 0.0001462871421868884, "loss": 0.0106, "step": 395330 }, { "epoch": 1.02, "learning_rate": 0.00014628325397051693, "loss": 0.0115, "step": 395340 }, { "epoch": 1.02, "learning_rate": 0.00014627936575414548, "loss": 0.0157, "step": 395350 }, { "epoch": 1.02, "learning_rate": 0.00014627547753777402, "loss": 0.0137, "step": 395360 }, { "epoch": 1.02, "learning_rate": 0.00014627158932140256, "loss": 0.0135, "step": 395370 }, { "epoch": 1.02, "learning_rate": 0.00014626770110503107, "loss": 0.0105, "step": 395380 }, { "epoch": 1.02, "learning_rate": 0.00014626381288865962, "loss": 0.0096, "step": 395390 }, { "epoch": 1.02, "learning_rate": 0.00014625992467228816, "loss": 0.0081, "step": 395400 }, { "epoch": 1.02, "learning_rate": 0.0001462560364559167, "loss": 0.0107, "step": 395410 }, { "epoch": 1.02, "learning_rate": 0.0001462521482395452, "loss": 0.0096, "step": 395420 }, { "epoch": 1.03, "learning_rate": 0.00014624826002317376, "loss": 0.0082, "step": 395430 }, { "epoch": 1.03, "learning_rate": 0.0001462443718068023, "loss": 0.0105, "step": 395440 }, { "epoch": 1.03, "learning_rate": 0.00014624048359043084, "loss": 0.0102, "step": 395450 }, { "epoch": 1.03, "learning_rate": 0.00014623659537405935, "loss": 0.0138, "step": 395460 }, { "epoch": 1.03, "learning_rate": 0.0001462327071576879, "loss": 0.0094, "step": 395470 }, { "epoch": 1.03, "learning_rate": 0.00014622881894131644, "loss": 0.0124, "step": 395480 }, { "epoch": 1.03, "learning_rate": 0.00014622493072494495, "loss": 0.0095, "step": 395490 }, { "epoch": 1.03, "learning_rate": 0.0001462210425085735, "loss": 0.0096, "step": 395500 }, { "epoch": 1.03, "learning_rate": 0.00014621715429220203, "loss": 0.0096, "step": 395510 }, { "epoch": 1.03, "learning_rate": 0.00014621326607583058, "loss": 0.0104, "step": 395520 }, { "epoch": 1.03, "learning_rate": 0.0001462093778594591, "loss": 0.0123, "step": 395530 }, { "epoch": 1.03, "learning_rate": 0.00014620548964308766, "loss": 0.0138, "step": 395540 }, { "epoch": 1.03, "learning_rate": 0.00014620160142671617, "loss": 0.0106, "step": 395550 }, { "epoch": 1.03, "learning_rate": 0.00014619771321034472, "loss": 0.0118, "step": 395560 }, { "epoch": 1.03, "learning_rate": 0.00014619382499397326, "loss": 0.014, "step": 395570 }, { "epoch": 1.03, "learning_rate": 0.0001461899367776018, "loss": 0.0106, "step": 395580 }, { "epoch": 1.03, "learning_rate": 0.0001461860485612303, "loss": 0.0107, "step": 395590 }, { "epoch": 1.03, "learning_rate": 0.00014618216034485885, "loss": 0.0124, "step": 395600 }, { "epoch": 1.03, "learning_rate": 0.0001461782721284874, "loss": 0.0123, "step": 395610 }, { "epoch": 1.03, "learning_rate": 0.00014617438391211594, "loss": 0.0106, "step": 395620 }, { "epoch": 1.03, "learning_rate": 0.00014617049569574445, "loss": 0.0124, "step": 395630 }, { "epoch": 1.03, "learning_rate": 0.000146166607479373, "loss": 0.0164, "step": 395640 }, { "epoch": 1.03, "learning_rate": 0.00014616271926300154, "loss": 0.0101, "step": 395650 }, { "epoch": 1.03, "learning_rate": 0.00014615883104663008, "loss": 0.0131, "step": 395660 }, { "epoch": 1.03, "learning_rate": 0.0001461549428302586, "loss": 0.0108, "step": 395670 }, { "epoch": 1.03, "learning_rate": 0.00014615105461388716, "loss": 0.0113, "step": 395680 }, { "epoch": 1.03, "learning_rate": 0.00014614716639751568, "loss": 0.0154, "step": 395690 }, { "epoch": 1.03, "learning_rate": 0.00014614327818114422, "loss": 0.0112, "step": 395700 }, { "epoch": 1.03, "learning_rate": 0.00014613938996477276, "loss": 0.0126, "step": 395710 }, { "epoch": 1.03, "learning_rate": 0.0001461355017484013, "loss": 0.0123, "step": 395720 }, { "epoch": 1.03, "learning_rate": 0.00014613161353202981, "loss": 0.0117, "step": 395730 }, { "epoch": 1.03, "learning_rate": 0.00014612772531565836, "loss": 0.011, "step": 395740 }, { "epoch": 1.03, "learning_rate": 0.0001461238370992869, "loss": 0.0091, "step": 395750 }, { "epoch": 1.03, "learning_rate": 0.0001461199488829154, "loss": 0.0092, "step": 395760 }, { "epoch": 1.03, "learning_rate": 0.00014611606066654395, "loss": 0.0135, "step": 395770 }, { "epoch": 1.03, "learning_rate": 0.0001461121724501725, "loss": 0.0143, "step": 395780 }, { "epoch": 1.03, "learning_rate": 0.00014610828423380104, "loss": 0.0124, "step": 395790 }, { "epoch": 1.03, "learning_rate": 0.00014610439601742955, "loss": 0.0131, "step": 395800 }, { "epoch": 1.03, "learning_rate": 0.0001461005078010581, "loss": 0.0164, "step": 395810 }, { "epoch": 1.03, "learning_rate": 0.00014609661958468664, "loss": 0.0155, "step": 395820 }, { "epoch": 1.03, "learning_rate": 0.00014609273136831518, "loss": 0.0131, "step": 395830 }, { "epoch": 1.03, "learning_rate": 0.0001460888431519437, "loss": 0.0121, "step": 395840 }, { "epoch": 1.03, "learning_rate": 0.00014608495493557223, "loss": 0.01, "step": 395850 }, { "epoch": 1.03, "learning_rate": 0.00014608106671920077, "loss": 0.0124, "step": 395860 }, { "epoch": 1.03, "learning_rate": 0.00014607717850282932, "loss": 0.0123, "step": 395870 }, { "epoch": 1.03, "learning_rate": 0.00014607329028645786, "loss": 0.01, "step": 395880 }, { "epoch": 1.03, "learning_rate": 0.0001460694020700864, "loss": 0.012, "step": 395890 }, { "epoch": 1.03, "learning_rate": 0.00014606551385371491, "loss": 0.0111, "step": 395900 }, { "epoch": 1.03, "learning_rate": 0.00014606162563734346, "loss": 0.0118, "step": 395910 }, { "epoch": 1.03, "learning_rate": 0.000146057737420972, "loss": 0.0101, "step": 395920 }, { "epoch": 1.03, "learning_rate": 0.00014605384920460054, "loss": 0.0133, "step": 395930 }, { "epoch": 1.03, "learning_rate": 0.00014604996098822905, "loss": 0.0113, "step": 395940 }, { "epoch": 1.03, "learning_rate": 0.0001460460727718576, "loss": 0.011, "step": 395950 }, { "epoch": 1.03, "learning_rate": 0.00014604218455548614, "loss": 0.0128, "step": 395960 }, { "epoch": 1.03, "learning_rate": 0.00014603829633911468, "loss": 0.0113, "step": 395970 }, { "epoch": 1.03, "learning_rate": 0.0001460344081227432, "loss": 0.0113, "step": 395980 }, { "epoch": 1.03, "learning_rate": 0.00014603051990637173, "loss": 0.011, "step": 395990 }, { "epoch": 1.03, "learning_rate": 0.00014602663169000028, "loss": 0.0115, "step": 396000 }, { "epoch": 1.03, "eval_cer": 0.8817082848709045, "eval_loss": 0.007747070398181677, "eval_runtime": 107.5107, "eval_samples_per_second": 18.603, "eval_steps_per_second": 4.651, "step": 396000 }, { "epoch": 1.03, "learning_rate": 0.0001460227434736288, "loss": 0.0157, "step": 396010 }, { "epoch": 1.03, "learning_rate": 0.00014601885525725733, "loss": 0.0104, "step": 396020 }, { "epoch": 1.03, "learning_rate": 0.00014601496704088587, "loss": 0.0117, "step": 396030 }, { "epoch": 1.03, "learning_rate": 0.00014601107882451442, "loss": 0.0098, "step": 396040 }, { "epoch": 1.03, "learning_rate": 0.00014600719060814293, "loss": 0.0116, "step": 396050 }, { "epoch": 1.03, "learning_rate": 0.0001460033023917715, "loss": 0.0115, "step": 396060 }, { "epoch": 1.03, "learning_rate": 0.0001459994141754, "loss": 0.0131, "step": 396070 }, { "epoch": 1.03, "learning_rate": 0.00014599552595902856, "loss": 0.0111, "step": 396080 }, { "epoch": 1.03, "learning_rate": 0.0001459916377426571, "loss": 0.0116, "step": 396090 }, { "epoch": 1.03, "learning_rate": 0.00014598774952628564, "loss": 0.0098, "step": 396100 }, { "epoch": 1.03, "learning_rate": 0.00014598386130991415, "loss": 0.0134, "step": 396110 }, { "epoch": 1.03, "learning_rate": 0.0001459799730935427, "loss": 0.0119, "step": 396120 }, { "epoch": 1.03, "learning_rate": 0.00014597608487717124, "loss": 0.0103, "step": 396130 }, { "epoch": 1.03, "learning_rate": 0.00014597219666079978, "loss": 0.0105, "step": 396140 }, { "epoch": 1.03, "learning_rate": 0.0001459683084444283, "loss": 0.0115, "step": 396150 }, { "epoch": 1.03, "learning_rate": 0.00014596442022805683, "loss": 0.0096, "step": 396160 }, { "epoch": 1.03, "learning_rate": 0.00014596053201168538, "loss": 0.0109, "step": 396170 }, { "epoch": 1.03, "learning_rate": 0.00014595664379531392, "loss": 0.0099, "step": 396180 }, { "epoch": 1.03, "learning_rate": 0.00014595275557894243, "loss": 0.0133, "step": 396190 }, { "epoch": 1.03, "learning_rate": 0.000145948867362571, "loss": 0.0109, "step": 396200 }, { "epoch": 1.03, "learning_rate": 0.00014594497914619952, "loss": 0.0121, "step": 396210 }, { "epoch": 1.03, "learning_rate": 0.00014594109092982806, "loss": 0.0104, "step": 396220 }, { "epoch": 1.03, "learning_rate": 0.0001459372027134566, "loss": 0.0121, "step": 396230 }, { "epoch": 1.03, "learning_rate": 0.0001459333144970851, "loss": 0.0124, "step": 396240 }, { "epoch": 1.03, "learning_rate": 0.00014592942628071365, "loss": 0.0104, "step": 396250 }, { "epoch": 1.03, "learning_rate": 0.0001459255380643422, "loss": 0.0087, "step": 396260 }, { "epoch": 1.03, "learning_rate": 0.00014592164984797074, "loss": 0.0103, "step": 396270 }, { "epoch": 1.03, "learning_rate": 0.00014591776163159925, "loss": 0.013, "step": 396280 }, { "epoch": 1.03, "learning_rate": 0.0001459138734152278, "loss": 0.0166, "step": 396290 }, { "epoch": 1.03, "learning_rate": 0.00014590998519885634, "loss": 0.0096, "step": 396300 }, { "epoch": 1.03, "learning_rate": 0.00014590609698248488, "loss": 0.0099, "step": 396310 }, { "epoch": 1.03, "learning_rate": 0.0001459022087661134, "loss": 0.0163, "step": 396320 }, { "epoch": 1.03, "learning_rate": 0.00014589832054974193, "loss": 0.0089, "step": 396330 }, { "epoch": 1.03, "learning_rate": 0.00014589443233337047, "loss": 0.0099, "step": 396340 }, { "epoch": 1.03, "learning_rate": 0.00014589054411699902, "loss": 0.0123, "step": 396350 }, { "epoch": 1.03, "learning_rate": 0.00014588665590062753, "loss": 0.0176, "step": 396360 }, { "epoch": 1.03, "learning_rate": 0.00014588276768425607, "loss": 0.0147, "step": 396370 }, { "epoch": 1.03, "learning_rate": 0.00014587887946788461, "loss": 0.0138, "step": 396380 }, { "epoch": 1.03, "learning_rate": 0.00014587499125151316, "loss": 0.01, "step": 396390 }, { "epoch": 1.03, "learning_rate": 0.0001458711030351417, "loss": 0.0144, "step": 396400 }, { "epoch": 1.03, "learning_rate": 0.00014586721481877024, "loss": 0.0104, "step": 396410 }, { "epoch": 1.03, "learning_rate": 0.00014586332660239875, "loss": 0.0119, "step": 396420 }, { "epoch": 1.03, "learning_rate": 0.0001458594383860273, "loss": 0.009, "step": 396430 }, { "epoch": 1.03, "learning_rate": 0.00014585555016965584, "loss": 0.0163, "step": 396440 }, { "epoch": 1.03, "learning_rate": 0.00014585166195328438, "loss": 0.011, "step": 396450 }, { "epoch": 1.03, "learning_rate": 0.0001458477737369129, "loss": 0.0087, "step": 396460 }, { "epoch": 1.03, "learning_rate": 0.00014584388552054143, "loss": 0.0124, "step": 396470 }, { "epoch": 1.03, "learning_rate": 0.00014583999730416998, "loss": 0.0108, "step": 396480 }, { "epoch": 1.03, "learning_rate": 0.0001458361090877985, "loss": 0.013, "step": 396490 }, { "epoch": 1.03, "learning_rate": 0.00014583222087142703, "loss": 0.0144, "step": 396500 }, { "epoch": 1.03, "learning_rate": 0.00014582833265505557, "loss": 0.0117, "step": 396510 }, { "epoch": 1.03, "learning_rate": 0.00014582444443868412, "loss": 0.0139, "step": 396520 }, { "epoch": 1.03, "learning_rate": 0.00014582055622231263, "loss": 0.0129, "step": 396530 }, { "epoch": 1.03, "learning_rate": 0.00014581666800594117, "loss": 0.0093, "step": 396540 }, { "epoch": 1.03, "learning_rate": 0.00014581277978956971, "loss": 0.0179, "step": 396550 }, { "epoch": 1.03, "learning_rate": 0.00014580889157319826, "loss": 0.0099, "step": 396560 }, { "epoch": 1.03, "learning_rate": 0.00014580500335682677, "loss": 0.0105, "step": 396570 }, { "epoch": 1.03, "learning_rate": 0.00014580111514045534, "loss": 0.011, "step": 396580 }, { "epoch": 1.03, "learning_rate": 0.00014579722692408385, "loss": 0.0115, "step": 396590 }, { "epoch": 1.03, "learning_rate": 0.0001457933387077124, "loss": 0.0117, "step": 396600 }, { "epoch": 1.03, "learning_rate": 0.00014578945049134094, "loss": 0.0092, "step": 396610 }, { "epoch": 1.03, "learning_rate": 0.00014578556227496948, "loss": 0.0098, "step": 396620 }, { "epoch": 1.03, "learning_rate": 0.000145781674058598, "loss": 0.0106, "step": 396630 }, { "epoch": 1.03, "learning_rate": 0.00014577778584222653, "loss": 0.0104, "step": 396640 }, { "epoch": 1.03, "learning_rate": 0.00014577389762585508, "loss": 0.0118, "step": 396650 }, { "epoch": 1.03, "learning_rate": 0.00014577000940948362, "loss": 0.012, "step": 396660 }, { "epoch": 1.03, "learning_rate": 0.00014576612119311213, "loss": 0.0113, "step": 396670 }, { "epoch": 1.03, "learning_rate": 0.00014576223297674067, "loss": 0.0112, "step": 396680 }, { "epoch": 1.03, "learning_rate": 0.00014575834476036922, "loss": 0.0143, "step": 396690 }, { "epoch": 1.03, "learning_rate": 0.00014575445654399776, "loss": 0.0091, "step": 396700 }, { "epoch": 1.03, "learning_rate": 0.00014575056832762627, "loss": 0.0107, "step": 396710 }, { "epoch": 1.03, "learning_rate": 0.0001457466801112548, "loss": 0.013, "step": 396720 }, { "epoch": 1.03, "learning_rate": 0.00014574279189488335, "loss": 0.0148, "step": 396730 }, { "epoch": 1.03, "learning_rate": 0.00014573890367851187, "loss": 0.0124, "step": 396740 }, { "epoch": 1.03, "learning_rate": 0.00014573501546214044, "loss": 0.0092, "step": 396750 }, { "epoch": 1.03, "learning_rate": 0.00014573112724576895, "loss": 0.0105, "step": 396760 }, { "epoch": 1.03, "learning_rate": 0.0001457272390293975, "loss": 0.0115, "step": 396770 }, { "epoch": 1.03, "learning_rate": 0.00014572335081302604, "loss": 0.009, "step": 396780 }, { "epoch": 1.03, "learning_rate": 0.00014571946259665458, "loss": 0.0101, "step": 396790 }, { "epoch": 1.03, "learning_rate": 0.0001457155743802831, "loss": 0.0116, "step": 396800 }, { "epoch": 1.03, "learning_rate": 0.00014571168616391163, "loss": 0.0097, "step": 396810 }, { "epoch": 1.03, "learning_rate": 0.00014570779794754018, "loss": 0.0093, "step": 396820 }, { "epoch": 1.03, "learning_rate": 0.00014570390973116872, "loss": 0.0121, "step": 396830 }, { "epoch": 1.03, "learning_rate": 0.00014570002151479723, "loss": 0.0094, "step": 396840 }, { "epoch": 1.03, "learning_rate": 0.00014569613329842577, "loss": 0.0161, "step": 396850 }, { "epoch": 1.03, "learning_rate": 0.00014569224508205431, "loss": 0.0121, "step": 396860 }, { "epoch": 1.03, "learning_rate": 0.00014568835686568286, "loss": 0.0141, "step": 396870 }, { "epoch": 1.03, "learning_rate": 0.00014568446864931137, "loss": 0.0156, "step": 396880 }, { "epoch": 1.03, "learning_rate": 0.0001456805804329399, "loss": 0.0107, "step": 396890 }, { "epoch": 1.03, "learning_rate": 0.00014567669221656845, "loss": 0.0145, "step": 396900 }, { "epoch": 1.03, "learning_rate": 0.000145672804000197, "loss": 0.0125, "step": 396910 }, { "epoch": 1.03, "learning_rate": 0.0001456689157838255, "loss": 0.011, "step": 396920 }, { "epoch": 1.03, "learning_rate": 0.00014566502756745408, "loss": 0.0105, "step": 396930 }, { "epoch": 1.03, "learning_rate": 0.0001456611393510826, "loss": 0.0137, "step": 396940 }, { "epoch": 1.03, "learning_rate": 0.00014565725113471114, "loss": 0.0119, "step": 396950 }, { "epoch": 1.03, "learning_rate": 0.00014565336291833968, "loss": 0.0089, "step": 396960 }, { "epoch": 1.03, "learning_rate": 0.00014564947470196822, "loss": 0.0124, "step": 396970 }, { "epoch": 1.03, "learning_rate": 0.00014564558648559673, "loss": 0.0098, "step": 396980 }, { "epoch": 1.03, "learning_rate": 0.00014564169826922527, "loss": 0.0139, "step": 396990 }, { "epoch": 1.03, "learning_rate": 0.00014563781005285382, "loss": 0.0146, "step": 397000 }, { "epoch": 1.03, "eval_cer": 0.8817628707113375, "eval_loss": 0.0079797999933362, "eval_runtime": 107.7727, "eval_samples_per_second": 18.558, "eval_steps_per_second": 4.639, "step": 397000 }, { "epoch": 1.03, "learning_rate": 0.00014563392183648233, "loss": 0.0106, "step": 397010 }, { "epoch": 1.03, "learning_rate": 0.00014563003362011087, "loss": 0.0102, "step": 397020 }, { "epoch": 1.03, "learning_rate": 0.00014562614540373941, "loss": 0.0144, "step": 397030 }, { "epoch": 1.03, "learning_rate": 0.00014562225718736796, "loss": 0.0096, "step": 397040 }, { "epoch": 1.03, "learning_rate": 0.00014561836897099647, "loss": 0.0112, "step": 397050 }, { "epoch": 1.03, "learning_rate": 0.000145614480754625, "loss": 0.0101, "step": 397060 }, { "epoch": 1.03, "learning_rate": 0.00014561059253825355, "loss": 0.0097, "step": 397070 }, { "epoch": 1.03, "learning_rate": 0.0001456067043218821, "loss": 0.0144, "step": 397080 }, { "epoch": 1.03, "learning_rate": 0.0001456028161055106, "loss": 0.0122, "step": 397090 }, { "epoch": 1.03, "learning_rate": 0.00014559892788913918, "loss": 0.0098, "step": 397100 }, { "epoch": 1.03, "learning_rate": 0.0001455950396727677, "loss": 0.0112, "step": 397110 }, { "epoch": 1.03, "learning_rate": 0.00014559115145639623, "loss": 0.0129, "step": 397120 }, { "epoch": 1.03, "learning_rate": 0.00014558726324002478, "loss": 0.0112, "step": 397130 }, { "epoch": 1.03, "learning_rate": 0.00014558337502365332, "loss": 0.0094, "step": 397140 }, { "epoch": 1.03, "learning_rate": 0.00014557948680728183, "loss": 0.0115, "step": 397150 }, { "epoch": 1.03, "learning_rate": 0.00014557559859091037, "loss": 0.0088, "step": 397160 }, { "epoch": 1.03, "learning_rate": 0.00014557171037453892, "loss": 0.0196, "step": 397170 }, { "epoch": 1.03, "learning_rate": 0.00014556782215816746, "loss": 0.0154, "step": 397180 }, { "epoch": 1.03, "learning_rate": 0.00014556393394179597, "loss": 0.0133, "step": 397190 }, { "epoch": 1.03, "learning_rate": 0.00014556004572542451, "loss": 0.0134, "step": 397200 }, { "epoch": 1.03, "learning_rate": 0.00014555615750905306, "loss": 0.0106, "step": 397210 }, { "epoch": 1.03, "learning_rate": 0.00014555226929268157, "loss": 0.0135, "step": 397220 }, { "epoch": 1.03, "learning_rate": 0.0001455483810763101, "loss": 0.0116, "step": 397230 }, { "epoch": 1.03, "learning_rate": 0.00014554449285993865, "loss": 0.0142, "step": 397240 }, { "epoch": 1.03, "learning_rate": 0.0001455406046435672, "loss": 0.0137, "step": 397250 }, { "epoch": 1.03, "learning_rate": 0.0001455367164271957, "loss": 0.0117, "step": 397260 }, { "epoch": 1.03, "learning_rate": 0.00014553282821082428, "loss": 0.0137, "step": 397270 }, { "epoch": 1.03, "learning_rate": 0.0001455289399944528, "loss": 0.0094, "step": 397280 }, { "epoch": 1.03, "learning_rate": 0.00014552505177808133, "loss": 0.012, "step": 397290 }, { "epoch": 1.03, "learning_rate": 0.00014552116356170988, "loss": 0.0093, "step": 397300 }, { "epoch": 1.03, "learning_rate": 0.00014551727534533842, "loss": 0.0125, "step": 397310 }, { "epoch": 1.03, "learning_rate": 0.00014551338712896693, "loss": 0.0097, "step": 397320 }, { "epoch": 1.03, "learning_rate": 0.00014550949891259547, "loss": 0.0096, "step": 397330 }, { "epoch": 1.03, "learning_rate": 0.00014550561069622402, "loss": 0.0122, "step": 397340 }, { "epoch": 1.03, "learning_rate": 0.00014550172247985256, "loss": 0.0096, "step": 397350 }, { "epoch": 1.03, "learning_rate": 0.00014549783426348107, "loss": 0.012, "step": 397360 }, { "epoch": 1.03, "learning_rate": 0.0001454939460471096, "loss": 0.0117, "step": 397370 }, { "epoch": 1.03, "learning_rate": 0.00014549005783073815, "loss": 0.0176, "step": 397380 }, { "epoch": 1.03, "learning_rate": 0.0001454861696143667, "loss": 0.0084, "step": 397390 }, { "epoch": 1.03, "learning_rate": 0.0001454822813979952, "loss": 0.0077, "step": 397400 }, { "epoch": 1.03, "learning_rate": 0.00014547839318162375, "loss": 0.0129, "step": 397410 }, { "epoch": 1.03, "learning_rate": 0.0001454745049652523, "loss": 0.0118, "step": 397420 }, { "epoch": 1.03, "learning_rate": 0.00014547061674888084, "loss": 0.0101, "step": 397430 }, { "epoch": 1.03, "learning_rate": 0.00014546672853250935, "loss": 0.0123, "step": 397440 }, { "epoch": 1.03, "learning_rate": 0.00014546284031613792, "loss": 0.0196, "step": 397450 }, { "epoch": 1.03, "learning_rate": 0.00014545895209976643, "loss": 0.0125, "step": 397460 }, { "epoch": 1.03, "learning_rate": 0.00014545506388339498, "loss": 0.0099, "step": 397470 }, { "epoch": 1.03, "learning_rate": 0.00014545117566702352, "loss": 0.0095, "step": 397480 }, { "epoch": 1.03, "learning_rate": 0.00014544728745065203, "loss": 0.0112, "step": 397490 }, { "epoch": 1.03, "learning_rate": 0.00014544339923428057, "loss": 0.0139, "step": 397500 }, { "epoch": 1.03, "learning_rate": 0.00014543951101790911, "loss": 0.0115, "step": 397510 }, { "epoch": 1.03, "learning_rate": 0.00014543562280153766, "loss": 0.0089, "step": 397520 }, { "epoch": 1.03, "learning_rate": 0.00014543173458516617, "loss": 0.0081, "step": 397530 }, { "epoch": 1.03, "learning_rate": 0.0001454278463687947, "loss": 0.0097, "step": 397540 }, { "epoch": 1.03, "learning_rate": 0.00014542395815242325, "loss": 0.0095, "step": 397550 }, { "epoch": 1.03, "learning_rate": 0.0001454200699360518, "loss": 0.0124, "step": 397560 }, { "epoch": 1.03, "learning_rate": 0.0001454161817196803, "loss": 0.0132, "step": 397570 }, { "epoch": 1.03, "learning_rate": 0.00014541229350330885, "loss": 0.0108, "step": 397580 }, { "epoch": 1.03, "learning_rate": 0.0001454084052869374, "loss": 0.0162, "step": 397590 }, { "epoch": 1.03, "learning_rate": 0.00014540451707056594, "loss": 0.0102, "step": 397600 }, { "epoch": 1.03, "learning_rate": 0.00014540062885419445, "loss": 0.0128, "step": 397610 }, { "epoch": 1.03, "learning_rate": 0.00014539674063782302, "loss": 0.0097, "step": 397620 }, { "epoch": 1.03, "learning_rate": 0.00014539285242145153, "loss": 0.0111, "step": 397630 }, { "epoch": 1.03, "learning_rate": 0.00014538896420508007, "loss": 0.0123, "step": 397640 }, { "epoch": 1.03, "learning_rate": 0.00014538507598870862, "loss": 0.0124, "step": 397650 }, { "epoch": 1.03, "learning_rate": 0.00014538118777233716, "loss": 0.0096, "step": 397660 }, { "epoch": 1.03, "learning_rate": 0.00014537729955596567, "loss": 0.0093, "step": 397670 }, { "epoch": 1.03, "learning_rate": 0.00014537341133959421, "loss": 0.0138, "step": 397680 }, { "epoch": 1.03, "learning_rate": 0.00014536952312322276, "loss": 0.0126, "step": 397690 }, { "epoch": 1.03, "learning_rate": 0.0001453656349068513, "loss": 0.0122, "step": 397700 }, { "epoch": 1.03, "learning_rate": 0.0001453617466904798, "loss": 0.0137, "step": 397710 }, { "epoch": 1.03, "learning_rate": 0.00014535785847410835, "loss": 0.0134, "step": 397720 }, { "epoch": 1.03, "learning_rate": 0.0001453539702577369, "loss": 0.0135, "step": 397730 }, { "epoch": 1.03, "learning_rate": 0.0001453500820413654, "loss": 0.0128, "step": 397740 }, { "epoch": 1.03, "learning_rate": 0.00014534619382499395, "loss": 0.0118, "step": 397750 }, { "epoch": 1.03, "learning_rate": 0.0001453423056086225, "loss": 0.0126, "step": 397760 }, { "epoch": 1.03, "learning_rate": 0.00014533841739225103, "loss": 0.0146, "step": 397770 }, { "epoch": 1.03, "learning_rate": 0.00014533452917587955, "loss": 0.014, "step": 397780 }, { "epoch": 1.03, "learning_rate": 0.00014533064095950812, "loss": 0.0128, "step": 397790 }, { "epoch": 1.03, "learning_rate": 0.00014532675274313663, "loss": 0.012, "step": 397800 }, { "epoch": 1.03, "learning_rate": 0.00014532286452676517, "loss": 0.015, "step": 397810 }, { "epoch": 1.03, "learning_rate": 0.00014531897631039372, "loss": 0.0157, "step": 397820 }, { "epoch": 1.03, "learning_rate": 0.00014531508809402226, "loss": 0.0113, "step": 397830 }, { "epoch": 1.03, "learning_rate": 0.00014531119987765077, "loss": 0.0119, "step": 397840 }, { "epoch": 1.03, "learning_rate": 0.00014530731166127931, "loss": 0.0112, "step": 397850 }, { "epoch": 1.03, "learning_rate": 0.00014530342344490786, "loss": 0.0115, "step": 397860 }, { "epoch": 1.03, "learning_rate": 0.0001452995352285364, "loss": 0.013, "step": 397870 }, { "epoch": 1.03, "learning_rate": 0.0001452956470121649, "loss": 0.0126, "step": 397880 }, { "epoch": 1.03, "learning_rate": 0.00014529175879579345, "loss": 0.012, "step": 397890 }, { "epoch": 1.03, "learning_rate": 0.000145287870579422, "loss": 0.01, "step": 397900 }, { "epoch": 1.03, "learning_rate": 0.00014528398236305054, "loss": 0.0119, "step": 397910 }, { "epoch": 1.03, "learning_rate": 0.00014528009414667905, "loss": 0.0125, "step": 397920 }, { "epoch": 1.03, "learning_rate": 0.0001452762059303076, "loss": 0.0115, "step": 397930 }, { "epoch": 1.03, "learning_rate": 0.00014527231771393613, "loss": 0.0134, "step": 397940 }, { "epoch": 1.03, "learning_rate": 0.00014526842949756468, "loss": 0.0112, "step": 397950 }, { "epoch": 1.03, "learning_rate": 0.0001452645412811932, "loss": 0.0109, "step": 397960 }, { "epoch": 1.03, "learning_rate": 0.00014526065306482173, "loss": 0.0136, "step": 397970 }, { "epoch": 1.03, "learning_rate": 0.00014525676484845027, "loss": 0.0115, "step": 397980 }, { "epoch": 1.03, "learning_rate": 0.00014525287663207882, "loss": 0.0101, "step": 397990 }, { "epoch": 1.03, "learning_rate": 0.00014524898841570736, "loss": 0.012, "step": 398000 }, { "epoch": 1.03, "eval_cer": 0.8816830914060892, "eval_loss": 0.007515719626098871, "eval_runtime": 107.6857, "eval_samples_per_second": 18.573, "eval_steps_per_second": 4.643, "step": 398000 }, { "epoch": 1.03, "learning_rate": 0.00014524510019933587, "loss": 0.0112, "step": 398010 }, { "epoch": 1.03, "learning_rate": 0.0001452412119829644, "loss": 0.01, "step": 398020 }, { "epoch": 1.03, "learning_rate": 0.00014523732376659295, "loss": 0.0098, "step": 398030 }, { "epoch": 1.03, "learning_rate": 0.0001452334355502215, "loss": 0.0124, "step": 398040 }, { "epoch": 1.03, "learning_rate": 0.00014522954733385, "loss": 0.011, "step": 398050 }, { "epoch": 1.03, "learning_rate": 0.00014522565911747855, "loss": 0.0139, "step": 398060 }, { "epoch": 1.03, "learning_rate": 0.0001452217709011071, "loss": 0.0128, "step": 398070 }, { "epoch": 1.03, "learning_rate": 0.00014521788268473564, "loss": 0.011, "step": 398080 }, { "epoch": 1.03, "learning_rate": 0.00014521399446836415, "loss": 0.0109, "step": 398090 }, { "epoch": 1.03, "learning_rate": 0.0001452101062519927, "loss": 0.0123, "step": 398100 }, { "epoch": 1.03, "learning_rate": 0.00014520621803562123, "loss": 0.0112, "step": 398110 }, { "epoch": 1.03, "learning_rate": 0.00014520232981924978, "loss": 0.0102, "step": 398120 }, { "epoch": 1.03, "learning_rate": 0.0001451984416028783, "loss": 0.0119, "step": 398130 }, { "epoch": 1.03, "learning_rate": 0.00014519455338650686, "loss": 0.0142, "step": 398140 }, { "epoch": 1.03, "learning_rate": 0.00014519066517013537, "loss": 0.0117, "step": 398150 }, { "epoch": 1.03, "learning_rate": 0.00014518677695376391, "loss": 0.0111, "step": 398160 }, { "epoch": 1.03, "learning_rate": 0.00014518288873739246, "loss": 0.011, "step": 398170 }, { "epoch": 1.03, "learning_rate": 0.000145179000521021, "loss": 0.0106, "step": 398180 }, { "epoch": 1.03, "learning_rate": 0.0001451751123046495, "loss": 0.0127, "step": 398190 }, { "epoch": 1.03, "learning_rate": 0.00014517122408827805, "loss": 0.0103, "step": 398200 }, { "epoch": 1.03, "learning_rate": 0.0001451673358719066, "loss": 0.0116, "step": 398210 }, { "epoch": 1.03, "learning_rate": 0.0001451634476555351, "loss": 0.0123, "step": 398220 }, { "epoch": 1.03, "learning_rate": 0.00014515955943916365, "loss": 0.0099, "step": 398230 }, { "epoch": 1.03, "learning_rate": 0.0001451556712227922, "loss": 0.0111, "step": 398240 }, { "epoch": 1.03, "learning_rate": 0.00014515178300642074, "loss": 0.0095, "step": 398250 }, { "epoch": 1.03, "learning_rate": 0.00014514789479004925, "loss": 0.0118, "step": 398260 }, { "epoch": 1.03, "learning_rate": 0.0001451440065736778, "loss": 0.0091, "step": 398270 }, { "epoch": 1.03, "learning_rate": 0.00014514011835730633, "loss": 0.0126, "step": 398280 }, { "epoch": 1.03, "learning_rate": 0.00014513623014093487, "loss": 0.0106, "step": 398290 }, { "epoch": 1.03, "learning_rate": 0.0001451323419245634, "loss": 0.0129, "step": 398300 }, { "epoch": 1.03, "learning_rate": 0.00014512845370819193, "loss": 0.0118, "step": 398310 }, { "epoch": 1.03, "learning_rate": 0.00014512456549182047, "loss": 0.0117, "step": 398320 }, { "epoch": 1.03, "learning_rate": 0.00014512067727544901, "loss": 0.0117, "step": 398330 }, { "epoch": 1.03, "learning_rate": 0.00014511678905907756, "loss": 0.0087, "step": 398340 }, { "epoch": 1.03, "learning_rate": 0.0001451129008427061, "loss": 0.0086, "step": 398350 }, { "epoch": 1.03, "learning_rate": 0.0001451090126263346, "loss": 0.0119, "step": 398360 }, { "epoch": 1.03, "learning_rate": 0.00014510512440996315, "loss": 0.0105, "step": 398370 }, { "epoch": 1.03, "learning_rate": 0.0001451012361935917, "loss": 0.0115, "step": 398380 }, { "epoch": 1.03, "learning_rate": 0.00014509734797722024, "loss": 0.0101, "step": 398390 }, { "epoch": 1.03, "learning_rate": 0.00014509345976084875, "loss": 0.0126, "step": 398400 }, { "epoch": 1.03, "learning_rate": 0.0001450895715444773, "loss": 0.0085, "step": 398410 }, { "epoch": 1.03, "learning_rate": 0.00014508568332810583, "loss": 0.0099, "step": 398420 }, { "epoch": 1.03, "learning_rate": 0.00014508179511173438, "loss": 0.0108, "step": 398430 }, { "epoch": 1.03, "learning_rate": 0.0001450779068953629, "loss": 0.0113, "step": 398440 }, { "epoch": 1.03, "learning_rate": 0.00014507401867899143, "loss": 0.0125, "step": 398450 }, { "epoch": 1.03, "learning_rate": 0.00014507013046261997, "loss": 0.0106, "step": 398460 }, { "epoch": 1.03, "learning_rate": 0.0001450662422462485, "loss": 0.0104, "step": 398470 }, { "epoch": 1.03, "learning_rate": 0.00014506235402987703, "loss": 0.012, "step": 398480 }, { "epoch": 1.03, "learning_rate": 0.00014505846581350557, "loss": 0.0142, "step": 398490 }, { "epoch": 1.03, "learning_rate": 0.0001450545775971341, "loss": 0.0114, "step": 398500 }, { "epoch": 1.03, "learning_rate": 0.00014505068938076263, "loss": 0.0119, "step": 398510 }, { "epoch": 1.03, "learning_rate": 0.0001450468011643912, "loss": 0.0121, "step": 398520 }, { "epoch": 1.03, "learning_rate": 0.0001450429129480197, "loss": 0.0113, "step": 398530 }, { "epoch": 1.03, "learning_rate": 0.00014503902473164825, "loss": 0.0129, "step": 398540 }, { "epoch": 1.03, "learning_rate": 0.0001450351365152768, "loss": 0.0125, "step": 398550 }, { "epoch": 1.03, "learning_rate": 0.00014503124829890534, "loss": 0.0099, "step": 398560 }, { "epoch": 1.03, "learning_rate": 0.00014502736008253385, "loss": 0.0119, "step": 398570 }, { "epoch": 1.03, "learning_rate": 0.0001450234718661624, "loss": 0.0142, "step": 398580 }, { "epoch": 1.03, "learning_rate": 0.00014501958364979093, "loss": 0.01, "step": 398590 }, { "epoch": 1.03, "learning_rate": 0.00014501569543341948, "loss": 0.0131, "step": 398600 }, { "epoch": 1.03, "learning_rate": 0.000145011807217048, "loss": 0.0131, "step": 398610 }, { "epoch": 1.03, "learning_rate": 0.00014500791900067653, "loss": 0.0114, "step": 398620 }, { "epoch": 1.03, "learning_rate": 0.00014500403078430507, "loss": 0.0114, "step": 398630 }, { "epoch": 1.03, "learning_rate": 0.00014500014256793362, "loss": 0.0098, "step": 398640 }, { "epoch": 1.03, "learning_rate": 0.00014499625435156213, "loss": 0.0133, "step": 398650 }, { "epoch": 1.03, "learning_rate": 0.0001449923661351907, "loss": 0.013, "step": 398660 }, { "epoch": 1.03, "learning_rate": 0.0001449884779188192, "loss": 0.0106, "step": 398670 }, { "epoch": 1.03, "learning_rate": 0.00014498458970244775, "loss": 0.0123, "step": 398680 }, { "epoch": 1.03, "learning_rate": 0.0001449807014860763, "loss": 0.0089, "step": 398690 }, { "epoch": 1.03, "learning_rate": 0.00014497681326970484, "loss": 0.0132, "step": 398700 }, { "epoch": 1.03, "learning_rate": 0.00014497292505333335, "loss": 0.0186, "step": 398710 }, { "epoch": 1.03, "learning_rate": 0.0001449690368369619, "loss": 0.0115, "step": 398720 }, { "epoch": 1.03, "learning_rate": 0.00014496514862059044, "loss": 0.0127, "step": 398730 }, { "epoch": 1.03, "learning_rate": 0.00014496126040421895, "loss": 0.011, "step": 398740 }, { "epoch": 1.03, "learning_rate": 0.0001449573721878475, "loss": 0.0147, "step": 398750 }, { "epoch": 1.03, "learning_rate": 0.00014495348397147603, "loss": 0.0105, "step": 398760 }, { "epoch": 1.03, "learning_rate": 0.00014494959575510458, "loss": 0.0102, "step": 398770 }, { "epoch": 1.03, "learning_rate": 0.0001449457075387331, "loss": 0.0102, "step": 398780 }, { "epoch": 1.03, "learning_rate": 0.00014494181932236163, "loss": 0.0085, "step": 398790 }, { "epoch": 1.03, "learning_rate": 0.00014493793110599017, "loss": 0.0149, "step": 398800 }, { "epoch": 1.03, "learning_rate": 0.00014493404288961871, "loss": 0.0146, "step": 398810 }, { "epoch": 1.03, "learning_rate": 0.00014493015467324723, "loss": 0.0116, "step": 398820 }, { "epoch": 1.03, "learning_rate": 0.00014492626645687577, "loss": 0.01, "step": 398830 }, { "epoch": 1.03, "learning_rate": 0.0001449223782405043, "loss": 0.0092, "step": 398840 }, { "epoch": 1.03, "learning_rate": 0.00014491849002413285, "loss": 0.0131, "step": 398850 }, { "epoch": 1.03, "learning_rate": 0.0001449146018077614, "loss": 0.0103, "step": 398860 }, { "epoch": 1.03, "learning_rate": 0.00014491071359138994, "loss": 0.0171, "step": 398870 }, { "epoch": 1.03, "learning_rate": 0.00014490682537501845, "loss": 0.0115, "step": 398880 }, { "epoch": 1.03, "learning_rate": 0.000144902937158647, "loss": 0.012, "step": 398890 }, { "epoch": 1.03, "learning_rate": 0.00014489904894227554, "loss": 0.0137, "step": 398900 }, { "epoch": 1.03, "learning_rate": 0.00014489516072590408, "loss": 0.0117, "step": 398910 }, { "epoch": 1.03, "learning_rate": 0.0001448912725095326, "loss": 0.0114, "step": 398920 }, { "epoch": 1.03, "learning_rate": 0.00014488738429316113, "loss": 0.0101, "step": 398930 }, { "epoch": 1.03, "learning_rate": 0.00014488349607678967, "loss": 0.0084, "step": 398940 }, { "epoch": 1.03, "learning_rate": 0.00014487960786041822, "loss": 0.011, "step": 398950 }, { "epoch": 1.03, "learning_rate": 0.00014487571964404673, "loss": 0.0117, "step": 398960 }, { "epoch": 1.03, "learning_rate": 0.00014487183142767527, "loss": 0.012, "step": 398970 }, { "epoch": 1.03, "learning_rate": 0.00014486794321130381, "loss": 0.013, "step": 398980 }, { "epoch": 1.03, "learning_rate": 0.00014486405499493233, "loss": 0.0093, "step": 398990 }, { "epoch": 1.03, "learning_rate": 0.00014486016677856087, "loss": 0.0127, "step": 399000 }, { "epoch": 1.03, "eval_cer": 0.881688689953826, "eval_loss": 0.00787573866546154, "eval_runtime": 107.4938, "eval_samples_per_second": 18.606, "eval_steps_per_second": 4.651, "step": 399000 }, { "epoch": 1.03, "learning_rate": 0.0001448562785621894, "loss": 0.01, "step": 399010 }, { "epoch": 1.03, "learning_rate": 0.00014485239034581795, "loss": 0.0104, "step": 399020 }, { "epoch": 1.03, "learning_rate": 0.00014484850212944647, "loss": 0.0176, "step": 399030 }, { "epoch": 1.03, "learning_rate": 0.00014484461391307504, "loss": 0.0113, "step": 399040 }, { "epoch": 1.03, "learning_rate": 0.00014484072569670355, "loss": 0.0124, "step": 399050 }, { "epoch": 1.03, "learning_rate": 0.0001448368374803321, "loss": 0.0111, "step": 399060 }, { "epoch": 1.03, "learning_rate": 0.00014483294926396063, "loss": 0.0093, "step": 399070 }, { "epoch": 1.03, "learning_rate": 0.00014482906104758918, "loss": 0.0124, "step": 399080 }, { "epoch": 1.03, "learning_rate": 0.0001448251728312177, "loss": 0.0113, "step": 399090 }, { "epoch": 1.03, "learning_rate": 0.00014482128461484623, "loss": 0.0114, "step": 399100 }, { "epoch": 1.03, "learning_rate": 0.00014481739639847477, "loss": 0.0141, "step": 399110 }, { "epoch": 1.03, "learning_rate": 0.00014481350818210332, "loss": 0.0202, "step": 399120 }, { "epoch": 1.03, "learning_rate": 0.00014480961996573183, "loss": 0.0132, "step": 399130 }, { "epoch": 1.03, "learning_rate": 0.00014480573174936037, "loss": 0.017, "step": 399140 }, { "epoch": 1.03, "learning_rate": 0.0001448018435329889, "loss": 0.0103, "step": 399150 }, { "epoch": 1.03, "learning_rate": 0.00014479795531661746, "loss": 0.0122, "step": 399160 }, { "epoch": 1.03, "learning_rate": 0.00014479406710024597, "loss": 0.0123, "step": 399170 }, { "epoch": 1.03, "learning_rate": 0.0001447901788838745, "loss": 0.0104, "step": 399180 }, { "epoch": 1.03, "learning_rate": 0.00014478629066750305, "loss": 0.0118, "step": 399190 }, { "epoch": 1.03, "learning_rate": 0.0001447824024511316, "loss": 0.0107, "step": 399200 }, { "epoch": 1.03, "learning_rate": 0.00014477851423476014, "loss": 0.0094, "step": 399210 }, { "epoch": 1.03, "learning_rate": 0.00014477462601838865, "loss": 0.0131, "step": 399220 }, { "epoch": 1.03, "learning_rate": 0.0001447707378020172, "loss": 0.0133, "step": 399230 }, { "epoch": 1.03, "learning_rate": 0.00014476684958564573, "loss": 0.0155, "step": 399240 }, { "epoch": 1.03, "learning_rate": 0.00014476296136927428, "loss": 0.0128, "step": 399250 }, { "epoch": 1.03, "learning_rate": 0.0001447590731529028, "loss": 0.0135, "step": 399260 }, { "epoch": 1.03, "learning_rate": 0.00014475518493653133, "loss": 0.0159, "step": 399270 }, { "epoch": 1.03, "learning_rate": 0.00014475129672015987, "loss": 0.0115, "step": 399280 }, { "epoch": 1.04, "learning_rate": 0.00014474740850378841, "loss": 0.0098, "step": 399290 }, { "epoch": 1.04, "learning_rate": 0.00014474352028741693, "loss": 0.0088, "step": 399300 }, { "epoch": 1.04, "learning_rate": 0.00014473963207104547, "loss": 0.0103, "step": 399310 }, { "epoch": 1.04, "learning_rate": 0.000144735743854674, "loss": 0.0176, "step": 399320 }, { "epoch": 1.04, "learning_rate": 0.00014473185563830255, "loss": 0.0124, "step": 399330 }, { "epoch": 1.04, "learning_rate": 0.00014472796742193107, "loss": 0.0111, "step": 399340 }, { "epoch": 1.04, "learning_rate": 0.0001447240792055596, "loss": 0.0118, "step": 399350 }, { "epoch": 1.04, "learning_rate": 0.00014472019098918815, "loss": 0.0105, "step": 399360 }, { "epoch": 1.04, "learning_rate": 0.0001447163027728167, "loss": 0.0116, "step": 399370 }, { "epoch": 1.04, "learning_rate": 0.00014471241455644524, "loss": 0.0103, "step": 399380 }, { "epoch": 1.04, "learning_rate": 0.00014470852634007378, "loss": 0.0112, "step": 399390 }, { "epoch": 1.04, "learning_rate": 0.0001447046381237023, "loss": 0.012, "step": 399400 }, { "epoch": 1.04, "learning_rate": 0.00014470074990733083, "loss": 0.0118, "step": 399410 }, { "epoch": 1.04, "learning_rate": 0.00014469686169095937, "loss": 0.0126, "step": 399420 }, { "epoch": 1.04, "learning_rate": 0.00014469297347458792, "loss": 0.0105, "step": 399430 }, { "epoch": 1.04, "learning_rate": 0.00014468908525821643, "loss": 0.0108, "step": 399440 }, { "epoch": 1.04, "learning_rate": 0.00014468519704184497, "loss": 0.0112, "step": 399450 }, { "epoch": 1.04, "learning_rate": 0.00014468130882547351, "loss": 0.0143, "step": 399460 }, { "epoch": 1.04, "learning_rate": 0.00014467742060910203, "loss": 0.0185, "step": 399470 }, { "epoch": 1.04, "learning_rate": 0.00014467353239273057, "loss": 0.0149, "step": 399480 }, { "epoch": 1.04, "learning_rate": 0.0001446696441763591, "loss": 0.0129, "step": 399490 }, { "epoch": 1.04, "learning_rate": 0.00014466575595998765, "loss": 0.0111, "step": 399500 }, { "epoch": 1.04, "learning_rate": 0.00014466186774361617, "loss": 0.0136, "step": 399510 }, { "epoch": 1.04, "learning_rate": 0.0001446579795272447, "loss": 0.0133, "step": 399520 }, { "epoch": 1.04, "learning_rate": 0.00014465409131087325, "loss": 0.0121, "step": 399530 }, { "epoch": 1.04, "learning_rate": 0.0001446502030945018, "loss": 0.0173, "step": 399540 }, { "epoch": 1.04, "learning_rate": 0.0001446463148781303, "loss": 0.0133, "step": 399550 }, { "epoch": 1.04, "learning_rate": 0.00014464242666175888, "loss": 0.0104, "step": 399560 }, { "epoch": 1.04, "learning_rate": 0.0001446385384453874, "loss": 0.0134, "step": 399570 }, { "epoch": 1.04, "learning_rate": 0.00014463465022901593, "loss": 0.0093, "step": 399580 }, { "epoch": 1.04, "learning_rate": 0.00014463076201264447, "loss": 0.0128, "step": 399590 }, { "epoch": 1.04, "learning_rate": 0.00014462687379627302, "loss": 0.0131, "step": 399600 }, { "epoch": 1.04, "learning_rate": 0.00014462298557990153, "loss": 0.0138, "step": 399610 }, { "epoch": 1.04, "learning_rate": 0.00014461909736353007, "loss": 0.0101, "step": 399620 }, { "epoch": 1.04, "learning_rate": 0.00014461520914715861, "loss": 0.0103, "step": 399630 }, { "epoch": 1.04, "learning_rate": 0.00014461132093078716, "loss": 0.0118, "step": 399640 }, { "epoch": 1.04, "learning_rate": 0.00014460743271441567, "loss": 0.0117, "step": 399650 }, { "epoch": 1.04, "learning_rate": 0.0001446035444980442, "loss": 0.013, "step": 399660 }, { "epoch": 1.04, "learning_rate": 0.00014459965628167275, "loss": 0.0128, "step": 399670 }, { "epoch": 1.04, "learning_rate": 0.0001445957680653013, "loss": 0.0114, "step": 399680 }, { "epoch": 1.04, "learning_rate": 0.0001445918798489298, "loss": 0.0102, "step": 399690 }, { "epoch": 1.04, "learning_rate": 0.00014458799163255835, "loss": 0.0138, "step": 399700 }, { "epoch": 1.04, "learning_rate": 0.0001445841034161869, "loss": 0.0111, "step": 399710 }, { "epoch": 1.04, "learning_rate": 0.0001445802151998154, "loss": 0.0146, "step": 399720 }, { "epoch": 1.04, "learning_rate": 0.00014457632698344398, "loss": 0.0144, "step": 399730 }, { "epoch": 1.04, "learning_rate": 0.0001445724387670725, "loss": 0.0138, "step": 399740 }, { "epoch": 1.04, "learning_rate": 0.00014456855055070103, "loss": 0.0107, "step": 399750 }, { "epoch": 1.04, "learning_rate": 0.00014456466233432957, "loss": 0.0125, "step": 399760 }, { "epoch": 1.04, "learning_rate": 0.00014456077411795812, "loss": 0.0122, "step": 399770 }, { "epoch": 1.04, "learning_rate": 0.00014455688590158663, "loss": 0.0127, "step": 399780 }, { "epoch": 1.04, "learning_rate": 0.00014455299768521517, "loss": 0.009, "step": 399790 }, { "epoch": 1.04, "learning_rate": 0.0001445491094688437, "loss": 0.0102, "step": 399800 }, { "epoch": 1.04, "learning_rate": 0.00014454522125247225, "loss": 0.0122, "step": 399810 }, { "epoch": 1.04, "learning_rate": 0.00014454133303610077, "loss": 0.0112, "step": 399820 }, { "epoch": 1.04, "learning_rate": 0.0001445374448197293, "loss": 0.0138, "step": 399830 }, { "epoch": 1.04, "learning_rate": 0.00014453355660335785, "loss": 0.0135, "step": 399840 }, { "epoch": 1.04, "learning_rate": 0.0001445296683869864, "loss": 0.0162, "step": 399850 }, { "epoch": 1.04, "learning_rate": 0.0001445257801706149, "loss": 0.0101, "step": 399860 }, { "epoch": 1.04, "learning_rate": 0.00014452189195424345, "loss": 0.0126, "step": 399870 }, { "epoch": 1.04, "learning_rate": 0.000144518003737872, "loss": 0.0135, "step": 399880 }, { "epoch": 1.04, "learning_rate": 0.00014451411552150053, "loss": 0.0116, "step": 399890 }, { "epoch": 1.04, "learning_rate": 0.00014451022730512905, "loss": 0.0154, "step": 399900 }, { "epoch": 1.04, "learning_rate": 0.00014450633908875762, "loss": 0.0142, "step": 399910 }, { "epoch": 1.04, "learning_rate": 0.00014450245087238613, "loss": 0.0149, "step": 399920 }, { "epoch": 1.04, "learning_rate": 0.00014449856265601467, "loss": 0.0517, "step": 399930 }, { "epoch": 1.04, "learning_rate": 0.00014449467443964321, "loss": 0.0142, "step": 399940 }, { "epoch": 1.04, "learning_rate": 0.00014449078622327173, "loss": 0.0147, "step": 399950 }, { "epoch": 1.04, "learning_rate": 0.00014448689800690027, "loss": 0.0106, "step": 399960 }, { "epoch": 1.04, "learning_rate": 0.0001444830097905288, "loss": 0.0115, "step": 399970 }, { "epoch": 1.04, "learning_rate": 0.00014447912157415735, "loss": 0.0116, "step": 399980 }, { "epoch": 1.04, "learning_rate": 0.00014447523335778587, "loss": 0.0112, "step": 399990 }, { "epoch": 1.04, "learning_rate": 0.0001444713451414144, "loss": 0.0136, "step": 400000 }, { "epoch": 1.04, "eval_cer": 0.8816774928583525, "eval_loss": 0.007727402728050947, "eval_runtime": 107.7237, "eval_samples_per_second": 18.566, "eval_steps_per_second": 4.642, "step": 400000 }, { "epoch": 1.04, "learning_rate": 0.00014446745692504295, "loss": 0.0131, "step": 400010 }, { "epoch": 1.04, "learning_rate": 0.0001444635687086715, "loss": 0.0137, "step": 400020 }, { "epoch": 1.04, "learning_rate": 0.0001444596804923, "loss": 0.0108, "step": 400030 }, { "epoch": 1.04, "learning_rate": 0.00014445579227592855, "loss": 0.0106, "step": 400040 }, { "epoch": 1.04, "learning_rate": 0.0001444519040595571, "loss": 0.0098, "step": 400050 }, { "epoch": 1.04, "learning_rate": 0.00014444801584318563, "loss": 0.0097, "step": 400060 }, { "epoch": 1.04, "learning_rate": 0.00014444412762681415, "loss": 0.0143, "step": 400070 }, { "epoch": 1.04, "learning_rate": 0.00014444023941044272, "loss": 0.0122, "step": 400080 }, { "epoch": 1.04, "learning_rate": 0.00014443635119407123, "loss": 0.0131, "step": 400090 }, { "epoch": 1.04, "learning_rate": 0.00014443246297769977, "loss": 0.0135, "step": 400100 }, { "epoch": 1.04, "learning_rate": 0.00014442857476132831, "loss": 0.0105, "step": 400110 }, { "epoch": 1.04, "learning_rate": 0.00014442468654495686, "loss": 0.0139, "step": 400120 }, { "epoch": 1.04, "learning_rate": 0.00014442079832858537, "loss": 0.0162, "step": 400130 }, { "epoch": 1.04, "learning_rate": 0.0001444169101122139, "loss": 0.0137, "step": 400140 }, { "epoch": 1.04, "learning_rate": 0.00014441302189584245, "loss": 0.0119, "step": 400150 }, { "epoch": 1.04, "learning_rate": 0.000144409133679471, "loss": 0.0113, "step": 400160 }, { "epoch": 1.04, "learning_rate": 0.0001444052454630995, "loss": 0.0127, "step": 400170 }, { "epoch": 1.04, "learning_rate": 0.00014440135724672805, "loss": 0.0168, "step": 400180 }, { "epoch": 1.04, "learning_rate": 0.0001443974690303566, "loss": 0.0116, "step": 400190 }, { "epoch": 1.04, "learning_rate": 0.0001443935808139851, "loss": 0.011, "step": 400200 }, { "epoch": 1.04, "learning_rate": 0.00014438969259761365, "loss": 0.0097, "step": 400210 }, { "epoch": 1.04, "learning_rate": 0.0001443858043812422, "loss": 0.012, "step": 400220 }, { "epoch": 1.04, "learning_rate": 0.00014438191616487073, "loss": 0.0111, "step": 400230 }, { "epoch": 1.04, "learning_rate": 0.00014437802794849925, "loss": 0.0112, "step": 400240 }, { "epoch": 1.04, "learning_rate": 0.00014437413973212782, "loss": 0.0092, "step": 400250 }, { "epoch": 1.04, "learning_rate": 0.00014437025151575633, "loss": 0.0112, "step": 400260 }, { "epoch": 1.04, "learning_rate": 0.00014436636329938487, "loss": 0.015, "step": 400270 }, { "epoch": 1.04, "learning_rate": 0.00014436247508301341, "loss": 0.0114, "step": 400280 }, { "epoch": 1.04, "learning_rate": 0.00014435858686664196, "loss": 0.0124, "step": 400290 }, { "epoch": 1.04, "learning_rate": 0.00014435469865027047, "loss": 0.0116, "step": 400300 }, { "epoch": 1.04, "learning_rate": 0.000144350810433899, "loss": 0.0166, "step": 400310 }, { "epoch": 1.04, "learning_rate": 0.00014434692221752755, "loss": 0.0101, "step": 400320 }, { "epoch": 1.04, "learning_rate": 0.0001443430340011561, "loss": 0.0121, "step": 400330 }, { "epoch": 1.04, "learning_rate": 0.0001443391457847846, "loss": 0.0088, "step": 400340 }, { "epoch": 1.04, "learning_rate": 0.00014433525756841315, "loss": 0.0091, "step": 400350 }, { "epoch": 1.04, "learning_rate": 0.0001443313693520417, "loss": 0.0121, "step": 400360 }, { "epoch": 1.04, "learning_rate": 0.00014432748113567023, "loss": 0.0117, "step": 400370 }, { "epoch": 1.04, "learning_rate": 0.00014432359291929875, "loss": 0.0122, "step": 400380 }, { "epoch": 1.04, "learning_rate": 0.0001443197047029273, "loss": 0.0096, "step": 400390 }, { "epoch": 1.04, "learning_rate": 0.00014431581648655583, "loss": 0.0109, "step": 400400 }, { "epoch": 1.04, "learning_rate": 0.00014431192827018437, "loss": 0.0113, "step": 400410 }, { "epoch": 1.04, "learning_rate": 0.0001443080400538129, "loss": 0.0111, "step": 400420 }, { "epoch": 1.04, "learning_rate": 0.00014430415183744146, "loss": 0.0133, "step": 400430 }, { "epoch": 1.04, "learning_rate": 0.00014430026362106997, "loss": 0.0129, "step": 400440 }, { "epoch": 1.04, "learning_rate": 0.0001442963754046985, "loss": 0.0127, "step": 400450 }, { "epoch": 1.04, "learning_rate": 0.00014429248718832705, "loss": 0.0137, "step": 400460 }, { "epoch": 1.04, "learning_rate": 0.00014428859897195557, "loss": 0.01, "step": 400470 }, { "epoch": 1.04, "learning_rate": 0.0001442847107555841, "loss": 0.0116, "step": 400480 }, { "epoch": 1.04, "learning_rate": 0.00014428082253921265, "loss": 0.0105, "step": 400490 }, { "epoch": 1.04, "learning_rate": 0.0001442769343228412, "loss": 0.0146, "step": 400500 }, { "epoch": 1.04, "learning_rate": 0.0001442730461064697, "loss": 0.0099, "step": 400510 }, { "epoch": 1.04, "learning_rate": 0.00014426915789009825, "loss": 0.0084, "step": 400520 }, { "epoch": 1.04, "learning_rate": 0.0001442652696737268, "loss": 0.0107, "step": 400530 }, { "epoch": 1.04, "learning_rate": 0.00014426138145735533, "loss": 0.0099, "step": 400540 }, { "epoch": 1.04, "learning_rate": 0.00014425749324098385, "loss": 0.0098, "step": 400550 }, { "epoch": 1.04, "learning_rate": 0.0001442536050246124, "loss": 0.0087, "step": 400560 }, { "epoch": 1.04, "learning_rate": 0.00014424971680824093, "loss": 0.0093, "step": 400570 }, { "epoch": 1.04, "learning_rate": 0.00014424582859186947, "loss": 0.0104, "step": 400580 }, { "epoch": 1.04, "learning_rate": 0.000144241940375498, "loss": 0.0126, "step": 400590 }, { "epoch": 1.04, "learning_rate": 0.00014423805215912656, "loss": 0.0133, "step": 400600 }, { "epoch": 1.04, "learning_rate": 0.00014423416394275507, "loss": 0.0099, "step": 400610 }, { "epoch": 1.04, "learning_rate": 0.0001442302757263836, "loss": 0.0108, "step": 400620 }, { "epoch": 1.04, "learning_rate": 0.00014422638751001215, "loss": 0.0114, "step": 400630 }, { "epoch": 1.04, "learning_rate": 0.0001442224992936407, "loss": 0.0115, "step": 400640 }, { "epoch": 1.04, "learning_rate": 0.0001442186110772692, "loss": 0.0129, "step": 400650 }, { "epoch": 1.04, "learning_rate": 0.00014421472286089775, "loss": 0.0108, "step": 400660 }, { "epoch": 1.04, "learning_rate": 0.0001442108346445263, "loss": 0.0133, "step": 400670 }, { "epoch": 1.04, "learning_rate": 0.00014420694642815484, "loss": 0.0108, "step": 400680 }, { "epoch": 1.04, "learning_rate": 0.00014420305821178335, "loss": 0.0135, "step": 400690 }, { "epoch": 1.04, "learning_rate": 0.0001441991699954119, "loss": 0.0141, "step": 400700 }, { "epoch": 1.04, "learning_rate": 0.00014419528177904043, "loss": 0.0151, "step": 400710 }, { "epoch": 1.04, "learning_rate": 0.00014419139356266895, "loss": 0.0105, "step": 400720 }, { "epoch": 1.04, "learning_rate": 0.0001441875053462975, "loss": 0.0132, "step": 400730 }, { "epoch": 1.04, "learning_rate": 0.00014418361712992603, "loss": 0.0124, "step": 400740 }, { "epoch": 1.04, "learning_rate": 0.00014417972891355457, "loss": 0.0133, "step": 400750 }, { "epoch": 1.04, "learning_rate": 0.0001441758406971831, "loss": 0.0147, "step": 400760 }, { "epoch": 1.04, "learning_rate": 0.00014417195248081163, "loss": 0.0129, "step": 400770 }, { "epoch": 1.04, "learning_rate": 0.00014416806426444017, "loss": 0.0116, "step": 400780 }, { "epoch": 1.04, "learning_rate": 0.0001441641760480687, "loss": 0.0113, "step": 400790 }, { "epoch": 1.04, "learning_rate": 0.00014416028783169725, "loss": 0.0113, "step": 400800 }, { "epoch": 1.04, "learning_rate": 0.0001441563996153258, "loss": 0.0108, "step": 400810 }, { "epoch": 1.04, "learning_rate": 0.0001441525113989543, "loss": 0.0157, "step": 400820 }, { "epoch": 1.04, "learning_rate": 0.00014414862318258285, "loss": 0.0129, "step": 400830 }, { "epoch": 1.04, "learning_rate": 0.0001441447349662114, "loss": 0.0138, "step": 400840 }, { "epoch": 1.04, "learning_rate": 0.00014414084674983993, "loss": 0.0116, "step": 400850 }, { "epoch": 1.04, "learning_rate": 0.00014413695853346845, "loss": 0.0175, "step": 400860 }, { "epoch": 1.04, "learning_rate": 0.000144133070317097, "loss": 0.014, "step": 400870 }, { "epoch": 1.04, "learning_rate": 0.00014412918210072553, "loss": 0.0163, "step": 400880 }, { "epoch": 1.04, "learning_rate": 0.00014412529388435407, "loss": 0.0134, "step": 400890 }, { "epoch": 1.04, "learning_rate": 0.0001441214056679826, "loss": 0.0128, "step": 400900 }, { "epoch": 1.04, "learning_rate": 0.00014411751745161113, "loss": 0.0103, "step": 400910 }, { "epoch": 1.04, "learning_rate": 0.00014411362923523967, "loss": 0.011, "step": 400920 }, { "epoch": 1.04, "learning_rate": 0.00014410974101886821, "loss": 0.0121, "step": 400930 }, { "epoch": 1.04, "learning_rate": 0.00014410585280249673, "loss": 0.0134, "step": 400940 }, { "epoch": 1.04, "learning_rate": 0.00014410196458612527, "loss": 0.0096, "step": 400950 }, { "epoch": 1.04, "learning_rate": 0.0001440980763697538, "loss": 0.0099, "step": 400960 }, { "epoch": 1.04, "learning_rate": 0.00014409418815338233, "loss": 0.0106, "step": 400970 }, { "epoch": 1.04, "learning_rate": 0.0001440902999370109, "loss": 0.0157, "step": 400980 }, { "epoch": 1.04, "learning_rate": 0.0001440864117206394, "loss": 0.0118, "step": 400990 }, { "epoch": 1.04, "learning_rate": 0.00014408252350426795, "loss": 0.0129, "step": 401000 }, { "epoch": 1.04, "eval_cer": 0.8817012866862336, "eval_loss": 0.0077420733869075775, "eval_runtime": 107.3386, "eval_samples_per_second": 18.633, "eval_steps_per_second": 4.658, "step": 401000 }, { "epoch": 1.04, "learning_rate": 0.0001440786352878965, "loss": 0.0098, "step": 401010 }, { "epoch": 1.04, "learning_rate": 0.00014407474707152503, "loss": 0.0108, "step": 401020 }, { "epoch": 1.04, "learning_rate": 0.00014407085885515355, "loss": 0.0123, "step": 401030 }, { "epoch": 1.04, "learning_rate": 0.0001440669706387821, "loss": 0.0113, "step": 401040 }, { "epoch": 1.04, "learning_rate": 0.00014406308242241063, "loss": 0.0136, "step": 401050 }, { "epoch": 1.04, "learning_rate": 0.00014405919420603917, "loss": 0.0139, "step": 401060 }, { "epoch": 1.04, "learning_rate": 0.0001440553059896677, "loss": 0.012, "step": 401070 }, { "epoch": 1.04, "learning_rate": 0.00014405141777329623, "loss": 0.0114, "step": 401080 }, { "epoch": 1.04, "learning_rate": 0.00014404752955692477, "loss": 0.0121, "step": 401090 }, { "epoch": 1.04, "learning_rate": 0.0001440436413405533, "loss": 0.0103, "step": 401100 }, { "epoch": 1.04, "learning_rate": 0.00014403975312418183, "loss": 0.0108, "step": 401110 }, { "epoch": 1.04, "learning_rate": 0.0001440358649078104, "loss": 0.0104, "step": 401120 }, { "epoch": 1.04, "learning_rate": 0.0001440319766914389, "loss": 0.0106, "step": 401130 }, { "epoch": 1.04, "learning_rate": 0.00014402808847506745, "loss": 0.0133, "step": 401140 }, { "epoch": 1.04, "learning_rate": 0.000144024200258696, "loss": 0.0123, "step": 401150 }, { "epoch": 1.04, "learning_rate": 0.00014402031204232454, "loss": 0.0206, "step": 401160 }, { "epoch": 1.04, "learning_rate": 0.00014401642382595305, "loss": 0.0103, "step": 401170 }, { "epoch": 1.04, "learning_rate": 0.0001440125356095816, "loss": 0.0095, "step": 401180 }, { "epoch": 1.04, "learning_rate": 0.00014400864739321013, "loss": 0.011, "step": 401190 }, { "epoch": 1.04, "learning_rate": 0.00014400475917683865, "loss": 0.0082, "step": 401200 }, { "epoch": 1.04, "learning_rate": 0.0001440008709604672, "loss": 0.0112, "step": 401210 }, { "epoch": 1.04, "learning_rate": 0.00014399698274409573, "loss": 0.0095, "step": 401220 }, { "epoch": 1.04, "learning_rate": 0.00014399309452772427, "loss": 0.0129, "step": 401230 }, { "epoch": 1.04, "learning_rate": 0.0001439892063113528, "loss": 0.0135, "step": 401240 }, { "epoch": 1.04, "learning_rate": 0.00014398531809498133, "loss": 0.0107, "step": 401250 }, { "epoch": 1.04, "learning_rate": 0.00014398142987860987, "loss": 0.0108, "step": 401260 }, { "epoch": 1.04, "learning_rate": 0.0001439775416622384, "loss": 0.0103, "step": 401270 }, { "epoch": 1.04, "learning_rate": 0.00014397365344586693, "loss": 0.0128, "step": 401280 }, { "epoch": 1.04, "learning_rate": 0.00014396976522949547, "loss": 0.0114, "step": 401290 }, { "epoch": 1.04, "learning_rate": 0.000143965877013124, "loss": 0.0121, "step": 401300 }, { "epoch": 1.04, "learning_rate": 0.00014396198879675255, "loss": 0.013, "step": 401310 }, { "epoch": 1.04, "learning_rate": 0.0001439581005803811, "loss": 0.01, "step": 401320 }, { "epoch": 1.04, "learning_rate": 0.00014395421236400964, "loss": 0.0081, "step": 401330 }, { "epoch": 1.04, "learning_rate": 0.00014395032414763815, "loss": 0.0107, "step": 401340 }, { "epoch": 1.04, "learning_rate": 0.0001439464359312667, "loss": 0.01, "step": 401350 }, { "epoch": 1.04, "learning_rate": 0.00014394254771489523, "loss": 0.0113, "step": 401360 }, { "epoch": 1.04, "learning_rate": 0.00014393865949852377, "loss": 0.0146, "step": 401370 }, { "epoch": 1.04, "learning_rate": 0.0001439347712821523, "loss": 0.0116, "step": 401380 }, { "epoch": 1.04, "learning_rate": 0.00014393088306578083, "loss": 0.014, "step": 401390 }, { "epoch": 1.04, "learning_rate": 0.00014392699484940937, "loss": 0.0109, "step": 401400 }, { "epoch": 1.04, "learning_rate": 0.00014392310663303791, "loss": 0.0094, "step": 401410 }, { "epoch": 1.04, "learning_rate": 0.00014391921841666643, "loss": 0.015, "step": 401420 }, { "epoch": 1.04, "learning_rate": 0.00014391533020029497, "loss": 0.0135, "step": 401430 }, { "epoch": 1.04, "learning_rate": 0.0001439114419839235, "loss": 0.0099, "step": 401440 }, { "epoch": 1.04, "learning_rate": 0.00014390755376755203, "loss": 0.014, "step": 401450 }, { "epoch": 1.04, "learning_rate": 0.00014390366555118057, "loss": 0.015, "step": 401460 }, { "epoch": 1.04, "learning_rate": 0.0001438997773348091, "loss": 0.0126, "step": 401470 }, { "epoch": 1.04, "learning_rate": 0.00014389588911843765, "loss": 0.0114, "step": 401480 }, { "epoch": 1.04, "learning_rate": 0.00014389200090206617, "loss": 0.0104, "step": 401490 }, { "epoch": 1.04, "learning_rate": 0.00014388811268569473, "loss": 0.0112, "step": 401500 }, { "epoch": 1.04, "learning_rate": 0.00014388422446932325, "loss": 0.0114, "step": 401510 }, { "epoch": 1.04, "learning_rate": 0.0001438803362529518, "loss": 0.0129, "step": 401520 }, { "epoch": 1.04, "learning_rate": 0.00014387644803658033, "loss": 0.0089, "step": 401530 }, { "epoch": 1.04, "learning_rate": 0.00014387255982020887, "loss": 0.0103, "step": 401540 }, { "epoch": 1.04, "learning_rate": 0.0001438686716038374, "loss": 0.0138, "step": 401550 }, { "epoch": 1.04, "learning_rate": 0.00014386478338746593, "loss": 0.0084, "step": 401560 }, { "epoch": 1.04, "learning_rate": 0.00014386089517109447, "loss": 0.0115, "step": 401570 }, { "epoch": 1.04, "learning_rate": 0.000143857006954723, "loss": 0.0097, "step": 401580 }, { "epoch": 1.04, "learning_rate": 0.00014385311873835153, "loss": 0.0126, "step": 401590 }, { "epoch": 1.04, "learning_rate": 0.00014384923052198007, "loss": 0.0129, "step": 401600 }, { "epoch": 1.04, "learning_rate": 0.0001438453423056086, "loss": 0.0109, "step": 401610 }, { "epoch": 1.04, "learning_rate": 0.00014384145408923715, "loss": 0.0107, "step": 401620 }, { "epoch": 1.04, "learning_rate": 0.00014383756587286567, "loss": 0.0112, "step": 401630 }, { "epoch": 1.04, "learning_rate": 0.00014383367765649424, "loss": 0.0111, "step": 401640 }, { "epoch": 1.04, "learning_rate": 0.00014382978944012275, "loss": 0.0135, "step": 401650 }, { "epoch": 1.04, "learning_rate": 0.0001438259012237513, "loss": 0.0098, "step": 401660 }, { "epoch": 1.04, "learning_rate": 0.00014382201300737983, "loss": 0.0123, "step": 401670 }, { "epoch": 1.04, "learning_rate": 0.00014381812479100838, "loss": 0.0112, "step": 401680 }, { "epoch": 1.04, "learning_rate": 0.0001438142365746369, "loss": 0.0154, "step": 401690 }, { "epoch": 1.04, "learning_rate": 0.00014381034835826543, "loss": 0.0111, "step": 401700 }, { "epoch": 1.04, "learning_rate": 0.00014380646014189397, "loss": 0.0135, "step": 401710 }, { "epoch": 1.04, "learning_rate": 0.0001438025719255225, "loss": 0.0096, "step": 401720 }, { "epoch": 1.04, "learning_rate": 0.00014379868370915103, "loss": 0.0123, "step": 401730 }, { "epoch": 1.04, "learning_rate": 0.00014379479549277957, "loss": 0.0127, "step": 401740 }, { "epoch": 1.04, "learning_rate": 0.0001437909072764081, "loss": 0.0118, "step": 401750 }, { "epoch": 1.04, "learning_rate": 0.00014378701906003663, "loss": 0.0143, "step": 401760 }, { "epoch": 1.04, "learning_rate": 0.00014378313084366517, "loss": 0.0123, "step": 401770 }, { "epoch": 1.04, "learning_rate": 0.0001437792426272937, "loss": 0.0115, "step": 401780 }, { "epoch": 1.04, "learning_rate": 0.00014377535441092225, "loss": 0.0145, "step": 401790 }, { "epoch": 1.04, "learning_rate": 0.00014377146619455077, "loss": 0.0107, "step": 401800 }, { "epoch": 1.04, "learning_rate": 0.0001437675779781793, "loss": 0.0092, "step": 401810 }, { "epoch": 1.04, "learning_rate": 0.00014376368976180785, "loss": 0.0133, "step": 401820 }, { "epoch": 1.04, "learning_rate": 0.0001437598015454364, "loss": 0.0115, "step": 401830 }, { "epoch": 1.04, "learning_rate": 0.00014375591332906493, "loss": 0.0125, "step": 401840 }, { "epoch": 1.04, "learning_rate": 0.00014375202511269348, "loss": 0.0126, "step": 401850 }, { "epoch": 1.04, "learning_rate": 0.000143748136896322, "loss": 0.0159, "step": 401860 }, { "epoch": 1.04, "learning_rate": 0.00014374424867995053, "loss": 0.0106, "step": 401870 }, { "epoch": 1.04, "learning_rate": 0.00014374036046357907, "loss": 0.0127, "step": 401880 }, { "epoch": 1.04, "learning_rate": 0.00014373647224720761, "loss": 0.0112, "step": 401890 }, { "epoch": 1.04, "learning_rate": 0.00014373258403083613, "loss": 0.0127, "step": 401900 }, { "epoch": 1.04, "learning_rate": 0.00014372869581446467, "loss": 0.0109, "step": 401910 }, { "epoch": 1.04, "learning_rate": 0.0001437248075980932, "loss": 0.0124, "step": 401920 }, { "epoch": 1.04, "learning_rate": 0.00014372091938172175, "loss": 0.0147, "step": 401930 }, { "epoch": 1.04, "learning_rate": 0.00014371703116535027, "loss": 0.0097, "step": 401940 }, { "epoch": 1.04, "learning_rate": 0.0001437131429489788, "loss": 0.0152, "step": 401950 }, { "epoch": 1.04, "learning_rate": 0.00014370925473260735, "loss": 0.0126, "step": 401960 }, { "epoch": 1.04, "learning_rate": 0.00014370536651623587, "loss": 0.0107, "step": 401970 }, { "epoch": 1.04, "learning_rate": 0.0001437014782998644, "loss": 0.0108, "step": 401980 }, { "epoch": 1.04, "learning_rate": 0.00014369759008349295, "loss": 0.0128, "step": 401990 }, { "epoch": 1.04, "learning_rate": 0.0001436937018671215, "loss": 0.0132, "step": 402000 }, { "epoch": 1.04, "eval_cer": 0.8817012866862336, "eval_loss": 0.007718118838965893, "eval_runtime": 107.504, "eval_samples_per_second": 18.604, "eval_steps_per_second": 4.651, "step": 402000 }, { "epoch": 1.04, "learning_rate": 0.00014368981365075, "loss": 0.0112, "step": 402010 }, { "epoch": 1.04, "learning_rate": 0.00014368592543437857, "loss": 0.0122, "step": 402020 }, { "epoch": 1.04, "learning_rate": 0.0001436820372180071, "loss": 0.0119, "step": 402030 }, { "epoch": 1.04, "learning_rate": 0.00014367814900163563, "loss": 0.0127, "step": 402040 }, { "epoch": 1.04, "learning_rate": 0.00014367426078526417, "loss": 0.015, "step": 402050 }, { "epoch": 1.04, "learning_rate": 0.00014367037256889271, "loss": 0.0107, "step": 402060 }, { "epoch": 1.04, "learning_rate": 0.00014366648435252123, "loss": 0.0101, "step": 402070 }, { "epoch": 1.04, "learning_rate": 0.00014366259613614977, "loss": 0.0134, "step": 402080 }, { "epoch": 1.04, "learning_rate": 0.0001436587079197783, "loss": 0.0112, "step": 402090 }, { "epoch": 1.04, "learning_rate": 0.00014365481970340685, "loss": 0.0122, "step": 402100 }, { "epoch": 1.04, "learning_rate": 0.00014365093148703537, "loss": 0.0117, "step": 402110 }, { "epoch": 1.04, "learning_rate": 0.0001436470432706639, "loss": 0.0133, "step": 402120 }, { "epoch": 1.04, "learning_rate": 0.00014364315505429245, "loss": 0.0239, "step": 402130 }, { "epoch": 1.04, "learning_rate": 0.000143639266837921, "loss": 0.0099, "step": 402140 }, { "epoch": 1.04, "learning_rate": 0.0001436353786215495, "loss": 0.0097, "step": 402150 }, { "epoch": 1.04, "learning_rate": 0.00014363149040517805, "loss": 0.0091, "step": 402160 }, { "epoch": 1.04, "learning_rate": 0.0001436276021888066, "loss": 0.013, "step": 402170 }, { "epoch": 1.04, "learning_rate": 0.00014362371397243513, "loss": 0.0135, "step": 402180 }, { "epoch": 1.04, "learning_rate": 0.00014361982575606367, "loss": 0.0119, "step": 402190 }, { "epoch": 1.04, "learning_rate": 0.0001436159375396922, "loss": 0.0097, "step": 402200 }, { "epoch": 1.04, "learning_rate": 0.00014361204932332073, "loss": 0.0092, "step": 402210 }, { "epoch": 1.04, "learning_rate": 0.00014360816110694927, "loss": 0.0136, "step": 402220 }, { "epoch": 1.04, "learning_rate": 0.0001436042728905778, "loss": 0.0113, "step": 402230 }, { "epoch": 1.04, "learning_rate": 0.00014360038467420633, "loss": 0.0137, "step": 402240 }, { "epoch": 1.04, "learning_rate": 0.00014359649645783487, "loss": 0.0137, "step": 402250 }, { "epoch": 1.04, "learning_rate": 0.0001435926082414634, "loss": 0.0111, "step": 402260 }, { "epoch": 1.04, "learning_rate": 0.00014358872002509195, "loss": 0.0108, "step": 402270 }, { "epoch": 1.04, "learning_rate": 0.00014358483180872047, "loss": 0.0128, "step": 402280 }, { "epoch": 1.04, "learning_rate": 0.000143580943592349, "loss": 0.0156, "step": 402290 }, { "epoch": 1.04, "learning_rate": 0.00014357705537597755, "loss": 0.0102, "step": 402300 }, { "epoch": 1.04, "learning_rate": 0.0001435731671596061, "loss": 0.01, "step": 402310 }, { "epoch": 1.04, "learning_rate": 0.0001435692789432346, "loss": 0.011, "step": 402320 }, { "epoch": 1.04, "learning_rate": 0.00014356539072686315, "loss": 0.0101, "step": 402330 }, { "epoch": 1.04, "learning_rate": 0.0001435615025104917, "loss": 0.0103, "step": 402340 }, { "epoch": 1.04, "learning_rate": 0.00014355761429412023, "loss": 0.0121, "step": 402350 }, { "epoch": 1.04, "learning_rate": 0.00014355372607774875, "loss": 0.011, "step": 402360 }, { "epoch": 1.04, "learning_rate": 0.00014354983786137731, "loss": 0.0209, "step": 402370 }, { "epoch": 1.04, "learning_rate": 0.00014354594964500583, "loss": 0.0137, "step": 402380 }, { "epoch": 1.04, "learning_rate": 0.00014354206142863437, "loss": 0.012, "step": 402390 }, { "epoch": 1.04, "learning_rate": 0.0001435381732122629, "loss": 0.0121, "step": 402400 }, { "epoch": 1.04, "learning_rate": 0.00014353428499589145, "loss": 0.0219, "step": 402410 }, { "epoch": 1.04, "learning_rate": 0.00014353039677951997, "loss": 0.0112, "step": 402420 }, { "epoch": 1.04, "learning_rate": 0.0001435265085631485, "loss": 0.0123, "step": 402430 }, { "epoch": 1.04, "learning_rate": 0.00014352262034677705, "loss": 0.0112, "step": 402440 }, { "epoch": 1.04, "learning_rate": 0.00014351873213040557, "loss": 0.0095, "step": 402450 }, { "epoch": 1.04, "learning_rate": 0.0001435148439140341, "loss": 0.0113, "step": 402460 }, { "epoch": 1.04, "learning_rate": 0.00014351095569766265, "loss": 0.0094, "step": 402470 }, { "epoch": 1.04, "learning_rate": 0.0001435070674812912, "loss": 0.0114, "step": 402480 }, { "epoch": 1.04, "learning_rate": 0.0001435031792649197, "loss": 0.0123, "step": 402490 }, { "epoch": 1.04, "learning_rate": 0.00014349929104854825, "loss": 0.0138, "step": 402500 }, { "epoch": 1.04, "learning_rate": 0.0001434954028321768, "loss": 0.0132, "step": 402510 }, { "epoch": 1.04, "learning_rate": 0.00014349151461580533, "loss": 0.0116, "step": 402520 }, { "epoch": 1.04, "learning_rate": 0.00014348762639943385, "loss": 0.0112, "step": 402530 }, { "epoch": 1.04, "learning_rate": 0.00014348373818306241, "loss": 0.0109, "step": 402540 }, { "epoch": 1.04, "learning_rate": 0.00014347984996669093, "loss": 0.0109, "step": 402550 }, { "epoch": 1.04, "learning_rate": 0.00014347596175031947, "loss": 0.0104, "step": 402560 }, { "epoch": 1.04, "learning_rate": 0.000143472073533948, "loss": 0.0093, "step": 402570 }, { "epoch": 1.04, "learning_rate": 0.00014346818531757655, "loss": 0.0096, "step": 402580 }, { "epoch": 1.04, "learning_rate": 0.00014346429710120507, "loss": 0.0094, "step": 402590 }, { "epoch": 1.04, "learning_rate": 0.0001434604088848336, "loss": 0.0146, "step": 402600 }, { "epoch": 1.04, "learning_rate": 0.00014345652066846215, "loss": 0.0145, "step": 402610 }, { "epoch": 1.04, "learning_rate": 0.0001434526324520907, "loss": 0.0116, "step": 402620 }, { "epoch": 1.04, "learning_rate": 0.0001434487442357192, "loss": 0.0107, "step": 402630 }, { "epoch": 1.04, "learning_rate": 0.00014344485601934775, "loss": 0.0143, "step": 402640 }, { "epoch": 1.04, "learning_rate": 0.0001434409678029763, "loss": 0.0097, "step": 402650 }, { "epoch": 1.04, "learning_rate": 0.00014343707958660483, "loss": 0.0109, "step": 402660 }, { "epoch": 1.04, "learning_rate": 0.00014343319137023335, "loss": 0.0112, "step": 402670 }, { "epoch": 1.04, "learning_rate": 0.0001434293031538619, "loss": 0.0098, "step": 402680 }, { "epoch": 1.04, "learning_rate": 0.00014342541493749043, "loss": 0.011, "step": 402690 }, { "epoch": 1.04, "learning_rate": 0.00014342152672111895, "loss": 0.0111, "step": 402700 }, { "epoch": 1.04, "learning_rate": 0.00014341763850474751, "loss": 0.0112, "step": 402710 }, { "epoch": 1.04, "learning_rate": 0.00014341375028837603, "loss": 0.008, "step": 402720 }, { "epoch": 1.04, "learning_rate": 0.00014340986207200457, "loss": 0.0117, "step": 402730 }, { "epoch": 1.04, "learning_rate": 0.0001434059738556331, "loss": 0.013, "step": 402740 }, { "epoch": 1.04, "learning_rate": 0.00014340208563926165, "loss": 0.0099, "step": 402750 }, { "epoch": 1.04, "learning_rate": 0.00014339819742289017, "loss": 0.0122, "step": 402760 }, { "epoch": 1.04, "learning_rate": 0.0001433943092065187, "loss": 0.0108, "step": 402770 }, { "epoch": 1.04, "learning_rate": 0.00014339042099014725, "loss": 0.0102, "step": 402780 }, { "epoch": 1.04, "learning_rate": 0.0001433865327737758, "loss": 0.0122, "step": 402790 }, { "epoch": 1.04, "learning_rate": 0.0001433826445574043, "loss": 0.013, "step": 402800 }, { "epoch": 1.04, "learning_rate": 0.00014337875634103285, "loss": 0.0122, "step": 402810 }, { "epoch": 1.04, "learning_rate": 0.0001433748681246614, "loss": 0.0118, "step": 402820 }, { "epoch": 1.04, "learning_rate": 0.00014337097990828993, "loss": 0.0103, "step": 402830 }, { "epoch": 1.04, "learning_rate": 0.00014336709169191845, "loss": 0.0136, "step": 402840 }, { "epoch": 1.04, "learning_rate": 0.000143363203475547, "loss": 0.0106, "step": 402850 }, { "epoch": 1.04, "learning_rate": 0.00014335931525917553, "loss": 0.0115, "step": 402860 }, { "epoch": 1.04, "learning_rate": 0.00014335542704280407, "loss": 0.0117, "step": 402870 }, { "epoch": 1.04, "learning_rate": 0.00014335153882643259, "loss": 0.0158, "step": 402880 }, { "epoch": 1.04, "learning_rate": 0.00014334765061006115, "loss": 0.0115, "step": 402890 }, { "epoch": 1.04, "learning_rate": 0.00014334376239368967, "loss": 0.0135, "step": 402900 }, { "epoch": 1.04, "learning_rate": 0.0001433398741773182, "loss": 0.0132, "step": 402910 }, { "epoch": 1.04, "learning_rate": 0.00014333598596094675, "loss": 0.0134, "step": 402920 }, { "epoch": 1.04, "learning_rate": 0.00014333209774457527, "loss": 0.0124, "step": 402930 }, { "epoch": 1.04, "learning_rate": 0.0001433282095282038, "loss": 0.0178, "step": 402940 }, { "epoch": 1.04, "learning_rate": 0.00014332432131183235, "loss": 0.0131, "step": 402950 }, { "epoch": 1.04, "learning_rate": 0.0001433204330954609, "loss": 0.0136, "step": 402960 }, { "epoch": 1.04, "learning_rate": 0.0001433165448790894, "loss": 0.0152, "step": 402970 }, { "epoch": 1.04, "learning_rate": 0.00014331265666271795, "loss": 0.012, "step": 402980 }, { "epoch": 1.04, "learning_rate": 0.0001433087684463465, "loss": 0.0107, "step": 402990 }, { "epoch": 1.04, "learning_rate": 0.00014330488022997503, "loss": 0.0077, "step": 403000 }, { "epoch": 1.04, "eval_cer": 0.8816970877754311, "eval_loss": 0.007720929104834795, "eval_runtime": 107.8049, "eval_samples_per_second": 18.552, "eval_steps_per_second": 4.638, "step": 403000 }, { "epoch": 1.04, "learning_rate": 0.00014330099201360355, "loss": 0.0107, "step": 403010 }, { "epoch": 1.04, "learning_rate": 0.0001432971037972321, "loss": 0.0111, "step": 403020 }, { "epoch": 1.04, "learning_rate": 0.00014329321558086063, "loss": 0.0138, "step": 403030 }, { "epoch": 1.04, "learning_rate": 0.00014328932736448917, "loss": 0.008, "step": 403040 }, { "epoch": 1.04, "learning_rate": 0.00014328543914811769, "loss": 0.0087, "step": 403050 }, { "epoch": 1.04, "learning_rate": 0.00014328155093174625, "loss": 0.0101, "step": 403060 }, { "epoch": 1.04, "learning_rate": 0.00014327766271537477, "loss": 0.0132, "step": 403070 }, { "epoch": 1.04, "learning_rate": 0.0001432737744990033, "loss": 0.0115, "step": 403080 }, { "epoch": 1.04, "learning_rate": 0.00014326988628263185, "loss": 0.0084, "step": 403090 }, { "epoch": 1.04, "learning_rate": 0.0001432659980662604, "loss": 0.0103, "step": 403100 }, { "epoch": 1.04, "learning_rate": 0.0001432621098498889, "loss": 0.0095, "step": 403110 }, { "epoch": 1.04, "learning_rate": 0.00014325822163351745, "loss": 0.0136, "step": 403120 }, { "epoch": 1.04, "learning_rate": 0.000143254333417146, "loss": 0.0102, "step": 403130 }, { "epoch": 1.04, "learning_rate": 0.00014325044520077453, "loss": 0.0103, "step": 403140 }, { "epoch": 1.05, "learning_rate": 0.00014324655698440305, "loss": 0.0094, "step": 403150 }, { "epoch": 1.05, "learning_rate": 0.0001432426687680316, "loss": 0.0145, "step": 403160 }, { "epoch": 1.05, "learning_rate": 0.00014323878055166013, "loss": 0.0154, "step": 403170 }, { "epoch": 1.05, "learning_rate": 0.00014323489233528865, "loss": 0.0099, "step": 403180 }, { "epoch": 1.05, "learning_rate": 0.0001432310041189172, "loss": 0.0122, "step": 403190 }, { "epoch": 1.05, "learning_rate": 0.00014322711590254573, "loss": 0.0112, "step": 403200 }, { "epoch": 1.05, "learning_rate": 0.00014322322768617427, "loss": 0.0112, "step": 403210 }, { "epoch": 1.05, "learning_rate": 0.00014321933946980278, "loss": 0.0108, "step": 403220 }, { "epoch": 1.05, "learning_rate": 0.00014321545125343135, "loss": 0.0093, "step": 403230 }, { "epoch": 1.05, "learning_rate": 0.00014321156303705987, "loss": 0.0107, "step": 403240 }, { "epoch": 1.05, "learning_rate": 0.0001432076748206884, "loss": 0.0107, "step": 403250 }, { "epoch": 1.05, "learning_rate": 0.00014320378660431695, "loss": 0.0104, "step": 403260 }, { "epoch": 1.05, "learning_rate": 0.0001431998983879455, "loss": 0.0138, "step": 403270 }, { "epoch": 1.05, "learning_rate": 0.000143196010171574, "loss": 0.0144, "step": 403280 }, { "epoch": 1.05, "learning_rate": 0.00014319212195520255, "loss": 0.014, "step": 403290 }, { "epoch": 1.05, "learning_rate": 0.0001431882337388311, "loss": 0.0103, "step": 403300 }, { "epoch": 1.05, "learning_rate": 0.00014318434552245963, "loss": 0.0149, "step": 403310 }, { "epoch": 1.05, "learning_rate": 0.00014318045730608815, "loss": 0.0101, "step": 403320 }, { "epoch": 1.05, "learning_rate": 0.0001431765690897167, "loss": 0.0097, "step": 403330 }, { "epoch": 1.05, "learning_rate": 0.00014317268087334523, "loss": 0.0112, "step": 403340 }, { "epoch": 1.05, "learning_rate": 0.00014316879265697377, "loss": 0.0095, "step": 403350 }, { "epoch": 1.05, "learning_rate": 0.0001431649044406023, "loss": 0.0108, "step": 403360 }, { "epoch": 1.05, "learning_rate": 0.00014316101622423083, "loss": 0.0119, "step": 403370 }, { "epoch": 1.05, "learning_rate": 0.00014315712800785937, "loss": 0.0129, "step": 403380 }, { "epoch": 1.05, "learning_rate": 0.0001431532397914879, "loss": 0.0144, "step": 403390 }, { "epoch": 1.05, "learning_rate": 0.00014314935157511643, "loss": 0.0113, "step": 403400 }, { "epoch": 1.05, "learning_rate": 0.000143145463358745, "loss": 0.0107, "step": 403410 }, { "epoch": 1.05, "learning_rate": 0.0001431415751423735, "loss": 0.0126, "step": 403420 }, { "epoch": 1.05, "learning_rate": 0.00014313768692600205, "loss": 0.0111, "step": 403430 }, { "epoch": 1.05, "learning_rate": 0.0001431337987096306, "loss": 0.0306, "step": 403440 }, { "epoch": 1.05, "learning_rate": 0.0001431299104932591, "loss": 0.0085, "step": 403450 }, { "epoch": 1.05, "learning_rate": 0.00014312602227688765, "loss": 0.0121, "step": 403460 }, { "epoch": 1.05, "learning_rate": 0.0001431221340605162, "loss": 0.0107, "step": 403470 }, { "epoch": 1.05, "learning_rate": 0.00014311824584414473, "loss": 0.01, "step": 403480 }, { "epoch": 1.05, "learning_rate": 0.00014311435762777325, "loss": 0.0124, "step": 403490 }, { "epoch": 1.05, "learning_rate": 0.0001431104694114018, "loss": 0.0091, "step": 403500 }, { "epoch": 1.05, "learning_rate": 0.00014310658119503033, "loss": 0.013, "step": 403510 }, { "epoch": 1.05, "learning_rate": 0.00014310269297865887, "loss": 0.0111, "step": 403520 }, { "epoch": 1.05, "learning_rate": 0.00014309880476228739, "loss": 0.0124, "step": 403530 }, { "epoch": 1.05, "learning_rate": 0.00014309491654591593, "loss": 0.0106, "step": 403540 }, { "epoch": 1.05, "learning_rate": 0.00014309102832954447, "loss": 0.0112, "step": 403550 }, { "epoch": 1.05, "learning_rate": 0.000143087140113173, "loss": 0.0156, "step": 403560 }, { "epoch": 1.05, "learning_rate": 0.00014308325189680153, "loss": 0.013, "step": 403570 }, { "epoch": 1.05, "learning_rate": 0.0001430793636804301, "loss": 0.0094, "step": 403580 }, { "epoch": 1.05, "learning_rate": 0.0001430754754640586, "loss": 0.0148, "step": 403590 }, { "epoch": 1.05, "learning_rate": 0.00014307158724768715, "loss": 0.0122, "step": 403600 }, { "epoch": 1.05, "learning_rate": 0.0001430676990313157, "loss": 0.0107, "step": 403610 }, { "epoch": 1.05, "learning_rate": 0.00014306381081494423, "loss": 0.0131, "step": 403620 }, { "epoch": 1.05, "learning_rate": 0.00014305992259857275, "loss": 0.0102, "step": 403630 }, { "epoch": 1.05, "learning_rate": 0.0001430560343822013, "loss": 0.0103, "step": 403640 }, { "epoch": 1.05, "learning_rate": 0.00014305214616582983, "loss": 0.0129, "step": 403650 }, { "epoch": 1.05, "learning_rate": 0.00014304825794945837, "loss": 0.0125, "step": 403660 }, { "epoch": 1.05, "learning_rate": 0.0001430443697330869, "loss": 0.0111, "step": 403670 }, { "epoch": 1.05, "learning_rate": 0.00014304048151671543, "loss": 0.009, "step": 403680 }, { "epoch": 1.05, "learning_rate": 0.00014303659330034397, "loss": 0.0108, "step": 403690 }, { "epoch": 1.05, "learning_rate": 0.00014303270508397249, "loss": 0.0211, "step": 403700 }, { "epoch": 1.05, "learning_rate": 0.00014302881686760103, "loss": 0.0147, "step": 403710 }, { "epoch": 1.05, "learning_rate": 0.00014302492865122957, "loss": 0.0113, "step": 403720 }, { "epoch": 1.05, "learning_rate": 0.0001430210404348581, "loss": 0.01, "step": 403730 }, { "epoch": 1.05, "learning_rate": 0.00014301715221848662, "loss": 0.01, "step": 403740 }, { "epoch": 1.05, "learning_rate": 0.00014301326400211517, "loss": 0.0126, "step": 403750 }, { "epoch": 1.05, "learning_rate": 0.0001430093757857437, "loss": 0.0145, "step": 403760 }, { "epoch": 1.05, "learning_rate": 0.00014300548756937225, "loss": 0.0125, "step": 403770 }, { "epoch": 1.05, "learning_rate": 0.0001430015993530008, "loss": 0.0131, "step": 403780 }, { "epoch": 1.05, "learning_rate": 0.00014299771113662933, "loss": 0.0109, "step": 403790 }, { "epoch": 1.05, "learning_rate": 0.00014299382292025785, "loss": 0.0162, "step": 403800 }, { "epoch": 1.05, "learning_rate": 0.0001429899347038864, "loss": 0.0147, "step": 403810 }, { "epoch": 1.05, "learning_rate": 0.00014298604648751493, "loss": 0.0132, "step": 403820 }, { "epoch": 1.05, "learning_rate": 0.00014298215827114347, "loss": 0.012, "step": 403830 }, { "epoch": 1.05, "learning_rate": 0.000142978270054772, "loss": 0.0087, "step": 403840 }, { "epoch": 1.05, "learning_rate": 0.00014297438183840053, "loss": 0.0114, "step": 403850 }, { "epoch": 1.05, "learning_rate": 0.00014297049362202907, "loss": 0.0104, "step": 403860 }, { "epoch": 1.05, "learning_rate": 0.0001429666054056576, "loss": 0.0109, "step": 403870 }, { "epoch": 1.05, "learning_rate": 0.00014296271718928613, "loss": 0.0106, "step": 403880 }, { "epoch": 1.05, "learning_rate": 0.00014295882897291467, "loss": 0.0103, "step": 403890 }, { "epoch": 1.05, "learning_rate": 0.0001429549407565432, "loss": 0.0115, "step": 403900 }, { "epoch": 1.05, "learning_rate": 0.00014295105254017175, "loss": 0.0131, "step": 403910 }, { "epoch": 1.05, "learning_rate": 0.00014294716432380027, "loss": 0.0182, "step": 403920 }, { "epoch": 1.05, "learning_rate": 0.0001429432761074288, "loss": 0.0115, "step": 403930 }, { "epoch": 1.05, "learning_rate": 0.00014293938789105735, "loss": 0.0114, "step": 403940 }, { "epoch": 1.05, "learning_rate": 0.00014293549967468586, "loss": 0.0105, "step": 403950 }, { "epoch": 1.05, "learning_rate": 0.00014293161145831443, "loss": 0.015, "step": 403960 }, { "epoch": 1.05, "learning_rate": 0.00014292772324194295, "loss": 0.0111, "step": 403970 }, { "epoch": 1.05, "learning_rate": 0.0001429238350255715, "loss": 0.0101, "step": 403980 }, { "epoch": 1.05, "learning_rate": 0.00014291994680920003, "loss": 0.0112, "step": 403990 }, { "epoch": 1.05, "learning_rate": 0.00014291605859282857, "loss": 0.013, "step": 404000 }, { "epoch": 1.05, "eval_cer": 0.8817110841447728, "eval_loss": 0.009204316884279251, "eval_runtime": 107.4647, "eval_samples_per_second": 18.611, "eval_steps_per_second": 4.653, "step": 404000 }, { "epoch": 1.05, "learning_rate": 0.0001429121703764571, "loss": 0.0083, "step": 404010 }, { "epoch": 1.05, "learning_rate": 0.00014290828216008563, "loss": 0.0128, "step": 404020 }, { "epoch": 1.05, "learning_rate": 0.00014290439394371417, "loss": 0.0101, "step": 404030 }, { "epoch": 1.05, "learning_rate": 0.0001429005057273427, "loss": 0.0138, "step": 404040 }, { "epoch": 1.05, "learning_rate": 0.00014289661751097123, "loss": 0.0102, "step": 404050 }, { "epoch": 1.05, "learning_rate": 0.00014289272929459977, "loss": 0.0119, "step": 404060 }, { "epoch": 1.05, "learning_rate": 0.0001428888410782283, "loss": 0.0117, "step": 404070 }, { "epoch": 1.05, "learning_rate": 0.00014288495286185685, "loss": 0.0124, "step": 404080 }, { "epoch": 1.05, "learning_rate": 0.00014288106464548537, "loss": 0.0108, "step": 404090 }, { "epoch": 1.05, "learning_rate": 0.00014287717642911393, "loss": 0.015, "step": 404100 }, { "epoch": 1.05, "learning_rate": 0.00014287328821274245, "loss": 0.0166, "step": 404110 }, { "epoch": 1.05, "learning_rate": 0.000142869399996371, "loss": 0.0108, "step": 404120 }, { "epoch": 1.05, "learning_rate": 0.00014286551177999953, "loss": 0.0132, "step": 404130 }, { "epoch": 1.05, "learning_rate": 0.00014286162356362807, "loss": 0.0122, "step": 404140 }, { "epoch": 1.05, "learning_rate": 0.0001428577353472566, "loss": 0.0121, "step": 404150 }, { "epoch": 1.05, "learning_rate": 0.00014285384713088513, "loss": 0.0105, "step": 404160 }, { "epoch": 1.05, "learning_rate": 0.00014284995891451367, "loss": 0.0111, "step": 404170 }, { "epoch": 1.05, "learning_rate": 0.00014284607069814219, "loss": 0.0119, "step": 404180 }, { "epoch": 1.05, "learning_rate": 0.00014284218248177073, "loss": 0.013, "step": 404190 }, { "epoch": 1.05, "learning_rate": 0.00014283829426539927, "loss": 0.0094, "step": 404200 }, { "epoch": 1.05, "learning_rate": 0.0001428344060490278, "loss": 0.0089, "step": 404210 }, { "epoch": 1.05, "learning_rate": 0.00014283051783265633, "loss": 0.0096, "step": 404220 }, { "epoch": 1.05, "learning_rate": 0.00014282662961628487, "loss": 0.0115, "step": 404230 }, { "epoch": 1.05, "learning_rate": 0.0001428227413999134, "loss": 0.0106, "step": 404240 }, { "epoch": 1.05, "learning_rate": 0.00014281885318354195, "loss": 0.0084, "step": 404250 }, { "epoch": 1.05, "learning_rate": 0.00014281496496717046, "loss": 0.0134, "step": 404260 }, { "epoch": 1.05, "learning_rate": 0.000142811076750799, "loss": 0.0113, "step": 404270 }, { "epoch": 1.05, "learning_rate": 0.00014280718853442755, "loss": 0.0116, "step": 404280 }, { "epoch": 1.05, "learning_rate": 0.0001428033003180561, "loss": 0.0122, "step": 404290 }, { "epoch": 1.05, "learning_rate": 0.00014279941210168463, "loss": 0.0106, "step": 404300 }, { "epoch": 1.05, "learning_rate": 0.00014279552388531317, "loss": 0.0118, "step": 404310 }, { "epoch": 1.05, "learning_rate": 0.0001427916356689417, "loss": 0.0105, "step": 404320 }, { "epoch": 1.05, "learning_rate": 0.00014278774745257023, "loss": 0.01, "step": 404330 }, { "epoch": 1.05, "learning_rate": 0.00014278385923619877, "loss": 0.0121, "step": 404340 }, { "epoch": 1.05, "learning_rate": 0.0001427799710198273, "loss": 0.0087, "step": 404350 }, { "epoch": 1.05, "learning_rate": 0.00014277608280345583, "loss": 0.0092, "step": 404360 }, { "epoch": 1.05, "learning_rate": 0.00014277219458708437, "loss": 0.012, "step": 404370 }, { "epoch": 1.05, "learning_rate": 0.0001427683063707129, "loss": 0.0119, "step": 404380 }, { "epoch": 1.05, "learning_rate": 0.00014276441815434145, "loss": 0.0101, "step": 404390 }, { "epoch": 1.05, "learning_rate": 0.00014276052993796997, "loss": 0.0152, "step": 404400 }, { "epoch": 1.05, "learning_rate": 0.0001427566417215985, "loss": 0.0114, "step": 404410 }, { "epoch": 1.05, "learning_rate": 0.00014275275350522705, "loss": 0.01, "step": 404420 }, { "epoch": 1.05, "learning_rate": 0.00014274886528885556, "loss": 0.0132, "step": 404430 }, { "epoch": 1.05, "learning_rate": 0.0001427449770724841, "loss": 0.0094, "step": 404440 }, { "epoch": 1.05, "learning_rate": 0.00014274108885611265, "loss": 0.0129, "step": 404450 }, { "epoch": 1.05, "learning_rate": 0.0001427372006397412, "loss": 0.0131, "step": 404460 }, { "epoch": 1.05, "learning_rate": 0.0001427333124233697, "loss": 0.0108, "step": 404470 }, { "epoch": 1.05, "learning_rate": 0.00014272942420699827, "loss": 0.0101, "step": 404480 }, { "epoch": 1.05, "learning_rate": 0.0001427255359906268, "loss": 0.012, "step": 404490 }, { "epoch": 1.05, "learning_rate": 0.00014272164777425533, "loss": 0.0104, "step": 404500 }, { "epoch": 1.05, "learning_rate": 0.00014271775955788387, "loss": 0.0117, "step": 404510 }, { "epoch": 1.05, "learning_rate": 0.0001427138713415124, "loss": 0.0105, "step": 404520 }, { "epoch": 1.05, "learning_rate": 0.00014270998312514093, "loss": 0.0119, "step": 404530 }, { "epoch": 1.05, "learning_rate": 0.00014270609490876947, "loss": 0.0114, "step": 404540 }, { "epoch": 1.05, "learning_rate": 0.000142702206692398, "loss": 0.0168, "step": 404550 }, { "epoch": 1.05, "learning_rate": 0.00014269831847602655, "loss": 0.0119, "step": 404560 }, { "epoch": 1.05, "learning_rate": 0.00014269443025965507, "loss": 0.012, "step": 404570 }, { "epoch": 1.05, "learning_rate": 0.0001426905420432836, "loss": 0.0149, "step": 404580 }, { "epoch": 1.05, "learning_rate": 0.00014268665382691215, "loss": 0.0116, "step": 404590 }, { "epoch": 1.05, "learning_rate": 0.0001426827656105407, "loss": 0.0127, "step": 404600 }, { "epoch": 1.05, "learning_rate": 0.0001426788773941692, "loss": 0.0111, "step": 404610 }, { "epoch": 1.05, "learning_rate": 0.00014267498917779777, "loss": 0.0088, "step": 404620 }, { "epoch": 1.05, "learning_rate": 0.0001426711009614263, "loss": 0.0171, "step": 404630 }, { "epoch": 1.05, "learning_rate": 0.00014266721274505483, "loss": 0.0111, "step": 404640 }, { "epoch": 1.05, "learning_rate": 0.00014266332452868337, "loss": 0.0119, "step": 404650 }, { "epoch": 1.05, "learning_rate": 0.0001426594363123119, "loss": 0.012, "step": 404660 }, { "epoch": 1.05, "learning_rate": 0.00014265554809594043, "loss": 0.0121, "step": 404670 }, { "epoch": 1.05, "learning_rate": 0.00014265165987956897, "loss": 0.0118, "step": 404680 }, { "epoch": 1.05, "learning_rate": 0.0001426477716631975, "loss": 0.0108, "step": 404690 }, { "epoch": 1.05, "learning_rate": 0.00014264388344682603, "loss": 0.0115, "step": 404700 }, { "epoch": 1.05, "learning_rate": 0.00014263999523045457, "loss": 0.0109, "step": 404710 }, { "epoch": 1.05, "learning_rate": 0.0001426361070140831, "loss": 0.0099, "step": 404720 }, { "epoch": 1.05, "learning_rate": 0.00014263221879771165, "loss": 0.0116, "step": 404730 }, { "epoch": 1.05, "learning_rate": 0.00014262833058134017, "loss": 0.0108, "step": 404740 }, { "epoch": 1.05, "learning_rate": 0.0001426244423649687, "loss": 0.0106, "step": 404750 }, { "epoch": 1.05, "learning_rate": 0.00014262055414859725, "loss": 0.0127, "step": 404760 }, { "epoch": 1.05, "learning_rate": 0.0001426166659322258, "loss": 0.0138, "step": 404770 }, { "epoch": 1.05, "learning_rate": 0.0001426127777158543, "loss": 0.014, "step": 404780 }, { "epoch": 1.05, "learning_rate": 0.00014260888949948285, "loss": 0.0096, "step": 404790 }, { "epoch": 1.05, "learning_rate": 0.0001426050012831114, "loss": 0.0117, "step": 404800 }, { "epoch": 1.05, "learning_rate": 0.00014260111306673993, "loss": 0.0112, "step": 404810 }, { "epoch": 1.05, "learning_rate": 0.00014259722485036847, "loss": 0.0106, "step": 404820 }, { "epoch": 1.05, "learning_rate": 0.000142593336633997, "loss": 0.0127, "step": 404830 }, { "epoch": 1.05, "learning_rate": 0.00014258944841762553, "loss": 0.0151, "step": 404840 }, { "epoch": 1.05, "learning_rate": 0.00014258556020125407, "loss": 0.0165, "step": 404850 }, { "epoch": 1.05, "learning_rate": 0.0001425816719848826, "loss": 0.0115, "step": 404860 }, { "epoch": 1.05, "learning_rate": 0.00014257778376851115, "loss": 0.0102, "step": 404870 }, { "epoch": 1.05, "learning_rate": 0.00014257389555213967, "loss": 0.0099, "step": 404880 }, { "epoch": 1.05, "learning_rate": 0.0001425700073357682, "loss": 0.0107, "step": 404890 }, { "epoch": 1.05, "learning_rate": 0.00014256611911939675, "loss": 0.0127, "step": 404900 }, { "epoch": 1.05, "learning_rate": 0.0001425622309030253, "loss": 0.0124, "step": 404910 }, { "epoch": 1.05, "learning_rate": 0.0001425583426866538, "loss": 0.0148, "step": 404920 }, { "epoch": 1.05, "learning_rate": 0.00014255445447028235, "loss": 0.0115, "step": 404930 }, { "epoch": 1.05, "learning_rate": 0.0001425505662539109, "loss": 0.0111, "step": 404940 }, { "epoch": 1.05, "learning_rate": 0.0001425466780375394, "loss": 0.0123, "step": 404950 }, { "epoch": 1.05, "learning_rate": 0.00014254278982116795, "loss": 0.012, "step": 404960 }, { "epoch": 1.05, "learning_rate": 0.0001425389016047965, "loss": 0.0147, "step": 404970 }, { "epoch": 1.05, "learning_rate": 0.00014253501338842503, "loss": 0.0133, "step": 404980 }, { "epoch": 1.05, "learning_rate": 0.00014253112517205354, "loss": 0.0122, "step": 404990 }, { "epoch": 1.05, "learning_rate": 0.0001425272369556821, "loss": 0.0136, "step": 405000 }, { "epoch": 1.05, "eval_cer": 0.8816928888646285, "eval_loss": 0.007998434826731682, "eval_runtime": 107.3073, "eval_samples_per_second": 18.638, "eval_steps_per_second": 4.66, "step": 405000 }, { "epoch": 1.05, "learning_rate": 0.00014252334873931063, "loss": 0.0107, "step": 405010 }, { "epoch": 1.05, "learning_rate": 0.00014251946052293917, "loss": 0.0139, "step": 405020 }, { "epoch": 1.05, "learning_rate": 0.0001425155723065677, "loss": 0.0128, "step": 405030 }, { "epoch": 1.05, "learning_rate": 0.00014251168409019625, "loss": 0.015, "step": 405040 }, { "epoch": 1.05, "learning_rate": 0.00014250779587382477, "loss": 0.0122, "step": 405050 }, { "epoch": 1.05, "learning_rate": 0.0001425039076574533, "loss": 0.009, "step": 405060 }, { "epoch": 1.05, "learning_rate": 0.00014250001944108185, "loss": 0.0099, "step": 405070 }, { "epoch": 1.05, "learning_rate": 0.0001424961312247104, "loss": 0.013, "step": 405080 }, { "epoch": 1.05, "learning_rate": 0.0001424922430083389, "loss": 0.0091, "step": 405090 }, { "epoch": 1.05, "learning_rate": 0.00014248835479196745, "loss": 0.01, "step": 405100 }, { "epoch": 1.05, "learning_rate": 0.000142484466575596, "loss": 0.012, "step": 405110 }, { "epoch": 1.05, "learning_rate": 0.00014248057835922453, "loss": 0.0132, "step": 405120 }, { "epoch": 1.05, "learning_rate": 0.00014247669014285305, "loss": 0.0106, "step": 405130 }, { "epoch": 1.05, "learning_rate": 0.0001424728019264816, "loss": 0.0117, "step": 405140 }, { "epoch": 1.05, "learning_rate": 0.00014246891371011013, "loss": 0.0139, "step": 405150 }, { "epoch": 1.05, "learning_rate": 0.00014246502549373864, "loss": 0.0142, "step": 405160 }, { "epoch": 1.05, "learning_rate": 0.0001424611372773672, "loss": 0.016, "step": 405170 }, { "epoch": 1.05, "learning_rate": 0.00014245724906099573, "loss": 0.0184, "step": 405180 }, { "epoch": 1.05, "learning_rate": 0.00014245336084462427, "loss": 0.0111, "step": 405190 }, { "epoch": 1.05, "learning_rate": 0.0001424494726282528, "loss": 0.0112, "step": 405200 }, { "epoch": 1.05, "learning_rate": 0.00014244558441188135, "loss": 0.0134, "step": 405210 }, { "epoch": 1.05, "learning_rate": 0.00014244169619550987, "loss": 0.0132, "step": 405220 }, { "epoch": 1.05, "learning_rate": 0.0001424378079791384, "loss": 0.0105, "step": 405230 }, { "epoch": 1.05, "learning_rate": 0.00014243391976276695, "loss": 0.0115, "step": 405240 }, { "epoch": 1.05, "learning_rate": 0.0001424300315463955, "loss": 0.0137, "step": 405250 }, { "epoch": 1.05, "learning_rate": 0.000142426143330024, "loss": 0.0123, "step": 405260 }, { "epoch": 1.05, "learning_rate": 0.00014242225511365255, "loss": 0.0089, "step": 405270 }, { "epoch": 1.05, "learning_rate": 0.0001424183668972811, "loss": 0.01, "step": 405280 }, { "epoch": 1.05, "learning_rate": 0.00014241447868090963, "loss": 0.0095, "step": 405290 }, { "epoch": 1.05, "learning_rate": 0.00014241059046453814, "loss": 0.015, "step": 405300 }, { "epoch": 1.05, "learning_rate": 0.00014240670224816669, "loss": 0.0132, "step": 405310 }, { "epoch": 1.05, "learning_rate": 0.00014240281403179523, "loss": 0.0126, "step": 405320 }, { "epoch": 1.05, "learning_rate": 0.00014239892581542377, "loss": 0.0146, "step": 405330 }, { "epoch": 1.05, "learning_rate": 0.00014239503759905228, "loss": 0.0132, "step": 405340 }, { "epoch": 1.05, "learning_rate": 0.00014239114938268085, "loss": 0.0131, "step": 405350 }, { "epoch": 1.05, "learning_rate": 0.00014238726116630937, "loss": 0.0116, "step": 405360 }, { "epoch": 1.05, "learning_rate": 0.0001423833729499379, "loss": 0.0126, "step": 405370 }, { "epoch": 1.05, "learning_rate": 0.00014237948473356645, "loss": 0.0123, "step": 405380 }, { "epoch": 1.05, "learning_rate": 0.000142375596517195, "loss": 0.01, "step": 405390 }, { "epoch": 1.05, "learning_rate": 0.0001423717083008235, "loss": 0.0118, "step": 405400 }, { "epoch": 1.05, "learning_rate": 0.00014236782008445205, "loss": 0.0141, "step": 405410 }, { "epoch": 1.05, "learning_rate": 0.0001423639318680806, "loss": 0.0122, "step": 405420 }, { "epoch": 1.05, "learning_rate": 0.0001423600436517091, "loss": 0.0133, "step": 405430 }, { "epoch": 1.05, "learning_rate": 0.00014235615543533765, "loss": 0.0119, "step": 405440 }, { "epoch": 1.05, "learning_rate": 0.0001423522672189662, "loss": 0.011, "step": 405450 }, { "epoch": 1.05, "learning_rate": 0.00014234837900259473, "loss": 0.011, "step": 405460 }, { "epoch": 1.05, "learning_rate": 0.00014234449078622324, "loss": 0.0124, "step": 405470 }, { "epoch": 1.05, "learning_rate": 0.00014234060256985179, "loss": 0.0097, "step": 405480 }, { "epoch": 1.05, "learning_rate": 0.00014233671435348033, "loss": 0.0121, "step": 405490 }, { "epoch": 1.05, "learning_rate": 0.00014233282613710887, "loss": 0.0109, "step": 405500 }, { "epoch": 1.05, "learning_rate": 0.00014232893792073738, "loss": 0.0128, "step": 405510 }, { "epoch": 1.05, "learning_rate": 0.00014232504970436595, "loss": 0.0092, "step": 405520 }, { "epoch": 1.05, "learning_rate": 0.00014232116148799447, "loss": 0.0108, "step": 405530 }, { "epoch": 1.05, "learning_rate": 0.000142317273271623, "loss": 0.0102, "step": 405540 }, { "epoch": 1.05, "learning_rate": 0.00014231338505525155, "loss": 0.0127, "step": 405550 }, { "epoch": 1.05, "learning_rate": 0.0001423094968388801, "loss": 0.0124, "step": 405560 }, { "epoch": 1.05, "learning_rate": 0.0001423056086225086, "loss": 0.0149, "step": 405570 }, { "epoch": 1.05, "learning_rate": 0.00014230172040613715, "loss": 0.0128, "step": 405580 }, { "epoch": 1.05, "learning_rate": 0.0001422978321897657, "loss": 0.0114, "step": 405590 }, { "epoch": 1.05, "learning_rate": 0.00014229394397339423, "loss": 0.0136, "step": 405600 }, { "epoch": 1.05, "learning_rate": 0.00014229005575702275, "loss": 0.0089, "step": 405610 }, { "epoch": 1.05, "learning_rate": 0.0001422861675406513, "loss": 0.0156, "step": 405620 }, { "epoch": 1.05, "learning_rate": 0.00014228227932427983, "loss": 0.0104, "step": 405630 }, { "epoch": 1.05, "learning_rate": 0.00014227839110790837, "loss": 0.0104, "step": 405640 }, { "epoch": 1.05, "learning_rate": 0.00014227450289153689, "loss": 0.0101, "step": 405650 }, { "epoch": 1.05, "learning_rate": 0.00014227061467516543, "loss": 0.0131, "step": 405660 }, { "epoch": 1.05, "learning_rate": 0.00014226672645879397, "loss": 0.0117, "step": 405670 }, { "epoch": 1.05, "learning_rate": 0.00014226283824242248, "loss": 0.013, "step": 405680 }, { "epoch": 1.05, "learning_rate": 0.00014225895002605105, "loss": 0.0149, "step": 405690 }, { "epoch": 1.05, "learning_rate": 0.00014225506180967957, "loss": 0.0088, "step": 405700 }, { "epoch": 1.05, "learning_rate": 0.0001422511735933081, "loss": 0.0117, "step": 405710 }, { "epoch": 1.05, "learning_rate": 0.00014224728537693665, "loss": 0.0096, "step": 405720 }, { "epoch": 1.05, "learning_rate": 0.0001422433971605652, "loss": 0.0143, "step": 405730 }, { "epoch": 1.05, "learning_rate": 0.0001422395089441937, "loss": 0.0142, "step": 405740 }, { "epoch": 1.05, "learning_rate": 0.00014223562072782225, "loss": 0.0109, "step": 405750 }, { "epoch": 1.05, "learning_rate": 0.0001422317325114508, "loss": 0.0119, "step": 405760 }, { "epoch": 1.05, "learning_rate": 0.00014222784429507933, "loss": 0.0113, "step": 405770 }, { "epoch": 1.05, "learning_rate": 0.00014222395607870785, "loss": 0.0134, "step": 405780 }, { "epoch": 1.05, "learning_rate": 0.0001422200678623364, "loss": 0.0101, "step": 405790 }, { "epoch": 1.05, "learning_rate": 0.00014221617964596493, "loss": 0.011, "step": 405800 }, { "epoch": 1.05, "learning_rate": 0.00014221229142959347, "loss": 0.0123, "step": 405810 }, { "epoch": 1.05, "learning_rate": 0.00014220840321322198, "loss": 0.0114, "step": 405820 }, { "epoch": 1.05, "learning_rate": 0.00014220451499685053, "loss": 0.0109, "step": 405830 }, { "epoch": 1.05, "learning_rate": 0.00014220062678047907, "loss": 0.0121, "step": 405840 }, { "epoch": 1.05, "learning_rate": 0.0001421967385641076, "loss": 0.015, "step": 405850 }, { "epoch": 1.05, "learning_rate": 0.00014219285034773612, "loss": 0.0117, "step": 405860 }, { "epoch": 1.05, "learning_rate": 0.0001421889621313647, "loss": 0.0109, "step": 405870 }, { "epoch": 1.05, "learning_rate": 0.0001421850739149932, "loss": 0.0093, "step": 405880 }, { "epoch": 1.05, "learning_rate": 0.00014218118569862175, "loss": 0.0101, "step": 405890 }, { "epoch": 1.05, "learning_rate": 0.0001421772974822503, "loss": 0.0116, "step": 405900 }, { "epoch": 1.05, "learning_rate": 0.0001421734092658788, "loss": 0.0104, "step": 405910 }, { "epoch": 1.05, "learning_rate": 0.00014216952104950735, "loss": 0.0101, "step": 405920 }, { "epoch": 1.05, "learning_rate": 0.0001421656328331359, "loss": 0.0102, "step": 405930 }, { "epoch": 1.05, "learning_rate": 0.00014216174461676443, "loss": 0.0124, "step": 405940 }, { "epoch": 1.05, "learning_rate": 0.00014215785640039294, "loss": 0.0129, "step": 405950 }, { "epoch": 1.05, "learning_rate": 0.00014215396818402149, "loss": 0.0106, "step": 405960 }, { "epoch": 1.05, "learning_rate": 0.00014215007996765003, "loss": 0.0112, "step": 405970 }, { "epoch": 1.05, "learning_rate": 0.00014214619175127857, "loss": 0.0135, "step": 405980 }, { "epoch": 1.05, "learning_rate": 0.00014214230353490708, "loss": 0.0132, "step": 405990 }, { "epoch": 1.05, "learning_rate": 0.00014213841531853563, "loss": 0.012, "step": 406000 }, { "epoch": 1.05, "eval_cer": 0.8817180823294437, "eval_loss": 0.007497414480894804, "eval_runtime": 107.7608, "eval_samples_per_second": 18.56, "eval_steps_per_second": 4.64, "step": 406000 }, { "epoch": 1.05, "learning_rate": 0.00014213452710216417, "loss": 0.0128, "step": 406010 }, { "epoch": 1.05, "learning_rate": 0.0001421306388857927, "loss": 0.0107, "step": 406020 }, { "epoch": 1.05, "learning_rate": 0.00014212675066942122, "loss": 0.0152, "step": 406030 }, { "epoch": 1.05, "learning_rate": 0.0001421228624530498, "loss": 0.0119, "step": 406040 }, { "epoch": 1.05, "learning_rate": 0.0001421189742366783, "loss": 0.0126, "step": 406050 }, { "epoch": 1.05, "learning_rate": 0.00014211508602030685, "loss": 0.0116, "step": 406060 }, { "epoch": 1.05, "learning_rate": 0.0001421111978039354, "loss": 0.0119, "step": 406070 }, { "epoch": 1.05, "learning_rate": 0.00014210730958756393, "loss": 0.0136, "step": 406080 }, { "epoch": 1.05, "learning_rate": 0.00014210342137119245, "loss": 0.0139, "step": 406090 }, { "epoch": 1.05, "learning_rate": 0.000142099533154821, "loss": 0.014, "step": 406100 }, { "epoch": 1.05, "learning_rate": 0.00014209564493844953, "loss": 0.0115, "step": 406110 }, { "epoch": 1.05, "learning_rate": 0.00014209175672207807, "loss": 0.017, "step": 406120 }, { "epoch": 1.05, "learning_rate": 0.00014208786850570659, "loss": 0.0111, "step": 406130 }, { "epoch": 1.05, "learning_rate": 0.00014208398028933513, "loss": 0.0098, "step": 406140 }, { "epoch": 1.05, "learning_rate": 0.00014208009207296367, "loss": 0.0105, "step": 406150 }, { "epoch": 1.05, "learning_rate": 0.00014207620385659218, "loss": 0.011, "step": 406160 }, { "epoch": 1.05, "learning_rate": 0.00014207231564022072, "loss": 0.0116, "step": 406170 }, { "epoch": 1.05, "learning_rate": 0.00014206842742384927, "loss": 0.0132, "step": 406180 }, { "epoch": 1.05, "learning_rate": 0.0001420645392074778, "loss": 0.01, "step": 406190 }, { "epoch": 1.05, "learning_rate": 0.00014206065099110632, "loss": 0.0115, "step": 406200 }, { "epoch": 1.05, "learning_rate": 0.0001420567627747349, "loss": 0.01, "step": 406210 }, { "epoch": 1.05, "learning_rate": 0.0001420528745583634, "loss": 0.011, "step": 406220 }, { "epoch": 1.05, "learning_rate": 0.00014204898634199195, "loss": 0.0161, "step": 406230 }, { "epoch": 1.05, "learning_rate": 0.0001420450981256205, "loss": 0.0157, "step": 406240 }, { "epoch": 1.05, "learning_rate": 0.00014204120990924903, "loss": 0.0112, "step": 406250 }, { "epoch": 1.05, "learning_rate": 0.00014203732169287755, "loss": 0.0123, "step": 406260 }, { "epoch": 1.05, "learning_rate": 0.0001420334334765061, "loss": 0.012, "step": 406270 }, { "epoch": 1.05, "learning_rate": 0.00014202954526013463, "loss": 0.0105, "step": 406280 }, { "epoch": 1.05, "learning_rate": 0.00014202565704376317, "loss": 0.0137, "step": 406290 }, { "epoch": 1.05, "learning_rate": 0.00014202176882739168, "loss": 0.0122, "step": 406300 }, { "epoch": 1.05, "learning_rate": 0.00014201788061102023, "loss": 0.013, "step": 406310 }, { "epoch": 1.05, "learning_rate": 0.00014201399239464877, "loss": 0.0079, "step": 406320 }, { "epoch": 1.05, "learning_rate": 0.0001420101041782773, "loss": 0.0168, "step": 406330 }, { "epoch": 1.05, "learning_rate": 0.00014200621596190582, "loss": 0.0092, "step": 406340 }, { "epoch": 1.05, "learning_rate": 0.00014200232774553437, "loss": 0.0131, "step": 406350 }, { "epoch": 1.05, "learning_rate": 0.0001419984395291629, "loss": 0.0092, "step": 406360 }, { "epoch": 1.05, "learning_rate": 0.00014199455131279145, "loss": 0.0099, "step": 406370 }, { "epoch": 1.05, "learning_rate": 0.00014199066309641996, "loss": 0.0088, "step": 406380 }, { "epoch": 1.05, "learning_rate": 0.00014198677488004853, "loss": 0.0132, "step": 406390 }, { "epoch": 1.05, "learning_rate": 0.00014198288666367705, "loss": 0.0105, "step": 406400 }, { "epoch": 1.05, "learning_rate": 0.0001419789984473056, "loss": 0.0107, "step": 406410 }, { "epoch": 1.05, "learning_rate": 0.00014197511023093413, "loss": 0.0108, "step": 406420 }, { "epoch": 1.05, "learning_rate": 0.00014197122201456264, "loss": 0.0137, "step": 406430 }, { "epoch": 1.05, "learning_rate": 0.0001419673337981912, "loss": 0.012, "step": 406440 }, { "epoch": 1.05, "learning_rate": 0.00014196344558181973, "loss": 0.0148, "step": 406450 }, { "epoch": 1.05, "learning_rate": 0.00014195955736544827, "loss": 0.0118, "step": 406460 }, { "epoch": 1.05, "learning_rate": 0.00014195566914907678, "loss": 0.009, "step": 406470 }, { "epoch": 1.05, "learning_rate": 0.00014195178093270533, "loss": 0.0156, "step": 406480 }, { "epoch": 1.05, "learning_rate": 0.00014194789271633387, "loss": 0.011, "step": 406490 }, { "epoch": 1.05, "learning_rate": 0.0001419440044999624, "loss": 0.0109, "step": 406500 }, { "epoch": 1.05, "learning_rate": 0.00014194011628359092, "loss": 0.0107, "step": 406510 }, { "epoch": 1.05, "learning_rate": 0.00014193622806721947, "loss": 0.0132, "step": 406520 }, { "epoch": 1.05, "learning_rate": 0.000141932339850848, "loss": 0.0116, "step": 406530 }, { "epoch": 1.05, "learning_rate": 0.00014192845163447655, "loss": 0.011, "step": 406540 }, { "epoch": 1.05, "learning_rate": 0.00014192456341810506, "loss": 0.0113, "step": 406550 }, { "epoch": 1.05, "learning_rate": 0.00014192067520173363, "loss": 0.0112, "step": 406560 }, { "epoch": 1.05, "learning_rate": 0.00014191678698536215, "loss": 0.0099, "step": 406570 }, { "epoch": 1.05, "learning_rate": 0.0001419128987689907, "loss": 0.013, "step": 406580 }, { "epoch": 1.05, "learning_rate": 0.00014190901055261923, "loss": 0.0127, "step": 406590 }, { "epoch": 1.05, "learning_rate": 0.00014190512233624777, "loss": 0.0097, "step": 406600 }, { "epoch": 1.05, "learning_rate": 0.00014190123411987629, "loss": 0.0116, "step": 406610 }, { "epoch": 1.05, "learning_rate": 0.00014189734590350483, "loss": 0.0133, "step": 406620 }, { "epoch": 1.05, "learning_rate": 0.00014189345768713337, "loss": 0.0106, "step": 406630 }, { "epoch": 1.05, "learning_rate": 0.0001418895694707619, "loss": 0.0105, "step": 406640 }, { "epoch": 1.05, "learning_rate": 0.00014188568125439043, "loss": 0.0132, "step": 406650 }, { "epoch": 1.05, "learning_rate": 0.00014188179303801897, "loss": 0.0108, "step": 406660 }, { "epoch": 1.05, "learning_rate": 0.0001418779048216475, "loss": 0.0167, "step": 406670 }, { "epoch": 1.05, "learning_rate": 0.00014187401660527602, "loss": 0.0084, "step": 406680 }, { "epoch": 1.05, "learning_rate": 0.00014187012838890456, "loss": 0.0105, "step": 406690 }, { "epoch": 1.05, "learning_rate": 0.0001418662401725331, "loss": 0.0094, "step": 406700 }, { "epoch": 1.05, "learning_rate": 0.00014186235195616165, "loss": 0.0116, "step": 406710 }, { "epoch": 1.05, "learning_rate": 0.00014185846373979016, "loss": 0.0113, "step": 406720 }, { "epoch": 1.05, "learning_rate": 0.0001418545755234187, "loss": 0.0139, "step": 406730 }, { "epoch": 1.05, "learning_rate": 0.00014185068730704725, "loss": 0.0092, "step": 406740 }, { "epoch": 1.05, "learning_rate": 0.0001418467990906758, "loss": 0.0123, "step": 406750 }, { "epoch": 1.05, "learning_rate": 0.00014184291087430433, "loss": 0.0134, "step": 406760 }, { "epoch": 1.05, "learning_rate": 0.00014183902265793287, "loss": 0.0106, "step": 406770 }, { "epoch": 1.05, "learning_rate": 0.00014183513444156139, "loss": 0.0132, "step": 406780 }, { "epoch": 1.05, "learning_rate": 0.00014183124622518993, "loss": 0.0121, "step": 406790 }, { "epoch": 1.05, "learning_rate": 0.00014182735800881847, "loss": 0.0104, "step": 406800 }, { "epoch": 1.05, "learning_rate": 0.000141823469792447, "loss": 0.0101, "step": 406810 }, { "epoch": 1.05, "learning_rate": 0.00014181958157607552, "loss": 0.0115, "step": 406820 }, { "epoch": 1.05, "learning_rate": 0.00014181569335970407, "loss": 0.0159, "step": 406830 }, { "epoch": 1.05, "learning_rate": 0.0001418118051433326, "loss": 0.0128, "step": 406840 }, { "epoch": 1.05, "learning_rate": 0.00014180791692696115, "loss": 0.0097, "step": 406850 }, { "epoch": 1.05, "learning_rate": 0.00014180402871058966, "loss": 0.0114, "step": 406860 }, { "epoch": 1.05, "learning_rate": 0.0001418001404942182, "loss": 0.0098, "step": 406870 }, { "epoch": 1.05, "learning_rate": 0.00014179625227784675, "loss": 0.0156, "step": 406880 }, { "epoch": 1.05, "learning_rate": 0.0001417923640614753, "loss": 0.0132, "step": 406890 }, { "epoch": 1.05, "learning_rate": 0.0001417884758451038, "loss": 0.0096, "step": 406900 }, { "epoch": 1.05, "learning_rate": 0.00014178458762873235, "loss": 0.0116, "step": 406910 }, { "epoch": 1.05, "learning_rate": 0.0001417806994123609, "loss": 0.0162, "step": 406920 }, { "epoch": 1.05, "learning_rate": 0.0001417768111959894, "loss": 0.0105, "step": 406930 }, { "epoch": 1.05, "learning_rate": 0.00014177292297961797, "loss": 0.0137, "step": 406940 }, { "epoch": 1.05, "learning_rate": 0.00014176903476324648, "loss": 0.0141, "step": 406950 }, { "epoch": 1.05, "learning_rate": 0.00014176514654687503, "loss": 0.0113, "step": 406960 }, { "epoch": 1.05, "learning_rate": 0.00014176125833050357, "loss": 0.0116, "step": 406970 }, { "epoch": 1.05, "learning_rate": 0.0001417573701141321, "loss": 0.0102, "step": 406980 }, { "epoch": 1.05, "learning_rate": 0.00014175348189776062, "loss": 0.0113, "step": 406990 }, { "epoch": 1.06, "learning_rate": 0.00014174959368138917, "loss": 0.013, "step": 407000 }, { "epoch": 1.06, "eval_cer": 0.8816830914060892, "eval_loss": 0.007594889495521784, "eval_runtime": 107.3439, "eval_samples_per_second": 18.632, "eval_steps_per_second": 4.658, "step": 407000 }, { "epoch": 1.06, "learning_rate": 0.0001417457054650177, "loss": 0.0087, "step": 407010 }, { "epoch": 1.06, "learning_rate": 0.00014174181724864625, "loss": 0.0162, "step": 407020 }, { "epoch": 1.06, "learning_rate": 0.00014173792903227476, "loss": 0.0139, "step": 407030 }, { "epoch": 1.06, "learning_rate": 0.0001417340408159033, "loss": 0.0108, "step": 407040 }, { "epoch": 1.06, "learning_rate": 0.00014173015259953185, "loss": 0.014, "step": 407050 }, { "epoch": 1.06, "learning_rate": 0.0001417262643831604, "loss": 0.0138, "step": 407060 }, { "epoch": 1.06, "learning_rate": 0.0001417223761667889, "loss": 0.0109, "step": 407070 }, { "epoch": 1.06, "learning_rate": 0.00014171848795041747, "loss": 0.0123, "step": 407080 }, { "epoch": 1.06, "learning_rate": 0.00014171459973404599, "loss": 0.0127, "step": 407090 }, { "epoch": 1.06, "learning_rate": 0.00014171071151767453, "loss": 0.0178, "step": 407100 }, { "epoch": 1.06, "learning_rate": 0.00014170682330130307, "loss": 0.0093, "step": 407110 }, { "epoch": 1.06, "learning_rate": 0.0001417029350849316, "loss": 0.0131, "step": 407120 }, { "epoch": 1.06, "learning_rate": 0.00014169904686856013, "loss": 0.0124, "step": 407130 }, { "epoch": 1.06, "learning_rate": 0.00014169515865218867, "loss": 0.013, "step": 407140 }, { "epoch": 1.06, "learning_rate": 0.0001416912704358172, "loss": 0.0113, "step": 407150 }, { "epoch": 1.06, "learning_rate": 0.00014168738221944572, "loss": 0.0101, "step": 407160 }, { "epoch": 1.06, "learning_rate": 0.00014168349400307427, "loss": 0.0139, "step": 407170 }, { "epoch": 1.06, "learning_rate": 0.0001416796057867028, "loss": 0.0121, "step": 407180 }, { "epoch": 1.06, "learning_rate": 0.00014167571757033135, "loss": 0.0101, "step": 407190 }, { "epoch": 1.06, "learning_rate": 0.00014167182935395986, "loss": 0.0114, "step": 407200 }, { "epoch": 1.06, "learning_rate": 0.0001416679411375884, "loss": 0.0149, "step": 407210 }, { "epoch": 1.06, "learning_rate": 0.00014166405292121695, "loss": 0.0091, "step": 407220 }, { "epoch": 1.06, "learning_rate": 0.0001416601647048455, "loss": 0.0167, "step": 407230 }, { "epoch": 1.06, "learning_rate": 0.000141656276488474, "loss": 0.0107, "step": 407240 }, { "epoch": 1.06, "learning_rate": 0.00014165238827210254, "loss": 0.016, "step": 407250 }, { "epoch": 1.06, "learning_rate": 0.00014164850005573109, "loss": 0.0173, "step": 407260 }, { "epoch": 1.06, "learning_rate": 0.00014164461183935963, "loss": 0.0087, "step": 407270 }, { "epoch": 1.06, "learning_rate": 0.00014164072362298817, "loss": 0.0141, "step": 407280 }, { "epoch": 1.06, "learning_rate": 0.0001416368354066167, "loss": 0.0083, "step": 407290 }, { "epoch": 1.06, "learning_rate": 0.00014163294719024523, "loss": 0.0132, "step": 407300 }, { "epoch": 1.06, "learning_rate": 0.00014162905897387377, "loss": 0.0146, "step": 407310 }, { "epoch": 1.06, "learning_rate": 0.0001416251707575023, "loss": 0.0137, "step": 407320 }, { "epoch": 1.06, "learning_rate": 0.00014162128254113085, "loss": 0.0131, "step": 407330 }, { "epoch": 1.06, "learning_rate": 0.00014161739432475936, "loss": 0.0123, "step": 407340 }, { "epoch": 1.06, "learning_rate": 0.0001416135061083879, "loss": 0.011, "step": 407350 }, { "epoch": 1.06, "learning_rate": 0.00014160961789201645, "loss": 0.0142, "step": 407360 }, { "epoch": 1.06, "learning_rate": 0.000141605729675645, "loss": 0.0123, "step": 407370 }, { "epoch": 1.06, "learning_rate": 0.0001416018414592735, "loss": 0.0114, "step": 407380 }, { "epoch": 1.06, "learning_rate": 0.00014159795324290205, "loss": 0.0137, "step": 407390 }, { "epoch": 1.06, "learning_rate": 0.0001415940650265306, "loss": 0.0129, "step": 407400 }, { "epoch": 1.06, "learning_rate": 0.0001415901768101591, "loss": 0.0157, "step": 407410 }, { "epoch": 1.06, "learning_rate": 0.00014158628859378764, "loss": 0.0139, "step": 407420 }, { "epoch": 1.06, "learning_rate": 0.00014158240037741619, "loss": 0.0131, "step": 407430 }, { "epoch": 1.06, "learning_rate": 0.00014157851216104473, "loss": 0.0113, "step": 407440 }, { "epoch": 1.06, "learning_rate": 0.00014157462394467324, "loss": 0.0114, "step": 407450 }, { "epoch": 1.06, "learning_rate": 0.0001415707357283018, "loss": 0.0119, "step": 407460 }, { "epoch": 1.06, "learning_rate": 0.00014156684751193032, "loss": 0.0183, "step": 407470 }, { "epoch": 1.06, "learning_rate": 0.00014156295929555887, "loss": 0.0099, "step": 407480 }, { "epoch": 1.06, "learning_rate": 0.0001415590710791874, "loss": 0.0103, "step": 407490 }, { "epoch": 1.06, "learning_rate": 0.00014155518286281595, "loss": 0.012, "step": 407500 }, { "epoch": 1.06, "learning_rate": 0.00014155129464644446, "loss": 0.0117, "step": 407510 }, { "epoch": 1.06, "learning_rate": 0.000141547406430073, "loss": 0.0112, "step": 407520 }, { "epoch": 1.06, "learning_rate": 0.00014154351821370155, "loss": 0.0108, "step": 407530 }, { "epoch": 1.06, "learning_rate": 0.0001415396299973301, "loss": 0.0098, "step": 407540 }, { "epoch": 1.06, "learning_rate": 0.0001415357417809586, "loss": 0.0096, "step": 407550 }, { "epoch": 1.06, "learning_rate": 0.00014153185356458715, "loss": 0.0111, "step": 407560 }, { "epoch": 1.06, "learning_rate": 0.0001415279653482157, "loss": 0.0113, "step": 407570 }, { "epoch": 1.06, "learning_rate": 0.00014152407713184423, "loss": 0.0106, "step": 407580 }, { "epoch": 1.06, "learning_rate": 0.00014152018891547274, "loss": 0.0091, "step": 407590 }, { "epoch": 1.06, "learning_rate": 0.00014151630069910128, "loss": 0.0131, "step": 407600 }, { "epoch": 1.06, "learning_rate": 0.00014151241248272983, "loss": 0.0143, "step": 407610 }, { "epoch": 1.06, "learning_rate": 0.00014150852426635837, "loss": 0.0101, "step": 407620 }, { "epoch": 1.06, "learning_rate": 0.0001415046360499869, "loss": 0.01, "step": 407630 }, { "epoch": 1.06, "learning_rate": 0.00014150074783361542, "loss": 0.0109, "step": 407640 }, { "epoch": 1.06, "learning_rate": 0.00014149685961724397, "loss": 0.0154, "step": 407650 }, { "epoch": 1.06, "learning_rate": 0.0001414929714008725, "loss": 0.0113, "step": 407660 }, { "epoch": 1.06, "learning_rate": 0.00014148908318450105, "loss": 0.012, "step": 407670 }, { "epoch": 1.06, "learning_rate": 0.00014148519496812956, "loss": 0.0108, "step": 407680 }, { "epoch": 1.06, "learning_rate": 0.0001414813067517581, "loss": 0.0128, "step": 407690 }, { "epoch": 1.06, "learning_rate": 0.00014147741853538665, "loss": 0.0078, "step": 407700 }, { "epoch": 1.06, "learning_rate": 0.0001414735303190152, "loss": 0.0108, "step": 407710 }, { "epoch": 1.06, "learning_rate": 0.0001414696421026437, "loss": 0.0106, "step": 407720 }, { "epoch": 1.06, "learning_rate": 0.00014146575388627224, "loss": 0.0113, "step": 407730 }, { "epoch": 1.06, "learning_rate": 0.00014146186566990079, "loss": 0.0105, "step": 407740 }, { "epoch": 1.06, "learning_rate": 0.00014145797745352933, "loss": 0.012, "step": 407750 }, { "epoch": 1.06, "learning_rate": 0.00014145408923715784, "loss": 0.0097, "step": 407760 }, { "epoch": 1.06, "learning_rate": 0.00014145020102078638, "loss": 0.0098, "step": 407770 }, { "epoch": 1.06, "learning_rate": 0.00014144631280441493, "loss": 0.0126, "step": 407780 }, { "epoch": 1.06, "learning_rate": 0.00014144242458804347, "loss": 0.0087, "step": 407790 }, { "epoch": 1.06, "learning_rate": 0.00014143853637167198, "loss": 0.0118, "step": 407800 }, { "epoch": 1.06, "learning_rate": 0.00014143464815530055, "loss": 0.0077, "step": 407810 }, { "epoch": 1.06, "learning_rate": 0.00014143075993892907, "loss": 0.0144, "step": 407820 }, { "epoch": 1.06, "learning_rate": 0.0001414268717225576, "loss": 0.0117, "step": 407830 }, { "epoch": 1.06, "learning_rate": 0.00014142298350618615, "loss": 0.0113, "step": 407840 }, { "epoch": 1.06, "learning_rate": 0.0001414190952898147, "loss": 0.0144, "step": 407850 }, { "epoch": 1.06, "learning_rate": 0.0001414152070734432, "loss": 0.0116, "step": 407860 }, { "epoch": 1.06, "learning_rate": 0.00014141131885707175, "loss": 0.0131, "step": 407870 }, { "epoch": 1.06, "learning_rate": 0.0001414074306407003, "loss": 0.0109, "step": 407880 }, { "epoch": 1.06, "learning_rate": 0.0001414035424243288, "loss": 0.0107, "step": 407890 }, { "epoch": 1.06, "learning_rate": 0.00014139965420795734, "loss": 0.0107, "step": 407900 }, { "epoch": 1.06, "learning_rate": 0.00014139576599158589, "loss": 0.0117, "step": 407910 }, { "epoch": 1.06, "learning_rate": 0.00014139187777521443, "loss": 0.0098, "step": 407920 }, { "epoch": 1.06, "learning_rate": 0.00014138798955884294, "loss": 0.0131, "step": 407930 }, { "epoch": 1.06, "learning_rate": 0.00014138410134247148, "loss": 0.0137, "step": 407940 }, { "epoch": 1.06, "learning_rate": 0.00014138021312610003, "loss": 0.0132, "step": 407950 }, { "epoch": 1.06, "learning_rate": 0.00014137632490972857, "loss": 0.0112, "step": 407960 }, { "epoch": 1.06, "learning_rate": 0.00014137243669335708, "loss": 0.0102, "step": 407970 }, { "epoch": 1.06, "learning_rate": 0.00014136854847698565, "loss": 0.0101, "step": 407980 }, { "epoch": 1.06, "learning_rate": 0.00014136466026061416, "loss": 0.0118, "step": 407990 }, { "epoch": 1.06, "learning_rate": 0.0001413607720442427, "loss": 0.0123, "step": 408000 }, { "epoch": 1.06, "eval_cer": 0.8817292794249172, "eval_loss": 0.007572217844426632, "eval_runtime": 107.5486, "eval_samples_per_second": 18.596, "eval_steps_per_second": 4.649, "step": 408000 }, { "epoch": 1.06, "learning_rate": 0.00014135688382787125, "loss": 0.0114, "step": 408010 }, { "epoch": 1.06, "learning_rate": 0.0001413529956114998, "loss": 0.0106, "step": 408020 }, { "epoch": 1.06, "learning_rate": 0.0001413491073951283, "loss": 0.0138, "step": 408030 }, { "epoch": 1.06, "learning_rate": 0.00014134521917875685, "loss": 0.0118, "step": 408040 }, { "epoch": 1.06, "learning_rate": 0.0001413413309623854, "loss": 0.0105, "step": 408050 }, { "epoch": 1.06, "learning_rate": 0.00014133744274601393, "loss": 0.0108, "step": 408060 }, { "epoch": 1.06, "learning_rate": 0.00014133355452964244, "loss": 0.0114, "step": 408070 }, { "epoch": 1.06, "learning_rate": 0.00014132966631327099, "loss": 0.0082, "step": 408080 }, { "epoch": 1.06, "learning_rate": 0.00014132577809689953, "loss": 0.0138, "step": 408090 }, { "epoch": 1.06, "learning_rate": 0.00014132188988052807, "loss": 0.0126, "step": 408100 }, { "epoch": 1.06, "learning_rate": 0.00014131800166415658, "loss": 0.0133, "step": 408110 }, { "epoch": 1.06, "learning_rate": 0.00014131411344778512, "loss": 0.0138, "step": 408120 }, { "epoch": 1.06, "learning_rate": 0.00014131022523141367, "loss": 0.0125, "step": 408130 }, { "epoch": 1.06, "learning_rate": 0.00014130633701504218, "loss": 0.013, "step": 408140 }, { "epoch": 1.06, "learning_rate": 0.00014130244879867075, "loss": 0.011, "step": 408150 }, { "epoch": 1.06, "learning_rate": 0.00014129856058229926, "loss": 0.0096, "step": 408160 }, { "epoch": 1.06, "learning_rate": 0.0001412946723659278, "loss": 0.0136, "step": 408170 }, { "epoch": 1.06, "learning_rate": 0.00014129078414955635, "loss": 0.0118, "step": 408180 }, { "epoch": 1.06, "learning_rate": 0.0001412868959331849, "loss": 0.0135, "step": 408190 }, { "epoch": 1.06, "learning_rate": 0.0001412830077168134, "loss": 0.0132, "step": 408200 }, { "epoch": 1.06, "learning_rate": 0.00014127911950044195, "loss": 0.0131, "step": 408210 }, { "epoch": 1.06, "learning_rate": 0.0001412752312840705, "loss": 0.0093, "step": 408220 }, { "epoch": 1.06, "learning_rate": 0.00014127134306769903, "loss": 0.0148, "step": 408230 }, { "epoch": 1.06, "learning_rate": 0.00014126745485132754, "loss": 0.0232, "step": 408240 }, { "epoch": 1.06, "learning_rate": 0.00014126356663495608, "loss": 0.0235, "step": 408250 }, { "epoch": 1.06, "learning_rate": 0.00014125967841858463, "loss": 0.0115, "step": 408260 }, { "epoch": 1.06, "learning_rate": 0.00014125579020221317, "loss": 0.0107, "step": 408270 }, { "epoch": 1.06, "learning_rate": 0.00014125190198584168, "loss": 0.0121, "step": 408280 }, { "epoch": 1.06, "learning_rate": 0.00014124801376947022, "loss": 0.0111, "step": 408290 }, { "epoch": 1.06, "learning_rate": 0.00014124412555309877, "loss": 0.0127, "step": 408300 }, { "epoch": 1.06, "learning_rate": 0.0001412402373367273, "loss": 0.0107, "step": 408310 }, { "epoch": 1.06, "learning_rate": 0.00014123634912035582, "loss": 0.0079, "step": 408320 }, { "epoch": 1.06, "learning_rate": 0.0001412324609039844, "loss": 0.017, "step": 408330 }, { "epoch": 1.06, "learning_rate": 0.0001412285726876129, "loss": 0.0157, "step": 408340 }, { "epoch": 1.06, "learning_rate": 0.00014122468447124145, "loss": 0.008, "step": 408350 }, { "epoch": 1.06, "learning_rate": 0.00014122079625487, "loss": 0.0131, "step": 408360 }, { "epoch": 1.06, "learning_rate": 0.00014121690803849853, "loss": 0.0136, "step": 408370 }, { "epoch": 1.06, "learning_rate": 0.00014121301982212704, "loss": 0.0107, "step": 408380 }, { "epoch": 1.06, "learning_rate": 0.00014120913160575559, "loss": 0.0105, "step": 408390 }, { "epoch": 1.06, "learning_rate": 0.00014120524338938413, "loss": 0.0094, "step": 408400 }, { "epoch": 1.06, "learning_rate": 0.00014120135517301264, "loss": 0.0084, "step": 408410 }, { "epoch": 1.06, "learning_rate": 0.00014119746695664118, "loss": 0.0101, "step": 408420 }, { "epoch": 1.06, "learning_rate": 0.00014119357874026973, "loss": 0.0112, "step": 408430 }, { "epoch": 1.06, "learning_rate": 0.00014118969052389827, "loss": 0.0124, "step": 408440 }, { "epoch": 1.06, "learning_rate": 0.00014118580230752678, "loss": 0.0142, "step": 408450 }, { "epoch": 1.06, "learning_rate": 0.00014118191409115532, "loss": 0.0113, "step": 408460 }, { "epoch": 1.06, "learning_rate": 0.00014117802587478387, "loss": 0.012, "step": 408470 }, { "epoch": 1.06, "learning_rate": 0.0001411741376584124, "loss": 0.0104, "step": 408480 }, { "epoch": 1.06, "learning_rate": 0.00014117024944204092, "loss": 0.0113, "step": 408490 }, { "epoch": 1.06, "learning_rate": 0.0001411663612256695, "loss": 0.0148, "step": 408500 }, { "epoch": 1.06, "learning_rate": 0.000141162473009298, "loss": 0.0112, "step": 408510 }, { "epoch": 1.06, "learning_rate": 0.00014115858479292655, "loss": 0.0114, "step": 408520 }, { "epoch": 1.06, "learning_rate": 0.0001411546965765551, "loss": 0.0106, "step": 408530 }, { "epoch": 1.06, "learning_rate": 0.00014115080836018363, "loss": 0.0089, "step": 408540 }, { "epoch": 1.06, "learning_rate": 0.00014114692014381214, "loss": 0.0146, "step": 408550 }, { "epoch": 1.06, "learning_rate": 0.00014114303192744069, "loss": 0.0118, "step": 408560 }, { "epoch": 1.06, "learning_rate": 0.00014113914371106923, "loss": 0.0089, "step": 408570 }, { "epoch": 1.06, "learning_rate": 0.00014113525549469777, "loss": 0.0123, "step": 408580 }, { "epoch": 1.06, "learning_rate": 0.00014113136727832628, "loss": 0.0141, "step": 408590 }, { "epoch": 1.06, "learning_rate": 0.00014112747906195483, "loss": 0.0107, "step": 408600 }, { "epoch": 1.06, "learning_rate": 0.00014112359084558337, "loss": 0.0108, "step": 408610 }, { "epoch": 1.06, "learning_rate": 0.0001411197026292119, "loss": 0.0107, "step": 408620 }, { "epoch": 1.06, "learning_rate": 0.00014111581441284042, "loss": 0.0113, "step": 408630 }, { "epoch": 1.06, "learning_rate": 0.00014111192619646896, "loss": 0.0109, "step": 408640 }, { "epoch": 1.06, "learning_rate": 0.0001411080379800975, "loss": 0.0093, "step": 408650 }, { "epoch": 1.06, "learning_rate": 0.00014110414976372602, "loss": 0.011, "step": 408660 }, { "epoch": 1.06, "learning_rate": 0.0001411002615473546, "loss": 0.011, "step": 408670 }, { "epoch": 1.06, "learning_rate": 0.0001410963733309831, "loss": 0.01, "step": 408680 }, { "epoch": 1.06, "learning_rate": 0.00014109248511461165, "loss": 0.0129, "step": 408690 }, { "epoch": 1.06, "learning_rate": 0.0001410885968982402, "loss": 0.0113, "step": 408700 }, { "epoch": 1.06, "learning_rate": 0.00014108470868186873, "loss": 0.0203, "step": 408710 }, { "epoch": 1.06, "learning_rate": 0.00014108082046549724, "loss": 0.0108, "step": 408720 }, { "epoch": 1.06, "learning_rate": 0.00014107693224912579, "loss": 0.0159, "step": 408730 }, { "epoch": 1.06, "learning_rate": 0.00014107304403275433, "loss": 0.0116, "step": 408740 }, { "epoch": 1.06, "learning_rate": 0.00014106915581638287, "loss": 0.0095, "step": 408750 }, { "epoch": 1.06, "learning_rate": 0.00014106526760001138, "loss": 0.0102, "step": 408760 }, { "epoch": 1.06, "learning_rate": 0.00014106137938363992, "loss": 0.0127, "step": 408770 }, { "epoch": 1.06, "learning_rate": 0.00014105749116726847, "loss": 0.0146, "step": 408780 }, { "epoch": 1.06, "learning_rate": 0.000141053602950897, "loss": 0.0101, "step": 408790 }, { "epoch": 1.06, "learning_rate": 0.00014104971473452552, "loss": 0.0122, "step": 408800 }, { "epoch": 1.06, "learning_rate": 0.00014104582651815406, "loss": 0.0124, "step": 408810 }, { "epoch": 1.06, "learning_rate": 0.0001410419383017826, "loss": 0.0116, "step": 408820 }, { "epoch": 1.06, "learning_rate": 0.00014103805008541115, "loss": 0.012, "step": 408830 }, { "epoch": 1.06, "learning_rate": 0.00014103416186903966, "loss": 0.0126, "step": 408840 }, { "epoch": 1.06, "learning_rate": 0.00014103027365266823, "loss": 0.011, "step": 408850 }, { "epoch": 1.06, "learning_rate": 0.00014102638543629675, "loss": 0.0142, "step": 408860 }, { "epoch": 1.06, "learning_rate": 0.0001410224972199253, "loss": 0.0117, "step": 408870 }, { "epoch": 1.06, "learning_rate": 0.00014101860900355383, "loss": 0.0111, "step": 408880 }, { "epoch": 1.06, "learning_rate": 0.00014101472078718234, "loss": 0.0107, "step": 408890 }, { "epoch": 1.06, "learning_rate": 0.00014101083257081088, "loss": 0.0111, "step": 408900 }, { "epoch": 1.06, "learning_rate": 0.00014100694435443943, "loss": 0.0112, "step": 408910 }, { "epoch": 1.06, "learning_rate": 0.00014100305613806797, "loss": 0.0084, "step": 408920 }, { "epoch": 1.06, "learning_rate": 0.00014099916792169648, "loss": 0.0113, "step": 408930 }, { "epoch": 1.06, "learning_rate": 0.00014099527970532502, "loss": 0.01, "step": 408940 }, { "epoch": 1.06, "learning_rate": 0.00014099139148895357, "loss": 0.0087, "step": 408950 }, { "epoch": 1.06, "learning_rate": 0.0001409875032725821, "loss": 0.0111, "step": 408960 }, { "epoch": 1.06, "learning_rate": 0.00014098361505621062, "loss": 0.0098, "step": 408970 }, { "epoch": 1.06, "learning_rate": 0.00014097972683983916, "loss": 0.013, "step": 408980 }, { "epoch": 1.06, "learning_rate": 0.0001409758386234677, "loss": 0.0111, "step": 408990 }, { "epoch": 1.06, "learning_rate": 0.00014097195040709625, "loss": 0.0106, "step": 409000 }, { "epoch": 1.06, "eval_cer": 0.8817390768834564, "eval_loss": 0.007736441679298878, "eval_runtime": 107.4459, "eval_samples_per_second": 18.614, "eval_steps_per_second": 4.654, "step": 409000 }, { "epoch": 1.06, "learning_rate": 0.00014096806219072476, "loss": 0.0107, "step": 409010 }, { "epoch": 1.06, "learning_rate": 0.00014096417397435333, "loss": 0.0108, "step": 409020 }, { "epoch": 1.06, "learning_rate": 0.00014096028575798184, "loss": 0.0295, "step": 409030 }, { "epoch": 1.06, "learning_rate": 0.00014095639754161039, "loss": 0.0122, "step": 409040 }, { "epoch": 1.06, "learning_rate": 0.00014095250932523893, "loss": 0.0106, "step": 409050 }, { "epoch": 1.06, "learning_rate": 0.00014094862110886747, "loss": 0.0121, "step": 409060 }, { "epoch": 1.06, "learning_rate": 0.00014094473289249598, "loss": 0.0162, "step": 409070 }, { "epoch": 1.06, "learning_rate": 0.00014094084467612453, "loss": 0.0128, "step": 409080 }, { "epoch": 1.06, "learning_rate": 0.00014093695645975307, "loss": 0.0122, "step": 409090 }, { "epoch": 1.06, "learning_rate": 0.0001409330682433816, "loss": 0.0106, "step": 409100 }, { "epoch": 1.06, "learning_rate": 0.00014092918002701012, "loss": 0.0108, "step": 409110 }, { "epoch": 1.06, "learning_rate": 0.00014092529181063866, "loss": 0.0102, "step": 409120 }, { "epoch": 1.06, "learning_rate": 0.0001409214035942672, "loss": 0.0117, "step": 409130 }, { "epoch": 1.06, "learning_rate": 0.00014091751537789572, "loss": 0.0119, "step": 409140 }, { "epoch": 1.06, "learning_rate": 0.00014091362716152426, "loss": 0.0117, "step": 409150 }, { "epoch": 1.06, "learning_rate": 0.0001409097389451528, "loss": 0.0105, "step": 409160 }, { "epoch": 1.06, "learning_rate": 0.00014090585072878135, "loss": 0.0118, "step": 409170 }, { "epoch": 1.06, "learning_rate": 0.00014090196251240986, "loss": 0.0094, "step": 409180 }, { "epoch": 1.06, "learning_rate": 0.0001408980742960384, "loss": 0.0104, "step": 409190 }, { "epoch": 1.06, "learning_rate": 0.00014089418607966694, "loss": 0.013, "step": 409200 }, { "epoch": 1.06, "learning_rate": 0.00014089029786329549, "loss": 0.0082, "step": 409210 }, { "epoch": 1.06, "learning_rate": 0.00014088640964692403, "loss": 0.0119, "step": 409220 }, { "epoch": 1.06, "learning_rate": 0.00014088252143055257, "loss": 0.011, "step": 409230 }, { "epoch": 1.06, "learning_rate": 0.00014087863321418108, "loss": 0.0126, "step": 409240 }, { "epoch": 1.06, "learning_rate": 0.00014087474499780962, "loss": 0.0122, "step": 409250 }, { "epoch": 1.06, "learning_rate": 0.00014087085678143817, "loss": 0.0097, "step": 409260 }, { "epoch": 1.06, "learning_rate": 0.0001408669685650667, "loss": 0.0118, "step": 409270 }, { "epoch": 1.06, "learning_rate": 0.00014086308034869522, "loss": 0.0099, "step": 409280 }, { "epoch": 1.06, "learning_rate": 0.00014085919213232376, "loss": 0.0092, "step": 409290 }, { "epoch": 1.06, "learning_rate": 0.0001408553039159523, "loss": 0.0106, "step": 409300 }, { "epoch": 1.06, "learning_rate": 0.00014085141569958085, "loss": 0.0134, "step": 409310 }, { "epoch": 1.06, "learning_rate": 0.00014084752748320936, "loss": 0.0134, "step": 409320 }, { "epoch": 1.06, "learning_rate": 0.0001408436392668379, "loss": 0.0091, "step": 409330 }, { "epoch": 1.06, "learning_rate": 0.00014083975105046645, "loss": 0.014, "step": 409340 }, { "epoch": 1.06, "learning_rate": 0.000140835862834095, "loss": 0.0096, "step": 409350 }, { "epoch": 1.06, "learning_rate": 0.0001408319746177235, "loss": 0.0096, "step": 409360 }, { "epoch": 1.06, "learning_rate": 0.00014082808640135207, "loss": 0.009, "step": 409370 }, { "epoch": 1.06, "learning_rate": 0.00014082419818498058, "loss": 0.0101, "step": 409380 }, { "epoch": 1.06, "learning_rate": 0.0001408203099686091, "loss": 0.0122, "step": 409390 }, { "epoch": 1.06, "learning_rate": 0.00014081642175223767, "loss": 0.0096, "step": 409400 }, { "epoch": 1.06, "learning_rate": 0.00014081253353586618, "loss": 0.0122, "step": 409410 }, { "epoch": 1.06, "learning_rate": 0.00014080864531949472, "loss": 0.0091, "step": 409420 }, { "epoch": 1.06, "learning_rate": 0.00014080475710312327, "loss": 0.0134, "step": 409430 }, { "epoch": 1.06, "learning_rate": 0.0001408008688867518, "loss": 0.0109, "step": 409440 }, { "epoch": 1.06, "learning_rate": 0.00014079698067038032, "loss": 0.011, "step": 409450 }, { "epoch": 1.06, "learning_rate": 0.00014079309245400886, "loss": 0.0118, "step": 409460 }, { "epoch": 1.06, "learning_rate": 0.0001407892042376374, "loss": 0.0158, "step": 409470 }, { "epoch": 1.06, "learning_rate": 0.00014078531602126595, "loss": 0.0095, "step": 409480 }, { "epoch": 1.06, "learning_rate": 0.00014078142780489446, "loss": 0.0161, "step": 409490 }, { "epoch": 1.06, "learning_rate": 0.000140777539588523, "loss": 0.0106, "step": 409500 }, { "epoch": 1.06, "learning_rate": 0.00014077365137215154, "loss": 0.0097, "step": 409510 }, { "epoch": 1.06, "learning_rate": 0.0001407697631557801, "loss": 0.0137, "step": 409520 }, { "epoch": 1.06, "learning_rate": 0.0001407658749394086, "loss": 0.0104, "step": 409530 }, { "epoch": 1.06, "learning_rate": 0.00014076198672303717, "loss": 0.011, "step": 409540 }, { "epoch": 1.06, "learning_rate": 0.00014075809850666568, "loss": 0.0114, "step": 409550 }, { "epoch": 1.06, "learning_rate": 0.00014075421029029423, "loss": 0.011, "step": 409560 }, { "epoch": 1.06, "learning_rate": 0.00014075032207392277, "loss": 0.0125, "step": 409570 }, { "epoch": 1.06, "learning_rate": 0.0001407464338575513, "loss": 0.0103, "step": 409580 }, { "epoch": 1.06, "learning_rate": 0.00014074254564117982, "loss": 0.0114, "step": 409590 }, { "epoch": 1.06, "learning_rate": 0.00014073865742480837, "loss": 0.0117, "step": 409600 }, { "epoch": 1.06, "learning_rate": 0.0001407347692084369, "loss": 0.0157, "step": 409610 }, { "epoch": 1.06, "learning_rate": 0.00014073088099206545, "loss": 0.0108, "step": 409620 }, { "epoch": 1.06, "learning_rate": 0.00014072699277569396, "loss": 0.0106, "step": 409630 }, { "epoch": 1.06, "learning_rate": 0.0001407231045593225, "loss": 0.0162, "step": 409640 }, { "epoch": 1.06, "learning_rate": 0.00014071921634295105, "loss": 0.0152, "step": 409650 }, { "epoch": 1.06, "learning_rate": 0.00014071532812657956, "loss": 0.0097, "step": 409660 }, { "epoch": 1.06, "learning_rate": 0.0001407114399102081, "loss": 0.0128, "step": 409670 }, { "epoch": 1.06, "learning_rate": 0.00014070755169383664, "loss": 0.0119, "step": 409680 }, { "epoch": 1.06, "learning_rate": 0.00014070366347746519, "loss": 0.0112, "step": 409690 }, { "epoch": 1.06, "learning_rate": 0.0001406997752610937, "loss": 0.0118, "step": 409700 }, { "epoch": 1.06, "learning_rate": 0.00014069588704472224, "loss": 0.0206, "step": 409710 }, { "epoch": 1.06, "learning_rate": 0.00014069199882835078, "loss": 0.0131, "step": 409720 }, { "epoch": 1.06, "learning_rate": 0.00014068811061197933, "loss": 0.0112, "step": 409730 }, { "epoch": 1.06, "learning_rate": 0.00014068422239560787, "loss": 0.0119, "step": 409740 }, { "epoch": 1.06, "learning_rate": 0.0001406803341792364, "loss": 0.0098, "step": 409750 }, { "epoch": 1.06, "learning_rate": 0.00014067644596286492, "loss": 0.0117, "step": 409760 }, { "epoch": 1.06, "learning_rate": 0.00014067255774649346, "loss": 0.013, "step": 409770 }, { "epoch": 1.06, "learning_rate": 0.000140668669530122, "loss": 0.0131, "step": 409780 }, { "epoch": 1.06, "learning_rate": 0.00014066478131375055, "loss": 0.0109, "step": 409790 }, { "epoch": 1.06, "learning_rate": 0.00014066089309737906, "loss": 0.008, "step": 409800 }, { "epoch": 1.06, "learning_rate": 0.0001406570048810076, "loss": 0.0113, "step": 409810 }, { "epoch": 1.06, "learning_rate": 0.00014065311666463615, "loss": 0.0133, "step": 409820 }, { "epoch": 1.06, "learning_rate": 0.0001406492284482647, "loss": 0.01, "step": 409830 }, { "epoch": 1.06, "learning_rate": 0.0001406453402318932, "loss": 0.0107, "step": 409840 }, { "epoch": 1.06, "learning_rate": 0.00014064145201552174, "loss": 0.0119, "step": 409850 }, { "epoch": 1.06, "learning_rate": 0.00014063756379915029, "loss": 0.0107, "step": 409860 }, { "epoch": 1.06, "learning_rate": 0.00014063367558277883, "loss": 0.0092, "step": 409870 }, { "epoch": 1.06, "learning_rate": 0.00014062978736640734, "loss": 0.0131, "step": 409880 }, { "epoch": 1.06, "learning_rate": 0.00014062589915003588, "loss": 0.0119, "step": 409890 }, { "epoch": 1.06, "learning_rate": 0.00014062201093366442, "loss": 0.0112, "step": 409900 }, { "epoch": 1.06, "learning_rate": 0.00014061812271729294, "loss": 0.0101, "step": 409910 }, { "epoch": 1.06, "learning_rate": 0.0001406142345009215, "loss": 0.0114, "step": 409920 }, { "epoch": 1.06, "learning_rate": 0.00014061034628455002, "loss": 0.0106, "step": 409930 }, { "epoch": 1.06, "learning_rate": 0.00014060645806817856, "loss": 0.0097, "step": 409940 }, { "epoch": 1.06, "learning_rate": 0.0001406025698518071, "loss": 0.01, "step": 409950 }, { "epoch": 1.06, "learning_rate": 0.00014059868163543565, "loss": 0.014, "step": 409960 }, { "epoch": 1.06, "learning_rate": 0.00014059479341906416, "loss": 0.0108, "step": 409970 }, { "epoch": 1.06, "learning_rate": 0.0001405909052026927, "loss": 0.0108, "step": 409980 }, { "epoch": 1.06, "learning_rate": 0.00014058701698632125, "loss": 0.0125, "step": 409990 }, { "epoch": 1.06, "learning_rate": 0.0001405831287699498, "loss": 0.0103, "step": 410000 }, { "epoch": 1.06, "eval_cer": 0.8817068852339703, "eval_loss": 0.007638953160494566, "eval_runtime": 107.3836, "eval_samples_per_second": 18.625, "eval_steps_per_second": 4.656, "step": 410000 }, { "epoch": 1.06, "learning_rate": 0.0001405792405535783, "loss": 0.0136, "step": 410010 }, { "epoch": 1.06, "learning_rate": 0.00014057535233720684, "loss": 0.0094, "step": 410020 }, { "epoch": 1.06, "learning_rate": 0.00014057146412083538, "loss": 0.0103, "step": 410030 }, { "epoch": 1.06, "learning_rate": 0.00014056757590446393, "loss": 0.0122, "step": 410040 }, { "epoch": 1.06, "learning_rate": 0.00014056368768809244, "loss": 0.0133, "step": 410050 }, { "epoch": 1.06, "learning_rate": 0.000140559799471721, "loss": 0.0119, "step": 410060 }, { "epoch": 1.06, "learning_rate": 0.00014055591125534952, "loss": 0.009, "step": 410070 }, { "epoch": 1.06, "learning_rate": 0.00014055202303897807, "loss": 0.009, "step": 410080 }, { "epoch": 1.06, "learning_rate": 0.0001405481348226066, "loss": 0.0118, "step": 410090 }, { "epoch": 1.06, "learning_rate": 0.00014054424660623515, "loss": 0.0096, "step": 410100 }, { "epoch": 1.06, "learning_rate": 0.00014054035838986366, "loss": 0.0156, "step": 410110 }, { "epoch": 1.06, "learning_rate": 0.0001405364701734922, "loss": 0.0137, "step": 410120 }, { "epoch": 1.06, "learning_rate": 0.00014053258195712075, "loss": 0.0084, "step": 410130 }, { "epoch": 1.06, "learning_rate": 0.00014052869374074926, "loss": 0.0121, "step": 410140 }, { "epoch": 1.06, "learning_rate": 0.0001405248055243778, "loss": 0.0163, "step": 410150 }, { "epoch": 1.06, "learning_rate": 0.00014052091730800634, "loss": 0.0128, "step": 410160 }, { "epoch": 1.06, "learning_rate": 0.00014051702909163489, "loss": 0.0118, "step": 410170 }, { "epoch": 1.06, "learning_rate": 0.0001405131408752634, "loss": 0.009, "step": 410180 }, { "epoch": 1.06, "learning_rate": 0.00014050925265889194, "loss": 0.0113, "step": 410190 }, { "epoch": 1.06, "learning_rate": 0.00014050536444252048, "loss": 0.0081, "step": 410200 }, { "epoch": 1.06, "learning_rate": 0.00014050147622614903, "loss": 0.0132, "step": 410210 }, { "epoch": 1.06, "learning_rate": 0.00014049758800977754, "loss": 0.0145, "step": 410220 }, { "epoch": 1.06, "learning_rate": 0.00014049369979340608, "loss": 0.0157, "step": 410230 }, { "epoch": 1.06, "learning_rate": 0.00014048981157703462, "loss": 0.0096, "step": 410240 }, { "epoch": 1.06, "learning_rate": 0.00014048592336066317, "loss": 0.0114, "step": 410250 }, { "epoch": 1.06, "learning_rate": 0.0001404820351442917, "loss": 0.0117, "step": 410260 }, { "epoch": 1.06, "learning_rate": 0.00014047814692792025, "loss": 0.0152, "step": 410270 }, { "epoch": 1.06, "learning_rate": 0.00014047425871154876, "loss": 0.013, "step": 410280 }, { "epoch": 1.06, "learning_rate": 0.0001404703704951773, "loss": 0.0112, "step": 410290 }, { "epoch": 1.06, "learning_rate": 0.00014046648227880585, "loss": 0.0166, "step": 410300 }, { "epoch": 1.06, "learning_rate": 0.0001404625940624344, "loss": 0.0113, "step": 410310 }, { "epoch": 1.06, "learning_rate": 0.0001404587058460629, "loss": 0.0243, "step": 410320 }, { "epoch": 1.06, "learning_rate": 0.00014045481762969144, "loss": 0.0102, "step": 410330 }, { "epoch": 1.06, "learning_rate": 0.00014045092941331999, "loss": 0.0138, "step": 410340 }, { "epoch": 1.06, "learning_rate": 0.00014044704119694853, "loss": 0.0104, "step": 410350 }, { "epoch": 1.06, "learning_rate": 0.00014044315298057704, "loss": 0.0116, "step": 410360 }, { "epoch": 1.06, "learning_rate": 0.00014043926476420558, "loss": 0.0093, "step": 410370 }, { "epoch": 1.06, "learning_rate": 0.00014043537654783413, "loss": 0.0136, "step": 410380 }, { "epoch": 1.06, "learning_rate": 0.00014043148833146264, "loss": 0.0104, "step": 410390 }, { "epoch": 1.06, "learning_rate": 0.00014042760011509118, "loss": 0.0098, "step": 410400 }, { "epoch": 1.06, "learning_rate": 0.00014042371189871972, "loss": 0.0099, "step": 410410 }, { "epoch": 1.06, "learning_rate": 0.00014041982368234826, "loss": 0.0122, "step": 410420 }, { "epoch": 1.06, "learning_rate": 0.00014041593546597678, "loss": 0.0111, "step": 410430 }, { "epoch": 1.06, "learning_rate": 0.00014041204724960535, "loss": 0.014, "step": 410440 }, { "epoch": 1.06, "learning_rate": 0.00014040815903323386, "loss": 0.0109, "step": 410450 }, { "epoch": 1.06, "learning_rate": 0.0001404042708168624, "loss": 0.0094, "step": 410460 }, { "epoch": 1.06, "learning_rate": 0.00014040038260049095, "loss": 0.0124, "step": 410470 }, { "epoch": 1.06, "learning_rate": 0.0001403964943841195, "loss": 0.0113, "step": 410480 }, { "epoch": 1.06, "learning_rate": 0.000140392606167748, "loss": 0.0121, "step": 410490 }, { "epoch": 1.06, "learning_rate": 0.00014038871795137654, "loss": 0.0104, "step": 410500 }, { "epoch": 1.06, "learning_rate": 0.00014038482973500509, "loss": 0.0137, "step": 410510 }, { "epoch": 1.06, "learning_rate": 0.00014038094151863363, "loss": 0.0101, "step": 410520 }, { "epoch": 1.06, "learning_rate": 0.00014037705330226214, "loss": 0.0098, "step": 410530 }, { "epoch": 1.06, "learning_rate": 0.00014037316508589068, "loss": 0.0115, "step": 410540 }, { "epoch": 1.06, "learning_rate": 0.00014036927686951922, "loss": 0.0112, "step": 410550 }, { "epoch": 1.06, "learning_rate": 0.00014036538865314777, "loss": 0.0101, "step": 410560 }, { "epoch": 1.06, "learning_rate": 0.00014036150043677628, "loss": 0.013, "step": 410570 }, { "epoch": 1.06, "learning_rate": 0.00014035761222040482, "loss": 0.0087, "step": 410580 }, { "epoch": 1.06, "learning_rate": 0.00014035372400403336, "loss": 0.0102, "step": 410590 }, { "epoch": 1.06, "learning_rate": 0.0001403498357876619, "loss": 0.0081, "step": 410600 }, { "epoch": 1.06, "learning_rate": 0.00014034594757129045, "loss": 0.0206, "step": 410610 }, { "epoch": 1.06, "learning_rate": 0.00014034205935491896, "loss": 0.0113, "step": 410620 }, { "epoch": 1.06, "learning_rate": 0.0001403381711385475, "loss": 0.0105, "step": 410630 }, { "epoch": 1.06, "learning_rate": 0.00014033428292217605, "loss": 0.0188, "step": 410640 }, { "epoch": 1.06, "learning_rate": 0.0001403303947058046, "loss": 0.012, "step": 410650 }, { "epoch": 1.06, "learning_rate": 0.0001403265064894331, "loss": 0.0112, "step": 410660 }, { "epoch": 1.06, "learning_rate": 0.00014032261827306164, "loss": 0.0112, "step": 410670 }, { "epoch": 1.06, "learning_rate": 0.00014031873005669018, "loss": 0.0111, "step": 410680 }, { "epoch": 1.06, "learning_rate": 0.00014031484184031873, "loss": 0.0138, "step": 410690 }, { "epoch": 1.06, "learning_rate": 0.00014031095362394724, "loss": 0.0128, "step": 410700 }, { "epoch": 1.06, "learning_rate": 0.00014030706540757578, "loss": 0.0132, "step": 410710 }, { "epoch": 1.06, "learning_rate": 0.00014030317719120432, "loss": 0.013, "step": 410720 }, { "epoch": 1.06, "learning_rate": 0.00014029928897483287, "loss": 0.0135, "step": 410730 }, { "epoch": 1.06, "learning_rate": 0.00014029540075846138, "loss": 0.0117, "step": 410740 }, { "epoch": 1.06, "learning_rate": 0.00014029151254208992, "loss": 0.0109, "step": 410750 }, { "epoch": 1.06, "learning_rate": 0.00014028762432571846, "loss": 0.0088, "step": 410760 }, { "epoch": 1.06, "learning_rate": 0.000140283736109347, "loss": 0.0118, "step": 410770 }, { "epoch": 1.06, "learning_rate": 0.00014027984789297552, "loss": 0.0111, "step": 410780 }, { "epoch": 1.06, "learning_rate": 0.0001402759596766041, "loss": 0.0136, "step": 410790 }, { "epoch": 1.06, "learning_rate": 0.0001402720714602326, "loss": 0.0107, "step": 410800 }, { "epoch": 1.06, "learning_rate": 0.00014026818324386114, "loss": 0.0112, "step": 410810 }, { "epoch": 1.06, "learning_rate": 0.00014026429502748969, "loss": 0.0129, "step": 410820 }, { "epoch": 1.06, "learning_rate": 0.00014026040681111823, "loss": 0.0153, "step": 410830 }, { "epoch": 1.06, "learning_rate": 0.00014025651859474674, "loss": 0.015, "step": 410840 }, { "epoch": 1.06, "learning_rate": 0.00014025263037837528, "loss": 0.0126, "step": 410850 }, { "epoch": 1.07, "learning_rate": 0.00014024874216200383, "loss": 0.0112, "step": 410860 }, { "epoch": 1.07, "learning_rate": 0.00014024485394563234, "loss": 0.0092, "step": 410870 }, { "epoch": 1.07, "learning_rate": 0.00014024096572926088, "loss": 0.0113, "step": 410880 }, { "epoch": 1.07, "learning_rate": 0.00014023707751288942, "loss": 0.0109, "step": 410890 }, { "epoch": 1.07, "learning_rate": 0.00014023318929651797, "loss": 0.01, "step": 410900 }, { "epoch": 1.07, "learning_rate": 0.00014022930108014648, "loss": 0.0141, "step": 410910 }, { "epoch": 1.07, "learning_rate": 0.00014022541286377502, "loss": 0.0136, "step": 410920 }, { "epoch": 1.07, "learning_rate": 0.00014022152464740356, "loss": 0.0113, "step": 410930 }, { "epoch": 1.07, "learning_rate": 0.0001402176364310321, "loss": 0.0134, "step": 410940 }, { "epoch": 1.07, "learning_rate": 0.00014021374821466062, "loss": 0.0116, "step": 410950 }, { "epoch": 1.07, "learning_rate": 0.0001402098599982892, "loss": 0.0121, "step": 410960 }, { "epoch": 1.07, "learning_rate": 0.0001402059717819177, "loss": 0.0107, "step": 410970 }, { "epoch": 1.07, "learning_rate": 0.00014020208356554624, "loss": 0.0095, "step": 410980 }, { "epoch": 1.07, "learning_rate": 0.00014019819534917479, "loss": 0.0158, "step": 410990 }, { "epoch": 1.07, "learning_rate": 0.00014019430713280333, "loss": 0.0111, "step": 411000 }, { "epoch": 1.07, "eval_cer": 0.8816830914060892, "eval_loss": 0.007736830040812492, "eval_runtime": 107.3663, "eval_samples_per_second": 18.628, "eval_steps_per_second": 4.657, "step": 411000 }, { "epoch": 1.07, "learning_rate": 0.00014019041891643184, "loss": 0.0112, "step": 411010 }, { "epoch": 1.07, "learning_rate": 0.00014018653070006038, "loss": 0.0119, "step": 411020 }, { "epoch": 1.07, "learning_rate": 0.00014018264248368893, "loss": 0.0118, "step": 411030 }, { "epoch": 1.07, "learning_rate": 0.00014017875426731747, "loss": 0.0093, "step": 411040 }, { "epoch": 1.07, "learning_rate": 0.00014017486605094598, "loss": 0.0111, "step": 411050 }, { "epoch": 1.07, "learning_rate": 0.00014017097783457452, "loss": 0.0127, "step": 411060 }, { "epoch": 1.07, "learning_rate": 0.00014016708961820306, "loss": 0.0084, "step": 411070 }, { "epoch": 1.07, "learning_rate": 0.0001401632014018316, "loss": 0.0106, "step": 411080 }, { "epoch": 1.07, "learning_rate": 0.00014015931318546012, "loss": 0.0093, "step": 411090 }, { "epoch": 1.07, "learning_rate": 0.00014015542496908866, "loss": 0.0106, "step": 411100 }, { "epoch": 1.07, "learning_rate": 0.0001401515367527172, "loss": 0.0092, "step": 411110 }, { "epoch": 1.07, "learning_rate": 0.00014014764853634572, "loss": 0.0113, "step": 411120 }, { "epoch": 1.07, "learning_rate": 0.0001401437603199743, "loss": 0.011, "step": 411130 }, { "epoch": 1.07, "learning_rate": 0.0001401398721036028, "loss": 0.0104, "step": 411140 }, { "epoch": 1.07, "learning_rate": 0.00014013598388723134, "loss": 0.0101, "step": 411150 }, { "epoch": 1.07, "learning_rate": 0.00014013209567085989, "loss": 0.0095, "step": 411160 }, { "epoch": 1.07, "learning_rate": 0.00014012820745448843, "loss": 0.016, "step": 411170 }, { "epoch": 1.07, "learning_rate": 0.00014012431923811694, "loss": 0.0089, "step": 411180 }, { "epoch": 1.07, "learning_rate": 0.00014012043102174548, "loss": 0.0101, "step": 411190 }, { "epoch": 1.07, "learning_rate": 0.00014011654280537402, "loss": 0.0084, "step": 411200 }, { "epoch": 1.07, "learning_rate": 0.00014011265458900257, "loss": 0.0131, "step": 411210 }, { "epoch": 1.07, "learning_rate": 0.00014010876637263108, "loss": 0.0102, "step": 411220 }, { "epoch": 1.07, "learning_rate": 0.00014010487815625962, "loss": 0.0091, "step": 411230 }, { "epoch": 1.07, "learning_rate": 0.00014010098993988816, "loss": 0.0115, "step": 411240 }, { "epoch": 1.07, "learning_rate": 0.0001400971017235167, "loss": 0.0111, "step": 411250 }, { "epoch": 1.07, "learning_rate": 0.00014009321350714522, "loss": 0.0127, "step": 411260 }, { "epoch": 1.07, "learning_rate": 0.00014008932529077376, "loss": 0.0118, "step": 411270 }, { "epoch": 1.07, "learning_rate": 0.0001400854370744023, "loss": 0.0102, "step": 411280 }, { "epoch": 1.07, "learning_rate": 0.00014008154885803085, "loss": 0.0108, "step": 411290 }, { "epoch": 1.07, "learning_rate": 0.00014007766064165936, "loss": 0.0106, "step": 411300 }, { "epoch": 1.07, "learning_rate": 0.00014007377242528793, "loss": 0.0131, "step": 411310 }, { "epoch": 1.07, "learning_rate": 0.00014006988420891644, "loss": 0.0131, "step": 411320 }, { "epoch": 1.07, "learning_rate": 0.00014006599599254498, "loss": 0.013, "step": 411330 }, { "epoch": 1.07, "learning_rate": 0.00014006210777617353, "loss": 0.0115, "step": 411340 }, { "epoch": 1.07, "learning_rate": 0.00014005821955980207, "loss": 0.0148, "step": 411350 }, { "epoch": 1.07, "learning_rate": 0.00014005433134343058, "loss": 0.0154, "step": 411360 }, { "epoch": 1.07, "learning_rate": 0.00014005044312705912, "loss": 0.0117, "step": 411370 }, { "epoch": 1.07, "learning_rate": 0.00014004655491068767, "loss": 0.012, "step": 411380 }, { "epoch": 1.07, "learning_rate": 0.00014004266669431618, "loss": 0.0105, "step": 411390 }, { "epoch": 1.07, "learning_rate": 0.00014003877847794472, "loss": 0.0088, "step": 411400 }, { "epoch": 1.07, "learning_rate": 0.00014003489026157326, "loss": 0.0088, "step": 411410 }, { "epoch": 1.07, "learning_rate": 0.0001400310020452018, "loss": 0.0089, "step": 411420 }, { "epoch": 1.07, "learning_rate": 0.00014002711382883032, "loss": 0.0174, "step": 411430 }, { "epoch": 1.07, "learning_rate": 0.00014002322561245886, "loss": 0.0115, "step": 411440 }, { "epoch": 1.07, "learning_rate": 0.0001400193373960874, "loss": 0.0115, "step": 411450 }, { "epoch": 1.07, "learning_rate": 0.00014001544917971594, "loss": 0.0122, "step": 411460 }, { "epoch": 1.07, "learning_rate": 0.00014001156096334446, "loss": 0.0113, "step": 411470 }, { "epoch": 1.07, "learning_rate": 0.00014000767274697303, "loss": 0.0094, "step": 411480 }, { "epoch": 1.07, "learning_rate": 0.00014000378453060154, "loss": 0.0121, "step": 411490 }, { "epoch": 1.07, "learning_rate": 0.00013999989631423008, "loss": 0.0128, "step": 411500 }, { "epoch": 1.07, "learning_rate": 0.00013999600809785863, "loss": 0.0133, "step": 411510 }, { "epoch": 1.07, "learning_rate": 0.00013999211988148717, "loss": 0.0092, "step": 411520 }, { "epoch": 1.07, "learning_rate": 0.00013998823166511568, "loss": 0.0129, "step": 411530 }, { "epoch": 1.07, "learning_rate": 0.00013998434344874422, "loss": 0.016, "step": 411540 }, { "epoch": 1.07, "learning_rate": 0.00013998045523237277, "loss": 0.0128, "step": 411550 }, { "epoch": 1.07, "learning_rate": 0.0001399765670160013, "loss": 0.0161, "step": 411560 }, { "epoch": 1.07, "learning_rate": 0.00013997267879962982, "loss": 0.01, "step": 411570 }, { "epoch": 1.07, "learning_rate": 0.00013996879058325836, "loss": 0.0125, "step": 411580 }, { "epoch": 1.07, "learning_rate": 0.0001399649023668869, "loss": 0.0125, "step": 411590 }, { "epoch": 1.07, "learning_rate": 0.00013996101415051545, "loss": 0.0089, "step": 411600 }, { "epoch": 1.07, "learning_rate": 0.00013995712593414396, "loss": 0.0124, "step": 411610 }, { "epoch": 1.07, "learning_rate": 0.0001399532377177725, "loss": 0.0089, "step": 411620 }, { "epoch": 1.07, "learning_rate": 0.00013994934950140104, "loss": 0.0077, "step": 411630 }, { "epoch": 1.07, "learning_rate": 0.00013994546128502956, "loss": 0.0096, "step": 411640 }, { "epoch": 1.07, "learning_rate": 0.00013994157306865813, "loss": 0.0095, "step": 411650 }, { "epoch": 1.07, "learning_rate": 0.00013993768485228664, "loss": 0.0123, "step": 411660 }, { "epoch": 1.07, "learning_rate": 0.00013993379663591518, "loss": 0.0094, "step": 411670 }, { "epoch": 1.07, "learning_rate": 0.00013992990841954373, "loss": 0.012, "step": 411680 }, { "epoch": 1.07, "learning_rate": 0.00013992602020317227, "loss": 0.0104, "step": 411690 }, { "epoch": 1.07, "learning_rate": 0.00013992213198680078, "loss": 0.015, "step": 411700 }, { "epoch": 1.07, "learning_rate": 0.00013991824377042932, "loss": 0.014, "step": 411710 }, { "epoch": 1.07, "learning_rate": 0.00013991435555405786, "loss": 0.011, "step": 411720 }, { "epoch": 1.07, "learning_rate": 0.0001399104673376864, "loss": 0.011, "step": 411730 }, { "epoch": 1.07, "learning_rate": 0.00013990657912131492, "loss": 0.0134, "step": 411740 }, { "epoch": 1.07, "learning_rate": 0.00013990269090494346, "loss": 0.0129, "step": 411750 }, { "epoch": 1.07, "learning_rate": 0.000139898802688572, "loss": 0.0087, "step": 411760 }, { "epoch": 1.07, "learning_rate": 0.00013989491447220055, "loss": 0.0129, "step": 411770 }, { "epoch": 1.07, "learning_rate": 0.00013989102625582906, "loss": 0.014, "step": 411780 }, { "epoch": 1.07, "learning_rate": 0.0001398871380394576, "loss": 0.0112, "step": 411790 }, { "epoch": 1.07, "learning_rate": 0.00013988324982308614, "loss": 0.0124, "step": 411800 }, { "epoch": 1.07, "learning_rate": 0.00013987936160671469, "loss": 0.0131, "step": 411810 }, { "epoch": 1.07, "learning_rate": 0.0001398754733903432, "loss": 0.0108, "step": 411820 }, { "epoch": 1.07, "learning_rate": 0.00013987158517397177, "loss": 0.0126, "step": 411830 }, { "epoch": 1.07, "learning_rate": 0.00013986769695760028, "loss": 0.0108, "step": 411840 }, { "epoch": 1.07, "learning_rate": 0.00013986380874122882, "loss": 0.0105, "step": 411850 }, { "epoch": 1.07, "learning_rate": 0.00013985992052485737, "loss": 0.0136, "step": 411860 }, { "epoch": 1.07, "learning_rate": 0.00013985603230848588, "loss": 0.0104, "step": 411870 }, { "epoch": 1.07, "learning_rate": 0.00013985214409211442, "loss": 0.0107, "step": 411880 }, { "epoch": 1.07, "learning_rate": 0.00013984825587574296, "loss": 0.011, "step": 411890 }, { "epoch": 1.07, "learning_rate": 0.0001398443676593715, "loss": 0.0092, "step": 411900 }, { "epoch": 1.07, "learning_rate": 0.00013984047944300002, "loss": 0.0105, "step": 411910 }, { "epoch": 1.07, "learning_rate": 0.00013983659122662856, "loss": 0.0108, "step": 411920 }, { "epoch": 1.07, "learning_rate": 0.0001398327030102571, "loss": 0.0162, "step": 411930 }, { "epoch": 1.07, "learning_rate": 0.00013982881479388564, "loss": 0.0086, "step": 411940 }, { "epoch": 1.07, "learning_rate": 0.00013982492657751416, "loss": 0.0106, "step": 411950 }, { "epoch": 1.07, "learning_rate": 0.0001398210383611427, "loss": 0.0106, "step": 411960 }, { "epoch": 1.07, "learning_rate": 0.00013981715014477124, "loss": 0.0137, "step": 411970 }, { "epoch": 1.07, "learning_rate": 0.00013981326192839978, "loss": 0.0126, "step": 411980 }, { "epoch": 1.07, "learning_rate": 0.0001398093737120283, "loss": 0.0127, "step": 411990 }, { "epoch": 1.07, "learning_rate": 0.00013980548549565687, "loss": 0.0119, "step": 412000 }, { "epoch": 1.07, "eval_cer": 0.8817138834186412, "eval_loss": 0.007703993935137987, "eval_runtime": 107.4229, "eval_samples_per_second": 18.618, "eval_steps_per_second": 4.655, "step": 412000 }, { "epoch": 1.07, "learning_rate": 0.00013980159727928538, "loss": 0.0126, "step": 412010 }, { "epoch": 1.07, "learning_rate": 0.00013979770906291392, "loss": 0.0141, "step": 412020 }, { "epoch": 1.07, "learning_rate": 0.00013979382084654247, "loss": 0.0113, "step": 412030 }, { "epoch": 1.07, "learning_rate": 0.000139789932630171, "loss": 0.0115, "step": 412040 }, { "epoch": 1.07, "learning_rate": 0.00013978604441379952, "loss": 0.0127, "step": 412050 }, { "epoch": 1.07, "learning_rate": 0.00013978215619742806, "loss": 0.0121, "step": 412060 }, { "epoch": 1.07, "learning_rate": 0.0001397782679810566, "loss": 0.0098, "step": 412070 }, { "epoch": 1.07, "learning_rate": 0.00013977437976468515, "loss": 0.0113, "step": 412080 }, { "epoch": 1.07, "learning_rate": 0.00013977049154831366, "loss": 0.0091, "step": 412090 }, { "epoch": 1.07, "learning_rate": 0.0001397666033319422, "loss": 0.0111, "step": 412100 }, { "epoch": 1.07, "learning_rate": 0.00013976271511557074, "loss": 0.0107, "step": 412110 }, { "epoch": 1.07, "learning_rate": 0.00013975882689919926, "loss": 0.0108, "step": 412120 }, { "epoch": 1.07, "learning_rate": 0.0001397549386828278, "loss": 0.012, "step": 412130 }, { "epoch": 1.07, "learning_rate": 0.00013975105046645634, "loss": 0.0107, "step": 412140 }, { "epoch": 1.07, "learning_rate": 0.00013974716225008488, "loss": 0.0114, "step": 412150 }, { "epoch": 1.07, "learning_rate": 0.0001397432740337134, "loss": 0.0097, "step": 412160 }, { "epoch": 1.07, "learning_rate": 0.00013973938581734194, "loss": 0.0086, "step": 412170 }, { "epoch": 1.07, "learning_rate": 0.00013973549760097048, "loss": 0.0117, "step": 412180 }, { "epoch": 1.07, "learning_rate": 0.00013973160938459902, "loss": 0.0095, "step": 412190 }, { "epoch": 1.07, "learning_rate": 0.00013972772116822756, "loss": 0.0128, "step": 412200 }, { "epoch": 1.07, "learning_rate": 0.0001397238329518561, "loss": 0.0105, "step": 412210 }, { "epoch": 1.07, "learning_rate": 0.00013971994473548462, "loss": 0.0105, "step": 412220 }, { "epoch": 1.07, "learning_rate": 0.00013971605651911316, "loss": 0.013, "step": 412230 }, { "epoch": 1.07, "learning_rate": 0.0001397121683027417, "loss": 0.0152, "step": 412240 }, { "epoch": 1.07, "learning_rate": 0.00013970828008637025, "loss": 0.0109, "step": 412250 }, { "epoch": 1.07, "learning_rate": 0.00013970439186999876, "loss": 0.013, "step": 412260 }, { "epoch": 1.07, "learning_rate": 0.0001397005036536273, "loss": 0.0081, "step": 412270 }, { "epoch": 1.07, "learning_rate": 0.00013969661543725584, "loss": 0.0117, "step": 412280 }, { "epoch": 1.07, "learning_rate": 0.00013969272722088439, "loss": 0.0221, "step": 412290 }, { "epoch": 1.07, "learning_rate": 0.0001396888390045129, "loss": 0.0123, "step": 412300 }, { "epoch": 1.07, "learning_rate": 0.00013968495078814144, "loss": 0.0094, "step": 412310 }, { "epoch": 1.07, "learning_rate": 0.00013968106257176998, "loss": 0.0139, "step": 412320 }, { "epoch": 1.07, "learning_rate": 0.00013967717435539852, "loss": 0.0115, "step": 412330 }, { "epoch": 1.07, "learning_rate": 0.00013967328613902704, "loss": 0.0139, "step": 412340 }, { "epoch": 1.07, "learning_rate": 0.0001396693979226556, "loss": 0.0098, "step": 412350 }, { "epoch": 1.07, "learning_rate": 0.00013966550970628412, "loss": 0.011, "step": 412360 }, { "epoch": 1.07, "learning_rate": 0.00013966162148991264, "loss": 0.0091, "step": 412370 }, { "epoch": 1.07, "learning_rate": 0.0001396577332735412, "loss": 0.0116, "step": 412380 }, { "epoch": 1.07, "learning_rate": 0.00013965384505716972, "loss": 0.0117, "step": 412390 }, { "epoch": 1.07, "learning_rate": 0.00013964995684079826, "loss": 0.0135, "step": 412400 }, { "epoch": 1.07, "learning_rate": 0.0001396460686244268, "loss": 0.009, "step": 412410 }, { "epoch": 1.07, "learning_rate": 0.00013964218040805535, "loss": 0.0105, "step": 412420 }, { "epoch": 1.07, "learning_rate": 0.00013963829219168386, "loss": 0.0125, "step": 412430 }, { "epoch": 1.07, "learning_rate": 0.0001396344039753124, "loss": 0.0089, "step": 412440 }, { "epoch": 1.07, "learning_rate": 0.00013963051575894094, "loss": 0.01, "step": 412450 }, { "epoch": 1.07, "learning_rate": 0.00013962662754256948, "loss": 0.0109, "step": 412460 }, { "epoch": 1.07, "learning_rate": 0.000139622739326198, "loss": 0.0104, "step": 412470 }, { "epoch": 1.07, "learning_rate": 0.00013961885110982654, "loss": 0.0119, "step": 412480 }, { "epoch": 1.07, "learning_rate": 0.00013961496289345508, "loss": 0.0161, "step": 412490 }, { "epoch": 1.07, "learning_rate": 0.00013961107467708362, "loss": 0.0092, "step": 412500 }, { "epoch": 1.07, "learning_rate": 0.00013960718646071214, "loss": 0.0131, "step": 412510 }, { "epoch": 1.07, "learning_rate": 0.0001396032982443407, "loss": 0.0108, "step": 412520 }, { "epoch": 1.07, "learning_rate": 0.00013959941002796922, "loss": 0.0097, "step": 412530 }, { "epoch": 1.07, "learning_rate": 0.00013959552181159776, "loss": 0.0123, "step": 412540 }, { "epoch": 1.07, "learning_rate": 0.0001395916335952263, "loss": 0.0092, "step": 412550 }, { "epoch": 1.07, "learning_rate": 0.00013958774537885485, "loss": 0.0115, "step": 412560 }, { "epoch": 1.07, "learning_rate": 0.00013958385716248336, "loss": 0.0113, "step": 412570 }, { "epoch": 1.07, "learning_rate": 0.0001395799689461119, "loss": 0.0135, "step": 412580 }, { "epoch": 1.07, "learning_rate": 0.00013957608072974044, "loss": 0.0149, "step": 412590 }, { "epoch": 1.07, "learning_rate": 0.000139572192513369, "loss": 0.0105, "step": 412600 }, { "epoch": 1.07, "learning_rate": 0.0001395683042969975, "loss": 0.0099, "step": 412610 }, { "epoch": 1.07, "learning_rate": 0.00013956441608062604, "loss": 0.0106, "step": 412620 }, { "epoch": 1.07, "learning_rate": 0.00013956052786425458, "loss": 0.0099, "step": 412630 }, { "epoch": 1.07, "learning_rate": 0.0001395566396478831, "loss": 0.0097, "step": 412640 }, { "epoch": 1.07, "learning_rate": 0.00013955275143151164, "loss": 0.0115, "step": 412650 }, { "epoch": 1.07, "learning_rate": 0.00013954886321514018, "loss": 0.0112, "step": 412660 }, { "epoch": 1.07, "learning_rate": 0.00013954497499876872, "loss": 0.0081, "step": 412670 }, { "epoch": 1.07, "learning_rate": 0.00013954108678239724, "loss": 0.009, "step": 412680 }, { "epoch": 1.07, "learning_rate": 0.00013953719856602578, "loss": 0.0126, "step": 412690 }, { "epoch": 1.07, "learning_rate": 0.00013953331034965432, "loss": 0.0102, "step": 412700 }, { "epoch": 1.07, "learning_rate": 0.00013952942213328286, "loss": 0.0099, "step": 412710 }, { "epoch": 1.07, "learning_rate": 0.0001395255339169114, "loss": 0.0104, "step": 412720 }, { "epoch": 1.07, "learning_rate": 0.00013952164570053995, "loss": 0.0101, "step": 412730 }, { "epoch": 1.07, "learning_rate": 0.00013951775748416846, "loss": 0.0135, "step": 412740 }, { "epoch": 1.07, "learning_rate": 0.000139513869267797, "loss": 0.0141, "step": 412750 }, { "epoch": 1.07, "learning_rate": 0.00013950998105142554, "loss": 0.015, "step": 412760 }, { "epoch": 1.07, "learning_rate": 0.00013950609283505409, "loss": 0.0088, "step": 412770 }, { "epoch": 1.07, "learning_rate": 0.0001395022046186826, "loss": 0.0109, "step": 412780 }, { "epoch": 1.07, "learning_rate": 0.00013949831640231114, "loss": 0.0111, "step": 412790 }, { "epoch": 1.07, "learning_rate": 0.00013949442818593968, "loss": 0.0135, "step": 412800 }, { "epoch": 1.07, "learning_rate": 0.00013949053996956823, "loss": 0.0133, "step": 412810 }, { "epoch": 1.07, "learning_rate": 0.00013948665175319674, "loss": 0.0086, "step": 412820 }, { "epoch": 1.07, "learning_rate": 0.00013948276353682528, "loss": 0.0146, "step": 412830 }, { "epoch": 1.07, "learning_rate": 0.00013947887532045382, "loss": 0.0098, "step": 412840 }, { "epoch": 1.07, "learning_rate": 0.00013947498710408234, "loss": 0.0101, "step": 412850 }, { "epoch": 1.07, "learning_rate": 0.00013947109888771088, "loss": 0.0105, "step": 412860 }, { "epoch": 1.07, "learning_rate": 0.00013946721067133942, "loss": 0.0125, "step": 412870 }, { "epoch": 1.07, "learning_rate": 0.00013946332245496796, "loss": 0.0103, "step": 412880 }, { "epoch": 1.07, "learning_rate": 0.00013945943423859648, "loss": 0.0142, "step": 412890 }, { "epoch": 1.07, "learning_rate": 0.00013945554602222505, "loss": 0.01, "step": 412900 }, { "epoch": 1.07, "learning_rate": 0.00013945165780585356, "loss": 0.0087, "step": 412910 }, { "epoch": 1.07, "learning_rate": 0.0001394477695894821, "loss": 0.0104, "step": 412920 }, { "epoch": 1.07, "learning_rate": 0.00013944388137311064, "loss": 0.0099, "step": 412930 }, { "epoch": 1.07, "learning_rate": 0.00013943999315673919, "loss": 0.0172, "step": 412940 }, { "epoch": 1.07, "learning_rate": 0.0001394361049403677, "loss": 0.0106, "step": 412950 }, { "epoch": 1.07, "learning_rate": 0.00013943221672399624, "loss": 0.0143, "step": 412960 }, { "epoch": 1.07, "learning_rate": 0.00013942832850762478, "loss": 0.0094, "step": 412970 }, { "epoch": 1.07, "learning_rate": 0.00013942444029125332, "loss": 0.0125, "step": 412980 }, { "epoch": 1.07, "learning_rate": 0.00013942055207488184, "loss": 0.0136, "step": 412990 }, { "epoch": 1.07, "learning_rate": 0.00013941666385851038, "loss": 0.0098, "step": 413000 }, { "epoch": 1.07, "eval_cer": 0.8817082848709045, "eval_loss": 0.007829415611922741, "eval_runtime": 107.3445, "eval_samples_per_second": 18.632, "eval_steps_per_second": 4.658, "step": 413000 }, { "epoch": 1.07, "learning_rate": 0.00013941277564213892, "loss": 0.0109, "step": 413010 }, { "epoch": 1.07, "learning_rate": 0.00013940888742576746, "loss": 0.0114, "step": 413020 }, { "epoch": 1.07, "learning_rate": 0.00013940499920939598, "loss": 0.0108, "step": 413030 }, { "epoch": 1.07, "learning_rate": 0.00013940111099302455, "loss": 0.0212, "step": 413040 }, { "epoch": 1.07, "learning_rate": 0.00013939722277665306, "loss": 0.013, "step": 413050 }, { "epoch": 1.07, "learning_rate": 0.0001393933345602816, "loss": 0.012, "step": 413060 }, { "epoch": 1.07, "learning_rate": 0.00013938944634391015, "loss": 0.0123, "step": 413070 }, { "epoch": 1.07, "learning_rate": 0.0001393855581275387, "loss": 0.0132, "step": 413080 }, { "epoch": 1.07, "learning_rate": 0.0001393816699111672, "loss": 0.0112, "step": 413090 }, { "epoch": 1.07, "learning_rate": 0.00013937778169479574, "loss": 0.0124, "step": 413100 }, { "epoch": 1.07, "learning_rate": 0.00013937389347842428, "loss": 0.0118, "step": 413110 }, { "epoch": 1.07, "learning_rate": 0.0001393700052620528, "loss": 0.0135, "step": 413120 }, { "epoch": 1.07, "learning_rate": 0.00013936611704568134, "loss": 0.0162, "step": 413130 }, { "epoch": 1.07, "learning_rate": 0.00013936222882930988, "loss": 0.0097, "step": 413140 }, { "epoch": 1.07, "learning_rate": 0.00013935834061293842, "loss": 0.0102, "step": 413150 }, { "epoch": 1.07, "learning_rate": 0.00013935445239656694, "loss": 0.0098, "step": 413160 }, { "epoch": 1.07, "learning_rate": 0.00013935056418019548, "loss": 0.0163, "step": 413170 }, { "epoch": 1.07, "learning_rate": 0.00013934667596382402, "loss": 0.0092, "step": 413180 }, { "epoch": 1.07, "learning_rate": 0.00013934278774745256, "loss": 0.013, "step": 413190 }, { "epoch": 1.07, "learning_rate": 0.00013933889953108108, "loss": 0.0103, "step": 413200 }, { "epoch": 1.07, "learning_rate": 0.00013933501131470962, "loss": 0.0106, "step": 413210 }, { "epoch": 1.07, "learning_rate": 0.00013933112309833816, "loss": 0.0115, "step": 413220 }, { "epoch": 1.07, "learning_rate": 0.0001393272348819667, "loss": 0.012, "step": 413230 }, { "epoch": 1.07, "learning_rate": 0.00013932334666559524, "loss": 0.0113, "step": 413240 }, { "epoch": 1.07, "learning_rate": 0.00013931945844922379, "loss": 0.0129, "step": 413250 }, { "epoch": 1.07, "learning_rate": 0.0001393155702328523, "loss": 0.0097, "step": 413260 }, { "epoch": 1.07, "learning_rate": 0.00013931168201648084, "loss": 0.0109, "step": 413270 }, { "epoch": 1.07, "learning_rate": 0.00013930779380010938, "loss": 0.0085, "step": 413280 }, { "epoch": 1.07, "learning_rate": 0.00013930390558373793, "loss": 0.0124, "step": 413290 }, { "epoch": 1.07, "learning_rate": 0.00013930001736736644, "loss": 0.0123, "step": 413300 }, { "epoch": 1.07, "learning_rate": 0.00013929612915099498, "loss": 0.0104, "step": 413310 }, { "epoch": 1.07, "learning_rate": 0.00013929224093462352, "loss": 0.013, "step": 413320 }, { "epoch": 1.07, "learning_rate": 0.00013928835271825207, "loss": 0.0119, "step": 413330 }, { "epoch": 1.07, "learning_rate": 0.00013928446450188058, "loss": 0.0135, "step": 413340 }, { "epoch": 1.07, "learning_rate": 0.00013928057628550912, "loss": 0.01, "step": 413350 }, { "epoch": 1.07, "learning_rate": 0.00013927668806913766, "loss": 0.0133, "step": 413360 }, { "epoch": 1.07, "learning_rate": 0.00013927279985276618, "loss": 0.0145, "step": 413370 }, { "epoch": 1.07, "learning_rate": 0.00013926891163639472, "loss": 0.0123, "step": 413380 }, { "epoch": 1.07, "learning_rate": 0.00013926502342002326, "loss": 0.0132, "step": 413390 }, { "epoch": 1.07, "learning_rate": 0.0001392611352036518, "loss": 0.0092, "step": 413400 }, { "epoch": 1.07, "learning_rate": 0.00013925724698728032, "loss": 0.0169, "step": 413410 }, { "epoch": 1.07, "learning_rate": 0.00013925335877090889, "loss": 0.0126, "step": 413420 }, { "epoch": 1.07, "learning_rate": 0.0001392494705545374, "loss": 0.0145, "step": 413430 }, { "epoch": 1.07, "learning_rate": 0.00013924558233816594, "loss": 0.0113, "step": 413440 }, { "epoch": 1.07, "learning_rate": 0.00013924169412179448, "loss": 0.0128, "step": 413450 }, { "epoch": 1.07, "learning_rate": 0.00013923780590542303, "loss": 0.0107, "step": 413460 }, { "epoch": 1.07, "learning_rate": 0.00013923391768905154, "loss": 0.0127, "step": 413470 }, { "epoch": 1.07, "learning_rate": 0.00013923002947268008, "loss": 0.0106, "step": 413480 }, { "epoch": 1.07, "learning_rate": 0.00013922614125630862, "loss": 0.0099, "step": 413490 }, { "epoch": 1.07, "learning_rate": 0.00013922225303993716, "loss": 0.0129, "step": 413500 }, { "epoch": 1.07, "learning_rate": 0.00013921836482356568, "loss": 0.0082, "step": 413510 }, { "epoch": 1.07, "learning_rate": 0.00013921447660719422, "loss": 0.01, "step": 413520 }, { "epoch": 1.07, "learning_rate": 0.00013921058839082276, "loss": 0.0118, "step": 413530 }, { "epoch": 1.07, "learning_rate": 0.0001392067001744513, "loss": 0.0098, "step": 413540 }, { "epoch": 1.07, "learning_rate": 0.00013920281195807982, "loss": 0.0093, "step": 413550 }, { "epoch": 1.07, "learning_rate": 0.00013919892374170836, "loss": 0.0091, "step": 413560 }, { "epoch": 1.07, "learning_rate": 0.0001391950355253369, "loss": 0.0103, "step": 413570 }, { "epoch": 1.07, "learning_rate": 0.00013919114730896544, "loss": 0.0102, "step": 413580 }, { "epoch": 1.07, "learning_rate": 0.00013918725909259399, "loss": 0.0104, "step": 413590 }, { "epoch": 1.07, "learning_rate": 0.0001391833708762225, "loss": 0.0096, "step": 413600 }, { "epoch": 1.07, "learning_rate": 0.00013917948265985104, "loss": 0.0135, "step": 413610 }, { "epoch": 1.07, "learning_rate": 0.00013917559444347958, "loss": 0.0122, "step": 413620 }, { "epoch": 1.07, "learning_rate": 0.00013917170622710812, "loss": 0.0121, "step": 413630 }, { "epoch": 1.07, "learning_rate": 0.00013916781801073664, "loss": 0.0111, "step": 413640 }, { "epoch": 1.07, "learning_rate": 0.00013916392979436518, "loss": 0.013, "step": 413650 }, { "epoch": 1.07, "learning_rate": 0.00013916004157799372, "loss": 0.0157, "step": 413660 }, { "epoch": 1.07, "learning_rate": 0.00013915615336162226, "loss": 0.0099, "step": 413670 }, { "epoch": 1.07, "learning_rate": 0.00013915226514525078, "loss": 0.0085, "step": 413680 }, { "epoch": 1.07, "learning_rate": 0.00013914837692887932, "loss": 0.0143, "step": 413690 }, { "epoch": 1.07, "learning_rate": 0.00013914448871250786, "loss": 0.0139, "step": 413700 }, { "epoch": 1.07, "learning_rate": 0.0001391406004961364, "loss": 0.0122, "step": 413710 }, { "epoch": 1.07, "learning_rate": 0.00013913671227976492, "loss": 0.0116, "step": 413720 }, { "epoch": 1.07, "learning_rate": 0.00013913282406339346, "loss": 0.0135, "step": 413730 }, { "epoch": 1.07, "learning_rate": 0.000139128935847022, "loss": 0.0128, "step": 413740 }, { "epoch": 1.07, "learning_rate": 0.00013912504763065054, "loss": 0.0104, "step": 413750 }, { "epoch": 1.07, "learning_rate": 0.00013912115941427906, "loss": 0.0093, "step": 413760 }, { "epoch": 1.07, "learning_rate": 0.00013911727119790763, "loss": 0.0094, "step": 413770 }, { "epoch": 1.07, "learning_rate": 0.00013911338298153614, "loss": 0.0093, "step": 413780 }, { "epoch": 1.07, "learning_rate": 0.00013910949476516468, "loss": 0.0109, "step": 413790 }, { "epoch": 1.07, "learning_rate": 0.00013910560654879322, "loss": 0.0096, "step": 413800 }, { "epoch": 1.07, "learning_rate": 0.00013910171833242177, "loss": 0.0092, "step": 413810 }, { "epoch": 1.07, "learning_rate": 0.00013909783011605028, "loss": 0.013, "step": 413820 }, { "epoch": 1.07, "learning_rate": 0.00013909394189967882, "loss": 0.0144, "step": 413830 }, { "epoch": 1.07, "learning_rate": 0.00013909005368330736, "loss": 0.0109, "step": 413840 }, { "epoch": 1.07, "learning_rate": 0.00013908616546693588, "loss": 0.0114, "step": 413850 }, { "epoch": 1.07, "learning_rate": 0.00013908227725056442, "loss": 0.0111, "step": 413860 }, { "epoch": 1.07, "learning_rate": 0.00013907838903419296, "loss": 0.0099, "step": 413870 }, { "epoch": 1.07, "learning_rate": 0.0001390745008178215, "loss": 0.0139, "step": 413880 }, { "epoch": 1.07, "learning_rate": 0.00013907061260145002, "loss": 0.0107, "step": 413890 }, { "epoch": 1.07, "learning_rate": 0.00013906672438507856, "loss": 0.0112, "step": 413900 }, { "epoch": 1.07, "learning_rate": 0.0001390628361687071, "loss": 0.0107, "step": 413910 }, { "epoch": 1.07, "learning_rate": 0.00013905894795233564, "loss": 0.011, "step": 413920 }, { "epoch": 1.07, "learning_rate": 0.00013905505973596416, "loss": 0.0111, "step": 413930 }, { "epoch": 1.07, "learning_rate": 0.00013905117151959273, "loss": 0.0132, "step": 413940 }, { "epoch": 1.07, "learning_rate": 0.00013904728330322124, "loss": 0.0143, "step": 413950 }, { "epoch": 1.07, "learning_rate": 0.00013904339508684978, "loss": 0.0126, "step": 413960 }, { "epoch": 1.07, "learning_rate": 0.00013903950687047832, "loss": 0.0098, "step": 413970 }, { "epoch": 1.07, "learning_rate": 0.00013903561865410687, "loss": 0.0108, "step": 413980 }, { "epoch": 1.07, "learning_rate": 0.00013903173043773538, "loss": 0.0113, "step": 413990 }, { "epoch": 1.07, "learning_rate": 0.00013902784222136392, "loss": 0.0139, "step": 414000 }, { "epoch": 1.07, "eval_cer": 0.881704085960102, "eval_loss": 0.007683408912271261, "eval_runtime": 107.5812, "eval_samples_per_second": 18.591, "eval_steps_per_second": 4.648, "step": 414000 }, { "epoch": 1.07, "learning_rate": 0.00013902395400499246, "loss": 0.0113, "step": 414010 }, { "epoch": 1.07, "learning_rate": 0.000139020065788621, "loss": 0.0096, "step": 414020 }, { "epoch": 1.07, "learning_rate": 0.00013901617757224952, "loss": 0.0124, "step": 414030 }, { "epoch": 1.07, "learning_rate": 0.00013901228935587806, "loss": 0.0115, "step": 414040 }, { "epoch": 1.07, "learning_rate": 0.0001390084011395066, "loss": 0.0086, "step": 414050 }, { "epoch": 1.07, "learning_rate": 0.00013900451292313514, "loss": 0.0141, "step": 414060 }, { "epoch": 1.07, "learning_rate": 0.00013900062470676366, "loss": 0.0089, "step": 414070 }, { "epoch": 1.07, "learning_rate": 0.0001389967364903922, "loss": 0.0117, "step": 414080 }, { "epoch": 1.07, "learning_rate": 0.00013899284827402074, "loss": 0.0108, "step": 414090 }, { "epoch": 1.07, "learning_rate": 0.00013898896005764926, "loss": 0.011, "step": 414100 }, { "epoch": 1.07, "learning_rate": 0.00013898507184127783, "loss": 0.0145, "step": 414110 }, { "epoch": 1.07, "learning_rate": 0.00013898118362490634, "loss": 0.0109, "step": 414120 }, { "epoch": 1.07, "learning_rate": 0.00013897729540853488, "loss": 0.009, "step": 414130 }, { "epoch": 1.07, "learning_rate": 0.00013897340719216342, "loss": 0.0092, "step": 414140 }, { "epoch": 1.07, "learning_rate": 0.00013896951897579196, "loss": 0.0115, "step": 414150 }, { "epoch": 1.07, "learning_rate": 0.00013896563075942048, "loss": 0.0125, "step": 414160 }, { "epoch": 1.07, "learning_rate": 0.00013896174254304902, "loss": 0.0125, "step": 414170 }, { "epoch": 1.07, "learning_rate": 0.00013895785432667756, "loss": 0.0109, "step": 414180 }, { "epoch": 1.07, "learning_rate": 0.0001389539661103061, "loss": 0.01, "step": 414190 }, { "epoch": 1.07, "learning_rate": 0.00013895007789393462, "loss": 0.0122, "step": 414200 }, { "epoch": 1.07, "learning_rate": 0.00013894618967756316, "loss": 0.0097, "step": 414210 }, { "epoch": 1.07, "learning_rate": 0.0001389423014611917, "loss": 0.0095, "step": 414220 }, { "epoch": 1.07, "learning_rate": 0.00013893841324482024, "loss": 0.0123, "step": 414230 }, { "epoch": 1.07, "learning_rate": 0.00013893452502844876, "loss": 0.0103, "step": 414240 }, { "epoch": 1.07, "learning_rate": 0.0001389306368120773, "loss": 0.0103, "step": 414250 }, { "epoch": 1.07, "learning_rate": 0.00013892674859570584, "loss": 0.0132, "step": 414260 }, { "epoch": 1.07, "learning_rate": 0.00013892286037933438, "loss": 0.0119, "step": 414270 }, { "epoch": 1.07, "learning_rate": 0.0001389189721629629, "loss": 0.0133, "step": 414280 }, { "epoch": 1.07, "learning_rate": 0.00013891508394659147, "loss": 0.0142, "step": 414290 }, { "epoch": 1.07, "learning_rate": 0.00013891119573021998, "loss": 0.0105, "step": 414300 }, { "epoch": 1.07, "learning_rate": 0.00013890730751384852, "loss": 0.0107, "step": 414310 }, { "epoch": 1.07, "learning_rate": 0.00013890341929747706, "loss": 0.0129, "step": 414320 }, { "epoch": 1.07, "learning_rate": 0.0001388995310811056, "loss": 0.0092, "step": 414330 }, { "epoch": 1.07, "learning_rate": 0.00013889564286473412, "loss": 0.0116, "step": 414340 }, { "epoch": 1.07, "learning_rate": 0.00013889175464836266, "loss": 0.0176, "step": 414350 }, { "epoch": 1.07, "learning_rate": 0.0001388878664319912, "loss": 0.0113, "step": 414360 }, { "epoch": 1.07, "learning_rate": 0.00013888397821561972, "loss": 0.0129, "step": 414370 }, { "epoch": 1.07, "learning_rate": 0.00013888008999924826, "loss": 0.017, "step": 414380 }, { "epoch": 1.07, "learning_rate": 0.0001388762017828768, "loss": 0.012, "step": 414390 }, { "epoch": 1.07, "learning_rate": 0.00013887231356650534, "loss": 0.0097, "step": 414400 }, { "epoch": 1.07, "learning_rate": 0.00013886842535013386, "loss": 0.0083, "step": 414410 }, { "epoch": 1.07, "learning_rate": 0.0001388645371337624, "loss": 0.0107, "step": 414420 }, { "epoch": 1.07, "learning_rate": 0.00013886064891739094, "loss": 0.011, "step": 414430 }, { "epoch": 1.07, "learning_rate": 0.00013885676070101948, "loss": 0.0085, "step": 414440 }, { "epoch": 1.07, "learning_rate": 0.000138852872484648, "loss": 0.0128, "step": 414450 }, { "epoch": 1.07, "learning_rate": 0.00013884898426827657, "loss": 0.0096, "step": 414460 }, { "epoch": 1.07, "learning_rate": 0.00013884509605190508, "loss": 0.0141, "step": 414470 }, { "epoch": 1.07, "learning_rate": 0.00013884120783553362, "loss": 0.0181, "step": 414480 }, { "epoch": 1.07, "learning_rate": 0.00013883731961916216, "loss": 0.011, "step": 414490 }, { "epoch": 1.07, "learning_rate": 0.0001388334314027907, "loss": 0.0136, "step": 414500 }, { "epoch": 1.07, "learning_rate": 0.00013882954318641922, "loss": 0.0113, "step": 414510 }, { "epoch": 1.07, "learning_rate": 0.00013882565497004776, "loss": 0.0159, "step": 414520 }, { "epoch": 1.07, "learning_rate": 0.0001388217667536763, "loss": 0.0087, "step": 414530 }, { "epoch": 1.07, "learning_rate": 0.00013881787853730484, "loss": 0.0115, "step": 414540 }, { "epoch": 1.07, "learning_rate": 0.00013881399032093336, "loss": 0.0102, "step": 414550 }, { "epoch": 1.07, "learning_rate": 0.0001388101021045619, "loss": 0.0118, "step": 414560 }, { "epoch": 1.07, "learning_rate": 0.00013880621388819044, "loss": 0.0128, "step": 414570 }, { "epoch": 1.07, "learning_rate": 0.00013880232567181898, "loss": 0.0098, "step": 414580 }, { "epoch": 1.07, "learning_rate": 0.0001387984374554475, "loss": 0.0118, "step": 414590 }, { "epoch": 1.07, "learning_rate": 0.00013879454923907604, "loss": 0.0094, "step": 414600 }, { "epoch": 1.07, "learning_rate": 0.00013879066102270458, "loss": 0.0122, "step": 414610 }, { "epoch": 1.07, "learning_rate": 0.0001387867728063331, "loss": 0.009, "step": 414620 }, { "epoch": 1.07, "learning_rate": 0.00013878288458996167, "loss": 0.0117, "step": 414630 }, { "epoch": 1.07, "learning_rate": 0.00013877899637359018, "loss": 0.0162, "step": 414640 }, { "epoch": 1.07, "learning_rate": 0.00013877510815721872, "loss": 0.0104, "step": 414650 }, { "epoch": 1.07, "learning_rate": 0.00013877121994084726, "loss": 0.0127, "step": 414660 }, { "epoch": 1.07, "learning_rate": 0.0001387673317244758, "loss": 0.0101, "step": 414670 }, { "epoch": 1.07, "learning_rate": 0.00013876344350810432, "loss": 0.0138, "step": 414680 }, { "epoch": 1.07, "learning_rate": 0.00013875955529173286, "loss": 0.0171, "step": 414690 }, { "epoch": 1.07, "learning_rate": 0.0001387556670753614, "loss": 0.0101, "step": 414700 }, { "epoch": 1.07, "learning_rate": 0.00013875177885898994, "loss": 0.011, "step": 414710 }, { "epoch": 1.08, "learning_rate": 0.00013874789064261846, "loss": 0.0127, "step": 414720 }, { "epoch": 1.08, "learning_rate": 0.000138744002426247, "loss": 0.0124, "step": 414730 }, { "epoch": 1.08, "learning_rate": 0.00013874011420987554, "loss": 0.01, "step": 414740 }, { "epoch": 1.08, "learning_rate": 0.00013873622599350408, "loss": 0.0147, "step": 414750 }, { "epoch": 1.08, "learning_rate": 0.0001387323377771326, "loss": 0.0106, "step": 414760 }, { "epoch": 1.08, "learning_rate": 0.00013872844956076114, "loss": 0.01, "step": 414770 }, { "epoch": 1.08, "learning_rate": 0.00013872456134438968, "loss": 0.0108, "step": 414780 }, { "epoch": 1.08, "learning_rate": 0.00013872067312801822, "loss": 0.0119, "step": 414790 }, { "epoch": 1.08, "learning_rate": 0.00013871678491164674, "loss": 0.0118, "step": 414800 }, { "epoch": 1.08, "learning_rate": 0.0001387128966952753, "loss": 0.0108, "step": 414810 }, { "epoch": 1.08, "learning_rate": 0.00013870900847890382, "loss": 0.0102, "step": 414820 }, { "epoch": 1.08, "learning_rate": 0.00013870512026253236, "loss": 0.0078, "step": 414830 }, { "epoch": 1.08, "learning_rate": 0.0001387012320461609, "loss": 0.0094, "step": 414840 }, { "epoch": 1.08, "learning_rate": 0.00013869734382978942, "loss": 0.0106, "step": 414850 }, { "epoch": 1.08, "learning_rate": 0.00013869345561341796, "loss": 0.0125, "step": 414860 }, { "epoch": 1.08, "learning_rate": 0.0001386895673970465, "loss": 0.0107, "step": 414870 }, { "epoch": 1.08, "learning_rate": 0.00013868567918067504, "loss": 0.0102, "step": 414880 }, { "epoch": 1.08, "learning_rate": 0.00013868179096430356, "loss": 0.0111, "step": 414890 }, { "epoch": 1.08, "learning_rate": 0.0001386779027479321, "loss": 0.0109, "step": 414900 }, { "epoch": 1.08, "learning_rate": 0.00013867401453156064, "loss": 0.0123, "step": 414910 }, { "epoch": 1.08, "learning_rate": 0.00013867012631518918, "loss": 0.0114, "step": 414920 }, { "epoch": 1.08, "learning_rate": 0.0001386662380988177, "loss": 0.0103, "step": 414930 }, { "epoch": 1.08, "learning_rate": 0.00013866234988244624, "loss": 0.009, "step": 414940 }, { "epoch": 1.08, "learning_rate": 0.00013865846166607478, "loss": 0.014, "step": 414950 }, { "epoch": 1.08, "learning_rate": 0.00013865457344970332, "loss": 0.0104, "step": 414960 }, { "epoch": 1.08, "learning_rate": 0.00013865068523333184, "loss": 0.0108, "step": 414970 }, { "epoch": 1.08, "learning_rate": 0.0001386467970169604, "loss": 0.0118, "step": 414980 }, { "epoch": 1.08, "learning_rate": 0.00013864290880058892, "loss": 0.0142, "step": 414990 }, { "epoch": 1.08, "learning_rate": 0.00013863902058421746, "loss": 0.0093, "step": 415000 }, { "epoch": 1.08, "eval_cer": 0.881727879787983, "eval_loss": 0.0076110344380140305, "eval_runtime": 107.5209, "eval_samples_per_second": 18.601, "eval_steps_per_second": 4.65, "step": 415000 }, { "epoch": 1.08, "learning_rate": 0.000138635132367846, "loss": 0.0094, "step": 415010 }, { "epoch": 1.08, "learning_rate": 0.00013863124415147454, "loss": 0.0102, "step": 415020 }, { "epoch": 1.08, "learning_rate": 0.00013862735593510306, "loss": 0.0091, "step": 415030 }, { "epoch": 1.08, "learning_rate": 0.0001386234677187316, "loss": 0.0133, "step": 415040 }, { "epoch": 1.08, "learning_rate": 0.00013861957950236014, "loss": 0.0136, "step": 415050 }, { "epoch": 1.08, "learning_rate": 0.00013861569128598868, "loss": 0.0098, "step": 415060 }, { "epoch": 1.08, "learning_rate": 0.0001386118030696172, "loss": 0.0167, "step": 415070 }, { "epoch": 1.08, "learning_rate": 0.00013860791485324574, "loss": 0.0138, "step": 415080 }, { "epoch": 1.08, "learning_rate": 0.00013860402663687428, "loss": 0.011, "step": 415090 }, { "epoch": 1.08, "learning_rate": 0.0001386001384205028, "loss": 0.0099, "step": 415100 }, { "epoch": 1.08, "learning_rate": 0.00013859625020413134, "loss": 0.0093, "step": 415110 }, { "epoch": 1.08, "learning_rate": 0.00013859236198775988, "loss": 0.0076, "step": 415120 }, { "epoch": 1.08, "learning_rate": 0.00013858847377138842, "loss": 0.0085, "step": 415130 }, { "epoch": 1.08, "learning_rate": 0.00013858458555501694, "loss": 0.0129, "step": 415140 }, { "epoch": 1.08, "learning_rate": 0.00013858069733864548, "loss": 0.0121, "step": 415150 }, { "epoch": 1.08, "learning_rate": 0.00013857680912227402, "loss": 0.0108, "step": 415160 }, { "epoch": 1.08, "learning_rate": 0.00013857292090590256, "loss": 0.0104, "step": 415170 }, { "epoch": 1.08, "learning_rate": 0.0001385690326895311, "loss": 0.0142, "step": 415180 }, { "epoch": 1.08, "learning_rate": 0.00013856514447315964, "loss": 0.0109, "step": 415190 }, { "epoch": 1.08, "learning_rate": 0.00013856125625678816, "loss": 0.0106, "step": 415200 }, { "epoch": 1.08, "learning_rate": 0.0001385573680404167, "loss": 0.0147, "step": 415210 }, { "epoch": 1.08, "learning_rate": 0.00013855347982404524, "loss": 0.0149, "step": 415220 }, { "epoch": 1.08, "learning_rate": 0.00013854959160767378, "loss": 0.0111, "step": 415230 }, { "epoch": 1.08, "learning_rate": 0.0001385457033913023, "loss": 0.0104, "step": 415240 }, { "epoch": 1.08, "learning_rate": 0.00013854181517493084, "loss": 0.0117, "step": 415250 }, { "epoch": 1.08, "learning_rate": 0.00013853792695855938, "loss": 0.013, "step": 415260 }, { "epoch": 1.08, "learning_rate": 0.00013853403874218792, "loss": 0.0128, "step": 415270 }, { "epoch": 1.08, "learning_rate": 0.00013853015052581644, "loss": 0.009, "step": 415280 }, { "epoch": 1.08, "learning_rate": 0.00013852626230944498, "loss": 0.0121, "step": 415290 }, { "epoch": 1.08, "learning_rate": 0.00013852237409307352, "loss": 0.013, "step": 415300 }, { "epoch": 1.08, "learning_rate": 0.00013851848587670206, "loss": 0.0073, "step": 415310 }, { "epoch": 1.08, "learning_rate": 0.00013851459766033058, "loss": 0.0116, "step": 415320 }, { "epoch": 1.08, "learning_rate": 0.00013851070944395915, "loss": 0.0112, "step": 415330 }, { "epoch": 1.08, "learning_rate": 0.00013850682122758766, "loss": 0.0134, "step": 415340 }, { "epoch": 1.08, "learning_rate": 0.00013850293301121618, "loss": 0.0121, "step": 415350 }, { "epoch": 1.08, "learning_rate": 0.00013849904479484474, "loss": 0.0122, "step": 415360 }, { "epoch": 1.08, "learning_rate": 0.00013849515657847326, "loss": 0.0138, "step": 415370 }, { "epoch": 1.08, "learning_rate": 0.0001384912683621018, "loss": 0.0135, "step": 415380 }, { "epoch": 1.08, "learning_rate": 0.00013848738014573034, "loss": 0.01, "step": 415390 }, { "epoch": 1.08, "learning_rate": 0.00013848349192935888, "loss": 0.0125, "step": 415400 }, { "epoch": 1.08, "learning_rate": 0.0001384796037129874, "loss": 0.0116, "step": 415410 }, { "epoch": 1.08, "learning_rate": 0.00013847571549661594, "loss": 0.0097, "step": 415420 }, { "epoch": 1.08, "learning_rate": 0.00013847182728024448, "loss": 0.01, "step": 415430 }, { "epoch": 1.08, "learning_rate": 0.00013846793906387302, "loss": 0.0099, "step": 415440 }, { "epoch": 1.08, "learning_rate": 0.00013846405084750154, "loss": 0.0098, "step": 415450 }, { "epoch": 1.08, "learning_rate": 0.00013846016263113008, "loss": 0.0107, "step": 415460 }, { "epoch": 1.08, "learning_rate": 0.00013845627441475862, "loss": 0.0105, "step": 415470 }, { "epoch": 1.08, "learning_rate": 0.00013845238619838716, "loss": 0.0109, "step": 415480 }, { "epoch": 1.08, "learning_rate": 0.00013844849798201568, "loss": 0.0112, "step": 415490 }, { "epoch": 1.08, "learning_rate": 0.00013844460976564425, "loss": 0.0114, "step": 415500 }, { "epoch": 1.08, "learning_rate": 0.00013844072154927276, "loss": 0.0106, "step": 415510 }, { "epoch": 1.08, "learning_rate": 0.0001384368333329013, "loss": 0.011, "step": 415520 }, { "epoch": 1.08, "learning_rate": 0.00013843294511652984, "loss": 0.0131, "step": 415530 }, { "epoch": 1.08, "learning_rate": 0.00013842905690015838, "loss": 0.0193, "step": 415540 }, { "epoch": 1.08, "learning_rate": 0.0001384251686837869, "loss": 0.0167, "step": 415550 }, { "epoch": 1.08, "learning_rate": 0.00013842128046741544, "loss": 0.0155, "step": 415560 }, { "epoch": 1.08, "learning_rate": 0.00013841739225104398, "loss": 0.0115, "step": 415570 }, { "epoch": 1.08, "learning_rate": 0.0001384135040346725, "loss": 0.0099, "step": 415580 }, { "epoch": 1.08, "learning_rate": 0.00013840961581830104, "loss": 0.0126, "step": 415590 }, { "epoch": 1.08, "learning_rate": 0.00013840572760192958, "loss": 0.0106, "step": 415600 }, { "epoch": 1.08, "learning_rate": 0.00013840183938555812, "loss": 0.0115, "step": 415610 }, { "epoch": 1.08, "learning_rate": 0.00013839795116918664, "loss": 0.0133, "step": 415620 }, { "epoch": 1.08, "learning_rate": 0.00013839406295281518, "loss": 0.0131, "step": 415630 }, { "epoch": 1.08, "learning_rate": 0.00013839017473644372, "loss": 0.0133, "step": 415640 }, { "epoch": 1.08, "learning_rate": 0.00013838628652007226, "loss": 0.0109, "step": 415650 }, { "epoch": 1.08, "learning_rate": 0.00013838239830370078, "loss": 0.0121, "step": 415660 }, { "epoch": 1.08, "learning_rate": 0.00013837851008732932, "loss": 0.0133, "step": 415670 }, { "epoch": 1.08, "learning_rate": 0.00013837462187095786, "loss": 0.0105, "step": 415680 }, { "epoch": 1.08, "learning_rate": 0.0001383707336545864, "loss": 0.0093, "step": 415690 }, { "epoch": 1.08, "learning_rate": 0.00013836684543821494, "loss": 0.0128, "step": 415700 }, { "epoch": 1.08, "learning_rate": 0.00013836295722184348, "loss": 0.0114, "step": 415710 }, { "epoch": 1.08, "learning_rate": 0.000138359069005472, "loss": 0.0102, "step": 415720 }, { "epoch": 1.08, "learning_rate": 0.00013835518078910054, "loss": 0.0108, "step": 415730 }, { "epoch": 1.08, "learning_rate": 0.00013835129257272908, "loss": 0.0155, "step": 415740 }, { "epoch": 1.08, "learning_rate": 0.00013834740435635762, "loss": 0.012, "step": 415750 }, { "epoch": 1.08, "learning_rate": 0.00013834351613998614, "loss": 0.0096, "step": 415760 }, { "epoch": 1.08, "learning_rate": 0.00013833962792361468, "loss": 0.0077, "step": 415770 }, { "epoch": 1.08, "learning_rate": 0.00013833573970724322, "loss": 0.015, "step": 415780 }, { "epoch": 1.08, "learning_rate": 0.00013833185149087176, "loss": 0.0105, "step": 415790 }, { "epoch": 1.08, "learning_rate": 0.00013832796327450028, "loss": 0.0073, "step": 415800 }, { "epoch": 1.08, "learning_rate": 0.00013832407505812882, "loss": 0.0136, "step": 415810 }, { "epoch": 1.08, "learning_rate": 0.00013832018684175736, "loss": 0.014, "step": 415820 }, { "epoch": 1.08, "learning_rate": 0.00013831629862538588, "loss": 0.0124, "step": 415830 }, { "epoch": 1.08, "learning_rate": 0.00013831241040901442, "loss": 0.013, "step": 415840 }, { "epoch": 1.08, "learning_rate": 0.00013830852219264296, "loss": 0.0126, "step": 415850 }, { "epoch": 1.08, "learning_rate": 0.0001383046339762715, "loss": 0.0125, "step": 415860 }, { "epoch": 1.08, "learning_rate": 0.00013830074575990001, "loss": 0.014, "step": 415870 }, { "epoch": 1.08, "learning_rate": 0.00013829685754352858, "loss": 0.0122, "step": 415880 }, { "epoch": 1.08, "learning_rate": 0.0001382929693271571, "loss": 0.0096, "step": 415890 }, { "epoch": 1.08, "learning_rate": 0.00013828908111078564, "loss": 0.0118, "step": 415900 }, { "epoch": 1.08, "learning_rate": 0.00013828519289441418, "loss": 0.0103, "step": 415910 }, { "epoch": 1.08, "learning_rate": 0.00013828130467804272, "loss": 0.0101, "step": 415920 }, { "epoch": 1.08, "learning_rate": 0.00013827741646167124, "loss": 0.0127, "step": 415930 }, { "epoch": 1.08, "learning_rate": 0.00013827352824529978, "loss": 0.013, "step": 415940 }, { "epoch": 1.08, "learning_rate": 0.00013826964002892832, "loss": 0.0124, "step": 415950 }, { "epoch": 1.08, "learning_rate": 0.00013826575181255686, "loss": 0.0125, "step": 415960 }, { "epoch": 1.08, "learning_rate": 0.00013826186359618538, "loss": 0.0107, "step": 415970 }, { "epoch": 1.08, "learning_rate": 0.00013825797537981392, "loss": 0.0104, "step": 415980 }, { "epoch": 1.08, "learning_rate": 0.00013825408716344246, "loss": 0.012, "step": 415990 }, { "epoch": 1.08, "learning_rate": 0.000138250198947071, "loss": 0.0121, "step": 416000 }, { "epoch": 1.08, "eval_cer": 0.8816928888646285, "eval_loss": 0.007917557843029499, "eval_runtime": 107.4603, "eval_samples_per_second": 18.612, "eval_steps_per_second": 4.653, "step": 416000 }, { "epoch": 1.08, "learning_rate": 0.00013824631073069952, "loss": 0.0113, "step": 416010 }, { "epoch": 1.08, "learning_rate": 0.00013824242251432806, "loss": 0.0124, "step": 416020 }, { "epoch": 1.08, "learning_rate": 0.0001382385342979566, "loss": 0.0116, "step": 416030 }, { "epoch": 1.08, "learning_rate": 0.00013823464608158514, "loss": 0.0114, "step": 416040 }, { "epoch": 1.08, "learning_rate": 0.00013823075786521368, "loss": 0.0082, "step": 416050 }, { "epoch": 1.08, "learning_rate": 0.00013822686964884222, "loss": 0.0111, "step": 416060 }, { "epoch": 1.08, "learning_rate": 0.00013822298143247074, "loss": 0.0157, "step": 416070 }, { "epoch": 1.08, "learning_rate": 0.00013821909321609928, "loss": 0.0159, "step": 416080 }, { "epoch": 1.08, "learning_rate": 0.00013821520499972782, "loss": 0.012, "step": 416090 }, { "epoch": 1.08, "learning_rate": 0.00013821131678335634, "loss": 0.0164, "step": 416100 }, { "epoch": 1.08, "learning_rate": 0.00013820742856698488, "loss": 0.01, "step": 416110 }, { "epoch": 1.08, "learning_rate": 0.00013820354035061342, "loss": 0.0113, "step": 416120 }, { "epoch": 1.08, "learning_rate": 0.00013819965213424196, "loss": 0.0102, "step": 416130 }, { "epoch": 1.08, "learning_rate": 0.00013819576391787048, "loss": 0.0105, "step": 416140 }, { "epoch": 1.08, "learning_rate": 0.00013819187570149902, "loss": 0.0106, "step": 416150 }, { "epoch": 1.08, "learning_rate": 0.00013818798748512756, "loss": 0.0103, "step": 416160 }, { "epoch": 1.08, "learning_rate": 0.0001381840992687561, "loss": 0.0087, "step": 416170 }, { "epoch": 1.08, "learning_rate": 0.00013818021105238462, "loss": 0.0135, "step": 416180 }, { "epoch": 1.08, "learning_rate": 0.00013817632283601316, "loss": 0.0125, "step": 416190 }, { "epoch": 1.08, "learning_rate": 0.0001381724346196417, "loss": 0.0094, "step": 416200 }, { "epoch": 1.08, "learning_rate": 0.00013816854640327024, "loss": 0.0132, "step": 416210 }, { "epoch": 1.08, "learning_rate": 0.00013816465818689876, "loss": 0.0126, "step": 416220 }, { "epoch": 1.08, "learning_rate": 0.00013816076997052732, "loss": 0.0114, "step": 416230 }, { "epoch": 1.08, "learning_rate": 0.00013815688175415584, "loss": 0.0118, "step": 416240 }, { "epoch": 1.08, "learning_rate": 0.00013815299353778438, "loss": 0.0086, "step": 416250 }, { "epoch": 1.08, "learning_rate": 0.00013814910532141292, "loss": 0.011, "step": 416260 }, { "epoch": 1.08, "learning_rate": 0.00013814521710504146, "loss": 0.0107, "step": 416270 }, { "epoch": 1.08, "learning_rate": 0.00013814132888866998, "loss": 0.0087, "step": 416280 }, { "epoch": 1.08, "learning_rate": 0.00013813744067229852, "loss": 0.0118, "step": 416290 }, { "epoch": 1.08, "learning_rate": 0.00013813355245592706, "loss": 0.0108, "step": 416300 }, { "epoch": 1.08, "learning_rate": 0.0001381296642395556, "loss": 0.0087, "step": 416310 }, { "epoch": 1.08, "learning_rate": 0.00013812577602318412, "loss": 0.0134, "step": 416320 }, { "epoch": 1.08, "learning_rate": 0.00013812188780681266, "loss": 0.0106, "step": 416330 }, { "epoch": 1.08, "learning_rate": 0.0001381179995904412, "loss": 0.0123, "step": 416340 }, { "epoch": 1.08, "learning_rate": 0.00013811411137406972, "loss": 0.0122, "step": 416350 }, { "epoch": 1.08, "learning_rate": 0.00013811022315769826, "loss": 0.0137, "step": 416360 }, { "epoch": 1.08, "learning_rate": 0.0001381063349413268, "loss": 0.0127, "step": 416370 }, { "epoch": 1.08, "learning_rate": 0.00013810244672495534, "loss": 0.0105, "step": 416380 }, { "epoch": 1.08, "learning_rate": 0.00013809855850858385, "loss": 0.0132, "step": 416390 }, { "epoch": 1.08, "learning_rate": 0.00013809467029221242, "loss": 0.0132, "step": 416400 }, { "epoch": 1.08, "learning_rate": 0.00013809078207584094, "loss": 0.0131, "step": 416410 }, { "epoch": 1.08, "learning_rate": 0.00013808689385946948, "loss": 0.0093, "step": 416420 }, { "epoch": 1.08, "learning_rate": 0.00013808300564309802, "loss": 0.0096, "step": 416430 }, { "epoch": 1.08, "learning_rate": 0.00013807911742672656, "loss": 0.012, "step": 416440 }, { "epoch": 1.08, "learning_rate": 0.00013807522921035508, "loss": 0.01, "step": 416450 }, { "epoch": 1.08, "learning_rate": 0.00013807134099398362, "loss": 0.0105, "step": 416460 }, { "epoch": 1.08, "learning_rate": 0.00013806745277761216, "loss": 0.0114, "step": 416470 }, { "epoch": 1.08, "learning_rate": 0.0001380635645612407, "loss": 0.0098, "step": 416480 }, { "epoch": 1.08, "learning_rate": 0.00013805967634486922, "loss": 0.0128, "step": 416490 }, { "epoch": 1.08, "learning_rate": 0.00013805578812849776, "loss": 0.0094, "step": 416500 }, { "epoch": 1.08, "learning_rate": 0.0001380518999121263, "loss": 0.0118, "step": 416510 }, { "epoch": 1.08, "learning_rate": 0.00013804801169575484, "loss": 0.0118, "step": 416520 }, { "epoch": 1.08, "learning_rate": 0.00013804412347938336, "loss": 0.0109, "step": 416530 }, { "epoch": 1.08, "learning_rate": 0.0001380402352630119, "loss": 0.0082, "step": 416540 }, { "epoch": 1.08, "learning_rate": 0.00013803634704664044, "loss": 0.0131, "step": 416550 }, { "epoch": 1.08, "learning_rate": 0.00013803245883026898, "loss": 0.0107, "step": 416560 }, { "epoch": 1.08, "learning_rate": 0.00013802857061389752, "loss": 0.0123, "step": 416570 }, { "epoch": 1.08, "learning_rate": 0.00013802468239752604, "loss": 0.0125, "step": 416580 }, { "epoch": 1.08, "learning_rate": 0.00013802079418115458, "loss": 0.0119, "step": 416590 }, { "epoch": 1.08, "learning_rate": 0.00013801690596478312, "loss": 0.0138, "step": 416600 }, { "epoch": 1.08, "learning_rate": 0.00013801301774841166, "loss": 0.011, "step": 416610 }, { "epoch": 1.08, "learning_rate": 0.00013800912953204018, "loss": 0.0119, "step": 416620 }, { "epoch": 1.08, "learning_rate": 0.00013800524131566872, "loss": 0.0133, "step": 416630 }, { "epoch": 1.08, "learning_rate": 0.00013800135309929726, "loss": 0.011, "step": 416640 }, { "epoch": 1.08, "learning_rate": 0.0001379974648829258, "loss": 0.0097, "step": 416650 }, { "epoch": 1.08, "learning_rate": 0.00013799357666655432, "loss": 0.0117, "step": 416660 }, { "epoch": 1.08, "learning_rate": 0.00013798968845018286, "loss": 0.0125, "step": 416670 }, { "epoch": 1.08, "learning_rate": 0.0001379858002338114, "loss": 0.0107, "step": 416680 }, { "epoch": 1.08, "learning_rate": 0.00013798191201743994, "loss": 0.0138, "step": 416690 }, { "epoch": 1.08, "learning_rate": 0.00013797802380106846, "loss": 0.0105, "step": 416700 }, { "epoch": 1.08, "learning_rate": 0.000137974135584697, "loss": 0.0081, "step": 416710 }, { "epoch": 1.08, "learning_rate": 0.00013797024736832554, "loss": 0.0084, "step": 416720 }, { "epoch": 1.08, "learning_rate": 0.00013796635915195408, "loss": 0.0151, "step": 416730 }, { "epoch": 1.08, "learning_rate": 0.0001379624709355826, "loss": 0.0109, "step": 416740 }, { "epoch": 1.08, "learning_rate": 0.00013795858271921116, "loss": 0.0111, "step": 416750 }, { "epoch": 1.08, "learning_rate": 0.00013795469450283968, "loss": 0.0118, "step": 416760 }, { "epoch": 1.08, "learning_rate": 0.00013795080628646822, "loss": 0.0107, "step": 416770 }, { "epoch": 1.08, "learning_rate": 0.00013794691807009676, "loss": 0.0101, "step": 416780 }, { "epoch": 1.08, "learning_rate": 0.0001379430298537253, "loss": 0.0115, "step": 416790 }, { "epoch": 1.08, "learning_rate": 0.00013793914163735382, "loss": 0.0111, "step": 416800 }, { "epoch": 1.08, "learning_rate": 0.00013793525342098236, "loss": 0.0085, "step": 416810 }, { "epoch": 1.08, "learning_rate": 0.0001379313652046109, "loss": 0.0093, "step": 416820 }, { "epoch": 1.08, "learning_rate": 0.00013792747698823942, "loss": 0.012, "step": 416830 }, { "epoch": 1.08, "learning_rate": 0.00013792358877186796, "loss": 0.0101, "step": 416840 }, { "epoch": 1.08, "learning_rate": 0.0001379197005554965, "loss": 0.0101, "step": 416850 }, { "epoch": 1.08, "learning_rate": 0.00013791581233912504, "loss": 0.0115, "step": 416860 }, { "epoch": 1.08, "learning_rate": 0.00013791192412275356, "loss": 0.0096, "step": 416870 }, { "epoch": 1.08, "learning_rate": 0.0001379080359063821, "loss": 0.0119, "step": 416880 }, { "epoch": 1.08, "learning_rate": 0.00013790414769001064, "loss": 0.0117, "step": 416890 }, { "epoch": 1.08, "learning_rate": 0.00013790025947363918, "loss": 0.0133, "step": 416900 }, { "epoch": 1.08, "learning_rate": 0.0001378963712572677, "loss": 0.0114, "step": 416910 }, { "epoch": 1.08, "learning_rate": 0.00013789248304089626, "loss": 0.0099, "step": 416920 }, { "epoch": 1.08, "learning_rate": 0.00013788859482452478, "loss": 0.0133, "step": 416930 }, { "epoch": 1.08, "learning_rate": 0.00013788470660815332, "loss": 0.0095, "step": 416940 }, { "epoch": 1.08, "learning_rate": 0.00013788081839178186, "loss": 0.0124, "step": 416950 }, { "epoch": 1.08, "learning_rate": 0.0001378769301754104, "loss": 0.0125, "step": 416960 }, { "epoch": 1.08, "learning_rate": 0.00013787304195903892, "loss": 0.012, "step": 416970 }, { "epoch": 1.08, "learning_rate": 0.00013786915374266746, "loss": 0.0104, "step": 416980 }, { "epoch": 1.08, "learning_rate": 0.000137865265526296, "loss": 0.0096, "step": 416990 }, { "epoch": 1.08, "learning_rate": 0.00013786137730992454, "loss": 0.014, "step": 417000 }, { "epoch": 1.08, "eval_cer": 0.8817166826925096, "eval_loss": 0.007632073480635881, "eval_runtime": 107.6798, "eval_samples_per_second": 18.574, "eval_steps_per_second": 4.643, "step": 417000 }, { "epoch": 1.08, "learning_rate": 0.00013785748909355306, "loss": 0.0112, "step": 417010 }, { "epoch": 1.08, "learning_rate": 0.0001378536008771816, "loss": 0.0123, "step": 417020 }, { "epoch": 1.08, "learning_rate": 0.00013784971266081014, "loss": 0.0114, "step": 417030 }, { "epoch": 1.08, "learning_rate": 0.00013784582444443868, "loss": 0.0165, "step": 417040 }, { "epoch": 1.08, "learning_rate": 0.0001378419362280672, "loss": 0.0085, "step": 417050 }, { "epoch": 1.08, "learning_rate": 0.00013783804801169574, "loss": 0.01, "step": 417060 }, { "epoch": 1.08, "learning_rate": 0.00013783415979532428, "loss": 0.0106, "step": 417070 }, { "epoch": 1.08, "learning_rate": 0.0001378302715789528, "loss": 0.0113, "step": 417080 }, { "epoch": 1.08, "learning_rate": 0.00013782638336258136, "loss": 0.0136, "step": 417090 }, { "epoch": 1.08, "learning_rate": 0.00013782249514620988, "loss": 0.009, "step": 417100 }, { "epoch": 1.08, "learning_rate": 0.00013781860692983842, "loss": 0.012, "step": 417110 }, { "epoch": 1.08, "learning_rate": 0.00013781471871346696, "loss": 0.0126, "step": 417120 }, { "epoch": 1.08, "learning_rate": 0.0001378108304970955, "loss": 0.0127, "step": 417130 }, { "epoch": 1.08, "learning_rate": 0.00013780694228072402, "loss": 0.0091, "step": 417140 }, { "epoch": 1.08, "learning_rate": 0.00013780305406435256, "loss": 0.0106, "step": 417150 }, { "epoch": 1.08, "learning_rate": 0.0001377991658479811, "loss": 0.0101, "step": 417160 }, { "epoch": 1.08, "learning_rate": 0.00013779527763160964, "loss": 0.0105, "step": 417170 }, { "epoch": 1.08, "learning_rate": 0.00013779138941523816, "loss": 0.0117, "step": 417180 }, { "epoch": 1.08, "learning_rate": 0.0001377875011988667, "loss": 0.0099, "step": 417190 }, { "epoch": 1.08, "learning_rate": 0.00013778361298249524, "loss": 0.0113, "step": 417200 }, { "epoch": 1.08, "learning_rate": 0.00013777972476612378, "loss": 0.0102, "step": 417210 }, { "epoch": 1.08, "learning_rate": 0.0001377758365497523, "loss": 0.0112, "step": 417220 }, { "epoch": 1.08, "learning_rate": 0.00013777194833338084, "loss": 0.011, "step": 417230 }, { "epoch": 1.08, "learning_rate": 0.00013776806011700938, "loss": 0.0112, "step": 417240 }, { "epoch": 1.08, "learning_rate": 0.00013776417190063792, "loss": 0.0118, "step": 417250 }, { "epoch": 1.08, "learning_rate": 0.00013776028368426644, "loss": 0.0083, "step": 417260 }, { "epoch": 1.08, "learning_rate": 0.000137756395467895, "loss": 0.0105, "step": 417270 }, { "epoch": 1.08, "learning_rate": 0.00013775250725152352, "loss": 0.0124, "step": 417280 }, { "epoch": 1.08, "learning_rate": 0.00013774861903515206, "loss": 0.0113, "step": 417290 }, { "epoch": 1.08, "learning_rate": 0.0001377447308187806, "loss": 0.0125, "step": 417300 }, { "epoch": 1.08, "learning_rate": 0.00013774084260240914, "loss": 0.0103, "step": 417310 }, { "epoch": 1.08, "learning_rate": 0.00013773695438603766, "loss": 0.0111, "step": 417320 }, { "epoch": 1.08, "learning_rate": 0.0001377330661696662, "loss": 0.012, "step": 417330 }, { "epoch": 1.08, "learning_rate": 0.00013772917795329474, "loss": 0.0115, "step": 417340 }, { "epoch": 1.08, "learning_rate": 0.00013772528973692326, "loss": 0.0099, "step": 417350 }, { "epoch": 1.08, "learning_rate": 0.0001377214015205518, "loss": 0.0122, "step": 417360 }, { "epoch": 1.08, "learning_rate": 0.00013771751330418034, "loss": 0.0138, "step": 417370 }, { "epoch": 1.08, "learning_rate": 0.00013771362508780888, "loss": 0.0103, "step": 417380 }, { "epoch": 1.08, "learning_rate": 0.0001377097368714374, "loss": 0.0098, "step": 417390 }, { "epoch": 1.08, "learning_rate": 0.00013770584865506594, "loss": 0.0112, "step": 417400 }, { "epoch": 1.08, "learning_rate": 0.00013770196043869448, "loss": 0.0122, "step": 417410 }, { "epoch": 1.08, "learning_rate": 0.00013769807222232302, "loss": 0.011, "step": 417420 }, { "epoch": 1.08, "learning_rate": 0.00013769418400595153, "loss": 0.0091, "step": 417430 }, { "epoch": 1.08, "learning_rate": 0.0001376902957895801, "loss": 0.0136, "step": 417440 }, { "epoch": 1.08, "learning_rate": 0.00013768640757320862, "loss": 0.0104, "step": 417450 }, { "epoch": 1.08, "learning_rate": 0.00013768251935683716, "loss": 0.0174, "step": 417460 }, { "epoch": 1.08, "learning_rate": 0.0001376786311404657, "loss": 0.0119, "step": 417470 }, { "epoch": 1.08, "learning_rate": 0.00013767474292409424, "loss": 0.0112, "step": 417480 }, { "epoch": 1.08, "learning_rate": 0.00013767085470772276, "loss": 0.0085, "step": 417490 }, { "epoch": 1.08, "learning_rate": 0.0001376669664913513, "loss": 0.0125, "step": 417500 }, { "epoch": 1.08, "learning_rate": 0.00013766307827497984, "loss": 0.0083, "step": 417510 }, { "epoch": 1.08, "learning_rate": 0.00013765919005860838, "loss": 0.0131, "step": 417520 }, { "epoch": 1.08, "learning_rate": 0.0001376553018422369, "loss": 0.0104, "step": 417530 }, { "epoch": 1.08, "learning_rate": 0.00013765141362586544, "loss": 0.0129, "step": 417540 }, { "epoch": 1.08, "learning_rate": 0.00013764752540949398, "loss": 0.0137, "step": 417550 }, { "epoch": 1.08, "learning_rate": 0.00013764363719312252, "loss": 0.0127, "step": 417560 }, { "epoch": 1.08, "learning_rate": 0.00013763974897675104, "loss": 0.0168, "step": 417570 }, { "epoch": 1.08, "learning_rate": 0.00013763586076037958, "loss": 0.0111, "step": 417580 }, { "epoch": 1.08, "learning_rate": 0.00013763197254400812, "loss": 0.0102, "step": 417590 }, { "epoch": 1.08, "learning_rate": 0.00013762808432763663, "loss": 0.0119, "step": 417600 }, { "epoch": 1.08, "learning_rate": 0.00013762419611126518, "loss": 0.012, "step": 417610 }, { "epoch": 1.08, "learning_rate": 0.00013762030789489372, "loss": 0.0102, "step": 417620 }, { "epoch": 1.08, "learning_rate": 0.00013761641967852226, "loss": 0.0118, "step": 417630 }, { "epoch": 1.08, "learning_rate": 0.0001376125314621508, "loss": 0.0122, "step": 417640 }, { "epoch": 1.08, "learning_rate": 0.00013760864324577934, "loss": 0.0111, "step": 417650 }, { "epoch": 1.08, "learning_rate": 0.00013760475502940786, "loss": 0.0082, "step": 417660 }, { "epoch": 1.08, "learning_rate": 0.0001376008668130364, "loss": 0.0114, "step": 417670 }, { "epoch": 1.08, "learning_rate": 0.00013759697859666494, "loss": 0.0082, "step": 417680 }, { "epoch": 1.08, "learning_rate": 0.00013759309038029348, "loss": 0.0144, "step": 417690 }, { "epoch": 1.08, "learning_rate": 0.000137589202163922, "loss": 0.012, "step": 417700 }, { "epoch": 1.08, "learning_rate": 0.00013758531394755054, "loss": 0.022, "step": 417710 }, { "epoch": 1.08, "learning_rate": 0.00013758142573117908, "loss": 0.0142, "step": 417720 }, { "epoch": 1.08, "learning_rate": 0.00013757753751480762, "loss": 0.0105, "step": 417730 }, { "epoch": 1.08, "learning_rate": 0.00013757364929843614, "loss": 0.0122, "step": 417740 }, { "epoch": 1.08, "learning_rate": 0.00013756976108206468, "loss": 0.0131, "step": 417750 }, { "epoch": 1.08, "learning_rate": 0.00013756587286569322, "loss": 0.0122, "step": 417760 }, { "epoch": 1.08, "learning_rate": 0.00013756198464932176, "loss": 0.0097, "step": 417770 }, { "epoch": 1.08, "learning_rate": 0.00013755809643295028, "loss": 0.0123, "step": 417780 }, { "epoch": 1.08, "learning_rate": 0.00013755420821657884, "loss": 0.0136, "step": 417790 }, { "epoch": 1.08, "learning_rate": 0.00013755032000020736, "loss": 0.0113, "step": 417800 }, { "epoch": 1.08, "learning_rate": 0.0001375464317838359, "loss": 0.0126, "step": 417810 }, { "epoch": 1.08, "learning_rate": 0.00013754254356746444, "loss": 0.0112, "step": 417820 }, { "epoch": 1.08, "learning_rate": 0.00013753865535109296, "loss": 0.0132, "step": 417830 }, { "epoch": 1.08, "learning_rate": 0.0001375347671347215, "loss": 0.0092, "step": 417840 }, { "epoch": 1.08, "learning_rate": 0.00013753087891835004, "loss": 0.011, "step": 417850 }, { "epoch": 1.08, "learning_rate": 0.00013752699070197858, "loss": 0.0095, "step": 417860 }, { "epoch": 1.08, "learning_rate": 0.0001375231024856071, "loss": 0.0114, "step": 417870 }, { "epoch": 1.08, "learning_rate": 0.00013751921426923564, "loss": 0.0104, "step": 417880 }, { "epoch": 1.08, "learning_rate": 0.00013751532605286418, "loss": 0.0113, "step": 417890 }, { "epoch": 1.08, "learning_rate": 0.00013751143783649272, "loss": 0.0147, "step": 417900 }, { "epoch": 1.08, "learning_rate": 0.00013750754962012124, "loss": 0.0111, "step": 417910 }, { "epoch": 1.08, "learning_rate": 0.00013750366140374978, "loss": 0.0127, "step": 417920 }, { "epoch": 1.08, "learning_rate": 0.00013749977318737832, "loss": 0.0083, "step": 417930 }, { "epoch": 1.08, "learning_rate": 0.00013749588497100686, "loss": 0.0104, "step": 417940 }, { "epoch": 1.08, "learning_rate": 0.00013749199675463537, "loss": 0.0103, "step": 417950 }, { "epoch": 1.08, "learning_rate": 0.00013748810853826394, "loss": 0.0108, "step": 417960 }, { "epoch": 1.08, "learning_rate": 0.00013748422032189246, "loss": 0.0093, "step": 417970 }, { "epoch": 1.08, "learning_rate": 0.000137480332105521, "loss": 0.0108, "step": 417980 }, { "epoch": 1.08, "learning_rate": 0.00013747644388914954, "loss": 0.0118, "step": 417990 }, { "epoch": 1.08, "learning_rate": 0.00013747255567277808, "loss": 0.0118, "step": 418000 }, { "epoch": 1.08, "eval_cer": 0.8817082848709045, "eval_loss": 0.007763538043946028, "eval_runtime": 107.433, "eval_samples_per_second": 18.616, "eval_steps_per_second": 4.654, "step": 418000 }, { "epoch": 1.08, "learning_rate": 0.0001374686674564066, "loss": 0.0093, "step": 418010 }, { "epoch": 1.08, "learning_rate": 0.00013746477924003514, "loss": 0.0115, "step": 418020 }, { "epoch": 1.08, "learning_rate": 0.00013746089102366368, "loss": 0.0112, "step": 418030 }, { "epoch": 1.08, "learning_rate": 0.00013745700280729222, "loss": 0.01, "step": 418040 }, { "epoch": 1.08, "learning_rate": 0.00013745311459092074, "loss": 0.0095, "step": 418050 }, { "epoch": 1.08, "learning_rate": 0.00013744922637454928, "loss": 0.0094, "step": 418060 }, { "epoch": 1.08, "learning_rate": 0.00013744533815817782, "loss": 0.0164, "step": 418070 }, { "epoch": 1.08, "learning_rate": 0.00013744144994180633, "loss": 0.0117, "step": 418080 }, { "epoch": 1.08, "learning_rate": 0.00013743756172543488, "loss": 0.0096, "step": 418090 }, { "epoch": 1.08, "learning_rate": 0.00013743367350906342, "loss": 0.0119, "step": 418100 }, { "epoch": 1.08, "learning_rate": 0.00013742978529269196, "loss": 0.0086, "step": 418110 }, { "epoch": 1.08, "learning_rate": 0.00013742589707632047, "loss": 0.0104, "step": 418120 }, { "epoch": 1.08, "learning_rate": 0.00013742200885994902, "loss": 0.008, "step": 418130 }, { "epoch": 1.08, "learning_rate": 0.00013741812064357756, "loss": 0.0102, "step": 418140 }, { "epoch": 1.08, "learning_rate": 0.0001374142324272061, "loss": 0.0108, "step": 418150 }, { "epoch": 1.08, "learning_rate": 0.00013741034421083464, "loss": 0.0105, "step": 418160 }, { "epoch": 1.08, "learning_rate": 0.00013740645599446318, "loss": 0.0122, "step": 418170 }, { "epoch": 1.08, "learning_rate": 0.0001374025677780917, "loss": 0.0093, "step": 418180 }, { "epoch": 1.08, "learning_rate": 0.00013739867956172024, "loss": 0.0087, "step": 418190 }, { "epoch": 1.08, "learning_rate": 0.00013739479134534878, "loss": 0.0154, "step": 418200 }, { "epoch": 1.08, "learning_rate": 0.00013739090312897732, "loss": 0.0109, "step": 418210 }, { "epoch": 1.08, "learning_rate": 0.00013738701491260584, "loss": 0.0095, "step": 418220 }, { "epoch": 1.08, "learning_rate": 0.00013738312669623438, "loss": 0.0103, "step": 418230 }, { "epoch": 1.08, "learning_rate": 0.00013737923847986292, "loss": 0.01, "step": 418240 }, { "epoch": 1.08, "learning_rate": 0.00013737535026349146, "loss": 0.0101, "step": 418250 }, { "epoch": 1.08, "learning_rate": 0.00013737146204711998, "loss": 0.014, "step": 418260 }, { "epoch": 1.08, "learning_rate": 0.00013736757383074852, "loss": 0.0135, "step": 418270 }, { "epoch": 1.08, "learning_rate": 0.00013736368561437706, "loss": 0.0136, "step": 418280 }, { "epoch": 1.08, "learning_rate": 0.0001373597973980056, "loss": 0.0133, "step": 418290 }, { "epoch": 1.08, "learning_rate": 0.00013735590918163412, "loss": 0.0096, "step": 418300 }, { "epoch": 1.08, "learning_rate": 0.00013735202096526266, "loss": 0.0096, "step": 418310 }, { "epoch": 1.08, "learning_rate": 0.0001373481327488912, "loss": 0.0131, "step": 418320 }, { "epoch": 1.08, "learning_rate": 0.0001373442445325197, "loss": 0.0119, "step": 418330 }, { "epoch": 1.08, "learning_rate": 0.00013734035631614828, "loss": 0.0113, "step": 418340 }, { "epoch": 1.08, "learning_rate": 0.0001373364680997768, "loss": 0.0089, "step": 418350 }, { "epoch": 1.08, "learning_rate": 0.00013733257988340534, "loss": 0.0114, "step": 418360 }, { "epoch": 1.08, "learning_rate": 0.00013732869166703388, "loss": 0.0111, "step": 418370 }, { "epoch": 1.08, "learning_rate": 0.00013732480345066242, "loss": 0.0155, "step": 418380 }, { "epoch": 1.08, "learning_rate": 0.00013732091523429094, "loss": 0.0113, "step": 418390 }, { "epoch": 1.08, "learning_rate": 0.00013731702701791948, "loss": 0.01, "step": 418400 }, { "epoch": 1.08, "learning_rate": 0.00013731313880154802, "loss": 0.0101, "step": 418410 }, { "epoch": 1.08, "learning_rate": 0.00013730925058517656, "loss": 0.0123, "step": 418420 }, { "epoch": 1.08, "learning_rate": 0.00013730536236880508, "loss": 0.0149, "step": 418430 }, { "epoch": 1.08, "learning_rate": 0.00013730147415243362, "loss": 0.0118, "step": 418440 }, { "epoch": 1.08, "learning_rate": 0.00013729758593606216, "loss": 0.0108, "step": 418450 }, { "epoch": 1.08, "learning_rate": 0.0001372936977196907, "loss": 0.0111, "step": 418460 }, { "epoch": 1.08, "learning_rate": 0.00013728980950331921, "loss": 0.0139, "step": 418470 }, { "epoch": 1.08, "learning_rate": 0.00013728592128694778, "loss": 0.0101, "step": 418480 }, { "epoch": 1.08, "learning_rate": 0.0001372820330705763, "loss": 0.0114, "step": 418490 }, { "epoch": 1.08, "learning_rate": 0.00013727814485420484, "loss": 0.0109, "step": 418500 }, { "epoch": 1.08, "learning_rate": 0.00013727425663783338, "loss": 0.0124, "step": 418510 }, { "epoch": 1.08, "learning_rate": 0.00013727036842146192, "loss": 0.0115, "step": 418520 }, { "epoch": 1.08, "learning_rate": 0.00013726648020509044, "loss": 0.0121, "step": 418530 }, { "epoch": 1.08, "learning_rate": 0.00013726259198871898, "loss": 0.0097, "step": 418540 }, { "epoch": 1.08, "learning_rate": 0.00013725870377234752, "loss": 0.0101, "step": 418550 }, { "epoch": 1.08, "learning_rate": 0.00013725481555597604, "loss": 0.014, "step": 418560 }, { "epoch": 1.08, "learning_rate": 0.00013725092733960458, "loss": 0.0087, "step": 418570 }, { "epoch": 1.09, "learning_rate": 0.00013724703912323312, "loss": 0.0113, "step": 418580 }, { "epoch": 1.09, "learning_rate": 0.00013724315090686166, "loss": 0.0099, "step": 418590 }, { "epoch": 1.09, "learning_rate": 0.00013723926269049017, "loss": 0.014, "step": 418600 }, { "epoch": 1.09, "learning_rate": 0.00013723537447411872, "loss": 0.0098, "step": 418610 }, { "epoch": 1.09, "learning_rate": 0.00013723148625774726, "loss": 0.0111, "step": 418620 }, { "epoch": 1.09, "learning_rate": 0.0001372275980413758, "loss": 0.0114, "step": 418630 }, { "epoch": 1.09, "learning_rate": 0.00013722370982500431, "loss": 0.0142, "step": 418640 }, { "epoch": 1.09, "learning_rate": 0.00013721982160863286, "loss": 0.0105, "step": 418650 }, { "epoch": 1.09, "learning_rate": 0.0001372159333922614, "loss": 0.0102, "step": 418660 }, { "epoch": 1.09, "learning_rate": 0.00013721204517588994, "loss": 0.0128, "step": 418670 }, { "epoch": 1.09, "learning_rate": 0.00013720815695951848, "loss": 0.01, "step": 418680 }, { "epoch": 1.09, "learning_rate": 0.00013720426874314702, "loss": 0.0107, "step": 418690 }, { "epoch": 1.09, "learning_rate": 0.00013720038052677554, "loss": 0.0115, "step": 418700 }, { "epoch": 1.09, "learning_rate": 0.00013719649231040408, "loss": 0.0114, "step": 418710 }, { "epoch": 1.09, "learning_rate": 0.00013719260409403262, "loss": 0.0127, "step": 418720 }, { "epoch": 1.09, "learning_rate": 0.00013718871587766116, "loss": 0.0114, "step": 418730 }, { "epoch": 1.09, "learning_rate": 0.00013718482766128968, "loss": 0.0127, "step": 418740 }, { "epoch": 1.09, "learning_rate": 0.00013718093944491822, "loss": 0.0117, "step": 418750 }, { "epoch": 1.09, "learning_rate": 0.00013717705122854676, "loss": 0.0131, "step": 418760 }, { "epoch": 1.09, "learning_rate": 0.0001371731630121753, "loss": 0.0126, "step": 418770 }, { "epoch": 1.09, "learning_rate": 0.00013716927479580382, "loss": 0.0076, "step": 418780 }, { "epoch": 1.09, "learning_rate": 0.00013716538657943236, "loss": 0.0134, "step": 418790 }, { "epoch": 1.09, "learning_rate": 0.0001371614983630609, "loss": 0.0105, "step": 418800 }, { "epoch": 1.09, "learning_rate": 0.0001371576101466894, "loss": 0.0105, "step": 418810 }, { "epoch": 1.09, "learning_rate": 0.00013715372193031795, "loss": 0.0109, "step": 418820 }, { "epoch": 1.09, "learning_rate": 0.0001371498337139465, "loss": 0.0172, "step": 418830 }, { "epoch": 1.09, "learning_rate": 0.00013714594549757504, "loss": 0.0135, "step": 418840 }, { "epoch": 1.09, "learning_rate": 0.00013714205728120355, "loss": 0.0117, "step": 418850 }, { "epoch": 1.09, "learning_rate": 0.00013713816906483212, "loss": 0.0133, "step": 418860 }, { "epoch": 1.09, "learning_rate": 0.00013713428084846064, "loss": 0.0128, "step": 418870 }, { "epoch": 1.09, "learning_rate": 0.00013713039263208918, "loss": 0.0154, "step": 418880 }, { "epoch": 1.09, "learning_rate": 0.00013712650441571772, "loss": 0.0158, "step": 418890 }, { "epoch": 1.09, "learning_rate": 0.00013712261619934626, "loss": 0.0123, "step": 418900 }, { "epoch": 1.09, "learning_rate": 0.00013711872798297478, "loss": 0.0087, "step": 418910 }, { "epoch": 1.09, "learning_rate": 0.00013711483976660332, "loss": 0.0095, "step": 418920 }, { "epoch": 1.09, "learning_rate": 0.00013711095155023186, "loss": 0.0117, "step": 418930 }, { "epoch": 1.09, "learning_rate": 0.0001371070633338604, "loss": 0.0098, "step": 418940 }, { "epoch": 1.09, "learning_rate": 0.00013710317511748891, "loss": 0.0119, "step": 418950 }, { "epoch": 1.09, "learning_rate": 0.00013709928690111746, "loss": 0.0071, "step": 418960 }, { "epoch": 1.09, "learning_rate": 0.000137095398684746, "loss": 0.0103, "step": 418970 }, { "epoch": 1.09, "learning_rate": 0.00013709151046837454, "loss": 0.009, "step": 418980 }, { "epoch": 1.09, "learning_rate": 0.00013708762225200305, "loss": 0.013, "step": 418990 }, { "epoch": 1.09, "learning_rate": 0.0001370837340356316, "loss": 0.0105, "step": 419000 }, { "epoch": 1.09, "eval_cer": 0.881751673615864, "eval_loss": 0.007565063424408436, "eval_runtime": 107.4764, "eval_samples_per_second": 18.609, "eval_steps_per_second": 4.652, "step": 419000 }, { "epoch": 1.09, "learning_rate": 0.00013707984581926014, "loss": 0.0118, "step": 419010 }, { "epoch": 1.09, "learning_rate": 0.00013707595760288868, "loss": 0.0109, "step": 419020 }, { "epoch": 1.09, "learning_rate": 0.00013707206938651722, "loss": 0.0136, "step": 419030 }, { "epoch": 1.09, "learning_rate": 0.00013706818117014576, "loss": 0.0149, "step": 419040 }, { "epoch": 1.09, "learning_rate": 0.00013706429295377428, "loss": 0.0147, "step": 419050 }, { "epoch": 1.09, "learning_rate": 0.00013706040473740282, "loss": 0.0107, "step": 419060 }, { "epoch": 1.09, "learning_rate": 0.00013705651652103136, "loss": 0.0127, "step": 419070 }, { "epoch": 1.09, "learning_rate": 0.00013705262830465987, "loss": 0.0123, "step": 419080 }, { "epoch": 1.09, "learning_rate": 0.00013704874008828842, "loss": 0.0099, "step": 419090 }, { "epoch": 1.09, "learning_rate": 0.00013704485187191696, "loss": 0.0125, "step": 419100 }, { "epoch": 1.09, "learning_rate": 0.0001370409636555455, "loss": 0.0126, "step": 419110 }, { "epoch": 1.09, "learning_rate": 0.00013703707543917401, "loss": 0.0132, "step": 419120 }, { "epoch": 1.09, "learning_rate": 0.00013703318722280256, "loss": 0.0143, "step": 419130 }, { "epoch": 1.09, "learning_rate": 0.0001370292990064311, "loss": 0.0122, "step": 419140 }, { "epoch": 1.09, "learning_rate": 0.00013702541079005964, "loss": 0.0128, "step": 419150 }, { "epoch": 1.09, "learning_rate": 0.00013702152257368815, "loss": 0.011, "step": 419160 }, { "epoch": 1.09, "learning_rate": 0.0001370176343573167, "loss": 0.0135, "step": 419170 }, { "epoch": 1.09, "learning_rate": 0.00013701374614094524, "loss": 0.0114, "step": 419180 }, { "epoch": 1.09, "learning_rate": 0.00013700985792457378, "loss": 0.0133, "step": 419190 }, { "epoch": 1.09, "learning_rate": 0.0001370059697082023, "loss": 0.0115, "step": 419200 }, { "epoch": 1.09, "learning_rate": 0.00013700208149183086, "loss": 0.0095, "step": 419210 }, { "epoch": 1.09, "learning_rate": 0.00013699819327545938, "loss": 0.0113, "step": 419220 }, { "epoch": 1.09, "learning_rate": 0.00013699430505908792, "loss": 0.0114, "step": 419230 }, { "epoch": 1.09, "learning_rate": 0.00013699041684271646, "loss": 0.0094, "step": 419240 }, { "epoch": 1.09, "learning_rate": 0.000136986528626345, "loss": 0.0091, "step": 419250 }, { "epoch": 1.09, "learning_rate": 0.00013698264040997352, "loss": 0.012, "step": 419260 }, { "epoch": 1.09, "learning_rate": 0.00013697875219360206, "loss": 0.0098, "step": 419270 }, { "epoch": 1.09, "learning_rate": 0.0001369748639772306, "loss": 0.0114, "step": 419280 }, { "epoch": 1.09, "learning_rate": 0.00013697097576085914, "loss": 0.0099, "step": 419290 }, { "epoch": 1.09, "learning_rate": 0.00013696708754448766, "loss": 0.0099, "step": 419300 }, { "epoch": 1.09, "learning_rate": 0.0001369631993281162, "loss": 0.0114, "step": 419310 }, { "epoch": 1.09, "learning_rate": 0.00013695931111174474, "loss": 0.0107, "step": 419320 }, { "epoch": 1.09, "learning_rate": 0.00013695542289537325, "loss": 0.0091, "step": 419330 }, { "epoch": 1.09, "learning_rate": 0.0001369515346790018, "loss": 0.0151, "step": 419340 }, { "epoch": 1.09, "learning_rate": 0.00013694764646263034, "loss": 0.0151, "step": 419350 }, { "epoch": 1.09, "learning_rate": 0.00013694375824625888, "loss": 0.0122, "step": 419360 }, { "epoch": 1.09, "learning_rate": 0.0001369398700298874, "loss": 0.0112, "step": 419370 }, { "epoch": 1.09, "learning_rate": 0.00013693598181351596, "loss": 0.0144, "step": 419380 }, { "epoch": 1.09, "learning_rate": 0.00013693209359714448, "loss": 0.0117, "step": 419390 }, { "epoch": 1.09, "learning_rate": 0.00013692820538077302, "loss": 0.0116, "step": 419400 }, { "epoch": 1.09, "learning_rate": 0.00013692431716440156, "loss": 0.0165, "step": 419410 }, { "epoch": 1.09, "learning_rate": 0.0001369204289480301, "loss": 0.0112, "step": 419420 }, { "epoch": 1.09, "learning_rate": 0.00013691654073165862, "loss": 0.0115, "step": 419430 }, { "epoch": 1.09, "learning_rate": 0.00013691265251528716, "loss": 0.0115, "step": 419440 }, { "epoch": 1.09, "learning_rate": 0.0001369087642989157, "loss": 0.0104, "step": 419450 }, { "epoch": 1.09, "learning_rate": 0.00013690487608254424, "loss": 0.0104, "step": 419460 }, { "epoch": 1.09, "learning_rate": 0.00013690098786617275, "loss": 0.0117, "step": 419470 }, { "epoch": 1.09, "learning_rate": 0.0001368970996498013, "loss": 0.0122, "step": 419480 }, { "epoch": 1.09, "learning_rate": 0.00013689321143342984, "loss": 0.012, "step": 419490 }, { "epoch": 1.09, "learning_rate": 0.00013688932321705838, "loss": 0.0109, "step": 419500 }, { "epoch": 1.09, "learning_rate": 0.0001368854350006869, "loss": 0.0145, "step": 419510 }, { "epoch": 1.09, "learning_rate": 0.00013688154678431544, "loss": 0.0105, "step": 419520 }, { "epoch": 1.09, "learning_rate": 0.00013687765856794398, "loss": 0.0119, "step": 419530 }, { "epoch": 1.09, "learning_rate": 0.00013687377035157252, "loss": 0.0121, "step": 419540 }, { "epoch": 1.09, "learning_rate": 0.00013686988213520106, "loss": 0.011, "step": 419550 }, { "epoch": 1.09, "learning_rate": 0.00013686599391882958, "loss": 0.0116, "step": 419560 }, { "epoch": 1.09, "learning_rate": 0.00013686210570245812, "loss": 0.0112, "step": 419570 }, { "epoch": 1.09, "learning_rate": 0.00013685821748608666, "loss": 0.0103, "step": 419580 }, { "epoch": 1.09, "learning_rate": 0.0001368543292697152, "loss": 0.0132, "step": 419590 }, { "epoch": 1.09, "learning_rate": 0.00013685044105334371, "loss": 0.0101, "step": 419600 }, { "epoch": 1.09, "learning_rate": 0.00013684655283697226, "loss": 0.0132, "step": 419610 }, { "epoch": 1.09, "learning_rate": 0.0001368426646206008, "loss": 0.0117, "step": 419620 }, { "epoch": 1.09, "learning_rate": 0.00013683877640422934, "loss": 0.0124, "step": 419630 }, { "epoch": 1.09, "learning_rate": 0.00013683488818785785, "loss": 0.0118, "step": 419640 }, { "epoch": 1.09, "learning_rate": 0.0001368309999714864, "loss": 0.009, "step": 419650 }, { "epoch": 1.09, "learning_rate": 0.00013682711175511494, "loss": 0.012, "step": 419660 }, { "epoch": 1.09, "learning_rate": 0.00013682322353874348, "loss": 0.011, "step": 419670 }, { "epoch": 1.09, "learning_rate": 0.000136819335322372, "loss": 0.0125, "step": 419680 }, { "epoch": 1.09, "learning_rate": 0.00013681544710600054, "loss": 0.0119, "step": 419690 }, { "epoch": 1.09, "learning_rate": 0.00013681155888962908, "loss": 0.0133, "step": 419700 }, { "epoch": 1.09, "learning_rate": 0.00013680767067325762, "loss": 0.0096, "step": 419710 }, { "epoch": 1.09, "learning_rate": 0.00013680378245688613, "loss": 0.0112, "step": 419720 }, { "epoch": 1.09, "learning_rate": 0.0001367998942405147, "loss": 0.0152, "step": 419730 }, { "epoch": 1.09, "learning_rate": 0.00013679600602414322, "loss": 0.0113, "step": 419740 }, { "epoch": 1.09, "learning_rate": 0.00013679211780777176, "loss": 0.0081, "step": 419750 }, { "epoch": 1.09, "learning_rate": 0.0001367882295914003, "loss": 0.0124, "step": 419760 }, { "epoch": 1.09, "learning_rate": 0.00013678434137502884, "loss": 0.0077, "step": 419770 }, { "epoch": 1.09, "learning_rate": 0.00013678045315865736, "loss": 0.0116, "step": 419780 }, { "epoch": 1.09, "learning_rate": 0.0001367765649422859, "loss": 0.0109, "step": 419790 }, { "epoch": 1.09, "learning_rate": 0.00013677267672591444, "loss": 0.0109, "step": 419800 }, { "epoch": 1.09, "learning_rate": 0.00013676878850954295, "loss": 0.0118, "step": 419810 }, { "epoch": 1.09, "learning_rate": 0.0001367649002931715, "loss": 0.0112, "step": 419820 }, { "epoch": 1.09, "learning_rate": 0.00013676101207680004, "loss": 0.0125, "step": 419830 }, { "epoch": 1.09, "learning_rate": 0.00013675712386042858, "loss": 0.0096, "step": 419840 }, { "epoch": 1.09, "learning_rate": 0.0001367532356440571, "loss": 0.0105, "step": 419850 }, { "epoch": 1.09, "learning_rate": 0.00013674934742768563, "loss": 0.0094, "step": 419860 }, { "epoch": 1.09, "learning_rate": 0.00013674545921131418, "loss": 0.0135, "step": 419870 }, { "epoch": 1.09, "learning_rate": 0.00013674157099494272, "loss": 0.0085, "step": 419880 }, { "epoch": 1.09, "learning_rate": 0.00013673768277857123, "loss": 0.0116, "step": 419890 }, { "epoch": 1.09, "learning_rate": 0.0001367337945621998, "loss": 0.0147, "step": 419900 }, { "epoch": 1.09, "learning_rate": 0.00013672990634582832, "loss": 0.0099, "step": 419910 }, { "epoch": 1.09, "learning_rate": 0.00013672601812945686, "loss": 0.01, "step": 419920 }, { "epoch": 1.09, "learning_rate": 0.0001367221299130854, "loss": 0.0105, "step": 419930 }, { "epoch": 1.09, "learning_rate": 0.00013671824169671394, "loss": 0.0147, "step": 419940 }, { "epoch": 1.09, "learning_rate": 0.00013671435348034246, "loss": 0.0133, "step": 419950 }, { "epoch": 1.09, "learning_rate": 0.000136710465263971, "loss": 0.013, "step": 419960 }, { "epoch": 1.09, "learning_rate": 0.00013670657704759954, "loss": 0.0112, "step": 419970 }, { "epoch": 1.09, "learning_rate": 0.00013670268883122808, "loss": 0.0096, "step": 419980 }, { "epoch": 1.09, "learning_rate": 0.0001366988006148566, "loss": 0.0123, "step": 419990 }, { "epoch": 1.09, "learning_rate": 0.00013669491239848514, "loss": 0.0102, "step": 420000 }, { "epoch": 1.09, "eval_cer": 0.8817488743419957, "eval_loss": 0.007611589971929789, "eval_runtime": 107.4861, "eval_samples_per_second": 18.607, "eval_steps_per_second": 4.652, "step": 420000 }, { "epoch": 1.09, "learning_rate": 0.00013669102418211368, "loss": 0.0117, "step": 420010 }, { "epoch": 1.09, "learning_rate": 0.00013668713596574222, "loss": 0.0129, "step": 420020 }, { "epoch": 1.09, "learning_rate": 0.00013668324774937073, "loss": 0.0097, "step": 420030 }, { "epoch": 1.09, "learning_rate": 0.00013667935953299928, "loss": 0.0129, "step": 420040 }, { "epoch": 1.09, "learning_rate": 0.00013667547131662782, "loss": 0.0102, "step": 420050 }, { "epoch": 1.09, "learning_rate": 0.00013667158310025633, "loss": 0.0096, "step": 420060 }, { "epoch": 1.09, "learning_rate": 0.0001366676948838849, "loss": 0.0111, "step": 420070 }, { "epoch": 1.09, "learning_rate": 0.00013666380666751342, "loss": 0.0146, "step": 420080 }, { "epoch": 1.09, "learning_rate": 0.00013665991845114196, "loss": 0.0143, "step": 420090 }, { "epoch": 1.09, "learning_rate": 0.0001366560302347705, "loss": 0.0131, "step": 420100 }, { "epoch": 1.09, "learning_rate": 0.00013665214201839904, "loss": 0.0138, "step": 420110 }, { "epoch": 1.09, "learning_rate": 0.00013664825380202755, "loss": 0.0088, "step": 420120 }, { "epoch": 1.09, "learning_rate": 0.0001366443655856561, "loss": 0.0106, "step": 420130 }, { "epoch": 1.09, "learning_rate": 0.00013664047736928464, "loss": 0.008, "step": 420140 }, { "epoch": 1.09, "learning_rate": 0.00013663658915291318, "loss": 0.01, "step": 420150 }, { "epoch": 1.09, "learning_rate": 0.0001366327009365417, "loss": 0.0103, "step": 420160 }, { "epoch": 1.09, "learning_rate": 0.00013662881272017024, "loss": 0.0104, "step": 420170 }, { "epoch": 1.09, "learning_rate": 0.00013662492450379878, "loss": 0.0111, "step": 420180 }, { "epoch": 1.09, "learning_rate": 0.00013662103628742732, "loss": 0.0116, "step": 420190 }, { "epoch": 1.09, "learning_rate": 0.00013661714807105583, "loss": 0.0116, "step": 420200 }, { "epoch": 1.09, "learning_rate": 0.00013661325985468438, "loss": 0.0079, "step": 420210 }, { "epoch": 1.09, "learning_rate": 0.00013660937163831292, "loss": 0.0097, "step": 420220 }, { "epoch": 1.09, "learning_rate": 0.00013660548342194146, "loss": 0.0124, "step": 420230 }, { "epoch": 1.09, "learning_rate": 0.00013660159520556997, "loss": 0.0116, "step": 420240 }, { "epoch": 1.09, "learning_rate": 0.00013659770698919854, "loss": 0.0084, "step": 420250 }, { "epoch": 1.09, "learning_rate": 0.00013659381877282706, "loss": 0.0124, "step": 420260 }, { "epoch": 1.09, "learning_rate": 0.0001365899305564556, "loss": 0.0115, "step": 420270 }, { "epoch": 1.09, "learning_rate": 0.00013658604234008414, "loss": 0.0107, "step": 420280 }, { "epoch": 1.09, "learning_rate": 0.00013658215412371268, "loss": 0.0093, "step": 420290 }, { "epoch": 1.09, "learning_rate": 0.0001365782659073412, "loss": 0.013, "step": 420300 }, { "epoch": 1.09, "learning_rate": 0.00013657437769096974, "loss": 0.0107, "step": 420310 }, { "epoch": 1.09, "learning_rate": 0.00013657048947459828, "loss": 0.0085, "step": 420320 }, { "epoch": 1.09, "learning_rate": 0.0001365666012582268, "loss": 0.013, "step": 420330 }, { "epoch": 1.09, "learning_rate": 0.00013656271304185534, "loss": 0.0153, "step": 420340 }, { "epoch": 1.09, "learning_rate": 0.00013655882482548388, "loss": 0.0124, "step": 420350 }, { "epoch": 1.09, "learning_rate": 0.00013655493660911242, "loss": 0.0109, "step": 420360 }, { "epoch": 1.09, "learning_rate": 0.00013655104839274093, "loss": 0.009, "step": 420370 }, { "epoch": 1.09, "learning_rate": 0.00013654716017636947, "loss": 0.0109, "step": 420380 }, { "epoch": 1.09, "learning_rate": 0.00013654327195999802, "loss": 0.0107, "step": 420390 }, { "epoch": 1.09, "learning_rate": 0.00013653938374362656, "loss": 0.0106, "step": 420400 }, { "epoch": 1.09, "learning_rate": 0.00013653549552725507, "loss": 0.01, "step": 420410 }, { "epoch": 1.09, "learning_rate": 0.00013653160731088364, "loss": 0.013, "step": 420420 }, { "epoch": 1.09, "learning_rate": 0.00013652771909451216, "loss": 0.0118, "step": 420430 }, { "epoch": 1.09, "learning_rate": 0.0001365238308781407, "loss": 0.013, "step": 420440 }, { "epoch": 1.09, "learning_rate": 0.00013651994266176924, "loss": 0.0107, "step": 420450 }, { "epoch": 1.09, "learning_rate": 0.00013651605444539778, "loss": 0.0113, "step": 420460 }, { "epoch": 1.09, "learning_rate": 0.0001365121662290263, "loss": 0.0109, "step": 420470 }, { "epoch": 1.09, "learning_rate": 0.00013650827801265484, "loss": 0.0151, "step": 420480 }, { "epoch": 1.09, "learning_rate": 0.00013650438979628338, "loss": 0.0115, "step": 420490 }, { "epoch": 1.09, "learning_rate": 0.00013650050157991192, "loss": 0.0174, "step": 420500 }, { "epoch": 1.09, "learning_rate": 0.00013649661336354043, "loss": 0.0088, "step": 420510 }, { "epoch": 1.09, "learning_rate": 0.00013649272514716898, "loss": 0.011, "step": 420520 }, { "epoch": 1.09, "learning_rate": 0.00013648883693079752, "loss": 0.0112, "step": 420530 }, { "epoch": 1.09, "learning_rate": 0.00013648494871442606, "loss": 0.0126, "step": 420540 }, { "epoch": 1.09, "learning_rate": 0.00013648106049805457, "loss": 0.0098, "step": 420550 }, { "epoch": 1.09, "learning_rate": 0.00013647717228168312, "loss": 0.0117, "step": 420560 }, { "epoch": 1.09, "learning_rate": 0.00013647328406531166, "loss": 0.0083, "step": 420570 }, { "epoch": 1.09, "learning_rate": 0.00013646939584894017, "loss": 0.0142, "step": 420580 }, { "epoch": 1.09, "learning_rate": 0.00013646550763256871, "loss": 0.0152, "step": 420590 }, { "epoch": 1.09, "learning_rate": 0.00013646161941619726, "loss": 0.0096, "step": 420600 }, { "epoch": 1.09, "learning_rate": 0.0001364577311998258, "loss": 0.0108, "step": 420610 }, { "epoch": 1.09, "learning_rate": 0.00013645384298345434, "loss": 0.0076, "step": 420620 }, { "epoch": 1.09, "learning_rate": 0.00013644995476708288, "loss": 0.0107, "step": 420630 }, { "epoch": 1.09, "learning_rate": 0.0001364460665507114, "loss": 0.012, "step": 420640 }, { "epoch": 1.09, "learning_rate": 0.00013644217833433994, "loss": 0.0106, "step": 420650 }, { "epoch": 1.09, "learning_rate": 0.00013643829011796848, "loss": 0.0139, "step": 420660 }, { "epoch": 1.09, "learning_rate": 0.00013643440190159702, "loss": 0.0152, "step": 420670 }, { "epoch": 1.09, "learning_rate": 0.00013643051368522553, "loss": 0.0124, "step": 420680 }, { "epoch": 1.09, "learning_rate": 0.00013642662546885408, "loss": 0.0087, "step": 420690 }, { "epoch": 1.09, "learning_rate": 0.00013642273725248262, "loss": 0.0093, "step": 420700 }, { "epoch": 1.09, "learning_rate": 0.00013641884903611116, "loss": 0.0094, "step": 420710 }, { "epoch": 1.09, "learning_rate": 0.00013641496081973967, "loss": 0.0126, "step": 420720 }, { "epoch": 1.09, "learning_rate": 0.00013641107260336822, "loss": 0.0087, "step": 420730 }, { "epoch": 1.09, "learning_rate": 0.00013640718438699676, "loss": 0.0114, "step": 420740 }, { "epoch": 1.09, "learning_rate": 0.0001364032961706253, "loss": 0.0163, "step": 420750 }, { "epoch": 1.09, "learning_rate": 0.0001363994079542538, "loss": 0.0115, "step": 420760 }, { "epoch": 1.09, "learning_rate": 0.00013639551973788238, "loss": 0.0113, "step": 420770 }, { "epoch": 1.09, "learning_rate": 0.0001363916315215109, "loss": 0.0144, "step": 420780 }, { "epoch": 1.09, "learning_rate": 0.0001363877433051394, "loss": 0.014, "step": 420790 }, { "epoch": 1.09, "learning_rate": 0.00013638385508876798, "loss": 0.0111, "step": 420800 }, { "epoch": 1.09, "learning_rate": 0.0001363799668723965, "loss": 0.0123, "step": 420810 }, { "epoch": 1.09, "learning_rate": 0.00013637607865602504, "loss": 0.014, "step": 420820 }, { "epoch": 1.09, "learning_rate": 0.00013637219043965358, "loss": 0.0094, "step": 420830 }, { "epoch": 1.09, "learning_rate": 0.00013636830222328212, "loss": 0.0086, "step": 420840 }, { "epoch": 1.09, "learning_rate": 0.00013636441400691063, "loss": 0.0145, "step": 420850 }, { "epoch": 1.09, "learning_rate": 0.00013636052579053918, "loss": 0.0122, "step": 420860 }, { "epoch": 1.09, "learning_rate": 0.00013635663757416772, "loss": 0.01, "step": 420870 }, { "epoch": 1.09, "learning_rate": 0.00013635274935779626, "loss": 0.0112, "step": 420880 }, { "epoch": 1.09, "learning_rate": 0.00013634886114142477, "loss": 0.0106, "step": 420890 }, { "epoch": 1.09, "learning_rate": 0.00013634497292505331, "loss": 0.009, "step": 420900 }, { "epoch": 1.09, "learning_rate": 0.00013634108470868186, "loss": 0.0108, "step": 420910 }, { "epoch": 1.09, "learning_rate": 0.0001363371964923104, "loss": 0.0095, "step": 420920 }, { "epoch": 1.09, "learning_rate": 0.0001363333082759389, "loss": 0.0111, "step": 420930 }, { "epoch": 1.09, "learning_rate": 0.00013632942005956748, "loss": 0.013, "step": 420940 }, { "epoch": 1.09, "learning_rate": 0.000136325531843196, "loss": 0.0125, "step": 420950 }, { "epoch": 1.09, "learning_rate": 0.00013632164362682454, "loss": 0.0101, "step": 420960 }, { "epoch": 1.09, "learning_rate": 0.00013631775541045308, "loss": 0.0163, "step": 420970 }, { "epoch": 1.09, "learning_rate": 0.00013631386719408162, "loss": 0.0112, "step": 420980 }, { "epoch": 1.09, "learning_rate": 0.00013630997897771014, "loss": 0.0112, "step": 420990 }, { "epoch": 1.09, "learning_rate": 0.00013630609076133868, "loss": 0.0104, "step": 421000 }, { "epoch": 1.09, "eval_cer": 0.8817152830555753, "eval_loss": 0.007646199781447649, "eval_runtime": 107.458, "eval_samples_per_second": 18.612, "eval_steps_per_second": 4.653, "step": 421000 }, { "epoch": 1.09, "learning_rate": 0.00013630220254496722, "loss": 0.0119, "step": 421010 }, { "epoch": 1.09, "learning_rate": 0.00013629831432859576, "loss": 0.0128, "step": 421020 }, { "epoch": 1.09, "learning_rate": 0.00013629442611222427, "loss": 0.0133, "step": 421030 }, { "epoch": 1.09, "learning_rate": 0.00013629053789585282, "loss": 0.0121, "step": 421040 }, { "epoch": 1.09, "learning_rate": 0.00013628664967948136, "loss": 0.0104, "step": 421050 }, { "epoch": 1.09, "learning_rate": 0.00013628276146310987, "loss": 0.0098, "step": 421060 }, { "epoch": 1.09, "learning_rate": 0.00013627887324673841, "loss": 0.0097, "step": 421070 }, { "epoch": 1.09, "learning_rate": 0.00013627498503036696, "loss": 0.0118, "step": 421080 }, { "epoch": 1.09, "learning_rate": 0.0001362710968139955, "loss": 0.0115, "step": 421090 }, { "epoch": 1.09, "learning_rate": 0.000136267208597624, "loss": 0.0111, "step": 421100 }, { "epoch": 1.09, "learning_rate": 0.00013626332038125255, "loss": 0.0096, "step": 421110 }, { "epoch": 1.09, "learning_rate": 0.0001362594321648811, "loss": 0.0156, "step": 421120 }, { "epoch": 1.09, "learning_rate": 0.00013625554394850964, "loss": 0.011, "step": 421130 }, { "epoch": 1.09, "learning_rate": 0.00013625165573213818, "loss": 0.0128, "step": 421140 }, { "epoch": 1.09, "learning_rate": 0.00013624776751576672, "loss": 0.0106, "step": 421150 }, { "epoch": 1.09, "learning_rate": 0.00013624387929939523, "loss": 0.0103, "step": 421160 }, { "epoch": 1.09, "learning_rate": 0.00013623999108302378, "loss": 0.0081, "step": 421170 }, { "epoch": 1.09, "learning_rate": 0.00013623610286665232, "loss": 0.0111, "step": 421180 }, { "epoch": 1.09, "learning_rate": 0.00013623221465028086, "loss": 0.0091, "step": 421190 }, { "epoch": 1.09, "learning_rate": 0.00013622832643390937, "loss": 0.0152, "step": 421200 }, { "epoch": 1.09, "learning_rate": 0.00013622443821753792, "loss": 0.0138, "step": 421210 }, { "epoch": 1.09, "learning_rate": 0.00013622055000116646, "loss": 0.0132, "step": 421220 }, { "epoch": 1.09, "learning_rate": 0.000136216661784795, "loss": 0.0112, "step": 421230 }, { "epoch": 1.09, "learning_rate": 0.0001362127735684235, "loss": 0.0268, "step": 421240 }, { "epoch": 1.09, "learning_rate": 0.00013620888535205206, "loss": 0.0143, "step": 421250 }, { "epoch": 1.09, "learning_rate": 0.0001362049971356806, "loss": 0.0121, "step": 421260 }, { "epoch": 1.09, "learning_rate": 0.00013620110891930914, "loss": 0.0105, "step": 421270 }, { "epoch": 1.09, "learning_rate": 0.00013619722070293765, "loss": 0.0097, "step": 421280 }, { "epoch": 1.09, "learning_rate": 0.0001361933324865662, "loss": 0.0149, "step": 421290 }, { "epoch": 1.09, "learning_rate": 0.00013618944427019474, "loss": 0.0101, "step": 421300 }, { "epoch": 1.09, "learning_rate": 0.00013618555605382325, "loss": 0.0108, "step": 421310 }, { "epoch": 1.09, "learning_rate": 0.00013618166783745182, "loss": 0.0097, "step": 421320 }, { "epoch": 1.09, "learning_rate": 0.00013617777962108033, "loss": 0.0132, "step": 421330 }, { "epoch": 1.09, "learning_rate": 0.00013617389140470888, "loss": 0.011, "step": 421340 }, { "epoch": 1.09, "learning_rate": 0.00013617000318833742, "loss": 0.0149, "step": 421350 }, { "epoch": 1.09, "learning_rate": 0.00013616611497196596, "loss": 0.0117, "step": 421360 }, { "epoch": 1.09, "learning_rate": 0.00013616222675559447, "loss": 0.0146, "step": 421370 }, { "epoch": 1.09, "learning_rate": 0.00013615833853922302, "loss": 0.0124, "step": 421380 }, { "epoch": 1.09, "learning_rate": 0.00013615445032285156, "loss": 0.0149, "step": 421390 }, { "epoch": 1.09, "learning_rate": 0.0001361505621064801, "loss": 0.0121, "step": 421400 }, { "epoch": 1.09, "learning_rate": 0.0001361466738901086, "loss": 0.0101, "step": 421410 }, { "epoch": 1.09, "learning_rate": 0.00013614278567373715, "loss": 0.0097, "step": 421420 }, { "epoch": 1.09, "learning_rate": 0.0001361388974573657, "loss": 0.0121, "step": 421430 }, { "epoch": 1.09, "learning_rate": 0.00013613500924099424, "loss": 0.0115, "step": 421440 }, { "epoch": 1.09, "learning_rate": 0.00013613112102462275, "loss": 0.012, "step": 421450 }, { "epoch": 1.09, "learning_rate": 0.00013612723280825132, "loss": 0.0152, "step": 421460 }, { "epoch": 1.09, "learning_rate": 0.00013612334459187984, "loss": 0.0097, "step": 421470 }, { "epoch": 1.09, "learning_rate": 0.00013611945637550838, "loss": 0.0109, "step": 421480 }, { "epoch": 1.09, "learning_rate": 0.00013611556815913692, "loss": 0.0128, "step": 421490 }, { "epoch": 1.09, "learning_rate": 0.00013611167994276546, "loss": 0.0091, "step": 421500 }, { "epoch": 1.09, "learning_rate": 0.00013610779172639398, "loss": 0.0102, "step": 421510 }, { "epoch": 1.09, "learning_rate": 0.00013610390351002252, "loss": 0.0126, "step": 421520 }, { "epoch": 1.09, "learning_rate": 0.00013610001529365106, "loss": 0.0109, "step": 421530 }, { "epoch": 1.09, "learning_rate": 0.00013609612707727957, "loss": 0.0122, "step": 421540 }, { "epoch": 1.09, "learning_rate": 0.00013609223886090811, "loss": 0.0121, "step": 421550 }, { "epoch": 1.09, "learning_rate": 0.00013608835064453666, "loss": 0.0137, "step": 421560 }, { "epoch": 1.09, "learning_rate": 0.0001360844624281652, "loss": 0.0123, "step": 421570 }, { "epoch": 1.09, "learning_rate": 0.0001360805742117937, "loss": 0.0101, "step": 421580 }, { "epoch": 1.09, "learning_rate": 0.00013607668599542225, "loss": 0.0098, "step": 421590 }, { "epoch": 1.09, "learning_rate": 0.0001360727977790508, "loss": 0.0108, "step": 421600 }, { "epoch": 1.09, "learning_rate": 0.00013606890956267934, "loss": 0.0129, "step": 421610 }, { "epoch": 1.09, "learning_rate": 0.00013606502134630785, "loss": 0.0142, "step": 421620 }, { "epoch": 1.09, "learning_rate": 0.0001360611331299364, "loss": 0.0136, "step": 421630 }, { "epoch": 1.09, "learning_rate": 0.00013605724491356493, "loss": 0.0093, "step": 421640 }, { "epoch": 1.09, "learning_rate": 0.00013605335669719348, "loss": 0.0121, "step": 421650 }, { "epoch": 1.09, "learning_rate": 0.00013604946848082202, "loss": 0.0104, "step": 421660 }, { "epoch": 1.09, "learning_rate": 0.00013604558026445056, "loss": 0.0128, "step": 421670 }, { "epoch": 1.09, "learning_rate": 0.00013604169204807907, "loss": 0.0102, "step": 421680 }, { "epoch": 1.09, "learning_rate": 0.00013603780383170762, "loss": 0.0142, "step": 421690 }, { "epoch": 1.09, "learning_rate": 0.00013603391561533616, "loss": 0.0118, "step": 421700 }, { "epoch": 1.09, "learning_rate": 0.0001360300273989647, "loss": 0.0103, "step": 421710 }, { "epoch": 1.09, "learning_rate": 0.00013602613918259321, "loss": 0.0103, "step": 421720 }, { "epoch": 1.09, "learning_rate": 0.00013602225096622176, "loss": 0.0088, "step": 421730 }, { "epoch": 1.09, "learning_rate": 0.0001360183627498503, "loss": 0.0109, "step": 421740 }, { "epoch": 1.09, "learning_rate": 0.00013601447453347884, "loss": 0.0116, "step": 421750 }, { "epoch": 1.09, "learning_rate": 0.00013601058631710735, "loss": 0.0136, "step": 421760 }, { "epoch": 1.09, "learning_rate": 0.0001360066981007359, "loss": 0.0093, "step": 421770 }, { "epoch": 1.09, "learning_rate": 0.00013600280988436444, "loss": 0.0097, "step": 421780 }, { "epoch": 1.09, "learning_rate": 0.00013599892166799295, "loss": 0.0122, "step": 421790 }, { "epoch": 1.09, "learning_rate": 0.0001359950334516215, "loss": 0.0092, "step": 421800 }, { "epoch": 1.09, "learning_rate": 0.00013599114523525003, "loss": 0.01, "step": 421810 }, { "epoch": 1.09, "learning_rate": 0.00013598725701887858, "loss": 0.0095, "step": 421820 }, { "epoch": 1.09, "learning_rate": 0.0001359833688025071, "loss": 0.0147, "step": 421830 }, { "epoch": 1.09, "learning_rate": 0.00013597948058613566, "loss": 0.0101, "step": 421840 }, { "epoch": 1.09, "learning_rate": 0.00013597559236976417, "loss": 0.014, "step": 421850 }, { "epoch": 1.09, "learning_rate": 0.00013597170415339272, "loss": 0.0105, "step": 421860 }, { "epoch": 1.09, "learning_rate": 0.00013596781593702126, "loss": 0.0111, "step": 421870 }, { "epoch": 1.09, "learning_rate": 0.0001359639277206498, "loss": 0.0108, "step": 421880 }, { "epoch": 1.09, "learning_rate": 0.0001359600395042783, "loss": 0.0105, "step": 421890 }, { "epoch": 1.09, "learning_rate": 0.00013595615128790685, "loss": 0.0139, "step": 421900 }, { "epoch": 1.09, "learning_rate": 0.0001359522630715354, "loss": 0.0119, "step": 421910 }, { "epoch": 1.09, "learning_rate": 0.00013594837485516394, "loss": 0.0099, "step": 421920 }, { "epoch": 1.09, "learning_rate": 0.00013594448663879245, "loss": 0.0104, "step": 421930 }, { "epoch": 1.09, "learning_rate": 0.000135940598422421, "loss": 0.0103, "step": 421940 }, { "epoch": 1.09, "learning_rate": 0.00013593671020604954, "loss": 0.0123, "step": 421950 }, { "epoch": 1.09, "learning_rate": 0.00013593282198967808, "loss": 0.0127, "step": 421960 }, { "epoch": 1.09, "learning_rate": 0.0001359289337733066, "loss": 0.0127, "step": 421970 }, { "epoch": 1.09, "learning_rate": 0.00013592504555693513, "loss": 0.0106, "step": 421980 }, { "epoch": 1.09, "learning_rate": 0.00013592115734056368, "loss": 0.0132, "step": 421990 }, { "epoch": 1.09, "learning_rate": 0.00013591726912419222, "loss": 0.0109, "step": 422000 }, { "epoch": 1.09, "eval_cer": 0.881727879787983, "eval_loss": 0.008169938810169697, "eval_runtime": 107.7698, "eval_samples_per_second": 18.558, "eval_steps_per_second": 4.64, "step": 422000 }, { "epoch": 1.09, "learning_rate": 0.00013591338090782076, "loss": 0.0138, "step": 422010 }, { "epoch": 1.09, "learning_rate": 0.0001359094926914493, "loss": 0.0087, "step": 422020 }, { "epoch": 1.09, "learning_rate": 0.00013590560447507781, "loss": 0.0119, "step": 422030 }, { "epoch": 1.09, "learning_rate": 0.00013590171625870636, "loss": 0.0113, "step": 422040 }, { "epoch": 1.09, "learning_rate": 0.0001358978280423349, "loss": 0.0149, "step": 422050 }, { "epoch": 1.09, "learning_rate": 0.0001358939398259634, "loss": 0.0113, "step": 422060 }, { "epoch": 1.09, "learning_rate": 0.00013589005160959195, "loss": 0.0162, "step": 422070 }, { "epoch": 1.09, "learning_rate": 0.0001358861633932205, "loss": 0.0132, "step": 422080 }, { "epoch": 1.09, "learning_rate": 0.00013588227517684904, "loss": 0.0106, "step": 422090 }, { "epoch": 1.09, "learning_rate": 0.00013587838696047755, "loss": 0.0094, "step": 422100 }, { "epoch": 1.09, "learning_rate": 0.0001358744987441061, "loss": 0.0141, "step": 422110 }, { "epoch": 1.09, "learning_rate": 0.00013587061052773464, "loss": 0.0109, "step": 422120 }, { "epoch": 1.09, "learning_rate": 0.00013586672231136318, "loss": 0.0126, "step": 422130 }, { "epoch": 1.09, "learning_rate": 0.0001358628340949917, "loss": 0.0124, "step": 422140 }, { "epoch": 1.09, "learning_rate": 0.00013585894587862023, "loss": 0.0116, "step": 422150 }, { "epoch": 1.09, "learning_rate": 0.00013585505766224877, "loss": 0.0092, "step": 422160 }, { "epoch": 1.09, "learning_rate": 0.00013585116944587732, "loss": 0.0088, "step": 422170 }, { "epoch": 1.09, "learning_rate": 0.00013584728122950583, "loss": 0.0134, "step": 422180 }, { "epoch": 1.09, "learning_rate": 0.0001358433930131344, "loss": 0.0127, "step": 422190 }, { "epoch": 1.09, "learning_rate": 0.00013583950479676291, "loss": 0.0114, "step": 422200 }, { "epoch": 1.09, "learning_rate": 0.00013583561658039146, "loss": 0.0095, "step": 422210 }, { "epoch": 1.09, "learning_rate": 0.00013583172836402, "loss": 0.0111, "step": 422220 }, { "epoch": 1.09, "learning_rate": 0.00013582784014764854, "loss": 0.0096, "step": 422230 }, { "epoch": 1.09, "learning_rate": 0.00013582395193127705, "loss": 0.0134, "step": 422240 }, { "epoch": 1.09, "learning_rate": 0.0001358200637149056, "loss": 0.0096, "step": 422250 }, { "epoch": 1.09, "learning_rate": 0.00013581617549853414, "loss": 0.0081, "step": 422260 }, { "epoch": 1.09, "learning_rate": 0.00013581228728216268, "loss": 0.0132, "step": 422270 }, { "epoch": 1.09, "learning_rate": 0.0001358083990657912, "loss": 0.0128, "step": 422280 }, { "epoch": 1.09, "learning_rate": 0.00013580451084941973, "loss": 0.0115, "step": 422290 }, { "epoch": 1.09, "learning_rate": 0.00013580062263304828, "loss": 0.01, "step": 422300 }, { "epoch": 1.09, "learning_rate": 0.0001357967344166768, "loss": 0.0108, "step": 422310 }, { "epoch": 1.09, "learning_rate": 0.00013579284620030533, "loss": 0.0108, "step": 422320 }, { "epoch": 1.09, "learning_rate": 0.00013578895798393387, "loss": 0.0104, "step": 422330 }, { "epoch": 1.09, "learning_rate": 0.00013578506976756242, "loss": 0.0118, "step": 422340 }, { "epoch": 1.09, "learning_rate": 0.00013578118155119093, "loss": 0.0121, "step": 422350 }, { "epoch": 1.09, "learning_rate": 0.0001357772933348195, "loss": 0.0112, "step": 422360 }, { "epoch": 1.09, "learning_rate": 0.00013577340511844801, "loss": 0.0097, "step": 422370 }, { "epoch": 1.09, "learning_rate": 0.00013576951690207656, "loss": 0.0143, "step": 422380 }, { "epoch": 1.09, "learning_rate": 0.0001357656286857051, "loss": 0.0129, "step": 422390 }, { "epoch": 1.09, "learning_rate": 0.00013576174046933364, "loss": 0.0097, "step": 422400 }, { "epoch": 1.09, "learning_rate": 0.00013575785225296215, "loss": 0.0183, "step": 422410 }, { "epoch": 1.09, "learning_rate": 0.0001357539640365907, "loss": 0.0093, "step": 422420 }, { "epoch": 1.09, "learning_rate": 0.00013575007582021924, "loss": 0.0154, "step": 422430 }, { "epoch": 1.1, "learning_rate": 0.00013574618760384778, "loss": 0.0124, "step": 422440 }, { "epoch": 1.1, "learning_rate": 0.0001357422993874763, "loss": 0.0104, "step": 422450 }, { "epoch": 1.1, "learning_rate": 0.00013573841117110483, "loss": 0.0142, "step": 422460 }, { "epoch": 1.1, "learning_rate": 0.00013573452295473338, "loss": 0.009, "step": 422470 }, { "epoch": 1.1, "learning_rate": 0.00013573063473836192, "loss": 0.0098, "step": 422480 }, { "epoch": 1.1, "learning_rate": 0.00013572674652199043, "loss": 0.0116, "step": 422490 }, { "epoch": 1.1, "learning_rate": 0.00013572285830561897, "loss": 0.0114, "step": 422500 }, { "epoch": 1.1, "learning_rate": 0.00013571897008924752, "loss": 0.0112, "step": 422510 }, { "epoch": 1.1, "learning_rate": 0.00013571508187287606, "loss": 0.0108, "step": 422520 }, { "epoch": 1.1, "learning_rate": 0.0001357111936565046, "loss": 0.0147, "step": 422530 }, { "epoch": 1.1, "learning_rate": 0.0001357073054401331, "loss": 0.0148, "step": 422540 }, { "epoch": 1.1, "learning_rate": 0.00013570341722376165, "loss": 0.011, "step": 422550 }, { "epoch": 1.1, "learning_rate": 0.0001356995290073902, "loss": 0.0103, "step": 422560 }, { "epoch": 1.1, "learning_rate": 0.00013569564079101874, "loss": 0.0127, "step": 422570 }, { "epoch": 1.1, "learning_rate": 0.00013569175257464725, "loss": 0.0128, "step": 422580 }, { "epoch": 1.1, "learning_rate": 0.0001356878643582758, "loss": 0.0113, "step": 422590 }, { "epoch": 1.1, "learning_rate": 0.00013568397614190434, "loss": 0.0112, "step": 422600 }, { "epoch": 1.1, "learning_rate": 0.00013568008792553288, "loss": 0.0092, "step": 422610 }, { "epoch": 1.1, "learning_rate": 0.0001356761997091614, "loss": 0.0096, "step": 422620 }, { "epoch": 1.1, "learning_rate": 0.00013567231149278993, "loss": 0.0098, "step": 422630 }, { "epoch": 1.1, "learning_rate": 0.00013566842327641848, "loss": 0.0096, "step": 422640 }, { "epoch": 1.1, "learning_rate": 0.00013566453506004702, "loss": 0.0105, "step": 422650 }, { "epoch": 1.1, "learning_rate": 0.00013566064684367553, "loss": 0.0112, "step": 422660 }, { "epoch": 1.1, "learning_rate": 0.00013565675862730407, "loss": 0.0101, "step": 422670 }, { "epoch": 1.1, "learning_rate": 0.00013565287041093261, "loss": 0.0095, "step": 422680 }, { "epoch": 1.1, "learning_rate": 0.00013564898219456116, "loss": 0.0112, "step": 422690 }, { "epoch": 1.1, "learning_rate": 0.00013564509397818967, "loss": 0.0126, "step": 422700 }, { "epoch": 1.1, "learning_rate": 0.00013564120576181824, "loss": 0.01, "step": 422710 }, { "epoch": 1.1, "learning_rate": 0.00013563731754544675, "loss": 0.0131, "step": 422720 }, { "epoch": 1.1, "learning_rate": 0.0001356334293290753, "loss": 0.0137, "step": 422730 }, { "epoch": 1.1, "learning_rate": 0.00013562954111270384, "loss": 0.0095, "step": 422740 }, { "epoch": 1.1, "learning_rate": 0.00013562565289633238, "loss": 0.0095, "step": 422750 }, { "epoch": 1.1, "learning_rate": 0.0001356217646799609, "loss": 0.0113, "step": 422760 }, { "epoch": 1.1, "learning_rate": 0.00013561787646358944, "loss": 0.0111, "step": 422770 }, { "epoch": 1.1, "learning_rate": 0.00013561398824721798, "loss": 0.0113, "step": 422780 }, { "epoch": 1.1, "learning_rate": 0.0001356101000308465, "loss": 0.0113, "step": 422790 }, { "epoch": 1.1, "learning_rate": 0.00013560621181447503, "loss": 0.0109, "step": 422800 }, { "epoch": 1.1, "learning_rate": 0.00013560232359810357, "loss": 0.01, "step": 422810 }, { "epoch": 1.1, "learning_rate": 0.00013559843538173212, "loss": 0.0142, "step": 422820 }, { "epoch": 1.1, "learning_rate": 0.00013559454716536063, "loss": 0.0166, "step": 422830 }, { "epoch": 1.1, "learning_rate": 0.00013559065894898917, "loss": 0.01, "step": 422840 }, { "epoch": 1.1, "learning_rate": 0.00013558677073261771, "loss": 0.0132, "step": 422850 }, { "epoch": 1.1, "learning_rate": 0.00013558288251624626, "loss": 0.0109, "step": 422860 }, { "epoch": 1.1, "learning_rate": 0.00013557899429987477, "loss": 0.0124, "step": 422870 }, { "epoch": 1.1, "learning_rate": 0.00013557510608350334, "loss": 0.0118, "step": 422880 }, { "epoch": 1.1, "learning_rate": 0.00013557121786713185, "loss": 0.0095, "step": 422890 }, { "epoch": 1.1, "learning_rate": 0.0001355673296507604, "loss": 0.0126, "step": 422900 }, { "epoch": 1.1, "learning_rate": 0.00013556344143438894, "loss": 0.0109, "step": 422910 }, { "epoch": 1.1, "learning_rate": 0.00013555955321801748, "loss": 0.0125, "step": 422920 }, { "epoch": 1.1, "learning_rate": 0.000135555665001646, "loss": 0.0116, "step": 422930 }, { "epoch": 1.1, "learning_rate": 0.00013555177678527453, "loss": 0.01, "step": 422940 }, { "epoch": 1.1, "learning_rate": 0.00013554788856890308, "loss": 0.01, "step": 422950 }, { "epoch": 1.1, "learning_rate": 0.00013554400035253162, "loss": 0.0115, "step": 422960 }, { "epoch": 1.1, "learning_rate": 0.00013554011213616013, "loss": 0.0109, "step": 422970 }, { "epoch": 1.1, "learning_rate": 0.00013553622391978867, "loss": 0.0106, "step": 422980 }, { "epoch": 1.1, "learning_rate": 0.00013553233570341722, "loss": 0.0113, "step": 422990 }, { "epoch": 1.1, "learning_rate": 0.00013552844748704576, "loss": 0.0092, "step": 423000 }, { "epoch": 1.1, "eval_cer": 0.8817054855970361, "eval_loss": 0.007950132712721825, "eval_runtime": 107.536, "eval_samples_per_second": 18.598, "eval_steps_per_second": 4.65, "step": 423000 }, { "epoch": 1.1, "learning_rate": 0.00013552455927067427, "loss": 0.0104, "step": 423010 }, { "epoch": 1.1, "learning_rate": 0.00013552067105430281, "loss": 0.0089, "step": 423020 }, { "epoch": 1.1, "learning_rate": 0.00013551678283793136, "loss": 0.0105, "step": 423030 }, { "epoch": 1.1, "learning_rate": 0.00013551289462155987, "loss": 0.0116, "step": 423040 }, { "epoch": 1.1, "learning_rate": 0.0001355090064051884, "loss": 0.0084, "step": 423050 }, { "epoch": 1.1, "learning_rate": 0.00013550511818881695, "loss": 0.0116, "step": 423060 }, { "epoch": 1.1, "learning_rate": 0.0001355012299724455, "loss": 0.012, "step": 423070 }, { "epoch": 1.1, "learning_rate": 0.00013549734175607404, "loss": 0.0133, "step": 423080 }, { "epoch": 1.1, "learning_rate": 0.00013549345353970258, "loss": 0.0111, "step": 423090 }, { "epoch": 1.1, "learning_rate": 0.0001354895653233311, "loss": 0.0091, "step": 423100 }, { "epoch": 1.1, "learning_rate": 0.00013548567710695963, "loss": 0.0142, "step": 423110 }, { "epoch": 1.1, "learning_rate": 0.00013548178889058818, "loss": 0.0102, "step": 423120 }, { "epoch": 1.1, "learning_rate": 0.00013547790067421672, "loss": 0.0116, "step": 423130 }, { "epoch": 1.1, "learning_rate": 0.00013547401245784523, "loss": 0.0137, "step": 423140 }, { "epoch": 1.1, "learning_rate": 0.00013547012424147377, "loss": 0.0152, "step": 423150 }, { "epoch": 1.1, "learning_rate": 0.00013546623602510232, "loss": 0.0102, "step": 423160 }, { "epoch": 1.1, "learning_rate": 0.00013546234780873086, "loss": 0.0102, "step": 423170 }, { "epoch": 1.1, "learning_rate": 0.00013545845959235937, "loss": 0.0116, "step": 423180 }, { "epoch": 1.1, "learning_rate": 0.0001354545713759879, "loss": 0.0096, "step": 423190 }, { "epoch": 1.1, "learning_rate": 0.00013545068315961645, "loss": 0.0098, "step": 423200 }, { "epoch": 1.1, "learning_rate": 0.000135446794943245, "loss": 0.0115, "step": 423210 }, { "epoch": 1.1, "learning_rate": 0.0001354429067268735, "loss": 0.0112, "step": 423220 }, { "epoch": 1.1, "learning_rate": 0.00013543901851050208, "loss": 0.0104, "step": 423230 }, { "epoch": 1.1, "learning_rate": 0.0001354351302941306, "loss": 0.0092, "step": 423240 }, { "epoch": 1.1, "learning_rate": 0.00013543124207775914, "loss": 0.0097, "step": 423250 }, { "epoch": 1.1, "learning_rate": 0.00013542735386138768, "loss": 0.0135, "step": 423260 }, { "epoch": 1.1, "learning_rate": 0.0001354234656450162, "loss": 0.0107, "step": 423270 }, { "epoch": 1.1, "learning_rate": 0.00013541957742864473, "loss": 0.0084, "step": 423280 }, { "epoch": 1.1, "learning_rate": 0.00013541568921227328, "loss": 0.0094, "step": 423290 }, { "epoch": 1.1, "learning_rate": 0.00013541180099590182, "loss": 0.0132, "step": 423300 }, { "epoch": 1.1, "learning_rate": 0.00013540791277953033, "loss": 0.0111, "step": 423310 }, { "epoch": 1.1, "learning_rate": 0.00013540402456315887, "loss": 0.0154, "step": 423320 }, { "epoch": 1.1, "learning_rate": 0.00013540013634678741, "loss": 0.011, "step": 423330 }, { "epoch": 1.1, "learning_rate": 0.00013539624813041596, "loss": 0.011, "step": 423340 }, { "epoch": 1.1, "learning_rate": 0.00013539235991404447, "loss": 0.0139, "step": 423350 }, { "epoch": 1.1, "learning_rate": 0.000135388471697673, "loss": 0.0133, "step": 423360 }, { "epoch": 1.1, "learning_rate": 0.00013538458348130155, "loss": 0.0131, "step": 423370 }, { "epoch": 1.1, "learning_rate": 0.0001353806952649301, "loss": 0.0077, "step": 423380 }, { "epoch": 1.1, "learning_rate": 0.0001353768070485586, "loss": 0.0126, "step": 423390 }, { "epoch": 1.1, "learning_rate": 0.00013537291883218718, "loss": 0.0077, "step": 423400 }, { "epoch": 1.1, "learning_rate": 0.0001353690306158157, "loss": 0.0101, "step": 423410 }, { "epoch": 1.1, "learning_rate": 0.00013536514239944424, "loss": 0.0099, "step": 423420 }, { "epoch": 1.1, "learning_rate": 0.00013536125418307278, "loss": 0.0103, "step": 423430 }, { "epoch": 1.1, "learning_rate": 0.00013535736596670132, "loss": 0.0125, "step": 423440 }, { "epoch": 1.1, "learning_rate": 0.00013535347775032983, "loss": 0.0092, "step": 423450 }, { "epoch": 1.1, "learning_rate": 0.00013534958953395837, "loss": 0.012, "step": 423460 }, { "epoch": 1.1, "learning_rate": 0.00013534570131758692, "loss": 0.0106, "step": 423470 }, { "epoch": 1.1, "learning_rate": 0.00013534181310121546, "loss": 0.013, "step": 423480 }, { "epoch": 1.1, "learning_rate": 0.00013533792488484397, "loss": 0.0109, "step": 423490 }, { "epoch": 1.1, "learning_rate": 0.00013533403666847251, "loss": 0.0122, "step": 423500 }, { "epoch": 1.1, "learning_rate": 0.00013533014845210106, "loss": 0.0147, "step": 423510 }, { "epoch": 1.1, "learning_rate": 0.00013532626023572957, "loss": 0.0101, "step": 423520 }, { "epoch": 1.1, "learning_rate": 0.0001353223720193581, "loss": 0.0123, "step": 423530 }, { "epoch": 1.1, "learning_rate": 0.00013531848380298665, "loss": 0.0094, "step": 423540 }, { "epoch": 1.1, "learning_rate": 0.0001353145955866152, "loss": 0.0134, "step": 423550 }, { "epoch": 1.1, "learning_rate": 0.0001353107073702437, "loss": 0.0101, "step": 423560 }, { "epoch": 1.1, "learning_rate": 0.00013530681915387225, "loss": 0.0117, "step": 423570 }, { "epoch": 1.1, "learning_rate": 0.0001353029309375008, "loss": 0.0129, "step": 423580 }, { "epoch": 1.1, "learning_rate": 0.00013529904272112933, "loss": 0.0107, "step": 423590 }, { "epoch": 1.1, "learning_rate": 0.00013529515450475788, "loss": 0.0144, "step": 423600 }, { "epoch": 1.1, "learning_rate": 0.00013529126628838642, "loss": 0.0092, "step": 423610 }, { "epoch": 1.1, "learning_rate": 0.00013528737807201493, "loss": 0.01, "step": 423620 }, { "epoch": 1.1, "learning_rate": 0.00013528348985564347, "loss": 0.0089, "step": 423630 }, { "epoch": 1.1, "learning_rate": 0.00013527960163927202, "loss": 0.0146, "step": 423640 }, { "epoch": 1.1, "learning_rate": 0.00013527571342290056, "loss": 0.0142, "step": 423650 }, { "epoch": 1.1, "learning_rate": 0.00013527182520652907, "loss": 0.0144, "step": 423660 }, { "epoch": 1.1, "learning_rate": 0.0001352679369901576, "loss": 0.0122, "step": 423670 }, { "epoch": 1.1, "learning_rate": 0.00013526404877378616, "loss": 0.0082, "step": 423680 }, { "epoch": 1.1, "learning_rate": 0.0001352601605574147, "loss": 0.0111, "step": 423690 }, { "epoch": 1.1, "learning_rate": 0.0001352562723410432, "loss": 0.0112, "step": 423700 }, { "epoch": 1.1, "learning_rate": 0.00013525238412467175, "loss": 0.014, "step": 423710 }, { "epoch": 1.1, "learning_rate": 0.0001352484959083003, "loss": 0.0098, "step": 423720 }, { "epoch": 1.1, "learning_rate": 0.00013524460769192884, "loss": 0.0112, "step": 423730 }, { "epoch": 1.1, "learning_rate": 0.00013524071947555735, "loss": 0.0092, "step": 423740 }, { "epoch": 1.1, "learning_rate": 0.00013523683125918592, "loss": 0.0144, "step": 423750 }, { "epoch": 1.1, "learning_rate": 0.00013523294304281443, "loss": 0.0126, "step": 423760 }, { "epoch": 1.1, "learning_rate": 0.00013522905482644295, "loss": 0.0083, "step": 423770 }, { "epoch": 1.1, "learning_rate": 0.00013522516661007152, "loss": 0.0125, "step": 423780 }, { "epoch": 1.1, "learning_rate": 0.00013522127839370003, "loss": 0.0141, "step": 423790 }, { "epoch": 1.1, "learning_rate": 0.00013521739017732857, "loss": 0.0122, "step": 423800 }, { "epoch": 1.1, "learning_rate": 0.00013521350196095712, "loss": 0.0114, "step": 423810 }, { "epoch": 1.1, "learning_rate": 0.00013520961374458566, "loss": 0.0129, "step": 423820 }, { "epoch": 1.1, "learning_rate": 0.00013520572552821417, "loss": 0.0092, "step": 423830 }, { "epoch": 1.1, "learning_rate": 0.0001352018373118427, "loss": 0.01, "step": 423840 }, { "epoch": 1.1, "learning_rate": 0.00013519794909547125, "loss": 0.0079, "step": 423850 }, { "epoch": 1.1, "learning_rate": 0.0001351940608790998, "loss": 0.0105, "step": 423860 }, { "epoch": 1.1, "learning_rate": 0.0001351901726627283, "loss": 0.013, "step": 423870 }, { "epoch": 1.1, "learning_rate": 0.00013518628444635685, "loss": 0.0121, "step": 423880 }, { "epoch": 1.1, "learning_rate": 0.0001351823962299854, "loss": 0.0118, "step": 423890 }, { "epoch": 1.1, "learning_rate": 0.00013517850801361394, "loss": 0.0114, "step": 423900 }, { "epoch": 1.1, "learning_rate": 0.00013517461979724245, "loss": 0.0119, "step": 423910 }, { "epoch": 1.1, "learning_rate": 0.00013517073158087102, "loss": 0.0144, "step": 423920 }, { "epoch": 1.1, "learning_rate": 0.00013516684336449953, "loss": 0.0137, "step": 423930 }, { "epoch": 1.1, "learning_rate": 0.00013516295514812808, "loss": 0.0137, "step": 423940 }, { "epoch": 1.1, "learning_rate": 0.00013515906693175662, "loss": 0.0109, "step": 423950 }, { "epoch": 1.1, "learning_rate": 0.00013515517871538516, "loss": 0.0091, "step": 423960 }, { "epoch": 1.1, "learning_rate": 0.00013515129049901367, "loss": 0.0111, "step": 423970 }, { "epoch": 1.1, "learning_rate": 0.00013514740228264221, "loss": 0.0134, "step": 423980 }, { "epoch": 1.1, "learning_rate": 0.00013514351406627076, "loss": 0.0105, "step": 423990 }, { "epoch": 1.1, "learning_rate": 0.0001351396258498993, "loss": 0.0127, "step": 424000 }, { "epoch": 1.1, "eval_cer": 0.8817026863231677, "eval_loss": 0.007645982783287764, "eval_runtime": 107.6093, "eval_samples_per_second": 18.586, "eval_steps_per_second": 4.646, "step": 424000 }, { "epoch": 1.1, "learning_rate": 0.0001351357376335278, "loss": 0.0093, "step": 424010 }, { "epoch": 1.1, "learning_rate": 0.00013513184941715635, "loss": 0.0107, "step": 424020 }, { "epoch": 1.1, "learning_rate": 0.0001351279612007849, "loss": 0.0145, "step": 424030 }, { "epoch": 1.1, "learning_rate": 0.0001351240729844134, "loss": 0.0112, "step": 424040 }, { "epoch": 1.1, "learning_rate": 0.00013512018476804195, "loss": 0.0108, "step": 424050 }, { "epoch": 1.1, "learning_rate": 0.0001351162965516705, "loss": 0.0096, "step": 424060 }, { "epoch": 1.1, "learning_rate": 0.00013511240833529904, "loss": 0.0136, "step": 424070 }, { "epoch": 1.1, "learning_rate": 0.00013510852011892755, "loss": 0.0087, "step": 424080 }, { "epoch": 1.1, "learning_rate": 0.0001351046319025561, "loss": 0.0102, "step": 424090 }, { "epoch": 1.1, "learning_rate": 0.00013510074368618463, "loss": 0.0164, "step": 424100 }, { "epoch": 1.1, "learning_rate": 0.00013509685546981317, "loss": 0.0145, "step": 424110 }, { "epoch": 1.1, "learning_rate": 0.00013509296725344172, "loss": 0.0113, "step": 424120 }, { "epoch": 1.1, "learning_rate": 0.00013508907903707026, "loss": 0.011, "step": 424130 }, { "epoch": 1.1, "learning_rate": 0.00013508519082069877, "loss": 0.0113, "step": 424140 }, { "epoch": 1.1, "learning_rate": 0.00013508130260432731, "loss": 0.0121, "step": 424150 }, { "epoch": 1.1, "learning_rate": 0.00013507741438795586, "loss": 0.0123, "step": 424160 }, { "epoch": 1.1, "learning_rate": 0.0001350735261715844, "loss": 0.0094, "step": 424170 }, { "epoch": 1.1, "learning_rate": 0.0001350696379552129, "loss": 0.0125, "step": 424180 }, { "epoch": 1.1, "learning_rate": 0.00013506574973884145, "loss": 0.0121, "step": 424190 }, { "epoch": 1.1, "learning_rate": 0.00013506186152247, "loss": 0.0111, "step": 424200 }, { "epoch": 1.1, "learning_rate": 0.00013505797330609854, "loss": 0.0129, "step": 424210 }, { "epoch": 1.1, "learning_rate": 0.00013505408508972705, "loss": 0.0124, "step": 424220 }, { "epoch": 1.1, "learning_rate": 0.0001350501968733556, "loss": 0.013, "step": 424230 }, { "epoch": 1.1, "learning_rate": 0.00013504630865698413, "loss": 0.018, "step": 424240 }, { "epoch": 1.1, "learning_rate": 0.00013504242044061268, "loss": 0.0087, "step": 424250 }, { "epoch": 1.1, "learning_rate": 0.0001350385322242412, "loss": 0.0085, "step": 424260 }, { "epoch": 1.1, "learning_rate": 0.00013503464400786973, "loss": 0.0092, "step": 424270 }, { "epoch": 1.1, "learning_rate": 0.00013503075579149827, "loss": 0.0099, "step": 424280 }, { "epoch": 1.1, "learning_rate": 0.0001350268675751268, "loss": 0.0129, "step": 424290 }, { "epoch": 1.1, "learning_rate": 0.00013502297935875536, "loss": 0.0123, "step": 424300 }, { "epoch": 1.1, "learning_rate": 0.00013501909114238387, "loss": 0.0112, "step": 424310 }, { "epoch": 1.1, "learning_rate": 0.0001350152029260124, "loss": 0.0093, "step": 424320 }, { "epoch": 1.1, "learning_rate": 0.00013501131470964096, "loss": 0.0092, "step": 424330 }, { "epoch": 1.1, "learning_rate": 0.0001350074264932695, "loss": 0.0123, "step": 424340 }, { "epoch": 1.1, "learning_rate": 0.000135003538276898, "loss": 0.012, "step": 424350 }, { "epoch": 1.1, "learning_rate": 0.00013499965006052655, "loss": 0.0111, "step": 424360 }, { "epoch": 1.1, "learning_rate": 0.0001349957618441551, "loss": 0.0119, "step": 424370 }, { "epoch": 1.1, "learning_rate": 0.00013499187362778364, "loss": 0.0127, "step": 424380 }, { "epoch": 1.1, "learning_rate": 0.00013498798541141215, "loss": 0.0103, "step": 424390 }, { "epoch": 1.1, "learning_rate": 0.0001349840971950407, "loss": 0.011, "step": 424400 }, { "epoch": 1.1, "learning_rate": 0.00013498020897866923, "loss": 0.0115, "step": 424410 }, { "epoch": 1.1, "learning_rate": 0.00013497632076229778, "loss": 0.0107, "step": 424420 }, { "epoch": 1.1, "learning_rate": 0.0001349724325459263, "loss": 0.013, "step": 424430 }, { "epoch": 1.1, "learning_rate": 0.00013496854432955483, "loss": 0.0129, "step": 424440 }, { "epoch": 1.1, "learning_rate": 0.00013496465611318337, "loss": 0.0094, "step": 424450 }, { "epoch": 1.1, "learning_rate": 0.00013496076789681192, "loss": 0.0113, "step": 424460 }, { "epoch": 1.1, "learning_rate": 0.00013495687968044046, "loss": 0.0093, "step": 424470 }, { "epoch": 1.1, "learning_rate": 0.000134952991464069, "loss": 0.0094, "step": 424480 }, { "epoch": 1.1, "learning_rate": 0.0001349491032476975, "loss": 0.0106, "step": 424490 }, { "epoch": 1.1, "learning_rate": 0.00013494521503132605, "loss": 0.0098, "step": 424500 }, { "epoch": 1.1, "learning_rate": 0.0001349413268149546, "loss": 0.0104, "step": 424510 }, { "epoch": 1.1, "learning_rate": 0.0001349374385985831, "loss": 0.0105, "step": 424520 }, { "epoch": 1.1, "learning_rate": 0.00013493355038221165, "loss": 0.0102, "step": 424530 }, { "epoch": 1.1, "learning_rate": 0.0001349296621658402, "loss": 0.0142, "step": 424540 }, { "epoch": 1.1, "learning_rate": 0.00013492577394946874, "loss": 0.0098, "step": 424550 }, { "epoch": 1.1, "learning_rate": 0.00013492188573309725, "loss": 0.0142, "step": 424560 }, { "epoch": 1.1, "learning_rate": 0.0001349179975167258, "loss": 0.0088, "step": 424570 }, { "epoch": 1.1, "learning_rate": 0.00013491410930035433, "loss": 0.0119, "step": 424580 }, { "epoch": 1.1, "learning_rate": 0.00013491022108398287, "loss": 0.0126, "step": 424590 }, { "epoch": 1.1, "learning_rate": 0.0001349063328676114, "loss": 0.0084, "step": 424600 }, { "epoch": 1.1, "learning_rate": 0.00013490244465123993, "loss": 0.0092, "step": 424610 }, { "epoch": 1.1, "learning_rate": 0.00013489855643486847, "loss": 0.0114, "step": 424620 }, { "epoch": 1.1, "learning_rate": 0.00013489466821849701, "loss": 0.0101, "step": 424630 }, { "epoch": 1.1, "learning_rate": 0.00013489078000212553, "loss": 0.0098, "step": 424640 }, { "epoch": 1.1, "learning_rate": 0.0001348868917857541, "loss": 0.0105, "step": 424650 }, { "epoch": 1.1, "learning_rate": 0.0001348830035693826, "loss": 0.0094, "step": 424660 }, { "epoch": 1.1, "learning_rate": 0.00013487911535301115, "loss": 0.0091, "step": 424670 }, { "epoch": 1.1, "learning_rate": 0.0001348752271366397, "loss": 0.0117, "step": 424680 }, { "epoch": 1.1, "learning_rate": 0.00013487133892026824, "loss": 0.0085, "step": 424690 }, { "epoch": 1.1, "learning_rate": 0.00013486745070389675, "loss": 0.0096, "step": 424700 }, { "epoch": 1.1, "learning_rate": 0.0001348635624875253, "loss": 0.0092, "step": 424710 }, { "epoch": 1.1, "learning_rate": 0.00013485967427115383, "loss": 0.0135, "step": 424720 }, { "epoch": 1.1, "learning_rate": 0.00013485578605478238, "loss": 0.0113, "step": 424730 }, { "epoch": 1.1, "learning_rate": 0.0001348518978384109, "loss": 0.0111, "step": 424740 }, { "epoch": 1.1, "learning_rate": 0.00013484800962203943, "loss": 0.0101, "step": 424750 }, { "epoch": 1.1, "learning_rate": 0.00013484412140566797, "loss": 0.0111, "step": 424760 }, { "epoch": 1.1, "learning_rate": 0.0001348402331892965, "loss": 0.008, "step": 424770 }, { "epoch": 1.1, "learning_rate": 0.00013483634497292503, "loss": 0.0074, "step": 424780 }, { "epoch": 1.1, "learning_rate": 0.00013483245675655357, "loss": 0.0113, "step": 424790 }, { "epoch": 1.1, "learning_rate": 0.00013482856854018211, "loss": 0.0114, "step": 424800 }, { "epoch": 1.1, "learning_rate": 0.00013482468032381063, "loss": 0.0102, "step": 424810 }, { "epoch": 1.1, "learning_rate": 0.0001348207921074392, "loss": 0.0133, "step": 424820 }, { "epoch": 1.1, "learning_rate": 0.0001348169038910677, "loss": 0.009, "step": 424830 }, { "epoch": 1.1, "learning_rate": 0.00013481301567469625, "loss": 0.0101, "step": 424840 }, { "epoch": 1.1, "learning_rate": 0.0001348091274583248, "loss": 0.0105, "step": 424850 }, { "epoch": 1.1, "learning_rate": 0.00013480523924195334, "loss": 0.0143, "step": 424860 }, { "epoch": 1.1, "learning_rate": 0.00013480135102558185, "loss": 0.0113, "step": 424870 }, { "epoch": 1.1, "learning_rate": 0.0001347974628092104, "loss": 0.0131, "step": 424880 }, { "epoch": 1.1, "learning_rate": 0.00013479357459283893, "loss": 0.0131, "step": 424890 }, { "epoch": 1.1, "learning_rate": 0.00013478968637646748, "loss": 0.0123, "step": 424900 }, { "epoch": 1.1, "learning_rate": 0.000134785798160096, "loss": 0.012, "step": 424910 }, { "epoch": 1.1, "learning_rate": 0.00013478190994372453, "loss": 0.0137, "step": 424920 }, { "epoch": 1.1, "learning_rate": 0.00013477802172735307, "loss": 0.0111, "step": 424930 }, { "epoch": 1.1, "learning_rate": 0.00013477413351098162, "loss": 0.0145, "step": 424940 }, { "epoch": 1.1, "learning_rate": 0.00013477024529461013, "loss": 0.0105, "step": 424950 }, { "epoch": 1.1, "learning_rate": 0.00013476635707823867, "loss": 0.0157, "step": 424960 }, { "epoch": 1.1, "learning_rate": 0.0001347624688618672, "loss": 0.0083, "step": 424970 }, { "epoch": 1.1, "learning_rate": 0.00013475858064549575, "loss": 0.0094, "step": 424980 }, { "epoch": 1.1, "learning_rate": 0.0001347546924291243, "loss": 0.0105, "step": 424990 }, { "epoch": 1.1, "learning_rate": 0.00013475080421275284, "loss": 0.0111, "step": 425000 }, { "epoch": 1.1, "eval_cer": 0.8817292794249172, "eval_loss": 0.007522050756961107, "eval_runtime": 107.5853, "eval_samples_per_second": 18.59, "eval_steps_per_second": 4.647, "step": 425000 }, { "epoch": 1.1, "learning_rate": 0.00013474691599638135, "loss": 0.0102, "step": 425010 }, { "epoch": 1.1, "learning_rate": 0.0001347430277800099, "loss": 0.0075, "step": 425020 }, { "epoch": 1.1, "learning_rate": 0.00013473913956363844, "loss": 0.0116, "step": 425030 }, { "epoch": 1.1, "learning_rate": 0.00013473525134726695, "loss": 0.0116, "step": 425040 }, { "epoch": 1.1, "learning_rate": 0.0001347313631308955, "loss": 0.0105, "step": 425050 }, { "epoch": 1.1, "learning_rate": 0.00013472747491452403, "loss": 0.0097, "step": 425060 }, { "epoch": 1.1, "learning_rate": 0.00013472358669815258, "loss": 0.0106, "step": 425070 }, { "epoch": 1.1, "learning_rate": 0.0001347196984817811, "loss": 0.0115, "step": 425080 }, { "epoch": 1.1, "learning_rate": 0.00013471581026540963, "loss": 0.0089, "step": 425090 }, { "epoch": 1.1, "learning_rate": 0.00013471192204903817, "loss": 0.0121, "step": 425100 }, { "epoch": 1.1, "learning_rate": 0.00013470803383266671, "loss": 0.0117, "step": 425110 }, { "epoch": 1.1, "learning_rate": 0.00013470414561629523, "loss": 0.0117, "step": 425120 }, { "epoch": 1.1, "learning_rate": 0.00013470025739992377, "loss": 0.0109, "step": 425130 }, { "epoch": 1.1, "learning_rate": 0.0001346963691835523, "loss": 0.0134, "step": 425140 }, { "epoch": 1.1, "learning_rate": 0.00013469248096718085, "loss": 0.0124, "step": 425150 }, { "epoch": 1.1, "learning_rate": 0.00013468859275080937, "loss": 0.012, "step": 425160 }, { "epoch": 1.1, "learning_rate": 0.00013468470453443794, "loss": 0.0103, "step": 425170 }, { "epoch": 1.1, "learning_rate": 0.00013468081631806645, "loss": 0.0102, "step": 425180 }, { "epoch": 1.1, "learning_rate": 0.000134676928101695, "loss": 0.0112, "step": 425190 }, { "epoch": 1.1, "learning_rate": 0.00013467303988532354, "loss": 0.0091, "step": 425200 }, { "epoch": 1.1, "learning_rate": 0.00013466915166895208, "loss": 0.0111, "step": 425210 }, { "epoch": 1.1, "learning_rate": 0.0001346652634525806, "loss": 0.0105, "step": 425220 }, { "epoch": 1.1, "learning_rate": 0.00013466137523620913, "loss": 0.0122, "step": 425230 }, { "epoch": 1.1, "learning_rate": 0.00013465748701983767, "loss": 0.0147, "step": 425240 }, { "epoch": 1.1, "learning_rate": 0.00013465359880346622, "loss": 0.0101, "step": 425250 }, { "epoch": 1.1, "learning_rate": 0.00013464971058709473, "loss": 0.0099, "step": 425260 }, { "epoch": 1.1, "learning_rate": 0.00013464582237072327, "loss": 0.0137, "step": 425270 }, { "epoch": 1.1, "learning_rate": 0.00013464193415435181, "loss": 0.0115, "step": 425280 }, { "epoch": 1.1, "learning_rate": 0.00013463804593798033, "loss": 0.0119, "step": 425290 }, { "epoch": 1.1, "learning_rate": 0.00013463415772160887, "loss": 0.011, "step": 425300 }, { "epoch": 1.1, "learning_rate": 0.0001346302695052374, "loss": 0.0114, "step": 425310 }, { "epoch": 1.1, "learning_rate": 0.00013462638128886595, "loss": 0.0097, "step": 425320 }, { "epoch": 1.1, "learning_rate": 0.00013462249307249447, "loss": 0.0113, "step": 425330 }, { "epoch": 1.1, "learning_rate": 0.00013461860485612304, "loss": 0.0113, "step": 425340 }, { "epoch": 1.1, "learning_rate": 0.00013461471663975155, "loss": 0.0112, "step": 425350 }, { "epoch": 1.1, "learning_rate": 0.0001346108284233801, "loss": 0.0128, "step": 425360 }, { "epoch": 1.1, "learning_rate": 0.00013460694020700863, "loss": 0.0114, "step": 425370 }, { "epoch": 1.1, "learning_rate": 0.00013460305199063718, "loss": 0.0106, "step": 425380 }, { "epoch": 1.1, "learning_rate": 0.0001345991637742657, "loss": 0.0103, "step": 425390 }, { "epoch": 1.1, "learning_rate": 0.00013459527555789423, "loss": 0.0095, "step": 425400 }, { "epoch": 1.1, "learning_rate": 0.00013459138734152277, "loss": 0.0111, "step": 425410 }, { "epoch": 1.1, "learning_rate": 0.00013458749912515132, "loss": 0.0109, "step": 425420 }, { "epoch": 1.1, "learning_rate": 0.00013458361090877983, "loss": 0.0119, "step": 425430 }, { "epoch": 1.1, "learning_rate": 0.00013457972269240837, "loss": 0.0106, "step": 425440 }, { "epoch": 1.1, "learning_rate": 0.00013457583447603691, "loss": 0.0164, "step": 425450 }, { "epoch": 1.1, "learning_rate": 0.00013457194625966546, "loss": 0.0108, "step": 425460 }, { "epoch": 1.1, "learning_rate": 0.00013456805804329397, "loss": 0.0121, "step": 425470 }, { "epoch": 1.1, "learning_rate": 0.0001345641698269225, "loss": 0.0179, "step": 425480 }, { "epoch": 1.1, "learning_rate": 0.00013456028161055105, "loss": 0.01, "step": 425490 }, { "epoch": 1.1, "learning_rate": 0.0001345563933941796, "loss": 0.0112, "step": 425500 }, { "epoch": 1.1, "learning_rate": 0.00013455250517780814, "loss": 0.0107, "step": 425510 }, { "epoch": 1.1, "learning_rate": 0.00013454861696143665, "loss": 0.0124, "step": 425520 }, { "epoch": 1.1, "learning_rate": 0.0001345447287450652, "loss": 0.012, "step": 425530 }, { "epoch": 1.1, "learning_rate": 0.00013454084052869373, "loss": 0.0106, "step": 425540 }, { "epoch": 1.1, "learning_rate": 0.00013453695231232228, "loss": 0.0109, "step": 425550 }, { "epoch": 1.1, "learning_rate": 0.0001345330640959508, "loss": 0.0087, "step": 425560 }, { "epoch": 1.1, "learning_rate": 0.00013452917587957933, "loss": 0.0095, "step": 425570 }, { "epoch": 1.1, "learning_rate": 0.00013452528766320787, "loss": 0.0125, "step": 425580 }, { "epoch": 1.1, "learning_rate": 0.00013452139944683642, "loss": 0.0091, "step": 425590 }, { "epoch": 1.1, "learning_rate": 0.00013451751123046493, "loss": 0.0138, "step": 425600 }, { "epoch": 1.1, "learning_rate": 0.00013451362301409347, "loss": 0.0132, "step": 425610 }, { "epoch": 1.1, "learning_rate": 0.000134509734797722, "loss": 0.0207, "step": 425620 }, { "epoch": 1.1, "learning_rate": 0.00013450584658135055, "loss": 0.0106, "step": 425630 }, { "epoch": 1.1, "learning_rate": 0.00013450195836497907, "loss": 0.0119, "step": 425640 }, { "epoch": 1.1, "learning_rate": 0.0001344980701486076, "loss": 0.0146, "step": 425650 }, { "epoch": 1.1, "learning_rate": 0.00013449418193223615, "loss": 0.0158, "step": 425660 }, { "epoch": 1.1, "learning_rate": 0.0001344902937158647, "loss": 0.0111, "step": 425670 }, { "epoch": 1.1, "learning_rate": 0.0001344864054994932, "loss": 0.0094, "step": 425680 }, { "epoch": 1.1, "learning_rate": 0.00013448251728312178, "loss": 0.0098, "step": 425690 }, { "epoch": 1.1, "learning_rate": 0.0001344786290667503, "loss": 0.0112, "step": 425700 }, { "epoch": 1.1, "learning_rate": 0.00013447474085037883, "loss": 0.0102, "step": 425710 }, { "epoch": 1.1, "learning_rate": 0.00013447085263400738, "loss": 0.0146, "step": 425720 }, { "epoch": 1.1, "learning_rate": 0.00013446696441763592, "loss": 0.0103, "step": 425730 }, { "epoch": 1.1, "learning_rate": 0.00013446307620126443, "loss": 0.0112, "step": 425740 }, { "epoch": 1.1, "learning_rate": 0.00013445918798489297, "loss": 0.012, "step": 425750 }, { "epoch": 1.1, "learning_rate": 0.00013445529976852151, "loss": 0.0109, "step": 425760 }, { "epoch": 1.1, "learning_rate": 0.00013445141155215003, "loss": 0.0128, "step": 425770 }, { "epoch": 1.1, "learning_rate": 0.00013444752333577857, "loss": 0.0125, "step": 425780 }, { "epoch": 1.1, "learning_rate": 0.0001344436351194071, "loss": 0.0101, "step": 425790 }, { "epoch": 1.1, "learning_rate": 0.00013443974690303565, "loss": 0.0091, "step": 425800 }, { "epoch": 1.1, "learning_rate": 0.00013443585868666417, "loss": 0.0104, "step": 425810 }, { "epoch": 1.1, "learning_rate": 0.0001344319704702927, "loss": 0.0149, "step": 425820 }, { "epoch": 1.1, "learning_rate": 0.00013442808225392125, "loss": 0.0106, "step": 425830 }, { "epoch": 1.1, "learning_rate": 0.0001344241940375498, "loss": 0.0111, "step": 425840 }, { "epoch": 1.1, "learning_rate": 0.0001344203058211783, "loss": 0.0111, "step": 425850 }, { "epoch": 1.1, "learning_rate": 0.00013441641760480688, "loss": 0.0097, "step": 425860 }, { "epoch": 1.1, "learning_rate": 0.0001344125293884354, "loss": 0.0087, "step": 425870 }, { "epoch": 1.1, "learning_rate": 0.00013440864117206393, "loss": 0.0106, "step": 425880 }, { "epoch": 1.1, "learning_rate": 0.00013440475295569247, "loss": 0.0099, "step": 425890 }, { "epoch": 1.1, "learning_rate": 0.00013440086473932102, "loss": 0.0136, "step": 425900 }, { "epoch": 1.1, "learning_rate": 0.00013439697652294953, "loss": 0.0106, "step": 425910 }, { "epoch": 1.1, "learning_rate": 0.00013439308830657807, "loss": 0.0117, "step": 425920 }, { "epoch": 1.1, "learning_rate": 0.00013438920009020661, "loss": 0.011, "step": 425930 }, { "epoch": 1.1, "learning_rate": 0.00013438531187383516, "loss": 0.0112, "step": 425940 }, { "epoch": 1.1, "learning_rate": 0.00013438142365746367, "loss": 0.0099, "step": 425950 }, { "epoch": 1.1, "learning_rate": 0.0001343775354410922, "loss": 0.0111, "step": 425960 }, { "epoch": 1.1, "learning_rate": 0.00013437364722472075, "loss": 0.0096, "step": 425970 }, { "epoch": 1.1, "learning_rate": 0.0001343697590083493, "loss": 0.0128, "step": 425980 }, { "epoch": 1.1, "learning_rate": 0.0001343658707919778, "loss": 0.0134, "step": 425990 }, { "epoch": 1.1, "learning_rate": 0.00013436198257560635, "loss": 0.0125, "step": 426000 }, { "epoch": 1.1, "eval_cer": 0.8816802921322209, "eval_loss": 0.007685732562094927, "eval_runtime": 107.9705, "eval_samples_per_second": 18.524, "eval_steps_per_second": 4.631, "step": 426000 }, { "epoch": 1.1, "learning_rate": 0.0001343580943592349, "loss": 0.009, "step": 426010 }, { "epoch": 1.1, "learning_rate": 0.0001343542061428634, "loss": 0.0102, "step": 426020 }, { "epoch": 1.1, "learning_rate": 0.00013435031792649195, "loss": 0.0105, "step": 426030 }, { "epoch": 1.1, "learning_rate": 0.0001343464297101205, "loss": 0.0089, "step": 426040 }, { "epoch": 1.1, "learning_rate": 0.00013434254149374903, "loss": 0.0133, "step": 426050 }, { "epoch": 1.1, "learning_rate": 0.00013433865327737757, "loss": 0.0111, "step": 426060 }, { "epoch": 1.1, "learning_rate": 0.00013433476506100612, "loss": 0.0095, "step": 426070 }, { "epoch": 1.1, "learning_rate": 0.00013433087684463463, "loss": 0.0142, "step": 426080 }, { "epoch": 1.1, "learning_rate": 0.00013432698862826317, "loss": 0.0077, "step": 426090 }, { "epoch": 1.1, "learning_rate": 0.00013432310041189171, "loss": 0.0102, "step": 426100 }, { "epoch": 1.1, "learning_rate": 0.00013431921219552026, "loss": 0.0079, "step": 426110 }, { "epoch": 1.1, "learning_rate": 0.00013431532397914877, "loss": 0.0128, "step": 426120 }, { "epoch": 1.1, "learning_rate": 0.0001343114357627773, "loss": 0.0141, "step": 426130 }, { "epoch": 1.1, "learning_rate": 0.00013430754754640585, "loss": 0.0148, "step": 426140 }, { "epoch": 1.1, "learning_rate": 0.0001343036593300344, "loss": 0.0076, "step": 426150 }, { "epoch": 1.1, "learning_rate": 0.0001342997711136629, "loss": 0.0092, "step": 426160 }, { "epoch": 1.1, "learning_rate": 0.00013429588289729145, "loss": 0.0122, "step": 426170 }, { "epoch": 1.1, "learning_rate": 0.00013429199468092, "loss": 0.0154, "step": 426180 }, { "epoch": 1.1, "learning_rate": 0.00013428810646454853, "loss": 0.0121, "step": 426190 }, { "epoch": 1.1, "learning_rate": 0.00013428421824817705, "loss": 0.0095, "step": 426200 }, { "epoch": 1.1, "learning_rate": 0.00013428033003180562, "loss": 0.0119, "step": 426210 }, { "epoch": 1.1, "learning_rate": 0.00013427644181543413, "loss": 0.0135, "step": 426220 }, { "epoch": 1.1, "learning_rate": 0.00013427255359906267, "loss": 0.0099, "step": 426230 }, { "epoch": 1.1, "learning_rate": 0.00013426866538269122, "loss": 0.011, "step": 426240 }, { "epoch": 1.1, "learning_rate": 0.00013426477716631973, "loss": 0.0129, "step": 426250 }, { "epoch": 1.1, "learning_rate": 0.00013426088894994827, "loss": 0.0117, "step": 426260 }, { "epoch": 1.1, "learning_rate": 0.0001342570007335768, "loss": 0.0156, "step": 426270 }, { "epoch": 1.1, "learning_rate": 0.00013425311251720535, "loss": 0.0117, "step": 426280 }, { "epoch": 1.11, "learning_rate": 0.00013424922430083387, "loss": 0.0125, "step": 426290 }, { "epoch": 1.11, "learning_rate": 0.0001342453360844624, "loss": 0.0122, "step": 426300 }, { "epoch": 1.11, "learning_rate": 0.00013424144786809095, "loss": 0.0155, "step": 426310 }, { "epoch": 1.11, "learning_rate": 0.0001342375596517195, "loss": 0.0169, "step": 426320 }, { "epoch": 1.11, "learning_rate": 0.000134233671435348, "loss": 0.0137, "step": 426330 }, { "epoch": 1.11, "learning_rate": 0.00013422978321897655, "loss": 0.0092, "step": 426340 }, { "epoch": 1.11, "learning_rate": 0.0001342258950026051, "loss": 0.0126, "step": 426350 }, { "epoch": 1.11, "learning_rate": 0.00013422200678623363, "loss": 0.0127, "step": 426360 }, { "epoch": 1.11, "learning_rate": 0.00013421811856986215, "loss": 0.0112, "step": 426370 }, { "epoch": 1.11, "learning_rate": 0.00013421423035349072, "loss": 0.0139, "step": 426380 }, { "epoch": 1.11, "learning_rate": 0.00013421034213711923, "loss": 0.0098, "step": 426390 }, { "epoch": 1.11, "learning_rate": 0.00013420645392074777, "loss": 0.0106, "step": 426400 }, { "epoch": 1.11, "learning_rate": 0.00013420256570437631, "loss": 0.011, "step": 426410 }, { "epoch": 1.11, "learning_rate": 0.00013419867748800486, "loss": 0.0104, "step": 426420 }, { "epoch": 1.11, "learning_rate": 0.00013419478927163337, "loss": 0.0128, "step": 426430 }, { "epoch": 1.11, "learning_rate": 0.0001341909010552619, "loss": 0.0111, "step": 426440 }, { "epoch": 1.11, "learning_rate": 0.00013418701283889045, "loss": 0.0156, "step": 426450 }, { "epoch": 1.11, "learning_rate": 0.000134183124622519, "loss": 0.0098, "step": 426460 }, { "epoch": 1.11, "learning_rate": 0.0001341792364061475, "loss": 0.0107, "step": 426470 }, { "epoch": 1.11, "learning_rate": 0.00013417534818977605, "loss": 0.0101, "step": 426480 }, { "epoch": 1.11, "learning_rate": 0.0001341714599734046, "loss": 0.0128, "step": 426490 }, { "epoch": 1.11, "learning_rate": 0.0001341675717570331, "loss": 0.0122, "step": 426500 }, { "epoch": 1.11, "learning_rate": 0.00013416368354066165, "loss": 0.0094, "step": 426510 }, { "epoch": 1.11, "learning_rate": 0.0001341597953242902, "loss": 0.0121, "step": 426520 }, { "epoch": 1.11, "learning_rate": 0.00013415590710791873, "loss": 0.0123, "step": 426530 }, { "epoch": 1.11, "learning_rate": 0.00013415201889154725, "loss": 0.0129, "step": 426540 }, { "epoch": 1.11, "learning_rate": 0.0001341481306751758, "loss": 0.0124, "step": 426550 }, { "epoch": 1.11, "learning_rate": 0.00013414424245880433, "loss": 0.0091, "step": 426560 }, { "epoch": 1.11, "learning_rate": 0.00013414035424243287, "loss": 0.0151, "step": 426570 }, { "epoch": 1.11, "learning_rate": 0.00013413646602606141, "loss": 0.0147, "step": 426580 }, { "epoch": 1.11, "learning_rate": 0.00013413257780968996, "loss": 0.0104, "step": 426590 }, { "epoch": 1.11, "learning_rate": 0.00013412868959331847, "loss": 0.0104, "step": 426600 }, { "epoch": 1.11, "learning_rate": 0.000134124801376947, "loss": 0.0089, "step": 426610 }, { "epoch": 1.11, "learning_rate": 0.00013412091316057555, "loss": 0.0141, "step": 426620 }, { "epoch": 1.11, "learning_rate": 0.0001341170249442041, "loss": 0.0096, "step": 426630 }, { "epoch": 1.11, "learning_rate": 0.0001341131367278326, "loss": 0.0108, "step": 426640 }, { "epoch": 1.11, "learning_rate": 0.00013410924851146115, "loss": 0.0103, "step": 426650 }, { "epoch": 1.11, "learning_rate": 0.0001341053602950897, "loss": 0.0132, "step": 426660 }, { "epoch": 1.11, "learning_rate": 0.00013410147207871823, "loss": 0.0118, "step": 426670 }, { "epoch": 1.11, "learning_rate": 0.00013409758386234675, "loss": 0.0111, "step": 426680 }, { "epoch": 1.11, "learning_rate": 0.0001340936956459753, "loss": 0.0093, "step": 426690 }, { "epoch": 1.11, "learning_rate": 0.00013408980742960383, "loss": 0.0126, "step": 426700 }, { "epoch": 1.11, "learning_rate": 0.00013408591921323237, "loss": 0.0091, "step": 426710 }, { "epoch": 1.11, "learning_rate": 0.0001340820309968609, "loss": 0.0073, "step": 426720 }, { "epoch": 1.11, "learning_rate": 0.00013407814278048946, "loss": 0.0079, "step": 426730 }, { "epoch": 1.11, "learning_rate": 0.00013407425456411797, "loss": 0.012, "step": 426740 }, { "epoch": 1.11, "learning_rate": 0.00013407036634774649, "loss": 0.0106, "step": 426750 }, { "epoch": 1.11, "learning_rate": 0.00013406647813137506, "loss": 0.0113, "step": 426760 }, { "epoch": 1.11, "learning_rate": 0.00013406258991500357, "loss": 0.0109, "step": 426770 }, { "epoch": 1.11, "learning_rate": 0.0001340587016986321, "loss": 0.0131, "step": 426780 }, { "epoch": 1.11, "learning_rate": 0.00013405481348226065, "loss": 0.0136, "step": 426790 }, { "epoch": 1.11, "learning_rate": 0.0001340509252658892, "loss": 0.0116, "step": 426800 }, { "epoch": 1.11, "learning_rate": 0.0001340470370495177, "loss": 0.0131, "step": 426810 }, { "epoch": 1.11, "learning_rate": 0.00013404314883314625, "loss": 0.0145, "step": 426820 }, { "epoch": 1.11, "learning_rate": 0.0001340392606167748, "loss": 0.0107, "step": 426830 }, { "epoch": 1.11, "learning_rate": 0.00013403537240040333, "loss": 0.01, "step": 426840 }, { "epoch": 1.11, "learning_rate": 0.00013403148418403185, "loss": 0.013, "step": 426850 }, { "epoch": 1.11, "learning_rate": 0.0001340275959676604, "loss": 0.0098, "step": 426860 }, { "epoch": 1.11, "learning_rate": 0.00013402370775128893, "loss": 0.0081, "step": 426870 }, { "epoch": 1.11, "learning_rate": 0.00013401981953491747, "loss": 0.009, "step": 426880 }, { "epoch": 1.11, "learning_rate": 0.000134015931318546, "loss": 0.011, "step": 426890 }, { "epoch": 1.11, "learning_rate": 0.00013401204310217456, "loss": 0.0131, "step": 426900 }, { "epoch": 1.11, "learning_rate": 0.00013400815488580307, "loss": 0.0125, "step": 426910 }, { "epoch": 1.11, "learning_rate": 0.0001340042666694316, "loss": 0.0097, "step": 426920 }, { "epoch": 1.11, "learning_rate": 0.00013400037845306015, "loss": 0.0118, "step": 426930 }, { "epoch": 1.11, "learning_rate": 0.0001339964902366887, "loss": 0.0129, "step": 426940 }, { "epoch": 1.11, "learning_rate": 0.0001339926020203172, "loss": 0.01, "step": 426950 }, { "epoch": 1.11, "learning_rate": 0.00013398871380394575, "loss": 0.0107, "step": 426960 }, { "epoch": 1.11, "learning_rate": 0.0001339848255875743, "loss": 0.0094, "step": 426970 }, { "epoch": 1.11, "learning_rate": 0.00013398093737120284, "loss": 0.0143, "step": 426980 }, { "epoch": 1.11, "learning_rate": 0.00013397704915483135, "loss": 0.0142, "step": 426990 }, { "epoch": 1.11, "learning_rate": 0.0001339731609384599, "loss": 0.0135, "step": 427000 }, { "epoch": 1.11, "eval_cer": 0.8816872903168917, "eval_loss": 0.007585541810840368, "eval_runtime": 107.5996, "eval_samples_per_second": 18.587, "eval_steps_per_second": 4.647, "step": 427000 }, { "epoch": 1.11, "learning_rate": 0.00013396927272208843, "loss": 0.0115, "step": 427010 }, { "epoch": 1.11, "learning_rate": 0.00013396538450571695, "loss": 0.0112, "step": 427020 }, { "epoch": 1.11, "learning_rate": 0.0001339614962893455, "loss": 0.0111, "step": 427030 }, { "epoch": 1.11, "learning_rate": 0.00013395760807297403, "loss": 0.0109, "step": 427040 }, { "epoch": 1.11, "learning_rate": 0.00013395371985660257, "loss": 0.0094, "step": 427050 }, { "epoch": 1.11, "learning_rate": 0.0001339498316402311, "loss": 0.0112, "step": 427060 }, { "epoch": 1.11, "learning_rate": 0.00013394594342385963, "loss": 0.0126, "step": 427070 }, { "epoch": 1.11, "learning_rate": 0.00013394205520748817, "loss": 0.0137, "step": 427080 }, { "epoch": 1.11, "learning_rate": 0.0001339381669911167, "loss": 0.0127, "step": 427090 }, { "epoch": 1.11, "learning_rate": 0.00013393427877474525, "loss": 0.0127, "step": 427100 }, { "epoch": 1.11, "learning_rate": 0.0001339303905583738, "loss": 0.0132, "step": 427110 }, { "epoch": 1.11, "learning_rate": 0.0001339265023420023, "loss": 0.0089, "step": 427120 }, { "epoch": 1.11, "learning_rate": 0.00013392261412563085, "loss": 0.0097, "step": 427130 }, { "epoch": 1.11, "learning_rate": 0.0001339187259092594, "loss": 0.0116, "step": 427140 }, { "epoch": 1.11, "learning_rate": 0.00013391483769288794, "loss": 0.0109, "step": 427150 }, { "epoch": 1.11, "learning_rate": 0.00013391094947651645, "loss": 0.0101, "step": 427160 }, { "epoch": 1.11, "learning_rate": 0.000133907061260145, "loss": 0.0113, "step": 427170 }, { "epoch": 1.11, "learning_rate": 0.00013390317304377353, "loss": 0.0134, "step": 427180 }, { "epoch": 1.11, "learning_rate": 0.00013389928482740207, "loss": 0.012, "step": 427190 }, { "epoch": 1.11, "learning_rate": 0.0001338953966110306, "loss": 0.0121, "step": 427200 }, { "epoch": 1.11, "learning_rate": 0.00013389150839465913, "loss": 0.0115, "step": 427210 }, { "epoch": 1.11, "learning_rate": 0.00013388762017828767, "loss": 0.0135, "step": 427220 }, { "epoch": 1.11, "learning_rate": 0.00013388373196191621, "loss": 0.0126, "step": 427230 }, { "epoch": 1.11, "learning_rate": 0.00013387984374554473, "loss": 0.0076, "step": 427240 }, { "epoch": 1.11, "learning_rate": 0.00013387595552917327, "loss": 0.0115, "step": 427250 }, { "epoch": 1.11, "learning_rate": 0.0001338720673128018, "loss": 0.0099, "step": 427260 }, { "epoch": 1.11, "learning_rate": 0.00013386817909643033, "loss": 0.009, "step": 427270 }, { "epoch": 1.11, "learning_rate": 0.0001338642908800589, "loss": 0.0136, "step": 427280 }, { "epoch": 1.11, "learning_rate": 0.0001338604026636874, "loss": 0.0144, "step": 427290 }, { "epoch": 1.11, "learning_rate": 0.00013385651444731595, "loss": 0.0109, "step": 427300 }, { "epoch": 1.11, "learning_rate": 0.0001338526262309445, "loss": 0.0111, "step": 427310 }, { "epoch": 1.11, "learning_rate": 0.00013384873801457303, "loss": 0.0114, "step": 427320 }, { "epoch": 1.11, "learning_rate": 0.00013384484979820155, "loss": 0.0105, "step": 427330 }, { "epoch": 1.11, "learning_rate": 0.0001338409615818301, "loss": 0.0093, "step": 427340 }, { "epoch": 1.11, "learning_rate": 0.00013383707336545863, "loss": 0.0096, "step": 427350 }, { "epoch": 1.11, "learning_rate": 0.00013383318514908717, "loss": 0.0107, "step": 427360 }, { "epoch": 1.11, "learning_rate": 0.0001338292969327157, "loss": 0.015, "step": 427370 }, { "epoch": 1.11, "learning_rate": 0.00013382540871634423, "loss": 0.0113, "step": 427380 }, { "epoch": 1.11, "learning_rate": 0.00013382152049997277, "loss": 0.0099, "step": 427390 }, { "epoch": 1.11, "learning_rate": 0.0001338176322836013, "loss": 0.0105, "step": 427400 }, { "epoch": 1.11, "learning_rate": 0.00013381374406722983, "loss": 0.013, "step": 427410 }, { "epoch": 1.11, "learning_rate": 0.00013380985585085837, "loss": 0.0133, "step": 427420 }, { "epoch": 1.11, "learning_rate": 0.0001338059676344869, "loss": 0.0149, "step": 427430 }, { "epoch": 1.11, "learning_rate": 0.00013380207941811545, "loss": 0.0112, "step": 427440 }, { "epoch": 1.11, "learning_rate": 0.000133798191201744, "loss": 0.0106, "step": 427450 }, { "epoch": 1.11, "learning_rate": 0.00013379430298537254, "loss": 0.0102, "step": 427460 }, { "epoch": 1.11, "learning_rate": 0.00013379041476900105, "loss": 0.0092, "step": 427470 }, { "epoch": 1.11, "learning_rate": 0.0001337865265526296, "loss": 0.0107, "step": 427480 }, { "epoch": 1.11, "learning_rate": 0.00013378263833625813, "loss": 0.0103, "step": 427490 }, { "epoch": 1.11, "learning_rate": 0.00013377875011988665, "loss": 0.0092, "step": 427500 }, { "epoch": 1.11, "learning_rate": 0.0001337748619035152, "loss": 0.0139, "step": 427510 }, { "epoch": 1.11, "learning_rate": 0.00013377097368714373, "loss": 0.0194, "step": 427520 }, { "epoch": 1.11, "learning_rate": 0.00013376708547077227, "loss": 0.0087, "step": 427530 }, { "epoch": 1.11, "learning_rate": 0.0001337631972544008, "loss": 0.0119, "step": 427540 }, { "epoch": 1.11, "learning_rate": 0.00013375930903802933, "loss": 0.0089, "step": 427550 }, { "epoch": 1.11, "learning_rate": 0.00013375542082165787, "loss": 0.0108, "step": 427560 }, { "epoch": 1.11, "learning_rate": 0.0001337515326052864, "loss": 0.0114, "step": 427570 }, { "epoch": 1.11, "learning_rate": 0.00013374764438891493, "loss": 0.0108, "step": 427580 }, { "epoch": 1.11, "learning_rate": 0.00013374375617254347, "loss": 0.0111, "step": 427590 }, { "epoch": 1.11, "learning_rate": 0.000133739867956172, "loss": 0.0109, "step": 427600 }, { "epoch": 1.11, "learning_rate": 0.00013373597973980055, "loss": 0.009, "step": 427610 }, { "epoch": 1.11, "learning_rate": 0.00013373209152342907, "loss": 0.0128, "step": 427620 }, { "epoch": 1.11, "learning_rate": 0.00013372820330705764, "loss": 0.0114, "step": 427630 }, { "epoch": 1.11, "learning_rate": 0.00013372431509068615, "loss": 0.0097, "step": 427640 }, { "epoch": 1.11, "learning_rate": 0.0001337204268743147, "loss": 0.0129, "step": 427650 }, { "epoch": 1.11, "learning_rate": 0.00013371653865794323, "loss": 0.0106, "step": 427660 }, { "epoch": 1.11, "learning_rate": 0.00013371265044157177, "loss": 0.0099, "step": 427670 }, { "epoch": 1.11, "learning_rate": 0.0001337087622252003, "loss": 0.0118, "step": 427680 }, { "epoch": 1.11, "learning_rate": 0.00013370487400882883, "loss": 0.0078, "step": 427690 }, { "epoch": 1.11, "learning_rate": 0.00013370098579245737, "loss": 0.0132, "step": 427700 }, { "epoch": 1.11, "learning_rate": 0.00013369709757608591, "loss": 0.0107, "step": 427710 }, { "epoch": 1.11, "learning_rate": 0.00013369320935971443, "loss": 0.0097, "step": 427720 }, { "epoch": 1.11, "learning_rate": 0.00013368932114334297, "loss": 0.0121, "step": 427730 }, { "epoch": 1.11, "learning_rate": 0.0001336854329269715, "loss": 0.011, "step": 427740 }, { "epoch": 1.11, "learning_rate": 0.00013368154471060003, "loss": 0.0091, "step": 427750 }, { "epoch": 1.11, "learning_rate": 0.00013367765649422857, "loss": 0.0093, "step": 427760 }, { "epoch": 1.11, "learning_rate": 0.0001336737682778571, "loss": 0.0094, "step": 427770 }, { "epoch": 1.11, "learning_rate": 0.00013366988006148565, "loss": 0.0095, "step": 427780 }, { "epoch": 1.11, "learning_rate": 0.00013366599184511417, "loss": 0.0094, "step": 427790 }, { "epoch": 1.11, "learning_rate": 0.00013366210362874273, "loss": 0.0143, "step": 427800 }, { "epoch": 1.11, "learning_rate": 0.00013365821541237125, "loss": 0.0138, "step": 427810 }, { "epoch": 1.11, "learning_rate": 0.0001336543271959998, "loss": 0.0105, "step": 427820 }, { "epoch": 1.11, "learning_rate": 0.00013365043897962833, "loss": 0.0092, "step": 427830 }, { "epoch": 1.11, "learning_rate": 0.00013364655076325687, "loss": 0.01, "step": 427840 }, { "epoch": 1.11, "learning_rate": 0.0001336426625468854, "loss": 0.012, "step": 427850 }, { "epoch": 1.11, "learning_rate": 0.00013363877433051393, "loss": 0.0086, "step": 427860 }, { "epoch": 1.11, "learning_rate": 0.00013363488611414247, "loss": 0.0114, "step": 427870 }, { "epoch": 1.11, "learning_rate": 0.00013363099789777101, "loss": 0.0131, "step": 427880 }, { "epoch": 1.11, "learning_rate": 0.00013362710968139953, "loss": 0.0105, "step": 427890 }, { "epoch": 1.11, "learning_rate": 0.00013362322146502807, "loss": 0.0121, "step": 427900 }, { "epoch": 1.11, "learning_rate": 0.0001336193332486566, "loss": 0.0098, "step": 427910 }, { "epoch": 1.11, "learning_rate": 0.00013361544503228515, "loss": 0.0106, "step": 427920 }, { "epoch": 1.11, "learning_rate": 0.00013361155681591367, "loss": 0.0106, "step": 427930 }, { "epoch": 1.11, "learning_rate": 0.0001336076685995422, "loss": 0.0109, "step": 427940 }, { "epoch": 1.11, "learning_rate": 0.00013360378038317075, "loss": 0.012, "step": 427950 }, { "epoch": 1.11, "learning_rate": 0.0001335998921667993, "loss": 0.0112, "step": 427960 }, { "epoch": 1.11, "learning_rate": 0.00013359600395042783, "loss": 0.0117, "step": 427970 }, { "epoch": 1.11, "learning_rate": 0.00013359211573405638, "loss": 0.0117, "step": 427980 }, { "epoch": 1.11, "learning_rate": 0.0001335882275176849, "loss": 0.0095, "step": 427990 }, { "epoch": 1.11, "learning_rate": 0.00013358433930131343, "loss": 0.012, "step": 428000 }, { "epoch": 1.11, "eval_cer": 0.8816788924952867, "eval_loss": 0.007801650557667017, "eval_runtime": 107.5281, "eval_samples_per_second": 18.6, "eval_steps_per_second": 4.65, "step": 428000 }, { "epoch": 1.11, "learning_rate": 0.00013358045108494197, "loss": 0.0129, "step": 428010 }, { "epoch": 1.11, "learning_rate": 0.0001335765628685705, "loss": 0.0122, "step": 428020 }, { "epoch": 1.11, "learning_rate": 0.00013357267465219903, "loss": 0.0098, "step": 428030 }, { "epoch": 1.11, "learning_rate": 0.00013356878643582757, "loss": 0.0117, "step": 428040 }, { "epoch": 1.11, "learning_rate": 0.0001335648982194561, "loss": 0.011, "step": 428050 }, { "epoch": 1.11, "learning_rate": 0.00013356101000308463, "loss": 0.0077, "step": 428060 }, { "epoch": 1.11, "learning_rate": 0.00013355712178671317, "loss": 0.0088, "step": 428070 }, { "epoch": 1.11, "learning_rate": 0.0001335532335703417, "loss": 0.011, "step": 428080 }, { "epoch": 1.11, "learning_rate": 0.00013354934535397025, "loss": 0.0084, "step": 428090 }, { "epoch": 1.11, "learning_rate": 0.00013354545713759877, "loss": 0.0117, "step": 428100 }, { "epoch": 1.11, "learning_rate": 0.0001335415689212273, "loss": 0.0096, "step": 428110 }, { "epoch": 1.11, "learning_rate": 0.00013353768070485585, "loss": 0.0105, "step": 428120 }, { "epoch": 1.11, "learning_rate": 0.0001335337924884844, "loss": 0.0105, "step": 428130 }, { "epoch": 1.11, "learning_rate": 0.0001335299042721129, "loss": 0.0099, "step": 428140 }, { "epoch": 1.11, "learning_rate": 0.00013352601605574148, "loss": 0.0105, "step": 428150 }, { "epoch": 1.11, "learning_rate": 0.00013352212783937, "loss": 0.0118, "step": 428160 }, { "epoch": 1.11, "learning_rate": 0.00013351823962299853, "loss": 0.0111, "step": 428170 }, { "epoch": 1.11, "learning_rate": 0.00013351435140662707, "loss": 0.0133, "step": 428180 }, { "epoch": 1.11, "learning_rate": 0.00013351046319025561, "loss": 0.0111, "step": 428190 }, { "epoch": 1.11, "learning_rate": 0.00013350657497388413, "loss": 0.0107, "step": 428200 }, { "epoch": 1.11, "learning_rate": 0.00013350268675751267, "loss": 0.0152, "step": 428210 }, { "epoch": 1.11, "learning_rate": 0.0001334987985411412, "loss": 0.0153, "step": 428220 }, { "epoch": 1.11, "learning_rate": 0.00013349491032476975, "loss": 0.0105, "step": 428230 }, { "epoch": 1.11, "learning_rate": 0.00013349102210839827, "loss": 0.0135, "step": 428240 }, { "epoch": 1.11, "learning_rate": 0.0001334871338920268, "loss": 0.0108, "step": 428250 }, { "epoch": 1.11, "learning_rate": 0.00013348324567565535, "loss": 0.0122, "step": 428260 }, { "epoch": 1.11, "learning_rate": 0.00013347935745928387, "loss": 0.0118, "step": 428270 }, { "epoch": 1.11, "learning_rate": 0.0001334754692429124, "loss": 0.0106, "step": 428280 }, { "epoch": 1.11, "learning_rate": 0.00013347158102654095, "loss": 0.0097, "step": 428290 }, { "epoch": 1.11, "learning_rate": 0.0001334676928101695, "loss": 0.0079, "step": 428300 }, { "epoch": 1.11, "learning_rate": 0.000133463804593798, "loss": 0.0103, "step": 428310 }, { "epoch": 1.11, "learning_rate": 0.00013345991637742657, "loss": 0.0221, "step": 428320 }, { "epoch": 1.11, "learning_rate": 0.0001334560281610551, "loss": 0.0112, "step": 428330 }, { "epoch": 1.11, "learning_rate": 0.00013345213994468363, "loss": 0.0089, "step": 428340 }, { "epoch": 1.11, "learning_rate": 0.00013344825172831217, "loss": 0.0085, "step": 428350 }, { "epoch": 1.11, "learning_rate": 0.00013344436351194071, "loss": 0.011, "step": 428360 }, { "epoch": 1.11, "learning_rate": 0.00013344047529556923, "loss": 0.0098, "step": 428370 }, { "epoch": 1.11, "learning_rate": 0.00013343658707919777, "loss": 0.0087, "step": 428380 }, { "epoch": 1.11, "learning_rate": 0.0001334326988628263, "loss": 0.0105, "step": 428390 }, { "epoch": 1.11, "learning_rate": 0.00013342881064645485, "loss": 0.0123, "step": 428400 }, { "epoch": 1.11, "learning_rate": 0.00013342492243008337, "loss": 0.0099, "step": 428410 }, { "epoch": 1.11, "learning_rate": 0.0001334210342137119, "loss": 0.0113, "step": 428420 }, { "epoch": 1.11, "learning_rate": 0.00013341714599734045, "loss": 0.0121, "step": 428430 }, { "epoch": 1.11, "learning_rate": 0.000133413257780969, "loss": 0.0097, "step": 428440 }, { "epoch": 1.11, "learning_rate": 0.0001334093695645975, "loss": 0.0091, "step": 428450 }, { "epoch": 1.11, "learning_rate": 0.00013340548134822605, "loss": 0.0145, "step": 428460 }, { "epoch": 1.11, "learning_rate": 0.0001334015931318546, "loss": 0.0103, "step": 428470 }, { "epoch": 1.11, "learning_rate": 0.00013339770491548313, "loss": 0.01, "step": 428480 }, { "epoch": 1.11, "learning_rate": 0.00013339381669911167, "loss": 0.0132, "step": 428490 }, { "epoch": 1.11, "learning_rate": 0.0001333899284827402, "loss": 0.0103, "step": 428500 }, { "epoch": 1.11, "learning_rate": 0.00013338604026636873, "loss": 0.0115, "step": 428510 }, { "epoch": 1.11, "learning_rate": 0.00013338215204999727, "loss": 0.0107, "step": 428520 }, { "epoch": 1.11, "learning_rate": 0.00013337826383362581, "loss": 0.0113, "step": 428530 }, { "epoch": 1.11, "learning_rate": 0.00013337437561725433, "loss": 0.0123, "step": 428540 }, { "epoch": 1.11, "learning_rate": 0.00013337048740088287, "loss": 0.0093, "step": 428550 }, { "epoch": 1.11, "learning_rate": 0.0001333665991845114, "loss": 0.0105, "step": 428560 }, { "epoch": 1.11, "learning_rate": 0.00013336271096813995, "loss": 0.0122, "step": 428570 }, { "epoch": 1.11, "learning_rate": 0.00013335882275176847, "loss": 0.0132, "step": 428580 }, { "epoch": 1.11, "learning_rate": 0.000133354934535397, "loss": 0.0109, "step": 428590 }, { "epoch": 1.11, "learning_rate": 0.00013335104631902555, "loss": 0.0137, "step": 428600 }, { "epoch": 1.11, "learning_rate": 0.0001333471581026541, "loss": 0.0135, "step": 428610 }, { "epoch": 1.11, "learning_rate": 0.0001333432698862826, "loss": 0.0103, "step": 428620 }, { "epoch": 1.11, "learning_rate": 0.00013333938166991115, "loss": 0.0094, "step": 428630 }, { "epoch": 1.11, "learning_rate": 0.0001333354934535397, "loss": 0.0104, "step": 428640 }, { "epoch": 1.11, "learning_rate": 0.00013333160523716823, "loss": 0.014, "step": 428650 }, { "epoch": 1.11, "learning_rate": 0.00013332771702079675, "loss": 0.0112, "step": 428660 }, { "epoch": 1.11, "learning_rate": 0.00013332382880442532, "loss": 0.0073, "step": 428670 }, { "epoch": 1.11, "learning_rate": 0.00013331994058805383, "loss": 0.0142, "step": 428680 }, { "epoch": 1.11, "learning_rate": 0.00013331605237168237, "loss": 0.0117, "step": 428690 }, { "epoch": 1.11, "learning_rate": 0.0001333121641553109, "loss": 0.0114, "step": 428700 }, { "epoch": 1.11, "learning_rate": 0.00013330827593893945, "loss": 0.0109, "step": 428710 }, { "epoch": 1.11, "learning_rate": 0.00013330438772256797, "loss": 0.0123, "step": 428720 }, { "epoch": 1.11, "learning_rate": 0.0001333004995061965, "loss": 0.0111, "step": 428730 }, { "epoch": 1.11, "learning_rate": 0.00013329661128982505, "loss": 0.0101, "step": 428740 }, { "epoch": 1.11, "learning_rate": 0.00013329272307345357, "loss": 0.0089, "step": 428750 }, { "epoch": 1.11, "learning_rate": 0.0001332888348570821, "loss": 0.0127, "step": 428760 }, { "epoch": 1.11, "learning_rate": 0.00013328494664071065, "loss": 0.0134, "step": 428770 }, { "epoch": 1.11, "learning_rate": 0.0001332810584243392, "loss": 0.0099, "step": 428780 }, { "epoch": 1.11, "learning_rate": 0.0001332771702079677, "loss": 0.0128, "step": 428790 }, { "epoch": 1.11, "learning_rate": 0.00013327328199159625, "loss": 0.0088, "step": 428800 }, { "epoch": 1.11, "learning_rate": 0.0001332693937752248, "loss": 0.0098, "step": 428810 }, { "epoch": 1.11, "learning_rate": 0.00013326550555885333, "loss": 0.0075, "step": 428820 }, { "epoch": 1.11, "learning_rate": 0.00013326161734248185, "loss": 0.0127, "step": 428830 }, { "epoch": 1.11, "learning_rate": 0.00013325772912611041, "loss": 0.0122, "step": 428840 }, { "epoch": 1.11, "learning_rate": 0.00013325384090973893, "loss": 0.0126, "step": 428850 }, { "epoch": 1.11, "learning_rate": 0.00013324995269336747, "loss": 0.0093, "step": 428860 }, { "epoch": 1.11, "learning_rate": 0.000133246064476996, "loss": 0.0105, "step": 428870 }, { "epoch": 1.11, "learning_rate": 0.00013324217626062455, "loss": 0.0125, "step": 428880 }, { "epoch": 1.11, "learning_rate": 0.00013323828804425307, "loss": 0.0107, "step": 428890 }, { "epoch": 1.11, "learning_rate": 0.0001332343998278816, "loss": 0.0136, "step": 428900 }, { "epoch": 1.11, "learning_rate": 0.00013323051161151015, "loss": 0.011, "step": 428910 }, { "epoch": 1.11, "learning_rate": 0.0001332266233951387, "loss": 0.0086, "step": 428920 }, { "epoch": 1.11, "learning_rate": 0.0001332227351787672, "loss": 0.0124, "step": 428930 }, { "epoch": 1.11, "learning_rate": 0.00013321884696239575, "loss": 0.0107, "step": 428940 }, { "epoch": 1.11, "learning_rate": 0.0001332149587460243, "loss": 0.0113, "step": 428950 }, { "epoch": 1.11, "learning_rate": 0.00013321107052965283, "loss": 0.0123, "step": 428960 }, { "epoch": 1.11, "learning_rate": 0.00013320718231328135, "loss": 0.0123, "step": 428970 }, { "epoch": 1.11, "learning_rate": 0.0001332032940969099, "loss": 0.0124, "step": 428980 }, { "epoch": 1.11, "learning_rate": 0.00013319940588053843, "loss": 0.0139, "step": 428990 }, { "epoch": 1.11, "learning_rate": 0.00013319551766416695, "loss": 0.0133, "step": 429000 }, { "epoch": 1.11, "eval_cer": 0.8816914892276944, "eval_loss": 0.007387722842395306, "eval_runtime": 107.4783, "eval_samples_per_second": 18.608, "eval_steps_per_second": 4.652, "step": 429000 }, { "epoch": 1.11, "learning_rate": 0.0001331916294477955, "loss": 0.0122, "step": 429010 }, { "epoch": 1.11, "learning_rate": 0.00013318774123142403, "loss": 0.01, "step": 429020 }, { "epoch": 1.11, "learning_rate": 0.00013318385301505257, "loss": 0.0116, "step": 429030 }, { "epoch": 1.11, "learning_rate": 0.0001331799647986811, "loss": 0.0109, "step": 429040 }, { "epoch": 1.11, "learning_rate": 0.00013317607658230965, "loss": 0.0122, "step": 429050 }, { "epoch": 1.11, "learning_rate": 0.00013317218836593817, "loss": 0.0097, "step": 429060 }, { "epoch": 1.11, "learning_rate": 0.0001331683001495667, "loss": 0.0111, "step": 429070 }, { "epoch": 1.11, "learning_rate": 0.00013316441193319525, "loss": 0.0142, "step": 429080 }, { "epoch": 1.11, "learning_rate": 0.0001331605237168238, "loss": 0.0139, "step": 429090 }, { "epoch": 1.11, "learning_rate": 0.0001331566355004523, "loss": 0.0125, "step": 429100 }, { "epoch": 1.11, "learning_rate": 0.00013315274728408085, "loss": 0.011, "step": 429110 }, { "epoch": 1.11, "learning_rate": 0.0001331488590677094, "loss": 0.0124, "step": 429120 }, { "epoch": 1.11, "learning_rate": 0.00013314497085133793, "loss": 0.0101, "step": 429130 }, { "epoch": 1.11, "learning_rate": 0.00013314108263496645, "loss": 0.015, "step": 429140 }, { "epoch": 1.11, "learning_rate": 0.000133137194418595, "loss": 0.0101, "step": 429150 }, { "epoch": 1.11, "learning_rate": 0.00013313330620222353, "loss": 0.0129, "step": 429160 }, { "epoch": 1.11, "learning_rate": 0.00013312941798585207, "loss": 0.0142, "step": 429170 }, { "epoch": 1.11, "learning_rate": 0.0001331255297694806, "loss": 0.0092, "step": 429180 }, { "epoch": 1.11, "learning_rate": 0.00013312164155310916, "loss": 0.0106, "step": 429190 }, { "epoch": 1.11, "learning_rate": 0.00013311775333673767, "loss": 0.0097, "step": 429200 }, { "epoch": 1.11, "learning_rate": 0.0001331138651203662, "loss": 0.0116, "step": 429210 }, { "epoch": 1.11, "learning_rate": 0.00013310997690399475, "loss": 0.01, "step": 429220 }, { "epoch": 1.11, "learning_rate": 0.00013310608868762327, "loss": 0.0091, "step": 429230 }, { "epoch": 1.11, "learning_rate": 0.0001331022004712518, "loss": 0.0111, "step": 429240 }, { "epoch": 1.11, "learning_rate": 0.00013309831225488035, "loss": 0.0108, "step": 429250 }, { "epoch": 1.11, "learning_rate": 0.0001330944240385089, "loss": 0.0103, "step": 429260 }, { "epoch": 1.11, "learning_rate": 0.0001330905358221374, "loss": 0.0117, "step": 429270 }, { "epoch": 1.11, "learning_rate": 0.00013308664760576595, "loss": 0.0104, "step": 429280 }, { "epoch": 1.11, "learning_rate": 0.0001330827593893945, "loss": 0.0089, "step": 429290 }, { "epoch": 1.11, "learning_rate": 0.00013307887117302303, "loss": 0.0112, "step": 429300 }, { "epoch": 1.11, "learning_rate": 0.00013307498295665155, "loss": 0.0122, "step": 429310 }, { "epoch": 1.11, "learning_rate": 0.0001330710947402801, "loss": 0.013, "step": 429320 }, { "epoch": 1.11, "learning_rate": 0.00013306720652390863, "loss": 0.0126, "step": 429330 }, { "epoch": 1.11, "learning_rate": 0.00013306331830753717, "loss": 0.0094, "step": 429340 }, { "epoch": 1.11, "learning_rate": 0.00013305943009116569, "loss": 0.0095, "step": 429350 }, { "epoch": 1.11, "learning_rate": 0.00013305554187479425, "loss": 0.0122, "step": 429360 }, { "epoch": 1.11, "learning_rate": 0.00013305165365842277, "loss": 0.0113, "step": 429370 }, { "epoch": 1.11, "learning_rate": 0.0001330477654420513, "loss": 0.0107, "step": 429380 }, { "epoch": 1.11, "learning_rate": 0.00013304387722567985, "loss": 0.0138, "step": 429390 }, { "epoch": 1.11, "learning_rate": 0.0001330399890093084, "loss": 0.0109, "step": 429400 }, { "epoch": 1.11, "learning_rate": 0.0001330361007929369, "loss": 0.0111, "step": 429410 }, { "epoch": 1.11, "learning_rate": 0.00013303221257656545, "loss": 0.0098, "step": 429420 }, { "epoch": 1.11, "learning_rate": 0.000133028324360194, "loss": 0.0109, "step": 429430 }, { "epoch": 1.11, "learning_rate": 0.00013302443614382253, "loss": 0.0149, "step": 429440 }, { "epoch": 1.11, "learning_rate": 0.00013302054792745105, "loss": 0.0096, "step": 429450 }, { "epoch": 1.11, "learning_rate": 0.0001330166597110796, "loss": 0.0101, "step": 429460 }, { "epoch": 1.11, "learning_rate": 0.00013301277149470813, "loss": 0.0115, "step": 429470 }, { "epoch": 1.11, "learning_rate": 0.00013300888327833665, "loss": 0.0117, "step": 429480 }, { "epoch": 1.11, "learning_rate": 0.0001330049950619652, "loss": 0.0131, "step": 429490 }, { "epoch": 1.11, "learning_rate": 0.00013300110684559373, "loss": 0.0085, "step": 429500 }, { "epoch": 1.11, "learning_rate": 0.00013299721862922227, "loss": 0.0127, "step": 429510 }, { "epoch": 1.11, "learning_rate": 0.00013299333041285079, "loss": 0.0107, "step": 429520 }, { "epoch": 1.11, "learning_rate": 0.00013298944219647933, "loss": 0.0102, "step": 429530 }, { "epoch": 1.11, "learning_rate": 0.00013298555398010787, "loss": 0.0123, "step": 429540 }, { "epoch": 1.11, "learning_rate": 0.0001329816657637364, "loss": 0.0095, "step": 429550 }, { "epoch": 1.11, "learning_rate": 0.00013297777754736495, "loss": 0.0087, "step": 429560 }, { "epoch": 1.11, "learning_rate": 0.0001329738893309935, "loss": 0.0116, "step": 429570 }, { "epoch": 1.11, "learning_rate": 0.000132970001114622, "loss": 0.01, "step": 429580 }, { "epoch": 1.11, "learning_rate": 0.00013296611289825055, "loss": 0.0098, "step": 429590 }, { "epoch": 1.11, "learning_rate": 0.0001329622246818791, "loss": 0.0083, "step": 429600 }, { "epoch": 1.11, "learning_rate": 0.00013295833646550763, "loss": 0.013, "step": 429610 }, { "epoch": 1.11, "learning_rate": 0.00013295444824913615, "loss": 0.0135, "step": 429620 }, { "epoch": 1.11, "learning_rate": 0.0001329505600327647, "loss": 0.013, "step": 429630 }, { "epoch": 1.11, "learning_rate": 0.00013294667181639323, "loss": 0.01, "step": 429640 }, { "epoch": 1.11, "learning_rate": 0.00013294278360002177, "loss": 0.0165, "step": 429650 }, { "epoch": 1.11, "learning_rate": 0.0001329388953836503, "loss": 0.0087, "step": 429660 }, { "epoch": 1.11, "learning_rate": 0.00013293500716727883, "loss": 0.0119, "step": 429670 }, { "epoch": 1.11, "learning_rate": 0.00013293111895090737, "loss": 0.0135, "step": 429680 }, { "epoch": 1.11, "learning_rate": 0.0001329272307345359, "loss": 0.0114, "step": 429690 }, { "epoch": 1.11, "learning_rate": 0.00013292334251816443, "loss": 0.0129, "step": 429700 }, { "epoch": 1.11, "learning_rate": 0.000132919454301793, "loss": 0.0099, "step": 429710 }, { "epoch": 1.11, "learning_rate": 0.0001329155660854215, "loss": 0.0076, "step": 429720 }, { "epoch": 1.11, "learning_rate": 0.00013291167786905002, "loss": 0.0121, "step": 429730 }, { "epoch": 1.11, "learning_rate": 0.0001329077896526786, "loss": 0.0084, "step": 429740 }, { "epoch": 1.11, "learning_rate": 0.0001329039014363071, "loss": 0.0109, "step": 429750 }, { "epoch": 1.11, "learning_rate": 0.00013290001321993565, "loss": 0.0086, "step": 429760 }, { "epoch": 1.11, "learning_rate": 0.0001328961250035642, "loss": 0.0153, "step": 429770 }, { "epoch": 1.11, "learning_rate": 0.00013289223678719273, "loss": 0.0116, "step": 429780 }, { "epoch": 1.11, "learning_rate": 0.00013288834857082125, "loss": 0.0095, "step": 429790 }, { "epoch": 1.11, "learning_rate": 0.0001328844603544498, "loss": 0.0177, "step": 429800 }, { "epoch": 1.11, "learning_rate": 0.00013288057213807833, "loss": 0.0157, "step": 429810 }, { "epoch": 1.11, "learning_rate": 0.00013287668392170687, "loss": 0.0118, "step": 429820 }, { "epoch": 1.11, "learning_rate": 0.00013287279570533539, "loss": 0.0108, "step": 429830 }, { "epoch": 1.11, "learning_rate": 0.00013286890748896393, "loss": 0.009, "step": 429840 }, { "epoch": 1.11, "learning_rate": 0.00013286501927259247, "loss": 0.0138, "step": 429850 }, { "epoch": 1.11, "learning_rate": 0.000132861131056221, "loss": 0.0115, "step": 429860 }, { "epoch": 1.11, "learning_rate": 0.00013285724283984953, "loss": 0.0095, "step": 429870 }, { "epoch": 1.11, "learning_rate": 0.0001328533546234781, "loss": 0.0112, "step": 429880 }, { "epoch": 1.11, "learning_rate": 0.0001328494664071066, "loss": 0.0109, "step": 429890 }, { "epoch": 1.11, "learning_rate": 0.00013284557819073515, "loss": 0.0089, "step": 429900 }, { "epoch": 1.11, "learning_rate": 0.0001328416899743637, "loss": 0.0119, "step": 429910 }, { "epoch": 1.11, "learning_rate": 0.00013283780175799223, "loss": 0.016, "step": 429920 }, { "epoch": 1.11, "learning_rate": 0.00013283391354162075, "loss": 0.0147, "step": 429930 }, { "epoch": 1.11, "learning_rate": 0.0001328300253252493, "loss": 0.015, "step": 429940 }, { "epoch": 1.11, "learning_rate": 0.00013282613710887783, "loss": 0.0123, "step": 429950 }, { "epoch": 1.11, "learning_rate": 0.00013282224889250637, "loss": 0.012, "step": 429960 }, { "epoch": 1.11, "learning_rate": 0.0001328183606761349, "loss": 0.0113, "step": 429970 }, { "epoch": 1.11, "learning_rate": 0.00013281447245976343, "loss": 0.0128, "step": 429980 }, { "epoch": 1.11, "learning_rate": 0.00013281058424339197, "loss": 0.011, "step": 429990 }, { "epoch": 1.11, "learning_rate": 0.00013280669602702049, "loss": 0.0108, "step": 430000 }, { "epoch": 1.11, "eval_cer": 0.8817124837817071, "eval_loss": 0.007531081326305866, "eval_runtime": 107.5849, "eval_samples_per_second": 18.59, "eval_steps_per_second": 4.647, "step": 430000 }, { "epoch": 1.11, "learning_rate": 0.00013280280781064903, "loss": 0.0092, "step": 430010 }, { "epoch": 1.11, "learning_rate": 0.00013279891959427757, "loss": 0.0132, "step": 430020 }, { "epoch": 1.11, "learning_rate": 0.0001327950313779061, "loss": 0.0124, "step": 430030 }, { "epoch": 1.11, "learning_rate": 0.00013279114316153463, "loss": 0.0084, "step": 430040 }, { "epoch": 1.11, "learning_rate": 0.00013278725494516317, "loss": 0.0094, "step": 430050 }, { "epoch": 1.11, "learning_rate": 0.0001327833667287917, "loss": 0.0163, "step": 430060 }, { "epoch": 1.11, "learning_rate": 0.00013277947851242025, "loss": 0.0102, "step": 430070 }, { "epoch": 1.11, "learning_rate": 0.0001327755902960488, "loss": 0.0117, "step": 430080 }, { "epoch": 1.11, "learning_rate": 0.00013277170207967733, "loss": 0.0113, "step": 430090 }, { "epoch": 1.11, "learning_rate": 0.00013276781386330585, "loss": 0.0085, "step": 430100 }, { "epoch": 1.11, "learning_rate": 0.0001327639256469344, "loss": 0.0147, "step": 430110 }, { "epoch": 1.11, "learning_rate": 0.00013276003743056293, "loss": 0.0139, "step": 430120 }, { "epoch": 1.11, "learning_rate": 0.00013275614921419147, "loss": 0.0114, "step": 430130 }, { "epoch": 1.11, "learning_rate": 0.00013275226099782, "loss": 0.0131, "step": 430140 }, { "epoch": 1.12, "learning_rate": 0.00013274837278144853, "loss": 0.0093, "step": 430150 }, { "epoch": 1.12, "learning_rate": 0.00013274448456507707, "loss": 0.0086, "step": 430160 }, { "epoch": 1.12, "learning_rate": 0.0001327405963487056, "loss": 0.0111, "step": 430170 }, { "epoch": 1.12, "learning_rate": 0.00013273670813233413, "loss": 0.0106, "step": 430180 }, { "epoch": 1.12, "learning_rate": 0.00013273281991596267, "loss": 0.0076, "step": 430190 }, { "epoch": 1.12, "learning_rate": 0.0001327289316995912, "loss": 0.0124, "step": 430200 }, { "epoch": 1.12, "learning_rate": 0.00013272504348321975, "loss": 0.0148, "step": 430210 }, { "epoch": 1.12, "learning_rate": 0.00013272115526684827, "loss": 0.0093, "step": 430220 }, { "epoch": 1.12, "learning_rate": 0.0001327172670504768, "loss": 0.0111, "step": 430230 }, { "epoch": 1.12, "learning_rate": 0.00013271337883410535, "loss": 0.0109, "step": 430240 }, { "epoch": 1.12, "learning_rate": 0.00013270949061773386, "loss": 0.0114, "step": 430250 }, { "epoch": 1.12, "learning_rate": 0.00013270560240136243, "loss": 0.0106, "step": 430260 }, { "epoch": 1.12, "learning_rate": 0.00013270171418499095, "loss": 0.0105, "step": 430270 }, { "epoch": 1.12, "learning_rate": 0.0001326978259686195, "loss": 0.0095, "step": 430280 }, { "epoch": 1.12, "learning_rate": 0.00013269393775224803, "loss": 0.0093, "step": 430290 }, { "epoch": 1.12, "learning_rate": 0.00013269004953587657, "loss": 0.0111, "step": 430300 }, { "epoch": 1.12, "learning_rate": 0.0001326861613195051, "loss": 0.0088, "step": 430310 }, { "epoch": 1.12, "learning_rate": 0.00013268227310313363, "loss": 0.0115, "step": 430320 }, { "epoch": 1.12, "learning_rate": 0.00013267838488676217, "loss": 0.0112, "step": 430330 }, { "epoch": 1.12, "learning_rate": 0.0001326744966703907, "loss": 0.0115, "step": 430340 }, { "epoch": 1.12, "learning_rate": 0.00013267060845401923, "loss": 0.0099, "step": 430350 }, { "epoch": 1.12, "learning_rate": 0.00013266672023764777, "loss": 0.0149, "step": 430360 }, { "epoch": 1.12, "learning_rate": 0.0001326628320212763, "loss": 0.0101, "step": 430370 }, { "epoch": 1.12, "learning_rate": 0.00013265894380490485, "loss": 0.0133, "step": 430380 }, { "epoch": 1.12, "learning_rate": 0.00013265505558853337, "loss": 0.014, "step": 430390 }, { "epoch": 1.12, "learning_rate": 0.0001326511673721619, "loss": 0.0124, "step": 430400 }, { "epoch": 1.12, "learning_rate": 0.00013264727915579045, "loss": 0.0112, "step": 430410 }, { "epoch": 1.12, "learning_rate": 0.000132643390939419, "loss": 0.013, "step": 430420 }, { "epoch": 1.12, "learning_rate": 0.00013263950272304753, "loss": 0.0098, "step": 430430 }, { "epoch": 1.12, "learning_rate": 0.00013263561450667607, "loss": 0.0117, "step": 430440 }, { "epoch": 1.12, "learning_rate": 0.0001326317262903046, "loss": 0.0132, "step": 430450 }, { "epoch": 1.12, "learning_rate": 0.00013262783807393313, "loss": 0.0094, "step": 430460 }, { "epoch": 1.12, "learning_rate": 0.00013262394985756167, "loss": 0.0153, "step": 430470 }, { "epoch": 1.12, "learning_rate": 0.00013262006164119019, "loss": 0.009, "step": 430480 }, { "epoch": 1.12, "learning_rate": 0.00013261617342481873, "loss": 0.01, "step": 430490 }, { "epoch": 1.12, "learning_rate": 0.00013261228520844727, "loss": 0.0119, "step": 430500 }, { "epoch": 1.12, "learning_rate": 0.0001326083969920758, "loss": 0.015, "step": 430510 }, { "epoch": 1.12, "learning_rate": 0.00013260450877570433, "loss": 0.0104, "step": 430520 }, { "epoch": 1.12, "learning_rate": 0.00013260062055933287, "loss": 0.0154, "step": 430530 }, { "epoch": 1.12, "learning_rate": 0.0001325967323429614, "loss": 0.0092, "step": 430540 }, { "epoch": 1.12, "learning_rate": 0.00013259284412658995, "loss": 0.0094, "step": 430550 }, { "epoch": 1.12, "learning_rate": 0.00013258895591021847, "loss": 0.0099, "step": 430560 }, { "epoch": 1.12, "learning_rate": 0.000132585067693847, "loss": 0.0094, "step": 430570 }, { "epoch": 1.12, "learning_rate": 0.00013258117947747555, "loss": 0.0114, "step": 430580 }, { "epoch": 1.12, "learning_rate": 0.0001325772912611041, "loss": 0.009, "step": 430590 }, { "epoch": 1.12, "learning_rate": 0.0001325734030447326, "loss": 0.0141, "step": 430600 }, { "epoch": 1.12, "learning_rate": 0.00013256951482836117, "loss": 0.0113, "step": 430610 }, { "epoch": 1.12, "learning_rate": 0.0001325656266119897, "loss": 0.0136, "step": 430620 }, { "epoch": 1.12, "learning_rate": 0.00013256173839561823, "loss": 0.0085, "step": 430630 }, { "epoch": 1.12, "learning_rate": 0.00013255785017924677, "loss": 0.0109, "step": 430640 }, { "epoch": 1.12, "learning_rate": 0.0001325539619628753, "loss": 0.0094, "step": 430650 }, { "epoch": 1.12, "learning_rate": 0.00013255007374650383, "loss": 0.0128, "step": 430660 }, { "epoch": 1.12, "learning_rate": 0.00013254618553013237, "loss": 0.0086, "step": 430670 }, { "epoch": 1.12, "learning_rate": 0.0001325422973137609, "loss": 0.011, "step": 430680 }, { "epoch": 1.12, "learning_rate": 0.00013253840909738945, "loss": 0.0084, "step": 430690 }, { "epoch": 1.12, "learning_rate": 0.00013253452088101797, "loss": 0.0123, "step": 430700 }, { "epoch": 1.12, "learning_rate": 0.0001325306326646465, "loss": 0.0107, "step": 430710 }, { "epoch": 1.12, "learning_rate": 0.00013252674444827505, "loss": 0.0127, "step": 430720 }, { "epoch": 1.12, "learning_rate": 0.00013252285623190356, "loss": 0.01, "step": 430730 }, { "epoch": 1.12, "learning_rate": 0.0001325189680155321, "loss": 0.0102, "step": 430740 }, { "epoch": 1.12, "learning_rate": 0.00013251507979916065, "loss": 0.0098, "step": 430750 }, { "epoch": 1.12, "learning_rate": 0.0001325111915827892, "loss": 0.01, "step": 430760 }, { "epoch": 1.12, "learning_rate": 0.0001325073033664177, "loss": 0.0105, "step": 430770 }, { "epoch": 1.12, "learning_rate": 0.00013250341515004627, "loss": 0.0103, "step": 430780 }, { "epoch": 1.12, "learning_rate": 0.0001324995269336748, "loss": 0.0099, "step": 430790 }, { "epoch": 1.12, "learning_rate": 0.00013249563871730333, "loss": 0.0148, "step": 430800 }, { "epoch": 1.12, "learning_rate": 0.00013249175050093187, "loss": 0.0131, "step": 430810 }, { "epoch": 1.12, "learning_rate": 0.0001324878622845604, "loss": 0.0128, "step": 430820 }, { "epoch": 1.12, "learning_rate": 0.00013248397406818893, "loss": 0.0101, "step": 430830 }, { "epoch": 1.12, "learning_rate": 0.00013248008585181747, "loss": 0.012, "step": 430840 }, { "epoch": 1.12, "learning_rate": 0.000132476197635446, "loss": 0.0129, "step": 430850 }, { "epoch": 1.12, "learning_rate": 0.00013247230941907455, "loss": 0.0117, "step": 430860 }, { "epoch": 1.12, "learning_rate": 0.00013246842120270307, "loss": 0.0125, "step": 430870 }, { "epoch": 1.12, "learning_rate": 0.0001324645329863316, "loss": 0.0086, "step": 430880 }, { "epoch": 1.12, "learning_rate": 0.00013246064476996015, "loss": 0.0084, "step": 430890 }, { "epoch": 1.12, "learning_rate": 0.0001324567565535887, "loss": 0.0109, "step": 430900 }, { "epoch": 1.12, "learning_rate": 0.0001324528683372172, "loss": 0.0105, "step": 430910 }, { "epoch": 1.12, "learning_rate": 0.00013244898012084575, "loss": 0.0121, "step": 430920 }, { "epoch": 1.12, "learning_rate": 0.0001324450919044743, "loss": 0.0108, "step": 430930 }, { "epoch": 1.12, "learning_rate": 0.00013244120368810283, "loss": 0.0142, "step": 430940 }, { "epoch": 1.12, "learning_rate": 0.00013243731547173137, "loss": 0.0116, "step": 430950 }, { "epoch": 1.12, "learning_rate": 0.00013243342725535991, "loss": 0.0109, "step": 430960 }, { "epoch": 1.12, "learning_rate": 0.00013242953903898843, "loss": 0.0093, "step": 430970 }, { "epoch": 1.12, "learning_rate": 0.00013242565082261697, "loss": 0.0123, "step": 430980 }, { "epoch": 1.12, "learning_rate": 0.0001324217626062455, "loss": 0.0132, "step": 430990 }, { "epoch": 1.12, "learning_rate": 0.00013241787438987403, "loss": 0.0104, "step": 431000 }, { "epoch": 1.12, "eval_cer": 0.881719481966378, "eval_loss": 0.007422698196023703, "eval_runtime": 107.6404, "eval_samples_per_second": 18.58, "eval_steps_per_second": 4.645, "step": 431000 }, { "epoch": 1.12, "learning_rate": 0.00013241398617350257, "loss": 0.0093, "step": 431010 }, { "epoch": 1.12, "learning_rate": 0.0001324100979571311, "loss": 0.0085, "step": 431020 }, { "epoch": 1.12, "learning_rate": 0.00013240620974075965, "loss": 0.0123, "step": 431030 }, { "epoch": 1.12, "learning_rate": 0.00013240232152438817, "loss": 0.0102, "step": 431040 }, { "epoch": 1.12, "learning_rate": 0.0001323984333080167, "loss": 0.0128, "step": 431050 }, { "epoch": 1.12, "learning_rate": 0.00013239454509164525, "loss": 0.0095, "step": 431060 }, { "epoch": 1.12, "learning_rate": 0.0001323906568752738, "loss": 0.0105, "step": 431070 }, { "epoch": 1.12, "learning_rate": 0.0001323867686589023, "loss": 0.0103, "step": 431080 }, { "epoch": 1.12, "learning_rate": 0.00013238288044253085, "loss": 0.0083, "step": 431090 }, { "epoch": 1.12, "learning_rate": 0.0001323789922261594, "loss": 0.0148, "step": 431100 }, { "epoch": 1.12, "learning_rate": 0.00013237510400978793, "loss": 0.0108, "step": 431110 }, { "epoch": 1.12, "learning_rate": 0.00013237121579341644, "loss": 0.0113, "step": 431120 }, { "epoch": 1.12, "learning_rate": 0.000132367327577045, "loss": 0.009, "step": 431130 }, { "epoch": 1.12, "learning_rate": 0.00013236343936067353, "loss": 0.0105, "step": 431140 }, { "epoch": 1.12, "learning_rate": 0.00013235955114430207, "loss": 0.0095, "step": 431150 }, { "epoch": 1.12, "learning_rate": 0.0001323556629279306, "loss": 0.0112, "step": 431160 }, { "epoch": 1.12, "learning_rate": 0.00013235177471155915, "loss": 0.0105, "step": 431170 }, { "epoch": 1.12, "learning_rate": 0.00013234788649518767, "loss": 0.0133, "step": 431180 }, { "epoch": 1.12, "learning_rate": 0.0001323439982788162, "loss": 0.0109, "step": 431190 }, { "epoch": 1.12, "learning_rate": 0.00013234011006244475, "loss": 0.0128, "step": 431200 }, { "epoch": 1.12, "learning_rate": 0.00013233622184607327, "loss": 0.0114, "step": 431210 }, { "epoch": 1.12, "learning_rate": 0.0001323323336297018, "loss": 0.0106, "step": 431220 }, { "epoch": 1.12, "learning_rate": 0.00013232844541333035, "loss": 0.0128, "step": 431230 }, { "epoch": 1.12, "learning_rate": 0.0001323245571969589, "loss": 0.0109, "step": 431240 }, { "epoch": 1.12, "learning_rate": 0.0001323206689805874, "loss": 0.0119, "step": 431250 }, { "epoch": 1.12, "learning_rate": 0.00013231678076421595, "loss": 0.0104, "step": 431260 }, { "epoch": 1.12, "learning_rate": 0.0001323128925478445, "loss": 0.0119, "step": 431270 }, { "epoch": 1.12, "learning_rate": 0.00013230900433147303, "loss": 0.0098, "step": 431280 }, { "epoch": 1.12, "learning_rate": 0.00013230511611510154, "loss": 0.0103, "step": 431290 }, { "epoch": 1.12, "learning_rate": 0.0001323012278987301, "loss": 0.0091, "step": 431300 }, { "epoch": 1.12, "learning_rate": 0.00013229733968235863, "loss": 0.0132, "step": 431310 }, { "epoch": 1.12, "learning_rate": 0.00013229345146598717, "loss": 0.0103, "step": 431320 }, { "epoch": 1.12, "learning_rate": 0.0001322895632496157, "loss": 0.0112, "step": 431330 }, { "epoch": 1.12, "learning_rate": 0.00013228567503324425, "loss": 0.0105, "step": 431340 }, { "epoch": 1.12, "learning_rate": 0.00013228178681687277, "loss": 0.0094, "step": 431350 }, { "epoch": 1.12, "learning_rate": 0.0001322778986005013, "loss": 0.0124, "step": 431360 }, { "epoch": 1.12, "learning_rate": 0.00013227401038412985, "loss": 0.009, "step": 431370 }, { "epoch": 1.12, "learning_rate": 0.0001322701221677584, "loss": 0.0106, "step": 431380 }, { "epoch": 1.12, "learning_rate": 0.0001322662339513869, "loss": 0.0118, "step": 431390 }, { "epoch": 1.12, "learning_rate": 0.00013226234573501545, "loss": 0.0149, "step": 431400 }, { "epoch": 1.12, "learning_rate": 0.000132258457518644, "loss": 0.0118, "step": 431410 }, { "epoch": 1.12, "learning_rate": 0.00013225456930227253, "loss": 0.0135, "step": 431420 }, { "epoch": 1.12, "learning_rate": 0.00013225068108590105, "loss": 0.0135, "step": 431430 }, { "epoch": 1.12, "learning_rate": 0.0001322467928695296, "loss": 0.0113, "step": 431440 }, { "epoch": 1.12, "learning_rate": 0.00013224290465315813, "loss": 0.0159, "step": 431450 }, { "epoch": 1.12, "learning_rate": 0.00013223901643678664, "loss": 0.0099, "step": 431460 }, { "epoch": 1.12, "learning_rate": 0.00013223512822041518, "loss": 0.0114, "step": 431470 }, { "epoch": 1.12, "learning_rate": 0.00013223124000404373, "loss": 0.0115, "step": 431480 }, { "epoch": 1.12, "learning_rate": 0.00013222735178767227, "loss": 0.0093, "step": 431490 }, { "epoch": 1.12, "learning_rate": 0.0001322234635713008, "loss": 0.0123, "step": 431500 }, { "epoch": 1.12, "learning_rate": 0.00013221957535492935, "loss": 0.0087, "step": 431510 }, { "epoch": 1.12, "learning_rate": 0.00013221568713855787, "loss": 0.0104, "step": 431520 }, { "epoch": 1.12, "learning_rate": 0.0001322117989221864, "loss": 0.0105, "step": 431530 }, { "epoch": 1.12, "learning_rate": 0.00013220791070581495, "loss": 0.0111, "step": 431540 }, { "epoch": 1.12, "learning_rate": 0.0001322040224894435, "loss": 0.0095, "step": 431550 }, { "epoch": 1.12, "learning_rate": 0.000132200134273072, "loss": 0.0118, "step": 431560 }, { "epoch": 1.12, "learning_rate": 0.00013219624605670055, "loss": 0.0107, "step": 431570 }, { "epoch": 1.12, "learning_rate": 0.0001321923578403291, "loss": 0.0117, "step": 431580 }, { "epoch": 1.12, "learning_rate": 0.00013218846962395763, "loss": 0.0118, "step": 431590 }, { "epoch": 1.12, "learning_rate": 0.00013218458140758614, "loss": 0.0117, "step": 431600 }, { "epoch": 1.12, "learning_rate": 0.0001321806931912147, "loss": 0.0094, "step": 431610 }, { "epoch": 1.12, "learning_rate": 0.00013217680497484323, "loss": 0.0097, "step": 431620 }, { "epoch": 1.12, "learning_rate": 0.00013217291675847177, "loss": 0.0112, "step": 431630 }, { "epoch": 1.12, "learning_rate": 0.00013216902854210028, "loss": 0.012, "step": 431640 }, { "epoch": 1.12, "learning_rate": 0.00013216514032572885, "loss": 0.0109, "step": 431650 }, { "epoch": 1.12, "learning_rate": 0.00013216125210935737, "loss": 0.0111, "step": 431660 }, { "epoch": 1.12, "learning_rate": 0.0001321573638929859, "loss": 0.0114, "step": 431670 }, { "epoch": 1.12, "learning_rate": 0.00013215347567661445, "loss": 0.0137, "step": 431680 }, { "epoch": 1.12, "learning_rate": 0.000132149587460243, "loss": 0.0108, "step": 431690 }, { "epoch": 1.12, "learning_rate": 0.0001321456992438715, "loss": 0.0083, "step": 431700 }, { "epoch": 1.12, "learning_rate": 0.00013214181102750005, "loss": 0.01, "step": 431710 }, { "epoch": 1.12, "learning_rate": 0.0001321379228111286, "loss": 0.0107, "step": 431720 }, { "epoch": 1.12, "learning_rate": 0.0001321340345947571, "loss": 0.0135, "step": 431730 }, { "epoch": 1.12, "learning_rate": 0.00013213014637838565, "loss": 0.012, "step": 431740 }, { "epoch": 1.12, "learning_rate": 0.0001321262581620142, "loss": 0.0097, "step": 431750 }, { "epoch": 1.12, "learning_rate": 0.00013212236994564273, "loss": 0.0113, "step": 431760 }, { "epoch": 1.12, "learning_rate": 0.00013211848172927124, "loss": 0.0121, "step": 431770 }, { "epoch": 1.12, "learning_rate": 0.00013211459351289979, "loss": 0.0108, "step": 431780 }, { "epoch": 1.12, "learning_rate": 0.00013211070529652833, "loss": 0.0104, "step": 431790 }, { "epoch": 1.12, "learning_rate": 0.00013210681708015687, "loss": 0.0099, "step": 431800 }, { "epoch": 1.12, "learning_rate": 0.00013210292886378538, "loss": 0.0083, "step": 431810 }, { "epoch": 1.12, "learning_rate": 0.00013209904064741395, "loss": 0.0097, "step": 431820 }, { "epoch": 1.12, "learning_rate": 0.00013209515243104247, "loss": 0.011, "step": 431830 }, { "epoch": 1.12, "learning_rate": 0.000132091264214671, "loss": 0.0104, "step": 431840 }, { "epoch": 1.12, "learning_rate": 0.00013208737599829955, "loss": 0.0105, "step": 431850 }, { "epoch": 1.12, "learning_rate": 0.0001320834877819281, "loss": 0.0125, "step": 431860 }, { "epoch": 1.12, "learning_rate": 0.0001320795995655566, "loss": 0.0127, "step": 431870 }, { "epoch": 1.12, "learning_rate": 0.00013207571134918515, "loss": 0.0131, "step": 431880 }, { "epoch": 1.12, "learning_rate": 0.0001320718231328137, "loss": 0.013, "step": 431890 }, { "epoch": 1.12, "learning_rate": 0.00013206793491644223, "loss": 0.0085, "step": 431900 }, { "epoch": 1.12, "learning_rate": 0.00013206404670007075, "loss": 0.0102, "step": 431910 }, { "epoch": 1.12, "learning_rate": 0.0001320601584836993, "loss": 0.0111, "step": 431920 }, { "epoch": 1.12, "learning_rate": 0.00013205627026732783, "loss": 0.0128, "step": 431930 }, { "epoch": 1.12, "learning_rate": 0.00013205238205095637, "loss": 0.0107, "step": 431940 }, { "epoch": 1.12, "learning_rate": 0.00013204849383458489, "loss": 0.0133, "step": 431950 }, { "epoch": 1.12, "learning_rate": 0.00013204460561821343, "loss": 0.0127, "step": 431960 }, { "epoch": 1.12, "learning_rate": 0.00013204071740184197, "loss": 0.0147, "step": 431970 }, { "epoch": 1.12, "learning_rate": 0.00013203682918547048, "loss": 0.0122, "step": 431980 }, { "epoch": 1.12, "learning_rate": 0.00013203294096909902, "loss": 0.0154, "step": 431990 }, { "epoch": 1.12, "learning_rate": 0.00013202905275272757, "loss": 0.0126, "step": 432000 }, { "epoch": 1.12, "eval_cer": 0.8816984874123652, "eval_loss": 0.007582567632198334, "eval_runtime": 107.5055, "eval_samples_per_second": 18.604, "eval_steps_per_second": 4.651, "step": 432000 }, { "epoch": 1.12, "learning_rate": 0.0001320251645363561, "loss": 0.0113, "step": 432010 }, { "epoch": 1.12, "learning_rate": 0.00013202127631998465, "loss": 0.0096, "step": 432020 }, { "epoch": 1.12, "learning_rate": 0.0001320173881036132, "loss": 0.0113, "step": 432030 }, { "epoch": 1.12, "learning_rate": 0.0001320134998872417, "loss": 0.0116, "step": 432040 }, { "epoch": 1.12, "learning_rate": 0.00013200961167087025, "loss": 0.0132, "step": 432050 }, { "epoch": 1.12, "learning_rate": 0.0001320057234544988, "loss": 0.0098, "step": 432060 }, { "epoch": 1.12, "learning_rate": 0.00013200183523812733, "loss": 0.0099, "step": 432070 }, { "epoch": 1.12, "learning_rate": 0.00013199794702175585, "loss": 0.0152, "step": 432080 }, { "epoch": 1.12, "learning_rate": 0.0001319940588053844, "loss": 0.0102, "step": 432090 }, { "epoch": 1.12, "learning_rate": 0.00013199017058901293, "loss": 0.0114, "step": 432100 }, { "epoch": 1.12, "learning_rate": 0.00013198628237264147, "loss": 0.0125, "step": 432110 }, { "epoch": 1.12, "learning_rate": 0.00013198239415626998, "loss": 0.0135, "step": 432120 }, { "epoch": 1.12, "learning_rate": 0.00013197850593989853, "loss": 0.0118, "step": 432130 }, { "epoch": 1.12, "learning_rate": 0.00013197461772352707, "loss": 0.0122, "step": 432140 }, { "epoch": 1.12, "learning_rate": 0.0001319707295071556, "loss": 0.01, "step": 432150 }, { "epoch": 1.12, "learning_rate": 0.00013196684129078412, "loss": 0.0138, "step": 432160 }, { "epoch": 1.12, "learning_rate": 0.0001319629530744127, "loss": 0.0121, "step": 432170 }, { "epoch": 1.12, "learning_rate": 0.0001319590648580412, "loss": 0.0182, "step": 432180 }, { "epoch": 1.12, "learning_rate": 0.00013195517664166975, "loss": 0.0144, "step": 432190 }, { "epoch": 1.12, "learning_rate": 0.0001319512884252983, "loss": 0.0114, "step": 432200 }, { "epoch": 1.12, "learning_rate": 0.0001319474002089268, "loss": 0.0142, "step": 432210 }, { "epoch": 1.12, "learning_rate": 0.00013194351199255535, "loss": 0.0086, "step": 432220 }, { "epoch": 1.12, "learning_rate": 0.0001319396237761839, "loss": 0.0146, "step": 432230 }, { "epoch": 1.12, "learning_rate": 0.00013193573555981243, "loss": 0.0116, "step": 432240 }, { "epoch": 1.12, "learning_rate": 0.00013193184734344094, "loss": 0.0117, "step": 432250 }, { "epoch": 1.12, "learning_rate": 0.0001319279591270695, "loss": 0.0091, "step": 432260 }, { "epoch": 1.12, "learning_rate": 0.00013192407091069803, "loss": 0.0142, "step": 432270 }, { "epoch": 1.12, "learning_rate": 0.00013192018269432657, "loss": 0.0149, "step": 432280 }, { "epoch": 1.12, "learning_rate": 0.00013191629447795508, "loss": 0.0137, "step": 432290 }, { "epoch": 1.12, "learning_rate": 0.00013191240626158363, "loss": 0.0114, "step": 432300 }, { "epoch": 1.12, "learning_rate": 0.00013190851804521217, "loss": 0.0094, "step": 432310 }, { "epoch": 1.12, "learning_rate": 0.0001319046298288407, "loss": 0.0161, "step": 432320 }, { "epoch": 1.12, "learning_rate": 0.00013190074161246922, "loss": 0.0083, "step": 432330 }, { "epoch": 1.12, "learning_rate": 0.0001318968533960978, "loss": 0.0113, "step": 432340 }, { "epoch": 1.12, "learning_rate": 0.0001318929651797263, "loss": 0.0089, "step": 432350 }, { "epoch": 1.12, "learning_rate": 0.00013188907696335485, "loss": 0.0152, "step": 432360 }, { "epoch": 1.12, "learning_rate": 0.0001318851887469834, "loss": 0.0116, "step": 432370 }, { "epoch": 1.12, "learning_rate": 0.00013188130053061193, "loss": 0.0115, "step": 432380 }, { "epoch": 1.12, "learning_rate": 0.00013187741231424045, "loss": 0.0104, "step": 432390 }, { "epoch": 1.12, "learning_rate": 0.000131873524097869, "loss": 0.0154, "step": 432400 }, { "epoch": 1.12, "learning_rate": 0.00013186963588149753, "loss": 0.0108, "step": 432410 }, { "epoch": 1.12, "learning_rate": 0.00013186574766512607, "loss": 0.0108, "step": 432420 }, { "epoch": 1.12, "learning_rate": 0.00013186185944875459, "loss": 0.014, "step": 432430 }, { "epoch": 1.12, "learning_rate": 0.00013185797123238313, "loss": 0.0097, "step": 432440 }, { "epoch": 1.12, "learning_rate": 0.00013185408301601167, "loss": 0.008, "step": 432450 }, { "epoch": 1.12, "learning_rate": 0.00013185019479964018, "loss": 0.0114, "step": 432460 }, { "epoch": 1.12, "learning_rate": 0.00013184630658326873, "loss": 0.013, "step": 432470 }, { "epoch": 1.12, "learning_rate": 0.00013184241836689727, "loss": 0.01, "step": 432480 }, { "epoch": 1.12, "learning_rate": 0.0001318385301505258, "loss": 0.0087, "step": 432490 }, { "epoch": 1.12, "learning_rate": 0.00013183464193415432, "loss": 0.011, "step": 432500 }, { "epoch": 1.12, "learning_rate": 0.00013183075371778286, "loss": 0.0102, "step": 432510 }, { "epoch": 1.12, "learning_rate": 0.0001318268655014114, "loss": 0.011, "step": 432520 }, { "epoch": 1.12, "learning_rate": 0.00013182297728503995, "loss": 0.0091, "step": 432530 }, { "epoch": 1.12, "learning_rate": 0.0001318190890686685, "loss": 0.0105, "step": 432540 }, { "epoch": 1.12, "learning_rate": 0.00013181520085229703, "loss": 0.0125, "step": 432550 }, { "epoch": 1.12, "learning_rate": 0.00013181131263592555, "loss": 0.0109, "step": 432560 }, { "epoch": 1.12, "learning_rate": 0.0001318074244195541, "loss": 0.0151, "step": 432570 }, { "epoch": 1.12, "learning_rate": 0.00013180353620318263, "loss": 0.0098, "step": 432580 }, { "epoch": 1.12, "learning_rate": 0.00013179964798681117, "loss": 0.0103, "step": 432590 }, { "epoch": 1.12, "learning_rate": 0.00013179575977043969, "loss": 0.0096, "step": 432600 }, { "epoch": 1.12, "learning_rate": 0.00013179187155406823, "loss": 0.0109, "step": 432610 }, { "epoch": 1.12, "learning_rate": 0.00013178798333769677, "loss": 0.0071, "step": 432620 }, { "epoch": 1.12, "learning_rate": 0.0001317840951213253, "loss": 0.0148, "step": 432630 }, { "epoch": 1.12, "learning_rate": 0.00013178020690495382, "loss": 0.0115, "step": 432640 }, { "epoch": 1.12, "learning_rate": 0.00013177631868858237, "loss": 0.016, "step": 432650 }, { "epoch": 1.12, "learning_rate": 0.0001317724304722109, "loss": 0.0133, "step": 432660 }, { "epoch": 1.12, "learning_rate": 0.00013176854225583945, "loss": 0.0111, "step": 432670 }, { "epoch": 1.12, "learning_rate": 0.00013176465403946796, "loss": 0.0123, "step": 432680 }, { "epoch": 1.12, "learning_rate": 0.00013176076582309653, "loss": 0.0149, "step": 432690 }, { "epoch": 1.12, "learning_rate": 0.00013175687760672505, "loss": 0.0127, "step": 432700 }, { "epoch": 1.12, "learning_rate": 0.00013175298939035356, "loss": 0.0105, "step": 432710 }, { "epoch": 1.12, "learning_rate": 0.00013174910117398213, "loss": 0.0104, "step": 432720 }, { "epoch": 1.12, "learning_rate": 0.00013174521295761065, "loss": 0.011, "step": 432730 }, { "epoch": 1.12, "learning_rate": 0.0001317413247412392, "loss": 0.0105, "step": 432740 }, { "epoch": 1.12, "learning_rate": 0.00013173743652486773, "loss": 0.0109, "step": 432750 }, { "epoch": 1.12, "learning_rate": 0.00013173354830849627, "loss": 0.0099, "step": 432760 }, { "epoch": 1.12, "learning_rate": 0.00013172966009212478, "loss": 0.0076, "step": 432770 }, { "epoch": 1.12, "learning_rate": 0.00013172577187575333, "loss": 0.0111, "step": 432780 }, { "epoch": 1.12, "learning_rate": 0.00013172188365938187, "loss": 0.0119, "step": 432790 }, { "epoch": 1.12, "learning_rate": 0.0001317179954430104, "loss": 0.0144, "step": 432800 }, { "epoch": 1.12, "learning_rate": 0.00013171410722663892, "loss": 0.011, "step": 432810 }, { "epoch": 1.12, "learning_rate": 0.00013171021901026747, "loss": 0.0094, "step": 432820 }, { "epoch": 1.12, "learning_rate": 0.000131706330793896, "loss": 0.0097, "step": 432830 }, { "epoch": 1.12, "learning_rate": 0.00013170244257752455, "loss": 0.0131, "step": 432840 }, { "epoch": 1.12, "learning_rate": 0.00013169855436115306, "loss": 0.0112, "step": 432850 }, { "epoch": 1.12, "learning_rate": 0.0001316946661447816, "loss": 0.0139, "step": 432860 }, { "epoch": 1.12, "learning_rate": 0.00013169077792841015, "loss": 0.0106, "step": 432870 }, { "epoch": 1.12, "learning_rate": 0.0001316868897120387, "loss": 0.0113, "step": 432880 }, { "epoch": 1.12, "learning_rate": 0.00013168300149566723, "loss": 0.0121, "step": 432890 }, { "epoch": 1.12, "learning_rate": 0.00013167911327929577, "loss": 0.0181, "step": 432900 }, { "epoch": 1.12, "learning_rate": 0.00013167522506292429, "loss": 0.0156, "step": 432910 }, { "epoch": 1.12, "learning_rate": 0.00013167133684655283, "loss": 0.011, "step": 432920 }, { "epoch": 1.12, "learning_rate": 0.00013166744863018137, "loss": 0.0106, "step": 432930 }, { "epoch": 1.12, "learning_rate": 0.0001316635604138099, "loss": 0.0107, "step": 432940 }, { "epoch": 1.12, "learning_rate": 0.00013165967219743843, "loss": 0.0119, "step": 432950 }, { "epoch": 1.12, "learning_rate": 0.00013165578398106697, "loss": 0.0126, "step": 432960 }, { "epoch": 1.12, "learning_rate": 0.0001316518957646955, "loss": 0.0121, "step": 432970 }, { "epoch": 1.12, "learning_rate": 0.00013164800754832402, "loss": 0.0111, "step": 432980 }, { "epoch": 1.12, "learning_rate": 0.00013164411933195257, "loss": 0.0116, "step": 432990 }, { "epoch": 1.12, "learning_rate": 0.0001316402311155811, "loss": 0.0123, "step": 433000 }, { "epoch": 1.12, "eval_cer": 0.8817138834186412, "eval_loss": 0.0072698756121098995, "eval_runtime": 107.5529, "eval_samples_per_second": 18.595, "eval_steps_per_second": 4.649, "step": 433000 }, { "epoch": 1.12, "learning_rate": 0.00013163634289920965, "loss": 0.0104, "step": 433010 }, { "epoch": 1.12, "learning_rate": 0.00013163245468283816, "loss": 0.0115, "step": 433020 }, { "epoch": 1.12, "learning_rate": 0.0001316285664664667, "loss": 0.0112, "step": 433030 }, { "epoch": 1.12, "learning_rate": 0.00013162467825009525, "loss": 0.012, "step": 433040 }, { "epoch": 1.12, "learning_rate": 0.0001316207900337238, "loss": 0.0158, "step": 433050 }, { "epoch": 1.12, "learning_rate": 0.0001316169018173523, "loss": 0.01, "step": 433060 }, { "epoch": 1.12, "learning_rate": 0.00013161301360098087, "loss": 0.0142, "step": 433070 }, { "epoch": 1.12, "learning_rate": 0.00013160912538460939, "loss": 0.0084, "step": 433080 }, { "epoch": 1.12, "learning_rate": 0.00013160523716823793, "loss": 0.0111, "step": 433090 }, { "epoch": 1.12, "learning_rate": 0.00013160134895186647, "loss": 0.0114, "step": 433100 }, { "epoch": 1.12, "learning_rate": 0.000131597460735495, "loss": 0.0125, "step": 433110 }, { "epoch": 1.12, "learning_rate": 0.00013159357251912353, "loss": 0.0112, "step": 433120 }, { "epoch": 1.12, "learning_rate": 0.00013158968430275207, "loss": 0.0134, "step": 433130 }, { "epoch": 1.12, "learning_rate": 0.0001315857960863806, "loss": 0.0112, "step": 433140 }, { "epoch": 1.12, "learning_rate": 0.00013158190787000915, "loss": 0.014, "step": 433150 }, { "epoch": 1.12, "learning_rate": 0.00013157801965363766, "loss": 0.01, "step": 433160 }, { "epoch": 1.12, "learning_rate": 0.0001315741314372662, "loss": 0.0109, "step": 433170 }, { "epoch": 1.12, "learning_rate": 0.00013157024322089475, "loss": 0.0117, "step": 433180 }, { "epoch": 1.12, "learning_rate": 0.0001315663550045233, "loss": 0.0147, "step": 433190 }, { "epoch": 1.12, "learning_rate": 0.0001315624667881518, "loss": 0.0109, "step": 433200 }, { "epoch": 1.12, "learning_rate": 0.00013155857857178035, "loss": 0.0097, "step": 433210 }, { "epoch": 1.12, "learning_rate": 0.0001315546903554089, "loss": 0.0141, "step": 433220 }, { "epoch": 1.12, "learning_rate": 0.0001315508021390374, "loss": 0.0117, "step": 433230 }, { "epoch": 1.12, "learning_rate": 0.00013154691392266597, "loss": 0.0148, "step": 433240 }, { "epoch": 1.12, "learning_rate": 0.00013154302570629449, "loss": 0.0102, "step": 433250 }, { "epoch": 1.12, "learning_rate": 0.00013153913748992303, "loss": 0.011, "step": 433260 }, { "epoch": 1.12, "learning_rate": 0.00013153524927355157, "loss": 0.0123, "step": 433270 }, { "epoch": 1.12, "learning_rate": 0.0001315313610571801, "loss": 0.0098, "step": 433280 }, { "epoch": 1.12, "learning_rate": 0.00013152747284080862, "loss": 0.0088, "step": 433290 }, { "epoch": 1.12, "learning_rate": 0.00013152358462443717, "loss": 0.0094, "step": 433300 }, { "epoch": 1.12, "learning_rate": 0.0001315196964080657, "loss": 0.0122, "step": 433310 }, { "epoch": 1.12, "learning_rate": 0.00013151580819169425, "loss": 0.009, "step": 433320 }, { "epoch": 1.12, "learning_rate": 0.00013151191997532276, "loss": 0.0104, "step": 433330 }, { "epoch": 1.12, "learning_rate": 0.0001315080317589513, "loss": 0.011, "step": 433340 }, { "epoch": 1.12, "learning_rate": 0.00013150414354257985, "loss": 0.0121, "step": 433350 }, { "epoch": 1.12, "learning_rate": 0.0001315002553262084, "loss": 0.0105, "step": 433360 }, { "epoch": 1.12, "learning_rate": 0.0001314963671098369, "loss": 0.0087, "step": 433370 }, { "epoch": 1.12, "learning_rate": 0.00013149247889346545, "loss": 0.0147, "step": 433380 }, { "epoch": 1.12, "learning_rate": 0.000131488590677094, "loss": 0.0138, "step": 433390 }, { "epoch": 1.12, "learning_rate": 0.00013148470246072253, "loss": 0.0132, "step": 433400 }, { "epoch": 1.12, "learning_rate": 0.00013148081424435107, "loss": 0.0113, "step": 433410 }, { "epoch": 1.12, "learning_rate": 0.0001314769260279796, "loss": 0.014, "step": 433420 }, { "epoch": 1.12, "learning_rate": 0.00013147303781160813, "loss": 0.0103, "step": 433430 }, { "epoch": 1.12, "learning_rate": 0.00013146914959523667, "loss": 0.0134, "step": 433440 }, { "epoch": 1.12, "learning_rate": 0.0001314652613788652, "loss": 0.0119, "step": 433450 }, { "epoch": 1.12, "learning_rate": 0.00013146137316249372, "loss": 0.0115, "step": 433460 }, { "epoch": 1.12, "learning_rate": 0.00013145748494612227, "loss": 0.01, "step": 433470 }, { "epoch": 1.12, "learning_rate": 0.0001314535967297508, "loss": 0.0151, "step": 433480 }, { "epoch": 1.12, "learning_rate": 0.00013144970851337935, "loss": 0.0105, "step": 433490 }, { "epoch": 1.12, "learning_rate": 0.00013144582029700786, "loss": 0.011, "step": 433500 }, { "epoch": 1.12, "learning_rate": 0.0001314419320806364, "loss": 0.0128, "step": 433510 }, { "epoch": 1.12, "learning_rate": 0.00013143804386426495, "loss": 0.0145, "step": 433520 }, { "epoch": 1.12, "learning_rate": 0.0001314341556478935, "loss": 0.0104, "step": 433530 }, { "epoch": 1.12, "learning_rate": 0.000131430267431522, "loss": 0.0128, "step": 433540 }, { "epoch": 1.12, "learning_rate": 0.00013142637921515054, "loss": 0.0097, "step": 433550 }, { "epoch": 1.12, "learning_rate": 0.00013142249099877909, "loss": 0.0111, "step": 433560 }, { "epoch": 1.12, "learning_rate": 0.00013141860278240763, "loss": 0.0113, "step": 433570 }, { "epoch": 1.12, "learning_rate": 0.00013141471456603614, "loss": 0.0092, "step": 433580 }, { "epoch": 1.12, "learning_rate": 0.0001314108263496647, "loss": 0.0106, "step": 433590 }, { "epoch": 1.12, "learning_rate": 0.00013140693813329323, "loss": 0.011, "step": 433600 }, { "epoch": 1.12, "learning_rate": 0.00013140304991692177, "loss": 0.0106, "step": 433610 }, { "epoch": 1.12, "learning_rate": 0.0001313991617005503, "loss": 0.0107, "step": 433620 }, { "epoch": 1.12, "learning_rate": 0.00013139527348417885, "loss": 0.0109, "step": 433630 }, { "epoch": 1.12, "learning_rate": 0.00013139138526780737, "loss": 0.0111, "step": 433640 }, { "epoch": 1.12, "learning_rate": 0.0001313874970514359, "loss": 0.0111, "step": 433650 }, { "epoch": 1.12, "learning_rate": 0.00013138360883506445, "loss": 0.0139, "step": 433660 }, { "epoch": 1.12, "learning_rate": 0.000131379720618693, "loss": 0.0138, "step": 433670 }, { "epoch": 1.12, "learning_rate": 0.0001313758324023215, "loss": 0.0126, "step": 433680 }, { "epoch": 1.12, "learning_rate": 0.00013137194418595005, "loss": 0.0127, "step": 433690 }, { "epoch": 1.12, "learning_rate": 0.0001313680559695786, "loss": 0.0105, "step": 433700 }, { "epoch": 1.12, "learning_rate": 0.0001313641677532071, "loss": 0.0113, "step": 433710 }, { "epoch": 1.12, "learning_rate": 0.00013136027953683564, "loss": 0.01, "step": 433720 }, { "epoch": 1.12, "learning_rate": 0.00013135639132046419, "loss": 0.0105, "step": 433730 }, { "epoch": 1.12, "learning_rate": 0.00013135250310409273, "loss": 0.0108, "step": 433740 }, { "epoch": 1.12, "learning_rate": 0.00013134861488772124, "loss": 0.0106, "step": 433750 }, { "epoch": 1.12, "learning_rate": 0.0001313447266713498, "loss": 0.0095, "step": 433760 }, { "epoch": 1.12, "learning_rate": 0.00013134083845497833, "loss": 0.0093, "step": 433770 }, { "epoch": 1.12, "learning_rate": 0.00013133695023860687, "loss": 0.0089, "step": 433780 }, { "epoch": 1.12, "learning_rate": 0.0001313330620222354, "loss": 0.0107, "step": 433790 }, { "epoch": 1.12, "learning_rate": 0.00013132917380586395, "loss": 0.0135, "step": 433800 }, { "epoch": 1.12, "learning_rate": 0.00013132528558949246, "loss": 0.0118, "step": 433810 }, { "epoch": 1.12, "learning_rate": 0.000131321397373121, "loss": 0.0094, "step": 433820 }, { "epoch": 1.12, "learning_rate": 0.00013131750915674955, "loss": 0.01, "step": 433830 }, { "epoch": 1.12, "learning_rate": 0.0001313136209403781, "loss": 0.0091, "step": 433840 }, { "epoch": 1.12, "learning_rate": 0.0001313097327240066, "loss": 0.0126, "step": 433850 }, { "epoch": 1.12, "learning_rate": 0.00013130584450763515, "loss": 0.0136, "step": 433860 }, { "epoch": 1.12, "learning_rate": 0.0001313019562912637, "loss": 0.0083, "step": 433870 }, { "epoch": 1.12, "learning_rate": 0.00013129806807489223, "loss": 0.0107, "step": 433880 }, { "epoch": 1.12, "learning_rate": 0.00013129417985852074, "loss": 0.0137, "step": 433890 }, { "epoch": 1.12, "learning_rate": 0.00013129029164214929, "loss": 0.0109, "step": 433900 }, { "epoch": 1.12, "learning_rate": 0.00013128640342577783, "loss": 0.0094, "step": 433910 }, { "epoch": 1.12, "learning_rate": 0.00013128251520940637, "loss": 0.012, "step": 433920 }, { "epoch": 1.12, "learning_rate": 0.0001312786269930349, "loss": 0.0125, "step": 433930 }, { "epoch": 1.12, "learning_rate": 0.00013127473877666342, "loss": 0.011, "step": 433940 }, { "epoch": 1.12, "learning_rate": 0.00013127085056029197, "loss": 0.0152, "step": 433950 }, { "epoch": 1.12, "learning_rate": 0.0001312669623439205, "loss": 0.0104, "step": 433960 }, { "epoch": 1.12, "learning_rate": 0.00013126307412754905, "loss": 0.0109, "step": 433970 }, { "epoch": 1.12, "learning_rate": 0.00013125918591117756, "loss": 0.0133, "step": 433980 }, { "epoch": 1.12, "learning_rate": 0.0001312552976948061, "loss": 0.0126, "step": 433990 }, { "epoch": 1.12, "learning_rate": 0.00013125140947843465, "loss": 0.0104, "step": 434000 }, { "epoch": 1.12, "eval_cer": 0.8817334783357197, "eval_loss": 0.007528600748628378, "eval_runtime": 107.4782, "eval_samples_per_second": 18.608, "eval_steps_per_second": 4.652, "step": 434000 }, { "epoch": 1.13, "learning_rate": 0.0001312475212620632, "loss": 0.0124, "step": 434010 }, { "epoch": 1.13, "learning_rate": 0.0001312436330456917, "loss": 0.0109, "step": 434020 }, { "epoch": 1.13, "learning_rate": 0.00013123974482932025, "loss": 0.0125, "step": 434030 }, { "epoch": 1.13, "learning_rate": 0.0001312358566129488, "loss": 0.0147, "step": 434040 }, { "epoch": 1.13, "learning_rate": 0.00013123196839657733, "loss": 0.014, "step": 434050 }, { "epoch": 1.13, "learning_rate": 0.00013122808018020584, "loss": 0.0158, "step": 434060 }, { "epoch": 1.13, "learning_rate": 0.00013122419196383438, "loss": 0.0117, "step": 434070 }, { "epoch": 1.13, "learning_rate": 0.00013122030374746293, "loss": 0.0135, "step": 434080 }, { "epoch": 1.13, "learning_rate": 0.00013121641553109147, "loss": 0.0116, "step": 434090 }, { "epoch": 1.13, "learning_rate": 0.00013121252731471998, "loss": 0.0102, "step": 434100 }, { "epoch": 1.13, "learning_rate": 0.00013120863909834855, "loss": 0.0103, "step": 434110 }, { "epoch": 1.13, "learning_rate": 0.00013120475088197707, "loss": 0.0127, "step": 434120 }, { "epoch": 1.13, "learning_rate": 0.0001312008626656056, "loss": 0.0122, "step": 434130 }, { "epoch": 1.13, "learning_rate": 0.00013119697444923415, "loss": 0.0131, "step": 434140 }, { "epoch": 1.13, "learning_rate": 0.0001311930862328627, "loss": 0.0094, "step": 434150 }, { "epoch": 1.13, "learning_rate": 0.0001311891980164912, "loss": 0.0115, "step": 434160 }, { "epoch": 1.13, "learning_rate": 0.00013118530980011975, "loss": 0.0125, "step": 434170 }, { "epoch": 1.13, "learning_rate": 0.0001311814215837483, "loss": 0.0123, "step": 434180 }, { "epoch": 1.13, "learning_rate": 0.0001311775333673768, "loss": 0.0129, "step": 434190 }, { "epoch": 1.13, "learning_rate": 0.00013117364515100534, "loss": 0.012, "step": 434200 }, { "epoch": 1.13, "learning_rate": 0.00013116975693463389, "loss": 0.0117, "step": 434210 }, { "epoch": 1.13, "learning_rate": 0.00013116586871826243, "loss": 0.0117, "step": 434220 }, { "epoch": 1.13, "learning_rate": 0.00013116198050189094, "loss": 0.0108, "step": 434230 }, { "epoch": 1.13, "learning_rate": 0.00013115809228551948, "loss": 0.0112, "step": 434240 }, { "epoch": 1.13, "learning_rate": 0.00013115420406914803, "loss": 0.0106, "step": 434250 }, { "epoch": 1.13, "learning_rate": 0.00013115031585277657, "loss": 0.0093, "step": 434260 }, { "epoch": 1.13, "learning_rate": 0.00013114642763640508, "loss": 0.0105, "step": 434270 }, { "epoch": 1.13, "learning_rate": 0.00013114253942003365, "loss": 0.0142, "step": 434280 }, { "epoch": 1.13, "learning_rate": 0.00013113865120366217, "loss": 0.0136, "step": 434290 }, { "epoch": 1.13, "learning_rate": 0.0001311347629872907, "loss": 0.0104, "step": 434300 }, { "epoch": 1.13, "learning_rate": 0.00013113087477091925, "loss": 0.0129, "step": 434310 }, { "epoch": 1.13, "learning_rate": 0.0001311269865545478, "loss": 0.009, "step": 434320 }, { "epoch": 1.13, "learning_rate": 0.0001311230983381763, "loss": 0.0111, "step": 434330 }, { "epoch": 1.13, "learning_rate": 0.00013111921012180485, "loss": 0.0152, "step": 434340 }, { "epoch": 1.13, "learning_rate": 0.0001311153219054334, "loss": 0.01, "step": 434350 }, { "epoch": 1.13, "learning_rate": 0.00013111143368906193, "loss": 0.0089, "step": 434360 }, { "epoch": 1.13, "learning_rate": 0.00013110754547269044, "loss": 0.0097, "step": 434370 }, { "epoch": 1.13, "learning_rate": 0.00013110365725631899, "loss": 0.0097, "step": 434380 }, { "epoch": 1.13, "learning_rate": 0.00013109976903994753, "loss": 0.013, "step": 434390 }, { "epoch": 1.13, "learning_rate": 0.00013109588082357607, "loss": 0.0118, "step": 434400 }, { "epoch": 1.13, "learning_rate": 0.00013109199260720458, "loss": 0.011, "step": 434410 }, { "epoch": 1.13, "learning_rate": 0.00013108810439083312, "loss": 0.0097, "step": 434420 }, { "epoch": 1.13, "learning_rate": 0.00013108421617446167, "loss": 0.0163, "step": 434430 }, { "epoch": 1.13, "learning_rate": 0.00013108032795809018, "loss": 0.0118, "step": 434440 }, { "epoch": 1.13, "learning_rate": 0.00013107643974171872, "loss": 0.0143, "step": 434450 }, { "epoch": 1.13, "learning_rate": 0.00013107255152534726, "loss": 0.009, "step": 434460 }, { "epoch": 1.13, "learning_rate": 0.0001310686633089758, "loss": 0.0138, "step": 434470 }, { "epoch": 1.13, "learning_rate": 0.00013106477509260435, "loss": 0.0099, "step": 434480 }, { "epoch": 1.13, "learning_rate": 0.0001310608868762329, "loss": 0.0105, "step": 434490 }, { "epoch": 1.13, "learning_rate": 0.0001310569986598614, "loss": 0.0129, "step": 434500 }, { "epoch": 1.13, "learning_rate": 0.00013105311044348995, "loss": 0.0128, "step": 434510 }, { "epoch": 1.13, "learning_rate": 0.0001310492222271185, "loss": 0.0168, "step": 434520 }, { "epoch": 1.13, "learning_rate": 0.00013104533401074703, "loss": 0.0144, "step": 434530 }, { "epoch": 1.13, "learning_rate": 0.00013104144579437554, "loss": 0.0075, "step": 434540 }, { "epoch": 1.13, "learning_rate": 0.00013103755757800408, "loss": 0.0189, "step": 434550 }, { "epoch": 1.13, "learning_rate": 0.00013103366936163263, "loss": 0.0122, "step": 434560 }, { "epoch": 1.13, "learning_rate": 0.00013102978114526117, "loss": 0.01, "step": 434570 }, { "epoch": 1.13, "learning_rate": 0.00013102589292888968, "loss": 0.0125, "step": 434580 }, { "epoch": 1.13, "learning_rate": 0.00013102200471251822, "loss": 0.0094, "step": 434590 }, { "epoch": 1.13, "learning_rate": 0.00013101811649614677, "loss": 0.0141, "step": 434600 }, { "epoch": 1.13, "learning_rate": 0.0001310142282797753, "loss": 0.0111, "step": 434610 }, { "epoch": 1.13, "learning_rate": 0.00013101034006340382, "loss": 0.0106, "step": 434620 }, { "epoch": 1.13, "learning_rate": 0.0001310064518470324, "loss": 0.0115, "step": 434630 }, { "epoch": 1.13, "learning_rate": 0.0001310025636306609, "loss": 0.0119, "step": 434640 }, { "epoch": 1.13, "learning_rate": 0.00013099867541428945, "loss": 0.0135, "step": 434650 }, { "epoch": 1.13, "learning_rate": 0.000130994787197918, "loss": 0.0132, "step": 434660 }, { "epoch": 1.13, "learning_rate": 0.00013099089898154653, "loss": 0.0118, "step": 434670 }, { "epoch": 1.13, "learning_rate": 0.00013098701076517504, "loss": 0.0115, "step": 434680 }, { "epoch": 1.13, "learning_rate": 0.0001309831225488036, "loss": 0.0095, "step": 434690 }, { "epoch": 1.13, "learning_rate": 0.00013097923433243213, "loss": 0.0135, "step": 434700 }, { "epoch": 1.13, "learning_rate": 0.00013097534611606064, "loss": 0.0116, "step": 434710 }, { "epoch": 1.13, "learning_rate": 0.00013097145789968918, "loss": 0.0111, "step": 434720 }, { "epoch": 1.13, "learning_rate": 0.00013096756968331773, "loss": 0.0104, "step": 434730 }, { "epoch": 1.13, "learning_rate": 0.00013096368146694627, "loss": 0.0103, "step": 434740 }, { "epoch": 1.13, "learning_rate": 0.00013095979325057478, "loss": 0.0094, "step": 434750 }, { "epoch": 1.13, "learning_rate": 0.00013095590503420332, "loss": 0.0107, "step": 434760 }, { "epoch": 1.13, "learning_rate": 0.00013095201681783187, "loss": 0.0087, "step": 434770 }, { "epoch": 1.13, "learning_rate": 0.0001309481286014604, "loss": 0.0136, "step": 434780 }, { "epoch": 1.13, "learning_rate": 0.00013094424038508892, "loss": 0.0113, "step": 434790 }, { "epoch": 1.13, "learning_rate": 0.0001309403521687175, "loss": 0.0123, "step": 434800 }, { "epoch": 1.13, "learning_rate": 0.000130936463952346, "loss": 0.0138, "step": 434810 }, { "epoch": 1.13, "learning_rate": 0.00013093257573597455, "loss": 0.0105, "step": 434820 }, { "epoch": 1.13, "learning_rate": 0.0001309286875196031, "loss": 0.0095, "step": 434830 }, { "epoch": 1.13, "learning_rate": 0.00013092479930323163, "loss": 0.0091, "step": 434840 }, { "epoch": 1.13, "learning_rate": 0.00013092091108686014, "loss": 0.0108, "step": 434850 }, { "epoch": 1.13, "learning_rate": 0.00013091702287048869, "loss": 0.0103, "step": 434860 }, { "epoch": 1.13, "learning_rate": 0.00013091313465411723, "loss": 0.0103, "step": 434870 }, { "epoch": 1.13, "learning_rate": 0.00013090924643774577, "loss": 0.0116, "step": 434880 }, { "epoch": 1.13, "learning_rate": 0.00013090535822137428, "loss": 0.0085, "step": 434890 }, { "epoch": 1.13, "learning_rate": 0.00013090147000500283, "loss": 0.0131, "step": 434900 }, { "epoch": 1.13, "learning_rate": 0.00013089758178863137, "loss": 0.0096, "step": 434910 }, { "epoch": 1.13, "learning_rate": 0.0001308936935722599, "loss": 0.0143, "step": 434920 }, { "epoch": 1.13, "learning_rate": 0.00013088980535588842, "loss": 0.0158, "step": 434930 }, { "epoch": 1.13, "learning_rate": 0.00013088591713951696, "loss": 0.0126, "step": 434940 }, { "epoch": 1.13, "learning_rate": 0.0001308820289231455, "loss": 0.0105, "step": 434950 }, { "epoch": 1.13, "learning_rate": 0.00013087814070677402, "loss": 0.007, "step": 434960 }, { "epoch": 1.13, "learning_rate": 0.00013087425249040256, "loss": 0.0143, "step": 434970 }, { "epoch": 1.13, "learning_rate": 0.0001308703642740311, "loss": 0.0103, "step": 434980 }, { "epoch": 1.13, "learning_rate": 0.00013086647605765965, "loss": 0.0142, "step": 434990 }, { "epoch": 1.13, "learning_rate": 0.0001308625878412882, "loss": 0.0142, "step": 435000 }, { "epoch": 1.13, "eval_cer": 0.8816928888646285, "eval_loss": 0.007556126918643713, "eval_runtime": 107.935, "eval_samples_per_second": 18.53, "eval_steps_per_second": 4.632, "step": 435000 }, { "epoch": 1.13, "learning_rate": 0.00013085869962491673, "loss": 0.0123, "step": 435010 }, { "epoch": 1.13, "learning_rate": 0.00013085481140854524, "loss": 0.0085, "step": 435020 }, { "epoch": 1.13, "learning_rate": 0.00013085092319217379, "loss": 0.014, "step": 435030 }, { "epoch": 1.13, "learning_rate": 0.00013084703497580233, "loss": 0.0111, "step": 435040 }, { "epoch": 1.13, "learning_rate": 0.00013084314675943087, "loss": 0.0114, "step": 435050 }, { "epoch": 1.13, "learning_rate": 0.00013083925854305938, "loss": 0.0089, "step": 435060 }, { "epoch": 1.13, "learning_rate": 0.00013083537032668792, "loss": 0.0106, "step": 435070 }, { "epoch": 1.13, "learning_rate": 0.00013083148211031647, "loss": 0.0092, "step": 435080 }, { "epoch": 1.13, "learning_rate": 0.000130827593893945, "loss": 0.0124, "step": 435090 }, { "epoch": 1.13, "learning_rate": 0.00013082370567757352, "loss": 0.0149, "step": 435100 }, { "epoch": 1.13, "learning_rate": 0.00013081981746120206, "loss": 0.0098, "step": 435110 }, { "epoch": 1.13, "learning_rate": 0.0001308159292448306, "loss": 0.0104, "step": 435120 }, { "epoch": 1.13, "learning_rate": 0.00013081204102845915, "loss": 0.0115, "step": 435130 }, { "epoch": 1.13, "learning_rate": 0.00013080815281208766, "loss": 0.01, "step": 435140 }, { "epoch": 1.13, "learning_rate": 0.00013080426459571623, "loss": 0.01, "step": 435150 }, { "epoch": 1.13, "learning_rate": 0.00013080037637934475, "loss": 0.0099, "step": 435160 }, { "epoch": 1.13, "learning_rate": 0.0001307964881629733, "loss": 0.0108, "step": 435170 }, { "epoch": 1.13, "learning_rate": 0.00013079259994660183, "loss": 0.0085, "step": 435180 }, { "epoch": 1.13, "learning_rate": 0.00013078871173023034, "loss": 0.0119, "step": 435190 }, { "epoch": 1.13, "learning_rate": 0.00013078482351385888, "loss": 0.0134, "step": 435200 }, { "epoch": 1.13, "learning_rate": 0.00013078093529748743, "loss": 0.0187, "step": 435210 }, { "epoch": 1.13, "learning_rate": 0.00013077704708111597, "loss": 0.0138, "step": 435220 }, { "epoch": 1.13, "learning_rate": 0.00013077315886474448, "loss": 0.012, "step": 435230 }, { "epoch": 1.13, "learning_rate": 0.00013076927064837302, "loss": 0.0239, "step": 435240 }, { "epoch": 1.13, "learning_rate": 0.00013076538243200157, "loss": 0.0131, "step": 435250 }, { "epoch": 1.13, "learning_rate": 0.0001307614942156301, "loss": 0.0108, "step": 435260 }, { "epoch": 1.13, "learning_rate": 0.00013075760599925862, "loss": 0.0128, "step": 435270 }, { "epoch": 1.13, "learning_rate": 0.00013075371778288716, "loss": 0.015, "step": 435280 }, { "epoch": 1.13, "learning_rate": 0.0001307498295665157, "loss": 0.0097, "step": 435290 }, { "epoch": 1.13, "learning_rate": 0.00013074594135014425, "loss": 0.0085, "step": 435300 }, { "epoch": 1.13, "learning_rate": 0.00013074205313377276, "loss": 0.0103, "step": 435310 }, { "epoch": 1.13, "learning_rate": 0.00013073816491740133, "loss": 0.0157, "step": 435320 }, { "epoch": 1.13, "learning_rate": 0.00013073427670102984, "loss": 0.0266, "step": 435330 }, { "epoch": 1.13, "learning_rate": 0.00013073038848465839, "loss": 0.0214, "step": 435340 }, { "epoch": 1.13, "learning_rate": 0.00013072650026828693, "loss": 0.0147, "step": 435350 }, { "epoch": 1.13, "learning_rate": 0.00013072261205191547, "loss": 0.0114, "step": 435360 }, { "epoch": 1.13, "learning_rate": 0.00013071872383554398, "loss": 0.0088, "step": 435370 }, { "epoch": 1.13, "learning_rate": 0.00013071483561917253, "loss": 0.0128, "step": 435380 }, { "epoch": 1.13, "learning_rate": 0.00013071094740280107, "loss": 0.018, "step": 435390 }, { "epoch": 1.13, "learning_rate": 0.0001307070591864296, "loss": 0.0095, "step": 435400 }, { "epoch": 1.13, "learning_rate": 0.00013070317097005812, "loss": 0.0111, "step": 435410 }, { "epoch": 1.13, "learning_rate": 0.00013069928275368667, "loss": 0.0098, "step": 435420 }, { "epoch": 1.13, "learning_rate": 0.0001306953945373152, "loss": 0.0138, "step": 435430 }, { "epoch": 1.13, "learning_rate": 0.00013069150632094372, "loss": 0.0126, "step": 435440 }, { "epoch": 1.13, "learning_rate": 0.00013068761810457226, "loss": 0.012, "step": 435450 }, { "epoch": 1.13, "learning_rate": 0.0001306837298882008, "loss": 0.0107, "step": 435460 }, { "epoch": 1.13, "learning_rate": 0.00013067984167182935, "loss": 0.0114, "step": 435470 }, { "epoch": 1.13, "learning_rate": 0.00013067595345545786, "loss": 0.0129, "step": 435480 }, { "epoch": 1.13, "learning_rate": 0.0001306720652390864, "loss": 0.0131, "step": 435490 }, { "epoch": 1.13, "learning_rate": 0.00013066817702271494, "loss": 0.0129, "step": 435500 }, { "epoch": 1.13, "learning_rate": 0.00013066428880634349, "loss": 0.0119, "step": 435510 }, { "epoch": 1.13, "learning_rate": 0.00013066040058997203, "loss": 0.0121, "step": 435520 }, { "epoch": 1.13, "learning_rate": 0.00013065651237360057, "loss": 0.0106, "step": 435530 }, { "epoch": 1.13, "learning_rate": 0.00013065262415722908, "loss": 0.0098, "step": 435540 }, { "epoch": 1.13, "learning_rate": 0.00013064873594085763, "loss": 0.0117, "step": 435550 }, { "epoch": 1.13, "learning_rate": 0.00013064484772448617, "loss": 0.0131, "step": 435560 }, { "epoch": 1.13, "learning_rate": 0.0001306409595081147, "loss": 0.0116, "step": 435570 }, { "epoch": 1.13, "learning_rate": 0.00013063707129174322, "loss": 0.0124, "step": 435580 }, { "epoch": 1.13, "learning_rate": 0.00013063318307537176, "loss": 0.0104, "step": 435590 }, { "epoch": 1.13, "learning_rate": 0.0001306292948590003, "loss": 0.0134, "step": 435600 }, { "epoch": 1.13, "learning_rate": 0.00013062540664262885, "loss": 0.0086, "step": 435610 }, { "epoch": 1.13, "learning_rate": 0.00013062151842625736, "loss": 0.0086, "step": 435620 }, { "epoch": 1.13, "learning_rate": 0.0001306176302098859, "loss": 0.0154, "step": 435630 }, { "epoch": 1.13, "learning_rate": 0.00013061374199351445, "loss": 0.0098, "step": 435640 }, { "epoch": 1.13, "learning_rate": 0.000130609853777143, "loss": 0.013, "step": 435650 }, { "epoch": 1.13, "learning_rate": 0.0001306059655607715, "loss": 0.0123, "step": 435660 }, { "epoch": 1.13, "learning_rate": 0.00013060207734440007, "loss": 0.0112, "step": 435670 }, { "epoch": 1.13, "learning_rate": 0.00013059818912802859, "loss": 0.0124, "step": 435680 }, { "epoch": 1.13, "learning_rate": 0.0001305943009116571, "loss": 0.0158, "step": 435690 }, { "epoch": 1.13, "learning_rate": 0.00013059041269528567, "loss": 0.0115, "step": 435700 }, { "epoch": 1.13, "learning_rate": 0.00013058652447891418, "loss": 0.0153, "step": 435710 }, { "epoch": 1.13, "learning_rate": 0.00013058263626254272, "loss": 0.0124, "step": 435720 }, { "epoch": 1.13, "learning_rate": 0.00013057874804617127, "loss": 0.0093, "step": 435730 }, { "epoch": 1.13, "learning_rate": 0.0001305748598297998, "loss": 0.011, "step": 435740 }, { "epoch": 1.13, "learning_rate": 0.00013057097161342832, "loss": 0.0113, "step": 435750 }, { "epoch": 1.13, "learning_rate": 0.00013056708339705686, "loss": 0.0117, "step": 435760 }, { "epoch": 1.13, "learning_rate": 0.0001305631951806854, "loss": 0.0102, "step": 435770 }, { "epoch": 1.13, "learning_rate": 0.00013055930696431395, "loss": 0.0128, "step": 435780 }, { "epoch": 1.13, "learning_rate": 0.00013055541874794246, "loss": 0.0093, "step": 435790 }, { "epoch": 1.13, "learning_rate": 0.000130551530531571, "loss": 0.0109, "step": 435800 }, { "epoch": 1.13, "learning_rate": 0.00013054764231519955, "loss": 0.0116, "step": 435810 }, { "epoch": 1.13, "learning_rate": 0.0001305437540988281, "loss": 0.0201, "step": 435820 }, { "epoch": 1.13, "learning_rate": 0.0001305398658824566, "loss": 0.0126, "step": 435830 }, { "epoch": 1.13, "learning_rate": 0.00013053597766608514, "loss": 0.0138, "step": 435840 }, { "epoch": 1.13, "learning_rate": 0.00013053208944971368, "loss": 0.0118, "step": 435850 }, { "epoch": 1.13, "learning_rate": 0.00013052820123334223, "loss": 0.0119, "step": 435860 }, { "epoch": 1.13, "learning_rate": 0.00013052431301697077, "loss": 0.0088, "step": 435870 }, { "epoch": 1.13, "learning_rate": 0.0001305204248005993, "loss": 0.0101, "step": 435880 }, { "epoch": 1.13, "learning_rate": 0.00013051653658422782, "loss": 0.0092, "step": 435890 }, { "epoch": 1.13, "learning_rate": 0.00013051264836785637, "loss": 0.0092, "step": 435900 }, { "epoch": 1.13, "learning_rate": 0.0001305087601514849, "loss": 0.0247, "step": 435910 }, { "epoch": 1.13, "learning_rate": 0.00013050487193511345, "loss": 0.0105, "step": 435920 }, { "epoch": 1.13, "learning_rate": 0.00013050098371874196, "loss": 0.0089, "step": 435930 }, { "epoch": 1.13, "learning_rate": 0.0001304970955023705, "loss": 0.0091, "step": 435940 }, { "epoch": 1.13, "learning_rate": 0.00013049320728599905, "loss": 0.0141, "step": 435950 }, { "epoch": 1.13, "learning_rate": 0.00013048931906962756, "loss": 0.0117, "step": 435960 }, { "epoch": 1.13, "learning_rate": 0.0001304854308532561, "loss": 0.0121, "step": 435970 }, { "epoch": 1.13, "learning_rate": 0.00013048154263688464, "loss": 0.0117, "step": 435980 }, { "epoch": 1.13, "learning_rate": 0.00013047765442051319, "loss": 0.0098, "step": 435990 }, { "epoch": 1.13, "learning_rate": 0.0001304737662041417, "loss": 0.0133, "step": 436000 }, { "epoch": 1.13, "eval_cer": 0.8816830914060892, "eval_loss": 0.007555661257356405, "eval_runtime": 107.5039, "eval_samples_per_second": 18.604, "eval_steps_per_second": 4.651, "step": 436000 }, { "epoch": 1.13, "learning_rate": 0.00013046987798777024, "loss": 0.0105, "step": 436010 }, { "epoch": 1.13, "learning_rate": 0.00013046598977139878, "loss": 0.0112, "step": 436020 }, { "epoch": 1.13, "learning_rate": 0.00013046210155502733, "loss": 0.0091, "step": 436030 }, { "epoch": 1.13, "learning_rate": 0.00013045821333865584, "loss": 0.0123, "step": 436040 }, { "epoch": 1.13, "learning_rate": 0.0001304543251222844, "loss": 0.0092, "step": 436050 }, { "epoch": 1.13, "learning_rate": 0.00013045043690591292, "loss": 0.0114, "step": 436060 }, { "epoch": 1.13, "learning_rate": 0.00013044654868954147, "loss": 0.0106, "step": 436070 }, { "epoch": 1.13, "learning_rate": 0.00013044266047317, "loss": 0.0103, "step": 436080 }, { "epoch": 1.13, "learning_rate": 0.00013043877225679855, "loss": 0.0115, "step": 436090 }, { "epoch": 1.13, "learning_rate": 0.00013043488404042706, "loss": 0.0082, "step": 436100 }, { "epoch": 1.13, "learning_rate": 0.0001304309958240556, "loss": 0.01, "step": 436110 }, { "epoch": 1.13, "learning_rate": 0.00013042710760768415, "loss": 0.0144, "step": 436120 }, { "epoch": 1.13, "learning_rate": 0.0001304232193913127, "loss": 0.0134, "step": 436130 }, { "epoch": 1.13, "learning_rate": 0.0001304193311749412, "loss": 0.0102, "step": 436140 }, { "epoch": 1.13, "learning_rate": 0.00013041544295856974, "loss": 0.0113, "step": 436150 }, { "epoch": 1.13, "learning_rate": 0.00013041155474219829, "loss": 0.009, "step": 436160 }, { "epoch": 1.13, "learning_rate": 0.00013040766652582683, "loss": 0.0119, "step": 436170 }, { "epoch": 1.13, "learning_rate": 0.00013040377830945534, "loss": 0.0096, "step": 436180 }, { "epoch": 1.13, "learning_rate": 0.00013039989009308388, "loss": 0.0156, "step": 436190 }, { "epoch": 1.13, "learning_rate": 0.00013039600187671243, "loss": 0.0111, "step": 436200 }, { "epoch": 1.13, "learning_rate": 0.00013039211366034094, "loss": 0.0132, "step": 436210 }, { "epoch": 1.13, "learning_rate": 0.0001303882254439695, "loss": 0.0107, "step": 436220 }, { "epoch": 1.13, "learning_rate": 0.00013038433722759802, "loss": 0.0095, "step": 436230 }, { "epoch": 1.13, "learning_rate": 0.00013038044901122656, "loss": 0.0117, "step": 436240 }, { "epoch": 1.13, "learning_rate": 0.0001303765607948551, "loss": 0.0095, "step": 436250 }, { "epoch": 1.13, "learning_rate": 0.00013037267257848365, "loss": 0.0146, "step": 436260 }, { "epoch": 1.13, "learning_rate": 0.00013036878436211216, "loss": 0.0114, "step": 436270 }, { "epoch": 1.13, "learning_rate": 0.0001303648961457407, "loss": 0.0121, "step": 436280 }, { "epoch": 1.13, "learning_rate": 0.00013036100792936925, "loss": 0.0109, "step": 436290 }, { "epoch": 1.13, "learning_rate": 0.0001303571197129978, "loss": 0.0143, "step": 436300 }, { "epoch": 1.13, "learning_rate": 0.0001303532314966263, "loss": 0.0101, "step": 436310 }, { "epoch": 1.13, "learning_rate": 0.00013034934328025484, "loss": 0.0122, "step": 436320 }, { "epoch": 1.13, "learning_rate": 0.00013034545506388339, "loss": 0.011, "step": 436330 }, { "epoch": 1.13, "learning_rate": 0.00013034156684751193, "loss": 0.0088, "step": 436340 }, { "epoch": 1.13, "learning_rate": 0.00013033767863114044, "loss": 0.015, "step": 436350 }, { "epoch": 1.13, "learning_rate": 0.00013033379041476898, "loss": 0.0115, "step": 436360 }, { "epoch": 1.13, "learning_rate": 0.00013032990219839752, "loss": 0.0121, "step": 436370 }, { "epoch": 1.13, "learning_rate": 0.00013032601398202607, "loss": 0.014, "step": 436380 }, { "epoch": 1.13, "learning_rate": 0.0001303221257656546, "loss": 0.0133, "step": 436390 }, { "epoch": 1.13, "learning_rate": 0.00013031823754928315, "loss": 0.0103, "step": 436400 }, { "epoch": 1.13, "learning_rate": 0.00013031434933291166, "loss": 0.0095, "step": 436410 }, { "epoch": 1.13, "learning_rate": 0.0001303104611165402, "loss": 0.0108, "step": 436420 }, { "epoch": 1.13, "learning_rate": 0.00013030657290016875, "loss": 0.0091, "step": 436430 }, { "epoch": 1.13, "learning_rate": 0.00013030268468379726, "loss": 0.01, "step": 436440 }, { "epoch": 1.13, "learning_rate": 0.0001302987964674258, "loss": 0.0111, "step": 436450 }, { "epoch": 1.13, "learning_rate": 0.00013029490825105435, "loss": 0.0132, "step": 436460 }, { "epoch": 1.13, "learning_rate": 0.0001302910200346829, "loss": 0.0146, "step": 436470 }, { "epoch": 1.13, "learning_rate": 0.0001302871318183114, "loss": 0.0099, "step": 436480 }, { "epoch": 1.13, "learning_rate": 0.00013028324360193994, "loss": 0.0113, "step": 436490 }, { "epoch": 1.13, "learning_rate": 0.00013027935538556848, "loss": 0.0113, "step": 436500 }, { "epoch": 1.13, "learning_rate": 0.00013027546716919703, "loss": 0.025, "step": 436510 }, { "epoch": 1.13, "learning_rate": 0.00013027157895282554, "loss": 0.0114, "step": 436520 }, { "epoch": 1.13, "learning_rate": 0.00013026769073645408, "loss": 0.0107, "step": 436530 }, { "epoch": 1.13, "learning_rate": 0.00013026380252008262, "loss": 0.0093, "step": 436540 }, { "epoch": 1.13, "learning_rate": 0.00013025991430371117, "loss": 0.0113, "step": 436550 }, { "epoch": 1.13, "learning_rate": 0.00013025602608733968, "loss": 0.013, "step": 436560 }, { "epoch": 1.13, "learning_rate": 0.00013025213787096825, "loss": 0.0129, "step": 436570 }, { "epoch": 1.13, "learning_rate": 0.00013024824965459676, "loss": 0.0074, "step": 436580 }, { "epoch": 1.13, "learning_rate": 0.0001302443614382253, "loss": 0.016, "step": 436590 }, { "epoch": 1.13, "learning_rate": 0.00013024047322185385, "loss": 0.0109, "step": 436600 }, { "epoch": 1.13, "learning_rate": 0.0001302365850054824, "loss": 0.0151, "step": 436610 }, { "epoch": 1.13, "learning_rate": 0.0001302326967891109, "loss": 0.0119, "step": 436620 }, { "epoch": 1.13, "learning_rate": 0.00013022880857273944, "loss": 0.0101, "step": 436630 }, { "epoch": 1.13, "learning_rate": 0.00013022492035636799, "loss": 0.0126, "step": 436640 }, { "epoch": 1.13, "learning_rate": 0.00013022103213999653, "loss": 0.0124, "step": 436650 }, { "epoch": 1.13, "learning_rate": 0.00013021714392362504, "loss": 0.0105, "step": 436660 }, { "epoch": 1.13, "learning_rate": 0.00013021325570725358, "loss": 0.0103, "step": 436670 }, { "epoch": 1.13, "learning_rate": 0.00013020936749088213, "loss": 0.0115, "step": 436680 }, { "epoch": 1.13, "learning_rate": 0.00013020547927451064, "loss": 0.014, "step": 436690 }, { "epoch": 1.13, "learning_rate": 0.00013020159105813918, "loss": 0.0138, "step": 436700 }, { "epoch": 1.13, "learning_rate": 0.00013019770284176772, "loss": 0.0305, "step": 436710 }, { "epoch": 1.13, "learning_rate": 0.00013019381462539627, "loss": 0.0112, "step": 436720 }, { "epoch": 1.13, "learning_rate": 0.00013018992640902478, "loss": 0.0117, "step": 436730 }, { "epoch": 1.13, "learning_rate": 0.00013018603819265335, "loss": 0.011, "step": 436740 }, { "epoch": 1.13, "learning_rate": 0.00013018214997628186, "loss": 0.0111, "step": 436750 }, { "epoch": 1.13, "learning_rate": 0.0001301782617599104, "loss": 0.0097, "step": 436760 }, { "epoch": 1.13, "learning_rate": 0.00013017437354353895, "loss": 0.0162, "step": 436770 }, { "epoch": 1.13, "learning_rate": 0.0001301704853271675, "loss": 0.0117, "step": 436780 }, { "epoch": 1.13, "learning_rate": 0.000130166597110796, "loss": 0.0116, "step": 436790 }, { "epoch": 1.13, "learning_rate": 0.00013016270889442454, "loss": 0.0094, "step": 436800 }, { "epoch": 1.13, "learning_rate": 0.00013015882067805309, "loss": 0.0096, "step": 436810 }, { "epoch": 1.13, "learning_rate": 0.00013015493246168163, "loss": 0.0092, "step": 436820 }, { "epoch": 1.13, "learning_rate": 0.00013015104424531014, "loss": 0.0098, "step": 436830 }, { "epoch": 1.13, "learning_rate": 0.00013014715602893868, "loss": 0.0107, "step": 436840 }, { "epoch": 1.13, "learning_rate": 0.00013014326781256723, "loss": 0.0103, "step": 436850 }, { "epoch": 1.13, "learning_rate": 0.00013013937959619577, "loss": 0.0092, "step": 436860 }, { "epoch": 1.13, "learning_rate": 0.00013013549137982428, "loss": 0.0124, "step": 436870 }, { "epoch": 1.13, "learning_rate": 0.00013013160316345282, "loss": 0.0113, "step": 436880 }, { "epoch": 1.13, "learning_rate": 0.00013012771494708136, "loss": 0.0114, "step": 436890 }, { "epoch": 1.13, "learning_rate": 0.0001301238267307099, "loss": 0.0112, "step": 436900 }, { "epoch": 1.13, "learning_rate": 0.00013011993851433845, "loss": 0.0175, "step": 436910 }, { "epoch": 1.13, "learning_rate": 0.00013011605029796696, "loss": 0.0118, "step": 436920 }, { "epoch": 1.13, "learning_rate": 0.0001301121620815955, "loss": 0.0118, "step": 436930 }, { "epoch": 1.13, "learning_rate": 0.00013010827386522405, "loss": 0.0128, "step": 436940 }, { "epoch": 1.13, "learning_rate": 0.0001301043856488526, "loss": 0.0083, "step": 436950 }, { "epoch": 1.13, "learning_rate": 0.0001301004974324811, "loss": 0.0137, "step": 436960 }, { "epoch": 1.13, "learning_rate": 0.00013009660921610964, "loss": 0.0101, "step": 436970 }, { "epoch": 1.13, "learning_rate": 0.00013009272099973819, "loss": 0.0151, "step": 436980 }, { "epoch": 1.13, "learning_rate": 0.00013008883278336673, "loss": 0.0092, "step": 436990 }, { "epoch": 1.13, "learning_rate": 0.00013008494456699524, "loss": 0.0111, "step": 437000 }, { "epoch": 1.13, "eval_cer": 0.8817096845078387, "eval_loss": 0.007372898980975151, "eval_runtime": 107.4604, "eval_samples_per_second": 18.612, "eval_steps_per_second": 4.653, "step": 437000 }, { "epoch": 1.13, "learning_rate": 0.00013008105635062378, "loss": 0.0105, "step": 437010 }, { "epoch": 1.13, "learning_rate": 0.00013007716813425232, "loss": 0.0099, "step": 437020 }, { "epoch": 1.13, "learning_rate": 0.00013007327991788087, "loss": 0.0135, "step": 437030 }, { "epoch": 1.13, "learning_rate": 0.00013006939170150938, "loss": 0.0106, "step": 437040 }, { "epoch": 1.13, "learning_rate": 0.00013006550348513792, "loss": 0.0103, "step": 437050 }, { "epoch": 1.13, "learning_rate": 0.00013006161526876646, "loss": 0.0108, "step": 437060 }, { "epoch": 1.13, "learning_rate": 0.000130057727052395, "loss": 0.0107, "step": 437070 }, { "epoch": 1.13, "learning_rate": 0.00013005383883602352, "loss": 0.0159, "step": 437080 }, { "epoch": 1.13, "learning_rate": 0.0001300499506196521, "loss": 0.0108, "step": 437090 }, { "epoch": 1.13, "learning_rate": 0.0001300460624032806, "loss": 0.0128, "step": 437100 }, { "epoch": 1.13, "learning_rate": 0.00013004217418690915, "loss": 0.0092, "step": 437110 }, { "epoch": 1.13, "learning_rate": 0.0001300382859705377, "loss": 0.0106, "step": 437120 }, { "epoch": 1.13, "learning_rate": 0.00013003439775416623, "loss": 0.0124, "step": 437130 }, { "epoch": 1.13, "learning_rate": 0.00013003050953779474, "loss": 0.0121, "step": 437140 }, { "epoch": 1.13, "learning_rate": 0.00013002662132142328, "loss": 0.0115, "step": 437150 }, { "epoch": 1.13, "learning_rate": 0.00013002273310505183, "loss": 0.0091, "step": 437160 }, { "epoch": 1.13, "learning_rate": 0.00013001884488868034, "loss": 0.0091, "step": 437170 }, { "epoch": 1.13, "learning_rate": 0.00013001495667230888, "loss": 0.0107, "step": 437180 }, { "epoch": 1.13, "learning_rate": 0.00013001106845593742, "loss": 0.0112, "step": 437190 }, { "epoch": 1.13, "learning_rate": 0.00013000718023956597, "loss": 0.0155, "step": 437200 }, { "epoch": 1.13, "learning_rate": 0.00013000329202319448, "loss": 0.0108, "step": 437210 }, { "epoch": 1.13, "learning_rate": 0.00012999940380682302, "loss": 0.0127, "step": 437220 }, { "epoch": 1.13, "learning_rate": 0.00012999551559045156, "loss": 0.0095, "step": 437230 }, { "epoch": 1.13, "learning_rate": 0.0001299916273740801, "loss": 0.0117, "step": 437240 }, { "epoch": 1.13, "learning_rate": 0.00012998773915770862, "loss": 0.0114, "step": 437250 }, { "epoch": 1.13, "learning_rate": 0.0001299838509413372, "loss": 0.0098, "step": 437260 }, { "epoch": 1.13, "learning_rate": 0.0001299799627249657, "loss": 0.0116, "step": 437270 }, { "epoch": 1.13, "learning_rate": 0.00012997607450859424, "loss": 0.0145, "step": 437280 }, { "epoch": 1.13, "learning_rate": 0.00012997218629222279, "loss": 0.01, "step": 437290 }, { "epoch": 1.13, "learning_rate": 0.00012996829807585133, "loss": 0.0097, "step": 437300 }, { "epoch": 1.13, "learning_rate": 0.00012996440985947984, "loss": 0.009, "step": 437310 }, { "epoch": 1.13, "learning_rate": 0.00012996052164310838, "loss": 0.0123, "step": 437320 }, { "epoch": 1.13, "learning_rate": 0.00012995663342673693, "loss": 0.0117, "step": 437330 }, { "epoch": 1.13, "learning_rate": 0.00012995274521036547, "loss": 0.0095, "step": 437340 }, { "epoch": 1.13, "learning_rate": 0.00012994885699399398, "loss": 0.0092, "step": 437350 }, { "epoch": 1.13, "learning_rate": 0.00012994496877762252, "loss": 0.0128, "step": 437360 }, { "epoch": 1.13, "learning_rate": 0.00012994108056125106, "loss": 0.01, "step": 437370 }, { "epoch": 1.13, "learning_rate": 0.0001299371923448796, "loss": 0.0095, "step": 437380 }, { "epoch": 1.13, "learning_rate": 0.00012993330412850812, "loss": 0.0117, "step": 437390 }, { "epoch": 1.13, "learning_rate": 0.00012992941591213666, "loss": 0.0088, "step": 437400 }, { "epoch": 1.13, "learning_rate": 0.0001299255276957652, "loss": 0.0097, "step": 437410 }, { "epoch": 1.13, "learning_rate": 0.00012992163947939372, "loss": 0.0111, "step": 437420 }, { "epoch": 1.13, "learning_rate": 0.00012991775126302226, "loss": 0.0086, "step": 437430 }, { "epoch": 1.13, "learning_rate": 0.0001299138630466508, "loss": 0.008, "step": 437440 }, { "epoch": 1.13, "learning_rate": 0.00012990997483027934, "loss": 0.0089, "step": 437450 }, { "epoch": 1.13, "learning_rate": 0.00012990608661390789, "loss": 0.0084, "step": 437460 }, { "epoch": 1.13, "learning_rate": 0.00012990219839753643, "loss": 0.0134, "step": 437470 }, { "epoch": 1.13, "learning_rate": 0.00012989831018116494, "loss": 0.0092, "step": 437480 }, { "epoch": 1.13, "learning_rate": 0.00012989442196479348, "loss": 0.0119, "step": 437490 }, { "epoch": 1.13, "learning_rate": 0.00012989053374842202, "loss": 0.0132, "step": 437500 }, { "epoch": 1.13, "learning_rate": 0.00012988664553205057, "loss": 0.0121, "step": 437510 }, { "epoch": 1.13, "learning_rate": 0.00012988275731567908, "loss": 0.0096, "step": 437520 }, { "epoch": 1.13, "learning_rate": 0.00012987886909930762, "loss": 0.01, "step": 437530 }, { "epoch": 1.13, "learning_rate": 0.00012987498088293616, "loss": 0.0111, "step": 437540 }, { "epoch": 1.13, "learning_rate": 0.0001298710926665647, "loss": 0.0105, "step": 437550 }, { "epoch": 1.13, "learning_rate": 0.00012986720445019322, "loss": 0.0276, "step": 437560 }, { "epoch": 1.13, "learning_rate": 0.00012986331623382176, "loss": 0.0106, "step": 437570 }, { "epoch": 1.13, "learning_rate": 0.0001298594280174503, "loss": 0.0104, "step": 437580 }, { "epoch": 1.13, "learning_rate": 0.00012985553980107885, "loss": 0.0125, "step": 437590 }, { "epoch": 1.13, "learning_rate": 0.00012985165158470736, "loss": 0.0111, "step": 437600 }, { "epoch": 1.13, "learning_rate": 0.00012984776336833593, "loss": 0.011, "step": 437610 }, { "epoch": 1.13, "learning_rate": 0.00012984387515196444, "loss": 0.0089, "step": 437620 }, { "epoch": 1.13, "learning_rate": 0.00012983998693559298, "loss": 0.0104, "step": 437630 }, { "epoch": 1.13, "learning_rate": 0.00012983609871922153, "loss": 0.0118, "step": 437640 }, { "epoch": 1.13, "learning_rate": 0.00012983221050285007, "loss": 0.0108, "step": 437650 }, { "epoch": 1.13, "learning_rate": 0.00012982832228647858, "loss": 0.0085, "step": 437660 }, { "epoch": 1.13, "learning_rate": 0.00012982443407010712, "loss": 0.0126, "step": 437670 }, { "epoch": 1.13, "learning_rate": 0.00012982054585373567, "loss": 0.0119, "step": 437680 }, { "epoch": 1.13, "learning_rate": 0.00012981665763736418, "loss": 0.0092, "step": 437690 }, { "epoch": 1.13, "learning_rate": 0.00012981276942099272, "loss": 0.0135, "step": 437700 }, { "epoch": 1.13, "learning_rate": 0.00012980888120462126, "loss": 0.0084, "step": 437710 }, { "epoch": 1.13, "learning_rate": 0.0001298049929882498, "loss": 0.0108, "step": 437720 }, { "epoch": 1.13, "learning_rate": 0.00012980110477187832, "loss": 0.0156, "step": 437730 }, { "epoch": 1.13, "learning_rate": 0.00012979721655550686, "loss": 0.0116, "step": 437740 }, { "epoch": 1.13, "learning_rate": 0.0001297933283391354, "loss": 0.0109, "step": 437750 }, { "epoch": 1.13, "learning_rate": 0.00012978944012276394, "loss": 0.0092, "step": 437760 }, { "epoch": 1.13, "learning_rate": 0.00012978555190639246, "loss": 0.0141, "step": 437770 }, { "epoch": 1.13, "learning_rate": 0.00012978166369002103, "loss": 0.0112, "step": 437780 }, { "epoch": 1.13, "learning_rate": 0.00012977777547364954, "loss": 0.0106, "step": 437790 }, { "epoch": 1.13, "learning_rate": 0.00012977388725727808, "loss": 0.0129, "step": 437800 }, { "epoch": 1.13, "learning_rate": 0.00012976999904090663, "loss": 0.0097, "step": 437810 }, { "epoch": 1.13, "learning_rate": 0.00012976611082453517, "loss": 0.0109, "step": 437820 }, { "epoch": 1.13, "learning_rate": 0.00012976222260816368, "loss": 0.0119, "step": 437830 }, { "epoch": 1.13, "learning_rate": 0.00012975833439179222, "loss": 0.0114, "step": 437840 }, { "epoch": 1.13, "learning_rate": 0.00012975444617542077, "loss": 0.0107, "step": 437850 }, { "epoch": 1.13, "learning_rate": 0.0001297505579590493, "loss": 0.0133, "step": 437860 }, { "epoch": 1.14, "learning_rate": 0.00012974666974267782, "loss": 0.0146, "step": 437870 }, { "epoch": 1.14, "learning_rate": 0.00012974278152630636, "loss": 0.0092, "step": 437880 }, { "epoch": 1.14, "learning_rate": 0.0001297388933099349, "loss": 0.0099, "step": 437890 }, { "epoch": 1.14, "learning_rate": 0.00012973500509356345, "loss": 0.0124, "step": 437900 }, { "epoch": 1.14, "learning_rate": 0.00012973111687719196, "loss": 0.01, "step": 437910 }, { "epoch": 1.14, "learning_rate": 0.0001297272286608205, "loss": 0.0102, "step": 437920 }, { "epoch": 1.14, "learning_rate": 0.00012972334044444904, "loss": 0.0119, "step": 437930 }, { "epoch": 1.14, "learning_rate": 0.00012971945222807756, "loss": 0.0116, "step": 437940 }, { "epoch": 1.14, "learning_rate": 0.0001297155640117061, "loss": 0.0102, "step": 437950 }, { "epoch": 1.14, "learning_rate": 0.00012971167579533464, "loss": 0.0133, "step": 437960 }, { "epoch": 1.14, "learning_rate": 0.00012970778757896318, "loss": 0.0099, "step": 437970 }, { "epoch": 1.14, "learning_rate": 0.00012970389936259173, "loss": 0.0105, "step": 437980 }, { "epoch": 1.14, "learning_rate": 0.00012970001114622027, "loss": 0.0137, "step": 437990 }, { "epoch": 1.14, "learning_rate": 0.00012969612292984878, "loss": 0.0114, "step": 438000 }, { "epoch": 1.14, "eval_cer": 0.8816746935844841, "eval_loss": 0.007308073341846466, "eval_runtime": 107.3816, "eval_samples_per_second": 18.625, "eval_steps_per_second": 4.656, "step": 438000 }, { "epoch": 1.14, "learning_rate": 0.00012969223471347732, "loss": 0.0099, "step": 438010 }, { "epoch": 1.14, "learning_rate": 0.00012968834649710586, "loss": 0.0121, "step": 438020 }, { "epoch": 1.14, "learning_rate": 0.0001296844582807344, "loss": 0.0094, "step": 438030 }, { "epoch": 1.14, "learning_rate": 0.00012968057006436292, "loss": 0.0107, "step": 438040 }, { "epoch": 1.14, "learning_rate": 0.00012967668184799146, "loss": 0.0106, "step": 438050 }, { "epoch": 1.14, "learning_rate": 0.00012967279363162, "loss": 0.0119, "step": 438060 }, { "epoch": 1.14, "learning_rate": 0.00012966890541524855, "loss": 0.0148, "step": 438070 }, { "epoch": 1.14, "learning_rate": 0.00012966501719887706, "loss": 0.0123, "step": 438080 }, { "epoch": 1.14, "learning_rate": 0.0001296611289825056, "loss": 0.0105, "step": 438090 }, { "epoch": 1.14, "learning_rate": 0.00012965724076613414, "loss": 0.01, "step": 438100 }, { "epoch": 1.14, "learning_rate": 0.00012965335254976269, "loss": 0.0088, "step": 438110 }, { "epoch": 1.14, "learning_rate": 0.0001296494643333912, "loss": 0.0266, "step": 438120 }, { "epoch": 1.14, "learning_rate": 0.00012964557611701977, "loss": 0.0132, "step": 438130 }, { "epoch": 1.14, "learning_rate": 0.00012964168790064828, "loss": 0.0119, "step": 438140 }, { "epoch": 1.14, "learning_rate": 0.00012963779968427682, "loss": 0.009, "step": 438150 }, { "epoch": 1.14, "learning_rate": 0.00012963391146790537, "loss": 0.0111, "step": 438160 }, { "epoch": 1.14, "learning_rate": 0.00012963002325153388, "loss": 0.0114, "step": 438170 }, { "epoch": 1.14, "learning_rate": 0.00012962613503516242, "loss": 0.013, "step": 438180 }, { "epoch": 1.14, "learning_rate": 0.00012962224681879096, "loss": 0.0118, "step": 438190 }, { "epoch": 1.14, "learning_rate": 0.0001296183586024195, "loss": 0.0108, "step": 438200 }, { "epoch": 1.14, "learning_rate": 0.00012961447038604802, "loss": 0.0191, "step": 438210 }, { "epoch": 1.14, "learning_rate": 0.00012961058216967656, "loss": 0.0124, "step": 438220 }, { "epoch": 1.14, "learning_rate": 0.0001296066939533051, "loss": 0.0107, "step": 438230 }, { "epoch": 1.14, "learning_rate": 0.00012960280573693365, "loss": 0.0139, "step": 438240 }, { "epoch": 1.14, "learning_rate": 0.00012959891752056216, "loss": 0.0098, "step": 438250 }, { "epoch": 1.14, "learning_rate": 0.0001295950293041907, "loss": 0.0108, "step": 438260 }, { "epoch": 1.14, "learning_rate": 0.00012959114108781924, "loss": 0.0091, "step": 438270 }, { "epoch": 1.14, "learning_rate": 0.00012958725287144778, "loss": 0.0093, "step": 438280 }, { "epoch": 1.14, "learning_rate": 0.0001295833646550763, "loss": 0.0116, "step": 438290 }, { "epoch": 1.14, "learning_rate": 0.00012957947643870484, "loss": 0.0089, "step": 438300 }, { "epoch": 1.14, "learning_rate": 0.00012957558822233338, "loss": 0.0093, "step": 438310 }, { "epoch": 1.14, "learning_rate": 0.00012957170000596192, "loss": 0.0146, "step": 438320 }, { "epoch": 1.14, "learning_rate": 0.00012956781178959047, "loss": 0.0116, "step": 438330 }, { "epoch": 1.14, "learning_rate": 0.000129563923573219, "loss": 0.0116, "step": 438340 }, { "epoch": 1.14, "learning_rate": 0.00012956003535684752, "loss": 0.0093, "step": 438350 }, { "epoch": 1.14, "learning_rate": 0.00012955614714047606, "loss": 0.0109, "step": 438360 }, { "epoch": 1.14, "learning_rate": 0.0001295522589241046, "loss": 0.0102, "step": 438370 }, { "epoch": 1.14, "learning_rate": 0.00012954837070773315, "loss": 0.0113, "step": 438380 }, { "epoch": 1.14, "learning_rate": 0.00012954448249136166, "loss": 0.0091, "step": 438390 }, { "epoch": 1.14, "learning_rate": 0.0001295405942749902, "loss": 0.0098, "step": 438400 }, { "epoch": 1.14, "learning_rate": 0.00012953670605861874, "loss": 0.0112, "step": 438410 }, { "epoch": 1.14, "learning_rate": 0.00012953281784224726, "loss": 0.0102, "step": 438420 }, { "epoch": 1.14, "learning_rate": 0.0001295289296258758, "loss": 0.0118, "step": 438430 }, { "epoch": 1.14, "learning_rate": 0.00012952504140950434, "loss": 0.0117, "step": 438440 }, { "epoch": 1.14, "learning_rate": 0.00012952115319313288, "loss": 0.0121, "step": 438450 }, { "epoch": 1.14, "learning_rate": 0.0001295172649767614, "loss": 0.01, "step": 438460 }, { "epoch": 1.14, "learning_rate": 0.00012951337676038994, "loss": 0.0162, "step": 438470 }, { "epoch": 1.14, "learning_rate": 0.00012950948854401848, "loss": 0.0125, "step": 438480 }, { "epoch": 1.14, "learning_rate": 0.00012950560032764702, "loss": 0.0135, "step": 438490 }, { "epoch": 1.14, "learning_rate": 0.00012950171211127557, "loss": 0.0098, "step": 438500 }, { "epoch": 1.14, "learning_rate": 0.0001294978238949041, "loss": 0.01, "step": 438510 }, { "epoch": 1.14, "learning_rate": 0.00012949393567853262, "loss": 0.0102, "step": 438520 }, { "epoch": 1.14, "learning_rate": 0.00012949004746216116, "loss": 0.0112, "step": 438530 }, { "epoch": 1.14, "learning_rate": 0.0001294861592457897, "loss": 0.011, "step": 438540 }, { "epoch": 1.14, "learning_rate": 0.00012948227102941825, "loss": 0.0104, "step": 438550 }, { "epoch": 1.14, "learning_rate": 0.00012947838281304676, "loss": 0.0108, "step": 438560 }, { "epoch": 1.14, "learning_rate": 0.0001294744945966753, "loss": 0.0108, "step": 438570 }, { "epoch": 1.14, "learning_rate": 0.00012947060638030384, "loss": 0.0131, "step": 438580 }, { "epoch": 1.14, "learning_rate": 0.00012946671816393239, "loss": 0.01, "step": 438590 }, { "epoch": 1.14, "learning_rate": 0.0001294628299475609, "loss": 0.0114, "step": 438600 }, { "epoch": 1.14, "learning_rate": 0.00012945894173118944, "loss": 0.0091, "step": 438610 }, { "epoch": 1.14, "learning_rate": 0.00012945505351481798, "loss": 0.0109, "step": 438620 }, { "epoch": 1.14, "learning_rate": 0.00012945116529844653, "loss": 0.0115, "step": 438630 }, { "epoch": 1.14, "learning_rate": 0.00012944727708207504, "loss": 0.0128, "step": 438640 }, { "epoch": 1.14, "learning_rate": 0.0001294433888657036, "loss": 0.0123, "step": 438650 }, { "epoch": 1.14, "learning_rate": 0.00012943950064933212, "loss": 0.0121, "step": 438660 }, { "epoch": 1.14, "learning_rate": 0.00012943561243296064, "loss": 0.0113, "step": 438670 }, { "epoch": 1.14, "learning_rate": 0.0001294317242165892, "loss": 0.0108, "step": 438680 }, { "epoch": 1.14, "learning_rate": 0.00012942783600021772, "loss": 0.0161, "step": 438690 }, { "epoch": 1.14, "learning_rate": 0.00012942394778384626, "loss": 0.0114, "step": 438700 }, { "epoch": 1.14, "learning_rate": 0.0001294200595674748, "loss": 0.0133, "step": 438710 }, { "epoch": 1.14, "learning_rate": 0.00012941617135110335, "loss": 0.017, "step": 438720 }, { "epoch": 1.14, "learning_rate": 0.00012941228313473186, "loss": 0.0101, "step": 438730 }, { "epoch": 1.14, "learning_rate": 0.0001294083949183604, "loss": 0.0112, "step": 438740 }, { "epoch": 1.14, "learning_rate": 0.00012940450670198894, "loss": 0.0095, "step": 438750 }, { "epoch": 1.14, "learning_rate": 0.00012940061848561749, "loss": 0.0117, "step": 438760 }, { "epoch": 1.14, "learning_rate": 0.000129396730269246, "loss": 0.0089, "step": 438770 }, { "epoch": 1.14, "learning_rate": 0.00012939284205287454, "loss": 0.013, "step": 438780 }, { "epoch": 1.14, "learning_rate": 0.00012938895383650308, "loss": 0.0105, "step": 438790 }, { "epoch": 1.14, "learning_rate": 0.00012938506562013162, "loss": 0.0091, "step": 438800 }, { "epoch": 1.14, "learning_rate": 0.00012938117740376014, "loss": 0.0086, "step": 438810 }, { "epoch": 1.14, "learning_rate": 0.00012937728918738868, "loss": 0.0084, "step": 438820 }, { "epoch": 1.14, "learning_rate": 0.00012937340097101722, "loss": 0.0111, "step": 438830 }, { "epoch": 1.14, "learning_rate": 0.00012936951275464576, "loss": 0.0109, "step": 438840 }, { "epoch": 1.14, "learning_rate": 0.0001293656245382743, "loss": 0.0079, "step": 438850 }, { "epoch": 1.14, "learning_rate": 0.00012936173632190285, "loss": 0.013, "step": 438860 }, { "epoch": 1.14, "learning_rate": 0.00012935784810553136, "loss": 0.0115, "step": 438870 }, { "epoch": 1.14, "learning_rate": 0.0001293539598891599, "loss": 0.0139, "step": 438880 }, { "epoch": 1.14, "learning_rate": 0.00012935007167278845, "loss": 0.0094, "step": 438890 }, { "epoch": 1.14, "learning_rate": 0.000129346183456417, "loss": 0.0093, "step": 438900 }, { "epoch": 1.14, "learning_rate": 0.0001293422952400455, "loss": 0.0121, "step": 438910 }, { "epoch": 1.14, "learning_rate": 0.00012933840702367404, "loss": 0.0126, "step": 438920 }, { "epoch": 1.14, "learning_rate": 0.00012933451880730258, "loss": 0.0105, "step": 438930 }, { "epoch": 1.14, "learning_rate": 0.0001293306305909311, "loss": 0.0116, "step": 438940 }, { "epoch": 1.14, "learning_rate": 0.00012932674237455964, "loss": 0.0173, "step": 438950 }, { "epoch": 1.14, "learning_rate": 0.00012932285415818818, "loss": 0.0117, "step": 438960 }, { "epoch": 1.14, "learning_rate": 0.00012931896594181672, "loss": 0.0126, "step": 438970 }, { "epoch": 1.14, "learning_rate": 0.00012931507772544524, "loss": 0.0154, "step": 438980 }, { "epoch": 1.14, "learning_rate": 0.00012931118950907378, "loss": 0.0102, "step": 438990 }, { "epoch": 1.14, "learning_rate": 0.00012930730129270232, "loss": 0.0122, "step": 439000 }, { "epoch": 1.14, "eval_cer": 0.8817180823294437, "eval_loss": 0.0074248588643968105, "eval_runtime": 107.7068, "eval_samples_per_second": 18.569, "eval_steps_per_second": 4.642, "step": 439000 }, { "epoch": 1.14, "learning_rate": 0.00012930341307633086, "loss": 0.0102, "step": 439010 }, { "epoch": 1.14, "learning_rate": 0.00012929952485995938, "loss": 0.0084, "step": 439020 }, { "epoch": 1.14, "learning_rate": 0.00012929563664358795, "loss": 0.0113, "step": 439030 }, { "epoch": 1.14, "learning_rate": 0.00012929174842721646, "loss": 0.0119, "step": 439040 }, { "epoch": 1.14, "learning_rate": 0.000129287860210845, "loss": 0.0124, "step": 439050 }, { "epoch": 1.14, "learning_rate": 0.00012928397199447354, "loss": 0.0099, "step": 439060 }, { "epoch": 1.14, "learning_rate": 0.00012928008377810209, "loss": 0.0089, "step": 439070 }, { "epoch": 1.14, "learning_rate": 0.0001292761955617306, "loss": 0.009, "step": 439080 }, { "epoch": 1.14, "learning_rate": 0.00012927230734535914, "loss": 0.0136, "step": 439090 }, { "epoch": 1.14, "learning_rate": 0.00012926841912898768, "loss": 0.0106, "step": 439100 }, { "epoch": 1.14, "learning_rate": 0.00012926453091261623, "loss": 0.009, "step": 439110 }, { "epoch": 1.14, "learning_rate": 0.00012926064269624474, "loss": 0.0099, "step": 439120 }, { "epoch": 1.14, "learning_rate": 0.00012925675447987328, "loss": 0.0096, "step": 439130 }, { "epoch": 1.14, "learning_rate": 0.00012925286626350182, "loss": 0.0097, "step": 439140 }, { "epoch": 1.14, "learning_rate": 0.00012924897804713034, "loss": 0.0116, "step": 439150 }, { "epoch": 1.14, "learning_rate": 0.00012924508983075888, "loss": 0.0085, "step": 439160 }, { "epoch": 1.14, "learning_rate": 0.00012924120161438742, "loss": 0.012, "step": 439170 }, { "epoch": 1.14, "learning_rate": 0.00012923731339801596, "loss": 0.0107, "step": 439180 }, { "epoch": 1.14, "learning_rate": 0.00012923342518164448, "loss": 0.0118, "step": 439190 }, { "epoch": 1.14, "learning_rate": 0.00012922953696527305, "loss": 0.0086, "step": 439200 }, { "epoch": 1.14, "learning_rate": 0.00012922564874890156, "loss": 0.0145, "step": 439210 }, { "epoch": 1.14, "learning_rate": 0.0001292217605325301, "loss": 0.012, "step": 439220 }, { "epoch": 1.14, "learning_rate": 0.00012921787231615864, "loss": 0.0107, "step": 439230 }, { "epoch": 1.14, "learning_rate": 0.00012921398409978719, "loss": 0.0089, "step": 439240 }, { "epoch": 1.14, "learning_rate": 0.0001292100958834157, "loss": 0.0119, "step": 439250 }, { "epoch": 1.14, "learning_rate": 0.00012920620766704424, "loss": 0.012, "step": 439260 }, { "epoch": 1.14, "learning_rate": 0.00012920231945067278, "loss": 0.0102, "step": 439270 }, { "epoch": 1.14, "learning_rate": 0.00012919843123430133, "loss": 0.0109, "step": 439280 }, { "epoch": 1.14, "learning_rate": 0.00012919454301792984, "loss": 0.0107, "step": 439290 }, { "epoch": 1.14, "learning_rate": 0.00012919065480155838, "loss": 0.0107, "step": 439300 }, { "epoch": 1.14, "learning_rate": 0.00012918676658518692, "loss": 0.0129, "step": 439310 }, { "epoch": 1.14, "learning_rate": 0.00012918287836881546, "loss": 0.0098, "step": 439320 }, { "epoch": 1.14, "learning_rate": 0.00012917899015244398, "loss": 0.012, "step": 439330 }, { "epoch": 1.14, "learning_rate": 0.00012917510193607252, "loss": 0.0135, "step": 439340 }, { "epoch": 1.14, "learning_rate": 0.00012917121371970106, "loss": 0.0105, "step": 439350 }, { "epoch": 1.14, "learning_rate": 0.0001291673255033296, "loss": 0.01, "step": 439360 }, { "epoch": 1.14, "learning_rate": 0.00012916343728695815, "loss": 0.0087, "step": 439370 }, { "epoch": 1.14, "learning_rate": 0.0001291595490705867, "loss": 0.0097, "step": 439380 }, { "epoch": 1.14, "learning_rate": 0.0001291556608542152, "loss": 0.0107, "step": 439390 }, { "epoch": 1.14, "learning_rate": 0.00012915177263784374, "loss": 0.011, "step": 439400 }, { "epoch": 1.14, "learning_rate": 0.00012914788442147229, "loss": 0.0109, "step": 439410 }, { "epoch": 1.14, "learning_rate": 0.0001291439962051008, "loss": 0.0133, "step": 439420 }, { "epoch": 1.14, "learning_rate": 0.00012914010798872934, "loss": 0.0154, "step": 439430 }, { "epoch": 1.14, "learning_rate": 0.00012913621977235788, "loss": 0.0118, "step": 439440 }, { "epoch": 1.14, "learning_rate": 0.00012913233155598642, "loss": 0.0118, "step": 439450 }, { "epoch": 1.14, "learning_rate": 0.00012912844333961494, "loss": 0.0101, "step": 439460 }, { "epoch": 1.14, "learning_rate": 0.00012912455512324348, "loss": 0.012, "step": 439470 }, { "epoch": 1.14, "learning_rate": 0.00012912066690687202, "loss": 0.0099, "step": 439480 }, { "epoch": 1.14, "learning_rate": 0.00012911677869050056, "loss": 0.0101, "step": 439490 }, { "epoch": 1.14, "learning_rate": 0.00012911289047412908, "loss": 0.0117, "step": 439500 }, { "epoch": 1.14, "learning_rate": 0.00012910900225775762, "loss": 0.0128, "step": 439510 }, { "epoch": 1.14, "learning_rate": 0.00012910511404138616, "loss": 0.0117, "step": 439520 }, { "epoch": 1.14, "learning_rate": 0.0001291012258250147, "loss": 0.0119, "step": 439530 }, { "epoch": 1.14, "learning_rate": 0.00012909733760864322, "loss": 0.011, "step": 439540 }, { "epoch": 1.14, "learning_rate": 0.0001290934493922718, "loss": 0.0157, "step": 439550 }, { "epoch": 1.14, "learning_rate": 0.0001290895611759003, "loss": 0.009, "step": 439560 }, { "epoch": 1.14, "learning_rate": 0.00012908567295952884, "loss": 0.0162, "step": 439570 }, { "epoch": 1.14, "learning_rate": 0.00012908178474315738, "loss": 0.013, "step": 439580 }, { "epoch": 1.14, "learning_rate": 0.00012907789652678593, "loss": 0.0101, "step": 439590 }, { "epoch": 1.14, "learning_rate": 0.00012907400831041444, "loss": 0.0105, "step": 439600 }, { "epoch": 1.14, "learning_rate": 0.00012907012009404298, "loss": 0.0116, "step": 439610 }, { "epoch": 1.14, "learning_rate": 0.00012906623187767152, "loss": 0.0096, "step": 439620 }, { "epoch": 1.14, "learning_rate": 0.00012906234366130007, "loss": 0.0103, "step": 439630 }, { "epoch": 1.14, "learning_rate": 0.00012905845544492858, "loss": 0.0098, "step": 439640 }, { "epoch": 1.14, "learning_rate": 0.00012905456722855712, "loss": 0.0104, "step": 439650 }, { "epoch": 1.14, "learning_rate": 0.00012905067901218566, "loss": 0.0102, "step": 439660 }, { "epoch": 1.14, "learning_rate": 0.00012904679079581418, "loss": 0.012, "step": 439670 }, { "epoch": 1.14, "learning_rate": 0.00012904290257944272, "loss": 0.011, "step": 439680 }, { "epoch": 1.14, "learning_rate": 0.00012903901436307126, "loss": 0.0089, "step": 439690 }, { "epoch": 1.14, "learning_rate": 0.0001290351261466998, "loss": 0.0124, "step": 439700 }, { "epoch": 1.14, "learning_rate": 0.00012903123793032832, "loss": 0.0089, "step": 439710 }, { "epoch": 1.14, "learning_rate": 0.00012902734971395689, "loss": 0.0111, "step": 439720 }, { "epoch": 1.14, "learning_rate": 0.0001290234614975854, "loss": 0.0122, "step": 439730 }, { "epoch": 1.14, "learning_rate": 0.00012901957328121394, "loss": 0.0128, "step": 439740 }, { "epoch": 1.14, "learning_rate": 0.00012901568506484248, "loss": 0.0115, "step": 439750 }, { "epoch": 1.14, "learning_rate": 0.00012901179684847103, "loss": 0.0129, "step": 439760 }, { "epoch": 1.14, "learning_rate": 0.00012900790863209954, "loss": 0.01, "step": 439770 }, { "epoch": 1.14, "learning_rate": 0.00012900402041572808, "loss": 0.0097, "step": 439780 }, { "epoch": 1.14, "learning_rate": 0.00012900013219935662, "loss": 0.0119, "step": 439790 }, { "epoch": 1.14, "learning_rate": 0.00012899624398298517, "loss": 0.016, "step": 439800 }, { "epoch": 1.14, "learning_rate": 0.00012899235576661368, "loss": 0.0095, "step": 439810 }, { "epoch": 1.14, "learning_rate": 0.00012898846755024222, "loss": 0.0122, "step": 439820 }, { "epoch": 1.14, "learning_rate": 0.00012898457933387076, "loss": 0.0113, "step": 439830 }, { "epoch": 1.14, "learning_rate": 0.0001289806911174993, "loss": 0.0087, "step": 439840 }, { "epoch": 1.14, "learning_rate": 0.00012897680290112782, "loss": 0.0098, "step": 439850 }, { "epoch": 1.14, "learning_rate": 0.00012897291468475636, "loss": 0.0101, "step": 439860 }, { "epoch": 1.14, "learning_rate": 0.0001289690264683849, "loss": 0.013, "step": 439870 }, { "epoch": 1.14, "learning_rate": 0.00012896513825201344, "loss": 0.0123, "step": 439880 }, { "epoch": 1.14, "learning_rate": 0.00012896125003564196, "loss": 0.0103, "step": 439890 }, { "epoch": 1.14, "learning_rate": 0.0001289573618192705, "loss": 0.0124, "step": 439900 }, { "epoch": 1.14, "learning_rate": 0.00012895347360289904, "loss": 0.011, "step": 439910 }, { "epoch": 1.14, "learning_rate": 0.00012894958538652758, "loss": 0.0088, "step": 439920 }, { "epoch": 1.14, "learning_rate": 0.00012894569717015613, "loss": 0.0147, "step": 439930 }, { "epoch": 1.14, "learning_rate": 0.00012894180895378464, "loss": 0.0117, "step": 439940 }, { "epoch": 1.14, "learning_rate": 0.00012893792073741318, "loss": 0.0141, "step": 439950 }, { "epoch": 1.14, "learning_rate": 0.00012893403252104172, "loss": 0.0102, "step": 439960 }, { "epoch": 1.14, "learning_rate": 0.00012893014430467026, "loss": 0.012, "step": 439970 }, { "epoch": 1.14, "learning_rate": 0.00012892625608829878, "loss": 0.013, "step": 439980 }, { "epoch": 1.14, "learning_rate": 0.00012892236787192732, "loss": 0.0117, "step": 439990 }, { "epoch": 1.14, "learning_rate": 0.00012891847965555586, "loss": 0.0118, "step": 440000 }, { "epoch": 1.14, "eval_cer": 0.8817236808771804, "eval_loss": 0.007295154966413975, "eval_runtime": 107.4949, "eval_samples_per_second": 18.606, "eval_steps_per_second": 4.651, "step": 440000 }, { "epoch": 1.14, "learning_rate": 0.0001289145914391844, "loss": 0.0117, "step": 440010 }, { "epoch": 1.14, "learning_rate": 0.00012891070322281292, "loss": 0.0141, "step": 440020 }, { "epoch": 1.14, "learning_rate": 0.00012890681500644146, "loss": 0.0151, "step": 440030 }, { "epoch": 1.14, "learning_rate": 0.00012890292679007, "loss": 0.0126, "step": 440040 }, { "epoch": 1.14, "learning_rate": 0.00012889903857369854, "loss": 0.0107, "step": 440050 }, { "epoch": 1.14, "learning_rate": 0.00012889515035732706, "loss": 0.0065, "step": 440060 }, { "epoch": 1.14, "learning_rate": 0.00012889126214095563, "loss": 0.0108, "step": 440070 }, { "epoch": 1.14, "learning_rate": 0.00012888737392458414, "loss": 0.0132, "step": 440080 }, { "epoch": 1.14, "learning_rate": 0.00012888348570821268, "loss": 0.0119, "step": 440090 }, { "epoch": 1.14, "learning_rate": 0.00012887959749184122, "loss": 0.0106, "step": 440100 }, { "epoch": 1.14, "learning_rate": 0.00012887570927546977, "loss": 0.0112, "step": 440110 }, { "epoch": 1.14, "learning_rate": 0.00012887182105909828, "loss": 0.0088, "step": 440120 }, { "epoch": 1.14, "learning_rate": 0.00012886793284272682, "loss": 0.011, "step": 440130 }, { "epoch": 1.14, "learning_rate": 0.00012886404462635536, "loss": 0.0088, "step": 440140 }, { "epoch": 1.14, "learning_rate": 0.00012886015640998388, "loss": 0.0101, "step": 440150 }, { "epoch": 1.14, "learning_rate": 0.00012885626819361242, "loss": 0.0114, "step": 440160 }, { "epoch": 1.14, "learning_rate": 0.00012885237997724096, "loss": 0.0139, "step": 440170 }, { "epoch": 1.14, "learning_rate": 0.0001288484917608695, "loss": 0.012, "step": 440180 }, { "epoch": 1.14, "learning_rate": 0.00012884460354449802, "loss": 0.0116, "step": 440190 }, { "epoch": 1.14, "learning_rate": 0.00012884071532812656, "loss": 0.0139, "step": 440200 }, { "epoch": 1.14, "learning_rate": 0.0001288368271117551, "loss": 0.0104, "step": 440210 }, { "epoch": 1.14, "learning_rate": 0.00012883293889538364, "loss": 0.0098, "step": 440220 }, { "epoch": 1.14, "learning_rate": 0.00012882905067901216, "loss": 0.0114, "step": 440230 }, { "epoch": 1.14, "learning_rate": 0.00012882516246264073, "loss": 0.0086, "step": 440240 }, { "epoch": 1.14, "learning_rate": 0.00012882127424626924, "loss": 0.0134, "step": 440250 }, { "epoch": 1.14, "learning_rate": 0.00012881738602989778, "loss": 0.0128, "step": 440260 }, { "epoch": 1.14, "learning_rate": 0.00012881349781352632, "loss": 0.0148, "step": 440270 }, { "epoch": 1.14, "learning_rate": 0.00012880960959715487, "loss": 0.0115, "step": 440280 }, { "epoch": 1.14, "learning_rate": 0.00012880572138078338, "loss": 0.0107, "step": 440290 }, { "epoch": 1.14, "learning_rate": 0.00012880183316441192, "loss": 0.0086, "step": 440300 }, { "epoch": 1.14, "learning_rate": 0.00012879794494804046, "loss": 0.0086, "step": 440310 }, { "epoch": 1.14, "learning_rate": 0.000128794056731669, "loss": 0.0128, "step": 440320 }, { "epoch": 1.14, "learning_rate": 0.00012879016851529752, "loss": 0.0106, "step": 440330 }, { "epoch": 1.14, "learning_rate": 0.00012878628029892606, "loss": 0.0121, "step": 440340 }, { "epoch": 1.14, "learning_rate": 0.0001287823920825546, "loss": 0.0103, "step": 440350 }, { "epoch": 1.14, "learning_rate": 0.00012877850386618314, "loss": 0.0107, "step": 440360 }, { "epoch": 1.14, "learning_rate": 0.00012877461564981166, "loss": 0.0102, "step": 440370 }, { "epoch": 1.14, "learning_rate": 0.0001287707274334402, "loss": 0.0087, "step": 440380 }, { "epoch": 1.14, "learning_rate": 0.00012876683921706874, "loss": 0.0125, "step": 440390 }, { "epoch": 1.14, "learning_rate": 0.00012876295100069726, "loss": 0.0131, "step": 440400 }, { "epoch": 1.14, "learning_rate": 0.0001287590627843258, "loss": 0.0092, "step": 440410 }, { "epoch": 1.14, "learning_rate": 0.00012875517456795434, "loss": 0.0098, "step": 440420 }, { "epoch": 1.14, "learning_rate": 0.00012875128635158288, "loss": 0.0113, "step": 440430 }, { "epoch": 1.14, "learning_rate": 0.00012874739813521142, "loss": 0.0091, "step": 440440 }, { "epoch": 1.14, "learning_rate": 0.00012874350991883996, "loss": 0.0119, "step": 440450 }, { "epoch": 1.14, "learning_rate": 0.00012873962170246848, "loss": 0.0106, "step": 440460 }, { "epoch": 1.14, "learning_rate": 0.00012873573348609702, "loss": 0.0119, "step": 440470 }, { "epoch": 1.14, "learning_rate": 0.00012873184526972556, "loss": 0.0144, "step": 440480 }, { "epoch": 1.14, "learning_rate": 0.0001287279570533541, "loss": 0.0109, "step": 440490 }, { "epoch": 1.14, "learning_rate": 0.00012872406883698262, "loss": 0.0137, "step": 440500 }, { "epoch": 1.14, "learning_rate": 0.00012872018062061116, "loss": 0.0115, "step": 440510 }, { "epoch": 1.14, "learning_rate": 0.0001287162924042397, "loss": 0.0123, "step": 440520 }, { "epoch": 1.14, "learning_rate": 0.00012871240418786824, "loss": 0.0111, "step": 440530 }, { "epoch": 1.14, "learning_rate": 0.00012870851597149676, "loss": 0.0096, "step": 440540 }, { "epoch": 1.14, "learning_rate": 0.0001287046277551253, "loss": 0.0094, "step": 440550 }, { "epoch": 1.14, "learning_rate": 0.00012870073953875384, "loss": 0.0109, "step": 440560 }, { "epoch": 1.14, "learning_rate": 0.00012869685132238238, "loss": 0.0099, "step": 440570 }, { "epoch": 1.14, "learning_rate": 0.0001286929631060109, "loss": 0.0094, "step": 440580 }, { "epoch": 1.14, "learning_rate": 0.00012868907488963947, "loss": 0.0122, "step": 440590 }, { "epoch": 1.14, "learning_rate": 0.00012868518667326798, "loss": 0.0098, "step": 440600 }, { "epoch": 1.14, "learning_rate": 0.00012868129845689652, "loss": 0.0093, "step": 440610 }, { "epoch": 1.14, "learning_rate": 0.00012867741024052506, "loss": 0.0091, "step": 440620 }, { "epoch": 1.14, "learning_rate": 0.0001286735220241536, "loss": 0.0129, "step": 440630 }, { "epoch": 1.14, "learning_rate": 0.00012866963380778212, "loss": 0.0097, "step": 440640 }, { "epoch": 1.14, "learning_rate": 0.00012866574559141066, "loss": 0.0123, "step": 440650 }, { "epoch": 1.14, "learning_rate": 0.0001286618573750392, "loss": 0.0121, "step": 440660 }, { "epoch": 1.14, "learning_rate": 0.00012865796915866772, "loss": 0.011, "step": 440670 }, { "epoch": 1.14, "learning_rate": 0.00012865408094229626, "loss": 0.0092, "step": 440680 }, { "epoch": 1.14, "learning_rate": 0.0001286501927259248, "loss": 0.0111, "step": 440690 }, { "epoch": 1.14, "learning_rate": 0.00012864630450955334, "loss": 0.0127, "step": 440700 }, { "epoch": 1.14, "learning_rate": 0.00012864241629318186, "loss": 0.0108, "step": 440710 }, { "epoch": 1.14, "learning_rate": 0.0001286385280768104, "loss": 0.0122, "step": 440720 }, { "epoch": 1.14, "learning_rate": 0.00012863463986043894, "loss": 0.009, "step": 440730 }, { "epoch": 1.14, "learning_rate": 0.00012863075164406748, "loss": 0.0115, "step": 440740 }, { "epoch": 1.14, "learning_rate": 0.000128626863427696, "loss": 0.0139, "step": 440750 }, { "epoch": 1.14, "learning_rate": 0.00012862297521132457, "loss": 0.01, "step": 440760 }, { "epoch": 1.14, "learning_rate": 0.00012861908699495308, "loss": 0.0178, "step": 440770 }, { "epoch": 1.14, "learning_rate": 0.00012861519877858162, "loss": 0.01, "step": 440780 }, { "epoch": 1.14, "learning_rate": 0.00012861131056221016, "loss": 0.0125, "step": 440790 }, { "epoch": 1.14, "learning_rate": 0.0001286074223458387, "loss": 0.0121, "step": 440800 }, { "epoch": 1.14, "learning_rate": 0.00012860353412946722, "loss": 0.0171, "step": 440810 }, { "epoch": 1.14, "learning_rate": 0.00012859964591309576, "loss": 0.0101, "step": 440820 }, { "epoch": 1.14, "learning_rate": 0.0001285957576967243, "loss": 0.0119, "step": 440830 }, { "epoch": 1.14, "learning_rate": 0.00012859186948035284, "loss": 0.0099, "step": 440840 }, { "epoch": 1.14, "learning_rate": 0.00012858798126398136, "loss": 0.0125, "step": 440850 }, { "epoch": 1.14, "learning_rate": 0.0001285840930476099, "loss": 0.0121, "step": 440860 }, { "epoch": 1.14, "learning_rate": 0.00012858020483123844, "loss": 0.0096, "step": 440870 }, { "epoch": 1.14, "learning_rate": 0.00012857631661486698, "loss": 0.0131, "step": 440880 }, { "epoch": 1.14, "learning_rate": 0.0001285724283984955, "loss": 0.0138, "step": 440890 }, { "epoch": 1.14, "learning_rate": 0.00012856854018212404, "loss": 0.0121, "step": 440900 }, { "epoch": 1.14, "learning_rate": 0.00012856465196575258, "loss": 0.0185, "step": 440910 }, { "epoch": 1.14, "learning_rate": 0.0001285607637493811, "loss": 0.0141, "step": 440920 }, { "epoch": 1.14, "learning_rate": 0.00012855687553300964, "loss": 0.0115, "step": 440930 }, { "epoch": 1.14, "learning_rate": 0.00012855298731663818, "loss": 0.0119, "step": 440940 }, { "epoch": 1.14, "learning_rate": 0.00012854909910026672, "loss": 0.0094, "step": 440950 }, { "epoch": 1.14, "learning_rate": 0.00012854521088389526, "loss": 0.0114, "step": 440960 }, { "epoch": 1.14, "learning_rate": 0.0001285413226675238, "loss": 0.0108, "step": 440970 }, { "epoch": 1.14, "learning_rate": 0.00012853743445115232, "loss": 0.0089, "step": 440980 }, { "epoch": 1.14, "learning_rate": 0.00012853354623478086, "loss": 0.0106, "step": 440990 }, { "epoch": 1.14, "learning_rate": 0.0001285296580184094, "loss": 0.0112, "step": 441000 }, { "epoch": 1.14, "eval_cer": 0.8816592975782083, "eval_loss": 0.007312288507819176, "eval_runtime": 107.3849, "eval_samples_per_second": 18.625, "eval_steps_per_second": 4.656, "step": 441000 }, { "epoch": 1.14, "learning_rate": 0.00012852576980203794, "loss": 0.0139, "step": 441010 }, { "epoch": 1.14, "learning_rate": 0.00012852188158566646, "loss": 0.0109, "step": 441020 }, { "epoch": 1.14, "learning_rate": 0.000128517993369295, "loss": 0.0113, "step": 441030 }, { "epoch": 1.14, "learning_rate": 0.00012851410515292354, "loss": 0.0104, "step": 441040 }, { "epoch": 1.14, "learning_rate": 0.00012851021693655208, "loss": 0.0113, "step": 441050 }, { "epoch": 1.14, "learning_rate": 0.0001285063287201806, "loss": 0.0128, "step": 441060 }, { "epoch": 1.14, "learning_rate": 0.00012850244050380914, "loss": 0.012, "step": 441070 }, { "epoch": 1.14, "learning_rate": 0.00012849855228743768, "loss": 0.0128, "step": 441080 }, { "epoch": 1.14, "learning_rate": 0.00012849466407106622, "loss": 0.0103, "step": 441090 }, { "epoch": 1.14, "learning_rate": 0.00012849077585469474, "loss": 0.0121, "step": 441100 }, { "epoch": 1.14, "learning_rate": 0.0001284868876383233, "loss": 0.0115, "step": 441110 }, { "epoch": 1.14, "learning_rate": 0.00012848299942195182, "loss": 0.0128, "step": 441120 }, { "epoch": 1.14, "learning_rate": 0.00012847911120558036, "loss": 0.0116, "step": 441130 }, { "epoch": 1.14, "learning_rate": 0.0001284752229892089, "loss": 0.0109, "step": 441140 }, { "epoch": 1.14, "learning_rate": 0.00012847133477283742, "loss": 0.0098, "step": 441150 }, { "epoch": 1.14, "learning_rate": 0.00012846744655646596, "loss": 0.0137, "step": 441160 }, { "epoch": 1.14, "learning_rate": 0.0001284635583400945, "loss": 0.0099, "step": 441170 }, { "epoch": 1.14, "learning_rate": 0.00012845967012372304, "loss": 0.016, "step": 441180 }, { "epoch": 1.14, "learning_rate": 0.00012845578190735156, "loss": 0.0096, "step": 441190 }, { "epoch": 1.14, "learning_rate": 0.0001284518936909801, "loss": 0.0092, "step": 441200 }, { "epoch": 1.14, "learning_rate": 0.00012844800547460864, "loss": 0.0124, "step": 441210 }, { "epoch": 1.14, "learning_rate": 0.00012844411725823718, "loss": 0.0116, "step": 441220 }, { "epoch": 1.14, "learning_rate": 0.0001284402290418657, "loss": 0.0114, "step": 441230 }, { "epoch": 1.14, "learning_rate": 0.00012843634082549424, "loss": 0.0112, "step": 441240 }, { "epoch": 1.14, "learning_rate": 0.00012843245260912278, "loss": 0.0104, "step": 441250 }, { "epoch": 1.14, "learning_rate": 0.00012842856439275132, "loss": 0.011, "step": 441260 }, { "epoch": 1.14, "learning_rate": 0.00012842467617637984, "loss": 0.0106, "step": 441270 }, { "epoch": 1.14, "learning_rate": 0.00012842078796000838, "loss": 0.0103, "step": 441280 }, { "epoch": 1.14, "learning_rate": 0.00012841689974363692, "loss": 0.0156, "step": 441290 }, { "epoch": 1.14, "learning_rate": 0.00012841301152726546, "loss": 0.0106, "step": 441300 }, { "epoch": 1.14, "learning_rate": 0.000128409123310894, "loss": 0.0104, "step": 441310 }, { "epoch": 1.14, "learning_rate": 0.00012840523509452255, "loss": 0.0093, "step": 441320 }, { "epoch": 1.14, "learning_rate": 0.00012840134687815106, "loss": 0.0135, "step": 441330 }, { "epoch": 1.14, "learning_rate": 0.0001283974586617796, "loss": 0.0133, "step": 441340 }, { "epoch": 1.14, "learning_rate": 0.00012839357044540814, "loss": 0.0098, "step": 441350 }, { "epoch": 1.14, "learning_rate": 0.00012838968222903668, "loss": 0.0104, "step": 441360 }, { "epoch": 1.14, "learning_rate": 0.0001283857940126652, "loss": 0.0108, "step": 441370 }, { "epoch": 1.14, "learning_rate": 0.00012838190579629374, "loss": 0.0109, "step": 441380 }, { "epoch": 1.14, "learning_rate": 0.00012837801757992228, "loss": 0.0099, "step": 441390 }, { "epoch": 1.14, "learning_rate": 0.0001283741293635508, "loss": 0.0117, "step": 441400 }, { "epoch": 1.14, "learning_rate": 0.00012837024114717934, "loss": 0.0106, "step": 441410 }, { "epoch": 1.14, "learning_rate": 0.00012836635293080788, "loss": 0.011, "step": 441420 }, { "epoch": 1.14, "learning_rate": 0.00012836246471443642, "loss": 0.0156, "step": 441430 }, { "epoch": 1.14, "learning_rate": 0.00012835857649806494, "loss": 0.0121, "step": 441440 }, { "epoch": 1.14, "learning_rate": 0.00012835468828169348, "loss": 0.0135, "step": 441450 }, { "epoch": 1.14, "learning_rate": 0.00012835080006532202, "loss": 0.0111, "step": 441460 }, { "epoch": 1.14, "learning_rate": 0.00012834691184895056, "loss": 0.0154, "step": 441470 }, { "epoch": 1.14, "learning_rate": 0.00012834302363257908, "loss": 0.0102, "step": 441480 }, { "epoch": 1.14, "learning_rate": 0.00012833913541620764, "loss": 0.0122, "step": 441490 }, { "epoch": 1.14, "learning_rate": 0.00012833524719983616, "loss": 0.0097, "step": 441500 }, { "epoch": 1.14, "learning_rate": 0.0001283313589834647, "loss": 0.0115, "step": 441510 }, { "epoch": 1.14, "learning_rate": 0.00012832747076709324, "loss": 0.0138, "step": 441520 }, { "epoch": 1.14, "learning_rate": 0.00012832358255072178, "loss": 0.0107, "step": 441530 }, { "epoch": 1.14, "learning_rate": 0.0001283196943343503, "loss": 0.0113, "step": 441540 }, { "epoch": 1.14, "learning_rate": 0.00012831580611797884, "loss": 0.0109, "step": 441550 }, { "epoch": 1.14, "learning_rate": 0.00012831191790160738, "loss": 0.0141, "step": 441560 }, { "epoch": 1.14, "learning_rate": 0.00012830802968523592, "loss": 0.0081, "step": 441570 }, { "epoch": 1.14, "learning_rate": 0.00012830414146886444, "loss": 0.0094, "step": 441580 }, { "epoch": 1.14, "learning_rate": 0.00012830025325249298, "loss": 0.0106, "step": 441590 }, { "epoch": 1.14, "learning_rate": 0.00012829636503612152, "loss": 0.0117, "step": 441600 }, { "epoch": 1.14, "learning_rate": 0.00012829247681975006, "loss": 0.0147, "step": 441610 }, { "epoch": 1.14, "learning_rate": 0.00012828858860337858, "loss": 0.0101, "step": 441620 }, { "epoch": 1.14, "learning_rate": 0.00012828470038700712, "loss": 0.0097, "step": 441630 }, { "epoch": 1.14, "learning_rate": 0.00012828081217063566, "loss": 0.0091, "step": 441640 }, { "epoch": 1.14, "learning_rate": 0.00012827692395426418, "loss": 0.0086, "step": 441650 }, { "epoch": 1.14, "learning_rate": 0.00012827303573789274, "loss": 0.0125, "step": 441660 }, { "epoch": 1.14, "learning_rate": 0.00012826914752152126, "loss": 0.0111, "step": 441670 }, { "epoch": 1.14, "learning_rate": 0.0001282652593051498, "loss": 0.0122, "step": 441680 }, { "epoch": 1.14, "learning_rate": 0.00012826137108877834, "loss": 0.0152, "step": 441690 }, { "epoch": 1.14, "learning_rate": 0.00012825748287240688, "loss": 0.0112, "step": 441700 }, { "epoch": 1.14, "learning_rate": 0.0001282535946560354, "loss": 0.0089, "step": 441710 }, { "epoch": 1.15, "learning_rate": 0.00012824970643966394, "loss": 0.0126, "step": 441720 }, { "epoch": 1.15, "learning_rate": 0.00012824581822329248, "loss": 0.0112, "step": 441730 }, { "epoch": 1.15, "learning_rate": 0.00012824193000692102, "loss": 0.0091, "step": 441740 }, { "epoch": 1.15, "learning_rate": 0.00012823804179054954, "loss": 0.0096, "step": 441750 }, { "epoch": 1.15, "learning_rate": 0.00012823415357417808, "loss": 0.0106, "step": 441760 }, { "epoch": 1.15, "learning_rate": 0.00012823026535780662, "loss": 0.0111, "step": 441770 }, { "epoch": 1.15, "learning_rate": 0.00012822637714143516, "loss": 0.0076, "step": 441780 }, { "epoch": 1.15, "learning_rate": 0.00012822248892506368, "loss": 0.0109, "step": 441790 }, { "epoch": 1.15, "learning_rate": 0.00012821860070869222, "loss": 0.01, "step": 441800 }, { "epoch": 1.15, "learning_rate": 0.00012821471249232076, "loss": 0.0158, "step": 441810 }, { "epoch": 1.15, "learning_rate": 0.0001282108242759493, "loss": 0.012, "step": 441820 }, { "epoch": 1.15, "learning_rate": 0.00012820693605957784, "loss": 0.0103, "step": 441830 }, { "epoch": 1.15, "learning_rate": 0.00012820304784320639, "loss": 0.0102, "step": 441840 }, { "epoch": 1.15, "learning_rate": 0.0001281991596268349, "loss": 0.0107, "step": 441850 }, { "epoch": 1.15, "learning_rate": 0.00012819527141046344, "loss": 0.0112, "step": 441860 }, { "epoch": 1.15, "learning_rate": 0.00012819138319409198, "loss": 0.0082, "step": 441870 }, { "epoch": 1.15, "learning_rate": 0.0001281874949777205, "loss": 0.0095, "step": 441880 }, { "epoch": 1.15, "learning_rate": 0.00012818360676134904, "loss": 0.0094, "step": 441890 }, { "epoch": 1.15, "learning_rate": 0.00012817971854497758, "loss": 0.0115, "step": 441900 }, { "epoch": 1.15, "learning_rate": 0.00012817583032860612, "loss": 0.0098, "step": 441910 }, { "epoch": 1.15, "learning_rate": 0.00012817194211223464, "loss": 0.0082, "step": 441920 }, { "epoch": 1.15, "learning_rate": 0.00012816805389586318, "loss": 0.0099, "step": 441930 }, { "epoch": 1.15, "learning_rate": 0.00012816416567949172, "loss": 0.0112, "step": 441940 }, { "epoch": 1.15, "learning_rate": 0.00012816027746312026, "loss": 0.0116, "step": 441950 }, { "epoch": 1.15, "learning_rate": 0.00012815638924674878, "loss": 0.0113, "step": 441960 }, { "epoch": 1.15, "learning_rate": 0.00012815250103037732, "loss": 0.009, "step": 441970 }, { "epoch": 1.15, "learning_rate": 0.00012814861281400586, "loss": 0.0099, "step": 441980 }, { "epoch": 1.15, "learning_rate": 0.0001281447245976344, "loss": 0.0111, "step": 441990 }, { "epoch": 1.15, "learning_rate": 0.00012814083638126292, "loss": 0.0101, "step": 442000 }, { "epoch": 1.15, "eval_cer": 0.881688689953826, "eval_loss": 0.007025611121207476, "eval_runtime": 107.5769, "eval_samples_per_second": 18.591, "eval_steps_per_second": 4.648, "step": 442000 }, { "epoch": 1.15, "learning_rate": 0.00012813694816489148, "loss": 0.011, "step": 442010 }, { "epoch": 1.15, "learning_rate": 0.00012813305994852, "loss": 0.0092, "step": 442020 }, { "epoch": 1.15, "learning_rate": 0.00012812917173214854, "loss": 0.015, "step": 442030 }, { "epoch": 1.15, "learning_rate": 0.00012812528351577708, "loss": 0.0092, "step": 442040 }, { "epoch": 1.15, "learning_rate": 0.00012812139529940562, "loss": 0.0105, "step": 442050 }, { "epoch": 1.15, "learning_rate": 0.00012811750708303414, "loss": 0.0116, "step": 442060 }, { "epoch": 1.15, "learning_rate": 0.00012811361886666268, "loss": 0.0118, "step": 442070 }, { "epoch": 1.15, "learning_rate": 0.00012810973065029122, "loss": 0.0145, "step": 442080 }, { "epoch": 1.15, "learning_rate": 0.00012810584243391976, "loss": 0.0097, "step": 442090 }, { "epoch": 1.15, "learning_rate": 0.00012810195421754828, "loss": 0.0126, "step": 442100 }, { "epoch": 1.15, "learning_rate": 0.00012809806600117682, "loss": 0.0117, "step": 442110 }, { "epoch": 1.15, "learning_rate": 0.00012809417778480536, "loss": 0.0105, "step": 442120 }, { "epoch": 1.15, "learning_rate": 0.00012809028956843388, "loss": 0.0093, "step": 442130 }, { "epoch": 1.15, "learning_rate": 0.00012808640135206242, "loss": 0.0134, "step": 442140 }, { "epoch": 1.15, "learning_rate": 0.00012808251313569096, "loss": 0.013, "step": 442150 }, { "epoch": 1.15, "learning_rate": 0.0001280786249193195, "loss": 0.0101, "step": 442160 }, { "epoch": 1.15, "learning_rate": 0.00012807473670294802, "loss": 0.0115, "step": 442170 }, { "epoch": 1.15, "learning_rate": 0.00012807084848657658, "loss": 0.012, "step": 442180 }, { "epoch": 1.15, "learning_rate": 0.0001280669602702051, "loss": 0.0105, "step": 442190 }, { "epoch": 1.15, "learning_rate": 0.00012806307205383364, "loss": 0.0091, "step": 442200 }, { "epoch": 1.15, "learning_rate": 0.00012805918383746218, "loss": 0.0156, "step": 442210 }, { "epoch": 1.15, "learning_rate": 0.00012805529562109072, "loss": 0.0111, "step": 442220 }, { "epoch": 1.15, "learning_rate": 0.00012805140740471924, "loss": 0.0101, "step": 442230 }, { "epoch": 1.15, "learning_rate": 0.00012804751918834778, "loss": 0.0088, "step": 442240 }, { "epoch": 1.15, "learning_rate": 0.00012804363097197632, "loss": 0.0093, "step": 442250 }, { "epoch": 1.15, "learning_rate": 0.00012803974275560486, "loss": 0.0109, "step": 442260 }, { "epoch": 1.15, "learning_rate": 0.00012803585453923338, "loss": 0.0114, "step": 442270 }, { "epoch": 1.15, "learning_rate": 0.00012803196632286192, "loss": 0.0132, "step": 442280 }, { "epoch": 1.15, "learning_rate": 0.00012802807810649046, "loss": 0.0107, "step": 442290 }, { "epoch": 1.15, "learning_rate": 0.000128024189890119, "loss": 0.0114, "step": 442300 }, { "epoch": 1.15, "learning_rate": 0.00012802030167374752, "loss": 0.0108, "step": 442310 }, { "epoch": 1.15, "learning_rate": 0.00012801641345737606, "loss": 0.0121, "step": 442320 }, { "epoch": 1.15, "learning_rate": 0.0001280125252410046, "loss": 0.0111, "step": 442330 }, { "epoch": 1.15, "learning_rate": 0.00012800863702463314, "loss": 0.0063, "step": 442340 }, { "epoch": 1.15, "learning_rate": 0.00012800474880826168, "loss": 0.0134, "step": 442350 }, { "epoch": 1.15, "learning_rate": 0.00012800086059189023, "loss": 0.0102, "step": 442360 }, { "epoch": 1.15, "learning_rate": 0.00012799697237551874, "loss": 0.0081, "step": 442370 }, { "epoch": 1.15, "learning_rate": 0.00012799308415914728, "loss": 0.0097, "step": 442380 }, { "epoch": 1.15, "learning_rate": 0.00012798919594277582, "loss": 0.0103, "step": 442390 }, { "epoch": 1.15, "learning_rate": 0.00012798530772640434, "loss": 0.0123, "step": 442400 }, { "epoch": 1.15, "learning_rate": 0.00012798141951003288, "loss": 0.0082, "step": 442410 }, { "epoch": 1.15, "learning_rate": 0.00012797753129366142, "loss": 0.0134, "step": 442420 }, { "epoch": 1.15, "learning_rate": 0.00012797364307728996, "loss": 0.0114, "step": 442430 }, { "epoch": 1.15, "learning_rate": 0.00012796975486091848, "loss": 0.0117, "step": 442440 }, { "epoch": 1.15, "learning_rate": 0.00012796586664454702, "loss": 0.0108, "step": 442450 }, { "epoch": 1.15, "learning_rate": 0.00012796197842817556, "loss": 0.0124, "step": 442460 }, { "epoch": 1.15, "learning_rate": 0.0001279580902118041, "loss": 0.0134, "step": 442470 }, { "epoch": 1.15, "learning_rate": 0.00012795420199543262, "loss": 0.0108, "step": 442480 }, { "epoch": 1.15, "learning_rate": 0.00012795031377906116, "loss": 0.0118, "step": 442490 }, { "epoch": 1.15, "learning_rate": 0.0001279464255626897, "loss": 0.0126, "step": 442500 }, { "epoch": 1.15, "learning_rate": 0.00012794253734631824, "loss": 0.0105, "step": 442510 }, { "epoch": 1.15, "learning_rate": 0.00012793864912994676, "loss": 0.0118, "step": 442520 }, { "epoch": 1.15, "learning_rate": 0.00012793476091357532, "loss": 0.0111, "step": 442530 }, { "epoch": 1.15, "learning_rate": 0.00012793087269720384, "loss": 0.0102, "step": 442540 }, { "epoch": 1.15, "learning_rate": 0.00012792698448083238, "loss": 0.0113, "step": 442550 }, { "epoch": 1.15, "learning_rate": 0.00012792309626446092, "loss": 0.0093, "step": 442560 }, { "epoch": 1.15, "learning_rate": 0.00012791920804808946, "loss": 0.0117, "step": 442570 }, { "epoch": 1.15, "learning_rate": 0.00012791531983171798, "loss": 0.0128, "step": 442580 }, { "epoch": 1.15, "learning_rate": 0.00012791143161534652, "loss": 0.0111, "step": 442590 }, { "epoch": 1.15, "learning_rate": 0.00012790754339897506, "loss": 0.0105, "step": 442600 }, { "epoch": 1.15, "learning_rate": 0.0001279036551826036, "loss": 0.0117, "step": 442610 }, { "epoch": 1.15, "learning_rate": 0.00012789976696623212, "loss": 0.013, "step": 442620 }, { "epoch": 1.15, "learning_rate": 0.00012789587874986066, "loss": 0.0146, "step": 442630 }, { "epoch": 1.15, "learning_rate": 0.0001278919905334892, "loss": 0.012, "step": 442640 }, { "epoch": 1.15, "learning_rate": 0.00012788810231711772, "loss": 0.0125, "step": 442650 }, { "epoch": 1.15, "learning_rate": 0.00012788421410074626, "loss": 0.011, "step": 442660 }, { "epoch": 1.15, "learning_rate": 0.0001278803258843748, "loss": 0.0108, "step": 442670 }, { "epoch": 1.15, "learning_rate": 0.00012787643766800334, "loss": 0.0098, "step": 442680 }, { "epoch": 1.15, "learning_rate": 0.00012787254945163186, "loss": 0.0115, "step": 442690 }, { "epoch": 1.15, "learning_rate": 0.00012786866123526042, "loss": 0.0149, "step": 442700 }, { "epoch": 1.15, "learning_rate": 0.00012786477301888894, "loss": 0.012, "step": 442710 }, { "epoch": 1.15, "learning_rate": 0.00012786088480251748, "loss": 0.0108, "step": 442720 }, { "epoch": 1.15, "learning_rate": 0.00012785699658614602, "loss": 0.0122, "step": 442730 }, { "epoch": 1.15, "learning_rate": 0.00012785310836977456, "loss": 0.0115, "step": 442740 }, { "epoch": 1.15, "learning_rate": 0.00012784922015340308, "loss": 0.0098, "step": 442750 }, { "epoch": 1.15, "learning_rate": 0.00012784533193703162, "loss": 0.0104, "step": 442760 }, { "epoch": 1.15, "learning_rate": 0.00012784144372066016, "loss": 0.0095, "step": 442770 }, { "epoch": 1.15, "learning_rate": 0.0001278375555042887, "loss": 0.0099, "step": 442780 }, { "epoch": 1.15, "learning_rate": 0.00012783366728791722, "loss": 0.0105, "step": 442790 }, { "epoch": 1.15, "learning_rate": 0.00012782977907154576, "loss": 0.0104, "step": 442800 }, { "epoch": 1.15, "learning_rate": 0.0001278258908551743, "loss": 0.0089, "step": 442810 }, { "epoch": 1.15, "learning_rate": 0.00012782200263880284, "loss": 0.0116, "step": 442820 }, { "epoch": 1.15, "learning_rate": 0.00012781811442243136, "loss": 0.0103, "step": 442830 }, { "epoch": 1.15, "learning_rate": 0.0001278142262060599, "loss": 0.0112, "step": 442840 }, { "epoch": 1.15, "learning_rate": 0.00012781033798968844, "loss": 0.0162, "step": 442850 }, { "epoch": 1.15, "learning_rate": 0.00012780644977331698, "loss": 0.0094, "step": 442860 }, { "epoch": 1.15, "learning_rate": 0.0001278025615569455, "loss": 0.0088, "step": 442870 }, { "epoch": 1.15, "learning_rate": 0.00012779867334057404, "loss": 0.0157, "step": 442880 }, { "epoch": 1.15, "learning_rate": 0.00012779478512420258, "loss": 0.0122, "step": 442890 }, { "epoch": 1.15, "learning_rate": 0.00012779089690783112, "loss": 0.0123, "step": 442900 }, { "epoch": 1.15, "learning_rate": 0.00012778700869145966, "loss": 0.0141, "step": 442910 }, { "epoch": 1.15, "learning_rate": 0.00012778312047508818, "loss": 0.0114, "step": 442920 }, { "epoch": 1.15, "learning_rate": 0.00012777923225871672, "loss": 0.011, "step": 442930 }, { "epoch": 1.15, "learning_rate": 0.00012777534404234526, "loss": 0.0095, "step": 442940 }, { "epoch": 1.15, "learning_rate": 0.0001277714558259738, "loss": 0.0096, "step": 442950 }, { "epoch": 1.15, "learning_rate": 0.00012776756760960232, "loss": 0.0106, "step": 442960 }, { "epoch": 1.15, "learning_rate": 0.00012776367939323086, "loss": 0.0101, "step": 442970 }, { "epoch": 1.15, "learning_rate": 0.0001277597911768594, "loss": 0.0114, "step": 442980 }, { "epoch": 1.15, "learning_rate": 0.00012775590296048794, "loss": 0.0094, "step": 442990 }, { "epoch": 1.15, "learning_rate": 0.00012775201474411646, "loss": 0.0128, "step": 443000 }, { "epoch": 1.15, "eval_cer": 0.8817026863231677, "eval_loss": 0.007168120238929987, "eval_runtime": 107.6791, "eval_samples_per_second": 18.574, "eval_steps_per_second": 4.643, "step": 443000 }, { "epoch": 1.15, "learning_rate": 0.000127748126527745, "loss": 0.0116, "step": 443010 }, { "epoch": 1.15, "learning_rate": 0.00012774423831137354, "loss": 0.0096, "step": 443020 }, { "epoch": 1.15, "learning_rate": 0.00012774035009500208, "loss": 0.0092, "step": 443030 }, { "epoch": 1.15, "learning_rate": 0.0001277364618786306, "loss": 0.0109, "step": 443040 }, { "epoch": 1.15, "learning_rate": 0.00012773257366225916, "loss": 0.0077, "step": 443050 }, { "epoch": 1.15, "learning_rate": 0.00012772868544588768, "loss": 0.0146, "step": 443060 }, { "epoch": 1.15, "learning_rate": 0.00012772479722951622, "loss": 0.0157, "step": 443070 }, { "epoch": 1.15, "learning_rate": 0.00012772090901314476, "loss": 0.0078, "step": 443080 }, { "epoch": 1.15, "learning_rate": 0.0001277170207967733, "loss": 0.0119, "step": 443090 }, { "epoch": 1.15, "learning_rate": 0.00012771313258040182, "loss": 0.0102, "step": 443100 }, { "epoch": 1.15, "learning_rate": 0.00012770924436403036, "loss": 0.0125, "step": 443110 }, { "epoch": 1.15, "learning_rate": 0.0001277053561476589, "loss": 0.014, "step": 443120 }, { "epoch": 1.15, "learning_rate": 0.00012770146793128742, "loss": 0.0104, "step": 443130 }, { "epoch": 1.15, "learning_rate": 0.00012769757971491596, "loss": 0.0128, "step": 443140 }, { "epoch": 1.15, "learning_rate": 0.0001276936914985445, "loss": 0.0131, "step": 443150 }, { "epoch": 1.15, "learning_rate": 0.00012768980328217304, "loss": 0.0105, "step": 443160 }, { "epoch": 1.15, "learning_rate": 0.00012768591506580156, "loss": 0.0096, "step": 443170 }, { "epoch": 1.15, "learning_rate": 0.0001276820268494301, "loss": 0.0105, "step": 443180 }, { "epoch": 1.15, "learning_rate": 0.00012767813863305864, "loss": 0.0087, "step": 443190 }, { "epoch": 1.15, "learning_rate": 0.00012767425041668718, "loss": 0.0096, "step": 443200 }, { "epoch": 1.15, "learning_rate": 0.0001276703622003157, "loss": 0.012, "step": 443210 }, { "epoch": 1.15, "learning_rate": 0.00012766647398394426, "loss": 0.0122, "step": 443220 }, { "epoch": 1.15, "learning_rate": 0.00012766258576757278, "loss": 0.0099, "step": 443230 }, { "epoch": 1.15, "learning_rate": 0.00012765869755120132, "loss": 0.0113, "step": 443240 }, { "epoch": 1.15, "learning_rate": 0.00012765480933482986, "loss": 0.0123, "step": 443250 }, { "epoch": 1.15, "learning_rate": 0.0001276509211184584, "loss": 0.0144, "step": 443260 }, { "epoch": 1.15, "learning_rate": 0.00012764703290208692, "loss": 0.011, "step": 443270 }, { "epoch": 1.15, "learning_rate": 0.00012764314468571546, "loss": 0.0116, "step": 443280 }, { "epoch": 1.15, "learning_rate": 0.000127639256469344, "loss": 0.0107, "step": 443290 }, { "epoch": 1.15, "learning_rate": 0.00012763536825297254, "loss": 0.0106, "step": 443300 }, { "epoch": 1.15, "learning_rate": 0.00012763148003660106, "loss": 0.0113, "step": 443310 }, { "epoch": 1.15, "learning_rate": 0.0001276275918202296, "loss": 0.0104, "step": 443320 }, { "epoch": 1.15, "learning_rate": 0.00012762370360385814, "loss": 0.0085, "step": 443330 }, { "epoch": 1.15, "learning_rate": 0.00012761981538748668, "loss": 0.0096, "step": 443340 }, { "epoch": 1.15, "learning_rate": 0.0001276159271711152, "loss": 0.0125, "step": 443350 }, { "epoch": 1.15, "learning_rate": 0.00012761203895474374, "loss": 0.011, "step": 443360 }, { "epoch": 1.15, "learning_rate": 0.00012760815073837228, "loss": 0.0157, "step": 443370 }, { "epoch": 1.15, "learning_rate": 0.0001276042625220008, "loss": 0.0128, "step": 443380 }, { "epoch": 1.15, "learning_rate": 0.00012760037430562934, "loss": 0.0122, "step": 443390 }, { "epoch": 1.15, "learning_rate": 0.00012759648608925788, "loss": 0.0108, "step": 443400 }, { "epoch": 1.15, "learning_rate": 0.00012759259787288642, "loss": 0.0117, "step": 443410 }, { "epoch": 1.15, "learning_rate": 0.00012758870965651496, "loss": 0.0112, "step": 443420 }, { "epoch": 1.15, "learning_rate": 0.0001275848214401435, "loss": 0.0116, "step": 443430 }, { "epoch": 1.15, "learning_rate": 0.00012758093322377202, "loss": 0.012, "step": 443440 }, { "epoch": 1.15, "learning_rate": 0.00012757704500740056, "loss": 0.0099, "step": 443450 }, { "epoch": 1.15, "learning_rate": 0.0001275731567910291, "loss": 0.0105, "step": 443460 }, { "epoch": 1.15, "learning_rate": 0.00012756926857465764, "loss": 0.009, "step": 443470 }, { "epoch": 1.15, "learning_rate": 0.00012756538035828616, "loss": 0.0092, "step": 443480 }, { "epoch": 1.15, "learning_rate": 0.0001275614921419147, "loss": 0.0117, "step": 443490 }, { "epoch": 1.15, "learning_rate": 0.00012755760392554324, "loss": 0.0104, "step": 443500 }, { "epoch": 1.15, "learning_rate": 0.00012755371570917178, "loss": 0.0125, "step": 443510 }, { "epoch": 1.15, "learning_rate": 0.0001275498274928003, "loss": 0.0126, "step": 443520 }, { "epoch": 1.15, "learning_rate": 0.00012754593927642884, "loss": 0.0124, "step": 443530 }, { "epoch": 1.15, "learning_rate": 0.00012754205106005738, "loss": 0.0083, "step": 443540 }, { "epoch": 1.15, "learning_rate": 0.00012753816284368592, "loss": 0.0116, "step": 443550 }, { "epoch": 1.15, "learning_rate": 0.00012753427462731444, "loss": 0.0096, "step": 443560 }, { "epoch": 1.15, "learning_rate": 0.000127530386410943, "loss": 0.0111, "step": 443570 }, { "epoch": 1.15, "learning_rate": 0.00012752649819457152, "loss": 0.0113, "step": 443580 }, { "epoch": 1.15, "learning_rate": 0.00012752260997820006, "loss": 0.0089, "step": 443590 }, { "epoch": 1.15, "learning_rate": 0.0001275187217618286, "loss": 0.0083, "step": 443600 }, { "epoch": 1.15, "learning_rate": 0.00012751483354545714, "loss": 0.0146, "step": 443610 }, { "epoch": 1.15, "learning_rate": 0.00012751094532908566, "loss": 0.008, "step": 443620 }, { "epoch": 1.15, "learning_rate": 0.0001275070571127142, "loss": 0.0099, "step": 443630 }, { "epoch": 1.15, "learning_rate": 0.00012750316889634274, "loss": 0.0111, "step": 443640 }, { "epoch": 1.15, "learning_rate": 0.00012749928067997126, "loss": 0.0106, "step": 443650 }, { "epoch": 1.15, "learning_rate": 0.0001274953924635998, "loss": 0.0124, "step": 443660 }, { "epoch": 1.15, "learning_rate": 0.00012749150424722834, "loss": 0.0103, "step": 443670 }, { "epoch": 1.15, "learning_rate": 0.00012748761603085688, "loss": 0.0351, "step": 443680 }, { "epoch": 1.15, "learning_rate": 0.0001274837278144854, "loss": 0.0102, "step": 443690 }, { "epoch": 1.15, "learning_rate": 0.00012747983959811394, "loss": 0.0114, "step": 443700 }, { "epoch": 1.15, "learning_rate": 0.00012747595138174248, "loss": 0.0117, "step": 443710 }, { "epoch": 1.15, "learning_rate": 0.00012747206316537102, "loss": 0.0104, "step": 443720 }, { "epoch": 1.15, "learning_rate": 0.00012746817494899954, "loss": 0.014, "step": 443730 }, { "epoch": 1.15, "learning_rate": 0.0001274642867326281, "loss": 0.0119, "step": 443740 }, { "epoch": 1.15, "learning_rate": 0.00012746039851625662, "loss": 0.0144, "step": 443750 }, { "epoch": 1.15, "learning_rate": 0.00012745651029988516, "loss": 0.0094, "step": 443760 }, { "epoch": 1.15, "learning_rate": 0.0001274526220835137, "loss": 0.0114, "step": 443770 }, { "epoch": 1.15, "learning_rate": 0.00012744873386714224, "loss": 0.0125, "step": 443780 }, { "epoch": 1.15, "learning_rate": 0.00012744484565077076, "loss": 0.0094, "step": 443790 }, { "epoch": 1.15, "learning_rate": 0.0001274409574343993, "loss": 0.0131, "step": 443800 }, { "epoch": 1.15, "learning_rate": 0.00012743706921802784, "loss": 0.0127, "step": 443810 }, { "epoch": 1.15, "learning_rate": 0.00012743318100165638, "loss": 0.0095, "step": 443820 }, { "epoch": 1.15, "learning_rate": 0.0001274292927852849, "loss": 0.0117, "step": 443830 }, { "epoch": 1.15, "learning_rate": 0.00012742540456891344, "loss": 0.0118, "step": 443840 }, { "epoch": 1.15, "learning_rate": 0.00012742151635254198, "loss": 0.0091, "step": 443850 }, { "epoch": 1.15, "learning_rate": 0.00012741762813617052, "loss": 0.0129, "step": 443860 }, { "epoch": 1.15, "learning_rate": 0.00012741373991979904, "loss": 0.0163, "step": 443870 }, { "epoch": 1.15, "learning_rate": 0.00012740985170342758, "loss": 0.0149, "step": 443880 }, { "epoch": 1.15, "learning_rate": 0.00012740596348705612, "loss": 0.0086, "step": 443890 }, { "epoch": 1.15, "learning_rate": 0.00012740207527068463, "loss": 0.0091, "step": 443900 }, { "epoch": 1.15, "learning_rate": 0.00012739818705431318, "loss": 0.013, "step": 443910 }, { "epoch": 1.15, "learning_rate": 0.00012739429883794172, "loss": 0.0096, "step": 443920 }, { "epoch": 1.15, "learning_rate": 0.00012739041062157026, "loss": 0.0119, "step": 443930 }, { "epoch": 1.15, "learning_rate": 0.0001273865224051988, "loss": 0.0091, "step": 443940 }, { "epoch": 1.15, "learning_rate": 0.00012738263418882734, "loss": 0.0081, "step": 443950 }, { "epoch": 1.15, "learning_rate": 0.00012737874597245586, "loss": 0.012, "step": 443960 }, { "epoch": 1.15, "learning_rate": 0.0001273748577560844, "loss": 0.0125, "step": 443970 }, { "epoch": 1.15, "learning_rate": 0.00012737096953971294, "loss": 0.0105, "step": 443980 }, { "epoch": 1.15, "learning_rate": 0.00012736708132334148, "loss": 0.0178, "step": 443990 }, { "epoch": 1.15, "learning_rate": 0.00012736319310697, "loss": 0.0141, "step": 444000 }, { "epoch": 1.15, "eval_cer": 0.8817026863231677, "eval_loss": 0.007035560440272093, "eval_runtime": 107.7478, "eval_samples_per_second": 18.562, "eval_steps_per_second": 4.64, "step": 444000 }, { "epoch": 1.15, "learning_rate": 0.00012735930489059854, "loss": 0.0124, "step": 444010 }, { "epoch": 1.15, "learning_rate": 0.00012735541667422708, "loss": 0.0107, "step": 444020 }, { "epoch": 1.15, "learning_rate": 0.00012735152845785562, "loss": 0.0163, "step": 444030 }, { "epoch": 1.15, "learning_rate": 0.00012734764024148414, "loss": 0.0098, "step": 444040 }, { "epoch": 1.15, "learning_rate": 0.00012734375202511268, "loss": 0.0118, "step": 444050 }, { "epoch": 1.15, "learning_rate": 0.00012733986380874122, "loss": 0.0108, "step": 444060 }, { "epoch": 1.15, "learning_rate": 0.00012733597559236976, "loss": 0.0104, "step": 444070 }, { "epoch": 1.15, "learning_rate": 0.00012733208737599828, "loss": 0.0145, "step": 444080 }, { "epoch": 1.15, "learning_rate": 0.00012732819915962684, "loss": 0.0127, "step": 444090 }, { "epoch": 1.15, "learning_rate": 0.00012732431094325536, "loss": 0.0088, "step": 444100 }, { "epoch": 1.15, "learning_rate": 0.0001273204227268839, "loss": 0.0096, "step": 444110 }, { "epoch": 1.15, "learning_rate": 0.00012731653451051244, "loss": 0.0098, "step": 444120 }, { "epoch": 1.15, "learning_rate": 0.00012731264629414096, "loss": 0.0095, "step": 444130 }, { "epoch": 1.15, "learning_rate": 0.0001273087580777695, "loss": 0.0112, "step": 444140 }, { "epoch": 1.15, "learning_rate": 0.00012730486986139804, "loss": 0.0103, "step": 444150 }, { "epoch": 1.15, "learning_rate": 0.00012730098164502658, "loss": 0.0141, "step": 444160 }, { "epoch": 1.15, "learning_rate": 0.0001272970934286551, "loss": 0.0092, "step": 444170 }, { "epoch": 1.15, "learning_rate": 0.00012729320521228364, "loss": 0.0117, "step": 444180 }, { "epoch": 1.15, "learning_rate": 0.00012728931699591218, "loss": 0.0121, "step": 444190 }, { "epoch": 1.15, "learning_rate": 0.00012728542877954072, "loss": 0.0131, "step": 444200 }, { "epoch": 1.15, "learning_rate": 0.00012728154056316924, "loss": 0.0091, "step": 444210 }, { "epoch": 1.15, "learning_rate": 0.00012727765234679778, "loss": 0.0123, "step": 444220 }, { "epoch": 1.15, "learning_rate": 0.00012727376413042632, "loss": 0.0092, "step": 444230 }, { "epoch": 1.15, "learning_rate": 0.00012726987591405486, "loss": 0.0111, "step": 444240 }, { "epoch": 1.15, "learning_rate": 0.00012726598769768337, "loss": 0.0126, "step": 444250 }, { "epoch": 1.15, "learning_rate": 0.00012726209948131192, "loss": 0.0115, "step": 444260 }, { "epoch": 1.15, "learning_rate": 0.00012725821126494046, "loss": 0.0089, "step": 444270 }, { "epoch": 1.15, "learning_rate": 0.000127254323048569, "loss": 0.0101, "step": 444280 }, { "epoch": 1.15, "learning_rate": 0.00012725043483219754, "loss": 0.0132, "step": 444290 }, { "epoch": 1.15, "learning_rate": 0.00012724654661582608, "loss": 0.0101, "step": 444300 }, { "epoch": 1.15, "learning_rate": 0.0001272426583994546, "loss": 0.0096, "step": 444310 }, { "epoch": 1.15, "learning_rate": 0.00012723877018308314, "loss": 0.012, "step": 444320 }, { "epoch": 1.15, "learning_rate": 0.00012723488196671168, "loss": 0.0096, "step": 444330 }, { "epoch": 1.15, "learning_rate": 0.00012723099375034022, "loss": 0.0129, "step": 444340 }, { "epoch": 1.15, "learning_rate": 0.00012722710553396874, "loss": 0.012, "step": 444350 }, { "epoch": 1.15, "learning_rate": 0.00012722321731759728, "loss": 0.0125, "step": 444360 }, { "epoch": 1.15, "learning_rate": 0.00012721932910122582, "loss": 0.0102, "step": 444370 }, { "epoch": 1.15, "learning_rate": 0.00012721544088485433, "loss": 0.0095, "step": 444380 }, { "epoch": 1.15, "learning_rate": 0.00012721155266848288, "loss": 0.0132, "step": 444390 }, { "epoch": 1.15, "learning_rate": 0.00012720766445211142, "loss": 0.0067, "step": 444400 }, { "epoch": 1.15, "learning_rate": 0.00012720377623573996, "loss": 0.0117, "step": 444410 }, { "epoch": 1.15, "learning_rate": 0.00012719988801936847, "loss": 0.0104, "step": 444420 }, { "epoch": 1.15, "learning_rate": 0.00012719599980299702, "loss": 0.0121, "step": 444430 }, { "epoch": 1.15, "learning_rate": 0.00012719211158662556, "loss": 0.0094, "step": 444440 }, { "epoch": 1.15, "learning_rate": 0.0001271882233702541, "loss": 0.0105, "step": 444450 }, { "epoch": 1.15, "learning_rate": 0.00012718433515388261, "loss": 0.0123, "step": 444460 }, { "epoch": 1.15, "learning_rate": 0.00012718044693751118, "loss": 0.0106, "step": 444470 }, { "epoch": 1.15, "learning_rate": 0.0001271765587211397, "loss": 0.0089, "step": 444480 }, { "epoch": 1.15, "learning_rate": 0.00012717267050476824, "loss": 0.0103, "step": 444490 }, { "epoch": 1.15, "learning_rate": 0.00012716878228839678, "loss": 0.0105, "step": 444500 }, { "epoch": 1.15, "learning_rate": 0.00012716489407202532, "loss": 0.0138, "step": 444510 }, { "epoch": 1.15, "learning_rate": 0.00012716100585565384, "loss": 0.0117, "step": 444520 }, { "epoch": 1.15, "learning_rate": 0.00012715711763928238, "loss": 0.0118, "step": 444530 }, { "epoch": 1.15, "learning_rate": 0.00012715322942291092, "loss": 0.0109, "step": 444540 }, { "epoch": 1.15, "learning_rate": 0.00012714934120653946, "loss": 0.0084, "step": 444550 }, { "epoch": 1.15, "learning_rate": 0.00012714545299016798, "loss": 0.015, "step": 444560 }, { "epoch": 1.15, "learning_rate": 0.00012714156477379652, "loss": 0.0119, "step": 444570 }, { "epoch": 1.15, "learning_rate": 0.00012713767655742506, "loss": 0.0087, "step": 444580 }, { "epoch": 1.15, "learning_rate": 0.0001271337883410536, "loss": 0.0156, "step": 444590 }, { "epoch": 1.15, "learning_rate": 0.00012712990012468212, "loss": 0.0104, "step": 444600 }, { "epoch": 1.15, "learning_rate": 0.00012712601190831066, "loss": 0.0109, "step": 444610 }, { "epoch": 1.15, "learning_rate": 0.0001271221236919392, "loss": 0.0125, "step": 444620 }, { "epoch": 1.15, "learning_rate": 0.0001271182354755677, "loss": 0.0105, "step": 444630 }, { "epoch": 1.15, "learning_rate": 0.00012711434725919628, "loss": 0.0094, "step": 444640 }, { "epoch": 1.15, "learning_rate": 0.0001271104590428248, "loss": 0.0113, "step": 444650 }, { "epoch": 1.15, "learning_rate": 0.00012710657082645334, "loss": 0.0124, "step": 444660 }, { "epoch": 1.15, "learning_rate": 0.00012710268261008188, "loss": 0.01, "step": 444670 }, { "epoch": 1.15, "learning_rate": 0.00012709879439371042, "loss": 0.0107, "step": 444680 }, { "epoch": 1.15, "learning_rate": 0.00012709490617733894, "loss": 0.0124, "step": 444690 }, { "epoch": 1.15, "learning_rate": 0.00012709101796096748, "loss": 0.012, "step": 444700 }, { "epoch": 1.15, "learning_rate": 0.00012708712974459602, "loss": 0.0126, "step": 444710 }, { "epoch": 1.15, "learning_rate": 0.00012708324152822456, "loss": 0.0099, "step": 444720 }, { "epoch": 1.15, "learning_rate": 0.00012707935331185308, "loss": 0.0183, "step": 444730 }, { "epoch": 1.15, "learning_rate": 0.00012707546509548162, "loss": 0.0119, "step": 444740 }, { "epoch": 1.15, "learning_rate": 0.00012707157687911016, "loss": 0.0145, "step": 444750 }, { "epoch": 1.15, "learning_rate": 0.0001270676886627387, "loss": 0.011, "step": 444760 }, { "epoch": 1.15, "learning_rate": 0.00012706380044636721, "loss": 0.0127, "step": 444770 }, { "epoch": 1.15, "learning_rate": 0.00012705991222999576, "loss": 0.0104, "step": 444780 }, { "epoch": 1.15, "learning_rate": 0.0001270560240136243, "loss": 0.0105, "step": 444790 }, { "epoch": 1.15, "learning_rate": 0.00012705213579725284, "loss": 0.0111, "step": 444800 }, { "epoch": 1.15, "learning_rate": 0.00012704824758088138, "loss": 0.0091, "step": 444810 }, { "epoch": 1.15, "learning_rate": 0.00012704435936450992, "loss": 0.0098, "step": 444820 }, { "epoch": 1.15, "learning_rate": 0.00012704047114813844, "loss": 0.0124, "step": 444830 }, { "epoch": 1.15, "learning_rate": 0.00012703658293176698, "loss": 0.0098, "step": 444840 }, { "epoch": 1.15, "learning_rate": 0.00012703269471539552, "loss": 0.0112, "step": 444850 }, { "epoch": 1.15, "learning_rate": 0.00012702880649902404, "loss": 0.0129, "step": 444860 }, { "epoch": 1.15, "learning_rate": 0.00012702491828265258, "loss": 0.0115, "step": 444870 }, { "epoch": 1.15, "learning_rate": 0.00012702103006628112, "loss": 0.0126, "step": 444880 }, { "epoch": 1.15, "learning_rate": 0.00012701714184990966, "loss": 0.0083, "step": 444890 }, { "epoch": 1.15, "learning_rate": 0.00012701325363353817, "loss": 0.0109, "step": 444900 }, { "epoch": 1.15, "learning_rate": 0.00012700936541716672, "loss": 0.0094, "step": 444910 }, { "epoch": 1.15, "learning_rate": 0.00012700547720079526, "loss": 0.014, "step": 444920 }, { "epoch": 1.15, "learning_rate": 0.0001270015889844238, "loss": 0.0131, "step": 444930 }, { "epoch": 1.15, "learning_rate": 0.00012699770076805231, "loss": 0.0108, "step": 444940 }, { "epoch": 1.15, "learning_rate": 0.00012699381255168086, "loss": 0.0099, "step": 444950 }, { "epoch": 1.15, "learning_rate": 0.0001269899243353094, "loss": 0.0109, "step": 444960 }, { "epoch": 1.15, "learning_rate": 0.00012698603611893794, "loss": 0.0117, "step": 444970 }, { "epoch": 1.15, "learning_rate": 0.00012698214790256645, "loss": 0.0126, "step": 444980 }, { "epoch": 1.15, "learning_rate": 0.00012697825968619502, "loss": 0.0106, "step": 444990 }, { "epoch": 1.15, "learning_rate": 0.00012697437146982354, "loss": 0.0111, "step": 445000 }, { "epoch": 1.15, "eval_cer": 0.8817152830555753, "eval_loss": 0.0074842702597379684, "eval_runtime": 107.1551, "eval_samples_per_second": 18.665, "eval_steps_per_second": 4.666, "step": 445000 }, { "epoch": 1.15, "learning_rate": 0.00012697048325345208, "loss": 0.0119, "step": 445010 }, { "epoch": 1.15, "learning_rate": 0.00012696659503708062, "loss": 0.0057, "step": 445020 }, { "epoch": 1.15, "learning_rate": 0.00012696270682070916, "loss": 0.0092, "step": 445030 }, { "epoch": 1.15, "learning_rate": 0.00012695881860433768, "loss": 0.0106, "step": 445040 }, { "epoch": 1.15, "learning_rate": 0.00012695493038796622, "loss": 0.0132, "step": 445050 }, { "epoch": 1.15, "learning_rate": 0.00012695104217159476, "loss": 0.0132, "step": 445060 }, { "epoch": 1.15, "learning_rate": 0.0001269471539552233, "loss": 0.0126, "step": 445070 }, { "epoch": 1.15, "learning_rate": 0.00012694326573885182, "loss": 0.0109, "step": 445080 }, { "epoch": 1.15, "learning_rate": 0.00012693937752248036, "loss": 0.0095, "step": 445090 }, { "epoch": 1.15, "learning_rate": 0.0001269354893061089, "loss": 0.0139, "step": 445100 }, { "epoch": 1.15, "learning_rate": 0.00012693160108973741, "loss": 0.0123, "step": 445110 }, { "epoch": 1.15, "learning_rate": 0.00012692771287336596, "loss": 0.0115, "step": 445120 }, { "epoch": 1.15, "learning_rate": 0.0001269238246569945, "loss": 0.0115, "step": 445130 }, { "epoch": 1.15, "learning_rate": 0.00012691993644062304, "loss": 0.0086, "step": 445140 }, { "epoch": 1.15, "learning_rate": 0.00012691604822425155, "loss": 0.009, "step": 445150 }, { "epoch": 1.15, "learning_rate": 0.00012691216000788012, "loss": 0.0094, "step": 445160 }, { "epoch": 1.15, "learning_rate": 0.00012690827179150864, "loss": 0.011, "step": 445170 }, { "epoch": 1.15, "learning_rate": 0.00012690438357513718, "loss": 0.0102, "step": 445180 }, { "epoch": 1.15, "learning_rate": 0.00012690049535876572, "loss": 0.0119, "step": 445190 }, { "epoch": 1.15, "learning_rate": 0.00012689660714239426, "loss": 0.0122, "step": 445200 }, { "epoch": 1.15, "learning_rate": 0.00012689271892602278, "loss": 0.0079, "step": 445210 }, { "epoch": 1.15, "learning_rate": 0.00012688883070965132, "loss": 0.0083, "step": 445220 }, { "epoch": 1.15, "learning_rate": 0.00012688494249327986, "loss": 0.0132, "step": 445230 }, { "epoch": 1.15, "learning_rate": 0.0001268810542769084, "loss": 0.0118, "step": 445240 }, { "epoch": 1.15, "learning_rate": 0.00012687716606053692, "loss": 0.0103, "step": 445250 }, { "epoch": 1.15, "learning_rate": 0.00012687327784416546, "loss": 0.013, "step": 445260 }, { "epoch": 1.15, "learning_rate": 0.000126869389627794, "loss": 0.0112, "step": 445270 }, { "epoch": 1.15, "learning_rate": 0.00012686550141142254, "loss": 0.0147, "step": 445280 }, { "epoch": 1.15, "learning_rate": 0.00012686161319505105, "loss": 0.0101, "step": 445290 }, { "epoch": 1.15, "learning_rate": 0.0001268577249786796, "loss": 0.0122, "step": 445300 }, { "epoch": 1.15, "learning_rate": 0.00012685383676230814, "loss": 0.0104, "step": 445310 }, { "epoch": 1.15, "learning_rate": 0.00012684994854593668, "loss": 0.01, "step": 445320 }, { "epoch": 1.15, "learning_rate": 0.00012684606032956522, "loss": 0.0094, "step": 445330 }, { "epoch": 1.15, "learning_rate": 0.00012684217211319376, "loss": 0.0109, "step": 445340 }, { "epoch": 1.15, "learning_rate": 0.00012683828389682228, "loss": 0.0112, "step": 445350 }, { "epoch": 1.15, "learning_rate": 0.00012683439568045082, "loss": 0.0138, "step": 445360 }, { "epoch": 1.15, "learning_rate": 0.00012683050746407936, "loss": 0.011, "step": 445370 }, { "epoch": 1.15, "learning_rate": 0.00012682661924770788, "loss": 0.0109, "step": 445380 }, { "epoch": 1.15, "learning_rate": 0.00012682273103133642, "loss": 0.0129, "step": 445390 }, { "epoch": 1.15, "learning_rate": 0.00012681884281496496, "loss": 0.0098, "step": 445400 }, { "epoch": 1.15, "learning_rate": 0.0001268149545985935, "loss": 0.0134, "step": 445410 }, { "epoch": 1.15, "learning_rate": 0.00012681106638222201, "loss": 0.0109, "step": 445420 }, { "epoch": 1.15, "learning_rate": 0.00012680717816585056, "loss": 0.0103, "step": 445430 }, { "epoch": 1.15, "learning_rate": 0.0001268032899494791, "loss": 0.0109, "step": 445440 }, { "epoch": 1.15, "learning_rate": 0.00012679940173310764, "loss": 0.0103, "step": 445450 }, { "epoch": 1.15, "learning_rate": 0.00012679551351673615, "loss": 0.0138, "step": 445460 }, { "epoch": 1.15, "learning_rate": 0.0001267916253003647, "loss": 0.011, "step": 445470 }, { "epoch": 1.15, "learning_rate": 0.00012678773708399324, "loss": 0.0107, "step": 445480 }, { "epoch": 1.15, "learning_rate": 0.00012678384886762178, "loss": 0.0156, "step": 445490 }, { "epoch": 1.15, "learning_rate": 0.0001267799606512503, "loss": 0.0083, "step": 445500 }, { "epoch": 1.15, "learning_rate": 0.00012677607243487886, "loss": 0.0105, "step": 445510 }, { "epoch": 1.15, "learning_rate": 0.00012677218421850738, "loss": 0.01, "step": 445520 }, { "epoch": 1.15, "learning_rate": 0.00012676829600213592, "loss": 0.0128, "step": 445530 }, { "epoch": 1.15, "learning_rate": 0.00012676440778576446, "loss": 0.0117, "step": 445540 }, { "epoch": 1.15, "learning_rate": 0.000126760519569393, "loss": 0.0102, "step": 445550 }, { "epoch": 1.15, "learning_rate": 0.00012675663135302152, "loss": 0.0099, "step": 445560 }, { "epoch": 1.15, "learning_rate": 0.00012675274313665006, "loss": 0.0099, "step": 445570 }, { "epoch": 1.16, "learning_rate": 0.0001267488549202786, "loss": 0.0102, "step": 445580 }, { "epoch": 1.16, "learning_rate": 0.00012674496670390714, "loss": 0.0117, "step": 445590 }, { "epoch": 1.16, "learning_rate": 0.00012674107848753566, "loss": 0.0091, "step": 445600 }, { "epoch": 1.16, "learning_rate": 0.0001267371902711642, "loss": 0.0095, "step": 445610 }, { "epoch": 1.16, "learning_rate": 0.00012673330205479274, "loss": 0.0104, "step": 445620 }, { "epoch": 1.16, "learning_rate": 0.00012672941383842125, "loss": 0.013, "step": 445630 }, { "epoch": 1.16, "learning_rate": 0.0001267255256220498, "loss": 0.0159, "step": 445640 }, { "epoch": 1.16, "learning_rate": 0.00012672163740567834, "loss": 0.0143, "step": 445650 }, { "epoch": 1.16, "learning_rate": 0.00012671774918930688, "loss": 0.0111, "step": 445660 }, { "epoch": 1.16, "learning_rate": 0.0001267138609729354, "loss": 0.0078, "step": 445670 }, { "epoch": 1.16, "learning_rate": 0.00012670997275656396, "loss": 0.0076, "step": 445680 }, { "epoch": 1.16, "learning_rate": 0.00012670608454019248, "loss": 0.0154, "step": 445690 }, { "epoch": 1.16, "learning_rate": 0.00012670219632382102, "loss": 0.0127, "step": 445700 }, { "epoch": 1.16, "learning_rate": 0.00012669830810744956, "loss": 0.0094, "step": 445710 }, { "epoch": 1.16, "learning_rate": 0.0001266944198910781, "loss": 0.0105, "step": 445720 }, { "epoch": 1.16, "learning_rate": 0.00012669053167470662, "loss": 0.0108, "step": 445730 }, { "epoch": 1.16, "learning_rate": 0.00012668664345833516, "loss": 0.0092, "step": 445740 }, { "epoch": 1.16, "learning_rate": 0.0001266827552419637, "loss": 0.0108, "step": 445750 }, { "epoch": 1.16, "learning_rate": 0.00012667886702559224, "loss": 0.01, "step": 445760 }, { "epoch": 1.16, "learning_rate": 0.00012667497880922076, "loss": 0.0108, "step": 445770 }, { "epoch": 1.16, "learning_rate": 0.0001266710905928493, "loss": 0.0107, "step": 445780 }, { "epoch": 1.16, "learning_rate": 0.00012666720237647784, "loss": 0.0114, "step": 445790 }, { "epoch": 1.16, "learning_rate": 0.00012666331416010638, "loss": 0.0092, "step": 445800 }, { "epoch": 1.16, "learning_rate": 0.0001266594259437349, "loss": 0.0145, "step": 445810 }, { "epoch": 1.16, "learning_rate": 0.00012665553772736344, "loss": 0.0143, "step": 445820 }, { "epoch": 1.16, "learning_rate": 0.00012665164951099198, "loss": 0.0114, "step": 445830 }, { "epoch": 1.16, "learning_rate": 0.00012664776129462052, "loss": 0.0116, "step": 445840 }, { "epoch": 1.16, "learning_rate": 0.00012664387307824903, "loss": 0.0125, "step": 445850 }, { "epoch": 1.16, "learning_rate": 0.00012663998486187758, "loss": 0.0113, "step": 445860 }, { "epoch": 1.16, "learning_rate": 0.00012663609664550612, "loss": 0.0071, "step": 445870 }, { "epoch": 1.16, "learning_rate": 0.00012663220842913466, "loss": 0.022, "step": 445880 }, { "epoch": 1.16, "learning_rate": 0.0001266283202127632, "loss": 0.0099, "step": 445890 }, { "epoch": 1.16, "learning_rate": 0.00012662443199639172, "loss": 0.013, "step": 445900 }, { "epoch": 1.16, "learning_rate": 0.00012662054378002026, "loss": 0.0106, "step": 445910 }, { "epoch": 1.16, "learning_rate": 0.0001266166555636488, "loss": 0.0121, "step": 445920 }, { "epoch": 1.16, "learning_rate": 0.00012661276734727734, "loss": 0.0152, "step": 445930 }, { "epoch": 1.16, "learning_rate": 0.00012660887913090585, "loss": 0.0137, "step": 445940 }, { "epoch": 1.16, "learning_rate": 0.0001266049909145344, "loss": 0.0101, "step": 445950 }, { "epoch": 1.16, "learning_rate": 0.00012660110269816294, "loss": 0.011, "step": 445960 }, { "epoch": 1.16, "learning_rate": 0.00012659721448179148, "loss": 0.0117, "step": 445970 }, { "epoch": 1.16, "learning_rate": 0.00012659332626542, "loss": 0.0094, "step": 445980 }, { "epoch": 1.16, "learning_rate": 0.00012658943804904854, "loss": 0.0074, "step": 445990 }, { "epoch": 1.16, "learning_rate": 0.00012658554983267708, "loss": 0.0116, "step": 446000 }, { "epoch": 1.16, "eval_cer": 0.8816648961259449, "eval_loss": 0.007201557978987694, "eval_runtime": 107.397, "eval_samples_per_second": 18.622, "eval_steps_per_second": 4.656, "step": 446000 }, { "epoch": 1.16, "learning_rate": 0.00012658166161630562, "loss": 0.0083, "step": 446010 }, { "epoch": 1.16, "learning_rate": 0.00012657777339993413, "loss": 0.0113, "step": 446020 }, { "epoch": 1.16, "learning_rate": 0.0001265738851835627, "loss": 0.0161, "step": 446030 }, { "epoch": 1.16, "learning_rate": 0.00012656999696719122, "loss": 0.0103, "step": 446040 }, { "epoch": 1.16, "learning_rate": 0.00012656610875081976, "loss": 0.0126, "step": 446050 }, { "epoch": 1.16, "learning_rate": 0.0001265622205344483, "loss": 0.0123, "step": 446060 }, { "epoch": 1.16, "learning_rate": 0.00012655833231807684, "loss": 0.0102, "step": 446070 }, { "epoch": 1.16, "learning_rate": 0.00012655444410170536, "loss": 0.0115, "step": 446080 }, { "epoch": 1.16, "learning_rate": 0.0001265505558853339, "loss": 0.0106, "step": 446090 }, { "epoch": 1.16, "learning_rate": 0.00012654666766896244, "loss": 0.0116, "step": 446100 }, { "epoch": 1.16, "learning_rate": 0.00012654277945259095, "loss": 0.0133, "step": 446110 }, { "epoch": 1.16, "learning_rate": 0.0001265388912362195, "loss": 0.0136, "step": 446120 }, { "epoch": 1.16, "learning_rate": 0.00012653500301984804, "loss": 0.0127, "step": 446130 }, { "epoch": 1.16, "learning_rate": 0.00012653111480347658, "loss": 0.0111, "step": 446140 }, { "epoch": 1.16, "learning_rate": 0.0001265272265871051, "loss": 0.0091, "step": 446150 }, { "epoch": 1.16, "learning_rate": 0.00012652333837073364, "loss": 0.0152, "step": 446160 }, { "epoch": 1.16, "learning_rate": 0.00012651945015436218, "loss": 0.0087, "step": 446170 }, { "epoch": 1.16, "learning_rate": 0.00012651556193799072, "loss": 0.0123, "step": 446180 }, { "epoch": 1.16, "learning_rate": 0.00012651167372161923, "loss": 0.0111, "step": 446190 }, { "epoch": 1.16, "learning_rate": 0.0001265077855052478, "loss": 0.0112, "step": 446200 }, { "epoch": 1.16, "learning_rate": 0.00012650389728887632, "loss": 0.0139, "step": 446210 }, { "epoch": 1.16, "learning_rate": 0.00012650000907250486, "loss": 0.014, "step": 446220 }, { "epoch": 1.16, "learning_rate": 0.0001264961208561334, "loss": 0.0096, "step": 446230 }, { "epoch": 1.16, "learning_rate": 0.00012649223263976194, "loss": 0.0118, "step": 446240 }, { "epoch": 1.16, "learning_rate": 0.00012648834442339046, "loss": 0.0156, "step": 446250 }, { "epoch": 1.16, "learning_rate": 0.000126484456207019, "loss": 0.0102, "step": 446260 }, { "epoch": 1.16, "learning_rate": 0.00012648056799064754, "loss": 0.0093, "step": 446270 }, { "epoch": 1.16, "learning_rate": 0.00012647667977427608, "loss": 0.0105, "step": 446280 }, { "epoch": 1.16, "learning_rate": 0.0001264727915579046, "loss": 0.0137, "step": 446290 }, { "epoch": 1.16, "learning_rate": 0.00012646890334153314, "loss": 0.009, "step": 446300 }, { "epoch": 1.16, "learning_rate": 0.00012646501512516168, "loss": 0.0087, "step": 446310 }, { "epoch": 1.16, "learning_rate": 0.00012646112690879022, "loss": 0.0098, "step": 446320 }, { "epoch": 1.16, "learning_rate": 0.00012645723869241873, "loss": 0.0155, "step": 446330 }, { "epoch": 1.16, "learning_rate": 0.00012645335047604728, "loss": 0.0101, "step": 446340 }, { "epoch": 1.16, "learning_rate": 0.00012644946225967582, "loss": 0.0106, "step": 446350 }, { "epoch": 1.16, "learning_rate": 0.00012644557404330433, "loss": 0.0104, "step": 446360 }, { "epoch": 1.16, "learning_rate": 0.00012644168582693287, "loss": 0.0101, "step": 446370 }, { "epoch": 1.16, "learning_rate": 0.00012643779761056142, "loss": 0.01, "step": 446380 }, { "epoch": 1.16, "learning_rate": 0.00012643390939418996, "loss": 0.0109, "step": 446390 }, { "epoch": 1.16, "learning_rate": 0.0001264300211778185, "loss": 0.0098, "step": 446400 }, { "epoch": 1.16, "learning_rate": 0.00012642613296144704, "loss": 0.0098, "step": 446410 }, { "epoch": 1.16, "learning_rate": 0.00012642224474507556, "loss": 0.0118, "step": 446420 }, { "epoch": 1.16, "learning_rate": 0.0001264183565287041, "loss": 0.0109, "step": 446430 }, { "epoch": 1.16, "learning_rate": 0.00012641446831233264, "loss": 0.0113, "step": 446440 }, { "epoch": 1.16, "learning_rate": 0.00012641058009596118, "loss": 0.0082, "step": 446450 }, { "epoch": 1.16, "learning_rate": 0.0001264066918795897, "loss": 0.0118, "step": 446460 }, { "epoch": 1.16, "learning_rate": 0.00012640280366321824, "loss": 0.0127, "step": 446470 }, { "epoch": 1.16, "learning_rate": 0.00012639891544684678, "loss": 0.0111, "step": 446480 }, { "epoch": 1.16, "learning_rate": 0.00012639502723047532, "loss": 0.0103, "step": 446490 }, { "epoch": 1.16, "learning_rate": 0.00012639113901410383, "loss": 0.0139, "step": 446500 }, { "epoch": 1.16, "learning_rate": 0.00012638725079773238, "loss": 0.0137, "step": 446510 }, { "epoch": 1.16, "learning_rate": 0.00012638336258136092, "loss": 0.0123, "step": 446520 }, { "epoch": 1.16, "learning_rate": 0.00012637947436498946, "loss": 0.013, "step": 446530 }, { "epoch": 1.16, "learning_rate": 0.00012637558614861797, "loss": 0.0136, "step": 446540 }, { "epoch": 1.16, "learning_rate": 0.00012637169793224654, "loss": 0.0098, "step": 446550 }, { "epoch": 1.16, "learning_rate": 0.00012636780971587506, "loss": 0.0102, "step": 446560 }, { "epoch": 1.16, "learning_rate": 0.0001263639214995036, "loss": 0.0126, "step": 446570 }, { "epoch": 1.16, "learning_rate": 0.00012636003328313214, "loss": 0.0083, "step": 446580 }, { "epoch": 1.16, "learning_rate": 0.00012635614506676068, "loss": 0.0126, "step": 446590 }, { "epoch": 1.16, "learning_rate": 0.0001263522568503892, "loss": 0.0125, "step": 446600 }, { "epoch": 1.16, "learning_rate": 0.00012634836863401774, "loss": 0.0121, "step": 446610 }, { "epoch": 1.16, "learning_rate": 0.00012634448041764628, "loss": 0.0121, "step": 446620 }, { "epoch": 1.16, "learning_rate": 0.0001263405922012748, "loss": 0.0132, "step": 446630 }, { "epoch": 1.16, "learning_rate": 0.00012633670398490334, "loss": 0.0117, "step": 446640 }, { "epoch": 1.16, "learning_rate": 0.00012633281576853188, "loss": 0.0113, "step": 446650 }, { "epoch": 1.16, "learning_rate": 0.00012632892755216042, "loss": 0.0088, "step": 446660 }, { "epoch": 1.16, "learning_rate": 0.00012632503933578893, "loss": 0.0097, "step": 446670 }, { "epoch": 1.16, "learning_rate": 0.00012632115111941748, "loss": 0.01, "step": 446680 }, { "epoch": 1.16, "learning_rate": 0.00012631726290304602, "loss": 0.0099, "step": 446690 }, { "epoch": 1.16, "learning_rate": 0.00012631337468667456, "loss": 0.01, "step": 446700 }, { "epoch": 1.16, "learning_rate": 0.00012630948647030307, "loss": 0.0099, "step": 446710 }, { "epoch": 1.16, "learning_rate": 0.00012630559825393161, "loss": 0.0136, "step": 446720 }, { "epoch": 1.16, "learning_rate": 0.00012630171003756016, "loss": 0.0112, "step": 446730 }, { "epoch": 1.16, "learning_rate": 0.0001262978218211887, "loss": 0.0101, "step": 446740 }, { "epoch": 1.16, "learning_rate": 0.00012629393360481724, "loss": 0.0108, "step": 446750 }, { "epoch": 1.16, "learning_rate": 0.00012629004538844578, "loss": 0.0086, "step": 446760 }, { "epoch": 1.16, "learning_rate": 0.0001262861571720743, "loss": 0.0108, "step": 446770 }, { "epoch": 1.16, "learning_rate": 0.00012628226895570284, "loss": 0.0128, "step": 446780 }, { "epoch": 1.16, "learning_rate": 0.00012627838073933138, "loss": 0.01, "step": 446790 }, { "epoch": 1.16, "learning_rate": 0.00012627449252295992, "loss": 0.0126, "step": 446800 }, { "epoch": 1.16, "learning_rate": 0.00012627060430658844, "loss": 0.0117, "step": 446810 }, { "epoch": 1.16, "learning_rate": 0.00012626671609021698, "loss": 0.0155, "step": 446820 }, { "epoch": 1.16, "learning_rate": 0.00012626282787384552, "loss": 0.0132, "step": 446830 }, { "epoch": 1.16, "learning_rate": 0.00012625893965747406, "loss": 0.01, "step": 446840 }, { "epoch": 1.16, "learning_rate": 0.00012625505144110257, "loss": 0.0109, "step": 446850 }, { "epoch": 1.16, "learning_rate": 0.00012625116322473112, "loss": 0.0115, "step": 446860 }, { "epoch": 1.16, "learning_rate": 0.00012624727500835966, "loss": 0.0134, "step": 446870 }, { "epoch": 1.16, "learning_rate": 0.00012624338679198817, "loss": 0.009, "step": 446880 }, { "epoch": 1.16, "learning_rate": 0.00012623949857561671, "loss": 0.0109, "step": 446890 }, { "epoch": 1.16, "learning_rate": 0.00012623561035924526, "loss": 0.0089, "step": 446900 }, { "epoch": 1.16, "learning_rate": 0.0001262317221428738, "loss": 0.0101, "step": 446910 }, { "epoch": 1.16, "learning_rate": 0.00012622783392650234, "loss": 0.0096, "step": 446920 }, { "epoch": 1.16, "learning_rate": 0.00012622394571013088, "loss": 0.0117, "step": 446930 }, { "epoch": 1.16, "learning_rate": 0.0001262200574937594, "loss": 0.0086, "step": 446940 }, { "epoch": 1.16, "learning_rate": 0.00012621616927738794, "loss": 0.0111, "step": 446950 }, { "epoch": 1.16, "learning_rate": 0.00012621228106101648, "loss": 0.0108, "step": 446960 }, { "epoch": 1.16, "learning_rate": 0.00012620839284464502, "loss": 0.01, "step": 446970 }, { "epoch": 1.16, "learning_rate": 0.00012620450462827353, "loss": 0.0092, "step": 446980 }, { "epoch": 1.16, "learning_rate": 0.00012620061641190208, "loss": 0.0144, "step": 446990 }, { "epoch": 1.16, "learning_rate": 0.00012619672819553062, "loss": 0.0123, "step": 447000 }, { "epoch": 1.16, "eval_cer": 0.8817054855970361, "eval_loss": 0.007263442501425743, "eval_runtime": 107.2268, "eval_samples_per_second": 18.652, "eval_steps_per_second": 4.663, "step": 447000 }, { "epoch": 1.16, "learning_rate": 0.00012619283997915916, "loss": 0.0073, "step": 447010 }, { "epoch": 1.16, "learning_rate": 0.00012618895176278767, "loss": 0.0123, "step": 447020 }, { "epoch": 1.16, "learning_rate": 0.00012618506354641622, "loss": 0.0104, "step": 447030 }, { "epoch": 1.16, "learning_rate": 0.00012618117533004476, "loss": 0.0112, "step": 447040 }, { "epoch": 1.16, "learning_rate": 0.0001261772871136733, "loss": 0.0092, "step": 447050 }, { "epoch": 1.16, "learning_rate": 0.0001261733988973018, "loss": 0.0101, "step": 447060 }, { "epoch": 1.16, "learning_rate": 0.00012616951068093038, "loss": 0.0117, "step": 447070 }, { "epoch": 1.16, "learning_rate": 0.0001261656224645589, "loss": 0.0119, "step": 447080 }, { "epoch": 1.16, "learning_rate": 0.0001261617342481874, "loss": 0.0108, "step": 447090 }, { "epoch": 1.16, "learning_rate": 0.00012615784603181598, "loss": 0.0097, "step": 447100 }, { "epoch": 1.16, "learning_rate": 0.0001261539578154445, "loss": 0.0115, "step": 447110 }, { "epoch": 1.16, "learning_rate": 0.00012615006959907304, "loss": 0.0137, "step": 447120 }, { "epoch": 1.16, "learning_rate": 0.00012614618138270158, "loss": 0.0121, "step": 447130 }, { "epoch": 1.16, "learning_rate": 0.00012614229316633012, "loss": 0.0108, "step": 447140 }, { "epoch": 1.16, "learning_rate": 0.00012613840494995863, "loss": 0.0075, "step": 447150 }, { "epoch": 1.16, "learning_rate": 0.00012613451673358718, "loss": 0.0086, "step": 447160 }, { "epoch": 1.16, "learning_rate": 0.00012613062851721572, "loss": 0.0083, "step": 447170 }, { "epoch": 1.16, "learning_rate": 0.00012612674030084426, "loss": 0.0128, "step": 447180 }, { "epoch": 1.16, "learning_rate": 0.00012612285208447277, "loss": 0.0112, "step": 447190 }, { "epoch": 1.16, "learning_rate": 0.00012611896386810131, "loss": 0.0136, "step": 447200 }, { "epoch": 1.16, "learning_rate": 0.00012611507565172986, "loss": 0.0101, "step": 447210 }, { "epoch": 1.16, "learning_rate": 0.0001261111874353584, "loss": 0.0096, "step": 447220 }, { "epoch": 1.16, "learning_rate": 0.0001261072992189869, "loss": 0.0114, "step": 447230 }, { "epoch": 1.16, "learning_rate": 0.00012610341100261545, "loss": 0.0103, "step": 447240 }, { "epoch": 1.16, "learning_rate": 0.000126099522786244, "loss": 0.0117, "step": 447250 }, { "epoch": 1.16, "learning_rate": 0.00012609563456987254, "loss": 0.0135, "step": 447260 }, { "epoch": 1.16, "learning_rate": 0.00012609174635350108, "loss": 0.0095, "step": 447270 }, { "epoch": 1.16, "learning_rate": 0.00012608785813712962, "loss": 0.0106, "step": 447280 }, { "epoch": 1.16, "learning_rate": 0.00012608396992075814, "loss": 0.0092, "step": 447290 }, { "epoch": 1.16, "learning_rate": 0.00012608008170438668, "loss": 0.0115, "step": 447300 }, { "epoch": 1.16, "learning_rate": 0.00012607619348801522, "loss": 0.0082, "step": 447310 }, { "epoch": 1.16, "learning_rate": 0.00012607230527164376, "loss": 0.013, "step": 447320 }, { "epoch": 1.16, "learning_rate": 0.00012606841705527227, "loss": 0.0138, "step": 447330 }, { "epoch": 1.16, "learning_rate": 0.00012606452883890082, "loss": 0.0081, "step": 447340 }, { "epoch": 1.16, "learning_rate": 0.00012606064062252936, "loss": 0.0149, "step": 447350 }, { "epoch": 1.16, "learning_rate": 0.00012605675240615787, "loss": 0.0123, "step": 447360 }, { "epoch": 1.16, "learning_rate": 0.00012605286418978641, "loss": 0.0151, "step": 447370 }, { "epoch": 1.16, "learning_rate": 0.00012604897597341496, "loss": 0.0095, "step": 447380 }, { "epoch": 1.16, "learning_rate": 0.0001260450877570435, "loss": 0.0107, "step": 447390 }, { "epoch": 1.16, "learning_rate": 0.000126041199540672, "loss": 0.0082, "step": 447400 }, { "epoch": 1.16, "learning_rate": 0.00012603731132430055, "loss": 0.0115, "step": 447410 }, { "epoch": 1.16, "learning_rate": 0.0001260334231079291, "loss": 0.0109, "step": 447420 }, { "epoch": 1.16, "learning_rate": 0.00012602953489155764, "loss": 0.0106, "step": 447430 }, { "epoch": 1.16, "learning_rate": 0.00012602564667518615, "loss": 0.0127, "step": 447440 }, { "epoch": 1.16, "learning_rate": 0.00012602175845881472, "loss": 0.012, "step": 447450 }, { "epoch": 1.16, "learning_rate": 0.00012601787024244323, "loss": 0.0105, "step": 447460 }, { "epoch": 1.16, "learning_rate": 0.00012601398202607178, "loss": 0.0099, "step": 447470 }, { "epoch": 1.16, "learning_rate": 0.00012601009380970032, "loss": 0.0103, "step": 447480 }, { "epoch": 1.16, "learning_rate": 0.00012600620559332886, "loss": 0.0115, "step": 447490 }, { "epoch": 1.16, "learning_rate": 0.00012600231737695737, "loss": 0.0123, "step": 447500 }, { "epoch": 1.16, "learning_rate": 0.00012599842916058592, "loss": 0.0079, "step": 447510 }, { "epoch": 1.16, "learning_rate": 0.00012599454094421446, "loss": 0.0111, "step": 447520 }, { "epoch": 1.16, "learning_rate": 0.000125990652727843, "loss": 0.0126, "step": 447530 }, { "epoch": 1.16, "learning_rate": 0.00012598676451147151, "loss": 0.008, "step": 447540 }, { "epoch": 1.16, "learning_rate": 0.00012598287629510006, "loss": 0.0124, "step": 447550 }, { "epoch": 1.16, "learning_rate": 0.0001259789880787286, "loss": 0.0078, "step": 447560 }, { "epoch": 1.16, "learning_rate": 0.00012597509986235714, "loss": 0.01, "step": 447570 }, { "epoch": 1.16, "learning_rate": 0.00012597121164598565, "loss": 0.0123, "step": 447580 }, { "epoch": 1.16, "learning_rate": 0.0001259673234296142, "loss": 0.013, "step": 447590 }, { "epoch": 1.16, "learning_rate": 0.00012596343521324274, "loss": 0.0099, "step": 447600 }, { "epoch": 1.16, "learning_rate": 0.00012595954699687125, "loss": 0.0103, "step": 447610 }, { "epoch": 1.16, "learning_rate": 0.00012595565878049982, "loss": 0.0112, "step": 447620 }, { "epoch": 1.16, "learning_rate": 0.00012595177056412833, "loss": 0.012, "step": 447630 }, { "epoch": 1.16, "learning_rate": 0.00012594788234775688, "loss": 0.011, "step": 447640 }, { "epoch": 1.16, "learning_rate": 0.00012594399413138542, "loss": 0.0101, "step": 447650 }, { "epoch": 1.16, "learning_rate": 0.00012594010591501396, "loss": 0.0097, "step": 447660 }, { "epoch": 1.16, "learning_rate": 0.00012593621769864247, "loss": 0.0087, "step": 447670 }, { "epoch": 1.16, "learning_rate": 0.00012593232948227102, "loss": 0.0162, "step": 447680 }, { "epoch": 1.16, "learning_rate": 0.00012592844126589956, "loss": 0.0118, "step": 447690 }, { "epoch": 1.16, "learning_rate": 0.0001259245530495281, "loss": 0.0111, "step": 447700 }, { "epoch": 1.16, "learning_rate": 0.0001259206648331566, "loss": 0.012, "step": 447710 }, { "epoch": 1.16, "learning_rate": 0.00012591677661678515, "loss": 0.0103, "step": 447720 }, { "epoch": 1.16, "learning_rate": 0.0001259128884004137, "loss": 0.0138, "step": 447730 }, { "epoch": 1.16, "learning_rate": 0.00012590900018404224, "loss": 0.0149, "step": 447740 }, { "epoch": 1.16, "learning_rate": 0.00012590511196767075, "loss": 0.0091, "step": 447750 }, { "epoch": 1.16, "learning_rate": 0.0001259012237512993, "loss": 0.0087, "step": 447760 }, { "epoch": 1.16, "learning_rate": 0.00012589733553492784, "loss": 0.0092, "step": 447770 }, { "epoch": 1.16, "learning_rate": 0.00012589344731855638, "loss": 0.0107, "step": 447780 }, { "epoch": 1.16, "learning_rate": 0.00012588955910218492, "loss": 0.0116, "step": 447790 }, { "epoch": 1.16, "learning_rate": 0.00012588567088581346, "loss": 0.0097, "step": 447800 }, { "epoch": 1.16, "learning_rate": 0.00012588178266944198, "loss": 0.0143, "step": 447810 }, { "epoch": 1.16, "learning_rate": 0.00012587789445307052, "loss": 0.0097, "step": 447820 }, { "epoch": 1.16, "learning_rate": 0.00012587400623669906, "loss": 0.013, "step": 447830 }, { "epoch": 1.16, "learning_rate": 0.00012587011802032757, "loss": 0.0096, "step": 447840 }, { "epoch": 1.16, "learning_rate": 0.00012586622980395611, "loss": 0.0113, "step": 447850 }, { "epoch": 1.16, "learning_rate": 0.00012586234158758466, "loss": 0.0124, "step": 447860 }, { "epoch": 1.16, "learning_rate": 0.0001258584533712132, "loss": 0.011, "step": 447870 }, { "epoch": 1.16, "learning_rate": 0.0001258545651548417, "loss": 0.0096, "step": 447880 }, { "epoch": 1.16, "learning_rate": 0.00012585067693847025, "loss": 0.0107, "step": 447890 }, { "epoch": 1.16, "learning_rate": 0.0001258467887220988, "loss": 0.0108, "step": 447900 }, { "epoch": 1.16, "learning_rate": 0.00012584290050572734, "loss": 0.0116, "step": 447910 }, { "epoch": 1.16, "learning_rate": 0.00012583901228935585, "loss": 0.0093, "step": 447920 }, { "epoch": 1.16, "learning_rate": 0.0001258351240729844, "loss": 0.0086, "step": 447930 }, { "epoch": 1.16, "learning_rate": 0.00012583123585661294, "loss": 0.015, "step": 447940 }, { "epoch": 1.16, "learning_rate": 0.00012582734764024148, "loss": 0.0099, "step": 447950 }, { "epoch": 1.16, "learning_rate": 0.00012582345942387, "loss": 0.0121, "step": 447960 }, { "epoch": 1.16, "learning_rate": 0.00012581957120749856, "loss": 0.0101, "step": 447970 }, { "epoch": 1.16, "learning_rate": 0.00012581568299112707, "loss": 0.0119, "step": 447980 }, { "epoch": 1.16, "learning_rate": 0.00012581179477475562, "loss": 0.0151, "step": 447990 }, { "epoch": 1.16, "learning_rate": 0.00012580790655838416, "loss": 0.009, "step": 448000 }, { "epoch": 1.16, "eval_cer": 0.8817068852339703, "eval_loss": 0.007401402574032545, "eval_runtime": 107.5857, "eval_samples_per_second": 18.59, "eval_steps_per_second": 4.647, "step": 448000 }, { "epoch": 1.16, "learning_rate": 0.0001258040183420127, "loss": 0.0098, "step": 448010 }, { "epoch": 1.16, "learning_rate": 0.00012580013012564121, "loss": 0.01, "step": 448020 }, { "epoch": 1.16, "learning_rate": 0.00012579624190926976, "loss": 0.0082, "step": 448030 }, { "epoch": 1.16, "learning_rate": 0.0001257923536928983, "loss": 0.0101, "step": 448040 }, { "epoch": 1.16, "learning_rate": 0.00012578846547652684, "loss": 0.0125, "step": 448050 }, { "epoch": 1.16, "learning_rate": 0.00012578457726015535, "loss": 0.0111, "step": 448060 }, { "epoch": 1.16, "learning_rate": 0.0001257806890437839, "loss": 0.0093, "step": 448070 }, { "epoch": 1.16, "learning_rate": 0.00012577680082741244, "loss": 0.0094, "step": 448080 }, { "epoch": 1.16, "learning_rate": 0.00012577291261104095, "loss": 0.012, "step": 448090 }, { "epoch": 1.16, "learning_rate": 0.0001257690243946695, "loss": 0.0125, "step": 448100 }, { "epoch": 1.16, "learning_rate": 0.00012576513617829803, "loss": 0.0107, "step": 448110 }, { "epoch": 1.16, "learning_rate": 0.00012576124796192658, "loss": 0.0133, "step": 448120 }, { "epoch": 1.16, "learning_rate": 0.0001257573597455551, "loss": 0.0085, "step": 448130 }, { "epoch": 1.16, "learning_rate": 0.00012575347152918366, "loss": 0.0126, "step": 448140 }, { "epoch": 1.16, "learning_rate": 0.00012574958331281217, "loss": 0.0088, "step": 448150 }, { "epoch": 1.16, "learning_rate": 0.00012574569509644072, "loss": 0.0105, "step": 448160 }, { "epoch": 1.16, "learning_rate": 0.00012574180688006926, "loss": 0.0162, "step": 448170 }, { "epoch": 1.16, "learning_rate": 0.0001257379186636978, "loss": 0.0098, "step": 448180 }, { "epoch": 1.16, "learning_rate": 0.00012573403044732631, "loss": 0.0096, "step": 448190 }, { "epoch": 1.16, "learning_rate": 0.00012573014223095486, "loss": 0.0106, "step": 448200 }, { "epoch": 1.16, "learning_rate": 0.0001257262540145834, "loss": 0.0091, "step": 448210 }, { "epoch": 1.16, "learning_rate": 0.00012572236579821194, "loss": 0.008, "step": 448220 }, { "epoch": 1.16, "learning_rate": 0.00012571847758184045, "loss": 0.0126, "step": 448230 }, { "epoch": 1.16, "learning_rate": 0.000125714589365469, "loss": 0.0143, "step": 448240 }, { "epoch": 1.16, "learning_rate": 0.00012571070114909754, "loss": 0.0101, "step": 448250 }, { "epoch": 1.16, "learning_rate": 0.00012570681293272608, "loss": 0.0101, "step": 448260 }, { "epoch": 1.16, "learning_rate": 0.0001257029247163546, "loss": 0.0112, "step": 448270 }, { "epoch": 1.16, "learning_rate": 0.00012569903649998313, "loss": 0.0123, "step": 448280 }, { "epoch": 1.16, "learning_rate": 0.00012569514828361168, "loss": 0.009, "step": 448290 }, { "epoch": 1.16, "learning_rate": 0.00012569126006724022, "loss": 0.0111, "step": 448300 }, { "epoch": 1.16, "learning_rate": 0.00012568737185086873, "loss": 0.0112, "step": 448310 }, { "epoch": 1.16, "learning_rate": 0.0001256834836344973, "loss": 0.0092, "step": 448320 }, { "epoch": 1.16, "learning_rate": 0.00012567959541812582, "loss": 0.0091, "step": 448330 }, { "epoch": 1.16, "learning_rate": 0.00012567570720175436, "loss": 0.0097, "step": 448340 }, { "epoch": 1.16, "learning_rate": 0.0001256718189853829, "loss": 0.0131, "step": 448350 }, { "epoch": 1.16, "learning_rate": 0.0001256679307690114, "loss": 0.0119, "step": 448360 }, { "epoch": 1.16, "learning_rate": 0.00012566404255263995, "loss": 0.0126, "step": 448370 }, { "epoch": 1.16, "learning_rate": 0.0001256601543362685, "loss": 0.0114, "step": 448380 }, { "epoch": 1.16, "learning_rate": 0.00012565626611989704, "loss": 0.0098, "step": 448390 }, { "epoch": 1.16, "learning_rate": 0.00012565237790352555, "loss": 0.0107, "step": 448400 }, { "epoch": 1.16, "learning_rate": 0.0001256484896871541, "loss": 0.0114, "step": 448410 }, { "epoch": 1.16, "learning_rate": 0.00012564460147078264, "loss": 0.0118, "step": 448420 }, { "epoch": 1.16, "learning_rate": 0.00012564071325441118, "loss": 0.0095, "step": 448430 }, { "epoch": 1.16, "learning_rate": 0.0001256368250380397, "loss": 0.0101, "step": 448440 }, { "epoch": 1.16, "learning_rate": 0.00012563293682166823, "loss": 0.0154, "step": 448450 }, { "epoch": 1.16, "learning_rate": 0.00012562904860529678, "loss": 0.0115, "step": 448460 }, { "epoch": 1.16, "learning_rate": 0.00012562516038892532, "loss": 0.0122, "step": 448470 }, { "epoch": 1.16, "learning_rate": 0.00012562127217255383, "loss": 0.01, "step": 448480 }, { "epoch": 1.16, "learning_rate": 0.0001256173839561824, "loss": 0.0115, "step": 448490 }, { "epoch": 1.16, "learning_rate": 0.00012561349573981091, "loss": 0.0113, "step": 448500 }, { "epoch": 1.16, "learning_rate": 0.00012560960752343946, "loss": 0.0087, "step": 448510 }, { "epoch": 1.16, "learning_rate": 0.000125605719307068, "loss": 0.0104, "step": 448520 }, { "epoch": 1.16, "learning_rate": 0.00012560183109069654, "loss": 0.0133, "step": 448530 }, { "epoch": 1.16, "learning_rate": 0.00012559794287432505, "loss": 0.0118, "step": 448540 }, { "epoch": 1.16, "learning_rate": 0.0001255940546579536, "loss": 0.01, "step": 448550 }, { "epoch": 1.16, "learning_rate": 0.00012559016644158214, "loss": 0.0123, "step": 448560 }, { "epoch": 1.16, "learning_rate": 0.00012558627822521068, "loss": 0.0085, "step": 448570 }, { "epoch": 1.16, "learning_rate": 0.0001255823900088392, "loss": 0.0105, "step": 448580 }, { "epoch": 1.16, "learning_rate": 0.00012557850179246774, "loss": 0.0135, "step": 448590 }, { "epoch": 1.16, "learning_rate": 0.00012557461357609628, "loss": 0.0107, "step": 448600 }, { "epoch": 1.16, "learning_rate": 0.0001255707253597248, "loss": 0.0142, "step": 448610 }, { "epoch": 1.16, "learning_rate": 0.00012556683714335333, "loss": 0.0117, "step": 448620 }, { "epoch": 1.16, "learning_rate": 0.00012556294892698187, "loss": 0.0092, "step": 448630 }, { "epoch": 1.16, "learning_rate": 0.00012555906071061042, "loss": 0.0098, "step": 448640 }, { "epoch": 1.16, "learning_rate": 0.00012555517249423893, "loss": 0.0114, "step": 448650 }, { "epoch": 1.16, "learning_rate": 0.0001255512842778675, "loss": 0.0115, "step": 448660 }, { "epoch": 1.16, "learning_rate": 0.00012554739606149601, "loss": 0.0095, "step": 448670 }, { "epoch": 1.16, "learning_rate": 0.00012554350784512456, "loss": 0.0109, "step": 448680 }, { "epoch": 1.16, "learning_rate": 0.0001255396196287531, "loss": 0.0096, "step": 448690 }, { "epoch": 1.16, "learning_rate": 0.00012553573141238164, "loss": 0.0133, "step": 448700 }, { "epoch": 1.16, "learning_rate": 0.00012553184319601015, "loss": 0.0112, "step": 448710 }, { "epoch": 1.16, "learning_rate": 0.0001255279549796387, "loss": 0.011, "step": 448720 }, { "epoch": 1.16, "learning_rate": 0.00012552406676326724, "loss": 0.0081, "step": 448730 }, { "epoch": 1.16, "learning_rate": 0.00012552017854689578, "loss": 0.012, "step": 448740 }, { "epoch": 1.16, "learning_rate": 0.0001255162903305243, "loss": 0.0126, "step": 448750 }, { "epoch": 1.16, "learning_rate": 0.00012551240211415283, "loss": 0.0107, "step": 448760 }, { "epoch": 1.16, "learning_rate": 0.00012550851389778138, "loss": 0.0114, "step": 448770 }, { "epoch": 1.16, "learning_rate": 0.00012550462568140992, "loss": 0.0119, "step": 448780 }, { "epoch": 1.16, "learning_rate": 0.00012550073746503843, "loss": 0.0091, "step": 448790 }, { "epoch": 1.16, "learning_rate": 0.00012549684924866697, "loss": 0.0083, "step": 448800 }, { "epoch": 1.16, "learning_rate": 0.00012549296103229552, "loss": 0.0122, "step": 448810 }, { "epoch": 1.16, "learning_rate": 0.00012548907281592406, "loss": 0.0126, "step": 448820 }, { "epoch": 1.16, "learning_rate": 0.00012548518459955257, "loss": 0.0118, "step": 448830 }, { "epoch": 1.16, "learning_rate": 0.00012548129638318111, "loss": 0.0083, "step": 448840 }, { "epoch": 1.16, "learning_rate": 0.00012547740816680966, "loss": 0.0108, "step": 448850 }, { "epoch": 1.16, "learning_rate": 0.0001254735199504382, "loss": 0.0109, "step": 448860 }, { "epoch": 1.16, "learning_rate": 0.00012546963173406674, "loss": 0.014, "step": 448870 }, { "epoch": 1.16, "learning_rate": 0.00012546574351769525, "loss": 0.0109, "step": 448880 }, { "epoch": 1.16, "learning_rate": 0.0001254618553013238, "loss": 0.0135, "step": 448890 }, { "epoch": 1.16, "learning_rate": 0.00012545796708495234, "loss": 0.0088, "step": 448900 }, { "epoch": 1.16, "learning_rate": 0.00012545407886858088, "loss": 0.011, "step": 448910 }, { "epoch": 1.16, "learning_rate": 0.0001254501906522094, "loss": 0.0118, "step": 448920 }, { "epoch": 1.16, "learning_rate": 0.00012544630243583793, "loss": 0.0097, "step": 448930 }, { "epoch": 1.16, "learning_rate": 0.00012544241421946648, "loss": 0.012, "step": 448940 }, { "epoch": 1.16, "learning_rate": 0.00012543852600309502, "loss": 0.0103, "step": 448950 }, { "epoch": 1.16, "learning_rate": 0.00012543463778672353, "loss": 0.0106, "step": 448960 }, { "epoch": 1.16, "learning_rate": 0.00012543074957035207, "loss": 0.0114, "step": 448970 }, { "epoch": 1.16, "learning_rate": 0.00012542686135398062, "loss": 0.0099, "step": 448980 }, { "epoch": 1.16, "learning_rate": 0.00012542297313760916, "loss": 0.0102, "step": 448990 }, { "epoch": 1.16, "learning_rate": 0.00012541908492123767, "loss": 0.0122, "step": 449000 }, { "epoch": 1.16, "eval_cer": 0.8817446754311932, "eval_loss": 0.0073244315572083, "eval_runtime": 107.5578, "eval_samples_per_second": 18.595, "eval_steps_per_second": 4.649, "step": 449000 }, { "epoch": 1.16, "learning_rate": 0.00012541519670486624, "loss": 0.0118, "step": 449010 }, { "epoch": 1.16, "learning_rate": 0.00012541130848849475, "loss": 0.0152, "step": 449020 }, { "epoch": 1.16, "learning_rate": 0.0001254074202721233, "loss": 0.0105, "step": 449030 }, { "epoch": 1.16, "learning_rate": 0.00012540353205575184, "loss": 0.0114, "step": 449040 }, { "epoch": 1.16, "learning_rate": 0.00012539964383938038, "loss": 0.01, "step": 449050 }, { "epoch": 1.16, "learning_rate": 0.0001253957556230089, "loss": 0.0122, "step": 449060 }, { "epoch": 1.16, "learning_rate": 0.00012539186740663744, "loss": 0.015, "step": 449070 }, { "epoch": 1.16, "learning_rate": 0.00012538797919026598, "loss": 0.0096, "step": 449080 }, { "epoch": 1.16, "learning_rate": 0.0001253840909738945, "loss": 0.0088, "step": 449090 }, { "epoch": 1.16, "learning_rate": 0.00012538020275752303, "loss": 0.0115, "step": 449100 }, { "epoch": 1.16, "learning_rate": 0.00012537631454115158, "loss": 0.0089, "step": 449110 }, { "epoch": 1.16, "learning_rate": 0.00012537242632478012, "loss": 0.0122, "step": 449120 }, { "epoch": 1.16, "learning_rate": 0.00012536853810840863, "loss": 0.0151, "step": 449130 }, { "epoch": 1.16, "learning_rate": 0.00012536464989203717, "loss": 0.0095, "step": 449140 }, { "epoch": 1.16, "learning_rate": 0.00012536076167566571, "loss": 0.0127, "step": 449150 }, { "epoch": 1.16, "learning_rate": 0.00012535687345929426, "loss": 0.0094, "step": 449160 }, { "epoch": 1.16, "learning_rate": 0.00012535298524292277, "loss": 0.0092, "step": 449170 }, { "epoch": 1.16, "learning_rate": 0.00012534909702655134, "loss": 0.0093, "step": 449180 }, { "epoch": 1.16, "learning_rate": 0.00012534520881017985, "loss": 0.0128, "step": 449190 }, { "epoch": 1.16, "learning_rate": 0.0001253413205938084, "loss": 0.0108, "step": 449200 }, { "epoch": 1.16, "learning_rate": 0.00012533743237743694, "loss": 0.0139, "step": 449210 }, { "epoch": 1.16, "learning_rate": 0.00012533354416106548, "loss": 0.013, "step": 449220 }, { "epoch": 1.16, "learning_rate": 0.000125329655944694, "loss": 0.0099, "step": 449230 }, { "epoch": 1.16, "learning_rate": 0.00012532576772832254, "loss": 0.0111, "step": 449240 }, { "epoch": 1.16, "learning_rate": 0.00012532187951195108, "loss": 0.0092, "step": 449250 }, { "epoch": 1.16, "learning_rate": 0.00012531799129557962, "loss": 0.0105, "step": 449260 }, { "epoch": 1.16, "learning_rate": 0.00012531410307920813, "loss": 0.0099, "step": 449270 }, { "epoch": 1.16, "learning_rate": 0.00012531021486283667, "loss": 0.0107, "step": 449280 }, { "epoch": 1.16, "learning_rate": 0.00012530632664646522, "loss": 0.0148, "step": 449290 }, { "epoch": 1.16, "learning_rate": 0.00012530243843009376, "loss": 0.0111, "step": 449300 }, { "epoch": 1.16, "learning_rate": 0.00012529855021372227, "loss": 0.0087, "step": 449310 }, { "epoch": 1.16, "learning_rate": 0.00012529466199735081, "loss": 0.0093, "step": 449320 }, { "epoch": 1.16, "learning_rate": 0.00012529077378097936, "loss": 0.0114, "step": 449330 }, { "epoch": 1.16, "learning_rate": 0.00012528688556460787, "loss": 0.0101, "step": 449340 }, { "epoch": 1.16, "learning_rate": 0.0001252829973482364, "loss": 0.0102, "step": 449350 }, { "epoch": 1.16, "learning_rate": 0.00012527910913186495, "loss": 0.0113, "step": 449360 }, { "epoch": 1.16, "learning_rate": 0.0001252752209154935, "loss": 0.0104, "step": 449370 }, { "epoch": 1.16, "learning_rate": 0.00012527133269912204, "loss": 0.0122, "step": 449380 }, { "epoch": 1.16, "learning_rate": 0.00012526744448275058, "loss": 0.015, "step": 449390 }, { "epoch": 1.16, "learning_rate": 0.0001252635562663791, "loss": 0.012, "step": 449400 }, { "epoch": 1.16, "learning_rate": 0.00012525966805000763, "loss": 0.0101, "step": 449410 }, { "epoch": 1.16, "learning_rate": 0.00012525577983363618, "loss": 0.0087, "step": 449420 }, { "epoch": 1.16, "learning_rate": 0.00012525189161726472, "loss": 0.0107, "step": 449430 }, { "epoch": 1.17, "learning_rate": 0.00012524800340089323, "loss": 0.0097, "step": 449440 }, { "epoch": 1.17, "learning_rate": 0.00012524411518452177, "loss": 0.0124, "step": 449450 }, { "epoch": 1.17, "learning_rate": 0.00012524022696815032, "loss": 0.0111, "step": 449460 }, { "epoch": 1.17, "learning_rate": 0.00012523633875177886, "loss": 0.0137, "step": 449470 }, { "epoch": 1.17, "learning_rate": 0.00012523245053540737, "loss": 0.0114, "step": 449480 }, { "epoch": 1.17, "learning_rate": 0.0001252285623190359, "loss": 0.0128, "step": 449490 }, { "epoch": 1.17, "learning_rate": 0.00012522467410266446, "loss": 0.0098, "step": 449500 }, { "epoch": 1.17, "learning_rate": 0.000125220785886293, "loss": 0.0119, "step": 449510 }, { "epoch": 1.17, "learning_rate": 0.0001252168976699215, "loss": 0.0132, "step": 449520 }, { "epoch": 1.17, "learning_rate": 0.00012521300945355008, "loss": 0.012, "step": 449530 }, { "epoch": 1.17, "learning_rate": 0.0001252091212371786, "loss": 0.0097, "step": 449540 }, { "epoch": 1.17, "learning_rate": 0.00012520523302080714, "loss": 0.0114, "step": 449550 }, { "epoch": 1.17, "learning_rate": 0.00012520134480443568, "loss": 0.0157, "step": 449560 }, { "epoch": 1.17, "learning_rate": 0.0001251974565880642, "loss": 0.0115, "step": 449570 }, { "epoch": 1.17, "learning_rate": 0.00012519356837169273, "loss": 0.0094, "step": 449580 }, { "epoch": 1.17, "learning_rate": 0.00012518968015532128, "loss": 0.0101, "step": 449590 }, { "epoch": 1.17, "learning_rate": 0.00012518579193894982, "loss": 0.0108, "step": 449600 }, { "epoch": 1.17, "learning_rate": 0.00012518190372257833, "loss": 0.0113, "step": 449610 }, { "epoch": 1.17, "learning_rate": 0.00012517801550620687, "loss": 0.0104, "step": 449620 }, { "epoch": 1.17, "learning_rate": 0.00012517412728983542, "loss": 0.0098, "step": 449630 }, { "epoch": 1.17, "learning_rate": 0.00012517023907346396, "loss": 0.0093, "step": 449640 }, { "epoch": 1.17, "learning_rate": 0.00012516635085709247, "loss": 0.0114, "step": 449650 }, { "epoch": 1.17, "learning_rate": 0.000125162462640721, "loss": 0.013, "step": 449660 }, { "epoch": 1.17, "learning_rate": 0.00012515857442434955, "loss": 0.0084, "step": 449670 }, { "epoch": 1.17, "learning_rate": 0.0001251546862079781, "loss": 0.0098, "step": 449680 }, { "epoch": 1.17, "learning_rate": 0.0001251507979916066, "loss": 0.0101, "step": 449690 }, { "epoch": 1.17, "learning_rate": 0.00012514690977523515, "loss": 0.0078, "step": 449700 }, { "epoch": 1.17, "learning_rate": 0.0001251430215588637, "loss": 0.0106, "step": 449710 }, { "epoch": 1.17, "learning_rate": 0.00012513913334249224, "loss": 0.0081, "step": 449720 }, { "epoch": 1.17, "learning_rate": 0.00012513524512612078, "loss": 0.0114, "step": 449730 }, { "epoch": 1.17, "learning_rate": 0.00012513135690974932, "loss": 0.0115, "step": 449740 }, { "epoch": 1.17, "learning_rate": 0.00012512746869337783, "loss": 0.0094, "step": 449750 }, { "epoch": 1.17, "learning_rate": 0.00012512358047700638, "loss": 0.0112, "step": 449760 }, { "epoch": 1.17, "learning_rate": 0.00012511969226063492, "loss": 0.0078, "step": 449770 }, { "epoch": 1.17, "learning_rate": 0.00012511580404426346, "loss": 0.0115, "step": 449780 }, { "epoch": 1.17, "learning_rate": 0.00012511191582789197, "loss": 0.0102, "step": 449790 }, { "epoch": 1.17, "learning_rate": 0.00012510802761152051, "loss": 0.0108, "step": 449800 }, { "epoch": 1.17, "learning_rate": 0.00012510413939514906, "loss": 0.0115, "step": 449810 }, { "epoch": 1.17, "learning_rate": 0.00012510025117877757, "loss": 0.009, "step": 449820 }, { "epoch": 1.17, "learning_rate": 0.0001250963629624061, "loss": 0.0114, "step": 449830 }, { "epoch": 1.17, "learning_rate": 0.00012509247474603465, "loss": 0.0067, "step": 449840 }, { "epoch": 1.17, "learning_rate": 0.0001250885865296632, "loss": 0.0158, "step": 449850 }, { "epoch": 1.17, "learning_rate": 0.0001250846983132917, "loss": 0.0095, "step": 449860 }, { "epoch": 1.17, "learning_rate": 0.00012508081009692025, "loss": 0.0104, "step": 449870 }, { "epoch": 1.17, "learning_rate": 0.0001250769218805488, "loss": 0.0075, "step": 449880 }, { "epoch": 1.17, "learning_rate": 0.00012507303366417734, "loss": 0.0126, "step": 449890 }, { "epoch": 1.17, "learning_rate": 0.00012506914544780585, "loss": 0.0101, "step": 449900 }, { "epoch": 1.17, "learning_rate": 0.00012506525723143442, "loss": 0.0067, "step": 449910 }, { "epoch": 1.17, "learning_rate": 0.00012506136901506293, "loss": 0.034, "step": 449920 }, { "epoch": 1.17, "learning_rate": 0.00012505748079869147, "loss": 0.0121, "step": 449930 }, { "epoch": 1.17, "learning_rate": 0.00012505359258232002, "loss": 0.0121, "step": 449940 }, { "epoch": 1.17, "learning_rate": 0.00012504970436594856, "loss": 0.0097, "step": 449950 }, { "epoch": 1.17, "learning_rate": 0.00012504581614957707, "loss": 0.0093, "step": 449960 }, { "epoch": 1.17, "learning_rate": 0.00012504192793320561, "loss": 0.0113, "step": 449970 }, { "epoch": 1.17, "learning_rate": 0.00012503803971683416, "loss": 0.0149, "step": 449980 }, { "epoch": 1.17, "learning_rate": 0.0001250341515004627, "loss": 0.0106, "step": 449990 }, { "epoch": 1.17, "learning_rate": 0.0001250302632840912, "loss": 0.0107, "step": 450000 }, { "epoch": 1.17, "eval_cer": 0.8816900895907601, "eval_loss": 0.007372671272605658, "eval_runtime": 107.4625, "eval_samples_per_second": 18.611, "eval_steps_per_second": 4.653, "step": 450000 }, { "epoch": 1.17, "learning_rate": 0.00012502637506771975, "loss": 0.0104, "step": 450010 }, { "epoch": 1.17, "learning_rate": 0.0001250224868513483, "loss": 0.012, "step": 450020 }, { "epoch": 1.17, "learning_rate": 0.00012501859863497684, "loss": 0.0088, "step": 450030 }, { "epoch": 1.17, "learning_rate": 0.00012501471041860535, "loss": 0.014, "step": 450040 }, { "epoch": 1.17, "learning_rate": 0.00012501082220223392, "loss": 0.0095, "step": 450050 }, { "epoch": 1.17, "learning_rate": 0.00012500693398586243, "loss": 0.0098, "step": 450060 }, { "epoch": 1.17, "learning_rate": 0.00012500304576949095, "loss": 0.0119, "step": 450070 }, { "epoch": 1.17, "learning_rate": 0.00012499915755311952, "loss": 0.0109, "step": 450080 }, { "epoch": 1.17, "learning_rate": 0.00012499526933674803, "loss": 0.0104, "step": 450090 }, { "epoch": 1.17, "learning_rate": 0.00012499138112037657, "loss": 0.0091, "step": 450100 }, { "epoch": 1.17, "learning_rate": 0.00012498749290400512, "loss": 0.0096, "step": 450110 }, { "epoch": 1.17, "learning_rate": 0.00012498360468763366, "loss": 0.0095, "step": 450120 }, { "epoch": 1.17, "learning_rate": 0.00012497971647126217, "loss": 0.0116, "step": 450130 }, { "epoch": 1.17, "learning_rate": 0.0001249758282548907, "loss": 0.0094, "step": 450140 }, { "epoch": 1.17, "learning_rate": 0.00012497194003851925, "loss": 0.0113, "step": 450150 }, { "epoch": 1.17, "learning_rate": 0.0001249680518221478, "loss": 0.013, "step": 450160 }, { "epoch": 1.17, "learning_rate": 0.0001249641636057763, "loss": 0.0144, "step": 450170 }, { "epoch": 1.17, "learning_rate": 0.00012496027538940485, "loss": 0.0108, "step": 450180 }, { "epoch": 1.17, "learning_rate": 0.0001249563871730334, "loss": 0.0126, "step": 450190 }, { "epoch": 1.17, "learning_rate": 0.00012495249895666194, "loss": 0.0123, "step": 450200 }, { "epoch": 1.17, "learning_rate": 0.00012494861074029045, "loss": 0.0119, "step": 450210 }, { "epoch": 1.17, "learning_rate": 0.000124944722523919, "loss": 0.0117, "step": 450220 }, { "epoch": 1.17, "learning_rate": 0.00012494083430754753, "loss": 0.0107, "step": 450230 }, { "epoch": 1.17, "learning_rate": 0.00012493694609117608, "loss": 0.0118, "step": 450240 }, { "epoch": 1.17, "learning_rate": 0.00012493305787480462, "loss": 0.0107, "step": 450250 }, { "epoch": 1.17, "learning_rate": 0.00012492916965843316, "loss": 0.01, "step": 450260 }, { "epoch": 1.17, "learning_rate": 0.00012492528144206167, "loss": 0.0092, "step": 450270 }, { "epoch": 1.17, "learning_rate": 0.00012492139322569021, "loss": 0.0093, "step": 450280 }, { "epoch": 1.17, "learning_rate": 0.00012491750500931876, "loss": 0.01, "step": 450290 }, { "epoch": 1.17, "learning_rate": 0.0001249136167929473, "loss": 0.0108, "step": 450300 }, { "epoch": 1.17, "learning_rate": 0.0001249097285765758, "loss": 0.0087, "step": 450310 }, { "epoch": 1.17, "learning_rate": 0.00012490584036020435, "loss": 0.011, "step": 450320 }, { "epoch": 1.17, "learning_rate": 0.0001249019521438329, "loss": 0.0115, "step": 450330 }, { "epoch": 1.17, "learning_rate": 0.0001248980639274614, "loss": 0.0129, "step": 450340 }, { "epoch": 1.17, "learning_rate": 0.00012489417571108995, "loss": 0.0112, "step": 450350 }, { "epoch": 1.17, "learning_rate": 0.0001248902874947185, "loss": 0.0112, "step": 450360 }, { "epoch": 1.17, "learning_rate": 0.00012488639927834704, "loss": 0.0102, "step": 450370 }, { "epoch": 1.17, "learning_rate": 0.00012488251106197555, "loss": 0.0139, "step": 450380 }, { "epoch": 1.17, "learning_rate": 0.0001248786228456041, "loss": 0.0105, "step": 450390 }, { "epoch": 1.17, "learning_rate": 0.00012487473462923263, "loss": 0.0154, "step": 450400 }, { "epoch": 1.17, "learning_rate": 0.00012487084641286117, "loss": 0.0134, "step": 450410 }, { "epoch": 1.17, "learning_rate": 0.0001248669581964897, "loss": 0.0113, "step": 450420 }, { "epoch": 1.17, "learning_rate": 0.00012486306998011826, "loss": 0.0114, "step": 450430 }, { "epoch": 1.17, "learning_rate": 0.00012485918176374677, "loss": 0.013, "step": 450440 }, { "epoch": 1.17, "learning_rate": 0.00012485529354737531, "loss": 0.0104, "step": 450450 }, { "epoch": 1.17, "learning_rate": 0.00012485140533100386, "loss": 0.0111, "step": 450460 }, { "epoch": 1.17, "learning_rate": 0.0001248475171146324, "loss": 0.0152, "step": 450470 }, { "epoch": 1.17, "learning_rate": 0.0001248436288982609, "loss": 0.0113, "step": 450480 }, { "epoch": 1.17, "learning_rate": 0.00012483974068188945, "loss": 0.0106, "step": 450490 }, { "epoch": 1.17, "learning_rate": 0.000124835852465518, "loss": 0.0113, "step": 450500 }, { "epoch": 1.17, "learning_rate": 0.00012483196424914654, "loss": 0.0118, "step": 450510 }, { "epoch": 1.17, "learning_rate": 0.00012482807603277505, "loss": 0.0094, "step": 450520 }, { "epoch": 1.17, "learning_rate": 0.0001248241878164036, "loss": 0.0109, "step": 450530 }, { "epoch": 1.17, "learning_rate": 0.00012482029960003213, "loss": 0.0096, "step": 450540 }, { "epoch": 1.17, "learning_rate": 0.00012481641138366068, "loss": 0.0131, "step": 450550 }, { "epoch": 1.17, "learning_rate": 0.0001248125231672892, "loss": 0.0145, "step": 450560 }, { "epoch": 1.17, "learning_rate": 0.00012480863495091773, "loss": 0.0124, "step": 450570 }, { "epoch": 1.17, "learning_rate": 0.00012480474673454627, "loss": 0.0145, "step": 450580 }, { "epoch": 1.17, "learning_rate": 0.0001248008585181748, "loss": 0.0124, "step": 450590 }, { "epoch": 1.17, "learning_rate": 0.00012479697030180336, "loss": 0.0117, "step": 450600 }, { "epoch": 1.17, "learning_rate": 0.00012479308208543187, "loss": 0.0082, "step": 450610 }, { "epoch": 1.17, "learning_rate": 0.00012478919386906041, "loss": 0.0094, "step": 450620 }, { "epoch": 1.17, "learning_rate": 0.00012478530565268896, "loss": 0.01, "step": 450630 }, { "epoch": 1.17, "learning_rate": 0.0001247814174363175, "loss": 0.0077, "step": 450640 }, { "epoch": 1.17, "learning_rate": 0.000124777529219946, "loss": 0.0112, "step": 450650 }, { "epoch": 1.17, "learning_rate": 0.00012477364100357455, "loss": 0.016, "step": 450660 }, { "epoch": 1.17, "learning_rate": 0.0001247697527872031, "loss": 0.009, "step": 450670 }, { "epoch": 1.17, "learning_rate": 0.00012476586457083164, "loss": 0.0117, "step": 450680 }, { "epoch": 1.17, "learning_rate": 0.00012476197635446015, "loss": 0.0106, "step": 450690 }, { "epoch": 1.17, "learning_rate": 0.0001247580881380887, "loss": 0.011, "step": 450700 }, { "epoch": 1.17, "learning_rate": 0.00012475419992171723, "loss": 0.0146, "step": 450710 }, { "epoch": 1.17, "learning_rate": 0.00012475031170534578, "loss": 0.0123, "step": 450720 }, { "epoch": 1.17, "learning_rate": 0.0001247464234889743, "loss": 0.0127, "step": 450730 }, { "epoch": 1.17, "learning_rate": 0.00012474253527260283, "loss": 0.0106, "step": 450740 }, { "epoch": 1.17, "learning_rate": 0.00012473864705623137, "loss": 0.0101, "step": 450750 }, { "epoch": 1.17, "learning_rate": 0.00012473475883985992, "loss": 0.0118, "step": 450760 }, { "epoch": 1.17, "learning_rate": 0.00012473087062348846, "loss": 0.0122, "step": 450770 }, { "epoch": 1.17, "learning_rate": 0.000124726982407117, "loss": 0.0142, "step": 450780 }, { "epoch": 1.17, "learning_rate": 0.0001247230941907455, "loss": 0.0145, "step": 450790 }, { "epoch": 1.17, "learning_rate": 0.00012471920597437405, "loss": 0.0105, "step": 450800 }, { "epoch": 1.17, "learning_rate": 0.0001247153177580026, "loss": 0.0095, "step": 450810 }, { "epoch": 1.17, "learning_rate": 0.0001247114295416311, "loss": 0.0098, "step": 450820 }, { "epoch": 1.17, "learning_rate": 0.00012470754132525965, "loss": 0.0108, "step": 450830 }, { "epoch": 1.17, "learning_rate": 0.0001247036531088882, "loss": 0.0106, "step": 450840 }, { "epoch": 1.17, "learning_rate": 0.00012469976489251674, "loss": 0.0094, "step": 450850 }, { "epoch": 1.17, "learning_rate": 0.00012469587667614525, "loss": 0.0103, "step": 450860 }, { "epoch": 1.17, "learning_rate": 0.0001246919884597738, "loss": 0.0103, "step": 450870 }, { "epoch": 1.17, "learning_rate": 0.00012468810024340233, "loss": 0.0103, "step": 450880 }, { "epoch": 1.17, "learning_rate": 0.00012468421202703088, "loss": 0.0093, "step": 450890 }, { "epoch": 1.17, "learning_rate": 0.0001246803238106594, "loss": 0.0139, "step": 450900 }, { "epoch": 1.17, "learning_rate": 0.00012467643559428793, "loss": 0.0093, "step": 450910 }, { "epoch": 1.17, "learning_rate": 0.00012467254737791647, "loss": 0.0079, "step": 450920 }, { "epoch": 1.17, "learning_rate": 0.00012466865916154501, "loss": 0.0114, "step": 450930 }, { "epoch": 1.17, "learning_rate": 0.00012466477094517353, "loss": 0.0086, "step": 450940 }, { "epoch": 1.17, "learning_rate": 0.0001246608827288021, "loss": 0.0111, "step": 450950 }, { "epoch": 1.17, "learning_rate": 0.0001246569945124306, "loss": 0.0161, "step": 450960 }, { "epoch": 1.17, "learning_rate": 0.00012465310629605915, "loss": 0.0176, "step": 450970 }, { "epoch": 1.17, "learning_rate": 0.0001246492180796877, "loss": 0.012, "step": 450980 }, { "epoch": 1.17, "learning_rate": 0.00012464532986331624, "loss": 0.0102, "step": 450990 }, { "epoch": 1.17, "learning_rate": 0.00012464144164694475, "loss": 0.0114, "step": 451000 }, { "epoch": 1.17, "eval_cer": 0.8817138834186412, "eval_loss": 0.007332668174058199, "eval_runtime": 107.5021, "eval_samples_per_second": 18.604, "eval_steps_per_second": 4.651, "step": 451000 }, { "epoch": 1.17, "learning_rate": 0.0001246375534305733, "loss": 0.0121, "step": 451010 }, { "epoch": 1.17, "learning_rate": 0.00012463366521420184, "loss": 0.0107, "step": 451020 }, { "epoch": 1.17, "learning_rate": 0.00012462977699783038, "loss": 0.0098, "step": 451030 }, { "epoch": 1.17, "learning_rate": 0.0001246258887814589, "loss": 0.0119, "step": 451040 }, { "epoch": 1.17, "learning_rate": 0.00012462200056508743, "loss": 0.0099, "step": 451050 }, { "epoch": 1.17, "learning_rate": 0.00012461811234871597, "loss": 0.0106, "step": 451060 }, { "epoch": 1.17, "learning_rate": 0.0001246142241323445, "loss": 0.0091, "step": 451070 }, { "epoch": 1.17, "learning_rate": 0.00012461033591597303, "loss": 0.0114, "step": 451080 }, { "epoch": 1.17, "learning_rate": 0.00012460644769960157, "loss": 0.0124, "step": 451090 }, { "epoch": 1.17, "learning_rate": 0.00012460255948323011, "loss": 0.0174, "step": 451100 }, { "epoch": 1.17, "learning_rate": 0.00012459867126685863, "loss": 0.0093, "step": 451110 }, { "epoch": 1.17, "learning_rate": 0.0001245947830504872, "loss": 0.0109, "step": 451120 }, { "epoch": 1.17, "learning_rate": 0.0001245908948341157, "loss": 0.0117, "step": 451130 }, { "epoch": 1.17, "learning_rate": 0.00012458700661774425, "loss": 0.0113, "step": 451140 }, { "epoch": 1.17, "learning_rate": 0.0001245831184013728, "loss": 0.0116, "step": 451150 }, { "epoch": 1.17, "learning_rate": 0.00012457923018500134, "loss": 0.0135, "step": 451160 }, { "epoch": 1.17, "learning_rate": 0.00012457534196862985, "loss": 0.0108, "step": 451170 }, { "epoch": 1.17, "learning_rate": 0.0001245714537522584, "loss": 0.0086, "step": 451180 }, { "epoch": 1.17, "learning_rate": 0.00012456756553588693, "loss": 0.0116, "step": 451190 }, { "epoch": 1.17, "learning_rate": 0.00012456367731951548, "loss": 0.0088, "step": 451200 }, { "epoch": 1.17, "learning_rate": 0.000124559789103144, "loss": 0.0119, "step": 451210 }, { "epoch": 1.17, "learning_rate": 0.00012455590088677253, "loss": 0.0111, "step": 451220 }, { "epoch": 1.17, "learning_rate": 0.00012455201267040107, "loss": 0.01, "step": 451230 }, { "epoch": 1.17, "learning_rate": 0.00012454812445402962, "loss": 0.0103, "step": 451240 }, { "epoch": 1.17, "learning_rate": 0.00012454423623765813, "loss": 0.0132, "step": 451250 }, { "epoch": 1.17, "learning_rate": 0.00012454034802128667, "loss": 0.0089, "step": 451260 }, { "epoch": 1.17, "learning_rate": 0.00012453645980491521, "loss": 0.0094, "step": 451270 }, { "epoch": 1.17, "learning_rate": 0.00012453257158854376, "loss": 0.0108, "step": 451280 }, { "epoch": 1.17, "learning_rate": 0.00012452868337217227, "loss": 0.0128, "step": 451290 }, { "epoch": 1.17, "learning_rate": 0.00012452479515580084, "loss": 0.0109, "step": 451300 }, { "epoch": 1.17, "learning_rate": 0.00012452090693942935, "loss": 0.0117, "step": 451310 }, { "epoch": 1.17, "learning_rate": 0.0001245170187230579, "loss": 0.0114, "step": 451320 }, { "epoch": 1.17, "learning_rate": 0.00012451313050668644, "loss": 0.0115, "step": 451330 }, { "epoch": 1.17, "learning_rate": 0.00012450924229031495, "loss": 0.0097, "step": 451340 }, { "epoch": 1.17, "learning_rate": 0.0001245053540739435, "loss": 0.0099, "step": 451350 }, { "epoch": 1.17, "learning_rate": 0.00012450146585757203, "loss": 0.0095, "step": 451360 }, { "epoch": 1.17, "learning_rate": 0.00012449757764120058, "loss": 0.0122, "step": 451370 }, { "epoch": 1.17, "learning_rate": 0.0001244936894248291, "loss": 0.0111, "step": 451380 }, { "epoch": 1.17, "learning_rate": 0.00012448980120845763, "loss": 0.0102, "step": 451390 }, { "epoch": 1.17, "learning_rate": 0.00012448591299208617, "loss": 0.0108, "step": 451400 }, { "epoch": 1.17, "learning_rate": 0.00012448202477571472, "loss": 0.0082, "step": 451410 }, { "epoch": 1.17, "learning_rate": 0.00012447813655934323, "loss": 0.0108, "step": 451420 }, { "epoch": 1.17, "learning_rate": 0.00012447424834297177, "loss": 0.0116, "step": 451430 }, { "epoch": 1.17, "learning_rate": 0.0001244703601266003, "loss": 0.0094, "step": 451440 }, { "epoch": 1.17, "learning_rate": 0.00012446647191022885, "loss": 0.0095, "step": 451450 }, { "epoch": 1.17, "learning_rate": 0.00012446258369385737, "loss": 0.0118, "step": 451460 }, { "epoch": 1.17, "learning_rate": 0.00012445869547748594, "loss": 0.0083, "step": 451470 }, { "epoch": 1.17, "learning_rate": 0.00012445480726111445, "loss": 0.0098, "step": 451480 }, { "epoch": 1.17, "learning_rate": 0.000124450919044743, "loss": 0.0112, "step": 451490 }, { "epoch": 1.17, "learning_rate": 0.00012444703082837154, "loss": 0.0101, "step": 451500 }, { "epoch": 1.17, "learning_rate": 0.00012444314261200008, "loss": 0.0096, "step": 451510 }, { "epoch": 1.17, "learning_rate": 0.0001244392543956286, "loss": 0.0098, "step": 451520 }, { "epoch": 1.17, "learning_rate": 0.00012443536617925713, "loss": 0.0181, "step": 451530 }, { "epoch": 1.17, "learning_rate": 0.00012443147796288568, "loss": 0.0164, "step": 451540 }, { "epoch": 1.17, "learning_rate": 0.00012442758974651422, "loss": 0.0095, "step": 451550 }, { "epoch": 1.17, "learning_rate": 0.00012442370153014273, "loss": 0.0137, "step": 451560 }, { "epoch": 1.17, "learning_rate": 0.00012441981331377127, "loss": 0.0129, "step": 451570 }, { "epoch": 1.17, "learning_rate": 0.00012441592509739981, "loss": 0.0091, "step": 451580 }, { "epoch": 1.17, "learning_rate": 0.00012441203688102833, "loss": 0.0138, "step": 451590 }, { "epoch": 1.17, "learning_rate": 0.00012440814866465687, "loss": 0.0116, "step": 451600 }, { "epoch": 1.17, "learning_rate": 0.0001244042604482854, "loss": 0.0115, "step": 451610 }, { "epoch": 1.17, "learning_rate": 0.00012440037223191395, "loss": 0.0124, "step": 451620 }, { "epoch": 1.17, "learning_rate": 0.00012439648401554247, "loss": 0.0112, "step": 451630 }, { "epoch": 1.17, "learning_rate": 0.00012439259579917104, "loss": 0.0114, "step": 451640 }, { "epoch": 1.17, "learning_rate": 0.00012438870758279955, "loss": 0.009, "step": 451650 }, { "epoch": 1.17, "learning_rate": 0.0001243848193664281, "loss": 0.0091, "step": 451660 }, { "epoch": 1.17, "learning_rate": 0.00012438093115005664, "loss": 0.01, "step": 451670 }, { "epoch": 1.17, "learning_rate": 0.00012437704293368518, "loss": 0.0101, "step": 451680 }, { "epoch": 1.17, "learning_rate": 0.0001243731547173137, "loss": 0.0116, "step": 451690 }, { "epoch": 1.17, "learning_rate": 0.00012436926650094223, "loss": 0.0126, "step": 451700 }, { "epoch": 1.17, "learning_rate": 0.00012436537828457077, "loss": 0.0101, "step": 451710 }, { "epoch": 1.17, "learning_rate": 0.00012436149006819932, "loss": 0.0095, "step": 451720 }, { "epoch": 1.17, "learning_rate": 0.00012435760185182783, "loss": 0.0153, "step": 451730 }, { "epoch": 1.17, "learning_rate": 0.00012435371363545637, "loss": 0.0093, "step": 451740 }, { "epoch": 1.17, "learning_rate": 0.00012434982541908491, "loss": 0.0131, "step": 451750 }, { "epoch": 1.17, "learning_rate": 0.00012434593720271346, "loss": 0.0154, "step": 451760 }, { "epoch": 1.17, "learning_rate": 0.00012434204898634197, "loss": 0.0085, "step": 451770 }, { "epoch": 1.17, "learning_rate": 0.0001243381607699705, "loss": 0.0142, "step": 451780 }, { "epoch": 1.17, "learning_rate": 0.00012433427255359905, "loss": 0.0113, "step": 451790 }, { "epoch": 1.17, "learning_rate": 0.0001243303843372276, "loss": 0.0141, "step": 451800 }, { "epoch": 1.17, "learning_rate": 0.0001243264961208561, "loss": 0.0102, "step": 451810 }, { "epoch": 1.17, "learning_rate": 0.00012432260790448465, "loss": 0.0121, "step": 451820 }, { "epoch": 1.17, "learning_rate": 0.0001243187196881132, "loss": 0.0107, "step": 451830 }, { "epoch": 1.17, "learning_rate": 0.00012431483147174173, "loss": 0.0094, "step": 451840 }, { "epoch": 1.17, "learning_rate": 0.00012431094325537028, "loss": 0.0097, "step": 451850 }, { "epoch": 1.17, "learning_rate": 0.0001243070550389988, "loss": 0.0142, "step": 451860 }, { "epoch": 1.17, "learning_rate": 0.00012430316682262733, "loss": 0.0128, "step": 451870 }, { "epoch": 1.17, "learning_rate": 0.00012429927860625587, "loss": 0.0097, "step": 451880 }, { "epoch": 1.17, "learning_rate": 0.00012429539038988442, "loss": 0.0096, "step": 451890 }, { "epoch": 1.17, "learning_rate": 0.00012429150217351293, "loss": 0.0118, "step": 451900 }, { "epoch": 1.17, "learning_rate": 0.00012428761395714147, "loss": 0.0112, "step": 451910 }, { "epoch": 1.17, "learning_rate": 0.00012428372574077, "loss": 0.0108, "step": 451920 }, { "epoch": 1.17, "learning_rate": 0.00012427983752439856, "loss": 0.0084, "step": 451930 }, { "epoch": 1.17, "learning_rate": 0.00012427594930802707, "loss": 0.0094, "step": 451940 }, { "epoch": 1.17, "learning_rate": 0.0001242720610916556, "loss": 0.01, "step": 451950 }, { "epoch": 1.17, "learning_rate": 0.00012426817287528415, "loss": 0.0119, "step": 451960 }, { "epoch": 1.17, "learning_rate": 0.0001242642846589127, "loss": 0.0117, "step": 451970 }, { "epoch": 1.17, "learning_rate": 0.0001242603964425412, "loss": 0.0094, "step": 451980 }, { "epoch": 1.17, "learning_rate": 0.00012425650822616978, "loss": 0.0125, "step": 451990 }, { "epoch": 1.17, "learning_rate": 0.0001242526200097983, "loss": 0.0134, "step": 452000 }, { "epoch": 1.17, "eval_cer": 0.8816956881384969, "eval_loss": 0.007198153994977474, "eval_runtime": 107.5259, "eval_samples_per_second": 18.6, "eval_steps_per_second": 4.65, "step": 452000 }, { "epoch": 1.17, "learning_rate": 0.00012424873179342683, "loss": 0.0107, "step": 452010 }, { "epoch": 1.17, "learning_rate": 0.00012424484357705538, "loss": 0.0084, "step": 452020 }, { "epoch": 1.17, "learning_rate": 0.00012424095536068392, "loss": 0.0103, "step": 452030 }, { "epoch": 1.17, "learning_rate": 0.00012423706714431243, "loss": 0.0102, "step": 452040 }, { "epoch": 1.17, "learning_rate": 0.00012423317892794097, "loss": 0.0102, "step": 452050 }, { "epoch": 1.17, "learning_rate": 0.00012422929071156952, "loss": 0.0117, "step": 452060 }, { "epoch": 1.17, "learning_rate": 0.00012422540249519803, "loss": 0.0126, "step": 452070 }, { "epoch": 1.17, "learning_rate": 0.00012422151427882657, "loss": 0.0118, "step": 452080 }, { "epoch": 1.17, "learning_rate": 0.0001242176260624551, "loss": 0.0085, "step": 452090 }, { "epoch": 1.17, "learning_rate": 0.00012421373784608365, "loss": 0.0098, "step": 452100 }, { "epoch": 1.17, "learning_rate": 0.00012420984962971217, "loss": 0.0102, "step": 452110 }, { "epoch": 1.17, "learning_rate": 0.0001242059614133407, "loss": 0.0091, "step": 452120 }, { "epoch": 1.17, "learning_rate": 0.00012420207319696925, "loss": 0.0084, "step": 452130 }, { "epoch": 1.17, "learning_rate": 0.0001241981849805978, "loss": 0.0108, "step": 452140 }, { "epoch": 1.17, "learning_rate": 0.0001241942967642263, "loss": 0.0125, "step": 452150 }, { "epoch": 1.17, "learning_rate": 0.00012419040854785488, "loss": 0.0104, "step": 452160 }, { "epoch": 1.17, "learning_rate": 0.0001241865203314834, "loss": 0.0094, "step": 452170 }, { "epoch": 1.17, "learning_rate": 0.00012418263211511193, "loss": 0.0106, "step": 452180 }, { "epoch": 1.17, "learning_rate": 0.00012417874389874048, "loss": 0.0177, "step": 452190 }, { "epoch": 1.17, "learning_rate": 0.00012417485568236902, "loss": 0.0116, "step": 452200 }, { "epoch": 1.17, "learning_rate": 0.00012417096746599753, "loss": 0.0111, "step": 452210 }, { "epoch": 1.17, "learning_rate": 0.00012416707924962607, "loss": 0.0105, "step": 452220 }, { "epoch": 1.17, "learning_rate": 0.00012416319103325461, "loss": 0.0117, "step": 452230 }, { "epoch": 1.17, "learning_rate": 0.00012415930281688316, "loss": 0.0089, "step": 452240 }, { "epoch": 1.17, "learning_rate": 0.00012415541460051167, "loss": 0.0099, "step": 452250 }, { "epoch": 1.17, "learning_rate": 0.0001241515263841402, "loss": 0.0175, "step": 452260 }, { "epoch": 1.17, "learning_rate": 0.00012414763816776875, "loss": 0.0103, "step": 452270 }, { "epoch": 1.17, "learning_rate": 0.0001241437499513973, "loss": 0.0082, "step": 452280 }, { "epoch": 1.17, "learning_rate": 0.0001241398617350258, "loss": 0.0118, "step": 452290 }, { "epoch": 1.17, "learning_rate": 0.00012413597351865435, "loss": 0.0098, "step": 452300 }, { "epoch": 1.17, "learning_rate": 0.0001241320853022829, "loss": 0.0132, "step": 452310 }, { "epoch": 1.17, "learning_rate": 0.0001241281970859114, "loss": 0.0071, "step": 452320 }, { "epoch": 1.17, "learning_rate": 0.00012412430886953995, "loss": 0.0089, "step": 452330 }, { "epoch": 1.17, "learning_rate": 0.0001241204206531685, "loss": 0.0104, "step": 452340 }, { "epoch": 1.17, "learning_rate": 0.00012411653243679703, "loss": 0.0081, "step": 452350 }, { "epoch": 1.17, "learning_rate": 0.00012411264422042557, "loss": 0.0101, "step": 452360 }, { "epoch": 1.17, "learning_rate": 0.00012410875600405412, "loss": 0.0103, "step": 452370 }, { "epoch": 1.17, "learning_rate": 0.00012410486778768263, "loss": 0.0114, "step": 452380 }, { "epoch": 1.17, "learning_rate": 0.00012410097957131117, "loss": 0.0118, "step": 452390 }, { "epoch": 1.17, "learning_rate": 0.00012409709135493971, "loss": 0.0093, "step": 452400 }, { "epoch": 1.17, "learning_rate": 0.00012409320313856826, "loss": 0.0125, "step": 452410 }, { "epoch": 1.17, "learning_rate": 0.00012408931492219677, "loss": 0.0113, "step": 452420 }, { "epoch": 1.17, "learning_rate": 0.0001240854267058253, "loss": 0.0126, "step": 452430 }, { "epoch": 1.17, "learning_rate": 0.00012408153848945385, "loss": 0.0116, "step": 452440 }, { "epoch": 1.17, "learning_rate": 0.0001240776502730824, "loss": 0.01, "step": 452450 }, { "epoch": 1.17, "learning_rate": 0.0001240737620567109, "loss": 0.0098, "step": 452460 }, { "epoch": 1.17, "learning_rate": 0.00012406987384033945, "loss": 0.0109, "step": 452470 }, { "epoch": 1.17, "learning_rate": 0.000124065985623968, "loss": 0.0141, "step": 452480 }, { "epoch": 1.17, "learning_rate": 0.00012406209740759653, "loss": 0.0107, "step": 452490 }, { "epoch": 1.17, "learning_rate": 0.00012405820919122505, "loss": 0.014, "step": 452500 }, { "epoch": 1.17, "learning_rate": 0.00012405432097485362, "loss": 0.0125, "step": 452510 }, { "epoch": 1.17, "learning_rate": 0.00012405043275848213, "loss": 0.0093, "step": 452520 }, { "epoch": 1.17, "learning_rate": 0.00012404654454211067, "loss": 0.0101, "step": 452530 }, { "epoch": 1.17, "learning_rate": 0.00012404265632573922, "loss": 0.0104, "step": 452540 }, { "epoch": 1.17, "learning_rate": 0.00012403876810936773, "loss": 0.0135, "step": 452550 }, { "epoch": 1.17, "learning_rate": 0.00012403487989299627, "loss": 0.0116, "step": 452560 }, { "epoch": 1.17, "learning_rate": 0.0001240309916766248, "loss": 0.0108, "step": 452570 }, { "epoch": 1.17, "learning_rate": 0.00012402710346025336, "loss": 0.0097, "step": 452580 }, { "epoch": 1.17, "learning_rate": 0.00012402321524388187, "loss": 0.0122, "step": 452590 }, { "epoch": 1.17, "learning_rate": 0.0001240193270275104, "loss": 0.0093, "step": 452600 }, { "epoch": 1.17, "learning_rate": 0.00012401543881113895, "loss": 0.011, "step": 452610 }, { "epoch": 1.17, "learning_rate": 0.0001240115505947675, "loss": 0.0077, "step": 452620 }, { "epoch": 1.17, "learning_rate": 0.000124007662378396, "loss": 0.0113, "step": 452630 }, { "epoch": 1.17, "learning_rate": 0.00012400377416202455, "loss": 0.0143, "step": 452640 }, { "epoch": 1.17, "learning_rate": 0.0001239998859456531, "loss": 0.0121, "step": 452650 }, { "epoch": 1.17, "learning_rate": 0.00012399599772928163, "loss": 0.0147, "step": 452660 }, { "epoch": 1.17, "learning_rate": 0.00012399210951291015, "loss": 0.0081, "step": 452670 }, { "epoch": 1.17, "learning_rate": 0.0001239882212965387, "loss": 0.0095, "step": 452680 }, { "epoch": 1.17, "learning_rate": 0.00012398433308016723, "loss": 0.0094, "step": 452690 }, { "epoch": 1.17, "learning_rate": 0.00012398044486379577, "loss": 0.0128, "step": 452700 }, { "epoch": 1.17, "learning_rate": 0.00012397655664742432, "loss": 0.011, "step": 452710 }, { "epoch": 1.17, "learning_rate": 0.00012397266843105286, "loss": 0.0086, "step": 452720 }, { "epoch": 1.17, "learning_rate": 0.00012396878021468137, "loss": 0.0111, "step": 452730 }, { "epoch": 1.17, "learning_rate": 0.0001239648919983099, "loss": 0.0125, "step": 452740 }, { "epoch": 1.17, "learning_rate": 0.00012396100378193845, "loss": 0.0087, "step": 452750 }, { "epoch": 1.17, "learning_rate": 0.000123957115565567, "loss": 0.0088, "step": 452760 }, { "epoch": 1.17, "learning_rate": 0.0001239532273491955, "loss": 0.0099, "step": 452770 }, { "epoch": 1.17, "learning_rate": 0.00012394933913282405, "loss": 0.0111, "step": 452780 }, { "epoch": 1.17, "learning_rate": 0.0001239454509164526, "loss": 0.0102, "step": 452790 }, { "epoch": 1.17, "learning_rate": 0.0001239415627000811, "loss": 0.0103, "step": 452800 }, { "epoch": 1.17, "learning_rate": 0.00012393767448370965, "loss": 0.0082, "step": 452810 }, { "epoch": 1.17, "learning_rate": 0.0001239337862673382, "loss": 0.0094, "step": 452820 }, { "epoch": 1.17, "learning_rate": 0.00012392989805096673, "loss": 0.01, "step": 452830 }, { "epoch": 1.17, "learning_rate": 0.00012392600983459525, "loss": 0.0117, "step": 452840 }, { "epoch": 1.17, "learning_rate": 0.0001239221216182238, "loss": 0.0121, "step": 452850 }, { "epoch": 1.17, "learning_rate": 0.00012391823340185233, "loss": 0.0131, "step": 452860 }, { "epoch": 1.17, "learning_rate": 0.00012391434518548087, "loss": 0.0147, "step": 452870 }, { "epoch": 1.17, "learning_rate": 0.0001239104569691094, "loss": 0.0108, "step": 452880 }, { "epoch": 1.17, "learning_rate": 0.00012390656875273796, "loss": 0.0099, "step": 452890 }, { "epoch": 1.17, "learning_rate": 0.00012390268053636647, "loss": 0.0119, "step": 452900 }, { "epoch": 1.17, "learning_rate": 0.000123898792319995, "loss": 0.0123, "step": 452910 }, { "epoch": 1.17, "learning_rate": 0.00012389490410362355, "loss": 0.0098, "step": 452920 }, { "epoch": 1.17, "learning_rate": 0.0001238910158872521, "loss": 0.0111, "step": 452930 }, { "epoch": 1.17, "learning_rate": 0.0001238871276708806, "loss": 0.012, "step": 452940 }, { "epoch": 1.17, "learning_rate": 0.00012388323945450915, "loss": 0.0106, "step": 452950 }, { "epoch": 1.17, "learning_rate": 0.0001238793512381377, "loss": 0.0093, "step": 452960 }, { "epoch": 1.17, "learning_rate": 0.00012387546302176623, "loss": 0.013, "step": 452970 }, { "epoch": 1.17, "learning_rate": 0.00012387157480539475, "loss": 0.0087, "step": 452980 }, { "epoch": 1.17, "learning_rate": 0.0001238676865890233, "loss": 0.0141, "step": 452990 }, { "epoch": 1.17, "learning_rate": 0.00012386379837265183, "loss": 0.0119, "step": 453000 }, { "epoch": 1.17, "eval_cer": 0.8816914892276944, "eval_loss": 0.007030075415968895, "eval_runtime": 108.0107, "eval_samples_per_second": 18.517, "eval_steps_per_second": 4.629, "step": 453000 }, { "epoch": 1.17, "learning_rate": 0.00012385991015628037, "loss": 0.0109, "step": 453010 }, { "epoch": 1.17, "learning_rate": 0.0001238560219399089, "loss": 0.0104, "step": 453020 }, { "epoch": 1.17, "learning_rate": 0.00012385213372353746, "loss": 0.0107, "step": 453030 }, { "epoch": 1.17, "learning_rate": 0.00012384824550716597, "loss": 0.0107, "step": 453040 }, { "epoch": 1.17, "learning_rate": 0.0001238443572907945, "loss": 0.01, "step": 453050 }, { "epoch": 1.17, "learning_rate": 0.00012384046907442306, "loss": 0.0132, "step": 453060 }, { "epoch": 1.17, "learning_rate": 0.00012383658085805157, "loss": 0.0108, "step": 453070 }, { "epoch": 1.17, "learning_rate": 0.0001238326926416801, "loss": 0.0234, "step": 453080 }, { "epoch": 1.17, "learning_rate": 0.00012382880442530865, "loss": 0.0119, "step": 453090 }, { "epoch": 1.17, "learning_rate": 0.0001238249162089372, "loss": 0.0086, "step": 453100 }, { "epoch": 1.17, "learning_rate": 0.0001238210279925657, "loss": 0.0084, "step": 453110 }, { "epoch": 1.17, "learning_rate": 0.00012381713977619425, "loss": 0.0093, "step": 453120 }, { "epoch": 1.17, "learning_rate": 0.0001238132515598228, "loss": 0.0135, "step": 453130 }, { "epoch": 1.17, "learning_rate": 0.00012380936334345133, "loss": 0.0098, "step": 453140 }, { "epoch": 1.17, "learning_rate": 0.00012380547512707985, "loss": 0.0099, "step": 453150 }, { "epoch": 1.17, "learning_rate": 0.0001238015869107084, "loss": 0.0089, "step": 453160 }, { "epoch": 1.17, "learning_rate": 0.00012379769869433693, "loss": 0.016, "step": 453170 }, { "epoch": 1.17, "learning_rate": 0.00012379381047796547, "loss": 0.0116, "step": 453180 }, { "epoch": 1.17, "learning_rate": 0.000123789922261594, "loss": 0.0119, "step": 453190 }, { "epoch": 1.17, "learning_rate": 0.00012378603404522253, "loss": 0.0127, "step": 453200 }, { "epoch": 1.17, "learning_rate": 0.00012378214582885107, "loss": 0.0087, "step": 453210 }, { "epoch": 1.17, "learning_rate": 0.0001237782576124796, "loss": 0.0112, "step": 453220 }, { "epoch": 1.17, "learning_rate": 0.00012377436939610815, "loss": 0.0098, "step": 453230 }, { "epoch": 1.17, "learning_rate": 0.0001237704811797367, "loss": 0.0096, "step": 453240 }, { "epoch": 1.17, "learning_rate": 0.0001237665929633652, "loss": 0.0082, "step": 453250 }, { "epoch": 1.17, "learning_rate": 0.00012376270474699375, "loss": 0.0078, "step": 453260 }, { "epoch": 1.17, "learning_rate": 0.0001237588165306223, "loss": 0.0094, "step": 453270 }, { "epoch": 1.17, "learning_rate": 0.00012375492831425084, "loss": 0.0113, "step": 453280 }, { "epoch": 1.17, "learning_rate": 0.00012375104009787935, "loss": 0.0112, "step": 453290 }, { "epoch": 1.18, "learning_rate": 0.0001237471518815079, "loss": 0.0098, "step": 453300 }, { "epoch": 1.18, "learning_rate": 0.00012374326366513643, "loss": 0.0092, "step": 453310 }, { "epoch": 1.18, "learning_rate": 0.00012373937544876495, "loss": 0.0132, "step": 453320 }, { "epoch": 1.18, "learning_rate": 0.0001237354872323935, "loss": 0.0148, "step": 453330 }, { "epoch": 1.18, "learning_rate": 0.00012373159901602203, "loss": 0.0093, "step": 453340 }, { "epoch": 1.18, "learning_rate": 0.00012372771079965057, "loss": 0.0112, "step": 453350 }, { "epoch": 1.18, "learning_rate": 0.0001237238225832791, "loss": 0.0107, "step": 453360 }, { "epoch": 1.18, "learning_rate": 0.00012371993436690763, "loss": 0.0099, "step": 453370 }, { "epoch": 1.18, "learning_rate": 0.00012371604615053617, "loss": 0.0093, "step": 453380 }, { "epoch": 1.18, "learning_rate": 0.0001237121579341647, "loss": 0.0106, "step": 453390 }, { "epoch": 1.18, "learning_rate": 0.00012370826971779323, "loss": 0.0143, "step": 453400 }, { "epoch": 1.18, "learning_rate": 0.0001237043815014218, "loss": 0.0105, "step": 453410 }, { "epoch": 1.18, "learning_rate": 0.0001237004932850503, "loss": 0.0092, "step": 453420 }, { "epoch": 1.18, "learning_rate": 0.00012369660506867885, "loss": 0.0107, "step": 453430 }, { "epoch": 1.18, "learning_rate": 0.0001236927168523074, "loss": 0.0102, "step": 453440 }, { "epoch": 1.18, "learning_rate": 0.00012368882863593594, "loss": 0.0125, "step": 453450 }, { "epoch": 1.18, "learning_rate": 0.00012368494041956445, "loss": 0.0129, "step": 453460 }, { "epoch": 1.18, "learning_rate": 0.000123681052203193, "loss": 0.014, "step": 453470 }, { "epoch": 1.18, "learning_rate": 0.00012367716398682153, "loss": 0.0145, "step": 453480 }, { "epoch": 1.18, "learning_rate": 0.00012367327577045007, "loss": 0.0088, "step": 453490 }, { "epoch": 1.18, "learning_rate": 0.0001236693875540786, "loss": 0.0109, "step": 453500 }, { "epoch": 1.18, "learning_rate": 0.00012366549933770713, "loss": 0.0113, "step": 453510 }, { "epoch": 1.18, "learning_rate": 0.00012366161112133567, "loss": 0.0101, "step": 453520 }, { "epoch": 1.18, "learning_rate": 0.00012365772290496421, "loss": 0.0123, "step": 453530 }, { "epoch": 1.18, "learning_rate": 0.00012365383468859273, "loss": 0.0127, "step": 453540 }, { "epoch": 1.18, "learning_rate": 0.00012364994647222127, "loss": 0.0146, "step": 453550 }, { "epoch": 1.18, "learning_rate": 0.0001236460582558498, "loss": 0.009, "step": 453560 }, { "epoch": 1.18, "learning_rate": 0.00012364217003947833, "loss": 0.0106, "step": 453570 }, { "epoch": 1.18, "learning_rate": 0.0001236382818231069, "loss": 0.0088, "step": 453580 }, { "epoch": 1.18, "learning_rate": 0.0001236343936067354, "loss": 0.0128, "step": 453590 }, { "epoch": 1.18, "learning_rate": 0.00012363050539036395, "loss": 0.0145, "step": 453600 }, { "epoch": 1.18, "learning_rate": 0.0001236266171739925, "loss": 0.0132, "step": 453610 }, { "epoch": 1.18, "learning_rate": 0.00012362272895762103, "loss": 0.011, "step": 453620 }, { "epoch": 1.18, "learning_rate": 0.00012361884074124955, "loss": 0.0097, "step": 453630 }, { "epoch": 1.18, "learning_rate": 0.0001236149525248781, "loss": 0.017, "step": 453640 }, { "epoch": 1.18, "learning_rate": 0.00012361106430850663, "loss": 0.0106, "step": 453650 }, { "epoch": 1.18, "learning_rate": 0.00012360717609213517, "loss": 0.0094, "step": 453660 }, { "epoch": 1.18, "learning_rate": 0.0001236032878757637, "loss": 0.0123, "step": 453670 }, { "epoch": 1.18, "learning_rate": 0.00012359939965939223, "loss": 0.0082, "step": 453680 }, { "epoch": 1.18, "learning_rate": 0.00012359551144302077, "loss": 0.0104, "step": 453690 }, { "epoch": 1.18, "learning_rate": 0.00012359162322664931, "loss": 0.0141, "step": 453700 }, { "epoch": 1.18, "learning_rate": 0.00012358773501027783, "loss": 0.01, "step": 453710 }, { "epoch": 1.18, "learning_rate": 0.00012358384679390637, "loss": 0.0117, "step": 453720 }, { "epoch": 1.18, "learning_rate": 0.0001235799585775349, "loss": 0.0081, "step": 453730 }, { "epoch": 1.18, "learning_rate": 0.00012357607036116345, "loss": 0.0099, "step": 453740 }, { "epoch": 1.18, "learning_rate": 0.000123572182144792, "loss": 0.0119, "step": 453750 }, { "epoch": 1.18, "learning_rate": 0.00012356829392842054, "loss": 0.0165, "step": 453760 }, { "epoch": 1.18, "learning_rate": 0.00012356440571204905, "loss": 0.0109, "step": 453770 }, { "epoch": 1.18, "learning_rate": 0.0001235605174956776, "loss": 0.0114, "step": 453780 }, { "epoch": 1.18, "learning_rate": 0.00012355662927930613, "loss": 0.0101, "step": 453790 }, { "epoch": 1.18, "learning_rate": 0.00012355274106293465, "loss": 0.0098, "step": 453800 }, { "epoch": 1.18, "learning_rate": 0.0001235488528465632, "loss": 0.0113, "step": 453810 }, { "epoch": 1.18, "learning_rate": 0.00012354496463019173, "loss": 0.0106, "step": 453820 }, { "epoch": 1.18, "learning_rate": 0.00012354107641382027, "loss": 0.0081, "step": 453830 }, { "epoch": 1.18, "learning_rate": 0.0001235371881974488, "loss": 0.0087, "step": 453840 }, { "epoch": 1.18, "learning_rate": 0.00012353329998107733, "loss": 0.009, "step": 453850 }, { "epoch": 1.18, "learning_rate": 0.00012352941176470587, "loss": 0.0094, "step": 453860 }, { "epoch": 1.18, "learning_rate": 0.0001235255235483344, "loss": 0.0125, "step": 453870 }, { "epoch": 1.18, "learning_rate": 0.00012352163533196293, "loss": 0.0093, "step": 453880 }, { "epoch": 1.18, "learning_rate": 0.00012351774711559147, "loss": 0.0105, "step": 453890 }, { "epoch": 1.18, "learning_rate": 0.00012351385889922, "loss": 0.0085, "step": 453900 }, { "epoch": 1.18, "learning_rate": 0.00012350997068284855, "loss": 0.0094, "step": 453910 }, { "epoch": 1.18, "learning_rate": 0.00012350608246647707, "loss": 0.0088, "step": 453920 }, { "epoch": 1.18, "learning_rate": 0.00012350219425010564, "loss": 0.0102, "step": 453930 }, { "epoch": 1.18, "learning_rate": 0.00012349830603373415, "loss": 0.0129, "step": 453940 }, { "epoch": 1.18, "learning_rate": 0.0001234944178173627, "loss": 0.0119, "step": 453950 }, { "epoch": 1.18, "learning_rate": 0.00012349052960099123, "loss": 0.0105, "step": 453960 }, { "epoch": 1.18, "learning_rate": 0.00012348664138461978, "loss": 0.01, "step": 453970 }, { "epoch": 1.18, "learning_rate": 0.0001234827531682483, "loss": 0.0105, "step": 453980 }, { "epoch": 1.18, "learning_rate": 0.00012347886495187683, "loss": 0.0146, "step": 453990 }, { "epoch": 1.18, "learning_rate": 0.00012347497673550537, "loss": 0.0125, "step": 454000 }, { "epoch": 1.18, "eval_cer": 0.8816760932214184, "eval_loss": 0.0068307314068078995, "eval_runtime": 107.3869, "eval_samples_per_second": 18.624, "eval_steps_per_second": 4.656, "step": 454000 }, { "epoch": 1.18, "learning_rate": 0.00012347108851913391, "loss": 0.0114, "step": 454010 }, { "epoch": 1.18, "learning_rate": 0.00012346720030276243, "loss": 0.0114, "step": 454020 }, { "epoch": 1.18, "learning_rate": 0.00012346331208639097, "loss": 0.0146, "step": 454030 }, { "epoch": 1.18, "learning_rate": 0.0001234594238700195, "loss": 0.012, "step": 454040 }, { "epoch": 1.18, "learning_rate": 0.00012345553565364803, "loss": 0.0123, "step": 454050 }, { "epoch": 1.18, "learning_rate": 0.00012345164743727657, "loss": 0.0102, "step": 454060 }, { "epoch": 1.18, "learning_rate": 0.0001234477592209051, "loss": 0.0149, "step": 454070 }, { "epoch": 1.18, "learning_rate": 0.00012344387100453365, "loss": 0.0102, "step": 454080 }, { "epoch": 1.18, "learning_rate": 0.00012343998278816217, "loss": 0.0088, "step": 454090 }, { "epoch": 1.18, "learning_rate": 0.00012343609457179074, "loss": 0.0119, "step": 454100 }, { "epoch": 1.18, "learning_rate": 0.00012343220635541925, "loss": 0.0128, "step": 454110 }, { "epoch": 1.18, "learning_rate": 0.0001234283181390478, "loss": 0.0123, "step": 454120 }, { "epoch": 1.18, "learning_rate": 0.00012342442992267633, "loss": 0.0121, "step": 454130 }, { "epoch": 1.18, "learning_rate": 0.00012342054170630487, "loss": 0.0164, "step": 454140 }, { "epoch": 1.18, "learning_rate": 0.0001234166534899334, "loss": 0.009, "step": 454150 }, { "epoch": 1.18, "learning_rate": 0.00012341276527356193, "loss": 0.0093, "step": 454160 }, { "epoch": 1.18, "learning_rate": 0.00012340887705719047, "loss": 0.013, "step": 454170 }, { "epoch": 1.18, "learning_rate": 0.00012340498884081901, "loss": 0.0111, "step": 454180 }, { "epoch": 1.18, "learning_rate": 0.00012340110062444753, "loss": 0.0098, "step": 454190 }, { "epoch": 1.18, "learning_rate": 0.00012339721240807607, "loss": 0.0097, "step": 454200 }, { "epoch": 1.18, "learning_rate": 0.0001233933241917046, "loss": 0.0127, "step": 454210 }, { "epoch": 1.18, "learning_rate": 0.00012338943597533315, "loss": 0.012, "step": 454220 }, { "epoch": 1.18, "learning_rate": 0.00012338554775896167, "loss": 0.01, "step": 454230 }, { "epoch": 1.18, "learning_rate": 0.0001233816595425902, "loss": 0.0126, "step": 454240 }, { "epoch": 1.18, "learning_rate": 0.00012337777132621875, "loss": 0.0145, "step": 454250 }, { "epoch": 1.18, "learning_rate": 0.0001233738831098473, "loss": 0.0086, "step": 454260 }, { "epoch": 1.18, "learning_rate": 0.0001233699948934758, "loss": 0.0103, "step": 454270 }, { "epoch": 1.18, "learning_rate": 0.00012336610667710438, "loss": 0.0089, "step": 454280 }, { "epoch": 1.18, "learning_rate": 0.0001233622184607329, "loss": 0.0124, "step": 454290 }, { "epoch": 1.18, "learning_rate": 0.00012335833024436143, "loss": 0.0141, "step": 454300 }, { "epoch": 1.18, "learning_rate": 0.00012335444202798997, "loss": 0.0113, "step": 454310 }, { "epoch": 1.18, "learning_rate": 0.0001233505538116185, "loss": 0.012, "step": 454320 }, { "epoch": 1.18, "learning_rate": 0.00012334666559524703, "loss": 0.0123, "step": 454330 }, { "epoch": 1.18, "learning_rate": 0.00012334277737887557, "loss": 0.0104, "step": 454340 }, { "epoch": 1.18, "learning_rate": 0.00012333888916250411, "loss": 0.0101, "step": 454350 }, { "epoch": 1.18, "learning_rate": 0.00012333500094613263, "loss": 0.0123, "step": 454360 }, { "epoch": 1.18, "learning_rate": 0.00012333111272976117, "loss": 0.0132, "step": 454370 }, { "epoch": 1.18, "learning_rate": 0.0001233272245133897, "loss": 0.0103, "step": 454380 }, { "epoch": 1.18, "learning_rate": 0.00012332333629701825, "loss": 0.0133, "step": 454390 }, { "epoch": 1.18, "learning_rate": 0.00012331944808064677, "loss": 0.0114, "step": 454400 }, { "epoch": 1.18, "learning_rate": 0.0001233155598642753, "loss": 0.0108, "step": 454410 }, { "epoch": 1.18, "learning_rate": 0.00012331167164790385, "loss": 0.0108, "step": 454420 }, { "epoch": 1.18, "learning_rate": 0.0001233077834315324, "loss": 0.0094, "step": 454430 }, { "epoch": 1.18, "learning_rate": 0.0001233038952151609, "loss": 0.0127, "step": 454440 }, { "epoch": 1.18, "learning_rate": 0.00012330000699878948, "loss": 0.0104, "step": 454450 }, { "epoch": 1.18, "learning_rate": 0.000123296118782418, "loss": 0.0114, "step": 454460 }, { "epoch": 1.18, "learning_rate": 0.00012329223056604653, "loss": 0.013, "step": 454470 }, { "epoch": 1.18, "learning_rate": 0.00012328834234967507, "loss": 0.0128, "step": 454480 }, { "epoch": 1.18, "learning_rate": 0.00012328445413330362, "loss": 0.0114, "step": 454490 }, { "epoch": 1.18, "learning_rate": 0.00012328056591693213, "loss": 0.0109, "step": 454500 }, { "epoch": 1.18, "learning_rate": 0.00012327667770056067, "loss": 0.0125, "step": 454510 }, { "epoch": 1.18, "learning_rate": 0.0001232727894841892, "loss": 0.0107, "step": 454520 }, { "epoch": 1.18, "learning_rate": 0.00012326890126781775, "loss": 0.0107, "step": 454530 }, { "epoch": 1.18, "learning_rate": 0.00012326501305144627, "loss": 0.0114, "step": 454540 }, { "epoch": 1.18, "learning_rate": 0.0001232611248350748, "loss": 0.0105, "step": 454550 }, { "epoch": 1.18, "learning_rate": 0.00012325723661870335, "loss": 0.011, "step": 454560 }, { "epoch": 1.18, "learning_rate": 0.00012325334840233187, "loss": 0.0111, "step": 454570 }, { "epoch": 1.18, "learning_rate": 0.0001232494601859604, "loss": 0.0134, "step": 454580 }, { "epoch": 1.18, "learning_rate": 0.00012324557196958895, "loss": 0.0115, "step": 454590 }, { "epoch": 1.18, "learning_rate": 0.0001232416837532175, "loss": 0.0104, "step": 454600 }, { "epoch": 1.18, "learning_rate": 0.000123237795536846, "loss": 0.0096, "step": 454610 }, { "epoch": 1.18, "learning_rate": 0.00012323390732047458, "loss": 0.0111, "step": 454620 }, { "epoch": 1.18, "learning_rate": 0.0001232300191041031, "loss": 0.0148, "step": 454630 }, { "epoch": 1.18, "learning_rate": 0.00012322613088773163, "loss": 0.0083, "step": 454640 }, { "epoch": 1.18, "learning_rate": 0.00012322224267136017, "loss": 0.0133, "step": 454650 }, { "epoch": 1.18, "learning_rate": 0.00012321835445498871, "loss": 0.0091, "step": 454660 }, { "epoch": 1.18, "learning_rate": 0.00012321446623861723, "loss": 0.0125, "step": 454670 }, { "epoch": 1.18, "learning_rate": 0.00012321057802224577, "loss": 0.0087, "step": 454680 }, { "epoch": 1.18, "learning_rate": 0.0001232066898058743, "loss": 0.0115, "step": 454690 }, { "epoch": 1.18, "learning_rate": 0.00012320280158950285, "loss": 0.0115, "step": 454700 }, { "epoch": 1.18, "learning_rate": 0.00012319891337313137, "loss": 0.0094, "step": 454710 }, { "epoch": 1.18, "learning_rate": 0.0001231950251567599, "loss": 0.0138, "step": 454720 }, { "epoch": 1.18, "learning_rate": 0.00012319113694038845, "loss": 0.011, "step": 454730 }, { "epoch": 1.18, "learning_rate": 0.000123187248724017, "loss": 0.0101, "step": 454740 }, { "epoch": 1.18, "learning_rate": 0.0001231833605076455, "loss": 0.0102, "step": 454750 }, { "epoch": 1.18, "learning_rate": 0.00012317947229127405, "loss": 0.0099, "step": 454760 }, { "epoch": 1.18, "learning_rate": 0.0001231755840749026, "loss": 0.0108, "step": 454770 }, { "epoch": 1.18, "learning_rate": 0.0001231716958585311, "loss": 0.0082, "step": 454780 }, { "epoch": 1.18, "learning_rate": 0.00012316780764215965, "loss": 0.0151, "step": 454790 }, { "epoch": 1.18, "learning_rate": 0.0001231639194257882, "loss": 0.01, "step": 454800 }, { "epoch": 1.18, "learning_rate": 0.00012316003120941673, "loss": 0.0116, "step": 454810 }, { "epoch": 1.18, "learning_rate": 0.00012315614299304527, "loss": 0.008, "step": 454820 }, { "epoch": 1.18, "learning_rate": 0.00012315225477667381, "loss": 0.0107, "step": 454830 }, { "epoch": 1.18, "learning_rate": 0.00012314836656030233, "loss": 0.0107, "step": 454840 }, { "epoch": 1.18, "learning_rate": 0.00012314447834393087, "loss": 0.0123, "step": 454850 }, { "epoch": 1.18, "learning_rate": 0.0001231405901275594, "loss": 0.0083, "step": 454860 }, { "epoch": 1.18, "learning_rate": 0.00012313670191118795, "loss": 0.0077, "step": 454870 }, { "epoch": 1.18, "learning_rate": 0.00012313281369481647, "loss": 0.0139, "step": 454880 }, { "epoch": 1.18, "learning_rate": 0.000123128925478445, "loss": 0.0129, "step": 454890 }, { "epoch": 1.18, "learning_rate": 0.00012312503726207355, "loss": 0.0095, "step": 454900 }, { "epoch": 1.18, "learning_rate": 0.0001231211490457021, "loss": 0.0173, "step": 454910 }, { "epoch": 1.18, "learning_rate": 0.0001231172608293306, "loss": 0.0107, "step": 454920 }, { "epoch": 1.18, "learning_rate": 0.00012311337261295915, "loss": 0.0097, "step": 454930 }, { "epoch": 1.18, "learning_rate": 0.0001231094843965877, "loss": 0.0109, "step": 454940 }, { "epoch": 1.18, "learning_rate": 0.00012310559618021623, "loss": 0.0122, "step": 454950 }, { "epoch": 1.18, "learning_rate": 0.00012310170796384475, "loss": 0.0111, "step": 454960 }, { "epoch": 1.18, "learning_rate": 0.00012309781974747332, "loss": 0.0079, "step": 454970 }, { "epoch": 1.18, "learning_rate": 0.00012309393153110183, "loss": 0.0104, "step": 454980 }, { "epoch": 1.18, "learning_rate": 0.00012309004331473037, "loss": 0.0108, "step": 454990 }, { "epoch": 1.18, "learning_rate": 0.0001230861550983589, "loss": 0.0104, "step": 455000 }, { "epoch": 1.18, "eval_cer": 0.8816746935844841, "eval_loss": 0.007326171267777681, "eval_runtime": 107.2391, "eval_samples_per_second": 18.65, "eval_steps_per_second": 4.662, "step": 455000 }, { "epoch": 1.18, "learning_rate": 0.00012308226688198746, "loss": 0.0138, "step": 455010 }, { "epoch": 1.18, "learning_rate": 0.00012307837866561597, "loss": 0.0125, "step": 455020 }, { "epoch": 1.18, "learning_rate": 0.0001230744904492445, "loss": 0.0083, "step": 455030 }, { "epoch": 1.18, "learning_rate": 0.00012307060223287305, "loss": 0.0109, "step": 455040 }, { "epoch": 1.18, "learning_rate": 0.00012306671401650157, "loss": 0.0098, "step": 455050 }, { "epoch": 1.18, "learning_rate": 0.0001230628258001301, "loss": 0.0123, "step": 455060 }, { "epoch": 1.18, "learning_rate": 0.00012305893758375865, "loss": 0.0101, "step": 455070 }, { "epoch": 1.18, "learning_rate": 0.0001230550493673872, "loss": 0.0114, "step": 455080 }, { "epoch": 1.18, "learning_rate": 0.0001230511611510157, "loss": 0.0121, "step": 455090 }, { "epoch": 1.18, "learning_rate": 0.00012304727293464425, "loss": 0.0098, "step": 455100 }, { "epoch": 1.18, "learning_rate": 0.0001230433847182728, "loss": 0.0105, "step": 455110 }, { "epoch": 1.18, "learning_rate": 0.00012303949650190133, "loss": 0.0101, "step": 455120 }, { "epoch": 1.18, "learning_rate": 0.00012303560828552985, "loss": 0.0107, "step": 455130 }, { "epoch": 1.18, "learning_rate": 0.0001230317200691584, "loss": 0.0107, "step": 455140 }, { "epoch": 1.18, "learning_rate": 0.00012302783185278693, "loss": 0.0095, "step": 455150 }, { "epoch": 1.18, "learning_rate": 0.00012302394363641547, "loss": 0.0106, "step": 455160 }, { "epoch": 1.18, "learning_rate": 0.000123020055420044, "loss": 0.0105, "step": 455170 }, { "epoch": 1.18, "learning_rate": 0.00012301616720367255, "loss": 0.0109, "step": 455180 }, { "epoch": 1.18, "learning_rate": 0.00012301227898730107, "loss": 0.0092, "step": 455190 }, { "epoch": 1.18, "learning_rate": 0.0001230083907709296, "loss": 0.0095, "step": 455200 }, { "epoch": 1.18, "learning_rate": 0.00012300450255455815, "loss": 0.0092, "step": 455210 }, { "epoch": 1.18, "learning_rate": 0.0001230006143381867, "loss": 0.0129, "step": 455220 }, { "epoch": 1.18, "learning_rate": 0.0001229967261218152, "loss": 0.0115, "step": 455230 }, { "epoch": 1.18, "learning_rate": 0.00012299283790544375, "loss": 0.0108, "step": 455240 }, { "epoch": 1.18, "learning_rate": 0.0001229889496890723, "loss": 0.0091, "step": 455250 }, { "epoch": 1.18, "learning_rate": 0.00012298506147270083, "loss": 0.0121, "step": 455260 }, { "epoch": 1.18, "learning_rate": 0.00012298117325632935, "loss": 0.0136, "step": 455270 }, { "epoch": 1.18, "learning_rate": 0.0001229772850399579, "loss": 0.0081, "step": 455280 }, { "epoch": 1.18, "learning_rate": 0.00012297339682358643, "loss": 0.0125, "step": 455290 }, { "epoch": 1.18, "learning_rate": 0.00012296950860721495, "loss": 0.0136, "step": 455300 }, { "epoch": 1.18, "learning_rate": 0.0001229656203908435, "loss": 0.0074, "step": 455310 }, { "epoch": 1.18, "learning_rate": 0.00012296173217447203, "loss": 0.0088, "step": 455320 }, { "epoch": 1.18, "learning_rate": 0.00012295784395810057, "loss": 0.0113, "step": 455330 }, { "epoch": 1.18, "learning_rate": 0.0001229539557417291, "loss": 0.0115, "step": 455340 }, { "epoch": 1.18, "learning_rate": 0.00012295006752535765, "loss": 0.0096, "step": 455350 }, { "epoch": 1.18, "learning_rate": 0.00012294617930898617, "loss": 0.0107, "step": 455360 }, { "epoch": 1.18, "learning_rate": 0.0001229422910926147, "loss": 0.0099, "step": 455370 }, { "epoch": 1.18, "learning_rate": 0.00012293840287624325, "loss": 0.0125, "step": 455380 }, { "epoch": 1.18, "learning_rate": 0.0001229345146598718, "loss": 0.0094, "step": 455390 }, { "epoch": 1.18, "learning_rate": 0.0001229306264435003, "loss": 0.0132, "step": 455400 }, { "epoch": 1.18, "learning_rate": 0.00012292673822712885, "loss": 0.0115, "step": 455410 }, { "epoch": 1.18, "learning_rate": 0.0001229228500107574, "loss": 0.0097, "step": 455420 }, { "epoch": 1.18, "learning_rate": 0.00012291896179438593, "loss": 0.0118, "step": 455430 }, { "epoch": 1.18, "learning_rate": 0.00012291507357801445, "loss": 0.01, "step": 455440 }, { "epoch": 1.18, "learning_rate": 0.000122911185361643, "loss": 0.013, "step": 455450 }, { "epoch": 1.18, "learning_rate": 0.00012290729714527153, "loss": 0.0133, "step": 455460 }, { "epoch": 1.18, "learning_rate": 0.00012290340892890007, "loss": 0.0093, "step": 455470 }, { "epoch": 1.18, "learning_rate": 0.0001228995207125286, "loss": 0.0099, "step": 455480 }, { "epoch": 1.18, "learning_rate": 0.00012289563249615716, "loss": 0.0081, "step": 455490 }, { "epoch": 1.18, "learning_rate": 0.00012289174427978567, "loss": 0.0085, "step": 455500 }, { "epoch": 1.18, "learning_rate": 0.0001228878560634142, "loss": 0.0111, "step": 455510 }, { "epoch": 1.18, "learning_rate": 0.00012288396784704275, "loss": 0.0113, "step": 455520 }, { "epoch": 1.18, "learning_rate": 0.00012288007963067127, "loss": 0.011, "step": 455530 }, { "epoch": 1.18, "learning_rate": 0.0001228761914142998, "loss": 0.0129, "step": 455540 }, { "epoch": 1.18, "learning_rate": 0.00012287230319792835, "loss": 0.0112, "step": 455550 }, { "epoch": 1.18, "learning_rate": 0.0001228684149815569, "loss": 0.0097, "step": 455560 }, { "epoch": 1.18, "learning_rate": 0.0001228645267651854, "loss": 0.0102, "step": 455570 }, { "epoch": 1.18, "learning_rate": 0.00012286063854881395, "loss": 0.0106, "step": 455580 }, { "epoch": 1.18, "learning_rate": 0.0001228567503324425, "loss": 0.0098, "step": 455590 }, { "epoch": 1.18, "learning_rate": 0.00012285286211607103, "loss": 0.01, "step": 455600 }, { "epoch": 1.18, "learning_rate": 0.00012284897389969955, "loss": 0.0081, "step": 455610 }, { "epoch": 1.18, "learning_rate": 0.0001228450856833281, "loss": 0.0114, "step": 455620 }, { "epoch": 1.18, "learning_rate": 0.00012284119746695663, "loss": 0.014, "step": 455630 }, { "epoch": 1.18, "learning_rate": 0.00012283730925058517, "loss": 0.0079, "step": 455640 }, { "epoch": 1.18, "learning_rate": 0.00012283342103421369, "loss": 0.0133, "step": 455650 }, { "epoch": 1.18, "learning_rate": 0.00012282953281784223, "loss": 0.0116, "step": 455660 }, { "epoch": 1.18, "learning_rate": 0.00012282564460147077, "loss": 0.0094, "step": 455670 }, { "epoch": 1.18, "learning_rate": 0.0001228217563850993, "loss": 0.0122, "step": 455680 }, { "epoch": 1.18, "learning_rate": 0.00012281786816872785, "loss": 0.0079, "step": 455690 }, { "epoch": 1.18, "learning_rate": 0.0001228139799523564, "loss": 0.0106, "step": 455700 }, { "epoch": 1.18, "learning_rate": 0.0001228100917359849, "loss": 0.0104, "step": 455710 }, { "epoch": 1.18, "learning_rate": 0.00012280620351961345, "loss": 0.008, "step": 455720 }, { "epoch": 1.18, "learning_rate": 0.000122802315303242, "loss": 0.0099, "step": 455730 }, { "epoch": 1.18, "learning_rate": 0.00012279842708687053, "loss": 0.0111, "step": 455740 }, { "epoch": 1.18, "learning_rate": 0.00012279453887049905, "loss": 0.0106, "step": 455750 }, { "epoch": 1.18, "learning_rate": 0.0001227906506541276, "loss": 0.0129, "step": 455760 }, { "epoch": 1.18, "learning_rate": 0.00012278676243775613, "loss": 0.0087, "step": 455770 }, { "epoch": 1.18, "learning_rate": 0.00012278287422138465, "loss": 0.0095, "step": 455780 }, { "epoch": 1.18, "learning_rate": 0.0001227789860050132, "loss": 0.0104, "step": 455790 }, { "epoch": 1.18, "learning_rate": 0.00012277509778864173, "loss": 0.0105, "step": 455800 }, { "epoch": 1.18, "learning_rate": 0.00012277120957227027, "loss": 0.0112, "step": 455810 }, { "epoch": 1.18, "learning_rate": 0.00012276732135589879, "loss": 0.0103, "step": 455820 }, { "epoch": 1.18, "learning_rate": 0.00012276343313952733, "loss": 0.0093, "step": 455830 }, { "epoch": 1.18, "learning_rate": 0.00012275954492315587, "loss": 0.0087, "step": 455840 }, { "epoch": 1.18, "learning_rate": 0.0001227556567067844, "loss": 0.0099, "step": 455850 }, { "epoch": 1.18, "learning_rate": 0.00012275176849041293, "loss": 0.0091, "step": 455860 }, { "epoch": 1.18, "learning_rate": 0.0001227478802740415, "loss": 0.0111, "step": 455870 }, { "epoch": 1.18, "learning_rate": 0.00012274399205767, "loss": 0.0103, "step": 455880 }, { "epoch": 1.18, "learning_rate": 0.00012274010384129855, "loss": 0.0111, "step": 455890 }, { "epoch": 1.18, "learning_rate": 0.0001227362156249271, "loss": 0.0122, "step": 455900 }, { "epoch": 1.18, "learning_rate": 0.00012273232740855563, "loss": 0.009, "step": 455910 }, { "epoch": 1.18, "learning_rate": 0.00012272843919218415, "loss": 0.0111, "step": 455920 }, { "epoch": 1.18, "learning_rate": 0.0001227245509758127, "loss": 0.0137, "step": 455930 }, { "epoch": 1.18, "learning_rate": 0.00012272066275944123, "loss": 0.0095, "step": 455940 }, { "epoch": 1.18, "learning_rate": 0.00012271677454306977, "loss": 0.0093, "step": 455950 }, { "epoch": 1.18, "learning_rate": 0.0001227128863266983, "loss": 0.0103, "step": 455960 }, { "epoch": 1.18, "learning_rate": 0.00012270899811032683, "loss": 0.0118, "step": 455970 }, { "epoch": 1.18, "learning_rate": 0.00012270510989395537, "loss": 0.0132, "step": 455980 }, { "epoch": 1.18, "learning_rate": 0.0001227012216775839, "loss": 0.0105, "step": 455990 }, { "epoch": 1.18, "learning_rate": 0.00012269733346121243, "loss": 0.0092, "step": 456000 }, { "epoch": 1.18, "eval_cer": 0.881688689953826, "eval_loss": 0.0070779649540781975, "eval_runtime": 107.4452, "eval_samples_per_second": 18.614, "eval_steps_per_second": 4.654, "step": 456000 }, { "epoch": 1.18, "learning_rate": 0.000122693445244841, "loss": 0.0093, "step": 456010 }, { "epoch": 1.18, "learning_rate": 0.0001226895570284695, "loss": 0.0095, "step": 456020 }, { "epoch": 1.18, "learning_rate": 0.00012268566881209802, "loss": 0.0106, "step": 456030 }, { "epoch": 1.18, "learning_rate": 0.0001226817805957266, "loss": 0.0143, "step": 456040 }, { "epoch": 1.18, "learning_rate": 0.0001226778923793551, "loss": 0.0096, "step": 456050 }, { "epoch": 1.18, "learning_rate": 0.00012267400416298365, "loss": 0.0108, "step": 456060 }, { "epoch": 1.18, "learning_rate": 0.0001226701159466122, "loss": 0.0114, "step": 456070 }, { "epoch": 1.18, "learning_rate": 0.00012266622773024073, "loss": 0.0089, "step": 456080 }, { "epoch": 1.18, "learning_rate": 0.00012266233951386925, "loss": 0.0088, "step": 456090 }, { "epoch": 1.18, "learning_rate": 0.0001226584512974978, "loss": 0.0121, "step": 456100 }, { "epoch": 1.18, "learning_rate": 0.00012265456308112633, "loss": 0.0125, "step": 456110 }, { "epoch": 1.18, "learning_rate": 0.00012265067486475487, "loss": 0.0139, "step": 456120 }, { "epoch": 1.18, "learning_rate": 0.0001226467866483834, "loss": 0.0132, "step": 456130 }, { "epoch": 1.18, "learning_rate": 0.00012264289843201193, "loss": 0.0107, "step": 456140 }, { "epoch": 1.18, "learning_rate": 0.00012263901021564047, "loss": 0.0107, "step": 456150 }, { "epoch": 1.18, "learning_rate": 0.000122635121999269, "loss": 0.0114, "step": 456160 }, { "epoch": 1.18, "learning_rate": 0.00012263123378289753, "loss": 0.0119, "step": 456170 }, { "epoch": 1.18, "learning_rate": 0.00012262734556652607, "loss": 0.0115, "step": 456180 }, { "epoch": 1.18, "learning_rate": 0.0001226234573501546, "loss": 0.0127, "step": 456190 }, { "epoch": 1.18, "learning_rate": 0.00012261956913378315, "loss": 0.0104, "step": 456200 }, { "epoch": 1.18, "learning_rate": 0.0001226156809174117, "loss": 0.0094, "step": 456210 }, { "epoch": 1.18, "learning_rate": 0.00012261179270104023, "loss": 0.0145, "step": 456220 }, { "epoch": 1.18, "learning_rate": 0.00012260790448466875, "loss": 0.0101, "step": 456230 }, { "epoch": 1.18, "learning_rate": 0.0001226040162682973, "loss": 0.0106, "step": 456240 }, { "epoch": 1.18, "learning_rate": 0.00012260012805192583, "loss": 0.0112, "step": 456250 }, { "epoch": 1.18, "learning_rate": 0.00012259623983555437, "loss": 0.0172, "step": 456260 }, { "epoch": 1.18, "learning_rate": 0.0001225923516191829, "loss": 0.01, "step": 456270 }, { "epoch": 1.18, "learning_rate": 0.00012258846340281143, "loss": 0.0092, "step": 456280 }, { "epoch": 1.18, "learning_rate": 0.00012258457518643997, "loss": 0.0113, "step": 456290 }, { "epoch": 1.18, "learning_rate": 0.00012258068697006849, "loss": 0.0099, "step": 456300 }, { "epoch": 1.18, "learning_rate": 0.00012257679875369703, "loss": 0.0145, "step": 456310 }, { "epoch": 1.18, "learning_rate": 0.00012257291053732557, "loss": 0.0087, "step": 456320 }, { "epoch": 1.18, "learning_rate": 0.0001225690223209541, "loss": 0.0134, "step": 456330 }, { "epoch": 1.18, "learning_rate": 0.00012256513410458263, "loss": 0.0121, "step": 456340 }, { "epoch": 1.18, "learning_rate": 0.00012256124588821117, "loss": 0.0109, "step": 456350 }, { "epoch": 1.18, "learning_rate": 0.0001225573576718397, "loss": 0.0111, "step": 456360 }, { "epoch": 1.18, "learning_rate": 0.00012255346945546825, "loss": 0.017, "step": 456370 }, { "epoch": 1.18, "learning_rate": 0.00012254958123909677, "loss": 0.0087, "step": 456380 }, { "epoch": 1.18, "learning_rate": 0.00012254569302272533, "loss": 0.0113, "step": 456390 }, { "epoch": 1.18, "learning_rate": 0.00012254180480635385, "loss": 0.0125, "step": 456400 }, { "epoch": 1.18, "learning_rate": 0.0001225379165899824, "loss": 0.0103, "step": 456410 }, { "epoch": 1.18, "learning_rate": 0.00012253402837361093, "loss": 0.0094, "step": 456420 }, { "epoch": 1.18, "learning_rate": 0.00012253014015723947, "loss": 0.0123, "step": 456430 }, { "epoch": 1.18, "learning_rate": 0.000122526251940868, "loss": 0.0086, "step": 456440 }, { "epoch": 1.18, "learning_rate": 0.00012252236372449653, "loss": 0.0131, "step": 456450 }, { "epoch": 1.18, "learning_rate": 0.00012251847550812507, "loss": 0.0112, "step": 456460 }, { "epoch": 1.18, "learning_rate": 0.0001225145872917536, "loss": 0.0099, "step": 456470 }, { "epoch": 1.18, "learning_rate": 0.00012251069907538213, "loss": 0.0145, "step": 456480 }, { "epoch": 1.18, "learning_rate": 0.00012250681085901067, "loss": 0.0117, "step": 456490 }, { "epoch": 1.18, "learning_rate": 0.0001225029226426392, "loss": 0.0111, "step": 456500 }, { "epoch": 1.18, "learning_rate": 0.00012249903442626775, "loss": 0.011, "step": 456510 }, { "epoch": 1.18, "learning_rate": 0.00012249514620989627, "loss": 0.0151, "step": 456520 }, { "epoch": 1.18, "learning_rate": 0.0001224912579935248, "loss": 0.0102, "step": 456530 }, { "epoch": 1.18, "learning_rate": 0.00012248736977715335, "loss": 0.0138, "step": 456540 }, { "epoch": 1.18, "learning_rate": 0.00012248348156078186, "loss": 0.0093, "step": 456550 }, { "epoch": 1.18, "learning_rate": 0.00012247959334441043, "loss": 0.0102, "step": 456560 }, { "epoch": 1.18, "learning_rate": 0.00012247570512803895, "loss": 0.0145, "step": 456570 }, { "epoch": 1.18, "learning_rate": 0.0001224718169116675, "loss": 0.0119, "step": 456580 }, { "epoch": 1.18, "learning_rate": 0.00012246792869529603, "loss": 0.01, "step": 456590 }, { "epoch": 1.18, "learning_rate": 0.00012246404047892457, "loss": 0.0109, "step": 456600 }, { "epoch": 1.18, "learning_rate": 0.0001224601522625531, "loss": 0.0112, "step": 456610 }, { "epoch": 1.18, "learning_rate": 0.00012245626404618163, "loss": 0.0106, "step": 456620 }, { "epoch": 1.18, "learning_rate": 0.00012245237582981017, "loss": 0.0111, "step": 456630 }, { "epoch": 1.18, "learning_rate": 0.0001224484876134387, "loss": 0.0129, "step": 456640 }, { "epoch": 1.18, "learning_rate": 0.00012244459939706723, "loss": 0.0095, "step": 456650 }, { "epoch": 1.18, "learning_rate": 0.00012244071118069577, "loss": 0.0141, "step": 456660 }, { "epoch": 1.18, "learning_rate": 0.0001224368229643243, "loss": 0.0084, "step": 456670 }, { "epoch": 1.18, "learning_rate": 0.00012243293474795285, "loss": 0.0101, "step": 456680 }, { "epoch": 1.18, "learning_rate": 0.00012242904653158137, "loss": 0.0108, "step": 456690 }, { "epoch": 1.18, "learning_rate": 0.0001224251583152099, "loss": 0.011, "step": 456700 }, { "epoch": 1.18, "learning_rate": 0.00012242127009883845, "loss": 0.0122, "step": 456710 }, { "epoch": 1.18, "learning_rate": 0.000122417381882467, "loss": 0.0172, "step": 456720 }, { "epoch": 1.18, "learning_rate": 0.0001224134936660955, "loss": 0.0114, "step": 456730 }, { "epoch": 1.18, "learning_rate": 0.00012240960544972407, "loss": 0.01, "step": 456740 }, { "epoch": 1.18, "learning_rate": 0.0001224057172333526, "loss": 0.0099, "step": 456750 }, { "epoch": 1.18, "learning_rate": 0.00012240182901698113, "loss": 0.0107, "step": 456760 }, { "epoch": 1.18, "learning_rate": 0.00012239794080060967, "loss": 0.0118, "step": 456770 }, { "epoch": 1.18, "learning_rate": 0.0001223940525842382, "loss": 0.01, "step": 456780 }, { "epoch": 1.18, "learning_rate": 0.00012239016436786673, "loss": 0.0093, "step": 456790 }, { "epoch": 1.18, "learning_rate": 0.00012238627615149527, "loss": 0.0111, "step": 456800 }, { "epoch": 1.18, "learning_rate": 0.0001223823879351238, "loss": 0.0095, "step": 456810 }, { "epoch": 1.18, "learning_rate": 0.00012237849971875233, "loss": 0.0143, "step": 456820 }, { "epoch": 1.18, "learning_rate": 0.00012237461150238087, "loss": 0.0128, "step": 456830 }, { "epoch": 1.18, "learning_rate": 0.0001223707232860094, "loss": 0.0129, "step": 456840 }, { "epoch": 1.18, "learning_rate": 0.00012236683506963795, "loss": 0.0087, "step": 456850 }, { "epoch": 1.18, "learning_rate": 0.00012236294685326647, "loss": 0.0138, "step": 456860 }, { "epoch": 1.18, "learning_rate": 0.000122359058636895, "loss": 0.0134, "step": 456870 }, { "epoch": 1.18, "learning_rate": 0.00012235517042052355, "loss": 0.0131, "step": 456880 }, { "epoch": 1.18, "learning_rate": 0.0001223512822041521, "loss": 0.012, "step": 456890 }, { "epoch": 1.18, "learning_rate": 0.0001223473939877806, "loss": 0.0156, "step": 456900 }, { "epoch": 1.18, "learning_rate": 0.00012234350577140917, "loss": 0.0062, "step": 456910 }, { "epoch": 1.18, "learning_rate": 0.0001223396175550377, "loss": 0.0093, "step": 456920 }, { "epoch": 1.18, "learning_rate": 0.00012233572933866623, "loss": 0.0104, "step": 456930 }, { "epoch": 1.18, "learning_rate": 0.00012233184112229477, "loss": 0.0111, "step": 456940 }, { "epoch": 1.18, "learning_rate": 0.0001223279529059233, "loss": 0.013, "step": 456950 }, { "epoch": 1.18, "learning_rate": 0.00012232406468955183, "loss": 0.0155, "step": 456960 }, { "epoch": 1.18, "learning_rate": 0.00012232017647318037, "loss": 0.0117, "step": 456970 }, { "epoch": 1.18, "learning_rate": 0.0001223162882568089, "loss": 0.0081, "step": 456980 }, { "epoch": 1.18, "learning_rate": 0.00012231240004043745, "loss": 0.0083, "step": 456990 }, { "epoch": 1.18, "learning_rate": 0.00012230851182406597, "loss": 0.0129, "step": 457000 }, { "epoch": 1.18, "eval_cer": 0.8816970877754311, "eval_loss": 0.0070222471840679646, "eval_runtime": 107.5432, "eval_samples_per_second": 18.597, "eval_steps_per_second": 4.649, "step": 457000 }, { "epoch": 1.18, "learning_rate": 0.0001223046236076945, "loss": 0.0156, "step": 457010 }, { "epoch": 1.18, "learning_rate": 0.00012230073539132305, "loss": 0.0108, "step": 457020 }, { "epoch": 1.18, "learning_rate": 0.00012229684717495156, "loss": 0.0125, "step": 457030 }, { "epoch": 1.18, "learning_rate": 0.0001222929589585801, "loss": 0.0118, "step": 457040 }, { "epoch": 1.18, "learning_rate": 0.00012228907074220865, "loss": 0.0109, "step": 457050 }, { "epoch": 1.18, "learning_rate": 0.0001222851825258372, "loss": 0.0089, "step": 457060 }, { "epoch": 1.18, "learning_rate": 0.0001222812943094657, "loss": 0.013, "step": 457070 }, { "epoch": 1.18, "learning_rate": 0.00012227740609309427, "loss": 0.0111, "step": 457080 }, { "epoch": 1.18, "learning_rate": 0.0001222735178767228, "loss": 0.0111, "step": 457090 }, { "epoch": 1.18, "learning_rate": 0.00012226962966035133, "loss": 0.0162, "step": 457100 }, { "epoch": 1.18, "learning_rate": 0.00012226574144397987, "loss": 0.0162, "step": 457110 }, { "epoch": 1.18, "learning_rate": 0.0001222618532276084, "loss": 0.0088, "step": 457120 }, { "epoch": 1.18, "learning_rate": 0.00012225796501123693, "loss": 0.0096, "step": 457130 }, { "epoch": 1.18, "learning_rate": 0.00012225407679486547, "loss": 0.01, "step": 457140 }, { "epoch": 1.18, "learning_rate": 0.000122250188578494, "loss": 0.0115, "step": 457150 }, { "epoch": 1.19, "learning_rate": 0.00012224630036212255, "loss": 0.006, "step": 457160 }, { "epoch": 1.19, "learning_rate": 0.00012224241214575107, "loss": 0.0103, "step": 457170 }, { "epoch": 1.19, "learning_rate": 0.0001222385239293796, "loss": 0.0125, "step": 457180 }, { "epoch": 1.19, "learning_rate": 0.00012223463571300815, "loss": 0.0097, "step": 457190 }, { "epoch": 1.19, "learning_rate": 0.0001222307474966367, "loss": 0.0149, "step": 457200 }, { "epoch": 1.19, "learning_rate": 0.0001222268592802652, "loss": 0.0129, "step": 457210 }, { "epoch": 1.19, "learning_rate": 0.00012222297106389375, "loss": 0.0121, "step": 457220 }, { "epoch": 1.19, "learning_rate": 0.0001222190828475223, "loss": 0.0099, "step": 457230 }, { "epoch": 1.19, "learning_rate": 0.00012221519463115083, "loss": 0.0134, "step": 457240 }, { "epoch": 1.19, "learning_rate": 0.00012221130641477935, "loss": 0.0135, "step": 457250 }, { "epoch": 1.19, "learning_rate": 0.00012220741819840791, "loss": 0.0111, "step": 457260 }, { "epoch": 1.19, "learning_rate": 0.00012220352998203643, "loss": 0.0104, "step": 457270 }, { "epoch": 1.19, "learning_rate": 0.00012219964176566497, "loss": 0.0103, "step": 457280 }, { "epoch": 1.19, "learning_rate": 0.0001221957535492935, "loss": 0.0112, "step": 457290 }, { "epoch": 1.19, "learning_rate": 0.00012219186533292203, "loss": 0.0094, "step": 457300 }, { "epoch": 1.19, "learning_rate": 0.00012218797711655057, "loss": 0.009, "step": 457310 }, { "epoch": 1.19, "learning_rate": 0.0001221840889001791, "loss": 0.01, "step": 457320 }, { "epoch": 1.19, "learning_rate": 0.00012218020068380765, "loss": 0.0093, "step": 457330 }, { "epoch": 1.19, "learning_rate": 0.00012217631246743617, "loss": 0.0089, "step": 457340 }, { "epoch": 1.19, "learning_rate": 0.0001221724242510647, "loss": 0.0115, "step": 457350 }, { "epoch": 1.19, "learning_rate": 0.00012216853603469325, "loss": 0.0126, "step": 457360 }, { "epoch": 1.19, "learning_rate": 0.0001221646478183218, "loss": 0.0129, "step": 457370 }, { "epoch": 1.19, "learning_rate": 0.0001221607596019503, "loss": 0.017, "step": 457380 }, { "epoch": 1.19, "learning_rate": 0.00012215687138557885, "loss": 0.0132, "step": 457390 }, { "epoch": 1.19, "learning_rate": 0.0001221529831692074, "loss": 0.0096, "step": 457400 }, { "epoch": 1.19, "learning_rate": 0.00012214909495283593, "loss": 0.0106, "step": 457410 }, { "epoch": 1.19, "learning_rate": 0.00012214520673646444, "loss": 0.0097, "step": 457420 }, { "epoch": 1.19, "learning_rate": 0.00012214131852009301, "loss": 0.0121, "step": 457430 }, { "epoch": 1.19, "learning_rate": 0.00012213743030372153, "loss": 0.0107, "step": 457440 }, { "epoch": 1.19, "learning_rate": 0.00012213354208735007, "loss": 0.0097, "step": 457450 }, { "epoch": 1.19, "learning_rate": 0.0001221296538709786, "loss": 0.0125, "step": 457460 }, { "epoch": 1.19, "learning_rate": 0.00012212576565460715, "loss": 0.0137, "step": 457470 }, { "epoch": 1.19, "learning_rate": 0.00012212187743823567, "loss": 0.008, "step": 457480 }, { "epoch": 1.19, "learning_rate": 0.0001221179892218642, "loss": 0.0118, "step": 457490 }, { "epoch": 1.19, "learning_rate": 0.00012211410100549275, "loss": 0.0144, "step": 457500 }, { "epoch": 1.19, "learning_rate": 0.00012211021278912127, "loss": 0.0144, "step": 457510 }, { "epoch": 1.19, "learning_rate": 0.0001221063245727498, "loss": 0.0099, "step": 457520 }, { "epoch": 1.19, "learning_rate": 0.00012210243635637835, "loss": 0.0117, "step": 457530 }, { "epoch": 1.19, "learning_rate": 0.0001220985481400069, "loss": 0.0088, "step": 457540 }, { "epoch": 1.19, "learning_rate": 0.0001220946599236354, "loss": 0.0096, "step": 457550 }, { "epoch": 1.19, "learning_rate": 0.00012209077170726395, "loss": 0.0114, "step": 457560 }, { "epoch": 1.19, "learning_rate": 0.0001220868834908925, "loss": 0.0092, "step": 457570 }, { "epoch": 1.19, "learning_rate": 0.00012208299527452103, "loss": 0.0107, "step": 457580 }, { "epoch": 1.19, "learning_rate": 0.00012207910705814954, "loss": 0.0128, "step": 457590 }, { "epoch": 1.19, "learning_rate": 0.0001220752188417781, "loss": 0.012, "step": 457600 }, { "epoch": 1.19, "learning_rate": 0.00012207133062540663, "loss": 0.0146, "step": 457610 }, { "epoch": 1.19, "learning_rate": 0.00012206744240903517, "loss": 0.0147, "step": 457620 }, { "epoch": 1.19, "learning_rate": 0.0001220635541926637, "loss": 0.0121, "step": 457630 }, { "epoch": 1.19, "learning_rate": 0.00012205966597629224, "loss": 0.0138, "step": 457640 }, { "epoch": 1.19, "learning_rate": 0.00012205577775992077, "loss": 0.0119, "step": 457650 }, { "epoch": 1.19, "learning_rate": 0.00012205188954354931, "loss": 0.0133, "step": 457660 }, { "epoch": 1.19, "learning_rate": 0.00012204800132717784, "loss": 0.01, "step": 457670 }, { "epoch": 1.19, "learning_rate": 0.00012204411311080639, "loss": 0.0112, "step": 457680 }, { "epoch": 1.19, "learning_rate": 0.0001220402248944349, "loss": 0.0103, "step": 457690 }, { "epoch": 1.19, "learning_rate": 0.00012203633667806346, "loss": 0.0112, "step": 457700 }, { "epoch": 1.19, "learning_rate": 0.00012203244846169199, "loss": 0.013, "step": 457710 }, { "epoch": 1.19, "learning_rate": 0.00012202856024532053, "loss": 0.0129, "step": 457720 }, { "epoch": 1.19, "learning_rate": 0.00012202467202894906, "loss": 0.0146, "step": 457730 }, { "epoch": 1.19, "learning_rate": 0.0001220207838125776, "loss": 0.012, "step": 457740 }, { "epoch": 1.19, "learning_rate": 0.00012201689559620613, "loss": 0.0095, "step": 457750 }, { "epoch": 1.19, "learning_rate": 0.00012201300737983466, "loss": 0.0114, "step": 457760 }, { "epoch": 1.19, "learning_rate": 0.0001220091191634632, "loss": 0.0119, "step": 457770 }, { "epoch": 1.19, "learning_rate": 0.00012200523094709173, "loss": 0.0098, "step": 457780 }, { "epoch": 1.19, "learning_rate": 0.00012200134273072027, "loss": 0.0116, "step": 457790 }, { "epoch": 1.19, "learning_rate": 0.0001219974545143488, "loss": 0.0115, "step": 457800 }, { "epoch": 1.19, "learning_rate": 0.00012199356629797734, "loss": 0.0101, "step": 457810 }, { "epoch": 1.19, "learning_rate": 0.00012198967808160587, "loss": 0.0085, "step": 457820 }, { "epoch": 1.19, "learning_rate": 0.00012198578986523441, "loss": 0.0096, "step": 457830 }, { "epoch": 1.19, "learning_rate": 0.00012198190164886294, "loss": 0.0154, "step": 457840 }, { "epoch": 1.19, "learning_rate": 0.00012197801343249148, "loss": 0.0128, "step": 457850 }, { "epoch": 1.19, "learning_rate": 0.00012197412521612, "loss": 0.0084, "step": 457860 }, { "epoch": 1.19, "learning_rate": 0.00012197023699974856, "loss": 0.0137, "step": 457870 }, { "epoch": 1.19, "learning_rate": 0.00012196634878337709, "loss": 0.0101, "step": 457880 }, { "epoch": 1.19, "learning_rate": 0.00012196246056700563, "loss": 0.0104, "step": 457890 }, { "epoch": 1.19, "learning_rate": 0.00012195857235063416, "loss": 0.0143, "step": 457900 }, { "epoch": 1.19, "learning_rate": 0.0001219546841342627, "loss": 0.0153, "step": 457910 }, { "epoch": 1.19, "learning_rate": 0.00012195079591789123, "loss": 0.0138, "step": 457920 }, { "epoch": 1.19, "learning_rate": 0.00012194690770151977, "loss": 0.0153, "step": 457930 }, { "epoch": 1.19, "learning_rate": 0.0001219430194851483, "loss": 0.0158, "step": 457940 }, { "epoch": 1.19, "learning_rate": 0.00012193913126877684, "loss": 0.0099, "step": 457950 }, { "epoch": 1.19, "learning_rate": 0.00012193524305240537, "loss": 0.0174, "step": 457960 }, { "epoch": 1.19, "learning_rate": 0.00012193135483603391, "loss": 0.0113, "step": 457970 }, { "epoch": 1.19, "learning_rate": 0.00012192746661966244, "loss": 0.0107, "step": 457980 }, { "epoch": 1.19, "learning_rate": 0.00012192357840329098, "loss": 0.0105, "step": 457990 }, { "epoch": 1.19, "learning_rate": 0.00012191969018691951, "loss": 0.0124, "step": 458000 }, { "epoch": 1.19, "eval_cer": 0.8817250805141147, "eval_loss": 0.007128569763153791, "eval_runtime": 107.4871, "eval_samples_per_second": 18.607, "eval_steps_per_second": 4.652, "step": 458000 }, { "epoch": 1.19, "learning_rate": 0.00012191580197054804, "loss": 0.0095, "step": 458010 }, { "epoch": 1.19, "learning_rate": 0.00012191191375417658, "loss": 0.0121, "step": 458020 }, { "epoch": 1.19, "learning_rate": 0.0001219080255378051, "loss": 0.0137, "step": 458030 }, { "epoch": 1.19, "learning_rate": 0.00012190413732143365, "loss": 0.015, "step": 458040 }, { "epoch": 1.19, "learning_rate": 0.00012190024910506218, "loss": 0.0168, "step": 458050 }, { "epoch": 1.19, "learning_rate": 0.00012189636088869073, "loss": 0.0097, "step": 458060 }, { "epoch": 1.19, "learning_rate": 0.00012189247267231926, "loss": 0.0115, "step": 458070 }, { "epoch": 1.19, "learning_rate": 0.0001218885844559478, "loss": 0.0093, "step": 458080 }, { "epoch": 1.19, "learning_rate": 0.00012188469623957633, "loss": 0.0121, "step": 458090 }, { "epoch": 1.19, "learning_rate": 0.00012188080802320487, "loss": 0.0127, "step": 458100 }, { "epoch": 1.19, "learning_rate": 0.0001218769198068334, "loss": 0.0121, "step": 458110 }, { "epoch": 1.19, "learning_rate": 0.00012187303159046194, "loss": 0.0086, "step": 458120 }, { "epoch": 1.19, "learning_rate": 0.00012186914337409047, "loss": 0.0106, "step": 458130 }, { "epoch": 1.19, "learning_rate": 0.00012186525515771901, "loss": 0.01, "step": 458140 }, { "epoch": 1.19, "learning_rate": 0.00012186136694134754, "loss": 0.0113, "step": 458150 }, { "epoch": 1.19, "learning_rate": 0.00012185747872497608, "loss": 0.0151, "step": 458160 }, { "epoch": 1.19, "learning_rate": 0.00012185359050860461, "loss": 0.0116, "step": 458170 }, { "epoch": 1.19, "learning_rate": 0.00012184970229223315, "loss": 0.015, "step": 458180 }, { "epoch": 1.19, "learning_rate": 0.00012184581407586168, "loss": 0.0115, "step": 458190 }, { "epoch": 1.19, "learning_rate": 0.00012184192585949022, "loss": 0.0121, "step": 458200 }, { "epoch": 1.19, "learning_rate": 0.00012183803764311875, "loss": 0.0115, "step": 458210 }, { "epoch": 1.19, "learning_rate": 0.0001218341494267473, "loss": 0.0109, "step": 458220 }, { "epoch": 1.19, "learning_rate": 0.00012183026121037583, "loss": 0.0116, "step": 458230 }, { "epoch": 1.19, "learning_rate": 0.00012182637299400437, "loss": 0.0092, "step": 458240 }, { "epoch": 1.19, "learning_rate": 0.0001218224847776329, "loss": 0.015, "step": 458250 }, { "epoch": 1.19, "learning_rate": 0.00012181859656126143, "loss": 0.009, "step": 458260 }, { "epoch": 1.19, "learning_rate": 0.00012181470834488997, "loss": 0.0092, "step": 458270 }, { "epoch": 1.19, "learning_rate": 0.0001218108201285185, "loss": 0.0131, "step": 458280 }, { "epoch": 1.19, "learning_rate": 0.00012180693191214704, "loss": 0.0108, "step": 458290 }, { "epoch": 1.19, "learning_rate": 0.00012180304369577557, "loss": 0.01, "step": 458300 }, { "epoch": 1.19, "learning_rate": 0.00012179915547940411, "loss": 0.0135, "step": 458310 }, { "epoch": 1.19, "learning_rate": 0.00012179526726303264, "loss": 0.0133, "step": 458320 }, { "epoch": 1.19, "learning_rate": 0.00012179137904666118, "loss": 0.0135, "step": 458330 }, { "epoch": 1.19, "learning_rate": 0.0001217874908302897, "loss": 0.0089, "step": 458340 }, { "epoch": 1.19, "learning_rate": 0.00012178360261391825, "loss": 0.0113, "step": 458350 }, { "epoch": 1.19, "learning_rate": 0.00012177971439754678, "loss": 0.0138, "step": 458360 }, { "epoch": 1.19, "learning_rate": 0.00012177582618117532, "loss": 0.013, "step": 458370 }, { "epoch": 1.19, "learning_rate": 0.00012177193796480385, "loss": 0.0092, "step": 458380 }, { "epoch": 1.19, "learning_rate": 0.0001217680497484324, "loss": 0.0136, "step": 458390 }, { "epoch": 1.19, "learning_rate": 0.00012176416153206092, "loss": 0.0104, "step": 458400 }, { "epoch": 1.19, "learning_rate": 0.00012176027331568947, "loss": 0.0109, "step": 458410 }, { "epoch": 1.19, "learning_rate": 0.000121756385099318, "loss": 0.0102, "step": 458420 }, { "epoch": 1.19, "learning_rate": 0.00012175249688294654, "loss": 0.0149, "step": 458430 }, { "epoch": 1.19, "learning_rate": 0.00012174860866657507, "loss": 0.0109, "step": 458440 }, { "epoch": 1.19, "learning_rate": 0.00012174472045020361, "loss": 0.0085, "step": 458450 }, { "epoch": 1.19, "learning_rate": 0.00012174083223383214, "loss": 0.0116, "step": 458460 }, { "epoch": 1.19, "learning_rate": 0.00012173694401746068, "loss": 0.0125, "step": 458470 }, { "epoch": 1.19, "learning_rate": 0.00012173305580108921, "loss": 0.0111, "step": 458480 }, { "epoch": 1.19, "learning_rate": 0.00012172916758471775, "loss": 0.0106, "step": 458490 }, { "epoch": 1.19, "learning_rate": 0.00012172527936834628, "loss": 0.0111, "step": 458500 }, { "epoch": 1.19, "learning_rate": 0.0001217213911519748, "loss": 0.0095, "step": 458510 }, { "epoch": 1.19, "learning_rate": 0.00012171750293560335, "loss": 0.0107, "step": 458520 }, { "epoch": 1.19, "learning_rate": 0.00012171361471923188, "loss": 0.0115, "step": 458530 }, { "epoch": 1.19, "learning_rate": 0.00012170972650286042, "loss": 0.0088, "step": 458540 }, { "epoch": 1.19, "learning_rate": 0.00012170583828648895, "loss": 0.0128, "step": 458550 }, { "epoch": 1.19, "learning_rate": 0.00012170195007011749, "loss": 0.014, "step": 458560 }, { "epoch": 1.19, "learning_rate": 0.00012169806185374601, "loss": 0.0138, "step": 458570 }, { "epoch": 1.19, "learning_rate": 0.00012169417363737457, "loss": 0.0085, "step": 458580 }, { "epoch": 1.19, "learning_rate": 0.0001216902854210031, "loss": 0.013, "step": 458590 }, { "epoch": 1.19, "learning_rate": 0.00012168639720463164, "loss": 0.0422, "step": 458600 }, { "epoch": 1.19, "learning_rate": 0.00012168250898826017, "loss": 0.0098, "step": 458610 }, { "epoch": 1.19, "learning_rate": 0.00012167862077188871, "loss": 0.0097, "step": 458620 }, { "epoch": 1.19, "learning_rate": 0.00012167473255551724, "loss": 0.0117, "step": 458630 }, { "epoch": 1.19, "learning_rate": 0.00012167084433914578, "loss": 0.0102, "step": 458640 }, { "epoch": 1.19, "learning_rate": 0.00012166695612277431, "loss": 0.0118, "step": 458650 }, { "epoch": 1.19, "learning_rate": 0.00012166306790640285, "loss": 0.0116, "step": 458660 }, { "epoch": 1.19, "learning_rate": 0.00012165917969003138, "loss": 0.0136, "step": 458670 }, { "epoch": 1.19, "learning_rate": 0.00012165529147365992, "loss": 0.0113, "step": 458680 }, { "epoch": 1.19, "learning_rate": 0.00012165140325728845, "loss": 0.0122, "step": 458690 }, { "epoch": 1.19, "learning_rate": 0.00012164751504091699, "loss": 0.0098, "step": 458700 }, { "epoch": 1.19, "learning_rate": 0.00012164362682454552, "loss": 0.0094, "step": 458710 }, { "epoch": 1.19, "learning_rate": 0.00012163973860817406, "loss": 0.0113, "step": 458720 }, { "epoch": 1.19, "learning_rate": 0.00012163585039180259, "loss": 0.0103, "step": 458730 }, { "epoch": 1.19, "learning_rate": 0.00012163196217543114, "loss": 0.015, "step": 458740 }, { "epoch": 1.19, "learning_rate": 0.00012162807395905967, "loss": 0.0092, "step": 458750 }, { "epoch": 1.19, "learning_rate": 0.00012162418574268818, "loss": 0.0103, "step": 458760 }, { "epoch": 1.19, "learning_rate": 0.00012162029752631674, "loss": 0.0105, "step": 458770 }, { "epoch": 1.19, "learning_rate": 0.00012161640930994527, "loss": 0.0106, "step": 458780 }, { "epoch": 1.19, "learning_rate": 0.00012161252109357381, "loss": 0.0131, "step": 458790 }, { "epoch": 1.19, "learning_rate": 0.00012160863287720234, "loss": 0.0194, "step": 458800 }, { "epoch": 1.19, "learning_rate": 0.00012160474466083088, "loss": 0.0102, "step": 458810 }, { "epoch": 1.19, "learning_rate": 0.00012160085644445941, "loss": 0.0144, "step": 458820 }, { "epoch": 1.19, "learning_rate": 0.00012159696822808795, "loss": 0.0109, "step": 458830 }, { "epoch": 1.19, "learning_rate": 0.00012159308001171648, "loss": 0.0103, "step": 458840 }, { "epoch": 1.19, "learning_rate": 0.00012158919179534502, "loss": 0.0133, "step": 458850 }, { "epoch": 1.19, "learning_rate": 0.00012158530357897355, "loss": 0.013, "step": 458860 }, { "epoch": 1.19, "learning_rate": 0.00012158141536260209, "loss": 0.0116, "step": 458870 }, { "epoch": 1.19, "learning_rate": 0.00012157752714623062, "loss": 0.0107, "step": 458880 }, { "epoch": 1.19, "learning_rate": 0.00012157363892985916, "loss": 0.0109, "step": 458890 }, { "epoch": 1.19, "learning_rate": 0.00012156975071348769, "loss": 0.0122, "step": 458900 }, { "epoch": 1.19, "learning_rate": 0.00012156586249711624, "loss": 0.0098, "step": 458910 }, { "epoch": 1.19, "learning_rate": 0.00012156197428074476, "loss": 0.0106, "step": 458920 }, { "epoch": 1.19, "learning_rate": 0.00012155808606437331, "loss": 0.0077, "step": 458930 }, { "epoch": 1.19, "learning_rate": 0.00012155419784800184, "loss": 0.014, "step": 458940 }, { "epoch": 1.19, "learning_rate": 0.00012155030963163038, "loss": 0.0106, "step": 458950 }, { "epoch": 1.19, "learning_rate": 0.00012154642141525891, "loss": 0.011, "step": 458960 }, { "epoch": 1.19, "learning_rate": 0.00012154253319888745, "loss": 0.0126, "step": 458970 }, { "epoch": 1.19, "learning_rate": 0.00012153864498251598, "loss": 0.008, "step": 458980 }, { "epoch": 1.19, "learning_rate": 0.00012153475676614452, "loss": 0.0212, "step": 458990 }, { "epoch": 1.19, "learning_rate": 0.00012153086854977305, "loss": 0.0102, "step": 459000 }, { "epoch": 1.19, "eval_cer": 0.8816914892276944, "eval_loss": 0.007249526679515839, "eval_runtime": 107.419, "eval_samples_per_second": 18.619, "eval_steps_per_second": 4.655, "step": 459000 }, { "epoch": 1.19, "learning_rate": 0.00012152698033340158, "loss": 0.0112, "step": 459010 }, { "epoch": 1.19, "learning_rate": 0.00012152309211703012, "loss": 0.0101, "step": 459020 }, { "epoch": 1.19, "learning_rate": 0.00012151920390065865, "loss": 0.0127, "step": 459030 }, { "epoch": 1.19, "learning_rate": 0.00012151531568428719, "loss": 0.0084, "step": 459040 }, { "epoch": 1.19, "learning_rate": 0.00012151142746791572, "loss": 0.008, "step": 459050 }, { "epoch": 1.19, "learning_rate": 0.00012150753925154426, "loss": 0.0135, "step": 459060 }, { "epoch": 1.19, "learning_rate": 0.00012150365103517279, "loss": 0.0093, "step": 459070 }, { "epoch": 1.19, "learning_rate": 0.00012149976281880133, "loss": 0.0111, "step": 459080 }, { "epoch": 1.19, "learning_rate": 0.00012149587460242985, "loss": 0.0098, "step": 459090 }, { "epoch": 1.19, "learning_rate": 0.00012149198638605841, "loss": 0.0132, "step": 459100 }, { "epoch": 1.19, "learning_rate": 0.00012148809816968694, "loss": 0.0111, "step": 459110 }, { "epoch": 1.19, "learning_rate": 0.00012148420995331548, "loss": 0.0113, "step": 459120 }, { "epoch": 1.19, "learning_rate": 0.00012148032173694401, "loss": 0.0137, "step": 459130 }, { "epoch": 1.19, "learning_rate": 0.00012147643352057255, "loss": 0.0109, "step": 459140 }, { "epoch": 1.19, "learning_rate": 0.00012147254530420108, "loss": 0.0098, "step": 459150 }, { "epoch": 1.19, "learning_rate": 0.00012146865708782962, "loss": 0.0119, "step": 459160 }, { "epoch": 1.19, "learning_rate": 0.00012146476887145815, "loss": 0.0107, "step": 459170 }, { "epoch": 1.19, "learning_rate": 0.00012146088065508669, "loss": 0.0065, "step": 459180 }, { "epoch": 1.19, "learning_rate": 0.00012145699243871522, "loss": 0.0106, "step": 459190 }, { "epoch": 1.19, "learning_rate": 0.00012145310422234376, "loss": 0.0083, "step": 459200 }, { "epoch": 1.19, "learning_rate": 0.00012144921600597229, "loss": 0.0105, "step": 459210 }, { "epoch": 1.19, "learning_rate": 0.00012144532778960083, "loss": 0.0097, "step": 459220 }, { "epoch": 1.19, "learning_rate": 0.00012144143957322936, "loss": 0.0083, "step": 459230 }, { "epoch": 1.19, "learning_rate": 0.0001214375513568579, "loss": 0.0088, "step": 459240 }, { "epoch": 1.19, "learning_rate": 0.00012143366314048643, "loss": 0.0109, "step": 459250 }, { "epoch": 1.19, "learning_rate": 0.00012142977492411495, "loss": 0.01, "step": 459260 }, { "epoch": 1.19, "learning_rate": 0.00012142588670774351, "loss": 0.0104, "step": 459270 }, { "epoch": 1.19, "learning_rate": 0.00012142199849137202, "loss": 0.0099, "step": 459280 }, { "epoch": 1.19, "learning_rate": 0.00012141811027500058, "loss": 0.0094, "step": 459290 }, { "epoch": 1.19, "learning_rate": 0.00012141422205862911, "loss": 0.0121, "step": 459300 }, { "epoch": 1.19, "learning_rate": 0.00012141033384225765, "loss": 0.0105, "step": 459310 }, { "epoch": 1.19, "learning_rate": 0.00012140644562588618, "loss": 0.0094, "step": 459320 }, { "epoch": 1.19, "learning_rate": 0.00012140255740951472, "loss": 0.0098, "step": 459330 }, { "epoch": 1.19, "learning_rate": 0.00012139866919314325, "loss": 0.0151, "step": 459340 }, { "epoch": 1.19, "learning_rate": 0.00012139478097677179, "loss": 0.0109, "step": 459350 }, { "epoch": 1.19, "learning_rate": 0.00012139089276040032, "loss": 0.0101, "step": 459360 }, { "epoch": 1.19, "learning_rate": 0.00012138700454402886, "loss": 0.0123, "step": 459370 }, { "epoch": 1.19, "learning_rate": 0.00012138311632765739, "loss": 0.0099, "step": 459380 }, { "epoch": 1.19, "learning_rate": 0.00012137922811128593, "loss": 0.0098, "step": 459390 }, { "epoch": 1.19, "learning_rate": 0.00012137533989491446, "loss": 0.0081, "step": 459400 }, { "epoch": 1.19, "learning_rate": 0.000121371451678543, "loss": 0.0147, "step": 459410 }, { "epoch": 1.19, "learning_rate": 0.00012136756346217153, "loss": 0.0095, "step": 459420 }, { "epoch": 1.19, "learning_rate": 0.00012136367524580007, "loss": 0.0138, "step": 459430 }, { "epoch": 1.19, "learning_rate": 0.0001213597870294286, "loss": 0.0122, "step": 459440 }, { "epoch": 1.19, "learning_rate": 0.00012135589881305715, "loss": 0.0096, "step": 459450 }, { "epoch": 1.19, "learning_rate": 0.00012135201059668568, "loss": 0.0145, "step": 459460 }, { "epoch": 1.19, "learning_rate": 0.00012134812238031422, "loss": 0.0125, "step": 459470 }, { "epoch": 1.19, "learning_rate": 0.00012134423416394275, "loss": 0.01, "step": 459480 }, { "epoch": 1.19, "learning_rate": 0.00012134034594757129, "loss": 0.0111, "step": 459490 }, { "epoch": 1.19, "learning_rate": 0.00012133645773119982, "loss": 0.0101, "step": 459500 }, { "epoch": 1.19, "learning_rate": 0.00012133256951482835, "loss": 0.0087, "step": 459510 }, { "epoch": 1.19, "learning_rate": 0.00012132868129845689, "loss": 0.0079, "step": 459520 }, { "epoch": 1.19, "learning_rate": 0.00012132479308208542, "loss": 0.0115, "step": 459530 }, { "epoch": 1.19, "learning_rate": 0.00012132090486571396, "loss": 0.0118, "step": 459540 }, { "epoch": 1.19, "learning_rate": 0.00012131701664934249, "loss": 0.0097, "step": 459550 }, { "epoch": 1.19, "learning_rate": 0.00012131312843297103, "loss": 0.011, "step": 459560 }, { "epoch": 1.19, "learning_rate": 0.00012130924021659956, "loss": 0.0104, "step": 459570 }, { "epoch": 1.19, "learning_rate": 0.0001213053520002281, "loss": 0.011, "step": 459580 }, { "epoch": 1.19, "learning_rate": 0.00012130146378385663, "loss": 0.0102, "step": 459590 }, { "epoch": 1.19, "learning_rate": 0.00012129757556748517, "loss": 0.009, "step": 459600 }, { "epoch": 1.19, "learning_rate": 0.0001212936873511137, "loss": 0.0102, "step": 459610 }, { "epoch": 1.19, "learning_rate": 0.00012128979913474225, "loss": 0.0109, "step": 459620 }, { "epoch": 1.19, "learning_rate": 0.00012128591091837076, "loss": 0.01, "step": 459630 }, { "epoch": 1.19, "learning_rate": 0.00012128202270199932, "loss": 0.0101, "step": 459640 }, { "epoch": 1.19, "learning_rate": 0.00012127813448562785, "loss": 0.0126, "step": 459650 }, { "epoch": 1.19, "learning_rate": 0.00012127424626925639, "loss": 0.0136, "step": 459660 }, { "epoch": 1.19, "learning_rate": 0.00012127035805288492, "loss": 0.0131, "step": 459670 }, { "epoch": 1.19, "learning_rate": 0.00012126646983651346, "loss": 0.0109, "step": 459680 }, { "epoch": 1.19, "learning_rate": 0.00012126258162014199, "loss": 0.0097, "step": 459690 }, { "epoch": 1.19, "learning_rate": 0.00012125869340377053, "loss": 0.014, "step": 459700 }, { "epoch": 1.19, "learning_rate": 0.00012125480518739906, "loss": 0.0123, "step": 459710 }, { "epoch": 1.19, "learning_rate": 0.0001212509169710276, "loss": 0.0098, "step": 459720 }, { "epoch": 1.19, "learning_rate": 0.00012124702875465613, "loss": 0.0112, "step": 459730 }, { "epoch": 1.19, "learning_rate": 0.00012124314053828467, "loss": 0.0105, "step": 459740 }, { "epoch": 1.19, "learning_rate": 0.0001212392523219132, "loss": 0.0122, "step": 459750 }, { "epoch": 1.19, "learning_rate": 0.00012123536410554172, "loss": 0.0088, "step": 459760 }, { "epoch": 1.19, "learning_rate": 0.00012123147588917027, "loss": 0.01, "step": 459770 }, { "epoch": 1.19, "learning_rate": 0.0001212275876727988, "loss": 0.0096, "step": 459780 }, { "epoch": 1.19, "learning_rate": 0.00012122369945642734, "loss": 0.01, "step": 459790 }, { "epoch": 1.19, "learning_rate": 0.00012121981124005586, "loss": 0.0093, "step": 459800 }, { "epoch": 1.19, "learning_rate": 0.00012121592302368442, "loss": 0.0122, "step": 459810 }, { "epoch": 1.19, "learning_rate": 0.00012121203480731295, "loss": 0.0118, "step": 459820 }, { "epoch": 1.19, "learning_rate": 0.00012120814659094149, "loss": 0.0092, "step": 459830 }, { "epoch": 1.19, "learning_rate": 0.00012120425837457002, "loss": 0.008, "step": 459840 }, { "epoch": 1.19, "learning_rate": 0.00012120037015819856, "loss": 0.0093, "step": 459850 }, { "epoch": 1.19, "learning_rate": 0.00012119648194182709, "loss": 0.0102, "step": 459860 }, { "epoch": 1.19, "learning_rate": 0.00012119259372545563, "loss": 0.0117, "step": 459870 }, { "epoch": 1.19, "learning_rate": 0.00012118870550908416, "loss": 0.0136, "step": 459880 }, { "epoch": 1.19, "learning_rate": 0.0001211848172927127, "loss": 0.0093, "step": 459890 }, { "epoch": 1.19, "learning_rate": 0.00012118092907634123, "loss": 0.0111, "step": 459900 }, { "epoch": 1.19, "learning_rate": 0.00012117704085996977, "loss": 0.0108, "step": 459910 }, { "epoch": 1.19, "learning_rate": 0.0001211731526435983, "loss": 0.0122, "step": 459920 }, { "epoch": 1.19, "learning_rate": 0.00012116926442722684, "loss": 0.01, "step": 459930 }, { "epoch": 1.19, "learning_rate": 0.00012116537621085537, "loss": 0.0096, "step": 459940 }, { "epoch": 1.19, "learning_rate": 0.00012116148799448391, "loss": 0.0108, "step": 459950 }, { "epoch": 1.19, "learning_rate": 0.00012115759977811244, "loss": 0.0103, "step": 459960 }, { "epoch": 1.19, "learning_rate": 0.00012115371156174099, "loss": 0.0125, "step": 459970 }, { "epoch": 1.19, "learning_rate": 0.00012114982334536952, "loss": 0.0104, "step": 459980 }, { "epoch": 1.19, "learning_rate": 0.00012114593512899803, "loss": 0.0105, "step": 459990 }, { "epoch": 1.19, "learning_rate": 0.00012114204691262659, "loss": 0.0159, "step": 460000 }, { "epoch": 1.19, "eval_cer": 0.8816718943106159, "eval_loss": 0.007131533697247505, "eval_runtime": 107.4528, "eval_samples_per_second": 18.613, "eval_steps_per_second": 4.653, "step": 460000 }, { "epoch": 1.19, "learning_rate": 0.00012113815869625512, "loss": 0.0106, "step": 460010 }, { "epoch": 1.19, "learning_rate": 0.00012113427047988366, "loss": 0.0105, "step": 460020 }, { "epoch": 1.19, "learning_rate": 0.00012113038226351219, "loss": 0.01, "step": 460030 }, { "epoch": 1.19, "learning_rate": 0.00012112649404714073, "loss": 0.0081, "step": 460040 }, { "epoch": 1.19, "learning_rate": 0.00012112260583076926, "loss": 0.0114, "step": 460050 }, { "epoch": 1.19, "learning_rate": 0.0001211187176143978, "loss": 0.0109, "step": 460060 }, { "epoch": 1.19, "learning_rate": 0.00012111482939802633, "loss": 0.0132, "step": 460070 }, { "epoch": 1.19, "learning_rate": 0.00012111094118165487, "loss": 0.0097, "step": 460080 }, { "epoch": 1.19, "learning_rate": 0.0001211070529652834, "loss": 0.01, "step": 460090 }, { "epoch": 1.19, "learning_rate": 0.00012110316474891194, "loss": 0.0112, "step": 460100 }, { "epoch": 1.19, "learning_rate": 0.00012109927653254046, "loss": 0.0087, "step": 460110 }, { "epoch": 1.19, "learning_rate": 0.000121095388316169, "loss": 0.0103, "step": 460120 }, { "epoch": 1.19, "learning_rate": 0.00012109150009979753, "loss": 0.0178, "step": 460130 }, { "epoch": 1.19, "learning_rate": 0.00012108761188342609, "loss": 0.0128, "step": 460140 }, { "epoch": 1.19, "learning_rate": 0.0001210837236670546, "loss": 0.0132, "step": 460150 }, { "epoch": 1.19, "learning_rate": 0.00012107983545068316, "loss": 0.0094, "step": 460160 }, { "epoch": 1.19, "learning_rate": 0.00012107594723431169, "loss": 0.0142, "step": 460170 }, { "epoch": 1.19, "learning_rate": 0.00012107205901794023, "loss": 0.0124, "step": 460180 }, { "epoch": 1.19, "learning_rate": 0.00012106817080156876, "loss": 0.0123, "step": 460190 }, { "epoch": 1.19, "learning_rate": 0.0001210642825851973, "loss": 0.01, "step": 460200 }, { "epoch": 1.19, "learning_rate": 0.00012106039436882583, "loss": 0.0099, "step": 460210 }, { "epoch": 1.19, "learning_rate": 0.00012105650615245437, "loss": 0.0125, "step": 460220 }, { "epoch": 1.19, "learning_rate": 0.0001210526179360829, "loss": 0.0105, "step": 460230 }, { "epoch": 1.19, "learning_rate": 0.00012104872971971142, "loss": 0.0145, "step": 460240 }, { "epoch": 1.19, "learning_rate": 0.00012104484150333997, "loss": 0.008, "step": 460250 }, { "epoch": 1.19, "learning_rate": 0.0001210409532869685, "loss": 0.0101, "step": 460260 }, { "epoch": 1.19, "learning_rate": 0.00012103706507059704, "loss": 0.0094, "step": 460270 }, { "epoch": 1.19, "learning_rate": 0.00012103317685422556, "loss": 0.0121, "step": 460280 }, { "epoch": 1.19, "learning_rate": 0.0001210292886378541, "loss": 0.0114, "step": 460290 }, { "epoch": 1.19, "learning_rate": 0.00012102540042148263, "loss": 0.009, "step": 460300 }, { "epoch": 1.19, "learning_rate": 0.00012102151220511118, "loss": 0.008, "step": 460310 }, { "epoch": 1.19, "learning_rate": 0.0001210176239887397, "loss": 0.0152, "step": 460320 }, { "epoch": 1.19, "learning_rate": 0.00012101373577236826, "loss": 0.01, "step": 460330 }, { "epoch": 1.19, "learning_rate": 0.00012100984755599679, "loss": 0.0105, "step": 460340 }, { "epoch": 1.19, "learning_rate": 0.00012100595933962533, "loss": 0.0119, "step": 460350 }, { "epoch": 1.19, "learning_rate": 0.00012100207112325386, "loss": 0.0136, "step": 460360 }, { "epoch": 1.19, "learning_rate": 0.0001209981829068824, "loss": 0.0101, "step": 460370 }, { "epoch": 1.19, "learning_rate": 0.00012099429469051093, "loss": 0.0099, "step": 460380 }, { "epoch": 1.19, "learning_rate": 0.00012099040647413947, "loss": 0.0099, "step": 460390 }, { "epoch": 1.19, "learning_rate": 0.000120986518257768, "loss": 0.0109, "step": 460400 }, { "epoch": 1.19, "learning_rate": 0.00012098263004139654, "loss": 0.0082, "step": 460410 }, { "epoch": 1.19, "learning_rate": 0.00012097874182502507, "loss": 0.0096, "step": 460420 }, { "epoch": 1.19, "learning_rate": 0.00012097485360865361, "loss": 0.0113, "step": 460430 }, { "epoch": 1.19, "learning_rate": 0.00012097096539228214, "loss": 0.0101, "step": 460440 }, { "epoch": 1.19, "learning_rate": 0.00012096707717591068, "loss": 0.0102, "step": 460450 }, { "epoch": 1.19, "learning_rate": 0.0001209631889595392, "loss": 0.0106, "step": 460460 }, { "epoch": 1.19, "learning_rate": 0.00012095930074316775, "loss": 0.0106, "step": 460470 }, { "epoch": 1.19, "learning_rate": 0.00012095541252679628, "loss": 0.0101, "step": 460480 }, { "epoch": 1.19, "learning_rate": 0.0001209515243104248, "loss": 0.0091, "step": 460490 }, { "epoch": 1.19, "learning_rate": 0.00012094763609405336, "loss": 0.0118, "step": 460500 }, { "epoch": 1.19, "learning_rate": 0.00012094374787768187, "loss": 0.0092, "step": 460510 }, { "epoch": 1.19, "learning_rate": 0.00012093985966131043, "loss": 0.0119, "step": 460520 }, { "epoch": 1.19, "learning_rate": 0.00012093597144493896, "loss": 0.0105, "step": 460530 }, { "epoch": 1.19, "learning_rate": 0.0001209320832285675, "loss": 0.0082, "step": 460540 }, { "epoch": 1.19, "learning_rate": 0.00012092819501219603, "loss": 0.012, "step": 460550 }, { "epoch": 1.19, "learning_rate": 0.00012092430679582457, "loss": 0.0115, "step": 460560 }, { "epoch": 1.19, "learning_rate": 0.0001209204185794531, "loss": 0.0108, "step": 460570 }, { "epoch": 1.19, "learning_rate": 0.00012091653036308164, "loss": 0.0117, "step": 460580 }, { "epoch": 1.19, "learning_rate": 0.00012091264214671017, "loss": 0.0093, "step": 460590 }, { "epoch": 1.19, "learning_rate": 0.00012090875393033871, "loss": 0.0098, "step": 460600 }, { "epoch": 1.19, "learning_rate": 0.00012090486571396724, "loss": 0.0093, "step": 460610 }, { "epoch": 1.19, "learning_rate": 0.00012090097749759578, "loss": 0.011, "step": 460620 }, { "epoch": 1.19, "learning_rate": 0.0001208970892812243, "loss": 0.0108, "step": 460630 }, { "epoch": 1.19, "learning_rate": 0.00012089320106485285, "loss": 0.0131, "step": 460640 }, { "epoch": 1.19, "learning_rate": 0.00012088931284848137, "loss": 0.0075, "step": 460650 }, { "epoch": 1.19, "learning_rate": 0.00012088542463210992, "loss": 0.0126, "step": 460660 }, { "epoch": 1.19, "learning_rate": 0.00012088153641573844, "loss": 0.0097, "step": 460670 }, { "epoch": 1.19, "learning_rate": 0.000120877648199367, "loss": 0.0125, "step": 460680 }, { "epoch": 1.19, "learning_rate": 0.00012087375998299553, "loss": 0.0121, "step": 460690 }, { "epoch": 1.19, "learning_rate": 0.00012086987176662407, "loss": 0.0119, "step": 460700 }, { "epoch": 1.19, "learning_rate": 0.0001208659835502526, "loss": 0.0087, "step": 460710 }, { "epoch": 1.19, "learning_rate": 0.00012086209533388114, "loss": 0.01, "step": 460720 }, { "epoch": 1.19, "learning_rate": 0.00012085820711750967, "loss": 0.0108, "step": 460730 }, { "epoch": 1.19, "learning_rate": 0.0001208543189011382, "loss": 0.01, "step": 460740 }, { "epoch": 1.19, "learning_rate": 0.00012085043068476674, "loss": 0.0111, "step": 460750 }, { "epoch": 1.19, "learning_rate": 0.00012084654246839526, "loss": 0.0108, "step": 460760 }, { "epoch": 1.19, "learning_rate": 0.0001208426542520238, "loss": 0.0093, "step": 460770 }, { "epoch": 1.19, "learning_rate": 0.00012083876603565233, "loss": 0.0116, "step": 460780 }, { "epoch": 1.19, "learning_rate": 0.00012083487781928088, "loss": 0.0107, "step": 460790 }, { "epoch": 1.19, "learning_rate": 0.0001208309896029094, "loss": 0.0109, "step": 460800 }, { "epoch": 1.19, "learning_rate": 0.00012082710138653795, "loss": 0.0108, "step": 460810 }, { "epoch": 1.19, "learning_rate": 0.00012082321317016647, "loss": 0.0098, "step": 460820 }, { "epoch": 1.19, "learning_rate": 0.00012081932495379502, "loss": 0.0105, "step": 460830 }, { "epoch": 1.19, "learning_rate": 0.00012081543673742354, "loss": 0.0087, "step": 460840 }, { "epoch": 1.19, "learning_rate": 0.0001208115485210521, "loss": 0.0115, "step": 460850 }, { "epoch": 1.19, "learning_rate": 0.00012080766030468063, "loss": 0.0121, "step": 460860 }, { "epoch": 1.19, "learning_rate": 0.00012080377208830917, "loss": 0.0104, "step": 460870 }, { "epoch": 1.19, "learning_rate": 0.0001207998838719377, "loss": 0.0123, "step": 460880 }, { "epoch": 1.19, "learning_rate": 0.00012079599565556624, "loss": 0.0087, "step": 460890 }, { "epoch": 1.19, "learning_rate": 0.00012079210743919477, "loss": 0.0139, "step": 460900 }, { "epoch": 1.19, "learning_rate": 0.00012078821922282331, "loss": 0.013, "step": 460910 }, { "epoch": 1.19, "learning_rate": 0.00012078433100645184, "loss": 0.0092, "step": 460920 }, { "epoch": 1.19, "learning_rate": 0.00012078044279008038, "loss": 0.0127, "step": 460930 }, { "epoch": 1.19, "learning_rate": 0.0001207765545737089, "loss": 0.0106, "step": 460940 }, { "epoch": 1.19, "learning_rate": 0.00012077266635733745, "loss": 0.0123, "step": 460950 }, { "epoch": 1.19, "learning_rate": 0.00012076877814096598, "loss": 0.0125, "step": 460960 }, { "epoch": 1.19, "learning_rate": 0.00012076488992459452, "loss": 0.0176, "step": 460970 }, { "epoch": 1.19, "learning_rate": 0.00012076100170822305, "loss": 0.0107, "step": 460980 }, { "epoch": 1.19, "learning_rate": 0.00012075711349185157, "loss": 0.0092, "step": 460990 }, { "epoch": 1.19, "learning_rate": 0.00012075322527548012, "loss": 0.0109, "step": 461000 }, { "epoch": 1.19, "eval_cer": 0.881719481966378, "eval_loss": 0.0072724465280771255, "eval_runtime": 107.8929, "eval_samples_per_second": 18.537, "eval_steps_per_second": 4.634, "step": 461000 }, { "epoch": 1.2, "learning_rate": 0.00012074933705910864, "loss": 0.0117, "step": 461010 }, { "epoch": 1.2, "learning_rate": 0.00012074544884273718, "loss": 0.0106, "step": 461020 }, { "epoch": 1.2, "learning_rate": 0.00012074156062636571, "loss": 0.0139, "step": 461030 }, { "epoch": 1.2, "learning_rate": 0.00012073767240999427, "loss": 0.0107, "step": 461040 }, { "epoch": 1.2, "learning_rate": 0.0001207337841936228, "loss": 0.0116, "step": 461050 }, { "epoch": 1.2, "learning_rate": 0.00012072989597725134, "loss": 0.0112, "step": 461060 }, { "epoch": 1.2, "learning_rate": 0.00012072600776087987, "loss": 0.0116, "step": 461070 }, { "epoch": 1.2, "learning_rate": 0.00012072211954450841, "loss": 0.011, "step": 461080 }, { "epoch": 1.2, "learning_rate": 0.00012071823132813694, "loss": 0.0094, "step": 461090 }, { "epoch": 1.2, "learning_rate": 0.00012071434311176548, "loss": 0.0084, "step": 461100 }, { "epoch": 1.2, "learning_rate": 0.000120710454895394, "loss": 0.0115, "step": 461110 }, { "epoch": 1.2, "learning_rate": 0.00012070656667902255, "loss": 0.0095, "step": 461120 }, { "epoch": 1.2, "learning_rate": 0.00012070267846265107, "loss": 0.0109, "step": 461130 }, { "epoch": 1.2, "learning_rate": 0.00012069879024627962, "loss": 0.0113, "step": 461140 }, { "epoch": 1.2, "learning_rate": 0.00012069490202990814, "loss": 0.0113, "step": 461150 }, { "epoch": 1.2, "learning_rate": 0.00012069101381353669, "loss": 0.0274, "step": 461160 }, { "epoch": 1.2, "learning_rate": 0.00012068712559716521, "loss": 0.0101, "step": 461170 }, { "epoch": 1.2, "learning_rate": 0.00012068323738079376, "loss": 0.0142, "step": 461180 }, { "epoch": 1.2, "learning_rate": 0.00012067934916442228, "loss": 0.0129, "step": 461190 }, { "epoch": 1.2, "learning_rate": 0.00012067546094805084, "loss": 0.0098, "step": 461200 }, { "epoch": 1.2, "learning_rate": 0.00012067157273167937, "loss": 0.0093, "step": 461210 }, { "epoch": 1.2, "learning_rate": 0.00012066768451530791, "loss": 0.0109, "step": 461220 }, { "epoch": 1.2, "learning_rate": 0.00012066379629893644, "loss": 0.0096, "step": 461230 }, { "epoch": 1.2, "learning_rate": 0.00012065990808256497, "loss": 0.0136, "step": 461240 }, { "epoch": 1.2, "learning_rate": 0.00012065601986619351, "loss": 0.0125, "step": 461250 }, { "epoch": 1.2, "learning_rate": 0.00012065213164982203, "loss": 0.0099, "step": 461260 }, { "epoch": 1.2, "learning_rate": 0.00012064824343345058, "loss": 0.0135, "step": 461270 }, { "epoch": 1.2, "learning_rate": 0.0001206443552170791, "loss": 0.0089, "step": 461280 }, { "epoch": 1.2, "learning_rate": 0.00012064046700070765, "loss": 0.0138, "step": 461290 }, { "epoch": 1.2, "learning_rate": 0.00012063657878433617, "loss": 0.0123, "step": 461300 }, { "epoch": 1.2, "learning_rate": 0.00012063269056796472, "loss": 0.0108, "step": 461310 }, { "epoch": 1.2, "learning_rate": 0.00012062880235159324, "loss": 0.0094, "step": 461320 }, { "epoch": 1.2, "learning_rate": 0.00012062491413522179, "loss": 0.0093, "step": 461330 }, { "epoch": 1.2, "learning_rate": 0.00012062102591885031, "loss": 0.0125, "step": 461340 }, { "epoch": 1.2, "learning_rate": 0.00012061713770247886, "loss": 0.0089, "step": 461350 }, { "epoch": 1.2, "learning_rate": 0.00012061324948610738, "loss": 0.0127, "step": 461360 }, { "epoch": 1.2, "learning_rate": 0.00012060936126973594, "loss": 0.0125, "step": 461370 }, { "epoch": 1.2, "learning_rate": 0.00012060547305336445, "loss": 0.0093, "step": 461380 }, { "epoch": 1.2, "learning_rate": 0.00012060158483699301, "loss": 0.0103, "step": 461390 }, { "epoch": 1.2, "learning_rate": 0.00012059769662062154, "loss": 0.0118, "step": 461400 }, { "epoch": 1.2, "learning_rate": 0.00012059380840425008, "loss": 0.0096, "step": 461410 }, { "epoch": 1.2, "learning_rate": 0.0001205899201878786, "loss": 0.0141, "step": 461420 }, { "epoch": 1.2, "learning_rate": 0.00012058603197150715, "loss": 0.0099, "step": 461430 }, { "epoch": 1.2, "learning_rate": 0.00012058214375513568, "loss": 0.0112, "step": 461440 }, { "epoch": 1.2, "learning_rate": 0.00012057825553876422, "loss": 0.0099, "step": 461450 }, { "epoch": 1.2, "learning_rate": 0.00012057436732239275, "loss": 0.0098, "step": 461460 }, { "epoch": 1.2, "learning_rate": 0.00012057047910602129, "loss": 0.0123, "step": 461470 }, { "epoch": 1.2, "learning_rate": 0.00012056659088964982, "loss": 0.0093, "step": 461480 }, { "epoch": 1.2, "learning_rate": 0.00012056270267327834, "loss": 0.0118, "step": 461490 }, { "epoch": 1.2, "learning_rate": 0.00012055881445690689, "loss": 0.0079, "step": 461500 }, { "epoch": 1.2, "learning_rate": 0.00012055492624053541, "loss": 0.0084, "step": 461510 }, { "epoch": 1.2, "learning_rate": 0.00012055103802416395, "loss": 0.0109, "step": 461520 }, { "epoch": 1.2, "learning_rate": 0.00012054714980779248, "loss": 0.0116, "step": 461530 }, { "epoch": 1.2, "learning_rate": 0.00012054326159142102, "loss": 0.0118, "step": 461540 }, { "epoch": 1.2, "learning_rate": 0.00012053937337504955, "loss": 0.0091, "step": 461550 }, { "epoch": 1.2, "learning_rate": 0.00012053548515867811, "loss": 0.0123, "step": 461560 }, { "epoch": 1.2, "learning_rate": 0.00012053159694230664, "loss": 0.0129, "step": 461570 }, { "epoch": 1.2, "learning_rate": 0.00012052770872593518, "loss": 0.0113, "step": 461580 }, { "epoch": 1.2, "learning_rate": 0.0001205238205095637, "loss": 0.0106, "step": 461590 }, { "epoch": 1.2, "learning_rate": 0.00012051993229319225, "loss": 0.0161, "step": 461600 }, { "epoch": 1.2, "learning_rate": 0.00012051604407682078, "loss": 0.0093, "step": 461610 }, { "epoch": 1.2, "learning_rate": 0.00012051215586044932, "loss": 0.0108, "step": 461620 }, { "epoch": 1.2, "learning_rate": 0.00012050826764407785, "loss": 0.0173, "step": 461630 }, { "epoch": 1.2, "learning_rate": 0.00012050437942770639, "loss": 0.0102, "step": 461640 }, { "epoch": 1.2, "learning_rate": 0.00012050049121133491, "loss": 0.0105, "step": 461650 }, { "epoch": 1.2, "learning_rate": 0.00012049660299496346, "loss": 0.0086, "step": 461660 }, { "epoch": 1.2, "learning_rate": 0.00012049271477859198, "loss": 0.0123, "step": 461670 }, { "epoch": 1.2, "learning_rate": 0.00012048882656222053, "loss": 0.01, "step": 461680 }, { "epoch": 1.2, "learning_rate": 0.00012048493834584905, "loss": 0.0142, "step": 461690 }, { "epoch": 1.2, "learning_rate": 0.0001204810501294776, "loss": 0.0109, "step": 461700 }, { "epoch": 1.2, "learning_rate": 0.00012047716191310612, "loss": 0.0096, "step": 461710 }, { "epoch": 1.2, "learning_rate": 0.00012047327369673468, "loss": 0.0131, "step": 461720 }, { "epoch": 1.2, "learning_rate": 0.00012046938548036321, "loss": 0.0108, "step": 461730 }, { "epoch": 1.2, "learning_rate": 0.00012046549726399172, "loss": 0.0104, "step": 461740 }, { "epoch": 1.2, "learning_rate": 0.00012046160904762028, "loss": 0.0118, "step": 461750 }, { "epoch": 1.2, "learning_rate": 0.0001204577208312488, "loss": 0.0104, "step": 461760 }, { "epoch": 1.2, "learning_rate": 0.00012045383261487735, "loss": 0.0104, "step": 461770 }, { "epoch": 1.2, "learning_rate": 0.00012044994439850587, "loss": 0.0124, "step": 461780 }, { "epoch": 1.2, "learning_rate": 0.00012044605618213442, "loss": 0.0088, "step": 461790 }, { "epoch": 1.2, "learning_rate": 0.00012044216796576294, "loss": 0.0126, "step": 461800 }, { "epoch": 1.2, "learning_rate": 0.00012043827974939149, "loss": 0.0079, "step": 461810 }, { "epoch": 1.2, "learning_rate": 0.00012043439153302001, "loss": 0.0106, "step": 461820 }, { "epoch": 1.2, "learning_rate": 0.00012043050331664856, "loss": 0.0126, "step": 461830 }, { "epoch": 1.2, "learning_rate": 0.00012042661510027708, "loss": 0.0119, "step": 461840 }, { "epoch": 1.2, "learning_rate": 0.00012042272688390563, "loss": 0.0098, "step": 461850 }, { "epoch": 1.2, "learning_rate": 0.00012041883866753415, "loss": 0.0169, "step": 461860 }, { "epoch": 1.2, "learning_rate": 0.0001204149504511627, "loss": 0.0126, "step": 461870 }, { "epoch": 1.2, "learning_rate": 0.00012041106223479122, "loss": 0.0113, "step": 461880 }, { "epoch": 1.2, "learning_rate": 0.00012040717401841978, "loss": 0.0096, "step": 461890 }, { "epoch": 1.2, "learning_rate": 0.00012040328580204829, "loss": 0.0117, "step": 461900 }, { "epoch": 1.2, "learning_rate": 0.00012039939758567685, "loss": 0.0209, "step": 461910 }, { "epoch": 1.2, "learning_rate": 0.00012039550936930538, "loss": 0.0093, "step": 461920 }, { "epoch": 1.2, "learning_rate": 0.00012039162115293392, "loss": 0.0106, "step": 461930 }, { "epoch": 1.2, "learning_rate": 0.00012038773293656245, "loss": 0.0118, "step": 461940 }, { "epoch": 1.2, "learning_rate": 0.00012038384472019099, "loss": 0.0105, "step": 461950 }, { "epoch": 1.2, "learning_rate": 0.00012037995650381952, "loss": 0.012, "step": 461960 }, { "epoch": 1.2, "learning_rate": 0.00012037606828744806, "loss": 0.011, "step": 461970 }, { "epoch": 1.2, "learning_rate": 0.00012037218007107659, "loss": 0.0089, "step": 461980 }, { "epoch": 1.2, "learning_rate": 0.00012036829185470511, "loss": 0.0097, "step": 461990 }, { "epoch": 1.2, "learning_rate": 0.00012036440363833366, "loss": 0.0085, "step": 462000 }, { "epoch": 1.2, "eval_cer": 0.8816928888646285, "eval_loss": 0.00711864186450839, "eval_runtime": 107.836, "eval_samples_per_second": 18.547, "eval_steps_per_second": 4.637, "step": 462000 }, { "epoch": 1.2, "learning_rate": 0.00012036051542196218, "loss": 0.0141, "step": 462010 }, { "epoch": 1.2, "learning_rate": 0.00012035662720559073, "loss": 0.0089, "step": 462020 }, { "epoch": 1.2, "learning_rate": 0.00012035273898921925, "loss": 0.0109, "step": 462030 }, { "epoch": 1.2, "learning_rate": 0.0001203488507728478, "loss": 0.0099, "step": 462040 }, { "epoch": 1.2, "learning_rate": 0.00012034496255647632, "loss": 0.0109, "step": 462050 }, { "epoch": 1.2, "learning_rate": 0.00012034107434010486, "loss": 0.0159, "step": 462060 }, { "epoch": 1.2, "learning_rate": 0.00012033718612373339, "loss": 0.0113, "step": 462070 }, { "epoch": 1.2, "learning_rate": 0.00012033329790736195, "loss": 0.0114, "step": 462080 }, { "epoch": 1.2, "learning_rate": 0.00012032940969099048, "loss": 0.0097, "step": 462090 }, { "epoch": 1.2, "learning_rate": 0.00012032552147461902, "loss": 0.0115, "step": 462100 }, { "epoch": 1.2, "learning_rate": 0.00012032163325824755, "loss": 0.0127, "step": 462110 }, { "epoch": 1.2, "learning_rate": 0.00012031774504187609, "loss": 0.0108, "step": 462120 }, { "epoch": 1.2, "learning_rate": 0.00012031385682550462, "loss": 0.0113, "step": 462130 }, { "epoch": 1.2, "learning_rate": 0.00012030996860913316, "loss": 0.0119, "step": 462140 }, { "epoch": 1.2, "learning_rate": 0.00012030608039276169, "loss": 0.0115, "step": 462150 }, { "epoch": 1.2, "learning_rate": 0.00012030219217639023, "loss": 0.0119, "step": 462160 }, { "epoch": 1.2, "learning_rate": 0.00012029830396001875, "loss": 0.0102, "step": 462170 }, { "epoch": 1.2, "learning_rate": 0.0001202944157436473, "loss": 0.0099, "step": 462180 }, { "epoch": 1.2, "learning_rate": 0.00012029052752727582, "loss": 0.0119, "step": 462190 }, { "epoch": 1.2, "learning_rate": 0.00012028663931090437, "loss": 0.0126, "step": 462200 }, { "epoch": 1.2, "learning_rate": 0.0001202827510945329, "loss": 0.0102, "step": 462210 }, { "epoch": 1.2, "learning_rate": 0.00012027886287816144, "loss": 0.0098, "step": 462220 }, { "epoch": 1.2, "learning_rate": 0.00012027497466178996, "loss": 0.0113, "step": 462230 }, { "epoch": 1.2, "learning_rate": 0.00012027108644541849, "loss": 0.0092, "step": 462240 }, { "epoch": 1.2, "learning_rate": 0.00012026719822904703, "loss": 0.0135, "step": 462250 }, { "epoch": 1.2, "learning_rate": 0.00012026331001267556, "loss": 0.0105, "step": 462260 }, { "epoch": 1.2, "learning_rate": 0.00012025942179630412, "loss": 0.0117, "step": 462270 }, { "epoch": 1.2, "learning_rate": 0.00012025553357993265, "loss": 0.0123, "step": 462280 }, { "epoch": 1.2, "learning_rate": 0.00012025164536356119, "loss": 0.012, "step": 462290 }, { "epoch": 1.2, "learning_rate": 0.00012024775714718971, "loss": 0.0094, "step": 462300 }, { "epoch": 1.2, "learning_rate": 0.00012024386893081826, "loss": 0.0107, "step": 462310 }, { "epoch": 1.2, "learning_rate": 0.00012023998071444678, "loss": 0.0144, "step": 462320 }, { "epoch": 1.2, "learning_rate": 0.00012023609249807533, "loss": 0.0125, "step": 462330 }, { "epoch": 1.2, "learning_rate": 0.00012023220428170385, "loss": 0.0106, "step": 462340 }, { "epoch": 1.2, "learning_rate": 0.0001202283160653324, "loss": 0.0106, "step": 462350 }, { "epoch": 1.2, "learning_rate": 0.00012022442784896092, "loss": 0.0099, "step": 462360 }, { "epoch": 1.2, "learning_rate": 0.00012022053963258947, "loss": 0.0089, "step": 462370 }, { "epoch": 1.2, "learning_rate": 0.000120216651416218, "loss": 0.0152, "step": 462380 }, { "epoch": 1.2, "learning_rate": 0.00012021276319984654, "loss": 0.014, "step": 462390 }, { "epoch": 1.2, "learning_rate": 0.00012020887498347506, "loss": 0.0116, "step": 462400 }, { "epoch": 1.2, "learning_rate": 0.0001202049867671036, "loss": 0.0103, "step": 462410 }, { "epoch": 1.2, "learning_rate": 0.00012020109855073213, "loss": 0.0091, "step": 462420 }, { "epoch": 1.2, "learning_rate": 0.00012019721033436069, "loss": 0.0097, "step": 462430 }, { "epoch": 1.2, "learning_rate": 0.00012019332211798922, "loss": 0.0109, "step": 462440 }, { "epoch": 1.2, "learning_rate": 0.00012018943390161776, "loss": 0.011, "step": 462450 }, { "epoch": 1.2, "learning_rate": 0.00012018554568524629, "loss": 0.0125, "step": 462460 }, { "epoch": 1.2, "learning_rate": 0.00012018165746887483, "loss": 0.0116, "step": 462470 }, { "epoch": 1.2, "learning_rate": 0.00012017776925250336, "loss": 0.0134, "step": 462480 }, { "epoch": 1.2, "learning_rate": 0.00012017388103613188, "loss": 0.0162, "step": 462490 }, { "epoch": 1.2, "learning_rate": 0.00012016999281976043, "loss": 0.0109, "step": 462500 }, { "epoch": 1.2, "learning_rate": 0.00012016610460338895, "loss": 0.0139, "step": 462510 }, { "epoch": 1.2, "learning_rate": 0.0001201622163870175, "loss": 0.0093, "step": 462520 }, { "epoch": 1.2, "learning_rate": 0.00012015832817064602, "loss": 0.0087, "step": 462530 }, { "epoch": 1.2, "learning_rate": 0.00012015443995427457, "loss": 0.0106, "step": 462540 }, { "epoch": 1.2, "learning_rate": 0.00012015055173790309, "loss": 0.0105, "step": 462550 }, { "epoch": 1.2, "learning_rate": 0.00012014666352153163, "loss": 0.01, "step": 462560 }, { "epoch": 1.2, "learning_rate": 0.00012014277530516016, "loss": 0.0098, "step": 462570 }, { "epoch": 1.2, "learning_rate": 0.0001201388870887887, "loss": 0.0146, "step": 462580 }, { "epoch": 1.2, "learning_rate": 0.00012013499887241723, "loss": 0.0156, "step": 462590 }, { "epoch": 1.2, "learning_rate": 0.00012013111065604579, "loss": 0.0111, "step": 462600 }, { "epoch": 1.2, "learning_rate": 0.0001201272224396743, "loss": 0.0094, "step": 462610 }, { "epoch": 1.2, "learning_rate": 0.00012012333422330286, "loss": 0.0127, "step": 462620 }, { "epoch": 1.2, "learning_rate": 0.00012011944600693139, "loss": 0.0086, "step": 462630 }, { "epoch": 1.2, "learning_rate": 0.00012011555779055993, "loss": 0.008, "step": 462640 }, { "epoch": 1.2, "learning_rate": 0.00012011166957418846, "loss": 0.0089, "step": 462650 }, { "epoch": 1.2, "learning_rate": 0.000120107781357817, "loss": 0.0095, "step": 462660 }, { "epoch": 1.2, "learning_rate": 0.00012010389314144552, "loss": 0.0114, "step": 462670 }, { "epoch": 1.2, "learning_rate": 0.00012010000492507407, "loss": 0.0105, "step": 462680 }, { "epoch": 1.2, "learning_rate": 0.0001200961167087026, "loss": 0.0117, "step": 462690 }, { "epoch": 1.2, "learning_rate": 0.00012009222849233114, "loss": 0.0098, "step": 462700 }, { "epoch": 1.2, "learning_rate": 0.00012008834027595966, "loss": 0.0117, "step": 462710 }, { "epoch": 1.2, "learning_rate": 0.00012008445205958819, "loss": 0.0108, "step": 462720 }, { "epoch": 1.2, "learning_rate": 0.00012008056384321673, "loss": 0.0082, "step": 462730 }, { "epoch": 1.2, "learning_rate": 0.00012007667562684526, "loss": 0.012, "step": 462740 }, { "epoch": 1.2, "learning_rate": 0.0001200727874104738, "loss": 0.0129, "step": 462750 }, { "epoch": 1.2, "learning_rate": 0.00012006889919410233, "loss": 0.0113, "step": 462760 }, { "epoch": 1.2, "learning_rate": 0.00012006501097773087, "loss": 0.0101, "step": 462770 }, { "epoch": 1.2, "learning_rate": 0.0001200611227613594, "loss": 0.0101, "step": 462780 }, { "epoch": 1.2, "learning_rate": 0.00012005723454498796, "loss": 0.0142, "step": 462790 }, { "epoch": 1.2, "learning_rate": 0.00012005334632861648, "loss": 0.0108, "step": 462800 }, { "epoch": 1.2, "learning_rate": 0.00012004945811224503, "loss": 0.012, "step": 462810 }, { "epoch": 1.2, "learning_rate": 0.00012004556989587355, "loss": 0.0087, "step": 462820 }, { "epoch": 1.2, "learning_rate": 0.0001200416816795021, "loss": 0.0108, "step": 462830 }, { "epoch": 1.2, "learning_rate": 0.00012003779346313062, "loss": 0.0109, "step": 462840 }, { "epoch": 1.2, "learning_rate": 0.00012003390524675917, "loss": 0.0086, "step": 462850 }, { "epoch": 1.2, "learning_rate": 0.0001200300170303877, "loss": 0.0086, "step": 462860 }, { "epoch": 1.2, "learning_rate": 0.00012002612881401624, "loss": 0.0142, "step": 462870 }, { "epoch": 1.2, "learning_rate": 0.00012002224059764476, "loss": 0.0117, "step": 462880 }, { "epoch": 1.2, "learning_rate": 0.0001200183523812733, "loss": 0.0102, "step": 462890 }, { "epoch": 1.2, "learning_rate": 0.00012001446416490183, "loss": 0.0096, "step": 462900 }, { "epoch": 1.2, "learning_rate": 0.00012001057594853038, "loss": 0.0102, "step": 462910 }, { "epoch": 1.2, "learning_rate": 0.0001200066877321589, "loss": 0.0105, "step": 462920 }, { "epoch": 1.2, "learning_rate": 0.00012000279951578744, "loss": 0.0077, "step": 462930 }, { "epoch": 1.2, "learning_rate": 0.00011999891129941597, "loss": 0.0125, "step": 462940 }, { "epoch": 1.2, "learning_rate": 0.00011999502308304453, "loss": 0.0121, "step": 462950 }, { "epoch": 1.2, "learning_rate": 0.00011999113486667306, "loss": 0.0109, "step": 462960 }, { "epoch": 1.2, "learning_rate": 0.00011998724665030157, "loss": 0.0113, "step": 462970 }, { "epoch": 1.2, "learning_rate": 0.00011998335843393013, "loss": 0.0108, "step": 462980 }, { "epoch": 1.2, "learning_rate": 0.00011997947021755865, "loss": 0.0168, "step": 462990 }, { "epoch": 1.2, "learning_rate": 0.0001199755820011872, "loss": 0.0126, "step": 463000 }, { "epoch": 1.2, "eval_cer": 0.8817110841447728, "eval_loss": 0.006891580764204264, "eval_runtime": 108.0948, "eval_samples_per_second": 18.502, "eval_steps_per_second": 4.626, "step": 463000 }, { "epoch": 1.2, "learning_rate": 0.00011997169378481572, "loss": 0.0089, "step": 463010 }, { "epoch": 1.2, "learning_rate": 0.00011996780556844427, "loss": 0.0089, "step": 463020 }, { "epoch": 1.2, "learning_rate": 0.0001199639173520728, "loss": 0.0124, "step": 463030 }, { "epoch": 1.2, "learning_rate": 0.00011996002913570134, "loss": 0.0142, "step": 463040 }, { "epoch": 1.2, "learning_rate": 0.00011995614091932986, "loss": 0.0176, "step": 463050 }, { "epoch": 1.2, "learning_rate": 0.0001199522527029584, "loss": 0.0095, "step": 463060 }, { "epoch": 1.2, "learning_rate": 0.00011994836448658693, "loss": 0.0092, "step": 463070 }, { "epoch": 1.2, "learning_rate": 0.00011994447627021547, "loss": 0.0102, "step": 463080 }, { "epoch": 1.2, "learning_rate": 0.000119940588053844, "loss": 0.0098, "step": 463090 }, { "epoch": 1.2, "learning_rate": 0.00011993669983747254, "loss": 0.011, "step": 463100 }, { "epoch": 1.2, "learning_rate": 0.00011993281162110107, "loss": 0.0106, "step": 463110 }, { "epoch": 1.2, "learning_rate": 0.00011992892340472963, "loss": 0.0114, "step": 463120 }, { "epoch": 1.2, "learning_rate": 0.00011992503518835814, "loss": 0.0114, "step": 463130 }, { "epoch": 1.2, "learning_rate": 0.0001199211469719867, "loss": 0.0099, "step": 463140 }, { "epoch": 1.2, "learning_rate": 0.00011991725875561523, "loss": 0.011, "step": 463150 }, { "epoch": 1.2, "learning_rate": 0.00011991337053924377, "loss": 0.0127, "step": 463160 }, { "epoch": 1.2, "learning_rate": 0.0001199094823228723, "loss": 0.0104, "step": 463170 }, { "epoch": 1.2, "learning_rate": 0.00011990559410650084, "loss": 0.0076, "step": 463180 }, { "epoch": 1.2, "learning_rate": 0.00011990170589012936, "loss": 0.0139, "step": 463190 }, { "epoch": 1.2, "learning_rate": 0.0001198978176737579, "loss": 0.0132, "step": 463200 }, { "epoch": 1.2, "learning_rate": 0.00011989392945738643, "loss": 0.0075, "step": 463210 }, { "epoch": 1.2, "learning_rate": 0.00011989004124101496, "loss": 0.0106, "step": 463220 }, { "epoch": 1.2, "learning_rate": 0.0001198861530246435, "loss": 0.0106, "step": 463230 }, { "epoch": 1.2, "learning_rate": 0.00011988226480827203, "loss": 0.0097, "step": 463240 }, { "epoch": 1.2, "learning_rate": 0.00011987837659190057, "loss": 0.0095, "step": 463250 }, { "epoch": 1.2, "learning_rate": 0.0001198744883755291, "loss": 0.0109, "step": 463260 }, { "epoch": 1.2, "learning_rate": 0.00011987060015915764, "loss": 0.0097, "step": 463270 }, { "epoch": 1.2, "learning_rate": 0.00011986671194278617, "loss": 0.0102, "step": 463280 }, { "epoch": 1.2, "learning_rate": 0.00011986282372641471, "loss": 0.0087, "step": 463290 }, { "epoch": 1.2, "learning_rate": 0.00011985893551004324, "loss": 0.0093, "step": 463300 }, { "epoch": 1.2, "learning_rate": 0.0001198550472936718, "loss": 0.0128, "step": 463310 }, { "epoch": 1.2, "learning_rate": 0.00011985115907730032, "loss": 0.0133, "step": 463320 }, { "epoch": 1.2, "learning_rate": 0.00011984727086092887, "loss": 0.0118, "step": 463330 }, { "epoch": 1.2, "learning_rate": 0.0001198433826445574, "loss": 0.0106, "step": 463340 }, { "epoch": 1.2, "learning_rate": 0.00011983949442818594, "loss": 0.0108, "step": 463350 }, { "epoch": 1.2, "learning_rate": 0.00011983560621181446, "loss": 0.0101, "step": 463360 }, { "epoch": 1.2, "learning_rate": 0.000119831717995443, "loss": 0.0105, "step": 463370 }, { "epoch": 1.2, "learning_rate": 0.00011982782977907153, "loss": 0.0131, "step": 463380 }, { "epoch": 1.2, "learning_rate": 0.00011982394156270008, "loss": 0.0084, "step": 463390 }, { "epoch": 1.2, "learning_rate": 0.0001198200533463286, "loss": 0.0111, "step": 463400 }, { "epoch": 1.2, "learning_rate": 0.00011981616512995715, "loss": 0.0095, "step": 463410 }, { "epoch": 1.2, "learning_rate": 0.00011981227691358567, "loss": 0.0095, "step": 463420 }, { "epoch": 1.2, "learning_rate": 0.00011980838869721422, "loss": 0.0084, "step": 463430 }, { "epoch": 1.2, "learning_rate": 0.00011980450048084274, "loss": 0.0112, "step": 463440 }, { "epoch": 1.2, "learning_rate": 0.00011980061226447128, "loss": 0.014, "step": 463450 }, { "epoch": 1.2, "learning_rate": 0.00011979672404809981, "loss": 0.0131, "step": 463460 }, { "epoch": 1.2, "learning_rate": 0.00011979283583172834, "loss": 0.0121, "step": 463470 }, { "epoch": 1.2, "learning_rate": 0.0001197889476153569, "loss": 0.014, "step": 463480 }, { "epoch": 1.2, "learning_rate": 0.00011978505939898541, "loss": 0.0116, "step": 463490 }, { "epoch": 1.2, "learning_rate": 0.00011978117118261397, "loss": 0.0095, "step": 463500 }, { "epoch": 1.2, "learning_rate": 0.0001197772829662425, "loss": 0.0109, "step": 463510 }, { "epoch": 1.2, "learning_rate": 0.00011977339474987104, "loss": 0.0116, "step": 463520 }, { "epoch": 1.2, "learning_rate": 0.00011976950653349956, "loss": 0.0094, "step": 463530 }, { "epoch": 1.2, "learning_rate": 0.0001197656183171281, "loss": 0.0127, "step": 463540 }, { "epoch": 1.2, "learning_rate": 0.00011976173010075663, "loss": 0.0112, "step": 463550 }, { "epoch": 1.2, "learning_rate": 0.00011975784188438518, "loss": 0.0093, "step": 463560 }, { "epoch": 1.2, "learning_rate": 0.0001197539536680137, "loss": 0.0096, "step": 463570 }, { "epoch": 1.2, "learning_rate": 0.00011975006545164224, "loss": 0.0106, "step": 463580 }, { "epoch": 1.2, "learning_rate": 0.00011974617723527077, "loss": 0.0113, "step": 463590 }, { "epoch": 1.2, "learning_rate": 0.00011974228901889931, "loss": 0.0097, "step": 463600 }, { "epoch": 1.2, "learning_rate": 0.00011973840080252784, "loss": 0.0118, "step": 463610 }, { "epoch": 1.2, "learning_rate": 0.00011973451258615638, "loss": 0.0093, "step": 463620 }, { "epoch": 1.2, "learning_rate": 0.00011973062436978491, "loss": 0.0098, "step": 463630 }, { "epoch": 1.2, "learning_rate": 0.00011972673615341345, "loss": 0.0136, "step": 463640 }, { "epoch": 1.2, "learning_rate": 0.00011972284793704198, "loss": 0.0122, "step": 463650 }, { "epoch": 1.2, "learning_rate": 0.00011971895972067054, "loss": 0.0104, "step": 463660 }, { "epoch": 1.2, "learning_rate": 0.00011971507150429907, "loss": 0.0114, "step": 463670 }, { "epoch": 1.2, "learning_rate": 0.00011971118328792761, "loss": 0.013, "step": 463680 }, { "epoch": 1.2, "learning_rate": 0.00011970729507155614, "loss": 0.0132, "step": 463690 }, { "epoch": 1.2, "learning_rate": 0.00011970340685518468, "loss": 0.0091, "step": 463700 }, { "epoch": 1.2, "learning_rate": 0.0001196995186388132, "loss": 0.0116, "step": 463710 }, { "epoch": 1.2, "learning_rate": 0.00011969563042244173, "loss": 0.0113, "step": 463720 }, { "epoch": 1.2, "learning_rate": 0.00011969174220607027, "loss": 0.0091, "step": 463730 }, { "epoch": 1.2, "learning_rate": 0.0001196878539896988, "loss": 0.0125, "step": 463740 }, { "epoch": 1.2, "learning_rate": 0.00011968396577332734, "loss": 0.0126, "step": 463750 }, { "epoch": 1.2, "learning_rate": 0.00011968007755695587, "loss": 0.0099, "step": 463760 }, { "epoch": 1.2, "learning_rate": 0.00011967618934058441, "loss": 0.0145, "step": 463770 }, { "epoch": 1.2, "learning_rate": 0.00011967230112421294, "loss": 0.0099, "step": 463780 }, { "epoch": 1.2, "learning_rate": 0.00011966841290784148, "loss": 0.0195, "step": 463790 }, { "epoch": 1.2, "learning_rate": 0.00011966452469147001, "loss": 0.0156, "step": 463800 }, { "epoch": 1.2, "learning_rate": 0.00011966063647509855, "loss": 0.0087, "step": 463810 }, { "epoch": 1.2, "learning_rate": 0.00011965674825872708, "loss": 0.0101, "step": 463820 }, { "epoch": 1.2, "learning_rate": 0.00011965286004235564, "loss": 0.0102, "step": 463830 }, { "epoch": 1.2, "learning_rate": 0.00011964897182598415, "loss": 0.0083, "step": 463840 }, { "epoch": 1.2, "learning_rate": 0.0001196450836096127, "loss": 0.009, "step": 463850 }, { "epoch": 1.2, "learning_rate": 0.00011964119539324123, "loss": 0.0112, "step": 463860 }, { "epoch": 1.2, "learning_rate": 0.00011963730717686978, "loss": 0.0117, "step": 463870 }, { "epoch": 1.2, "learning_rate": 0.0001196334189604983, "loss": 0.011, "step": 463880 }, { "epoch": 1.2, "learning_rate": 0.00011962953074412685, "loss": 0.0095, "step": 463890 }, { "epoch": 1.2, "learning_rate": 0.00011962564252775537, "loss": 0.0098, "step": 463900 }, { "epoch": 1.2, "learning_rate": 0.00011962175431138392, "loss": 0.0093, "step": 463910 }, { "epoch": 1.2, "learning_rate": 0.00011961786609501244, "loss": 0.0133, "step": 463920 }, { "epoch": 1.2, "learning_rate": 0.00011961397787864099, "loss": 0.0097, "step": 463930 }, { "epoch": 1.2, "learning_rate": 0.00011961008966226951, "loss": 0.0109, "step": 463940 }, { "epoch": 1.2, "learning_rate": 0.00011960620144589806, "loss": 0.0101, "step": 463950 }, { "epoch": 1.2, "learning_rate": 0.00011960231322952658, "loss": 0.0122, "step": 463960 }, { "epoch": 1.2, "learning_rate": 0.00011959842501315511, "loss": 0.009, "step": 463970 }, { "epoch": 1.2, "learning_rate": 0.00011959453679678365, "loss": 0.0079, "step": 463980 }, { "epoch": 1.2, "learning_rate": 0.00011959064858041218, "loss": 0.0137, "step": 463990 }, { "epoch": 1.2, "learning_rate": 0.00011958676036404072, "loss": 0.01, "step": 464000 }, { "epoch": 1.2, "eval_cer": 0.8816718943106159, "eval_loss": 0.0069192503578960896, "eval_runtime": 107.9208, "eval_samples_per_second": 18.532, "eval_steps_per_second": 4.633, "step": 464000 }, { "epoch": 1.2, "learning_rate": 0.00011958287214766925, "loss": 0.0094, "step": 464010 }, { "epoch": 1.2, "learning_rate": 0.0001195789839312978, "loss": 0.012, "step": 464020 }, { "epoch": 1.2, "learning_rate": 0.00011957509571492633, "loss": 0.0083, "step": 464030 }, { "epoch": 1.2, "learning_rate": 0.00011957120749855488, "loss": 0.0109, "step": 464040 }, { "epoch": 1.2, "learning_rate": 0.0001195673192821834, "loss": 0.01, "step": 464050 }, { "epoch": 1.2, "learning_rate": 0.00011956343106581195, "loss": 0.0102, "step": 464060 }, { "epoch": 1.2, "learning_rate": 0.00011955954284944047, "loss": 0.0113, "step": 464070 }, { "epoch": 1.2, "learning_rate": 0.00011955565463306901, "loss": 0.012, "step": 464080 }, { "epoch": 1.2, "learning_rate": 0.00011955176641669754, "loss": 0.0123, "step": 464090 }, { "epoch": 1.2, "learning_rate": 0.00011954787820032608, "loss": 0.0142, "step": 464100 }, { "epoch": 1.2, "learning_rate": 0.00011954398998395461, "loss": 0.009, "step": 464110 }, { "epoch": 1.2, "learning_rate": 0.00011954010176758315, "loss": 0.0111, "step": 464120 }, { "epoch": 1.2, "learning_rate": 0.00011953621355121168, "loss": 0.0104, "step": 464130 }, { "epoch": 1.2, "learning_rate": 0.00011953232533484022, "loss": 0.0137, "step": 464140 }, { "epoch": 1.2, "learning_rate": 0.00011952843711846875, "loss": 0.0103, "step": 464150 }, { "epoch": 1.2, "learning_rate": 0.0001195245489020973, "loss": 0.0089, "step": 464160 }, { "epoch": 1.2, "learning_rate": 0.00011952066068572582, "loss": 0.016, "step": 464170 }, { "epoch": 1.2, "learning_rate": 0.00011951677246935438, "loss": 0.0095, "step": 464180 }, { "epoch": 1.2, "learning_rate": 0.0001195128842529829, "loss": 0.0081, "step": 464190 }, { "epoch": 1.2, "learning_rate": 0.00011950899603661145, "loss": 0.0093, "step": 464200 }, { "epoch": 1.2, "learning_rate": 0.00011950510782023997, "loss": 0.0089, "step": 464210 }, { "epoch": 1.2, "learning_rate": 0.0001195012196038685, "loss": 0.0087, "step": 464220 }, { "epoch": 1.2, "learning_rate": 0.00011949733138749704, "loss": 0.0099, "step": 464230 }, { "epoch": 1.2, "learning_rate": 0.00011949344317112557, "loss": 0.0128, "step": 464240 }, { "epoch": 1.2, "learning_rate": 0.00011948955495475411, "loss": 0.0111, "step": 464250 }, { "epoch": 1.2, "learning_rate": 0.00011948566673838264, "loss": 0.0099, "step": 464260 }, { "epoch": 1.2, "learning_rate": 0.00011948177852201118, "loss": 0.0124, "step": 464270 }, { "epoch": 1.2, "learning_rate": 0.00011947789030563971, "loss": 0.0108, "step": 464280 }, { "epoch": 1.2, "learning_rate": 0.00011947400208926825, "loss": 0.0101, "step": 464290 }, { "epoch": 1.2, "learning_rate": 0.00011947011387289678, "loss": 0.0089, "step": 464300 }, { "epoch": 1.2, "learning_rate": 0.00011946622565652532, "loss": 0.0071, "step": 464310 }, { "epoch": 1.2, "learning_rate": 0.00011946233744015385, "loss": 0.0085, "step": 464320 }, { "epoch": 1.2, "learning_rate": 0.0001194584492237824, "loss": 0.0078, "step": 464330 }, { "epoch": 1.2, "learning_rate": 0.00011945456100741092, "loss": 0.0115, "step": 464340 }, { "epoch": 1.2, "learning_rate": 0.00011945067279103948, "loss": 0.0085, "step": 464350 }, { "epoch": 1.2, "learning_rate": 0.00011944678457466799, "loss": 0.009, "step": 464360 }, { "epoch": 1.2, "learning_rate": 0.00011944289635829655, "loss": 0.0086, "step": 464370 }, { "epoch": 1.2, "learning_rate": 0.00011943900814192507, "loss": 0.0158, "step": 464380 }, { "epoch": 1.2, "learning_rate": 0.00011943511992555362, "loss": 0.0122, "step": 464390 }, { "epoch": 1.2, "learning_rate": 0.00011943123170918214, "loss": 0.0092, "step": 464400 }, { "epoch": 1.2, "learning_rate": 0.00011942734349281069, "loss": 0.0166, "step": 464410 }, { "epoch": 1.2, "learning_rate": 0.00011942345527643921, "loss": 0.014, "step": 464420 }, { "epoch": 1.2, "learning_rate": 0.00011941956706006776, "loss": 0.0125, "step": 464430 }, { "epoch": 1.2, "learning_rate": 0.00011941567884369628, "loss": 0.0119, "step": 464440 }, { "epoch": 1.2, "learning_rate": 0.00011941179062732483, "loss": 0.0125, "step": 464450 }, { "epoch": 1.2, "learning_rate": 0.00011940790241095335, "loss": 0.0144, "step": 464460 }, { "epoch": 1.2, "learning_rate": 0.00011940401419458188, "loss": 0.0101, "step": 464470 }, { "epoch": 1.2, "learning_rate": 0.00011940012597821042, "loss": 0.0104, "step": 464480 }, { "epoch": 1.2, "learning_rate": 0.00011939623776183895, "loss": 0.0171, "step": 464490 }, { "epoch": 1.2, "learning_rate": 0.00011939234954546749, "loss": 0.0109, "step": 464500 }, { "epoch": 1.2, "learning_rate": 0.00011938846132909602, "loss": 0.0108, "step": 464510 }, { "epoch": 1.2, "learning_rate": 0.00011938457311272456, "loss": 0.0124, "step": 464520 }, { "epoch": 1.2, "learning_rate": 0.00011938068489635309, "loss": 0.0107, "step": 464530 }, { "epoch": 1.2, "learning_rate": 0.00011937679667998165, "loss": 0.0098, "step": 464540 }, { "epoch": 1.2, "learning_rate": 0.00011937290846361017, "loss": 0.0167, "step": 464550 }, { "epoch": 1.2, "learning_rate": 0.00011936902024723872, "loss": 0.0102, "step": 464560 }, { "epoch": 1.2, "learning_rate": 0.00011936513203086724, "loss": 0.0104, "step": 464570 }, { "epoch": 1.2, "learning_rate": 0.00011936124381449579, "loss": 0.0102, "step": 464580 }, { "epoch": 1.2, "learning_rate": 0.00011935735559812431, "loss": 0.0089, "step": 464590 }, { "epoch": 1.2, "learning_rate": 0.00011935346738175285, "loss": 0.0109, "step": 464600 }, { "epoch": 1.2, "learning_rate": 0.00011934957916538138, "loss": 0.0087, "step": 464610 }, { "epoch": 1.2, "learning_rate": 0.00011934569094900992, "loss": 0.0108, "step": 464620 }, { "epoch": 1.2, "learning_rate": 0.00011934180273263845, "loss": 0.0098, "step": 464630 }, { "epoch": 1.2, "learning_rate": 0.000119337914516267, "loss": 0.0128, "step": 464640 }, { "epoch": 1.2, "learning_rate": 0.00011933402629989552, "loss": 0.0095, "step": 464650 }, { "epoch": 1.2, "learning_rate": 0.00011933013808352406, "loss": 0.0091, "step": 464660 }, { "epoch": 1.2, "learning_rate": 0.00011932624986715259, "loss": 0.0092, "step": 464670 }, { "epoch": 1.2, "learning_rate": 0.00011932236165078113, "loss": 0.0082, "step": 464680 }, { "epoch": 1.2, "learning_rate": 0.00011931847343440966, "loss": 0.012, "step": 464690 }, { "epoch": 1.2, "learning_rate": 0.00011931458521803822, "loss": 0.0088, "step": 464700 }, { "epoch": 1.2, "learning_rate": 0.00011931069700166675, "loss": 0.0094, "step": 464710 }, { "epoch": 1.2, "learning_rate": 0.00011930680878529526, "loss": 0.0099, "step": 464720 }, { "epoch": 1.2, "learning_rate": 0.00011930292056892381, "loss": 0.015, "step": 464730 }, { "epoch": 1.2, "learning_rate": 0.00011929903235255234, "loss": 0.0103, "step": 464740 }, { "epoch": 1.2, "learning_rate": 0.00011929514413618088, "loss": 0.0112, "step": 464750 }, { "epoch": 1.2, "learning_rate": 0.00011929125591980941, "loss": 0.0113, "step": 464760 }, { "epoch": 1.2, "learning_rate": 0.00011928736770343795, "loss": 0.0093, "step": 464770 }, { "epoch": 1.2, "learning_rate": 0.00011928347948706648, "loss": 0.0123, "step": 464780 }, { "epoch": 1.2, "learning_rate": 0.00011927959127069502, "loss": 0.0123, "step": 464790 }, { "epoch": 1.2, "learning_rate": 0.00011927570305432355, "loss": 0.0137, "step": 464800 }, { "epoch": 1.2, "learning_rate": 0.0001192718148379521, "loss": 0.0088, "step": 464810 }, { "epoch": 1.2, "learning_rate": 0.00011926792662158062, "loss": 0.011, "step": 464820 }, { "epoch": 1.2, "learning_rate": 0.00011926403840520916, "loss": 0.0131, "step": 464830 }, { "epoch": 1.2, "learning_rate": 0.00011926015018883769, "loss": 0.0123, "step": 464840 }, { "epoch": 1.2, "learning_rate": 0.00011925626197246623, "loss": 0.0106, "step": 464850 }, { "epoch": 1.2, "learning_rate": 0.00011925237375609476, "loss": 0.0095, "step": 464860 }, { "epoch": 1.21, "learning_rate": 0.0001192484855397233, "loss": 0.0106, "step": 464870 }, { "epoch": 1.21, "learning_rate": 0.00011924459732335183, "loss": 0.0098, "step": 464880 }, { "epoch": 1.21, "learning_rate": 0.00011924070910698039, "loss": 0.0083, "step": 464890 }, { "epoch": 1.21, "learning_rate": 0.00011923682089060891, "loss": 0.0091, "step": 464900 }, { "epoch": 1.21, "learning_rate": 0.00011923293267423746, "loss": 0.0136, "step": 464910 }, { "epoch": 1.21, "learning_rate": 0.00011922904445786598, "loss": 0.0113, "step": 464920 }, { "epoch": 1.21, "learning_rate": 0.00011922515624149453, "loss": 0.0128, "step": 464930 }, { "epoch": 1.21, "learning_rate": 0.00011922126802512305, "loss": 0.0081, "step": 464940 }, { "epoch": 1.21, "learning_rate": 0.0001192173798087516, "loss": 0.0122, "step": 464950 }, { "epoch": 1.21, "learning_rate": 0.00011921349159238012, "loss": 0.0129, "step": 464960 }, { "epoch": 1.21, "learning_rate": 0.00011920960337600865, "loss": 0.0126, "step": 464970 }, { "epoch": 1.21, "learning_rate": 0.00011920571515963719, "loss": 0.0088, "step": 464980 }, { "epoch": 1.21, "learning_rate": 0.00011920182694326572, "loss": 0.0098, "step": 464990 }, { "epoch": 1.21, "learning_rate": 0.00011919793872689426, "loss": 0.0108, "step": 465000 }, { "epoch": 1.21, "eval_cer": 0.8816802921322209, "eval_loss": 0.006845335941761732, "eval_runtime": 107.9447, "eval_samples_per_second": 18.528, "eval_steps_per_second": 4.632, "step": 465000 }, { "epoch": 1.21, "learning_rate": 0.00011919405051052279, "loss": 0.0135, "step": 465010 }, { "epoch": 1.21, "learning_rate": 0.00011919016229415133, "loss": 0.0116, "step": 465020 }, { "epoch": 1.21, "learning_rate": 0.00011918627407777986, "loss": 0.0099, "step": 465030 }, { "epoch": 1.21, "learning_rate": 0.0001191823858614084, "loss": 0.0106, "step": 465040 }, { "epoch": 1.21, "learning_rate": 0.00011917849764503693, "loss": 0.0108, "step": 465050 }, { "epoch": 1.21, "learning_rate": 0.00011917460942866549, "loss": 0.0096, "step": 465060 }, { "epoch": 1.21, "learning_rate": 0.00011917072121229401, "loss": 0.0094, "step": 465070 }, { "epoch": 1.21, "learning_rate": 0.00011916683299592256, "loss": 0.0149, "step": 465080 }, { "epoch": 1.21, "learning_rate": 0.00011916294477955108, "loss": 0.0083, "step": 465090 }, { "epoch": 1.21, "learning_rate": 0.00011915905656317963, "loss": 0.0113, "step": 465100 }, { "epoch": 1.21, "learning_rate": 0.00011915516834680815, "loss": 0.0122, "step": 465110 }, { "epoch": 1.21, "learning_rate": 0.0001191512801304367, "loss": 0.0091, "step": 465120 }, { "epoch": 1.21, "learning_rate": 0.00011914739191406522, "loss": 0.0135, "step": 465130 }, { "epoch": 1.21, "learning_rate": 0.00011914350369769376, "loss": 0.0096, "step": 465140 }, { "epoch": 1.21, "learning_rate": 0.00011913961548132229, "loss": 0.0112, "step": 465150 }, { "epoch": 1.21, "learning_rate": 0.00011913572726495083, "loss": 0.009, "step": 465160 }, { "epoch": 1.21, "learning_rate": 0.00011913183904857936, "loss": 0.0103, "step": 465170 }, { "epoch": 1.21, "learning_rate": 0.0001191279508322079, "loss": 0.0096, "step": 465180 }, { "epoch": 1.21, "learning_rate": 0.00011912406261583643, "loss": 0.0106, "step": 465190 }, { "epoch": 1.21, "learning_rate": 0.00011912017439946496, "loss": 0.01, "step": 465200 }, { "epoch": 1.21, "learning_rate": 0.0001191162861830935, "loss": 0.0095, "step": 465210 }, { "epoch": 1.21, "learning_rate": 0.00011911239796672203, "loss": 0.0122, "step": 465220 }, { "epoch": 1.21, "learning_rate": 0.00011910850975035057, "loss": 0.0114, "step": 465230 }, { "epoch": 1.21, "learning_rate": 0.0001191046215339791, "loss": 0.0116, "step": 465240 }, { "epoch": 1.21, "learning_rate": 0.00011910073331760765, "loss": 0.0111, "step": 465250 }, { "epoch": 1.21, "learning_rate": 0.00011909684510123618, "loss": 0.0102, "step": 465260 }, { "epoch": 1.21, "learning_rate": 0.00011909295688486472, "loss": 0.011, "step": 465270 }, { "epoch": 1.21, "learning_rate": 0.00011908906866849325, "loss": 0.0118, "step": 465280 }, { "epoch": 1.21, "learning_rate": 0.0001190851804521218, "loss": 0.0104, "step": 465290 }, { "epoch": 1.21, "learning_rate": 0.00011908129223575032, "loss": 0.0117, "step": 465300 }, { "epoch": 1.21, "learning_rate": 0.00011907740401937886, "loss": 0.0102, "step": 465310 }, { "epoch": 1.21, "learning_rate": 0.00011907351580300739, "loss": 0.0113, "step": 465320 }, { "epoch": 1.21, "learning_rate": 0.00011906962758663593, "loss": 0.012, "step": 465330 }, { "epoch": 1.21, "learning_rate": 0.00011906573937026446, "loss": 0.0192, "step": 465340 }, { "epoch": 1.21, "learning_rate": 0.000119061851153893, "loss": 0.0087, "step": 465350 }, { "epoch": 1.21, "learning_rate": 0.00011905796293752153, "loss": 0.0188, "step": 465360 }, { "epoch": 1.21, "learning_rate": 0.00011905407472115007, "loss": 0.0102, "step": 465370 }, { "epoch": 1.21, "learning_rate": 0.0001190501865047786, "loss": 0.0099, "step": 465380 }, { "epoch": 1.21, "learning_rate": 0.00011904629828840714, "loss": 0.0086, "step": 465390 }, { "epoch": 1.21, "learning_rate": 0.00011904241007203567, "loss": 0.0121, "step": 465400 }, { "epoch": 1.21, "learning_rate": 0.00011903852185566423, "loss": 0.0136, "step": 465410 }, { "epoch": 1.21, "learning_rate": 0.00011903463363929275, "loss": 0.0113, "step": 465420 }, { "epoch": 1.21, "learning_rate": 0.0001190307454229213, "loss": 0.0148, "step": 465430 }, { "epoch": 1.21, "learning_rate": 0.00011902685720654982, "loss": 0.0096, "step": 465440 }, { "epoch": 1.21, "learning_rate": 0.00011902296899017835, "loss": 0.0105, "step": 465450 }, { "epoch": 1.21, "learning_rate": 0.0001190190807738069, "loss": 0.0109, "step": 465460 }, { "epoch": 1.21, "learning_rate": 0.00011901519255743542, "loss": 0.0112, "step": 465470 }, { "epoch": 1.21, "learning_rate": 0.00011901130434106396, "loss": 0.0124, "step": 465480 }, { "epoch": 1.21, "learning_rate": 0.00011900741612469249, "loss": 0.011, "step": 465490 }, { "epoch": 1.21, "learning_rate": 0.00011900352790832103, "loss": 0.0072, "step": 465500 }, { "epoch": 1.21, "learning_rate": 0.00011899963969194956, "loss": 0.0122, "step": 465510 }, { "epoch": 1.21, "learning_rate": 0.0001189957514755781, "loss": 0.0102, "step": 465520 }, { "epoch": 1.21, "learning_rate": 0.00011899186325920663, "loss": 0.01, "step": 465530 }, { "epoch": 1.21, "learning_rate": 0.00011898797504283517, "loss": 0.0091, "step": 465540 }, { "epoch": 1.21, "learning_rate": 0.0001189840868264637, "loss": 0.0093, "step": 465550 }, { "epoch": 1.21, "learning_rate": 0.00011898019861009224, "loss": 0.0123, "step": 465560 }, { "epoch": 1.21, "learning_rate": 0.00011897631039372077, "loss": 0.011, "step": 465570 }, { "epoch": 1.21, "learning_rate": 0.00011897242217734933, "loss": 0.0088, "step": 465580 }, { "epoch": 1.21, "learning_rate": 0.00011896853396097784, "loss": 0.011, "step": 465590 }, { "epoch": 1.21, "learning_rate": 0.0001189646457446064, "loss": 0.0137, "step": 465600 }, { "epoch": 1.21, "learning_rate": 0.00011896075752823492, "loss": 0.0105, "step": 465610 }, { "epoch": 1.21, "learning_rate": 0.00011895686931186346, "loss": 0.011, "step": 465620 }, { "epoch": 1.21, "learning_rate": 0.00011895298109549199, "loss": 0.0077, "step": 465630 }, { "epoch": 1.21, "learning_rate": 0.00011894909287912053, "loss": 0.0088, "step": 465640 }, { "epoch": 1.21, "learning_rate": 0.00011894520466274906, "loss": 0.0084, "step": 465650 }, { "epoch": 1.21, "learning_rate": 0.0001189413164463776, "loss": 0.0096, "step": 465660 }, { "epoch": 1.21, "learning_rate": 0.00011893742823000613, "loss": 0.0172, "step": 465670 }, { "epoch": 1.21, "learning_rate": 0.00011893354001363467, "loss": 0.0115, "step": 465680 }, { "epoch": 1.21, "learning_rate": 0.0001189296517972632, "loss": 0.0129, "step": 465690 }, { "epoch": 1.21, "learning_rate": 0.00011892576358089173, "loss": 0.0141, "step": 465700 }, { "epoch": 1.21, "learning_rate": 0.00011892187536452027, "loss": 0.012, "step": 465710 }, { "epoch": 1.21, "learning_rate": 0.0001189179871481488, "loss": 0.0123, "step": 465720 }, { "epoch": 1.21, "learning_rate": 0.00011891409893177734, "loss": 0.0096, "step": 465730 }, { "epoch": 1.21, "learning_rate": 0.00011891021071540587, "loss": 0.01, "step": 465740 }, { "epoch": 1.21, "learning_rate": 0.00011890632249903441, "loss": 0.0093, "step": 465750 }, { "epoch": 1.21, "learning_rate": 0.00011890243428266294, "loss": 0.0135, "step": 465760 }, { "epoch": 1.21, "learning_rate": 0.0001188985460662915, "loss": 0.0135, "step": 465770 }, { "epoch": 1.21, "learning_rate": 0.00011889465784992002, "loss": 0.0146, "step": 465780 }, { "epoch": 1.21, "learning_rate": 0.00011889076963354856, "loss": 0.0124, "step": 465790 }, { "epoch": 1.21, "learning_rate": 0.00011888688141717709, "loss": 0.0126, "step": 465800 }, { "epoch": 1.21, "learning_rate": 0.00011888299320080563, "loss": 0.0099, "step": 465810 }, { "epoch": 1.21, "learning_rate": 0.00011887910498443416, "loss": 0.0114, "step": 465820 }, { "epoch": 1.21, "learning_rate": 0.0001188752167680627, "loss": 0.0112, "step": 465830 }, { "epoch": 1.21, "learning_rate": 0.00011887132855169123, "loss": 0.0111, "step": 465840 }, { "epoch": 1.21, "learning_rate": 0.00011886744033531977, "loss": 0.0101, "step": 465850 }, { "epoch": 1.21, "learning_rate": 0.0001188635521189483, "loss": 0.0121, "step": 465860 }, { "epoch": 1.21, "learning_rate": 0.00011885966390257684, "loss": 0.0082, "step": 465870 }, { "epoch": 1.21, "learning_rate": 0.00011885577568620537, "loss": 0.0103, "step": 465880 }, { "epoch": 1.21, "learning_rate": 0.00011885188746983391, "loss": 0.0102, "step": 465890 }, { "epoch": 1.21, "learning_rate": 0.00011884799925346244, "loss": 0.0104, "step": 465900 }, { "epoch": 1.21, "learning_rate": 0.00011884411103709098, "loss": 0.0135, "step": 465910 }, { "epoch": 1.21, "learning_rate": 0.00011884022282071951, "loss": 0.0098, "step": 465920 }, { "epoch": 1.21, "learning_rate": 0.00011883633460434807, "loss": 0.0102, "step": 465930 }, { "epoch": 1.21, "learning_rate": 0.0001188324463879766, "loss": 0.0078, "step": 465940 }, { "epoch": 1.21, "learning_rate": 0.00011882855817160511, "loss": 0.0087, "step": 465950 }, { "epoch": 1.21, "learning_rate": 0.00011882466995523366, "loss": 0.0125, "step": 465960 }, { "epoch": 1.21, "learning_rate": 0.00011882078173886219, "loss": 0.0105, "step": 465970 }, { "epoch": 1.21, "learning_rate": 0.00011881689352249073, "loss": 0.0091, "step": 465980 }, { "epoch": 1.21, "learning_rate": 0.00011881300530611926, "loss": 0.0089, "step": 465990 }, { "epoch": 1.21, "learning_rate": 0.0001188091170897478, "loss": 0.0101, "step": 466000 }, { "epoch": 1.21, "eval_cer": 0.8817138834186412, "eval_loss": 0.00721912644803524, "eval_runtime": 107.9087, "eval_samples_per_second": 18.534, "eval_steps_per_second": 4.634, "step": 466000 }, { "epoch": 1.21, "learning_rate": 0.00011880522887337633, "loss": 0.0107, "step": 466010 }, { "epoch": 1.21, "learning_rate": 0.00011880134065700487, "loss": 0.0171, "step": 466020 }, { "epoch": 1.21, "learning_rate": 0.0001187974524406334, "loss": 0.0106, "step": 466030 }, { "epoch": 1.21, "learning_rate": 0.00011879356422426194, "loss": 0.0062, "step": 466040 }, { "epoch": 1.21, "learning_rate": 0.00011878967600789047, "loss": 0.0086, "step": 466050 }, { "epoch": 1.21, "learning_rate": 0.00011878578779151901, "loss": 0.0103, "step": 466060 }, { "epoch": 1.21, "learning_rate": 0.00011878189957514754, "loss": 0.0101, "step": 466070 }, { "epoch": 1.21, "learning_rate": 0.00011877801135877608, "loss": 0.0105, "step": 466080 }, { "epoch": 1.21, "learning_rate": 0.00011877412314240461, "loss": 0.0144, "step": 466090 }, { "epoch": 1.21, "learning_rate": 0.00011877023492603317, "loss": 0.0096, "step": 466100 }, { "epoch": 1.21, "learning_rate": 0.00011876634670966168, "loss": 0.0095, "step": 466110 }, { "epoch": 1.21, "learning_rate": 0.00011876245849329024, "loss": 0.0115, "step": 466120 }, { "epoch": 1.21, "learning_rate": 0.00011875857027691876, "loss": 0.013, "step": 466130 }, { "epoch": 1.21, "learning_rate": 0.0001187546820605473, "loss": 0.0096, "step": 466140 }, { "epoch": 1.21, "learning_rate": 0.00011875079384417583, "loss": 0.0121, "step": 466150 }, { "epoch": 1.21, "learning_rate": 0.00011874690562780437, "loss": 0.0097, "step": 466160 }, { "epoch": 1.21, "learning_rate": 0.0001187430174114329, "loss": 0.0137, "step": 466170 }, { "epoch": 1.21, "learning_rate": 0.00011873912919506144, "loss": 0.0094, "step": 466180 }, { "epoch": 1.21, "learning_rate": 0.00011873524097868997, "loss": 0.0112, "step": 466190 }, { "epoch": 1.21, "learning_rate": 0.0001187313527623185, "loss": 0.0105, "step": 466200 }, { "epoch": 1.21, "learning_rate": 0.00011872746454594704, "loss": 0.0143, "step": 466210 }, { "epoch": 1.21, "learning_rate": 0.00011872357632957557, "loss": 0.0118, "step": 466220 }, { "epoch": 1.21, "learning_rate": 0.00011871968811320411, "loss": 0.0069, "step": 466230 }, { "epoch": 1.21, "learning_rate": 0.00011871579989683264, "loss": 0.0102, "step": 466240 }, { "epoch": 1.21, "learning_rate": 0.00011871191168046118, "loss": 0.0134, "step": 466250 }, { "epoch": 1.21, "learning_rate": 0.00011870802346408971, "loss": 0.009, "step": 466260 }, { "epoch": 1.21, "learning_rate": 0.00011870413524771825, "loss": 0.0103, "step": 466270 }, { "epoch": 1.21, "learning_rate": 0.00011870024703134678, "loss": 0.0102, "step": 466280 }, { "epoch": 1.21, "learning_rate": 0.00011869635881497533, "loss": 0.0108, "step": 466290 }, { "epoch": 1.21, "learning_rate": 0.00011869247059860386, "loss": 0.0132, "step": 466300 }, { "epoch": 1.21, "learning_rate": 0.0001186885823822324, "loss": 0.0108, "step": 466310 }, { "epoch": 1.21, "learning_rate": 0.00011868469416586093, "loss": 0.0094, "step": 466320 }, { "epoch": 1.21, "learning_rate": 0.00011868080594948947, "loss": 0.0098, "step": 466330 }, { "epoch": 1.21, "learning_rate": 0.000118676917733118, "loss": 0.0099, "step": 466340 }, { "epoch": 1.21, "learning_rate": 0.00011867302951674654, "loss": 0.0118, "step": 466350 }, { "epoch": 1.21, "learning_rate": 0.00011866914130037507, "loss": 0.0111, "step": 466360 }, { "epoch": 1.21, "learning_rate": 0.00011866525308400361, "loss": 0.0084, "step": 466370 }, { "epoch": 1.21, "learning_rate": 0.00011866136486763214, "loss": 0.0106, "step": 466380 }, { "epoch": 1.21, "learning_rate": 0.00011865747665126068, "loss": 0.0112, "step": 466390 }, { "epoch": 1.21, "learning_rate": 0.00011865358843488921, "loss": 0.0081, "step": 466400 }, { "epoch": 1.21, "learning_rate": 0.00011864970021851775, "loss": 0.0131, "step": 466410 }, { "epoch": 1.21, "learning_rate": 0.00011864581200214628, "loss": 0.0123, "step": 466420 }, { "epoch": 1.21, "learning_rate": 0.00011864192378577482, "loss": 0.0127, "step": 466430 }, { "epoch": 1.21, "learning_rate": 0.00011863803556940335, "loss": 0.0134, "step": 466440 }, { "epoch": 1.21, "learning_rate": 0.00011863414735303188, "loss": 0.0119, "step": 466450 }, { "epoch": 1.21, "learning_rate": 0.00011863025913666042, "loss": 0.0153, "step": 466460 }, { "epoch": 1.21, "learning_rate": 0.00011862637092028895, "loss": 0.0097, "step": 466470 }, { "epoch": 1.21, "learning_rate": 0.0001186224827039175, "loss": 0.0093, "step": 466480 }, { "epoch": 1.21, "learning_rate": 0.00011861859448754603, "loss": 0.0117, "step": 466490 }, { "epoch": 1.21, "learning_rate": 0.00011861470627117457, "loss": 0.0118, "step": 466500 }, { "epoch": 1.21, "learning_rate": 0.0001186108180548031, "loss": 0.0165, "step": 466510 }, { "epoch": 1.21, "learning_rate": 0.00011860692983843164, "loss": 0.0087, "step": 466520 }, { "epoch": 1.21, "learning_rate": 0.00011860304162206017, "loss": 0.0105, "step": 466530 }, { "epoch": 1.21, "learning_rate": 0.00011859915340568871, "loss": 0.0117, "step": 466540 }, { "epoch": 1.21, "learning_rate": 0.00011859526518931724, "loss": 0.0093, "step": 466550 }, { "epoch": 1.21, "learning_rate": 0.00011859137697294578, "loss": 0.0124, "step": 466560 }, { "epoch": 1.21, "learning_rate": 0.00011858748875657431, "loss": 0.0142, "step": 466570 }, { "epoch": 1.21, "learning_rate": 0.00011858360054020285, "loss": 0.0142, "step": 466580 }, { "epoch": 1.21, "learning_rate": 0.00011857971232383138, "loss": 0.0118, "step": 466590 }, { "epoch": 1.21, "learning_rate": 0.00011857582410745992, "loss": 0.013, "step": 466600 }, { "epoch": 1.21, "learning_rate": 0.00011857193589108845, "loss": 0.0097, "step": 466610 }, { "epoch": 1.21, "learning_rate": 0.00011856804767471699, "loss": 0.0098, "step": 466620 }, { "epoch": 1.21, "learning_rate": 0.00011856415945834552, "loss": 0.0107, "step": 466630 }, { "epoch": 1.21, "learning_rate": 0.00011856027124197408, "loss": 0.0108, "step": 466640 }, { "epoch": 1.21, "learning_rate": 0.0001185563830256026, "loss": 0.0126, "step": 466650 }, { "epoch": 1.21, "learning_rate": 0.00011855249480923114, "loss": 0.0133, "step": 466660 }, { "epoch": 1.21, "learning_rate": 0.00011854860659285967, "loss": 0.011, "step": 466670 }, { "epoch": 1.21, "learning_rate": 0.00011854471837648821, "loss": 0.0081, "step": 466680 }, { "epoch": 1.21, "learning_rate": 0.00011854083016011674, "loss": 0.0101, "step": 466690 }, { "epoch": 1.21, "learning_rate": 0.00011853694194374527, "loss": 0.0103, "step": 466700 }, { "epoch": 1.21, "learning_rate": 0.00011853305372737381, "loss": 0.0097, "step": 466710 }, { "epoch": 1.21, "learning_rate": 0.00011852916551100234, "loss": 0.0096, "step": 466720 }, { "epoch": 1.21, "learning_rate": 0.00011852527729463088, "loss": 0.012, "step": 466730 }, { "epoch": 1.21, "learning_rate": 0.00011852138907825941, "loss": 0.0095, "step": 466740 }, { "epoch": 1.21, "learning_rate": 0.00011851750086188795, "loss": 0.0122, "step": 466750 }, { "epoch": 1.21, "learning_rate": 0.00011851361264551648, "loss": 0.0144, "step": 466760 }, { "epoch": 1.21, "learning_rate": 0.00011850972442914502, "loss": 0.0134, "step": 466770 }, { "epoch": 1.21, "learning_rate": 0.00011850583621277355, "loss": 0.0142, "step": 466780 }, { "epoch": 1.21, "learning_rate": 0.00011850194799640209, "loss": 0.0088, "step": 466790 }, { "epoch": 1.21, "learning_rate": 0.00011849805978003062, "loss": 0.0185, "step": 466800 }, { "epoch": 1.21, "learning_rate": 0.00011849417156365917, "loss": 0.0098, "step": 466810 }, { "epoch": 1.21, "learning_rate": 0.00011849028334728769, "loss": 0.0109, "step": 466820 }, { "epoch": 1.21, "learning_rate": 0.00011848639513091624, "loss": 0.0103, "step": 466830 }, { "epoch": 1.21, "learning_rate": 0.00011848250691454477, "loss": 0.0091, "step": 466840 }, { "epoch": 1.21, "learning_rate": 0.00011847861869817331, "loss": 0.0113, "step": 466850 }, { "epoch": 1.21, "learning_rate": 0.00011847473048180184, "loss": 0.0094, "step": 466860 }, { "epoch": 1.21, "learning_rate": 0.00011847084226543038, "loss": 0.01, "step": 466870 }, { "epoch": 1.21, "learning_rate": 0.00011846695404905891, "loss": 0.0112, "step": 466880 }, { "epoch": 1.21, "learning_rate": 0.00011846306583268745, "loss": 0.0103, "step": 466890 }, { "epoch": 1.21, "learning_rate": 0.00011845917761631598, "loss": 0.0135, "step": 466900 }, { "epoch": 1.21, "learning_rate": 0.00011845528939994452, "loss": 0.0086, "step": 466910 }, { "epoch": 1.21, "learning_rate": 0.00011845140118357305, "loss": 0.0077, "step": 466920 }, { "epoch": 1.21, "learning_rate": 0.00011844751296720159, "loss": 0.012, "step": 466930 }, { "epoch": 1.21, "learning_rate": 0.00011844362475083012, "loss": 0.0095, "step": 466940 }, { "epoch": 1.21, "learning_rate": 0.00011843973653445865, "loss": 0.0102, "step": 466950 }, { "epoch": 1.21, "learning_rate": 0.00011843584831808719, "loss": 0.0123, "step": 466960 }, { "epoch": 1.21, "learning_rate": 0.00011843196010171572, "loss": 0.0098, "step": 466970 }, { "epoch": 1.21, "learning_rate": 0.00011842807188534426, "loss": 0.0085, "step": 466980 }, { "epoch": 1.21, "learning_rate": 0.00011842418366897279, "loss": 0.011, "step": 466990 }, { "epoch": 1.21, "learning_rate": 0.00011842029545260134, "loss": 0.0113, "step": 467000 }, { "epoch": 1.21, "eval_cer": 0.8816648961259449, "eval_loss": 0.006742514204233885, "eval_runtime": 107.864, "eval_samples_per_second": 18.542, "eval_steps_per_second": 4.635, "step": 467000 }, { "epoch": 1.21, "learning_rate": 0.00011841640723622987, "loss": 0.0108, "step": 467010 }, { "epoch": 1.21, "learning_rate": 0.00011841251901985841, "loss": 0.0096, "step": 467020 }, { "epoch": 1.21, "learning_rate": 0.00011840863080348694, "loss": 0.009, "step": 467030 }, { "epoch": 1.21, "learning_rate": 0.00011840474258711548, "loss": 0.0076, "step": 467040 }, { "epoch": 1.21, "learning_rate": 0.00011840085437074401, "loss": 0.0111, "step": 467050 }, { "epoch": 1.21, "learning_rate": 0.00011839696615437255, "loss": 0.0119, "step": 467060 }, { "epoch": 1.21, "learning_rate": 0.00011839307793800108, "loss": 0.0098, "step": 467070 }, { "epoch": 1.21, "learning_rate": 0.00011838918972162962, "loss": 0.0166, "step": 467080 }, { "epoch": 1.21, "learning_rate": 0.00011838530150525815, "loss": 0.0122, "step": 467090 }, { "epoch": 1.21, "learning_rate": 0.00011838141328888669, "loss": 0.0095, "step": 467100 }, { "epoch": 1.21, "learning_rate": 0.00011837752507251522, "loss": 0.0101, "step": 467110 }, { "epoch": 1.21, "learning_rate": 0.00011837363685614376, "loss": 0.009, "step": 467120 }, { "epoch": 1.21, "learning_rate": 0.00011836974863977229, "loss": 0.0103, "step": 467130 }, { "epoch": 1.21, "learning_rate": 0.00011836586042340083, "loss": 0.0115, "step": 467140 }, { "epoch": 1.21, "learning_rate": 0.00011836197220702936, "loss": 0.0098, "step": 467150 }, { "epoch": 1.21, "learning_rate": 0.00011835808399065791, "loss": 0.0094, "step": 467160 }, { "epoch": 1.21, "learning_rate": 0.00011835419577428644, "loss": 0.0095, "step": 467170 }, { "epoch": 1.21, "learning_rate": 0.00011835030755791498, "loss": 0.0091, "step": 467180 }, { "epoch": 1.21, "learning_rate": 0.00011834641934154351, "loss": 0.0109, "step": 467190 }, { "epoch": 1.21, "learning_rate": 0.00011834253112517204, "loss": 0.0123, "step": 467200 }, { "epoch": 1.21, "learning_rate": 0.00011833864290880058, "loss": 0.01, "step": 467210 }, { "epoch": 1.21, "learning_rate": 0.00011833475469242911, "loss": 0.013, "step": 467220 }, { "epoch": 1.21, "learning_rate": 0.00011833086647605765, "loss": 0.0127, "step": 467230 }, { "epoch": 1.21, "learning_rate": 0.00011832697825968618, "loss": 0.0085, "step": 467240 }, { "epoch": 1.21, "learning_rate": 0.00011832309004331472, "loss": 0.0114, "step": 467250 }, { "epoch": 1.21, "learning_rate": 0.00011831920182694325, "loss": 0.0112, "step": 467260 }, { "epoch": 1.21, "learning_rate": 0.00011831531361057179, "loss": 0.0098, "step": 467270 }, { "epoch": 1.21, "learning_rate": 0.00011831142539420032, "loss": 0.0095, "step": 467280 }, { "epoch": 1.21, "learning_rate": 0.00011830753717782886, "loss": 0.0112, "step": 467290 }, { "epoch": 1.21, "learning_rate": 0.00011830364896145739, "loss": 0.0081, "step": 467300 }, { "epoch": 1.21, "learning_rate": 0.00011829976074508593, "loss": 0.0088, "step": 467310 }, { "epoch": 1.21, "learning_rate": 0.00011829587252871446, "loss": 0.0092, "step": 467320 }, { "epoch": 1.21, "learning_rate": 0.00011829198431234301, "loss": 0.007, "step": 467330 }, { "epoch": 1.21, "learning_rate": 0.00011828809609597153, "loss": 0.0106, "step": 467340 }, { "epoch": 1.21, "learning_rate": 0.00011828420787960008, "loss": 0.0099, "step": 467350 }, { "epoch": 1.21, "learning_rate": 0.00011828031966322861, "loss": 0.0085, "step": 467360 }, { "epoch": 1.21, "learning_rate": 0.00011827643144685715, "loss": 0.0124, "step": 467370 }, { "epoch": 1.21, "learning_rate": 0.00011827254323048568, "loss": 0.0089, "step": 467380 }, { "epoch": 1.21, "learning_rate": 0.00011826865501411422, "loss": 0.0112, "step": 467390 }, { "epoch": 1.21, "learning_rate": 0.00011826476679774275, "loss": 0.0086, "step": 467400 }, { "epoch": 1.21, "learning_rate": 0.0001182608785813713, "loss": 0.0113, "step": 467410 }, { "epoch": 1.21, "learning_rate": 0.00011825699036499982, "loss": 0.0112, "step": 467420 }, { "epoch": 1.21, "learning_rate": 0.00011825310214862836, "loss": 0.011, "step": 467430 }, { "epoch": 1.21, "learning_rate": 0.00011824921393225689, "loss": 0.01, "step": 467440 }, { "epoch": 1.21, "learning_rate": 0.00011824532571588542, "loss": 0.0102, "step": 467450 }, { "epoch": 1.21, "learning_rate": 0.00011824143749951396, "loss": 0.0083, "step": 467460 }, { "epoch": 1.21, "learning_rate": 0.00011823754928314249, "loss": 0.0122, "step": 467470 }, { "epoch": 1.21, "learning_rate": 0.00011823366106677103, "loss": 0.0091, "step": 467480 }, { "epoch": 1.21, "learning_rate": 0.00011822977285039956, "loss": 0.0101, "step": 467490 }, { "epoch": 1.21, "learning_rate": 0.0001182258846340281, "loss": 0.0106, "step": 467500 }, { "epoch": 1.21, "learning_rate": 0.00011822199641765663, "loss": 0.0119, "step": 467510 }, { "epoch": 1.21, "learning_rate": 0.00011821810820128518, "loss": 0.0098, "step": 467520 }, { "epoch": 1.21, "learning_rate": 0.00011821421998491371, "loss": 0.0147, "step": 467530 }, { "epoch": 1.21, "learning_rate": 0.00011821033176854225, "loss": 0.011, "step": 467540 }, { "epoch": 1.21, "learning_rate": 0.00011820644355217078, "loss": 0.0086, "step": 467550 }, { "epoch": 1.21, "learning_rate": 0.00011820255533579932, "loss": 0.01, "step": 467560 }, { "epoch": 1.21, "learning_rate": 0.00011819866711942785, "loss": 0.0103, "step": 467570 }, { "epoch": 1.21, "learning_rate": 0.00011819477890305639, "loss": 0.0098, "step": 467580 }, { "epoch": 1.21, "learning_rate": 0.00011819089068668492, "loss": 0.01, "step": 467590 }, { "epoch": 1.21, "learning_rate": 0.00011818700247031346, "loss": 0.0134, "step": 467600 }, { "epoch": 1.21, "learning_rate": 0.00011818311425394199, "loss": 0.0083, "step": 467610 }, { "epoch": 1.21, "learning_rate": 0.00011817922603757053, "loss": 0.0126, "step": 467620 }, { "epoch": 1.21, "learning_rate": 0.00011817533782119906, "loss": 0.0104, "step": 467630 }, { "epoch": 1.21, "learning_rate": 0.0001181714496048276, "loss": 0.0106, "step": 467640 }, { "epoch": 1.21, "learning_rate": 0.00011816756138845613, "loss": 0.0105, "step": 467650 }, { "epoch": 1.21, "learning_rate": 0.00011816367317208467, "loss": 0.0113, "step": 467660 }, { "epoch": 1.21, "learning_rate": 0.0001181597849557132, "loss": 0.0092, "step": 467670 }, { "epoch": 1.21, "learning_rate": 0.00011815589673934175, "loss": 0.0105, "step": 467680 }, { "epoch": 1.21, "learning_rate": 0.00011815200852297028, "loss": 0.0122, "step": 467690 }, { "epoch": 1.21, "learning_rate": 0.0001181481203065988, "loss": 0.0103, "step": 467700 }, { "epoch": 1.21, "learning_rate": 0.00011814423209022735, "loss": 0.0128, "step": 467710 }, { "epoch": 1.21, "learning_rate": 0.00011814034387385588, "loss": 0.0102, "step": 467720 }, { "epoch": 1.21, "learning_rate": 0.00011813645565748442, "loss": 0.0083, "step": 467730 }, { "epoch": 1.21, "learning_rate": 0.00011813256744111295, "loss": 0.0139, "step": 467740 }, { "epoch": 1.21, "learning_rate": 0.00011812867922474149, "loss": 0.0095, "step": 467750 }, { "epoch": 1.21, "learning_rate": 0.00011812479100837002, "loss": 0.0133, "step": 467760 }, { "epoch": 1.21, "learning_rate": 0.00011812090279199856, "loss": 0.0087, "step": 467770 }, { "epoch": 1.21, "learning_rate": 0.00011811701457562709, "loss": 0.0127, "step": 467780 }, { "epoch": 1.21, "learning_rate": 0.00011811312635925563, "loss": 0.0083, "step": 467790 }, { "epoch": 1.21, "learning_rate": 0.00011810923814288416, "loss": 0.0092, "step": 467800 }, { "epoch": 1.21, "learning_rate": 0.0001181053499265127, "loss": 0.0119, "step": 467810 }, { "epoch": 1.21, "learning_rate": 0.00011810146171014123, "loss": 0.0123, "step": 467820 }, { "epoch": 1.21, "learning_rate": 0.00011809757349376977, "loss": 0.0113, "step": 467830 }, { "epoch": 1.21, "learning_rate": 0.0001180936852773983, "loss": 0.0091, "step": 467840 }, { "epoch": 1.21, "learning_rate": 0.00011808979706102684, "loss": 0.0102, "step": 467850 }, { "epoch": 1.21, "learning_rate": 0.00011808590884465537, "loss": 0.0118, "step": 467860 }, { "epoch": 1.21, "learning_rate": 0.00011808202062828392, "loss": 0.0129, "step": 467870 }, { "epoch": 1.21, "learning_rate": 0.00011807813241191245, "loss": 0.0098, "step": 467880 }, { "epoch": 1.21, "learning_rate": 0.000118074244195541, "loss": 0.0142, "step": 467890 }, { "epoch": 1.21, "learning_rate": 0.00011807035597916952, "loss": 0.0114, "step": 467900 }, { "epoch": 1.21, "learning_rate": 0.00011806646776279806, "loss": 0.0111, "step": 467910 }, { "epoch": 1.21, "learning_rate": 0.00011806257954642659, "loss": 0.0123, "step": 467920 }, { "epoch": 1.21, "learning_rate": 0.00011805869133005512, "loss": 0.0092, "step": 467930 }, { "epoch": 1.21, "learning_rate": 0.00011805480311368366, "loss": 0.0102, "step": 467940 }, { "epoch": 1.21, "learning_rate": 0.00011805091489731219, "loss": 0.0092, "step": 467950 }, { "epoch": 1.21, "learning_rate": 0.00011804702668094073, "loss": 0.0113, "step": 467960 }, { "epoch": 1.21, "learning_rate": 0.00011804313846456926, "loss": 0.0096, "step": 467970 }, { "epoch": 1.21, "learning_rate": 0.0001180392502481978, "loss": 0.0105, "step": 467980 }, { "epoch": 1.21, "learning_rate": 0.00011803536203182633, "loss": 0.0112, "step": 467990 }, { "epoch": 1.21, "learning_rate": 0.00011803147381545487, "loss": 0.011, "step": 468000 }, { "epoch": 1.21, "eval_cer": 0.8817124837817071, "eval_loss": 0.007058866787701845, "eval_runtime": 107.9524, "eval_samples_per_second": 18.527, "eval_steps_per_second": 4.632, "step": 468000 }, { "epoch": 1.21, "learning_rate": 0.0001180275855990834, "loss": 0.0111, "step": 468010 }, { "epoch": 1.21, "learning_rate": 0.00011802369738271194, "loss": 0.0116, "step": 468020 }, { "epoch": 1.21, "learning_rate": 0.00011801980916634047, "loss": 0.0092, "step": 468030 }, { "epoch": 1.21, "learning_rate": 0.00011801592094996902, "loss": 0.011, "step": 468040 }, { "epoch": 1.21, "learning_rate": 0.00011801203273359754, "loss": 0.0099, "step": 468050 }, { "epoch": 1.21, "learning_rate": 0.00011800814451722609, "loss": 0.0128, "step": 468060 }, { "epoch": 1.21, "learning_rate": 0.00011800425630085462, "loss": 0.0122, "step": 468070 }, { "epoch": 1.21, "learning_rate": 0.00011800036808448316, "loss": 0.0081, "step": 468080 }, { "epoch": 1.21, "learning_rate": 0.00011799647986811169, "loss": 0.0117, "step": 468090 }, { "epoch": 1.21, "learning_rate": 0.00011799259165174023, "loss": 0.0127, "step": 468100 }, { "epoch": 1.21, "learning_rate": 0.00011798870343536876, "loss": 0.0081, "step": 468110 }, { "epoch": 1.21, "learning_rate": 0.0001179848152189973, "loss": 0.0106, "step": 468120 }, { "epoch": 1.21, "learning_rate": 0.00011798092700262583, "loss": 0.0107, "step": 468130 }, { "epoch": 1.21, "learning_rate": 0.00011797703878625437, "loss": 0.0095, "step": 468140 }, { "epoch": 1.21, "learning_rate": 0.0001179731505698829, "loss": 0.0124, "step": 468150 }, { "epoch": 1.21, "learning_rate": 0.00011796926235351144, "loss": 0.0134, "step": 468160 }, { "epoch": 1.21, "learning_rate": 0.00011796537413713997, "loss": 0.0105, "step": 468170 }, { "epoch": 1.21, "learning_rate": 0.0001179614859207685, "loss": 0.0083, "step": 468180 }, { "epoch": 1.21, "learning_rate": 0.00011795759770439704, "loss": 0.0121, "step": 468190 }, { "epoch": 1.21, "learning_rate": 0.00011795370948802557, "loss": 0.0091, "step": 468200 }, { "epoch": 1.21, "learning_rate": 0.00011794982127165411, "loss": 0.0116, "step": 468210 }, { "epoch": 1.21, "learning_rate": 0.00011794593305528264, "loss": 0.0126, "step": 468220 }, { "epoch": 1.21, "learning_rate": 0.00011794204483891119, "loss": 0.0128, "step": 468230 }, { "epoch": 1.21, "learning_rate": 0.00011793815662253972, "loss": 0.0098, "step": 468240 }, { "epoch": 1.21, "learning_rate": 0.00011793426840616826, "loss": 0.0112, "step": 468250 }, { "epoch": 1.21, "learning_rate": 0.00011793038018979679, "loss": 0.0128, "step": 468260 }, { "epoch": 1.21, "learning_rate": 0.00011792649197342533, "loss": 0.0133, "step": 468270 }, { "epoch": 1.21, "learning_rate": 0.00011792260375705386, "loss": 0.0095, "step": 468280 }, { "epoch": 1.21, "learning_rate": 0.0001179187155406824, "loss": 0.0112, "step": 468290 }, { "epoch": 1.21, "learning_rate": 0.00011791482732431093, "loss": 0.0115, "step": 468300 }, { "epoch": 1.21, "learning_rate": 0.00011791093910793947, "loss": 0.0093, "step": 468310 }, { "epoch": 1.21, "learning_rate": 0.000117907050891568, "loss": 0.0124, "step": 468320 }, { "epoch": 1.21, "learning_rate": 0.00011790316267519654, "loss": 0.0091, "step": 468330 }, { "epoch": 1.21, "learning_rate": 0.00011789927445882507, "loss": 0.0105, "step": 468340 }, { "epoch": 1.21, "learning_rate": 0.00011789538624245361, "loss": 0.0104, "step": 468350 }, { "epoch": 1.21, "learning_rate": 0.00011789149802608214, "loss": 0.0127, "step": 468360 }, { "epoch": 1.21, "learning_rate": 0.00011788760980971068, "loss": 0.0088, "step": 468370 }, { "epoch": 1.21, "learning_rate": 0.00011788372159333921, "loss": 0.0114, "step": 468380 }, { "epoch": 1.21, "learning_rate": 0.00011787983337696776, "loss": 0.0174, "step": 468390 }, { "epoch": 1.21, "learning_rate": 0.00011787594516059629, "loss": 0.0123, "step": 468400 }, { "epoch": 1.21, "learning_rate": 0.00011787205694422483, "loss": 0.0094, "step": 468410 }, { "epoch": 1.21, "learning_rate": 0.00011786816872785336, "loss": 0.0093, "step": 468420 }, { "epoch": 1.21, "learning_rate": 0.00011786428051148189, "loss": 0.0119, "step": 468430 }, { "epoch": 1.21, "learning_rate": 0.00011786039229511043, "loss": 0.0082, "step": 468440 }, { "epoch": 1.21, "learning_rate": 0.00011785650407873896, "loss": 0.0131, "step": 468450 }, { "epoch": 1.21, "learning_rate": 0.0001178526158623675, "loss": 0.0099, "step": 468460 }, { "epoch": 1.21, "learning_rate": 0.00011784872764599603, "loss": 0.0106, "step": 468470 }, { "epoch": 1.21, "learning_rate": 0.00011784483942962457, "loss": 0.0111, "step": 468480 }, { "epoch": 1.21, "learning_rate": 0.0001178409512132531, "loss": 0.0107, "step": 468490 }, { "epoch": 1.21, "learning_rate": 0.00011783706299688164, "loss": 0.0108, "step": 468500 }, { "epoch": 1.21, "learning_rate": 0.00011783317478051017, "loss": 0.0111, "step": 468510 }, { "epoch": 1.21, "learning_rate": 0.00011782928656413871, "loss": 0.0098, "step": 468520 }, { "epoch": 1.21, "learning_rate": 0.00011782539834776724, "loss": 0.0134, "step": 468530 }, { "epoch": 1.21, "learning_rate": 0.00011782151013139578, "loss": 0.0103, "step": 468540 }, { "epoch": 1.21, "learning_rate": 0.00011781762191502431, "loss": 0.011, "step": 468550 }, { "epoch": 1.21, "learning_rate": 0.00011781373369865286, "loss": 0.0095, "step": 468560 }, { "epoch": 1.21, "learning_rate": 0.00011780984548228138, "loss": 0.0121, "step": 468570 }, { "epoch": 1.21, "learning_rate": 0.00011780595726590993, "loss": 0.0094, "step": 468580 }, { "epoch": 1.21, "learning_rate": 0.00011780206904953846, "loss": 0.0075, "step": 468590 }, { "epoch": 1.21, "learning_rate": 0.000117798180833167, "loss": 0.0122, "step": 468600 }, { "epoch": 1.21, "learning_rate": 0.00011779429261679553, "loss": 0.0105, "step": 468610 }, { "epoch": 1.21, "learning_rate": 0.00011779040440042407, "loss": 0.0093, "step": 468620 }, { "epoch": 1.21, "learning_rate": 0.0001177865161840526, "loss": 0.0087, "step": 468630 }, { "epoch": 1.21, "learning_rate": 0.00011778262796768114, "loss": 0.0103, "step": 468640 }, { "epoch": 1.21, "learning_rate": 0.00011777873975130967, "loss": 0.0114, "step": 468650 }, { "epoch": 1.21, "learning_rate": 0.00011777485153493821, "loss": 0.0087, "step": 468660 }, { "epoch": 1.21, "learning_rate": 0.00011777096331856674, "loss": 0.0138, "step": 468670 }, { "epoch": 1.21, "learning_rate": 0.00011776707510219527, "loss": 0.0103, "step": 468680 }, { "epoch": 1.21, "learning_rate": 0.00011776318688582381, "loss": 0.0105, "step": 468690 }, { "epoch": 1.21, "learning_rate": 0.00011775929866945234, "loss": 0.0111, "step": 468700 }, { "epoch": 1.21, "learning_rate": 0.00011775541045308088, "loss": 0.0131, "step": 468710 }, { "epoch": 1.21, "learning_rate": 0.00011775152223670941, "loss": 0.0108, "step": 468720 }, { "epoch": 1.22, "learning_rate": 0.00011774763402033795, "loss": 0.0122, "step": 468730 }, { "epoch": 1.22, "learning_rate": 0.00011774374580396648, "loss": 0.0097, "step": 468740 }, { "epoch": 1.22, "learning_rate": 0.00011773985758759503, "loss": 0.01, "step": 468750 }, { "epoch": 1.22, "learning_rate": 0.00011773596937122356, "loss": 0.0103, "step": 468760 }, { "epoch": 1.22, "learning_rate": 0.0001177320811548521, "loss": 0.009, "step": 468770 }, { "epoch": 1.22, "learning_rate": 0.00011772819293848063, "loss": 0.0123, "step": 468780 }, { "epoch": 1.22, "learning_rate": 0.00011772430472210917, "loss": 0.0088, "step": 468790 }, { "epoch": 1.22, "learning_rate": 0.0001177204165057377, "loss": 0.0095, "step": 468800 }, { "epoch": 1.22, "learning_rate": 0.00011771652828936624, "loss": 0.0114, "step": 468810 }, { "epoch": 1.22, "learning_rate": 0.00011771264007299477, "loss": 0.0116, "step": 468820 }, { "epoch": 1.22, "learning_rate": 0.00011770875185662331, "loss": 0.0129, "step": 468830 }, { "epoch": 1.22, "learning_rate": 0.00011770486364025184, "loss": 0.0094, "step": 468840 }, { "epoch": 1.22, "learning_rate": 0.00011770097542388038, "loss": 0.0126, "step": 468850 }, { "epoch": 1.22, "learning_rate": 0.00011769708720750891, "loss": 0.0117, "step": 468860 }, { "epoch": 1.22, "learning_rate": 0.00011769319899113745, "loss": 0.01, "step": 468870 }, { "epoch": 1.22, "learning_rate": 0.00011768931077476598, "loss": 0.0105, "step": 468880 }, { "epoch": 1.22, "learning_rate": 0.00011768542255839452, "loss": 0.0122, "step": 468890 }, { "epoch": 1.22, "learning_rate": 0.00011768153434202305, "loss": 0.0093, "step": 468900 }, { "epoch": 1.22, "learning_rate": 0.0001176776461256516, "loss": 0.0092, "step": 468910 }, { "epoch": 1.22, "learning_rate": 0.00011767375790928013, "loss": 0.0167, "step": 468920 }, { "epoch": 1.22, "learning_rate": 0.00011766986969290865, "loss": 0.0117, "step": 468930 }, { "epoch": 1.22, "learning_rate": 0.0001176659814765372, "loss": 0.0121, "step": 468940 }, { "epoch": 1.22, "learning_rate": 0.00011766209326016573, "loss": 0.0102, "step": 468950 }, { "epoch": 1.22, "learning_rate": 0.00011765820504379427, "loss": 0.0098, "step": 468960 }, { "epoch": 1.22, "learning_rate": 0.0001176543168274228, "loss": 0.011, "step": 468970 }, { "epoch": 1.22, "learning_rate": 0.00011765042861105134, "loss": 0.0135, "step": 468980 }, { "epoch": 1.22, "learning_rate": 0.00011764654039467987, "loss": 0.0092, "step": 468990 }, { "epoch": 1.22, "learning_rate": 0.00011764265217830841, "loss": 0.01, "step": 469000 }, { "epoch": 1.22, "eval_cer": 0.881719481966378, "eval_loss": 0.007160056848078966, "eval_runtime": 107.8978, "eval_samples_per_second": 18.536, "eval_steps_per_second": 4.634, "step": 469000 }, { "epoch": 1.22, "learning_rate": 0.00011763876396193694, "loss": 0.0109, "step": 469010 }, { "epoch": 1.22, "learning_rate": 0.00011763487574556548, "loss": 0.0092, "step": 469020 }, { "epoch": 1.22, "learning_rate": 0.00011763098752919401, "loss": 0.0111, "step": 469030 }, { "epoch": 1.22, "learning_rate": 0.00011762709931282255, "loss": 0.0135, "step": 469040 }, { "epoch": 1.22, "learning_rate": 0.00011762321109645108, "loss": 0.0127, "step": 469050 }, { "epoch": 1.22, "learning_rate": 0.00011761932288007962, "loss": 0.0091, "step": 469060 }, { "epoch": 1.22, "learning_rate": 0.00011761543466370815, "loss": 0.0118, "step": 469070 }, { "epoch": 1.22, "learning_rate": 0.00011761154644733669, "loss": 0.0077, "step": 469080 }, { "epoch": 1.22, "learning_rate": 0.00011760765823096522, "loss": 0.0095, "step": 469090 }, { "epoch": 1.22, "learning_rate": 0.00011760377001459377, "loss": 0.0092, "step": 469100 }, { "epoch": 1.22, "learning_rate": 0.0001175998817982223, "loss": 0.0108, "step": 469110 }, { "epoch": 1.22, "learning_rate": 0.00011759599358185084, "loss": 0.0091, "step": 469120 }, { "epoch": 1.22, "learning_rate": 0.00011759210536547937, "loss": 0.008, "step": 469130 }, { "epoch": 1.22, "learning_rate": 0.00011758821714910791, "loss": 0.008, "step": 469140 }, { "epoch": 1.22, "learning_rate": 0.00011758432893273644, "loss": 0.0104, "step": 469150 }, { "epoch": 1.22, "learning_rate": 0.00011758044071636498, "loss": 0.0117, "step": 469160 }, { "epoch": 1.22, "learning_rate": 0.00011757655249999351, "loss": 0.0145, "step": 469170 }, { "epoch": 1.22, "learning_rate": 0.00011757266428362204, "loss": 0.0105, "step": 469180 }, { "epoch": 1.22, "learning_rate": 0.00011756877606725058, "loss": 0.0095, "step": 469190 }, { "epoch": 1.22, "learning_rate": 0.00011756488785087911, "loss": 0.0117, "step": 469200 }, { "epoch": 1.22, "learning_rate": 0.00011756099963450765, "loss": 0.0122, "step": 469210 }, { "epoch": 1.22, "learning_rate": 0.00011755711141813618, "loss": 0.0143, "step": 469220 }, { "epoch": 1.22, "learning_rate": 0.00011755322320176472, "loss": 0.013, "step": 469230 }, { "epoch": 1.22, "learning_rate": 0.00011754933498539325, "loss": 0.0131, "step": 469240 }, { "epoch": 1.22, "learning_rate": 0.00011754544676902179, "loss": 0.0086, "step": 469250 }, { "epoch": 1.22, "learning_rate": 0.00011754155855265032, "loss": 0.0117, "step": 469260 }, { "epoch": 1.22, "learning_rate": 0.00011753767033627887, "loss": 0.0138, "step": 469270 }, { "epoch": 1.22, "learning_rate": 0.00011753378211990739, "loss": 0.0101, "step": 469280 }, { "epoch": 1.22, "learning_rate": 0.00011752989390353594, "loss": 0.0096, "step": 469290 }, { "epoch": 1.22, "learning_rate": 0.00011752600568716447, "loss": 0.0099, "step": 469300 }, { "epoch": 1.22, "learning_rate": 0.00011752211747079301, "loss": 0.0137, "step": 469310 }, { "epoch": 1.22, "learning_rate": 0.00011751822925442154, "loss": 0.0106, "step": 469320 }, { "epoch": 1.22, "learning_rate": 0.00011751434103805008, "loss": 0.0116, "step": 469330 }, { "epoch": 1.22, "learning_rate": 0.00011751045282167861, "loss": 0.0154, "step": 469340 }, { "epoch": 1.22, "learning_rate": 0.00011750656460530715, "loss": 0.0102, "step": 469350 }, { "epoch": 1.22, "learning_rate": 0.00011750267638893568, "loss": 0.0097, "step": 469360 }, { "epoch": 1.22, "learning_rate": 0.00011749878817256422, "loss": 0.0119, "step": 469370 }, { "epoch": 1.22, "learning_rate": 0.00011749489995619275, "loss": 0.0109, "step": 469380 }, { "epoch": 1.22, "learning_rate": 0.00011749101173982129, "loss": 0.0121, "step": 469390 }, { "epoch": 1.22, "learning_rate": 0.00011748712352344982, "loss": 0.0084, "step": 469400 }, { "epoch": 1.22, "learning_rate": 0.00011748323530707836, "loss": 0.0068, "step": 469410 }, { "epoch": 1.22, "learning_rate": 0.00011747934709070689, "loss": 0.0131, "step": 469420 }, { "epoch": 1.22, "learning_rate": 0.00011747545887433542, "loss": 0.0152, "step": 469430 }, { "epoch": 1.22, "learning_rate": 0.00011747157065796396, "loss": 0.0099, "step": 469440 }, { "epoch": 1.22, "learning_rate": 0.00011746768244159249, "loss": 0.0086, "step": 469450 }, { "epoch": 1.22, "learning_rate": 0.00011746379422522104, "loss": 0.0091, "step": 469460 }, { "epoch": 1.22, "learning_rate": 0.00011745990600884957, "loss": 0.0118, "step": 469470 }, { "epoch": 1.22, "learning_rate": 0.00011745601779247811, "loss": 0.0092, "step": 469480 }, { "epoch": 1.22, "learning_rate": 0.00011745212957610664, "loss": 0.0082, "step": 469490 }, { "epoch": 1.22, "learning_rate": 0.00011744824135973518, "loss": 0.013, "step": 469500 }, { "epoch": 1.22, "learning_rate": 0.00011744435314336371, "loss": 0.0094, "step": 469510 }, { "epoch": 1.22, "learning_rate": 0.00011744046492699225, "loss": 0.0088, "step": 469520 }, { "epoch": 1.22, "learning_rate": 0.00011743657671062078, "loss": 0.0125, "step": 469530 }, { "epoch": 1.22, "learning_rate": 0.00011743268849424932, "loss": 0.0123, "step": 469540 }, { "epoch": 1.22, "learning_rate": 0.00011742880027787785, "loss": 0.0109, "step": 469550 }, { "epoch": 1.22, "learning_rate": 0.00011742491206150639, "loss": 0.008, "step": 469560 }, { "epoch": 1.22, "learning_rate": 0.00011742102384513492, "loss": 0.0116, "step": 469570 }, { "epoch": 1.22, "learning_rate": 0.00011741713562876346, "loss": 0.0093, "step": 469580 }, { "epoch": 1.22, "learning_rate": 0.00011741324741239199, "loss": 0.0147, "step": 469590 }, { "epoch": 1.22, "learning_rate": 0.00011740935919602053, "loss": 0.011, "step": 469600 }, { "epoch": 1.22, "learning_rate": 0.00011740547097964906, "loss": 0.0138, "step": 469610 }, { "epoch": 1.22, "learning_rate": 0.00011740158276327761, "loss": 0.0101, "step": 469620 }, { "epoch": 1.22, "learning_rate": 0.00011739769454690614, "loss": 0.0145, "step": 469630 }, { "epoch": 1.22, "learning_rate": 0.00011739380633053468, "loss": 0.0096, "step": 469640 }, { "epoch": 1.22, "learning_rate": 0.00011738991811416321, "loss": 0.0081, "step": 469650 }, { "epoch": 1.22, "learning_rate": 0.00011738602989779175, "loss": 0.0139, "step": 469660 }, { "epoch": 1.22, "learning_rate": 0.00011738214168142028, "loss": 0.0104, "step": 469670 }, { "epoch": 1.22, "learning_rate": 0.00011737825346504881, "loss": 0.0123, "step": 469680 }, { "epoch": 1.22, "learning_rate": 0.00011737436524867735, "loss": 0.0115, "step": 469690 }, { "epoch": 1.22, "learning_rate": 0.00011737047703230588, "loss": 0.0094, "step": 469700 }, { "epoch": 1.22, "learning_rate": 0.00011736658881593442, "loss": 0.0143, "step": 469710 }, { "epoch": 1.22, "learning_rate": 0.00011736270059956295, "loss": 0.0086, "step": 469720 }, { "epoch": 1.22, "learning_rate": 0.00011735881238319149, "loss": 0.0102, "step": 469730 }, { "epoch": 1.22, "learning_rate": 0.00011735492416682002, "loss": 0.0082, "step": 469740 }, { "epoch": 1.22, "learning_rate": 0.00011735103595044856, "loss": 0.0103, "step": 469750 }, { "epoch": 1.22, "learning_rate": 0.00011734714773407709, "loss": 0.0125, "step": 469760 }, { "epoch": 1.22, "learning_rate": 0.00011734325951770563, "loss": 0.0143, "step": 469770 }, { "epoch": 1.22, "learning_rate": 0.00011733937130133416, "loss": 0.01, "step": 469780 }, { "epoch": 1.22, "learning_rate": 0.00011733548308496271, "loss": 0.0128, "step": 469790 }, { "epoch": 1.22, "learning_rate": 0.00011733159486859123, "loss": 0.0118, "step": 469800 }, { "epoch": 1.22, "learning_rate": 0.00011732770665221978, "loss": 0.0115, "step": 469810 }, { "epoch": 1.22, "learning_rate": 0.00011732381843584831, "loss": 0.0114, "step": 469820 }, { "epoch": 1.22, "learning_rate": 0.00011731993021947685, "loss": 0.0102, "step": 469830 }, { "epoch": 1.22, "learning_rate": 0.00011731604200310538, "loss": 0.0122, "step": 469840 }, { "epoch": 1.22, "learning_rate": 0.00011731215378673392, "loss": 0.0135, "step": 469850 }, { "epoch": 1.22, "learning_rate": 0.00011730826557036245, "loss": 0.0102, "step": 469860 }, { "epoch": 1.22, "learning_rate": 0.00011730437735399099, "loss": 0.0118, "step": 469870 }, { "epoch": 1.22, "learning_rate": 0.00011730048913761952, "loss": 0.0117, "step": 469880 }, { "epoch": 1.22, "learning_rate": 0.00011729660092124806, "loss": 0.0098, "step": 469890 }, { "epoch": 1.22, "learning_rate": 0.00011729271270487659, "loss": 0.0102, "step": 469900 }, { "epoch": 1.22, "learning_rate": 0.00011728882448850513, "loss": 0.0114, "step": 469910 }, { "epoch": 1.22, "learning_rate": 0.00011728493627213366, "loss": 0.0088, "step": 469920 }, { "epoch": 1.22, "learning_rate": 0.00011728104805576219, "loss": 0.0114, "step": 469930 }, { "epoch": 1.22, "learning_rate": 0.00011727715983939073, "loss": 0.0157, "step": 469940 }, { "epoch": 1.22, "learning_rate": 0.00011727327162301926, "loss": 0.0126, "step": 469950 }, { "epoch": 1.22, "learning_rate": 0.0001172693834066478, "loss": 0.0141, "step": 469960 }, { "epoch": 1.22, "learning_rate": 0.00011726549519027633, "loss": 0.0138, "step": 469970 }, { "epoch": 1.22, "learning_rate": 0.00011726160697390488, "loss": 0.011, "step": 469980 }, { "epoch": 1.22, "learning_rate": 0.00011725771875753341, "loss": 0.0093, "step": 469990 }, { "epoch": 1.22, "learning_rate": 0.00011725383054116195, "loss": 0.0104, "step": 470000 }, { "epoch": 1.22, "eval_cer": 0.8816942885015627, "eval_loss": 0.007257182616740465, "eval_runtime": 107.971, "eval_samples_per_second": 18.523, "eval_steps_per_second": 4.631, "step": 470000 }, { "epoch": 1.22, "learning_rate": 0.00011724994232479048, "loss": 0.0113, "step": 470010 }, { "epoch": 1.22, "learning_rate": 0.00011724605410841902, "loss": 0.0108, "step": 470020 }, { "epoch": 1.22, "learning_rate": 0.00011724216589204755, "loss": 0.0117, "step": 470030 }, { "epoch": 1.22, "learning_rate": 0.00011723827767567609, "loss": 0.0102, "step": 470040 }, { "epoch": 1.22, "learning_rate": 0.00011723438945930462, "loss": 0.0101, "step": 470050 }, { "epoch": 1.22, "learning_rate": 0.00011723050124293316, "loss": 0.0085, "step": 470060 }, { "epoch": 1.22, "learning_rate": 0.00011722661302656169, "loss": 0.0097, "step": 470070 }, { "epoch": 1.22, "learning_rate": 0.00011722272481019023, "loss": 0.0091, "step": 470080 }, { "epoch": 1.22, "learning_rate": 0.00011721883659381876, "loss": 0.0101, "step": 470090 }, { "epoch": 1.22, "learning_rate": 0.0001172149483774473, "loss": 0.01, "step": 470100 }, { "epoch": 1.22, "learning_rate": 0.00011721106016107583, "loss": 0.0114, "step": 470110 }, { "epoch": 1.22, "learning_rate": 0.00011720717194470437, "loss": 0.0123, "step": 470120 }, { "epoch": 1.22, "learning_rate": 0.0001172032837283329, "loss": 0.0109, "step": 470130 }, { "epoch": 1.22, "learning_rate": 0.00011719939551196145, "loss": 0.0113, "step": 470140 }, { "epoch": 1.22, "learning_rate": 0.00011719550729558998, "loss": 0.0117, "step": 470150 }, { "epoch": 1.22, "learning_rate": 0.00011719161907921852, "loss": 0.0087, "step": 470160 }, { "epoch": 1.22, "learning_rate": 0.00011718773086284705, "loss": 0.0133, "step": 470170 }, { "epoch": 1.22, "learning_rate": 0.00011718384264647558, "loss": 0.0117, "step": 470180 }, { "epoch": 1.22, "learning_rate": 0.00011717995443010412, "loss": 0.0124, "step": 470190 }, { "epoch": 1.22, "learning_rate": 0.00011717606621373265, "loss": 0.014, "step": 470200 }, { "epoch": 1.22, "learning_rate": 0.00011717217799736119, "loss": 0.0111, "step": 470210 }, { "epoch": 1.22, "learning_rate": 0.00011716828978098972, "loss": 0.0115, "step": 470220 }, { "epoch": 1.22, "learning_rate": 0.00011716440156461826, "loss": 0.0103, "step": 470230 }, { "epoch": 1.22, "learning_rate": 0.00011716051334824679, "loss": 0.0118, "step": 470240 }, { "epoch": 1.22, "learning_rate": 0.00011715662513187533, "loss": 0.0134, "step": 470250 }, { "epoch": 1.22, "learning_rate": 0.00011715273691550386, "loss": 0.008, "step": 470260 }, { "epoch": 1.22, "learning_rate": 0.0001171488486991324, "loss": 0.0116, "step": 470270 }, { "epoch": 1.22, "learning_rate": 0.00011714496048276093, "loss": 0.0129, "step": 470280 }, { "epoch": 1.22, "learning_rate": 0.00011714107226638947, "loss": 0.0128, "step": 470290 }, { "epoch": 1.22, "learning_rate": 0.000117137184050018, "loss": 0.0095, "step": 470300 }, { "epoch": 1.22, "learning_rate": 0.00011713329583364655, "loss": 0.0102, "step": 470310 }, { "epoch": 1.22, "learning_rate": 0.00011712940761727507, "loss": 0.0107, "step": 470320 }, { "epoch": 1.22, "learning_rate": 0.00011712551940090362, "loss": 0.0098, "step": 470330 }, { "epoch": 1.22, "learning_rate": 0.00011712163118453215, "loss": 0.0075, "step": 470340 }, { "epoch": 1.22, "learning_rate": 0.00011711774296816069, "loss": 0.0107, "step": 470350 }, { "epoch": 1.22, "learning_rate": 0.00011711385475178922, "loss": 0.0111, "step": 470360 }, { "epoch": 1.22, "learning_rate": 0.00011710996653541776, "loss": 0.0105, "step": 470370 }, { "epoch": 1.22, "learning_rate": 0.00011710607831904629, "loss": 0.0099, "step": 470380 }, { "epoch": 1.22, "learning_rate": 0.00011710219010267483, "loss": 0.0095, "step": 470390 }, { "epoch": 1.22, "learning_rate": 0.00011709830188630336, "loss": 0.0102, "step": 470400 }, { "epoch": 1.22, "learning_rate": 0.0001170944136699319, "loss": 0.0093, "step": 470410 }, { "epoch": 1.22, "learning_rate": 0.00011709052545356043, "loss": 0.0088, "step": 470420 }, { "epoch": 1.22, "learning_rate": 0.00011708663723718896, "loss": 0.0155, "step": 470430 }, { "epoch": 1.22, "learning_rate": 0.0001170827490208175, "loss": 0.0159, "step": 470440 }, { "epoch": 1.22, "learning_rate": 0.00011707886080444603, "loss": 0.0127, "step": 470450 }, { "epoch": 1.22, "learning_rate": 0.00011707497258807457, "loss": 0.0105, "step": 470460 }, { "epoch": 1.22, "learning_rate": 0.0001170710843717031, "loss": 0.0112, "step": 470470 }, { "epoch": 1.22, "learning_rate": 0.00011706719615533164, "loss": 0.0121, "step": 470480 }, { "epoch": 1.22, "learning_rate": 0.00011706330793896017, "loss": 0.0153, "step": 470490 }, { "epoch": 1.22, "learning_rate": 0.00011705941972258872, "loss": 0.0085, "step": 470500 }, { "epoch": 1.22, "learning_rate": 0.00011705553150621725, "loss": 0.0112, "step": 470510 }, { "epoch": 1.22, "learning_rate": 0.00011705164328984579, "loss": 0.0106, "step": 470520 }, { "epoch": 1.22, "learning_rate": 0.00011704775507347432, "loss": 0.009, "step": 470530 }, { "epoch": 1.22, "learning_rate": 0.00011704386685710286, "loss": 0.016, "step": 470540 }, { "epoch": 1.22, "learning_rate": 0.00011703997864073139, "loss": 0.0089, "step": 470550 }, { "epoch": 1.22, "learning_rate": 0.00011703609042435993, "loss": 0.0131, "step": 470560 }, { "epoch": 1.22, "learning_rate": 0.00011703220220798846, "loss": 0.0095, "step": 470570 }, { "epoch": 1.22, "learning_rate": 0.000117028313991617, "loss": 0.0096, "step": 470580 }, { "epoch": 1.22, "learning_rate": 0.00011702442577524553, "loss": 0.0103, "step": 470590 }, { "epoch": 1.22, "learning_rate": 0.00011702053755887407, "loss": 0.0138, "step": 470600 }, { "epoch": 1.22, "learning_rate": 0.0001170166493425026, "loss": 0.0098, "step": 470610 }, { "epoch": 1.22, "learning_rate": 0.00011701276112613114, "loss": 0.0094, "step": 470620 }, { "epoch": 1.22, "learning_rate": 0.00011700887290975967, "loss": 0.0092, "step": 470630 }, { "epoch": 1.22, "learning_rate": 0.00011700498469338821, "loss": 0.0097, "step": 470640 }, { "epoch": 1.22, "learning_rate": 0.00011700109647701674, "loss": 0.0122, "step": 470650 }, { "epoch": 1.22, "learning_rate": 0.00011699720826064527, "loss": 0.01, "step": 470660 }, { "epoch": 1.22, "learning_rate": 0.00011699332004427381, "loss": 0.0102, "step": 470670 }, { "epoch": 1.22, "learning_rate": 0.00011698943182790234, "loss": 0.0121, "step": 470680 }, { "epoch": 1.22, "learning_rate": 0.00011698554361153089, "loss": 0.0107, "step": 470690 }, { "epoch": 1.22, "learning_rate": 0.00011698165539515942, "loss": 0.0117, "step": 470700 }, { "epoch": 1.22, "learning_rate": 0.00011697776717878796, "loss": 0.0084, "step": 470710 }, { "epoch": 1.22, "learning_rate": 0.00011697387896241649, "loss": 0.0145, "step": 470720 }, { "epoch": 1.22, "learning_rate": 0.00011696999074604503, "loss": 0.012, "step": 470730 }, { "epoch": 1.22, "learning_rate": 0.00011696610252967356, "loss": 0.0094, "step": 470740 }, { "epoch": 1.22, "learning_rate": 0.0001169622143133021, "loss": 0.0116, "step": 470750 }, { "epoch": 1.22, "learning_rate": 0.00011695832609693063, "loss": 0.0093, "step": 470760 }, { "epoch": 1.22, "learning_rate": 0.00011695443788055917, "loss": 0.0104, "step": 470770 }, { "epoch": 1.22, "learning_rate": 0.0001169505496641877, "loss": 0.0139, "step": 470780 }, { "epoch": 1.22, "learning_rate": 0.00011694666144781624, "loss": 0.0139, "step": 470790 }, { "epoch": 1.22, "learning_rate": 0.00011694277323144477, "loss": 0.0106, "step": 470800 }, { "epoch": 1.22, "learning_rate": 0.00011693888501507331, "loss": 0.0099, "step": 470810 }, { "epoch": 1.22, "learning_rate": 0.00011693499679870184, "loss": 0.0102, "step": 470820 }, { "epoch": 1.22, "learning_rate": 0.00011693110858233038, "loss": 0.0093, "step": 470830 }, { "epoch": 1.22, "learning_rate": 0.0001169272203659589, "loss": 0.0102, "step": 470840 }, { "epoch": 1.22, "learning_rate": 0.00011692333214958746, "loss": 0.01, "step": 470850 }, { "epoch": 1.22, "learning_rate": 0.00011691944393321599, "loss": 0.0122, "step": 470860 }, { "epoch": 1.22, "learning_rate": 0.00011691555571684453, "loss": 0.0106, "step": 470870 }, { "epoch": 1.22, "learning_rate": 0.00011691166750047306, "loss": 0.0096, "step": 470880 }, { "epoch": 1.22, "learning_rate": 0.0001169077792841016, "loss": 0.0113, "step": 470890 }, { "epoch": 1.22, "learning_rate": 0.00011690389106773013, "loss": 0.0125, "step": 470900 }, { "epoch": 1.22, "learning_rate": 0.00011690000285135866, "loss": 0.011, "step": 470910 }, { "epoch": 1.22, "learning_rate": 0.0001168961146349872, "loss": 0.0096, "step": 470920 }, { "epoch": 1.22, "learning_rate": 0.00011689222641861573, "loss": 0.0113, "step": 470930 }, { "epoch": 1.22, "learning_rate": 0.00011688833820224427, "loss": 0.0124, "step": 470940 }, { "epoch": 1.22, "learning_rate": 0.0001168844499858728, "loss": 0.0082, "step": 470950 }, { "epoch": 1.22, "learning_rate": 0.00011688056176950134, "loss": 0.0073, "step": 470960 }, { "epoch": 1.22, "learning_rate": 0.00011687667355312987, "loss": 0.0117, "step": 470970 }, { "epoch": 1.22, "learning_rate": 0.00011687278533675841, "loss": 0.0121, "step": 470980 }, { "epoch": 1.22, "learning_rate": 0.00011686889712038694, "loss": 0.0088, "step": 470990 }, { "epoch": 1.22, "learning_rate": 0.00011686500890401548, "loss": 0.0131, "step": 471000 }, { "epoch": 1.22, "eval_cer": 0.8816844910430235, "eval_loss": 0.007188483607023954, "eval_runtime": 107.8616, "eval_samples_per_second": 18.542, "eval_steps_per_second": 4.636, "step": 471000 }, { "epoch": 1.22, "learning_rate": 0.000116861120687644, "loss": 0.0163, "step": 471010 }, { "epoch": 1.22, "learning_rate": 0.00011685723247127256, "loss": 0.0105, "step": 471020 }, { "epoch": 1.22, "learning_rate": 0.00011685334425490108, "loss": 0.0102, "step": 471030 }, { "epoch": 1.22, "learning_rate": 0.00011684945603852963, "loss": 0.008, "step": 471040 }, { "epoch": 1.22, "learning_rate": 0.00011684556782215816, "loss": 0.0135, "step": 471050 }, { "epoch": 1.22, "learning_rate": 0.0001168416796057867, "loss": 0.0144, "step": 471060 }, { "epoch": 1.22, "learning_rate": 0.00011683779138941523, "loss": 0.0104, "step": 471070 }, { "epoch": 1.22, "learning_rate": 0.00011683390317304377, "loss": 0.0133, "step": 471080 }, { "epoch": 1.22, "learning_rate": 0.0001168300149566723, "loss": 0.0118, "step": 471090 }, { "epoch": 1.22, "learning_rate": 0.00011682612674030084, "loss": 0.009, "step": 471100 }, { "epoch": 1.22, "learning_rate": 0.00011682223852392937, "loss": 0.0094, "step": 471110 }, { "epoch": 1.22, "learning_rate": 0.00011681835030755791, "loss": 0.0104, "step": 471120 }, { "epoch": 1.22, "learning_rate": 0.00011681446209118644, "loss": 0.0109, "step": 471130 }, { "epoch": 1.22, "learning_rate": 0.00011681057387481498, "loss": 0.0118, "step": 471140 }, { "epoch": 1.22, "learning_rate": 0.00011680668565844351, "loss": 0.0102, "step": 471150 }, { "epoch": 1.22, "learning_rate": 0.00011680279744207204, "loss": 0.0119, "step": 471160 }, { "epoch": 1.22, "learning_rate": 0.00011679890922570058, "loss": 0.0116, "step": 471170 }, { "epoch": 1.22, "learning_rate": 0.0001167950210093291, "loss": 0.0065, "step": 471180 }, { "epoch": 1.22, "learning_rate": 0.00011679113279295765, "loss": 0.0106, "step": 471190 }, { "epoch": 1.22, "learning_rate": 0.00011678724457658618, "loss": 0.0131, "step": 471200 }, { "epoch": 1.22, "learning_rate": 0.00011678335636021473, "loss": 0.0098, "step": 471210 }, { "epoch": 1.22, "learning_rate": 0.00011677946814384326, "loss": 0.0146, "step": 471220 }, { "epoch": 1.22, "learning_rate": 0.0001167755799274718, "loss": 0.0099, "step": 471230 }, { "epoch": 1.22, "learning_rate": 0.00011677169171110033, "loss": 0.0098, "step": 471240 }, { "epoch": 1.22, "learning_rate": 0.00011676780349472887, "loss": 0.011, "step": 471250 }, { "epoch": 1.22, "learning_rate": 0.0001167639152783574, "loss": 0.0087, "step": 471260 }, { "epoch": 1.22, "learning_rate": 0.00011676002706198594, "loss": 0.0115, "step": 471270 }, { "epoch": 1.22, "learning_rate": 0.00011675613884561447, "loss": 0.008, "step": 471280 }, { "epoch": 1.22, "learning_rate": 0.00011675225062924301, "loss": 0.0109, "step": 471290 }, { "epoch": 1.22, "learning_rate": 0.00011674836241287154, "loss": 0.007, "step": 471300 }, { "epoch": 1.22, "learning_rate": 0.00011674447419650008, "loss": 0.0102, "step": 471310 }, { "epoch": 1.22, "learning_rate": 0.00011674058598012861, "loss": 0.0103, "step": 471320 }, { "epoch": 1.22, "learning_rate": 0.00011673669776375715, "loss": 0.0093, "step": 471330 }, { "epoch": 1.22, "learning_rate": 0.00011673280954738568, "loss": 0.0138, "step": 471340 }, { "epoch": 1.22, "learning_rate": 0.00011672892133101422, "loss": 0.0085, "step": 471350 }, { "epoch": 1.22, "learning_rate": 0.00011672503311464275, "loss": 0.0087, "step": 471360 }, { "epoch": 1.22, "learning_rate": 0.0001167211448982713, "loss": 0.0082, "step": 471370 }, { "epoch": 1.22, "learning_rate": 0.00011671725668189983, "loss": 0.0121, "step": 471380 }, { "epoch": 1.22, "learning_rate": 0.00011671336846552837, "loss": 0.0089, "step": 471390 }, { "epoch": 1.22, "learning_rate": 0.0001167094802491569, "loss": 0.011, "step": 471400 }, { "epoch": 1.22, "learning_rate": 0.00011670559203278543, "loss": 0.0112, "step": 471410 }, { "epoch": 1.22, "learning_rate": 0.00011670170381641397, "loss": 0.0121, "step": 471420 }, { "epoch": 1.22, "learning_rate": 0.0001166978156000425, "loss": 0.0129, "step": 471430 }, { "epoch": 1.22, "learning_rate": 0.00011669392738367104, "loss": 0.0092, "step": 471440 }, { "epoch": 1.22, "learning_rate": 0.00011669003916729957, "loss": 0.0152, "step": 471450 }, { "epoch": 1.22, "learning_rate": 0.00011668615095092811, "loss": 0.0086, "step": 471460 }, { "epoch": 1.22, "learning_rate": 0.00011668226273455664, "loss": 0.011, "step": 471470 }, { "epoch": 1.22, "learning_rate": 0.00011667837451818518, "loss": 0.014, "step": 471480 }, { "epoch": 1.22, "learning_rate": 0.0001166744863018137, "loss": 0.0086, "step": 471490 }, { "epoch": 1.22, "learning_rate": 0.00011667059808544225, "loss": 0.0098, "step": 471500 }, { "epoch": 1.22, "learning_rate": 0.00011666670986907078, "loss": 0.0107, "step": 471510 }, { "epoch": 1.22, "learning_rate": 0.00011666282165269932, "loss": 0.0123, "step": 471520 }, { "epoch": 1.22, "learning_rate": 0.00011665893343632785, "loss": 0.0103, "step": 471530 }, { "epoch": 1.22, "learning_rate": 0.0001166550452199564, "loss": 0.01, "step": 471540 }, { "epoch": 1.22, "learning_rate": 0.00011665115700358492, "loss": 0.0106, "step": 471550 }, { "epoch": 1.22, "learning_rate": 0.00011664726878721347, "loss": 0.0091, "step": 471560 }, { "epoch": 1.22, "learning_rate": 0.000116643380570842, "loss": 0.013, "step": 471570 }, { "epoch": 1.22, "learning_rate": 0.00011663949235447054, "loss": 0.015, "step": 471580 }, { "epoch": 1.22, "learning_rate": 0.00011663560413809907, "loss": 0.0076, "step": 471590 }, { "epoch": 1.22, "learning_rate": 0.00011663171592172761, "loss": 0.0092, "step": 471600 }, { "epoch": 1.22, "learning_rate": 0.00011662782770535614, "loss": 0.0129, "step": 471610 }, { "epoch": 1.22, "learning_rate": 0.00011662393948898468, "loss": 0.0096, "step": 471620 }, { "epoch": 1.22, "learning_rate": 0.00011662005127261321, "loss": 0.0089, "step": 471630 }, { "epoch": 1.22, "learning_rate": 0.00011661616305624175, "loss": 0.009, "step": 471640 }, { "epoch": 1.22, "learning_rate": 0.00011661227483987028, "loss": 0.0104, "step": 471650 }, { "epoch": 1.22, "learning_rate": 0.0001166083866234988, "loss": 0.0093, "step": 471660 }, { "epoch": 1.22, "learning_rate": 0.00011660449840712735, "loss": 0.0079, "step": 471670 }, { "epoch": 1.22, "learning_rate": 0.00011660061019075588, "loss": 0.0132, "step": 471680 }, { "epoch": 1.22, "learning_rate": 0.00011659672197438442, "loss": 0.014, "step": 471690 }, { "epoch": 1.22, "learning_rate": 0.00011659283375801295, "loss": 0.0104, "step": 471700 }, { "epoch": 1.22, "learning_rate": 0.00011658894554164149, "loss": 0.0107, "step": 471710 }, { "epoch": 1.22, "learning_rate": 0.00011658505732527002, "loss": 0.0097, "step": 471720 }, { "epoch": 1.22, "learning_rate": 0.00011658116910889857, "loss": 0.0096, "step": 471730 }, { "epoch": 1.22, "learning_rate": 0.0001165772808925271, "loss": 0.0134, "step": 471740 }, { "epoch": 1.22, "learning_rate": 0.00011657339267615564, "loss": 0.0121, "step": 471750 }, { "epoch": 1.22, "learning_rate": 0.00011656950445978417, "loss": 0.0101, "step": 471760 }, { "epoch": 1.22, "learning_rate": 0.00011656561624341271, "loss": 0.0105, "step": 471770 }, { "epoch": 1.22, "learning_rate": 0.00011656172802704124, "loss": 0.0124, "step": 471780 }, { "epoch": 1.22, "learning_rate": 0.00011655783981066978, "loss": 0.0125, "step": 471790 }, { "epoch": 1.22, "learning_rate": 0.00011655395159429831, "loss": 0.0082, "step": 471800 }, { "epoch": 1.22, "learning_rate": 0.00011655006337792685, "loss": 0.0115, "step": 471810 }, { "epoch": 1.22, "learning_rate": 0.00011654617516155538, "loss": 0.0134, "step": 471820 }, { "epoch": 1.22, "learning_rate": 0.00011654228694518392, "loss": 0.0094, "step": 471830 }, { "epoch": 1.22, "learning_rate": 0.00011653839872881245, "loss": 0.009, "step": 471840 }, { "epoch": 1.22, "learning_rate": 0.00011653451051244099, "loss": 0.0125, "step": 471850 }, { "epoch": 1.22, "learning_rate": 0.00011653062229606952, "loss": 0.0095, "step": 471860 }, { "epoch": 1.22, "learning_rate": 0.00011652673407969806, "loss": 0.0119, "step": 471870 }, { "epoch": 1.22, "learning_rate": 0.00011652284586332659, "loss": 0.0106, "step": 471880 }, { "epoch": 1.22, "learning_rate": 0.00011651895764695514, "loss": 0.01, "step": 471890 }, { "epoch": 1.22, "learning_rate": 0.00011651506943058367, "loss": 0.0109, "step": 471900 }, { "epoch": 1.22, "learning_rate": 0.00011651118121421218, "loss": 0.0118, "step": 471910 }, { "epoch": 1.22, "learning_rate": 0.00011650729299784074, "loss": 0.007, "step": 471920 }, { "epoch": 1.22, "learning_rate": 0.00011650340478146927, "loss": 0.0105, "step": 471930 }, { "epoch": 1.22, "learning_rate": 0.00011649951656509781, "loss": 0.0083, "step": 471940 }, { "epoch": 1.22, "learning_rate": 0.00011649562834872634, "loss": 0.0106, "step": 471950 }, { "epoch": 1.22, "learning_rate": 0.00011649174013235488, "loss": 0.011, "step": 471960 }, { "epoch": 1.22, "learning_rate": 0.00011648785191598341, "loss": 0.0095, "step": 471970 }, { "epoch": 1.22, "learning_rate": 0.00011648396369961195, "loss": 0.0096, "step": 471980 }, { "epoch": 1.22, "learning_rate": 0.00011648007548324048, "loss": 0.0129, "step": 471990 }, { "epoch": 1.22, "learning_rate": 0.00011647618726686902, "loss": 0.0108, "step": 472000 }, { "epoch": 1.22, "eval_cer": 0.8817012866862336, "eval_loss": 0.007290003355592489, "eval_runtime": 108.0416, "eval_samples_per_second": 18.511, "eval_steps_per_second": 4.628, "step": 472000 }, { "epoch": 1.22, "learning_rate": 0.00011647229905049755, "loss": 0.0118, "step": 472010 }, { "epoch": 1.22, "learning_rate": 0.00011646841083412609, "loss": 0.0106, "step": 472020 }, { "epoch": 1.22, "learning_rate": 0.00011646452261775462, "loss": 0.0121, "step": 472030 }, { "epoch": 1.22, "learning_rate": 0.00011646063440138316, "loss": 0.011, "step": 472040 }, { "epoch": 1.22, "learning_rate": 0.00011645674618501169, "loss": 0.012, "step": 472050 }, { "epoch": 1.22, "learning_rate": 0.00011645285796864023, "loss": 0.0146, "step": 472060 }, { "epoch": 1.22, "learning_rate": 0.00011644896975226876, "loss": 0.0111, "step": 472070 }, { "epoch": 1.22, "learning_rate": 0.00011644508153589731, "loss": 0.0118, "step": 472080 }, { "epoch": 1.22, "learning_rate": 0.00011644119331952584, "loss": 0.0142, "step": 472090 }, { "epoch": 1.22, "learning_rate": 0.00011643730510315438, "loss": 0.0111, "step": 472100 }, { "epoch": 1.22, "learning_rate": 0.00011643341688678291, "loss": 0.0095, "step": 472110 }, { "epoch": 1.22, "learning_rate": 0.00011642952867041145, "loss": 0.0083, "step": 472120 }, { "epoch": 1.22, "learning_rate": 0.00011642564045403998, "loss": 0.0081, "step": 472130 }, { "epoch": 1.22, "learning_rate": 0.00011642175223766852, "loss": 0.0076, "step": 472140 }, { "epoch": 1.22, "learning_rate": 0.00011641786402129705, "loss": 0.0111, "step": 472150 }, { "epoch": 1.22, "learning_rate": 0.00011641397580492558, "loss": 0.0105, "step": 472160 }, { "epoch": 1.22, "learning_rate": 0.00011641008758855412, "loss": 0.0092, "step": 472170 }, { "epoch": 1.22, "learning_rate": 0.00011640619937218265, "loss": 0.0163, "step": 472180 }, { "epoch": 1.22, "learning_rate": 0.00011640231115581119, "loss": 0.0099, "step": 472190 }, { "epoch": 1.22, "learning_rate": 0.00011639842293943972, "loss": 0.0103, "step": 472200 }, { "epoch": 1.22, "learning_rate": 0.00011639453472306826, "loss": 0.0085, "step": 472210 }, { "epoch": 1.22, "learning_rate": 0.00011639064650669679, "loss": 0.0092, "step": 472220 }, { "epoch": 1.22, "learning_rate": 0.00011638675829032533, "loss": 0.0109, "step": 472230 }, { "epoch": 1.22, "learning_rate": 0.00011638287007395386, "loss": 0.0086, "step": 472240 }, { "epoch": 1.22, "learning_rate": 0.00011637898185758241, "loss": 0.0108, "step": 472250 }, { "epoch": 1.22, "learning_rate": 0.00011637509364121092, "loss": 0.0104, "step": 472260 }, { "epoch": 1.22, "learning_rate": 0.00011637120542483948, "loss": 0.0083, "step": 472270 }, { "epoch": 1.22, "learning_rate": 0.00011636731720846801, "loss": 0.0093, "step": 472280 }, { "epoch": 1.22, "learning_rate": 0.00011636342899209655, "loss": 0.0113, "step": 472290 }, { "epoch": 1.22, "learning_rate": 0.00011635954077572508, "loss": 0.0061, "step": 472300 }, { "epoch": 1.22, "learning_rate": 0.00011635565255935362, "loss": 0.011, "step": 472310 }, { "epoch": 1.22, "learning_rate": 0.00011635176434298215, "loss": 0.0099, "step": 472320 }, { "epoch": 1.22, "learning_rate": 0.00011634787612661069, "loss": 0.012, "step": 472330 }, { "epoch": 1.22, "learning_rate": 0.00011634398791023922, "loss": 0.009, "step": 472340 }, { "epoch": 1.22, "learning_rate": 0.00011634009969386776, "loss": 0.0075, "step": 472350 }, { "epoch": 1.22, "learning_rate": 0.00011633621147749629, "loss": 0.0117, "step": 472360 }, { "epoch": 1.22, "learning_rate": 0.00011633232326112483, "loss": 0.0147, "step": 472370 }, { "epoch": 1.22, "learning_rate": 0.00011632843504475336, "loss": 0.0099, "step": 472380 }, { "epoch": 1.22, "learning_rate": 0.0001163245468283819, "loss": 0.0107, "step": 472390 }, { "epoch": 1.22, "learning_rate": 0.00011632065861201043, "loss": 0.0115, "step": 472400 }, { "epoch": 1.22, "learning_rate": 0.00011631677039563895, "loss": 0.0101, "step": 472410 }, { "epoch": 1.22, "learning_rate": 0.0001163128821792675, "loss": 0.0107, "step": 472420 }, { "epoch": 1.22, "learning_rate": 0.00011630899396289602, "loss": 0.0137, "step": 472430 }, { "epoch": 1.22, "learning_rate": 0.00011630510574652458, "loss": 0.0089, "step": 472440 }, { "epoch": 1.22, "learning_rate": 0.00011630121753015311, "loss": 0.0112, "step": 472450 }, { "epoch": 1.22, "learning_rate": 0.00011629732931378165, "loss": 0.0127, "step": 472460 }, { "epoch": 1.22, "learning_rate": 0.00011629344109741018, "loss": 0.012, "step": 472470 }, { "epoch": 1.22, "learning_rate": 0.00011628955288103872, "loss": 0.0101, "step": 472480 }, { "epoch": 1.22, "learning_rate": 0.00011628566466466725, "loss": 0.0116, "step": 472490 }, { "epoch": 1.22, "learning_rate": 0.00011628177644829579, "loss": 0.0102, "step": 472500 }, { "epoch": 1.22, "learning_rate": 0.00011627788823192432, "loss": 0.0094, "step": 472510 }, { "epoch": 1.22, "learning_rate": 0.00011627400001555286, "loss": 0.0098, "step": 472520 }, { "epoch": 1.22, "learning_rate": 0.00011627011179918139, "loss": 0.0099, "step": 472530 }, { "epoch": 1.22, "learning_rate": 0.00011626622358280993, "loss": 0.012, "step": 472540 }, { "epoch": 1.22, "learning_rate": 0.00011626233536643846, "loss": 0.0102, "step": 472550 }, { "epoch": 1.22, "learning_rate": 0.000116258447150067, "loss": 0.0109, "step": 472560 }, { "epoch": 1.22, "learning_rate": 0.00011625455893369553, "loss": 0.0086, "step": 472570 }, { "epoch": 1.22, "learning_rate": 0.00011625067071732407, "loss": 0.0086, "step": 472580 }, { "epoch": 1.23, "learning_rate": 0.0001162467825009526, "loss": 0.0132, "step": 472590 }, { "epoch": 1.23, "learning_rate": 0.00011624289428458115, "loss": 0.0092, "step": 472600 }, { "epoch": 1.23, "learning_rate": 0.00011623900606820968, "loss": 0.0114, "step": 472610 }, { "epoch": 1.23, "learning_rate": 0.00011623511785183822, "loss": 0.0078, "step": 472620 }, { "epoch": 1.23, "learning_rate": 0.00011623122963546675, "loss": 0.0095, "step": 472630 }, { "epoch": 1.23, "learning_rate": 0.00011622734141909529, "loss": 0.01, "step": 472640 }, { "epoch": 1.23, "learning_rate": 0.00011622345320272382, "loss": 0.0094, "step": 472650 }, { "epoch": 1.23, "learning_rate": 0.00011621956498635235, "loss": 0.0118, "step": 472660 }, { "epoch": 1.23, "learning_rate": 0.00011621567676998089, "loss": 0.009, "step": 472670 }, { "epoch": 1.23, "learning_rate": 0.00011621178855360942, "loss": 0.009, "step": 472680 }, { "epoch": 1.23, "learning_rate": 0.00011620790033723796, "loss": 0.0107, "step": 472690 }, { "epoch": 1.23, "learning_rate": 0.00011620401212086649, "loss": 0.0089, "step": 472700 }, { "epoch": 1.23, "learning_rate": 0.00011620012390449503, "loss": 0.0097, "step": 472710 }, { "epoch": 1.23, "learning_rate": 0.00011619623568812356, "loss": 0.0091, "step": 472720 }, { "epoch": 1.23, "learning_rate": 0.0001161923474717521, "loss": 0.0121, "step": 472730 }, { "epoch": 1.23, "learning_rate": 0.00011618845925538063, "loss": 0.0141, "step": 472740 }, { "epoch": 1.23, "learning_rate": 0.00011618457103900917, "loss": 0.0146, "step": 472750 }, { "epoch": 1.23, "learning_rate": 0.0001161806828226377, "loss": 0.0104, "step": 472760 }, { "epoch": 1.23, "learning_rate": 0.00011617679460626625, "loss": 0.0102, "step": 472770 }, { "epoch": 1.23, "learning_rate": 0.00011617290638989476, "loss": 0.0114, "step": 472780 }, { "epoch": 1.23, "learning_rate": 0.00011616901817352332, "loss": 0.0102, "step": 472790 }, { "epoch": 1.23, "learning_rate": 0.00011616512995715185, "loss": 0.0081, "step": 472800 }, { "epoch": 1.23, "learning_rate": 0.00011616124174078039, "loss": 0.0094, "step": 472810 }, { "epoch": 1.23, "learning_rate": 0.00011615735352440892, "loss": 0.0127, "step": 472820 }, { "epoch": 1.23, "learning_rate": 0.00011615346530803746, "loss": 0.0087, "step": 472830 }, { "epoch": 1.23, "learning_rate": 0.00011614957709166599, "loss": 0.0083, "step": 472840 }, { "epoch": 1.23, "learning_rate": 0.00011614568887529453, "loss": 0.0114, "step": 472850 }, { "epoch": 1.23, "learning_rate": 0.00011614180065892306, "loss": 0.0104, "step": 472860 }, { "epoch": 1.23, "learning_rate": 0.0001161379124425516, "loss": 0.0096, "step": 472870 }, { "epoch": 1.23, "learning_rate": 0.00011613402422618013, "loss": 0.0097, "step": 472880 }, { "epoch": 1.23, "learning_rate": 0.00011613013600980867, "loss": 0.011, "step": 472890 }, { "epoch": 1.23, "learning_rate": 0.0001161262477934372, "loss": 0.01, "step": 472900 }, { "epoch": 1.23, "learning_rate": 0.00011612235957706572, "loss": 0.0102, "step": 472910 }, { "epoch": 1.23, "learning_rate": 0.00011611847136069427, "loss": 0.008, "step": 472920 }, { "epoch": 1.23, "learning_rate": 0.0001161145831443228, "loss": 0.0114, "step": 472930 }, { "epoch": 1.23, "learning_rate": 0.00011611069492795134, "loss": 0.01, "step": 472940 }, { "epoch": 1.23, "learning_rate": 0.00011610680671157986, "loss": 0.0101, "step": 472950 }, { "epoch": 1.23, "learning_rate": 0.00011610291849520842, "loss": 0.0109, "step": 472960 }, { "epoch": 1.23, "learning_rate": 0.00011609903027883695, "loss": 0.0114, "step": 472970 }, { "epoch": 1.23, "learning_rate": 0.00011609514206246549, "loss": 0.0085, "step": 472980 }, { "epoch": 1.23, "learning_rate": 0.00011609125384609402, "loss": 0.0132, "step": 472990 }, { "epoch": 1.23, "learning_rate": 0.00011608736562972256, "loss": 0.0106, "step": 473000 }, { "epoch": 1.23, "eval_cer": 0.8816858906799576, "eval_loss": 0.0070616379380226135, "eval_runtime": 108.0667, "eval_samples_per_second": 18.507, "eval_steps_per_second": 4.627, "step": 473000 }, { "epoch": 1.23, "learning_rate": 0.00011608347741335109, "loss": 0.0117, "step": 473010 }, { "epoch": 1.23, "learning_rate": 0.00011607958919697963, "loss": 0.0147, "step": 473020 }, { "epoch": 1.23, "learning_rate": 0.00011607570098060816, "loss": 0.0096, "step": 473030 }, { "epoch": 1.23, "learning_rate": 0.0001160718127642367, "loss": 0.0139, "step": 473040 }, { "epoch": 1.23, "learning_rate": 0.00011606792454786523, "loss": 0.0106, "step": 473050 }, { "epoch": 1.23, "learning_rate": 0.00011606403633149377, "loss": 0.0097, "step": 473060 }, { "epoch": 1.23, "learning_rate": 0.0001160601481151223, "loss": 0.0086, "step": 473070 }, { "epoch": 1.23, "learning_rate": 0.00011605625989875084, "loss": 0.0143, "step": 473080 }, { "epoch": 1.23, "learning_rate": 0.00011605237168237937, "loss": 0.0095, "step": 473090 }, { "epoch": 1.23, "learning_rate": 0.00011604848346600791, "loss": 0.0099, "step": 473100 }, { "epoch": 1.23, "learning_rate": 0.00011604459524963644, "loss": 0.011, "step": 473110 }, { "epoch": 1.23, "learning_rate": 0.00011604070703326499, "loss": 0.0092, "step": 473120 }, { "epoch": 1.23, "learning_rate": 0.00011603681881689352, "loss": 0.0095, "step": 473130 }, { "epoch": 1.23, "learning_rate": 0.00011603293060052203, "loss": 0.0106, "step": 473140 }, { "epoch": 1.23, "learning_rate": 0.00011602904238415059, "loss": 0.01, "step": 473150 }, { "epoch": 1.23, "learning_rate": 0.00011602515416777912, "loss": 0.0101, "step": 473160 }, { "epoch": 1.23, "learning_rate": 0.00011602126595140766, "loss": 0.0098, "step": 473170 }, { "epoch": 1.23, "learning_rate": 0.00011601737773503619, "loss": 0.0099, "step": 473180 }, { "epoch": 1.23, "learning_rate": 0.00011601348951866473, "loss": 0.0102, "step": 473190 }, { "epoch": 1.23, "learning_rate": 0.00011600960130229326, "loss": 0.0097, "step": 473200 }, { "epoch": 1.23, "learning_rate": 0.0001160057130859218, "loss": 0.0098, "step": 473210 }, { "epoch": 1.23, "learning_rate": 0.00011600182486955033, "loss": 0.0097, "step": 473220 }, { "epoch": 1.23, "learning_rate": 0.00011599793665317887, "loss": 0.0095, "step": 473230 }, { "epoch": 1.23, "learning_rate": 0.0001159940484368074, "loss": 0.0129, "step": 473240 }, { "epoch": 1.23, "learning_rate": 0.00011599016022043594, "loss": 0.0122, "step": 473250 }, { "epoch": 1.23, "learning_rate": 0.00011598627200406447, "loss": 0.0108, "step": 473260 }, { "epoch": 1.23, "learning_rate": 0.000115982383787693, "loss": 0.0131, "step": 473270 }, { "epoch": 1.23, "learning_rate": 0.00011597849557132153, "loss": 0.0121, "step": 473280 }, { "epoch": 1.23, "learning_rate": 0.00011597460735495008, "loss": 0.011, "step": 473290 }, { "epoch": 1.23, "learning_rate": 0.0001159707191385786, "loss": 0.0137, "step": 473300 }, { "epoch": 1.23, "learning_rate": 0.00011596683092220716, "loss": 0.0117, "step": 473310 }, { "epoch": 1.23, "learning_rate": 0.00011596294270583569, "loss": 0.009, "step": 473320 }, { "epoch": 1.23, "learning_rate": 0.00011595905448946423, "loss": 0.008, "step": 473330 }, { "epoch": 1.23, "learning_rate": 0.00011595516627309276, "loss": 0.0303, "step": 473340 }, { "epoch": 1.23, "learning_rate": 0.0001159512780567213, "loss": 0.0126, "step": 473350 }, { "epoch": 1.23, "learning_rate": 0.00011594738984034983, "loss": 0.0102, "step": 473360 }, { "epoch": 1.23, "learning_rate": 0.00011594350162397837, "loss": 0.0107, "step": 473370 }, { "epoch": 1.23, "learning_rate": 0.0001159396134076069, "loss": 0.0081, "step": 473380 }, { "epoch": 1.23, "learning_rate": 0.00011593572519123543, "loss": 0.0107, "step": 473390 }, { "epoch": 1.23, "learning_rate": 0.00011593183697486397, "loss": 0.0087, "step": 473400 }, { "epoch": 1.23, "learning_rate": 0.0001159279487584925, "loss": 0.0082, "step": 473410 }, { "epoch": 1.23, "learning_rate": 0.00011592406054212104, "loss": 0.0106, "step": 473420 }, { "epoch": 1.23, "learning_rate": 0.00011592017232574956, "loss": 0.0091, "step": 473430 }, { "epoch": 1.23, "learning_rate": 0.0001159162841093781, "loss": 0.0083, "step": 473440 }, { "epoch": 1.23, "learning_rate": 0.00011591239589300663, "loss": 0.0126, "step": 473450 }, { "epoch": 1.23, "learning_rate": 0.00011590850767663518, "loss": 0.0106, "step": 473460 }, { "epoch": 1.23, "learning_rate": 0.0001159046194602637, "loss": 0.0069, "step": 473470 }, { "epoch": 1.23, "learning_rate": 0.00011590073124389226, "loss": 0.0116, "step": 473480 }, { "epoch": 1.23, "learning_rate": 0.00011589684302752077, "loss": 0.012, "step": 473490 }, { "epoch": 1.23, "learning_rate": 0.00011589295481114933, "loss": 0.0114, "step": 473500 }, { "epoch": 1.23, "learning_rate": 0.00011588906659477786, "loss": 0.0128, "step": 473510 }, { "epoch": 1.23, "learning_rate": 0.0001158851783784064, "loss": 0.0103, "step": 473520 }, { "epoch": 1.23, "learning_rate": 0.00011588129016203493, "loss": 0.0118, "step": 473530 }, { "epoch": 1.23, "learning_rate": 0.00011587740194566347, "loss": 0.0109, "step": 473540 }, { "epoch": 1.23, "learning_rate": 0.000115873513729292, "loss": 0.0093, "step": 473550 }, { "epoch": 1.23, "learning_rate": 0.00011586962551292054, "loss": 0.0131, "step": 473560 }, { "epoch": 1.23, "learning_rate": 0.00011586573729654907, "loss": 0.0129, "step": 473570 }, { "epoch": 1.23, "learning_rate": 0.00011586184908017761, "loss": 0.0074, "step": 473580 }, { "epoch": 1.23, "learning_rate": 0.00011585796086380614, "loss": 0.008, "step": 473590 }, { "epoch": 1.23, "learning_rate": 0.00011585407264743468, "loss": 0.0114, "step": 473600 }, { "epoch": 1.23, "learning_rate": 0.0001158501844310632, "loss": 0.0106, "step": 473610 }, { "epoch": 1.23, "learning_rate": 0.00011584629621469175, "loss": 0.0108, "step": 473620 }, { "epoch": 1.23, "learning_rate": 0.00011584240799832028, "loss": 0.0098, "step": 473630 }, { "epoch": 1.23, "learning_rate": 0.0001158385197819488, "loss": 0.0075, "step": 473640 }, { "epoch": 1.23, "learning_rate": 0.00011583463156557735, "loss": 0.0081, "step": 473650 }, { "epoch": 1.23, "learning_rate": 0.00011583074334920587, "loss": 0.0127, "step": 473660 }, { "epoch": 1.23, "learning_rate": 0.00011582685513283443, "loss": 0.01, "step": 473670 }, { "epoch": 1.23, "learning_rate": 0.00011582296691646296, "loss": 0.0093, "step": 473680 }, { "epoch": 1.23, "learning_rate": 0.0001158190787000915, "loss": 0.011, "step": 473690 }, { "epoch": 1.23, "learning_rate": 0.00011581519048372003, "loss": 0.0124, "step": 473700 }, { "epoch": 1.23, "learning_rate": 0.00011581130226734857, "loss": 0.0126, "step": 473710 }, { "epoch": 1.23, "learning_rate": 0.0001158074140509771, "loss": 0.0095, "step": 473720 }, { "epoch": 1.23, "learning_rate": 0.00011580352583460564, "loss": 0.0108, "step": 473730 }, { "epoch": 1.23, "learning_rate": 0.00011579963761823417, "loss": 0.0099, "step": 473740 }, { "epoch": 1.23, "learning_rate": 0.00011579574940186271, "loss": 0.0108, "step": 473750 }, { "epoch": 1.23, "learning_rate": 0.00011579186118549124, "loss": 0.0118, "step": 473760 }, { "epoch": 1.23, "learning_rate": 0.00011578797296911978, "loss": 0.0112, "step": 473770 }, { "epoch": 1.23, "learning_rate": 0.0001157840847527483, "loss": 0.0118, "step": 473780 }, { "epoch": 1.23, "learning_rate": 0.00011578019653637685, "loss": 0.0106, "step": 473790 }, { "epoch": 1.23, "learning_rate": 0.00011577630832000537, "loss": 0.0141, "step": 473800 }, { "epoch": 1.23, "learning_rate": 0.00011577242010363392, "loss": 0.0141, "step": 473810 }, { "epoch": 1.23, "learning_rate": 0.00011576853188726244, "loss": 0.0116, "step": 473820 }, { "epoch": 1.23, "learning_rate": 0.000115764643670891, "loss": 0.0095, "step": 473830 }, { "epoch": 1.23, "learning_rate": 0.00011576075545451953, "loss": 0.0099, "step": 473840 }, { "epoch": 1.23, "learning_rate": 0.00011575686723814807, "loss": 0.0089, "step": 473850 }, { "epoch": 1.23, "learning_rate": 0.0001157529790217766, "loss": 0.0133, "step": 473860 }, { "epoch": 1.23, "learning_rate": 0.00011574909080540514, "loss": 0.0088, "step": 473870 }, { "epoch": 1.23, "learning_rate": 0.00011574520258903367, "loss": 0.0131, "step": 473880 }, { "epoch": 1.23, "learning_rate": 0.0001157413143726622, "loss": 0.0132, "step": 473890 }, { "epoch": 1.23, "learning_rate": 0.00011573742615629074, "loss": 0.0099, "step": 473900 }, { "epoch": 1.23, "learning_rate": 0.00011573353793991926, "loss": 0.0108, "step": 473910 }, { "epoch": 1.23, "learning_rate": 0.0001157296497235478, "loss": 0.0103, "step": 473920 }, { "epoch": 1.23, "learning_rate": 0.00011572576150717633, "loss": 0.0101, "step": 473930 }, { "epoch": 1.23, "learning_rate": 0.00011572187329080488, "loss": 0.0101, "step": 473940 }, { "epoch": 1.23, "learning_rate": 0.0001157179850744334, "loss": 0.0117, "step": 473950 }, { "epoch": 1.23, "learning_rate": 0.00011571409685806195, "loss": 0.0123, "step": 473960 }, { "epoch": 1.23, "learning_rate": 0.00011571020864169047, "loss": 0.0114, "step": 473970 }, { "epoch": 1.23, "learning_rate": 0.00011570632042531902, "loss": 0.0123, "step": 473980 }, { "epoch": 1.23, "learning_rate": 0.00011570243220894754, "loss": 0.0127, "step": 473990 }, { "epoch": 1.23, "learning_rate": 0.0001156985439925761, "loss": 0.0116, "step": 474000 }, { "epoch": 1.23, "eval_cer": 0.8816844910430235, "eval_loss": 0.007081829011440277, "eval_runtime": 107.9934, "eval_samples_per_second": 18.52, "eval_steps_per_second": 4.63, "step": 474000 }, { "epoch": 1.23, "learning_rate": 0.00011569465577620461, "loss": 0.0095, "step": 474010 }, { "epoch": 1.23, "learning_rate": 0.00011569076755983317, "loss": 0.0094, "step": 474020 }, { "epoch": 1.23, "learning_rate": 0.0001156868793434617, "loss": 0.0109, "step": 474030 }, { "epoch": 1.23, "learning_rate": 0.00011568299112709024, "loss": 0.0108, "step": 474040 }, { "epoch": 1.23, "learning_rate": 0.00011567910291071877, "loss": 0.0091, "step": 474050 }, { "epoch": 1.23, "learning_rate": 0.00011567521469434731, "loss": 0.0075, "step": 474060 }, { "epoch": 1.23, "learning_rate": 0.00011567132647797584, "loss": 0.0091, "step": 474070 }, { "epoch": 1.23, "learning_rate": 0.00011566743826160438, "loss": 0.0106, "step": 474080 }, { "epoch": 1.23, "learning_rate": 0.0001156635500452329, "loss": 0.0118, "step": 474090 }, { "epoch": 1.23, "learning_rate": 0.00011565966182886145, "loss": 0.0143, "step": 474100 }, { "epoch": 1.23, "learning_rate": 0.00011565577361248998, "loss": 0.0089, "step": 474110 }, { "epoch": 1.23, "learning_rate": 0.00011565188539611852, "loss": 0.0117, "step": 474120 }, { "epoch": 1.23, "learning_rate": 0.00011564799717974705, "loss": 0.0122, "step": 474130 }, { "epoch": 1.23, "learning_rate": 0.00011564410896337557, "loss": 0.0117, "step": 474140 }, { "epoch": 1.23, "learning_rate": 0.00011564022074700412, "loss": 0.0109, "step": 474150 }, { "epoch": 1.23, "learning_rate": 0.00011563633253063264, "loss": 0.0132, "step": 474160 }, { "epoch": 1.23, "learning_rate": 0.00011563244431426118, "loss": 0.0118, "step": 474170 }, { "epoch": 1.23, "learning_rate": 0.00011562855609788971, "loss": 0.0095, "step": 474180 }, { "epoch": 1.23, "learning_rate": 0.00011562466788151827, "loss": 0.0138, "step": 474190 }, { "epoch": 1.23, "learning_rate": 0.0001156207796651468, "loss": 0.0153, "step": 474200 }, { "epoch": 1.23, "learning_rate": 0.00011561689144877534, "loss": 0.0141, "step": 474210 }, { "epoch": 1.23, "learning_rate": 0.00011561300323240387, "loss": 0.0108, "step": 474220 }, { "epoch": 1.23, "learning_rate": 0.00011560911501603241, "loss": 0.0085, "step": 474230 }, { "epoch": 1.23, "learning_rate": 0.00011560522679966094, "loss": 0.0122, "step": 474240 }, { "epoch": 1.23, "learning_rate": 0.00011560133858328948, "loss": 0.0091, "step": 474250 }, { "epoch": 1.23, "learning_rate": 0.000115597450366918, "loss": 0.008, "step": 474260 }, { "epoch": 1.23, "learning_rate": 0.00011559356215054655, "loss": 0.0108, "step": 474270 }, { "epoch": 1.23, "learning_rate": 0.00011558967393417508, "loss": 0.01, "step": 474280 }, { "epoch": 1.23, "learning_rate": 0.00011558578571780362, "loss": 0.0077, "step": 474290 }, { "epoch": 1.23, "learning_rate": 0.00011558189750143214, "loss": 0.0114, "step": 474300 }, { "epoch": 1.23, "learning_rate": 0.00011557800928506069, "loss": 0.0099, "step": 474310 }, { "epoch": 1.23, "learning_rate": 0.00011557412106868921, "loss": 0.0098, "step": 474320 }, { "epoch": 1.23, "learning_rate": 0.00011557023285231776, "loss": 0.0099, "step": 474330 }, { "epoch": 1.23, "learning_rate": 0.00011556634463594628, "loss": 0.0107, "step": 474340 }, { "epoch": 1.23, "learning_rate": 0.00011556245641957484, "loss": 0.0116, "step": 474350 }, { "epoch": 1.23, "learning_rate": 0.00011555856820320337, "loss": 0.0121, "step": 474360 }, { "epoch": 1.23, "learning_rate": 0.00011555467998683191, "loss": 0.0104, "step": 474370 }, { "epoch": 1.23, "learning_rate": 0.00011555079177046044, "loss": 0.0117, "step": 474380 }, { "epoch": 1.23, "learning_rate": 0.00011554690355408897, "loss": 0.0096, "step": 474390 }, { "epoch": 1.23, "learning_rate": 0.00011554301533771751, "loss": 0.0129, "step": 474400 }, { "epoch": 1.23, "learning_rate": 0.00011553912712134604, "loss": 0.0087, "step": 474410 }, { "epoch": 1.23, "learning_rate": 0.00011553523890497458, "loss": 0.0083, "step": 474420 }, { "epoch": 1.23, "learning_rate": 0.0001155313506886031, "loss": 0.0103, "step": 474430 }, { "epoch": 1.23, "learning_rate": 0.00011552746247223165, "loss": 0.0121, "step": 474440 }, { "epoch": 1.23, "learning_rate": 0.00011552357425586017, "loss": 0.0127, "step": 474450 }, { "epoch": 1.23, "learning_rate": 0.00011551968603948872, "loss": 0.0091, "step": 474460 }, { "epoch": 1.23, "learning_rate": 0.00011551579782311724, "loss": 0.0105, "step": 474470 }, { "epoch": 1.23, "learning_rate": 0.00011551190960674579, "loss": 0.0104, "step": 474480 }, { "epoch": 1.23, "learning_rate": 0.00011550802139037431, "loss": 0.0129, "step": 474490 }, { "epoch": 1.23, "learning_rate": 0.00011550413317400286, "loss": 0.0094, "step": 474500 }, { "epoch": 1.23, "learning_rate": 0.00011550024495763138, "loss": 0.0093, "step": 474510 }, { "epoch": 1.23, "learning_rate": 0.00011549635674125994, "loss": 0.0139, "step": 474520 }, { "epoch": 1.23, "learning_rate": 0.00011549246852488845, "loss": 0.0091, "step": 474530 }, { "epoch": 1.23, "learning_rate": 0.00011548858030851701, "loss": 0.0145, "step": 474540 }, { "epoch": 1.23, "learning_rate": 0.00011548469209214554, "loss": 0.0105, "step": 474550 }, { "epoch": 1.23, "learning_rate": 0.00011548080387577408, "loss": 0.0144, "step": 474560 }, { "epoch": 1.23, "learning_rate": 0.0001154769156594026, "loss": 0.0101, "step": 474570 }, { "epoch": 1.23, "learning_rate": 0.00011547302744303115, "loss": 0.0084, "step": 474580 }, { "epoch": 1.23, "learning_rate": 0.00011546913922665968, "loss": 0.0113, "step": 474590 }, { "epoch": 1.23, "learning_rate": 0.00011546525101028822, "loss": 0.0098, "step": 474600 }, { "epoch": 1.23, "learning_rate": 0.00011546136279391675, "loss": 0.0103, "step": 474610 }, { "epoch": 1.23, "learning_rate": 0.00011545747457754529, "loss": 0.0104, "step": 474620 }, { "epoch": 1.23, "learning_rate": 0.00011545358636117382, "loss": 0.0092, "step": 474630 }, { "epoch": 1.23, "learning_rate": 0.00011544969814480234, "loss": 0.0134, "step": 474640 }, { "epoch": 1.23, "learning_rate": 0.00011544580992843089, "loss": 0.0086, "step": 474650 }, { "epoch": 1.23, "learning_rate": 0.00011544192171205941, "loss": 0.0106, "step": 474660 }, { "epoch": 1.23, "learning_rate": 0.00011543803349568796, "loss": 0.0086, "step": 474670 }, { "epoch": 1.23, "learning_rate": 0.00011543414527931648, "loss": 0.0087, "step": 474680 }, { "epoch": 1.23, "learning_rate": 0.00011543025706294502, "loss": 0.0119, "step": 474690 }, { "epoch": 1.23, "learning_rate": 0.00011542636884657355, "loss": 0.0076, "step": 474700 }, { "epoch": 1.23, "learning_rate": 0.00011542248063020211, "loss": 0.0078, "step": 474710 }, { "epoch": 1.23, "learning_rate": 0.00011541859241383064, "loss": 0.0114, "step": 474720 }, { "epoch": 1.23, "learning_rate": 0.00011541470419745918, "loss": 0.0121, "step": 474730 }, { "epoch": 1.23, "learning_rate": 0.0001154108159810877, "loss": 0.009, "step": 474740 }, { "epoch": 1.23, "learning_rate": 0.00011540692776471625, "loss": 0.0111, "step": 474750 }, { "epoch": 1.23, "learning_rate": 0.00011540303954834478, "loss": 0.0133, "step": 474760 }, { "epoch": 1.23, "learning_rate": 0.00011539915133197332, "loss": 0.0122, "step": 474770 }, { "epoch": 1.23, "learning_rate": 0.00011539526311560185, "loss": 0.0121, "step": 474780 }, { "epoch": 1.23, "learning_rate": 0.00011539137489923039, "loss": 0.0111, "step": 474790 }, { "epoch": 1.23, "learning_rate": 0.00011538748668285892, "loss": 0.0133, "step": 474800 }, { "epoch": 1.23, "learning_rate": 0.00011538359846648746, "loss": 0.0128, "step": 474810 }, { "epoch": 1.23, "learning_rate": 0.00011537971025011598, "loss": 0.0151, "step": 474820 }, { "epoch": 1.23, "learning_rate": 0.00011537582203374453, "loss": 0.0098, "step": 474830 }, { "epoch": 1.23, "learning_rate": 0.00011537193381737305, "loss": 0.0105, "step": 474840 }, { "epoch": 1.23, "learning_rate": 0.0001153680456010016, "loss": 0.0104, "step": 474850 }, { "epoch": 1.23, "learning_rate": 0.00011536415738463012, "loss": 0.0109, "step": 474860 }, { "epoch": 1.23, "learning_rate": 0.00011536026916825868, "loss": 0.0111, "step": 474870 }, { "epoch": 1.23, "learning_rate": 0.0001153563809518872, "loss": 0.0108, "step": 474880 }, { "epoch": 1.23, "learning_rate": 0.00011535249273551572, "loss": 0.0101, "step": 474890 }, { "epoch": 1.23, "learning_rate": 0.00011534860451914428, "loss": 0.014, "step": 474900 }, { "epoch": 1.23, "learning_rate": 0.0001153447163027728, "loss": 0.0122, "step": 474910 }, { "epoch": 1.23, "learning_rate": 0.00011534082808640135, "loss": 0.0107, "step": 474920 }, { "epoch": 1.23, "learning_rate": 0.00011533693987002988, "loss": 0.01, "step": 474930 }, { "epoch": 1.23, "learning_rate": 0.00011533305165365842, "loss": 0.0078, "step": 474940 }, { "epoch": 1.23, "learning_rate": 0.00011532916343728694, "loss": 0.013, "step": 474950 }, { "epoch": 1.23, "learning_rate": 0.00011532527522091549, "loss": 0.0104, "step": 474960 }, { "epoch": 1.23, "learning_rate": 0.00011532138700454401, "loss": 0.0126, "step": 474970 }, { "epoch": 1.23, "learning_rate": 0.00011531749878817256, "loss": 0.0139, "step": 474980 }, { "epoch": 1.23, "learning_rate": 0.00011531361057180108, "loss": 0.0101, "step": 474990 }, { "epoch": 1.23, "learning_rate": 0.00011530972235542963, "loss": 0.0109, "step": 475000 }, { "epoch": 1.23, "eval_cer": 0.8816914892276944, "eval_loss": 0.007072898093611002, "eval_runtime": 108.0529, "eval_samples_per_second": 18.509, "eval_steps_per_second": 4.627, "step": 475000 }, { "epoch": 1.23, "learning_rate": 0.00011530583413905815, "loss": 0.014, "step": 475010 }, { "epoch": 1.23, "learning_rate": 0.0001153019459226867, "loss": 0.0102, "step": 475020 }, { "epoch": 1.23, "learning_rate": 0.00011529805770631522, "loss": 0.0092, "step": 475030 }, { "epoch": 1.23, "learning_rate": 0.00011529416948994377, "loss": 0.0121, "step": 475040 }, { "epoch": 1.23, "learning_rate": 0.0001152902812735723, "loss": 0.0123, "step": 475050 }, { "epoch": 1.23, "learning_rate": 0.00011528639305720085, "loss": 0.0109, "step": 475060 }, { "epoch": 1.23, "learning_rate": 0.00011528250484082938, "loss": 0.0114, "step": 475070 }, { "epoch": 1.23, "learning_rate": 0.00011527861662445792, "loss": 0.0114, "step": 475080 }, { "epoch": 1.23, "learning_rate": 0.00011527472840808645, "loss": 0.0067, "step": 475090 }, { "epoch": 1.23, "learning_rate": 0.00011527084019171499, "loss": 0.0107, "step": 475100 }, { "epoch": 1.23, "learning_rate": 0.00011526695197534352, "loss": 0.0081, "step": 475110 }, { "epoch": 1.23, "learning_rate": 0.00011526306375897206, "loss": 0.0077, "step": 475120 }, { "epoch": 1.23, "learning_rate": 0.00011525917554260059, "loss": 0.0108, "step": 475130 }, { "epoch": 1.23, "learning_rate": 0.00011525528732622911, "loss": 0.008, "step": 475140 }, { "epoch": 1.23, "learning_rate": 0.00011525139910985766, "loss": 0.0101, "step": 475150 }, { "epoch": 1.23, "learning_rate": 0.00011524751089348618, "loss": 0.0099, "step": 475160 }, { "epoch": 1.23, "learning_rate": 0.00011524362267711473, "loss": 0.0098, "step": 475170 }, { "epoch": 1.23, "learning_rate": 0.00011523973446074325, "loss": 0.0111, "step": 475180 }, { "epoch": 1.23, "learning_rate": 0.0001152358462443718, "loss": 0.0099, "step": 475190 }, { "epoch": 1.23, "learning_rate": 0.00011523195802800032, "loss": 0.0146, "step": 475200 }, { "epoch": 1.23, "learning_rate": 0.00011522806981162886, "loss": 0.0124, "step": 475210 }, { "epoch": 1.23, "learning_rate": 0.00011522418159525739, "loss": 0.0111, "step": 475220 }, { "epoch": 1.23, "learning_rate": 0.00011522029337888595, "loss": 0.0095, "step": 475230 }, { "epoch": 1.23, "learning_rate": 0.00011521640516251446, "loss": 0.0122, "step": 475240 }, { "epoch": 1.23, "learning_rate": 0.00011521251694614302, "loss": 0.0115, "step": 475250 }, { "epoch": 1.23, "learning_rate": 0.00011520862872977155, "loss": 0.0129, "step": 475260 }, { "epoch": 1.23, "learning_rate": 0.00011520474051340009, "loss": 0.0098, "step": 475270 }, { "epoch": 1.23, "learning_rate": 0.00011520085229702862, "loss": 0.0118, "step": 475280 }, { "epoch": 1.23, "learning_rate": 0.00011519696408065716, "loss": 0.0193, "step": 475290 }, { "epoch": 1.23, "learning_rate": 0.00011519307586428569, "loss": 0.0095, "step": 475300 }, { "epoch": 1.23, "learning_rate": 0.00011518918764791423, "loss": 0.0088, "step": 475310 }, { "epoch": 1.23, "learning_rate": 0.00011518529943154275, "loss": 0.0086, "step": 475320 }, { "epoch": 1.23, "learning_rate": 0.0001151814112151713, "loss": 0.0096, "step": 475330 }, { "epoch": 1.23, "learning_rate": 0.00011517752299879982, "loss": 0.0117, "step": 475340 }, { "epoch": 1.23, "learning_rate": 0.00011517363478242837, "loss": 0.0108, "step": 475350 }, { "epoch": 1.23, "learning_rate": 0.0001151697465660569, "loss": 0.0103, "step": 475360 }, { "epoch": 1.23, "learning_rate": 0.00011516585834968544, "loss": 0.009, "step": 475370 }, { "epoch": 1.23, "learning_rate": 0.00011516197013331396, "loss": 0.0108, "step": 475380 }, { "epoch": 1.23, "learning_rate": 0.00011515808191694249, "loss": 0.0092, "step": 475390 }, { "epoch": 1.23, "learning_rate": 0.00011515419370057103, "loss": 0.01, "step": 475400 }, { "epoch": 1.23, "learning_rate": 0.00011515030548419956, "loss": 0.0103, "step": 475410 }, { "epoch": 1.23, "learning_rate": 0.00011514641726782812, "loss": 0.0125, "step": 475420 }, { "epoch": 1.23, "learning_rate": 0.00011514252905145665, "loss": 0.0091, "step": 475430 }, { "epoch": 1.23, "learning_rate": 0.00011513864083508519, "loss": 0.0124, "step": 475440 }, { "epoch": 1.23, "learning_rate": 0.00011513475261871371, "loss": 0.0124, "step": 475450 }, { "epoch": 1.23, "learning_rate": 0.00011513086440234226, "loss": 0.0133, "step": 475460 }, { "epoch": 1.23, "learning_rate": 0.00011512697618597078, "loss": 0.009, "step": 475470 }, { "epoch": 1.23, "learning_rate": 0.00011512308796959933, "loss": 0.0135, "step": 475480 }, { "epoch": 1.23, "learning_rate": 0.00011511919975322785, "loss": 0.0112, "step": 475490 }, { "epoch": 1.23, "learning_rate": 0.0001151153115368564, "loss": 0.0088, "step": 475500 }, { "epoch": 1.23, "learning_rate": 0.00011511142332048492, "loss": 0.0106, "step": 475510 }, { "epoch": 1.23, "learning_rate": 0.00011510753510411347, "loss": 0.0102, "step": 475520 }, { "epoch": 1.23, "learning_rate": 0.000115103646887742, "loss": 0.0089, "step": 475530 }, { "epoch": 1.23, "learning_rate": 0.00011509975867137054, "loss": 0.0106, "step": 475540 }, { "epoch": 1.23, "learning_rate": 0.00011509587045499906, "loss": 0.0087, "step": 475550 }, { "epoch": 1.23, "learning_rate": 0.0001150919822386276, "loss": 0.0109, "step": 475560 }, { "epoch": 1.23, "learning_rate": 0.00011508809402225613, "loss": 0.0122, "step": 475570 }, { "epoch": 1.23, "learning_rate": 0.00011508420580588469, "loss": 0.0129, "step": 475580 }, { "epoch": 1.23, "learning_rate": 0.00011508031758951322, "loss": 0.0093, "step": 475590 }, { "epoch": 1.23, "learning_rate": 0.00011507642937314176, "loss": 0.0142, "step": 475600 }, { "epoch": 1.23, "learning_rate": 0.00011507254115677029, "loss": 0.0115, "step": 475610 }, { "epoch": 1.23, "learning_rate": 0.00011506865294039883, "loss": 0.0131, "step": 475620 }, { "epoch": 1.23, "learning_rate": 0.00011506476472402736, "loss": 0.0108, "step": 475630 }, { "epoch": 1.23, "learning_rate": 0.00011506087650765588, "loss": 0.0095, "step": 475640 }, { "epoch": 1.23, "learning_rate": 0.00011505698829128443, "loss": 0.0121, "step": 475650 }, { "epoch": 1.23, "learning_rate": 0.00011505310007491295, "loss": 0.0118, "step": 475660 }, { "epoch": 1.23, "learning_rate": 0.0001150492118585415, "loss": 0.0087, "step": 475670 }, { "epoch": 1.23, "learning_rate": 0.00011504532364217002, "loss": 0.0083, "step": 475680 }, { "epoch": 1.23, "learning_rate": 0.00011504143542579857, "loss": 0.0071, "step": 475690 }, { "epoch": 1.23, "learning_rate": 0.0001150375472094271, "loss": 0.0115, "step": 475700 }, { "epoch": 1.23, "learning_rate": 0.00011503365899305563, "loss": 0.0115, "step": 475710 }, { "epoch": 1.23, "learning_rate": 0.00011502977077668416, "loss": 0.0108, "step": 475720 }, { "epoch": 1.23, "learning_rate": 0.0001150258825603127, "loss": 0.0104, "step": 475730 }, { "epoch": 1.23, "learning_rate": 0.00011502199434394123, "loss": 0.0111, "step": 475740 }, { "epoch": 1.23, "learning_rate": 0.00011501810612756979, "loss": 0.0124, "step": 475750 }, { "epoch": 1.23, "learning_rate": 0.0001150142179111983, "loss": 0.0102, "step": 475760 }, { "epoch": 1.23, "learning_rate": 0.00011501032969482686, "loss": 0.0111, "step": 475770 }, { "epoch": 1.23, "learning_rate": 0.00011500644147845539, "loss": 0.0077, "step": 475780 }, { "epoch": 1.23, "learning_rate": 0.00011500255326208393, "loss": 0.0096, "step": 475790 }, { "epoch": 1.23, "learning_rate": 0.00011499866504571246, "loss": 0.0141, "step": 475800 }, { "epoch": 1.23, "learning_rate": 0.000114994776829341, "loss": 0.0098, "step": 475810 }, { "epoch": 1.23, "learning_rate": 0.00011499088861296953, "loss": 0.0111, "step": 475820 }, { "epoch": 1.23, "learning_rate": 0.00011498700039659807, "loss": 0.012, "step": 475830 }, { "epoch": 1.23, "learning_rate": 0.0001149831121802266, "loss": 0.0097, "step": 475840 }, { "epoch": 1.23, "learning_rate": 0.00011497922396385514, "loss": 0.0093, "step": 475850 }, { "epoch": 1.23, "learning_rate": 0.00011497533574748366, "loss": 0.0128, "step": 475860 }, { "epoch": 1.23, "learning_rate": 0.00011497144753111219, "loss": 0.0113, "step": 475870 }, { "epoch": 1.23, "learning_rate": 0.00011496755931474073, "loss": 0.009, "step": 475880 }, { "epoch": 1.23, "learning_rate": 0.00011496367109836926, "loss": 0.0116, "step": 475890 }, { "epoch": 1.23, "learning_rate": 0.0001149597828819978, "loss": 0.0105, "step": 475900 }, { "epoch": 1.23, "learning_rate": 0.00011495589466562633, "loss": 0.0091, "step": 475910 }, { "epoch": 1.23, "learning_rate": 0.00011495200644925487, "loss": 0.0088, "step": 475920 }, { "epoch": 1.23, "learning_rate": 0.0001149481182328834, "loss": 0.0133, "step": 475930 }, { "epoch": 1.23, "learning_rate": 0.00011494423001651196, "loss": 0.0126, "step": 475940 }, { "epoch": 1.23, "learning_rate": 0.00011494034180014049, "loss": 0.0101, "step": 475950 }, { "epoch": 1.23, "learning_rate": 0.00011493645358376903, "loss": 0.01, "step": 475960 }, { "epoch": 1.23, "learning_rate": 0.00011493256536739755, "loss": 0.0104, "step": 475970 }, { "epoch": 1.23, "learning_rate": 0.0001149286771510261, "loss": 0.0124, "step": 475980 }, { "epoch": 1.23, "learning_rate": 0.00011492478893465462, "loss": 0.0081, "step": 475990 }, { "epoch": 1.23, "learning_rate": 0.00011492090071828317, "loss": 0.0087, "step": 476000 }, { "epoch": 1.23, "eval_cer": 0.8816690950367475, "eval_loss": 0.00715318787842989, "eval_runtime": 108.0552, "eval_samples_per_second": 18.509, "eval_steps_per_second": 4.627, "step": 476000 }, { "epoch": 1.23, "learning_rate": 0.0001149170125019117, "loss": 0.0087, "step": 476010 }, { "epoch": 1.23, "learning_rate": 0.00011491312428554024, "loss": 0.0087, "step": 476020 }, { "epoch": 1.23, "learning_rate": 0.00011490923606916876, "loss": 0.0108, "step": 476030 }, { "epoch": 1.23, "learning_rate": 0.0001149053478527973, "loss": 0.0096, "step": 476040 }, { "epoch": 1.23, "learning_rate": 0.00011490145963642583, "loss": 0.0109, "step": 476050 }, { "epoch": 1.23, "learning_rate": 0.00011489757142005438, "loss": 0.0089, "step": 476060 }, { "epoch": 1.23, "learning_rate": 0.0001148936832036829, "loss": 0.012, "step": 476070 }, { "epoch": 1.23, "learning_rate": 0.00011488979498731145, "loss": 0.0095, "step": 476080 }, { "epoch": 1.23, "learning_rate": 0.00011488590677093997, "loss": 0.0109, "step": 476090 }, { "epoch": 1.23, "learning_rate": 0.00011488201855456853, "loss": 0.0091, "step": 476100 }, { "epoch": 1.23, "learning_rate": 0.00011487813033819706, "loss": 0.0106, "step": 476110 }, { "epoch": 1.23, "learning_rate": 0.00011487424212182557, "loss": 0.0099, "step": 476120 }, { "epoch": 1.23, "learning_rate": 0.00011487035390545413, "loss": 0.0098, "step": 476130 }, { "epoch": 1.23, "learning_rate": 0.00011486646568908265, "loss": 0.0108, "step": 476140 }, { "epoch": 1.23, "learning_rate": 0.0001148625774727112, "loss": 0.0106, "step": 476150 }, { "epoch": 1.23, "learning_rate": 0.00011485868925633972, "loss": 0.0072, "step": 476160 }, { "epoch": 1.23, "learning_rate": 0.00011485480103996827, "loss": 0.0098, "step": 476170 }, { "epoch": 1.23, "learning_rate": 0.0001148509128235968, "loss": 0.009, "step": 476180 }, { "epoch": 1.23, "learning_rate": 0.00011484702460722534, "loss": 0.0102, "step": 476190 }, { "epoch": 1.23, "learning_rate": 0.00011484313639085386, "loss": 0.0103, "step": 476200 }, { "epoch": 1.23, "learning_rate": 0.0001148392481744824, "loss": 0.0118, "step": 476210 }, { "epoch": 1.23, "learning_rate": 0.00011483535995811093, "loss": 0.0093, "step": 476220 }, { "epoch": 1.23, "learning_rate": 0.00011483147174173947, "loss": 0.0108, "step": 476230 }, { "epoch": 1.23, "learning_rate": 0.000114827583525368, "loss": 0.0094, "step": 476240 }, { "epoch": 1.23, "learning_rate": 0.00011482369530899654, "loss": 0.011, "step": 476250 }, { "epoch": 1.23, "learning_rate": 0.00011481980709262507, "loss": 0.009, "step": 476260 }, { "epoch": 1.23, "learning_rate": 0.00011481591887625361, "loss": 0.0116, "step": 476270 }, { "epoch": 1.23, "learning_rate": 0.00011481203065988214, "loss": 0.0086, "step": 476280 }, { "epoch": 1.23, "learning_rate": 0.0001148081424435107, "loss": 0.0098, "step": 476290 }, { "epoch": 1.23, "learning_rate": 0.00011480425422713923, "loss": 0.0117, "step": 476300 }, { "epoch": 1.23, "learning_rate": 0.00011480036601076777, "loss": 0.0127, "step": 476310 }, { "epoch": 1.23, "learning_rate": 0.0001147964777943963, "loss": 0.0113, "step": 476320 }, { "epoch": 1.23, "learning_rate": 0.00011479258957802484, "loss": 0.0089, "step": 476330 }, { "epoch": 1.23, "learning_rate": 0.00011478870136165337, "loss": 0.011, "step": 476340 }, { "epoch": 1.23, "learning_rate": 0.0001147848131452819, "loss": 0.0114, "step": 476350 }, { "epoch": 1.23, "learning_rate": 0.00011478092492891043, "loss": 0.0089, "step": 476360 }, { "epoch": 1.23, "learning_rate": 0.00011477703671253896, "loss": 0.0093, "step": 476370 }, { "epoch": 1.23, "learning_rate": 0.0001147731484961675, "loss": 0.0128, "step": 476380 }, { "epoch": 1.23, "learning_rate": 0.00011476926027979603, "loss": 0.0188, "step": 476390 }, { "epoch": 1.23, "learning_rate": 0.00011476537206342457, "loss": 0.0083, "step": 476400 }, { "epoch": 1.23, "learning_rate": 0.0001147614838470531, "loss": 0.0077, "step": 476410 }, { "epoch": 1.23, "learning_rate": 0.00011475759563068164, "loss": 0.012, "step": 476420 }, { "epoch": 1.23, "learning_rate": 0.00011475370741431017, "loss": 0.009, "step": 476430 }, { "epoch": 1.24, "learning_rate": 0.00011474981919793871, "loss": 0.0103, "step": 476440 }, { "epoch": 1.24, "learning_rate": 0.00011474593098156724, "loss": 0.0114, "step": 476450 }, { "epoch": 1.24, "learning_rate": 0.0001147420427651958, "loss": 0.0106, "step": 476460 }, { "epoch": 1.24, "learning_rate": 0.00011473815454882431, "loss": 0.0108, "step": 476470 }, { "epoch": 1.24, "learning_rate": 0.00011473426633245287, "loss": 0.0089, "step": 476480 }, { "epoch": 1.24, "learning_rate": 0.0001147303781160814, "loss": 0.0108, "step": 476490 }, { "epoch": 1.24, "learning_rate": 0.00011472648989970994, "loss": 0.0084, "step": 476500 }, { "epoch": 1.24, "learning_rate": 0.00011472260168333846, "loss": 0.0145, "step": 476510 }, { "epoch": 1.24, "learning_rate": 0.000114718713466967, "loss": 0.0111, "step": 476520 }, { "epoch": 1.24, "learning_rate": 0.00011471482525059553, "loss": 0.0127, "step": 476530 }, { "epoch": 1.24, "learning_rate": 0.00011471093703422408, "loss": 0.0112, "step": 476540 }, { "epoch": 1.24, "learning_rate": 0.0001147070488178526, "loss": 0.009, "step": 476550 }, { "epoch": 1.24, "learning_rate": 0.00011470316060148115, "loss": 0.0098, "step": 476560 }, { "epoch": 1.24, "learning_rate": 0.00011469927238510967, "loss": 0.0104, "step": 476570 }, { "epoch": 1.24, "learning_rate": 0.00011469538416873822, "loss": 0.0118, "step": 476580 }, { "epoch": 1.24, "learning_rate": 0.00011469149595236674, "loss": 0.0087, "step": 476590 }, { "epoch": 1.24, "learning_rate": 0.00011468760773599529, "loss": 0.0103, "step": 476600 }, { "epoch": 1.24, "learning_rate": 0.00011468371951962381, "loss": 0.0117, "step": 476610 }, { "epoch": 1.24, "learning_rate": 0.00011467983130325234, "loss": 0.0114, "step": 476620 }, { "epoch": 1.24, "learning_rate": 0.00011467594308688088, "loss": 0.0108, "step": 476630 }, { "epoch": 1.24, "learning_rate": 0.00011467205487050941, "loss": 0.01, "step": 476640 }, { "epoch": 1.24, "learning_rate": 0.00011466816665413797, "loss": 0.0099, "step": 476650 }, { "epoch": 1.24, "learning_rate": 0.0001146642784377665, "loss": 0.009, "step": 476660 }, { "epoch": 1.24, "learning_rate": 0.00011466039022139504, "loss": 0.0103, "step": 476670 }, { "epoch": 1.24, "learning_rate": 0.00011465650200502356, "loss": 0.0101, "step": 476680 }, { "epoch": 1.24, "learning_rate": 0.0001146526137886521, "loss": 0.0093, "step": 476690 }, { "epoch": 1.24, "learning_rate": 0.00011464872557228063, "loss": 0.0082, "step": 476700 }, { "epoch": 1.24, "learning_rate": 0.00011464483735590918, "loss": 0.0089, "step": 476710 }, { "epoch": 1.24, "learning_rate": 0.0001146409491395377, "loss": 0.0106, "step": 476720 }, { "epoch": 1.24, "learning_rate": 0.00011463706092316624, "loss": 0.0096, "step": 476730 }, { "epoch": 1.24, "learning_rate": 0.00011463317270679477, "loss": 0.0097, "step": 476740 }, { "epoch": 1.24, "learning_rate": 0.00011462928449042331, "loss": 0.0106, "step": 476750 }, { "epoch": 1.24, "learning_rate": 0.00011462539627405184, "loss": 0.0119, "step": 476760 }, { "epoch": 1.24, "learning_rate": 0.00011462150805768038, "loss": 0.0095, "step": 476770 }, { "epoch": 1.24, "learning_rate": 0.00011461761984130891, "loss": 0.0102, "step": 476780 }, { "epoch": 1.24, "learning_rate": 0.00011461373162493745, "loss": 0.0132, "step": 476790 }, { "epoch": 1.24, "learning_rate": 0.00011460984340856598, "loss": 0.0113, "step": 476800 }, { "epoch": 1.24, "learning_rate": 0.00011460595519219454, "loss": 0.0127, "step": 476810 }, { "epoch": 1.24, "learning_rate": 0.00011460206697582307, "loss": 0.0115, "step": 476820 }, { "epoch": 1.24, "learning_rate": 0.00011459817875945161, "loss": 0.0087, "step": 476830 }, { "epoch": 1.24, "learning_rate": 0.00011459429054308014, "loss": 0.01, "step": 476840 }, { "epoch": 1.24, "learning_rate": 0.00011459040232670868, "loss": 0.0109, "step": 476850 }, { "epoch": 1.24, "learning_rate": 0.0001145865141103372, "loss": 0.0134, "step": 476860 }, { "epoch": 1.24, "learning_rate": 0.00011458262589396573, "loss": 0.0107, "step": 476870 }, { "epoch": 1.24, "learning_rate": 0.00011457873767759427, "loss": 0.0111, "step": 476880 }, { "epoch": 1.24, "learning_rate": 0.0001145748494612228, "loss": 0.0061, "step": 476890 }, { "epoch": 1.24, "learning_rate": 0.00011457096124485134, "loss": 0.0144, "step": 476900 }, { "epoch": 1.24, "learning_rate": 0.00011456707302847987, "loss": 0.0116, "step": 476910 }, { "epoch": 1.24, "learning_rate": 0.00011456318481210841, "loss": 0.0098, "step": 476920 }, { "epoch": 1.24, "learning_rate": 0.00011455929659573694, "loss": 0.0115, "step": 476930 }, { "epoch": 1.24, "learning_rate": 0.00011455540837936548, "loss": 0.0099, "step": 476940 }, { "epoch": 1.24, "learning_rate": 0.00011455152016299401, "loss": 0.0092, "step": 476950 }, { "epoch": 1.24, "learning_rate": 0.00011454763194662255, "loss": 0.011, "step": 476960 }, { "epoch": 1.24, "learning_rate": 0.00011454374373025108, "loss": 0.0089, "step": 476970 }, { "epoch": 1.24, "learning_rate": 0.00011453985551387964, "loss": 0.0083, "step": 476980 }, { "epoch": 1.24, "learning_rate": 0.00011453596729750815, "loss": 0.0089, "step": 476990 }, { "epoch": 1.24, "learning_rate": 0.0001145320790811367, "loss": 0.0112, "step": 477000 }, { "epoch": 1.24, "eval_cer": 0.8817054855970361, "eval_loss": 0.0070707546547055244, "eval_runtime": 108.0477, "eval_samples_per_second": 18.51, "eval_steps_per_second": 4.628, "step": 477000 }, { "epoch": 1.24, "learning_rate": 0.00011452819086476523, "loss": 0.011, "step": 477010 }, { "epoch": 1.24, "learning_rate": 0.00011452430264839378, "loss": 0.0081, "step": 477020 }, { "epoch": 1.24, "learning_rate": 0.0001145204144320223, "loss": 0.0096, "step": 477030 }, { "epoch": 1.24, "learning_rate": 0.00011451652621565085, "loss": 0.0095, "step": 477040 }, { "epoch": 1.24, "learning_rate": 0.00011451263799927937, "loss": 0.0121, "step": 477050 }, { "epoch": 1.24, "learning_rate": 0.00011450874978290792, "loss": 0.01, "step": 477060 }, { "epoch": 1.24, "learning_rate": 0.00011450486156653644, "loss": 0.0177, "step": 477070 }, { "epoch": 1.24, "learning_rate": 0.00011450097335016499, "loss": 0.0117, "step": 477080 }, { "epoch": 1.24, "learning_rate": 0.00011449708513379351, "loss": 0.0082, "step": 477090 }, { "epoch": 1.24, "learning_rate": 0.00011449319691742206, "loss": 0.013, "step": 477100 }, { "epoch": 1.24, "learning_rate": 0.00011448930870105058, "loss": 0.0111, "step": 477110 }, { "epoch": 1.24, "learning_rate": 0.00011448542048467911, "loss": 0.0115, "step": 477120 }, { "epoch": 1.24, "learning_rate": 0.00011448153226830765, "loss": 0.0104, "step": 477130 }, { "epoch": 1.24, "learning_rate": 0.00011447764405193618, "loss": 0.011, "step": 477140 }, { "epoch": 1.24, "learning_rate": 0.00011447375583556472, "loss": 0.0111, "step": 477150 }, { "epoch": 1.24, "learning_rate": 0.00011446986761919325, "loss": 0.0123, "step": 477160 }, { "epoch": 1.24, "learning_rate": 0.0001144659794028218, "loss": 0.0127, "step": 477170 }, { "epoch": 1.24, "learning_rate": 0.00011446209118645033, "loss": 0.0096, "step": 477180 }, { "epoch": 1.24, "learning_rate": 0.00011445820297007888, "loss": 0.0097, "step": 477190 }, { "epoch": 1.24, "learning_rate": 0.0001144543147537074, "loss": 0.0116, "step": 477200 }, { "epoch": 1.24, "learning_rate": 0.00011445042653733595, "loss": 0.0088, "step": 477210 }, { "epoch": 1.24, "learning_rate": 0.00011444653832096447, "loss": 0.0103, "step": 477220 }, { "epoch": 1.24, "learning_rate": 0.00011444265010459302, "loss": 0.0077, "step": 477230 }, { "epoch": 1.24, "learning_rate": 0.00011443876188822154, "loss": 0.0105, "step": 477240 }, { "epoch": 1.24, "learning_rate": 0.00011443487367185008, "loss": 0.01, "step": 477250 }, { "epoch": 1.24, "learning_rate": 0.00011443098545547861, "loss": 0.0099, "step": 477260 }, { "epoch": 1.24, "learning_rate": 0.00011442709723910715, "loss": 0.0104, "step": 477270 }, { "epoch": 1.24, "learning_rate": 0.00011442320902273568, "loss": 0.0116, "step": 477280 }, { "epoch": 1.24, "learning_rate": 0.00011441932080636422, "loss": 0.0105, "step": 477290 }, { "epoch": 1.24, "learning_rate": 0.00011441543258999275, "loss": 0.0113, "step": 477300 }, { "epoch": 1.24, "learning_rate": 0.0001144115443736213, "loss": 0.0123, "step": 477310 }, { "epoch": 1.24, "learning_rate": 0.00011440765615724982, "loss": 0.0129, "step": 477320 }, { "epoch": 1.24, "learning_rate": 0.00011440376794087838, "loss": 0.012, "step": 477330 }, { "epoch": 1.24, "learning_rate": 0.0001143998797245069, "loss": 0.0111, "step": 477340 }, { "epoch": 1.24, "learning_rate": 0.00011439599150813545, "loss": 0.0109, "step": 477350 }, { "epoch": 1.24, "learning_rate": 0.00011439210329176398, "loss": 0.0116, "step": 477360 }, { "epoch": 1.24, "learning_rate": 0.0001143882150753925, "loss": 0.008, "step": 477370 }, { "epoch": 1.24, "learning_rate": 0.00011438432685902104, "loss": 0.0074, "step": 477380 }, { "epoch": 1.24, "learning_rate": 0.00011438043864264957, "loss": 0.0083, "step": 477390 }, { "epoch": 1.24, "learning_rate": 0.00011437655042627811, "loss": 0.0105, "step": 477400 }, { "epoch": 1.24, "learning_rate": 0.00011437266220990664, "loss": 0.0125, "step": 477410 }, { "epoch": 1.24, "learning_rate": 0.00011436877399353518, "loss": 0.0092, "step": 477420 }, { "epoch": 1.24, "learning_rate": 0.00011436488577716371, "loss": 0.0085, "step": 477430 }, { "epoch": 1.24, "learning_rate": 0.00011436099756079225, "loss": 0.0079, "step": 477440 }, { "epoch": 1.24, "learning_rate": 0.00011435710934442078, "loss": 0.0097, "step": 477450 }, { "epoch": 1.24, "learning_rate": 0.00011435322112804932, "loss": 0.0088, "step": 477460 }, { "epoch": 1.24, "learning_rate": 0.00011434933291167785, "loss": 0.0119, "step": 477470 }, { "epoch": 1.24, "learning_rate": 0.0001143454446953064, "loss": 0.0099, "step": 477480 }, { "epoch": 1.24, "learning_rate": 0.00011434155647893492, "loss": 0.0106, "step": 477490 }, { "epoch": 1.24, "learning_rate": 0.00011433766826256346, "loss": 0.0105, "step": 477500 }, { "epoch": 1.24, "learning_rate": 0.00011433378004619199, "loss": 0.0131, "step": 477510 }, { "epoch": 1.24, "learning_rate": 0.00011432989182982055, "loss": 0.012, "step": 477520 }, { "epoch": 1.24, "learning_rate": 0.00011432600361344907, "loss": 0.0088, "step": 477530 }, { "epoch": 1.24, "learning_rate": 0.00011432211539707762, "loss": 0.0099, "step": 477540 }, { "epoch": 1.24, "learning_rate": 0.00011431822718070614, "loss": 0.0158, "step": 477550 }, { "epoch": 1.24, "learning_rate": 0.00011431433896433469, "loss": 0.013, "step": 477560 }, { "epoch": 1.24, "learning_rate": 0.00011431045074796321, "loss": 0.0102, "step": 477570 }, { "epoch": 1.24, "learning_rate": 0.00011430656253159176, "loss": 0.0115, "step": 477580 }, { "epoch": 1.24, "learning_rate": 0.00011430267431522028, "loss": 0.0094, "step": 477590 }, { "epoch": 1.24, "learning_rate": 0.00011429878609884883, "loss": 0.0127, "step": 477600 }, { "epoch": 1.24, "learning_rate": 0.00011429489788247735, "loss": 0.0114, "step": 477610 }, { "epoch": 1.24, "learning_rate": 0.00011429100966610588, "loss": 0.0103, "step": 477620 }, { "epoch": 1.24, "learning_rate": 0.00011428712144973442, "loss": 0.0083, "step": 477630 }, { "epoch": 1.24, "learning_rate": 0.00011428323323336295, "loss": 0.0093, "step": 477640 }, { "epoch": 1.24, "learning_rate": 0.00011427934501699149, "loss": 0.01, "step": 477650 }, { "epoch": 1.24, "learning_rate": 0.00011427545680062002, "loss": 0.0113, "step": 477660 }, { "epoch": 1.24, "learning_rate": 0.00011427156858424856, "loss": 0.0117, "step": 477670 }, { "epoch": 1.24, "learning_rate": 0.00011426768036787709, "loss": 0.0112, "step": 477680 }, { "epoch": 1.24, "learning_rate": 0.00011426379215150565, "loss": 0.0116, "step": 477690 }, { "epoch": 1.24, "learning_rate": 0.00011425990393513416, "loss": 0.0104, "step": 477700 }, { "epoch": 1.24, "learning_rate": 0.00011425601571876272, "loss": 0.0086, "step": 477710 }, { "epoch": 1.24, "learning_rate": 0.00011425212750239124, "loss": 0.0106, "step": 477720 }, { "epoch": 1.24, "learning_rate": 0.00011424823928601979, "loss": 0.0091, "step": 477730 }, { "epoch": 1.24, "learning_rate": 0.00011424435106964831, "loss": 0.0101, "step": 477740 }, { "epoch": 1.24, "learning_rate": 0.00011424046285327686, "loss": 0.0116, "step": 477750 }, { "epoch": 1.24, "learning_rate": 0.00011423657463690538, "loss": 0.0106, "step": 477760 }, { "epoch": 1.24, "learning_rate": 0.00011423268642053392, "loss": 0.0106, "step": 477770 }, { "epoch": 1.24, "learning_rate": 0.00011422879820416245, "loss": 0.0084, "step": 477780 }, { "epoch": 1.24, "learning_rate": 0.000114224909987791, "loss": 0.0129, "step": 477790 }, { "epoch": 1.24, "learning_rate": 0.00011422102177141952, "loss": 0.0096, "step": 477800 }, { "epoch": 1.24, "learning_rate": 0.00011421713355504806, "loss": 0.0088, "step": 477810 }, { "epoch": 1.24, "learning_rate": 0.00011421324533867659, "loss": 0.0092, "step": 477820 }, { "epoch": 1.24, "learning_rate": 0.00011420935712230513, "loss": 0.0096, "step": 477830 }, { "epoch": 1.24, "learning_rate": 0.00011420546890593366, "loss": 0.0086, "step": 477840 }, { "epoch": 1.24, "learning_rate": 0.00011420158068956222, "loss": 0.0099, "step": 477850 }, { "epoch": 1.24, "learning_rate": 0.00011419769247319073, "loss": 0.008, "step": 477860 }, { "epoch": 1.24, "learning_rate": 0.00011419380425681926, "loss": 0.01, "step": 477870 }, { "epoch": 1.24, "learning_rate": 0.00011418991604044782, "loss": 0.0094, "step": 477880 }, { "epoch": 1.24, "learning_rate": 0.00011418602782407634, "loss": 0.0139, "step": 477890 }, { "epoch": 1.24, "learning_rate": 0.00011418213960770488, "loss": 0.0148, "step": 477900 }, { "epoch": 1.24, "learning_rate": 0.00011417825139133341, "loss": 0.0126, "step": 477910 }, { "epoch": 1.24, "learning_rate": 0.00011417436317496195, "loss": 0.0111, "step": 477920 }, { "epoch": 1.24, "learning_rate": 0.00011417047495859048, "loss": 0.0116, "step": 477930 }, { "epoch": 1.24, "learning_rate": 0.00011416658674221902, "loss": 0.0103, "step": 477940 }, { "epoch": 1.24, "learning_rate": 0.00011416269852584755, "loss": 0.0118, "step": 477950 }, { "epoch": 1.24, "learning_rate": 0.0001141588103094761, "loss": 0.01, "step": 477960 }, { "epoch": 1.24, "learning_rate": 0.00011415492209310462, "loss": 0.0123, "step": 477970 }, { "epoch": 1.24, "learning_rate": 0.00011415103387673316, "loss": 0.0114, "step": 477980 }, { "epoch": 1.24, "learning_rate": 0.00011414714566036169, "loss": 0.0126, "step": 477990 }, { "epoch": 1.24, "learning_rate": 0.00011414325744399023, "loss": 0.0094, "step": 478000 }, { "epoch": 1.24, "eval_cer": 0.881688689953826, "eval_loss": 0.007163301110267639, "eval_runtime": 107.8483, "eval_samples_per_second": 18.545, "eval_steps_per_second": 4.636, "step": 478000 }, { "epoch": 1.24, "learning_rate": 0.00011413936922761876, "loss": 0.0111, "step": 478010 }, { "epoch": 1.24, "learning_rate": 0.0001141354810112473, "loss": 0.0131, "step": 478020 }, { "epoch": 1.24, "learning_rate": 0.00011413159279487583, "loss": 0.0115, "step": 478030 }, { "epoch": 1.24, "learning_rate": 0.00011412770457850439, "loss": 0.0126, "step": 478040 }, { "epoch": 1.24, "learning_rate": 0.00011412381636213291, "loss": 0.0079, "step": 478050 }, { "epoch": 1.24, "learning_rate": 0.00011411992814576146, "loss": 0.0113, "step": 478060 }, { "epoch": 1.24, "learning_rate": 0.00011411603992938998, "loss": 0.0117, "step": 478070 }, { "epoch": 1.24, "learning_rate": 0.00011411215171301853, "loss": 0.0086, "step": 478080 }, { "epoch": 1.24, "learning_rate": 0.00011410826349664705, "loss": 0.0129, "step": 478090 }, { "epoch": 1.24, "learning_rate": 0.0001141043752802756, "loss": 0.0121, "step": 478100 }, { "epoch": 1.24, "learning_rate": 0.00011410048706390412, "loss": 0.0105, "step": 478110 }, { "epoch": 1.24, "learning_rate": 0.00011409659884753265, "loss": 0.0125, "step": 478120 }, { "epoch": 1.24, "learning_rate": 0.0001140927106311612, "loss": 0.0103, "step": 478130 }, { "epoch": 1.24, "learning_rate": 0.00011408882241478972, "loss": 0.0083, "step": 478140 }, { "epoch": 1.24, "learning_rate": 0.00011408493419841826, "loss": 0.0119, "step": 478150 }, { "epoch": 1.24, "learning_rate": 0.00011408104598204679, "loss": 0.0082, "step": 478160 }, { "epoch": 1.24, "learning_rate": 0.00011407715776567533, "loss": 0.0087, "step": 478170 }, { "epoch": 1.24, "learning_rate": 0.00011407326954930386, "loss": 0.0109, "step": 478180 }, { "epoch": 1.24, "learning_rate": 0.0001140693813329324, "loss": 0.0182, "step": 478190 }, { "epoch": 1.24, "learning_rate": 0.00011406549311656093, "loss": 0.0094, "step": 478200 }, { "epoch": 1.24, "learning_rate": 0.00011406160490018949, "loss": 0.012, "step": 478210 }, { "epoch": 1.24, "learning_rate": 0.000114057716683818, "loss": 0.0096, "step": 478220 }, { "epoch": 1.24, "learning_rate": 0.00011405382846744656, "loss": 0.0097, "step": 478230 }, { "epoch": 1.24, "learning_rate": 0.00011404994025107508, "loss": 0.0109, "step": 478240 }, { "epoch": 1.24, "learning_rate": 0.00011404605203470363, "loss": 0.0112, "step": 478250 }, { "epoch": 1.24, "learning_rate": 0.00011404216381833215, "loss": 0.0136, "step": 478260 }, { "epoch": 1.24, "learning_rate": 0.0001140382756019607, "loss": 0.0095, "step": 478270 }, { "epoch": 1.24, "learning_rate": 0.00011403438738558922, "loss": 0.0098, "step": 478280 }, { "epoch": 1.24, "learning_rate": 0.00011403049916921776, "loss": 0.0105, "step": 478290 }, { "epoch": 1.24, "learning_rate": 0.00011402661095284629, "loss": 0.0133, "step": 478300 }, { "epoch": 1.24, "learning_rate": 0.00011402272273647483, "loss": 0.0102, "step": 478310 }, { "epoch": 1.24, "learning_rate": 0.00011401883452010336, "loss": 0.0083, "step": 478320 }, { "epoch": 1.24, "learning_rate": 0.0001140149463037319, "loss": 0.0112, "step": 478330 }, { "epoch": 1.24, "learning_rate": 0.00011401105808736043, "loss": 0.0128, "step": 478340 }, { "epoch": 1.24, "learning_rate": 0.00011400716987098896, "loss": 0.0095, "step": 478350 }, { "epoch": 1.24, "learning_rate": 0.0001140032816546175, "loss": 0.012, "step": 478360 }, { "epoch": 1.24, "learning_rate": 0.00011399939343824603, "loss": 0.0087, "step": 478370 }, { "epoch": 1.24, "learning_rate": 0.00011399550522187457, "loss": 0.0084, "step": 478380 }, { "epoch": 1.24, "learning_rate": 0.0001139916170055031, "loss": 0.0109, "step": 478390 }, { "epoch": 1.24, "learning_rate": 0.00011398772878913165, "loss": 0.0118, "step": 478400 }, { "epoch": 1.24, "learning_rate": 0.00011398384057276018, "loss": 0.0107, "step": 478410 }, { "epoch": 1.24, "learning_rate": 0.00011397995235638872, "loss": 0.0087, "step": 478420 }, { "epoch": 1.24, "learning_rate": 0.00011397606414001725, "loss": 0.0093, "step": 478430 }, { "epoch": 1.24, "learning_rate": 0.0001139721759236458, "loss": 0.0093, "step": 478440 }, { "epoch": 1.24, "learning_rate": 0.00011396828770727432, "loss": 0.0108, "step": 478450 }, { "epoch": 1.24, "learning_rate": 0.00011396439949090286, "loss": 0.009, "step": 478460 }, { "epoch": 1.24, "learning_rate": 0.00011396051127453139, "loss": 0.0126, "step": 478470 }, { "epoch": 1.24, "learning_rate": 0.00011395662305815993, "loss": 0.0118, "step": 478480 }, { "epoch": 1.24, "learning_rate": 0.00011395273484178846, "loss": 0.0105, "step": 478490 }, { "epoch": 1.24, "learning_rate": 0.000113948846625417, "loss": 0.0097, "step": 478500 }, { "epoch": 1.24, "learning_rate": 0.00011394495840904553, "loss": 0.0103, "step": 478510 }, { "epoch": 1.24, "learning_rate": 0.00011394107019267407, "loss": 0.0098, "step": 478520 }, { "epoch": 1.24, "learning_rate": 0.0001139371819763026, "loss": 0.0119, "step": 478530 }, { "epoch": 1.24, "learning_rate": 0.00011393329375993114, "loss": 0.0117, "step": 478540 }, { "epoch": 1.24, "learning_rate": 0.00011392940554355967, "loss": 0.0098, "step": 478550 }, { "epoch": 1.24, "learning_rate": 0.00011392551732718823, "loss": 0.0118, "step": 478560 }, { "epoch": 1.24, "learning_rate": 0.00011392162911081675, "loss": 0.0102, "step": 478570 }, { "epoch": 1.24, "learning_rate": 0.0001139177408944453, "loss": 0.0101, "step": 478580 }, { "epoch": 1.24, "learning_rate": 0.00011391385267807382, "loss": 0.0108, "step": 478590 }, { "epoch": 1.24, "learning_rate": 0.00011390996446170235, "loss": 0.0077, "step": 478600 }, { "epoch": 1.24, "learning_rate": 0.0001139060762453309, "loss": 0.0097, "step": 478610 }, { "epoch": 1.24, "learning_rate": 0.00011390218802895942, "loss": 0.0082, "step": 478620 }, { "epoch": 1.24, "learning_rate": 0.00011389829981258796, "loss": 0.01, "step": 478630 }, { "epoch": 1.24, "learning_rate": 0.00011389441159621649, "loss": 0.0085, "step": 478640 }, { "epoch": 1.24, "learning_rate": 0.00011389052337984503, "loss": 0.0094, "step": 478650 }, { "epoch": 1.24, "learning_rate": 0.00011388663516347356, "loss": 0.0127, "step": 478660 }, { "epoch": 1.24, "learning_rate": 0.0001138827469471021, "loss": 0.0082, "step": 478670 }, { "epoch": 1.24, "learning_rate": 0.00011387885873073063, "loss": 0.0118, "step": 478680 }, { "epoch": 1.24, "learning_rate": 0.00011387497051435917, "loss": 0.0077, "step": 478690 }, { "epoch": 1.24, "learning_rate": 0.0001138710822979877, "loss": 0.0095, "step": 478700 }, { "epoch": 1.24, "learning_rate": 0.00011386719408161624, "loss": 0.0103, "step": 478710 }, { "epoch": 1.24, "learning_rate": 0.00011386330586524477, "loss": 0.0082, "step": 478720 }, { "epoch": 1.24, "learning_rate": 0.00011385941764887333, "loss": 0.0093, "step": 478730 }, { "epoch": 1.24, "learning_rate": 0.00011385552943250184, "loss": 0.0074, "step": 478740 }, { "epoch": 1.24, "learning_rate": 0.0001138516412161304, "loss": 0.0087, "step": 478750 }, { "epoch": 1.24, "learning_rate": 0.00011384775299975892, "loss": 0.0098, "step": 478760 }, { "epoch": 1.24, "learning_rate": 0.00011384386478338747, "loss": 0.0082, "step": 478770 }, { "epoch": 1.24, "learning_rate": 0.000113839976567016, "loss": 0.0089, "step": 478780 }, { "epoch": 1.24, "learning_rate": 0.00011383608835064453, "loss": 0.0099, "step": 478790 }, { "epoch": 1.24, "learning_rate": 0.00011383220013427306, "loss": 0.0113, "step": 478800 }, { "epoch": 1.24, "learning_rate": 0.0001138283119179016, "loss": 0.0191, "step": 478810 }, { "epoch": 1.24, "learning_rate": 0.00011382442370153013, "loss": 0.0108, "step": 478820 }, { "epoch": 1.24, "learning_rate": 0.00011382053548515867, "loss": 0.0108, "step": 478830 }, { "epoch": 1.24, "learning_rate": 0.0001138166472687872, "loss": 0.0107, "step": 478840 }, { "epoch": 1.24, "learning_rate": 0.00011381275905241573, "loss": 0.0113, "step": 478850 }, { "epoch": 1.24, "learning_rate": 0.00011380887083604427, "loss": 0.0119, "step": 478860 }, { "epoch": 1.24, "learning_rate": 0.0001138049826196728, "loss": 0.0104, "step": 478870 }, { "epoch": 1.24, "learning_rate": 0.00011380109440330134, "loss": 0.0079, "step": 478880 }, { "epoch": 1.24, "learning_rate": 0.00011379720618692987, "loss": 0.013, "step": 478890 }, { "epoch": 1.24, "learning_rate": 0.00011379331797055841, "loss": 0.01, "step": 478900 }, { "epoch": 1.24, "learning_rate": 0.00011378942975418694, "loss": 0.0092, "step": 478910 }, { "epoch": 1.24, "learning_rate": 0.0001137855415378155, "loss": 0.0106, "step": 478920 }, { "epoch": 1.24, "learning_rate": 0.00011378165332144402, "loss": 0.0097, "step": 478930 }, { "epoch": 1.24, "learning_rate": 0.00011377776510507256, "loss": 0.011, "step": 478940 }, { "epoch": 1.24, "learning_rate": 0.00011377387688870109, "loss": 0.0092, "step": 478950 }, { "epoch": 1.24, "learning_rate": 0.00011376998867232963, "loss": 0.0109, "step": 478960 }, { "epoch": 1.24, "learning_rate": 0.00011376610045595816, "loss": 0.0111, "step": 478970 }, { "epoch": 1.24, "learning_rate": 0.0001137622122395867, "loss": 0.0119, "step": 478980 }, { "epoch": 1.24, "learning_rate": 0.00011375832402321523, "loss": 0.0116, "step": 478990 }, { "epoch": 1.24, "learning_rate": 0.00011375443580684377, "loss": 0.0129, "step": 479000 }, { "epoch": 1.24, "eval_cer": 0.88167329394755, "eval_loss": 0.006849655415862799, "eval_runtime": 107.8443, "eval_samples_per_second": 18.545, "eval_steps_per_second": 4.636, "step": 479000 }, { "epoch": 1.24, "learning_rate": 0.0001137505475904723, "loss": 0.0105, "step": 479010 }, { "epoch": 1.24, "learning_rate": 0.00011374665937410084, "loss": 0.0131, "step": 479020 }, { "epoch": 1.24, "learning_rate": 0.00011374277115772937, "loss": 0.0097, "step": 479030 }, { "epoch": 1.24, "learning_rate": 0.00011373888294135791, "loss": 0.0103, "step": 479040 }, { "epoch": 1.24, "learning_rate": 0.00011373499472498644, "loss": 0.0093, "step": 479050 }, { "epoch": 1.24, "learning_rate": 0.00011373110650861498, "loss": 0.0115, "step": 479060 }, { "epoch": 1.24, "learning_rate": 0.00011372721829224351, "loss": 0.0153, "step": 479070 }, { "epoch": 1.24, "learning_rate": 0.00011372333007587207, "loss": 0.0104, "step": 479080 }, { "epoch": 1.24, "learning_rate": 0.00011371944185950058, "loss": 0.0125, "step": 479090 }, { "epoch": 1.24, "learning_rate": 0.00011371555364312911, "loss": 0.013, "step": 479100 }, { "epoch": 1.24, "learning_rate": 0.00011371166542675766, "loss": 0.0094, "step": 479110 }, { "epoch": 1.24, "learning_rate": 0.00011370777721038619, "loss": 0.0137, "step": 479120 }, { "epoch": 1.24, "learning_rate": 0.00011370388899401473, "loss": 0.0106, "step": 479130 }, { "epoch": 1.24, "learning_rate": 0.00011370000077764326, "loss": 0.0121, "step": 479140 }, { "epoch": 1.24, "learning_rate": 0.0001136961125612718, "loss": 0.01, "step": 479150 }, { "epoch": 1.24, "learning_rate": 0.00011369222434490033, "loss": 0.0098, "step": 479160 }, { "epoch": 1.24, "learning_rate": 0.00011368833612852887, "loss": 0.0124, "step": 479170 }, { "epoch": 1.24, "learning_rate": 0.0001136844479121574, "loss": 0.0104, "step": 479180 }, { "epoch": 1.24, "learning_rate": 0.00011368055969578594, "loss": 0.0125, "step": 479190 }, { "epoch": 1.24, "learning_rate": 0.00011367667147941447, "loss": 0.0091, "step": 479200 }, { "epoch": 1.24, "learning_rate": 0.00011367278326304301, "loss": 0.0102, "step": 479210 }, { "epoch": 1.24, "learning_rate": 0.00011366889504667154, "loss": 0.0096, "step": 479220 }, { "epoch": 1.24, "learning_rate": 0.00011366500683030008, "loss": 0.0102, "step": 479230 }, { "epoch": 1.24, "learning_rate": 0.00011366111861392861, "loss": 0.0079, "step": 479240 }, { "epoch": 1.24, "learning_rate": 0.00011365723039755715, "loss": 0.0098, "step": 479250 }, { "epoch": 1.24, "learning_rate": 0.00011365334218118568, "loss": 0.0137, "step": 479260 }, { "epoch": 1.24, "learning_rate": 0.00011364945396481424, "loss": 0.0161, "step": 479270 }, { "epoch": 1.24, "learning_rate": 0.00011364556574844276, "loss": 0.0123, "step": 479280 }, { "epoch": 1.24, "learning_rate": 0.0001136416775320713, "loss": 0.0094, "step": 479290 }, { "epoch": 1.24, "learning_rate": 0.00011363778931569983, "loss": 0.0109, "step": 479300 }, { "epoch": 1.24, "learning_rate": 0.00011363390109932837, "loss": 0.0074, "step": 479310 }, { "epoch": 1.24, "learning_rate": 0.0001136300128829569, "loss": 0.0099, "step": 479320 }, { "epoch": 1.24, "learning_rate": 0.00011362612466658544, "loss": 0.0129, "step": 479330 }, { "epoch": 1.24, "learning_rate": 0.00011362223645021397, "loss": 0.0094, "step": 479340 }, { "epoch": 1.24, "learning_rate": 0.0001136183482338425, "loss": 0.0086, "step": 479350 }, { "epoch": 1.24, "learning_rate": 0.00011361446001747104, "loss": 0.0116, "step": 479360 }, { "epoch": 1.24, "learning_rate": 0.00011361057180109957, "loss": 0.0136, "step": 479370 }, { "epoch": 1.24, "learning_rate": 0.00011360668358472811, "loss": 0.012, "step": 479380 }, { "epoch": 1.24, "learning_rate": 0.00011360279536835664, "loss": 0.0069, "step": 479390 }, { "epoch": 1.24, "learning_rate": 0.00011359890715198518, "loss": 0.0095, "step": 479400 }, { "epoch": 1.24, "learning_rate": 0.00011359501893561371, "loss": 0.0105, "step": 479410 }, { "epoch": 1.24, "learning_rate": 0.00011359113071924225, "loss": 0.0103, "step": 479420 }, { "epoch": 1.24, "learning_rate": 0.00011358724250287078, "loss": 0.0143, "step": 479430 }, { "epoch": 1.24, "learning_rate": 0.00011358335428649933, "loss": 0.0097, "step": 479440 }, { "epoch": 1.24, "learning_rate": 0.00011357946607012785, "loss": 0.0103, "step": 479450 }, { "epoch": 1.24, "learning_rate": 0.0001135755778537564, "loss": 0.0092, "step": 479460 }, { "epoch": 1.24, "learning_rate": 0.00011357168963738493, "loss": 0.0112, "step": 479470 }, { "epoch": 1.24, "learning_rate": 0.00011356780142101347, "loss": 0.0117, "step": 479480 }, { "epoch": 1.24, "learning_rate": 0.000113563913204642, "loss": 0.0142, "step": 479490 }, { "epoch": 1.24, "learning_rate": 0.00011356002498827054, "loss": 0.0134, "step": 479500 }, { "epoch": 1.24, "learning_rate": 0.00011355613677189907, "loss": 0.01, "step": 479510 }, { "epoch": 1.24, "learning_rate": 0.00011355224855552761, "loss": 0.0133, "step": 479520 }, { "epoch": 1.24, "learning_rate": 0.00011354836033915614, "loss": 0.0085, "step": 479530 }, { "epoch": 1.24, "learning_rate": 0.00011354447212278468, "loss": 0.0116, "step": 479540 }, { "epoch": 1.24, "learning_rate": 0.00011354058390641321, "loss": 0.0149, "step": 479550 }, { "epoch": 1.24, "learning_rate": 0.00011353669569004175, "loss": 0.0098, "step": 479560 }, { "epoch": 1.24, "learning_rate": 0.00011353280747367028, "loss": 0.0112, "step": 479570 }, { "epoch": 1.24, "learning_rate": 0.00011352891925729882, "loss": 0.0115, "step": 479580 }, { "epoch": 1.24, "learning_rate": 0.00011352503104092735, "loss": 0.0081, "step": 479590 }, { "epoch": 1.24, "learning_rate": 0.00011352114282455588, "loss": 0.0114, "step": 479600 }, { "epoch": 1.24, "learning_rate": 0.00011351725460818442, "loss": 0.0088, "step": 479610 }, { "epoch": 1.24, "learning_rate": 0.00011351336639181295, "loss": 0.009, "step": 479620 }, { "epoch": 1.24, "learning_rate": 0.0001135094781754415, "loss": 0.0084, "step": 479630 }, { "epoch": 1.24, "learning_rate": 0.00011350558995907003, "loss": 0.0093, "step": 479640 }, { "epoch": 1.24, "learning_rate": 0.00011350170174269857, "loss": 0.0093, "step": 479650 }, { "epoch": 1.24, "learning_rate": 0.0001134978135263271, "loss": 0.0061, "step": 479660 }, { "epoch": 1.24, "learning_rate": 0.00011349392530995564, "loss": 0.0105, "step": 479670 }, { "epoch": 1.24, "learning_rate": 0.00011349003709358417, "loss": 0.013, "step": 479680 }, { "epoch": 1.24, "learning_rate": 0.00011348614887721271, "loss": 0.0126, "step": 479690 }, { "epoch": 1.24, "learning_rate": 0.00011348226066084124, "loss": 0.019, "step": 479700 }, { "epoch": 1.24, "learning_rate": 0.00011347837244446978, "loss": 0.0089, "step": 479710 }, { "epoch": 1.24, "learning_rate": 0.00011347448422809831, "loss": 0.0127, "step": 479720 }, { "epoch": 1.24, "learning_rate": 0.00011347059601172685, "loss": 0.01, "step": 479730 }, { "epoch": 1.24, "learning_rate": 0.00011346670779535538, "loss": 0.0106, "step": 479740 }, { "epoch": 1.24, "learning_rate": 0.00011346281957898392, "loss": 0.0091, "step": 479750 }, { "epoch": 1.24, "learning_rate": 0.00011345893136261245, "loss": 0.0167, "step": 479760 }, { "epoch": 1.24, "learning_rate": 0.00011345504314624099, "loss": 0.0074, "step": 479770 }, { "epoch": 1.24, "learning_rate": 0.00011345115492986952, "loss": 0.0075, "step": 479780 }, { "epoch": 1.24, "learning_rate": 0.00011344726671349808, "loss": 0.0131, "step": 479790 }, { "epoch": 1.24, "learning_rate": 0.0001134433784971266, "loss": 0.0173, "step": 479800 }, { "epoch": 1.24, "learning_rate": 0.00011343949028075514, "loss": 0.0098, "step": 479810 }, { "epoch": 1.24, "learning_rate": 0.00011343560206438367, "loss": 0.0154, "step": 479820 }, { "epoch": 1.24, "learning_rate": 0.00011343171384801221, "loss": 0.0086, "step": 479830 }, { "epoch": 1.24, "learning_rate": 0.00011342782563164074, "loss": 0.0107, "step": 479840 }, { "epoch": 1.24, "learning_rate": 0.00011342393741526927, "loss": 0.0091, "step": 479850 }, { "epoch": 1.24, "learning_rate": 0.00011342004919889781, "loss": 0.0096, "step": 479860 }, { "epoch": 1.24, "learning_rate": 0.00011341616098252634, "loss": 0.0121, "step": 479870 }, { "epoch": 1.24, "learning_rate": 0.00011341227276615488, "loss": 0.012, "step": 479880 }, { "epoch": 1.24, "learning_rate": 0.00011340838454978341, "loss": 0.0109, "step": 479890 }, { "epoch": 1.24, "learning_rate": 0.00011340449633341195, "loss": 0.0088, "step": 479900 }, { "epoch": 1.24, "learning_rate": 0.00011340060811704048, "loss": 0.0106, "step": 479910 }, { "epoch": 1.24, "learning_rate": 0.00011339671990066902, "loss": 0.012, "step": 479920 }, { "epoch": 1.24, "learning_rate": 0.00011339283168429755, "loss": 0.0112, "step": 479930 }, { "epoch": 1.24, "learning_rate": 0.00011338894346792609, "loss": 0.0077, "step": 479940 }, { "epoch": 1.24, "learning_rate": 0.00011338505525155462, "loss": 0.0136, "step": 479950 }, { "epoch": 1.24, "learning_rate": 0.00011338116703518317, "loss": 0.0107, "step": 479960 }, { "epoch": 1.24, "learning_rate": 0.00011337727881881169, "loss": 0.0087, "step": 479970 }, { "epoch": 1.24, "learning_rate": 0.00011337339060244024, "loss": 0.0121, "step": 479980 }, { "epoch": 1.24, "learning_rate": 0.00011336950238606877, "loss": 0.011, "step": 479990 }, { "epoch": 1.24, "learning_rate": 0.00011336561416969731, "loss": 0.0108, "step": 480000 }, { "epoch": 1.24, "eval_cer": 0.8816606972151424, "eval_loss": 0.0065583763644099236, "eval_runtime": 107.8502, "eval_samples_per_second": 18.544, "eval_steps_per_second": 4.636, "step": 480000 }, { "epoch": 1.24, "learning_rate": 0.00011336172595332584, "loss": 0.0118, "step": 480010 }, { "epoch": 1.24, "learning_rate": 0.00011335783773695438, "loss": 0.0136, "step": 480020 }, { "epoch": 1.24, "learning_rate": 0.00011335394952058291, "loss": 0.0105, "step": 480030 }, { "epoch": 1.24, "learning_rate": 0.00011335006130421145, "loss": 0.0116, "step": 480040 }, { "epoch": 1.24, "learning_rate": 0.00011334617308783998, "loss": 0.009, "step": 480050 }, { "epoch": 1.24, "learning_rate": 0.00011334228487146852, "loss": 0.0127, "step": 480060 }, { "epoch": 1.24, "learning_rate": 0.00011333839665509705, "loss": 0.0081, "step": 480070 }, { "epoch": 1.24, "learning_rate": 0.00011333450843872559, "loss": 0.0088, "step": 480080 }, { "epoch": 1.24, "learning_rate": 0.00011333062022235412, "loss": 0.0115, "step": 480090 }, { "epoch": 1.24, "learning_rate": 0.00011332673200598265, "loss": 0.0085, "step": 480100 }, { "epoch": 1.24, "learning_rate": 0.00011332284378961119, "loss": 0.0093, "step": 480110 }, { "epoch": 1.24, "learning_rate": 0.00011331895557323972, "loss": 0.0095, "step": 480120 }, { "epoch": 1.24, "learning_rate": 0.00011331506735686826, "loss": 0.0125, "step": 480130 }, { "epoch": 1.24, "learning_rate": 0.00011331117914049679, "loss": 0.0182, "step": 480140 }, { "epoch": 1.24, "learning_rate": 0.00011330729092412534, "loss": 0.0109, "step": 480150 }, { "epoch": 1.24, "learning_rate": 0.00011330340270775387, "loss": 0.0134, "step": 480160 }, { "epoch": 1.24, "learning_rate": 0.00011329951449138241, "loss": 0.007, "step": 480170 }, { "epoch": 1.24, "learning_rate": 0.00011329562627501094, "loss": 0.014, "step": 480180 }, { "epoch": 1.24, "learning_rate": 0.00011329173805863948, "loss": 0.0105, "step": 480190 }, { "epoch": 1.24, "learning_rate": 0.00011328784984226801, "loss": 0.0121, "step": 480200 }, { "epoch": 1.24, "learning_rate": 0.00011328396162589655, "loss": 0.0127, "step": 480210 }, { "epoch": 1.24, "learning_rate": 0.00011328007340952508, "loss": 0.0082, "step": 480220 }, { "epoch": 1.24, "learning_rate": 0.00011327618519315362, "loss": 0.0107, "step": 480230 }, { "epoch": 1.24, "learning_rate": 0.00011327229697678215, "loss": 0.0089, "step": 480240 }, { "epoch": 1.24, "learning_rate": 0.00011326840876041069, "loss": 0.0138, "step": 480250 }, { "epoch": 1.24, "learning_rate": 0.00011326452054403922, "loss": 0.01, "step": 480260 }, { "epoch": 1.24, "learning_rate": 0.00011326063232766776, "loss": 0.0108, "step": 480270 }, { "epoch": 1.24, "learning_rate": 0.00011325674411129629, "loss": 0.0122, "step": 480280 }, { "epoch": 1.24, "learning_rate": 0.00011325285589492483, "loss": 0.0105, "step": 480290 }, { "epoch": 1.25, "learning_rate": 0.00011324896767855336, "loss": 0.0093, "step": 480300 }, { "epoch": 1.25, "learning_rate": 0.00011324507946218192, "loss": 0.0076, "step": 480310 }, { "epoch": 1.25, "learning_rate": 0.00011324119124581044, "loss": 0.0098, "step": 480320 }, { "epoch": 1.25, "learning_rate": 0.00011323730302943898, "loss": 0.011, "step": 480330 }, { "epoch": 1.25, "learning_rate": 0.00011323341481306751, "loss": 0.0087, "step": 480340 }, { "epoch": 1.25, "learning_rate": 0.00011322952659669604, "loss": 0.0082, "step": 480350 }, { "epoch": 1.25, "learning_rate": 0.00011322563838032458, "loss": 0.0111, "step": 480360 }, { "epoch": 1.25, "learning_rate": 0.00011322175016395311, "loss": 0.0098, "step": 480370 }, { "epoch": 1.25, "learning_rate": 0.00011321786194758165, "loss": 0.0124, "step": 480380 }, { "epoch": 1.25, "learning_rate": 0.00011321397373121018, "loss": 0.0088, "step": 480390 }, { "epoch": 1.25, "learning_rate": 0.00011321008551483872, "loss": 0.012, "step": 480400 }, { "epoch": 1.25, "learning_rate": 0.00011320619729846725, "loss": 0.0115, "step": 480410 }, { "epoch": 1.25, "learning_rate": 0.00011320230908209579, "loss": 0.0092, "step": 480420 }, { "epoch": 1.25, "learning_rate": 0.00011319842086572432, "loss": 0.0099, "step": 480430 }, { "epoch": 1.25, "learning_rate": 0.00011319453264935286, "loss": 0.0112, "step": 480440 }, { "epoch": 1.25, "learning_rate": 0.00011319064443298139, "loss": 0.0081, "step": 480450 }, { "epoch": 1.25, "learning_rate": 0.00011318675621660993, "loss": 0.0105, "step": 480460 }, { "epoch": 1.25, "learning_rate": 0.00011318286800023846, "loss": 0.0132, "step": 480470 }, { "epoch": 1.25, "learning_rate": 0.000113178979783867, "loss": 0.0127, "step": 480480 }, { "epoch": 1.25, "learning_rate": 0.00011317509156749553, "loss": 0.0138, "step": 480490 }, { "epoch": 1.25, "learning_rate": 0.00011317120335112408, "loss": 0.0109, "step": 480500 }, { "epoch": 1.25, "learning_rate": 0.00011316731513475261, "loss": 0.0118, "step": 480510 }, { "epoch": 1.25, "learning_rate": 0.00011316342691838115, "loss": 0.0103, "step": 480520 }, { "epoch": 1.25, "learning_rate": 0.00011315953870200968, "loss": 0.0093, "step": 480530 }, { "epoch": 1.25, "learning_rate": 0.00011315565048563822, "loss": 0.0102, "step": 480540 }, { "epoch": 1.25, "learning_rate": 0.00011315176226926675, "loss": 0.0089, "step": 480550 }, { "epoch": 1.25, "learning_rate": 0.0001131478740528953, "loss": 0.0096, "step": 480560 }, { "epoch": 1.25, "learning_rate": 0.00011314398583652382, "loss": 0.0162, "step": 480570 }, { "epoch": 1.25, "learning_rate": 0.00011314009762015236, "loss": 0.0075, "step": 480580 }, { "epoch": 1.25, "learning_rate": 0.00011313620940378089, "loss": 0.0113, "step": 480590 }, { "epoch": 1.25, "learning_rate": 0.00011313232118740942, "loss": 0.0097, "step": 480600 }, { "epoch": 1.25, "learning_rate": 0.00011312843297103796, "loss": 0.0087, "step": 480610 }, { "epoch": 1.25, "learning_rate": 0.00011312454475466649, "loss": 0.0081, "step": 480620 }, { "epoch": 1.25, "learning_rate": 0.00011312065653829503, "loss": 0.0103, "step": 480630 }, { "epoch": 1.25, "learning_rate": 0.00011311676832192356, "loss": 0.0107, "step": 480640 }, { "epoch": 1.25, "learning_rate": 0.0001131128801055521, "loss": 0.0093, "step": 480650 }, { "epoch": 1.25, "learning_rate": 0.00011310899188918063, "loss": 0.0086, "step": 480660 }, { "epoch": 1.25, "learning_rate": 0.00011310510367280918, "loss": 0.0079, "step": 480670 }, { "epoch": 1.25, "learning_rate": 0.0001131012154564377, "loss": 0.0149, "step": 480680 }, { "epoch": 1.25, "learning_rate": 0.00011309732724006625, "loss": 0.0069, "step": 480690 }, { "epoch": 1.25, "learning_rate": 0.00011309343902369478, "loss": 0.0093, "step": 480700 }, { "epoch": 1.25, "learning_rate": 0.00011308955080732332, "loss": 0.0089, "step": 480710 }, { "epoch": 1.25, "learning_rate": 0.00011308566259095185, "loss": 0.0096, "step": 480720 }, { "epoch": 1.25, "learning_rate": 0.00011308177437458039, "loss": 0.0088, "step": 480730 }, { "epoch": 1.25, "learning_rate": 0.00011307788615820892, "loss": 0.01, "step": 480740 }, { "epoch": 1.25, "learning_rate": 0.00011307399794183746, "loss": 0.0134, "step": 480750 }, { "epoch": 1.25, "learning_rate": 0.00011307010972546599, "loss": 0.0105, "step": 480760 }, { "epoch": 1.25, "learning_rate": 0.00011306622150909453, "loss": 0.0092, "step": 480770 }, { "epoch": 1.25, "learning_rate": 0.00011306233329272306, "loss": 0.0129, "step": 480780 }, { "epoch": 1.25, "learning_rate": 0.0001130584450763516, "loss": 0.0135, "step": 480790 }, { "epoch": 1.25, "learning_rate": 0.00011305455685998013, "loss": 0.0089, "step": 480800 }, { "epoch": 1.25, "learning_rate": 0.00011305066864360867, "loss": 0.0095, "step": 480810 }, { "epoch": 1.25, "learning_rate": 0.0001130467804272372, "loss": 0.0134, "step": 480820 }, { "epoch": 1.25, "learning_rate": 0.00011304289221086576, "loss": 0.0093, "step": 480830 }, { "epoch": 1.25, "learning_rate": 0.00011303900399449427, "loss": 0.0124, "step": 480840 }, { "epoch": 1.25, "learning_rate": 0.0001130351157781228, "loss": 0.0124, "step": 480850 }, { "epoch": 1.25, "learning_rate": 0.00011303122756175135, "loss": 0.0081, "step": 480860 }, { "epoch": 1.25, "learning_rate": 0.00011302733934537988, "loss": 0.0068, "step": 480870 }, { "epoch": 1.25, "learning_rate": 0.00011302345112900842, "loss": 0.012, "step": 480880 }, { "epoch": 1.25, "learning_rate": 0.00011301956291263695, "loss": 0.0127, "step": 480890 }, { "epoch": 1.25, "learning_rate": 0.00011301567469626549, "loss": 0.0102, "step": 480900 }, { "epoch": 1.25, "learning_rate": 0.00011301178647989402, "loss": 0.0103, "step": 480910 }, { "epoch": 1.25, "learning_rate": 0.00011300789826352256, "loss": 0.0107, "step": 480920 }, { "epoch": 1.25, "learning_rate": 0.00011300401004715109, "loss": 0.0113, "step": 480930 }, { "epoch": 1.25, "learning_rate": 0.00011300012183077963, "loss": 0.0122, "step": 480940 }, { "epoch": 1.25, "learning_rate": 0.00011299623361440816, "loss": 0.011, "step": 480950 }, { "epoch": 1.25, "learning_rate": 0.0001129923453980367, "loss": 0.0103, "step": 480960 }, { "epoch": 1.25, "learning_rate": 0.00011298845718166523, "loss": 0.0138, "step": 480970 }, { "epoch": 1.25, "learning_rate": 0.00011298456896529377, "loss": 0.0079, "step": 480980 }, { "epoch": 1.25, "learning_rate": 0.0001129806807489223, "loss": 0.0094, "step": 480990 }, { "epoch": 1.25, "learning_rate": 0.00011297679253255084, "loss": 0.0123, "step": 481000 }, { "epoch": 1.25, "eval_cer": 0.8816774928583525, "eval_loss": 0.006680840160697699, "eval_runtime": 108.1021, "eval_samples_per_second": 18.501, "eval_steps_per_second": 4.625, "step": 481000 }, { "epoch": 1.25, "learning_rate": 0.00011297290431617937, "loss": 0.0169, "step": 481010 }, { "epoch": 1.25, "learning_rate": 0.00011296901609980792, "loss": 0.0127, "step": 481020 }, { "epoch": 1.25, "learning_rate": 0.00011296512788343645, "loss": 0.0091, "step": 481030 }, { "epoch": 1.25, "learning_rate": 0.000112961239667065, "loss": 0.0098, "step": 481040 }, { "epoch": 1.25, "learning_rate": 0.00011295735145069352, "loss": 0.0087, "step": 481050 }, { "epoch": 1.25, "learning_rate": 0.00011295346323432206, "loss": 0.0097, "step": 481060 }, { "epoch": 1.25, "learning_rate": 0.00011294957501795059, "loss": 0.0094, "step": 481070 }, { "epoch": 1.25, "learning_rate": 0.00011294568680157912, "loss": 0.0102, "step": 481080 }, { "epoch": 1.25, "learning_rate": 0.00011294179858520766, "loss": 0.0107, "step": 481090 }, { "epoch": 1.25, "learning_rate": 0.00011293791036883619, "loss": 0.0088, "step": 481100 }, { "epoch": 1.25, "learning_rate": 0.00011293402215246473, "loss": 0.0086, "step": 481110 }, { "epoch": 1.25, "learning_rate": 0.00011293013393609326, "loss": 0.0107, "step": 481120 }, { "epoch": 1.25, "learning_rate": 0.0001129262457197218, "loss": 0.0097, "step": 481130 }, { "epoch": 1.25, "learning_rate": 0.00011292235750335033, "loss": 0.0107, "step": 481140 }, { "epoch": 1.25, "learning_rate": 0.00011291846928697887, "loss": 0.0117, "step": 481150 }, { "epoch": 1.25, "learning_rate": 0.0001129145810706074, "loss": 0.0089, "step": 481160 }, { "epoch": 1.25, "learning_rate": 0.00011291069285423594, "loss": 0.0131, "step": 481170 }, { "epoch": 1.25, "learning_rate": 0.00011290680463786447, "loss": 0.0125, "step": 481180 }, { "epoch": 1.25, "learning_rate": 0.00011290291642149302, "loss": 0.0091, "step": 481190 }, { "epoch": 1.25, "learning_rate": 0.00011289902820512154, "loss": 0.0129, "step": 481200 }, { "epoch": 1.25, "learning_rate": 0.0001128951399887501, "loss": 0.0105, "step": 481210 }, { "epoch": 1.25, "learning_rate": 0.00011289125177237862, "loss": 0.0119, "step": 481220 }, { "epoch": 1.25, "learning_rate": 0.00011288736355600716, "loss": 0.0099, "step": 481230 }, { "epoch": 1.25, "learning_rate": 0.00011288347533963569, "loss": 0.0124, "step": 481240 }, { "epoch": 1.25, "learning_rate": 0.00011287958712326423, "loss": 0.0106, "step": 481250 }, { "epoch": 1.25, "learning_rate": 0.00011287569890689276, "loss": 0.0095, "step": 481260 }, { "epoch": 1.25, "learning_rate": 0.0001128718106905213, "loss": 0.0134, "step": 481270 }, { "epoch": 1.25, "learning_rate": 0.00011286792247414983, "loss": 0.0111, "step": 481280 }, { "epoch": 1.25, "learning_rate": 0.00011286403425777837, "loss": 0.0091, "step": 481290 }, { "epoch": 1.25, "learning_rate": 0.0001128601460414069, "loss": 0.0113, "step": 481300 }, { "epoch": 1.25, "learning_rate": 0.00011285625782503544, "loss": 0.0131, "step": 481310 }, { "epoch": 1.25, "learning_rate": 0.00011285236960866397, "loss": 0.0093, "step": 481320 }, { "epoch": 1.25, "learning_rate": 0.0001128484813922925, "loss": 0.0114, "step": 481330 }, { "epoch": 1.25, "learning_rate": 0.00011284459317592104, "loss": 0.0178, "step": 481340 }, { "epoch": 1.25, "learning_rate": 0.00011284070495954957, "loss": 0.0146, "step": 481350 }, { "epoch": 1.25, "learning_rate": 0.00011283681674317811, "loss": 0.0113, "step": 481360 }, { "epoch": 1.25, "learning_rate": 0.00011283292852680664, "loss": 0.0176, "step": 481370 }, { "epoch": 1.25, "learning_rate": 0.00011282904031043519, "loss": 0.0125, "step": 481380 }, { "epoch": 1.25, "learning_rate": 0.00011282515209406372, "loss": 0.0101, "step": 481390 }, { "epoch": 1.25, "learning_rate": 0.00011282126387769226, "loss": 0.0125, "step": 481400 }, { "epoch": 1.25, "learning_rate": 0.00011281737566132079, "loss": 0.0148, "step": 481410 }, { "epoch": 1.25, "learning_rate": 0.00011281348744494933, "loss": 0.0117, "step": 481420 }, { "epoch": 1.25, "learning_rate": 0.00011280959922857786, "loss": 0.009, "step": 481430 }, { "epoch": 1.25, "learning_rate": 0.0001128057110122064, "loss": 0.0101, "step": 481440 }, { "epoch": 1.25, "learning_rate": 0.00011280182279583493, "loss": 0.013, "step": 481450 }, { "epoch": 1.25, "learning_rate": 0.00011279793457946347, "loss": 0.0126, "step": 481460 }, { "epoch": 1.25, "learning_rate": 0.000112794046363092, "loss": 0.0087, "step": 481470 }, { "epoch": 1.25, "learning_rate": 0.00011279015814672054, "loss": 0.0135, "step": 481480 }, { "epoch": 1.25, "learning_rate": 0.00011278626993034907, "loss": 0.0088, "step": 481490 }, { "epoch": 1.25, "learning_rate": 0.00011278238171397761, "loss": 0.0082, "step": 481500 }, { "epoch": 1.25, "learning_rate": 0.00011277849349760614, "loss": 0.0083, "step": 481510 }, { "epoch": 1.25, "learning_rate": 0.00011277460528123468, "loss": 0.0075, "step": 481520 }, { "epoch": 1.25, "learning_rate": 0.00011277071706486321, "loss": 0.011, "step": 481530 }, { "epoch": 1.25, "learning_rate": 0.00011276682884849176, "loss": 0.0095, "step": 481540 }, { "epoch": 1.25, "learning_rate": 0.00011276294063212029, "loss": 0.0112, "step": 481550 }, { "epoch": 1.25, "learning_rate": 0.00011275905241574883, "loss": 0.0144, "step": 481560 }, { "epoch": 1.25, "learning_rate": 0.00011275516419937736, "loss": 0.0101, "step": 481570 }, { "epoch": 1.25, "learning_rate": 0.00011275127598300589, "loss": 0.0138, "step": 481580 }, { "epoch": 1.25, "learning_rate": 0.00011274738776663443, "loss": 0.0094, "step": 481590 }, { "epoch": 1.25, "learning_rate": 0.00011274349955026296, "loss": 0.0108, "step": 481600 }, { "epoch": 1.25, "learning_rate": 0.0001127396113338915, "loss": 0.0093, "step": 481610 }, { "epoch": 1.25, "learning_rate": 0.00011273572311752003, "loss": 0.009, "step": 481620 }, { "epoch": 1.25, "learning_rate": 0.00011273183490114857, "loss": 0.0094, "step": 481630 }, { "epoch": 1.25, "learning_rate": 0.0001127279466847771, "loss": 0.0111, "step": 481640 }, { "epoch": 1.25, "learning_rate": 0.00011272405846840564, "loss": 0.0092, "step": 481650 }, { "epoch": 1.25, "learning_rate": 0.00011272017025203417, "loss": 0.0106, "step": 481660 }, { "epoch": 1.25, "learning_rate": 0.00011271628203566271, "loss": 0.0104, "step": 481670 }, { "epoch": 1.25, "learning_rate": 0.00011271239381929124, "loss": 0.0087, "step": 481680 }, { "epoch": 1.25, "learning_rate": 0.00011270850560291978, "loss": 0.0081, "step": 481690 }, { "epoch": 1.25, "learning_rate": 0.00011270461738654831, "loss": 0.0123, "step": 481700 }, { "epoch": 1.25, "learning_rate": 0.00011270072917017685, "loss": 0.0107, "step": 481710 }, { "epoch": 1.25, "learning_rate": 0.00011269684095380538, "loss": 0.0099, "step": 481720 }, { "epoch": 1.25, "learning_rate": 0.00011269295273743393, "loss": 0.0099, "step": 481730 }, { "epoch": 1.25, "learning_rate": 0.00011268906452106246, "loss": 0.0088, "step": 481740 }, { "epoch": 1.25, "learning_rate": 0.000112685176304691, "loss": 0.0113, "step": 481750 }, { "epoch": 1.25, "learning_rate": 0.00011268128808831953, "loss": 0.0094, "step": 481760 }, { "epoch": 1.25, "learning_rate": 0.00011267739987194807, "loss": 0.0098, "step": 481770 }, { "epoch": 1.25, "learning_rate": 0.0001126735116555766, "loss": 0.0118, "step": 481780 }, { "epoch": 1.25, "learning_rate": 0.00011266962343920514, "loss": 0.0109, "step": 481790 }, { "epoch": 1.25, "learning_rate": 0.00011266573522283367, "loss": 0.0101, "step": 481800 }, { "epoch": 1.25, "learning_rate": 0.00011266184700646221, "loss": 0.012, "step": 481810 }, { "epoch": 1.25, "learning_rate": 0.00011265795879009074, "loss": 0.0092, "step": 481820 }, { "epoch": 1.25, "learning_rate": 0.00011265407057371927, "loss": 0.0098, "step": 481830 }, { "epoch": 1.25, "learning_rate": 0.00011265018235734781, "loss": 0.0141, "step": 481840 }, { "epoch": 1.25, "learning_rate": 0.00011264629414097634, "loss": 0.009, "step": 481850 }, { "epoch": 1.25, "learning_rate": 0.00011264240592460488, "loss": 0.0092, "step": 481860 }, { "epoch": 1.25, "learning_rate": 0.00011263851770823341, "loss": 0.0089, "step": 481870 }, { "epoch": 1.25, "learning_rate": 0.00011263462949186195, "loss": 0.0085, "step": 481880 }, { "epoch": 1.25, "learning_rate": 0.00011263074127549048, "loss": 0.0113, "step": 481890 }, { "epoch": 1.25, "learning_rate": 0.00011262685305911903, "loss": 0.0169, "step": 481900 }, { "epoch": 1.25, "learning_rate": 0.00011262296484274755, "loss": 0.0111, "step": 481910 }, { "epoch": 1.25, "learning_rate": 0.0001126190766263761, "loss": 0.0108, "step": 481920 }, { "epoch": 1.25, "learning_rate": 0.00011261518841000463, "loss": 0.0114, "step": 481930 }, { "epoch": 1.25, "learning_rate": 0.00011261130019363317, "loss": 0.0093, "step": 481940 }, { "epoch": 1.25, "learning_rate": 0.0001126074119772617, "loss": 0.0127, "step": 481950 }, { "epoch": 1.25, "learning_rate": 0.00011260352376089024, "loss": 0.0096, "step": 481960 }, { "epoch": 1.25, "learning_rate": 0.00011259963554451877, "loss": 0.0095, "step": 481970 }, { "epoch": 1.25, "learning_rate": 0.00011259574732814731, "loss": 0.0088, "step": 481980 }, { "epoch": 1.25, "learning_rate": 0.00011259185911177584, "loss": 0.0082, "step": 481990 }, { "epoch": 1.25, "learning_rate": 0.00011258797089540438, "loss": 0.0084, "step": 482000 }, { "epoch": 1.25, "eval_cer": 0.8817404765203906, "eval_loss": 0.0068023488856852055, "eval_runtime": 107.9256, "eval_samples_per_second": 18.531, "eval_steps_per_second": 4.633, "step": 482000 }, { "epoch": 1.25, "learning_rate": 0.00011258408267903291, "loss": 0.0117, "step": 482010 }, { "epoch": 1.25, "learning_rate": 0.00011258019446266145, "loss": 0.0093, "step": 482020 }, { "epoch": 1.25, "learning_rate": 0.00011257630624628998, "loss": 0.0091, "step": 482030 }, { "epoch": 1.25, "learning_rate": 0.00011257241802991852, "loss": 0.009, "step": 482040 }, { "epoch": 1.25, "learning_rate": 0.00011256852981354705, "loss": 0.0155, "step": 482050 }, { "epoch": 1.25, "learning_rate": 0.0001125646415971756, "loss": 0.0116, "step": 482060 }, { "epoch": 1.25, "learning_rate": 0.00011256075338080412, "loss": 0.0093, "step": 482070 }, { "epoch": 1.25, "learning_rate": 0.00011255686516443265, "loss": 0.0097, "step": 482080 }, { "epoch": 1.25, "learning_rate": 0.0001125529769480612, "loss": 0.0132, "step": 482090 }, { "epoch": 1.25, "learning_rate": 0.00011254908873168973, "loss": 0.0089, "step": 482100 }, { "epoch": 1.25, "learning_rate": 0.00011254520051531827, "loss": 0.0136, "step": 482110 }, { "epoch": 1.25, "learning_rate": 0.0001125413122989468, "loss": 0.0141, "step": 482120 }, { "epoch": 1.25, "learning_rate": 0.00011253742408257534, "loss": 0.0161, "step": 482130 }, { "epoch": 1.25, "learning_rate": 0.00011253353586620387, "loss": 0.0105, "step": 482140 }, { "epoch": 1.25, "learning_rate": 0.00011252964764983241, "loss": 0.0099, "step": 482150 }, { "epoch": 1.25, "learning_rate": 0.00011252575943346094, "loss": 0.0115, "step": 482160 }, { "epoch": 1.25, "learning_rate": 0.00011252187121708948, "loss": 0.0084, "step": 482170 }, { "epoch": 1.25, "learning_rate": 0.00011251798300071801, "loss": 0.0106, "step": 482180 }, { "epoch": 1.25, "learning_rate": 0.00011251409478434655, "loss": 0.012, "step": 482190 }, { "epoch": 1.25, "learning_rate": 0.00011251020656797508, "loss": 0.0149, "step": 482200 }, { "epoch": 1.25, "learning_rate": 0.00011250631835160362, "loss": 0.0098, "step": 482210 }, { "epoch": 1.25, "learning_rate": 0.00011250243013523215, "loss": 0.0108, "step": 482220 }, { "epoch": 1.25, "learning_rate": 0.00011249854191886069, "loss": 0.0081, "step": 482230 }, { "epoch": 1.25, "learning_rate": 0.00011249465370248922, "loss": 0.0149, "step": 482240 }, { "epoch": 1.25, "learning_rate": 0.00011249076548611777, "loss": 0.0159, "step": 482250 }, { "epoch": 1.25, "learning_rate": 0.0001124868772697463, "loss": 0.0126, "step": 482260 }, { "epoch": 1.25, "learning_rate": 0.00011248298905337484, "loss": 0.0106, "step": 482270 }, { "epoch": 1.25, "learning_rate": 0.00011247910083700337, "loss": 0.0092, "step": 482280 }, { "epoch": 1.25, "learning_rate": 0.00011247521262063191, "loss": 0.0133, "step": 482290 }, { "epoch": 1.25, "learning_rate": 0.00011247132440426044, "loss": 0.011, "step": 482300 }, { "epoch": 1.25, "learning_rate": 0.00011246743618788898, "loss": 0.0128, "step": 482310 }, { "epoch": 1.25, "learning_rate": 0.00011246354797151751, "loss": 0.0089, "step": 482320 }, { "epoch": 1.25, "learning_rate": 0.00011245965975514604, "loss": 0.0083, "step": 482330 }, { "epoch": 1.25, "learning_rate": 0.00011245577153877458, "loss": 0.0124, "step": 482340 }, { "epoch": 1.25, "learning_rate": 0.00011245188332240311, "loss": 0.0105, "step": 482350 }, { "epoch": 1.25, "learning_rate": 0.00011244799510603165, "loss": 0.0101, "step": 482360 }, { "epoch": 1.25, "learning_rate": 0.00011244410688966018, "loss": 0.0091, "step": 482370 }, { "epoch": 1.25, "learning_rate": 0.00011244021867328872, "loss": 0.0094, "step": 482380 }, { "epoch": 1.25, "learning_rate": 0.00011243633045691725, "loss": 0.0091, "step": 482390 }, { "epoch": 1.25, "learning_rate": 0.00011243244224054579, "loss": 0.0136, "step": 482400 }, { "epoch": 1.25, "learning_rate": 0.00011242855402417432, "loss": 0.0087, "step": 482410 }, { "epoch": 1.25, "learning_rate": 0.00011242466580780287, "loss": 0.0104, "step": 482420 }, { "epoch": 1.25, "learning_rate": 0.00011242077759143139, "loss": 0.0102, "step": 482430 }, { "epoch": 1.25, "learning_rate": 0.00011241688937505994, "loss": 0.0109, "step": 482440 }, { "epoch": 1.25, "learning_rate": 0.00011241300115868847, "loss": 0.0089, "step": 482450 }, { "epoch": 1.25, "learning_rate": 0.00011240911294231701, "loss": 0.0098, "step": 482460 }, { "epoch": 1.25, "learning_rate": 0.00011240522472594554, "loss": 0.0098, "step": 482470 }, { "epoch": 1.25, "learning_rate": 0.00011240133650957408, "loss": 0.0113, "step": 482480 }, { "epoch": 1.25, "learning_rate": 0.00011239744829320261, "loss": 0.0123, "step": 482490 }, { "epoch": 1.25, "learning_rate": 0.00011239356007683115, "loss": 0.0135, "step": 482500 }, { "epoch": 1.25, "learning_rate": 0.00011238967186045968, "loss": 0.0095, "step": 482510 }, { "epoch": 1.25, "learning_rate": 0.00011238578364408822, "loss": 0.0111, "step": 482520 }, { "epoch": 1.25, "learning_rate": 0.00011238189542771675, "loss": 0.0137, "step": 482530 }, { "epoch": 1.25, "learning_rate": 0.00011237800721134529, "loss": 0.0071, "step": 482540 }, { "epoch": 1.25, "learning_rate": 0.00011237411899497382, "loss": 0.0119, "step": 482550 }, { "epoch": 1.25, "learning_rate": 0.00011237023077860236, "loss": 0.0079, "step": 482560 }, { "epoch": 1.25, "learning_rate": 0.00011236634256223089, "loss": 0.0069, "step": 482570 }, { "epoch": 1.25, "learning_rate": 0.00011236245434585942, "loss": 0.009, "step": 482580 }, { "epoch": 1.25, "learning_rate": 0.00011235856612948796, "loss": 0.0109, "step": 482590 }, { "epoch": 1.25, "learning_rate": 0.00011235467791311649, "loss": 0.01, "step": 482600 }, { "epoch": 1.25, "learning_rate": 0.00011235078969674504, "loss": 0.0098, "step": 482610 }, { "epoch": 1.25, "learning_rate": 0.00011234690148037357, "loss": 0.0121, "step": 482620 }, { "epoch": 1.25, "learning_rate": 0.00011234301326400211, "loss": 0.0123, "step": 482630 }, { "epoch": 1.25, "learning_rate": 0.00011233912504763064, "loss": 0.0107, "step": 482640 }, { "epoch": 1.25, "learning_rate": 0.00011233523683125918, "loss": 0.0098, "step": 482650 }, { "epoch": 1.25, "learning_rate": 0.00011233134861488771, "loss": 0.012, "step": 482660 }, { "epoch": 1.25, "learning_rate": 0.00011232746039851625, "loss": 0.0102, "step": 482670 }, { "epoch": 1.25, "learning_rate": 0.00011232357218214478, "loss": 0.0106, "step": 482680 }, { "epoch": 1.25, "learning_rate": 0.00011231968396577332, "loss": 0.01, "step": 482690 }, { "epoch": 1.25, "learning_rate": 0.00011231579574940185, "loss": 0.0107, "step": 482700 }, { "epoch": 1.25, "learning_rate": 0.00011231190753303039, "loss": 0.0112, "step": 482710 }, { "epoch": 1.25, "learning_rate": 0.00011230801931665892, "loss": 0.0112, "step": 482720 }, { "epoch": 1.25, "learning_rate": 0.00011230413110028746, "loss": 0.0124, "step": 482730 }, { "epoch": 1.25, "learning_rate": 0.00011230024288391599, "loss": 0.0109, "step": 482740 }, { "epoch": 1.25, "learning_rate": 0.00011229635466754453, "loss": 0.0082, "step": 482750 }, { "epoch": 1.25, "learning_rate": 0.00011229246645117306, "loss": 0.0138, "step": 482760 }, { "epoch": 1.25, "learning_rate": 0.00011228857823480161, "loss": 0.0109, "step": 482770 }, { "epoch": 1.25, "learning_rate": 0.00011228469001843014, "loss": 0.01, "step": 482780 }, { "epoch": 1.25, "learning_rate": 0.00011228080180205868, "loss": 0.0095, "step": 482790 }, { "epoch": 1.25, "learning_rate": 0.00011227691358568721, "loss": 0.0139, "step": 482800 }, { "epoch": 1.25, "learning_rate": 0.00011227302536931575, "loss": 0.0134, "step": 482810 }, { "epoch": 1.25, "learning_rate": 0.00011226913715294428, "loss": 0.0159, "step": 482820 }, { "epoch": 1.25, "learning_rate": 0.00011226524893657281, "loss": 0.0097, "step": 482830 }, { "epoch": 1.25, "learning_rate": 0.00011226136072020135, "loss": 0.0149, "step": 482840 }, { "epoch": 1.25, "learning_rate": 0.00011225747250382988, "loss": 0.0092, "step": 482850 }, { "epoch": 1.25, "learning_rate": 0.00011225358428745842, "loss": 0.0106, "step": 482860 }, { "epoch": 1.25, "learning_rate": 0.00011224969607108695, "loss": 0.0128, "step": 482870 }, { "epoch": 1.25, "learning_rate": 0.00011224580785471549, "loss": 0.0114, "step": 482880 }, { "epoch": 1.25, "learning_rate": 0.00011224191963834402, "loss": 0.0074, "step": 482890 }, { "epoch": 1.25, "learning_rate": 0.00011223803142197256, "loss": 0.0113, "step": 482900 }, { "epoch": 1.25, "learning_rate": 0.00011223414320560109, "loss": 0.0105, "step": 482910 }, { "epoch": 1.25, "learning_rate": 0.00011223025498922963, "loss": 0.0127, "step": 482920 }, { "epoch": 1.25, "learning_rate": 0.00011222636677285816, "loss": 0.0138, "step": 482930 }, { "epoch": 1.25, "learning_rate": 0.00011222247855648671, "loss": 0.0109, "step": 482940 }, { "epoch": 1.25, "learning_rate": 0.00011221859034011523, "loss": 0.0128, "step": 482950 }, { "epoch": 1.25, "learning_rate": 0.00011221470212374378, "loss": 0.0094, "step": 482960 }, { "epoch": 1.25, "learning_rate": 0.00011221081390737231, "loss": 0.0131, "step": 482970 }, { "epoch": 1.25, "learning_rate": 0.00011220692569100085, "loss": 0.0131, "step": 482980 }, { "epoch": 1.25, "learning_rate": 0.00011220303747462938, "loss": 0.0117, "step": 482990 }, { "epoch": 1.25, "learning_rate": 0.00011219914925825792, "loss": 0.0086, "step": 483000 }, { "epoch": 1.25, "eval_cer": 0.8816788924952867, "eval_loss": 0.006821894086897373, "eval_runtime": 108.1122, "eval_samples_per_second": 18.499, "eval_steps_per_second": 4.625, "step": 483000 }, { "epoch": 1.25, "learning_rate": 0.00011219526104188645, "loss": 0.0116, "step": 483010 }, { "epoch": 1.25, "learning_rate": 0.00011219137282551499, "loss": 0.0119, "step": 483020 }, { "epoch": 1.25, "learning_rate": 0.00011218748460914352, "loss": 0.0102, "step": 483030 }, { "epoch": 1.25, "learning_rate": 0.00011218359639277206, "loss": 0.0115, "step": 483040 }, { "epoch": 1.25, "learning_rate": 0.00011217970817640059, "loss": 0.0167, "step": 483050 }, { "epoch": 1.25, "learning_rate": 0.00011217581996002913, "loss": 0.0088, "step": 483060 }, { "epoch": 1.25, "learning_rate": 0.00011217193174365766, "loss": 0.0074, "step": 483070 }, { "epoch": 1.25, "learning_rate": 0.00011216804352728619, "loss": 0.0087, "step": 483080 }, { "epoch": 1.25, "learning_rate": 0.00011216415531091473, "loss": 0.0137, "step": 483090 }, { "epoch": 1.25, "learning_rate": 0.00011216026709454326, "loss": 0.0126, "step": 483100 }, { "epoch": 1.25, "learning_rate": 0.0001121563788781718, "loss": 0.0093, "step": 483110 }, { "epoch": 1.25, "learning_rate": 0.00011215249066180033, "loss": 0.0106, "step": 483120 }, { "epoch": 1.25, "learning_rate": 0.00011214860244542888, "loss": 0.0124, "step": 483130 }, { "epoch": 1.25, "learning_rate": 0.00011214471422905741, "loss": 0.009, "step": 483140 }, { "epoch": 1.25, "learning_rate": 0.00011214082601268595, "loss": 0.0108, "step": 483150 }, { "epoch": 1.25, "learning_rate": 0.00011213693779631448, "loss": 0.0112, "step": 483160 }, { "epoch": 1.25, "learning_rate": 0.00011213304957994302, "loss": 0.0093, "step": 483170 }, { "epoch": 1.25, "learning_rate": 0.00011212916136357155, "loss": 0.0098, "step": 483180 }, { "epoch": 1.25, "learning_rate": 0.00011212527314720009, "loss": 0.0101, "step": 483190 }, { "epoch": 1.25, "learning_rate": 0.00011212138493082862, "loss": 0.0141, "step": 483200 }, { "epoch": 1.25, "learning_rate": 0.00011211749671445716, "loss": 0.0114, "step": 483210 }, { "epoch": 1.25, "learning_rate": 0.00011211360849808569, "loss": 0.0178, "step": 483220 }, { "epoch": 1.25, "learning_rate": 0.00011210972028171423, "loss": 0.01, "step": 483230 }, { "epoch": 1.25, "learning_rate": 0.00011210583206534276, "loss": 0.0098, "step": 483240 }, { "epoch": 1.25, "learning_rate": 0.0001121019438489713, "loss": 0.0075, "step": 483250 }, { "epoch": 1.25, "learning_rate": 0.00011209805563259983, "loss": 0.0121, "step": 483260 }, { "epoch": 1.25, "learning_rate": 0.00011209416741622837, "loss": 0.0113, "step": 483270 }, { "epoch": 1.25, "learning_rate": 0.0001120902791998569, "loss": 0.0106, "step": 483280 }, { "epoch": 1.25, "learning_rate": 0.00011208639098348545, "loss": 0.0082, "step": 483290 }, { "epoch": 1.25, "learning_rate": 0.00011208250276711397, "loss": 0.0065, "step": 483300 }, { "epoch": 1.25, "learning_rate": 0.00011207861455074252, "loss": 0.0135, "step": 483310 }, { "epoch": 1.25, "learning_rate": 0.00011207472633437105, "loss": 0.0109, "step": 483320 }, { "epoch": 1.25, "learning_rate": 0.00011207083811799958, "loss": 0.0103, "step": 483330 }, { "epoch": 1.25, "learning_rate": 0.00011206694990162812, "loss": 0.0088, "step": 483340 }, { "epoch": 1.25, "learning_rate": 0.00011206306168525665, "loss": 0.0115, "step": 483350 }, { "epoch": 1.25, "learning_rate": 0.00011205917346888519, "loss": 0.0078, "step": 483360 }, { "epoch": 1.25, "learning_rate": 0.00011205528525251372, "loss": 0.0103, "step": 483370 }, { "epoch": 1.25, "learning_rate": 0.00011205139703614226, "loss": 0.0113, "step": 483380 }, { "epoch": 1.25, "learning_rate": 0.00011204750881977079, "loss": 0.0135, "step": 483390 }, { "epoch": 1.25, "learning_rate": 0.00011204362060339933, "loss": 0.0099, "step": 483400 }, { "epoch": 1.25, "learning_rate": 0.00011203973238702786, "loss": 0.0099, "step": 483410 }, { "epoch": 1.25, "learning_rate": 0.0001120358441706564, "loss": 0.0093, "step": 483420 }, { "epoch": 1.25, "learning_rate": 0.00011203195595428493, "loss": 0.012, "step": 483430 }, { "epoch": 1.25, "learning_rate": 0.00011202806773791347, "loss": 0.0104, "step": 483440 }, { "epoch": 1.25, "learning_rate": 0.000112024179521542, "loss": 0.0102, "step": 483450 }, { "epoch": 1.25, "learning_rate": 0.00011202029130517054, "loss": 0.0105, "step": 483460 }, { "epoch": 1.25, "learning_rate": 0.00011201640308879907, "loss": 0.0118, "step": 483470 }, { "epoch": 1.25, "learning_rate": 0.00011201251487242762, "loss": 0.0102, "step": 483480 }, { "epoch": 1.25, "learning_rate": 0.00011200862665605615, "loss": 0.01, "step": 483490 }, { "epoch": 1.25, "learning_rate": 0.00011200473843968469, "loss": 0.0115, "step": 483500 }, { "epoch": 1.25, "learning_rate": 0.00011200085022331322, "loss": 0.0114, "step": 483510 }, { "epoch": 1.25, "learning_rate": 0.00011199696200694176, "loss": 0.0098, "step": 483520 }, { "epoch": 1.25, "learning_rate": 0.00011199307379057029, "loss": 0.0122, "step": 483530 }, { "epoch": 1.25, "learning_rate": 0.00011198918557419883, "loss": 0.0075, "step": 483540 }, { "epoch": 1.25, "learning_rate": 0.00011198529735782736, "loss": 0.0105, "step": 483550 }, { "epoch": 1.25, "learning_rate": 0.00011198140914145589, "loss": 0.0106, "step": 483560 }, { "epoch": 1.25, "learning_rate": 0.00011197752092508443, "loss": 0.0112, "step": 483570 }, { "epoch": 1.25, "learning_rate": 0.00011197363270871296, "loss": 0.013, "step": 483580 }, { "epoch": 1.25, "learning_rate": 0.0001119697444923415, "loss": 0.0128, "step": 483590 }, { "epoch": 1.25, "learning_rate": 0.00011196585627597003, "loss": 0.0134, "step": 483600 }, { "epoch": 1.25, "learning_rate": 0.00011196196805959857, "loss": 0.0152, "step": 483610 }, { "epoch": 1.25, "learning_rate": 0.0001119580798432271, "loss": 0.0071, "step": 483620 }, { "epoch": 1.25, "learning_rate": 0.00011195419162685564, "loss": 0.0101, "step": 483630 }, { "epoch": 1.25, "learning_rate": 0.00011195030341048417, "loss": 0.0149, "step": 483640 }, { "epoch": 1.25, "learning_rate": 0.00011194641519411272, "loss": 0.0089, "step": 483650 }, { "epoch": 1.25, "learning_rate": 0.00011194252697774124, "loss": 0.0098, "step": 483660 }, { "epoch": 1.25, "learning_rate": 0.00011193863876136979, "loss": 0.012, "step": 483670 }, { "epoch": 1.25, "learning_rate": 0.00011193475054499832, "loss": 0.0097, "step": 483680 }, { "epoch": 1.25, "learning_rate": 0.00011193086232862686, "loss": 0.0115, "step": 483690 }, { "epoch": 1.25, "learning_rate": 0.00011192697411225539, "loss": 0.0126, "step": 483700 }, { "epoch": 1.25, "learning_rate": 0.00011192308589588393, "loss": 0.0116, "step": 483710 }, { "epoch": 1.25, "learning_rate": 0.00011191919767951246, "loss": 0.0131, "step": 483720 }, { "epoch": 1.25, "learning_rate": 0.000111915309463141, "loss": 0.011, "step": 483730 }, { "epoch": 1.25, "learning_rate": 0.00011191142124676953, "loss": 0.0111, "step": 483740 }, { "epoch": 1.25, "learning_rate": 0.00011190753303039807, "loss": 0.0155, "step": 483750 }, { "epoch": 1.25, "learning_rate": 0.0001119036448140266, "loss": 0.0101, "step": 483760 }, { "epoch": 1.25, "learning_rate": 0.00011189975659765514, "loss": 0.011, "step": 483770 }, { "epoch": 1.25, "learning_rate": 0.00011189586838128367, "loss": 0.013, "step": 483780 }, { "epoch": 1.25, "learning_rate": 0.00011189198016491221, "loss": 0.0109, "step": 483790 }, { "epoch": 1.25, "learning_rate": 0.00011188809194854074, "loss": 0.011, "step": 483800 }, { "epoch": 1.25, "learning_rate": 0.00011188420373216927, "loss": 0.009, "step": 483810 }, { "epoch": 1.25, "learning_rate": 0.00011188031551579781, "loss": 0.0121, "step": 483820 }, { "epoch": 1.25, "learning_rate": 0.00011187642729942634, "loss": 0.0114, "step": 483830 }, { "epoch": 1.25, "learning_rate": 0.00011187253908305489, "loss": 0.0137, "step": 483840 }, { "epoch": 1.25, "learning_rate": 0.00011186865086668342, "loss": 0.0082, "step": 483850 }, { "epoch": 1.25, "learning_rate": 0.00011186476265031196, "loss": 0.0125, "step": 483860 }, { "epoch": 1.25, "learning_rate": 0.00011186087443394049, "loss": 0.0106, "step": 483870 }, { "epoch": 1.25, "learning_rate": 0.00011185698621756903, "loss": 0.0132, "step": 483880 }, { "epoch": 1.25, "learning_rate": 0.00011185309800119756, "loss": 0.01, "step": 483890 }, { "epoch": 1.25, "learning_rate": 0.0001118492097848261, "loss": 0.0093, "step": 483900 }, { "epoch": 1.25, "learning_rate": 0.00011184532156845463, "loss": 0.0088, "step": 483910 }, { "epoch": 1.25, "learning_rate": 0.00011184143335208317, "loss": 0.011, "step": 483920 }, { "epoch": 1.25, "learning_rate": 0.0001118375451357117, "loss": 0.0109, "step": 483930 }, { "epoch": 1.25, "learning_rate": 0.00011183365691934024, "loss": 0.0096, "step": 483940 }, { "epoch": 1.25, "learning_rate": 0.00011182976870296877, "loss": 0.0115, "step": 483950 }, { "epoch": 1.25, "learning_rate": 0.00011182588048659731, "loss": 0.0101, "step": 483960 }, { "epoch": 1.25, "learning_rate": 0.00011182199227022584, "loss": 0.0109, "step": 483970 }, { "epoch": 1.25, "learning_rate": 0.00011181810405385438, "loss": 0.0112, "step": 483980 }, { "epoch": 1.25, "learning_rate": 0.00011181421583748291, "loss": 0.0116, "step": 483990 }, { "epoch": 1.25, "learning_rate": 0.00011181032762111146, "loss": 0.0101, "step": 484000 }, { "epoch": 1.25, "eval_cer": 0.8816942885015627, "eval_loss": 0.0068328119814395905, "eval_runtime": 108.0595, "eval_samples_per_second": 18.508, "eval_steps_per_second": 4.627, "step": 484000 }, { "epoch": 1.25, "learning_rate": 0.00011180643940473999, "loss": 0.0086, "step": 484010 }, { "epoch": 1.25, "learning_rate": 0.00011180255118836853, "loss": 0.0102, "step": 484020 }, { "epoch": 1.25, "learning_rate": 0.00011179866297199706, "loss": 0.0113, "step": 484030 }, { "epoch": 1.25, "learning_rate": 0.0001117947747556256, "loss": 0.0096, "step": 484040 }, { "epoch": 1.25, "learning_rate": 0.00011179088653925413, "loss": 0.0107, "step": 484050 }, { "epoch": 1.25, "learning_rate": 0.00011178699832288266, "loss": 0.0091, "step": 484060 }, { "epoch": 1.25, "learning_rate": 0.0001117831101065112, "loss": 0.0125, "step": 484070 }, { "epoch": 1.25, "learning_rate": 0.00011177922189013973, "loss": 0.0098, "step": 484080 }, { "epoch": 1.25, "learning_rate": 0.00011177533367376827, "loss": 0.0119, "step": 484090 }, { "epoch": 1.25, "learning_rate": 0.0001117714454573968, "loss": 0.0104, "step": 484100 }, { "epoch": 1.25, "learning_rate": 0.00011176755724102534, "loss": 0.0085, "step": 484110 }, { "epoch": 1.25, "learning_rate": 0.00011176366902465387, "loss": 0.0104, "step": 484120 }, { "epoch": 1.25, "learning_rate": 0.00011175978080828241, "loss": 0.0097, "step": 484130 }, { "epoch": 1.25, "learning_rate": 0.00011175589259191094, "loss": 0.0102, "step": 484140 }, { "epoch": 1.25, "learning_rate": 0.00011175200437553948, "loss": 0.0092, "step": 484150 }, { "epoch": 1.26, "learning_rate": 0.000111748116159168, "loss": 0.0101, "step": 484160 }, { "epoch": 1.26, "learning_rate": 0.00011174422794279656, "loss": 0.0125, "step": 484170 }, { "epoch": 1.26, "learning_rate": 0.00011174033972642508, "loss": 0.0101, "step": 484180 }, { "epoch": 1.26, "learning_rate": 0.00011173645151005363, "loss": 0.0082, "step": 484190 }, { "epoch": 1.26, "learning_rate": 0.00011173256329368216, "loss": 0.0116, "step": 484200 }, { "epoch": 1.26, "learning_rate": 0.0001117286750773107, "loss": 0.0109, "step": 484210 }, { "epoch": 1.26, "learning_rate": 0.00011172478686093923, "loss": 0.01, "step": 484220 }, { "epoch": 1.26, "learning_rate": 0.00011172089864456777, "loss": 0.0093, "step": 484230 }, { "epoch": 1.26, "learning_rate": 0.0001117170104281963, "loss": 0.0096, "step": 484240 }, { "epoch": 1.26, "learning_rate": 0.00011171312221182484, "loss": 0.0096, "step": 484250 }, { "epoch": 1.26, "learning_rate": 0.00011170923399545337, "loss": 0.0102, "step": 484260 }, { "epoch": 1.26, "learning_rate": 0.00011170534577908191, "loss": 0.0083, "step": 484270 }, { "epoch": 1.26, "learning_rate": 0.00011170145756271044, "loss": 0.0111, "step": 484280 }, { "epoch": 1.26, "learning_rate": 0.00011169756934633898, "loss": 0.0115, "step": 484290 }, { "epoch": 1.26, "learning_rate": 0.00011169368112996751, "loss": 0.0094, "step": 484300 }, { "epoch": 1.26, "learning_rate": 0.00011168979291359604, "loss": 0.0114, "step": 484310 }, { "epoch": 1.26, "learning_rate": 0.00011168590469722458, "loss": 0.0126, "step": 484320 }, { "epoch": 1.26, "learning_rate": 0.0001116820164808531, "loss": 0.0106, "step": 484330 }, { "epoch": 1.26, "learning_rate": 0.00011167812826448165, "loss": 0.013, "step": 484340 }, { "epoch": 1.26, "learning_rate": 0.00011167424004811018, "loss": 0.0105, "step": 484350 }, { "epoch": 1.26, "learning_rate": 0.00011167035183173873, "loss": 0.0095, "step": 484360 }, { "epoch": 1.26, "learning_rate": 0.00011166646361536726, "loss": 0.009, "step": 484370 }, { "epoch": 1.26, "learning_rate": 0.0001116625753989958, "loss": 0.0101, "step": 484380 }, { "epoch": 1.26, "learning_rate": 0.00011165868718262433, "loss": 0.0145, "step": 484390 }, { "epoch": 1.26, "learning_rate": 0.00011165479896625287, "loss": 0.0094, "step": 484400 }, { "epoch": 1.26, "learning_rate": 0.0001116509107498814, "loss": 0.0152, "step": 484410 }, { "epoch": 1.26, "learning_rate": 0.00011164702253350994, "loss": 0.01, "step": 484420 }, { "epoch": 1.26, "learning_rate": 0.00011164313431713847, "loss": 0.0098, "step": 484430 }, { "epoch": 1.26, "learning_rate": 0.00011163924610076701, "loss": 0.0094, "step": 484440 }, { "epoch": 1.26, "learning_rate": 0.00011163535788439554, "loss": 0.0128, "step": 484450 }, { "epoch": 1.26, "learning_rate": 0.00011163146966802408, "loss": 0.0098, "step": 484460 }, { "epoch": 1.26, "learning_rate": 0.00011162758145165261, "loss": 0.0085, "step": 484470 }, { "epoch": 1.26, "learning_rate": 0.00011162369323528115, "loss": 0.0107, "step": 484480 }, { "epoch": 1.26, "learning_rate": 0.00011161980501890968, "loss": 0.0122, "step": 484490 }, { "epoch": 1.26, "learning_rate": 0.00011161591680253822, "loss": 0.0084, "step": 484500 }, { "epoch": 1.26, "learning_rate": 0.00011161202858616675, "loss": 0.0087, "step": 484510 }, { "epoch": 1.26, "learning_rate": 0.0001116081403697953, "loss": 0.0123, "step": 484520 }, { "epoch": 1.26, "learning_rate": 0.00011160425215342382, "loss": 0.0112, "step": 484530 }, { "epoch": 1.26, "learning_rate": 0.00011160036393705237, "loss": 0.0079, "step": 484540 }, { "epoch": 1.26, "learning_rate": 0.0001115964757206809, "loss": 0.0105, "step": 484550 }, { "epoch": 1.26, "learning_rate": 0.00011159258750430943, "loss": 0.0123, "step": 484560 }, { "epoch": 1.26, "learning_rate": 0.00011158869928793797, "loss": 0.0108, "step": 484570 }, { "epoch": 1.26, "learning_rate": 0.0001115848110715665, "loss": 0.0108, "step": 484580 }, { "epoch": 1.26, "learning_rate": 0.00011158092285519504, "loss": 0.0141, "step": 484590 }, { "epoch": 1.26, "learning_rate": 0.00011157703463882357, "loss": 0.0116, "step": 484600 }, { "epoch": 1.26, "learning_rate": 0.00011157314642245211, "loss": 0.0133, "step": 484610 }, { "epoch": 1.26, "learning_rate": 0.00011156925820608064, "loss": 0.0107, "step": 484620 }, { "epoch": 1.26, "learning_rate": 0.00011156536998970918, "loss": 0.009, "step": 484630 }, { "epoch": 1.26, "learning_rate": 0.0001115614817733377, "loss": 0.0121, "step": 484640 }, { "epoch": 1.26, "learning_rate": 0.00011155759355696625, "loss": 0.0115, "step": 484650 }, { "epoch": 1.26, "learning_rate": 0.00011155370534059478, "loss": 0.0084, "step": 484660 }, { "epoch": 1.26, "learning_rate": 0.00011154981712422332, "loss": 0.008, "step": 484670 }, { "epoch": 1.26, "learning_rate": 0.00011154592890785185, "loss": 0.0123, "step": 484680 }, { "epoch": 1.26, "learning_rate": 0.00011154204069148039, "loss": 0.0097, "step": 484690 }, { "epoch": 1.26, "learning_rate": 0.00011153815247510892, "loss": 0.0122, "step": 484700 }, { "epoch": 1.26, "learning_rate": 0.00011153426425873747, "loss": 0.0124, "step": 484710 }, { "epoch": 1.26, "learning_rate": 0.000111530376042366, "loss": 0.01, "step": 484720 }, { "epoch": 1.26, "learning_rate": 0.00011152648782599454, "loss": 0.0132, "step": 484730 }, { "epoch": 1.26, "learning_rate": 0.00011152259960962307, "loss": 0.0099, "step": 484740 }, { "epoch": 1.26, "learning_rate": 0.00011151871139325161, "loss": 0.0103, "step": 484750 }, { "epoch": 1.26, "learning_rate": 0.00011151482317688014, "loss": 0.0117, "step": 484760 }, { "epoch": 1.26, "learning_rate": 0.00011151093496050868, "loss": 0.0094, "step": 484770 }, { "epoch": 1.26, "learning_rate": 0.00011150704674413721, "loss": 0.0099, "step": 484780 }, { "epoch": 1.26, "learning_rate": 0.00011150315852776575, "loss": 0.0107, "step": 484790 }, { "epoch": 1.26, "learning_rate": 0.00011149927031139428, "loss": 0.0098, "step": 484800 }, { "epoch": 1.26, "learning_rate": 0.0001114953820950228, "loss": 0.0088, "step": 484810 }, { "epoch": 1.26, "learning_rate": 0.00011149149387865135, "loss": 0.0082, "step": 484820 }, { "epoch": 1.26, "learning_rate": 0.00011148760566227988, "loss": 0.0108, "step": 484830 }, { "epoch": 1.26, "learning_rate": 0.00011148371744590842, "loss": 0.0101, "step": 484840 }, { "epoch": 1.26, "learning_rate": 0.00011147982922953695, "loss": 0.0131, "step": 484850 }, { "epoch": 1.26, "learning_rate": 0.00011147594101316549, "loss": 0.0094, "step": 484860 }, { "epoch": 1.26, "learning_rate": 0.00011147205279679402, "loss": 0.0118, "step": 484870 }, { "epoch": 1.26, "learning_rate": 0.00011146816458042257, "loss": 0.0086, "step": 484880 }, { "epoch": 1.26, "learning_rate": 0.00011146427636405109, "loss": 0.0111, "step": 484890 }, { "epoch": 1.26, "learning_rate": 0.00011146038814767964, "loss": 0.01, "step": 484900 }, { "epoch": 1.26, "learning_rate": 0.00011145649993130817, "loss": 0.0089, "step": 484910 }, { "epoch": 1.26, "learning_rate": 0.00011145261171493671, "loss": 0.0155, "step": 484920 }, { "epoch": 1.26, "learning_rate": 0.00011144872349856524, "loss": 0.0098, "step": 484930 }, { "epoch": 1.26, "learning_rate": 0.00011144483528219378, "loss": 0.0091, "step": 484940 }, { "epoch": 1.26, "learning_rate": 0.00011144094706582231, "loss": 0.0107, "step": 484950 }, { "epoch": 1.26, "learning_rate": 0.00011143705884945085, "loss": 0.0082, "step": 484960 }, { "epoch": 1.26, "learning_rate": 0.00011143317063307938, "loss": 0.0144, "step": 484970 }, { "epoch": 1.26, "learning_rate": 0.00011142928241670792, "loss": 0.0134, "step": 484980 }, { "epoch": 1.26, "learning_rate": 0.00011142539420033645, "loss": 0.0102, "step": 484990 }, { "epoch": 1.26, "learning_rate": 0.00011142150598396499, "loss": 0.0097, "step": 485000 }, { "epoch": 1.26, "eval_cer": 0.8816858906799576, "eval_loss": 0.006655857898294926, "eval_runtime": 107.9871, "eval_samples_per_second": 18.521, "eval_steps_per_second": 4.63, "step": 485000 }, { "epoch": 1.26, "learning_rate": 0.00011141761776759352, "loss": 0.0088, "step": 485010 }, { "epoch": 1.26, "learning_rate": 0.00011141372955122206, "loss": 0.0101, "step": 485020 }, { "epoch": 1.26, "learning_rate": 0.00011140984133485059, "loss": 0.013, "step": 485030 }, { "epoch": 1.26, "learning_rate": 0.00011140595311847914, "loss": 0.0106, "step": 485040 }, { "epoch": 1.26, "learning_rate": 0.00011140206490210766, "loss": 0.0111, "step": 485050 }, { "epoch": 1.26, "learning_rate": 0.00011139817668573618, "loss": 0.0115, "step": 485060 }, { "epoch": 1.26, "learning_rate": 0.00011139428846936474, "loss": 0.0099, "step": 485070 }, { "epoch": 1.26, "learning_rate": 0.00011139040025299327, "loss": 0.0101, "step": 485080 }, { "epoch": 1.26, "learning_rate": 0.00011138651203662181, "loss": 0.0118, "step": 485090 }, { "epoch": 1.26, "learning_rate": 0.00011138262382025034, "loss": 0.0145, "step": 485100 }, { "epoch": 1.26, "learning_rate": 0.00011137873560387888, "loss": 0.0095, "step": 485110 }, { "epoch": 1.26, "learning_rate": 0.00011137484738750741, "loss": 0.0103, "step": 485120 }, { "epoch": 1.26, "learning_rate": 0.00011137095917113595, "loss": 0.0094, "step": 485130 }, { "epoch": 1.26, "learning_rate": 0.00011136707095476448, "loss": 0.0106, "step": 485140 }, { "epoch": 1.26, "learning_rate": 0.00011136318273839302, "loss": 0.0097, "step": 485150 }, { "epoch": 1.26, "learning_rate": 0.00011135929452202155, "loss": 0.0118, "step": 485160 }, { "epoch": 1.26, "learning_rate": 0.00011135540630565009, "loss": 0.0106, "step": 485170 }, { "epoch": 1.26, "learning_rate": 0.00011135151808927862, "loss": 0.0089, "step": 485180 }, { "epoch": 1.26, "learning_rate": 0.00011134762987290716, "loss": 0.0127, "step": 485190 }, { "epoch": 1.26, "learning_rate": 0.00011134374165653569, "loss": 0.0111, "step": 485200 }, { "epoch": 1.26, "learning_rate": 0.00011133985344016423, "loss": 0.0114, "step": 485210 }, { "epoch": 1.26, "learning_rate": 0.00011133596522379276, "loss": 0.0133, "step": 485220 }, { "epoch": 1.26, "learning_rate": 0.00011133207700742131, "loss": 0.0103, "step": 485230 }, { "epoch": 1.26, "learning_rate": 0.00011132818879104984, "loss": 0.0117, "step": 485240 }, { "epoch": 1.26, "learning_rate": 0.00011132430057467838, "loss": 0.0087, "step": 485250 }, { "epoch": 1.26, "learning_rate": 0.00011132041235830691, "loss": 0.0102, "step": 485260 }, { "epoch": 1.26, "learning_rate": 0.00011131652414193545, "loss": 0.0106, "step": 485270 }, { "epoch": 1.26, "learning_rate": 0.00011131263592556398, "loss": 0.0082, "step": 485280 }, { "epoch": 1.26, "learning_rate": 0.00011130874770919252, "loss": 0.0077, "step": 485290 }, { "epoch": 1.26, "learning_rate": 0.00011130485949282105, "loss": 0.0106, "step": 485300 }, { "epoch": 1.26, "learning_rate": 0.00011130097127644958, "loss": 0.0107, "step": 485310 }, { "epoch": 1.26, "learning_rate": 0.00011129708306007812, "loss": 0.0083, "step": 485320 }, { "epoch": 1.26, "learning_rate": 0.00011129319484370665, "loss": 0.01, "step": 485330 }, { "epoch": 1.26, "learning_rate": 0.00011128930662733519, "loss": 0.01, "step": 485340 }, { "epoch": 1.26, "learning_rate": 0.00011128541841096372, "loss": 0.0134, "step": 485350 }, { "epoch": 1.26, "learning_rate": 0.00011128153019459226, "loss": 0.0096, "step": 485360 }, { "epoch": 1.26, "learning_rate": 0.00011127764197822079, "loss": 0.012, "step": 485370 }, { "epoch": 1.26, "learning_rate": 0.00011127375376184933, "loss": 0.0075, "step": 485380 }, { "epoch": 1.26, "learning_rate": 0.00011126986554547786, "loss": 0.0094, "step": 485390 }, { "epoch": 1.26, "learning_rate": 0.00011126597732910641, "loss": 0.0102, "step": 485400 }, { "epoch": 1.26, "learning_rate": 0.00011126208911273492, "loss": 0.0103, "step": 485410 }, { "epoch": 1.26, "learning_rate": 0.00011125820089636348, "loss": 0.0114, "step": 485420 }, { "epoch": 1.26, "learning_rate": 0.00011125431267999201, "loss": 0.0104, "step": 485430 }, { "epoch": 1.26, "learning_rate": 0.00011125042446362055, "loss": 0.0092, "step": 485440 }, { "epoch": 1.26, "learning_rate": 0.00011124653624724908, "loss": 0.0098, "step": 485450 }, { "epoch": 1.26, "learning_rate": 0.00011124264803087762, "loss": 0.0093, "step": 485460 }, { "epoch": 1.26, "learning_rate": 0.00011123875981450615, "loss": 0.0136, "step": 485470 }, { "epoch": 1.26, "learning_rate": 0.00011123487159813469, "loss": 0.0102, "step": 485480 }, { "epoch": 1.26, "learning_rate": 0.00011123098338176322, "loss": 0.0102, "step": 485490 }, { "epoch": 1.26, "learning_rate": 0.00011122709516539176, "loss": 0.014, "step": 485500 }, { "epoch": 1.26, "learning_rate": 0.00011122320694902029, "loss": 0.0141, "step": 485510 }, { "epoch": 1.26, "learning_rate": 0.00011121931873264883, "loss": 0.0117, "step": 485520 }, { "epoch": 1.26, "learning_rate": 0.00011121543051627736, "loss": 0.0104, "step": 485530 }, { "epoch": 1.26, "learning_rate": 0.0001112115422999059, "loss": 0.0104, "step": 485540 }, { "epoch": 1.26, "learning_rate": 0.00011120765408353443, "loss": 0.0088, "step": 485550 }, { "epoch": 1.26, "learning_rate": 0.00011120376586716295, "loss": 0.0111, "step": 485560 }, { "epoch": 1.26, "learning_rate": 0.0001111998776507915, "loss": 0.009, "step": 485570 }, { "epoch": 1.26, "learning_rate": 0.00011119598943442002, "loss": 0.0089, "step": 485580 }, { "epoch": 1.26, "learning_rate": 0.00011119210121804858, "loss": 0.0075, "step": 485590 }, { "epoch": 1.26, "learning_rate": 0.00011118821300167711, "loss": 0.0108, "step": 485600 }, { "epoch": 1.26, "learning_rate": 0.00011118432478530565, "loss": 0.0092, "step": 485610 }, { "epoch": 1.26, "learning_rate": 0.00011118043656893418, "loss": 0.01, "step": 485620 }, { "epoch": 1.26, "learning_rate": 0.00011117654835256272, "loss": 0.0111, "step": 485630 }, { "epoch": 1.26, "learning_rate": 0.00011117266013619125, "loss": 0.0095, "step": 485640 }, { "epoch": 1.26, "learning_rate": 0.00011116877191981979, "loss": 0.0084, "step": 485650 }, { "epoch": 1.26, "learning_rate": 0.00011116488370344832, "loss": 0.0124, "step": 485660 }, { "epoch": 1.26, "learning_rate": 0.00011116099548707686, "loss": 0.0148, "step": 485670 }, { "epoch": 1.26, "learning_rate": 0.00011115710727070539, "loss": 0.016, "step": 485680 }, { "epoch": 1.26, "learning_rate": 0.00011115321905433393, "loss": 0.0112, "step": 485690 }, { "epoch": 1.26, "learning_rate": 0.00011114933083796246, "loss": 0.0103, "step": 485700 }, { "epoch": 1.26, "learning_rate": 0.000111145442621591, "loss": 0.01, "step": 485710 }, { "epoch": 1.26, "learning_rate": 0.00011114155440521953, "loss": 0.0105, "step": 485720 }, { "epoch": 1.26, "learning_rate": 0.00011113766618884807, "loss": 0.0109, "step": 485730 }, { "epoch": 1.26, "learning_rate": 0.0001111337779724766, "loss": 0.0098, "step": 485740 }, { "epoch": 1.26, "learning_rate": 0.00011112988975610515, "loss": 0.0088, "step": 485750 }, { "epoch": 1.26, "learning_rate": 0.00011112600153973368, "loss": 0.011, "step": 485760 }, { "epoch": 1.26, "learning_rate": 0.00011112211332336222, "loss": 0.0113, "step": 485770 }, { "epoch": 1.26, "learning_rate": 0.00011111822510699075, "loss": 0.0083, "step": 485780 }, { "epoch": 1.26, "learning_rate": 0.00011111433689061929, "loss": 0.012, "step": 485790 }, { "epoch": 1.26, "learning_rate": 0.00011111044867424782, "loss": 0.0116, "step": 485800 }, { "epoch": 1.26, "learning_rate": 0.00011110656045787635, "loss": 0.0116, "step": 485810 }, { "epoch": 1.26, "learning_rate": 0.00011110267224150489, "loss": 0.0145, "step": 485820 }, { "epoch": 1.26, "learning_rate": 0.00011109878402513342, "loss": 0.0087, "step": 485830 }, { "epoch": 1.26, "learning_rate": 0.00011109489580876196, "loss": 0.0094, "step": 485840 }, { "epoch": 1.26, "learning_rate": 0.00011109100759239049, "loss": 0.0116, "step": 485850 }, { "epoch": 1.26, "learning_rate": 0.00011108711937601903, "loss": 0.0131, "step": 485860 }, { "epoch": 1.26, "learning_rate": 0.00011108323115964756, "loss": 0.0091, "step": 485870 }, { "epoch": 1.26, "learning_rate": 0.0001110793429432761, "loss": 0.0105, "step": 485880 }, { "epoch": 1.26, "learning_rate": 0.00011107545472690463, "loss": 0.0075, "step": 485890 }, { "epoch": 1.26, "learning_rate": 0.00011107156651053317, "loss": 0.0099, "step": 485900 }, { "epoch": 1.26, "learning_rate": 0.0001110676782941617, "loss": 0.011, "step": 485910 }, { "epoch": 1.26, "learning_rate": 0.00011106379007779024, "loss": 0.0117, "step": 485920 }, { "epoch": 1.26, "learning_rate": 0.00011105990186141876, "loss": 0.0116, "step": 485930 }, { "epoch": 1.26, "learning_rate": 0.00011105601364504732, "loss": 0.0074, "step": 485940 }, { "epoch": 1.26, "learning_rate": 0.00011105212542867585, "loss": 0.0082, "step": 485950 }, { "epoch": 1.26, "learning_rate": 0.00011104823721230439, "loss": 0.0112, "step": 485960 }, { "epoch": 1.26, "learning_rate": 0.00011104434899593292, "loss": 0.0121, "step": 485970 }, { "epoch": 1.26, "learning_rate": 0.00011104046077956146, "loss": 0.0108, "step": 485980 }, { "epoch": 1.26, "learning_rate": 0.00011103657256318999, "loss": 0.0106, "step": 485990 }, { "epoch": 1.26, "learning_rate": 0.00011103268434681853, "loss": 0.012, "step": 486000 }, { "epoch": 1.26, "eval_cer": 0.8816550986674057, "eval_loss": 0.006589991506189108, "eval_runtime": 108.066, "eval_samples_per_second": 18.507, "eval_steps_per_second": 4.627, "step": 486000 }, { "epoch": 1.26, "learning_rate": 0.00011102879613044706, "loss": 0.0113, "step": 486010 }, { "epoch": 1.26, "learning_rate": 0.0001110249079140756, "loss": 0.0146, "step": 486020 }, { "epoch": 1.26, "learning_rate": 0.00011102101969770413, "loss": 0.0101, "step": 486030 }, { "epoch": 1.26, "learning_rate": 0.00011101713148133267, "loss": 0.0102, "step": 486040 }, { "epoch": 1.26, "learning_rate": 0.0001110132432649612, "loss": 0.0092, "step": 486050 }, { "epoch": 1.26, "learning_rate": 0.00011100935504858972, "loss": 0.0102, "step": 486060 }, { "epoch": 1.26, "learning_rate": 0.00011100546683221827, "loss": 0.0116, "step": 486070 }, { "epoch": 1.26, "learning_rate": 0.0001110015786158468, "loss": 0.0148, "step": 486080 }, { "epoch": 1.26, "learning_rate": 0.00011099769039947534, "loss": 0.0085, "step": 486090 }, { "epoch": 1.26, "learning_rate": 0.00011099380218310386, "loss": 0.0128, "step": 486100 }, { "epoch": 1.26, "learning_rate": 0.00011098991396673242, "loss": 0.0108, "step": 486110 }, { "epoch": 1.26, "learning_rate": 0.00011098602575036093, "loss": 0.01, "step": 486120 }, { "epoch": 1.26, "learning_rate": 0.00011098213753398949, "loss": 0.0099, "step": 486130 }, { "epoch": 1.26, "learning_rate": 0.00011097824931761802, "loss": 0.008, "step": 486140 }, { "epoch": 1.26, "learning_rate": 0.00011097436110124656, "loss": 0.011, "step": 486150 }, { "epoch": 1.26, "learning_rate": 0.00011097047288487509, "loss": 0.0106, "step": 486160 }, { "epoch": 1.26, "learning_rate": 0.00011096658466850363, "loss": 0.0091, "step": 486170 }, { "epoch": 1.26, "learning_rate": 0.00011096269645213216, "loss": 0.014, "step": 486180 }, { "epoch": 1.26, "learning_rate": 0.0001109588082357607, "loss": 0.0116, "step": 486190 }, { "epoch": 1.26, "learning_rate": 0.00011095492001938923, "loss": 0.0113, "step": 486200 }, { "epoch": 1.26, "learning_rate": 0.00011095103180301777, "loss": 0.0092, "step": 486210 }, { "epoch": 1.26, "learning_rate": 0.0001109471435866463, "loss": 0.011, "step": 486220 }, { "epoch": 1.26, "learning_rate": 0.00011094325537027484, "loss": 0.0103, "step": 486230 }, { "epoch": 1.26, "learning_rate": 0.00011093936715390337, "loss": 0.0101, "step": 486240 }, { "epoch": 1.26, "learning_rate": 0.00011093547893753191, "loss": 0.0117, "step": 486250 }, { "epoch": 1.26, "learning_rate": 0.00011093159072116044, "loss": 0.0081, "step": 486260 }, { "epoch": 1.26, "learning_rate": 0.00011092770250478899, "loss": 0.0098, "step": 486270 }, { "epoch": 1.26, "learning_rate": 0.0001109238142884175, "loss": 0.0096, "step": 486280 }, { "epoch": 1.26, "learning_rate": 0.00011091992607204603, "loss": 0.0091, "step": 486290 }, { "epoch": 1.26, "learning_rate": 0.00011091603785567459, "loss": 0.0095, "step": 486300 }, { "epoch": 1.26, "learning_rate": 0.00011091214963930312, "loss": 0.0097, "step": 486310 }, { "epoch": 1.26, "learning_rate": 0.00011090826142293166, "loss": 0.0123, "step": 486320 }, { "epoch": 1.26, "learning_rate": 0.00011090437320656019, "loss": 0.0085, "step": 486330 }, { "epoch": 1.26, "learning_rate": 0.00011090048499018873, "loss": 0.0097, "step": 486340 }, { "epoch": 1.26, "learning_rate": 0.00011089659677381726, "loss": 0.0098, "step": 486350 }, { "epoch": 1.26, "learning_rate": 0.0001108927085574458, "loss": 0.0092, "step": 486360 }, { "epoch": 1.26, "learning_rate": 0.00011088882034107433, "loss": 0.0096, "step": 486370 }, { "epoch": 1.26, "learning_rate": 0.00011088493212470287, "loss": 0.0074, "step": 486380 }, { "epoch": 1.26, "learning_rate": 0.0001108810439083314, "loss": 0.0082, "step": 486390 }, { "epoch": 1.26, "learning_rate": 0.00011087715569195994, "loss": 0.0095, "step": 486400 }, { "epoch": 1.26, "learning_rate": 0.00011087326747558847, "loss": 0.0128, "step": 486410 }, { "epoch": 1.26, "learning_rate": 0.00011086937925921701, "loss": 0.0123, "step": 486420 }, { "epoch": 1.26, "learning_rate": 0.00011086549104284553, "loss": 0.0106, "step": 486430 }, { "epoch": 1.26, "learning_rate": 0.00011086160282647408, "loss": 0.0105, "step": 486440 }, { "epoch": 1.26, "learning_rate": 0.0001108577146101026, "loss": 0.016, "step": 486450 }, { "epoch": 1.26, "learning_rate": 0.00011085382639373116, "loss": 0.0138, "step": 486460 }, { "epoch": 1.26, "learning_rate": 0.00011084993817735969, "loss": 0.0091, "step": 486470 }, { "epoch": 1.26, "learning_rate": 0.00011084604996098823, "loss": 0.0077, "step": 486480 }, { "epoch": 1.26, "learning_rate": 0.00011084216174461676, "loss": 0.0085, "step": 486490 }, { "epoch": 1.26, "learning_rate": 0.0001108382735282453, "loss": 0.0119, "step": 486500 }, { "epoch": 1.26, "learning_rate": 0.00011083438531187383, "loss": 0.0105, "step": 486510 }, { "epoch": 1.26, "learning_rate": 0.00011083049709550237, "loss": 0.0104, "step": 486520 }, { "epoch": 1.26, "learning_rate": 0.0001108266088791309, "loss": 0.0128, "step": 486530 }, { "epoch": 1.26, "learning_rate": 0.00011082272066275943, "loss": 0.0126, "step": 486540 }, { "epoch": 1.26, "learning_rate": 0.00011081883244638797, "loss": 0.01, "step": 486550 }, { "epoch": 1.26, "learning_rate": 0.0001108149442300165, "loss": 0.0121, "step": 486560 }, { "epoch": 1.26, "learning_rate": 0.00011081105601364504, "loss": 0.0084, "step": 486570 }, { "epoch": 1.26, "learning_rate": 0.00011080716779727356, "loss": 0.0126, "step": 486580 }, { "epoch": 1.26, "learning_rate": 0.0001108032795809021, "loss": 0.0099, "step": 486590 }, { "epoch": 1.26, "learning_rate": 0.00011079939136453063, "loss": 0.0098, "step": 486600 }, { "epoch": 1.26, "learning_rate": 0.00011079550314815918, "loss": 0.0104, "step": 486610 }, { "epoch": 1.26, "learning_rate": 0.0001107916149317877, "loss": 0.012, "step": 486620 }, { "epoch": 1.26, "learning_rate": 0.00011078772671541626, "loss": 0.0152, "step": 486630 }, { "epoch": 1.26, "learning_rate": 0.00011078383849904477, "loss": 0.0105, "step": 486640 }, { "epoch": 1.26, "learning_rate": 0.00011077995028267333, "loss": 0.0108, "step": 486650 }, { "epoch": 1.26, "learning_rate": 0.00011077606206630186, "loss": 0.012, "step": 486660 }, { "epoch": 1.26, "learning_rate": 0.0001107721738499304, "loss": 0.013, "step": 486670 }, { "epoch": 1.26, "learning_rate": 0.00011076828563355893, "loss": 0.0105, "step": 486680 }, { "epoch": 1.26, "learning_rate": 0.00011076439741718747, "loss": 0.01, "step": 486690 }, { "epoch": 1.26, "learning_rate": 0.000110760509200816, "loss": 0.0146, "step": 486700 }, { "epoch": 1.26, "learning_rate": 0.00011075662098444454, "loss": 0.0114, "step": 486710 }, { "epoch": 1.26, "learning_rate": 0.00011075273276807307, "loss": 0.0079, "step": 486720 }, { "epoch": 1.26, "learning_rate": 0.00011074884455170161, "loss": 0.0077, "step": 486730 }, { "epoch": 1.26, "learning_rate": 0.00011074495633533014, "loss": 0.0125, "step": 486740 }, { "epoch": 1.26, "learning_rate": 0.00011074106811895868, "loss": 0.0079, "step": 486750 }, { "epoch": 1.26, "learning_rate": 0.0001107371799025872, "loss": 0.012, "step": 486760 }, { "epoch": 1.26, "learning_rate": 0.00011073329168621575, "loss": 0.0095, "step": 486770 }, { "epoch": 1.26, "learning_rate": 0.00011072940346984428, "loss": 0.0148, "step": 486780 }, { "epoch": 1.26, "learning_rate": 0.0001107255152534728, "loss": 0.0133, "step": 486790 }, { "epoch": 1.26, "learning_rate": 0.00011072162703710135, "loss": 0.0094, "step": 486800 }, { "epoch": 1.26, "learning_rate": 0.00011071773882072987, "loss": 0.0101, "step": 486810 }, { "epoch": 1.26, "learning_rate": 0.00011071385060435843, "loss": 0.0111, "step": 486820 }, { "epoch": 1.26, "learning_rate": 0.00011070996238798696, "loss": 0.0121, "step": 486830 }, { "epoch": 1.26, "learning_rate": 0.0001107060741716155, "loss": 0.0132, "step": 486840 }, { "epoch": 1.26, "learning_rate": 0.00011070218595524403, "loss": 0.0116, "step": 486850 }, { "epoch": 1.26, "learning_rate": 0.00011069829773887257, "loss": 0.0119, "step": 486860 }, { "epoch": 1.26, "learning_rate": 0.0001106944095225011, "loss": 0.0089, "step": 486870 }, { "epoch": 1.26, "learning_rate": 0.00011069052130612964, "loss": 0.0144, "step": 486880 }, { "epoch": 1.26, "learning_rate": 0.00011068663308975817, "loss": 0.0073, "step": 486890 }, { "epoch": 1.26, "learning_rate": 0.00011068274487338671, "loss": 0.0131, "step": 486900 }, { "epoch": 1.26, "learning_rate": 0.00011067885665701524, "loss": 0.0091, "step": 486910 }, { "epoch": 1.26, "learning_rate": 0.00011067496844064378, "loss": 0.0093, "step": 486920 }, { "epoch": 1.26, "learning_rate": 0.0001106710802242723, "loss": 0.0105, "step": 486930 }, { "epoch": 1.26, "learning_rate": 0.00011066719200790085, "loss": 0.011, "step": 486940 }, { "epoch": 1.26, "learning_rate": 0.00011066330379152937, "loss": 0.0097, "step": 486950 }, { "epoch": 1.26, "learning_rate": 0.00011065941557515792, "loss": 0.0068, "step": 486960 }, { "epoch": 1.26, "learning_rate": 0.00011065552735878644, "loss": 0.0113, "step": 486970 }, { "epoch": 1.26, "learning_rate": 0.000110651639142415, "loss": 0.0103, "step": 486980 }, { "epoch": 1.26, "learning_rate": 0.00011064775092604353, "loss": 0.0088, "step": 486990 }, { "epoch": 1.26, "learning_rate": 0.00011064386270967207, "loss": 0.0107, "step": 487000 }, { "epoch": 1.26, "eval_cer": 0.8816690950367475, "eval_loss": 0.0066790650598704815, "eval_runtime": 108.1004, "eval_samples_per_second": 18.501, "eval_steps_per_second": 4.625, "step": 487000 }, { "epoch": 1.26, "learning_rate": 0.0001106399744933006, "loss": 0.0097, "step": 487010 }, { "epoch": 1.26, "learning_rate": 0.00011063608627692914, "loss": 0.0121, "step": 487020 }, { "epoch": 1.26, "learning_rate": 0.00011063219806055767, "loss": 0.0081, "step": 487030 }, { "epoch": 1.26, "learning_rate": 0.0001106283098441862, "loss": 0.0098, "step": 487040 }, { "epoch": 1.26, "learning_rate": 0.00011062442162781474, "loss": 0.0128, "step": 487050 }, { "epoch": 1.26, "learning_rate": 0.00011062053341144327, "loss": 0.0141, "step": 487060 }, { "epoch": 1.26, "learning_rate": 0.00011061664519507181, "loss": 0.0104, "step": 487070 }, { "epoch": 1.26, "learning_rate": 0.00011061275697870033, "loss": 0.0077, "step": 487080 }, { "epoch": 1.26, "learning_rate": 0.00011060886876232888, "loss": 0.0102, "step": 487090 }, { "epoch": 1.26, "learning_rate": 0.0001106049805459574, "loss": 0.0143, "step": 487100 }, { "epoch": 1.26, "learning_rate": 0.00011060109232958595, "loss": 0.0094, "step": 487110 }, { "epoch": 1.26, "learning_rate": 0.00011059720411321447, "loss": 0.0103, "step": 487120 }, { "epoch": 1.26, "learning_rate": 0.00011059331589684302, "loss": 0.011, "step": 487130 }, { "epoch": 1.26, "learning_rate": 0.00011058942768047154, "loss": 0.0092, "step": 487140 }, { "epoch": 1.26, "learning_rate": 0.0001105855394641001, "loss": 0.0095, "step": 487150 }, { "epoch": 1.26, "learning_rate": 0.00011058165124772861, "loss": 0.007, "step": 487160 }, { "epoch": 1.26, "learning_rate": 0.00011057776303135717, "loss": 0.0104, "step": 487170 }, { "epoch": 1.26, "learning_rate": 0.0001105738748149857, "loss": 0.0141, "step": 487180 }, { "epoch": 1.26, "learning_rate": 0.00011056998659861424, "loss": 0.0103, "step": 487190 }, { "epoch": 1.26, "learning_rate": 0.00011056609838224277, "loss": 0.0094, "step": 487200 }, { "epoch": 1.26, "learning_rate": 0.00011056221016587131, "loss": 0.0124, "step": 487210 }, { "epoch": 1.26, "learning_rate": 0.00011055832194949984, "loss": 0.0125, "step": 487220 }, { "epoch": 1.26, "learning_rate": 0.00011055443373312838, "loss": 0.0073, "step": 487230 }, { "epoch": 1.26, "learning_rate": 0.0001105505455167569, "loss": 0.0095, "step": 487240 }, { "epoch": 1.26, "learning_rate": 0.00011054665730038545, "loss": 0.0116, "step": 487250 }, { "epoch": 1.26, "learning_rate": 0.00011054276908401398, "loss": 0.0105, "step": 487260 }, { "epoch": 1.26, "learning_rate": 0.00011053888086764252, "loss": 0.0096, "step": 487270 }, { "epoch": 1.26, "learning_rate": 0.00011053499265127105, "loss": 0.0105, "step": 487280 }, { "epoch": 1.26, "learning_rate": 0.00011053110443489957, "loss": 0.0079, "step": 487290 }, { "epoch": 1.26, "learning_rate": 0.00011052721621852812, "loss": 0.0092, "step": 487300 }, { "epoch": 1.26, "learning_rate": 0.00011052332800215664, "loss": 0.0104, "step": 487310 }, { "epoch": 1.26, "learning_rate": 0.00011051943978578519, "loss": 0.0104, "step": 487320 }, { "epoch": 1.26, "learning_rate": 0.00011051555156941371, "loss": 0.0122, "step": 487330 }, { "epoch": 1.26, "learning_rate": 0.00011051166335304227, "loss": 0.0096, "step": 487340 }, { "epoch": 1.26, "learning_rate": 0.0001105077751366708, "loss": 0.0086, "step": 487350 }, { "epoch": 1.26, "learning_rate": 0.00011050388692029934, "loss": 0.0107, "step": 487360 }, { "epoch": 1.26, "learning_rate": 0.00011049999870392787, "loss": 0.0103, "step": 487370 }, { "epoch": 1.26, "learning_rate": 0.00011049611048755641, "loss": 0.011, "step": 487380 }, { "epoch": 1.26, "learning_rate": 0.00011049222227118494, "loss": 0.0092, "step": 487390 }, { "epoch": 1.26, "learning_rate": 0.00011048833405481348, "loss": 0.0115, "step": 487400 }, { "epoch": 1.26, "learning_rate": 0.000110484445838442, "loss": 0.0115, "step": 487410 }, { "epoch": 1.26, "learning_rate": 0.00011048055762207055, "loss": 0.0114, "step": 487420 }, { "epoch": 1.26, "learning_rate": 0.00011047666940569908, "loss": 0.0093, "step": 487430 }, { "epoch": 1.26, "learning_rate": 0.00011047278118932762, "loss": 0.0112, "step": 487440 }, { "epoch": 1.26, "learning_rate": 0.00011046889297295615, "loss": 0.0101, "step": 487450 }, { "epoch": 1.26, "learning_rate": 0.00011046500475658469, "loss": 0.0121, "step": 487460 }, { "epoch": 1.26, "learning_rate": 0.00011046111654021321, "loss": 0.0106, "step": 487470 }, { "epoch": 1.26, "learning_rate": 0.00011045722832384176, "loss": 0.0134, "step": 487480 }, { "epoch": 1.26, "learning_rate": 0.00011045334010747028, "loss": 0.0107, "step": 487490 }, { "epoch": 1.26, "learning_rate": 0.00011044945189109884, "loss": 0.0092, "step": 487500 }, { "epoch": 1.26, "learning_rate": 0.00011044556367472735, "loss": 0.0109, "step": 487510 }, { "epoch": 1.26, "learning_rate": 0.00011044167545835591, "loss": 0.0081, "step": 487520 }, { "epoch": 1.26, "learning_rate": 0.00011043778724198444, "loss": 0.0128, "step": 487530 }, { "epoch": 1.26, "learning_rate": 0.00011043389902561297, "loss": 0.0098, "step": 487540 }, { "epoch": 1.26, "learning_rate": 0.00011043001080924151, "loss": 0.0097, "step": 487550 }, { "epoch": 1.26, "learning_rate": 0.00011042612259287004, "loss": 0.009, "step": 487560 }, { "epoch": 1.26, "learning_rate": 0.00011042223437649858, "loss": 0.0144, "step": 487570 }, { "epoch": 1.26, "learning_rate": 0.0001104183461601271, "loss": 0.0088, "step": 487580 }, { "epoch": 1.26, "learning_rate": 0.00011041445794375565, "loss": 0.0102, "step": 487590 }, { "epoch": 1.26, "learning_rate": 0.00011041056972738417, "loss": 0.0122, "step": 487600 }, { "epoch": 1.26, "learning_rate": 0.00011040668151101272, "loss": 0.0108, "step": 487610 }, { "epoch": 1.26, "learning_rate": 0.00011040279329464124, "loss": 0.0142, "step": 487620 }, { "epoch": 1.26, "learning_rate": 0.00011039890507826979, "loss": 0.0112, "step": 487630 }, { "epoch": 1.26, "learning_rate": 0.00011039501686189831, "loss": 0.015, "step": 487640 }, { "epoch": 1.26, "learning_rate": 0.00011039112864552686, "loss": 0.0127, "step": 487650 }, { "epoch": 1.26, "learning_rate": 0.00011038724042915538, "loss": 0.0156, "step": 487660 }, { "epoch": 1.26, "learning_rate": 0.00011038335221278393, "loss": 0.0223, "step": 487670 }, { "epoch": 1.26, "learning_rate": 0.00011037946399641245, "loss": 0.008, "step": 487680 }, { "epoch": 1.26, "learning_rate": 0.00011037557578004101, "loss": 0.0095, "step": 487690 }, { "epoch": 1.26, "learning_rate": 0.00011037168756366954, "loss": 0.0083, "step": 487700 }, { "epoch": 1.26, "learning_rate": 0.00011036779934729808, "loss": 0.0178, "step": 487710 }, { "epoch": 1.26, "learning_rate": 0.0001103639111309266, "loss": 0.0099, "step": 487720 }, { "epoch": 1.26, "learning_rate": 0.00011036002291455515, "loss": 0.0109, "step": 487730 }, { "epoch": 1.26, "learning_rate": 0.00011035613469818368, "loss": 0.0129, "step": 487740 }, { "epoch": 1.26, "learning_rate": 0.00011035224648181222, "loss": 0.0105, "step": 487750 }, { "epoch": 1.26, "learning_rate": 0.00011034835826544075, "loss": 0.0093, "step": 487760 }, { "epoch": 1.26, "learning_rate": 0.00011034447004906929, "loss": 0.0117, "step": 487770 }, { "epoch": 1.26, "learning_rate": 0.00011034058183269782, "loss": 0.0077, "step": 487780 }, { "epoch": 1.26, "learning_rate": 0.00011033669361632634, "loss": 0.0117, "step": 487790 }, { "epoch": 1.26, "learning_rate": 0.00011033280539995489, "loss": 0.0124, "step": 487800 }, { "epoch": 1.26, "learning_rate": 0.00011032891718358341, "loss": 0.011, "step": 487810 }, { "epoch": 1.26, "learning_rate": 0.00011032502896721196, "loss": 0.0077, "step": 487820 }, { "epoch": 1.26, "learning_rate": 0.00011032114075084048, "loss": 0.0138, "step": 487830 }, { "epoch": 1.26, "learning_rate": 0.00011031725253446903, "loss": 0.0115, "step": 487840 }, { "epoch": 1.26, "learning_rate": 0.00011031336431809755, "loss": 0.0129, "step": 487850 }, { "epoch": 1.26, "learning_rate": 0.00011030947610172611, "loss": 0.0106, "step": 487860 }, { "epoch": 1.26, "learning_rate": 0.00011030558788535462, "loss": 0.0132, "step": 487870 }, { "epoch": 1.26, "learning_rate": 0.00011030169966898318, "loss": 0.013, "step": 487880 }, { "epoch": 1.26, "learning_rate": 0.0001102978114526117, "loss": 0.0101, "step": 487890 }, { "epoch": 1.26, "learning_rate": 0.00011029392323624025, "loss": 0.0091, "step": 487900 }, { "epoch": 1.26, "learning_rate": 0.00011029003501986878, "loss": 0.0095, "step": 487910 }, { "epoch": 1.26, "learning_rate": 0.00011028614680349732, "loss": 0.0118, "step": 487920 }, { "epoch": 1.26, "learning_rate": 0.00011028225858712585, "loss": 0.0134, "step": 487930 }, { "epoch": 1.26, "learning_rate": 0.00011027837037075439, "loss": 0.0135, "step": 487940 }, { "epoch": 1.26, "learning_rate": 0.00011027448215438292, "loss": 0.0111, "step": 487950 }, { "epoch": 1.26, "learning_rate": 0.00011027059393801146, "loss": 0.0097, "step": 487960 }, { "epoch": 1.26, "learning_rate": 0.00011026670572163998, "loss": 0.0122, "step": 487970 }, { "epoch": 1.26, "learning_rate": 0.00011026281750526853, "loss": 0.0113, "step": 487980 }, { "epoch": 1.26, "learning_rate": 0.00011025892928889705, "loss": 0.0112, "step": 487990 }, { "epoch": 1.26, "learning_rate": 0.0001102550410725256, "loss": 0.0118, "step": 488000 }, { "epoch": 1.26, "eval_cer": 0.8816662957628791, "eval_loss": 0.006483182776719332, "eval_runtime": 108.0759, "eval_samples_per_second": 18.506, "eval_steps_per_second": 4.626, "step": 488000 }, { "epoch": 1.26, "learning_rate": 0.00011025115285615412, "loss": 0.0104, "step": 488010 }, { "epoch": 1.27, "learning_rate": 0.00011024726463978268, "loss": 0.013, "step": 488020 }, { "epoch": 1.27, "learning_rate": 0.0001102433764234112, "loss": 0.0083, "step": 488030 }, { "epoch": 1.27, "learning_rate": 0.00011023948820703972, "loss": 0.0072, "step": 488040 }, { "epoch": 1.27, "learning_rate": 0.00011023559999066828, "loss": 0.0094, "step": 488050 }, { "epoch": 1.27, "learning_rate": 0.0001102317117742968, "loss": 0.0112, "step": 488060 }, { "epoch": 1.27, "learning_rate": 0.00011022782355792535, "loss": 0.0139, "step": 488070 }, { "epoch": 1.27, "learning_rate": 0.00011022393534155388, "loss": 0.014, "step": 488080 }, { "epoch": 1.27, "learning_rate": 0.00011022004712518242, "loss": 0.0125, "step": 488090 }, { "epoch": 1.27, "learning_rate": 0.00011021615890881094, "loss": 0.0078, "step": 488100 }, { "epoch": 1.27, "learning_rate": 0.00011021227069243949, "loss": 0.0101, "step": 488110 }, { "epoch": 1.27, "learning_rate": 0.00011020838247606801, "loss": 0.0135, "step": 488120 }, { "epoch": 1.27, "learning_rate": 0.00011020449425969656, "loss": 0.0105, "step": 488130 }, { "epoch": 1.27, "learning_rate": 0.00011020060604332508, "loss": 0.0073, "step": 488140 }, { "epoch": 1.27, "learning_rate": 0.00011019671782695363, "loss": 0.0117, "step": 488150 }, { "epoch": 1.27, "learning_rate": 0.00011019282961058215, "loss": 0.0126, "step": 488160 }, { "epoch": 1.27, "learning_rate": 0.0001101889413942107, "loss": 0.0092, "step": 488170 }, { "epoch": 1.27, "learning_rate": 0.00011018505317783922, "loss": 0.0125, "step": 488180 }, { "epoch": 1.27, "learning_rate": 0.00011018116496146777, "loss": 0.0103, "step": 488190 }, { "epoch": 1.27, "learning_rate": 0.0001101772767450963, "loss": 0.0096, "step": 488200 }, { "epoch": 1.27, "learning_rate": 0.00011017338852872485, "loss": 0.0085, "step": 488210 }, { "epoch": 1.27, "learning_rate": 0.00011016950031235338, "loss": 0.0116, "step": 488220 }, { "epoch": 1.27, "learning_rate": 0.00011016561209598192, "loss": 0.0085, "step": 488230 }, { "epoch": 1.27, "learning_rate": 0.00011016172387961045, "loss": 0.009, "step": 488240 }, { "epoch": 1.27, "learning_rate": 0.00011015783566323899, "loss": 0.0092, "step": 488250 }, { "epoch": 1.27, "learning_rate": 0.00011015394744686752, "loss": 0.0094, "step": 488260 }, { "epoch": 1.27, "learning_rate": 0.00011015005923049606, "loss": 0.0092, "step": 488270 }, { "epoch": 1.27, "learning_rate": 0.00011014617101412459, "loss": 0.0082, "step": 488280 }, { "epoch": 1.27, "learning_rate": 0.00011014228279775311, "loss": 0.0078, "step": 488290 }, { "epoch": 1.27, "learning_rate": 0.00011013839458138166, "loss": 0.0099, "step": 488300 }, { "epoch": 1.27, "learning_rate": 0.00011013450636501018, "loss": 0.0108, "step": 488310 }, { "epoch": 1.27, "learning_rate": 0.00011013061814863873, "loss": 0.0099, "step": 488320 }, { "epoch": 1.27, "learning_rate": 0.00011012672993226725, "loss": 0.0121, "step": 488330 }, { "epoch": 1.27, "learning_rate": 0.0001101228417158958, "loss": 0.0127, "step": 488340 }, { "epoch": 1.27, "learning_rate": 0.00011011895349952432, "loss": 0.0124, "step": 488350 }, { "epoch": 1.27, "learning_rate": 0.00011011506528315286, "loss": 0.0098, "step": 488360 }, { "epoch": 1.27, "learning_rate": 0.00011011117706678139, "loss": 0.0084, "step": 488370 }, { "epoch": 1.27, "learning_rate": 0.00011010728885040995, "loss": 0.0082, "step": 488380 }, { "epoch": 1.27, "learning_rate": 0.00011010340063403846, "loss": 0.0131, "step": 488390 }, { "epoch": 1.27, "learning_rate": 0.00011009951241766702, "loss": 0.0094, "step": 488400 }, { "epoch": 1.27, "learning_rate": 0.00011009562420129555, "loss": 0.0117, "step": 488410 }, { "epoch": 1.27, "learning_rate": 0.00011009173598492409, "loss": 0.0146, "step": 488420 }, { "epoch": 1.27, "learning_rate": 0.00011008784776855262, "loss": 0.0136, "step": 488430 }, { "epoch": 1.27, "learning_rate": 0.00011008395955218116, "loss": 0.0089, "step": 488440 }, { "epoch": 1.27, "learning_rate": 0.00011008007133580969, "loss": 0.0154, "step": 488450 }, { "epoch": 1.27, "learning_rate": 0.00011007618311943823, "loss": 0.0116, "step": 488460 }, { "epoch": 1.27, "learning_rate": 0.00011007229490306676, "loss": 0.0113, "step": 488470 }, { "epoch": 1.27, "learning_rate": 0.0001100684066866953, "loss": 0.0109, "step": 488480 }, { "epoch": 1.27, "learning_rate": 0.00011006451847032382, "loss": 0.009, "step": 488490 }, { "epoch": 1.27, "learning_rate": 0.00011006063025395237, "loss": 0.0091, "step": 488500 }, { "epoch": 1.27, "learning_rate": 0.0001100567420375809, "loss": 0.0092, "step": 488510 }, { "epoch": 1.27, "learning_rate": 0.00011005285382120944, "loss": 0.009, "step": 488520 }, { "epoch": 1.27, "learning_rate": 0.00011004896560483796, "loss": 0.0093, "step": 488530 }, { "epoch": 1.27, "learning_rate": 0.00011004507738846649, "loss": 0.0084, "step": 488540 }, { "epoch": 1.27, "learning_rate": 0.00011004118917209503, "loss": 0.0103, "step": 488550 }, { "epoch": 1.27, "learning_rate": 0.00011003730095572356, "loss": 0.0085, "step": 488560 }, { "epoch": 1.27, "learning_rate": 0.00011003341273935212, "loss": 0.0125, "step": 488570 }, { "epoch": 1.27, "learning_rate": 0.00011002952452298065, "loss": 0.0143, "step": 488580 }, { "epoch": 1.27, "learning_rate": 0.00011002563630660919, "loss": 0.0115, "step": 488590 }, { "epoch": 1.27, "learning_rate": 0.00011002174809023772, "loss": 0.0123, "step": 488600 }, { "epoch": 1.27, "learning_rate": 0.00011001785987386626, "loss": 0.0095, "step": 488610 }, { "epoch": 1.27, "learning_rate": 0.00011001397165749478, "loss": 0.013, "step": 488620 }, { "epoch": 1.27, "learning_rate": 0.00011001008344112333, "loss": 0.0084, "step": 488630 }, { "epoch": 1.27, "learning_rate": 0.00011000619522475185, "loss": 0.0128, "step": 488640 }, { "epoch": 1.27, "learning_rate": 0.0001100023070083804, "loss": 0.0126, "step": 488650 }, { "epoch": 1.27, "learning_rate": 0.00010999841879200892, "loss": 0.0136, "step": 488660 }, { "epoch": 1.27, "learning_rate": 0.00010999453057563747, "loss": 0.0143, "step": 488670 }, { "epoch": 1.27, "learning_rate": 0.000109990642359266, "loss": 0.0114, "step": 488680 }, { "epoch": 1.27, "learning_rate": 0.00010998675414289454, "loss": 0.01, "step": 488690 }, { "epoch": 1.27, "learning_rate": 0.00010998286592652306, "loss": 0.0098, "step": 488700 }, { "epoch": 1.27, "learning_rate": 0.0001099789777101516, "loss": 0.008, "step": 488710 }, { "epoch": 1.27, "learning_rate": 0.00010997508949378013, "loss": 0.0094, "step": 488720 }, { "epoch": 1.27, "learning_rate": 0.00010997120127740869, "loss": 0.0089, "step": 488730 }, { "epoch": 1.27, "learning_rate": 0.0001099673130610372, "loss": 0.0087, "step": 488740 }, { "epoch": 1.27, "learning_rate": 0.00010996342484466576, "loss": 0.009, "step": 488750 }, { "epoch": 1.27, "learning_rate": 0.00010995953662829429, "loss": 0.0094, "step": 488760 }, { "epoch": 1.27, "learning_rate": 0.00010995564841192283, "loss": 0.01, "step": 488770 }, { "epoch": 1.27, "learning_rate": 0.00010995176019555136, "loss": 0.0088, "step": 488780 }, { "epoch": 1.27, "learning_rate": 0.00010994787197917988, "loss": 0.0091, "step": 488790 }, { "epoch": 1.27, "learning_rate": 0.00010994398376280843, "loss": 0.0096, "step": 488800 }, { "epoch": 1.27, "learning_rate": 0.00010994009554643695, "loss": 0.0096, "step": 488810 }, { "epoch": 1.27, "learning_rate": 0.0001099362073300655, "loss": 0.012, "step": 488820 }, { "epoch": 1.27, "learning_rate": 0.00010993231911369402, "loss": 0.0132, "step": 488830 }, { "epoch": 1.27, "learning_rate": 0.00010992843089732257, "loss": 0.0092, "step": 488840 }, { "epoch": 1.27, "learning_rate": 0.0001099245426809511, "loss": 0.0118, "step": 488850 }, { "epoch": 1.27, "learning_rate": 0.00010992065446457964, "loss": 0.01, "step": 488860 }, { "epoch": 1.27, "learning_rate": 0.00010991676624820816, "loss": 0.0099, "step": 488870 }, { "epoch": 1.27, "learning_rate": 0.0001099128780318367, "loss": 0.0139, "step": 488880 }, { "epoch": 1.27, "learning_rate": 0.00010990898981546523, "loss": 0.0103, "step": 488890 }, { "epoch": 1.27, "learning_rate": 0.00010990510159909377, "loss": 0.011, "step": 488900 }, { "epoch": 1.27, "learning_rate": 0.0001099012133827223, "loss": 0.0131, "step": 488910 }, { "epoch": 1.27, "learning_rate": 0.00010989732516635086, "loss": 0.0073, "step": 488920 }, { "epoch": 1.27, "learning_rate": 0.00010989343694997939, "loss": 0.0094, "step": 488930 }, { "epoch": 1.27, "learning_rate": 0.00010988954873360793, "loss": 0.0109, "step": 488940 }, { "epoch": 1.27, "learning_rate": 0.00010988566051723646, "loss": 0.0098, "step": 488950 }, { "epoch": 1.27, "learning_rate": 0.000109881772300865, "loss": 0.0078, "step": 488960 }, { "epoch": 1.27, "learning_rate": 0.00010987788408449353, "loss": 0.011, "step": 488970 }, { "epoch": 1.27, "learning_rate": 0.00010987399586812207, "loss": 0.011, "step": 488980 }, { "epoch": 1.27, "learning_rate": 0.0001098701076517506, "loss": 0.0107, "step": 488990 }, { "epoch": 1.27, "learning_rate": 0.00010986621943537914, "loss": 0.0093, "step": 489000 }, { "epoch": 1.27, "eval_cer": 0.8816620968520765, "eval_loss": 0.0065433569252491, "eval_runtime": 108.073, "eval_samples_per_second": 18.506, "eval_steps_per_second": 4.627, "step": 489000 }, { "epoch": 1.27, "learning_rate": 0.00010986233121900766, "loss": 0.009, "step": 489010 }, { "epoch": 1.27, "learning_rate": 0.00010985844300263619, "loss": 0.0112, "step": 489020 }, { "epoch": 1.27, "learning_rate": 0.00010985455478626473, "loss": 0.0096, "step": 489030 }, { "epoch": 1.27, "learning_rate": 0.00010985066656989326, "loss": 0.0103, "step": 489040 }, { "epoch": 1.27, "learning_rate": 0.0001098467783535218, "loss": 0.0092, "step": 489050 }, { "epoch": 1.27, "learning_rate": 0.00010984289013715033, "loss": 0.0089, "step": 489060 }, { "epoch": 1.27, "learning_rate": 0.00010983900192077887, "loss": 0.0086, "step": 489070 }, { "epoch": 1.27, "learning_rate": 0.0001098351137044074, "loss": 0.0095, "step": 489080 }, { "epoch": 1.27, "learning_rate": 0.00010983122548803596, "loss": 0.0096, "step": 489090 }, { "epoch": 1.27, "learning_rate": 0.00010982733727166447, "loss": 0.0114, "step": 489100 }, { "epoch": 1.27, "learning_rate": 0.00010982344905529303, "loss": 0.0086, "step": 489110 }, { "epoch": 1.27, "learning_rate": 0.00010981956083892156, "loss": 0.0093, "step": 489120 }, { "epoch": 1.27, "learning_rate": 0.0001098156726225501, "loss": 0.0116, "step": 489130 }, { "epoch": 1.27, "learning_rate": 0.00010981178440617862, "loss": 0.0117, "step": 489140 }, { "epoch": 1.27, "learning_rate": 0.00010980789618980717, "loss": 0.0115, "step": 489150 }, { "epoch": 1.27, "learning_rate": 0.0001098040079734357, "loss": 0.0127, "step": 489160 }, { "epoch": 1.27, "learning_rate": 0.00010980011975706424, "loss": 0.0097, "step": 489170 }, { "epoch": 1.27, "learning_rate": 0.00010979623154069276, "loss": 0.0107, "step": 489180 }, { "epoch": 1.27, "learning_rate": 0.0001097923433243213, "loss": 0.0112, "step": 489190 }, { "epoch": 1.27, "learning_rate": 0.00010978845510794983, "loss": 0.012, "step": 489200 }, { "epoch": 1.27, "learning_rate": 0.00010978456689157838, "loss": 0.0072, "step": 489210 }, { "epoch": 1.27, "learning_rate": 0.0001097806786752069, "loss": 0.0117, "step": 489220 }, { "epoch": 1.27, "learning_rate": 0.00010977679045883545, "loss": 0.0091, "step": 489230 }, { "epoch": 1.27, "learning_rate": 0.00010977290224246397, "loss": 0.0102, "step": 489240 }, { "epoch": 1.27, "learning_rate": 0.00010976901402609253, "loss": 0.0114, "step": 489250 }, { "epoch": 1.27, "learning_rate": 0.00010976512580972104, "loss": 0.009, "step": 489260 }, { "epoch": 1.27, "learning_rate": 0.00010976123759334957, "loss": 0.0117, "step": 489270 }, { "epoch": 1.27, "learning_rate": 0.00010975734937697813, "loss": 0.012, "step": 489280 }, { "epoch": 1.27, "learning_rate": 0.00010975346116060665, "loss": 0.012, "step": 489290 }, { "epoch": 1.27, "learning_rate": 0.0001097495729442352, "loss": 0.0092, "step": 489300 }, { "epoch": 1.27, "learning_rate": 0.00010974568472786372, "loss": 0.0101, "step": 489310 }, { "epoch": 1.27, "learning_rate": 0.00010974179651149227, "loss": 0.0082, "step": 489320 }, { "epoch": 1.27, "learning_rate": 0.0001097379082951208, "loss": 0.0085, "step": 489330 }, { "epoch": 1.27, "learning_rate": 0.00010973402007874934, "loss": 0.0093, "step": 489340 }, { "epoch": 1.27, "learning_rate": 0.00010973013186237786, "loss": 0.0088, "step": 489350 }, { "epoch": 1.27, "learning_rate": 0.0001097262436460064, "loss": 0.0087, "step": 489360 }, { "epoch": 1.27, "learning_rate": 0.00010972235542963493, "loss": 0.009, "step": 489370 }, { "epoch": 1.27, "learning_rate": 0.00010971846721326347, "loss": 0.008, "step": 489380 }, { "epoch": 1.27, "learning_rate": 0.000109714578996892, "loss": 0.0088, "step": 489390 }, { "epoch": 1.27, "learning_rate": 0.00010971069078052054, "loss": 0.0111, "step": 489400 }, { "epoch": 1.27, "learning_rate": 0.00010970680256414907, "loss": 0.0154, "step": 489410 }, { "epoch": 1.27, "learning_rate": 0.00010970291434777761, "loss": 0.0122, "step": 489420 }, { "epoch": 1.27, "learning_rate": 0.00010969902613140614, "loss": 0.0102, "step": 489430 }, { "epoch": 1.27, "learning_rate": 0.0001096951379150347, "loss": 0.0141, "step": 489440 }, { "epoch": 1.27, "learning_rate": 0.00010969124969866323, "loss": 0.019, "step": 489450 }, { "epoch": 1.27, "learning_rate": 0.00010968736148229177, "loss": 0.0091, "step": 489460 }, { "epoch": 1.27, "learning_rate": 0.0001096834732659203, "loss": 0.0102, "step": 489470 }, { "epoch": 1.27, "learning_rate": 0.00010967958504954884, "loss": 0.01, "step": 489480 }, { "epoch": 1.27, "learning_rate": 0.00010967569683317737, "loss": 0.0081, "step": 489490 }, { "epoch": 1.27, "learning_rate": 0.00010967180861680591, "loss": 0.0092, "step": 489500 }, { "epoch": 1.27, "learning_rate": 0.00010966792040043443, "loss": 0.0084, "step": 489510 }, { "epoch": 1.27, "learning_rate": 0.00010966403218406296, "loss": 0.0107, "step": 489520 }, { "epoch": 1.27, "learning_rate": 0.0001096601439676915, "loss": 0.0102, "step": 489530 }, { "epoch": 1.27, "learning_rate": 0.00010965625575132003, "loss": 0.0109, "step": 489540 }, { "epoch": 1.27, "learning_rate": 0.00010965236753494857, "loss": 0.011, "step": 489550 }, { "epoch": 1.27, "learning_rate": 0.0001096484793185771, "loss": 0.0091, "step": 489560 }, { "epoch": 1.27, "learning_rate": 0.00010964459110220564, "loss": 0.0099, "step": 489570 }, { "epoch": 1.27, "learning_rate": 0.00010964070288583417, "loss": 0.0109, "step": 489580 }, { "epoch": 1.27, "learning_rate": 0.00010963681466946271, "loss": 0.0079, "step": 489590 }, { "epoch": 1.27, "learning_rate": 0.00010963292645309124, "loss": 0.0107, "step": 489600 }, { "epoch": 1.27, "learning_rate": 0.0001096290382367198, "loss": 0.011, "step": 489610 }, { "epoch": 1.27, "learning_rate": 0.00010962515002034831, "loss": 0.0091, "step": 489620 }, { "epoch": 1.27, "learning_rate": 0.00010962126180397687, "loss": 0.0089, "step": 489630 }, { "epoch": 1.27, "learning_rate": 0.0001096173735876054, "loss": 0.0098, "step": 489640 }, { "epoch": 1.27, "learning_rate": 0.00010961348537123394, "loss": 0.0096, "step": 489650 }, { "epoch": 1.27, "learning_rate": 0.00010960959715486246, "loss": 0.0092, "step": 489660 }, { "epoch": 1.27, "learning_rate": 0.000109605708938491, "loss": 0.0102, "step": 489670 }, { "epoch": 1.27, "learning_rate": 0.00010960182072211953, "loss": 0.0096, "step": 489680 }, { "epoch": 1.27, "learning_rate": 0.00010959793250574808, "loss": 0.0074, "step": 489690 }, { "epoch": 1.27, "learning_rate": 0.0001095940442893766, "loss": 0.0095, "step": 489700 }, { "epoch": 1.27, "learning_rate": 0.00010959015607300515, "loss": 0.0126, "step": 489710 }, { "epoch": 1.27, "learning_rate": 0.00010958626785663367, "loss": 0.0083, "step": 489720 }, { "epoch": 1.27, "learning_rate": 0.00010958237964026222, "loss": 0.0116, "step": 489730 }, { "epoch": 1.27, "learning_rate": 0.00010957849142389074, "loss": 0.0126, "step": 489740 }, { "epoch": 1.27, "learning_rate": 0.00010957460320751929, "loss": 0.0093, "step": 489750 }, { "epoch": 1.27, "learning_rate": 0.00010957071499114781, "loss": 0.0106, "step": 489760 }, { "epoch": 1.27, "learning_rate": 0.00010956682677477634, "loss": 0.0111, "step": 489770 }, { "epoch": 1.27, "learning_rate": 0.00010956293855840488, "loss": 0.0107, "step": 489780 }, { "epoch": 1.27, "learning_rate": 0.00010955905034203341, "loss": 0.009, "step": 489790 }, { "epoch": 1.27, "learning_rate": 0.00010955516212566197, "loss": 0.0101, "step": 489800 }, { "epoch": 1.27, "learning_rate": 0.0001095512739092905, "loss": 0.0123, "step": 489810 }, { "epoch": 1.27, "learning_rate": 0.00010954738569291904, "loss": 0.0083, "step": 489820 }, { "epoch": 1.27, "learning_rate": 0.00010954349747654756, "loss": 0.0087, "step": 489830 }, { "epoch": 1.27, "learning_rate": 0.0001095396092601761, "loss": 0.013, "step": 489840 }, { "epoch": 1.27, "learning_rate": 0.00010953572104380463, "loss": 0.0123, "step": 489850 }, { "epoch": 1.27, "learning_rate": 0.00010953183282743318, "loss": 0.0118, "step": 489860 }, { "epoch": 1.27, "learning_rate": 0.0001095279446110617, "loss": 0.0101, "step": 489870 }, { "epoch": 1.27, "learning_rate": 0.00010952405639469025, "loss": 0.0078, "step": 489880 }, { "epoch": 1.27, "learning_rate": 0.00010952016817831877, "loss": 0.0093, "step": 489890 }, { "epoch": 1.27, "learning_rate": 0.00010951627996194731, "loss": 0.008, "step": 489900 }, { "epoch": 1.27, "learning_rate": 0.00010951239174557584, "loss": 0.0142, "step": 489910 }, { "epoch": 1.27, "learning_rate": 0.00010950850352920438, "loss": 0.0092, "step": 489920 }, { "epoch": 1.27, "learning_rate": 0.00010950461531283291, "loss": 0.0106, "step": 489930 }, { "epoch": 1.27, "learning_rate": 0.00010950072709646145, "loss": 0.0092, "step": 489940 }, { "epoch": 1.27, "learning_rate": 0.00010949683888008998, "loss": 0.0081, "step": 489950 }, { "epoch": 1.27, "learning_rate": 0.00010949295066371854, "loss": 0.011, "step": 489960 }, { "epoch": 1.27, "learning_rate": 0.00010948906244734707, "loss": 0.0088, "step": 489970 }, { "epoch": 1.27, "learning_rate": 0.00010948517423097561, "loss": 0.0132, "step": 489980 }, { "epoch": 1.27, "learning_rate": 0.00010948128601460414, "loss": 0.0085, "step": 489990 }, { "epoch": 1.27, "learning_rate": 0.00010947739779823268, "loss": 0.008, "step": 490000 }, { "epoch": 1.27, "eval_cer": 0.8816690950367475, "eval_loss": 0.006557569373399019, "eval_runtime": 107.9754, "eval_samples_per_second": 18.523, "eval_steps_per_second": 4.631, "step": 490000 }, { "epoch": 1.27, "learning_rate": 0.0001094735095818612, "loss": 0.0084, "step": 490010 }, { "epoch": 1.27, "learning_rate": 0.00010946962136548973, "loss": 0.0097, "step": 490020 }, { "epoch": 1.27, "learning_rate": 0.00010946573314911827, "loss": 0.0102, "step": 490030 }, { "epoch": 1.27, "learning_rate": 0.0001094618449327468, "loss": 0.0091, "step": 490040 }, { "epoch": 1.27, "learning_rate": 0.00010945795671637534, "loss": 0.0095, "step": 490050 }, { "epoch": 1.27, "learning_rate": 0.00010945406850000387, "loss": 0.0085, "step": 490060 }, { "epoch": 1.27, "learning_rate": 0.00010945018028363241, "loss": 0.01, "step": 490070 }, { "epoch": 1.27, "learning_rate": 0.00010944629206726094, "loss": 0.0139, "step": 490080 }, { "epoch": 1.27, "learning_rate": 0.00010944240385088948, "loss": 0.0146, "step": 490090 }, { "epoch": 1.27, "learning_rate": 0.00010943851563451801, "loss": 0.0104, "step": 490100 }, { "epoch": 1.27, "learning_rate": 0.00010943462741814655, "loss": 0.0111, "step": 490110 }, { "epoch": 1.27, "learning_rate": 0.00010943073920177508, "loss": 0.0132, "step": 490120 }, { "epoch": 1.27, "learning_rate": 0.00010942685098540362, "loss": 0.0084, "step": 490130 }, { "epoch": 1.27, "learning_rate": 0.00010942296276903215, "loss": 0.0062, "step": 490140 }, { "epoch": 1.27, "learning_rate": 0.0001094190745526607, "loss": 0.0099, "step": 490150 }, { "epoch": 1.27, "learning_rate": 0.00010941518633628923, "loss": 0.0133, "step": 490160 }, { "epoch": 1.27, "learning_rate": 0.00010941129811991778, "loss": 0.0093, "step": 490170 }, { "epoch": 1.27, "learning_rate": 0.0001094074099035463, "loss": 0.0098, "step": 490180 }, { "epoch": 1.27, "learning_rate": 0.00010940352168717485, "loss": 0.0146, "step": 490190 }, { "epoch": 1.27, "learning_rate": 0.00010939963347080337, "loss": 0.0098, "step": 490200 }, { "epoch": 1.27, "learning_rate": 0.00010939574525443192, "loss": 0.0117, "step": 490210 }, { "epoch": 1.27, "learning_rate": 0.00010939185703806044, "loss": 0.0113, "step": 490220 }, { "epoch": 1.27, "learning_rate": 0.00010938796882168899, "loss": 0.0166, "step": 490230 }, { "epoch": 1.27, "learning_rate": 0.00010938408060531751, "loss": 0.0132, "step": 490240 }, { "epoch": 1.27, "learning_rate": 0.00010938019238894606, "loss": 0.0142, "step": 490250 }, { "epoch": 1.27, "learning_rate": 0.00010937630417257458, "loss": 0.0089, "step": 490260 }, { "epoch": 1.27, "learning_rate": 0.00010937241595620311, "loss": 0.0088, "step": 490270 }, { "epoch": 1.27, "learning_rate": 0.00010936852773983165, "loss": 0.0094, "step": 490280 }, { "epoch": 1.27, "learning_rate": 0.00010936463952346018, "loss": 0.0096, "step": 490290 }, { "epoch": 1.27, "learning_rate": 0.00010936075130708872, "loss": 0.0091, "step": 490300 }, { "epoch": 1.27, "learning_rate": 0.00010935686309071725, "loss": 0.0104, "step": 490310 }, { "epoch": 1.27, "learning_rate": 0.0001093529748743458, "loss": 0.0102, "step": 490320 }, { "epoch": 1.27, "learning_rate": 0.00010934908665797432, "loss": 0.0108, "step": 490330 }, { "epoch": 1.27, "learning_rate": 0.00010934519844160288, "loss": 0.0112, "step": 490340 }, { "epoch": 1.27, "learning_rate": 0.0001093413102252314, "loss": 0.0091, "step": 490350 }, { "epoch": 1.27, "learning_rate": 0.00010933742200885995, "loss": 0.011, "step": 490360 }, { "epoch": 1.27, "learning_rate": 0.00010933353379248847, "loss": 0.0107, "step": 490370 }, { "epoch": 1.27, "learning_rate": 0.00010932964557611702, "loss": 0.0121, "step": 490380 }, { "epoch": 1.27, "learning_rate": 0.00010932575735974554, "loss": 0.0151, "step": 490390 }, { "epoch": 1.27, "learning_rate": 0.00010932186914337409, "loss": 0.0122, "step": 490400 }, { "epoch": 1.27, "learning_rate": 0.00010931798092700261, "loss": 0.0086, "step": 490410 }, { "epoch": 1.27, "learning_rate": 0.00010931409271063115, "loss": 0.0099, "step": 490420 }, { "epoch": 1.27, "learning_rate": 0.00010931020449425968, "loss": 0.0099, "step": 490430 }, { "epoch": 1.27, "learning_rate": 0.00010930631627788822, "loss": 0.0119, "step": 490440 }, { "epoch": 1.27, "learning_rate": 0.00010930242806151675, "loss": 0.013, "step": 490450 }, { "epoch": 1.27, "learning_rate": 0.0001092985398451453, "loss": 0.0116, "step": 490460 }, { "epoch": 1.27, "learning_rate": 0.00010929465162877382, "loss": 0.0108, "step": 490470 }, { "epoch": 1.27, "learning_rate": 0.00010929076341240238, "loss": 0.0127, "step": 490480 }, { "epoch": 1.27, "learning_rate": 0.00010928687519603089, "loss": 0.0098, "step": 490490 }, { "epoch": 1.27, "learning_rate": 0.00010928298697965945, "loss": 0.0146, "step": 490500 }, { "epoch": 1.27, "learning_rate": 0.00010927909876328798, "loss": 0.0098, "step": 490510 }, { "epoch": 1.27, "learning_rate": 0.0001092752105469165, "loss": 0.009, "step": 490520 }, { "epoch": 1.27, "learning_rate": 0.00010927132233054505, "loss": 0.011, "step": 490530 }, { "epoch": 1.27, "learning_rate": 0.00010926743411417357, "loss": 0.0118, "step": 490540 }, { "epoch": 1.27, "learning_rate": 0.00010926354589780211, "loss": 0.0087, "step": 490550 }, { "epoch": 1.27, "learning_rate": 0.00010925965768143064, "loss": 0.0117, "step": 490560 }, { "epoch": 1.27, "learning_rate": 0.00010925576946505918, "loss": 0.0107, "step": 490570 }, { "epoch": 1.27, "learning_rate": 0.00010925188124868771, "loss": 0.0099, "step": 490580 }, { "epoch": 1.27, "learning_rate": 0.00010924799303231625, "loss": 0.0092, "step": 490590 }, { "epoch": 1.27, "learning_rate": 0.00010924410481594478, "loss": 0.0239, "step": 490600 }, { "epoch": 1.27, "learning_rate": 0.00010924021659957332, "loss": 0.0085, "step": 490610 }, { "epoch": 1.27, "learning_rate": 0.00010923632838320185, "loss": 0.0093, "step": 490620 }, { "epoch": 1.27, "learning_rate": 0.0001092324401668304, "loss": 0.0103, "step": 490630 }, { "epoch": 1.27, "learning_rate": 0.00010922855195045892, "loss": 0.0133, "step": 490640 }, { "epoch": 1.27, "learning_rate": 0.00010922466373408746, "loss": 0.0091, "step": 490650 }, { "epoch": 1.27, "learning_rate": 0.00010922077551771599, "loss": 0.0102, "step": 490660 }, { "epoch": 1.27, "learning_rate": 0.00010921688730134455, "loss": 0.0132, "step": 490670 }, { "epoch": 1.27, "learning_rate": 0.00010921299908497307, "loss": 0.0083, "step": 490680 }, { "epoch": 1.27, "learning_rate": 0.00010920911086860162, "loss": 0.0111, "step": 490690 }, { "epoch": 1.27, "learning_rate": 0.00010920522265223014, "loss": 0.011, "step": 490700 }, { "epoch": 1.27, "learning_rate": 0.00010920133443585869, "loss": 0.0082, "step": 490710 }, { "epoch": 1.27, "learning_rate": 0.00010919744621948721, "loss": 0.0091, "step": 490720 }, { "epoch": 1.27, "learning_rate": 0.00010919355800311576, "loss": 0.0122, "step": 490730 }, { "epoch": 1.27, "learning_rate": 0.00010918966978674428, "loss": 0.0105, "step": 490740 }, { "epoch": 1.27, "learning_rate": 0.00010918578157037283, "loss": 0.0063, "step": 490750 }, { "epoch": 1.27, "learning_rate": 0.00010918189335400135, "loss": 0.0099, "step": 490760 }, { "epoch": 1.27, "learning_rate": 0.00010917800513762988, "loss": 0.0106, "step": 490770 }, { "epoch": 1.27, "learning_rate": 0.00010917411692125842, "loss": 0.0114, "step": 490780 }, { "epoch": 1.27, "learning_rate": 0.00010917022870488695, "loss": 0.011, "step": 490790 }, { "epoch": 1.27, "learning_rate": 0.00010916634048851549, "loss": 0.0138, "step": 490800 }, { "epoch": 1.27, "learning_rate": 0.00010916245227214402, "loss": 0.0087, "step": 490810 }, { "epoch": 1.27, "learning_rate": 0.00010915856405577256, "loss": 0.0112, "step": 490820 }, { "epoch": 1.27, "learning_rate": 0.00010915467583940109, "loss": 0.0071, "step": 490830 }, { "epoch": 1.27, "learning_rate": 0.00010915078762302965, "loss": 0.0091, "step": 490840 }, { "epoch": 1.27, "learning_rate": 0.00010914689940665816, "loss": 0.0087, "step": 490850 }, { "epoch": 1.27, "learning_rate": 0.00010914301119028672, "loss": 0.0106, "step": 490860 }, { "epoch": 1.27, "learning_rate": 0.00010913912297391524, "loss": 0.0119, "step": 490870 }, { "epoch": 1.27, "learning_rate": 0.00010913523475754379, "loss": 0.0109, "step": 490880 }, { "epoch": 1.27, "learning_rate": 0.00010913134654117231, "loss": 0.0092, "step": 490890 }, { "epoch": 1.27, "learning_rate": 0.00010912745832480086, "loss": 0.0132, "step": 490900 }, { "epoch": 1.27, "learning_rate": 0.00010912357010842938, "loss": 0.0092, "step": 490910 }, { "epoch": 1.27, "learning_rate": 0.00010911968189205792, "loss": 0.0122, "step": 490920 }, { "epoch": 1.27, "learning_rate": 0.00010911579367568645, "loss": 0.01, "step": 490930 }, { "epoch": 1.27, "learning_rate": 0.000109111905459315, "loss": 0.0116, "step": 490940 }, { "epoch": 1.27, "learning_rate": 0.00010910801724294352, "loss": 0.0112, "step": 490950 }, { "epoch": 1.27, "learning_rate": 0.00010910412902657206, "loss": 0.0124, "step": 490960 }, { "epoch": 1.27, "learning_rate": 0.00010910024081020059, "loss": 0.0115, "step": 490970 }, { "epoch": 1.27, "learning_rate": 0.00010909635259382913, "loss": 0.0104, "step": 490980 }, { "epoch": 1.27, "learning_rate": 0.00010909246437745766, "loss": 0.0092, "step": 490990 }, { "epoch": 1.27, "learning_rate": 0.00010908857616108622, "loss": 0.0107, "step": 491000 }, { "epoch": 1.27, "eval_cer": 0.881688689953826, "eval_loss": 0.0065551563166081905, "eval_runtime": 108.1856, "eval_samples_per_second": 18.487, "eval_steps_per_second": 4.622, "step": 491000 }, { "epoch": 1.27, "learning_rate": 0.00010908468794471473, "loss": 0.0098, "step": 491010 }, { "epoch": 1.27, "learning_rate": 0.00010908079972834326, "loss": 0.012, "step": 491020 }, { "epoch": 1.27, "learning_rate": 0.00010907691151197182, "loss": 0.0071, "step": 491030 }, { "epoch": 1.27, "learning_rate": 0.00010907302329560034, "loss": 0.0105, "step": 491040 }, { "epoch": 1.27, "learning_rate": 0.00010906913507922888, "loss": 0.0105, "step": 491050 }, { "epoch": 1.27, "learning_rate": 0.00010906524686285741, "loss": 0.0105, "step": 491060 }, { "epoch": 1.27, "learning_rate": 0.00010906135864648595, "loss": 0.0108, "step": 491070 }, { "epoch": 1.27, "learning_rate": 0.00010905747043011448, "loss": 0.01, "step": 491080 }, { "epoch": 1.27, "learning_rate": 0.00010905358221374302, "loss": 0.012, "step": 491090 }, { "epoch": 1.27, "learning_rate": 0.00010904969399737155, "loss": 0.0113, "step": 491100 }, { "epoch": 1.27, "learning_rate": 0.0001090458057810001, "loss": 0.0099, "step": 491110 }, { "epoch": 1.27, "learning_rate": 0.00010904191756462862, "loss": 0.0106, "step": 491120 }, { "epoch": 1.27, "learning_rate": 0.00010903802934825716, "loss": 0.0084, "step": 491130 }, { "epoch": 1.27, "learning_rate": 0.00010903414113188569, "loss": 0.0151, "step": 491140 }, { "epoch": 1.27, "learning_rate": 0.00010903025291551423, "loss": 0.0129, "step": 491150 }, { "epoch": 1.27, "learning_rate": 0.00010902636469914276, "loss": 0.0115, "step": 491160 }, { "epoch": 1.27, "learning_rate": 0.0001090224764827713, "loss": 0.0089, "step": 491170 }, { "epoch": 1.27, "learning_rate": 0.00010901858826639983, "loss": 0.0119, "step": 491180 }, { "epoch": 1.27, "learning_rate": 0.00010901470005002839, "loss": 0.0122, "step": 491190 }, { "epoch": 1.27, "learning_rate": 0.00010901081183365691, "loss": 0.0085, "step": 491200 }, { "epoch": 1.27, "learning_rate": 0.00010900692361728546, "loss": 0.0139, "step": 491210 }, { "epoch": 1.27, "learning_rate": 0.00010900303540091398, "loss": 0.0117, "step": 491220 }, { "epoch": 1.27, "learning_rate": 0.00010899914718454253, "loss": 0.014, "step": 491230 }, { "epoch": 1.27, "learning_rate": 0.00010899525896817105, "loss": 0.0108, "step": 491240 }, { "epoch": 1.27, "learning_rate": 0.0001089913707517996, "loss": 0.0077, "step": 491250 }, { "epoch": 1.27, "learning_rate": 0.00010898748253542812, "loss": 0.0142, "step": 491260 }, { "epoch": 1.27, "learning_rate": 0.00010898359431905665, "loss": 0.0101, "step": 491270 }, { "epoch": 1.27, "learning_rate": 0.0001089797061026852, "loss": 0.013, "step": 491280 }, { "epoch": 1.27, "learning_rate": 0.00010897581788631372, "loss": 0.0086, "step": 491290 }, { "epoch": 1.27, "learning_rate": 0.00010897192966994226, "loss": 0.0127, "step": 491300 }, { "epoch": 1.27, "learning_rate": 0.00010896804145357079, "loss": 0.0085, "step": 491310 }, { "epoch": 1.27, "learning_rate": 0.00010896415323719933, "loss": 0.0094, "step": 491320 }, { "epoch": 1.27, "learning_rate": 0.00010896026502082786, "loss": 0.0106, "step": 491330 }, { "epoch": 1.27, "learning_rate": 0.0001089563768044564, "loss": 0.01, "step": 491340 }, { "epoch": 1.27, "learning_rate": 0.00010895248858808493, "loss": 0.0105, "step": 491350 }, { "epoch": 1.27, "learning_rate": 0.00010894860037171349, "loss": 0.0118, "step": 491360 }, { "epoch": 1.27, "learning_rate": 0.000108944712155342, "loss": 0.0167, "step": 491370 }, { "epoch": 1.27, "learning_rate": 0.00010894082393897056, "loss": 0.012, "step": 491380 }, { "epoch": 1.27, "learning_rate": 0.00010893693572259908, "loss": 0.0094, "step": 491390 }, { "epoch": 1.27, "learning_rate": 0.00010893304750622763, "loss": 0.0114, "step": 491400 }, { "epoch": 1.27, "learning_rate": 0.00010892915928985615, "loss": 0.0108, "step": 491410 }, { "epoch": 1.27, "learning_rate": 0.0001089252710734847, "loss": 0.0079, "step": 491420 }, { "epoch": 1.27, "learning_rate": 0.00010892138285711322, "loss": 0.0091, "step": 491430 }, { "epoch": 1.27, "learning_rate": 0.00010891749464074176, "loss": 0.0118, "step": 491440 }, { "epoch": 1.27, "learning_rate": 0.00010891360642437029, "loss": 0.0102, "step": 491450 }, { "epoch": 1.27, "learning_rate": 0.00010890971820799883, "loss": 0.0084, "step": 491460 }, { "epoch": 1.27, "learning_rate": 0.00010890582999162736, "loss": 0.0085, "step": 491470 }, { "epoch": 1.27, "learning_rate": 0.0001089019417752559, "loss": 0.0111, "step": 491480 }, { "epoch": 1.27, "learning_rate": 0.00010889805355888443, "loss": 0.0087, "step": 491490 }, { "epoch": 1.27, "learning_rate": 0.00010889416534251296, "loss": 0.0128, "step": 491500 }, { "epoch": 1.27, "learning_rate": 0.0001088902771261415, "loss": 0.0105, "step": 491510 }, { "epoch": 1.27, "learning_rate": 0.00010888638890977003, "loss": 0.01, "step": 491520 }, { "epoch": 1.27, "learning_rate": 0.00010888250069339857, "loss": 0.0089, "step": 491530 }, { "epoch": 1.27, "learning_rate": 0.0001088786124770271, "loss": 0.0122, "step": 491540 }, { "epoch": 1.27, "learning_rate": 0.00010887472426065566, "loss": 0.0119, "step": 491550 }, { "epoch": 1.27, "learning_rate": 0.00010887083604428418, "loss": 0.0105, "step": 491560 }, { "epoch": 1.27, "learning_rate": 0.00010886694782791272, "loss": 0.0089, "step": 491570 }, { "epoch": 1.27, "learning_rate": 0.00010886305961154125, "loss": 0.0103, "step": 491580 }, { "epoch": 1.27, "learning_rate": 0.0001088591713951698, "loss": 0.0123, "step": 491590 }, { "epoch": 1.27, "learning_rate": 0.00010885528317879832, "loss": 0.0108, "step": 491600 }, { "epoch": 1.27, "learning_rate": 0.00010885139496242686, "loss": 0.0095, "step": 491610 }, { "epoch": 1.27, "learning_rate": 0.00010884750674605539, "loss": 0.0141, "step": 491620 }, { "epoch": 1.27, "learning_rate": 0.00010884361852968393, "loss": 0.0106, "step": 491630 }, { "epoch": 1.27, "learning_rate": 0.00010883973031331246, "loss": 0.016, "step": 491640 }, { "epoch": 1.27, "learning_rate": 0.000108835842096941, "loss": 0.0118, "step": 491650 }, { "epoch": 1.27, "learning_rate": 0.00010883195388056953, "loss": 0.0128, "step": 491660 }, { "epoch": 1.27, "learning_rate": 0.00010882806566419807, "loss": 0.01, "step": 491670 }, { "epoch": 1.27, "learning_rate": 0.0001088241774478266, "loss": 0.0087, "step": 491680 }, { "epoch": 1.27, "learning_rate": 0.00010882028923145514, "loss": 0.0138, "step": 491690 }, { "epoch": 1.27, "learning_rate": 0.00010881640101508367, "loss": 0.0082, "step": 491700 }, { "epoch": 1.27, "learning_rate": 0.00010881251279871223, "loss": 0.0109, "step": 491710 }, { "epoch": 1.27, "learning_rate": 0.00010880862458234074, "loss": 0.0095, "step": 491720 }, { "epoch": 1.27, "learning_rate": 0.0001088047363659693, "loss": 0.0119, "step": 491730 }, { "epoch": 1.27, "learning_rate": 0.00010880084814959782, "loss": 0.0093, "step": 491740 }, { "epoch": 1.27, "learning_rate": 0.00010879695993322635, "loss": 0.0083, "step": 491750 }, { "epoch": 1.27, "learning_rate": 0.0001087930717168549, "loss": 0.008, "step": 491760 }, { "epoch": 1.27, "learning_rate": 0.00010878918350048342, "loss": 0.0147, "step": 491770 }, { "epoch": 1.27, "learning_rate": 0.00010878529528411196, "loss": 0.0082, "step": 491780 }, { "epoch": 1.27, "learning_rate": 0.00010878140706774049, "loss": 0.0161, "step": 491790 }, { "epoch": 1.27, "learning_rate": 0.00010877751885136903, "loss": 0.0102, "step": 491800 }, { "epoch": 1.27, "learning_rate": 0.00010877363063499756, "loss": 0.0142, "step": 491810 }, { "epoch": 1.27, "learning_rate": 0.0001087697424186261, "loss": 0.009, "step": 491820 }, { "epoch": 1.27, "learning_rate": 0.00010876585420225463, "loss": 0.0105, "step": 491830 }, { "epoch": 1.27, "learning_rate": 0.00010876196598588317, "loss": 0.0081, "step": 491840 }, { "epoch": 1.27, "learning_rate": 0.0001087580777695117, "loss": 0.0109, "step": 491850 }, { "epoch": 1.27, "learning_rate": 0.00010875418955314024, "loss": 0.0072, "step": 491860 }, { "epoch": 1.27, "learning_rate": 0.00010875030133676877, "loss": 0.0088, "step": 491870 }, { "epoch": 1.28, "learning_rate": 0.00010874641312039731, "loss": 0.0093, "step": 491880 }, { "epoch": 1.28, "learning_rate": 0.00010874252490402584, "loss": 0.0104, "step": 491890 }, { "epoch": 1.28, "learning_rate": 0.0001087386366876544, "loss": 0.0114, "step": 491900 }, { "epoch": 1.28, "learning_rate": 0.00010873474847128292, "loss": 0.0133, "step": 491910 }, { "epoch": 1.28, "learning_rate": 0.00010873086025491147, "loss": 0.0139, "step": 491920 }, { "epoch": 1.28, "learning_rate": 0.00010872697203854, "loss": 0.007, "step": 491930 }, { "epoch": 1.28, "learning_rate": 0.00010872308382216854, "loss": 0.0099, "step": 491940 }, { "epoch": 1.28, "learning_rate": 0.00010871919560579706, "loss": 0.0114, "step": 491950 }, { "epoch": 1.28, "learning_rate": 0.0001087153073894256, "loss": 0.0061, "step": 491960 }, { "epoch": 1.28, "learning_rate": 0.00010871141917305413, "loss": 0.0075, "step": 491970 }, { "epoch": 1.28, "learning_rate": 0.00010870753095668267, "loss": 0.0091, "step": 491980 }, { "epoch": 1.28, "learning_rate": 0.0001087036427403112, "loss": 0.009, "step": 491990 }, { "epoch": 1.28, "learning_rate": 0.00010869975452393973, "loss": 0.0135, "step": 492000 }, { "epoch": 1.28, "eval_cer": 0.8816453012088664, "eval_loss": 0.006531266961246729, "eval_runtime": 108.0198, "eval_samples_per_second": 18.515, "eval_steps_per_second": 4.629, "step": 492000 }, { "epoch": 1.28, "learning_rate": 0.00010869586630756827, "loss": 0.0092, "step": 492010 }, { "epoch": 1.28, "learning_rate": 0.0001086919780911968, "loss": 0.0085, "step": 492020 }, { "epoch": 1.28, "learning_rate": 0.00010868808987482534, "loss": 0.0098, "step": 492030 }, { "epoch": 1.28, "learning_rate": 0.00010868420165845387, "loss": 0.014, "step": 492040 }, { "epoch": 1.28, "learning_rate": 0.00010868031344208241, "loss": 0.0102, "step": 492050 }, { "epoch": 1.28, "learning_rate": 0.00010867642522571094, "loss": 0.0096, "step": 492060 }, { "epoch": 1.28, "learning_rate": 0.0001086725370093395, "loss": 0.0102, "step": 492070 }, { "epoch": 1.28, "learning_rate": 0.00010866864879296801, "loss": 0.0113, "step": 492080 }, { "epoch": 1.28, "learning_rate": 0.00010866476057659656, "loss": 0.0103, "step": 492090 }, { "epoch": 1.28, "learning_rate": 0.00010866087236022509, "loss": 0.0127, "step": 492100 }, { "epoch": 1.28, "learning_rate": 0.00010865698414385363, "loss": 0.0083, "step": 492110 }, { "epoch": 1.28, "learning_rate": 0.00010865309592748216, "loss": 0.0093, "step": 492120 }, { "epoch": 1.28, "learning_rate": 0.0001086492077111107, "loss": 0.0074, "step": 492130 }, { "epoch": 1.28, "learning_rate": 0.00010864531949473923, "loss": 0.0087, "step": 492140 }, { "epoch": 1.28, "learning_rate": 0.00010864143127836777, "loss": 0.0124, "step": 492150 }, { "epoch": 1.28, "learning_rate": 0.0001086375430619963, "loss": 0.0106, "step": 492160 }, { "epoch": 1.28, "learning_rate": 0.00010863365484562484, "loss": 0.0103, "step": 492170 }, { "epoch": 1.28, "learning_rate": 0.00010862976662925337, "loss": 0.0111, "step": 492180 }, { "epoch": 1.28, "learning_rate": 0.00010862587841288191, "loss": 0.0125, "step": 492190 }, { "epoch": 1.28, "learning_rate": 0.00010862199019651044, "loss": 0.0103, "step": 492200 }, { "epoch": 1.28, "learning_rate": 0.00010861810198013898, "loss": 0.0108, "step": 492210 }, { "epoch": 1.28, "learning_rate": 0.00010861421376376751, "loss": 0.0109, "step": 492220 }, { "epoch": 1.28, "learning_rate": 0.00010861032554739607, "loss": 0.01, "step": 492230 }, { "epoch": 1.28, "learning_rate": 0.00010860643733102458, "loss": 0.0089, "step": 492240 }, { "epoch": 1.28, "learning_rate": 0.00010860254911465311, "loss": 0.0096, "step": 492250 }, { "epoch": 1.28, "learning_rate": 0.00010859866089828166, "loss": 0.0131, "step": 492260 }, { "epoch": 1.28, "learning_rate": 0.00010859477268191019, "loss": 0.0119, "step": 492270 }, { "epoch": 1.28, "learning_rate": 0.00010859088446553873, "loss": 0.0091, "step": 492280 }, { "epoch": 1.28, "learning_rate": 0.00010858699624916726, "loss": 0.0076, "step": 492290 }, { "epoch": 1.28, "learning_rate": 0.0001085831080327958, "loss": 0.01, "step": 492300 }, { "epoch": 1.28, "learning_rate": 0.00010857921981642433, "loss": 0.0108, "step": 492310 }, { "epoch": 1.28, "learning_rate": 0.00010857533160005287, "loss": 0.0112, "step": 492320 }, { "epoch": 1.28, "learning_rate": 0.0001085714433836814, "loss": 0.0125, "step": 492330 }, { "epoch": 1.28, "learning_rate": 0.00010856755516730994, "loss": 0.0097, "step": 492340 }, { "epoch": 1.28, "learning_rate": 0.00010856366695093847, "loss": 0.0105, "step": 492350 }, { "epoch": 1.28, "learning_rate": 0.00010855977873456701, "loss": 0.0121, "step": 492360 }, { "epoch": 1.28, "learning_rate": 0.00010855589051819554, "loss": 0.0102, "step": 492370 }, { "epoch": 1.28, "learning_rate": 0.00010855200230182408, "loss": 0.0108, "step": 492380 }, { "epoch": 1.28, "learning_rate": 0.00010854811408545261, "loss": 0.0084, "step": 492390 }, { "epoch": 1.28, "learning_rate": 0.00010854422586908115, "loss": 0.0094, "step": 492400 }, { "epoch": 1.28, "learning_rate": 0.00010854033765270968, "loss": 0.0104, "step": 492410 }, { "epoch": 1.28, "learning_rate": 0.00010853644943633824, "loss": 0.0079, "step": 492420 }, { "epoch": 1.28, "learning_rate": 0.00010853256121996676, "loss": 0.0129, "step": 492430 }, { "epoch": 1.28, "learning_rate": 0.0001085286730035953, "loss": 0.0104, "step": 492440 }, { "epoch": 1.28, "learning_rate": 0.00010852478478722383, "loss": 0.0123, "step": 492450 }, { "epoch": 1.28, "learning_rate": 0.00010852089657085237, "loss": 0.0111, "step": 492460 }, { "epoch": 1.28, "learning_rate": 0.0001085170083544809, "loss": 0.0116, "step": 492470 }, { "epoch": 1.28, "learning_rate": 0.00010851312013810944, "loss": 0.0098, "step": 492480 }, { "epoch": 1.28, "learning_rate": 0.00010850923192173797, "loss": 0.0104, "step": 492490 }, { "epoch": 1.28, "learning_rate": 0.0001085053437053665, "loss": 0.0107, "step": 492500 }, { "epoch": 1.28, "learning_rate": 0.00010850145548899504, "loss": 0.0131, "step": 492510 }, { "epoch": 1.28, "learning_rate": 0.00010849756727262357, "loss": 0.0113, "step": 492520 }, { "epoch": 1.28, "learning_rate": 0.00010849367905625211, "loss": 0.0102, "step": 492530 }, { "epoch": 1.28, "learning_rate": 0.00010848979083988064, "loss": 0.0104, "step": 492540 }, { "epoch": 1.28, "learning_rate": 0.00010848590262350918, "loss": 0.0079, "step": 492550 }, { "epoch": 1.28, "learning_rate": 0.00010848201440713771, "loss": 0.0106, "step": 492560 }, { "epoch": 1.28, "learning_rate": 0.00010847812619076625, "loss": 0.0141, "step": 492570 }, { "epoch": 1.28, "learning_rate": 0.00010847423797439478, "loss": 0.0074, "step": 492580 }, { "epoch": 1.28, "learning_rate": 0.00010847034975802333, "loss": 0.0109, "step": 492590 }, { "epoch": 1.28, "learning_rate": 0.00010846646154165185, "loss": 0.0102, "step": 492600 }, { "epoch": 1.28, "learning_rate": 0.0001084625733252804, "loss": 0.0123, "step": 492610 }, { "epoch": 1.28, "learning_rate": 0.00010845868510890893, "loss": 0.0109, "step": 492620 }, { "epoch": 1.28, "learning_rate": 0.00010845479689253747, "loss": 0.0111, "step": 492630 }, { "epoch": 1.28, "learning_rate": 0.000108450908676166, "loss": 0.0102, "step": 492640 }, { "epoch": 1.28, "learning_rate": 0.00010844702045979454, "loss": 0.0093, "step": 492650 }, { "epoch": 1.28, "learning_rate": 0.00010844313224342307, "loss": 0.0136, "step": 492660 }, { "epoch": 1.28, "learning_rate": 0.00010843924402705161, "loss": 0.0103, "step": 492670 }, { "epoch": 1.28, "learning_rate": 0.00010843535581068014, "loss": 0.0098, "step": 492680 }, { "epoch": 1.28, "learning_rate": 0.00010843146759430868, "loss": 0.0106, "step": 492690 }, { "epoch": 1.28, "learning_rate": 0.00010842757937793721, "loss": 0.009, "step": 492700 }, { "epoch": 1.28, "learning_rate": 0.00010842369116156575, "loss": 0.0105, "step": 492710 }, { "epoch": 1.28, "learning_rate": 0.00010841980294519428, "loss": 0.0102, "step": 492720 }, { "epoch": 1.28, "learning_rate": 0.00010841591472882282, "loss": 0.0106, "step": 492730 }, { "epoch": 1.28, "learning_rate": 0.00010841202651245135, "loss": 0.0057, "step": 492740 }, { "epoch": 1.28, "learning_rate": 0.00010840813829607988, "loss": 0.0092, "step": 492750 }, { "epoch": 1.28, "learning_rate": 0.00010840425007970842, "loss": 0.0085, "step": 492760 }, { "epoch": 1.28, "learning_rate": 0.00010840036186333695, "loss": 0.0131, "step": 492770 }, { "epoch": 1.28, "learning_rate": 0.0001083964736469655, "loss": 0.0114, "step": 492780 }, { "epoch": 1.28, "learning_rate": 0.00010839258543059403, "loss": 0.0098, "step": 492790 }, { "epoch": 1.28, "learning_rate": 0.00010838869721422257, "loss": 0.0096, "step": 492800 }, { "epoch": 1.28, "learning_rate": 0.0001083848089978511, "loss": 0.0114, "step": 492810 }, { "epoch": 1.28, "learning_rate": 0.00010838092078147964, "loss": 0.0105, "step": 492820 }, { "epoch": 1.28, "learning_rate": 0.00010837703256510817, "loss": 0.01, "step": 492830 }, { "epoch": 1.28, "learning_rate": 0.00010837314434873671, "loss": 0.0104, "step": 492840 }, { "epoch": 1.28, "learning_rate": 0.00010836925613236524, "loss": 0.0147, "step": 492850 }, { "epoch": 1.28, "learning_rate": 0.00010836536791599378, "loss": 0.011, "step": 492860 }, { "epoch": 1.28, "learning_rate": 0.00010836147969962231, "loss": 0.0141, "step": 492870 }, { "epoch": 1.28, "learning_rate": 0.00010835759148325085, "loss": 0.0142, "step": 492880 }, { "epoch": 1.28, "learning_rate": 0.00010835370326687938, "loss": 0.012, "step": 492890 }, { "epoch": 1.28, "learning_rate": 0.00010834981505050792, "loss": 0.0092, "step": 492900 }, { "epoch": 1.28, "learning_rate": 0.00010834592683413645, "loss": 0.0144, "step": 492910 }, { "epoch": 1.28, "learning_rate": 0.00010834203861776499, "loss": 0.0133, "step": 492920 }, { "epoch": 1.28, "learning_rate": 0.00010833815040139352, "loss": 0.0113, "step": 492930 }, { "epoch": 1.28, "learning_rate": 0.00010833426218502208, "loss": 0.0066, "step": 492940 }, { "epoch": 1.28, "learning_rate": 0.00010833037396865059, "loss": 0.0123, "step": 492950 }, { "epoch": 1.28, "learning_rate": 0.00010832648575227915, "loss": 0.0134, "step": 492960 }, { "epoch": 1.28, "learning_rate": 0.00010832259753590767, "loss": 0.0112, "step": 492970 }, { "epoch": 1.28, "learning_rate": 0.00010831870931953621, "loss": 0.0103, "step": 492980 }, { "epoch": 1.28, "learning_rate": 0.00010831482110316474, "loss": 0.0117, "step": 492990 }, { "epoch": 1.28, "learning_rate": 0.00010831093288679327, "loss": 0.0076, "step": 493000 }, { "epoch": 1.28, "eval_cer": 0.8816564983043399, "eval_loss": 0.006680097430944443, "eval_runtime": 108.037, "eval_samples_per_second": 18.512, "eval_steps_per_second": 4.628, "step": 493000 }, { "epoch": 1.28, "learning_rate": 0.00010830704467042181, "loss": 0.0096, "step": 493010 }, { "epoch": 1.28, "learning_rate": 0.00010830315645405034, "loss": 0.0117, "step": 493020 }, { "epoch": 1.28, "learning_rate": 0.00010829926823767888, "loss": 0.0087, "step": 493030 }, { "epoch": 1.28, "learning_rate": 0.00010829538002130741, "loss": 0.008, "step": 493040 }, { "epoch": 1.28, "learning_rate": 0.00010829149180493595, "loss": 0.0101, "step": 493050 }, { "epoch": 1.28, "learning_rate": 0.00010828760358856448, "loss": 0.0079, "step": 493060 }, { "epoch": 1.28, "learning_rate": 0.00010828371537219302, "loss": 0.0122, "step": 493070 }, { "epoch": 1.28, "learning_rate": 0.00010827982715582155, "loss": 0.0109, "step": 493080 }, { "epoch": 1.28, "learning_rate": 0.00010827593893945009, "loss": 0.0112, "step": 493090 }, { "epoch": 1.28, "learning_rate": 0.00010827205072307862, "loss": 0.0115, "step": 493100 }, { "epoch": 1.28, "learning_rate": 0.00010826816250670716, "loss": 0.0114, "step": 493110 }, { "epoch": 1.28, "learning_rate": 0.00010826427429033569, "loss": 0.0081, "step": 493120 }, { "epoch": 1.28, "learning_rate": 0.00010826038607396424, "loss": 0.0095, "step": 493130 }, { "epoch": 1.28, "learning_rate": 0.00010825649785759277, "loss": 0.0097, "step": 493140 }, { "epoch": 1.28, "learning_rate": 0.00010825260964122131, "loss": 0.0108, "step": 493150 }, { "epoch": 1.28, "learning_rate": 0.00010824872142484984, "loss": 0.0094, "step": 493160 }, { "epoch": 1.28, "learning_rate": 0.00010824483320847838, "loss": 0.01, "step": 493170 }, { "epoch": 1.28, "learning_rate": 0.00010824094499210691, "loss": 0.0093, "step": 493180 }, { "epoch": 1.28, "learning_rate": 0.00010823705677573545, "loss": 0.0085, "step": 493190 }, { "epoch": 1.28, "learning_rate": 0.00010823316855936398, "loss": 0.0076, "step": 493200 }, { "epoch": 1.28, "learning_rate": 0.00010822928034299252, "loss": 0.0091, "step": 493210 }, { "epoch": 1.28, "learning_rate": 0.00010822539212662105, "loss": 0.0094, "step": 493220 }, { "epoch": 1.28, "learning_rate": 0.00010822150391024959, "loss": 0.0085, "step": 493230 }, { "epoch": 1.28, "learning_rate": 0.00010821761569387812, "loss": 0.0118, "step": 493240 }, { "epoch": 1.28, "learning_rate": 0.00010821372747750665, "loss": 0.0116, "step": 493250 }, { "epoch": 1.28, "learning_rate": 0.00010820983926113519, "loss": 0.014, "step": 493260 }, { "epoch": 1.28, "learning_rate": 0.00010820595104476372, "loss": 0.0081, "step": 493270 }, { "epoch": 1.28, "learning_rate": 0.00010820206282839226, "loss": 0.008, "step": 493280 }, { "epoch": 1.28, "learning_rate": 0.00010819817461202079, "loss": 0.0096, "step": 493290 }, { "epoch": 1.28, "learning_rate": 0.00010819428639564934, "loss": 0.0114, "step": 493300 }, { "epoch": 1.28, "learning_rate": 0.00010819039817927786, "loss": 0.0104, "step": 493310 }, { "epoch": 1.28, "learning_rate": 0.00010818650996290641, "loss": 0.0109, "step": 493320 }, { "epoch": 1.28, "learning_rate": 0.00010818262174653494, "loss": 0.0128, "step": 493330 }, { "epoch": 1.28, "learning_rate": 0.00010817873353016348, "loss": 0.0108, "step": 493340 }, { "epoch": 1.28, "learning_rate": 0.00010817484531379201, "loss": 0.0123, "step": 493350 }, { "epoch": 1.28, "learning_rate": 0.00010817095709742055, "loss": 0.0093, "step": 493360 }, { "epoch": 1.28, "learning_rate": 0.00010816706888104908, "loss": 0.0168, "step": 493370 }, { "epoch": 1.28, "learning_rate": 0.00010816318066467762, "loss": 0.0118, "step": 493380 }, { "epoch": 1.28, "learning_rate": 0.00010815929244830615, "loss": 0.0097, "step": 493390 }, { "epoch": 1.28, "learning_rate": 0.00010815540423193469, "loss": 0.0072, "step": 493400 }, { "epoch": 1.28, "learning_rate": 0.00010815151601556322, "loss": 0.0117, "step": 493410 }, { "epoch": 1.28, "learning_rate": 0.00010814762779919176, "loss": 0.0099, "step": 493420 }, { "epoch": 1.28, "learning_rate": 0.00010814373958282029, "loss": 0.0135, "step": 493430 }, { "epoch": 1.28, "learning_rate": 0.00010813985136644883, "loss": 0.0103, "step": 493440 }, { "epoch": 1.28, "learning_rate": 0.00010813596315007736, "loss": 0.0111, "step": 493450 }, { "epoch": 1.28, "learning_rate": 0.00010813207493370592, "loss": 0.0122, "step": 493460 }, { "epoch": 1.28, "learning_rate": 0.00010812818671733443, "loss": 0.0086, "step": 493470 }, { "epoch": 1.28, "learning_rate": 0.00010812429850096299, "loss": 0.0115, "step": 493480 }, { "epoch": 1.28, "learning_rate": 0.00010812041028459151, "loss": 0.0086, "step": 493490 }, { "epoch": 1.28, "learning_rate": 0.00010811652206822004, "loss": 0.0097, "step": 493500 }, { "epoch": 1.28, "learning_rate": 0.00010811263385184858, "loss": 0.0098, "step": 493510 }, { "epoch": 1.28, "learning_rate": 0.00010810874563547711, "loss": 0.008, "step": 493520 }, { "epoch": 1.28, "learning_rate": 0.00010810485741910565, "loss": 0.0091, "step": 493530 }, { "epoch": 1.28, "learning_rate": 0.00010810096920273418, "loss": 0.0098, "step": 493540 }, { "epoch": 1.28, "learning_rate": 0.00010809708098636272, "loss": 0.0086, "step": 493550 }, { "epoch": 1.28, "learning_rate": 0.00010809319276999125, "loss": 0.0081, "step": 493560 }, { "epoch": 1.28, "learning_rate": 0.00010808930455361979, "loss": 0.0085, "step": 493570 }, { "epoch": 1.28, "learning_rate": 0.00010808541633724832, "loss": 0.009, "step": 493580 }, { "epoch": 1.28, "learning_rate": 0.00010808152812087686, "loss": 0.0109, "step": 493590 }, { "epoch": 1.28, "learning_rate": 0.00010807763990450539, "loss": 0.0103, "step": 493600 }, { "epoch": 1.28, "learning_rate": 0.00010807375168813393, "loss": 0.0078, "step": 493610 }, { "epoch": 1.28, "learning_rate": 0.00010806986347176246, "loss": 0.0082, "step": 493620 }, { "epoch": 1.28, "learning_rate": 0.000108065975255391, "loss": 0.0101, "step": 493630 }, { "epoch": 1.28, "learning_rate": 0.00010806208703901953, "loss": 0.0092, "step": 493640 }, { "epoch": 1.28, "learning_rate": 0.00010805819882264808, "loss": 0.0116, "step": 493650 }, { "epoch": 1.28, "learning_rate": 0.00010805431060627661, "loss": 0.012, "step": 493660 }, { "epoch": 1.28, "learning_rate": 0.00010805042238990515, "loss": 0.0082, "step": 493670 }, { "epoch": 1.28, "learning_rate": 0.00010804653417353368, "loss": 0.0146, "step": 493680 }, { "epoch": 1.28, "learning_rate": 0.00010804264595716222, "loss": 0.0109, "step": 493690 }, { "epoch": 1.28, "learning_rate": 0.00010803875774079075, "loss": 0.0108, "step": 493700 }, { "epoch": 1.28, "learning_rate": 0.0001080348695244193, "loss": 0.0137, "step": 493710 }, { "epoch": 1.28, "learning_rate": 0.00010803098130804782, "loss": 0.011, "step": 493720 }, { "epoch": 1.28, "learning_rate": 0.00010802709309167636, "loss": 0.0073, "step": 493730 }, { "epoch": 1.28, "learning_rate": 0.00010802320487530489, "loss": 0.0096, "step": 493740 }, { "epoch": 1.28, "learning_rate": 0.00010801931665893342, "loss": 0.0104, "step": 493750 }, { "epoch": 1.28, "learning_rate": 0.00010801542844256196, "loss": 0.013, "step": 493760 }, { "epoch": 1.28, "learning_rate": 0.00010801154022619049, "loss": 0.01, "step": 493770 }, { "epoch": 1.28, "learning_rate": 0.00010800765200981903, "loss": 0.0115, "step": 493780 }, { "epoch": 1.28, "learning_rate": 0.00010800376379344756, "loss": 0.0109, "step": 493790 }, { "epoch": 1.28, "learning_rate": 0.0001079998755770761, "loss": 0.0077, "step": 493800 }, { "epoch": 1.28, "learning_rate": 0.00010799598736070463, "loss": 0.0107, "step": 493810 }, { "epoch": 1.28, "learning_rate": 0.00010799209914433318, "loss": 0.0069, "step": 493820 }, { "epoch": 1.28, "learning_rate": 0.0001079882109279617, "loss": 0.0101, "step": 493830 }, { "epoch": 1.28, "learning_rate": 0.00010798432271159025, "loss": 0.01, "step": 493840 }, { "epoch": 1.28, "learning_rate": 0.00010798043449521878, "loss": 0.0096, "step": 493850 }, { "epoch": 1.28, "learning_rate": 0.00010797654627884732, "loss": 0.0104, "step": 493860 }, { "epoch": 1.28, "learning_rate": 0.00010797265806247585, "loss": 0.009, "step": 493870 }, { "epoch": 1.28, "learning_rate": 0.00010796876984610439, "loss": 0.0083, "step": 493880 }, { "epoch": 1.28, "learning_rate": 0.00010796488162973292, "loss": 0.0104, "step": 493890 }, { "epoch": 1.28, "learning_rate": 0.00010796099341336146, "loss": 0.0081, "step": 493900 }, { "epoch": 1.28, "learning_rate": 0.00010795710519698999, "loss": 0.0093, "step": 493910 }, { "epoch": 1.28, "learning_rate": 0.00010795321698061853, "loss": 0.0082, "step": 493920 }, { "epoch": 1.28, "learning_rate": 0.00010794932876424706, "loss": 0.0086, "step": 493930 }, { "epoch": 1.28, "learning_rate": 0.0001079454405478756, "loss": 0.0103, "step": 493940 }, { "epoch": 1.28, "learning_rate": 0.00010794155233150413, "loss": 0.0098, "step": 493950 }, { "epoch": 1.28, "learning_rate": 0.00010793766411513267, "loss": 0.0116, "step": 493960 }, { "epoch": 1.28, "learning_rate": 0.0001079337758987612, "loss": 0.0096, "step": 493970 }, { "epoch": 1.28, "learning_rate": 0.00010792988768238976, "loss": 0.008, "step": 493980 }, { "epoch": 1.28, "learning_rate": 0.00010792599946601827, "loss": 0.0093, "step": 493990 }, { "epoch": 1.28, "learning_rate": 0.0001079221112496468, "loss": 0.01, "step": 494000 }, { "epoch": 1.28, "eval_cer": 0.88167329394755, "eval_loss": 0.006551279220730066, "eval_runtime": 107.9937, "eval_samples_per_second": 18.52, "eval_steps_per_second": 4.63, "step": 494000 }, { "epoch": 1.28, "learning_rate": 0.00010791822303327535, "loss": 0.0097, "step": 494010 }, { "epoch": 1.28, "learning_rate": 0.00010791433481690388, "loss": 0.0124, "step": 494020 }, { "epoch": 1.28, "learning_rate": 0.00010791044660053242, "loss": 0.0112, "step": 494030 }, { "epoch": 1.28, "learning_rate": 0.00010790655838416095, "loss": 0.0111, "step": 494040 }, { "epoch": 1.28, "learning_rate": 0.00010790267016778949, "loss": 0.0097, "step": 494050 }, { "epoch": 1.28, "learning_rate": 0.00010789878195141802, "loss": 0.0103, "step": 494060 }, { "epoch": 1.28, "learning_rate": 0.00010789489373504656, "loss": 0.0115, "step": 494070 }, { "epoch": 1.28, "learning_rate": 0.00010789100551867509, "loss": 0.0091, "step": 494080 }, { "epoch": 1.28, "learning_rate": 0.00010788711730230363, "loss": 0.0099, "step": 494090 }, { "epoch": 1.28, "learning_rate": 0.00010788322908593216, "loss": 0.0139, "step": 494100 }, { "epoch": 1.28, "learning_rate": 0.0001078793408695607, "loss": 0.0087, "step": 494110 }, { "epoch": 1.28, "learning_rate": 0.00010787545265318923, "loss": 0.0086, "step": 494120 }, { "epoch": 1.28, "learning_rate": 0.00010787156443681777, "loss": 0.0093, "step": 494130 }, { "epoch": 1.28, "learning_rate": 0.0001078676762204463, "loss": 0.0089, "step": 494140 }, { "epoch": 1.28, "learning_rate": 0.00010786378800407484, "loss": 0.0122, "step": 494150 }, { "epoch": 1.28, "learning_rate": 0.00010785989978770337, "loss": 0.0164, "step": 494160 }, { "epoch": 1.28, "learning_rate": 0.00010785601157133192, "loss": 0.0125, "step": 494170 }, { "epoch": 1.28, "learning_rate": 0.00010785212335496045, "loss": 0.0124, "step": 494180 }, { "epoch": 1.28, "learning_rate": 0.000107848235138589, "loss": 0.0105, "step": 494190 }, { "epoch": 1.28, "learning_rate": 0.00010784434692221752, "loss": 0.01, "step": 494200 }, { "epoch": 1.28, "learning_rate": 0.00010784045870584606, "loss": 0.0107, "step": 494210 }, { "epoch": 1.28, "learning_rate": 0.00010783657048947459, "loss": 0.0095, "step": 494220 }, { "epoch": 1.28, "learning_rate": 0.00010783268227310312, "loss": 0.0137, "step": 494230 }, { "epoch": 1.28, "learning_rate": 0.00010782879405673166, "loss": 0.0096, "step": 494240 }, { "epoch": 1.28, "learning_rate": 0.00010782490584036019, "loss": 0.0117, "step": 494250 }, { "epoch": 1.28, "learning_rate": 0.00010782101762398873, "loss": 0.0115, "step": 494260 }, { "epoch": 1.28, "learning_rate": 0.00010781712940761726, "loss": 0.0091, "step": 494270 }, { "epoch": 1.28, "learning_rate": 0.0001078132411912458, "loss": 0.0117, "step": 494280 }, { "epoch": 1.28, "learning_rate": 0.00010780935297487433, "loss": 0.0095, "step": 494290 }, { "epoch": 1.28, "learning_rate": 0.00010780546475850287, "loss": 0.0148, "step": 494300 }, { "epoch": 1.28, "learning_rate": 0.0001078015765421314, "loss": 0.0091, "step": 494310 }, { "epoch": 1.28, "learning_rate": 0.00010779768832575994, "loss": 0.0097, "step": 494320 }, { "epoch": 1.28, "learning_rate": 0.00010779380010938847, "loss": 0.009, "step": 494330 }, { "epoch": 1.28, "learning_rate": 0.00010778991189301701, "loss": 0.0124, "step": 494340 }, { "epoch": 1.28, "learning_rate": 0.00010778602367664554, "loss": 0.0123, "step": 494350 }, { "epoch": 1.28, "learning_rate": 0.0001077821354602741, "loss": 0.0111, "step": 494360 }, { "epoch": 1.28, "learning_rate": 0.00010777824724390262, "loss": 0.0104, "step": 494370 }, { "epoch": 1.28, "learning_rate": 0.00010777435902753116, "loss": 0.01, "step": 494380 }, { "epoch": 1.28, "learning_rate": 0.00010777047081115969, "loss": 0.0111, "step": 494390 }, { "epoch": 1.28, "learning_rate": 0.00010776658259478823, "loss": 0.0104, "step": 494400 }, { "epoch": 1.28, "learning_rate": 0.00010776269437841676, "loss": 0.0129, "step": 494410 }, { "epoch": 1.28, "learning_rate": 0.0001077588061620453, "loss": 0.0094, "step": 494420 }, { "epoch": 1.28, "learning_rate": 0.00010775491794567383, "loss": 0.0113, "step": 494430 }, { "epoch": 1.28, "learning_rate": 0.00010775102972930237, "loss": 0.0101, "step": 494440 }, { "epoch": 1.28, "learning_rate": 0.0001077471415129309, "loss": 0.0119, "step": 494450 }, { "epoch": 1.28, "learning_rate": 0.00010774325329655944, "loss": 0.0101, "step": 494460 }, { "epoch": 1.28, "learning_rate": 0.00010773936508018797, "loss": 0.0111, "step": 494470 }, { "epoch": 1.28, "learning_rate": 0.0001077354768638165, "loss": 0.0064, "step": 494480 }, { "epoch": 1.28, "learning_rate": 0.00010773158864744504, "loss": 0.0087, "step": 494490 }, { "epoch": 1.28, "learning_rate": 0.00010772770043107357, "loss": 0.0076, "step": 494500 }, { "epoch": 1.28, "learning_rate": 0.00010772381221470211, "loss": 0.0131, "step": 494510 }, { "epoch": 1.28, "learning_rate": 0.00010771992399833064, "loss": 0.0092, "step": 494520 }, { "epoch": 1.28, "learning_rate": 0.00010771603578195919, "loss": 0.0089, "step": 494530 }, { "epoch": 1.28, "learning_rate": 0.00010771214756558771, "loss": 0.008, "step": 494540 }, { "epoch": 1.28, "learning_rate": 0.00010770825934921626, "loss": 0.0106, "step": 494550 }, { "epoch": 1.28, "learning_rate": 0.00010770437113284479, "loss": 0.0095, "step": 494560 }, { "epoch": 1.28, "learning_rate": 0.00010770048291647333, "loss": 0.0074, "step": 494570 }, { "epoch": 1.28, "learning_rate": 0.00010769659470010186, "loss": 0.0081, "step": 494580 }, { "epoch": 1.28, "learning_rate": 0.0001076927064837304, "loss": 0.0077, "step": 494590 }, { "epoch": 1.28, "learning_rate": 0.00010768881826735893, "loss": 0.0075, "step": 494600 }, { "epoch": 1.28, "learning_rate": 0.00010768493005098747, "loss": 0.0107, "step": 494610 }, { "epoch": 1.28, "learning_rate": 0.000107681041834616, "loss": 0.0087, "step": 494620 }, { "epoch": 1.28, "learning_rate": 0.00010767715361824454, "loss": 0.0085, "step": 494630 }, { "epoch": 1.28, "learning_rate": 0.00010767326540187307, "loss": 0.0124, "step": 494640 }, { "epoch": 1.28, "learning_rate": 0.00010766937718550161, "loss": 0.0107, "step": 494650 }, { "epoch": 1.28, "learning_rate": 0.00010766548896913014, "loss": 0.0097, "step": 494660 }, { "epoch": 1.28, "learning_rate": 0.00010766160075275868, "loss": 0.0089, "step": 494670 }, { "epoch": 1.28, "learning_rate": 0.00010765771253638721, "loss": 0.011, "step": 494680 }, { "epoch": 1.28, "learning_rate": 0.00010765382432001576, "loss": 0.0099, "step": 494690 }, { "epoch": 1.28, "learning_rate": 0.00010764993610364428, "loss": 0.0092, "step": 494700 }, { "epoch": 1.28, "learning_rate": 0.00010764604788727283, "loss": 0.0106, "step": 494710 }, { "epoch": 1.28, "learning_rate": 0.00010764215967090136, "loss": 0.0087, "step": 494720 }, { "epoch": 1.28, "learning_rate": 0.00010763827145452989, "loss": 0.0082, "step": 494730 }, { "epoch": 1.28, "learning_rate": 0.00010763438323815843, "loss": 0.0084, "step": 494740 }, { "epoch": 1.28, "learning_rate": 0.00010763049502178696, "loss": 0.0099, "step": 494750 }, { "epoch": 1.28, "learning_rate": 0.0001076266068054155, "loss": 0.0092, "step": 494760 }, { "epoch": 1.28, "learning_rate": 0.00010762271858904403, "loss": 0.0197, "step": 494770 }, { "epoch": 1.28, "learning_rate": 0.00010761883037267257, "loss": 0.0097, "step": 494780 }, { "epoch": 1.28, "learning_rate": 0.0001076149421563011, "loss": 0.0088, "step": 494790 }, { "epoch": 1.28, "learning_rate": 0.00010761105393992964, "loss": 0.0119, "step": 494800 }, { "epoch": 1.28, "learning_rate": 0.00010760716572355817, "loss": 0.0114, "step": 494810 }, { "epoch": 1.28, "learning_rate": 0.00010760327750718671, "loss": 0.0111, "step": 494820 }, { "epoch": 1.28, "learning_rate": 0.00010759938929081524, "loss": 0.0129, "step": 494830 }, { "epoch": 1.28, "learning_rate": 0.00010759550107444378, "loss": 0.0085, "step": 494840 }, { "epoch": 1.28, "learning_rate": 0.00010759161285807231, "loss": 0.0108, "step": 494850 }, { "epoch": 1.28, "learning_rate": 0.00010758772464170085, "loss": 0.009, "step": 494860 }, { "epoch": 1.28, "learning_rate": 0.00010758383642532938, "loss": 0.0092, "step": 494870 }, { "epoch": 1.28, "learning_rate": 0.00010757994820895793, "loss": 0.0102, "step": 494880 }, { "epoch": 1.28, "learning_rate": 0.00010757605999258646, "loss": 0.0106, "step": 494890 }, { "epoch": 1.28, "learning_rate": 0.000107572171776215, "loss": 0.0135, "step": 494900 }, { "epoch": 1.28, "learning_rate": 0.00010756828355984353, "loss": 0.0169, "step": 494910 }, { "epoch": 1.28, "learning_rate": 0.00010756439534347207, "loss": 0.0116, "step": 494920 }, { "epoch": 1.28, "learning_rate": 0.0001075605071271006, "loss": 0.0101, "step": 494930 }, { "epoch": 1.28, "learning_rate": 0.00010755661891072914, "loss": 0.0085, "step": 494940 }, { "epoch": 1.28, "learning_rate": 0.00010755273069435767, "loss": 0.0112, "step": 494950 }, { "epoch": 1.28, "learning_rate": 0.00010754884247798621, "loss": 0.0095, "step": 494960 }, { "epoch": 1.28, "learning_rate": 0.00010754495426161474, "loss": 0.0103, "step": 494970 }, { "epoch": 1.28, "learning_rate": 0.00010754106604524327, "loss": 0.007, "step": 494980 }, { "epoch": 1.28, "learning_rate": 0.00010753717782887181, "loss": 0.0136, "step": 494990 }, { "epoch": 1.28, "learning_rate": 0.00010753328961250034, "loss": 0.0112, "step": 495000 }, { "epoch": 1.28, "eval_cer": 0.8816704946736816, "eval_loss": 0.006601433735340834, "eval_runtime": 108.0099, "eval_samples_per_second": 18.517, "eval_steps_per_second": 4.629, "step": 495000 }, { "epoch": 1.28, "learning_rate": 0.00010752940139612888, "loss": 0.0162, "step": 495010 }, { "epoch": 1.28, "learning_rate": 0.00010752551317975741, "loss": 0.0107, "step": 495020 }, { "epoch": 1.28, "learning_rate": 0.00010752162496338595, "loss": 0.0105, "step": 495030 }, { "epoch": 1.28, "learning_rate": 0.00010751773674701448, "loss": 0.0094, "step": 495040 }, { "epoch": 1.28, "learning_rate": 0.00010751384853064303, "loss": 0.0117, "step": 495050 }, { "epoch": 1.28, "learning_rate": 0.00010750996031427155, "loss": 0.0102, "step": 495060 }, { "epoch": 1.28, "learning_rate": 0.0001075060720979001, "loss": 0.0123, "step": 495070 }, { "epoch": 1.28, "learning_rate": 0.00010750218388152863, "loss": 0.0124, "step": 495080 }, { "epoch": 1.28, "learning_rate": 0.00010749829566515717, "loss": 0.0106, "step": 495090 }, { "epoch": 1.28, "learning_rate": 0.0001074944074487857, "loss": 0.0078, "step": 495100 }, { "epoch": 1.28, "learning_rate": 0.00010749051923241424, "loss": 0.0091, "step": 495110 }, { "epoch": 1.28, "learning_rate": 0.00010748663101604277, "loss": 0.0098, "step": 495120 }, { "epoch": 1.28, "learning_rate": 0.00010748274279967131, "loss": 0.011, "step": 495130 }, { "epoch": 1.28, "learning_rate": 0.00010747885458329984, "loss": 0.0107, "step": 495140 }, { "epoch": 1.28, "learning_rate": 0.00010747496636692838, "loss": 0.0094, "step": 495150 }, { "epoch": 1.28, "learning_rate": 0.00010747107815055691, "loss": 0.008, "step": 495160 }, { "epoch": 1.28, "learning_rate": 0.00010746718993418545, "loss": 0.0103, "step": 495170 }, { "epoch": 1.28, "learning_rate": 0.00010746330171781398, "loss": 0.0087, "step": 495180 }, { "epoch": 1.28, "learning_rate": 0.00010745941350144252, "loss": 0.012, "step": 495190 }, { "epoch": 1.28, "learning_rate": 0.00010745552528507105, "loss": 0.008, "step": 495200 }, { "epoch": 1.28, "learning_rate": 0.0001074516370686996, "loss": 0.0086, "step": 495210 }, { "epoch": 1.28, "learning_rate": 0.00010744774885232812, "loss": 0.0092, "step": 495220 }, { "epoch": 1.28, "learning_rate": 0.00010744386063595665, "loss": 0.0114, "step": 495230 }, { "epoch": 1.28, "learning_rate": 0.0001074399724195852, "loss": 0.0091, "step": 495240 }, { "epoch": 1.28, "learning_rate": 0.00010743608420321373, "loss": 0.0103, "step": 495250 }, { "epoch": 1.28, "learning_rate": 0.00010743219598684227, "loss": 0.0085, "step": 495260 }, { "epoch": 1.28, "learning_rate": 0.0001074283077704708, "loss": 0.0093, "step": 495270 }, { "epoch": 1.28, "learning_rate": 0.00010742441955409934, "loss": 0.0122, "step": 495280 }, { "epoch": 1.28, "learning_rate": 0.00010742053133772787, "loss": 0.0153, "step": 495290 }, { "epoch": 1.28, "learning_rate": 0.00010741664312135641, "loss": 0.0086, "step": 495300 }, { "epoch": 1.28, "learning_rate": 0.00010741275490498494, "loss": 0.0117, "step": 495310 }, { "epoch": 1.28, "learning_rate": 0.00010740886668861348, "loss": 0.0085, "step": 495320 }, { "epoch": 1.28, "learning_rate": 0.00010740497847224201, "loss": 0.0105, "step": 495330 }, { "epoch": 1.28, "learning_rate": 0.00010740109025587055, "loss": 0.0085, "step": 495340 }, { "epoch": 1.28, "learning_rate": 0.00010739720203949908, "loss": 0.0107, "step": 495350 }, { "epoch": 1.28, "learning_rate": 0.00010739331382312762, "loss": 0.0087, "step": 495360 }, { "epoch": 1.28, "learning_rate": 0.00010738942560675615, "loss": 0.009, "step": 495370 }, { "epoch": 1.28, "learning_rate": 0.00010738553739038469, "loss": 0.0093, "step": 495380 }, { "epoch": 1.28, "learning_rate": 0.00010738164917401322, "loss": 0.0095, "step": 495390 }, { "epoch": 1.28, "learning_rate": 0.00010737776095764177, "loss": 0.0169, "step": 495400 }, { "epoch": 1.28, "learning_rate": 0.0001073738727412703, "loss": 0.0092, "step": 495410 }, { "epoch": 1.28, "learning_rate": 0.00010736998452489884, "loss": 0.0122, "step": 495420 }, { "epoch": 1.28, "learning_rate": 0.00010736609630852737, "loss": 0.0087, "step": 495430 }, { "epoch": 1.28, "learning_rate": 0.00010736220809215591, "loss": 0.0078, "step": 495440 }, { "epoch": 1.28, "learning_rate": 0.00010735831987578444, "loss": 0.0091, "step": 495450 }, { "epoch": 1.28, "learning_rate": 0.00010735443165941298, "loss": 0.0102, "step": 495460 }, { "epoch": 1.28, "learning_rate": 0.00010735054344304151, "loss": 0.0084, "step": 495470 }, { "epoch": 1.28, "learning_rate": 0.00010734665522667004, "loss": 0.0078, "step": 495480 }, { "epoch": 1.28, "learning_rate": 0.00010734276701029858, "loss": 0.0092, "step": 495490 }, { "epoch": 1.28, "learning_rate": 0.00010733887879392711, "loss": 0.0099, "step": 495500 }, { "epoch": 1.28, "learning_rate": 0.00010733499057755565, "loss": 0.0082, "step": 495510 }, { "epoch": 1.28, "learning_rate": 0.00010733110236118418, "loss": 0.0118, "step": 495520 }, { "epoch": 1.28, "learning_rate": 0.00010732721414481272, "loss": 0.0091, "step": 495530 }, { "epoch": 1.28, "learning_rate": 0.00010732332592844125, "loss": 0.0106, "step": 495540 }, { "epoch": 1.28, "learning_rate": 0.00010731943771206979, "loss": 0.0077, "step": 495550 }, { "epoch": 1.28, "learning_rate": 0.00010731554949569832, "loss": 0.0123, "step": 495560 }, { "epoch": 1.28, "learning_rate": 0.00010731166127932686, "loss": 0.0086, "step": 495570 }, { "epoch": 1.28, "learning_rate": 0.00010730777306295539, "loss": 0.0101, "step": 495580 }, { "epoch": 1.28, "learning_rate": 0.00010730388484658394, "loss": 0.0121, "step": 495590 }, { "epoch": 1.28, "learning_rate": 0.00010729999663021247, "loss": 0.0114, "step": 495600 }, { "epoch": 1.28, "learning_rate": 0.00010729610841384101, "loss": 0.0099, "step": 495610 }, { "epoch": 1.28, "learning_rate": 0.00010729222019746954, "loss": 0.0106, "step": 495620 }, { "epoch": 1.28, "learning_rate": 0.00010728833198109808, "loss": 0.0101, "step": 495630 }, { "epoch": 1.28, "learning_rate": 0.00010728444376472661, "loss": 0.0119, "step": 495640 }, { "epoch": 1.28, "learning_rate": 0.00010728055554835515, "loss": 0.0122, "step": 495650 }, { "epoch": 1.28, "learning_rate": 0.00010727666733198368, "loss": 0.0145, "step": 495660 }, { "epoch": 1.28, "learning_rate": 0.00010727277911561222, "loss": 0.0088, "step": 495670 }, { "epoch": 1.28, "learning_rate": 0.00010726889089924075, "loss": 0.0093, "step": 495680 }, { "epoch": 1.28, "learning_rate": 0.00010726500268286929, "loss": 0.0104, "step": 495690 }, { "epoch": 1.28, "learning_rate": 0.00010726111446649782, "loss": 0.0111, "step": 495700 }, { "epoch": 1.28, "learning_rate": 0.00010725722625012636, "loss": 0.0111, "step": 495710 }, { "epoch": 1.28, "learning_rate": 0.00010725333803375489, "loss": 0.0097, "step": 495720 }, { "epoch": 1.29, "learning_rate": 0.00010724944981738342, "loss": 0.0108, "step": 495730 }, { "epoch": 1.29, "learning_rate": 0.00010724556160101196, "loss": 0.0108, "step": 495740 }, { "epoch": 1.29, "learning_rate": 0.00010724167338464049, "loss": 0.0105, "step": 495750 }, { "epoch": 1.29, "learning_rate": 0.00010723778516826904, "loss": 0.0145, "step": 495760 }, { "epoch": 1.29, "learning_rate": 0.00010723389695189757, "loss": 0.0082, "step": 495770 }, { "epoch": 1.29, "learning_rate": 0.00010723000873552611, "loss": 0.0109, "step": 495780 }, { "epoch": 1.29, "learning_rate": 0.00010722612051915464, "loss": 0.0108, "step": 495790 }, { "epoch": 1.29, "learning_rate": 0.00010722223230278318, "loss": 0.0104, "step": 495800 }, { "epoch": 1.29, "learning_rate": 0.00010721834408641171, "loss": 0.0078, "step": 495810 }, { "epoch": 1.29, "learning_rate": 0.00010721445587004025, "loss": 0.0085, "step": 495820 }, { "epoch": 1.29, "learning_rate": 0.00010721056765366878, "loss": 0.0082, "step": 495830 }, { "epoch": 1.29, "learning_rate": 0.00010720667943729732, "loss": 0.0093, "step": 495840 }, { "epoch": 1.29, "learning_rate": 0.00010720279122092585, "loss": 0.0099, "step": 495850 }, { "epoch": 1.29, "learning_rate": 0.00010719890300455439, "loss": 0.0122, "step": 495860 }, { "epoch": 1.29, "learning_rate": 0.00010719501478818292, "loss": 0.0092, "step": 495870 }, { "epoch": 1.29, "learning_rate": 0.00010719112657181146, "loss": 0.0109, "step": 495880 }, { "epoch": 1.29, "learning_rate": 0.00010718723835543999, "loss": 0.0101, "step": 495890 }, { "epoch": 1.29, "learning_rate": 0.00010718335013906853, "loss": 0.0135, "step": 495900 }, { "epoch": 1.29, "learning_rate": 0.00010717946192269706, "loss": 0.0102, "step": 495910 }, { "epoch": 1.29, "learning_rate": 0.00010717557370632561, "loss": 0.0068, "step": 495920 }, { "epoch": 1.29, "learning_rate": 0.00010717168548995413, "loss": 0.0115, "step": 495930 }, { "epoch": 1.29, "learning_rate": 0.00010716779727358268, "loss": 0.0155, "step": 495940 }, { "epoch": 1.29, "learning_rate": 0.00010716390905721121, "loss": 0.0086, "step": 495950 }, { "epoch": 1.29, "learning_rate": 0.00010716002084083975, "loss": 0.0116, "step": 495960 }, { "epoch": 1.29, "learning_rate": 0.00010715613262446828, "loss": 0.0096, "step": 495970 }, { "epoch": 1.29, "learning_rate": 0.00010715224440809681, "loss": 0.0116, "step": 495980 }, { "epoch": 1.29, "learning_rate": 0.00010714835619172535, "loss": 0.0115, "step": 495990 }, { "epoch": 1.29, "learning_rate": 0.00010714446797535388, "loss": 0.0088, "step": 496000 }, { "epoch": 1.29, "eval_cer": 0.8816648961259449, "eval_loss": 0.006738040130585432, "eval_runtime": 107.9676, "eval_samples_per_second": 18.524, "eval_steps_per_second": 4.631, "step": 496000 }, { "epoch": 1.29, "learning_rate": 0.00010714057975898242, "loss": 0.0116, "step": 496010 }, { "epoch": 1.29, "learning_rate": 0.00010713669154261095, "loss": 0.0111, "step": 496020 }, { "epoch": 1.29, "learning_rate": 0.00010713280332623949, "loss": 0.0107, "step": 496030 }, { "epoch": 1.29, "learning_rate": 0.00010712891510986802, "loss": 0.011, "step": 496040 }, { "epoch": 1.29, "learning_rate": 0.00010712502689349656, "loss": 0.0103, "step": 496050 }, { "epoch": 1.29, "learning_rate": 0.00010712113867712509, "loss": 0.0132, "step": 496060 }, { "epoch": 1.29, "learning_rate": 0.00010711725046075363, "loss": 0.0085, "step": 496070 }, { "epoch": 1.29, "learning_rate": 0.00010711336224438216, "loss": 0.0088, "step": 496080 }, { "epoch": 1.29, "learning_rate": 0.0001071094740280107, "loss": 0.0131, "step": 496090 }, { "epoch": 1.29, "learning_rate": 0.00010710558581163923, "loss": 0.0156, "step": 496100 }, { "epoch": 1.29, "learning_rate": 0.00010710169759526778, "loss": 0.0097, "step": 496110 }, { "epoch": 1.29, "learning_rate": 0.00010709780937889631, "loss": 0.0092, "step": 496120 }, { "epoch": 1.29, "learning_rate": 0.00010709392116252485, "loss": 0.0118, "step": 496130 }, { "epoch": 1.29, "learning_rate": 0.00010709003294615338, "loss": 0.0121, "step": 496140 }, { "epoch": 1.29, "learning_rate": 0.00010708614472978192, "loss": 0.0135, "step": 496150 }, { "epoch": 1.29, "learning_rate": 0.00010708225651341045, "loss": 0.0092, "step": 496160 }, { "epoch": 1.29, "learning_rate": 0.00010707836829703899, "loss": 0.0097, "step": 496170 }, { "epoch": 1.29, "learning_rate": 0.00010707448008066752, "loss": 0.0109, "step": 496180 }, { "epoch": 1.29, "learning_rate": 0.00010707059186429606, "loss": 0.0089, "step": 496190 }, { "epoch": 1.29, "learning_rate": 0.00010706670364792459, "loss": 0.0139, "step": 496200 }, { "epoch": 1.29, "learning_rate": 0.00010706281543155313, "loss": 0.011, "step": 496210 }, { "epoch": 1.29, "learning_rate": 0.00010705892721518166, "loss": 0.0124, "step": 496220 }, { "epoch": 1.29, "learning_rate": 0.00010705503899881019, "loss": 0.0108, "step": 496230 }, { "epoch": 1.29, "learning_rate": 0.00010705115078243873, "loss": 0.0127, "step": 496240 }, { "epoch": 1.29, "learning_rate": 0.00010704726256606726, "loss": 0.0099, "step": 496250 }, { "epoch": 1.29, "learning_rate": 0.0001070433743496958, "loss": 0.0101, "step": 496260 }, { "epoch": 1.29, "learning_rate": 0.00010703948613332433, "loss": 0.0122, "step": 496270 }, { "epoch": 1.29, "learning_rate": 0.00010703559791695288, "loss": 0.0091, "step": 496280 }, { "epoch": 1.29, "learning_rate": 0.0001070317097005814, "loss": 0.0109, "step": 496290 }, { "epoch": 1.29, "learning_rate": 0.00010702782148420995, "loss": 0.0103, "step": 496300 }, { "epoch": 1.29, "learning_rate": 0.00010702393326783848, "loss": 0.0081, "step": 496310 }, { "epoch": 1.29, "learning_rate": 0.00010702004505146702, "loss": 0.0093, "step": 496320 }, { "epoch": 1.29, "learning_rate": 0.00010701615683509555, "loss": 0.01, "step": 496330 }, { "epoch": 1.29, "learning_rate": 0.00010701226861872409, "loss": 0.0078, "step": 496340 }, { "epoch": 1.29, "learning_rate": 0.00010700838040235262, "loss": 0.0103, "step": 496350 }, { "epoch": 1.29, "learning_rate": 0.00010700449218598116, "loss": 0.008, "step": 496360 }, { "epoch": 1.29, "learning_rate": 0.00010700060396960969, "loss": 0.0079, "step": 496370 }, { "epoch": 1.29, "learning_rate": 0.00010699671575323823, "loss": 0.0134, "step": 496380 }, { "epoch": 1.29, "learning_rate": 0.00010699282753686676, "loss": 0.0094, "step": 496390 }, { "epoch": 1.29, "learning_rate": 0.0001069889393204953, "loss": 0.0101, "step": 496400 }, { "epoch": 1.29, "learning_rate": 0.00010698505110412383, "loss": 0.0126, "step": 496410 }, { "epoch": 1.29, "learning_rate": 0.00010698116288775237, "loss": 0.0115, "step": 496420 }, { "epoch": 1.29, "learning_rate": 0.0001069772746713809, "loss": 0.0108, "step": 496430 }, { "epoch": 1.29, "learning_rate": 0.00010697338645500945, "loss": 0.012, "step": 496440 }, { "epoch": 1.29, "learning_rate": 0.00010696949823863797, "loss": 0.0081, "step": 496450 }, { "epoch": 1.29, "learning_rate": 0.00010696561002226652, "loss": 0.013, "step": 496460 }, { "epoch": 1.29, "learning_rate": 0.00010696172180589505, "loss": 0.012, "step": 496470 }, { "epoch": 1.29, "learning_rate": 0.00010695783358952358, "loss": 0.012, "step": 496480 }, { "epoch": 1.29, "learning_rate": 0.00010695394537315212, "loss": 0.0088, "step": 496490 }, { "epoch": 1.29, "learning_rate": 0.00010695005715678065, "loss": 0.0107, "step": 496500 }, { "epoch": 1.29, "learning_rate": 0.00010694616894040919, "loss": 0.0118, "step": 496510 }, { "epoch": 1.29, "learning_rate": 0.00010694228072403772, "loss": 0.0155, "step": 496520 }, { "epoch": 1.29, "learning_rate": 0.00010693839250766626, "loss": 0.01, "step": 496530 }, { "epoch": 1.29, "learning_rate": 0.00010693450429129479, "loss": 0.0084, "step": 496540 }, { "epoch": 1.29, "learning_rate": 0.00010693061607492333, "loss": 0.0116, "step": 496550 }, { "epoch": 1.29, "learning_rate": 0.00010692672785855186, "loss": 0.0137, "step": 496560 }, { "epoch": 1.29, "learning_rate": 0.0001069228396421804, "loss": 0.0096, "step": 496570 }, { "epoch": 1.29, "learning_rate": 0.00010691895142580893, "loss": 0.0094, "step": 496580 }, { "epoch": 1.29, "learning_rate": 0.00010691506320943747, "loss": 0.0089, "step": 496590 }, { "epoch": 1.29, "learning_rate": 0.000106911174993066, "loss": 0.0083, "step": 496600 }, { "epoch": 1.29, "learning_rate": 0.00010690728677669454, "loss": 0.0116, "step": 496610 }, { "epoch": 1.29, "learning_rate": 0.00010690339856032307, "loss": 0.0115, "step": 496620 }, { "epoch": 1.29, "learning_rate": 0.00010689951034395162, "loss": 0.0113, "step": 496630 }, { "epoch": 1.29, "learning_rate": 0.00010689562212758015, "loss": 0.0094, "step": 496640 }, { "epoch": 1.29, "learning_rate": 0.00010689173391120869, "loss": 0.0097, "step": 496650 }, { "epoch": 1.29, "learning_rate": 0.00010688784569483722, "loss": 0.0098, "step": 496660 }, { "epoch": 1.29, "learning_rate": 0.00010688395747846576, "loss": 0.0095, "step": 496670 }, { "epoch": 1.29, "learning_rate": 0.00010688006926209429, "loss": 0.0087, "step": 496680 }, { "epoch": 1.29, "learning_rate": 0.00010687618104572283, "loss": 0.0123, "step": 496690 }, { "epoch": 1.29, "learning_rate": 0.00010687229282935136, "loss": 0.0117, "step": 496700 }, { "epoch": 1.29, "learning_rate": 0.00010686840461297989, "loss": 0.0094, "step": 496710 }, { "epoch": 1.29, "learning_rate": 0.00010686451639660843, "loss": 0.011, "step": 496720 }, { "epoch": 1.29, "learning_rate": 0.00010686062818023696, "loss": 0.0142, "step": 496730 }, { "epoch": 1.29, "learning_rate": 0.0001068567399638655, "loss": 0.0084, "step": 496740 }, { "epoch": 1.29, "learning_rate": 0.00010685285174749403, "loss": 0.0105, "step": 496750 }, { "epoch": 1.29, "learning_rate": 0.00010684896353112257, "loss": 0.012, "step": 496760 }, { "epoch": 1.29, "learning_rate": 0.0001068450753147511, "loss": 0.0099, "step": 496770 }, { "epoch": 1.29, "learning_rate": 0.00010684118709837964, "loss": 0.0086, "step": 496780 }, { "epoch": 1.29, "learning_rate": 0.00010683729888200817, "loss": 0.0152, "step": 496790 }, { "epoch": 1.29, "learning_rate": 0.00010683341066563672, "loss": 0.0131, "step": 496800 }, { "epoch": 1.29, "learning_rate": 0.00010682952244926524, "loss": 0.0103, "step": 496810 }, { "epoch": 1.29, "learning_rate": 0.00010682563423289379, "loss": 0.0128, "step": 496820 }, { "epoch": 1.29, "learning_rate": 0.00010682174601652232, "loss": 0.0106, "step": 496830 }, { "epoch": 1.29, "learning_rate": 0.00010681785780015086, "loss": 0.0084, "step": 496840 }, { "epoch": 1.29, "learning_rate": 0.00010681396958377939, "loss": 0.009, "step": 496850 }, { "epoch": 1.29, "learning_rate": 0.00010681008136740793, "loss": 0.0095, "step": 496860 }, { "epoch": 1.29, "learning_rate": 0.00010680619315103646, "loss": 0.0098, "step": 496870 }, { "epoch": 1.29, "learning_rate": 0.000106802304934665, "loss": 0.0098, "step": 496880 }, { "epoch": 1.29, "learning_rate": 0.00010679841671829353, "loss": 0.0075, "step": 496890 }, { "epoch": 1.29, "learning_rate": 0.00010679452850192207, "loss": 0.0086, "step": 496900 }, { "epoch": 1.29, "learning_rate": 0.0001067906402855506, "loss": 0.0099, "step": 496910 }, { "epoch": 1.29, "learning_rate": 0.00010678675206917914, "loss": 0.0096, "step": 496920 }, { "epoch": 1.29, "learning_rate": 0.00010678286385280767, "loss": 0.0104, "step": 496930 }, { "epoch": 1.29, "learning_rate": 0.00010677897563643621, "loss": 0.0099, "step": 496940 }, { "epoch": 1.29, "learning_rate": 0.00010677508742006474, "loss": 0.0124, "step": 496950 }, { "epoch": 1.29, "learning_rate": 0.00010677119920369327, "loss": 0.0116, "step": 496960 }, { "epoch": 1.29, "learning_rate": 0.00010676731098732181, "loss": 0.0104, "step": 496970 }, { "epoch": 1.29, "learning_rate": 0.00010676342277095034, "loss": 0.0131, "step": 496980 }, { "epoch": 1.29, "learning_rate": 0.00010675953455457889, "loss": 0.0099, "step": 496990 }, { "epoch": 1.29, "learning_rate": 0.00010675564633820742, "loss": 0.0082, "step": 497000 }, { "epoch": 1.29, "eval_cer": 0.881657897941274, "eval_loss": 0.006887293886393309, "eval_runtime": 108.0582, "eval_samples_per_second": 18.509, "eval_steps_per_second": 4.627, "step": 497000 }, { "epoch": 1.29, "learning_rate": 0.00010675175812183596, "loss": 0.0097, "step": 497010 }, { "epoch": 1.29, "learning_rate": 0.00010674786990546449, "loss": 0.0097, "step": 497020 }, { "epoch": 1.29, "learning_rate": 0.00010674398168909303, "loss": 0.01, "step": 497030 }, { "epoch": 1.29, "learning_rate": 0.00010674009347272156, "loss": 0.011, "step": 497040 }, { "epoch": 1.29, "learning_rate": 0.0001067362052563501, "loss": 0.0094, "step": 497050 }, { "epoch": 1.29, "learning_rate": 0.00010673231703997863, "loss": 0.0088, "step": 497060 }, { "epoch": 1.29, "learning_rate": 0.00010672842882360717, "loss": 0.0109, "step": 497070 }, { "epoch": 1.29, "learning_rate": 0.0001067245406072357, "loss": 0.0114, "step": 497080 }, { "epoch": 1.29, "learning_rate": 0.00010672065239086424, "loss": 0.0101, "step": 497090 }, { "epoch": 1.29, "learning_rate": 0.00010671676417449277, "loss": 0.011, "step": 497100 }, { "epoch": 1.29, "learning_rate": 0.00010671287595812131, "loss": 0.01, "step": 497110 }, { "epoch": 1.29, "learning_rate": 0.00010670898774174984, "loss": 0.024, "step": 497120 }, { "epoch": 1.29, "learning_rate": 0.00010670509952537838, "loss": 0.011, "step": 497130 }, { "epoch": 1.29, "learning_rate": 0.00010670121130900691, "loss": 0.0094, "step": 497140 }, { "epoch": 1.29, "learning_rate": 0.00010669732309263546, "loss": 0.0108, "step": 497150 }, { "epoch": 1.29, "learning_rate": 0.00010669343487626398, "loss": 0.0074, "step": 497160 }, { "epoch": 1.29, "learning_rate": 0.00010668954665989253, "loss": 0.0088, "step": 497170 }, { "epoch": 1.29, "learning_rate": 0.00010668565844352106, "loss": 0.0114, "step": 497180 }, { "epoch": 1.29, "learning_rate": 0.0001066817702271496, "loss": 0.0072, "step": 497190 }, { "epoch": 1.29, "learning_rate": 0.00010667788201077813, "loss": 0.0092, "step": 497200 }, { "epoch": 1.29, "learning_rate": 0.00010667399379440666, "loss": 0.0104, "step": 497210 }, { "epoch": 1.29, "learning_rate": 0.0001066701055780352, "loss": 0.0128, "step": 497220 }, { "epoch": 1.29, "learning_rate": 0.00010666621736166373, "loss": 0.0117, "step": 497230 }, { "epoch": 1.29, "learning_rate": 0.00010666232914529227, "loss": 0.0088, "step": 497240 }, { "epoch": 1.29, "learning_rate": 0.0001066584409289208, "loss": 0.0107, "step": 497250 }, { "epoch": 1.29, "learning_rate": 0.00010665455271254934, "loss": 0.0105, "step": 497260 }, { "epoch": 1.29, "learning_rate": 0.00010665066449617787, "loss": 0.0089, "step": 497270 }, { "epoch": 1.29, "learning_rate": 0.00010664677627980641, "loss": 0.0091, "step": 497280 }, { "epoch": 1.29, "learning_rate": 0.00010664288806343494, "loss": 0.0094, "step": 497290 }, { "epoch": 1.29, "learning_rate": 0.00010663899984706348, "loss": 0.0107, "step": 497300 }, { "epoch": 1.29, "learning_rate": 0.000106635111630692, "loss": 0.0105, "step": 497310 }, { "epoch": 1.29, "learning_rate": 0.00010663122341432055, "loss": 0.0134, "step": 497320 }, { "epoch": 1.29, "learning_rate": 0.00010662733519794908, "loss": 0.0085, "step": 497330 }, { "epoch": 1.29, "learning_rate": 0.00010662344698157763, "loss": 0.0091, "step": 497340 }, { "epoch": 1.29, "learning_rate": 0.00010661955876520616, "loss": 0.0109, "step": 497350 }, { "epoch": 1.29, "learning_rate": 0.0001066156705488347, "loss": 0.0122, "step": 497360 }, { "epoch": 1.29, "learning_rate": 0.00010661178233246323, "loss": 0.0096, "step": 497370 }, { "epoch": 1.29, "learning_rate": 0.00010660789411609177, "loss": 0.0124, "step": 497380 }, { "epoch": 1.29, "learning_rate": 0.0001066040058997203, "loss": 0.0126, "step": 497390 }, { "epoch": 1.29, "learning_rate": 0.00010660011768334884, "loss": 0.0088, "step": 497400 }, { "epoch": 1.29, "learning_rate": 0.00010659622946697737, "loss": 0.0094, "step": 497410 }, { "epoch": 1.29, "learning_rate": 0.00010659234125060591, "loss": 0.0132, "step": 497420 }, { "epoch": 1.29, "learning_rate": 0.00010658845303423444, "loss": 0.0093, "step": 497430 }, { "epoch": 1.29, "learning_rate": 0.00010658456481786298, "loss": 0.0119, "step": 497440 }, { "epoch": 1.29, "learning_rate": 0.00010658067660149151, "loss": 0.0106, "step": 497450 }, { "epoch": 1.29, "learning_rate": 0.00010657678838512004, "loss": 0.008, "step": 497460 }, { "epoch": 1.29, "learning_rate": 0.00010657290016874858, "loss": 0.0126, "step": 497470 }, { "epoch": 1.29, "learning_rate": 0.0001065690119523771, "loss": 0.0118, "step": 497480 }, { "epoch": 1.29, "learning_rate": 0.00010656512373600565, "loss": 0.0107, "step": 497490 }, { "epoch": 1.29, "learning_rate": 0.00010656123551963418, "loss": 0.0111, "step": 497500 }, { "epoch": 1.29, "learning_rate": 0.00010655734730326273, "loss": 0.0104, "step": 497510 }, { "epoch": 1.29, "learning_rate": 0.00010655345908689125, "loss": 0.0101, "step": 497520 }, { "epoch": 1.29, "learning_rate": 0.0001065495708705198, "loss": 0.0111, "step": 497530 }, { "epoch": 1.29, "learning_rate": 0.00010654568265414833, "loss": 0.0109, "step": 497540 }, { "epoch": 1.29, "learning_rate": 0.00010654179443777687, "loss": 0.0082, "step": 497550 }, { "epoch": 1.29, "learning_rate": 0.0001065379062214054, "loss": 0.0094, "step": 497560 }, { "epoch": 1.29, "learning_rate": 0.00010653401800503394, "loss": 0.0098, "step": 497570 }, { "epoch": 1.29, "learning_rate": 0.00010653012978866247, "loss": 0.0154, "step": 497580 }, { "epoch": 1.29, "learning_rate": 0.00010652624157229101, "loss": 0.0121, "step": 497590 }, { "epoch": 1.29, "learning_rate": 0.00010652235335591954, "loss": 0.0124, "step": 497600 }, { "epoch": 1.29, "learning_rate": 0.00010651846513954808, "loss": 0.0085, "step": 497610 }, { "epoch": 1.29, "learning_rate": 0.00010651457692317661, "loss": 0.0077, "step": 497620 }, { "epoch": 1.29, "learning_rate": 0.00010651068870680515, "loss": 0.0105, "step": 497630 }, { "epoch": 1.29, "learning_rate": 0.00010650680049043368, "loss": 0.0107, "step": 497640 }, { "epoch": 1.29, "learning_rate": 0.00010650291227406222, "loss": 0.0113, "step": 497650 }, { "epoch": 1.29, "learning_rate": 0.00010649902405769075, "loss": 0.0109, "step": 497660 }, { "epoch": 1.29, "learning_rate": 0.0001064951358413193, "loss": 0.0105, "step": 497670 }, { "epoch": 1.29, "learning_rate": 0.00010649124762494782, "loss": 0.0097, "step": 497680 }, { "epoch": 1.29, "learning_rate": 0.00010648735940857637, "loss": 0.0099, "step": 497690 }, { "epoch": 1.29, "learning_rate": 0.0001064834711922049, "loss": 0.0098, "step": 497700 }, { "epoch": 1.29, "learning_rate": 0.00010647958297583343, "loss": 0.0091, "step": 497710 }, { "epoch": 1.29, "learning_rate": 0.00010647569475946197, "loss": 0.0095, "step": 497720 }, { "epoch": 1.29, "learning_rate": 0.0001064718065430905, "loss": 0.0151, "step": 497730 }, { "epoch": 1.29, "learning_rate": 0.00010646791832671904, "loss": 0.0129, "step": 497740 }, { "epoch": 1.29, "learning_rate": 0.00010646403011034757, "loss": 0.0085, "step": 497750 }, { "epoch": 1.29, "learning_rate": 0.00010646014189397611, "loss": 0.0123, "step": 497760 }, { "epoch": 1.29, "learning_rate": 0.00010645625367760464, "loss": 0.0091, "step": 497770 }, { "epoch": 1.29, "learning_rate": 0.00010645236546123318, "loss": 0.0091, "step": 497780 }, { "epoch": 1.29, "learning_rate": 0.00010644847724486171, "loss": 0.0086, "step": 497790 }, { "epoch": 1.29, "learning_rate": 0.00010644458902849025, "loss": 0.008, "step": 497800 }, { "epoch": 1.29, "learning_rate": 0.00010644070081211878, "loss": 0.0093, "step": 497810 }, { "epoch": 1.29, "learning_rate": 0.00010643681259574732, "loss": 0.0064, "step": 497820 }, { "epoch": 1.29, "learning_rate": 0.00010643292437937585, "loss": 0.0117, "step": 497830 }, { "epoch": 1.29, "learning_rate": 0.00010642903616300439, "loss": 0.0109, "step": 497840 }, { "epoch": 1.29, "learning_rate": 0.00010642514794663292, "loss": 0.0098, "step": 497850 }, { "epoch": 1.29, "learning_rate": 0.00010642125973026147, "loss": 0.0084, "step": 497860 }, { "epoch": 1.29, "learning_rate": 0.00010641737151389, "loss": 0.0085, "step": 497870 }, { "epoch": 1.29, "learning_rate": 0.00010641348329751854, "loss": 0.0117, "step": 497880 }, { "epoch": 1.29, "learning_rate": 0.00010640959508114707, "loss": 0.0088, "step": 497890 }, { "epoch": 1.29, "learning_rate": 0.00010640570686477561, "loss": 0.0092, "step": 497900 }, { "epoch": 1.29, "learning_rate": 0.00010640181864840414, "loss": 0.0115, "step": 497910 }, { "epoch": 1.29, "learning_rate": 0.00010639793043203268, "loss": 0.0121, "step": 497920 }, { "epoch": 1.29, "learning_rate": 0.00010639404221566121, "loss": 0.0092, "step": 497930 }, { "epoch": 1.29, "learning_rate": 0.00010639015399928975, "loss": 0.0122, "step": 497940 }, { "epoch": 1.29, "learning_rate": 0.00010638626578291828, "loss": 0.0075, "step": 497950 }, { "epoch": 1.29, "learning_rate": 0.0001063823775665468, "loss": 0.0114, "step": 497960 }, { "epoch": 1.29, "learning_rate": 0.00010637848935017535, "loss": 0.0096, "step": 497970 }, { "epoch": 1.29, "learning_rate": 0.00010637460113380388, "loss": 0.0102, "step": 497980 }, { "epoch": 1.29, "learning_rate": 0.00010637071291743242, "loss": 0.0128, "step": 497990 }, { "epoch": 1.29, "learning_rate": 0.00010636682470106095, "loss": 0.0096, "step": 498000 }, { "epoch": 1.29, "eval_cer": 0.8816802921322209, "eval_loss": 0.0066691674292087555, "eval_runtime": 108.0801, "eval_samples_per_second": 18.505, "eval_steps_per_second": 4.626, "step": 498000 }, { "epoch": 1.29, "learning_rate": 0.00010636293648468949, "loss": 0.0116, "step": 498010 }, { "epoch": 1.29, "learning_rate": 0.00010635904826831802, "loss": 0.0074, "step": 498020 }, { "epoch": 1.29, "learning_rate": 0.00010635516005194657, "loss": 0.0088, "step": 498030 }, { "epoch": 1.29, "learning_rate": 0.00010635127183557509, "loss": 0.0076, "step": 498040 }, { "epoch": 1.29, "learning_rate": 0.00010634738361920364, "loss": 0.0083, "step": 498050 }, { "epoch": 1.29, "learning_rate": 0.00010634349540283217, "loss": 0.0153, "step": 498060 }, { "epoch": 1.29, "learning_rate": 0.00010633960718646071, "loss": 0.011, "step": 498070 }, { "epoch": 1.29, "learning_rate": 0.00010633571897008924, "loss": 0.0111, "step": 498080 }, { "epoch": 1.29, "learning_rate": 0.00010633183075371778, "loss": 0.0111, "step": 498090 }, { "epoch": 1.29, "learning_rate": 0.00010632794253734631, "loss": 0.0113, "step": 498100 }, { "epoch": 1.29, "learning_rate": 0.00010632405432097485, "loss": 0.0134, "step": 498110 }, { "epoch": 1.29, "learning_rate": 0.00010632016610460338, "loss": 0.016, "step": 498120 }, { "epoch": 1.29, "learning_rate": 0.00010631627788823192, "loss": 0.0103, "step": 498130 }, { "epoch": 1.29, "learning_rate": 0.00010631238967186045, "loss": 0.0112, "step": 498140 }, { "epoch": 1.29, "learning_rate": 0.00010630850145548899, "loss": 0.0106, "step": 498150 }, { "epoch": 1.29, "learning_rate": 0.00010630461323911752, "loss": 0.0065, "step": 498160 }, { "epoch": 1.29, "learning_rate": 0.00010630072502274606, "loss": 0.0101, "step": 498170 }, { "epoch": 1.29, "learning_rate": 0.00010629683680637459, "loss": 0.0105, "step": 498180 }, { "epoch": 1.29, "learning_rate": 0.00010629294859000314, "loss": 0.0108, "step": 498190 }, { "epoch": 1.29, "learning_rate": 0.00010628906037363166, "loss": 0.0082, "step": 498200 }, { "epoch": 1.29, "learning_rate": 0.00010628517215726018, "loss": 0.0092, "step": 498210 }, { "epoch": 1.29, "learning_rate": 0.00010628128394088874, "loss": 0.01, "step": 498220 }, { "epoch": 1.29, "learning_rate": 0.00010627739572451727, "loss": 0.0104, "step": 498230 }, { "epoch": 1.29, "learning_rate": 0.00010627350750814581, "loss": 0.0109, "step": 498240 }, { "epoch": 1.29, "learning_rate": 0.00010626961929177434, "loss": 0.0088, "step": 498250 }, { "epoch": 1.29, "learning_rate": 0.00010626573107540288, "loss": 0.0097, "step": 498260 }, { "epoch": 1.29, "learning_rate": 0.00010626184285903141, "loss": 0.0098, "step": 498270 }, { "epoch": 1.29, "learning_rate": 0.00010625795464265995, "loss": 0.0096, "step": 498280 }, { "epoch": 1.29, "learning_rate": 0.00010625406642628848, "loss": 0.0103, "step": 498290 }, { "epoch": 1.29, "learning_rate": 0.00010625017820991702, "loss": 0.012, "step": 498300 }, { "epoch": 1.29, "learning_rate": 0.00010624628999354555, "loss": 0.0104, "step": 498310 }, { "epoch": 1.29, "learning_rate": 0.00010624240177717409, "loss": 0.0114, "step": 498320 }, { "epoch": 1.29, "learning_rate": 0.00010623851356080262, "loss": 0.0084, "step": 498330 }, { "epoch": 1.29, "learning_rate": 0.00010623462534443116, "loss": 0.0129, "step": 498340 }, { "epoch": 1.29, "learning_rate": 0.00010623073712805969, "loss": 0.0117, "step": 498350 }, { "epoch": 1.29, "learning_rate": 0.00010622684891168823, "loss": 0.0112, "step": 498360 }, { "epoch": 1.29, "learning_rate": 0.00010622296069531676, "loss": 0.0125, "step": 498370 }, { "epoch": 1.29, "learning_rate": 0.00010621907247894531, "loss": 0.0104, "step": 498380 }, { "epoch": 1.29, "learning_rate": 0.00010621518426257384, "loss": 0.0122, "step": 498390 }, { "epoch": 1.29, "learning_rate": 0.00010621129604620238, "loss": 0.0116, "step": 498400 }, { "epoch": 1.29, "learning_rate": 0.00010620740782983091, "loss": 0.0092, "step": 498410 }, { "epoch": 1.29, "learning_rate": 0.00010620351961345945, "loss": 0.0103, "step": 498420 }, { "epoch": 1.29, "learning_rate": 0.00010619963139708798, "loss": 0.0108, "step": 498430 }, { "epoch": 1.29, "learning_rate": 0.00010619574318071652, "loss": 0.0083, "step": 498440 }, { "epoch": 1.29, "learning_rate": 0.00010619185496434505, "loss": 0.0107, "step": 498450 }, { "epoch": 1.29, "learning_rate": 0.00010618796674797358, "loss": 0.0098, "step": 498460 }, { "epoch": 1.29, "learning_rate": 0.00010618407853160212, "loss": 0.0102, "step": 498470 }, { "epoch": 1.29, "learning_rate": 0.00010618019031523065, "loss": 0.0091, "step": 498480 }, { "epoch": 1.29, "learning_rate": 0.00010617630209885919, "loss": 0.0104, "step": 498490 }, { "epoch": 1.29, "learning_rate": 0.00010617241388248772, "loss": 0.0105, "step": 498500 }, { "epoch": 1.29, "learning_rate": 0.00010616852566611626, "loss": 0.012, "step": 498510 }, { "epoch": 1.29, "learning_rate": 0.00010616463744974479, "loss": 0.0097, "step": 498520 }, { "epoch": 1.29, "learning_rate": 0.00010616074923337333, "loss": 0.0135, "step": 498530 }, { "epoch": 1.29, "learning_rate": 0.00010615686101700186, "loss": 0.0111, "step": 498540 }, { "epoch": 1.29, "learning_rate": 0.0001061529728006304, "loss": 0.0118, "step": 498550 }, { "epoch": 1.29, "learning_rate": 0.00010614908458425893, "loss": 0.0097, "step": 498560 }, { "epoch": 1.29, "learning_rate": 0.00010614519636788748, "loss": 0.0099, "step": 498570 }, { "epoch": 1.29, "learning_rate": 0.00010614130815151601, "loss": 0.0139, "step": 498580 }, { "epoch": 1.29, "learning_rate": 0.00010613741993514455, "loss": 0.0133, "step": 498590 }, { "epoch": 1.29, "learning_rate": 0.00010613353171877308, "loss": 0.0138, "step": 498600 }, { "epoch": 1.29, "learning_rate": 0.00010612964350240162, "loss": 0.0097, "step": 498610 }, { "epoch": 1.29, "learning_rate": 0.00010612575528603015, "loss": 0.0084, "step": 498620 }, { "epoch": 1.29, "learning_rate": 0.00010612186706965869, "loss": 0.0085, "step": 498630 }, { "epoch": 1.29, "learning_rate": 0.00010611797885328722, "loss": 0.0107, "step": 498640 }, { "epoch": 1.29, "learning_rate": 0.00010611409063691576, "loss": 0.0094, "step": 498650 }, { "epoch": 1.29, "learning_rate": 0.00010611020242054429, "loss": 0.0112, "step": 498660 }, { "epoch": 1.29, "learning_rate": 0.00010610631420417283, "loss": 0.009, "step": 498670 }, { "epoch": 1.29, "learning_rate": 0.00010610242598780136, "loss": 0.0077, "step": 498680 }, { "epoch": 1.29, "learning_rate": 0.0001060985377714299, "loss": 0.0099, "step": 498690 }, { "epoch": 1.29, "learning_rate": 0.00010609464955505843, "loss": 0.0135, "step": 498700 }, { "epoch": 1.29, "learning_rate": 0.00010609076133868695, "loss": 0.0118, "step": 498710 }, { "epoch": 1.29, "learning_rate": 0.0001060868731223155, "loss": 0.0094, "step": 498720 }, { "epoch": 1.29, "learning_rate": 0.00010608298490594402, "loss": 0.015, "step": 498730 }, { "epoch": 1.29, "learning_rate": 0.00010607909668957258, "loss": 0.01, "step": 498740 }, { "epoch": 1.29, "learning_rate": 0.0001060752084732011, "loss": 0.0088, "step": 498750 }, { "epoch": 1.29, "learning_rate": 0.00010607132025682965, "loss": 0.0102, "step": 498760 }, { "epoch": 1.29, "learning_rate": 0.00010606743204045818, "loss": 0.0114, "step": 498770 }, { "epoch": 1.29, "learning_rate": 0.00010606354382408672, "loss": 0.0105, "step": 498780 }, { "epoch": 1.29, "learning_rate": 0.00010605965560771525, "loss": 0.0139, "step": 498790 }, { "epoch": 1.29, "learning_rate": 0.00010605576739134379, "loss": 0.0105, "step": 498800 }, { "epoch": 1.29, "learning_rate": 0.00010605187917497232, "loss": 0.0109, "step": 498810 }, { "epoch": 1.29, "learning_rate": 0.00010604799095860086, "loss": 0.0125, "step": 498820 }, { "epoch": 1.29, "learning_rate": 0.00010604410274222939, "loss": 0.0097, "step": 498830 }, { "epoch": 1.29, "learning_rate": 0.00010604021452585793, "loss": 0.0115, "step": 498840 }, { "epoch": 1.29, "learning_rate": 0.00010603632630948646, "loss": 0.011, "step": 498850 }, { "epoch": 1.29, "learning_rate": 0.000106032438093115, "loss": 0.0103, "step": 498860 }, { "epoch": 1.29, "learning_rate": 0.00010602854987674353, "loss": 0.0106, "step": 498870 }, { "epoch": 1.29, "learning_rate": 0.00010602466166037207, "loss": 0.0089, "step": 498880 }, { "epoch": 1.29, "learning_rate": 0.0001060207734440006, "loss": 0.0096, "step": 498890 }, { "epoch": 1.29, "learning_rate": 0.00010601688522762915, "loss": 0.0126, "step": 498900 }, { "epoch": 1.29, "learning_rate": 0.00010601299701125767, "loss": 0.0119, "step": 498910 }, { "epoch": 1.29, "learning_rate": 0.00010600910879488622, "loss": 0.0086, "step": 498920 }, { "epoch": 1.29, "learning_rate": 0.00010600522057851475, "loss": 0.0106, "step": 498930 }, { "epoch": 1.29, "learning_rate": 0.00010600133236214329, "loss": 0.0085, "step": 498940 }, { "epoch": 1.29, "learning_rate": 0.00010599744414577182, "loss": 0.0095, "step": 498950 }, { "epoch": 1.29, "learning_rate": 0.00010599355592940035, "loss": 0.0088, "step": 498960 }, { "epoch": 1.29, "learning_rate": 0.00010598966771302889, "loss": 0.0081, "step": 498970 }, { "epoch": 1.29, "learning_rate": 0.00010598577949665742, "loss": 0.0107, "step": 498980 }, { "epoch": 1.29, "learning_rate": 0.00010598189128028596, "loss": 0.0129, "step": 498990 }, { "epoch": 1.29, "learning_rate": 0.00010597800306391449, "loss": 0.0127, "step": 499000 }, { "epoch": 1.29, "eval_cer": 0.8816467008458005, "eval_loss": 0.006797228939831257, "eval_runtime": 108.108, "eval_samples_per_second": 18.5, "eval_steps_per_second": 4.625, "step": 499000 }, { "epoch": 1.29, "learning_rate": 0.00010597411484754303, "loss": 0.011, "step": 499010 }, { "epoch": 1.29, "learning_rate": 0.00010597022663117156, "loss": 0.0117, "step": 499020 }, { "epoch": 1.29, "learning_rate": 0.0001059663384148001, "loss": 0.0096, "step": 499030 }, { "epoch": 1.29, "learning_rate": 0.00010596245019842863, "loss": 0.0089, "step": 499040 }, { "epoch": 1.29, "learning_rate": 0.00010595856198205717, "loss": 0.0096, "step": 499050 }, { "epoch": 1.29, "learning_rate": 0.0001059546737656857, "loss": 0.0102, "step": 499060 }, { "epoch": 1.29, "learning_rate": 0.00010595078554931424, "loss": 0.0096, "step": 499070 }, { "epoch": 1.29, "learning_rate": 0.00010594689733294276, "loss": 0.0119, "step": 499080 }, { "epoch": 1.29, "learning_rate": 0.00010594300911657132, "loss": 0.0077, "step": 499090 }, { "epoch": 1.29, "learning_rate": 0.00010593912090019985, "loss": 0.01, "step": 499100 }, { "epoch": 1.29, "learning_rate": 0.00010593523268382839, "loss": 0.0111, "step": 499110 }, { "epoch": 1.29, "learning_rate": 0.00010593134446745692, "loss": 0.0111, "step": 499120 }, { "epoch": 1.29, "learning_rate": 0.00010592745625108546, "loss": 0.0084, "step": 499130 }, { "epoch": 1.29, "learning_rate": 0.00010592356803471399, "loss": 0.0091, "step": 499140 }, { "epoch": 1.29, "learning_rate": 0.00010591967981834253, "loss": 0.0127, "step": 499150 }, { "epoch": 1.29, "learning_rate": 0.00010591579160197106, "loss": 0.0105, "step": 499160 }, { "epoch": 1.29, "learning_rate": 0.0001059119033855996, "loss": 0.0111, "step": 499170 }, { "epoch": 1.29, "learning_rate": 0.00010590801516922813, "loss": 0.0137, "step": 499180 }, { "epoch": 1.29, "learning_rate": 0.00010590412695285667, "loss": 0.0119, "step": 499190 }, { "epoch": 1.29, "learning_rate": 0.0001059002387364852, "loss": 0.0086, "step": 499200 }, { "epoch": 1.29, "learning_rate": 0.00010589635052011372, "loss": 0.0134, "step": 499210 }, { "epoch": 1.29, "learning_rate": 0.00010589246230374227, "loss": 0.0103, "step": 499220 }, { "epoch": 1.29, "learning_rate": 0.0001058885740873708, "loss": 0.0083, "step": 499230 }, { "epoch": 1.29, "learning_rate": 0.00010588468587099934, "loss": 0.0098, "step": 499240 }, { "epoch": 1.29, "learning_rate": 0.00010588079765462786, "loss": 0.0113, "step": 499250 }, { "epoch": 1.29, "learning_rate": 0.00010587690943825642, "loss": 0.0101, "step": 499260 }, { "epoch": 1.29, "learning_rate": 0.00010587302122188493, "loss": 0.0085, "step": 499270 }, { "epoch": 1.29, "learning_rate": 0.00010586913300551349, "loss": 0.0101, "step": 499280 }, { "epoch": 1.29, "learning_rate": 0.00010586524478914202, "loss": 0.0098, "step": 499290 }, { "epoch": 1.29, "learning_rate": 0.00010586135657277056, "loss": 0.0124, "step": 499300 }, { "epoch": 1.29, "learning_rate": 0.00010585746835639909, "loss": 0.01, "step": 499310 }, { "epoch": 1.29, "learning_rate": 0.00010585358014002763, "loss": 0.0095, "step": 499320 }, { "epoch": 1.29, "learning_rate": 0.00010584969192365616, "loss": 0.0089, "step": 499330 }, { "epoch": 1.29, "learning_rate": 0.0001058458037072847, "loss": 0.0095, "step": 499340 }, { "epoch": 1.29, "learning_rate": 0.00010584191549091323, "loss": 0.0089, "step": 499350 }, { "epoch": 1.29, "learning_rate": 0.00010583802727454177, "loss": 0.0083, "step": 499360 }, { "epoch": 1.29, "learning_rate": 0.0001058341390581703, "loss": 0.0085, "step": 499370 }, { "epoch": 1.29, "learning_rate": 0.00010583025084179884, "loss": 0.0094, "step": 499380 }, { "epoch": 1.29, "learning_rate": 0.00010582636262542737, "loss": 0.0106, "step": 499390 }, { "epoch": 1.29, "learning_rate": 0.00010582247440905591, "loss": 0.0128, "step": 499400 }, { "epoch": 1.29, "learning_rate": 0.00010581858619268444, "loss": 0.008, "step": 499410 }, { "epoch": 1.29, "learning_rate": 0.00010581469797631299, "loss": 0.0118, "step": 499420 }, { "epoch": 1.29, "learning_rate": 0.0001058108097599415, "loss": 0.0124, "step": 499430 }, { "epoch": 1.29, "learning_rate": 0.00010580692154357003, "loss": 0.0083, "step": 499440 }, { "epoch": 1.29, "learning_rate": 0.00010580303332719859, "loss": 0.0074, "step": 499450 }, { "epoch": 1.29, "learning_rate": 0.00010579914511082712, "loss": 0.009, "step": 499460 }, { "epoch": 1.29, "learning_rate": 0.00010579525689445566, "loss": 0.0092, "step": 499470 }, { "epoch": 1.29, "learning_rate": 0.00010579136867808419, "loss": 0.0126, "step": 499480 }, { "epoch": 1.29, "learning_rate": 0.00010578748046171273, "loss": 0.0093, "step": 499490 }, { "epoch": 1.29, "learning_rate": 0.00010578359224534126, "loss": 0.0138, "step": 499500 }, { "epoch": 1.29, "learning_rate": 0.0001057797040289698, "loss": 0.0097, "step": 499510 }, { "epoch": 1.29, "learning_rate": 0.00010577581581259833, "loss": 0.0082, "step": 499520 }, { "epoch": 1.29, "learning_rate": 0.00010577192759622687, "loss": 0.0108, "step": 499530 }, { "epoch": 1.29, "learning_rate": 0.0001057680393798554, "loss": 0.0114, "step": 499540 }, { "epoch": 1.29, "learning_rate": 0.00010576415116348394, "loss": 0.0112, "step": 499550 }, { "epoch": 1.29, "learning_rate": 0.00010576026294711247, "loss": 0.0108, "step": 499560 }, { "epoch": 1.29, "learning_rate": 0.00010575637473074101, "loss": 0.0093, "step": 499570 }, { "epoch": 1.29, "learning_rate": 0.00010575248651436954, "loss": 0.0093, "step": 499580 }, { "epoch": 1.3, "learning_rate": 0.00010574859829799808, "loss": 0.0094, "step": 499590 }, { "epoch": 1.3, "learning_rate": 0.0001057447100816266, "loss": 0.0101, "step": 499600 }, { "epoch": 1.3, "learning_rate": 0.00010574082186525516, "loss": 0.007, "step": 499610 }, { "epoch": 1.3, "learning_rate": 0.00010573693364888369, "loss": 0.0096, "step": 499620 }, { "epoch": 1.3, "learning_rate": 0.00010573304543251223, "loss": 0.0084, "step": 499630 }, { "epoch": 1.3, "learning_rate": 0.00010572915721614076, "loss": 0.0071, "step": 499640 }, { "epoch": 1.3, "learning_rate": 0.0001057252689997693, "loss": 0.0102, "step": 499650 }, { "epoch": 1.3, "learning_rate": 0.00010572138078339783, "loss": 0.0114, "step": 499660 }, { "epoch": 1.3, "learning_rate": 0.00010571749256702637, "loss": 0.0108, "step": 499670 }, { "epoch": 1.3, "learning_rate": 0.0001057136043506549, "loss": 0.0093, "step": 499680 }, { "epoch": 1.3, "learning_rate": 0.00010570971613428343, "loss": 0.0112, "step": 499690 }, { "epoch": 1.3, "learning_rate": 0.00010570582791791197, "loss": 0.0078, "step": 499700 }, { "epoch": 1.3, "learning_rate": 0.0001057019397015405, "loss": 0.0098, "step": 499710 }, { "epoch": 1.3, "learning_rate": 0.00010569805148516904, "loss": 0.0111, "step": 499720 }, { "epoch": 1.3, "learning_rate": 0.00010569416326879756, "loss": 0.0096, "step": 499730 }, { "epoch": 1.3, "learning_rate": 0.0001056902750524261, "loss": 0.0115, "step": 499740 }, { "epoch": 1.3, "learning_rate": 0.00010568638683605463, "loss": 0.0062, "step": 499750 }, { "epoch": 1.3, "learning_rate": 0.00010568249861968318, "loss": 0.0081, "step": 499760 }, { "epoch": 1.3, "learning_rate": 0.0001056786104033117, "loss": 0.0132, "step": 499770 }, { "epoch": 1.3, "learning_rate": 0.00010567472218694025, "loss": 0.013, "step": 499780 }, { "epoch": 1.3, "learning_rate": 0.00010567083397056877, "loss": 0.0087, "step": 499790 }, { "epoch": 1.3, "learning_rate": 0.00010566694575419733, "loss": 0.0095, "step": 499800 }, { "epoch": 1.3, "learning_rate": 0.00010566305753782586, "loss": 0.0075, "step": 499810 }, { "epoch": 1.3, "learning_rate": 0.0001056591693214544, "loss": 0.0078, "step": 499820 }, { "epoch": 1.3, "learning_rate": 0.00010565528110508293, "loss": 0.0104, "step": 499830 }, { "epoch": 1.3, "learning_rate": 0.00010565139288871147, "loss": 0.0121, "step": 499840 }, { "epoch": 1.3, "learning_rate": 0.00010564750467234, "loss": 0.0106, "step": 499850 }, { "epoch": 1.3, "learning_rate": 0.00010564361645596854, "loss": 0.0132, "step": 499860 }, { "epoch": 1.3, "learning_rate": 0.00010563972823959707, "loss": 0.0079, "step": 499870 }, { "epoch": 1.3, "learning_rate": 0.00010563584002322561, "loss": 0.0106, "step": 499880 }, { "epoch": 1.3, "learning_rate": 0.00010563195180685414, "loss": 0.0101, "step": 499890 }, { "epoch": 1.3, "learning_rate": 0.00010562806359048268, "loss": 0.0104, "step": 499900 }, { "epoch": 1.3, "learning_rate": 0.0001056241753741112, "loss": 0.0111, "step": 499910 }, { "epoch": 1.3, "learning_rate": 0.00010562028715773975, "loss": 0.0105, "step": 499920 }, { "epoch": 1.3, "learning_rate": 0.00010561639894136828, "loss": 0.0103, "step": 499930 }, { "epoch": 1.3, "learning_rate": 0.0001056125107249968, "loss": 0.0106, "step": 499940 }, { "epoch": 1.3, "learning_rate": 0.00010560862250862535, "loss": 0.0145, "step": 499950 }, { "epoch": 1.3, "learning_rate": 0.00010560473429225387, "loss": 0.0126, "step": 499960 }, { "epoch": 1.3, "learning_rate": 0.00010560084607588243, "loss": 0.0132, "step": 499970 }, { "epoch": 1.3, "learning_rate": 0.00010559695785951096, "loss": 0.0125, "step": 499980 }, { "epoch": 1.3, "learning_rate": 0.0001055930696431395, "loss": 0.0102, "step": 499990 }, { "epoch": 1.3, "learning_rate": 0.00010558918142676803, "loss": 0.0084, "step": 500000 }, { "epoch": 1.3, "eval_cer": 0.8816704946736816, "eval_loss": 0.006844638846814632, "eval_runtime": 107.9782, "eval_samples_per_second": 18.522, "eval_steps_per_second": 4.631, "step": 500000 }, { "epoch": 1.3, "learning_rate": 0.00010558529321039657, "loss": 0.0109, "step": 500010 }, { "epoch": 1.3, "learning_rate": 0.0001055814049940251, "loss": 0.0125, "step": 500020 }, { "epoch": 1.3, "learning_rate": 0.00010557751677765364, "loss": 0.0096, "step": 500030 }, { "epoch": 1.3, "learning_rate": 0.00010557362856128217, "loss": 0.0089, "step": 500040 }, { "epoch": 1.3, "learning_rate": 0.00010556974034491071, "loss": 0.0113, "step": 500050 }, { "epoch": 1.3, "learning_rate": 0.00010556585212853924, "loss": 0.0097, "step": 500060 }, { "epoch": 1.3, "learning_rate": 0.00010556196391216778, "loss": 0.0098, "step": 500070 }, { "epoch": 1.3, "learning_rate": 0.0001055580756957963, "loss": 0.0094, "step": 500080 }, { "epoch": 1.3, "learning_rate": 0.00010555418747942485, "loss": 0.0122, "step": 500090 }, { "epoch": 1.3, "learning_rate": 0.00010555029926305338, "loss": 0.0096, "step": 500100 }, { "epoch": 1.3, "learning_rate": 0.00010554641104668192, "loss": 0.0077, "step": 500110 }, { "epoch": 1.3, "learning_rate": 0.00010554252283031044, "loss": 0.0099, "step": 500120 }, { "epoch": 1.3, "learning_rate": 0.000105538634613939, "loss": 0.01, "step": 500130 }, { "epoch": 1.3, "learning_rate": 0.00010553474639756751, "loss": 0.0127, "step": 500140 }, { "epoch": 1.3, "learning_rate": 0.00010553085818119607, "loss": 0.01, "step": 500150 }, { "epoch": 1.3, "learning_rate": 0.0001055269699648246, "loss": 0.0094, "step": 500160 }, { "epoch": 1.3, "learning_rate": 0.00010552308174845314, "loss": 0.0077, "step": 500170 }, { "epoch": 1.3, "learning_rate": 0.00010551919353208167, "loss": 0.0128, "step": 500180 }, { "epoch": 1.3, "learning_rate": 0.0001055153053157102, "loss": 0.0099, "step": 500190 }, { "epoch": 1.3, "learning_rate": 0.00010551141709933874, "loss": 0.0079, "step": 500200 }, { "epoch": 1.3, "learning_rate": 0.00010550752888296727, "loss": 0.013, "step": 500210 }, { "epoch": 1.3, "learning_rate": 0.00010550364066659581, "loss": 0.011, "step": 500220 }, { "epoch": 1.3, "learning_rate": 0.00010549975245022434, "loss": 0.0083, "step": 500230 }, { "epoch": 1.3, "learning_rate": 0.00010549586423385288, "loss": 0.011, "step": 500240 }, { "epoch": 1.3, "learning_rate": 0.0001054919760174814, "loss": 0.0077, "step": 500250 }, { "epoch": 1.3, "learning_rate": 0.00010548808780110995, "loss": 0.0109, "step": 500260 }, { "epoch": 1.3, "learning_rate": 0.00010548419958473847, "loss": 0.0102, "step": 500270 }, { "epoch": 1.3, "learning_rate": 0.00010548031136836702, "loss": 0.0095, "step": 500280 }, { "epoch": 1.3, "learning_rate": 0.00010547642315199554, "loss": 0.0123, "step": 500290 }, { "epoch": 1.3, "learning_rate": 0.00010547253493562409, "loss": 0.011, "step": 500300 }, { "epoch": 1.3, "learning_rate": 0.00010546864671925261, "loss": 0.0111, "step": 500310 }, { "epoch": 1.3, "learning_rate": 0.00010546475850288117, "loss": 0.0099, "step": 500320 }, { "epoch": 1.3, "learning_rate": 0.0001054608702865097, "loss": 0.0086, "step": 500330 }, { "epoch": 1.3, "learning_rate": 0.00010545698207013824, "loss": 0.0092, "step": 500340 }, { "epoch": 1.3, "learning_rate": 0.00010545309385376677, "loss": 0.0095, "step": 500350 }, { "epoch": 1.3, "learning_rate": 0.00010544920563739531, "loss": 0.0098, "step": 500360 }, { "epoch": 1.3, "learning_rate": 0.00010544531742102384, "loss": 0.0108, "step": 500370 }, { "epoch": 1.3, "learning_rate": 0.00010544142920465238, "loss": 0.0105, "step": 500380 }, { "epoch": 1.3, "learning_rate": 0.0001054375409882809, "loss": 0.0136, "step": 500390 }, { "epoch": 1.3, "learning_rate": 0.00010543365277190945, "loss": 0.0123, "step": 500400 }, { "epoch": 1.3, "learning_rate": 0.00010542976455553798, "loss": 0.0067, "step": 500410 }, { "epoch": 1.3, "learning_rate": 0.00010542587633916652, "loss": 0.0099, "step": 500420 }, { "epoch": 1.3, "learning_rate": 0.00010542198812279505, "loss": 0.0106, "step": 500430 }, { "epoch": 1.3, "learning_rate": 0.00010541809990642357, "loss": 0.0099, "step": 500440 }, { "epoch": 1.3, "learning_rate": 0.00010541421169005212, "loss": 0.0127, "step": 500450 }, { "epoch": 1.3, "learning_rate": 0.00010541032347368064, "loss": 0.0116, "step": 500460 }, { "epoch": 1.3, "learning_rate": 0.00010540643525730919, "loss": 0.0116, "step": 500470 }, { "epoch": 1.3, "learning_rate": 0.00010540254704093771, "loss": 0.011, "step": 500480 }, { "epoch": 1.3, "learning_rate": 0.00010539865882456627, "loss": 0.0084, "step": 500490 }, { "epoch": 1.3, "learning_rate": 0.00010539477060819478, "loss": 0.0104, "step": 500500 }, { "epoch": 1.3, "learning_rate": 0.00010539088239182334, "loss": 0.0099, "step": 500510 }, { "epoch": 1.3, "learning_rate": 0.00010538699417545187, "loss": 0.0098, "step": 500520 }, { "epoch": 1.3, "learning_rate": 0.00010538310595908041, "loss": 0.0112, "step": 500530 }, { "epoch": 1.3, "learning_rate": 0.00010537921774270894, "loss": 0.0126, "step": 500540 }, { "epoch": 1.3, "learning_rate": 0.00010537532952633748, "loss": 0.0085, "step": 500550 }, { "epoch": 1.3, "learning_rate": 0.000105371441309966, "loss": 0.0126, "step": 500560 }, { "epoch": 1.3, "learning_rate": 0.00010536755309359455, "loss": 0.0088, "step": 500570 }, { "epoch": 1.3, "learning_rate": 0.00010536366487722308, "loss": 0.0141, "step": 500580 }, { "epoch": 1.3, "learning_rate": 0.00010535977666085162, "loss": 0.0113, "step": 500590 }, { "epoch": 1.3, "learning_rate": 0.00010535588844448015, "loss": 0.0109, "step": 500600 }, { "epoch": 1.3, "learning_rate": 0.00010535200022810869, "loss": 0.0133, "step": 500610 }, { "epoch": 1.3, "learning_rate": 0.00010534811201173721, "loss": 0.0102, "step": 500620 }, { "epoch": 1.3, "learning_rate": 0.00010534422379536576, "loss": 0.0086, "step": 500630 }, { "epoch": 1.3, "learning_rate": 0.00010534033557899428, "loss": 0.0124, "step": 500640 }, { "epoch": 1.3, "learning_rate": 0.00010533644736262284, "loss": 0.0112, "step": 500650 }, { "epoch": 1.3, "learning_rate": 0.00010533255914625135, "loss": 0.0096, "step": 500660 }, { "epoch": 1.3, "learning_rate": 0.00010532867092987991, "loss": 0.0114, "step": 500670 }, { "epoch": 1.3, "learning_rate": 0.00010532478271350844, "loss": 0.0112, "step": 500680 }, { "epoch": 1.3, "learning_rate": 0.00010532089449713697, "loss": 0.0105, "step": 500690 }, { "epoch": 1.3, "learning_rate": 0.00010531700628076551, "loss": 0.0094, "step": 500700 }, { "epoch": 1.3, "learning_rate": 0.00010531311806439404, "loss": 0.0086, "step": 500710 }, { "epoch": 1.3, "learning_rate": 0.00010530922984802258, "loss": 0.0118, "step": 500720 }, { "epoch": 1.3, "learning_rate": 0.0001053053416316511, "loss": 0.0108, "step": 500730 }, { "epoch": 1.3, "learning_rate": 0.00010530145341527965, "loss": 0.0118, "step": 500740 }, { "epoch": 1.3, "learning_rate": 0.00010529756519890817, "loss": 0.0084, "step": 500750 }, { "epoch": 1.3, "learning_rate": 0.00010529367698253672, "loss": 0.0105, "step": 500760 }, { "epoch": 1.3, "learning_rate": 0.00010528978876616524, "loss": 0.0104, "step": 500770 }, { "epoch": 1.3, "learning_rate": 0.00010528590054979379, "loss": 0.0124, "step": 500780 }, { "epoch": 1.3, "learning_rate": 0.00010528201233342231, "loss": 0.0106, "step": 500790 }, { "epoch": 1.3, "learning_rate": 0.00010527812411705086, "loss": 0.0108, "step": 500800 }, { "epoch": 1.3, "learning_rate": 0.00010527423590067938, "loss": 0.0101, "step": 500810 }, { "epoch": 1.3, "learning_rate": 0.00010527034768430793, "loss": 0.0156, "step": 500820 }, { "epoch": 1.3, "learning_rate": 0.00010526645946793645, "loss": 0.0085, "step": 500830 }, { "epoch": 1.3, "learning_rate": 0.00010526257125156501, "loss": 0.0102, "step": 500840 }, { "epoch": 1.3, "learning_rate": 0.00010525868303519354, "loss": 0.0099, "step": 500850 }, { "epoch": 1.3, "learning_rate": 0.00010525479481882208, "loss": 0.0102, "step": 500860 }, { "epoch": 1.3, "learning_rate": 0.00010525090660245061, "loss": 0.0096, "step": 500870 }, { "epoch": 1.3, "learning_rate": 0.00010524701838607915, "loss": 0.0093, "step": 500880 }, { "epoch": 1.3, "learning_rate": 0.00010524313016970768, "loss": 0.0103, "step": 500890 }, { "epoch": 1.3, "learning_rate": 0.00010523924195333622, "loss": 0.0117, "step": 500900 }, { "epoch": 1.3, "learning_rate": 0.00010523535373696475, "loss": 0.0115, "step": 500910 }, { "epoch": 1.3, "learning_rate": 0.00010523146552059329, "loss": 0.0101, "step": 500920 }, { "epoch": 1.3, "learning_rate": 0.00010522757730422182, "loss": 0.0117, "step": 500930 }, { "epoch": 1.3, "learning_rate": 0.00010522368908785034, "loss": 0.0111, "step": 500940 }, { "epoch": 1.3, "learning_rate": 0.00010521980087147889, "loss": 0.0111, "step": 500950 }, { "epoch": 1.3, "learning_rate": 0.00010521591265510741, "loss": 0.01, "step": 500960 }, { "epoch": 1.3, "learning_rate": 0.00010521202443873596, "loss": 0.0098, "step": 500970 }, { "epoch": 1.3, "learning_rate": 0.00010520813622236448, "loss": 0.0097, "step": 500980 }, { "epoch": 1.3, "learning_rate": 0.00010520424800599303, "loss": 0.0117, "step": 500990 }, { "epoch": 1.3, "learning_rate": 0.00010520035978962155, "loss": 0.0122, "step": 501000 }, { "epoch": 1.3, "eval_cer": 0.8816956881384969, "eval_loss": 0.0065152887254953384, "eval_runtime": 107.805, "eval_samples_per_second": 18.552, "eval_steps_per_second": 4.638, "step": 501000 }, { "epoch": 1.3, "learning_rate": 0.00010519647157325011, "loss": 0.0084, "step": 501010 }, { "epoch": 1.3, "learning_rate": 0.00010519258335687862, "loss": 0.0108, "step": 501020 }, { "epoch": 1.3, "learning_rate": 0.00010518869514050718, "loss": 0.01, "step": 501030 }, { "epoch": 1.3, "learning_rate": 0.0001051848069241357, "loss": 0.0146, "step": 501040 }, { "epoch": 1.3, "learning_rate": 0.00010518091870776425, "loss": 0.0115, "step": 501050 }, { "epoch": 1.3, "learning_rate": 0.00010517703049139278, "loss": 0.0106, "step": 501060 }, { "epoch": 1.3, "learning_rate": 0.00010517314227502132, "loss": 0.0098, "step": 501070 }, { "epoch": 1.3, "learning_rate": 0.00010516925405864985, "loss": 0.0124, "step": 501080 }, { "epoch": 1.3, "learning_rate": 0.00010516536584227839, "loss": 0.0086, "step": 501090 }, { "epoch": 1.3, "learning_rate": 0.00010516147762590692, "loss": 0.008, "step": 501100 }, { "epoch": 1.3, "learning_rate": 0.00010515758940953546, "loss": 0.0105, "step": 501110 }, { "epoch": 1.3, "learning_rate": 0.00010515370119316399, "loss": 0.0118, "step": 501120 }, { "epoch": 1.3, "learning_rate": 0.00010514981297679253, "loss": 0.0119, "step": 501130 }, { "epoch": 1.3, "learning_rate": 0.00010514592476042105, "loss": 0.0084, "step": 501140 }, { "epoch": 1.3, "learning_rate": 0.0001051420365440496, "loss": 0.0113, "step": 501150 }, { "epoch": 1.3, "learning_rate": 0.00010513814832767812, "loss": 0.0083, "step": 501160 }, { "epoch": 1.3, "learning_rate": 0.00010513426011130667, "loss": 0.0116, "step": 501170 }, { "epoch": 1.3, "learning_rate": 0.0001051303718949352, "loss": 0.0102, "step": 501180 }, { "epoch": 1.3, "learning_rate": 0.00010512648367856372, "loss": 0.011, "step": 501190 }, { "epoch": 1.3, "learning_rate": 0.00010512259546219228, "loss": 0.008, "step": 501200 }, { "epoch": 1.3, "learning_rate": 0.0001051187072458208, "loss": 0.0085, "step": 501210 }, { "epoch": 1.3, "learning_rate": 0.00010511481902944935, "loss": 0.0105, "step": 501220 }, { "epoch": 1.3, "learning_rate": 0.00010511093081307788, "loss": 0.0126, "step": 501230 }, { "epoch": 1.3, "learning_rate": 0.00010510704259670642, "loss": 0.0116, "step": 501240 }, { "epoch": 1.3, "learning_rate": 0.00010510315438033495, "loss": 0.0083, "step": 501250 }, { "epoch": 1.3, "learning_rate": 0.00010509926616396349, "loss": 0.0099, "step": 501260 }, { "epoch": 1.3, "learning_rate": 0.00010509537794759201, "loss": 0.0115, "step": 501270 }, { "epoch": 1.3, "learning_rate": 0.00010509148973122056, "loss": 0.0086, "step": 501280 }, { "epoch": 1.3, "learning_rate": 0.00010508760151484908, "loss": 0.0089, "step": 501290 }, { "epoch": 1.3, "learning_rate": 0.00010508371329847763, "loss": 0.0105, "step": 501300 }, { "epoch": 1.3, "learning_rate": 0.00010507982508210615, "loss": 0.009, "step": 501310 }, { "epoch": 1.3, "learning_rate": 0.0001050759368657347, "loss": 0.0099, "step": 501320 }, { "epoch": 1.3, "learning_rate": 0.00010507204864936322, "loss": 0.0118, "step": 501330 }, { "epoch": 1.3, "learning_rate": 0.00010506816043299177, "loss": 0.0126, "step": 501340 }, { "epoch": 1.3, "learning_rate": 0.0001050642722166203, "loss": 0.0077, "step": 501350 }, { "epoch": 1.3, "learning_rate": 0.00010506038400024885, "loss": 0.0099, "step": 501360 }, { "epoch": 1.3, "learning_rate": 0.00010505649578387736, "loss": 0.0088, "step": 501370 }, { "epoch": 1.3, "learning_rate": 0.00010505260756750592, "loss": 0.0087, "step": 501380 }, { "epoch": 1.3, "learning_rate": 0.00010504871935113445, "loss": 0.0088, "step": 501390 }, { "epoch": 1.3, "learning_rate": 0.00010504483113476299, "loss": 0.0084, "step": 501400 }, { "epoch": 1.3, "learning_rate": 0.00010504094291839152, "loss": 0.0068, "step": 501410 }, { "epoch": 1.3, "learning_rate": 0.00010503705470202006, "loss": 0.0103, "step": 501420 }, { "epoch": 1.3, "learning_rate": 0.00010503316648564859, "loss": 0.0088, "step": 501430 }, { "epoch": 1.3, "learning_rate": 0.00010502927826927711, "loss": 0.0127, "step": 501440 }, { "epoch": 1.3, "learning_rate": 0.00010502539005290566, "loss": 0.0101, "step": 501450 }, { "epoch": 1.3, "learning_rate": 0.00010502150183653418, "loss": 0.0135, "step": 501460 }, { "epoch": 1.3, "learning_rate": 0.00010501761362016273, "loss": 0.0108, "step": 501470 }, { "epoch": 1.3, "learning_rate": 0.00010501372540379125, "loss": 0.0091, "step": 501480 }, { "epoch": 1.3, "learning_rate": 0.0001050098371874198, "loss": 0.0091, "step": 501490 }, { "epoch": 1.3, "learning_rate": 0.00010500594897104832, "loss": 0.0094, "step": 501500 }, { "epoch": 1.3, "learning_rate": 0.00010500206075467687, "loss": 0.0084, "step": 501510 }, { "epoch": 1.3, "learning_rate": 0.00010499817253830539, "loss": 0.0117, "step": 501520 }, { "epoch": 1.3, "learning_rate": 0.00010499428432193393, "loss": 0.0085, "step": 501530 }, { "epoch": 1.3, "learning_rate": 0.00010499039610556246, "loss": 0.0105, "step": 501540 }, { "epoch": 1.3, "learning_rate": 0.00010498650788919102, "loss": 0.0085, "step": 501550 }, { "epoch": 1.3, "learning_rate": 0.00010498261967281955, "loss": 0.0085, "step": 501560 }, { "epoch": 1.3, "learning_rate": 0.00010497873145644809, "loss": 0.0097, "step": 501570 }, { "epoch": 1.3, "learning_rate": 0.00010497484324007662, "loss": 0.0085, "step": 501580 }, { "epoch": 1.3, "learning_rate": 0.00010497095502370516, "loss": 0.0126, "step": 501590 }, { "epoch": 1.3, "learning_rate": 0.00010496706680733369, "loss": 0.0092, "step": 501600 }, { "epoch": 1.3, "learning_rate": 0.00010496317859096223, "loss": 0.0085, "step": 501610 }, { "epoch": 1.3, "learning_rate": 0.00010495929037459076, "loss": 0.0077, "step": 501620 }, { "epoch": 1.3, "learning_rate": 0.0001049554021582193, "loss": 0.0108, "step": 501630 }, { "epoch": 1.3, "learning_rate": 0.00010495151394184783, "loss": 0.0121, "step": 501640 }, { "epoch": 1.3, "learning_rate": 0.00010494762572547637, "loss": 0.0107, "step": 501650 }, { "epoch": 1.3, "learning_rate": 0.0001049437375091049, "loss": 0.0123, "step": 501660 }, { "epoch": 1.3, "learning_rate": 0.00010493984929273344, "loss": 0.0105, "step": 501670 }, { "epoch": 1.3, "learning_rate": 0.00010493596107636196, "loss": 0.0099, "step": 501680 }, { "epoch": 1.3, "learning_rate": 0.00010493207285999049, "loss": 0.0125, "step": 501690 }, { "epoch": 1.3, "learning_rate": 0.00010492818464361903, "loss": 0.0102, "step": 501700 }, { "epoch": 1.3, "learning_rate": 0.00010492429642724756, "loss": 0.0081, "step": 501710 }, { "epoch": 1.3, "learning_rate": 0.00010492040821087612, "loss": 0.0108, "step": 501720 }, { "epoch": 1.3, "learning_rate": 0.00010491651999450463, "loss": 0.017, "step": 501730 }, { "epoch": 1.3, "learning_rate": 0.00010491263177813319, "loss": 0.0109, "step": 501740 }, { "epoch": 1.3, "learning_rate": 0.00010490874356176172, "loss": 0.0096, "step": 501750 }, { "epoch": 1.3, "learning_rate": 0.00010490485534539026, "loss": 0.0103, "step": 501760 }, { "epoch": 1.3, "learning_rate": 0.00010490096712901879, "loss": 0.0114, "step": 501770 }, { "epoch": 1.3, "learning_rate": 0.00010489707891264733, "loss": 0.0103, "step": 501780 }, { "epoch": 1.3, "learning_rate": 0.00010489319069627585, "loss": 0.0082, "step": 501790 }, { "epoch": 1.3, "learning_rate": 0.0001048893024799044, "loss": 0.0106, "step": 501800 }, { "epoch": 1.3, "learning_rate": 0.00010488541426353292, "loss": 0.0112, "step": 501810 }, { "epoch": 1.3, "learning_rate": 0.00010488152604716147, "loss": 0.0092, "step": 501820 }, { "epoch": 1.3, "learning_rate": 0.00010487763783079, "loss": 0.0093, "step": 501830 }, { "epoch": 1.3, "learning_rate": 0.00010487374961441854, "loss": 0.0091, "step": 501840 }, { "epoch": 1.3, "learning_rate": 0.00010486986139804706, "loss": 0.0118, "step": 501850 }, { "epoch": 1.3, "learning_rate": 0.0001048659731816756, "loss": 0.0078, "step": 501860 }, { "epoch": 1.3, "learning_rate": 0.00010486208496530413, "loss": 0.0066, "step": 501870 }, { "epoch": 1.3, "learning_rate": 0.00010485819674893269, "loss": 0.0106, "step": 501880 }, { "epoch": 1.3, "learning_rate": 0.0001048543085325612, "loss": 0.0109, "step": 501890 }, { "epoch": 1.3, "learning_rate": 0.00010485042031618976, "loss": 0.0121, "step": 501900 }, { "epoch": 1.3, "learning_rate": 0.00010484653209981829, "loss": 0.0088, "step": 501910 }, { "epoch": 1.3, "learning_rate": 0.00010484264388344681, "loss": 0.0098, "step": 501920 }, { "epoch": 1.3, "learning_rate": 0.00010483875566707536, "loss": 0.01, "step": 501930 }, { "epoch": 1.3, "learning_rate": 0.00010483486745070388, "loss": 0.0083, "step": 501940 }, { "epoch": 1.3, "learning_rate": 0.00010483097923433243, "loss": 0.011, "step": 501950 }, { "epoch": 1.3, "learning_rate": 0.00010482709101796095, "loss": 0.011, "step": 501960 }, { "epoch": 1.3, "learning_rate": 0.0001048232028015895, "loss": 0.0086, "step": 501970 }, { "epoch": 1.3, "learning_rate": 0.00010481931458521802, "loss": 0.0094, "step": 501980 }, { "epoch": 1.3, "learning_rate": 0.00010481542636884657, "loss": 0.0152, "step": 501990 }, { "epoch": 1.3, "learning_rate": 0.0001048115381524751, "loss": 0.0114, "step": 502000 }, { "epoch": 1.3, "eval_cer": 0.8816704946736816, "eval_loss": 0.006790985353291035, "eval_runtime": 107.9811, "eval_samples_per_second": 18.522, "eval_steps_per_second": 4.63, "step": 502000 }, { "epoch": 1.3, "learning_rate": 0.00010480764993610364, "loss": 0.0103, "step": 502010 }, { "epoch": 1.3, "learning_rate": 0.00010480376171973216, "loss": 0.0105, "step": 502020 }, { "epoch": 1.3, "learning_rate": 0.0001047998735033607, "loss": 0.0098, "step": 502030 }, { "epoch": 1.3, "learning_rate": 0.00010479598528698923, "loss": 0.0104, "step": 502040 }, { "epoch": 1.3, "learning_rate": 0.00010479209707061777, "loss": 0.009, "step": 502050 }, { "epoch": 1.3, "learning_rate": 0.0001047882088542463, "loss": 0.0087, "step": 502060 }, { "epoch": 1.3, "learning_rate": 0.00010478432063787486, "loss": 0.0098, "step": 502070 }, { "epoch": 1.3, "learning_rate": 0.00010478043242150339, "loss": 0.0089, "step": 502080 }, { "epoch": 1.3, "learning_rate": 0.00010477654420513193, "loss": 0.0086, "step": 502090 }, { "epoch": 1.3, "learning_rate": 0.00010477265598876046, "loss": 0.0145, "step": 502100 }, { "epoch": 1.3, "learning_rate": 0.000104768767772389, "loss": 0.0072, "step": 502110 }, { "epoch": 1.3, "learning_rate": 0.00010476487955601753, "loss": 0.009, "step": 502120 }, { "epoch": 1.3, "learning_rate": 0.00010476099133964607, "loss": 0.0082, "step": 502130 }, { "epoch": 1.3, "learning_rate": 0.0001047571031232746, "loss": 0.0123, "step": 502140 }, { "epoch": 1.3, "learning_rate": 0.00010475321490690314, "loss": 0.0098, "step": 502150 }, { "epoch": 1.3, "learning_rate": 0.00010474932669053166, "loss": 0.0107, "step": 502160 }, { "epoch": 1.3, "learning_rate": 0.00010474543847416019, "loss": 0.0101, "step": 502170 }, { "epoch": 1.3, "learning_rate": 0.00010474155025778873, "loss": 0.0104, "step": 502180 }, { "epoch": 1.3, "learning_rate": 0.00010473766204141726, "loss": 0.013, "step": 502190 }, { "epoch": 1.3, "learning_rate": 0.0001047337738250458, "loss": 0.0089, "step": 502200 }, { "epoch": 1.3, "learning_rate": 0.00010472988560867433, "loss": 0.0108, "step": 502210 }, { "epoch": 1.3, "learning_rate": 0.00010472599739230287, "loss": 0.0119, "step": 502220 }, { "epoch": 1.3, "learning_rate": 0.0001047221091759314, "loss": 0.009, "step": 502230 }, { "epoch": 1.3, "learning_rate": 0.00010471822095955996, "loss": 0.0118, "step": 502240 }, { "epoch": 1.3, "learning_rate": 0.00010471433274318847, "loss": 0.0121, "step": 502250 }, { "epoch": 1.3, "learning_rate": 0.00010471044452681703, "loss": 0.0085, "step": 502260 }, { "epoch": 1.3, "learning_rate": 0.00010470655631044556, "loss": 0.0124, "step": 502270 }, { "epoch": 1.3, "learning_rate": 0.0001047026680940741, "loss": 0.0105, "step": 502280 }, { "epoch": 1.3, "learning_rate": 0.00010469877987770262, "loss": 0.0106, "step": 502290 }, { "epoch": 1.3, "learning_rate": 0.00010469489166133117, "loss": 0.0119, "step": 502300 }, { "epoch": 1.3, "learning_rate": 0.0001046910034449597, "loss": 0.0099, "step": 502310 }, { "epoch": 1.3, "learning_rate": 0.00010468711522858824, "loss": 0.0085, "step": 502320 }, { "epoch": 1.3, "learning_rate": 0.00010468322701221676, "loss": 0.0082, "step": 502330 }, { "epoch": 1.3, "learning_rate": 0.0001046793387958453, "loss": 0.0123, "step": 502340 }, { "epoch": 1.3, "learning_rate": 0.00010467545057947383, "loss": 0.0113, "step": 502350 }, { "epoch": 1.3, "learning_rate": 0.00010467156236310238, "loss": 0.0102, "step": 502360 }, { "epoch": 1.3, "learning_rate": 0.0001046676741467309, "loss": 0.0111, "step": 502370 }, { "epoch": 1.3, "learning_rate": 0.00010466378593035945, "loss": 0.01, "step": 502380 }, { "epoch": 1.3, "learning_rate": 0.00010465989771398797, "loss": 0.0118, "step": 502390 }, { "epoch": 1.3, "learning_rate": 0.00010465600949761653, "loss": 0.0089, "step": 502400 }, { "epoch": 1.3, "learning_rate": 0.00010465212128124504, "loss": 0.011, "step": 502410 }, { "epoch": 1.3, "learning_rate": 0.00010464823306487357, "loss": 0.0096, "step": 502420 }, { "epoch": 1.3, "learning_rate": 0.00010464434484850213, "loss": 0.0119, "step": 502430 }, { "epoch": 1.3, "learning_rate": 0.00010464045663213065, "loss": 0.0087, "step": 502440 }, { "epoch": 1.3, "learning_rate": 0.0001046365684157592, "loss": 0.0103, "step": 502450 }, { "epoch": 1.3, "learning_rate": 0.00010463268019938772, "loss": 0.0089, "step": 502460 }, { "epoch": 1.3, "learning_rate": 0.00010462879198301627, "loss": 0.0117, "step": 502470 }, { "epoch": 1.3, "learning_rate": 0.0001046249037666448, "loss": 0.0089, "step": 502480 }, { "epoch": 1.3, "learning_rate": 0.00010462101555027334, "loss": 0.0109, "step": 502490 }, { "epoch": 1.3, "learning_rate": 0.00010461712733390186, "loss": 0.011, "step": 502500 }, { "epoch": 1.3, "learning_rate": 0.0001046132391175304, "loss": 0.0072, "step": 502510 }, { "epoch": 1.3, "learning_rate": 0.00010460935090115893, "loss": 0.0109, "step": 502520 }, { "epoch": 1.3, "learning_rate": 0.00010460546268478748, "loss": 0.0084, "step": 502530 }, { "epoch": 1.3, "learning_rate": 0.000104601574468416, "loss": 0.0152, "step": 502540 }, { "epoch": 1.3, "learning_rate": 0.00010459768625204454, "loss": 0.0097, "step": 502550 }, { "epoch": 1.3, "learning_rate": 0.00010459379803567307, "loss": 0.0092, "step": 502560 }, { "epoch": 1.3, "learning_rate": 0.00010458990981930161, "loss": 0.0122, "step": 502570 }, { "epoch": 1.3, "learning_rate": 0.00010458602160293014, "loss": 0.009, "step": 502580 }, { "epoch": 1.3, "learning_rate": 0.0001045821333865587, "loss": 0.0099, "step": 502590 }, { "epoch": 1.3, "learning_rate": 0.00010457824517018723, "loss": 0.0098, "step": 502600 }, { "epoch": 1.3, "learning_rate": 0.00010457435695381577, "loss": 0.0121, "step": 502610 }, { "epoch": 1.3, "learning_rate": 0.0001045704687374443, "loss": 0.0081, "step": 502620 }, { "epoch": 1.3, "learning_rate": 0.00010456658052107284, "loss": 0.0068, "step": 502630 }, { "epoch": 1.3, "learning_rate": 0.00010456269230470137, "loss": 0.0142, "step": 502640 }, { "epoch": 1.3, "learning_rate": 0.00010455880408832991, "loss": 0.012, "step": 502650 }, { "epoch": 1.3, "learning_rate": 0.00010455491587195844, "loss": 0.0098, "step": 502660 }, { "epoch": 1.3, "learning_rate": 0.00010455102765558696, "loss": 0.0092, "step": 502670 }, { "epoch": 1.3, "learning_rate": 0.0001045471394392155, "loss": 0.0089, "step": 502680 }, { "epoch": 1.3, "learning_rate": 0.00010454325122284403, "loss": 0.0108, "step": 502690 }, { "epoch": 1.3, "learning_rate": 0.00010453936300647257, "loss": 0.0111, "step": 502700 }, { "epoch": 1.3, "learning_rate": 0.0001045354747901011, "loss": 0.0105, "step": 502710 }, { "epoch": 1.3, "learning_rate": 0.00010453158657372964, "loss": 0.0118, "step": 502720 }, { "epoch": 1.3, "learning_rate": 0.00010452769835735817, "loss": 0.0106, "step": 502730 }, { "epoch": 1.3, "learning_rate": 0.00010452381014098671, "loss": 0.0108, "step": 502740 }, { "epoch": 1.3, "learning_rate": 0.00010451992192461524, "loss": 0.0102, "step": 502750 }, { "epoch": 1.3, "learning_rate": 0.00010451603370824378, "loss": 0.0103, "step": 502760 }, { "epoch": 1.3, "learning_rate": 0.00010451214549187231, "loss": 0.0169, "step": 502770 }, { "epoch": 1.3, "learning_rate": 0.00010450825727550087, "loss": 0.0117, "step": 502780 }, { "epoch": 1.3, "learning_rate": 0.0001045043690591294, "loss": 0.0157, "step": 502790 }, { "epoch": 1.3, "learning_rate": 0.00010450048084275794, "loss": 0.0121, "step": 502800 }, { "epoch": 1.3, "learning_rate": 0.00010449659262638646, "loss": 0.0102, "step": 502810 }, { "epoch": 1.3, "learning_rate": 0.000104492704410015, "loss": 0.0109, "step": 502820 }, { "epoch": 1.3, "learning_rate": 0.00010448881619364353, "loss": 0.0092, "step": 502830 }, { "epoch": 1.3, "learning_rate": 0.00010448492797727208, "loss": 0.0107, "step": 502840 }, { "epoch": 1.3, "learning_rate": 0.0001044810397609006, "loss": 0.0104, "step": 502850 }, { "epoch": 1.3, "learning_rate": 0.00010447715154452915, "loss": 0.0093, "step": 502860 }, { "epoch": 1.3, "learning_rate": 0.00010447326332815767, "loss": 0.0103, "step": 502870 }, { "epoch": 1.3, "learning_rate": 0.00010446937511178622, "loss": 0.0076, "step": 502880 }, { "epoch": 1.3, "learning_rate": 0.00010446548689541474, "loss": 0.0085, "step": 502890 }, { "epoch": 1.3, "learning_rate": 0.00010446159867904329, "loss": 0.0088, "step": 502900 }, { "epoch": 1.3, "learning_rate": 0.00010445771046267181, "loss": 0.0108, "step": 502910 }, { "epoch": 1.3, "learning_rate": 0.00010445382224630034, "loss": 0.0078, "step": 502920 }, { "epoch": 1.3, "learning_rate": 0.00010444993402992888, "loss": 0.0086, "step": 502930 }, { "epoch": 1.3, "learning_rate": 0.00010444604581355741, "loss": 0.0106, "step": 502940 }, { "epoch": 1.3, "learning_rate": 0.00010444215759718597, "loss": 0.0129, "step": 502950 }, { "epoch": 1.3, "learning_rate": 0.00010443826938081448, "loss": 0.0062, "step": 502960 }, { "epoch": 1.3, "learning_rate": 0.00010443438116444304, "loss": 0.0105, "step": 502970 }, { "epoch": 1.3, "learning_rate": 0.00010443049294807156, "loss": 0.0075, "step": 502980 }, { "epoch": 1.3, "learning_rate": 0.0001044266047317001, "loss": 0.0116, "step": 502990 }, { "epoch": 1.3, "learning_rate": 0.00010442271651532863, "loss": 0.0093, "step": 503000 }, { "epoch": 1.3, "eval_cer": 0.8816662957628791, "eval_loss": 0.006540039554238319, "eval_runtime": 108.0994, "eval_samples_per_second": 18.501, "eval_steps_per_second": 4.625, "step": 503000 }, { "epoch": 1.3, "learning_rate": 0.00010441882829895718, "loss": 0.0084, "step": 503010 }, { "epoch": 1.3, "learning_rate": 0.0001044149400825857, "loss": 0.014, "step": 503020 }, { "epoch": 1.3, "learning_rate": 0.00010441105186621425, "loss": 0.0129, "step": 503030 }, { "epoch": 1.3, "learning_rate": 0.00010440716364984277, "loss": 0.013, "step": 503040 }, { "epoch": 1.3, "learning_rate": 0.00010440327543347132, "loss": 0.0099, "step": 503050 }, { "epoch": 1.3, "learning_rate": 0.00010439938721709984, "loss": 0.0118, "step": 503060 }, { "epoch": 1.3, "learning_rate": 0.00010439549900072838, "loss": 0.0091, "step": 503070 }, { "epoch": 1.3, "learning_rate": 0.00010439161078435691, "loss": 0.0107, "step": 503080 }, { "epoch": 1.3, "learning_rate": 0.00010438772256798545, "loss": 0.0095, "step": 503090 }, { "epoch": 1.3, "learning_rate": 0.00010438383435161398, "loss": 0.0118, "step": 503100 }, { "epoch": 1.3, "learning_rate": 0.00010437994613524254, "loss": 0.0096, "step": 503110 }, { "epoch": 1.3, "learning_rate": 0.00010437605791887105, "loss": 0.0104, "step": 503120 }, { "epoch": 1.3, "learning_rate": 0.00010437216970249961, "loss": 0.0072, "step": 503130 }, { "epoch": 1.3, "learning_rate": 0.00010436828148612814, "loss": 0.008, "step": 503140 }, { "epoch": 1.3, "learning_rate": 0.00010436439326975668, "loss": 0.0105, "step": 503150 }, { "epoch": 1.3, "learning_rate": 0.0001043605050533852, "loss": 0.0106, "step": 503160 }, { "epoch": 1.3, "learning_rate": 0.00010435661683701373, "loss": 0.0093, "step": 503170 }, { "epoch": 1.3, "learning_rate": 0.00010435272862064228, "loss": 0.0108, "step": 503180 }, { "epoch": 1.3, "learning_rate": 0.0001043488404042708, "loss": 0.01, "step": 503190 }, { "epoch": 1.3, "learning_rate": 0.00010434495218789934, "loss": 0.01, "step": 503200 }, { "epoch": 1.3, "learning_rate": 0.00010434106397152787, "loss": 0.009, "step": 503210 }, { "epoch": 1.3, "learning_rate": 0.00010433717575515641, "loss": 0.0089, "step": 503220 }, { "epoch": 1.3, "learning_rate": 0.00010433328753878494, "loss": 0.0077, "step": 503230 }, { "epoch": 1.3, "learning_rate": 0.00010432939932241348, "loss": 0.0091, "step": 503240 }, { "epoch": 1.3, "learning_rate": 0.00010432551110604201, "loss": 0.0096, "step": 503250 }, { "epoch": 1.3, "learning_rate": 0.00010432162288967055, "loss": 0.0109, "step": 503260 }, { "epoch": 1.3, "learning_rate": 0.00010431773467329908, "loss": 0.0127, "step": 503270 }, { "epoch": 1.3, "learning_rate": 0.00010431384645692762, "loss": 0.0117, "step": 503280 }, { "epoch": 1.3, "learning_rate": 0.00010430995824055615, "loss": 0.0139, "step": 503290 }, { "epoch": 1.3, "learning_rate": 0.00010430607002418471, "loss": 0.009, "step": 503300 }, { "epoch": 1.3, "learning_rate": 0.00010430218180781324, "loss": 0.0119, "step": 503310 }, { "epoch": 1.3, "learning_rate": 0.00010429829359144178, "loss": 0.0098, "step": 503320 }, { "epoch": 1.3, "learning_rate": 0.0001042944053750703, "loss": 0.0106, "step": 503330 }, { "epoch": 1.3, "learning_rate": 0.00010429051715869885, "loss": 0.0118, "step": 503340 }, { "epoch": 1.3, "learning_rate": 0.00010428662894232737, "loss": 0.0087, "step": 503350 }, { "epoch": 1.3, "learning_rate": 0.00010428274072595592, "loss": 0.0106, "step": 503360 }, { "epoch": 1.3, "learning_rate": 0.00010427885250958444, "loss": 0.0094, "step": 503370 }, { "epoch": 1.3, "learning_rate": 0.00010427496429321299, "loss": 0.0093, "step": 503380 }, { "epoch": 1.3, "learning_rate": 0.00010427107607684151, "loss": 0.0098, "step": 503390 }, { "epoch": 1.3, "learning_rate": 0.00010426718786047006, "loss": 0.0106, "step": 503400 }, { "epoch": 1.3, "learning_rate": 0.00010426329964409858, "loss": 0.0119, "step": 503410 }, { "epoch": 1.3, "learning_rate": 0.00010425941142772711, "loss": 0.0104, "step": 503420 }, { "epoch": 1.3, "learning_rate": 0.00010425552321135565, "loss": 0.0101, "step": 503430 }, { "epoch": 1.3, "learning_rate": 0.00010425163499498418, "loss": 0.0091, "step": 503440 }, { "epoch": 1.31, "learning_rate": 0.00010424774677861272, "loss": 0.0103, "step": 503450 }, { "epoch": 1.31, "learning_rate": 0.00010424385856224125, "loss": 0.0096, "step": 503460 }, { "epoch": 1.31, "learning_rate": 0.0001042399703458698, "loss": 0.0093, "step": 503470 }, { "epoch": 1.31, "learning_rate": 0.00010423608212949832, "loss": 0.0107, "step": 503480 }, { "epoch": 1.31, "learning_rate": 0.00010423219391312688, "loss": 0.0198, "step": 503490 }, { "epoch": 1.31, "learning_rate": 0.0001042283056967554, "loss": 0.0073, "step": 503500 }, { "epoch": 1.31, "learning_rate": 0.00010422441748038395, "loss": 0.0135, "step": 503510 }, { "epoch": 1.31, "learning_rate": 0.00010422052926401247, "loss": 0.0092, "step": 503520 }, { "epoch": 1.31, "learning_rate": 0.00010421664104764102, "loss": 0.0102, "step": 503530 }, { "epoch": 1.31, "learning_rate": 0.00010421275283126954, "loss": 0.01, "step": 503540 }, { "epoch": 1.31, "learning_rate": 0.00010420886461489809, "loss": 0.0113, "step": 503550 }, { "epoch": 1.31, "learning_rate": 0.00010420497639852661, "loss": 0.0134, "step": 503560 }, { "epoch": 1.31, "learning_rate": 0.00010420108818215515, "loss": 0.015, "step": 503570 }, { "epoch": 1.31, "learning_rate": 0.00010419719996578368, "loss": 0.0077, "step": 503580 }, { "epoch": 1.31, "learning_rate": 0.00010419331174941222, "loss": 0.0106, "step": 503590 }, { "epoch": 1.31, "learning_rate": 0.00010418942353304075, "loss": 0.0094, "step": 503600 }, { "epoch": 1.31, "learning_rate": 0.0001041855353166693, "loss": 0.0093, "step": 503610 }, { "epoch": 1.31, "learning_rate": 0.00010418164710029782, "loss": 0.0089, "step": 503620 }, { "epoch": 1.31, "learning_rate": 0.00010417775888392638, "loss": 0.0146, "step": 503630 }, { "epoch": 1.31, "learning_rate": 0.00010417387066755489, "loss": 0.009, "step": 503640 }, { "epoch": 1.31, "learning_rate": 0.00010416998245118345, "loss": 0.0103, "step": 503650 }, { "epoch": 1.31, "learning_rate": 0.00010416609423481198, "loss": 0.0127, "step": 503660 }, { "epoch": 1.31, "learning_rate": 0.0001041622060184405, "loss": 0.0092, "step": 503670 }, { "epoch": 1.31, "learning_rate": 0.00010415831780206905, "loss": 0.0109, "step": 503680 }, { "epoch": 1.31, "learning_rate": 0.00010415442958569757, "loss": 0.0077, "step": 503690 }, { "epoch": 1.31, "learning_rate": 0.00010415054136932611, "loss": 0.0068, "step": 503700 }, { "epoch": 1.31, "learning_rate": 0.00010414665315295464, "loss": 0.0088, "step": 503710 }, { "epoch": 1.31, "learning_rate": 0.00010414276493658318, "loss": 0.01, "step": 503720 }, { "epoch": 1.31, "learning_rate": 0.00010413887672021171, "loss": 0.0068, "step": 503730 }, { "epoch": 1.31, "learning_rate": 0.00010413498850384025, "loss": 0.0071, "step": 503740 }, { "epoch": 1.31, "learning_rate": 0.00010413110028746878, "loss": 0.0094, "step": 503750 }, { "epoch": 1.31, "learning_rate": 0.00010412721207109732, "loss": 0.0104, "step": 503760 }, { "epoch": 1.31, "learning_rate": 0.00010412332385472585, "loss": 0.0105, "step": 503770 }, { "epoch": 1.31, "learning_rate": 0.0001041194356383544, "loss": 0.0077, "step": 503780 }, { "epoch": 1.31, "learning_rate": 0.00010411554742198292, "loss": 0.0097, "step": 503790 }, { "epoch": 1.31, "learning_rate": 0.00010411165920561146, "loss": 0.0101, "step": 503800 }, { "epoch": 1.31, "learning_rate": 0.00010410777098923999, "loss": 0.0104, "step": 503810 }, { "epoch": 1.31, "learning_rate": 0.00010410388277286855, "loss": 0.0122, "step": 503820 }, { "epoch": 1.31, "learning_rate": 0.00010409999455649707, "loss": 0.0079, "step": 503830 }, { "epoch": 1.31, "learning_rate": 0.00010409610634012562, "loss": 0.0099, "step": 503840 }, { "epoch": 1.31, "learning_rate": 0.00010409221812375414, "loss": 0.0102, "step": 503850 }, { "epoch": 1.31, "learning_rate": 0.00010408832990738269, "loss": 0.0086, "step": 503860 }, { "epoch": 1.31, "learning_rate": 0.00010408444169101121, "loss": 0.0092, "step": 503870 }, { "epoch": 1.31, "learning_rate": 0.00010408055347463976, "loss": 0.0126, "step": 503880 }, { "epoch": 1.31, "learning_rate": 0.00010407666525826828, "loss": 0.0101, "step": 503890 }, { "epoch": 1.31, "learning_rate": 0.00010407277704189683, "loss": 0.0088, "step": 503900 }, { "epoch": 1.31, "learning_rate": 0.00010406888882552535, "loss": 0.0079, "step": 503910 }, { "epoch": 1.31, "learning_rate": 0.00010406500060915388, "loss": 0.0109, "step": 503920 }, { "epoch": 1.31, "learning_rate": 0.00010406111239278242, "loss": 0.0072, "step": 503930 }, { "epoch": 1.31, "learning_rate": 0.00010405722417641095, "loss": 0.0098, "step": 503940 }, { "epoch": 1.31, "learning_rate": 0.0001040533359600395, "loss": 0.012, "step": 503950 }, { "epoch": 1.31, "learning_rate": 0.00010404944774366802, "loss": 0.0136, "step": 503960 }, { "epoch": 1.31, "learning_rate": 0.00010404555952729656, "loss": 0.0109, "step": 503970 }, { "epoch": 1.31, "learning_rate": 0.00010404167131092509, "loss": 0.01, "step": 503980 }, { "epoch": 1.31, "learning_rate": 0.00010403778309455363, "loss": 0.0102, "step": 503990 }, { "epoch": 1.31, "learning_rate": 0.00010403389487818216, "loss": 0.0122, "step": 504000 }, { "epoch": 1.31, "eval_cer": 0.8816956881384969, "eval_loss": 0.0066497717052698135, "eval_runtime": 108.0868, "eval_samples_per_second": 18.504, "eval_steps_per_second": 4.626, "step": 504000 }, { "epoch": 1.31, "learning_rate": 0.00010403000666181072, "loss": 0.0098, "step": 504010 }, { "epoch": 1.31, "learning_rate": 0.00010402611844543924, "loss": 0.0094, "step": 504020 }, { "epoch": 1.31, "learning_rate": 0.00010402223022906779, "loss": 0.0102, "step": 504030 }, { "epoch": 1.31, "learning_rate": 0.00010401834201269631, "loss": 0.0081, "step": 504040 }, { "epoch": 1.31, "learning_rate": 0.00010401445379632486, "loss": 0.009, "step": 504050 }, { "epoch": 1.31, "learning_rate": 0.00010401056557995338, "loss": 0.0144, "step": 504060 }, { "epoch": 1.31, "learning_rate": 0.00010400667736358193, "loss": 0.0088, "step": 504070 }, { "epoch": 1.31, "learning_rate": 0.00010400278914721045, "loss": 0.012, "step": 504080 }, { "epoch": 1.31, "learning_rate": 0.000103998900930839, "loss": 0.009, "step": 504090 }, { "epoch": 1.31, "learning_rate": 0.00010399501271446752, "loss": 0.0127, "step": 504100 }, { "epoch": 1.31, "learning_rate": 0.00010399112449809606, "loss": 0.0113, "step": 504110 }, { "epoch": 1.31, "learning_rate": 0.00010398723628172459, "loss": 0.0105, "step": 504120 }, { "epoch": 1.31, "learning_rate": 0.00010398334806535313, "loss": 0.0101, "step": 504130 }, { "epoch": 1.31, "learning_rate": 0.00010397945984898166, "loss": 0.0091, "step": 504140 }, { "epoch": 1.31, "learning_rate": 0.0001039755716326102, "loss": 0.0135, "step": 504150 }, { "epoch": 1.31, "learning_rate": 0.00010397168341623873, "loss": 0.0115, "step": 504160 }, { "epoch": 1.31, "learning_rate": 0.00010396779519986726, "loss": 0.0113, "step": 504170 }, { "epoch": 1.31, "learning_rate": 0.00010396390698349582, "loss": 0.01, "step": 504180 }, { "epoch": 1.31, "learning_rate": 0.00010396001876712434, "loss": 0.0119, "step": 504190 }, { "epoch": 1.31, "learning_rate": 0.00010395613055075289, "loss": 0.0146, "step": 504200 }, { "epoch": 1.31, "learning_rate": 0.00010395224233438141, "loss": 0.0106, "step": 504210 }, { "epoch": 1.31, "learning_rate": 0.00010394835411800995, "loss": 0.0094, "step": 504220 }, { "epoch": 1.31, "learning_rate": 0.00010394446590163848, "loss": 0.0126, "step": 504230 }, { "epoch": 1.31, "learning_rate": 0.00010394057768526702, "loss": 0.0092, "step": 504240 }, { "epoch": 1.31, "learning_rate": 0.00010393668946889555, "loss": 0.0068, "step": 504250 }, { "epoch": 1.31, "learning_rate": 0.0001039328012525241, "loss": 0.0129, "step": 504260 }, { "epoch": 1.31, "learning_rate": 0.00010392891303615262, "loss": 0.0098, "step": 504270 }, { "epoch": 1.31, "learning_rate": 0.00010392502481978116, "loss": 0.0096, "step": 504280 }, { "epoch": 1.31, "learning_rate": 0.00010392113660340969, "loss": 0.0095, "step": 504290 }, { "epoch": 1.31, "learning_rate": 0.00010391724838703823, "loss": 0.0078, "step": 504300 }, { "epoch": 1.31, "learning_rate": 0.00010391336017066676, "loss": 0.0079, "step": 504310 }, { "epoch": 1.31, "learning_rate": 0.0001039094719542953, "loss": 0.0117, "step": 504320 }, { "epoch": 1.31, "learning_rate": 0.00010390558373792383, "loss": 0.0098, "step": 504330 }, { "epoch": 1.31, "learning_rate": 0.00010390169552155239, "loss": 0.009, "step": 504340 }, { "epoch": 1.31, "learning_rate": 0.0001038978073051809, "loss": 0.0126, "step": 504350 }, { "epoch": 1.31, "learning_rate": 0.00010389391908880946, "loss": 0.0104, "step": 504360 }, { "epoch": 1.31, "learning_rate": 0.00010389003087243798, "loss": 0.0123, "step": 504370 }, { "epoch": 1.31, "learning_rate": 0.00010388614265606653, "loss": 0.0072, "step": 504380 }, { "epoch": 1.31, "learning_rate": 0.00010388225443969505, "loss": 0.0118, "step": 504390 }, { "epoch": 1.31, "learning_rate": 0.0001038783662233236, "loss": 0.0084, "step": 504400 }, { "epoch": 1.31, "learning_rate": 0.00010387447800695212, "loss": 0.0112, "step": 504410 }, { "epoch": 1.31, "learning_rate": 0.00010387058979058065, "loss": 0.0113, "step": 504420 }, { "epoch": 1.31, "learning_rate": 0.0001038667015742092, "loss": 0.0088, "step": 504430 }, { "epoch": 1.31, "learning_rate": 0.00010386281335783772, "loss": 0.0088, "step": 504440 }, { "epoch": 1.31, "learning_rate": 0.00010385892514146626, "loss": 0.0093, "step": 504450 }, { "epoch": 1.31, "learning_rate": 0.00010385503692509479, "loss": 0.0113, "step": 504460 }, { "epoch": 1.31, "learning_rate": 0.00010385114870872333, "loss": 0.013, "step": 504470 }, { "epoch": 1.31, "learning_rate": 0.00010384726049235186, "loss": 0.0138, "step": 504480 }, { "epoch": 1.31, "learning_rate": 0.0001038433722759804, "loss": 0.0097, "step": 504490 }, { "epoch": 1.31, "learning_rate": 0.00010383948405960893, "loss": 0.0323, "step": 504500 }, { "epoch": 1.31, "learning_rate": 0.00010383559584323747, "loss": 0.0113, "step": 504510 }, { "epoch": 1.31, "learning_rate": 0.000103831707626866, "loss": 0.0146, "step": 504520 }, { "epoch": 1.31, "learning_rate": 0.00010382781941049456, "loss": 0.0085, "step": 504530 }, { "epoch": 1.31, "learning_rate": 0.00010382393119412308, "loss": 0.0099, "step": 504540 }, { "epoch": 1.31, "learning_rate": 0.00010382004297775163, "loss": 0.0099, "step": 504550 }, { "epoch": 1.31, "learning_rate": 0.00010381615476138015, "loss": 0.0121, "step": 504560 }, { "epoch": 1.31, "learning_rate": 0.0001038122665450087, "loss": 0.0104, "step": 504570 }, { "epoch": 1.31, "learning_rate": 0.00010380837832863722, "loss": 0.0115, "step": 504580 }, { "epoch": 1.31, "learning_rate": 0.00010380449011226577, "loss": 0.0118, "step": 504590 }, { "epoch": 1.31, "learning_rate": 0.00010380060189589429, "loss": 0.0109, "step": 504600 }, { "epoch": 1.31, "learning_rate": 0.00010379671367952283, "loss": 0.0101, "step": 504610 }, { "epoch": 1.31, "learning_rate": 0.00010379282546315136, "loss": 0.0101, "step": 504620 }, { "epoch": 1.31, "learning_rate": 0.0001037889372467799, "loss": 0.0108, "step": 504630 }, { "epoch": 1.31, "learning_rate": 0.00010378504903040843, "loss": 0.012, "step": 504640 }, { "epoch": 1.31, "learning_rate": 0.00010378116081403696, "loss": 0.0145, "step": 504650 }, { "epoch": 1.31, "learning_rate": 0.0001037772725976655, "loss": 0.011, "step": 504660 }, { "epoch": 1.31, "learning_rate": 0.00010377338438129403, "loss": 0.0124, "step": 504670 }, { "epoch": 1.31, "learning_rate": 0.00010376949616492257, "loss": 0.0105, "step": 504680 }, { "epoch": 1.31, "learning_rate": 0.0001037656079485511, "loss": 0.0093, "step": 504690 }, { "epoch": 1.31, "learning_rate": 0.00010376171973217966, "loss": 0.0107, "step": 504700 }, { "epoch": 1.31, "learning_rate": 0.00010375783151580817, "loss": 0.0084, "step": 504710 }, { "epoch": 1.31, "learning_rate": 0.00010375394329943673, "loss": 0.0086, "step": 504720 }, { "epoch": 1.31, "learning_rate": 0.00010375005508306525, "loss": 0.008, "step": 504730 }, { "epoch": 1.31, "learning_rate": 0.0001037461668666938, "loss": 0.0106, "step": 504740 }, { "epoch": 1.31, "learning_rate": 0.00010374227865032232, "loss": 0.0101, "step": 504750 }, { "epoch": 1.31, "learning_rate": 0.00010373839043395086, "loss": 0.0081, "step": 504760 }, { "epoch": 1.31, "learning_rate": 0.00010373450221757939, "loss": 0.0085, "step": 504770 }, { "epoch": 1.31, "learning_rate": 0.00010373061400120793, "loss": 0.0113, "step": 504780 }, { "epoch": 1.31, "learning_rate": 0.00010372672578483646, "loss": 0.007, "step": 504790 }, { "epoch": 1.31, "learning_rate": 0.000103722837568465, "loss": 0.0074, "step": 504800 }, { "epoch": 1.31, "learning_rate": 0.00010371894935209353, "loss": 0.0118, "step": 504810 }, { "epoch": 1.31, "learning_rate": 0.00010371506113572207, "loss": 0.0105, "step": 504820 }, { "epoch": 1.31, "learning_rate": 0.0001037111729193506, "loss": 0.0141, "step": 504830 }, { "epoch": 1.31, "learning_rate": 0.00010370728470297914, "loss": 0.0104, "step": 504840 }, { "epoch": 1.31, "learning_rate": 0.00010370339648660767, "loss": 0.0091, "step": 504850 }, { "epoch": 1.31, "learning_rate": 0.00010369950827023623, "loss": 0.0099, "step": 504860 }, { "epoch": 1.31, "learning_rate": 0.00010369562005386474, "loss": 0.0105, "step": 504870 }, { "epoch": 1.31, "learning_rate": 0.0001036917318374933, "loss": 0.0123, "step": 504880 }, { "epoch": 1.31, "learning_rate": 0.00010368784362112182, "loss": 0.0104, "step": 504890 }, { "epoch": 1.31, "learning_rate": 0.00010368395540475035, "loss": 0.0127, "step": 504900 }, { "epoch": 1.31, "learning_rate": 0.0001036800671883789, "loss": 0.008, "step": 504910 }, { "epoch": 1.31, "learning_rate": 0.00010367617897200742, "loss": 0.0132, "step": 504920 }, { "epoch": 1.31, "learning_rate": 0.00010367229075563596, "loss": 0.0102, "step": 504930 }, { "epoch": 1.31, "learning_rate": 0.00010366840253926449, "loss": 0.012, "step": 504940 }, { "epoch": 1.31, "learning_rate": 0.00010366451432289303, "loss": 0.0088, "step": 504950 }, { "epoch": 1.31, "learning_rate": 0.00010366062610652156, "loss": 0.0094, "step": 504960 }, { "epoch": 1.31, "learning_rate": 0.0001036567378901501, "loss": 0.0099, "step": 504970 }, { "epoch": 1.31, "learning_rate": 0.00010365284967377863, "loss": 0.0112, "step": 504980 }, { "epoch": 1.31, "learning_rate": 0.00010364896145740717, "loss": 0.0099, "step": 504990 }, { "epoch": 1.31, "learning_rate": 0.0001036450732410357, "loss": 0.008, "step": 505000 }, { "epoch": 1.31, "eval_cer": 0.8817096845078387, "eval_loss": 0.006840614136308432, "eval_runtime": 108.1691, "eval_samples_per_second": 18.49, "eval_steps_per_second": 4.622, "step": 505000 }, { "epoch": 1.31, "learning_rate": 0.00010364118502466424, "loss": 0.0109, "step": 505010 }, { "epoch": 1.31, "learning_rate": 0.00010363729680829277, "loss": 0.0099, "step": 505020 }, { "epoch": 1.31, "learning_rate": 0.00010363340859192131, "loss": 0.0087, "step": 505030 }, { "epoch": 1.31, "learning_rate": 0.00010362952037554984, "loss": 0.0103, "step": 505040 }, { "epoch": 1.31, "learning_rate": 0.0001036256321591784, "loss": 0.0114, "step": 505050 }, { "epoch": 1.31, "learning_rate": 0.00010362174394280692, "loss": 0.0117, "step": 505060 }, { "epoch": 1.31, "learning_rate": 0.00010361785572643547, "loss": 0.0103, "step": 505070 }, { "epoch": 1.31, "learning_rate": 0.000103613967510064, "loss": 0.0093, "step": 505080 }, { "epoch": 1.31, "learning_rate": 0.00010361007929369254, "loss": 0.0106, "step": 505090 }, { "epoch": 1.31, "learning_rate": 0.00010360619107732106, "loss": 0.0129, "step": 505100 }, { "epoch": 1.31, "learning_rate": 0.0001036023028609496, "loss": 0.0094, "step": 505110 }, { "epoch": 1.31, "learning_rate": 0.00010359841464457813, "loss": 0.0089, "step": 505120 }, { "epoch": 1.31, "learning_rate": 0.00010359452642820667, "loss": 0.0126, "step": 505130 }, { "epoch": 1.31, "learning_rate": 0.0001035906382118352, "loss": 0.0099, "step": 505140 }, { "epoch": 1.31, "learning_rate": 0.00010358674999546373, "loss": 0.0106, "step": 505150 }, { "epoch": 1.31, "learning_rate": 0.00010358286177909227, "loss": 0.0085, "step": 505160 }, { "epoch": 1.31, "learning_rate": 0.0001035789735627208, "loss": 0.0079, "step": 505170 }, { "epoch": 1.31, "learning_rate": 0.00010357508534634934, "loss": 0.009, "step": 505180 }, { "epoch": 1.31, "learning_rate": 0.00010357119712997787, "loss": 0.0112, "step": 505190 }, { "epoch": 1.31, "learning_rate": 0.00010356730891360641, "loss": 0.0111, "step": 505200 }, { "epoch": 1.31, "learning_rate": 0.00010356342069723494, "loss": 0.0112, "step": 505210 }, { "epoch": 1.31, "learning_rate": 0.0001035595324808635, "loss": 0.0089, "step": 505220 }, { "epoch": 1.31, "learning_rate": 0.00010355564426449201, "loss": 0.0076, "step": 505230 }, { "epoch": 1.31, "learning_rate": 0.00010355175604812056, "loss": 0.01, "step": 505240 }, { "epoch": 1.31, "learning_rate": 0.00010354786783174909, "loss": 0.008, "step": 505250 }, { "epoch": 1.31, "learning_rate": 0.00010354397961537763, "loss": 0.0108, "step": 505260 }, { "epoch": 1.31, "learning_rate": 0.00010354009139900616, "loss": 0.0099, "step": 505270 }, { "epoch": 1.31, "learning_rate": 0.0001035362031826347, "loss": 0.0101, "step": 505280 }, { "epoch": 1.31, "learning_rate": 0.00010353231496626323, "loss": 0.0105, "step": 505290 }, { "epoch": 1.31, "learning_rate": 0.00010352842674989177, "loss": 0.0111, "step": 505300 }, { "epoch": 1.31, "learning_rate": 0.0001035245385335203, "loss": 0.0097, "step": 505310 }, { "epoch": 1.31, "learning_rate": 0.00010352065031714884, "loss": 0.008, "step": 505320 }, { "epoch": 1.31, "learning_rate": 0.00010351676210077737, "loss": 0.0128, "step": 505330 }, { "epoch": 1.31, "learning_rate": 0.00010351287388440591, "loss": 0.0082, "step": 505340 }, { "epoch": 1.31, "learning_rate": 0.00010350898566803444, "loss": 0.0097, "step": 505350 }, { "epoch": 1.31, "learning_rate": 0.00010350509745166298, "loss": 0.0092, "step": 505360 }, { "epoch": 1.31, "learning_rate": 0.00010350120923529151, "loss": 0.0125, "step": 505370 }, { "epoch": 1.31, "learning_rate": 0.00010349732101892005, "loss": 0.0108, "step": 505380 }, { "epoch": 1.31, "learning_rate": 0.00010349343280254858, "loss": 0.0115, "step": 505390 }, { "epoch": 1.31, "learning_rate": 0.00010348954458617711, "loss": 0.0112, "step": 505400 }, { "epoch": 1.31, "learning_rate": 0.00010348565636980566, "loss": 0.0101, "step": 505410 }, { "epoch": 1.31, "learning_rate": 0.00010348176815343419, "loss": 0.0087, "step": 505420 }, { "epoch": 1.31, "learning_rate": 0.00010347787993706273, "loss": 0.0111, "step": 505430 }, { "epoch": 1.31, "learning_rate": 0.00010347399172069126, "loss": 0.0107, "step": 505440 }, { "epoch": 1.31, "learning_rate": 0.0001034701035043198, "loss": 0.0095, "step": 505450 }, { "epoch": 1.31, "learning_rate": 0.00010346621528794833, "loss": 0.0112, "step": 505460 }, { "epoch": 1.31, "learning_rate": 0.00010346232707157687, "loss": 0.0107, "step": 505470 }, { "epoch": 1.31, "learning_rate": 0.0001034584388552054, "loss": 0.0092, "step": 505480 }, { "epoch": 1.31, "learning_rate": 0.00010345455063883394, "loss": 0.0093, "step": 505490 }, { "epoch": 1.31, "learning_rate": 0.00010345066242246247, "loss": 0.0117, "step": 505500 }, { "epoch": 1.31, "learning_rate": 0.00010344677420609101, "loss": 0.0075, "step": 505510 }, { "epoch": 1.31, "learning_rate": 0.00010344288598971954, "loss": 0.0107, "step": 505520 }, { "epoch": 1.31, "learning_rate": 0.00010343899777334808, "loss": 0.0118, "step": 505530 }, { "epoch": 1.31, "learning_rate": 0.00010343510955697661, "loss": 0.0152, "step": 505540 }, { "epoch": 1.31, "learning_rate": 0.00010343122134060515, "loss": 0.0088, "step": 505550 }, { "epoch": 1.31, "learning_rate": 0.00010342733312423368, "loss": 0.0092, "step": 505560 }, { "epoch": 1.31, "learning_rate": 0.00010342344490786224, "loss": 0.0101, "step": 505570 }, { "epoch": 1.31, "learning_rate": 0.00010341955669149075, "loss": 0.0115, "step": 505580 }, { "epoch": 1.31, "learning_rate": 0.0001034156684751193, "loss": 0.0099, "step": 505590 }, { "epoch": 1.31, "learning_rate": 0.00010341178025874783, "loss": 0.009, "step": 505600 }, { "epoch": 1.31, "learning_rate": 0.00010340789204237638, "loss": 0.0083, "step": 505610 }, { "epoch": 1.31, "learning_rate": 0.0001034040038260049, "loss": 0.0092, "step": 505620 }, { "epoch": 1.31, "learning_rate": 0.00010340011560963344, "loss": 0.0113, "step": 505630 }, { "epoch": 1.31, "learning_rate": 0.00010339622739326197, "loss": 0.0136, "step": 505640 }, { "epoch": 1.31, "learning_rate": 0.0001033923391768905, "loss": 0.0114, "step": 505650 }, { "epoch": 1.31, "learning_rate": 0.00010338845096051904, "loss": 0.0075, "step": 505660 }, { "epoch": 1.31, "learning_rate": 0.00010338456274414757, "loss": 0.0106, "step": 505670 }, { "epoch": 1.31, "learning_rate": 0.00010338067452777611, "loss": 0.0078, "step": 505680 }, { "epoch": 1.31, "learning_rate": 0.00010337678631140464, "loss": 0.014, "step": 505690 }, { "epoch": 1.31, "learning_rate": 0.00010337289809503318, "loss": 0.011, "step": 505700 }, { "epoch": 1.31, "learning_rate": 0.00010336900987866171, "loss": 0.009, "step": 505710 }, { "epoch": 1.31, "learning_rate": 0.00010336512166229025, "loss": 0.0089, "step": 505720 }, { "epoch": 1.31, "learning_rate": 0.00010336123344591878, "loss": 0.0094, "step": 505730 }, { "epoch": 1.31, "learning_rate": 0.00010335734522954732, "loss": 0.0091, "step": 505740 }, { "epoch": 1.31, "learning_rate": 0.00010335345701317585, "loss": 0.0117, "step": 505750 }, { "epoch": 1.31, "learning_rate": 0.0001033495687968044, "loss": 0.0069, "step": 505760 }, { "epoch": 1.31, "learning_rate": 0.00010334568058043293, "loss": 0.0102, "step": 505770 }, { "epoch": 1.31, "learning_rate": 0.00010334179236406147, "loss": 0.0114, "step": 505780 }, { "epoch": 1.31, "learning_rate": 0.00010333790414769, "loss": 0.0121, "step": 505790 }, { "epoch": 1.31, "learning_rate": 0.00010333401593131854, "loss": 0.0107, "step": 505800 }, { "epoch": 1.31, "learning_rate": 0.00010333012771494707, "loss": 0.0087, "step": 505810 }, { "epoch": 1.31, "learning_rate": 0.00010332623949857561, "loss": 0.0133, "step": 505820 }, { "epoch": 1.31, "learning_rate": 0.00010332235128220414, "loss": 0.0098, "step": 505830 }, { "epoch": 1.31, "learning_rate": 0.00010331846306583268, "loss": 0.0139, "step": 505840 }, { "epoch": 1.31, "learning_rate": 0.00010331457484946121, "loss": 0.0095, "step": 505850 }, { "epoch": 1.31, "learning_rate": 0.00010331068663308975, "loss": 0.0163, "step": 505860 }, { "epoch": 1.31, "learning_rate": 0.00010330679841671828, "loss": 0.0107, "step": 505870 }, { "epoch": 1.31, "learning_rate": 0.00010330291020034682, "loss": 0.0139, "step": 505880 }, { "epoch": 1.31, "learning_rate": 0.00010329902198397535, "loss": 0.0096, "step": 505890 }, { "epoch": 1.31, "learning_rate": 0.00010329513376760388, "loss": 0.0188, "step": 505900 }, { "epoch": 1.31, "learning_rate": 0.00010329124555123242, "loss": 0.0081, "step": 505910 }, { "epoch": 1.31, "learning_rate": 0.00010328735733486095, "loss": 0.0133, "step": 505920 }, { "epoch": 1.31, "learning_rate": 0.0001032834691184895, "loss": 0.0101, "step": 505930 }, { "epoch": 1.31, "learning_rate": 0.00010327958090211802, "loss": 0.0078, "step": 505940 }, { "epoch": 1.31, "learning_rate": 0.00010327569268574657, "loss": 0.0319, "step": 505950 }, { "epoch": 1.31, "learning_rate": 0.0001032718044693751, "loss": 0.0085, "step": 505960 }, { "epoch": 1.31, "learning_rate": 0.00010326791625300364, "loss": 0.0111, "step": 505970 }, { "epoch": 1.31, "learning_rate": 0.00010326402803663217, "loss": 0.0087, "step": 505980 }, { "epoch": 1.31, "learning_rate": 0.00010326013982026071, "loss": 0.0171, "step": 505990 }, { "epoch": 1.31, "learning_rate": 0.00010325625160388924, "loss": 0.0131, "step": 506000 }, { "epoch": 1.31, "eval_cer": 0.88167329394755, "eval_loss": 0.006615667603909969, "eval_runtime": 107.9151, "eval_samples_per_second": 18.533, "eval_steps_per_second": 4.633, "step": 506000 }, { "epoch": 1.31, "learning_rate": 0.00010325236338751778, "loss": 0.0095, "step": 506010 }, { "epoch": 1.31, "learning_rate": 0.00010324847517114631, "loss": 0.0094, "step": 506020 }, { "epoch": 1.31, "learning_rate": 0.00010324458695477485, "loss": 0.0105, "step": 506030 }, { "epoch": 1.31, "learning_rate": 0.00010324069873840338, "loss": 0.0091, "step": 506040 }, { "epoch": 1.31, "learning_rate": 0.00010323681052203192, "loss": 0.0147, "step": 506050 }, { "epoch": 1.31, "learning_rate": 0.00010323292230566045, "loss": 0.0101, "step": 506060 }, { "epoch": 1.31, "learning_rate": 0.00010322903408928899, "loss": 0.0099, "step": 506070 }, { "epoch": 1.31, "learning_rate": 0.00010322514587291752, "loss": 0.0073, "step": 506080 }, { "epoch": 1.31, "learning_rate": 0.00010322125765654608, "loss": 0.0114, "step": 506090 }, { "epoch": 1.31, "learning_rate": 0.00010321736944017459, "loss": 0.0113, "step": 506100 }, { "epoch": 1.31, "learning_rate": 0.00010321348122380315, "loss": 0.008, "step": 506110 }, { "epoch": 1.31, "learning_rate": 0.00010320959300743167, "loss": 0.0109, "step": 506120 }, { "epoch": 1.31, "learning_rate": 0.00010320570479106022, "loss": 0.0118, "step": 506130 }, { "epoch": 1.31, "learning_rate": 0.00010320181657468874, "loss": 0.0092, "step": 506140 }, { "epoch": 1.31, "learning_rate": 0.00010319792835831727, "loss": 0.0109, "step": 506150 }, { "epoch": 1.31, "learning_rate": 0.00010319404014194581, "loss": 0.008, "step": 506160 }, { "epoch": 1.31, "learning_rate": 0.00010319015192557434, "loss": 0.0103, "step": 506170 }, { "epoch": 1.31, "learning_rate": 0.00010318626370920288, "loss": 0.0104, "step": 506180 }, { "epoch": 1.31, "learning_rate": 0.00010318237549283141, "loss": 0.0117, "step": 506190 }, { "epoch": 1.31, "learning_rate": 0.00010317848727645995, "loss": 0.0101, "step": 506200 }, { "epoch": 1.31, "learning_rate": 0.00010317459906008848, "loss": 0.0112, "step": 506210 }, { "epoch": 1.31, "learning_rate": 0.00010317071084371702, "loss": 0.0082, "step": 506220 }, { "epoch": 1.31, "learning_rate": 0.00010316682262734555, "loss": 0.0109, "step": 506230 }, { "epoch": 1.31, "learning_rate": 0.00010316293441097409, "loss": 0.012, "step": 506240 }, { "epoch": 1.31, "learning_rate": 0.00010315904619460262, "loss": 0.0124, "step": 506250 }, { "epoch": 1.31, "learning_rate": 0.00010315515797823116, "loss": 0.0084, "step": 506260 }, { "epoch": 1.31, "learning_rate": 0.00010315126976185969, "loss": 0.0088, "step": 506270 }, { "epoch": 1.31, "learning_rate": 0.00010314738154548824, "loss": 0.011, "step": 506280 }, { "epoch": 1.31, "learning_rate": 0.00010314349332911677, "loss": 0.0085, "step": 506290 }, { "epoch": 1.31, "learning_rate": 0.00010313960511274531, "loss": 0.0095, "step": 506300 }, { "epoch": 1.31, "learning_rate": 0.00010313571689637384, "loss": 0.0118, "step": 506310 }, { "epoch": 1.31, "learning_rate": 0.00010313182868000238, "loss": 0.0108, "step": 506320 }, { "epoch": 1.31, "learning_rate": 0.00010312794046363091, "loss": 0.0096, "step": 506330 }, { "epoch": 1.31, "learning_rate": 0.00010312405224725945, "loss": 0.0118, "step": 506340 }, { "epoch": 1.31, "learning_rate": 0.00010312016403088798, "loss": 0.0117, "step": 506350 }, { "epoch": 1.31, "learning_rate": 0.00010311627581451652, "loss": 0.0068, "step": 506360 }, { "epoch": 1.31, "learning_rate": 0.00010311238759814505, "loss": 0.0096, "step": 506370 }, { "epoch": 1.31, "learning_rate": 0.0001031084993817736, "loss": 0.0096, "step": 506380 }, { "epoch": 1.31, "learning_rate": 0.00010310461116540212, "loss": 0.0128, "step": 506390 }, { "epoch": 1.31, "learning_rate": 0.00010310072294903065, "loss": 0.0107, "step": 506400 }, { "epoch": 1.31, "learning_rate": 0.00010309683473265919, "loss": 0.0134, "step": 506410 }, { "epoch": 1.31, "learning_rate": 0.00010309294651628772, "loss": 0.0135, "step": 506420 }, { "epoch": 1.31, "learning_rate": 0.00010308905829991626, "loss": 0.0081, "step": 506430 }, { "epoch": 1.31, "learning_rate": 0.00010308517008354479, "loss": 0.0075, "step": 506440 }, { "epoch": 1.31, "learning_rate": 0.00010308128186717334, "loss": 0.0105, "step": 506450 }, { "epoch": 1.31, "learning_rate": 0.00010307739365080186, "loss": 0.0085, "step": 506460 }, { "epoch": 1.31, "learning_rate": 0.00010307350543443041, "loss": 0.0123, "step": 506470 }, { "epoch": 1.31, "learning_rate": 0.00010306961721805894, "loss": 0.0062, "step": 506480 }, { "epoch": 1.31, "learning_rate": 0.00010306572900168748, "loss": 0.0072, "step": 506490 }, { "epoch": 1.31, "learning_rate": 0.00010306184078531601, "loss": 0.0129, "step": 506500 }, { "epoch": 1.31, "learning_rate": 0.00010305795256894455, "loss": 0.0119, "step": 506510 }, { "epoch": 1.31, "learning_rate": 0.00010305406435257308, "loss": 0.0088, "step": 506520 }, { "epoch": 1.31, "learning_rate": 0.00010305017613620162, "loss": 0.0121, "step": 506530 }, { "epoch": 1.31, "learning_rate": 0.00010304628791983015, "loss": 0.0119, "step": 506540 }, { "epoch": 1.31, "learning_rate": 0.00010304239970345869, "loss": 0.0093, "step": 506550 }, { "epoch": 1.31, "learning_rate": 0.00010303851148708722, "loss": 0.0095, "step": 506560 }, { "epoch": 1.31, "learning_rate": 0.00010303462327071576, "loss": 0.0117, "step": 506570 }, { "epoch": 1.31, "learning_rate": 0.00010303073505434429, "loss": 0.0087, "step": 506580 }, { "epoch": 1.31, "learning_rate": 0.00010302684683797283, "loss": 0.0076, "step": 506590 }, { "epoch": 1.31, "learning_rate": 0.00010302295862160136, "loss": 0.0117, "step": 506600 }, { "epoch": 1.31, "learning_rate": 0.00010301907040522992, "loss": 0.0082, "step": 506610 }, { "epoch": 1.31, "learning_rate": 0.00010301518218885843, "loss": 0.0115, "step": 506620 }, { "epoch": 1.31, "learning_rate": 0.00010301129397248699, "loss": 0.0091, "step": 506630 }, { "epoch": 1.31, "learning_rate": 0.00010300740575611551, "loss": 0.0105, "step": 506640 }, { "epoch": 1.31, "learning_rate": 0.00010300351753974404, "loss": 0.0147, "step": 506650 }, { "epoch": 1.31, "learning_rate": 0.00010299962932337258, "loss": 0.0101, "step": 506660 }, { "epoch": 1.31, "learning_rate": 0.00010299574110700111, "loss": 0.0088, "step": 506670 }, { "epoch": 1.31, "learning_rate": 0.00010299185289062965, "loss": 0.0084, "step": 506680 }, { "epoch": 1.31, "learning_rate": 0.00010298796467425818, "loss": 0.0113, "step": 506690 }, { "epoch": 1.31, "learning_rate": 0.00010298407645788672, "loss": 0.0089, "step": 506700 }, { "epoch": 1.31, "learning_rate": 0.00010298018824151525, "loss": 0.0145, "step": 506710 }, { "epoch": 1.31, "learning_rate": 0.00010297630002514379, "loss": 0.0107, "step": 506720 }, { "epoch": 1.31, "learning_rate": 0.00010297241180877232, "loss": 0.0127, "step": 506730 }, { "epoch": 1.31, "learning_rate": 0.00010296852359240086, "loss": 0.0122, "step": 506740 }, { "epoch": 1.31, "learning_rate": 0.00010296463537602939, "loss": 0.0133, "step": 506750 }, { "epoch": 1.31, "learning_rate": 0.00010296074715965793, "loss": 0.0111, "step": 506760 }, { "epoch": 1.31, "learning_rate": 0.00010295685894328646, "loss": 0.0113, "step": 506770 }, { "epoch": 1.31, "learning_rate": 0.000102952970726915, "loss": 0.0119, "step": 506780 }, { "epoch": 1.31, "learning_rate": 0.00010294908251054353, "loss": 0.008, "step": 506790 }, { "epoch": 1.31, "learning_rate": 0.00010294519429417208, "loss": 0.0104, "step": 506800 }, { "epoch": 1.31, "learning_rate": 0.00010294130607780061, "loss": 0.0115, "step": 506810 }, { "epoch": 1.31, "learning_rate": 0.00010293741786142915, "loss": 0.0123, "step": 506820 }, { "epoch": 1.31, "learning_rate": 0.00010293352964505768, "loss": 0.0106, "step": 506830 }, { "epoch": 1.31, "learning_rate": 0.00010292964142868622, "loss": 0.0097, "step": 506840 }, { "epoch": 1.31, "learning_rate": 0.00010292575321231475, "loss": 0.0112, "step": 506850 }, { "epoch": 1.31, "learning_rate": 0.0001029218649959433, "loss": 0.0095, "step": 506860 }, { "epoch": 1.31, "learning_rate": 0.00010291797677957182, "loss": 0.0082, "step": 506870 }, { "epoch": 1.31, "learning_rate": 0.00010291408856320036, "loss": 0.0136, "step": 506880 }, { "epoch": 1.31, "learning_rate": 0.00010291020034682889, "loss": 0.0074, "step": 506890 }, { "epoch": 1.31, "learning_rate": 0.00010290631213045742, "loss": 0.0113, "step": 506900 }, { "epoch": 1.31, "learning_rate": 0.00010290242391408596, "loss": 0.0081, "step": 506910 }, { "epoch": 1.31, "learning_rate": 0.00010289853569771449, "loss": 0.0103, "step": 506920 }, { "epoch": 1.31, "learning_rate": 0.00010289464748134303, "loss": 0.0099, "step": 506930 }, { "epoch": 1.31, "learning_rate": 0.00010289075926497156, "loss": 0.0118, "step": 506940 }, { "epoch": 1.31, "learning_rate": 0.0001028868710486001, "loss": 0.0102, "step": 506950 }, { "epoch": 1.31, "learning_rate": 0.00010288298283222863, "loss": 0.0095, "step": 506960 }, { "epoch": 1.31, "learning_rate": 0.00010287909461585717, "loss": 0.0099, "step": 506970 }, { "epoch": 1.31, "learning_rate": 0.0001028752063994857, "loss": 0.0116, "step": 506980 }, { "epoch": 1.31, "learning_rate": 0.00010287131818311425, "loss": 0.0101, "step": 506990 }, { "epoch": 1.31, "learning_rate": 0.00010286742996674278, "loss": 0.0111, "step": 507000 }, { "epoch": 1.31, "eval_cer": 0.8816592975782083, "eval_loss": 0.0065526701509952545, "eval_runtime": 108.0305, "eval_samples_per_second": 18.513, "eval_steps_per_second": 4.628, "step": 507000 }, { "epoch": 1.31, "learning_rate": 0.00010286354175037132, "loss": 0.0113, "step": 507010 }, { "epoch": 1.31, "learning_rate": 0.00010285965353399985, "loss": 0.0081, "step": 507020 }, { "epoch": 1.31, "learning_rate": 0.0001028557653176284, "loss": 0.0106, "step": 507030 }, { "epoch": 1.31, "learning_rate": 0.00010285187710125692, "loss": 0.0078, "step": 507040 }, { "epoch": 1.31, "learning_rate": 0.00010284798888488546, "loss": 0.0133, "step": 507050 }, { "epoch": 1.31, "learning_rate": 0.00010284410066851399, "loss": 0.0107, "step": 507060 }, { "epoch": 1.31, "learning_rate": 0.00010284021245214253, "loss": 0.0099, "step": 507070 }, { "epoch": 1.31, "learning_rate": 0.00010283632423577106, "loss": 0.0105, "step": 507080 }, { "epoch": 1.31, "learning_rate": 0.0001028324360193996, "loss": 0.0091, "step": 507090 }, { "epoch": 1.31, "learning_rate": 0.00010282854780302813, "loss": 0.0098, "step": 507100 }, { "epoch": 1.31, "learning_rate": 0.00010282465958665667, "loss": 0.0104, "step": 507110 }, { "epoch": 1.31, "learning_rate": 0.0001028207713702852, "loss": 0.0102, "step": 507120 }, { "epoch": 1.31, "learning_rate": 0.00010281688315391373, "loss": 0.0082, "step": 507130 }, { "epoch": 1.31, "learning_rate": 0.00010281299493754227, "loss": 0.0105, "step": 507140 }, { "epoch": 1.31, "learning_rate": 0.0001028091067211708, "loss": 0.0118, "step": 507150 }, { "epoch": 1.31, "learning_rate": 0.00010280521850479935, "loss": 0.0087, "step": 507160 }, { "epoch": 1.31, "learning_rate": 0.00010280133028842787, "loss": 0.011, "step": 507170 }, { "epoch": 1.31, "learning_rate": 0.00010279744207205642, "loss": 0.01, "step": 507180 }, { "epoch": 1.31, "learning_rate": 0.00010279355385568495, "loss": 0.011, "step": 507190 }, { "epoch": 1.31, "learning_rate": 0.00010278966563931349, "loss": 0.0096, "step": 507200 }, { "epoch": 1.31, "learning_rate": 0.00010278577742294202, "loss": 0.0118, "step": 507210 }, { "epoch": 1.31, "learning_rate": 0.00010278188920657056, "loss": 0.011, "step": 507220 }, { "epoch": 1.31, "learning_rate": 0.00010277800099019909, "loss": 0.01, "step": 507230 }, { "epoch": 1.31, "learning_rate": 0.00010277411277382763, "loss": 0.0129, "step": 507240 }, { "epoch": 1.31, "learning_rate": 0.00010277022455745616, "loss": 0.0097, "step": 507250 }, { "epoch": 1.31, "learning_rate": 0.0001027663363410847, "loss": 0.0095, "step": 507260 }, { "epoch": 1.31, "learning_rate": 0.00010276244812471323, "loss": 0.0086, "step": 507270 }, { "epoch": 1.31, "learning_rate": 0.00010275855990834177, "loss": 0.0114, "step": 507280 }, { "epoch": 1.31, "learning_rate": 0.0001027546716919703, "loss": 0.0094, "step": 507290 }, { "epoch": 1.31, "learning_rate": 0.00010275078347559884, "loss": 0.0123, "step": 507300 }, { "epoch": 1.32, "learning_rate": 0.00010274689525922737, "loss": 0.0096, "step": 507310 }, { "epoch": 1.32, "learning_rate": 0.00010274300704285592, "loss": 0.0097, "step": 507320 }, { "epoch": 1.32, "learning_rate": 0.00010273911882648444, "loss": 0.0122, "step": 507330 }, { "epoch": 1.32, "learning_rate": 0.000102735230610113, "loss": 0.0126, "step": 507340 }, { "epoch": 1.32, "learning_rate": 0.00010273134239374152, "loss": 0.0087, "step": 507350 }, { "epoch": 1.32, "learning_rate": 0.00010272745417737006, "loss": 0.0094, "step": 507360 }, { "epoch": 1.32, "learning_rate": 0.00010272356596099859, "loss": 0.0112, "step": 507370 }, { "epoch": 1.32, "learning_rate": 0.00010271967774462712, "loss": 0.0103, "step": 507380 }, { "epoch": 1.32, "learning_rate": 0.00010271578952825566, "loss": 0.0071, "step": 507390 }, { "epoch": 1.32, "learning_rate": 0.00010271190131188419, "loss": 0.0104, "step": 507400 }, { "epoch": 1.32, "learning_rate": 0.00010270801309551273, "loss": 0.0111, "step": 507410 }, { "epoch": 1.32, "learning_rate": 0.00010270412487914126, "loss": 0.0081, "step": 507420 }, { "epoch": 1.32, "learning_rate": 0.0001027002366627698, "loss": 0.0093, "step": 507430 }, { "epoch": 1.32, "learning_rate": 0.00010269634844639833, "loss": 0.0111, "step": 507440 }, { "epoch": 1.32, "learning_rate": 0.00010269246023002687, "loss": 0.0119, "step": 507450 }, { "epoch": 1.32, "learning_rate": 0.0001026885720136554, "loss": 0.0066, "step": 507460 }, { "epoch": 1.32, "learning_rate": 0.00010268468379728394, "loss": 0.0113, "step": 507470 }, { "epoch": 1.32, "learning_rate": 0.00010268079558091247, "loss": 0.0146, "step": 507480 }, { "epoch": 1.32, "learning_rate": 0.00010267690736454101, "loss": 0.0097, "step": 507490 }, { "epoch": 1.32, "learning_rate": 0.00010267301914816954, "loss": 0.0117, "step": 507500 }, { "epoch": 1.32, "learning_rate": 0.0001026691309317981, "loss": 0.0104, "step": 507510 }, { "epoch": 1.32, "learning_rate": 0.00010266524271542662, "loss": 0.0138, "step": 507520 }, { "epoch": 1.32, "learning_rate": 0.00010266135449905516, "loss": 0.009, "step": 507530 }, { "epoch": 1.32, "learning_rate": 0.00010265746628268369, "loss": 0.0087, "step": 507540 }, { "epoch": 1.32, "learning_rate": 0.00010265357806631223, "loss": 0.0107, "step": 507550 }, { "epoch": 1.32, "learning_rate": 0.00010264968984994076, "loss": 0.0136, "step": 507560 }, { "epoch": 1.32, "learning_rate": 0.0001026458016335693, "loss": 0.0107, "step": 507570 }, { "epoch": 1.32, "learning_rate": 0.00010264191341719783, "loss": 0.0115, "step": 507580 }, { "epoch": 1.32, "learning_rate": 0.00010263802520082637, "loss": 0.0085, "step": 507590 }, { "epoch": 1.32, "learning_rate": 0.0001026341369844549, "loss": 0.0094, "step": 507600 }, { "epoch": 1.32, "learning_rate": 0.00010263024876808344, "loss": 0.0081, "step": 507610 }, { "epoch": 1.32, "learning_rate": 0.00010262636055171197, "loss": 0.0103, "step": 507620 }, { "epoch": 1.32, "learning_rate": 0.0001026224723353405, "loss": 0.0097, "step": 507630 }, { "epoch": 1.32, "learning_rate": 0.00010261858411896904, "loss": 0.0103, "step": 507640 }, { "epoch": 1.32, "learning_rate": 0.00010261469590259757, "loss": 0.0082, "step": 507650 }, { "epoch": 1.32, "learning_rate": 0.00010261080768622611, "loss": 0.0103, "step": 507660 }, { "epoch": 1.32, "learning_rate": 0.00010260691946985464, "loss": 0.0112, "step": 507670 }, { "epoch": 1.32, "learning_rate": 0.00010260303125348319, "loss": 0.0108, "step": 507680 }, { "epoch": 1.32, "learning_rate": 0.00010259914303711171, "loss": 0.009, "step": 507690 }, { "epoch": 1.32, "learning_rate": 0.00010259525482074026, "loss": 0.0084, "step": 507700 }, { "epoch": 1.32, "learning_rate": 0.00010259136660436879, "loss": 0.0118, "step": 507710 }, { "epoch": 1.32, "learning_rate": 0.00010258747838799733, "loss": 0.0099, "step": 507720 }, { "epoch": 1.32, "learning_rate": 0.00010258359017162586, "loss": 0.0092, "step": 507730 }, { "epoch": 1.32, "learning_rate": 0.0001025797019552544, "loss": 0.0084, "step": 507740 }, { "epoch": 1.32, "learning_rate": 0.00010257581373888293, "loss": 0.0133, "step": 507750 }, { "epoch": 1.32, "learning_rate": 0.00010257192552251147, "loss": 0.0078, "step": 507760 }, { "epoch": 1.32, "learning_rate": 0.00010256803730614, "loss": 0.0095, "step": 507770 }, { "epoch": 1.32, "learning_rate": 0.00010256414908976854, "loss": 0.0146, "step": 507780 }, { "epoch": 1.32, "learning_rate": 0.00010256026087339707, "loss": 0.0119, "step": 507790 }, { "epoch": 1.32, "learning_rate": 0.00010255637265702561, "loss": 0.0095, "step": 507800 }, { "epoch": 1.32, "learning_rate": 0.00010255248444065414, "loss": 0.0086, "step": 507810 }, { "epoch": 1.32, "learning_rate": 0.00010254859622428268, "loss": 0.0091, "step": 507820 }, { "epoch": 1.32, "learning_rate": 0.00010254470800791121, "loss": 0.01, "step": 507830 }, { "epoch": 1.32, "learning_rate": 0.00010254081979153976, "loss": 0.0087, "step": 507840 }, { "epoch": 1.32, "learning_rate": 0.00010253693157516828, "loss": 0.0098, "step": 507850 }, { "epoch": 1.32, "learning_rate": 0.00010253304335879683, "loss": 0.0083, "step": 507860 }, { "epoch": 1.32, "learning_rate": 0.00010252915514242536, "loss": 0.0132, "step": 507870 }, { "epoch": 1.32, "learning_rate": 0.00010252526692605389, "loss": 0.0093, "step": 507880 }, { "epoch": 1.32, "learning_rate": 0.00010252137870968243, "loss": 0.0105, "step": 507890 }, { "epoch": 1.32, "learning_rate": 0.00010251749049331096, "loss": 0.0098, "step": 507900 }, { "epoch": 1.32, "learning_rate": 0.0001025136022769395, "loss": 0.0079, "step": 507910 }, { "epoch": 1.32, "learning_rate": 0.00010250971406056803, "loss": 0.0098, "step": 507920 }, { "epoch": 1.32, "learning_rate": 0.00010250582584419657, "loss": 0.0071, "step": 507930 }, { "epoch": 1.32, "learning_rate": 0.0001025019376278251, "loss": 0.0104, "step": 507940 }, { "epoch": 1.32, "learning_rate": 0.00010249804941145364, "loss": 0.0109, "step": 507950 }, { "epoch": 1.32, "learning_rate": 0.00010249416119508217, "loss": 0.0089, "step": 507960 }, { "epoch": 1.32, "learning_rate": 0.00010249027297871071, "loss": 0.0156, "step": 507970 }, { "epoch": 1.32, "learning_rate": 0.00010248638476233924, "loss": 0.0077, "step": 507980 }, { "epoch": 1.32, "learning_rate": 0.00010248249654596778, "loss": 0.0086, "step": 507990 }, { "epoch": 1.32, "learning_rate": 0.00010247860832959631, "loss": 0.01, "step": 508000 }, { "epoch": 1.32, "eval_cer": 0.8817026863231677, "eval_loss": 0.00661470415070653, "eval_runtime": 108.0315, "eval_samples_per_second": 18.513, "eval_steps_per_second": 4.628, "step": 508000 }, { "epoch": 1.32, "learning_rate": 0.00010247472011322485, "loss": 0.0111, "step": 508010 }, { "epoch": 1.32, "learning_rate": 0.00010247083189685338, "loss": 0.0104, "step": 508020 }, { "epoch": 1.32, "learning_rate": 0.00010246694368048193, "loss": 0.0098, "step": 508030 }, { "epoch": 1.32, "learning_rate": 0.00010246305546411046, "loss": 0.0123, "step": 508040 }, { "epoch": 1.32, "learning_rate": 0.000102459167247739, "loss": 0.0106, "step": 508050 }, { "epoch": 1.32, "learning_rate": 0.00010245527903136753, "loss": 0.0093, "step": 508060 }, { "epoch": 1.32, "learning_rate": 0.00010245139081499607, "loss": 0.02, "step": 508070 }, { "epoch": 1.32, "learning_rate": 0.0001024475025986246, "loss": 0.0108, "step": 508080 }, { "epoch": 1.32, "learning_rate": 0.00010244361438225314, "loss": 0.01, "step": 508090 }, { "epoch": 1.32, "learning_rate": 0.00010243972616588167, "loss": 0.0108, "step": 508100 }, { "epoch": 1.32, "learning_rate": 0.00010243583794951021, "loss": 0.009, "step": 508110 }, { "epoch": 1.32, "learning_rate": 0.00010243194973313874, "loss": 0.0104, "step": 508120 }, { "epoch": 1.32, "learning_rate": 0.00010242806151676727, "loss": 0.0081, "step": 508130 }, { "epoch": 1.32, "learning_rate": 0.00010242417330039581, "loss": 0.0085, "step": 508140 }, { "epoch": 1.32, "learning_rate": 0.00010242028508402434, "loss": 0.0101, "step": 508150 }, { "epoch": 1.32, "learning_rate": 0.00010241639686765288, "loss": 0.0112, "step": 508160 }, { "epoch": 1.32, "learning_rate": 0.00010241250865128141, "loss": 0.0088, "step": 508170 }, { "epoch": 1.32, "learning_rate": 0.00010240862043490995, "loss": 0.0105, "step": 508180 }, { "epoch": 1.32, "learning_rate": 0.00010240473221853848, "loss": 0.0097, "step": 508190 }, { "epoch": 1.32, "learning_rate": 0.00010240084400216702, "loss": 0.0105, "step": 508200 }, { "epoch": 1.32, "learning_rate": 0.00010239695578579555, "loss": 0.0072, "step": 508210 }, { "epoch": 1.32, "learning_rate": 0.0001023930675694241, "loss": 0.0109, "step": 508220 }, { "epoch": 1.32, "learning_rate": 0.00010238917935305263, "loss": 0.0092, "step": 508230 }, { "epoch": 1.32, "learning_rate": 0.00010238529113668117, "loss": 0.0119, "step": 508240 }, { "epoch": 1.32, "learning_rate": 0.0001023814029203097, "loss": 0.0078, "step": 508250 }, { "epoch": 1.32, "learning_rate": 0.00010237751470393824, "loss": 0.0118, "step": 508260 }, { "epoch": 1.32, "learning_rate": 0.00010237362648756677, "loss": 0.008, "step": 508270 }, { "epoch": 1.32, "learning_rate": 0.00010236973827119531, "loss": 0.0112, "step": 508280 }, { "epoch": 1.32, "learning_rate": 0.00010236585005482384, "loss": 0.0103, "step": 508290 }, { "epoch": 1.32, "learning_rate": 0.00010236196183845238, "loss": 0.0095, "step": 508300 }, { "epoch": 1.32, "learning_rate": 0.00010235807362208091, "loss": 0.0101, "step": 508310 }, { "epoch": 1.32, "learning_rate": 0.00010235418540570945, "loss": 0.0097, "step": 508320 }, { "epoch": 1.32, "learning_rate": 0.00010235029718933798, "loss": 0.0125, "step": 508330 }, { "epoch": 1.32, "learning_rate": 0.00010234640897296652, "loss": 0.011, "step": 508340 }, { "epoch": 1.32, "learning_rate": 0.00010234252075659505, "loss": 0.0084, "step": 508350 }, { "epoch": 1.32, "learning_rate": 0.00010233863254022359, "loss": 0.0075, "step": 508360 }, { "epoch": 1.32, "learning_rate": 0.00010233474432385212, "loss": 0.0101, "step": 508370 }, { "epoch": 1.32, "learning_rate": 0.00010233085610748065, "loss": 0.0067, "step": 508380 }, { "epoch": 1.32, "learning_rate": 0.0001023269678911092, "loss": 0.0075, "step": 508390 }, { "epoch": 1.32, "learning_rate": 0.00010232307967473773, "loss": 0.0101, "step": 508400 }, { "epoch": 1.32, "learning_rate": 0.00010231919145836627, "loss": 0.0092, "step": 508410 }, { "epoch": 1.32, "learning_rate": 0.0001023153032419948, "loss": 0.0115, "step": 508420 }, { "epoch": 1.32, "learning_rate": 0.00010231141502562334, "loss": 0.0095, "step": 508430 }, { "epoch": 1.32, "learning_rate": 0.00010230752680925187, "loss": 0.0098, "step": 508440 }, { "epoch": 1.32, "learning_rate": 0.00010230363859288041, "loss": 0.0128, "step": 508450 }, { "epoch": 1.32, "learning_rate": 0.00010229975037650894, "loss": 0.0108, "step": 508460 }, { "epoch": 1.32, "learning_rate": 0.00010229586216013748, "loss": 0.0128, "step": 508470 }, { "epoch": 1.32, "learning_rate": 0.00010229197394376601, "loss": 0.0101, "step": 508480 }, { "epoch": 1.32, "learning_rate": 0.00010228808572739455, "loss": 0.0079, "step": 508490 }, { "epoch": 1.32, "learning_rate": 0.00010228419751102308, "loss": 0.0083, "step": 508500 }, { "epoch": 1.32, "learning_rate": 0.00010228030929465162, "loss": 0.0075, "step": 508510 }, { "epoch": 1.32, "learning_rate": 0.00010227642107828015, "loss": 0.012, "step": 508520 }, { "epoch": 1.32, "learning_rate": 0.00010227253286190869, "loss": 0.0072, "step": 508530 }, { "epoch": 1.32, "learning_rate": 0.00010226864464553722, "loss": 0.0086, "step": 508540 }, { "epoch": 1.32, "learning_rate": 0.00010226475642916577, "loss": 0.0127, "step": 508550 }, { "epoch": 1.32, "learning_rate": 0.00010226086821279429, "loss": 0.0105, "step": 508560 }, { "epoch": 1.32, "learning_rate": 0.00010225697999642284, "loss": 0.0097, "step": 508570 }, { "epoch": 1.32, "learning_rate": 0.00010225309178005137, "loss": 0.0101, "step": 508580 }, { "epoch": 1.32, "learning_rate": 0.00010224920356367991, "loss": 0.014, "step": 508590 }, { "epoch": 1.32, "learning_rate": 0.00010224531534730844, "loss": 0.0113, "step": 508600 }, { "epoch": 1.32, "learning_rate": 0.00010224142713093698, "loss": 0.0103, "step": 508610 }, { "epoch": 1.32, "learning_rate": 0.00010223753891456551, "loss": 0.0091, "step": 508620 }, { "epoch": 1.32, "learning_rate": 0.00010223365069819404, "loss": 0.0134, "step": 508630 }, { "epoch": 1.32, "learning_rate": 0.00010222976248182258, "loss": 0.011, "step": 508640 }, { "epoch": 1.32, "learning_rate": 0.00010222587426545111, "loss": 0.0101, "step": 508650 }, { "epoch": 1.32, "learning_rate": 0.00010222198604907965, "loss": 0.0092, "step": 508660 }, { "epoch": 1.32, "learning_rate": 0.00010221809783270818, "loss": 0.0126, "step": 508670 }, { "epoch": 1.32, "learning_rate": 0.00010221420961633672, "loss": 0.0121, "step": 508680 }, { "epoch": 1.32, "learning_rate": 0.00010221032139996525, "loss": 0.0102, "step": 508690 }, { "epoch": 1.32, "learning_rate": 0.00010220643318359379, "loss": 0.0117, "step": 508700 }, { "epoch": 1.32, "learning_rate": 0.00010220254496722232, "loss": 0.0095, "step": 508710 }, { "epoch": 1.32, "learning_rate": 0.00010219865675085086, "loss": 0.0097, "step": 508720 }, { "epoch": 1.32, "learning_rate": 0.00010219476853447939, "loss": 0.0094, "step": 508730 }, { "epoch": 1.32, "learning_rate": 0.00010219088031810794, "loss": 0.0088, "step": 508740 }, { "epoch": 1.32, "learning_rate": 0.00010218699210173647, "loss": 0.0113, "step": 508750 }, { "epoch": 1.32, "learning_rate": 0.00010218310388536501, "loss": 0.0099, "step": 508760 }, { "epoch": 1.32, "learning_rate": 0.00010217921566899354, "loss": 0.0097, "step": 508770 }, { "epoch": 1.32, "learning_rate": 0.00010217532745262208, "loss": 0.0111, "step": 508780 }, { "epoch": 1.32, "learning_rate": 0.00010217143923625061, "loss": 0.0096, "step": 508790 }, { "epoch": 1.32, "learning_rate": 0.00010216755101987915, "loss": 0.0146, "step": 508800 }, { "epoch": 1.32, "learning_rate": 0.00010216366280350768, "loss": 0.0095, "step": 508810 }, { "epoch": 1.32, "learning_rate": 0.00010215977458713622, "loss": 0.0138, "step": 508820 }, { "epoch": 1.32, "learning_rate": 0.00010215588637076475, "loss": 0.0082, "step": 508830 }, { "epoch": 1.32, "learning_rate": 0.00010215199815439329, "loss": 0.0095, "step": 508840 }, { "epoch": 1.32, "learning_rate": 0.00010214810993802182, "loss": 0.0136, "step": 508850 }, { "epoch": 1.32, "learning_rate": 0.00010214422172165036, "loss": 0.0117, "step": 508860 }, { "epoch": 1.32, "learning_rate": 0.00010214033350527889, "loss": 0.0127, "step": 508870 }, { "epoch": 1.32, "learning_rate": 0.00010213644528890742, "loss": 0.0138, "step": 508880 }, { "epoch": 1.32, "learning_rate": 0.00010213255707253596, "loss": 0.0138, "step": 508890 }, { "epoch": 1.32, "learning_rate": 0.00010212866885616449, "loss": 0.0083, "step": 508900 }, { "epoch": 1.32, "learning_rate": 0.00010212478063979304, "loss": 0.0101, "step": 508910 }, { "epoch": 1.32, "learning_rate": 0.00010212089242342156, "loss": 0.0108, "step": 508920 }, { "epoch": 1.32, "learning_rate": 0.00010211700420705011, "loss": 0.0079, "step": 508930 }, { "epoch": 1.32, "learning_rate": 0.00010211311599067864, "loss": 0.0097, "step": 508940 }, { "epoch": 1.32, "learning_rate": 0.00010210922777430718, "loss": 0.0077, "step": 508950 }, { "epoch": 1.32, "learning_rate": 0.00010210533955793571, "loss": 0.0094, "step": 508960 }, { "epoch": 1.32, "learning_rate": 0.00010210145134156425, "loss": 0.011, "step": 508970 }, { "epoch": 1.32, "learning_rate": 0.00010209756312519278, "loss": 0.0117, "step": 508980 }, { "epoch": 1.32, "learning_rate": 0.00010209367490882132, "loss": 0.0131, "step": 508990 }, { "epoch": 1.32, "learning_rate": 0.00010208978669244985, "loss": 0.011, "step": 509000 }, { "epoch": 1.32, "eval_cer": 0.881704085960102, "eval_loss": 0.0064851148054003716, "eval_runtime": 108.0593, "eval_samples_per_second": 18.508, "eval_steps_per_second": 4.627, "step": 509000 }, { "epoch": 1.32, "learning_rate": 0.00010208589847607839, "loss": 0.0097, "step": 509010 }, { "epoch": 1.32, "learning_rate": 0.00010208201025970692, "loss": 0.0071, "step": 509020 }, { "epoch": 1.32, "learning_rate": 0.00010207812204333546, "loss": 0.0133, "step": 509030 }, { "epoch": 1.32, "learning_rate": 0.00010207423382696399, "loss": 0.008, "step": 509040 }, { "epoch": 1.32, "learning_rate": 0.00010207034561059253, "loss": 0.0089, "step": 509050 }, { "epoch": 1.32, "learning_rate": 0.00010206645739422106, "loss": 0.0088, "step": 509060 }, { "epoch": 1.32, "learning_rate": 0.00010206256917784961, "loss": 0.0088, "step": 509070 }, { "epoch": 1.32, "learning_rate": 0.00010205868096147813, "loss": 0.0147, "step": 509080 }, { "epoch": 1.32, "learning_rate": 0.00010205479274510668, "loss": 0.0114, "step": 509090 }, { "epoch": 1.32, "learning_rate": 0.00010205090452873521, "loss": 0.0107, "step": 509100 }, { "epoch": 1.32, "learning_rate": 0.00010204701631236375, "loss": 0.0133, "step": 509110 }, { "epoch": 1.32, "learning_rate": 0.00010204312809599228, "loss": 0.0117, "step": 509120 }, { "epoch": 1.32, "learning_rate": 0.00010203923987962081, "loss": 0.0091, "step": 509130 }, { "epoch": 1.32, "learning_rate": 0.00010203535166324935, "loss": 0.0075, "step": 509140 }, { "epoch": 1.32, "learning_rate": 0.00010203146344687788, "loss": 0.0121, "step": 509150 }, { "epoch": 1.32, "learning_rate": 0.00010202757523050642, "loss": 0.0076, "step": 509160 }, { "epoch": 1.32, "learning_rate": 0.00010202368701413495, "loss": 0.0083, "step": 509170 }, { "epoch": 1.32, "learning_rate": 0.00010201979879776349, "loss": 0.0116, "step": 509180 }, { "epoch": 1.32, "learning_rate": 0.00010201591058139202, "loss": 0.0097, "step": 509190 }, { "epoch": 1.32, "learning_rate": 0.00010201202236502056, "loss": 0.0145, "step": 509200 }, { "epoch": 1.32, "learning_rate": 0.00010200813414864909, "loss": 0.0108, "step": 509210 }, { "epoch": 1.32, "learning_rate": 0.00010200424593227763, "loss": 0.0109, "step": 509220 }, { "epoch": 1.32, "learning_rate": 0.00010200035771590616, "loss": 0.0102, "step": 509230 }, { "epoch": 1.32, "learning_rate": 0.0001019964694995347, "loss": 0.0156, "step": 509240 }, { "epoch": 1.32, "learning_rate": 0.00010199258128316323, "loss": 0.0098, "step": 509250 }, { "epoch": 1.32, "learning_rate": 0.00010198869306679178, "loss": 0.0095, "step": 509260 }, { "epoch": 1.32, "learning_rate": 0.00010198480485042031, "loss": 0.0118, "step": 509270 }, { "epoch": 1.32, "learning_rate": 0.00010198091663404885, "loss": 0.0102, "step": 509280 }, { "epoch": 1.32, "learning_rate": 0.00010197702841767738, "loss": 0.0112, "step": 509290 }, { "epoch": 1.32, "learning_rate": 0.00010197314020130592, "loss": 0.0097, "step": 509300 }, { "epoch": 1.32, "learning_rate": 0.00010196925198493445, "loss": 0.0066, "step": 509310 }, { "epoch": 1.32, "learning_rate": 0.00010196536376856299, "loss": 0.0083, "step": 509320 }, { "epoch": 1.32, "learning_rate": 0.00010196147555219152, "loss": 0.0084, "step": 509330 }, { "epoch": 1.32, "learning_rate": 0.00010195758733582006, "loss": 0.0095, "step": 509340 }, { "epoch": 1.32, "learning_rate": 0.00010195369911944859, "loss": 0.0111, "step": 509350 }, { "epoch": 1.32, "learning_rate": 0.00010194981090307713, "loss": 0.0085, "step": 509360 }, { "epoch": 1.32, "learning_rate": 0.00010194592268670566, "loss": 0.0157, "step": 509370 }, { "epoch": 1.32, "learning_rate": 0.00010194203447033419, "loss": 0.01, "step": 509380 }, { "epoch": 1.32, "learning_rate": 0.00010193814625396273, "loss": 0.0121, "step": 509390 }, { "epoch": 1.32, "learning_rate": 0.00010193425803759126, "loss": 0.0112, "step": 509400 }, { "epoch": 1.32, "learning_rate": 0.0001019303698212198, "loss": 0.0099, "step": 509410 }, { "epoch": 1.32, "learning_rate": 0.00010192648160484833, "loss": 0.0115, "step": 509420 }, { "epoch": 1.32, "learning_rate": 0.00010192259338847688, "loss": 0.009, "step": 509430 }, { "epoch": 1.32, "learning_rate": 0.0001019187051721054, "loss": 0.0107, "step": 509440 }, { "epoch": 1.32, "learning_rate": 0.00010191481695573395, "loss": 0.0128, "step": 509450 }, { "epoch": 1.32, "learning_rate": 0.00010191092873936248, "loss": 0.0093, "step": 509460 }, { "epoch": 1.32, "learning_rate": 0.00010190704052299102, "loss": 0.0123, "step": 509470 }, { "epoch": 1.32, "learning_rate": 0.00010190315230661955, "loss": 0.0077, "step": 509480 }, { "epoch": 1.32, "learning_rate": 0.00010189926409024809, "loss": 0.0124, "step": 509490 }, { "epoch": 1.32, "learning_rate": 0.00010189537587387662, "loss": 0.0079, "step": 509500 }, { "epoch": 1.32, "learning_rate": 0.00010189148765750516, "loss": 0.0127, "step": 509510 }, { "epoch": 1.32, "learning_rate": 0.00010188759944113369, "loss": 0.0099, "step": 509520 }, { "epoch": 1.32, "learning_rate": 0.00010188371122476223, "loss": 0.0136, "step": 509530 }, { "epoch": 1.32, "learning_rate": 0.00010187982300839076, "loss": 0.0086, "step": 509540 }, { "epoch": 1.32, "learning_rate": 0.0001018759347920193, "loss": 0.0134, "step": 509550 }, { "epoch": 1.32, "learning_rate": 0.00010187204657564783, "loss": 0.0091, "step": 509560 }, { "epoch": 1.32, "learning_rate": 0.00010186815835927637, "loss": 0.0099, "step": 509570 }, { "epoch": 1.32, "learning_rate": 0.0001018642701429049, "loss": 0.0088, "step": 509580 }, { "epoch": 1.32, "learning_rate": 0.00010186038192653344, "loss": 0.011, "step": 509590 }, { "epoch": 1.32, "learning_rate": 0.00010185649371016197, "loss": 0.0153, "step": 509600 }, { "epoch": 1.32, "learning_rate": 0.00010185260549379052, "loss": 0.0126, "step": 509610 }, { "epoch": 1.32, "learning_rate": 0.00010184871727741905, "loss": 0.0134, "step": 509620 }, { "epoch": 1.32, "learning_rate": 0.00010184482906104758, "loss": 0.009, "step": 509630 }, { "epoch": 1.32, "learning_rate": 0.00010184094084467612, "loss": 0.01, "step": 509640 }, { "epoch": 1.32, "learning_rate": 0.00010183705262830465, "loss": 0.0109, "step": 509650 }, { "epoch": 1.32, "learning_rate": 0.00010183316441193319, "loss": 0.0094, "step": 509660 }, { "epoch": 1.32, "learning_rate": 0.00010182927619556172, "loss": 0.008, "step": 509670 }, { "epoch": 1.32, "learning_rate": 0.00010182538797919026, "loss": 0.0113, "step": 509680 }, { "epoch": 1.32, "learning_rate": 0.00010182149976281879, "loss": 0.0091, "step": 509690 }, { "epoch": 1.32, "learning_rate": 0.00010181761154644733, "loss": 0.0119, "step": 509700 }, { "epoch": 1.32, "learning_rate": 0.00010181372333007586, "loss": 0.0114, "step": 509710 }, { "epoch": 1.32, "learning_rate": 0.0001018098351137044, "loss": 0.0099, "step": 509720 }, { "epoch": 1.32, "learning_rate": 0.00010180594689733293, "loss": 0.0072, "step": 509730 }, { "epoch": 1.32, "learning_rate": 0.00010180205868096147, "loss": 0.0105, "step": 509740 }, { "epoch": 1.32, "learning_rate": 0.00010179817046459, "loss": 0.0098, "step": 509750 }, { "epoch": 1.32, "learning_rate": 0.00010179428224821854, "loss": 0.0098, "step": 509760 }, { "epoch": 1.32, "learning_rate": 0.00010179039403184707, "loss": 0.0115, "step": 509770 }, { "epoch": 1.32, "learning_rate": 0.00010178650581547562, "loss": 0.0106, "step": 509780 }, { "epoch": 1.32, "learning_rate": 0.00010178261759910414, "loss": 0.0125, "step": 509790 }, { "epoch": 1.32, "learning_rate": 0.00010177872938273269, "loss": 0.0077, "step": 509800 }, { "epoch": 1.32, "learning_rate": 0.00010177484116636122, "loss": 0.0112, "step": 509810 }, { "epoch": 1.32, "learning_rate": 0.00010177095294998976, "loss": 0.0111, "step": 509820 }, { "epoch": 1.32, "learning_rate": 0.00010176706473361829, "loss": 0.0108, "step": 509830 }, { "epoch": 1.32, "learning_rate": 0.00010176317651724683, "loss": 0.01, "step": 509840 }, { "epoch": 1.32, "learning_rate": 0.00010175928830087536, "loss": 0.0093, "step": 509850 }, { "epoch": 1.32, "learning_rate": 0.00010175540008450389, "loss": 0.0108, "step": 509860 }, { "epoch": 1.32, "learning_rate": 0.00010175151186813243, "loss": 0.008, "step": 509870 }, { "epoch": 1.32, "learning_rate": 0.00010174762365176096, "loss": 0.0091, "step": 509880 }, { "epoch": 1.32, "learning_rate": 0.0001017437354353895, "loss": 0.0088, "step": 509890 }, { "epoch": 1.32, "learning_rate": 0.00010173984721901803, "loss": 0.0099, "step": 509900 }, { "epoch": 1.32, "learning_rate": 0.00010173595900264657, "loss": 0.0082, "step": 509910 }, { "epoch": 1.32, "learning_rate": 0.0001017320707862751, "loss": 0.0112, "step": 509920 }, { "epoch": 1.32, "learning_rate": 0.00010172818256990364, "loss": 0.0098, "step": 509930 }, { "epoch": 1.32, "learning_rate": 0.00010172429435353217, "loss": 0.0122, "step": 509940 }, { "epoch": 1.32, "learning_rate": 0.00010172040613716071, "loss": 0.0102, "step": 509950 }, { "epoch": 1.32, "learning_rate": 0.00010171651792078924, "loss": 0.0131, "step": 509960 }, { "epoch": 1.32, "learning_rate": 0.00010171262970441779, "loss": 0.0095, "step": 509970 }, { "epoch": 1.32, "learning_rate": 0.00010170874148804632, "loss": 0.012, "step": 509980 }, { "epoch": 1.32, "learning_rate": 0.00010170485327167486, "loss": 0.0123, "step": 509990 }, { "epoch": 1.32, "learning_rate": 0.00010170096505530339, "loss": 0.0113, "step": 510000 }, { "epoch": 1.32, "eval_cer": 0.8816984874123652, "eval_loss": 0.0066459812223911285, "eval_runtime": 108.1498, "eval_samples_per_second": 18.493, "eval_steps_per_second": 4.623, "step": 510000 }, { "epoch": 1.32, "learning_rate": 0.00010169707683893193, "loss": 0.0081, "step": 510010 }, { "epoch": 1.32, "learning_rate": 0.00010169318862256046, "loss": 0.0139, "step": 510020 }, { "epoch": 1.32, "learning_rate": 0.000101689300406189, "loss": 0.0092, "step": 510030 }, { "epoch": 1.32, "learning_rate": 0.00010168541218981753, "loss": 0.0157, "step": 510040 }, { "epoch": 1.32, "learning_rate": 0.00010168152397344607, "loss": 0.0113, "step": 510050 }, { "epoch": 1.32, "learning_rate": 0.0001016776357570746, "loss": 0.0098, "step": 510060 }, { "epoch": 1.32, "learning_rate": 0.00010167374754070314, "loss": 0.0112, "step": 510070 }, { "epoch": 1.32, "learning_rate": 0.00010166985932433167, "loss": 0.0099, "step": 510080 }, { "epoch": 1.32, "learning_rate": 0.00010166597110796021, "loss": 0.0089, "step": 510090 }, { "epoch": 1.32, "learning_rate": 0.00010166208289158874, "loss": 0.0095, "step": 510100 }, { "epoch": 1.32, "learning_rate": 0.00010165819467521727, "loss": 0.012, "step": 510110 }, { "epoch": 1.32, "learning_rate": 0.00010165430645884581, "loss": 0.0119, "step": 510120 }, { "epoch": 1.32, "learning_rate": 0.00010165041824247434, "loss": 0.0095, "step": 510130 }, { "epoch": 1.32, "learning_rate": 0.00010164653002610289, "loss": 0.01, "step": 510140 }, { "epoch": 1.32, "learning_rate": 0.0001016426418097314, "loss": 0.0099, "step": 510150 }, { "epoch": 1.32, "learning_rate": 0.00010163875359335996, "loss": 0.0103, "step": 510160 }, { "epoch": 1.32, "learning_rate": 0.00010163486537698849, "loss": 0.0109, "step": 510170 }, { "epoch": 1.32, "learning_rate": 0.00010163097716061703, "loss": 0.01, "step": 510180 }, { "epoch": 1.32, "learning_rate": 0.00010162708894424556, "loss": 0.0099, "step": 510190 }, { "epoch": 1.32, "learning_rate": 0.0001016232007278741, "loss": 0.0088, "step": 510200 }, { "epoch": 1.32, "learning_rate": 0.00010161931251150263, "loss": 0.0101, "step": 510210 }, { "epoch": 1.32, "learning_rate": 0.00010161542429513117, "loss": 0.0103, "step": 510220 }, { "epoch": 1.32, "learning_rate": 0.0001016115360787597, "loss": 0.0086, "step": 510230 }, { "epoch": 1.32, "learning_rate": 0.00010160764786238824, "loss": 0.0095, "step": 510240 }, { "epoch": 1.32, "learning_rate": 0.00010160375964601677, "loss": 0.0087, "step": 510250 }, { "epoch": 1.32, "learning_rate": 0.00010159987142964531, "loss": 0.0098, "step": 510260 }, { "epoch": 1.32, "learning_rate": 0.00010159598321327384, "loss": 0.0087, "step": 510270 }, { "epoch": 1.32, "learning_rate": 0.00010159209499690238, "loss": 0.0093, "step": 510280 }, { "epoch": 1.32, "learning_rate": 0.00010158820678053091, "loss": 0.0108, "step": 510290 }, { "epoch": 1.32, "learning_rate": 0.00010158431856415946, "loss": 0.0124, "step": 510300 }, { "epoch": 1.32, "learning_rate": 0.00010158043034778798, "loss": 0.0109, "step": 510310 }, { "epoch": 1.32, "learning_rate": 0.00010157654213141653, "loss": 0.0107, "step": 510320 }, { "epoch": 1.32, "learning_rate": 0.00010157265391504506, "loss": 0.0085, "step": 510330 }, { "epoch": 1.32, "learning_rate": 0.0001015687656986736, "loss": 0.0138, "step": 510340 }, { "epoch": 1.32, "learning_rate": 0.00010156487748230213, "loss": 0.0098, "step": 510350 }, { "epoch": 1.32, "learning_rate": 0.00010156098926593066, "loss": 0.0125, "step": 510360 }, { "epoch": 1.32, "learning_rate": 0.0001015571010495592, "loss": 0.0093, "step": 510370 }, { "epoch": 1.32, "learning_rate": 0.00010155321283318773, "loss": 0.0112, "step": 510380 }, { "epoch": 1.32, "learning_rate": 0.00010154932461681627, "loss": 0.0112, "step": 510390 }, { "epoch": 1.32, "learning_rate": 0.0001015454364004448, "loss": 0.0112, "step": 510400 }, { "epoch": 1.32, "learning_rate": 0.00010154154818407334, "loss": 0.0093, "step": 510410 }, { "epoch": 1.32, "learning_rate": 0.00010153765996770187, "loss": 0.0088, "step": 510420 }, { "epoch": 1.32, "learning_rate": 0.00010153377175133041, "loss": 0.0078, "step": 510430 }, { "epoch": 1.32, "learning_rate": 0.00010152988353495894, "loss": 0.0142, "step": 510440 }, { "epoch": 1.32, "learning_rate": 0.00010152599531858748, "loss": 0.0083, "step": 510450 }, { "epoch": 1.32, "learning_rate": 0.000101522107102216, "loss": 0.0068, "step": 510460 }, { "epoch": 1.32, "learning_rate": 0.00010151821888584455, "loss": 0.009, "step": 510470 }, { "epoch": 1.32, "learning_rate": 0.00010151433066947308, "loss": 0.01, "step": 510480 }, { "epoch": 1.32, "learning_rate": 0.00010151044245310163, "loss": 0.012, "step": 510490 }, { "epoch": 1.32, "learning_rate": 0.00010150655423673016, "loss": 0.0136, "step": 510500 }, { "epoch": 1.32, "learning_rate": 0.0001015026660203587, "loss": 0.0116, "step": 510510 }, { "epoch": 1.32, "learning_rate": 0.00010149877780398723, "loss": 0.0106, "step": 510520 }, { "epoch": 1.32, "learning_rate": 0.00010149488958761577, "loss": 0.0087, "step": 510530 }, { "epoch": 1.32, "learning_rate": 0.0001014910013712443, "loss": 0.0095, "step": 510540 }, { "epoch": 1.32, "learning_rate": 0.00010148711315487284, "loss": 0.0104, "step": 510550 }, { "epoch": 1.32, "learning_rate": 0.00010148322493850137, "loss": 0.0112, "step": 510560 }, { "epoch": 1.32, "learning_rate": 0.00010147933672212991, "loss": 0.0083, "step": 510570 }, { "epoch": 1.32, "learning_rate": 0.00010147544850575844, "loss": 0.0139, "step": 510580 }, { "epoch": 1.32, "learning_rate": 0.00010147156028938698, "loss": 0.0104, "step": 510590 }, { "epoch": 1.32, "learning_rate": 0.00010146767207301551, "loss": 0.0083, "step": 510600 }, { "epoch": 1.32, "learning_rate": 0.00010146378385664404, "loss": 0.0088, "step": 510610 }, { "epoch": 1.32, "learning_rate": 0.00010145989564027258, "loss": 0.0105, "step": 510620 }, { "epoch": 1.32, "learning_rate": 0.0001014560074239011, "loss": 0.0097, "step": 510630 }, { "epoch": 1.32, "learning_rate": 0.00010145211920752965, "loss": 0.0092, "step": 510640 }, { "epoch": 1.32, "learning_rate": 0.00010144823099115818, "loss": 0.0102, "step": 510650 }, { "epoch": 1.32, "learning_rate": 0.00010144434277478673, "loss": 0.0071, "step": 510660 }, { "epoch": 1.32, "learning_rate": 0.00010144045455841525, "loss": 0.0065, "step": 510670 }, { "epoch": 1.32, "learning_rate": 0.0001014365663420438, "loss": 0.0105, "step": 510680 }, { "epoch": 1.32, "learning_rate": 0.00010143267812567233, "loss": 0.0108, "step": 510690 }, { "epoch": 1.32, "learning_rate": 0.00010142878990930087, "loss": 0.0118, "step": 510700 }, { "epoch": 1.32, "learning_rate": 0.0001014249016929294, "loss": 0.0136, "step": 510710 }, { "epoch": 1.32, "learning_rate": 0.00010142101347655794, "loss": 0.0086, "step": 510720 }, { "epoch": 1.32, "learning_rate": 0.00010141712526018647, "loss": 0.0111, "step": 510730 }, { "epoch": 1.32, "learning_rate": 0.00010141323704381501, "loss": 0.0093, "step": 510740 }, { "epoch": 1.32, "learning_rate": 0.00010140934882744354, "loss": 0.0079, "step": 510750 }, { "epoch": 1.32, "learning_rate": 0.00010140546061107208, "loss": 0.0087, "step": 510760 }, { "epoch": 1.32, "learning_rate": 0.00010140157239470061, "loss": 0.0088, "step": 510770 }, { "epoch": 1.32, "learning_rate": 0.00010139768417832915, "loss": 0.0089, "step": 510780 }, { "epoch": 1.32, "learning_rate": 0.00010139379596195768, "loss": 0.008, "step": 510790 }, { "epoch": 1.32, "learning_rate": 0.00010138990774558622, "loss": 0.0116, "step": 510800 }, { "epoch": 1.32, "learning_rate": 0.00010138601952921475, "loss": 0.0084, "step": 510810 }, { "epoch": 1.32, "learning_rate": 0.00010138213131284329, "loss": 0.0101, "step": 510820 }, { "epoch": 1.32, "learning_rate": 0.00010137824309647182, "loss": 0.0097, "step": 510830 }, { "epoch": 1.32, "learning_rate": 0.00010137435488010037, "loss": 0.0072, "step": 510840 }, { "epoch": 1.32, "learning_rate": 0.0001013704666637289, "loss": 0.0081, "step": 510850 }, { "epoch": 1.32, "learning_rate": 0.00010136657844735743, "loss": 0.0102, "step": 510860 }, { "epoch": 1.32, "learning_rate": 0.00010136269023098597, "loss": 0.0088, "step": 510870 }, { "epoch": 1.32, "learning_rate": 0.0001013588020146145, "loss": 0.0085, "step": 510880 }, { "epoch": 1.32, "learning_rate": 0.00010135491379824304, "loss": 0.0118, "step": 510890 }, { "epoch": 1.32, "learning_rate": 0.00010135102558187157, "loss": 0.0093, "step": 510900 }, { "epoch": 1.32, "learning_rate": 0.00010134713736550011, "loss": 0.0102, "step": 510910 }, { "epoch": 1.32, "learning_rate": 0.00010134324914912864, "loss": 0.0122, "step": 510920 }, { "epoch": 1.32, "learning_rate": 0.00010133936093275718, "loss": 0.0073, "step": 510930 }, { "epoch": 1.32, "learning_rate": 0.00010133547271638571, "loss": 0.0121, "step": 510940 }, { "epoch": 1.32, "learning_rate": 0.00010133158450001425, "loss": 0.0112, "step": 510950 }, { "epoch": 1.32, "learning_rate": 0.00010132769628364278, "loss": 0.0092, "step": 510960 }, { "epoch": 1.32, "learning_rate": 0.00010132380806727132, "loss": 0.0131, "step": 510970 }, { "epoch": 1.32, "learning_rate": 0.00010131991985089985, "loss": 0.0083, "step": 510980 }, { "epoch": 1.32, "learning_rate": 0.00010131603163452839, "loss": 0.0109, "step": 510990 }, { "epoch": 1.32, "learning_rate": 0.00010131214341815692, "loss": 0.0086, "step": 511000 }, { "epoch": 1.32, "eval_cer": 0.8816564983043399, "eval_loss": 0.006579502020031214, "eval_runtime": 107.825, "eval_samples_per_second": 18.549, "eval_steps_per_second": 4.637, "step": 511000 }, { "epoch": 1.32, "learning_rate": 0.00010130825520178547, "loss": 0.0117, "step": 511010 }, { "epoch": 1.32, "learning_rate": 0.000101304366985414, "loss": 0.0068, "step": 511020 }, { "epoch": 1.32, "learning_rate": 0.00010130047876904254, "loss": 0.0092, "step": 511030 }, { "epoch": 1.32, "learning_rate": 0.00010129659055267107, "loss": 0.0089, "step": 511040 }, { "epoch": 1.32, "learning_rate": 0.00010129270233629961, "loss": 0.0089, "step": 511050 }, { "epoch": 1.32, "learning_rate": 0.00010128881411992814, "loss": 0.0108, "step": 511060 }, { "epoch": 1.32, "learning_rate": 0.00010128492590355668, "loss": 0.0105, "step": 511070 }, { "epoch": 1.32, "learning_rate": 0.00010128103768718521, "loss": 0.0119, "step": 511080 }, { "epoch": 1.32, "learning_rate": 0.00010127714947081375, "loss": 0.009, "step": 511090 }, { "epoch": 1.32, "learning_rate": 0.00010127326125444228, "loss": 0.0121, "step": 511100 }, { "epoch": 1.32, "learning_rate": 0.0001012693730380708, "loss": 0.016, "step": 511110 }, { "epoch": 1.32, "learning_rate": 0.00010126548482169935, "loss": 0.0099, "step": 511120 }, { "epoch": 1.32, "learning_rate": 0.00010126159660532788, "loss": 0.0123, "step": 511130 }, { "epoch": 1.32, "learning_rate": 0.00010125770838895642, "loss": 0.01, "step": 511140 }, { "epoch": 1.32, "learning_rate": 0.00010125382017258495, "loss": 0.0107, "step": 511150 }, { "epoch": 1.32, "learning_rate": 0.00010124993195621349, "loss": 0.0103, "step": 511160 }, { "epoch": 1.33, "learning_rate": 0.00010124604373984202, "loss": 0.0095, "step": 511170 }, { "epoch": 1.33, "learning_rate": 0.00010124215552347056, "loss": 0.0119, "step": 511180 }, { "epoch": 1.33, "learning_rate": 0.00010123826730709909, "loss": 0.0077, "step": 511190 }, { "epoch": 1.33, "learning_rate": 0.00010123437909072764, "loss": 0.0115, "step": 511200 }, { "epoch": 1.33, "learning_rate": 0.00010123049087435617, "loss": 0.0112, "step": 511210 }, { "epoch": 1.33, "learning_rate": 0.00010122660265798471, "loss": 0.0094, "step": 511220 }, { "epoch": 1.33, "learning_rate": 0.00010122271444161324, "loss": 0.013, "step": 511230 }, { "epoch": 1.33, "learning_rate": 0.00010121882622524178, "loss": 0.0091, "step": 511240 }, { "epoch": 1.33, "learning_rate": 0.00010121493800887031, "loss": 0.0112, "step": 511250 }, { "epoch": 1.33, "learning_rate": 0.00010121104979249885, "loss": 0.0095, "step": 511260 }, { "epoch": 1.33, "learning_rate": 0.00010120716157612738, "loss": 0.0111, "step": 511270 }, { "epoch": 1.33, "learning_rate": 0.00010120327335975592, "loss": 0.0108, "step": 511280 }, { "epoch": 1.33, "learning_rate": 0.00010119938514338445, "loss": 0.0101, "step": 511290 }, { "epoch": 1.33, "learning_rate": 0.00010119549692701299, "loss": 0.0155, "step": 511300 }, { "epoch": 1.33, "learning_rate": 0.00010119160871064152, "loss": 0.0113, "step": 511310 }, { "epoch": 1.33, "learning_rate": 0.00010118772049427006, "loss": 0.0103, "step": 511320 }, { "epoch": 1.33, "learning_rate": 0.00010118383227789859, "loss": 0.0067, "step": 511330 }, { "epoch": 1.33, "learning_rate": 0.00010117994406152713, "loss": 0.0094, "step": 511340 }, { "epoch": 1.33, "learning_rate": 0.00010117605584515566, "loss": 0.0103, "step": 511350 }, { "epoch": 1.33, "learning_rate": 0.00010117216762878418, "loss": 0.0087, "step": 511360 }, { "epoch": 1.33, "learning_rate": 0.00010116827941241274, "loss": 0.0106, "step": 511370 }, { "epoch": 1.33, "learning_rate": 0.00010116439119604125, "loss": 0.007, "step": 511380 }, { "epoch": 1.33, "learning_rate": 0.00010116050297966981, "loss": 0.0144, "step": 511390 }, { "epoch": 1.33, "learning_rate": 0.00010115661476329834, "loss": 0.013, "step": 511400 }, { "epoch": 1.33, "learning_rate": 0.00010115272654692688, "loss": 0.0129, "step": 511410 }, { "epoch": 1.33, "learning_rate": 0.00010114883833055541, "loss": 0.0117, "step": 511420 }, { "epoch": 1.33, "learning_rate": 0.00010114495011418395, "loss": 0.0104, "step": 511430 }, { "epoch": 1.33, "learning_rate": 0.00010114106189781248, "loss": 0.012, "step": 511440 }, { "epoch": 1.33, "learning_rate": 0.00010113717368144102, "loss": 0.0101, "step": 511450 }, { "epoch": 1.33, "learning_rate": 0.00010113328546506955, "loss": 0.0114, "step": 511460 }, { "epoch": 1.33, "learning_rate": 0.00010112939724869809, "loss": 0.0073, "step": 511470 }, { "epoch": 1.33, "learning_rate": 0.00010112550903232662, "loss": 0.0113, "step": 511480 }, { "epoch": 1.33, "learning_rate": 0.00010112162081595516, "loss": 0.0096, "step": 511490 }, { "epoch": 1.33, "learning_rate": 0.00010111773259958369, "loss": 0.0096, "step": 511500 }, { "epoch": 1.33, "learning_rate": 0.00010111384438321223, "loss": 0.0077, "step": 511510 }, { "epoch": 1.33, "learning_rate": 0.00010110995616684076, "loss": 0.0096, "step": 511520 }, { "epoch": 1.33, "learning_rate": 0.00010110606795046931, "loss": 0.013, "step": 511530 }, { "epoch": 1.33, "learning_rate": 0.00010110217973409783, "loss": 0.0109, "step": 511540 }, { "epoch": 1.33, "learning_rate": 0.00010109829151772638, "loss": 0.009, "step": 511550 }, { "epoch": 1.33, "learning_rate": 0.00010109440330135491, "loss": 0.0092, "step": 511560 }, { "epoch": 1.33, "learning_rate": 0.00010109051508498345, "loss": 0.0099, "step": 511570 }, { "epoch": 1.33, "learning_rate": 0.00010108662686861198, "loss": 0.0105, "step": 511580 }, { "epoch": 1.33, "learning_rate": 0.00010108273865224052, "loss": 0.0113, "step": 511590 }, { "epoch": 1.33, "learning_rate": 0.00010107885043586905, "loss": 0.0095, "step": 511600 }, { "epoch": 1.33, "learning_rate": 0.00010107496221949758, "loss": 0.0075, "step": 511610 }, { "epoch": 1.33, "learning_rate": 0.00010107107400312612, "loss": 0.0096, "step": 511620 }, { "epoch": 1.33, "learning_rate": 0.00010106718578675465, "loss": 0.0089, "step": 511630 }, { "epoch": 1.33, "learning_rate": 0.00010106329757038319, "loss": 0.0073, "step": 511640 }, { "epoch": 1.33, "learning_rate": 0.00010105940935401172, "loss": 0.0096, "step": 511650 }, { "epoch": 1.33, "learning_rate": 0.00010105552113764026, "loss": 0.0097, "step": 511660 }, { "epoch": 1.33, "learning_rate": 0.00010105163292126879, "loss": 0.0102, "step": 511670 }, { "epoch": 1.33, "learning_rate": 0.00010104774470489733, "loss": 0.0115, "step": 511680 }, { "epoch": 1.33, "learning_rate": 0.00010104385648852586, "loss": 0.0097, "step": 511690 }, { "epoch": 1.33, "learning_rate": 0.0001010399682721544, "loss": 0.0078, "step": 511700 }, { "epoch": 1.33, "learning_rate": 0.00010103608005578293, "loss": 0.0063, "step": 511710 }, { "epoch": 1.33, "learning_rate": 0.00010103219183941148, "loss": 0.009, "step": 511720 }, { "epoch": 1.33, "learning_rate": 0.00010102830362304001, "loss": 0.0121, "step": 511730 }, { "epoch": 1.33, "learning_rate": 0.00010102441540666855, "loss": 0.0118, "step": 511740 }, { "epoch": 1.33, "learning_rate": 0.00010102052719029708, "loss": 0.0126, "step": 511750 }, { "epoch": 1.33, "learning_rate": 0.00010101663897392562, "loss": 0.0085, "step": 511760 }, { "epoch": 1.33, "learning_rate": 0.00010101275075755415, "loss": 0.0078, "step": 511770 }, { "epoch": 1.33, "learning_rate": 0.00010100886254118269, "loss": 0.0079, "step": 511780 }, { "epoch": 1.33, "learning_rate": 0.00010100497432481122, "loss": 0.0097, "step": 511790 }, { "epoch": 1.33, "learning_rate": 0.00010100108610843976, "loss": 0.0071, "step": 511800 }, { "epoch": 1.33, "learning_rate": 0.00010099719789206829, "loss": 0.0099, "step": 511810 }, { "epoch": 1.33, "learning_rate": 0.00010099330967569683, "loss": 0.0085, "step": 511820 }, { "epoch": 1.33, "learning_rate": 0.00010098942145932536, "loss": 0.0104, "step": 511830 }, { "epoch": 1.33, "learning_rate": 0.0001009855332429539, "loss": 0.0091, "step": 511840 }, { "epoch": 1.33, "learning_rate": 0.00010098164502658243, "loss": 0.0085, "step": 511850 }, { "epoch": 1.33, "learning_rate": 0.00010097775681021095, "loss": 0.0083, "step": 511860 }, { "epoch": 1.33, "learning_rate": 0.0001009738685938395, "loss": 0.012, "step": 511870 }, { "epoch": 1.33, "learning_rate": 0.00010096998037746802, "loss": 0.0105, "step": 511880 }, { "epoch": 1.33, "learning_rate": 0.00010096609216109658, "loss": 0.0101, "step": 511890 }, { "epoch": 1.33, "learning_rate": 0.0001009622039447251, "loss": 0.0127, "step": 511900 }, { "epoch": 1.33, "learning_rate": 0.00010095831572835365, "loss": 0.0128, "step": 511910 }, { "epoch": 1.33, "learning_rate": 0.00010095442751198218, "loss": 0.0071, "step": 511920 }, { "epoch": 1.33, "learning_rate": 0.00010095053929561072, "loss": 0.0078, "step": 511930 }, { "epoch": 1.33, "learning_rate": 0.00010094665107923925, "loss": 0.0088, "step": 511940 }, { "epoch": 1.33, "learning_rate": 0.00010094276286286779, "loss": 0.0091, "step": 511950 }, { "epoch": 1.33, "learning_rate": 0.00010093887464649632, "loss": 0.0081, "step": 511960 }, { "epoch": 1.33, "learning_rate": 0.00010093498643012486, "loss": 0.0087, "step": 511970 }, { "epoch": 1.33, "learning_rate": 0.00010093109821375339, "loss": 0.0112, "step": 511980 }, { "epoch": 1.33, "learning_rate": 0.00010092720999738193, "loss": 0.0113, "step": 511990 }, { "epoch": 1.33, "learning_rate": 0.00010092332178101046, "loss": 0.0088, "step": 512000 }, { "epoch": 1.33, "eval_cer": 0.8816984874123652, "eval_loss": 0.006633738521486521, "eval_runtime": 107.8155, "eval_samples_per_second": 18.55, "eval_steps_per_second": 4.638, "step": 512000 }, { "epoch": 1.33, "learning_rate": 0.000100919433564639, "loss": 0.0103, "step": 512010 }, { "epoch": 1.33, "learning_rate": 0.00010091554534826753, "loss": 0.0086, "step": 512020 }, { "epoch": 1.33, "learning_rate": 0.00010091165713189607, "loss": 0.0127, "step": 512030 }, { "epoch": 1.33, "learning_rate": 0.0001009077689155246, "loss": 0.0105, "step": 512040 }, { "epoch": 1.33, "learning_rate": 0.00010090388069915315, "loss": 0.0104, "step": 512050 }, { "epoch": 1.33, "learning_rate": 0.00010089999248278167, "loss": 0.014, "step": 512060 }, { "epoch": 1.33, "learning_rate": 0.00010089610426641022, "loss": 0.008, "step": 512070 }, { "epoch": 1.33, "learning_rate": 0.00010089221605003875, "loss": 0.0077, "step": 512080 }, { "epoch": 1.33, "learning_rate": 0.00010088832783366729, "loss": 0.0124, "step": 512090 }, { "epoch": 1.33, "learning_rate": 0.00010088443961729582, "loss": 0.0103, "step": 512100 }, { "epoch": 1.33, "learning_rate": 0.00010088055140092435, "loss": 0.0091, "step": 512110 }, { "epoch": 1.33, "learning_rate": 0.00010087666318455289, "loss": 0.0108, "step": 512120 }, { "epoch": 1.33, "learning_rate": 0.00010087277496818142, "loss": 0.0104, "step": 512130 }, { "epoch": 1.33, "learning_rate": 0.00010086888675180996, "loss": 0.0095, "step": 512140 }, { "epoch": 1.33, "learning_rate": 0.00010086499853543849, "loss": 0.0101, "step": 512150 }, { "epoch": 1.33, "learning_rate": 0.00010086111031906703, "loss": 0.0113, "step": 512160 }, { "epoch": 1.33, "learning_rate": 0.00010085722210269556, "loss": 0.0069, "step": 512170 }, { "epoch": 1.33, "learning_rate": 0.0001008533338863241, "loss": 0.0085, "step": 512180 }, { "epoch": 1.33, "learning_rate": 0.00010084944566995263, "loss": 0.0093, "step": 512190 }, { "epoch": 1.33, "learning_rate": 0.00010084555745358117, "loss": 0.0097, "step": 512200 }, { "epoch": 1.33, "learning_rate": 0.0001008416692372097, "loss": 0.0104, "step": 512210 }, { "epoch": 1.33, "learning_rate": 0.00010083778102083824, "loss": 0.0088, "step": 512220 }, { "epoch": 1.33, "learning_rate": 0.00010083389280446677, "loss": 0.0106, "step": 512230 }, { "epoch": 1.33, "learning_rate": 0.00010083000458809532, "loss": 0.0125, "step": 512240 }, { "epoch": 1.33, "learning_rate": 0.00010082611637172385, "loss": 0.0114, "step": 512250 }, { "epoch": 1.33, "learning_rate": 0.00010082222815535239, "loss": 0.0094, "step": 512260 }, { "epoch": 1.33, "learning_rate": 0.00010081833993898092, "loss": 0.0106, "step": 512270 }, { "epoch": 1.33, "learning_rate": 0.00010081445172260946, "loss": 0.01, "step": 512280 }, { "epoch": 1.33, "learning_rate": 0.00010081056350623799, "loss": 0.0117, "step": 512290 }, { "epoch": 1.33, "learning_rate": 0.00010080667528986653, "loss": 0.009, "step": 512300 }, { "epoch": 1.33, "learning_rate": 0.00010080278707349506, "loss": 0.0104, "step": 512310 }, { "epoch": 1.33, "learning_rate": 0.0001007988988571236, "loss": 0.0103, "step": 512320 }, { "epoch": 1.33, "learning_rate": 0.00010079501064075213, "loss": 0.0101, "step": 512330 }, { "epoch": 1.33, "learning_rate": 0.00010079112242438067, "loss": 0.0112, "step": 512340 }, { "epoch": 1.33, "learning_rate": 0.0001007872342080092, "loss": 0.0109, "step": 512350 }, { "epoch": 1.33, "learning_rate": 0.00010078334599163773, "loss": 0.0093, "step": 512360 }, { "epoch": 1.33, "learning_rate": 0.00010077945777526627, "loss": 0.008, "step": 512370 }, { "epoch": 1.33, "learning_rate": 0.0001007755695588948, "loss": 0.0114, "step": 512380 }, { "epoch": 1.33, "learning_rate": 0.00010077168134252334, "loss": 0.0107, "step": 512390 }, { "epoch": 1.33, "learning_rate": 0.00010076779312615186, "loss": 0.0146, "step": 512400 }, { "epoch": 1.33, "learning_rate": 0.0001007639049097804, "loss": 0.0136, "step": 512410 }, { "epoch": 1.33, "learning_rate": 0.00010076001669340893, "loss": 0.0106, "step": 512420 }, { "epoch": 1.33, "learning_rate": 0.00010075612847703749, "loss": 0.0083, "step": 512430 }, { "epoch": 1.33, "learning_rate": 0.00010075224026066602, "loss": 0.0152, "step": 512440 }, { "epoch": 1.33, "learning_rate": 0.00010074835204429456, "loss": 0.0113, "step": 512450 }, { "epoch": 1.33, "learning_rate": 0.00010074446382792309, "loss": 0.0097, "step": 512460 }, { "epoch": 1.33, "learning_rate": 0.00010074057561155163, "loss": 0.0099, "step": 512470 }, { "epoch": 1.33, "learning_rate": 0.00010073668739518016, "loss": 0.0143, "step": 512480 }, { "epoch": 1.33, "learning_rate": 0.0001007327991788087, "loss": 0.009, "step": 512490 }, { "epoch": 1.33, "learning_rate": 0.00010072891096243723, "loss": 0.0085, "step": 512500 }, { "epoch": 1.33, "learning_rate": 0.00010072502274606577, "loss": 0.0093, "step": 512510 }, { "epoch": 1.33, "learning_rate": 0.0001007211345296943, "loss": 0.0094, "step": 512520 }, { "epoch": 1.33, "learning_rate": 0.00010071724631332284, "loss": 0.0115, "step": 512530 }, { "epoch": 1.33, "learning_rate": 0.00010071335809695137, "loss": 0.0085, "step": 512540 }, { "epoch": 1.33, "learning_rate": 0.00010070946988057991, "loss": 0.0068, "step": 512550 }, { "epoch": 1.33, "learning_rate": 0.00010070558166420844, "loss": 0.0084, "step": 512560 }, { "epoch": 1.33, "learning_rate": 0.00010070169344783698, "loss": 0.0106, "step": 512570 }, { "epoch": 1.33, "learning_rate": 0.0001006978052314655, "loss": 0.0098, "step": 512580 }, { "epoch": 1.33, "learning_rate": 0.00010069391701509403, "loss": 0.0113, "step": 512590 }, { "epoch": 1.33, "learning_rate": 0.00010069002879872259, "loss": 0.0095, "step": 512600 }, { "epoch": 1.33, "learning_rate": 0.00010068614058235112, "loss": 0.0089, "step": 512610 }, { "epoch": 1.33, "learning_rate": 0.00010068225236597966, "loss": 0.0113, "step": 512620 }, { "epoch": 1.33, "learning_rate": 0.00010067836414960819, "loss": 0.0094, "step": 512630 }, { "epoch": 1.33, "learning_rate": 0.00010067447593323673, "loss": 0.0104, "step": 512640 }, { "epoch": 1.33, "learning_rate": 0.00010067058771686526, "loss": 0.012, "step": 512650 }, { "epoch": 1.33, "learning_rate": 0.0001006666995004938, "loss": 0.0107, "step": 512660 }, { "epoch": 1.33, "learning_rate": 0.00010066281128412233, "loss": 0.0096, "step": 512670 }, { "epoch": 1.33, "learning_rate": 0.00010065892306775087, "loss": 0.0094, "step": 512680 }, { "epoch": 1.33, "learning_rate": 0.0001006550348513794, "loss": 0.0089, "step": 512690 }, { "epoch": 1.33, "learning_rate": 0.00010065114663500794, "loss": 0.0074, "step": 512700 }, { "epoch": 1.33, "learning_rate": 0.00010064725841863647, "loss": 0.0108, "step": 512710 }, { "epoch": 1.33, "learning_rate": 0.00010064337020226501, "loss": 0.0089, "step": 512720 }, { "epoch": 1.33, "learning_rate": 0.00010063948198589354, "loss": 0.0086, "step": 512730 }, { "epoch": 1.33, "learning_rate": 0.00010063559376952208, "loss": 0.0104, "step": 512740 }, { "epoch": 1.33, "learning_rate": 0.0001006317055531506, "loss": 0.0116, "step": 512750 }, { "epoch": 1.33, "learning_rate": 0.00010062781733677916, "loss": 0.0105, "step": 512760 }, { "epoch": 1.33, "learning_rate": 0.00010062392912040767, "loss": 0.011, "step": 512770 }, { "epoch": 1.33, "learning_rate": 0.00010062004090403623, "loss": 0.0109, "step": 512780 }, { "epoch": 1.33, "learning_rate": 0.00010061615268766476, "loss": 0.0085, "step": 512790 }, { "epoch": 1.33, "learning_rate": 0.0001006122644712933, "loss": 0.0093, "step": 512800 }, { "epoch": 1.33, "learning_rate": 0.00010060837625492183, "loss": 0.0131, "step": 512810 }, { "epoch": 1.33, "learning_rate": 0.00010060448803855037, "loss": 0.0095, "step": 512820 }, { "epoch": 1.33, "learning_rate": 0.0001006005998221789, "loss": 0.0135, "step": 512830 }, { "epoch": 1.33, "learning_rate": 0.00010059671160580743, "loss": 0.0106, "step": 512840 }, { "epoch": 1.33, "learning_rate": 0.00010059282338943597, "loss": 0.0117, "step": 512850 }, { "epoch": 1.33, "learning_rate": 0.0001005889351730645, "loss": 0.0116, "step": 512860 }, { "epoch": 1.33, "learning_rate": 0.00010058504695669304, "loss": 0.0085, "step": 512870 }, { "epoch": 1.33, "learning_rate": 0.00010058115874032157, "loss": 0.0093, "step": 512880 }, { "epoch": 1.33, "learning_rate": 0.0001005772705239501, "loss": 0.0132, "step": 512890 }, { "epoch": 1.33, "learning_rate": 0.00010057338230757863, "loss": 0.0111, "step": 512900 }, { "epoch": 1.33, "learning_rate": 0.00010056949409120718, "loss": 0.0092, "step": 512910 }, { "epoch": 1.33, "learning_rate": 0.0001005656058748357, "loss": 0.0093, "step": 512920 }, { "epoch": 1.33, "learning_rate": 0.00010056171765846425, "loss": 0.0095, "step": 512930 }, { "epoch": 1.33, "learning_rate": 0.00010055782944209277, "loss": 0.0097, "step": 512940 }, { "epoch": 1.33, "learning_rate": 0.00010055394122572133, "loss": 0.0105, "step": 512950 }, { "epoch": 1.33, "learning_rate": 0.00010055005300934986, "loss": 0.0117, "step": 512960 }, { "epoch": 1.33, "learning_rate": 0.0001005461647929784, "loss": 0.0083, "step": 512970 }, { "epoch": 1.33, "learning_rate": 0.00010054227657660693, "loss": 0.0115, "step": 512980 }, { "epoch": 1.33, "learning_rate": 0.00010053838836023547, "loss": 0.0069, "step": 512990 }, { "epoch": 1.33, "learning_rate": 0.000100534500143864, "loss": 0.0112, "step": 513000 }, { "epoch": 1.33, "eval_cer": 0.8816942885015627, "eval_loss": 0.006440384313464165, "eval_runtime": 107.8594, "eval_samples_per_second": 18.543, "eval_steps_per_second": 4.636, "step": 513000 }, { "epoch": 1.33, "learning_rate": 0.00010053061192749254, "loss": 0.0088, "step": 513010 }, { "epoch": 1.33, "learning_rate": 0.00010052672371112107, "loss": 0.0093, "step": 513020 }, { "epoch": 1.33, "learning_rate": 0.00010052283549474961, "loss": 0.0079, "step": 513030 }, { "epoch": 1.33, "learning_rate": 0.00010051894727837814, "loss": 0.0106, "step": 513040 }, { "epoch": 1.33, "learning_rate": 0.00010051505906200668, "loss": 0.0099, "step": 513050 }, { "epoch": 1.33, "learning_rate": 0.0001005111708456352, "loss": 0.0101, "step": 513060 }, { "epoch": 1.33, "learning_rate": 0.00010050728262926375, "loss": 0.0102, "step": 513070 }, { "epoch": 1.33, "learning_rate": 0.00010050339441289228, "loss": 0.0119, "step": 513080 }, { "epoch": 1.33, "learning_rate": 0.0001004995061965208, "loss": 0.008, "step": 513090 }, { "epoch": 1.33, "learning_rate": 0.00010049561798014935, "loss": 0.0078, "step": 513100 }, { "epoch": 1.33, "learning_rate": 0.00010049172976377787, "loss": 0.0088, "step": 513110 }, { "epoch": 1.33, "learning_rate": 0.00010048784154740643, "loss": 0.0111, "step": 513120 }, { "epoch": 1.33, "learning_rate": 0.00010048395333103494, "loss": 0.0094, "step": 513130 }, { "epoch": 1.33, "learning_rate": 0.0001004800651146635, "loss": 0.0081, "step": 513140 }, { "epoch": 1.33, "learning_rate": 0.00010047617689829203, "loss": 0.0089, "step": 513150 }, { "epoch": 1.33, "learning_rate": 0.00010047228868192057, "loss": 0.0086, "step": 513160 }, { "epoch": 1.33, "learning_rate": 0.0001004684004655491, "loss": 0.0107, "step": 513170 }, { "epoch": 1.33, "learning_rate": 0.00010046451224917764, "loss": 0.0119, "step": 513180 }, { "epoch": 1.33, "learning_rate": 0.00010046062403280617, "loss": 0.009, "step": 513190 }, { "epoch": 1.33, "learning_rate": 0.00010045673581643471, "loss": 0.0099, "step": 513200 }, { "epoch": 1.33, "learning_rate": 0.00010045284760006324, "loss": 0.0093, "step": 513210 }, { "epoch": 1.33, "learning_rate": 0.00010044895938369178, "loss": 0.0095, "step": 513220 }, { "epoch": 1.33, "learning_rate": 0.0001004450711673203, "loss": 0.0104, "step": 513230 }, { "epoch": 1.33, "learning_rate": 0.00010044118295094885, "loss": 0.0096, "step": 513240 }, { "epoch": 1.33, "learning_rate": 0.00010043729473457738, "loss": 0.0149, "step": 513250 }, { "epoch": 1.33, "learning_rate": 0.00010043340651820592, "loss": 0.0108, "step": 513260 }, { "epoch": 1.33, "learning_rate": 0.00010042951830183444, "loss": 0.0092, "step": 513270 }, { "epoch": 1.33, "learning_rate": 0.000100425630085463, "loss": 0.0102, "step": 513280 }, { "epoch": 1.33, "learning_rate": 0.00010042174186909151, "loss": 0.0091, "step": 513290 }, { "epoch": 1.33, "learning_rate": 0.00010041785365272007, "loss": 0.0078, "step": 513300 }, { "epoch": 1.33, "learning_rate": 0.0001004139654363486, "loss": 0.0153, "step": 513310 }, { "epoch": 1.33, "learning_rate": 0.00010041007721997714, "loss": 0.0092, "step": 513320 }, { "epoch": 1.33, "learning_rate": 0.00010040618900360567, "loss": 0.0107, "step": 513330 }, { "epoch": 1.33, "learning_rate": 0.0001004023007872342, "loss": 0.009, "step": 513340 }, { "epoch": 1.33, "learning_rate": 0.00010039841257086274, "loss": 0.0123, "step": 513350 }, { "epoch": 1.33, "learning_rate": 0.00010039452435449127, "loss": 0.0099, "step": 513360 }, { "epoch": 1.33, "learning_rate": 0.00010039063613811981, "loss": 0.012, "step": 513370 }, { "epoch": 1.33, "learning_rate": 0.00010038674792174834, "loss": 0.0087, "step": 513380 }, { "epoch": 1.33, "learning_rate": 0.00010038285970537688, "loss": 0.0079, "step": 513390 }, { "epoch": 1.33, "learning_rate": 0.0001003789714890054, "loss": 0.009, "step": 513400 }, { "epoch": 1.33, "learning_rate": 0.00010037508327263395, "loss": 0.0102, "step": 513410 }, { "epoch": 1.33, "learning_rate": 0.00010037119505626247, "loss": 0.0093, "step": 513420 }, { "epoch": 1.33, "learning_rate": 0.00010036730683989102, "loss": 0.0097, "step": 513430 }, { "epoch": 1.33, "learning_rate": 0.00010036341862351954, "loss": 0.01, "step": 513440 }, { "epoch": 1.33, "learning_rate": 0.00010035953040714809, "loss": 0.009, "step": 513450 }, { "epoch": 1.33, "learning_rate": 0.00010035564219077661, "loss": 0.0104, "step": 513460 }, { "epoch": 1.33, "learning_rate": 0.00010035175397440517, "loss": 0.0091, "step": 513470 }, { "epoch": 1.33, "learning_rate": 0.0001003478657580337, "loss": 0.0083, "step": 513480 }, { "epoch": 1.33, "learning_rate": 0.00010034397754166224, "loss": 0.0095, "step": 513490 }, { "epoch": 1.33, "learning_rate": 0.00010034008932529077, "loss": 0.0102, "step": 513500 }, { "epoch": 1.33, "learning_rate": 0.00010033620110891931, "loss": 0.0089, "step": 513510 }, { "epoch": 1.33, "learning_rate": 0.00010033231289254784, "loss": 0.0101, "step": 513520 }, { "epoch": 1.33, "learning_rate": 0.00010032842467617638, "loss": 0.0102, "step": 513530 }, { "epoch": 1.33, "learning_rate": 0.0001003245364598049, "loss": 0.0099, "step": 513540 }, { "epoch": 1.33, "learning_rate": 0.00010032064824343345, "loss": 0.0097, "step": 513550 }, { "epoch": 1.33, "learning_rate": 0.00010031676002706198, "loss": 0.0082, "step": 513560 }, { "epoch": 1.33, "learning_rate": 0.00010031287181069052, "loss": 0.0106, "step": 513570 }, { "epoch": 1.33, "learning_rate": 0.00010030898359431905, "loss": 0.0073, "step": 513580 }, { "epoch": 1.33, "learning_rate": 0.00010030509537794757, "loss": 0.0103, "step": 513590 }, { "epoch": 1.33, "learning_rate": 0.00010030120716157612, "loss": 0.0113, "step": 513600 }, { "epoch": 1.33, "learning_rate": 0.00010029731894520464, "loss": 0.0103, "step": 513610 }, { "epoch": 1.33, "learning_rate": 0.00010029343072883319, "loss": 0.0159, "step": 513620 }, { "epoch": 1.33, "learning_rate": 0.00010028954251246171, "loss": 0.0107, "step": 513630 }, { "epoch": 1.33, "learning_rate": 0.00010028565429609027, "loss": 0.0083, "step": 513640 }, { "epoch": 1.33, "learning_rate": 0.00010028176607971878, "loss": 0.0091, "step": 513650 }, { "epoch": 1.33, "learning_rate": 0.00010027787786334734, "loss": 0.0108, "step": 513660 }, { "epoch": 1.33, "learning_rate": 0.00010027398964697587, "loss": 0.0076, "step": 513670 }, { "epoch": 1.33, "learning_rate": 0.00010027010143060441, "loss": 0.0119, "step": 513680 }, { "epoch": 1.33, "learning_rate": 0.00010026621321423294, "loss": 0.0079, "step": 513690 }, { "epoch": 1.33, "learning_rate": 0.00010026232499786148, "loss": 0.0087, "step": 513700 }, { "epoch": 1.33, "learning_rate": 0.00010025843678149, "loss": 0.0138, "step": 513710 }, { "epoch": 1.33, "learning_rate": 0.00010025454856511855, "loss": 0.0131, "step": 513720 }, { "epoch": 1.33, "learning_rate": 0.00010025066034874708, "loss": 0.0083, "step": 513730 }, { "epoch": 1.33, "learning_rate": 0.00010024677213237562, "loss": 0.0082, "step": 513740 }, { "epoch": 1.33, "learning_rate": 0.00010024288391600415, "loss": 0.0115, "step": 513750 }, { "epoch": 1.33, "learning_rate": 0.00010023899569963269, "loss": 0.0077, "step": 513760 }, { "epoch": 1.33, "learning_rate": 0.00010023510748326122, "loss": 0.0109, "step": 513770 }, { "epoch": 1.33, "learning_rate": 0.00010023121926688976, "loss": 0.0131, "step": 513780 }, { "epoch": 1.33, "learning_rate": 0.00010022733105051828, "loss": 0.0099, "step": 513790 }, { "epoch": 1.33, "learning_rate": 0.00010022344283414683, "loss": 0.0111, "step": 513800 }, { "epoch": 1.33, "learning_rate": 0.00010021955461777535, "loss": 0.0129, "step": 513810 }, { "epoch": 1.33, "learning_rate": 0.00010021566640140391, "loss": 0.0068, "step": 513820 }, { "epoch": 1.33, "learning_rate": 0.00010021177818503244, "loss": 0.0108, "step": 513830 }, { "epoch": 1.33, "learning_rate": 0.00010020788996866097, "loss": 0.0122, "step": 513840 }, { "epoch": 1.33, "learning_rate": 0.00010020400175228951, "loss": 0.0117, "step": 513850 }, { "epoch": 1.33, "learning_rate": 0.00010020011353591804, "loss": 0.0095, "step": 513860 }, { "epoch": 1.33, "learning_rate": 0.00010019622531954658, "loss": 0.0122, "step": 513870 }, { "epoch": 1.33, "learning_rate": 0.0001001923371031751, "loss": 0.009, "step": 513880 }, { "epoch": 1.33, "learning_rate": 0.00010018844888680365, "loss": 0.0084, "step": 513890 }, { "epoch": 1.33, "learning_rate": 0.00010018456067043218, "loss": 0.0121, "step": 513900 }, { "epoch": 1.33, "learning_rate": 0.00010018067245406072, "loss": 0.0095, "step": 513910 }, { "epoch": 1.33, "learning_rate": 0.00010017678423768924, "loss": 0.0073, "step": 513920 }, { "epoch": 1.33, "learning_rate": 0.00010017289602131779, "loss": 0.0062, "step": 513930 }, { "epoch": 1.33, "learning_rate": 0.00010016900780494631, "loss": 0.0145, "step": 513940 }, { "epoch": 1.33, "learning_rate": 0.00010016511958857486, "loss": 0.0087, "step": 513950 }, { "epoch": 1.33, "learning_rate": 0.00010016123137220338, "loss": 0.0095, "step": 513960 }, { "epoch": 1.33, "learning_rate": 0.00010015734315583193, "loss": 0.0132, "step": 513970 }, { "epoch": 1.33, "learning_rate": 0.00010015345493946045, "loss": 0.0082, "step": 513980 }, { "epoch": 1.33, "learning_rate": 0.00010014956672308901, "loss": 0.0084, "step": 513990 }, { "epoch": 1.33, "learning_rate": 0.00010014567850671752, "loss": 0.0073, "step": 514000 }, { "epoch": 1.33, "eval_cer": 0.8816956881384969, "eval_loss": 0.006481009069830179, "eval_runtime": 108.0446, "eval_samples_per_second": 18.511, "eval_steps_per_second": 4.628, "step": 514000 }, { "epoch": 1.33, "learning_rate": 0.00010014179029034608, "loss": 0.0106, "step": 514010 }, { "epoch": 1.33, "learning_rate": 0.00010013790207397461, "loss": 0.0117, "step": 514020 }, { "epoch": 1.33, "learning_rate": 0.00010013401385760315, "loss": 0.0088, "step": 514030 }, { "epoch": 1.33, "learning_rate": 0.00010013012564123168, "loss": 0.0116, "step": 514040 }, { "epoch": 1.33, "learning_rate": 0.00010012623742486022, "loss": 0.0089, "step": 514050 }, { "epoch": 1.33, "learning_rate": 0.00010012234920848875, "loss": 0.011, "step": 514060 }, { "epoch": 1.33, "learning_rate": 0.00010011846099211729, "loss": 0.0108, "step": 514070 }, { "epoch": 1.33, "learning_rate": 0.00010011457277574582, "loss": 0.0091, "step": 514080 }, { "epoch": 1.33, "learning_rate": 0.00010011068455937434, "loss": 0.0139, "step": 514090 }, { "epoch": 1.33, "learning_rate": 0.00010010679634300289, "loss": 0.0082, "step": 514100 }, { "epoch": 1.33, "learning_rate": 0.00010010290812663141, "loss": 0.0092, "step": 514110 }, { "epoch": 1.33, "learning_rate": 0.00010009901991025996, "loss": 0.0145, "step": 514120 }, { "epoch": 1.33, "learning_rate": 0.00010009513169388848, "loss": 0.0119, "step": 514130 }, { "epoch": 1.33, "learning_rate": 0.00010009124347751703, "loss": 0.0082, "step": 514140 }, { "epoch": 1.33, "learning_rate": 0.00010008735526114555, "loss": 0.0131, "step": 514150 }, { "epoch": 1.33, "learning_rate": 0.0001000834670447741, "loss": 0.0093, "step": 514160 }, { "epoch": 1.33, "learning_rate": 0.00010007957882840262, "loss": 0.0117, "step": 514170 }, { "epoch": 1.33, "learning_rate": 0.00010007569061203118, "loss": 0.0087, "step": 514180 }, { "epoch": 1.33, "learning_rate": 0.0001000718023956597, "loss": 0.01, "step": 514190 }, { "epoch": 1.33, "learning_rate": 0.00010006791417928825, "loss": 0.0099, "step": 514200 }, { "epoch": 1.33, "learning_rate": 0.00010006402596291678, "loss": 0.0084, "step": 514210 }, { "epoch": 1.33, "learning_rate": 0.00010006013774654532, "loss": 0.0127, "step": 514220 }, { "epoch": 1.33, "learning_rate": 0.00010005624953017385, "loss": 0.0101, "step": 514230 }, { "epoch": 1.33, "learning_rate": 0.00010005236131380239, "loss": 0.0113, "step": 514240 }, { "epoch": 1.33, "learning_rate": 0.00010004847309743092, "loss": 0.0091, "step": 514250 }, { "epoch": 1.33, "learning_rate": 0.00010004458488105946, "loss": 0.0114, "step": 514260 }, { "epoch": 1.33, "learning_rate": 0.00010004069666468799, "loss": 0.012, "step": 514270 }, { "epoch": 1.33, "learning_rate": 0.00010003680844831653, "loss": 0.0088, "step": 514280 }, { "epoch": 1.33, "learning_rate": 0.00010003292023194506, "loss": 0.0101, "step": 514290 }, { "epoch": 1.33, "learning_rate": 0.0001000290320155736, "loss": 0.0091, "step": 514300 }, { "epoch": 1.33, "learning_rate": 0.00010002514379920212, "loss": 0.0119, "step": 514310 }, { "epoch": 1.33, "learning_rate": 0.00010002125558283067, "loss": 0.0095, "step": 514320 }, { "epoch": 1.33, "learning_rate": 0.0001000173673664592, "loss": 0.0088, "step": 514330 }, { "epoch": 1.33, "learning_rate": 0.00010001347915008772, "loss": 0.0077, "step": 514340 }, { "epoch": 1.33, "learning_rate": 0.00010000959093371628, "loss": 0.0128, "step": 514350 }, { "epoch": 1.33, "learning_rate": 0.00010000570271734479, "loss": 0.009, "step": 514360 }, { "epoch": 1.33, "learning_rate": 0.00010000181450097335, "loss": 0.0083, "step": 514370 }, { "epoch": 1.33, "learning_rate": 9.999792628460188e-05, "loss": 0.0085, "step": 514380 }, { "epoch": 1.33, "learning_rate": 9.999403806823042e-05, "loss": 0.01, "step": 514390 }, { "epoch": 1.33, "learning_rate": 9.999014985185895e-05, "loss": 0.0146, "step": 514400 }, { "epoch": 1.33, "learning_rate": 9.998626163548749e-05, "loss": 0.0117, "step": 514410 }, { "epoch": 1.33, "learning_rate": 9.998237341911602e-05, "loss": 0.0086, "step": 514420 }, { "epoch": 1.33, "learning_rate": 9.997848520274456e-05, "loss": 0.0091, "step": 514430 }, { "epoch": 1.33, "learning_rate": 9.997459698637308e-05, "loss": 0.0085, "step": 514440 }, { "epoch": 1.33, "learning_rate": 9.997070877000163e-05, "loss": 0.0095, "step": 514450 }, { "epoch": 1.33, "learning_rate": 9.996682055363015e-05, "loss": 0.0084, "step": 514460 }, { "epoch": 1.33, "learning_rate": 9.99629323372587e-05, "loss": 0.011, "step": 514470 }, { "epoch": 1.33, "learning_rate": 9.995904412088722e-05, "loss": 0.0088, "step": 514480 }, { "epoch": 1.33, "learning_rate": 9.995515590451577e-05, "loss": 0.0073, "step": 514490 }, { "epoch": 1.33, "learning_rate": 9.99512676881443e-05, "loss": 0.0141, "step": 514500 }, { "epoch": 1.33, "learning_rate": 9.994737947177285e-05, "loss": 0.0099, "step": 514510 }, { "epoch": 1.33, "learning_rate": 9.994349125540136e-05, "loss": 0.0088, "step": 514520 }, { "epoch": 1.33, "learning_rate": 9.993960303902992e-05, "loss": 0.0095, "step": 514530 }, { "epoch": 1.33, "learning_rate": 9.993571482265845e-05, "loss": 0.0107, "step": 514540 }, { "epoch": 1.33, "learning_rate": 9.993182660628699e-05, "loss": 0.0089, "step": 514550 }, { "epoch": 1.33, "learning_rate": 9.992793838991552e-05, "loss": 0.009, "step": 514560 }, { "epoch": 1.33, "learning_rate": 9.992405017354406e-05, "loss": 0.0085, "step": 514570 }, { "epoch": 1.33, "learning_rate": 9.992016195717259e-05, "loss": 0.0123, "step": 514580 }, { "epoch": 1.33, "learning_rate": 9.991627374080111e-05, "loss": 0.0112, "step": 514590 }, { "epoch": 1.33, "learning_rate": 9.991238552442966e-05, "loss": 0.0125, "step": 514600 }, { "epoch": 1.33, "learning_rate": 9.990849730805818e-05, "loss": 0.0116, "step": 514610 }, { "epoch": 1.33, "learning_rate": 9.990460909168673e-05, "loss": 0.0122, "step": 514620 }, { "epoch": 1.33, "learning_rate": 9.990072087531525e-05, "loss": 0.0084, "step": 514630 }, { "epoch": 1.33, "learning_rate": 9.98968326589438e-05, "loss": 0.0125, "step": 514640 }, { "epoch": 1.33, "learning_rate": 9.989294444257232e-05, "loss": 0.0069, "step": 514650 }, { "epoch": 1.33, "learning_rate": 9.988905622620087e-05, "loss": 0.0087, "step": 514660 }, { "epoch": 1.33, "learning_rate": 9.98851680098294e-05, "loss": 0.0083, "step": 514670 }, { "epoch": 1.33, "learning_rate": 9.988127979345793e-05, "loss": 0.0098, "step": 514680 }, { "epoch": 1.33, "learning_rate": 9.987739157708646e-05, "loss": 0.0121, "step": 514690 }, { "epoch": 1.33, "learning_rate": 9.987350336071502e-05, "loss": 0.0078, "step": 514700 }, { "epoch": 1.33, "learning_rate": 9.986961514434355e-05, "loss": 0.0084, "step": 514710 }, { "epoch": 1.33, "learning_rate": 9.986572692797209e-05, "loss": 0.0199, "step": 514720 }, { "epoch": 1.33, "learning_rate": 9.986183871160062e-05, "loss": 0.0079, "step": 514730 }, { "epoch": 1.33, "learning_rate": 9.985795049522916e-05, "loss": 0.0089, "step": 514740 }, { "epoch": 1.33, "learning_rate": 9.985406227885769e-05, "loss": 0.0096, "step": 514750 }, { "epoch": 1.33, "learning_rate": 9.985017406248623e-05, "loss": 0.0108, "step": 514760 }, { "epoch": 1.33, "learning_rate": 9.984628584611476e-05, "loss": 0.0096, "step": 514770 }, { "epoch": 1.33, "learning_rate": 9.98423976297433e-05, "loss": 0.0193, "step": 514780 }, { "epoch": 1.33, "learning_rate": 9.983850941337183e-05, "loss": 0.01, "step": 514790 }, { "epoch": 1.33, "learning_rate": 9.983462119700037e-05, "loss": 0.0115, "step": 514800 }, { "epoch": 1.33, "learning_rate": 9.98307329806289e-05, "loss": 0.0099, "step": 514810 }, { "epoch": 1.33, "learning_rate": 9.982684476425744e-05, "loss": 0.0085, "step": 514820 }, { "epoch": 1.33, "learning_rate": 9.982295654788596e-05, "loss": 0.0066, "step": 514830 }, { "epoch": 1.33, "learning_rate": 9.981906833151449e-05, "loss": 0.0123, "step": 514840 }, { "epoch": 1.33, "learning_rate": 9.981518011514303e-05, "loss": 0.0103, "step": 514850 }, { "epoch": 1.33, "learning_rate": 9.981129189877156e-05, "loss": 0.0122, "step": 514860 }, { "epoch": 1.33, "learning_rate": 9.980740368240012e-05, "loss": 0.0093, "step": 514870 }, { "epoch": 1.33, "learning_rate": 9.980351546602863e-05, "loss": 0.0073, "step": 514880 }, { "epoch": 1.33, "learning_rate": 9.979962724965719e-05, "loss": 0.0087, "step": 514890 }, { "epoch": 1.33, "learning_rate": 9.979573903328572e-05, "loss": 0.0101, "step": 514900 }, { "epoch": 1.33, "learning_rate": 9.979185081691426e-05, "loss": 0.0091, "step": 514910 }, { "epoch": 1.33, "learning_rate": 9.978796260054279e-05, "loss": 0.0075, "step": 514920 }, { "epoch": 1.33, "learning_rate": 9.978407438417133e-05, "loss": 0.011, "step": 514930 }, { "epoch": 1.33, "learning_rate": 9.978018616779985e-05, "loss": 0.0107, "step": 514940 }, { "epoch": 1.33, "learning_rate": 9.97762979514284e-05, "loss": 0.0083, "step": 514950 }, { "epoch": 1.33, "learning_rate": 9.977240973505692e-05, "loss": 0.0106, "step": 514960 }, { "epoch": 1.33, "learning_rate": 9.976852151868547e-05, "loss": 0.0083, "step": 514970 }, { "epoch": 1.33, "learning_rate": 9.9764633302314e-05, "loss": 0.0093, "step": 514980 }, { "epoch": 1.33, "learning_rate": 9.976074508594254e-05, "loss": 0.0101, "step": 514990 }, { "epoch": 1.33, "learning_rate": 9.975685686957106e-05, "loss": 0.0079, "step": 515000 }, { "epoch": 1.33, "eval_cer": 0.8816872903168917, "eval_loss": 0.006493269931524992, "eval_runtime": 108.0338, "eval_samples_per_second": 18.513, "eval_steps_per_second": 4.628, "step": 515000 }, { "epoch": 1.33, "learning_rate": 9.97529686531996e-05, "loss": 0.0072, "step": 515010 }, { "epoch": 1.34, "learning_rate": 9.974908043682813e-05, "loss": 0.0088, "step": 515020 }, { "epoch": 1.34, "learning_rate": 9.974519222045668e-05, "loss": 0.0101, "step": 515030 }, { "epoch": 1.34, "learning_rate": 9.97413040040852e-05, "loss": 0.0084, "step": 515040 }, { "epoch": 1.34, "learning_rate": 9.973741578771376e-05, "loss": 0.0128, "step": 515050 }, { "epoch": 1.34, "learning_rate": 9.973352757134229e-05, "loss": 0.0101, "step": 515060 }, { "epoch": 1.34, "learning_rate": 9.972963935497081e-05, "loss": 0.0098, "step": 515070 }, { "epoch": 1.34, "learning_rate": 9.972575113859936e-05, "loss": 0.0117, "step": 515080 }, { "epoch": 1.34, "learning_rate": 9.972186292222788e-05, "loss": 0.0095, "step": 515090 }, { "epoch": 1.34, "learning_rate": 9.971797470585643e-05, "loss": 0.0107, "step": 515100 }, { "epoch": 1.34, "learning_rate": 9.971408648948495e-05, "loss": 0.0095, "step": 515110 }, { "epoch": 1.34, "learning_rate": 9.97101982731135e-05, "loss": 0.0098, "step": 515120 }, { "epoch": 1.34, "learning_rate": 9.970631005674202e-05, "loss": 0.0099, "step": 515130 }, { "epoch": 1.34, "learning_rate": 9.970242184037057e-05, "loss": 0.0095, "step": 515140 }, { "epoch": 1.34, "learning_rate": 9.96985336239991e-05, "loss": 0.0125, "step": 515150 }, { "epoch": 1.34, "learning_rate": 9.969464540762764e-05, "loss": 0.0086, "step": 515160 }, { "epoch": 1.34, "learning_rate": 9.969075719125616e-05, "loss": 0.0108, "step": 515170 }, { "epoch": 1.34, "learning_rate": 9.96868689748847e-05, "loss": 0.0097, "step": 515180 }, { "epoch": 1.34, "learning_rate": 9.968298075851323e-05, "loss": 0.0081, "step": 515190 }, { "epoch": 1.34, "learning_rate": 9.967909254214177e-05, "loss": 0.0082, "step": 515200 }, { "epoch": 1.34, "learning_rate": 9.96752043257703e-05, "loss": 0.0071, "step": 515210 }, { "epoch": 1.34, "learning_rate": 9.967131610939886e-05, "loss": 0.0125, "step": 515220 }, { "epoch": 1.34, "learning_rate": 9.966742789302739e-05, "loss": 0.0108, "step": 515230 }, { "epoch": 1.34, "learning_rate": 9.966353967665593e-05, "loss": 0.0087, "step": 515240 }, { "epoch": 1.34, "learning_rate": 9.965965146028446e-05, "loss": 0.0091, "step": 515250 }, { "epoch": 1.34, "learning_rate": 9.9655763243913e-05, "loss": 0.0109, "step": 515260 }, { "epoch": 1.34, "learning_rate": 9.965187502754153e-05, "loss": 0.0087, "step": 515270 }, { "epoch": 1.34, "learning_rate": 9.964798681117007e-05, "loss": 0.0104, "step": 515280 }, { "epoch": 1.34, "learning_rate": 9.96440985947986e-05, "loss": 0.0103, "step": 515290 }, { "epoch": 1.34, "learning_rate": 9.964021037842714e-05, "loss": 0.0086, "step": 515300 }, { "epoch": 1.34, "learning_rate": 9.963632216205567e-05, "loss": 0.0107, "step": 515310 }, { "epoch": 1.34, "learning_rate": 9.96324339456842e-05, "loss": 0.0107, "step": 515320 }, { "epoch": 1.34, "learning_rate": 9.962854572931273e-05, "loss": 0.0074, "step": 515330 }, { "epoch": 1.34, "learning_rate": 9.962465751294126e-05, "loss": 0.015, "step": 515340 }, { "epoch": 1.34, "learning_rate": 9.96207692965698e-05, "loss": 0.0123, "step": 515350 }, { "epoch": 1.34, "learning_rate": 9.961688108019833e-05, "loss": 0.0099, "step": 515360 }, { "epoch": 1.34, "learning_rate": 9.961299286382687e-05, "loss": 0.012, "step": 515370 }, { "epoch": 1.34, "learning_rate": 9.96091046474554e-05, "loss": 0.0089, "step": 515380 }, { "epoch": 1.34, "learning_rate": 9.960521643108394e-05, "loss": 0.0128, "step": 515390 }, { "epoch": 1.34, "learning_rate": 9.960132821471247e-05, "loss": 0.0116, "step": 515400 }, { "epoch": 1.34, "learning_rate": 9.959743999834103e-05, "loss": 0.0083, "step": 515410 }, { "epoch": 1.34, "learning_rate": 9.959355178196956e-05, "loss": 0.0078, "step": 515420 }, { "epoch": 1.34, "learning_rate": 9.95896635655981e-05, "loss": 0.0117, "step": 515430 }, { "epoch": 1.34, "learning_rate": 9.958577534922663e-05, "loss": 0.0086, "step": 515440 }, { "epoch": 1.34, "learning_rate": 9.958188713285517e-05, "loss": 0.0091, "step": 515450 }, { "epoch": 1.34, "learning_rate": 9.95779989164837e-05, "loss": 0.0097, "step": 515460 }, { "epoch": 1.34, "learning_rate": 9.957411070011224e-05, "loss": 0.0079, "step": 515470 }, { "epoch": 1.34, "learning_rate": 9.957022248374076e-05, "loss": 0.007, "step": 515480 }, { "epoch": 1.34, "learning_rate": 9.95663342673693e-05, "loss": 0.0109, "step": 515490 }, { "epoch": 1.34, "learning_rate": 9.956244605099783e-05, "loss": 0.011, "step": 515500 }, { "epoch": 1.34, "learning_rate": 9.955855783462638e-05, "loss": 0.013, "step": 515510 }, { "epoch": 1.34, "learning_rate": 9.95546696182549e-05, "loss": 0.0085, "step": 515520 }, { "epoch": 1.34, "learning_rate": 9.955078140188345e-05, "loss": 0.0121, "step": 515530 }, { "epoch": 1.34, "learning_rate": 9.954689318551197e-05, "loss": 0.0123, "step": 515540 }, { "epoch": 1.34, "learning_rate": 9.954300496914052e-05, "loss": 0.0133, "step": 515550 }, { "epoch": 1.34, "learning_rate": 9.953911675276904e-05, "loss": 0.0102, "step": 515560 }, { "epoch": 1.34, "learning_rate": 9.953522853639757e-05, "loss": 0.0084, "step": 515570 }, { "epoch": 1.34, "learning_rate": 9.953134032002613e-05, "loss": 0.0121, "step": 515580 }, { "epoch": 1.34, "learning_rate": 9.952745210365464e-05, "loss": 0.0122, "step": 515590 }, { "epoch": 1.34, "learning_rate": 9.95235638872832e-05, "loss": 0.0109, "step": 515600 }, { "epoch": 1.34, "learning_rate": 9.951967567091172e-05, "loss": 0.0092, "step": 515610 }, { "epoch": 1.34, "learning_rate": 9.951578745454027e-05, "loss": 0.0113, "step": 515620 }, { "epoch": 1.34, "learning_rate": 9.95118992381688e-05, "loss": 0.0086, "step": 515630 }, { "epoch": 1.34, "learning_rate": 9.950801102179734e-05, "loss": 0.0109, "step": 515640 }, { "epoch": 1.34, "learning_rate": 9.950412280542586e-05, "loss": 0.0101, "step": 515650 }, { "epoch": 1.34, "learning_rate": 9.95002345890544e-05, "loss": 0.0099, "step": 515660 }, { "epoch": 1.34, "learning_rate": 9.949634637268293e-05, "loss": 0.0082, "step": 515670 }, { "epoch": 1.34, "learning_rate": 9.949245815631148e-05, "loss": 0.0115, "step": 515680 }, { "epoch": 1.34, "learning_rate": 9.948856993994e-05, "loss": 0.0132, "step": 515690 }, { "epoch": 1.34, "learning_rate": 9.948468172356855e-05, "loss": 0.0085, "step": 515700 }, { "epoch": 1.34, "learning_rate": 9.948079350719707e-05, "loss": 0.0093, "step": 515710 }, { "epoch": 1.34, "learning_rate": 9.947690529082561e-05, "loss": 0.0104, "step": 515720 }, { "epoch": 1.34, "learning_rate": 9.947301707445414e-05, "loss": 0.0094, "step": 515730 }, { "epoch": 1.34, "learning_rate": 9.94691288580827e-05, "loss": 0.0085, "step": 515740 }, { "epoch": 1.34, "learning_rate": 9.946524064171121e-05, "loss": 0.0111, "step": 515750 }, { "epoch": 1.34, "learning_rate": 9.946135242533977e-05, "loss": 0.0118, "step": 515760 }, { "epoch": 1.34, "learning_rate": 9.94574642089683e-05, "loss": 0.0115, "step": 515770 }, { "epoch": 1.34, "learning_rate": 9.945357599259684e-05, "loss": 0.0082, "step": 515780 }, { "epoch": 1.34, "learning_rate": 9.944968777622537e-05, "loss": 0.0081, "step": 515790 }, { "epoch": 1.34, "learning_rate": 9.944579955985391e-05, "loss": 0.0084, "step": 515800 }, { "epoch": 1.34, "learning_rate": 9.944191134348244e-05, "loss": 0.009, "step": 515810 }, { "epoch": 1.34, "learning_rate": 9.943802312711096e-05, "loss": 0.0092, "step": 515820 }, { "epoch": 1.34, "learning_rate": 9.94341349107395e-05, "loss": 0.01, "step": 515830 }, { "epoch": 1.34, "learning_rate": 9.943024669436803e-05, "loss": 0.0082, "step": 515840 }, { "epoch": 1.34, "learning_rate": 9.942635847799657e-05, "loss": 0.0077, "step": 515850 }, { "epoch": 1.34, "learning_rate": 9.94224702616251e-05, "loss": 0.0132, "step": 515860 }, { "epoch": 1.34, "learning_rate": 9.941858204525364e-05, "loss": 0.012, "step": 515870 }, { "epoch": 1.34, "learning_rate": 9.941469382888217e-05, "loss": 0.0112, "step": 515880 }, { "epoch": 1.34, "learning_rate": 9.941080561251071e-05, "loss": 0.0101, "step": 515890 }, { "epoch": 1.34, "learning_rate": 9.940691739613924e-05, "loss": 0.0073, "step": 515900 }, { "epoch": 1.34, "learning_rate": 9.940302917976778e-05, "loss": 0.0103, "step": 515910 }, { "epoch": 1.34, "learning_rate": 9.939914096339631e-05, "loss": 0.0092, "step": 515920 }, { "epoch": 1.34, "learning_rate": 9.939525274702487e-05, "loss": 0.0105, "step": 515930 }, { "epoch": 1.34, "learning_rate": 9.93913645306534e-05, "loss": 0.0093, "step": 515940 }, { "epoch": 1.34, "learning_rate": 9.938747631428194e-05, "loss": 0.0088, "step": 515950 }, { "epoch": 1.34, "learning_rate": 9.938358809791047e-05, "loss": 0.0099, "step": 515960 }, { "epoch": 1.34, "learning_rate": 9.9379699881539e-05, "loss": 0.0111, "step": 515970 }, { "epoch": 1.34, "learning_rate": 9.937581166516753e-05, "loss": 0.0086, "step": 515980 }, { "epoch": 1.34, "learning_rate": 9.937192344879608e-05, "loss": 0.01, "step": 515990 }, { "epoch": 1.34, "learning_rate": 9.93680352324246e-05, "loss": 0.0092, "step": 516000 }, { "epoch": 1.34, "eval_cer": 0.8816900895907601, "eval_loss": 0.006371052470058203, "eval_runtime": 107.8941, "eval_samples_per_second": 18.537, "eval_steps_per_second": 4.634, "step": 516000 }, { "epoch": 1.34, "learning_rate": 9.936414701605315e-05, "loss": 0.0107, "step": 516010 }, { "epoch": 1.34, "learning_rate": 9.936025879968167e-05, "loss": 0.0106, "step": 516020 }, { "epoch": 1.34, "learning_rate": 9.935637058331022e-05, "loss": 0.009, "step": 516030 }, { "epoch": 1.34, "learning_rate": 9.935248236693874e-05, "loss": 0.0084, "step": 516040 }, { "epoch": 1.34, "learning_rate": 9.934859415056729e-05, "loss": 0.0073, "step": 516050 }, { "epoch": 1.34, "learning_rate": 9.934470593419581e-05, "loss": 0.0123, "step": 516060 }, { "epoch": 1.34, "learning_rate": 9.934081771782434e-05, "loss": 0.0102, "step": 516070 }, { "epoch": 1.34, "learning_rate": 9.933692950145288e-05, "loss": 0.0109, "step": 516080 }, { "epoch": 1.34, "learning_rate": 9.933304128508141e-05, "loss": 0.009, "step": 516090 }, { "epoch": 1.34, "learning_rate": 9.932915306870997e-05, "loss": 0.0074, "step": 516100 }, { "epoch": 1.34, "learning_rate": 9.932526485233848e-05, "loss": 0.0088, "step": 516110 }, { "epoch": 1.34, "learning_rate": 9.932137663596704e-05, "loss": 0.0091, "step": 516120 }, { "epoch": 1.34, "learning_rate": 9.931748841959556e-05, "loss": 0.0107, "step": 516130 }, { "epoch": 1.34, "learning_rate": 9.93136002032241e-05, "loss": 0.0151, "step": 516140 }, { "epoch": 1.34, "learning_rate": 9.930971198685263e-05, "loss": 0.012, "step": 516150 }, { "epoch": 1.34, "learning_rate": 9.930582377048118e-05, "loss": 0.0078, "step": 516160 }, { "epoch": 1.34, "learning_rate": 9.93019355541097e-05, "loss": 0.0081, "step": 516170 }, { "epoch": 1.34, "learning_rate": 9.929804733773825e-05, "loss": 0.012, "step": 516180 }, { "epoch": 1.34, "learning_rate": 9.929415912136677e-05, "loss": 0.0099, "step": 516190 }, { "epoch": 1.34, "learning_rate": 9.929027090499532e-05, "loss": 0.011, "step": 516200 }, { "epoch": 1.34, "learning_rate": 9.928638268862384e-05, "loss": 0.0103, "step": 516210 }, { "epoch": 1.34, "learning_rate": 9.928249447225238e-05, "loss": 0.0079, "step": 516220 }, { "epoch": 1.34, "learning_rate": 9.927860625588091e-05, "loss": 0.0084, "step": 516230 }, { "epoch": 1.34, "learning_rate": 9.927471803950945e-05, "loss": 0.0093, "step": 516240 }, { "epoch": 1.34, "learning_rate": 9.927082982313798e-05, "loss": 0.0087, "step": 516250 }, { "epoch": 1.34, "learning_rate": 9.926694160676654e-05, "loss": 0.0084, "step": 516260 }, { "epoch": 1.34, "learning_rate": 9.926305339039505e-05, "loss": 0.0082, "step": 516270 }, { "epoch": 1.34, "learning_rate": 9.925916517402361e-05, "loss": 0.0102, "step": 516280 }, { "epoch": 1.34, "learning_rate": 9.925527695765214e-05, "loss": 0.0113, "step": 516290 }, { "epoch": 1.34, "learning_rate": 9.925138874128068e-05, "loss": 0.0119, "step": 516300 }, { "epoch": 1.34, "learning_rate": 9.92475005249092e-05, "loss": 0.0074, "step": 516310 }, { "epoch": 1.34, "learning_rate": 9.924361230853773e-05, "loss": 0.012, "step": 516320 }, { "epoch": 1.34, "learning_rate": 9.923972409216628e-05, "loss": 0.0116, "step": 516330 }, { "epoch": 1.34, "learning_rate": 9.92358358757948e-05, "loss": 0.0101, "step": 516340 }, { "epoch": 1.34, "learning_rate": 9.923194765942334e-05, "loss": 0.0097, "step": 516350 }, { "epoch": 1.34, "learning_rate": 9.922805944305187e-05, "loss": 0.011, "step": 516360 }, { "epoch": 1.34, "learning_rate": 9.922417122668041e-05, "loss": 0.0092, "step": 516370 }, { "epoch": 1.34, "learning_rate": 9.922028301030894e-05, "loss": 0.0098, "step": 516380 }, { "epoch": 1.34, "learning_rate": 9.921639479393748e-05, "loss": 0.0081, "step": 516390 }, { "epoch": 1.34, "learning_rate": 9.921250657756601e-05, "loss": 0.0095, "step": 516400 }, { "epoch": 1.34, "learning_rate": 9.920861836119455e-05, "loss": 0.0108, "step": 516410 }, { "epoch": 1.34, "learning_rate": 9.920473014482308e-05, "loss": 0.0113, "step": 516420 }, { "epoch": 1.34, "learning_rate": 9.920084192845162e-05, "loss": 0.0104, "step": 516430 }, { "epoch": 1.34, "learning_rate": 9.919695371208015e-05, "loss": 0.0093, "step": 516440 }, { "epoch": 1.34, "learning_rate": 9.919306549570871e-05, "loss": 0.0079, "step": 516450 }, { "epoch": 1.34, "learning_rate": 9.918917727933724e-05, "loss": 0.0091, "step": 516460 }, { "epoch": 1.34, "learning_rate": 9.918528906296578e-05, "loss": 0.0089, "step": 516470 }, { "epoch": 1.34, "learning_rate": 9.91814008465943e-05, "loss": 0.0089, "step": 516480 }, { "epoch": 1.34, "learning_rate": 9.917751263022285e-05, "loss": 0.0085, "step": 516490 }, { "epoch": 1.34, "learning_rate": 9.917362441385137e-05, "loss": 0.0083, "step": 516500 }, { "epoch": 1.34, "learning_rate": 9.916973619747992e-05, "loss": 0.0102, "step": 516510 }, { "epoch": 1.34, "learning_rate": 9.916584798110844e-05, "loss": 0.0133, "step": 516520 }, { "epoch": 1.34, "learning_rate": 9.916195976473699e-05, "loss": 0.0127, "step": 516530 }, { "epoch": 1.34, "learning_rate": 9.915807154836551e-05, "loss": 0.0097, "step": 516540 }, { "epoch": 1.34, "learning_rate": 9.915418333199406e-05, "loss": 0.0107, "step": 516550 }, { "epoch": 1.34, "learning_rate": 9.915029511562258e-05, "loss": 0.0125, "step": 516560 }, { "epoch": 1.34, "learning_rate": 9.914640689925111e-05, "loss": 0.0094, "step": 516570 }, { "epoch": 1.34, "learning_rate": 9.914251868287965e-05, "loss": 0.0101, "step": 516580 }, { "epoch": 1.34, "learning_rate": 9.913863046650818e-05, "loss": 0.0109, "step": 516590 }, { "epoch": 1.34, "learning_rate": 9.913474225013672e-05, "loss": 0.0113, "step": 516600 }, { "epoch": 1.34, "learning_rate": 9.913085403376525e-05, "loss": 0.0081, "step": 516610 }, { "epoch": 1.34, "learning_rate": 9.912696581739379e-05, "loss": 0.0083, "step": 516620 }, { "epoch": 1.34, "learning_rate": 9.912307760102232e-05, "loss": 0.0078, "step": 516630 }, { "epoch": 1.34, "learning_rate": 9.911918938465088e-05, "loss": 0.0094, "step": 516640 }, { "epoch": 1.34, "learning_rate": 9.91153011682794e-05, "loss": 0.0107, "step": 516650 }, { "epoch": 1.34, "learning_rate": 9.911141295190795e-05, "loss": 0.0122, "step": 516660 }, { "epoch": 1.34, "learning_rate": 9.910752473553647e-05, "loss": 0.0142, "step": 516670 }, { "epoch": 1.34, "learning_rate": 9.910363651916502e-05, "loss": 0.0088, "step": 516680 }, { "epoch": 1.34, "learning_rate": 9.909974830279354e-05, "loss": 0.0089, "step": 516690 }, { "epoch": 1.34, "learning_rate": 9.909586008642209e-05, "loss": 0.0082, "step": 516700 }, { "epoch": 1.34, "learning_rate": 9.909197187005061e-05, "loss": 0.0089, "step": 516710 }, { "epoch": 1.34, "learning_rate": 9.908808365367916e-05, "loss": 0.007, "step": 516720 }, { "epoch": 1.34, "learning_rate": 9.908419543730768e-05, "loss": 0.0096, "step": 516730 }, { "epoch": 1.34, "learning_rate": 9.908030722093622e-05, "loss": 0.0093, "step": 516740 }, { "epoch": 1.34, "learning_rate": 9.907641900456475e-05, "loss": 0.01, "step": 516750 }, { "epoch": 1.34, "learning_rate": 9.90725307881933e-05, "loss": 0.0065, "step": 516760 }, { "epoch": 1.34, "learning_rate": 9.906864257182182e-05, "loss": 0.0105, "step": 516770 }, { "epoch": 1.34, "learning_rate": 9.906475435545036e-05, "loss": 0.0076, "step": 516780 }, { "epoch": 1.34, "learning_rate": 9.906086613907889e-05, "loss": 0.0095, "step": 516790 }, { "epoch": 1.34, "learning_rate": 9.905697792270745e-05, "loss": 0.0088, "step": 516800 }, { "epoch": 1.34, "learning_rate": 9.905308970633598e-05, "loss": 0.0087, "step": 516810 }, { "epoch": 1.34, "learning_rate": 9.90492014899645e-05, "loss": 0.0101, "step": 516820 }, { "epoch": 1.34, "learning_rate": 9.904531327359305e-05, "loss": 0.0089, "step": 516830 }, { "epoch": 1.34, "learning_rate": 9.904142505722157e-05, "loss": 0.0082, "step": 516840 }, { "epoch": 1.34, "learning_rate": 9.903753684085012e-05, "loss": 0.0069, "step": 516850 }, { "epoch": 1.34, "learning_rate": 9.903364862447864e-05, "loss": 0.0097, "step": 516860 }, { "epoch": 1.34, "learning_rate": 9.902976040810718e-05, "loss": 0.0096, "step": 516870 }, { "epoch": 1.34, "learning_rate": 9.902587219173571e-05, "loss": 0.0108, "step": 516880 }, { "epoch": 1.34, "learning_rate": 9.902198397536425e-05, "loss": 0.0103, "step": 516890 }, { "epoch": 1.34, "learning_rate": 9.901809575899278e-05, "loss": 0.0116, "step": 516900 }, { "epoch": 1.34, "learning_rate": 9.901420754262132e-05, "loss": 0.0091, "step": 516910 }, { "epoch": 1.34, "learning_rate": 9.901031932624985e-05, "loss": 0.0104, "step": 516920 }, { "epoch": 1.34, "learning_rate": 9.90064311098784e-05, "loss": 0.0092, "step": 516930 }, { "epoch": 1.34, "learning_rate": 9.900254289350692e-05, "loss": 0.0089, "step": 516940 }, { "epoch": 1.34, "learning_rate": 9.899865467713546e-05, "loss": 0.0127, "step": 516950 }, { "epoch": 1.34, "learning_rate": 9.899476646076399e-05, "loss": 0.0077, "step": 516960 }, { "epoch": 1.34, "learning_rate": 9.899087824439255e-05, "loss": 0.0112, "step": 516970 }, { "epoch": 1.34, "learning_rate": 9.898699002802106e-05, "loss": 0.0102, "step": 516980 }, { "epoch": 1.34, "learning_rate": 9.898310181164962e-05, "loss": 0.0115, "step": 516990 }, { "epoch": 1.34, "learning_rate": 9.897921359527814e-05, "loss": 0.0112, "step": 517000 }, { "epoch": 1.34, "eval_cer": 0.8816984874123652, "eval_loss": 0.006507012993097305, "eval_runtime": 107.881, "eval_samples_per_second": 18.539, "eval_steps_per_second": 4.635, "step": 517000 }, { "epoch": 1.34, "learning_rate": 9.897532537890669e-05, "loss": 0.0128, "step": 517010 }, { "epoch": 1.34, "learning_rate": 9.897143716253521e-05, "loss": 0.0128, "step": 517020 }, { "epoch": 1.34, "learning_rate": 9.896754894616376e-05, "loss": 0.0094, "step": 517030 }, { "epoch": 1.34, "learning_rate": 9.896366072979228e-05, "loss": 0.0101, "step": 517040 }, { "epoch": 1.34, "learning_rate": 9.895977251342083e-05, "loss": 0.012, "step": 517050 }, { "epoch": 1.34, "learning_rate": 9.895588429704935e-05, "loss": 0.0129, "step": 517060 }, { "epoch": 1.34, "learning_rate": 9.895199608067788e-05, "loss": 0.0094, "step": 517070 }, { "epoch": 1.34, "learning_rate": 9.894810786430642e-05, "loss": 0.0082, "step": 517080 }, { "epoch": 1.34, "learning_rate": 9.894421964793495e-05, "loss": 0.0092, "step": 517090 }, { "epoch": 1.34, "learning_rate": 9.89403314315635e-05, "loss": 0.008, "step": 517100 }, { "epoch": 1.34, "learning_rate": 9.893644321519202e-05, "loss": 0.0096, "step": 517110 }, { "epoch": 1.34, "learning_rate": 9.893255499882056e-05, "loss": 0.01, "step": 517120 }, { "epoch": 1.34, "learning_rate": 9.892866678244909e-05, "loss": 0.0107, "step": 517130 }, { "epoch": 1.34, "learning_rate": 9.892477856607763e-05, "loss": 0.0095, "step": 517140 }, { "epoch": 1.34, "learning_rate": 9.892089034970616e-05, "loss": 0.0099, "step": 517150 }, { "epoch": 1.34, "learning_rate": 9.891700213333472e-05, "loss": 0.0084, "step": 517160 }, { "epoch": 1.34, "learning_rate": 9.891311391696324e-05, "loss": 0.008, "step": 517170 }, { "epoch": 1.34, "learning_rate": 9.890922570059179e-05, "loss": 0.0104, "step": 517180 }, { "epoch": 1.34, "learning_rate": 9.890533748422031e-05, "loss": 0.0093, "step": 517190 }, { "epoch": 1.34, "learning_rate": 9.890144926784886e-05, "loss": 0.0114, "step": 517200 }, { "epoch": 1.34, "learning_rate": 9.889756105147738e-05, "loss": 0.0093, "step": 517210 }, { "epoch": 1.34, "learning_rate": 9.889367283510593e-05, "loss": 0.0124, "step": 517220 }, { "epoch": 1.34, "learning_rate": 9.888978461873445e-05, "loss": 0.0117, "step": 517230 }, { "epoch": 1.34, "learning_rate": 9.8885896402363e-05, "loss": 0.0087, "step": 517240 }, { "epoch": 1.34, "learning_rate": 9.888200818599152e-05, "loss": 0.0076, "step": 517250 }, { "epoch": 1.34, "learning_rate": 9.887811996962006e-05, "loss": 0.0118, "step": 517260 }, { "epoch": 1.34, "learning_rate": 9.887423175324859e-05, "loss": 0.007, "step": 517270 }, { "epoch": 1.34, "learning_rate": 9.887034353687713e-05, "loss": 0.01, "step": 517280 }, { "epoch": 1.34, "learning_rate": 9.886645532050566e-05, "loss": 0.0082, "step": 517290 }, { "epoch": 1.34, "learning_rate": 9.88625671041342e-05, "loss": 0.0095, "step": 517300 }, { "epoch": 1.34, "learning_rate": 9.885867888776273e-05, "loss": 0.0114, "step": 517310 }, { "epoch": 1.34, "learning_rate": 9.885479067139126e-05, "loss": 0.0107, "step": 517320 }, { "epoch": 1.34, "learning_rate": 9.885090245501982e-05, "loss": 0.0066, "step": 517330 }, { "epoch": 1.34, "learning_rate": 9.884701423864833e-05, "loss": 0.0081, "step": 517340 }, { "epoch": 1.34, "learning_rate": 9.884312602227689e-05, "loss": 0.0115, "step": 517350 }, { "epoch": 1.34, "learning_rate": 9.883923780590541e-05, "loss": 0.0106, "step": 517360 }, { "epoch": 1.34, "learning_rate": 9.883534958953396e-05, "loss": 0.0076, "step": 517370 }, { "epoch": 1.34, "learning_rate": 9.883146137316248e-05, "loss": 0.0121, "step": 517380 }, { "epoch": 1.34, "learning_rate": 9.882757315679102e-05, "loss": 0.0072, "step": 517390 }, { "epoch": 1.34, "learning_rate": 9.882368494041955e-05, "loss": 0.0079, "step": 517400 }, { "epoch": 1.34, "learning_rate": 9.88197967240481e-05, "loss": 0.0096, "step": 517410 }, { "epoch": 1.34, "learning_rate": 9.881590850767662e-05, "loss": 0.0124, "step": 517420 }, { "epoch": 1.34, "learning_rate": 9.881202029130516e-05, "loss": 0.0102, "step": 517430 }, { "epoch": 1.34, "learning_rate": 9.880813207493369e-05, "loss": 0.0091, "step": 517440 }, { "epoch": 1.34, "learning_rate": 9.880424385856223e-05, "loss": 0.0138, "step": 517450 }, { "epoch": 1.34, "learning_rate": 9.880035564219076e-05, "loss": 0.0085, "step": 517460 }, { "epoch": 1.34, "learning_rate": 9.87964674258193e-05, "loss": 0.0147, "step": 517470 }, { "epoch": 1.34, "learning_rate": 9.879257920944783e-05, "loss": 0.0095, "step": 517480 }, { "epoch": 1.34, "learning_rate": 9.878869099307639e-05, "loss": 0.0118, "step": 517490 }, { "epoch": 1.34, "learning_rate": 9.87848027767049e-05, "loss": 0.0103, "step": 517500 }, { "epoch": 1.34, "learning_rate": 9.878091456033346e-05, "loss": 0.0098, "step": 517510 }, { "epoch": 1.34, "learning_rate": 9.877702634396198e-05, "loss": 0.0099, "step": 517520 }, { "epoch": 1.34, "learning_rate": 9.877313812759053e-05, "loss": 0.0074, "step": 517530 }, { "epoch": 1.34, "learning_rate": 9.876924991121905e-05, "loss": 0.0108, "step": 517540 }, { "epoch": 1.34, "learning_rate": 9.87653616948476e-05, "loss": 0.0108, "step": 517550 }, { "epoch": 1.34, "learning_rate": 9.876147347847612e-05, "loss": 0.0116, "step": 517560 }, { "epoch": 1.34, "learning_rate": 9.875758526210465e-05, "loss": 0.0127, "step": 517570 }, { "epoch": 1.34, "learning_rate": 9.87536970457332e-05, "loss": 0.0108, "step": 517580 }, { "epoch": 1.34, "learning_rate": 9.874980882936172e-05, "loss": 0.0078, "step": 517590 }, { "epoch": 1.34, "learning_rate": 9.874592061299026e-05, "loss": 0.0098, "step": 517600 }, { "epoch": 1.34, "learning_rate": 9.874203239661879e-05, "loss": 0.0096, "step": 517610 }, { "epoch": 1.34, "learning_rate": 9.873814418024733e-05, "loss": 0.0107, "step": 517620 }, { "epoch": 1.34, "learning_rate": 9.873425596387586e-05, "loss": 0.0099, "step": 517630 }, { "epoch": 1.34, "learning_rate": 9.87303677475044e-05, "loss": 0.0103, "step": 517640 }, { "epoch": 1.34, "learning_rate": 9.872647953113293e-05, "loss": 0.0084, "step": 517650 }, { "epoch": 1.34, "learning_rate": 9.872259131476147e-05, "loss": 0.0122, "step": 517660 }, { "epoch": 1.34, "learning_rate": 9.871870309839e-05, "loss": 0.0086, "step": 517670 }, { "epoch": 1.34, "learning_rate": 9.871481488201856e-05, "loss": 0.0117, "step": 517680 }, { "epoch": 1.34, "learning_rate": 9.871092666564708e-05, "loss": 0.0126, "step": 517690 }, { "epoch": 1.34, "learning_rate": 9.870703844927563e-05, "loss": 0.012, "step": 517700 }, { "epoch": 1.34, "learning_rate": 9.870315023290415e-05, "loss": 0.0079, "step": 517710 }, { "epoch": 1.34, "learning_rate": 9.86992620165327e-05, "loss": 0.0092, "step": 517720 }, { "epoch": 1.34, "learning_rate": 9.869537380016122e-05, "loss": 0.0164, "step": 517730 }, { "epoch": 1.34, "learning_rate": 9.869148558378977e-05, "loss": 0.0112, "step": 517740 }, { "epoch": 1.34, "learning_rate": 9.86875973674183e-05, "loss": 0.0116, "step": 517750 }, { "epoch": 1.34, "learning_rate": 9.868370915104683e-05, "loss": 0.0131, "step": 517760 }, { "epoch": 1.34, "learning_rate": 9.867982093467536e-05, "loss": 0.0122, "step": 517770 }, { "epoch": 1.34, "learning_rate": 9.86759327183039e-05, "loss": 0.01, "step": 517780 }, { "epoch": 1.34, "learning_rate": 9.867204450193243e-05, "loss": 0.0109, "step": 517790 }, { "epoch": 1.34, "learning_rate": 9.866815628556096e-05, "loss": 0.0118, "step": 517800 }, { "epoch": 1.34, "learning_rate": 9.86642680691895e-05, "loss": 0.01, "step": 517810 }, { "epoch": 1.34, "learning_rate": 9.866037985281803e-05, "loss": 0.0111, "step": 517820 }, { "epoch": 1.34, "learning_rate": 9.865649163644657e-05, "loss": 0.009, "step": 517830 }, { "epoch": 1.34, "learning_rate": 9.86526034200751e-05, "loss": 0.0122, "step": 517840 }, { "epoch": 1.34, "learning_rate": 9.864871520370366e-05, "loss": 0.0102, "step": 517850 }, { "epoch": 1.34, "learning_rate": 9.864482698733217e-05, "loss": 0.0106, "step": 517860 }, { "epoch": 1.34, "learning_rate": 9.864093877096073e-05, "loss": 0.0078, "step": 517870 }, { "epoch": 1.34, "learning_rate": 9.863705055458925e-05, "loss": 0.0088, "step": 517880 }, { "epoch": 1.34, "learning_rate": 9.86331623382178e-05, "loss": 0.009, "step": 517890 }, { "epoch": 1.34, "learning_rate": 9.862927412184632e-05, "loss": 0.0094, "step": 517900 }, { "epoch": 1.34, "learning_rate": 9.862538590547486e-05, "loss": 0.0099, "step": 517910 }, { "epoch": 1.34, "learning_rate": 9.862149768910339e-05, "loss": 0.012, "step": 517920 }, { "epoch": 1.34, "learning_rate": 9.861760947273193e-05, "loss": 0.0073, "step": 517930 }, { "epoch": 1.34, "learning_rate": 9.861372125636046e-05, "loss": 0.0121, "step": 517940 }, { "epoch": 1.34, "learning_rate": 9.8609833039989e-05, "loss": 0.008, "step": 517950 }, { "epoch": 1.34, "learning_rate": 9.860594482361753e-05, "loss": 0.0097, "step": 517960 }, { "epoch": 1.34, "learning_rate": 9.860205660724607e-05, "loss": 0.0108, "step": 517970 }, { "epoch": 1.34, "learning_rate": 9.85981683908746e-05, "loss": 0.0088, "step": 517980 }, { "epoch": 1.34, "learning_rate": 9.859428017450314e-05, "loss": 0.0128, "step": 517990 }, { "epoch": 1.34, "learning_rate": 9.859039195813167e-05, "loss": 0.0113, "step": 518000 }, { "epoch": 1.34, "eval_cer": 0.8816536990304715, "eval_loss": 0.006467238999903202, "eval_runtime": 107.9416, "eval_samples_per_second": 18.529, "eval_steps_per_second": 4.632, "step": 518000 }, { "epoch": 1.34, "learning_rate": 9.858650374176021e-05, "loss": 0.0113, "step": 518010 }, { "epoch": 1.34, "learning_rate": 9.858261552538874e-05, "loss": 0.0135, "step": 518020 }, { "epoch": 1.34, "learning_rate": 9.85787273090173e-05, "loss": 0.0081, "step": 518030 }, { "epoch": 1.34, "learning_rate": 9.857483909264582e-05, "loss": 0.0122, "step": 518040 }, { "epoch": 1.34, "learning_rate": 9.857095087627435e-05, "loss": 0.011, "step": 518050 }, { "epoch": 1.34, "learning_rate": 9.85670626599029e-05, "loss": 0.0107, "step": 518060 }, { "epoch": 1.34, "learning_rate": 9.856317444353142e-05, "loss": 0.0103, "step": 518070 }, { "epoch": 1.34, "learning_rate": 9.855928622715996e-05, "loss": 0.0098, "step": 518080 }, { "epoch": 1.34, "learning_rate": 9.855539801078849e-05, "loss": 0.0121, "step": 518090 }, { "epoch": 1.34, "learning_rate": 9.855150979441703e-05, "loss": 0.0102, "step": 518100 }, { "epoch": 1.34, "learning_rate": 9.854762157804556e-05, "loss": 0.0097, "step": 518110 }, { "epoch": 1.34, "learning_rate": 9.85437333616741e-05, "loss": 0.0106, "step": 518120 }, { "epoch": 1.34, "learning_rate": 9.853984514530263e-05, "loss": 0.0102, "step": 518130 }, { "epoch": 1.34, "learning_rate": 9.853595692893117e-05, "loss": 0.0129, "step": 518140 }, { "epoch": 1.34, "learning_rate": 9.85320687125597e-05, "loss": 0.0076, "step": 518150 }, { "epoch": 1.34, "learning_rate": 9.852818049618824e-05, "loss": 0.0158, "step": 518160 }, { "epoch": 1.34, "learning_rate": 9.852429227981677e-05, "loss": 0.0094, "step": 518170 }, { "epoch": 1.34, "learning_rate": 9.852040406344531e-05, "loss": 0.0085, "step": 518180 }, { "epoch": 1.34, "learning_rate": 9.851651584707384e-05, "loss": 0.0121, "step": 518190 }, { "epoch": 1.34, "learning_rate": 9.85126276307024e-05, "loss": 0.0089, "step": 518200 }, { "epoch": 1.34, "learning_rate": 9.850873941433091e-05, "loss": 0.0101, "step": 518210 }, { "epoch": 1.34, "learning_rate": 9.850485119795947e-05, "loss": 0.0095, "step": 518220 }, { "epoch": 1.34, "learning_rate": 9.8500962981588e-05, "loss": 0.01, "step": 518230 }, { "epoch": 1.34, "learning_rate": 9.849707476521654e-05, "loss": 0.0103, "step": 518240 }, { "epoch": 1.34, "learning_rate": 9.849318654884506e-05, "loss": 0.008, "step": 518250 }, { "epoch": 1.34, "learning_rate": 9.84892983324736e-05, "loss": 0.0095, "step": 518260 }, { "epoch": 1.34, "learning_rate": 9.848541011610213e-05, "loss": 0.0078, "step": 518270 }, { "epoch": 1.34, "learning_rate": 9.848152189973067e-05, "loss": 0.0094, "step": 518280 }, { "epoch": 1.34, "learning_rate": 9.84776336833592e-05, "loss": 0.0123, "step": 518290 }, { "epoch": 1.34, "learning_rate": 9.847374546698773e-05, "loss": 0.0104, "step": 518300 }, { "epoch": 1.34, "learning_rate": 9.846985725061627e-05, "loss": 0.0092, "step": 518310 }, { "epoch": 1.34, "learning_rate": 9.84659690342448e-05, "loss": 0.0086, "step": 518320 }, { "epoch": 1.34, "learning_rate": 9.846208081787334e-05, "loss": 0.0101, "step": 518330 }, { "epoch": 1.34, "learning_rate": 9.845819260150187e-05, "loss": 0.0088, "step": 518340 }, { "epoch": 1.34, "learning_rate": 9.845430438513041e-05, "loss": 0.0089, "step": 518350 }, { "epoch": 1.34, "learning_rate": 9.845041616875894e-05, "loss": 0.0108, "step": 518360 }, { "epoch": 1.34, "learning_rate": 9.844652795238748e-05, "loss": 0.0078, "step": 518370 }, { "epoch": 1.34, "learning_rate": 9.844263973601601e-05, "loss": 0.008, "step": 518380 }, { "epoch": 1.34, "learning_rate": 9.843875151964457e-05, "loss": 0.0106, "step": 518390 }, { "epoch": 1.34, "learning_rate": 9.843486330327309e-05, "loss": 0.0109, "step": 518400 }, { "epoch": 1.34, "learning_rate": 9.843097508690163e-05, "loss": 0.0098, "step": 518410 }, { "epoch": 1.34, "learning_rate": 9.842708687053016e-05, "loss": 0.0114, "step": 518420 }, { "epoch": 1.34, "learning_rate": 9.84231986541587e-05, "loss": 0.0116, "step": 518430 }, { "epoch": 1.34, "learning_rate": 9.841931043778723e-05, "loss": 0.0081, "step": 518440 }, { "epoch": 1.34, "learning_rate": 9.841542222141577e-05, "loss": 0.0111, "step": 518450 }, { "epoch": 1.34, "learning_rate": 9.84115340050443e-05, "loss": 0.0094, "step": 518460 }, { "epoch": 1.34, "learning_rate": 9.840764578867284e-05, "loss": 0.0109, "step": 518470 }, { "epoch": 1.34, "learning_rate": 9.840375757230137e-05, "loss": 0.0078, "step": 518480 }, { "epoch": 1.34, "learning_rate": 9.839986935592991e-05, "loss": 0.0104, "step": 518490 }, { "epoch": 1.34, "learning_rate": 9.839598113955844e-05, "loss": 0.0109, "step": 518500 }, { "epoch": 1.34, "learning_rate": 9.839209292318698e-05, "loss": 0.0106, "step": 518510 }, { "epoch": 1.34, "learning_rate": 9.838820470681551e-05, "loss": 0.0135, "step": 518520 }, { "epoch": 1.34, "learning_rate": 9.838431649044405e-05, "loss": 0.0077, "step": 518530 }, { "epoch": 1.34, "learning_rate": 9.838042827407258e-05, "loss": 0.0082, "step": 518540 }, { "epoch": 1.34, "learning_rate": 9.837654005770111e-05, "loss": 0.0086, "step": 518550 }, { "epoch": 1.34, "learning_rate": 9.837265184132966e-05, "loss": 0.0115, "step": 518560 }, { "epoch": 1.34, "learning_rate": 9.836876362495818e-05, "loss": 0.0111, "step": 518570 }, { "epoch": 1.34, "learning_rate": 9.836487540858673e-05, "loss": 0.0096, "step": 518580 }, { "epoch": 1.34, "learning_rate": 9.836098719221526e-05, "loss": 0.011, "step": 518590 }, { "epoch": 1.34, "learning_rate": 9.83570989758438e-05, "loss": 0.01, "step": 518600 }, { "epoch": 1.34, "learning_rate": 9.835321075947233e-05, "loss": 0.0119, "step": 518610 }, { "epoch": 1.34, "learning_rate": 9.834932254310087e-05, "loss": 0.0109, "step": 518620 }, { "epoch": 1.34, "learning_rate": 9.83454343267294e-05, "loss": 0.0103, "step": 518630 }, { "epoch": 1.34, "learning_rate": 9.834154611035794e-05, "loss": 0.0084, "step": 518640 }, { "epoch": 1.34, "learning_rate": 9.833765789398647e-05, "loss": 0.0097, "step": 518650 }, { "epoch": 1.34, "learning_rate": 9.833376967761501e-05, "loss": 0.0097, "step": 518660 }, { "epoch": 1.34, "learning_rate": 9.832988146124354e-05, "loss": 0.0106, "step": 518670 }, { "epoch": 1.34, "learning_rate": 9.832599324487208e-05, "loss": 0.0089, "step": 518680 }, { "epoch": 1.34, "learning_rate": 9.832210502850061e-05, "loss": 0.0067, "step": 518690 }, { "epoch": 1.34, "learning_rate": 9.831821681212915e-05, "loss": 0.0171, "step": 518700 }, { "epoch": 1.34, "learning_rate": 9.831432859575768e-05, "loss": 0.009, "step": 518710 }, { "epoch": 1.34, "learning_rate": 9.831044037938624e-05, "loss": 0.0085, "step": 518720 }, { "epoch": 1.34, "learning_rate": 9.830655216301475e-05, "loss": 0.008, "step": 518730 }, { "epoch": 1.34, "learning_rate": 9.83026639466433e-05, "loss": 0.0117, "step": 518740 }, { "epoch": 1.34, "learning_rate": 9.829877573027183e-05, "loss": 0.009, "step": 518750 }, { "epoch": 1.34, "learning_rate": 9.829488751390038e-05, "loss": 0.0096, "step": 518760 }, { "epoch": 1.34, "learning_rate": 9.82909992975289e-05, "loss": 0.0096, "step": 518770 }, { "epoch": 1.34, "learning_rate": 9.828711108115745e-05, "loss": 0.0144, "step": 518780 }, { "epoch": 1.34, "learning_rate": 9.828322286478597e-05, "loss": 0.0083, "step": 518790 }, { "epoch": 1.34, "learning_rate": 9.82793346484145e-05, "loss": 0.0094, "step": 518800 }, { "epoch": 1.34, "learning_rate": 9.827544643204304e-05, "loss": 0.0092, "step": 518810 }, { "epoch": 1.34, "learning_rate": 9.827155821567157e-05, "loss": 0.0111, "step": 518820 }, { "epoch": 1.34, "learning_rate": 9.826766999930011e-05, "loss": 0.0095, "step": 518830 }, { "epoch": 1.34, "learning_rate": 9.826378178292864e-05, "loss": 0.0103, "step": 518840 }, { "epoch": 1.34, "learning_rate": 9.825989356655718e-05, "loss": 0.0122, "step": 518850 }, { "epoch": 1.34, "learning_rate": 9.825600535018571e-05, "loss": 0.0109, "step": 518860 }, { "epoch": 1.34, "learning_rate": 9.825211713381425e-05, "loss": 0.0092, "step": 518870 }, { "epoch": 1.35, "learning_rate": 9.824822891744278e-05, "loss": 0.0108, "step": 518880 }, { "epoch": 1.35, "learning_rate": 9.824434070107132e-05, "loss": 0.0084, "step": 518890 }, { "epoch": 1.35, "learning_rate": 9.824045248469985e-05, "loss": 0.0088, "step": 518900 }, { "epoch": 1.35, "learning_rate": 9.82365642683284e-05, "loss": 0.008, "step": 518910 }, { "epoch": 1.35, "learning_rate": 9.823267605195693e-05, "loss": 0.0096, "step": 518920 }, { "epoch": 1.35, "learning_rate": 9.822878783558547e-05, "loss": 0.0074, "step": 518930 }, { "epoch": 1.35, "learning_rate": 9.8224899619214e-05, "loss": 0.0094, "step": 518940 }, { "epoch": 1.35, "learning_rate": 9.822101140284254e-05, "loss": 0.0101, "step": 518950 }, { "epoch": 1.35, "learning_rate": 9.821712318647107e-05, "loss": 0.007, "step": 518960 }, { "epoch": 1.35, "learning_rate": 9.821323497009961e-05, "loss": 0.0115, "step": 518970 }, { "epoch": 1.35, "learning_rate": 9.820934675372814e-05, "loss": 0.0089, "step": 518980 }, { "epoch": 1.35, "learning_rate": 9.820545853735668e-05, "loss": 0.0079, "step": 518990 }, { "epoch": 1.35, "learning_rate": 9.820157032098521e-05, "loss": 0.0079, "step": 519000 }, { "epoch": 1.35, "eval_cer": 0.8816928888646285, "eval_loss": 0.006426098756492138, "eval_runtime": 107.8933, "eval_samples_per_second": 18.537, "eval_steps_per_second": 4.634, "step": 519000 }, { "epoch": 1.35, "learning_rate": 9.819768210461375e-05, "loss": 0.0138, "step": 519010 }, { "epoch": 1.35, "learning_rate": 9.819379388824228e-05, "loss": 0.009, "step": 519020 }, { "epoch": 1.35, "learning_rate": 9.818990567187082e-05, "loss": 0.0089, "step": 519030 }, { "epoch": 1.35, "learning_rate": 9.818601745549935e-05, "loss": 0.0121, "step": 519040 }, { "epoch": 1.35, "learning_rate": 9.818212923912788e-05, "loss": 0.0104, "step": 519050 }, { "epoch": 1.35, "learning_rate": 9.817824102275642e-05, "loss": 0.011, "step": 519060 }, { "epoch": 1.35, "learning_rate": 9.817435280638495e-05, "loss": 0.0119, "step": 519070 }, { "epoch": 1.35, "learning_rate": 9.81704645900135e-05, "loss": 0.0111, "step": 519080 }, { "epoch": 1.35, "learning_rate": 9.816657637364202e-05, "loss": 0.011, "step": 519090 }, { "epoch": 1.35, "learning_rate": 9.816268815727057e-05, "loss": 0.0089, "step": 519100 }, { "epoch": 1.35, "learning_rate": 9.81587999408991e-05, "loss": 0.0106, "step": 519110 }, { "epoch": 1.35, "learning_rate": 9.815491172452764e-05, "loss": 0.0093, "step": 519120 }, { "epoch": 1.35, "learning_rate": 9.815102350815617e-05, "loss": 0.009, "step": 519130 }, { "epoch": 1.35, "learning_rate": 9.814713529178471e-05, "loss": 0.012, "step": 519140 }, { "epoch": 1.35, "learning_rate": 9.814324707541324e-05, "loss": 0.009, "step": 519150 }, { "epoch": 1.35, "learning_rate": 9.813935885904178e-05, "loss": 0.0102, "step": 519160 }, { "epoch": 1.35, "learning_rate": 9.813547064267031e-05, "loss": 0.0091, "step": 519170 }, { "epoch": 1.35, "learning_rate": 9.813158242629885e-05, "loss": 0.0075, "step": 519180 }, { "epoch": 1.35, "learning_rate": 9.812769420992738e-05, "loss": 0.0093, "step": 519190 }, { "epoch": 1.35, "learning_rate": 9.812380599355592e-05, "loss": 0.007, "step": 519200 }, { "epoch": 1.35, "learning_rate": 9.811991777718445e-05, "loss": 0.0117, "step": 519210 }, { "epoch": 1.35, "learning_rate": 9.811602956081299e-05, "loss": 0.0102, "step": 519220 }, { "epoch": 1.35, "learning_rate": 9.811214134444152e-05, "loss": 0.0105, "step": 519230 }, { "epoch": 1.35, "learning_rate": 9.810825312807006e-05, "loss": 0.0101, "step": 519240 }, { "epoch": 1.35, "learning_rate": 9.810436491169859e-05, "loss": 0.0098, "step": 519250 }, { "epoch": 1.35, "learning_rate": 9.810047669532715e-05, "loss": 0.008, "step": 519260 }, { "epoch": 1.35, "learning_rate": 9.809658847895567e-05, "loss": 0.0105, "step": 519270 }, { "epoch": 1.35, "learning_rate": 9.809270026258422e-05, "loss": 0.0168, "step": 519280 }, { "epoch": 1.35, "learning_rate": 9.808881204621274e-05, "loss": 0.0081, "step": 519290 }, { "epoch": 1.35, "learning_rate": 9.808492382984127e-05, "loss": 0.0077, "step": 519300 }, { "epoch": 1.35, "learning_rate": 9.808103561346981e-05, "loss": 0.0102, "step": 519310 }, { "epoch": 1.35, "learning_rate": 9.807714739709834e-05, "loss": 0.0109, "step": 519320 }, { "epoch": 1.35, "learning_rate": 9.807325918072688e-05, "loss": 0.0129, "step": 519330 }, { "epoch": 1.35, "learning_rate": 9.806937096435541e-05, "loss": 0.0086, "step": 519340 }, { "epoch": 1.35, "learning_rate": 9.806548274798395e-05, "loss": 0.0082, "step": 519350 }, { "epoch": 1.35, "learning_rate": 9.806159453161248e-05, "loss": 0.0153, "step": 519360 }, { "epoch": 1.35, "learning_rate": 9.805770631524102e-05, "loss": 0.0123, "step": 519370 }, { "epoch": 1.35, "learning_rate": 9.805381809886955e-05, "loss": 0.0121, "step": 519380 }, { "epoch": 1.35, "learning_rate": 9.804992988249809e-05, "loss": 0.0096, "step": 519390 }, { "epoch": 1.35, "learning_rate": 9.804604166612662e-05, "loss": 0.0172, "step": 519400 }, { "epoch": 1.35, "learning_rate": 9.804215344975516e-05, "loss": 0.0087, "step": 519410 }, { "epoch": 1.35, "learning_rate": 9.803826523338369e-05, "loss": 0.008, "step": 519420 }, { "epoch": 1.35, "learning_rate": 9.803437701701224e-05, "loss": 0.0106, "step": 519430 }, { "epoch": 1.35, "learning_rate": 9.803048880064077e-05, "loss": 0.0098, "step": 519440 }, { "epoch": 1.35, "learning_rate": 9.802660058426931e-05, "loss": 0.0085, "step": 519450 }, { "epoch": 1.35, "learning_rate": 9.802271236789784e-05, "loss": 0.0095, "step": 519460 }, { "epoch": 1.35, "learning_rate": 9.801882415152638e-05, "loss": 0.0082, "step": 519470 }, { "epoch": 1.35, "learning_rate": 9.801493593515491e-05, "loss": 0.0106, "step": 519480 }, { "epoch": 1.35, "learning_rate": 9.801104771878345e-05, "loss": 0.0109, "step": 519490 }, { "epoch": 1.35, "learning_rate": 9.800715950241198e-05, "loss": 0.0091, "step": 519500 }, { "epoch": 1.35, "learning_rate": 9.800327128604052e-05, "loss": 0.011, "step": 519510 }, { "epoch": 1.35, "learning_rate": 9.799938306966905e-05, "loss": 0.0092, "step": 519520 }, { "epoch": 1.35, "learning_rate": 9.79954948532976e-05, "loss": 0.0105, "step": 519530 }, { "epoch": 1.35, "learning_rate": 9.799160663692612e-05, "loss": 0.009, "step": 519540 }, { "epoch": 1.35, "learning_rate": 9.798771842055465e-05, "loss": 0.0091, "step": 519550 }, { "epoch": 1.35, "learning_rate": 9.798383020418319e-05, "loss": 0.0098, "step": 519560 }, { "epoch": 1.35, "learning_rate": 9.797994198781172e-05, "loss": 0.0095, "step": 519570 }, { "epoch": 1.35, "learning_rate": 9.797605377144026e-05, "loss": 0.0077, "step": 519580 }, { "epoch": 1.35, "learning_rate": 9.797216555506879e-05, "loss": 0.0119, "step": 519590 }, { "epoch": 1.35, "learning_rate": 9.796827733869733e-05, "loss": 0.0092, "step": 519600 }, { "epoch": 1.35, "learning_rate": 9.796438912232586e-05, "loss": 0.0095, "step": 519610 }, { "epoch": 1.35, "learning_rate": 9.796050090595441e-05, "loss": 0.0101, "step": 519620 }, { "epoch": 1.35, "learning_rate": 9.795661268958294e-05, "loss": 0.0078, "step": 519630 }, { "epoch": 1.35, "learning_rate": 9.795272447321148e-05, "loss": 0.0092, "step": 519640 }, { "epoch": 1.35, "learning_rate": 9.794883625684001e-05, "loss": 0.0116, "step": 519650 }, { "epoch": 1.35, "learning_rate": 9.794494804046855e-05, "loss": 0.0084, "step": 519660 }, { "epoch": 1.35, "learning_rate": 9.794105982409708e-05, "loss": 0.0109, "step": 519670 }, { "epoch": 1.35, "learning_rate": 9.793717160772562e-05, "loss": 0.0109, "step": 519680 }, { "epoch": 1.35, "learning_rate": 9.793328339135415e-05, "loss": 0.0097, "step": 519690 }, { "epoch": 1.35, "learning_rate": 9.792939517498269e-05, "loss": 0.0077, "step": 519700 }, { "epoch": 1.35, "learning_rate": 9.792550695861122e-05, "loss": 0.0069, "step": 519710 }, { "epoch": 1.35, "learning_rate": 9.792161874223976e-05, "loss": 0.0086, "step": 519720 }, { "epoch": 1.35, "learning_rate": 9.791773052586829e-05, "loss": 0.0081, "step": 519730 }, { "epoch": 1.35, "learning_rate": 9.791384230949683e-05, "loss": 0.0088, "step": 519740 }, { "epoch": 1.35, "learning_rate": 9.790995409312536e-05, "loss": 0.0141, "step": 519750 }, { "epoch": 1.35, "learning_rate": 9.79060658767539e-05, "loss": 0.012, "step": 519760 }, { "epoch": 1.35, "learning_rate": 9.790217766038243e-05, "loss": 0.0116, "step": 519770 }, { "epoch": 1.35, "learning_rate": 9.789828944401099e-05, "loss": 0.0154, "step": 519780 }, { "epoch": 1.35, "learning_rate": 9.789440122763951e-05, "loss": 0.0173, "step": 519790 }, { "epoch": 1.35, "learning_rate": 9.789051301126803e-05, "loss": 0.007, "step": 519800 }, { "epoch": 1.35, "learning_rate": 9.788662479489658e-05, "loss": 0.0111, "step": 519810 }, { "epoch": 1.35, "learning_rate": 9.788273657852511e-05, "loss": 0.0131, "step": 519820 }, { "epoch": 1.35, "learning_rate": 9.787884836215365e-05, "loss": 0.0147, "step": 519830 }, { "epoch": 1.35, "learning_rate": 9.787496014578218e-05, "loss": 0.0087, "step": 519840 }, { "epoch": 1.35, "learning_rate": 9.787107192941072e-05, "loss": 0.0107, "step": 519850 }, { "epoch": 1.35, "learning_rate": 9.786718371303925e-05, "loss": 0.011, "step": 519860 }, { "epoch": 1.35, "learning_rate": 9.786329549666779e-05, "loss": 0.0113, "step": 519870 }, { "epoch": 1.35, "learning_rate": 9.785940728029632e-05, "loss": 0.0097, "step": 519880 }, { "epoch": 1.35, "learning_rate": 9.785551906392486e-05, "loss": 0.0094, "step": 519890 }, { "epoch": 1.35, "learning_rate": 9.785163084755339e-05, "loss": 0.0147, "step": 519900 }, { "epoch": 1.35, "learning_rate": 9.784774263118193e-05, "loss": 0.0102, "step": 519910 }, { "epoch": 1.35, "learning_rate": 9.784385441481046e-05, "loss": 0.0115, "step": 519920 }, { "epoch": 1.35, "learning_rate": 9.7839966198439e-05, "loss": 0.0086, "step": 519930 }, { "epoch": 1.35, "learning_rate": 9.783607798206753e-05, "loss": 0.0102, "step": 519940 }, { "epoch": 1.35, "learning_rate": 9.783218976569608e-05, "loss": 0.009, "step": 519950 }, { "epoch": 1.35, "learning_rate": 9.78283015493246e-05, "loss": 0.0099, "step": 519960 }, { "epoch": 1.35, "learning_rate": 9.782441333295315e-05, "loss": 0.0102, "step": 519970 }, { "epoch": 1.35, "learning_rate": 9.782052511658168e-05, "loss": 0.0092, "step": 519980 }, { "epoch": 1.35, "learning_rate": 9.781663690021022e-05, "loss": 0.0107, "step": 519990 }, { "epoch": 1.35, "learning_rate": 9.781274868383875e-05, "loss": 0.0105, "step": 520000 }, { "epoch": 1.35, "eval_cer": 0.8816956881384969, "eval_loss": 0.006626142654567957, "eval_runtime": 107.8646, "eval_samples_per_second": 18.542, "eval_steps_per_second": 4.635, "step": 520000 }, { "epoch": 1.35, "learning_rate": 9.78088604674673e-05, "loss": 0.0113, "step": 520010 }, { "epoch": 1.35, "learning_rate": 9.780497225109582e-05, "loss": 0.0097, "step": 520020 }, { "epoch": 1.35, "learning_rate": 9.780108403472436e-05, "loss": 0.0088, "step": 520030 }, { "epoch": 1.35, "learning_rate": 9.779719581835289e-05, "loss": 0.0105, "step": 520040 }, { "epoch": 1.35, "learning_rate": 9.779330760198142e-05, "loss": 0.0097, "step": 520050 }, { "epoch": 1.35, "learning_rate": 9.778941938560996e-05, "loss": 0.0105, "step": 520060 }, { "epoch": 1.35, "learning_rate": 9.778553116923849e-05, "loss": 0.0084, "step": 520070 }, { "epoch": 1.35, "learning_rate": 9.778164295286703e-05, "loss": 0.0079, "step": 520080 }, { "epoch": 1.35, "learning_rate": 9.777775473649556e-05, "loss": 0.0233, "step": 520090 }, { "epoch": 1.35, "learning_rate": 9.77738665201241e-05, "loss": 0.0116, "step": 520100 }, { "epoch": 1.35, "learning_rate": 9.776997830375263e-05, "loss": 0.0131, "step": 520110 }, { "epoch": 1.35, "learning_rate": 9.776609008738117e-05, "loss": 0.0085, "step": 520120 }, { "epoch": 1.35, "learning_rate": 9.77622018710097e-05, "loss": 0.0087, "step": 520130 }, { "epoch": 1.35, "learning_rate": 9.775831365463825e-05, "loss": 0.0073, "step": 520140 }, { "epoch": 1.35, "learning_rate": 9.775442543826678e-05, "loss": 0.0085, "step": 520150 }, { "epoch": 1.35, "learning_rate": 9.775053722189532e-05, "loss": 0.016, "step": 520160 }, { "epoch": 1.35, "learning_rate": 9.774664900552385e-05, "loss": 0.012, "step": 520170 }, { "epoch": 1.35, "learning_rate": 9.77427607891524e-05, "loss": 0.0075, "step": 520180 }, { "epoch": 1.35, "learning_rate": 9.773887257278092e-05, "loss": 0.0087, "step": 520190 }, { "epoch": 1.35, "learning_rate": 9.773498435640946e-05, "loss": 0.0081, "step": 520200 }, { "epoch": 1.35, "learning_rate": 9.773109614003799e-05, "loss": 0.0134, "step": 520210 }, { "epoch": 1.35, "learning_rate": 9.772720792366653e-05, "loss": 0.0082, "step": 520220 }, { "epoch": 1.35, "learning_rate": 9.772331970729506e-05, "loss": 0.01, "step": 520230 }, { "epoch": 1.35, "learning_rate": 9.77194314909236e-05, "loss": 0.0081, "step": 520240 }, { "epoch": 1.35, "learning_rate": 9.771554327455213e-05, "loss": 0.0082, "step": 520250 }, { "epoch": 1.35, "learning_rate": 9.771165505818067e-05, "loss": 0.0094, "step": 520260 }, { "epoch": 1.35, "learning_rate": 9.77077668418092e-05, "loss": 0.0078, "step": 520270 }, { "epoch": 1.35, "learning_rate": 9.770387862543773e-05, "loss": 0.0093, "step": 520280 }, { "epoch": 1.35, "learning_rate": 9.769999040906627e-05, "loss": 0.0085, "step": 520290 }, { "epoch": 1.35, "learning_rate": 9.76961021926948e-05, "loss": 0.0098, "step": 520300 }, { "epoch": 1.35, "learning_rate": 9.769221397632335e-05, "loss": 0.011, "step": 520310 }, { "epoch": 1.35, "learning_rate": 9.768832575995187e-05, "loss": 0.0107, "step": 520320 }, { "epoch": 1.35, "learning_rate": 9.768443754358042e-05, "loss": 0.0149, "step": 520330 }, { "epoch": 1.35, "learning_rate": 9.768054932720895e-05, "loss": 0.0095, "step": 520340 }, { "epoch": 1.35, "learning_rate": 9.767666111083749e-05, "loss": 0.0086, "step": 520350 }, { "epoch": 1.35, "learning_rate": 9.767277289446602e-05, "loss": 0.009, "step": 520360 }, { "epoch": 1.35, "learning_rate": 9.766888467809456e-05, "loss": 0.0134, "step": 520370 }, { "epoch": 1.35, "learning_rate": 9.766499646172309e-05, "loss": 0.0107, "step": 520380 }, { "epoch": 1.35, "learning_rate": 9.766110824535163e-05, "loss": 0.0092, "step": 520390 }, { "epoch": 1.35, "learning_rate": 9.765722002898016e-05, "loss": 0.0109, "step": 520400 }, { "epoch": 1.35, "learning_rate": 9.76533318126087e-05, "loss": 0.0115, "step": 520410 }, { "epoch": 1.35, "learning_rate": 9.764944359623723e-05, "loss": 0.0089, "step": 520420 }, { "epoch": 1.35, "learning_rate": 9.764555537986577e-05, "loss": 0.0105, "step": 520430 }, { "epoch": 1.35, "learning_rate": 9.76416671634943e-05, "loss": 0.0088, "step": 520440 }, { "epoch": 1.35, "learning_rate": 9.763777894712284e-05, "loss": 0.0114, "step": 520450 }, { "epoch": 1.35, "learning_rate": 9.763389073075137e-05, "loss": 0.0069, "step": 520460 }, { "epoch": 1.35, "learning_rate": 9.763000251437992e-05, "loss": 0.0097, "step": 520470 }, { "epoch": 1.35, "learning_rate": 9.762611429800844e-05, "loss": 0.0117, "step": 520480 }, { "epoch": 1.35, "learning_rate": 9.7622226081637e-05, "loss": 0.0105, "step": 520490 }, { "epoch": 1.35, "learning_rate": 9.761833786526552e-05, "loss": 0.01, "step": 520500 }, { "epoch": 1.35, "learning_rate": 9.761444964889406e-05, "loss": 0.0134, "step": 520510 }, { "epoch": 1.35, "learning_rate": 9.761056143252259e-05, "loss": 0.0114, "step": 520520 }, { "epoch": 1.35, "learning_rate": 9.760667321615112e-05, "loss": 0.011, "step": 520530 }, { "epoch": 1.35, "learning_rate": 9.760278499977966e-05, "loss": 0.0104, "step": 520540 }, { "epoch": 1.35, "learning_rate": 9.759889678340819e-05, "loss": 0.0083, "step": 520550 }, { "epoch": 1.35, "learning_rate": 9.759500856703673e-05, "loss": 0.0083, "step": 520560 }, { "epoch": 1.35, "learning_rate": 9.759112035066526e-05, "loss": 0.01, "step": 520570 }, { "epoch": 1.35, "learning_rate": 9.75872321342938e-05, "loss": 0.0151, "step": 520580 }, { "epoch": 1.35, "learning_rate": 9.758334391792233e-05, "loss": 0.011, "step": 520590 }, { "epoch": 1.35, "learning_rate": 9.757945570155087e-05, "loss": 0.0098, "step": 520600 }, { "epoch": 1.35, "learning_rate": 9.75755674851794e-05, "loss": 0.0078, "step": 520610 }, { "epoch": 1.35, "learning_rate": 9.757167926880794e-05, "loss": 0.0146, "step": 520620 }, { "epoch": 1.35, "learning_rate": 9.756779105243647e-05, "loss": 0.0071, "step": 520630 }, { "epoch": 1.35, "learning_rate": 9.756390283606501e-05, "loss": 0.0117, "step": 520640 }, { "epoch": 1.35, "learning_rate": 9.756001461969354e-05, "loss": 0.0101, "step": 520650 }, { "epoch": 1.35, "learning_rate": 9.75561264033221e-05, "loss": 0.01, "step": 520660 }, { "epoch": 1.35, "learning_rate": 9.755223818695062e-05, "loss": 0.0113, "step": 520670 }, { "epoch": 1.35, "learning_rate": 9.754834997057916e-05, "loss": 0.0098, "step": 520680 }, { "epoch": 1.35, "learning_rate": 9.754446175420769e-05, "loss": 0.0101, "step": 520690 }, { "epoch": 1.35, "learning_rate": 9.754057353783623e-05, "loss": 0.0088, "step": 520700 }, { "epoch": 1.35, "learning_rate": 9.753668532146476e-05, "loss": 0.0086, "step": 520710 }, { "epoch": 1.35, "learning_rate": 9.75327971050933e-05, "loss": 0.0113, "step": 520720 }, { "epoch": 1.35, "learning_rate": 9.752890888872183e-05, "loss": 0.0109, "step": 520730 }, { "epoch": 1.35, "learning_rate": 9.752502067235037e-05, "loss": 0.0082, "step": 520740 }, { "epoch": 1.35, "learning_rate": 9.75211324559789e-05, "loss": 0.0104, "step": 520750 }, { "epoch": 1.35, "learning_rate": 9.751724423960744e-05, "loss": 0.013, "step": 520760 }, { "epoch": 1.35, "learning_rate": 9.751335602323597e-05, "loss": 0.0079, "step": 520770 }, { "epoch": 1.35, "learning_rate": 9.75094678068645e-05, "loss": 0.0104, "step": 520780 }, { "epoch": 1.35, "learning_rate": 9.750557959049304e-05, "loss": 0.0085, "step": 520790 }, { "epoch": 1.35, "learning_rate": 9.750169137412157e-05, "loss": 0.0112, "step": 520800 }, { "epoch": 1.35, "learning_rate": 9.749780315775011e-05, "loss": 0.0111, "step": 520810 }, { "epoch": 1.35, "learning_rate": 9.749391494137864e-05, "loss": 0.0086, "step": 520820 }, { "epoch": 1.35, "learning_rate": 9.749002672500718e-05, "loss": 0.0092, "step": 520830 }, { "epoch": 1.35, "learning_rate": 9.748613850863571e-05, "loss": 0.0102, "step": 520840 }, { "epoch": 1.35, "learning_rate": 9.748225029226426e-05, "loss": 0.01, "step": 520850 }, { "epoch": 1.35, "learning_rate": 9.747836207589279e-05, "loss": 0.0089, "step": 520860 }, { "epoch": 1.35, "learning_rate": 9.747447385952133e-05, "loss": 0.0083, "step": 520870 }, { "epoch": 1.35, "learning_rate": 9.747058564314986e-05, "loss": 0.0122, "step": 520880 }, { "epoch": 1.35, "learning_rate": 9.74666974267784e-05, "loss": 0.012, "step": 520890 }, { "epoch": 1.35, "learning_rate": 9.746280921040693e-05, "loss": 0.0106, "step": 520900 }, { "epoch": 1.35, "learning_rate": 9.745892099403547e-05, "loss": 0.0097, "step": 520910 }, { "epoch": 1.35, "learning_rate": 9.7455032777664e-05, "loss": 0.0097, "step": 520920 }, { "epoch": 1.35, "learning_rate": 9.745114456129254e-05, "loss": 0.0074, "step": 520930 }, { "epoch": 1.35, "learning_rate": 9.744725634492107e-05, "loss": 0.0113, "step": 520940 }, { "epoch": 1.35, "learning_rate": 9.744336812854961e-05, "loss": 0.0122, "step": 520950 }, { "epoch": 1.35, "learning_rate": 9.743947991217814e-05, "loss": 0.0129, "step": 520960 }, { "epoch": 1.35, "learning_rate": 9.743559169580668e-05, "loss": 0.014, "step": 520970 }, { "epoch": 1.35, "learning_rate": 9.743170347943521e-05, "loss": 0.0108, "step": 520980 }, { "epoch": 1.35, "learning_rate": 9.742781526306375e-05, "loss": 0.0142, "step": 520990 }, { "epoch": 1.35, "learning_rate": 9.742392704669228e-05, "loss": 0.0098, "step": 521000 }, { "epoch": 1.35, "eval_cer": 0.8816872903168917, "eval_loss": 0.006592988967895508, "eval_runtime": 107.9088, "eval_samples_per_second": 18.534, "eval_steps_per_second": 4.634, "step": 521000 }, { "epoch": 1.35, "learning_rate": 9.742003883032083e-05, "loss": 0.011, "step": 521010 }, { "epoch": 1.35, "learning_rate": 9.741615061394936e-05, "loss": 0.0093, "step": 521020 }, { "epoch": 1.35, "learning_rate": 9.741226239757788e-05, "loss": 0.009, "step": 521030 }, { "epoch": 1.35, "learning_rate": 9.740837418120643e-05, "loss": 0.0084, "step": 521040 }, { "epoch": 1.35, "learning_rate": 9.740448596483496e-05, "loss": 0.0088, "step": 521050 }, { "epoch": 1.35, "learning_rate": 9.74005977484635e-05, "loss": 0.01, "step": 521060 }, { "epoch": 1.35, "learning_rate": 9.739670953209203e-05, "loss": 0.0094, "step": 521070 }, { "epoch": 1.35, "learning_rate": 9.739282131572057e-05, "loss": 0.0098, "step": 521080 }, { "epoch": 1.35, "learning_rate": 9.73889330993491e-05, "loss": 0.0091, "step": 521090 }, { "epoch": 1.35, "learning_rate": 9.738504488297764e-05, "loss": 0.0104, "step": 521100 }, { "epoch": 1.35, "learning_rate": 9.738115666660617e-05, "loss": 0.0084, "step": 521110 }, { "epoch": 1.35, "learning_rate": 9.737726845023471e-05, "loss": 0.0104, "step": 521120 }, { "epoch": 1.35, "learning_rate": 9.737338023386324e-05, "loss": 0.0097, "step": 521130 }, { "epoch": 1.35, "learning_rate": 9.736949201749178e-05, "loss": 0.0088, "step": 521140 }, { "epoch": 1.35, "learning_rate": 9.736560380112031e-05, "loss": 0.0076, "step": 521150 }, { "epoch": 1.35, "learning_rate": 9.736171558474885e-05, "loss": 0.0118, "step": 521160 }, { "epoch": 1.35, "learning_rate": 9.735782736837738e-05, "loss": 0.0083, "step": 521170 }, { "epoch": 1.35, "learning_rate": 9.735393915200593e-05, "loss": 0.0124, "step": 521180 }, { "epoch": 1.35, "learning_rate": 9.735005093563445e-05, "loss": 0.0082, "step": 521190 }, { "epoch": 1.35, "learning_rate": 9.7346162719263e-05, "loss": 0.0118, "step": 521200 }, { "epoch": 1.35, "learning_rate": 9.734227450289153e-05, "loss": 0.0076, "step": 521210 }, { "epoch": 1.35, "learning_rate": 9.733838628652007e-05, "loss": 0.0093, "step": 521220 }, { "epoch": 1.35, "learning_rate": 9.73344980701486e-05, "loss": 0.0106, "step": 521230 }, { "epoch": 1.35, "learning_rate": 9.733060985377714e-05, "loss": 0.0092, "step": 521240 }, { "epoch": 1.35, "learning_rate": 9.732672163740567e-05, "loss": 0.0103, "step": 521250 }, { "epoch": 1.35, "learning_rate": 9.732283342103421e-05, "loss": 0.0097, "step": 521260 }, { "epoch": 1.35, "learning_rate": 9.731894520466274e-05, "loss": 0.0114, "step": 521270 }, { "epoch": 1.35, "learning_rate": 9.731505698829127e-05, "loss": 0.0129, "step": 521280 }, { "epoch": 1.35, "learning_rate": 9.731116877191981e-05, "loss": 0.0118, "step": 521290 }, { "epoch": 1.35, "learning_rate": 9.730728055554834e-05, "loss": 0.0115, "step": 521300 }, { "epoch": 1.35, "learning_rate": 9.730339233917688e-05, "loss": 0.0097, "step": 521310 }, { "epoch": 1.35, "learning_rate": 9.729950412280541e-05, "loss": 0.0122, "step": 521320 }, { "epoch": 1.35, "learning_rate": 9.729561590643395e-05, "loss": 0.0071, "step": 521330 }, { "epoch": 1.35, "learning_rate": 9.729172769006248e-05, "loss": 0.0091, "step": 521340 }, { "epoch": 1.35, "learning_rate": 9.728783947369102e-05, "loss": 0.0205, "step": 521350 }, { "epoch": 1.35, "learning_rate": 9.728395125731955e-05, "loss": 0.0123, "step": 521360 }, { "epoch": 1.35, "learning_rate": 9.72800630409481e-05, "loss": 0.011, "step": 521370 }, { "epoch": 1.35, "learning_rate": 9.727617482457663e-05, "loss": 0.0095, "step": 521380 }, { "epoch": 1.35, "learning_rate": 9.727228660820517e-05, "loss": 0.0114, "step": 521390 }, { "epoch": 1.35, "learning_rate": 9.72683983918337e-05, "loss": 0.011, "step": 521400 }, { "epoch": 1.35, "learning_rate": 9.726451017546224e-05, "loss": 0.0107, "step": 521410 }, { "epoch": 1.35, "learning_rate": 9.726062195909077e-05, "loss": 0.0172, "step": 521420 }, { "epoch": 1.35, "learning_rate": 9.725673374271931e-05, "loss": 0.0119, "step": 521430 }, { "epoch": 1.35, "learning_rate": 9.725284552634784e-05, "loss": 0.009, "step": 521440 }, { "epoch": 1.35, "learning_rate": 9.724895730997638e-05, "loss": 0.0105, "step": 521450 }, { "epoch": 1.35, "learning_rate": 9.724506909360491e-05, "loss": 0.0095, "step": 521460 }, { "epoch": 1.35, "learning_rate": 9.724118087723345e-05, "loss": 0.0088, "step": 521470 }, { "epoch": 1.35, "learning_rate": 9.723729266086198e-05, "loss": 0.0103, "step": 521480 }, { "epoch": 1.35, "learning_rate": 9.723340444449052e-05, "loss": 0.011, "step": 521490 }, { "epoch": 1.35, "learning_rate": 9.722951622811905e-05, "loss": 0.0097, "step": 521500 }, { "epoch": 1.35, "learning_rate": 9.722562801174759e-05, "loss": 0.0086, "step": 521510 }, { "epoch": 1.35, "learning_rate": 9.722173979537612e-05, "loss": 0.0082, "step": 521520 }, { "epoch": 1.35, "learning_rate": 9.721785157900465e-05, "loss": 0.0108, "step": 521530 }, { "epoch": 1.35, "learning_rate": 9.72139633626332e-05, "loss": 0.0075, "step": 521540 }, { "epoch": 1.35, "learning_rate": 9.721007514626172e-05, "loss": 0.009, "step": 521550 }, { "epoch": 1.35, "learning_rate": 9.720618692989027e-05, "loss": 0.0071, "step": 521560 }, { "epoch": 1.35, "learning_rate": 9.72022987135188e-05, "loss": 0.0079, "step": 521570 }, { "epoch": 1.35, "learning_rate": 9.719841049714734e-05, "loss": 0.0106, "step": 521580 }, { "epoch": 1.35, "learning_rate": 9.719452228077587e-05, "loss": 0.0153, "step": 521590 }, { "epoch": 1.35, "learning_rate": 9.719063406440441e-05, "loss": 0.0068, "step": 521600 }, { "epoch": 1.35, "learning_rate": 9.718674584803294e-05, "loss": 0.0091, "step": 521610 }, { "epoch": 1.35, "learning_rate": 9.718285763166148e-05, "loss": 0.0097, "step": 521620 }, { "epoch": 1.35, "learning_rate": 9.717896941529001e-05, "loss": 0.0103, "step": 521630 }, { "epoch": 1.35, "learning_rate": 9.717508119891855e-05, "loss": 0.0068, "step": 521640 }, { "epoch": 1.35, "learning_rate": 9.717119298254708e-05, "loss": 0.0068, "step": 521650 }, { "epoch": 1.35, "learning_rate": 9.716730476617562e-05, "loss": 0.0088, "step": 521660 }, { "epoch": 1.35, "learning_rate": 9.716341654980415e-05, "loss": 0.0081, "step": 521670 }, { "epoch": 1.35, "learning_rate": 9.715952833343269e-05, "loss": 0.0101, "step": 521680 }, { "epoch": 1.35, "learning_rate": 9.715564011706122e-05, "loss": 0.0094, "step": 521690 }, { "epoch": 1.35, "learning_rate": 9.715175190068977e-05, "loss": 0.009, "step": 521700 }, { "epoch": 1.35, "learning_rate": 9.714786368431829e-05, "loss": 0.0112, "step": 521710 }, { "epoch": 1.35, "learning_rate": 9.714397546794684e-05, "loss": 0.0091, "step": 521720 }, { "epoch": 1.35, "learning_rate": 9.714008725157537e-05, "loss": 0.0108, "step": 521730 }, { "epoch": 1.35, "learning_rate": 9.713619903520391e-05, "loss": 0.0077, "step": 521740 }, { "epoch": 1.35, "learning_rate": 9.713231081883244e-05, "loss": 0.0105, "step": 521750 }, { "epoch": 1.35, "learning_rate": 9.712842260246098e-05, "loss": 0.0076, "step": 521760 }, { "epoch": 1.35, "learning_rate": 9.712453438608951e-05, "loss": 0.0109, "step": 521770 }, { "epoch": 1.35, "learning_rate": 9.712064616971804e-05, "loss": 0.0098, "step": 521780 }, { "epoch": 1.35, "learning_rate": 9.711675795334658e-05, "loss": 0.0116, "step": 521790 }, { "epoch": 1.35, "learning_rate": 9.711286973697511e-05, "loss": 0.0121, "step": 521800 }, { "epoch": 1.35, "learning_rate": 9.710898152060365e-05, "loss": 0.0142, "step": 521810 }, { "epoch": 1.35, "learning_rate": 9.710509330423218e-05, "loss": 0.0079, "step": 521820 }, { "epoch": 1.35, "learning_rate": 9.710120508786072e-05, "loss": 0.011, "step": 521830 }, { "epoch": 1.35, "learning_rate": 9.709731687148925e-05, "loss": 0.0097, "step": 521840 }, { "epoch": 1.35, "learning_rate": 9.709342865511779e-05, "loss": 0.0096, "step": 521850 }, { "epoch": 1.35, "learning_rate": 9.708954043874632e-05, "loss": 0.0071, "step": 521860 }, { "epoch": 1.35, "learning_rate": 9.708565222237486e-05, "loss": 0.0101, "step": 521870 }, { "epoch": 1.35, "learning_rate": 9.708176400600339e-05, "loss": 0.0116, "step": 521880 }, { "epoch": 1.35, "learning_rate": 9.707787578963194e-05, "loss": 0.0069, "step": 521890 }, { "epoch": 1.35, "learning_rate": 9.707398757326047e-05, "loss": 0.0127, "step": 521900 }, { "epoch": 1.35, "learning_rate": 9.707009935688901e-05, "loss": 0.0117, "step": 521910 }, { "epoch": 1.35, "learning_rate": 9.706621114051754e-05, "loss": 0.01, "step": 521920 }, { "epoch": 1.35, "learning_rate": 9.706232292414608e-05, "loss": 0.0101, "step": 521930 }, { "epoch": 1.35, "learning_rate": 9.705843470777461e-05, "loss": 0.008, "step": 521940 }, { "epoch": 1.35, "learning_rate": 9.705454649140315e-05, "loss": 0.0098, "step": 521950 }, { "epoch": 1.35, "learning_rate": 9.705065827503168e-05, "loss": 0.0132, "step": 521960 }, { "epoch": 1.35, "learning_rate": 9.704677005866022e-05, "loss": 0.0102, "step": 521970 }, { "epoch": 1.35, "learning_rate": 9.704288184228875e-05, "loss": 0.0072, "step": 521980 }, { "epoch": 1.35, "learning_rate": 9.703899362591729e-05, "loss": 0.0073, "step": 521990 }, { "epoch": 1.35, "learning_rate": 9.703510540954582e-05, "loss": 0.0131, "step": 522000 }, { "epoch": 1.35, "eval_cer": 0.8816802921322209, "eval_loss": 0.006435697432607412, "eval_runtime": 107.8203, "eval_samples_per_second": 18.549, "eval_steps_per_second": 4.637, "step": 522000 }, { "epoch": 1.35, "learning_rate": 9.703121719317436e-05, "loss": 0.0104, "step": 522010 }, { "epoch": 1.35, "learning_rate": 9.702732897680289e-05, "loss": 0.0084, "step": 522020 }, { "epoch": 1.35, "learning_rate": 9.702344076043142e-05, "loss": 0.009, "step": 522030 }, { "epoch": 1.35, "learning_rate": 9.701955254405996e-05, "loss": 0.0069, "step": 522040 }, { "epoch": 1.35, "learning_rate": 9.701566432768849e-05, "loss": 0.0133, "step": 522050 }, { "epoch": 1.35, "learning_rate": 9.701177611131704e-05, "loss": 0.0086, "step": 522060 }, { "epoch": 1.35, "learning_rate": 9.700788789494556e-05, "loss": 0.0083, "step": 522070 }, { "epoch": 1.35, "learning_rate": 9.700399967857411e-05, "loss": 0.0104, "step": 522080 }, { "epoch": 1.35, "learning_rate": 9.700011146220264e-05, "loss": 0.0108, "step": 522090 }, { "epoch": 1.35, "learning_rate": 9.699622324583118e-05, "loss": 0.0075, "step": 522100 }, { "epoch": 1.35, "learning_rate": 9.699233502945971e-05, "loss": 0.0093, "step": 522110 }, { "epoch": 1.35, "learning_rate": 9.698844681308825e-05, "loss": 0.0097, "step": 522120 }, { "epoch": 1.35, "learning_rate": 9.698455859671678e-05, "loss": 0.0105, "step": 522130 }, { "epoch": 1.35, "learning_rate": 9.698067038034532e-05, "loss": 0.0093, "step": 522140 }, { "epoch": 1.35, "learning_rate": 9.697678216397385e-05, "loss": 0.0078, "step": 522150 }, { "epoch": 1.35, "learning_rate": 9.697289394760239e-05, "loss": 0.0077, "step": 522160 }, { "epoch": 1.35, "learning_rate": 9.696900573123092e-05, "loss": 0.0109, "step": 522170 }, { "epoch": 1.35, "learning_rate": 9.696511751485946e-05, "loss": 0.0103, "step": 522180 }, { "epoch": 1.35, "learning_rate": 9.696122929848799e-05, "loss": 0.0117, "step": 522190 }, { "epoch": 1.35, "learning_rate": 9.695734108211653e-05, "loss": 0.01, "step": 522200 }, { "epoch": 1.35, "learning_rate": 9.695345286574506e-05, "loss": 0.0087, "step": 522210 }, { "epoch": 1.35, "learning_rate": 9.69495646493736e-05, "loss": 0.0115, "step": 522220 }, { "epoch": 1.35, "learning_rate": 9.694567643300213e-05, "loss": 0.0106, "step": 522230 }, { "epoch": 1.35, "learning_rate": 9.694178821663068e-05, "loss": 0.0112, "step": 522240 }, { "epoch": 1.35, "learning_rate": 9.693790000025921e-05, "loss": 0.0063, "step": 522250 }, { "epoch": 1.35, "learning_rate": 9.693401178388775e-05, "loss": 0.0083, "step": 522260 }, { "epoch": 1.35, "learning_rate": 9.693012356751628e-05, "loss": 0.0091, "step": 522270 }, { "epoch": 1.35, "learning_rate": 9.692623535114481e-05, "loss": 0.0096, "step": 522280 }, { "epoch": 1.35, "learning_rate": 9.692234713477335e-05, "loss": 0.0089, "step": 522290 }, { "epoch": 1.35, "learning_rate": 9.691845891840188e-05, "loss": 0.01, "step": 522300 }, { "epoch": 1.35, "learning_rate": 9.691457070203042e-05, "loss": 0.0073, "step": 522310 }, { "epoch": 1.35, "learning_rate": 9.691068248565895e-05, "loss": 0.0053, "step": 522320 }, { "epoch": 1.35, "learning_rate": 9.690679426928749e-05, "loss": 0.0082, "step": 522330 }, { "epoch": 1.35, "learning_rate": 9.690290605291602e-05, "loss": 0.0102, "step": 522340 }, { "epoch": 1.35, "learning_rate": 9.689901783654456e-05, "loss": 0.0134, "step": 522350 }, { "epoch": 1.35, "learning_rate": 9.689512962017309e-05, "loss": 0.0118, "step": 522360 }, { "epoch": 1.35, "learning_rate": 9.689124140380163e-05, "loss": 0.0093, "step": 522370 }, { "epoch": 1.35, "learning_rate": 9.688735318743016e-05, "loss": 0.01, "step": 522380 }, { "epoch": 1.35, "learning_rate": 9.68834649710587e-05, "loss": 0.0085, "step": 522390 }, { "epoch": 1.35, "learning_rate": 9.687957675468723e-05, "loss": 0.01, "step": 522400 }, { "epoch": 1.35, "learning_rate": 9.687568853831578e-05, "loss": 0.0094, "step": 522410 }, { "epoch": 1.35, "learning_rate": 9.68718003219443e-05, "loss": 0.009, "step": 522420 }, { "epoch": 1.35, "learning_rate": 9.686791210557285e-05, "loss": 0.0066, "step": 522430 }, { "epoch": 1.35, "learning_rate": 9.686402388920138e-05, "loss": 0.0101, "step": 522440 }, { "epoch": 1.35, "learning_rate": 9.686013567282992e-05, "loss": 0.0088, "step": 522450 }, { "epoch": 1.35, "learning_rate": 9.685624745645845e-05, "loss": 0.0103, "step": 522460 }, { "epoch": 1.35, "learning_rate": 9.685235924008699e-05, "loss": 0.0266, "step": 522470 }, { "epoch": 1.35, "learning_rate": 9.684847102371552e-05, "loss": 0.0144, "step": 522480 }, { "epoch": 1.35, "learning_rate": 9.684458280734406e-05, "loss": 0.0119, "step": 522490 }, { "epoch": 1.35, "learning_rate": 9.684069459097259e-05, "loss": 0.0092, "step": 522500 }, { "epoch": 1.35, "learning_rate": 9.683680637460113e-05, "loss": 0.0078, "step": 522510 }, { "epoch": 1.35, "learning_rate": 9.683291815822966e-05, "loss": 0.011, "step": 522520 }, { "epoch": 1.35, "learning_rate": 9.682902994185819e-05, "loss": 0.0127, "step": 522530 }, { "epoch": 1.35, "learning_rate": 9.682514172548673e-05, "loss": 0.0075, "step": 522540 }, { "epoch": 1.35, "learning_rate": 9.682125350911526e-05, "loss": 0.0143, "step": 522550 }, { "epoch": 1.35, "learning_rate": 9.68173652927438e-05, "loss": 0.0121, "step": 522560 }, { "epoch": 1.35, "learning_rate": 9.681347707637233e-05, "loss": 0.0098, "step": 522570 }, { "epoch": 1.35, "learning_rate": 9.680958886000087e-05, "loss": 0.0083, "step": 522580 }, { "epoch": 1.35, "learning_rate": 9.68057006436294e-05, "loss": 0.0073, "step": 522590 }, { "epoch": 1.35, "learning_rate": 9.680181242725795e-05, "loss": 0.0106, "step": 522600 }, { "epoch": 1.35, "learning_rate": 9.679792421088648e-05, "loss": 0.0103, "step": 522610 }, { "epoch": 1.35, "learning_rate": 9.679403599451502e-05, "loss": 0.0085, "step": 522620 }, { "epoch": 1.35, "learning_rate": 9.679014777814355e-05, "loss": 0.0098, "step": 522630 }, { "epoch": 1.35, "learning_rate": 9.678625956177209e-05, "loss": 0.0152, "step": 522640 }, { "epoch": 1.35, "learning_rate": 9.678237134540062e-05, "loss": 0.0093, "step": 522650 }, { "epoch": 1.35, "learning_rate": 9.677848312902916e-05, "loss": 0.0079, "step": 522660 }, { "epoch": 1.35, "learning_rate": 9.677459491265769e-05, "loss": 0.0101, "step": 522670 }, { "epoch": 1.35, "learning_rate": 9.677070669628623e-05, "loss": 0.0082, "step": 522680 }, { "epoch": 1.35, "learning_rate": 9.676681847991476e-05, "loss": 0.0097, "step": 522690 }, { "epoch": 1.35, "learning_rate": 9.67629302635433e-05, "loss": 0.0105, "step": 522700 }, { "epoch": 1.35, "learning_rate": 9.675904204717183e-05, "loss": 0.0104, "step": 522710 }, { "epoch": 1.35, "learning_rate": 9.675515383080037e-05, "loss": 0.0088, "step": 522720 }, { "epoch": 1.35, "learning_rate": 9.67512656144289e-05, "loss": 0.0078, "step": 522730 }, { "epoch": 1.36, "learning_rate": 9.674737739805744e-05, "loss": 0.0102, "step": 522740 }, { "epoch": 1.36, "learning_rate": 9.674348918168597e-05, "loss": 0.0129, "step": 522750 }, { "epoch": 1.36, "learning_rate": 9.673960096531452e-05, "loss": 0.0078, "step": 522760 }, { "epoch": 1.36, "learning_rate": 9.673571274894305e-05, "loss": 0.0123, "step": 522770 }, { "epoch": 1.36, "learning_rate": 9.673182453257157e-05, "loss": 0.0092, "step": 522780 }, { "epoch": 1.36, "learning_rate": 9.672793631620012e-05, "loss": 0.0127, "step": 522790 }, { "epoch": 1.36, "learning_rate": 9.672404809982865e-05, "loss": 0.01, "step": 522800 }, { "epoch": 1.36, "learning_rate": 9.672015988345719e-05, "loss": 0.0097, "step": 522810 }, { "epoch": 1.36, "learning_rate": 9.671627166708572e-05, "loss": 0.0124, "step": 522820 }, { "epoch": 1.36, "learning_rate": 9.671238345071426e-05, "loss": 0.0067, "step": 522830 }, { "epoch": 1.36, "learning_rate": 9.670849523434279e-05, "loss": 0.0118, "step": 522840 }, { "epoch": 1.36, "learning_rate": 9.670460701797133e-05, "loss": 0.0085, "step": 522850 }, { "epoch": 1.36, "learning_rate": 9.670071880159986e-05, "loss": 0.0124, "step": 522860 }, { "epoch": 1.36, "learning_rate": 9.66968305852284e-05, "loss": 0.0081, "step": 522870 }, { "epoch": 1.36, "learning_rate": 9.669294236885693e-05, "loss": 0.0085, "step": 522880 }, { "epoch": 1.36, "learning_rate": 9.668905415248547e-05, "loss": 0.0082, "step": 522890 }, { "epoch": 1.36, "learning_rate": 9.6685165936114e-05, "loss": 0.01, "step": 522900 }, { "epoch": 1.36, "learning_rate": 9.668127771974254e-05, "loss": 0.0108, "step": 522910 }, { "epoch": 1.36, "learning_rate": 9.667738950337107e-05, "loss": 0.009, "step": 522920 }, { "epoch": 1.36, "learning_rate": 9.667350128699962e-05, "loss": 0.01, "step": 522930 }, { "epoch": 1.36, "learning_rate": 9.666961307062814e-05, "loss": 0.0084, "step": 522940 }, { "epoch": 1.36, "learning_rate": 9.666572485425669e-05, "loss": 0.0079, "step": 522950 }, { "epoch": 1.36, "learning_rate": 9.666183663788522e-05, "loss": 0.011, "step": 522960 }, { "epoch": 1.36, "learning_rate": 9.665794842151376e-05, "loss": 0.0094, "step": 522970 }, { "epoch": 1.36, "learning_rate": 9.665406020514229e-05, "loss": 0.0061, "step": 522980 }, { "epoch": 1.36, "learning_rate": 9.665017198877083e-05, "loss": 0.0097, "step": 522990 }, { "epoch": 1.36, "learning_rate": 9.664628377239936e-05, "loss": 0.01, "step": 523000 }, { "epoch": 1.36, "eval_cer": 0.8816718943106159, "eval_loss": 0.006541228387504816, "eval_runtime": 107.8789, "eval_samples_per_second": 18.539, "eval_steps_per_second": 4.635, "step": 523000 }, { "epoch": 1.36, "learning_rate": 9.664239555602789e-05, "loss": 0.0105, "step": 523010 }, { "epoch": 1.36, "learning_rate": 9.663850733965643e-05, "loss": 0.0105, "step": 523020 }, { "epoch": 1.36, "learning_rate": 9.663461912328496e-05, "loss": 0.0089, "step": 523030 }, { "epoch": 1.36, "learning_rate": 9.66307309069135e-05, "loss": 0.0093, "step": 523040 }, { "epoch": 1.36, "learning_rate": 9.662684269054203e-05, "loss": 0.0104, "step": 523050 }, { "epoch": 1.36, "learning_rate": 9.662295447417057e-05, "loss": 0.0094, "step": 523060 }, { "epoch": 1.36, "learning_rate": 9.66190662577991e-05, "loss": 0.0118, "step": 523070 }, { "epoch": 1.36, "learning_rate": 9.661517804142764e-05, "loss": 0.0118, "step": 523080 }, { "epoch": 1.36, "learning_rate": 9.661128982505617e-05, "loss": 0.0102, "step": 523090 }, { "epoch": 1.36, "learning_rate": 9.660740160868471e-05, "loss": 0.0069, "step": 523100 }, { "epoch": 1.36, "learning_rate": 9.660351339231324e-05, "loss": 0.0075, "step": 523110 }, { "epoch": 1.36, "learning_rate": 9.659962517594179e-05, "loss": 0.0137, "step": 523120 }, { "epoch": 1.36, "learning_rate": 9.659573695957032e-05, "loss": 0.014, "step": 523130 }, { "epoch": 1.36, "learning_rate": 9.659184874319886e-05, "loss": 0.0105, "step": 523140 }, { "epoch": 1.36, "learning_rate": 9.658796052682739e-05, "loss": 0.0079, "step": 523150 }, { "epoch": 1.36, "learning_rate": 9.658407231045593e-05, "loss": 0.009, "step": 523160 }, { "epoch": 1.36, "learning_rate": 9.658018409408446e-05, "loss": 0.0095, "step": 523170 }, { "epoch": 1.36, "learning_rate": 9.6576295877713e-05, "loss": 0.0085, "step": 523180 }, { "epoch": 1.36, "learning_rate": 9.657240766134153e-05, "loss": 0.0144, "step": 523190 }, { "epoch": 1.36, "learning_rate": 9.656851944497007e-05, "loss": 0.0118, "step": 523200 }, { "epoch": 1.36, "learning_rate": 9.65646312285986e-05, "loss": 0.0084, "step": 523210 }, { "epoch": 1.36, "learning_rate": 9.656074301222714e-05, "loss": 0.0104, "step": 523220 }, { "epoch": 1.36, "learning_rate": 9.655685479585567e-05, "loss": 0.0079, "step": 523230 }, { "epoch": 1.36, "learning_rate": 9.655296657948421e-05, "loss": 0.0082, "step": 523240 }, { "epoch": 1.36, "learning_rate": 9.654907836311274e-05, "loss": 0.01, "step": 523250 }, { "epoch": 1.36, "learning_rate": 9.654519014674127e-05, "loss": 0.0106, "step": 523260 }, { "epoch": 1.36, "learning_rate": 9.654130193036981e-05, "loss": 0.0118, "step": 523270 }, { "epoch": 1.36, "learning_rate": 9.653741371399834e-05, "loss": 0.0119, "step": 523280 }, { "epoch": 1.36, "learning_rate": 9.653352549762689e-05, "loss": 0.0075, "step": 523290 }, { "epoch": 1.36, "learning_rate": 9.65296372812554e-05, "loss": 0.0086, "step": 523300 }, { "epoch": 1.36, "learning_rate": 9.652574906488396e-05, "loss": 0.0113, "step": 523310 }, { "epoch": 1.36, "learning_rate": 9.652186084851249e-05, "loss": 0.0095, "step": 523320 }, { "epoch": 1.36, "learning_rate": 9.651797263214103e-05, "loss": 0.0079, "step": 523330 }, { "epoch": 1.36, "learning_rate": 9.651408441576956e-05, "loss": 0.0111, "step": 523340 }, { "epoch": 1.36, "learning_rate": 9.65101961993981e-05, "loss": 0.0094, "step": 523350 }, { "epoch": 1.36, "learning_rate": 9.650630798302663e-05, "loss": 0.0082, "step": 523360 }, { "epoch": 1.36, "learning_rate": 9.650241976665517e-05, "loss": 0.0089, "step": 523370 }, { "epoch": 1.36, "learning_rate": 9.64985315502837e-05, "loss": 0.0089, "step": 523380 }, { "epoch": 1.36, "learning_rate": 9.649464333391224e-05, "loss": 0.01, "step": 523390 }, { "epoch": 1.36, "learning_rate": 9.649075511754077e-05, "loss": 0.0098, "step": 523400 }, { "epoch": 1.36, "learning_rate": 9.648686690116931e-05, "loss": 0.0101, "step": 523410 }, { "epoch": 1.36, "learning_rate": 9.648297868479784e-05, "loss": 0.0098, "step": 523420 }, { "epoch": 1.36, "learning_rate": 9.647909046842638e-05, "loss": 0.0124, "step": 523430 }, { "epoch": 1.36, "learning_rate": 9.647520225205491e-05, "loss": 0.0118, "step": 523440 }, { "epoch": 1.36, "learning_rate": 9.647131403568345e-05, "loss": 0.0112, "step": 523450 }, { "epoch": 1.36, "learning_rate": 9.646742581931198e-05, "loss": 0.0107, "step": 523460 }, { "epoch": 1.36, "learning_rate": 9.646353760294053e-05, "loss": 0.0103, "step": 523470 }, { "epoch": 1.36, "learning_rate": 9.645964938656906e-05, "loss": 0.0084, "step": 523480 }, { "epoch": 1.36, "learning_rate": 9.64557611701976e-05, "loss": 0.0133, "step": 523490 }, { "epoch": 1.36, "learning_rate": 9.645187295382613e-05, "loss": 0.0104, "step": 523500 }, { "epoch": 1.36, "learning_rate": 9.644798473745466e-05, "loss": 0.0092, "step": 523510 }, { "epoch": 1.36, "learning_rate": 9.64440965210832e-05, "loss": 0.0106, "step": 523520 }, { "epoch": 1.36, "learning_rate": 9.644020830471173e-05, "loss": 0.01, "step": 523530 }, { "epoch": 1.36, "learning_rate": 9.643632008834027e-05, "loss": 0.009, "step": 523540 }, { "epoch": 1.36, "learning_rate": 9.64324318719688e-05, "loss": 0.0137, "step": 523550 }, { "epoch": 1.36, "learning_rate": 9.642854365559734e-05, "loss": 0.0076, "step": 523560 }, { "epoch": 1.36, "learning_rate": 9.642465543922587e-05, "loss": 0.0084, "step": 523570 }, { "epoch": 1.36, "learning_rate": 9.642076722285441e-05, "loss": 0.0126, "step": 523580 }, { "epoch": 1.36, "learning_rate": 9.641687900648294e-05, "loss": 0.0102, "step": 523590 }, { "epoch": 1.36, "learning_rate": 9.641299079011148e-05, "loss": 0.0083, "step": 523600 }, { "epoch": 1.36, "learning_rate": 9.640910257374001e-05, "loss": 0.0084, "step": 523610 }, { "epoch": 1.36, "learning_rate": 9.640521435736855e-05, "loss": 0.0107, "step": 523620 }, { "epoch": 1.36, "learning_rate": 9.640132614099708e-05, "loss": 0.0083, "step": 523630 }, { "epoch": 1.36, "learning_rate": 9.639743792462563e-05, "loss": 0.0115, "step": 523640 }, { "epoch": 1.36, "learning_rate": 9.639354970825416e-05, "loss": 0.0115, "step": 523650 }, { "epoch": 1.36, "learning_rate": 9.63896614918827e-05, "loss": 0.0108, "step": 523660 }, { "epoch": 1.36, "learning_rate": 9.638577327551123e-05, "loss": 0.0084, "step": 523670 }, { "epoch": 1.36, "learning_rate": 9.638188505913977e-05, "loss": 0.0083, "step": 523680 }, { "epoch": 1.36, "learning_rate": 9.63779968427683e-05, "loss": 0.0123, "step": 523690 }, { "epoch": 1.36, "learning_rate": 9.637410862639684e-05, "loss": 0.0095, "step": 523700 }, { "epoch": 1.36, "learning_rate": 9.637022041002537e-05, "loss": 0.0083, "step": 523710 }, { "epoch": 1.36, "learning_rate": 9.636633219365391e-05, "loss": 0.0109, "step": 523720 }, { "epoch": 1.36, "learning_rate": 9.636244397728244e-05, "loss": 0.0115, "step": 523730 }, { "epoch": 1.36, "learning_rate": 9.635855576091098e-05, "loss": 0.0106, "step": 523740 }, { "epoch": 1.36, "learning_rate": 9.635466754453951e-05, "loss": 0.0089, "step": 523750 }, { "epoch": 1.36, "learning_rate": 9.635077932816804e-05, "loss": 0.015, "step": 523760 }, { "epoch": 1.36, "learning_rate": 9.634689111179658e-05, "loss": 0.0094, "step": 523770 }, { "epoch": 1.36, "learning_rate": 9.63430028954251e-05, "loss": 0.01, "step": 523780 }, { "epoch": 1.36, "learning_rate": 9.633911467905365e-05, "loss": 0.0069, "step": 523790 }, { "epoch": 1.36, "learning_rate": 9.633522646268218e-05, "loss": 0.0089, "step": 523800 }, { "epoch": 1.36, "learning_rate": 9.633133824631072e-05, "loss": 0.0095, "step": 523810 }, { "epoch": 1.36, "learning_rate": 9.632745002993925e-05, "loss": 0.009, "step": 523820 }, { "epoch": 1.36, "learning_rate": 9.63235618135678e-05, "loss": 0.0146, "step": 523830 }, { "epoch": 1.36, "learning_rate": 9.631967359719633e-05, "loss": 0.0115, "step": 523840 }, { "epoch": 1.36, "learning_rate": 9.631578538082487e-05, "loss": 0.0079, "step": 523850 }, { "epoch": 1.36, "learning_rate": 9.63118971644534e-05, "loss": 0.01, "step": 523860 }, { "epoch": 1.36, "learning_rate": 9.630800894808194e-05, "loss": 0.0111, "step": 523870 }, { "epoch": 1.36, "learning_rate": 9.630412073171047e-05, "loss": 0.0169, "step": 523880 }, { "epoch": 1.36, "learning_rate": 9.630023251533901e-05, "loss": 0.0085, "step": 523890 }, { "epoch": 1.36, "learning_rate": 9.629634429896754e-05, "loss": 0.0101, "step": 523900 }, { "epoch": 1.36, "learning_rate": 9.629245608259608e-05, "loss": 0.0102, "step": 523910 }, { "epoch": 1.36, "learning_rate": 9.628856786622461e-05, "loss": 0.011, "step": 523920 }, { "epoch": 1.36, "learning_rate": 9.628467964985315e-05, "loss": 0.0115, "step": 523930 }, { "epoch": 1.36, "learning_rate": 9.628079143348168e-05, "loss": 0.0114, "step": 523940 }, { "epoch": 1.36, "learning_rate": 9.627690321711022e-05, "loss": 0.0097, "step": 523950 }, { "epoch": 1.36, "learning_rate": 9.627301500073875e-05, "loss": 0.0102, "step": 523960 }, { "epoch": 1.36, "learning_rate": 9.626912678436729e-05, "loss": 0.0087, "step": 523970 }, { "epoch": 1.36, "learning_rate": 9.626523856799582e-05, "loss": 0.0099, "step": 523980 }, { "epoch": 1.36, "learning_rate": 9.626135035162437e-05, "loss": 0.009, "step": 523990 }, { "epoch": 1.36, "learning_rate": 9.62574621352529e-05, "loss": 0.0124, "step": 524000 }, { "epoch": 1.36, "eval_cer": 0.8816788924952867, "eval_loss": 0.0065029398538172245, "eval_runtime": 107.8132, "eval_samples_per_second": 18.551, "eval_steps_per_second": 4.638, "step": 524000 }, { "epoch": 1.36, "learning_rate": 9.625357391888141e-05, "loss": 0.008, "step": 524010 }, { "epoch": 1.36, "learning_rate": 9.624968570250997e-05, "loss": 0.0115, "step": 524020 }, { "epoch": 1.36, "learning_rate": 9.62457974861385e-05, "loss": 0.011, "step": 524030 }, { "epoch": 1.36, "learning_rate": 9.624190926976704e-05, "loss": 0.0105, "step": 524040 }, { "epoch": 1.36, "learning_rate": 9.623802105339557e-05, "loss": 0.0124, "step": 524050 }, { "epoch": 1.36, "learning_rate": 9.623413283702411e-05, "loss": 0.0074, "step": 524060 }, { "epoch": 1.36, "learning_rate": 9.623024462065264e-05, "loss": 0.0106, "step": 524070 }, { "epoch": 1.36, "learning_rate": 9.622635640428118e-05, "loss": 0.0089, "step": 524080 }, { "epoch": 1.36, "learning_rate": 9.622246818790971e-05, "loss": 0.0102, "step": 524090 }, { "epoch": 1.36, "learning_rate": 9.621857997153825e-05, "loss": 0.0116, "step": 524100 }, { "epoch": 1.36, "learning_rate": 9.621469175516678e-05, "loss": 0.0088, "step": 524110 }, { "epoch": 1.36, "learning_rate": 9.621080353879532e-05, "loss": 0.0091, "step": 524120 }, { "epoch": 1.36, "learning_rate": 9.620691532242385e-05, "loss": 0.0087, "step": 524130 }, { "epoch": 1.36, "learning_rate": 9.620302710605239e-05, "loss": 0.0092, "step": 524140 }, { "epoch": 1.36, "learning_rate": 9.619913888968092e-05, "loss": 0.009, "step": 524150 }, { "epoch": 1.36, "learning_rate": 9.619525067330947e-05, "loss": 0.0112, "step": 524160 }, { "epoch": 1.36, "learning_rate": 9.619136245693799e-05, "loss": 0.0094, "step": 524170 }, { "epoch": 1.36, "learning_rate": 9.618747424056654e-05, "loss": 0.0166, "step": 524180 }, { "epoch": 1.36, "learning_rate": 9.618358602419507e-05, "loss": 0.0093, "step": 524190 }, { "epoch": 1.36, "learning_rate": 9.617969780782361e-05, "loss": 0.0117, "step": 524200 }, { "epoch": 1.36, "learning_rate": 9.617580959145214e-05, "loss": 0.009, "step": 524210 }, { "epoch": 1.36, "learning_rate": 9.617192137508068e-05, "loss": 0.008, "step": 524220 }, { "epoch": 1.36, "learning_rate": 9.616803315870921e-05, "loss": 0.0106, "step": 524230 }, { "epoch": 1.36, "learning_rate": 9.616414494233775e-05, "loss": 0.009, "step": 524240 }, { "epoch": 1.36, "learning_rate": 9.616025672596628e-05, "loss": 0.0082, "step": 524250 }, { "epoch": 1.36, "learning_rate": 9.61563685095948e-05, "loss": 0.0084, "step": 524260 }, { "epoch": 1.36, "learning_rate": 9.615248029322335e-05, "loss": 0.0099, "step": 524270 }, { "epoch": 1.36, "learning_rate": 9.614859207685188e-05, "loss": 0.0094, "step": 524280 }, { "epoch": 1.36, "learning_rate": 9.614470386048042e-05, "loss": 0.0128, "step": 524290 }, { "epoch": 1.36, "learning_rate": 9.614081564410895e-05, "loss": 0.0093, "step": 524300 }, { "epoch": 1.36, "learning_rate": 9.613692742773749e-05, "loss": 0.0134, "step": 524310 }, { "epoch": 1.36, "learning_rate": 9.613303921136602e-05, "loss": 0.0103, "step": 524320 }, { "epoch": 1.36, "learning_rate": 9.612915099499456e-05, "loss": 0.0085, "step": 524330 }, { "epoch": 1.36, "learning_rate": 9.612526277862309e-05, "loss": 0.0076, "step": 524340 }, { "epoch": 1.36, "learning_rate": 9.612137456225164e-05, "loss": 0.0085, "step": 524350 }, { "epoch": 1.36, "learning_rate": 9.611748634588017e-05, "loss": 0.0083, "step": 524360 }, { "epoch": 1.36, "learning_rate": 9.611359812950871e-05, "loss": 0.0131, "step": 524370 }, { "epoch": 1.36, "learning_rate": 9.610970991313724e-05, "loss": 0.0116, "step": 524380 }, { "epoch": 1.36, "learning_rate": 9.610582169676578e-05, "loss": 0.0094, "step": 524390 }, { "epoch": 1.36, "learning_rate": 9.610193348039431e-05, "loss": 0.0072, "step": 524400 }, { "epoch": 1.36, "learning_rate": 9.609804526402285e-05, "loss": 0.0103, "step": 524410 }, { "epoch": 1.36, "learning_rate": 9.609415704765138e-05, "loss": 0.0112, "step": 524420 }, { "epoch": 1.36, "learning_rate": 9.609026883127992e-05, "loss": 0.0097, "step": 524430 }, { "epoch": 1.36, "learning_rate": 9.608638061490845e-05, "loss": 0.0097, "step": 524440 }, { "epoch": 1.36, "learning_rate": 9.608249239853699e-05, "loss": 0.0116, "step": 524450 }, { "epoch": 1.36, "learning_rate": 9.607860418216552e-05, "loss": 0.0088, "step": 524460 }, { "epoch": 1.36, "learning_rate": 9.607471596579406e-05, "loss": 0.0081, "step": 524470 }, { "epoch": 1.36, "learning_rate": 9.607082774942259e-05, "loss": 0.0115, "step": 524480 }, { "epoch": 1.36, "learning_rate": 9.606693953305113e-05, "loss": 0.0081, "step": 524490 }, { "epoch": 1.36, "learning_rate": 9.606305131667966e-05, "loss": 0.0107, "step": 524500 }, { "epoch": 1.36, "learning_rate": 9.605916310030818e-05, "loss": 0.0095, "step": 524510 }, { "epoch": 1.36, "learning_rate": 9.605527488393674e-05, "loss": 0.0092, "step": 524520 }, { "epoch": 1.36, "learning_rate": 9.605138666756525e-05, "loss": 0.0081, "step": 524530 }, { "epoch": 1.36, "learning_rate": 9.604749845119381e-05, "loss": 0.009, "step": 524540 }, { "epoch": 1.36, "learning_rate": 9.604361023482234e-05, "loss": 0.0101, "step": 524550 }, { "epoch": 1.36, "learning_rate": 9.603972201845088e-05, "loss": 0.0078, "step": 524560 }, { "epoch": 1.36, "learning_rate": 9.603583380207941e-05, "loss": 0.0097, "step": 524570 }, { "epoch": 1.36, "learning_rate": 9.603194558570795e-05, "loss": 0.0085, "step": 524580 }, { "epoch": 1.36, "learning_rate": 9.602805736933648e-05, "loss": 0.0094, "step": 524590 }, { "epoch": 1.36, "learning_rate": 9.602416915296502e-05, "loss": 0.0092, "step": 524600 }, { "epoch": 1.36, "learning_rate": 9.602028093659355e-05, "loss": 0.0077, "step": 524610 }, { "epoch": 1.36, "learning_rate": 9.601639272022209e-05, "loss": 0.0094, "step": 524620 }, { "epoch": 1.36, "learning_rate": 9.601250450385062e-05, "loss": 0.0106, "step": 524630 }, { "epoch": 1.36, "learning_rate": 9.600861628747916e-05, "loss": 0.0088, "step": 524640 }, { "epoch": 1.36, "learning_rate": 9.600472807110769e-05, "loss": 0.0105, "step": 524650 }, { "epoch": 1.36, "learning_rate": 9.600083985473623e-05, "loss": 0.0263, "step": 524660 }, { "epoch": 1.36, "learning_rate": 9.599695163836476e-05, "loss": 0.0128, "step": 524670 }, { "epoch": 1.36, "learning_rate": 9.599306342199331e-05, "loss": 0.0088, "step": 524680 }, { "epoch": 1.36, "learning_rate": 9.598917520562183e-05, "loss": 0.0117, "step": 524690 }, { "epoch": 1.36, "learning_rate": 9.598528698925038e-05, "loss": 0.0122, "step": 524700 }, { "epoch": 1.36, "learning_rate": 9.598139877287891e-05, "loss": 0.0097, "step": 524710 }, { "epoch": 1.36, "learning_rate": 9.597751055650745e-05, "loss": 0.0121, "step": 524720 }, { "epoch": 1.36, "learning_rate": 9.597362234013598e-05, "loss": 0.0101, "step": 524730 }, { "epoch": 1.36, "learning_rate": 9.596973412376452e-05, "loss": 0.0099, "step": 524740 }, { "epoch": 1.36, "learning_rate": 9.596584590739305e-05, "loss": 0.0097, "step": 524750 }, { "epoch": 1.36, "learning_rate": 9.596195769102158e-05, "loss": 0.0072, "step": 524760 }, { "epoch": 1.36, "learning_rate": 9.595806947465012e-05, "loss": 0.0074, "step": 524770 }, { "epoch": 1.36, "learning_rate": 9.595418125827865e-05, "loss": 0.01, "step": 524780 }, { "epoch": 1.36, "learning_rate": 9.595029304190719e-05, "loss": 0.0087, "step": 524790 }, { "epoch": 1.36, "learning_rate": 9.594640482553572e-05, "loss": 0.0099, "step": 524800 }, { "epoch": 1.36, "learning_rate": 9.594251660916426e-05, "loss": 0.0094, "step": 524810 }, { "epoch": 1.36, "learning_rate": 9.593862839279279e-05, "loss": 0.0104, "step": 524820 }, { "epoch": 1.36, "learning_rate": 9.593474017642133e-05, "loss": 0.0111, "step": 524830 }, { "epoch": 1.36, "learning_rate": 9.593085196004986e-05, "loss": 0.014, "step": 524840 }, { "epoch": 1.36, "learning_rate": 9.59269637436784e-05, "loss": 0.0079, "step": 524850 }, { "epoch": 1.36, "learning_rate": 9.592307552730693e-05, "loss": 0.0124, "step": 524860 }, { "epoch": 1.36, "learning_rate": 9.591918731093548e-05, "loss": 0.0084, "step": 524870 }, { "epoch": 1.36, "learning_rate": 9.591529909456401e-05, "loss": 0.0076, "step": 524880 }, { "epoch": 1.36, "learning_rate": 9.591141087819255e-05, "loss": 0.0081, "step": 524890 }, { "epoch": 1.36, "learning_rate": 9.590752266182108e-05, "loss": 0.0091, "step": 524900 }, { "epoch": 1.36, "learning_rate": 9.590363444544962e-05, "loss": 0.0108, "step": 524910 }, { "epoch": 1.36, "learning_rate": 9.589974622907815e-05, "loss": 0.0093, "step": 524920 }, { "epoch": 1.36, "learning_rate": 9.589585801270669e-05, "loss": 0.0114, "step": 524930 }, { "epoch": 1.36, "learning_rate": 9.589196979633522e-05, "loss": 0.0095, "step": 524940 }, { "epoch": 1.36, "learning_rate": 9.588808157996376e-05, "loss": 0.0115, "step": 524950 }, { "epoch": 1.36, "learning_rate": 9.588419336359229e-05, "loss": 0.0082, "step": 524960 }, { "epoch": 1.36, "learning_rate": 9.588030514722083e-05, "loss": 0.0116, "step": 524970 }, { "epoch": 1.36, "learning_rate": 9.587641693084936e-05, "loss": 0.009, "step": 524980 }, { "epoch": 1.36, "learning_rate": 9.58725287144779e-05, "loss": 0.0093, "step": 524990 }, { "epoch": 1.36, "learning_rate": 9.586864049810643e-05, "loss": 0.0099, "step": 525000 }, { "epoch": 1.36, "eval_cer": 0.8816900895907601, "eval_loss": 0.006309923715889454, "eval_runtime": 107.932, "eval_samples_per_second": 18.53, "eval_steps_per_second": 4.633, "step": 525000 }, { "epoch": 1.36, "learning_rate": 9.586475228173496e-05, "loss": 0.0128, "step": 525010 }, { "epoch": 1.36, "learning_rate": 9.58608640653635e-05, "loss": 0.0118, "step": 525020 }, { "epoch": 1.36, "learning_rate": 9.585697584899202e-05, "loss": 0.0076, "step": 525030 }, { "epoch": 1.36, "learning_rate": 9.585308763262057e-05, "loss": 0.0097, "step": 525040 }, { "epoch": 1.36, "learning_rate": 9.58491994162491e-05, "loss": 0.0079, "step": 525050 }, { "epoch": 1.36, "learning_rate": 9.584531119987765e-05, "loss": 0.0098, "step": 525060 }, { "epoch": 1.36, "learning_rate": 9.584142298350618e-05, "loss": 0.0138, "step": 525070 }, { "epoch": 1.36, "learning_rate": 9.583753476713472e-05, "loss": 0.009, "step": 525080 }, { "epoch": 1.36, "learning_rate": 9.583364655076325e-05, "loss": 0.0115, "step": 525090 }, { "epoch": 1.36, "learning_rate": 9.582975833439179e-05, "loss": 0.0106, "step": 525100 }, { "epoch": 1.36, "learning_rate": 9.582587011802032e-05, "loss": 0.0104, "step": 525110 }, { "epoch": 1.36, "learning_rate": 9.582198190164886e-05, "loss": 0.0082, "step": 525120 }, { "epoch": 1.36, "learning_rate": 9.581809368527739e-05, "loss": 0.01, "step": 525130 }, { "epoch": 1.36, "learning_rate": 9.581420546890593e-05, "loss": 0.0075, "step": 525140 }, { "epoch": 1.36, "learning_rate": 9.581031725253446e-05, "loss": 0.009, "step": 525150 }, { "epoch": 1.36, "learning_rate": 9.5806429036163e-05, "loss": 0.0097, "step": 525160 }, { "epoch": 1.36, "learning_rate": 9.580254081979153e-05, "loss": 0.0118, "step": 525170 }, { "epoch": 1.36, "learning_rate": 9.579865260342007e-05, "loss": 0.0112, "step": 525180 }, { "epoch": 1.36, "learning_rate": 9.57947643870486e-05, "loss": 0.0092, "step": 525190 }, { "epoch": 1.36, "learning_rate": 9.579087617067714e-05, "loss": 0.0077, "step": 525200 }, { "epoch": 1.36, "learning_rate": 9.578698795430567e-05, "loss": 0.0088, "step": 525210 }, { "epoch": 1.36, "learning_rate": 9.578309973793422e-05, "loss": 0.0094, "step": 525220 }, { "epoch": 1.36, "learning_rate": 9.577921152156275e-05, "loss": 0.0113, "step": 525230 }, { "epoch": 1.36, "learning_rate": 9.577532330519129e-05, "loss": 0.0096, "step": 525240 }, { "epoch": 1.36, "learning_rate": 9.577143508881982e-05, "loss": 0.0087, "step": 525250 }, { "epoch": 1.36, "learning_rate": 9.576754687244835e-05, "loss": 0.012, "step": 525260 }, { "epoch": 1.36, "learning_rate": 9.576365865607689e-05, "loss": 0.0097, "step": 525270 }, { "epoch": 1.36, "learning_rate": 9.575977043970542e-05, "loss": 0.0148, "step": 525280 }, { "epoch": 1.36, "learning_rate": 9.575588222333396e-05, "loss": 0.0098, "step": 525290 }, { "epoch": 1.36, "learning_rate": 9.575199400696249e-05, "loss": 0.0113, "step": 525300 }, { "epoch": 1.36, "learning_rate": 9.574810579059103e-05, "loss": 0.0109, "step": 525310 }, { "epoch": 1.36, "learning_rate": 9.574421757421956e-05, "loss": 0.0079, "step": 525320 }, { "epoch": 1.36, "learning_rate": 9.57403293578481e-05, "loss": 0.0103, "step": 525330 }, { "epoch": 1.36, "learning_rate": 9.573644114147663e-05, "loss": 0.0094, "step": 525340 }, { "epoch": 1.36, "learning_rate": 9.573255292510517e-05, "loss": 0.0074, "step": 525350 }, { "epoch": 1.36, "learning_rate": 9.57286647087337e-05, "loss": 0.0089, "step": 525360 }, { "epoch": 1.36, "learning_rate": 9.572477649236224e-05, "loss": 0.0118, "step": 525370 }, { "epoch": 1.36, "learning_rate": 9.572088827599077e-05, "loss": 0.0101, "step": 525380 }, { "epoch": 1.36, "learning_rate": 9.571700005961932e-05, "loss": 0.0127, "step": 525390 }, { "epoch": 1.36, "learning_rate": 9.571311184324784e-05, "loss": 0.0091, "step": 525400 }, { "epoch": 1.36, "learning_rate": 9.570922362687639e-05, "loss": 0.0113, "step": 525410 }, { "epoch": 1.36, "learning_rate": 9.570533541050492e-05, "loss": 0.0085, "step": 525420 }, { "epoch": 1.36, "learning_rate": 9.570144719413346e-05, "loss": 0.0119, "step": 525430 }, { "epoch": 1.36, "learning_rate": 9.569755897776199e-05, "loss": 0.0109, "step": 525440 }, { "epoch": 1.36, "learning_rate": 9.569367076139053e-05, "loss": 0.0139, "step": 525450 }, { "epoch": 1.36, "learning_rate": 9.568978254501906e-05, "loss": 0.0092, "step": 525460 }, { "epoch": 1.36, "learning_rate": 9.56858943286476e-05, "loss": 0.02, "step": 525470 }, { "epoch": 1.36, "learning_rate": 9.568200611227613e-05, "loss": 0.009, "step": 525480 }, { "epoch": 1.36, "learning_rate": 9.567811789590466e-05, "loss": 0.0084, "step": 525490 }, { "epoch": 1.36, "learning_rate": 9.56742296795332e-05, "loss": 0.0091, "step": 525500 }, { "epoch": 1.36, "learning_rate": 9.567034146316173e-05, "loss": 0.0091, "step": 525510 }, { "epoch": 1.36, "learning_rate": 9.566645324679027e-05, "loss": 0.0119, "step": 525520 }, { "epoch": 1.36, "learning_rate": 9.56625650304188e-05, "loss": 0.0087, "step": 525530 }, { "epoch": 1.36, "learning_rate": 9.565867681404734e-05, "loss": 0.0089, "step": 525540 }, { "epoch": 1.36, "learning_rate": 9.565478859767586e-05, "loss": 0.0093, "step": 525550 }, { "epoch": 1.36, "learning_rate": 9.56509003813044e-05, "loss": 0.0095, "step": 525560 }, { "epoch": 1.36, "learning_rate": 9.564701216493293e-05, "loss": 0.0107, "step": 525570 }, { "epoch": 1.36, "learning_rate": 9.564312394856149e-05, "loss": 0.0092, "step": 525580 }, { "epoch": 1.36, "learning_rate": 9.563923573219002e-05, "loss": 0.0075, "step": 525590 }, { "epoch": 1.36, "learning_rate": 9.563534751581856e-05, "loss": 0.014, "step": 525600 }, { "epoch": 1.36, "learning_rate": 9.563145929944709e-05, "loss": 0.008, "step": 525610 }, { "epoch": 1.36, "learning_rate": 9.562757108307563e-05, "loss": 0.0108, "step": 525620 }, { "epoch": 1.36, "learning_rate": 9.562368286670416e-05, "loss": 0.009, "step": 525630 }, { "epoch": 1.36, "learning_rate": 9.56197946503327e-05, "loss": 0.0085, "step": 525640 }, { "epoch": 1.36, "learning_rate": 9.561590643396123e-05, "loss": 0.0103, "step": 525650 }, { "epoch": 1.36, "learning_rate": 9.561201821758977e-05, "loss": 0.0078, "step": 525660 }, { "epoch": 1.36, "learning_rate": 9.56081300012183e-05, "loss": 0.0079, "step": 525670 }, { "epoch": 1.36, "learning_rate": 9.560424178484684e-05, "loss": 0.0106, "step": 525680 }, { "epoch": 1.36, "learning_rate": 9.560035356847537e-05, "loss": 0.0093, "step": 525690 }, { "epoch": 1.36, "learning_rate": 9.559646535210391e-05, "loss": 0.0115, "step": 525700 }, { "epoch": 1.36, "learning_rate": 9.559257713573244e-05, "loss": 0.0092, "step": 525710 }, { "epoch": 1.36, "learning_rate": 9.558868891936098e-05, "loss": 0.008, "step": 525720 }, { "epoch": 1.36, "learning_rate": 9.55848007029895e-05, "loss": 0.0146, "step": 525730 }, { "epoch": 1.36, "learning_rate": 9.558091248661803e-05, "loss": 0.0095, "step": 525740 }, { "epoch": 1.36, "learning_rate": 9.557702427024659e-05, "loss": 0.0099, "step": 525750 }, { "epoch": 1.36, "learning_rate": 9.55731360538751e-05, "loss": 0.0096, "step": 525760 }, { "epoch": 1.36, "learning_rate": 9.556924783750366e-05, "loss": 0.0122, "step": 525770 }, { "epoch": 1.36, "learning_rate": 9.556535962113219e-05, "loss": 0.0081, "step": 525780 }, { "epoch": 1.36, "learning_rate": 9.556147140476073e-05, "loss": 0.0084, "step": 525790 }, { "epoch": 1.36, "learning_rate": 9.555758318838926e-05, "loss": 0.0092, "step": 525800 }, { "epoch": 1.36, "learning_rate": 9.55536949720178e-05, "loss": 0.0084, "step": 525810 }, { "epoch": 1.36, "learning_rate": 9.554980675564633e-05, "loss": 0.0071, "step": 525820 }, { "epoch": 1.36, "learning_rate": 9.554591853927487e-05, "loss": 0.0168, "step": 525830 }, { "epoch": 1.36, "learning_rate": 9.55420303229034e-05, "loss": 0.0083, "step": 525840 }, { "epoch": 1.36, "learning_rate": 9.553814210653194e-05, "loss": 0.0093, "step": 525850 }, { "epoch": 1.36, "learning_rate": 9.553425389016047e-05, "loss": 0.0076, "step": 525860 }, { "epoch": 1.36, "learning_rate": 9.553036567378901e-05, "loss": 0.0087, "step": 525870 }, { "epoch": 1.36, "learning_rate": 9.552647745741754e-05, "loss": 0.0095, "step": 525880 }, { "epoch": 1.36, "learning_rate": 9.552258924104608e-05, "loss": 0.0127, "step": 525890 }, { "epoch": 1.36, "learning_rate": 9.55187010246746e-05, "loss": 0.0108, "step": 525900 }, { "epoch": 1.36, "learning_rate": 9.551481280830316e-05, "loss": 0.0089, "step": 525910 }, { "epoch": 1.36, "learning_rate": 9.551092459193167e-05, "loss": 0.0096, "step": 525920 }, { "epoch": 1.36, "learning_rate": 9.550703637556023e-05, "loss": 0.0079, "step": 525930 }, { "epoch": 1.36, "learning_rate": 9.550314815918876e-05, "loss": 0.0096, "step": 525940 }, { "epoch": 1.36, "learning_rate": 9.54992599428173e-05, "loss": 0.0101, "step": 525950 }, { "epoch": 1.36, "learning_rate": 9.549537172644583e-05, "loss": 0.0097, "step": 525960 }, { "epoch": 1.36, "learning_rate": 9.549148351007437e-05, "loss": 0.0079, "step": 525970 }, { "epoch": 1.36, "learning_rate": 9.54875952937029e-05, "loss": 0.0092, "step": 525980 }, { "epoch": 1.36, "learning_rate": 9.548370707733143e-05, "loss": 0.0075, "step": 525990 }, { "epoch": 1.36, "learning_rate": 9.547981886095997e-05, "loss": 0.0104, "step": 526000 }, { "epoch": 1.36, "eval_cer": 0.8816620968520765, "eval_loss": 0.006388062611222267, "eval_runtime": 107.8148, "eval_samples_per_second": 18.55, "eval_steps_per_second": 4.638, "step": 526000 }, { "epoch": 1.36, "learning_rate": 9.54759306445885e-05, "loss": 0.0081, "step": 526010 }, { "epoch": 1.36, "learning_rate": 9.547204242821704e-05, "loss": 0.009, "step": 526020 }, { "epoch": 1.36, "learning_rate": 9.546815421184557e-05, "loss": 0.0082, "step": 526030 }, { "epoch": 1.36, "learning_rate": 9.546426599547411e-05, "loss": 0.0087, "step": 526040 }, { "epoch": 1.36, "learning_rate": 9.546037777910263e-05, "loss": 0.0113, "step": 526050 }, { "epoch": 1.36, "learning_rate": 9.545648956273118e-05, "loss": 0.0105, "step": 526060 }, { "epoch": 1.36, "learning_rate": 9.54526013463597e-05, "loss": 0.0082, "step": 526070 }, { "epoch": 1.36, "learning_rate": 9.544871312998825e-05, "loss": 0.0066, "step": 526080 }, { "epoch": 1.36, "learning_rate": 9.544482491361677e-05, "loss": 0.0095, "step": 526090 }, { "epoch": 1.36, "learning_rate": 9.544093669724533e-05, "loss": 0.0118, "step": 526100 }, { "epoch": 1.36, "learning_rate": 9.543704848087386e-05, "loss": 0.0121, "step": 526110 }, { "epoch": 1.36, "learning_rate": 9.54331602645024e-05, "loss": 0.0086, "step": 526120 }, { "epoch": 1.36, "learning_rate": 9.542927204813093e-05, "loss": 0.0105, "step": 526130 }, { "epoch": 1.36, "learning_rate": 9.542538383175947e-05, "loss": 0.0095, "step": 526140 }, { "epoch": 1.36, "learning_rate": 9.5421495615388e-05, "loss": 0.0111, "step": 526150 }, { "epoch": 1.36, "learning_rate": 9.541760739901654e-05, "loss": 0.0116, "step": 526160 }, { "epoch": 1.36, "learning_rate": 9.541371918264507e-05, "loss": 0.0102, "step": 526170 }, { "epoch": 1.36, "learning_rate": 9.540983096627361e-05, "loss": 0.0121, "step": 526180 }, { "epoch": 1.36, "learning_rate": 9.540594274990214e-05, "loss": 0.0125, "step": 526190 }, { "epoch": 1.36, "learning_rate": 9.540205453353068e-05, "loss": 0.0096, "step": 526200 }, { "epoch": 1.36, "learning_rate": 9.53981663171592e-05, "loss": 0.0093, "step": 526210 }, { "epoch": 1.36, "learning_rate": 9.539427810078775e-05, "loss": 0.0086, "step": 526220 }, { "epoch": 1.36, "learning_rate": 9.539038988441628e-05, "loss": 0.0089, "step": 526230 }, { "epoch": 1.36, "learning_rate": 9.53865016680448e-05, "loss": 0.0118, "step": 526240 }, { "epoch": 1.36, "learning_rate": 9.538261345167335e-05, "loss": 0.0124, "step": 526250 }, { "epoch": 1.36, "learning_rate": 9.537872523530187e-05, "loss": 0.0074, "step": 526260 }, { "epoch": 1.36, "learning_rate": 9.537483701893043e-05, "loss": 0.0082, "step": 526270 }, { "epoch": 1.36, "learning_rate": 9.537094880255894e-05, "loss": 0.0077, "step": 526280 }, { "epoch": 1.36, "learning_rate": 9.53670605861875e-05, "loss": 0.0068, "step": 526290 }, { "epoch": 1.36, "learning_rate": 9.536317236981603e-05, "loss": 0.0079, "step": 526300 }, { "epoch": 1.36, "learning_rate": 9.535928415344457e-05, "loss": 0.0095, "step": 526310 }, { "epoch": 1.36, "learning_rate": 9.53553959370731e-05, "loss": 0.0082, "step": 526320 }, { "epoch": 1.36, "learning_rate": 9.535150772070164e-05, "loss": 0.0101, "step": 526330 }, { "epoch": 1.36, "learning_rate": 9.534761950433017e-05, "loss": 0.0093, "step": 526340 }, { "epoch": 1.36, "learning_rate": 9.534373128795871e-05, "loss": 0.0114, "step": 526350 }, { "epoch": 1.36, "learning_rate": 9.533984307158724e-05, "loss": 0.0131, "step": 526360 }, { "epoch": 1.36, "learning_rate": 9.533595485521578e-05, "loss": 0.0092, "step": 526370 }, { "epoch": 1.36, "learning_rate": 9.53320666388443e-05, "loss": 0.0098, "step": 526380 }, { "epoch": 1.36, "learning_rate": 9.532817842247285e-05, "loss": 0.0081, "step": 526390 }, { "epoch": 1.36, "learning_rate": 9.532429020610138e-05, "loss": 0.0105, "step": 526400 }, { "epoch": 1.36, "learning_rate": 9.532040198972992e-05, "loss": 0.0106, "step": 526410 }, { "epoch": 1.36, "learning_rate": 9.531651377335845e-05, "loss": 0.013, "step": 526420 }, { "epoch": 1.36, "learning_rate": 9.531262555698699e-05, "loss": 0.0071, "step": 526430 }, { "epoch": 1.36, "learning_rate": 9.530873734061551e-05, "loss": 0.008, "step": 526440 }, { "epoch": 1.36, "learning_rate": 9.530484912424407e-05, "loss": 0.0064, "step": 526450 }, { "epoch": 1.36, "learning_rate": 9.53009609078726e-05, "loss": 0.0119, "step": 526460 }, { "epoch": 1.36, "learning_rate": 9.529707269150114e-05, "loss": 0.0142, "step": 526470 }, { "epoch": 1.36, "learning_rate": 9.529318447512967e-05, "loss": 0.0112, "step": 526480 }, { "epoch": 1.36, "learning_rate": 9.52892962587582e-05, "loss": 0.0096, "step": 526490 }, { "epoch": 1.36, "learning_rate": 9.528540804238674e-05, "loss": 0.0108, "step": 526500 }, { "epoch": 1.36, "learning_rate": 9.528151982601527e-05, "loss": 0.009, "step": 526510 }, { "epoch": 1.36, "learning_rate": 9.527763160964381e-05, "loss": 0.0115, "step": 526520 }, { "epoch": 1.36, "learning_rate": 9.527374339327234e-05, "loss": 0.0099, "step": 526530 }, { "epoch": 1.36, "learning_rate": 9.526985517690088e-05, "loss": 0.0087, "step": 526540 }, { "epoch": 1.36, "learning_rate": 9.52659669605294e-05, "loss": 0.0097, "step": 526550 }, { "epoch": 1.36, "learning_rate": 9.526207874415795e-05, "loss": 0.0114, "step": 526560 }, { "epoch": 1.36, "learning_rate": 9.525819052778647e-05, "loss": 0.0099, "step": 526570 }, { "epoch": 1.36, "learning_rate": 9.525430231141502e-05, "loss": 0.0098, "step": 526580 }, { "epoch": 1.36, "learning_rate": 9.525041409504354e-05, "loss": 0.0104, "step": 526590 }, { "epoch": 1.37, "learning_rate": 9.524652587867209e-05, "loss": 0.0086, "step": 526600 }, { "epoch": 1.37, "learning_rate": 9.524263766230061e-05, "loss": 0.0085, "step": 526610 }, { "epoch": 1.37, "learning_rate": 9.523874944592917e-05, "loss": 0.0092, "step": 526620 }, { "epoch": 1.37, "learning_rate": 9.523486122955768e-05, "loss": 0.01, "step": 526630 }, { "epoch": 1.37, "learning_rate": 9.523097301318624e-05, "loss": 0.0107, "step": 526640 }, { "epoch": 1.37, "learning_rate": 9.522708479681477e-05, "loss": 0.0101, "step": 526650 }, { "epoch": 1.37, "learning_rate": 9.522319658044331e-05, "loss": 0.0062, "step": 526660 }, { "epoch": 1.37, "learning_rate": 9.521930836407184e-05, "loss": 0.0072, "step": 526670 }, { "epoch": 1.37, "learning_rate": 9.521542014770038e-05, "loss": 0.0093, "step": 526680 }, { "epoch": 1.37, "learning_rate": 9.52115319313289e-05, "loss": 0.0078, "step": 526690 }, { "epoch": 1.37, "learning_rate": 9.520764371495745e-05, "loss": 0.0101, "step": 526700 }, { "epoch": 1.37, "learning_rate": 9.520375549858598e-05, "loss": 0.0097, "step": 526710 }, { "epoch": 1.37, "learning_rate": 9.519986728221452e-05, "loss": 0.0097, "step": 526720 }, { "epoch": 1.37, "learning_rate": 9.519597906584305e-05, "loss": 0.0082, "step": 526730 }, { "epoch": 1.37, "learning_rate": 9.519209084947157e-05, "loss": 0.0124, "step": 526740 }, { "epoch": 1.37, "learning_rate": 9.518820263310012e-05, "loss": 0.0104, "step": 526750 }, { "epoch": 1.37, "learning_rate": 9.518431441672864e-05, "loss": 0.0093, "step": 526760 }, { "epoch": 1.37, "learning_rate": 9.518042620035719e-05, "loss": 0.0113, "step": 526770 }, { "epoch": 1.37, "learning_rate": 9.517653798398571e-05, "loss": 0.0098, "step": 526780 }, { "epoch": 1.37, "learning_rate": 9.517264976761426e-05, "loss": 0.0099, "step": 526790 }, { "epoch": 1.37, "learning_rate": 9.516876155124278e-05, "loss": 0.0111, "step": 526800 }, { "epoch": 1.37, "learning_rate": 9.516487333487134e-05, "loss": 0.0102, "step": 526810 }, { "epoch": 1.37, "learning_rate": 9.516098511849987e-05, "loss": 0.0077, "step": 526820 }, { "epoch": 1.37, "learning_rate": 9.515709690212841e-05, "loss": 0.0098, "step": 526830 }, { "epoch": 1.37, "learning_rate": 9.515320868575694e-05, "loss": 0.0125, "step": 526840 }, { "epoch": 1.37, "learning_rate": 9.514932046938548e-05, "loss": 0.0081, "step": 526850 }, { "epoch": 1.37, "learning_rate": 9.5145432253014e-05, "loss": 0.0095, "step": 526860 }, { "epoch": 1.37, "learning_rate": 9.514154403664255e-05, "loss": 0.0098, "step": 526870 }, { "epoch": 1.37, "learning_rate": 9.513765582027108e-05, "loss": 0.0078, "step": 526880 }, { "epoch": 1.37, "learning_rate": 9.513376760389962e-05, "loss": 0.0105, "step": 526890 }, { "epoch": 1.37, "learning_rate": 9.512987938752815e-05, "loss": 0.0104, "step": 526900 }, { "epoch": 1.37, "learning_rate": 9.512599117115669e-05, "loss": 0.0092, "step": 526910 }, { "epoch": 1.37, "learning_rate": 9.512210295478522e-05, "loss": 0.0068, "step": 526920 }, { "epoch": 1.37, "learning_rate": 9.511821473841376e-05, "loss": 0.0085, "step": 526930 }, { "epoch": 1.37, "learning_rate": 9.511432652204229e-05, "loss": 0.01, "step": 526940 }, { "epoch": 1.37, "learning_rate": 9.511043830567083e-05, "loss": 0.0095, "step": 526950 }, { "epoch": 1.37, "learning_rate": 9.510655008929935e-05, "loss": 0.0105, "step": 526960 }, { "epoch": 1.37, "learning_rate": 9.510266187292791e-05, "loss": 0.0123, "step": 526970 }, { "epoch": 1.37, "learning_rate": 9.509877365655644e-05, "loss": 0.0092, "step": 526980 }, { "epoch": 1.37, "learning_rate": 9.509488544018495e-05, "loss": 0.0066, "step": 526990 }, { "epoch": 1.37, "learning_rate": 9.509099722381351e-05, "loss": 0.0091, "step": 527000 }, { "epoch": 1.37, "eval_cer": 0.8816634964890108, "eval_loss": 0.006512734107673168, "eval_runtime": 108.0004, "eval_samples_per_second": 18.518, "eval_steps_per_second": 4.63, "step": 527000 }, { "epoch": 1.37, "learning_rate": 9.508710900744204e-05, "loss": 0.011, "step": 527010 }, { "epoch": 1.37, "learning_rate": 9.508322079107058e-05, "loss": 0.0086, "step": 527020 }, { "epoch": 1.37, "learning_rate": 9.50793325746991e-05, "loss": 0.0087, "step": 527030 }, { "epoch": 1.37, "learning_rate": 9.507544435832765e-05, "loss": 0.0106, "step": 527040 }, { "epoch": 1.37, "learning_rate": 9.507155614195618e-05, "loss": 0.0102, "step": 527050 }, { "epoch": 1.37, "learning_rate": 9.506766792558472e-05, "loss": 0.0098, "step": 527060 }, { "epoch": 1.37, "learning_rate": 9.506377970921325e-05, "loss": 0.0095, "step": 527070 }, { "epoch": 1.37, "learning_rate": 9.505989149284179e-05, "loss": 0.0102, "step": 527080 }, { "epoch": 1.37, "learning_rate": 9.505600327647031e-05, "loss": 0.0102, "step": 527090 }, { "epoch": 1.37, "learning_rate": 9.505211506009886e-05, "loss": 0.008, "step": 527100 }, { "epoch": 1.37, "learning_rate": 9.504822684372738e-05, "loss": 0.0108, "step": 527110 }, { "epoch": 1.37, "learning_rate": 9.504433862735593e-05, "loss": 0.0094, "step": 527120 }, { "epoch": 1.37, "learning_rate": 9.504045041098445e-05, "loss": 0.0128, "step": 527130 }, { "epoch": 1.37, "learning_rate": 9.503656219461301e-05, "loss": 0.0097, "step": 527140 }, { "epoch": 1.37, "learning_rate": 9.503267397824152e-05, "loss": 0.009, "step": 527150 }, { "epoch": 1.37, "learning_rate": 9.502878576187008e-05, "loss": 0.0104, "step": 527160 }, { "epoch": 1.37, "learning_rate": 9.502489754549861e-05, "loss": 0.0093, "step": 527170 }, { "epoch": 1.37, "learning_rate": 9.502100932912715e-05, "loss": 0.0102, "step": 527180 }, { "epoch": 1.37, "learning_rate": 9.501712111275568e-05, "loss": 0.0087, "step": 527190 }, { "epoch": 1.37, "learning_rate": 9.501323289638422e-05, "loss": 0.0111, "step": 527200 }, { "epoch": 1.37, "learning_rate": 9.500934468001275e-05, "loss": 0.008, "step": 527210 }, { "epoch": 1.37, "learning_rate": 9.500545646364129e-05, "loss": 0.0094, "step": 527220 }, { "epoch": 1.37, "learning_rate": 9.500156824726982e-05, "loss": 0.016, "step": 527230 }, { "epoch": 1.37, "learning_rate": 9.499768003089834e-05, "loss": 0.0098, "step": 527240 }, { "epoch": 1.37, "learning_rate": 9.499379181452689e-05, "loss": 0.0098, "step": 527250 }, { "epoch": 1.37, "learning_rate": 9.498990359815541e-05, "loss": 0.0074, "step": 527260 }, { "epoch": 1.37, "learning_rate": 9.498601538178396e-05, "loss": 0.0076, "step": 527270 }, { "epoch": 1.37, "learning_rate": 9.498212716541248e-05, "loss": 0.0096, "step": 527280 }, { "epoch": 1.37, "learning_rate": 9.497823894904103e-05, "loss": 0.0103, "step": 527290 }, { "epoch": 1.37, "learning_rate": 9.497435073266955e-05, "loss": 0.0071, "step": 527300 }, { "epoch": 1.37, "learning_rate": 9.49704625162981e-05, "loss": 0.0095, "step": 527310 }, { "epoch": 1.37, "learning_rate": 9.496657429992662e-05, "loss": 0.0135, "step": 527320 }, { "epoch": 1.37, "learning_rate": 9.496268608355518e-05, "loss": 0.0079, "step": 527330 }, { "epoch": 1.37, "learning_rate": 9.49587978671837e-05, "loss": 0.0075, "step": 527340 }, { "epoch": 1.37, "learning_rate": 9.495490965081225e-05, "loss": 0.011, "step": 527350 }, { "epoch": 1.37, "learning_rate": 9.495102143444078e-05, "loss": 0.0084, "step": 527360 }, { "epoch": 1.37, "learning_rate": 9.494713321806932e-05, "loss": 0.009, "step": 527370 }, { "epoch": 1.37, "learning_rate": 9.494324500169785e-05, "loss": 0.0134, "step": 527380 }, { "epoch": 1.37, "learning_rate": 9.493935678532639e-05, "loss": 0.0125, "step": 527390 }, { "epoch": 1.37, "learning_rate": 9.493546856895492e-05, "loss": 0.0089, "step": 527400 }, { "epoch": 1.37, "learning_rate": 9.493158035258346e-05, "loss": 0.0094, "step": 527410 }, { "epoch": 1.37, "learning_rate": 9.492769213621199e-05, "loss": 0.0127, "step": 527420 }, { "epoch": 1.37, "learning_rate": 9.492380391984053e-05, "loss": 0.0083, "step": 527430 }, { "epoch": 1.37, "learning_rate": 9.491991570346906e-05, "loss": 0.0104, "step": 527440 }, { "epoch": 1.37, "learning_rate": 9.49160274870976e-05, "loss": 0.0114, "step": 527450 }, { "epoch": 1.37, "learning_rate": 9.491213927072612e-05, "loss": 0.0107, "step": 527460 }, { "epoch": 1.37, "learning_rate": 9.490825105435467e-05, "loss": 0.0094, "step": 527470 }, { "epoch": 1.37, "learning_rate": 9.49043628379832e-05, "loss": 0.0081, "step": 527480 }, { "epoch": 1.37, "learning_rate": 9.490047462161172e-05, "loss": 0.0094, "step": 527490 }, { "epoch": 1.37, "learning_rate": 9.489658640524028e-05, "loss": 0.0087, "step": 527500 }, { "epoch": 1.37, "learning_rate": 9.489269818886879e-05, "loss": 0.0139, "step": 527510 }, { "epoch": 1.37, "learning_rate": 9.488880997249735e-05, "loss": 0.0086, "step": 527520 }, { "epoch": 1.37, "learning_rate": 9.488492175612588e-05, "loss": 0.0096, "step": 527530 }, { "epoch": 1.37, "learning_rate": 9.488103353975442e-05, "loss": 0.0074, "step": 527540 }, { "epoch": 1.37, "learning_rate": 9.487714532338295e-05, "loss": 0.0086, "step": 527550 }, { "epoch": 1.37, "learning_rate": 9.487325710701149e-05, "loss": 0.0101, "step": 527560 }, { "epoch": 1.37, "learning_rate": 9.486936889064002e-05, "loss": 0.0071, "step": 527570 }, { "epoch": 1.37, "learning_rate": 9.486548067426856e-05, "loss": 0.0102, "step": 527580 }, { "epoch": 1.37, "learning_rate": 9.486159245789708e-05, "loss": 0.0074, "step": 527590 }, { "epoch": 1.37, "learning_rate": 9.485770424152563e-05, "loss": 0.0094, "step": 527600 }, { "epoch": 1.37, "learning_rate": 9.485381602515415e-05, "loss": 0.0102, "step": 527610 }, { "epoch": 1.37, "learning_rate": 9.48499278087827e-05, "loss": 0.0071, "step": 527620 }, { "epoch": 1.37, "learning_rate": 9.484603959241122e-05, "loss": 0.0122, "step": 527630 }, { "epoch": 1.37, "learning_rate": 9.484215137603977e-05, "loss": 0.0094, "step": 527640 }, { "epoch": 1.37, "learning_rate": 9.48382631596683e-05, "loss": 0.011, "step": 527650 }, { "epoch": 1.37, "learning_rate": 9.483437494329684e-05, "loss": 0.009, "step": 527660 }, { "epoch": 1.37, "learning_rate": 9.483048672692536e-05, "loss": 0.011, "step": 527670 }, { "epoch": 1.37, "learning_rate": 9.482659851055392e-05, "loss": 0.0083, "step": 527680 }, { "epoch": 1.37, "learning_rate": 9.482271029418245e-05, "loss": 0.0122, "step": 527690 }, { "epoch": 1.37, "learning_rate": 9.481882207781099e-05, "loss": 0.0107, "step": 527700 }, { "epoch": 1.37, "learning_rate": 9.481493386143952e-05, "loss": 0.0087, "step": 527710 }, { "epoch": 1.37, "learning_rate": 9.481104564506806e-05, "loss": 0.0088, "step": 527720 }, { "epoch": 1.37, "learning_rate": 9.480715742869659e-05, "loss": 0.0113, "step": 527730 }, { "epoch": 1.37, "learning_rate": 9.480326921232511e-05, "loss": 0.0088, "step": 527740 }, { "epoch": 1.37, "learning_rate": 9.479938099595366e-05, "loss": 0.0082, "step": 527750 }, { "epoch": 1.37, "learning_rate": 9.479549277958218e-05, "loss": 0.0072, "step": 527760 }, { "epoch": 1.37, "learning_rate": 9.479160456321073e-05, "loss": 0.0117, "step": 527770 }, { "epoch": 1.37, "learning_rate": 9.478771634683925e-05, "loss": 0.0128, "step": 527780 }, { "epoch": 1.37, "learning_rate": 9.47838281304678e-05, "loss": 0.0107, "step": 527790 }, { "epoch": 1.37, "learning_rate": 9.477993991409632e-05, "loss": 0.012, "step": 527800 }, { "epoch": 1.37, "learning_rate": 9.477605169772487e-05, "loss": 0.0083, "step": 527810 }, { "epoch": 1.37, "learning_rate": 9.47721634813534e-05, "loss": 0.0102, "step": 527820 }, { "epoch": 1.37, "learning_rate": 9.476827526498194e-05, "loss": 0.0088, "step": 527830 }, { "epoch": 1.37, "learning_rate": 9.476438704861046e-05, "loss": 0.0135, "step": 527840 }, { "epoch": 1.37, "learning_rate": 9.476049883223902e-05, "loss": 0.0117, "step": 527850 }, { "epoch": 1.37, "learning_rate": 9.475661061586755e-05, "loss": 0.0096, "step": 527860 }, { "epoch": 1.37, "learning_rate": 9.475272239949609e-05, "loss": 0.0087, "step": 527870 }, { "epoch": 1.37, "learning_rate": 9.474883418312462e-05, "loss": 0.008, "step": 527880 }, { "epoch": 1.37, "learning_rate": 9.474494596675316e-05, "loss": 0.0082, "step": 527890 }, { "epoch": 1.37, "learning_rate": 9.474105775038169e-05, "loss": 0.008, "step": 527900 }, { "epoch": 1.37, "learning_rate": 9.473716953401023e-05, "loss": 0.0091, "step": 527910 }, { "epoch": 1.37, "learning_rate": 9.473328131763876e-05, "loss": 0.0125, "step": 527920 }, { "epoch": 1.37, "learning_rate": 9.47293931012673e-05, "loss": 0.0082, "step": 527930 }, { "epoch": 1.37, "learning_rate": 9.472550488489583e-05, "loss": 0.0126, "step": 527940 }, { "epoch": 1.37, "learning_rate": 9.472161666852437e-05, "loss": 0.0092, "step": 527950 }, { "epoch": 1.37, "learning_rate": 9.47177284521529e-05, "loss": 0.0094, "step": 527960 }, { "epoch": 1.37, "learning_rate": 9.471384023578144e-05, "loss": 0.0078, "step": 527970 }, { "epoch": 1.37, "learning_rate": 9.470995201940996e-05, "loss": 0.0116, "step": 527980 }, { "epoch": 1.37, "learning_rate": 9.470606380303849e-05, "loss": 0.008, "step": 527990 }, { "epoch": 1.37, "learning_rate": 9.470217558666703e-05, "loss": 0.0101, "step": 528000 }, { "epoch": 1.37, "eval_cer": 0.8816676953998133, "eval_loss": 0.006410685367882252, "eval_runtime": 108.0197, "eval_samples_per_second": 18.515, "eval_steps_per_second": 4.629, "step": 528000 }, { "epoch": 1.37, "learning_rate": 9.469828737029556e-05, "loss": 0.009, "step": 528010 }, { "epoch": 1.37, "learning_rate": 9.46943991539241e-05, "loss": 0.009, "step": 528020 }, { "epoch": 1.37, "learning_rate": 9.469051093755263e-05, "loss": 0.0081, "step": 528030 }, { "epoch": 1.37, "learning_rate": 9.468662272118119e-05, "loss": 0.0097, "step": 528040 }, { "epoch": 1.37, "learning_rate": 9.468273450480972e-05, "loss": 0.009, "step": 528050 }, { "epoch": 1.37, "learning_rate": 9.467884628843826e-05, "loss": 0.0121, "step": 528060 }, { "epoch": 1.37, "learning_rate": 9.467495807206679e-05, "loss": 0.0086, "step": 528070 }, { "epoch": 1.37, "learning_rate": 9.467106985569533e-05, "loss": 0.0085, "step": 528080 }, { "epoch": 1.37, "learning_rate": 9.466718163932386e-05, "loss": 0.0104, "step": 528090 }, { "epoch": 1.37, "learning_rate": 9.46632934229524e-05, "loss": 0.011, "step": 528100 }, { "epoch": 1.37, "learning_rate": 9.465940520658092e-05, "loss": 0.0101, "step": 528110 }, { "epoch": 1.37, "learning_rate": 9.465551699020947e-05, "loss": 0.011, "step": 528120 }, { "epoch": 1.37, "learning_rate": 9.4651628773838e-05, "loss": 0.012, "step": 528130 }, { "epoch": 1.37, "learning_rate": 9.464774055746654e-05, "loss": 0.0115, "step": 528140 }, { "epoch": 1.37, "learning_rate": 9.464385234109506e-05, "loss": 0.0126, "step": 528150 }, { "epoch": 1.37, "learning_rate": 9.46399641247236e-05, "loss": 0.008, "step": 528160 }, { "epoch": 1.37, "learning_rate": 9.463607590835213e-05, "loss": 0.0117, "step": 528170 }, { "epoch": 1.37, "learning_rate": 9.463218769198068e-05, "loss": 0.0084, "step": 528180 }, { "epoch": 1.37, "learning_rate": 9.46282994756092e-05, "loss": 0.0121, "step": 528190 }, { "epoch": 1.37, "learning_rate": 9.462441125923776e-05, "loss": 0.0089, "step": 528200 }, { "epoch": 1.37, "learning_rate": 9.462052304286629e-05, "loss": 0.0103, "step": 528210 }, { "epoch": 1.37, "learning_rate": 9.46166348264948e-05, "loss": 0.0094, "step": 528220 }, { "epoch": 1.37, "learning_rate": 9.461274661012336e-05, "loss": 0.0113, "step": 528230 }, { "epoch": 1.37, "learning_rate": 9.460885839375188e-05, "loss": 0.0106, "step": 528240 }, { "epoch": 1.37, "learning_rate": 9.460497017738043e-05, "loss": 0.0112, "step": 528250 }, { "epoch": 1.37, "learning_rate": 9.460108196100895e-05, "loss": 0.012, "step": 528260 }, { "epoch": 1.37, "learning_rate": 9.45971937446375e-05, "loss": 0.0087, "step": 528270 }, { "epoch": 1.37, "learning_rate": 9.459330552826602e-05, "loss": 0.0084, "step": 528280 }, { "epoch": 1.37, "learning_rate": 9.458941731189457e-05, "loss": 0.0091, "step": 528290 }, { "epoch": 1.37, "learning_rate": 9.45855290955231e-05, "loss": 0.0111, "step": 528300 }, { "epoch": 1.37, "learning_rate": 9.458164087915164e-05, "loss": 0.0135, "step": 528310 }, { "epoch": 1.37, "learning_rate": 9.457775266278016e-05, "loss": 0.012, "step": 528320 }, { "epoch": 1.37, "learning_rate": 9.45738644464087e-05, "loss": 0.0093, "step": 528330 }, { "epoch": 1.37, "learning_rate": 9.456997623003723e-05, "loss": 0.0076, "step": 528340 }, { "epoch": 1.37, "learning_rate": 9.456608801366578e-05, "loss": 0.0066, "step": 528350 }, { "epoch": 1.37, "learning_rate": 9.45621997972943e-05, "loss": 0.0113, "step": 528360 }, { "epoch": 1.37, "learning_rate": 9.455831158092286e-05, "loss": 0.0087, "step": 528370 }, { "epoch": 1.37, "learning_rate": 9.455442336455137e-05, "loss": 0.0086, "step": 528380 }, { "epoch": 1.37, "learning_rate": 9.455053514817993e-05, "loss": 0.0142, "step": 528390 }, { "epoch": 1.37, "learning_rate": 9.454664693180846e-05, "loss": 0.0118, "step": 528400 }, { "epoch": 1.37, "learning_rate": 9.4542758715437e-05, "loss": 0.0101, "step": 528410 }, { "epoch": 1.37, "learning_rate": 9.453887049906553e-05, "loss": 0.0101, "step": 528420 }, { "epoch": 1.37, "learning_rate": 9.453498228269407e-05, "loss": 0.0121, "step": 528430 }, { "epoch": 1.37, "learning_rate": 9.45310940663226e-05, "loss": 0.0121, "step": 528440 }, { "epoch": 1.37, "learning_rate": 9.452720584995114e-05, "loss": 0.0098, "step": 528450 }, { "epoch": 1.37, "learning_rate": 9.452331763357967e-05, "loss": 0.0075, "step": 528460 }, { "epoch": 1.37, "learning_rate": 9.45194294172082e-05, "loss": 0.0118, "step": 528470 }, { "epoch": 1.37, "learning_rate": 9.451554120083674e-05, "loss": 0.0121, "step": 528480 }, { "epoch": 1.37, "learning_rate": 9.451165298446526e-05, "loss": 0.0093, "step": 528490 }, { "epoch": 1.37, "learning_rate": 9.45077647680938e-05, "loss": 0.0107, "step": 528500 }, { "epoch": 1.37, "learning_rate": 9.450387655172233e-05, "loss": 0.0113, "step": 528510 }, { "epoch": 1.37, "learning_rate": 9.449998833535087e-05, "loss": 0.0091, "step": 528520 }, { "epoch": 1.37, "learning_rate": 9.44961001189794e-05, "loss": 0.0116, "step": 528530 }, { "epoch": 1.37, "learning_rate": 9.449221190260794e-05, "loss": 0.0094, "step": 528540 }, { "epoch": 1.37, "learning_rate": 9.448832368623647e-05, "loss": 0.0096, "step": 528550 }, { "epoch": 1.37, "learning_rate": 9.448443546986503e-05, "loss": 0.0105, "step": 528560 }, { "epoch": 1.37, "learning_rate": 9.448054725349356e-05, "loss": 0.0077, "step": 528570 }, { "epoch": 1.37, "learning_rate": 9.44766590371221e-05, "loss": 0.0085, "step": 528580 }, { "epoch": 1.37, "learning_rate": 9.447277082075063e-05, "loss": 0.0085, "step": 528590 }, { "epoch": 1.37, "learning_rate": 9.446888260437917e-05, "loss": 0.0113, "step": 528600 }, { "epoch": 1.37, "learning_rate": 9.44649943880077e-05, "loss": 0.0109, "step": 528610 }, { "epoch": 1.37, "learning_rate": 9.446110617163624e-05, "loss": 0.0135, "step": 528620 }, { "epoch": 1.37, "learning_rate": 9.445721795526476e-05, "loss": 0.0094, "step": 528630 }, { "epoch": 1.37, "learning_rate": 9.44533297388933e-05, "loss": 0.0098, "step": 528640 }, { "epoch": 1.37, "learning_rate": 9.444944152252183e-05, "loss": 0.0111, "step": 528650 }, { "epoch": 1.37, "learning_rate": 9.444555330615038e-05, "loss": 0.0092, "step": 528660 }, { "epoch": 1.37, "learning_rate": 9.44416650897789e-05, "loss": 0.0096, "step": 528670 }, { "epoch": 1.37, "learning_rate": 9.443777687340745e-05, "loss": 0.0109, "step": 528680 }, { "epoch": 1.37, "learning_rate": 9.443388865703597e-05, "loss": 0.0089, "step": 528690 }, { "epoch": 1.37, "learning_rate": 9.443000044066452e-05, "loss": 0.0097, "step": 528700 }, { "epoch": 1.37, "learning_rate": 9.442611222429304e-05, "loss": 0.0078, "step": 528710 }, { "epoch": 1.37, "learning_rate": 9.442222400792157e-05, "loss": 0.0107, "step": 528720 }, { "epoch": 1.37, "learning_rate": 9.441833579155013e-05, "loss": 0.0074, "step": 528730 }, { "epoch": 1.37, "learning_rate": 9.441444757517864e-05, "loss": 0.0095, "step": 528740 }, { "epoch": 1.37, "learning_rate": 9.44105593588072e-05, "loss": 0.0112, "step": 528750 }, { "epoch": 1.37, "learning_rate": 9.440667114243572e-05, "loss": 0.0094, "step": 528760 }, { "epoch": 1.37, "learning_rate": 9.440278292606427e-05, "loss": 0.0125, "step": 528770 }, { "epoch": 1.37, "learning_rate": 9.43988947096928e-05, "loss": 0.0099, "step": 528780 }, { "epoch": 1.37, "learning_rate": 9.439500649332134e-05, "loss": 0.0111, "step": 528790 }, { "epoch": 1.37, "learning_rate": 9.439111827694986e-05, "loss": 0.0087, "step": 528800 }, { "epoch": 1.37, "learning_rate": 9.43872300605784e-05, "loss": 0.0087, "step": 528810 }, { "epoch": 1.37, "learning_rate": 9.438334184420693e-05, "loss": 0.0128, "step": 528820 }, { "epoch": 1.37, "learning_rate": 9.437945362783548e-05, "loss": 0.0096, "step": 528830 }, { "epoch": 1.37, "learning_rate": 9.4375565411464e-05, "loss": 0.0097, "step": 528840 }, { "epoch": 1.37, "learning_rate": 9.437167719509255e-05, "loss": 0.0119, "step": 528850 }, { "epoch": 1.37, "learning_rate": 9.436778897872107e-05, "loss": 0.0119, "step": 528860 }, { "epoch": 1.37, "learning_rate": 9.436390076234961e-05, "loss": 0.0118, "step": 528870 }, { "epoch": 1.37, "learning_rate": 9.436001254597814e-05, "loss": 0.01, "step": 528880 }, { "epoch": 1.37, "learning_rate": 9.43561243296067e-05, "loss": 0.0081, "step": 528890 }, { "epoch": 1.37, "learning_rate": 9.435223611323521e-05, "loss": 0.0124, "step": 528900 }, { "epoch": 1.37, "learning_rate": 9.434834789686377e-05, "loss": 0.0114, "step": 528910 }, { "epoch": 1.37, "learning_rate": 9.43444596804923e-05, "loss": 0.0099, "step": 528920 }, { "epoch": 1.37, "learning_rate": 9.434057146412084e-05, "loss": 0.0074, "step": 528930 }, { "epoch": 1.37, "learning_rate": 9.433668324774937e-05, "loss": 0.0084, "step": 528940 }, { "epoch": 1.37, "learning_rate": 9.433279503137791e-05, "loss": 0.009, "step": 528950 }, { "epoch": 1.37, "learning_rate": 9.432890681500644e-05, "loss": 0.0098, "step": 528960 }, { "epoch": 1.37, "learning_rate": 9.432501859863496e-05, "loss": 0.0105, "step": 528970 }, { "epoch": 1.37, "learning_rate": 9.43211303822635e-05, "loss": 0.0095, "step": 528980 }, { "epoch": 1.37, "learning_rate": 9.431724216589203e-05, "loss": 0.0076, "step": 528990 }, { "epoch": 1.37, "learning_rate": 9.431335394952057e-05, "loss": 0.0091, "step": 529000 }, { "epoch": 1.37, "eval_cer": 0.8816816917691551, "eval_loss": 0.006558180321007967, "eval_runtime": 107.9692, "eval_samples_per_second": 18.524, "eval_steps_per_second": 4.631, "step": 529000 }, { "epoch": 1.37, "learning_rate": 9.43094657331491e-05, "loss": 0.0104, "step": 529010 }, { "epoch": 1.37, "learning_rate": 9.430557751677764e-05, "loss": 0.0106, "step": 529020 }, { "epoch": 1.37, "learning_rate": 9.430168930040617e-05, "loss": 0.0078, "step": 529030 }, { "epoch": 1.37, "learning_rate": 9.429780108403471e-05, "loss": 0.0066, "step": 529040 }, { "epoch": 1.37, "learning_rate": 9.429391286766324e-05, "loss": 0.0099, "step": 529050 }, { "epoch": 1.37, "learning_rate": 9.429002465129178e-05, "loss": 0.0115, "step": 529060 }, { "epoch": 1.37, "learning_rate": 9.428613643492031e-05, "loss": 0.0097, "step": 529070 }, { "epoch": 1.37, "learning_rate": 9.428224821854887e-05, "loss": 0.012, "step": 529080 }, { "epoch": 1.37, "learning_rate": 9.42783600021774e-05, "loss": 0.0087, "step": 529090 }, { "epoch": 1.37, "learning_rate": 9.427447178580594e-05, "loss": 0.0115, "step": 529100 }, { "epoch": 1.37, "learning_rate": 9.427058356943447e-05, "loss": 0.0087, "step": 529110 }, { "epoch": 1.37, "learning_rate": 9.426669535306301e-05, "loss": 0.0101, "step": 529120 }, { "epoch": 1.37, "learning_rate": 9.426280713669153e-05, "loss": 0.0109, "step": 529130 }, { "epoch": 1.37, "learning_rate": 9.425891892032008e-05, "loss": 0.0082, "step": 529140 }, { "epoch": 1.37, "learning_rate": 9.42550307039486e-05, "loss": 0.0087, "step": 529150 }, { "epoch": 1.37, "learning_rate": 9.425114248757715e-05, "loss": 0.0083, "step": 529160 }, { "epoch": 1.37, "learning_rate": 9.424725427120567e-05, "loss": 0.008, "step": 529170 }, { "epoch": 1.37, "learning_rate": 9.424336605483422e-05, "loss": 0.0094, "step": 529180 }, { "epoch": 1.37, "learning_rate": 9.423947783846274e-05, "loss": 0.0096, "step": 529190 }, { "epoch": 1.37, "learning_rate": 9.423558962209129e-05, "loss": 0.0086, "step": 529200 }, { "epoch": 1.37, "learning_rate": 9.423170140571981e-05, "loss": 0.0126, "step": 529210 }, { "epoch": 1.37, "learning_rate": 9.422781318934834e-05, "loss": 0.0105, "step": 529220 }, { "epoch": 1.37, "learning_rate": 9.422392497297688e-05, "loss": 0.0079, "step": 529230 }, { "epoch": 1.37, "learning_rate": 9.422003675660541e-05, "loss": 0.0068, "step": 529240 }, { "epoch": 1.37, "learning_rate": 9.421614854023395e-05, "loss": 0.009, "step": 529250 }, { "epoch": 1.37, "learning_rate": 9.421226032386248e-05, "loss": 0.0068, "step": 529260 }, { "epoch": 1.37, "learning_rate": 9.420837210749104e-05, "loss": 0.0085, "step": 529270 }, { "epoch": 1.37, "learning_rate": 9.420448389111956e-05, "loss": 0.0132, "step": 529280 }, { "epoch": 1.37, "learning_rate": 9.42005956747481e-05, "loss": 0.009, "step": 529290 }, { "epoch": 1.37, "learning_rate": 9.419670745837663e-05, "loss": 0.0116, "step": 529300 }, { "epoch": 1.37, "learning_rate": 9.419281924200518e-05, "loss": 0.0135, "step": 529310 }, { "epoch": 1.37, "learning_rate": 9.41889310256337e-05, "loss": 0.0082, "step": 529320 }, { "epoch": 1.37, "learning_rate": 9.418504280926225e-05, "loss": 0.0114, "step": 529330 }, { "epoch": 1.37, "learning_rate": 9.418115459289077e-05, "loss": 0.0071, "step": 529340 }, { "epoch": 1.37, "learning_rate": 9.417726637651932e-05, "loss": 0.0112, "step": 529350 }, { "epoch": 1.37, "learning_rate": 9.417337816014784e-05, "loss": 0.0096, "step": 529360 }, { "epoch": 1.37, "learning_rate": 9.416948994377639e-05, "loss": 0.0103, "step": 529370 }, { "epoch": 1.37, "learning_rate": 9.416560172740491e-05, "loss": 0.0107, "step": 529380 }, { "epoch": 1.37, "learning_rate": 9.416171351103345e-05, "loss": 0.0093, "step": 529390 }, { "epoch": 1.37, "learning_rate": 9.415782529466198e-05, "loss": 0.0132, "step": 529400 }, { "epoch": 1.37, "learning_rate": 9.415393707829052e-05, "loss": 0.011, "step": 529410 }, { "epoch": 1.37, "learning_rate": 9.415004886191905e-05, "loss": 0.0119, "step": 529420 }, { "epoch": 1.37, "learning_rate": 9.414616064554761e-05, "loss": 0.0108, "step": 529430 }, { "epoch": 1.37, "learning_rate": 9.414227242917614e-05, "loss": 0.0106, "step": 529440 }, { "epoch": 1.37, "learning_rate": 9.413838421280468e-05, "loss": 0.0096, "step": 529450 }, { "epoch": 1.37, "learning_rate": 9.41344959964332e-05, "loss": 0.0096, "step": 529460 }, { "epoch": 1.37, "learning_rate": 9.413060778006173e-05, "loss": 0.0089, "step": 529470 }, { "epoch": 1.37, "learning_rate": 9.412671956369028e-05, "loss": 0.0087, "step": 529480 }, { "epoch": 1.37, "learning_rate": 9.41228313473188e-05, "loss": 0.0111, "step": 529490 }, { "epoch": 1.37, "learning_rate": 9.411894313094735e-05, "loss": 0.0072, "step": 529500 }, { "epoch": 1.37, "learning_rate": 9.411505491457587e-05, "loss": 0.0126, "step": 529510 }, { "epoch": 1.37, "learning_rate": 9.411116669820441e-05, "loss": 0.0082, "step": 529520 }, { "epoch": 1.37, "learning_rate": 9.410727848183294e-05, "loss": 0.0139, "step": 529530 }, { "epoch": 1.37, "learning_rate": 9.410339026546148e-05, "loss": 0.0105, "step": 529540 }, { "epoch": 1.37, "learning_rate": 9.409950204909001e-05, "loss": 0.0087, "step": 529550 }, { "epoch": 1.37, "learning_rate": 9.409561383271855e-05, "loss": 0.0106, "step": 529560 }, { "epoch": 1.37, "learning_rate": 9.409172561634708e-05, "loss": 0.0095, "step": 529570 }, { "epoch": 1.37, "learning_rate": 9.408783739997562e-05, "loss": 0.0095, "step": 529580 }, { "epoch": 1.37, "learning_rate": 9.408394918360415e-05, "loss": 0.0094, "step": 529590 }, { "epoch": 1.37, "learning_rate": 9.408006096723271e-05, "loss": 0.0093, "step": 529600 }, { "epoch": 1.37, "learning_rate": 9.407617275086122e-05, "loss": 0.0063, "step": 529610 }, { "epoch": 1.37, "learning_rate": 9.407228453448978e-05, "loss": 0.0092, "step": 529620 }, { "epoch": 1.37, "learning_rate": 9.40683963181183e-05, "loss": 0.0119, "step": 529630 }, { "epoch": 1.37, "learning_rate": 9.406450810174685e-05, "loss": 0.0101, "step": 529640 }, { "epoch": 1.37, "learning_rate": 9.406061988537537e-05, "loss": 0.011, "step": 529650 }, { "epoch": 1.37, "learning_rate": 9.405673166900392e-05, "loss": 0.0117, "step": 529660 }, { "epoch": 1.37, "learning_rate": 9.405284345263244e-05, "loss": 0.013, "step": 529670 }, { "epoch": 1.37, "learning_rate": 9.404895523626099e-05, "loss": 0.0111, "step": 529680 }, { "epoch": 1.37, "learning_rate": 9.404506701988951e-05, "loss": 0.0086, "step": 529690 }, { "epoch": 1.37, "learning_rate": 9.404117880351806e-05, "loss": 0.0123, "step": 529700 }, { "epoch": 1.37, "learning_rate": 9.403729058714658e-05, "loss": 0.0078, "step": 529710 }, { "epoch": 1.37, "learning_rate": 9.403340237077511e-05, "loss": 0.0072, "step": 529720 }, { "epoch": 1.37, "learning_rate": 9.402951415440365e-05, "loss": 0.0097, "step": 529730 }, { "epoch": 1.37, "learning_rate": 9.402562593803218e-05, "loss": 0.0087, "step": 529740 }, { "epoch": 1.37, "learning_rate": 9.402173772166072e-05, "loss": 0.0077, "step": 529750 }, { "epoch": 1.37, "learning_rate": 9.401784950528925e-05, "loss": 0.0077, "step": 529760 }, { "epoch": 1.37, "learning_rate": 9.401396128891779e-05, "loss": 0.0101, "step": 529770 }, { "epoch": 1.37, "learning_rate": 9.401007307254632e-05, "loss": 0.0097, "step": 529780 }, { "epoch": 1.37, "learning_rate": 9.400618485617488e-05, "loss": 0.0096, "step": 529790 }, { "epoch": 1.37, "learning_rate": 9.40022966398034e-05, "loss": 0.0108, "step": 529800 }, { "epoch": 1.37, "learning_rate": 9.399840842343195e-05, "loss": 0.0094, "step": 529810 }, { "epoch": 1.37, "learning_rate": 9.399452020706047e-05, "loss": 0.0112, "step": 529820 }, { "epoch": 1.37, "learning_rate": 9.399063199068902e-05, "loss": 0.0085, "step": 529830 }, { "epoch": 1.37, "learning_rate": 9.398674377431754e-05, "loss": 0.0081, "step": 529840 }, { "epoch": 1.37, "learning_rate": 9.398285555794609e-05, "loss": 0.0106, "step": 529850 }, { "epoch": 1.37, "learning_rate": 9.397896734157461e-05, "loss": 0.0107, "step": 529860 }, { "epoch": 1.37, "learning_rate": 9.397507912520316e-05, "loss": 0.0097, "step": 529870 }, { "epoch": 1.37, "learning_rate": 9.397119090883168e-05, "loss": 0.0101, "step": 529880 }, { "epoch": 1.37, "learning_rate": 9.396730269246023e-05, "loss": 0.0137, "step": 529890 }, { "epoch": 1.37, "learning_rate": 9.396341447608875e-05, "loss": 0.0101, "step": 529900 }, { "epoch": 1.37, "learning_rate": 9.39595262597173e-05, "loss": 0.0133, "step": 529910 }, { "epoch": 1.37, "learning_rate": 9.395563804334582e-05, "loss": 0.0097, "step": 529920 }, { "epoch": 1.37, "learning_rate": 9.395174982697436e-05, "loss": 0.0115, "step": 529930 }, { "epoch": 1.37, "learning_rate": 9.394786161060289e-05, "loss": 0.0092, "step": 529940 }, { "epoch": 1.37, "learning_rate": 9.394397339423145e-05, "loss": 0.0095, "step": 529950 }, { "epoch": 1.37, "learning_rate": 9.394008517785998e-05, "loss": 0.009, "step": 529960 }, { "epoch": 1.37, "learning_rate": 9.393619696148849e-05, "loss": 0.0113, "step": 529970 }, { "epoch": 1.37, "learning_rate": 9.393230874511705e-05, "loss": 0.0078, "step": 529980 }, { "epoch": 1.37, "learning_rate": 9.392842052874557e-05, "loss": 0.0088, "step": 529990 }, { "epoch": 1.37, "learning_rate": 9.392453231237412e-05, "loss": 0.0123, "step": 530000 }, { "epoch": 1.37, "eval_cer": 0.8816858906799576, "eval_loss": 0.0064879064448177814, "eval_runtime": 107.9436, "eval_samples_per_second": 18.528, "eval_steps_per_second": 4.632, "step": 530000 }, { "epoch": 1.37, "learning_rate": 9.392064409600264e-05, "loss": 0.0073, "step": 530010 }, { "epoch": 1.37, "learning_rate": 9.391675587963119e-05, "loss": 0.009, "step": 530020 }, { "epoch": 1.37, "learning_rate": 9.391286766325971e-05, "loss": 0.0111, "step": 530030 }, { "epoch": 1.37, "learning_rate": 9.390897944688825e-05, "loss": 0.0094, "step": 530040 }, { "epoch": 1.37, "learning_rate": 9.390509123051678e-05, "loss": 0.0087, "step": 530050 }, { "epoch": 1.37, "learning_rate": 9.390120301414532e-05, "loss": 0.0112, "step": 530060 }, { "epoch": 1.37, "learning_rate": 9.389731479777385e-05, "loss": 0.0121, "step": 530070 }, { "epoch": 1.37, "learning_rate": 9.38934265814024e-05, "loss": 0.0092, "step": 530080 }, { "epoch": 1.37, "learning_rate": 9.388953836503092e-05, "loss": 0.0122, "step": 530090 }, { "epoch": 1.37, "learning_rate": 9.388565014865946e-05, "loss": 0.0135, "step": 530100 }, { "epoch": 1.37, "learning_rate": 9.388176193228799e-05, "loss": 0.0086, "step": 530110 }, { "epoch": 1.37, "learning_rate": 9.387787371591655e-05, "loss": 0.0175, "step": 530120 }, { "epoch": 1.37, "learning_rate": 9.387398549954506e-05, "loss": 0.0096, "step": 530130 }, { "epoch": 1.37, "learning_rate": 9.387009728317362e-05, "loss": 0.0089, "step": 530140 }, { "epoch": 1.37, "learning_rate": 9.386620906680215e-05, "loss": 0.0082, "step": 530150 }, { "epoch": 1.37, "learning_rate": 9.386232085043069e-05, "loss": 0.0092, "step": 530160 }, { "epoch": 1.37, "learning_rate": 9.385843263405921e-05, "loss": 0.0098, "step": 530170 }, { "epoch": 1.37, "learning_rate": 9.385454441768776e-05, "loss": 0.0092, "step": 530180 }, { "epoch": 1.37, "learning_rate": 9.385065620131628e-05, "loss": 0.0077, "step": 530190 }, { "epoch": 1.37, "learning_rate": 9.384676798494483e-05, "loss": 0.0191, "step": 530200 }, { "epoch": 1.37, "learning_rate": 9.384287976857335e-05, "loss": 0.0118, "step": 530210 }, { "epoch": 1.37, "learning_rate": 9.383899155220188e-05, "loss": 0.0122, "step": 530220 }, { "epoch": 1.37, "learning_rate": 9.383510333583042e-05, "loss": 0.009, "step": 530230 }, { "epoch": 1.37, "learning_rate": 9.383121511945895e-05, "loss": 0.0086, "step": 530240 }, { "epoch": 1.37, "learning_rate": 9.38273269030875e-05, "loss": 0.0098, "step": 530250 }, { "epoch": 1.37, "learning_rate": 9.382343868671602e-05, "loss": 0.0128, "step": 530260 }, { "epoch": 1.37, "learning_rate": 9.381955047034456e-05, "loss": 0.0089, "step": 530270 }, { "epoch": 1.37, "learning_rate": 9.381566225397309e-05, "loss": 0.008, "step": 530280 }, { "epoch": 1.37, "learning_rate": 9.381177403760163e-05, "loss": 0.0069, "step": 530290 }, { "epoch": 1.37, "learning_rate": 9.380788582123016e-05, "loss": 0.0118, "step": 530300 }, { "epoch": 1.37, "learning_rate": 9.380399760485872e-05, "loss": 0.0079, "step": 530310 }, { "epoch": 1.37, "learning_rate": 9.380010938848724e-05, "loss": 0.0075, "step": 530320 }, { "epoch": 1.37, "learning_rate": 9.379622117211579e-05, "loss": 0.0079, "step": 530330 }, { "epoch": 1.37, "learning_rate": 9.379233295574431e-05, "loss": 0.0109, "step": 530340 }, { "epoch": 1.37, "learning_rate": 9.378844473937286e-05, "loss": 0.0093, "step": 530350 }, { "epoch": 1.37, "learning_rate": 9.378455652300138e-05, "loss": 0.0089, "step": 530360 }, { "epoch": 1.37, "learning_rate": 9.378066830662993e-05, "loss": 0.0103, "step": 530370 }, { "epoch": 1.37, "learning_rate": 9.377678009025845e-05, "loss": 0.0112, "step": 530380 }, { "epoch": 1.37, "learning_rate": 9.3772891873887e-05, "loss": 0.0119, "step": 530390 }, { "epoch": 1.37, "learning_rate": 9.376900365751552e-05, "loss": 0.0091, "step": 530400 }, { "epoch": 1.37, "learning_rate": 9.376511544114406e-05, "loss": 0.0076, "step": 530410 }, { "epoch": 1.37, "learning_rate": 9.376122722477259e-05, "loss": 0.0088, "step": 530420 }, { "epoch": 1.37, "learning_rate": 9.375733900840113e-05, "loss": 0.009, "step": 530430 }, { "epoch": 1.37, "learning_rate": 9.375345079202966e-05, "loss": 0.0084, "step": 530440 }, { "epoch": 1.38, "learning_rate": 9.37495625756582e-05, "loss": 0.0099, "step": 530450 }, { "epoch": 1.38, "learning_rate": 9.374567435928673e-05, "loss": 0.0085, "step": 530460 }, { "epoch": 1.38, "learning_rate": 9.374178614291526e-05, "loss": 0.0088, "step": 530470 }, { "epoch": 1.38, "learning_rate": 9.373789792654382e-05, "loss": 0.0092, "step": 530480 }, { "epoch": 1.38, "learning_rate": 9.373400971017233e-05, "loss": 0.0115, "step": 530490 }, { "epoch": 1.38, "learning_rate": 9.373012149380089e-05, "loss": 0.0103, "step": 530500 }, { "epoch": 1.38, "learning_rate": 9.372623327742941e-05, "loss": 0.0087, "step": 530510 }, { "epoch": 1.38, "learning_rate": 9.372234506105796e-05, "loss": 0.0078, "step": 530520 }, { "epoch": 1.38, "learning_rate": 9.371845684468648e-05, "loss": 0.0091, "step": 530530 }, { "epoch": 1.38, "learning_rate": 9.371456862831502e-05, "loss": 0.0112, "step": 530540 }, { "epoch": 1.38, "learning_rate": 9.371068041194355e-05, "loss": 0.0108, "step": 530550 }, { "epoch": 1.38, "learning_rate": 9.37067921955721e-05, "loss": 0.012, "step": 530560 }, { "epoch": 1.38, "learning_rate": 9.370290397920062e-05, "loss": 0.009, "step": 530570 }, { "epoch": 1.38, "learning_rate": 9.369901576282916e-05, "loss": 0.009, "step": 530580 }, { "epoch": 1.38, "learning_rate": 9.369512754645769e-05, "loss": 0.0144, "step": 530590 }, { "epoch": 1.38, "learning_rate": 9.369123933008623e-05, "loss": 0.0092, "step": 530600 }, { "epoch": 1.38, "learning_rate": 9.368735111371476e-05, "loss": 0.0102, "step": 530610 }, { "epoch": 1.38, "learning_rate": 9.36834628973433e-05, "loss": 0.0101, "step": 530620 }, { "epoch": 1.38, "learning_rate": 9.367957468097183e-05, "loss": 0.012, "step": 530630 }, { "epoch": 1.38, "learning_rate": 9.367568646460037e-05, "loss": 0.0109, "step": 530640 }, { "epoch": 1.38, "learning_rate": 9.36717982482289e-05, "loss": 0.0145, "step": 530650 }, { "epoch": 1.38, "learning_rate": 9.366791003185746e-05, "loss": 0.0065, "step": 530660 }, { "epoch": 1.38, "learning_rate": 9.366402181548598e-05, "loss": 0.0106, "step": 530670 }, { "epoch": 1.38, "learning_rate": 9.366013359911453e-05, "loss": 0.0089, "step": 530680 }, { "epoch": 1.38, "learning_rate": 9.365624538274305e-05, "loss": 0.0087, "step": 530690 }, { "epoch": 1.38, "learning_rate": 9.36523571663716e-05, "loss": 0.0078, "step": 530700 }, { "epoch": 1.38, "learning_rate": 9.364846895000012e-05, "loss": 0.0107, "step": 530710 }, { "epoch": 1.38, "learning_rate": 9.364458073362865e-05, "loss": 0.008, "step": 530720 }, { "epoch": 1.38, "learning_rate": 9.36406925172572e-05, "loss": 0.0113, "step": 530730 }, { "epoch": 1.38, "learning_rate": 9.363680430088572e-05, "loss": 0.0156, "step": 530740 }, { "epoch": 1.38, "learning_rate": 9.363291608451426e-05, "loss": 0.0102, "step": 530750 }, { "epoch": 1.38, "learning_rate": 9.362902786814279e-05, "loss": 0.0115, "step": 530760 }, { "epoch": 1.38, "learning_rate": 9.362513965177133e-05, "loss": 0.0185, "step": 530770 }, { "epoch": 1.38, "learning_rate": 9.362125143539986e-05, "loss": 0.0083, "step": 530780 }, { "epoch": 1.38, "learning_rate": 9.36173632190284e-05, "loss": 0.0081, "step": 530790 }, { "epoch": 1.38, "learning_rate": 9.361347500265693e-05, "loss": 0.01, "step": 530800 }, { "epoch": 1.38, "learning_rate": 9.360958678628547e-05, "loss": 0.0103, "step": 530810 }, { "epoch": 1.38, "learning_rate": 9.3605698569914e-05, "loss": 0.0115, "step": 530820 }, { "epoch": 1.38, "learning_rate": 9.360181035354256e-05, "loss": 0.0119, "step": 530830 }, { "epoch": 1.38, "learning_rate": 9.359792213717107e-05, "loss": 0.0077, "step": 530840 }, { "epoch": 1.38, "learning_rate": 9.359403392079963e-05, "loss": 0.0094, "step": 530850 }, { "epoch": 1.38, "learning_rate": 9.359014570442815e-05, "loss": 0.0115, "step": 530860 }, { "epoch": 1.38, "learning_rate": 9.35862574880567e-05, "loss": 0.0099, "step": 530870 }, { "epoch": 1.38, "learning_rate": 9.358236927168522e-05, "loss": 0.011, "step": 530880 }, { "epoch": 1.38, "learning_rate": 9.357848105531377e-05, "loss": 0.0081, "step": 530890 }, { "epoch": 1.38, "learning_rate": 9.35745928389423e-05, "loss": 0.0105, "step": 530900 }, { "epoch": 1.38, "learning_rate": 9.357070462257084e-05, "loss": 0.0094, "step": 530910 }, { "epoch": 1.38, "learning_rate": 9.356681640619936e-05, "loss": 0.0077, "step": 530920 }, { "epoch": 1.38, "learning_rate": 9.35629281898279e-05, "loss": 0.0103, "step": 530930 }, { "epoch": 1.38, "learning_rate": 9.355903997345643e-05, "loss": 0.0092, "step": 530940 }, { "epoch": 1.38, "learning_rate": 9.355515175708496e-05, "loss": 0.0088, "step": 530950 }, { "epoch": 1.38, "learning_rate": 9.35512635407135e-05, "loss": 0.0105, "step": 530960 }, { "epoch": 1.38, "learning_rate": 9.354737532434203e-05, "loss": 0.0122, "step": 530970 }, { "epoch": 1.38, "learning_rate": 9.354348710797057e-05, "loss": 0.0102, "step": 530980 }, { "epoch": 1.38, "learning_rate": 9.35395988915991e-05, "loss": 0.0093, "step": 530990 }, { "epoch": 1.38, "learning_rate": 9.353571067522764e-05, "loss": 0.0123, "step": 531000 }, { "epoch": 1.38, "eval_cer": 0.8816676953998133, "eval_loss": 0.006338402628898621, "eval_runtime": 107.8828, "eval_samples_per_second": 18.539, "eval_steps_per_second": 4.635, "step": 531000 }, { "epoch": 1.38, "learning_rate": 9.353182245885617e-05, "loss": 0.0096, "step": 531010 }, { "epoch": 1.38, "learning_rate": 9.352793424248473e-05, "loss": 0.0123, "step": 531020 }, { "epoch": 1.38, "learning_rate": 9.352404602611325e-05, "loss": 0.0192, "step": 531030 }, { "epoch": 1.38, "learning_rate": 9.35201578097418e-05, "loss": 0.0083, "step": 531040 }, { "epoch": 1.38, "learning_rate": 9.351626959337032e-05, "loss": 0.01, "step": 531050 }, { "epoch": 1.38, "learning_rate": 9.351238137699886e-05, "loss": 0.0099, "step": 531060 }, { "epoch": 1.38, "learning_rate": 9.350849316062739e-05, "loss": 0.0096, "step": 531070 }, { "epoch": 1.38, "learning_rate": 9.350460494425593e-05, "loss": 0.0089, "step": 531080 }, { "epoch": 1.38, "learning_rate": 9.350071672788446e-05, "loss": 0.0084, "step": 531090 }, { "epoch": 1.38, "learning_rate": 9.3496828511513e-05, "loss": 0.0112, "step": 531100 }, { "epoch": 1.38, "learning_rate": 9.349294029514153e-05, "loss": 0.0114, "step": 531110 }, { "epoch": 1.38, "learning_rate": 9.348905207877007e-05, "loss": 0.0074, "step": 531120 }, { "epoch": 1.38, "learning_rate": 9.34851638623986e-05, "loss": 0.009, "step": 531130 }, { "epoch": 1.38, "learning_rate": 9.348127564602714e-05, "loss": 0.0074, "step": 531140 }, { "epoch": 1.38, "learning_rate": 9.347738742965567e-05, "loss": 0.0094, "step": 531150 }, { "epoch": 1.38, "learning_rate": 9.347349921328421e-05, "loss": 0.0117, "step": 531160 }, { "epoch": 1.38, "learning_rate": 9.346961099691274e-05, "loss": 0.008, "step": 531170 }, { "epoch": 1.38, "learning_rate": 9.34657227805413e-05, "loss": 0.0097, "step": 531180 }, { "epoch": 1.38, "learning_rate": 9.346183456416982e-05, "loss": 0.0093, "step": 531190 }, { "epoch": 1.38, "learning_rate": 9.345794634779834e-05, "loss": 0.01, "step": 531200 }, { "epoch": 1.38, "learning_rate": 9.34540581314269e-05, "loss": 0.0093, "step": 531210 }, { "epoch": 1.38, "learning_rate": 9.345016991505542e-05, "loss": 0.0086, "step": 531220 }, { "epoch": 1.38, "learning_rate": 9.344628169868396e-05, "loss": 0.011, "step": 531230 }, { "epoch": 1.38, "learning_rate": 9.344239348231249e-05, "loss": 0.0086, "step": 531240 }, { "epoch": 1.38, "learning_rate": 9.343850526594103e-05, "loss": 0.0105, "step": 531250 }, { "epoch": 1.38, "learning_rate": 9.343461704956956e-05, "loss": 0.008, "step": 531260 }, { "epoch": 1.38, "learning_rate": 9.34307288331981e-05, "loss": 0.0102, "step": 531270 }, { "epoch": 1.38, "learning_rate": 9.342684061682663e-05, "loss": 0.0087, "step": 531280 }, { "epoch": 1.38, "learning_rate": 9.342295240045517e-05, "loss": 0.0116, "step": 531290 }, { "epoch": 1.38, "learning_rate": 9.34190641840837e-05, "loss": 0.0089, "step": 531300 }, { "epoch": 1.38, "learning_rate": 9.341517596771224e-05, "loss": 0.0077, "step": 531310 }, { "epoch": 1.38, "learning_rate": 9.341128775134077e-05, "loss": 0.0083, "step": 531320 }, { "epoch": 1.38, "learning_rate": 9.340739953496931e-05, "loss": 0.0089, "step": 531330 }, { "epoch": 1.38, "learning_rate": 9.340351131859784e-05, "loss": 0.01, "step": 531340 }, { "epoch": 1.38, "learning_rate": 9.33996231022264e-05, "loss": 0.0081, "step": 531350 }, { "epoch": 1.38, "learning_rate": 9.339573488585491e-05, "loss": 0.0095, "step": 531360 }, { "epoch": 1.38, "learning_rate": 9.339184666948347e-05, "loss": 0.0078, "step": 531370 }, { "epoch": 1.38, "learning_rate": 9.3387958453112e-05, "loss": 0.0077, "step": 531380 }, { "epoch": 1.38, "learning_rate": 9.338407023674054e-05, "loss": 0.0108, "step": 531390 }, { "epoch": 1.38, "learning_rate": 9.338018202036906e-05, "loss": 0.0094, "step": 531400 }, { "epoch": 1.38, "learning_rate": 9.33762938039976e-05, "loss": 0.0102, "step": 531410 }, { "epoch": 1.38, "learning_rate": 9.337240558762613e-05, "loss": 0.0084, "step": 531420 }, { "epoch": 1.38, "learning_rate": 9.336851737125468e-05, "loss": 0.0095, "step": 531430 }, { "epoch": 1.38, "learning_rate": 9.33646291548832e-05, "loss": 0.0103, "step": 531440 }, { "epoch": 1.38, "learning_rate": 9.336074093851173e-05, "loss": 0.0109, "step": 531450 }, { "epoch": 1.38, "learning_rate": 9.335685272214027e-05, "loss": 0.0088, "step": 531460 }, { "epoch": 1.38, "learning_rate": 9.33529645057688e-05, "loss": 0.0091, "step": 531470 }, { "epoch": 1.38, "learning_rate": 9.334907628939734e-05, "loss": 0.0088, "step": 531480 }, { "epoch": 1.38, "learning_rate": 9.334518807302587e-05, "loss": 0.0095, "step": 531490 }, { "epoch": 1.38, "learning_rate": 9.334129985665441e-05, "loss": 0.0102, "step": 531500 }, { "epoch": 1.38, "learning_rate": 9.333741164028294e-05, "loss": 0.0106, "step": 531510 }, { "epoch": 1.38, "learning_rate": 9.333352342391148e-05, "loss": 0.0091, "step": 531520 }, { "epoch": 1.38, "learning_rate": 9.332963520754001e-05, "loss": 0.0077, "step": 531530 }, { "epoch": 1.38, "learning_rate": 9.332574699116857e-05, "loss": 0.0114, "step": 531540 }, { "epoch": 1.38, "learning_rate": 9.33218587747971e-05, "loss": 0.0127, "step": 531550 }, { "epoch": 1.38, "learning_rate": 9.331797055842564e-05, "loss": 0.0088, "step": 531560 }, { "epoch": 1.38, "learning_rate": 9.331408234205416e-05, "loss": 0.0107, "step": 531570 }, { "epoch": 1.38, "learning_rate": 9.33101941256827e-05, "loss": 0.0103, "step": 531580 }, { "epoch": 1.38, "learning_rate": 9.330630590931123e-05, "loss": 0.0093, "step": 531590 }, { "epoch": 1.38, "learning_rate": 9.330241769293977e-05, "loss": 0.0081, "step": 531600 }, { "epoch": 1.38, "learning_rate": 9.32985294765683e-05, "loss": 0.0089, "step": 531610 }, { "epoch": 1.38, "learning_rate": 9.329464126019684e-05, "loss": 0.008, "step": 531620 }, { "epoch": 1.38, "learning_rate": 9.329075304382537e-05, "loss": 0.0091, "step": 531630 }, { "epoch": 1.38, "learning_rate": 9.328686482745391e-05, "loss": 0.011, "step": 531640 }, { "epoch": 1.38, "learning_rate": 9.328297661108244e-05, "loss": 0.0132, "step": 531650 }, { "epoch": 1.38, "learning_rate": 9.327908839471098e-05, "loss": 0.0093, "step": 531660 }, { "epoch": 1.38, "learning_rate": 9.327520017833951e-05, "loss": 0.0076, "step": 531670 }, { "epoch": 1.38, "learning_rate": 9.327131196196805e-05, "loss": 0.0112, "step": 531680 }, { "epoch": 1.38, "learning_rate": 9.326742374559658e-05, "loss": 0.0152, "step": 531690 }, { "epoch": 1.38, "learning_rate": 9.326353552922511e-05, "loss": 0.0104, "step": 531700 }, { "epoch": 1.38, "learning_rate": 9.325964731285366e-05, "loss": 0.0093, "step": 531710 }, { "epoch": 1.38, "learning_rate": 9.325575909648218e-05, "loss": 0.0111, "step": 531720 }, { "epoch": 1.38, "learning_rate": 9.325187088011073e-05, "loss": 0.0075, "step": 531730 }, { "epoch": 1.38, "learning_rate": 9.324798266373926e-05, "loss": 0.007, "step": 531740 }, { "epoch": 1.38, "learning_rate": 9.32440944473678e-05, "loss": 0.0114, "step": 531750 }, { "epoch": 1.38, "learning_rate": 9.324020623099633e-05, "loss": 0.0088, "step": 531760 }, { "epoch": 1.38, "learning_rate": 9.323631801462487e-05, "loss": 0.0086, "step": 531770 }, { "epoch": 1.38, "learning_rate": 9.32324297982534e-05, "loss": 0.0091, "step": 531780 }, { "epoch": 1.38, "learning_rate": 9.322854158188194e-05, "loss": 0.0105, "step": 531790 }, { "epoch": 1.38, "learning_rate": 9.322465336551047e-05, "loss": 0.0098, "step": 531800 }, { "epoch": 1.38, "learning_rate": 9.322076514913901e-05, "loss": 0.0093, "step": 531810 }, { "epoch": 1.38, "learning_rate": 9.321687693276754e-05, "loss": 0.0101, "step": 531820 }, { "epoch": 1.38, "learning_rate": 9.321298871639608e-05, "loss": 0.0068, "step": 531830 }, { "epoch": 1.38, "learning_rate": 9.320910050002461e-05, "loss": 0.0081, "step": 531840 }, { "epoch": 1.38, "learning_rate": 9.320521228365315e-05, "loss": 0.0114, "step": 531850 }, { "epoch": 1.38, "learning_rate": 9.320132406728168e-05, "loss": 0.0113, "step": 531860 }, { "epoch": 1.38, "learning_rate": 9.319743585091022e-05, "loss": 0.0092, "step": 531870 }, { "epoch": 1.38, "learning_rate": 9.319354763453875e-05, "loss": 0.0083, "step": 531880 }, { "epoch": 1.38, "learning_rate": 9.31896594181673e-05, "loss": 0.0088, "step": 531890 }, { "epoch": 1.38, "learning_rate": 9.318577120179583e-05, "loss": 0.0106, "step": 531900 }, { "epoch": 1.38, "learning_rate": 9.318188298542438e-05, "loss": 0.0104, "step": 531910 }, { "epoch": 1.38, "learning_rate": 9.31779947690529e-05, "loss": 0.0117, "step": 531920 }, { "epoch": 1.38, "learning_rate": 9.317410655268145e-05, "loss": 0.0125, "step": 531930 }, { "epoch": 1.38, "learning_rate": 9.317021833630997e-05, "loss": 0.011, "step": 531940 }, { "epoch": 1.38, "learning_rate": 9.31663301199385e-05, "loss": 0.0088, "step": 531950 }, { "epoch": 1.38, "learning_rate": 9.316244190356704e-05, "loss": 0.0088, "step": 531960 }, { "epoch": 1.38, "learning_rate": 9.315855368719557e-05, "loss": 0.0078, "step": 531970 }, { "epoch": 1.38, "learning_rate": 9.315466547082411e-05, "loss": 0.0075, "step": 531980 }, { "epoch": 1.38, "learning_rate": 9.315077725445264e-05, "loss": 0.0095, "step": 531990 }, { "epoch": 1.38, "learning_rate": 9.314688903808118e-05, "loss": 0.0085, "step": 532000 }, { "epoch": 1.38, "eval_cer": 0.8816690950367475, "eval_loss": 0.0063028521835803986, "eval_runtime": 108.1012, "eval_samples_per_second": 18.501, "eval_steps_per_second": 4.625, "step": 532000 }, { "epoch": 1.38, "learning_rate": 9.314300082170971e-05, "loss": 0.006, "step": 532010 }, { "epoch": 1.38, "learning_rate": 9.313911260533825e-05, "loss": 0.0104, "step": 532020 }, { "epoch": 1.38, "learning_rate": 9.313522438896678e-05, "loss": 0.0101, "step": 532030 }, { "epoch": 1.38, "learning_rate": 9.313133617259532e-05, "loss": 0.0079, "step": 532040 }, { "epoch": 1.38, "learning_rate": 9.312744795622385e-05, "loss": 0.012, "step": 532050 }, { "epoch": 1.38, "learning_rate": 9.31235597398524e-05, "loss": 0.0101, "step": 532060 }, { "epoch": 1.38, "learning_rate": 9.311967152348093e-05, "loss": 0.0085, "step": 532070 }, { "epoch": 1.38, "learning_rate": 9.311578330710947e-05, "loss": 0.0106, "step": 532080 }, { "epoch": 1.38, "learning_rate": 9.3111895090738e-05, "loss": 0.0092, "step": 532090 }, { "epoch": 1.38, "learning_rate": 9.310800687436654e-05, "loss": 0.0094, "step": 532100 }, { "epoch": 1.38, "learning_rate": 9.310411865799507e-05, "loss": 0.0074, "step": 532110 }, { "epoch": 1.38, "learning_rate": 9.310023044162361e-05, "loss": 0.0072, "step": 532120 }, { "epoch": 1.38, "learning_rate": 9.309634222525214e-05, "loss": 0.0132, "step": 532130 }, { "epoch": 1.38, "learning_rate": 9.309245400888068e-05, "loss": 0.0091, "step": 532140 }, { "epoch": 1.38, "learning_rate": 9.308856579250921e-05, "loss": 0.0105, "step": 532150 }, { "epoch": 1.38, "learning_rate": 9.308467757613775e-05, "loss": 0.0105, "step": 532160 }, { "epoch": 1.38, "learning_rate": 9.308078935976628e-05, "loss": 0.0111, "step": 532170 }, { "epoch": 1.38, "learning_rate": 9.307690114339482e-05, "loss": 0.0106, "step": 532180 }, { "epoch": 1.38, "learning_rate": 9.307301292702335e-05, "loss": 0.0111, "step": 532190 }, { "epoch": 1.38, "learning_rate": 9.306912471065188e-05, "loss": 0.0079, "step": 532200 }, { "epoch": 1.38, "learning_rate": 9.306523649428042e-05, "loss": 0.0081, "step": 532210 }, { "epoch": 1.38, "learning_rate": 9.306134827790895e-05, "loss": 0.0102, "step": 532220 }, { "epoch": 1.38, "learning_rate": 9.305746006153749e-05, "loss": 0.0115, "step": 532230 }, { "epoch": 1.38, "learning_rate": 9.305357184516602e-05, "loss": 0.0118, "step": 532240 }, { "epoch": 1.38, "learning_rate": 9.304968362879457e-05, "loss": 0.0117, "step": 532250 }, { "epoch": 1.38, "learning_rate": 9.30457954124231e-05, "loss": 0.011, "step": 532260 }, { "epoch": 1.38, "learning_rate": 9.304190719605164e-05, "loss": 0.0129, "step": 532270 }, { "epoch": 1.38, "learning_rate": 9.303801897968017e-05, "loss": 0.0127, "step": 532280 }, { "epoch": 1.38, "learning_rate": 9.303413076330871e-05, "loss": 0.0085, "step": 532290 }, { "epoch": 1.38, "learning_rate": 9.303024254693724e-05, "loss": 0.011, "step": 532300 }, { "epoch": 1.38, "learning_rate": 9.302635433056578e-05, "loss": 0.0074, "step": 532310 }, { "epoch": 1.38, "learning_rate": 9.302246611419431e-05, "loss": 0.0145, "step": 532320 }, { "epoch": 1.38, "learning_rate": 9.301857789782285e-05, "loss": 0.0108, "step": 532330 }, { "epoch": 1.38, "learning_rate": 9.301468968145138e-05, "loss": 0.0083, "step": 532340 }, { "epoch": 1.38, "learning_rate": 9.301080146507992e-05, "loss": 0.0097, "step": 532350 }, { "epoch": 1.38, "learning_rate": 9.300691324870845e-05, "loss": 0.011, "step": 532360 }, { "epoch": 1.38, "learning_rate": 9.300302503233699e-05, "loss": 0.0083, "step": 532370 }, { "epoch": 1.38, "learning_rate": 9.299913681596552e-05, "loss": 0.0111, "step": 532380 }, { "epoch": 1.38, "learning_rate": 9.299524859959406e-05, "loss": 0.0095, "step": 532390 }, { "epoch": 1.38, "learning_rate": 9.299136038322259e-05, "loss": 0.0108, "step": 532400 }, { "epoch": 1.38, "learning_rate": 9.298747216685115e-05, "loss": 0.009, "step": 532410 }, { "epoch": 1.38, "learning_rate": 9.298358395047967e-05, "loss": 0.008, "step": 532420 }, { "epoch": 1.38, "learning_rate": 9.297969573410822e-05, "loss": 0.0058, "step": 532430 }, { "epoch": 1.38, "learning_rate": 9.297580751773674e-05, "loss": 0.0092, "step": 532440 }, { "epoch": 1.38, "learning_rate": 9.297191930136527e-05, "loss": 0.0077, "step": 532450 }, { "epoch": 1.38, "learning_rate": 9.296803108499381e-05, "loss": 0.0096, "step": 532460 }, { "epoch": 1.38, "learning_rate": 9.296414286862234e-05, "loss": 0.0114, "step": 532470 }, { "epoch": 1.38, "learning_rate": 9.296025465225088e-05, "loss": 0.0076, "step": 532480 }, { "epoch": 1.38, "learning_rate": 9.295636643587941e-05, "loss": 0.0116, "step": 532490 }, { "epoch": 1.38, "learning_rate": 9.295247821950795e-05, "loss": 0.0108, "step": 532500 }, { "epoch": 1.38, "learning_rate": 9.294859000313648e-05, "loss": 0.0096, "step": 532510 }, { "epoch": 1.38, "learning_rate": 9.294470178676502e-05, "loss": 0.0098, "step": 532520 }, { "epoch": 1.38, "learning_rate": 9.294081357039355e-05, "loss": 0.008, "step": 532530 }, { "epoch": 1.38, "learning_rate": 9.293692535402209e-05, "loss": 0.0093, "step": 532540 }, { "epoch": 1.38, "learning_rate": 9.293303713765062e-05, "loss": 0.0084, "step": 532550 }, { "epoch": 1.38, "learning_rate": 9.292914892127916e-05, "loss": 0.0092, "step": 532560 }, { "epoch": 1.38, "learning_rate": 9.292526070490769e-05, "loss": 0.0079, "step": 532570 }, { "epoch": 1.38, "learning_rate": 9.292137248853625e-05, "loss": 0.0101, "step": 532580 }, { "epoch": 1.38, "learning_rate": 9.291748427216476e-05, "loss": 0.0093, "step": 532590 }, { "epoch": 1.38, "learning_rate": 9.291359605579331e-05, "loss": 0.011, "step": 532600 }, { "epoch": 1.38, "learning_rate": 9.290970783942184e-05, "loss": 0.0108, "step": 532610 }, { "epoch": 1.38, "learning_rate": 9.290581962305038e-05, "loss": 0.0093, "step": 532620 }, { "epoch": 1.38, "learning_rate": 9.290193140667891e-05, "loss": 0.0091, "step": 532630 }, { "epoch": 1.38, "learning_rate": 9.289804319030745e-05, "loss": 0.0087, "step": 532640 }, { "epoch": 1.38, "learning_rate": 9.289415497393598e-05, "loss": 0.0098, "step": 532650 }, { "epoch": 1.38, "learning_rate": 9.289026675756452e-05, "loss": 0.0072, "step": 532660 }, { "epoch": 1.38, "learning_rate": 9.288637854119305e-05, "loss": 0.0109, "step": 532670 }, { "epoch": 1.38, "learning_rate": 9.28824903248216e-05, "loss": 0.0113, "step": 532680 }, { "epoch": 1.38, "learning_rate": 9.287860210845012e-05, "loss": 0.0136, "step": 532690 }, { "epoch": 1.38, "learning_rate": 9.287471389207865e-05, "loss": 0.0101, "step": 532700 }, { "epoch": 1.38, "learning_rate": 9.287082567570719e-05, "loss": 0.0073, "step": 532710 }, { "epoch": 1.38, "learning_rate": 9.286693745933572e-05, "loss": 0.0101, "step": 532720 }, { "epoch": 1.38, "learning_rate": 9.286304924296426e-05, "loss": 0.0206, "step": 532730 }, { "epoch": 1.38, "learning_rate": 9.285916102659279e-05, "loss": 0.0087, "step": 532740 }, { "epoch": 1.38, "learning_rate": 9.285527281022133e-05, "loss": 0.0091, "step": 532750 }, { "epoch": 1.38, "learning_rate": 9.285138459384986e-05, "loss": 0.0085, "step": 532760 }, { "epoch": 1.38, "learning_rate": 9.284749637747841e-05, "loss": 0.01, "step": 532770 }, { "epoch": 1.38, "learning_rate": 9.284360816110694e-05, "loss": 0.0097, "step": 532780 }, { "epoch": 1.38, "learning_rate": 9.283971994473548e-05, "loss": 0.009, "step": 532790 }, { "epoch": 1.38, "learning_rate": 9.283583172836401e-05, "loss": 0.0101, "step": 532800 }, { "epoch": 1.38, "learning_rate": 9.283194351199255e-05, "loss": 0.0114, "step": 532810 }, { "epoch": 1.38, "learning_rate": 9.282805529562108e-05, "loss": 0.0086, "step": 532820 }, { "epoch": 1.38, "learning_rate": 9.282416707924962e-05, "loss": 0.0148, "step": 532830 }, { "epoch": 1.38, "learning_rate": 9.282027886287815e-05, "loss": 0.0085, "step": 532840 }, { "epoch": 1.38, "learning_rate": 9.281639064650669e-05, "loss": 0.0074, "step": 532850 }, { "epoch": 1.38, "learning_rate": 9.281250243013522e-05, "loss": 0.0102, "step": 532860 }, { "epoch": 1.38, "learning_rate": 9.280861421376376e-05, "loss": 0.012, "step": 532870 }, { "epoch": 1.38, "learning_rate": 9.280472599739229e-05, "loss": 0.0076, "step": 532880 }, { "epoch": 1.38, "learning_rate": 9.280083778102083e-05, "loss": 0.0132, "step": 532890 }, { "epoch": 1.38, "learning_rate": 9.279694956464936e-05, "loss": 0.0095, "step": 532900 }, { "epoch": 1.38, "learning_rate": 9.27930613482779e-05, "loss": 0.0084, "step": 532910 }, { "epoch": 1.38, "learning_rate": 9.278917313190643e-05, "loss": 0.0101, "step": 532920 }, { "epoch": 1.38, "learning_rate": 9.278528491553499e-05, "loss": 0.0089, "step": 532930 }, { "epoch": 1.38, "learning_rate": 9.278139669916351e-05, "loss": 0.0083, "step": 532940 }, { "epoch": 1.38, "learning_rate": 9.277750848279203e-05, "loss": 0.0087, "step": 532950 }, { "epoch": 1.38, "learning_rate": 9.277362026642058e-05, "loss": 0.011, "step": 532960 }, { "epoch": 1.38, "learning_rate": 9.276973205004911e-05, "loss": 0.009, "step": 532970 }, { "epoch": 1.38, "learning_rate": 9.276584383367765e-05, "loss": 0.014, "step": 532980 }, { "epoch": 1.38, "learning_rate": 9.276195561730618e-05, "loss": 0.0064, "step": 532990 }, { "epoch": 1.38, "learning_rate": 9.275806740093472e-05, "loss": 0.0092, "step": 533000 }, { "epoch": 1.38, "eval_cer": 0.8816914892276944, "eval_loss": 0.006268115248531103, "eval_runtime": 107.8458, "eval_samples_per_second": 18.545, "eval_steps_per_second": 4.636, "step": 533000 }, { "epoch": 1.38, "learning_rate": 9.275417918456325e-05, "loss": 0.0076, "step": 533010 }, { "epoch": 1.38, "learning_rate": 9.275029096819179e-05, "loss": 0.0086, "step": 533020 }, { "epoch": 1.38, "learning_rate": 9.274640275182032e-05, "loss": 0.0094, "step": 533030 }, { "epoch": 1.38, "learning_rate": 9.274251453544886e-05, "loss": 0.0094, "step": 533040 }, { "epoch": 1.38, "learning_rate": 9.273862631907739e-05, "loss": 0.0104, "step": 533050 }, { "epoch": 1.38, "learning_rate": 9.273473810270593e-05, "loss": 0.0095, "step": 533060 }, { "epoch": 1.38, "learning_rate": 9.273084988633446e-05, "loss": 0.0086, "step": 533070 }, { "epoch": 1.38, "learning_rate": 9.2726961669963e-05, "loss": 0.0093, "step": 533080 }, { "epoch": 1.38, "learning_rate": 9.272307345359153e-05, "loss": 0.0094, "step": 533090 }, { "epoch": 1.38, "learning_rate": 9.271918523722009e-05, "loss": 0.0094, "step": 533100 }, { "epoch": 1.38, "learning_rate": 9.27152970208486e-05, "loss": 0.0106, "step": 533110 }, { "epoch": 1.38, "learning_rate": 9.271140880447715e-05, "loss": 0.0081, "step": 533120 }, { "epoch": 1.38, "learning_rate": 9.270752058810568e-05, "loss": 0.0092, "step": 533130 }, { "epoch": 1.38, "learning_rate": 9.270363237173422e-05, "loss": 0.0116, "step": 533140 }, { "epoch": 1.38, "learning_rate": 9.269974415536275e-05, "loss": 0.0119, "step": 533150 }, { "epoch": 1.38, "learning_rate": 9.26958559389913e-05, "loss": 0.0085, "step": 533160 }, { "epoch": 1.38, "learning_rate": 9.269196772261982e-05, "loss": 0.011, "step": 533170 }, { "epoch": 1.38, "learning_rate": 9.268807950624836e-05, "loss": 0.0108, "step": 533180 }, { "epoch": 1.38, "learning_rate": 9.268419128987689e-05, "loss": 0.0092, "step": 533190 }, { "epoch": 1.38, "learning_rate": 9.268030307350542e-05, "loss": 0.014, "step": 533200 }, { "epoch": 1.38, "learning_rate": 9.267641485713396e-05, "loss": 0.0085, "step": 533210 }, { "epoch": 1.38, "learning_rate": 9.267252664076249e-05, "loss": 0.0106, "step": 533220 }, { "epoch": 1.38, "learning_rate": 9.266863842439103e-05, "loss": 0.0084, "step": 533230 }, { "epoch": 1.38, "learning_rate": 9.266475020801956e-05, "loss": 0.0089, "step": 533240 }, { "epoch": 1.38, "learning_rate": 9.26608619916481e-05, "loss": 0.009, "step": 533250 }, { "epoch": 1.38, "learning_rate": 9.265697377527663e-05, "loss": 0.0107, "step": 533260 }, { "epoch": 1.38, "learning_rate": 9.265308555890517e-05, "loss": 0.0143, "step": 533270 }, { "epoch": 1.38, "learning_rate": 9.26491973425337e-05, "loss": 0.0078, "step": 533280 }, { "epoch": 1.38, "learning_rate": 9.264530912616225e-05, "loss": 0.0093, "step": 533290 }, { "epoch": 1.38, "learning_rate": 9.264142090979078e-05, "loss": 0.0078, "step": 533300 }, { "epoch": 1.38, "learning_rate": 9.263753269341932e-05, "loss": 0.0093, "step": 533310 }, { "epoch": 1.38, "learning_rate": 9.263364447704785e-05, "loss": 0.0084, "step": 533320 }, { "epoch": 1.38, "learning_rate": 9.26297562606764e-05, "loss": 0.0101, "step": 533330 }, { "epoch": 1.38, "learning_rate": 9.262586804430492e-05, "loss": 0.0075, "step": 533340 }, { "epoch": 1.38, "learning_rate": 9.262197982793346e-05, "loss": 0.0135, "step": 533350 }, { "epoch": 1.38, "learning_rate": 9.261809161156199e-05, "loss": 0.009, "step": 533360 }, { "epoch": 1.38, "learning_rate": 9.261420339519053e-05, "loss": 0.0109, "step": 533370 }, { "epoch": 1.38, "learning_rate": 9.261031517881906e-05, "loss": 0.0121, "step": 533380 }, { "epoch": 1.38, "learning_rate": 9.26064269624476e-05, "loss": 0.0133, "step": 533390 }, { "epoch": 1.38, "learning_rate": 9.260253874607613e-05, "loss": 0.0094, "step": 533400 }, { "epoch": 1.38, "learning_rate": 9.259865052970467e-05, "loss": 0.0137, "step": 533410 }, { "epoch": 1.38, "learning_rate": 9.25947623133332e-05, "loss": 0.0117, "step": 533420 }, { "epoch": 1.38, "learning_rate": 9.259087409696173e-05, "loss": 0.0082, "step": 533430 }, { "epoch": 1.38, "learning_rate": 9.258698588059027e-05, "loss": 0.0085, "step": 533440 }, { "epoch": 1.38, "learning_rate": 9.25830976642188e-05, "loss": 0.0074, "step": 533450 }, { "epoch": 1.38, "learning_rate": 9.257920944784734e-05, "loss": 0.01, "step": 533460 }, { "epoch": 1.38, "learning_rate": 9.257532123147587e-05, "loss": 0.01, "step": 533470 }, { "epoch": 1.38, "learning_rate": 9.257143301510442e-05, "loss": 0.0123, "step": 533480 }, { "epoch": 1.38, "learning_rate": 9.256754479873295e-05, "loss": 0.0103, "step": 533490 }, { "epoch": 1.38, "learning_rate": 9.256365658236149e-05, "loss": 0.0074, "step": 533500 }, { "epoch": 1.38, "learning_rate": 9.255976836599002e-05, "loss": 0.0099, "step": 533510 }, { "epoch": 1.38, "learning_rate": 9.255588014961856e-05, "loss": 0.0085, "step": 533520 }, { "epoch": 1.38, "learning_rate": 9.255199193324709e-05, "loss": 0.0115, "step": 533530 }, { "epoch": 1.38, "learning_rate": 9.254810371687563e-05, "loss": 0.0148, "step": 533540 }, { "epoch": 1.38, "learning_rate": 9.254421550050416e-05, "loss": 0.0114, "step": 533550 }, { "epoch": 1.38, "learning_rate": 9.25403272841327e-05, "loss": 0.011, "step": 533560 }, { "epoch": 1.38, "learning_rate": 9.253643906776123e-05, "loss": 0.0094, "step": 533570 }, { "epoch": 1.38, "learning_rate": 9.253255085138977e-05, "loss": 0.0086, "step": 533580 }, { "epoch": 1.38, "learning_rate": 9.25286626350183e-05, "loss": 0.0078, "step": 533590 }, { "epoch": 1.38, "learning_rate": 9.252477441864684e-05, "loss": 0.0126, "step": 533600 }, { "epoch": 1.38, "learning_rate": 9.252088620227537e-05, "loss": 0.0116, "step": 533610 }, { "epoch": 1.38, "learning_rate": 9.251699798590391e-05, "loss": 0.0099, "step": 533620 }, { "epoch": 1.38, "learning_rate": 9.251310976953244e-05, "loss": 0.0118, "step": 533630 }, { "epoch": 1.38, "learning_rate": 9.2509221553161e-05, "loss": 0.01, "step": 533640 }, { "epoch": 1.38, "learning_rate": 9.250533333678952e-05, "loss": 0.0082, "step": 533650 }, { "epoch": 1.38, "learning_rate": 9.250144512041806e-05, "loss": 0.0125, "step": 533660 }, { "epoch": 1.38, "learning_rate": 9.249755690404659e-05, "loss": 0.0112, "step": 533670 }, { "epoch": 1.38, "learning_rate": 9.249366868767512e-05, "loss": 0.0077, "step": 533680 }, { "epoch": 1.38, "learning_rate": 9.248978047130366e-05, "loss": 0.0098, "step": 533690 }, { "epoch": 1.38, "learning_rate": 9.248589225493219e-05, "loss": 0.009, "step": 533700 }, { "epoch": 1.38, "learning_rate": 9.248200403856073e-05, "loss": 0.0109, "step": 533710 }, { "epoch": 1.38, "learning_rate": 9.247811582218926e-05, "loss": 0.009, "step": 533720 }, { "epoch": 1.38, "learning_rate": 9.24742276058178e-05, "loss": 0.0104, "step": 533730 }, { "epoch": 1.38, "learning_rate": 9.247033938944633e-05, "loss": 0.0071, "step": 533740 }, { "epoch": 1.38, "learning_rate": 9.246645117307487e-05, "loss": 0.0093, "step": 533750 }, { "epoch": 1.38, "learning_rate": 9.24625629567034e-05, "loss": 0.0079, "step": 533760 }, { "epoch": 1.38, "learning_rate": 9.245867474033194e-05, "loss": 0.0093, "step": 533770 }, { "epoch": 1.38, "learning_rate": 9.245478652396047e-05, "loss": 0.0087, "step": 533780 }, { "epoch": 1.38, "learning_rate": 9.245089830758901e-05, "loss": 0.0095, "step": 533790 }, { "epoch": 1.38, "learning_rate": 9.244701009121754e-05, "loss": 0.008, "step": 533800 }, { "epoch": 1.38, "learning_rate": 9.24431218748461e-05, "loss": 0.0139, "step": 533810 }, { "epoch": 1.38, "learning_rate": 9.243923365847461e-05, "loss": 0.0108, "step": 533820 }, { "epoch": 1.38, "learning_rate": 9.243534544210316e-05, "loss": 0.0082, "step": 533830 }, { "epoch": 1.38, "learning_rate": 9.243145722573169e-05, "loss": 0.0123, "step": 533840 }, { "epoch": 1.38, "learning_rate": 9.242756900936023e-05, "loss": 0.0107, "step": 533850 }, { "epoch": 1.38, "learning_rate": 9.242368079298876e-05, "loss": 0.0084, "step": 533860 }, { "epoch": 1.38, "learning_rate": 9.24197925766173e-05, "loss": 0.0119, "step": 533870 }, { "epoch": 1.38, "learning_rate": 9.241590436024583e-05, "loss": 0.0095, "step": 533880 }, { "epoch": 1.38, "learning_rate": 9.241201614387437e-05, "loss": 0.0094, "step": 533890 }, { "epoch": 1.38, "learning_rate": 9.24081279275029e-05, "loss": 0.0086, "step": 533900 }, { "epoch": 1.38, "learning_rate": 9.240423971113144e-05, "loss": 0.0082, "step": 533910 }, { "epoch": 1.38, "learning_rate": 9.240035149475997e-05, "loss": 0.0087, "step": 533920 }, { "epoch": 1.38, "learning_rate": 9.23964632783885e-05, "loss": 0.0102, "step": 533930 }, { "epoch": 1.38, "learning_rate": 9.239257506201704e-05, "loss": 0.0103, "step": 533940 }, { "epoch": 1.38, "learning_rate": 9.238868684564557e-05, "loss": 0.0096, "step": 533950 }, { "epoch": 1.38, "learning_rate": 9.238479862927411e-05, "loss": 0.0093, "step": 533960 }, { "epoch": 1.38, "learning_rate": 9.238091041290264e-05, "loss": 0.0111, "step": 533970 }, { "epoch": 1.38, "learning_rate": 9.237702219653118e-05, "loss": 0.0109, "step": 533980 }, { "epoch": 1.38, "learning_rate": 9.237313398015971e-05, "loss": 0.0128, "step": 533990 }, { "epoch": 1.38, "learning_rate": 9.236924576378826e-05, "loss": 0.0091, "step": 534000 }, { "epoch": 1.38, "eval_cer": 0.8816900895907601, "eval_loss": 0.0059846206568181515, "eval_runtime": 107.6906, "eval_samples_per_second": 18.572, "eval_steps_per_second": 4.643, "step": 534000 }, { "epoch": 1.38, "learning_rate": 9.236535754741679e-05, "loss": 0.0112, "step": 534010 }, { "epoch": 1.38, "learning_rate": 9.236146933104533e-05, "loss": 0.0117, "step": 534020 }, { "epoch": 1.38, "learning_rate": 9.235758111467386e-05, "loss": 0.0094, "step": 534030 }, { "epoch": 1.38, "learning_rate": 9.23536928983024e-05, "loss": 0.0092, "step": 534040 }, { "epoch": 1.38, "learning_rate": 9.234980468193093e-05, "loss": 0.0064, "step": 534050 }, { "epoch": 1.38, "learning_rate": 9.234591646555947e-05, "loss": 0.0108, "step": 534060 }, { "epoch": 1.38, "learning_rate": 9.2342028249188e-05, "loss": 0.008, "step": 534070 }, { "epoch": 1.38, "learning_rate": 9.233814003281654e-05, "loss": 0.0117, "step": 534080 }, { "epoch": 1.38, "learning_rate": 9.233425181644507e-05, "loss": 0.0069, "step": 534090 }, { "epoch": 1.38, "learning_rate": 9.233036360007361e-05, "loss": 0.0096, "step": 534100 }, { "epoch": 1.38, "learning_rate": 9.232647538370214e-05, "loss": 0.0091, "step": 534110 }, { "epoch": 1.38, "learning_rate": 9.232258716733068e-05, "loss": 0.0097, "step": 534120 }, { "epoch": 1.38, "learning_rate": 9.231869895095921e-05, "loss": 0.0107, "step": 534130 }, { "epoch": 1.38, "learning_rate": 9.231481073458775e-05, "loss": 0.0108, "step": 534140 }, { "epoch": 1.38, "learning_rate": 9.231092251821628e-05, "loss": 0.0099, "step": 534150 }, { "epoch": 1.38, "learning_rate": 9.230703430184483e-05, "loss": 0.0106, "step": 534160 }, { "epoch": 1.38, "learning_rate": 9.230314608547336e-05, "loss": 0.0092, "step": 534170 }, { "epoch": 1.38, "learning_rate": 9.229925786910188e-05, "loss": 0.0139, "step": 534180 }, { "epoch": 1.38, "learning_rate": 9.229536965273043e-05, "loss": 0.0089, "step": 534190 }, { "epoch": 1.38, "learning_rate": 9.229148143635896e-05, "loss": 0.0088, "step": 534200 }, { "epoch": 1.38, "learning_rate": 9.22875932199875e-05, "loss": 0.0105, "step": 534210 }, { "epoch": 1.38, "learning_rate": 9.228370500361603e-05, "loss": 0.0095, "step": 534220 }, { "epoch": 1.38, "learning_rate": 9.227981678724457e-05, "loss": 0.0093, "step": 534230 }, { "epoch": 1.38, "learning_rate": 9.22759285708731e-05, "loss": 0.0088, "step": 534240 }, { "epoch": 1.38, "learning_rate": 9.227204035450164e-05, "loss": 0.0094, "step": 534250 }, { "epoch": 1.38, "learning_rate": 9.226815213813017e-05, "loss": 0.0102, "step": 534260 }, { "epoch": 1.38, "learning_rate": 9.226426392175871e-05, "loss": 0.0117, "step": 534270 }, { "epoch": 1.38, "learning_rate": 9.226037570538724e-05, "loss": 0.0081, "step": 534280 }, { "epoch": 1.38, "learning_rate": 9.225648748901578e-05, "loss": 0.0098, "step": 534290 }, { "epoch": 1.38, "learning_rate": 9.225259927264431e-05, "loss": 0.0076, "step": 534300 }, { "epoch": 1.39, "learning_rate": 9.224871105627285e-05, "loss": 0.0084, "step": 534310 }, { "epoch": 1.39, "learning_rate": 9.224482283990138e-05, "loss": 0.0114, "step": 534320 }, { "epoch": 1.39, "learning_rate": 9.224093462352993e-05, "loss": 0.0081, "step": 534330 }, { "epoch": 1.39, "learning_rate": 9.223704640715845e-05, "loss": 0.0102, "step": 534340 }, { "epoch": 1.39, "learning_rate": 9.2233158190787e-05, "loss": 0.0085, "step": 534350 }, { "epoch": 1.39, "learning_rate": 9.222926997441553e-05, "loss": 0.0099, "step": 534360 }, { "epoch": 1.39, "learning_rate": 9.222538175804407e-05, "loss": 0.0081, "step": 534370 }, { "epoch": 1.39, "learning_rate": 9.22214935416726e-05, "loss": 0.0111, "step": 534380 }, { "epoch": 1.39, "learning_rate": 9.221760532530114e-05, "loss": 0.0101, "step": 534390 }, { "epoch": 1.39, "learning_rate": 9.221371710892967e-05, "loss": 0.0121, "step": 534400 }, { "epoch": 1.39, "learning_rate": 9.220982889255821e-05, "loss": 0.01, "step": 534410 }, { "epoch": 1.39, "learning_rate": 9.220594067618674e-05, "loss": 0.0126, "step": 534420 }, { "epoch": 1.39, "learning_rate": 9.220205245981527e-05, "loss": 0.0106, "step": 534430 }, { "epoch": 1.39, "learning_rate": 9.219816424344381e-05, "loss": 0.0082, "step": 534440 }, { "epoch": 1.39, "learning_rate": 9.219427602707234e-05, "loss": 0.0093, "step": 534450 }, { "epoch": 1.39, "learning_rate": 9.219038781070088e-05, "loss": 0.0099, "step": 534460 }, { "epoch": 1.39, "learning_rate": 9.218649959432941e-05, "loss": 0.0075, "step": 534470 }, { "epoch": 1.39, "learning_rate": 9.218261137795795e-05, "loss": 0.0102, "step": 534480 }, { "epoch": 1.39, "learning_rate": 9.217872316158648e-05, "loss": 0.0101, "step": 534490 }, { "epoch": 1.39, "learning_rate": 9.217483494521502e-05, "loss": 0.0102, "step": 534500 }, { "epoch": 1.39, "learning_rate": 9.217094672884355e-05, "loss": 0.0082, "step": 534510 }, { "epoch": 1.39, "learning_rate": 9.21670585124721e-05, "loss": 0.0091, "step": 534520 }, { "epoch": 1.39, "learning_rate": 9.216317029610063e-05, "loss": 0.0092, "step": 534530 }, { "epoch": 1.39, "learning_rate": 9.215928207972917e-05, "loss": 0.0092, "step": 534540 }, { "epoch": 1.39, "learning_rate": 9.21553938633577e-05, "loss": 0.0093, "step": 534550 }, { "epoch": 1.39, "learning_rate": 9.215150564698624e-05, "loss": 0.0106, "step": 534560 }, { "epoch": 1.39, "learning_rate": 9.214761743061477e-05, "loss": 0.0079, "step": 534570 }, { "epoch": 1.39, "learning_rate": 9.214372921424331e-05, "loss": 0.0084, "step": 534580 }, { "epoch": 1.39, "learning_rate": 9.213984099787184e-05, "loss": 0.0096, "step": 534590 }, { "epoch": 1.39, "learning_rate": 9.213595278150038e-05, "loss": 0.0096, "step": 534600 }, { "epoch": 1.39, "learning_rate": 9.213206456512891e-05, "loss": 0.0108, "step": 534610 }, { "epoch": 1.39, "learning_rate": 9.212817634875745e-05, "loss": 0.0099, "step": 534620 }, { "epoch": 1.39, "learning_rate": 9.212428813238598e-05, "loss": 0.0093, "step": 534630 }, { "epoch": 1.39, "learning_rate": 9.212039991601452e-05, "loss": 0.008, "step": 534640 }, { "epoch": 1.39, "learning_rate": 9.211651169964305e-05, "loss": 0.01, "step": 534650 }, { "epoch": 1.39, "learning_rate": 9.211262348327159e-05, "loss": 0.0155, "step": 534660 }, { "epoch": 1.39, "learning_rate": 9.210873526690012e-05, "loss": 0.0094, "step": 534670 }, { "epoch": 1.39, "learning_rate": 9.210484705052865e-05, "loss": 0.0075, "step": 534680 }, { "epoch": 1.39, "learning_rate": 9.21009588341572e-05, "loss": 0.0093, "step": 534690 }, { "epoch": 1.39, "learning_rate": 9.209707061778572e-05, "loss": 0.0075, "step": 534700 }, { "epoch": 1.39, "learning_rate": 9.209318240141427e-05, "loss": 0.0086, "step": 534710 }, { "epoch": 1.39, "learning_rate": 9.20892941850428e-05, "loss": 0.0081, "step": 534720 }, { "epoch": 1.39, "learning_rate": 9.208540596867134e-05, "loss": 0.0078, "step": 534730 }, { "epoch": 1.39, "learning_rate": 9.208151775229987e-05, "loss": 0.0074, "step": 534740 }, { "epoch": 1.39, "learning_rate": 9.207762953592841e-05, "loss": 0.0091, "step": 534750 }, { "epoch": 1.39, "learning_rate": 9.207374131955694e-05, "loss": 0.0095, "step": 534760 }, { "epoch": 1.39, "learning_rate": 9.206985310318548e-05, "loss": 0.0082, "step": 534770 }, { "epoch": 1.39, "learning_rate": 9.206596488681401e-05, "loss": 0.0093, "step": 534780 }, { "epoch": 1.39, "learning_rate": 9.206207667044255e-05, "loss": 0.0079, "step": 534790 }, { "epoch": 1.39, "learning_rate": 9.205818845407108e-05, "loss": 0.0079, "step": 534800 }, { "epoch": 1.39, "learning_rate": 9.205430023769962e-05, "loss": 0.0095, "step": 534810 }, { "epoch": 1.39, "learning_rate": 9.205041202132815e-05, "loss": 0.0106, "step": 534820 }, { "epoch": 1.39, "learning_rate": 9.204652380495669e-05, "loss": 0.0077, "step": 534830 }, { "epoch": 1.39, "learning_rate": 9.204263558858522e-05, "loss": 0.0071, "step": 534840 }, { "epoch": 1.39, "learning_rate": 9.203874737221376e-05, "loss": 0.0108, "step": 534850 }, { "epoch": 1.39, "learning_rate": 9.203485915584229e-05, "loss": 0.0074, "step": 534860 }, { "epoch": 1.39, "learning_rate": 9.203097093947084e-05, "loss": 0.0084, "step": 534870 }, { "epoch": 1.39, "learning_rate": 9.202708272309937e-05, "loss": 0.0087, "step": 534880 }, { "epoch": 1.39, "learning_rate": 9.202319450672791e-05, "loss": 0.0098, "step": 534890 }, { "epoch": 1.39, "learning_rate": 9.201930629035644e-05, "loss": 0.0083, "step": 534900 }, { "epoch": 1.39, "learning_rate": 9.201541807398498e-05, "loss": 0.0075, "step": 534910 }, { "epoch": 1.39, "learning_rate": 9.201152985761351e-05, "loss": 0.0088, "step": 534920 }, { "epoch": 1.39, "learning_rate": 9.200764164124204e-05, "loss": 0.0122, "step": 534930 }, { "epoch": 1.39, "learning_rate": 9.200375342487058e-05, "loss": 0.0083, "step": 534940 }, { "epoch": 1.39, "learning_rate": 9.199986520849911e-05, "loss": 0.01, "step": 534950 }, { "epoch": 1.39, "learning_rate": 9.199597699212765e-05, "loss": 0.0097, "step": 534960 }, { "epoch": 1.39, "learning_rate": 9.199208877575618e-05, "loss": 0.0122, "step": 534970 }, { "epoch": 1.39, "learning_rate": 9.198820055938472e-05, "loss": 0.0076, "step": 534980 }, { "epoch": 1.39, "learning_rate": 9.198431234301325e-05, "loss": 0.009, "step": 534990 }, { "epoch": 1.39, "learning_rate": 9.198042412664179e-05, "loss": 0.0105, "step": 535000 }, { "epoch": 1.39, "eval_cer": 0.8816802921322209, "eval_loss": 0.0063683707267045975, "eval_runtime": 107.8309, "eval_samples_per_second": 18.548, "eval_steps_per_second": 4.637, "step": 535000 }, { "epoch": 1.39, "learning_rate": 9.197653591027032e-05, "loss": 0.0114, "step": 535010 }, { "epoch": 1.39, "learning_rate": 9.197264769389886e-05, "loss": 0.0086, "step": 535020 }, { "epoch": 1.39, "learning_rate": 9.196875947752739e-05, "loss": 0.0101, "step": 535030 }, { "epoch": 1.39, "learning_rate": 9.196487126115594e-05, "loss": 0.0121, "step": 535040 }, { "epoch": 1.39, "learning_rate": 9.196098304478446e-05, "loss": 0.0115, "step": 535050 }, { "epoch": 1.39, "learning_rate": 9.195709482841301e-05, "loss": 0.0124, "step": 535060 }, { "epoch": 1.39, "learning_rate": 9.195320661204154e-05, "loss": 0.0079, "step": 535070 }, { "epoch": 1.39, "learning_rate": 9.194931839567008e-05, "loss": 0.012, "step": 535080 }, { "epoch": 1.39, "learning_rate": 9.194543017929861e-05, "loss": 0.0095, "step": 535090 }, { "epoch": 1.39, "learning_rate": 9.194154196292715e-05, "loss": 0.0083, "step": 535100 }, { "epoch": 1.39, "learning_rate": 9.193765374655568e-05, "loss": 0.0091, "step": 535110 }, { "epoch": 1.39, "learning_rate": 9.193376553018422e-05, "loss": 0.0097, "step": 535120 }, { "epoch": 1.39, "learning_rate": 9.192987731381275e-05, "loss": 0.0109, "step": 535130 }, { "epoch": 1.39, "learning_rate": 9.192598909744129e-05, "loss": 0.0109, "step": 535140 }, { "epoch": 1.39, "learning_rate": 9.192210088106982e-05, "loss": 0.0107, "step": 535150 }, { "epoch": 1.39, "learning_rate": 9.191821266469836e-05, "loss": 0.009, "step": 535160 }, { "epoch": 1.39, "learning_rate": 9.191432444832689e-05, "loss": 0.0101, "step": 535170 }, { "epoch": 1.39, "learning_rate": 9.191043623195542e-05, "loss": 0.0101, "step": 535180 }, { "epoch": 1.39, "learning_rate": 9.190654801558396e-05, "loss": 0.0095, "step": 535190 }, { "epoch": 1.39, "learning_rate": 9.190265979921249e-05, "loss": 0.0143, "step": 535200 }, { "epoch": 1.39, "learning_rate": 9.189877158284103e-05, "loss": 0.0089, "step": 535210 }, { "epoch": 1.39, "learning_rate": 9.189488336646956e-05, "loss": 0.0076, "step": 535220 }, { "epoch": 1.39, "learning_rate": 9.189099515009811e-05, "loss": 0.0103, "step": 535230 }, { "epoch": 1.39, "learning_rate": 9.188710693372664e-05, "loss": 0.0117, "step": 535240 }, { "epoch": 1.39, "learning_rate": 9.188321871735518e-05, "loss": 0.0087, "step": 535250 }, { "epoch": 1.39, "learning_rate": 9.187933050098371e-05, "loss": 0.0093, "step": 535260 }, { "epoch": 1.39, "learning_rate": 9.187544228461225e-05, "loss": 0.01, "step": 535270 }, { "epoch": 1.39, "learning_rate": 9.187155406824078e-05, "loss": 0.0105, "step": 535280 }, { "epoch": 1.39, "learning_rate": 9.186766585186932e-05, "loss": 0.0098, "step": 535290 }, { "epoch": 1.39, "learning_rate": 9.186377763549785e-05, "loss": 0.0091, "step": 535300 }, { "epoch": 1.39, "learning_rate": 9.185988941912639e-05, "loss": 0.0092, "step": 535310 }, { "epoch": 1.39, "learning_rate": 9.185600120275492e-05, "loss": 0.0097, "step": 535320 }, { "epoch": 1.39, "learning_rate": 9.185211298638346e-05, "loss": 0.0096, "step": 535330 }, { "epoch": 1.39, "learning_rate": 9.184822477001199e-05, "loss": 0.0073, "step": 535340 }, { "epoch": 1.39, "learning_rate": 9.184433655364053e-05, "loss": 0.0103, "step": 535350 }, { "epoch": 1.39, "learning_rate": 9.184044833726906e-05, "loss": 0.0071, "step": 535360 }, { "epoch": 1.39, "learning_rate": 9.18365601208976e-05, "loss": 0.0065, "step": 535370 }, { "epoch": 1.39, "learning_rate": 9.183267190452613e-05, "loss": 0.0108, "step": 535380 }, { "epoch": 1.39, "learning_rate": 9.182878368815468e-05, "loss": 0.0087, "step": 535390 }, { "epoch": 1.39, "learning_rate": 9.182489547178321e-05, "loss": 0.0089, "step": 535400 }, { "epoch": 1.39, "learning_rate": 9.182100725541175e-05, "loss": 0.0103, "step": 535410 }, { "epoch": 1.39, "learning_rate": 9.181711903904028e-05, "loss": 0.0118, "step": 535420 }, { "epoch": 1.39, "learning_rate": 9.181323082266881e-05, "loss": 0.0114, "step": 535430 }, { "epoch": 1.39, "learning_rate": 9.180934260629735e-05, "loss": 0.009, "step": 535440 }, { "epoch": 1.39, "learning_rate": 9.180545438992588e-05, "loss": 0.0067, "step": 535450 }, { "epoch": 1.39, "learning_rate": 9.180156617355442e-05, "loss": 0.0108, "step": 535460 }, { "epoch": 1.39, "learning_rate": 9.179767795718295e-05, "loss": 0.0091, "step": 535470 }, { "epoch": 1.39, "learning_rate": 9.179378974081149e-05, "loss": 0.0079, "step": 535480 }, { "epoch": 1.39, "learning_rate": 9.178990152444002e-05, "loss": 0.0121, "step": 535490 }, { "epoch": 1.39, "learning_rate": 9.178601330806856e-05, "loss": 0.0109, "step": 535500 }, { "epoch": 1.39, "learning_rate": 9.178212509169709e-05, "loss": 0.0069, "step": 535510 }, { "epoch": 1.39, "learning_rate": 9.177823687532563e-05, "loss": 0.0095, "step": 535520 }, { "epoch": 1.39, "learning_rate": 9.177434865895416e-05, "loss": 0.0075, "step": 535530 }, { "epoch": 1.39, "learning_rate": 9.17704604425827e-05, "loss": 0.0101, "step": 535540 }, { "epoch": 1.39, "learning_rate": 9.176657222621123e-05, "loss": 0.0088, "step": 535550 }, { "epoch": 1.39, "learning_rate": 9.176268400983978e-05, "loss": 0.0051, "step": 535560 }, { "epoch": 1.39, "learning_rate": 9.17587957934683e-05, "loss": 0.0108, "step": 535570 }, { "epoch": 1.39, "learning_rate": 9.175490757709685e-05, "loss": 0.0064, "step": 535580 }, { "epoch": 1.39, "learning_rate": 9.175101936072538e-05, "loss": 0.0097, "step": 535590 }, { "epoch": 1.39, "learning_rate": 9.174713114435392e-05, "loss": 0.0134, "step": 535600 }, { "epoch": 1.39, "learning_rate": 9.174324292798245e-05, "loss": 0.0092, "step": 535610 }, { "epoch": 1.39, "learning_rate": 9.173935471161099e-05, "loss": 0.0087, "step": 535620 }, { "epoch": 1.39, "learning_rate": 9.173546649523952e-05, "loss": 0.0083, "step": 535630 }, { "epoch": 1.39, "learning_rate": 9.173157827886806e-05, "loss": 0.0114, "step": 535640 }, { "epoch": 1.39, "learning_rate": 9.172769006249659e-05, "loss": 0.0092, "step": 535650 }, { "epoch": 1.39, "learning_rate": 9.172380184612513e-05, "loss": 0.0078, "step": 535660 }, { "epoch": 1.39, "learning_rate": 9.171991362975366e-05, "loss": 0.0088, "step": 535670 }, { "epoch": 1.39, "learning_rate": 9.171602541338219e-05, "loss": 0.0112, "step": 535680 }, { "epoch": 1.39, "learning_rate": 9.171213719701073e-05, "loss": 0.0096, "step": 535690 }, { "epoch": 1.39, "learning_rate": 9.170824898063926e-05, "loss": 0.01, "step": 535700 }, { "epoch": 1.39, "learning_rate": 9.17043607642678e-05, "loss": 0.0083, "step": 535710 }, { "epoch": 1.39, "learning_rate": 9.170047254789633e-05, "loss": 0.0098, "step": 535720 }, { "epoch": 1.39, "learning_rate": 9.169658433152487e-05, "loss": 0.01, "step": 535730 }, { "epoch": 1.39, "learning_rate": 9.16926961151534e-05, "loss": 0.0207, "step": 535740 }, { "epoch": 1.39, "learning_rate": 9.168880789878195e-05, "loss": 0.0081, "step": 535750 }, { "epoch": 1.39, "learning_rate": 9.168491968241048e-05, "loss": 0.0102, "step": 535760 }, { "epoch": 1.39, "learning_rate": 9.168103146603902e-05, "loss": 0.0088, "step": 535770 }, { "epoch": 1.39, "learning_rate": 9.167714324966755e-05, "loss": 0.0101, "step": 535780 }, { "epoch": 1.39, "learning_rate": 9.167325503329609e-05, "loss": 0.0075, "step": 535790 }, { "epoch": 1.39, "learning_rate": 9.166936681692462e-05, "loss": 0.0143, "step": 535800 }, { "epoch": 1.39, "learning_rate": 9.166547860055316e-05, "loss": 0.0101, "step": 535810 }, { "epoch": 1.39, "learning_rate": 9.166159038418169e-05, "loss": 0.0113, "step": 535820 }, { "epoch": 1.39, "learning_rate": 9.165770216781023e-05, "loss": 0.01, "step": 535830 }, { "epoch": 1.39, "learning_rate": 9.165381395143876e-05, "loss": 0.009, "step": 535840 }, { "epoch": 1.39, "learning_rate": 9.16499257350673e-05, "loss": 0.0109, "step": 535850 }, { "epoch": 1.39, "learning_rate": 9.164603751869583e-05, "loss": 0.0088, "step": 535860 }, { "epoch": 1.39, "learning_rate": 9.164214930232437e-05, "loss": 0.0095, "step": 535870 }, { "epoch": 1.39, "learning_rate": 9.16382610859529e-05, "loss": 0.0099, "step": 535880 }, { "epoch": 1.39, "learning_rate": 9.163437286958144e-05, "loss": 0.011, "step": 535890 }, { "epoch": 1.39, "learning_rate": 9.163048465320997e-05, "loss": 0.01, "step": 535900 }, { "epoch": 1.39, "learning_rate": 9.162659643683852e-05, "loss": 0.0104, "step": 535910 }, { "epoch": 1.39, "learning_rate": 9.162270822046705e-05, "loss": 0.0116, "step": 535920 }, { "epoch": 1.39, "learning_rate": 9.161882000409557e-05, "loss": 0.0074, "step": 535930 }, { "epoch": 1.39, "learning_rate": 9.161493178772412e-05, "loss": 0.0121, "step": 535940 }, { "epoch": 1.39, "learning_rate": 9.161104357135265e-05, "loss": 0.011, "step": 535950 }, { "epoch": 1.39, "learning_rate": 9.160715535498119e-05, "loss": 0.0113, "step": 535960 }, { "epoch": 1.39, "learning_rate": 9.160326713860972e-05, "loss": 0.0101, "step": 535970 }, { "epoch": 1.39, "learning_rate": 9.159937892223826e-05, "loss": 0.0097, "step": 535980 }, { "epoch": 1.39, "learning_rate": 9.159549070586679e-05, "loss": 0.0083, "step": 535990 }, { "epoch": 1.39, "learning_rate": 9.159160248949533e-05, "loss": 0.0079, "step": 536000 }, { "epoch": 1.39, "eval_cer": 0.8816760932214184, "eval_loss": 0.006177127361297607, "eval_runtime": 107.7114, "eval_samples_per_second": 18.568, "eval_steps_per_second": 4.642, "step": 536000 }, { "epoch": 1.39, "learning_rate": 9.158771427312386e-05, "loss": 0.0102, "step": 536010 }, { "epoch": 1.39, "learning_rate": 9.15838260567524e-05, "loss": 0.0093, "step": 536020 }, { "epoch": 1.39, "learning_rate": 9.157993784038093e-05, "loss": 0.0102, "step": 536030 }, { "epoch": 1.39, "learning_rate": 9.157604962400947e-05, "loss": 0.0107, "step": 536040 }, { "epoch": 1.39, "learning_rate": 9.1572161407638e-05, "loss": 0.0125, "step": 536050 }, { "epoch": 1.39, "learning_rate": 9.156827319126654e-05, "loss": 0.0101, "step": 536060 }, { "epoch": 1.39, "learning_rate": 9.156438497489507e-05, "loss": 0.0091, "step": 536070 }, { "epoch": 1.39, "learning_rate": 9.156049675852361e-05, "loss": 0.0107, "step": 536080 }, { "epoch": 1.39, "learning_rate": 9.155660854215214e-05, "loss": 0.0079, "step": 536090 }, { "epoch": 1.39, "learning_rate": 9.155272032578069e-05, "loss": 0.0098, "step": 536100 }, { "epoch": 1.39, "learning_rate": 9.154883210940922e-05, "loss": 0.0092, "step": 536110 }, { "epoch": 1.39, "learning_rate": 9.154494389303776e-05, "loss": 0.0096, "step": 536120 }, { "epoch": 1.39, "learning_rate": 9.154105567666629e-05, "loss": 0.0079, "step": 536130 }, { "epoch": 1.39, "learning_rate": 9.153716746029483e-05, "loss": 0.0095, "step": 536140 }, { "epoch": 1.39, "learning_rate": 9.153327924392336e-05, "loss": 0.0087, "step": 536150 }, { "epoch": 1.39, "learning_rate": 9.152939102755189e-05, "loss": 0.0093, "step": 536160 }, { "epoch": 1.39, "learning_rate": 9.152550281118043e-05, "loss": 0.0089, "step": 536170 }, { "epoch": 1.39, "learning_rate": 9.152161459480896e-05, "loss": 0.0078, "step": 536180 }, { "epoch": 1.39, "learning_rate": 9.15177263784375e-05, "loss": 0.0098, "step": 536190 }, { "epoch": 1.39, "learning_rate": 9.151383816206603e-05, "loss": 0.011, "step": 536200 }, { "epoch": 1.39, "learning_rate": 9.150994994569457e-05, "loss": 0.0074, "step": 536210 }, { "epoch": 1.39, "learning_rate": 9.15060617293231e-05, "loss": 0.0097, "step": 536220 }, { "epoch": 1.39, "learning_rate": 9.150217351295164e-05, "loss": 0.011, "step": 536230 }, { "epoch": 1.39, "learning_rate": 9.149828529658017e-05, "loss": 0.0084, "step": 536240 }, { "epoch": 1.39, "learning_rate": 9.149439708020871e-05, "loss": 0.0102, "step": 536250 }, { "epoch": 1.39, "learning_rate": 9.149050886383724e-05, "loss": 0.0096, "step": 536260 }, { "epoch": 1.39, "learning_rate": 9.148662064746579e-05, "loss": 0.0077, "step": 536270 }, { "epoch": 1.39, "learning_rate": 9.14827324310943e-05, "loss": 0.0088, "step": 536280 }, { "epoch": 1.39, "learning_rate": 9.147884421472286e-05, "loss": 0.0083, "step": 536290 }, { "epoch": 1.39, "learning_rate": 9.147495599835139e-05, "loss": 0.0096, "step": 536300 }, { "epoch": 1.39, "learning_rate": 9.147106778197993e-05, "loss": 0.01, "step": 536310 }, { "epoch": 1.39, "learning_rate": 9.146717956560846e-05, "loss": 0.0084, "step": 536320 }, { "epoch": 1.39, "learning_rate": 9.1463291349237e-05, "loss": 0.0087, "step": 536330 }, { "epoch": 1.39, "learning_rate": 9.145940313286553e-05, "loss": 0.0112, "step": 536340 }, { "epoch": 1.39, "learning_rate": 9.145551491649407e-05, "loss": 0.0066, "step": 536350 }, { "epoch": 1.39, "learning_rate": 9.14516267001226e-05, "loss": 0.0096, "step": 536360 }, { "epoch": 1.39, "learning_rate": 9.144773848375114e-05, "loss": 0.0074, "step": 536370 }, { "epoch": 1.39, "learning_rate": 9.144385026737967e-05, "loss": 0.0073, "step": 536380 }, { "epoch": 1.39, "learning_rate": 9.143996205100821e-05, "loss": 0.0082, "step": 536390 }, { "epoch": 1.39, "learning_rate": 9.143607383463674e-05, "loss": 0.0093, "step": 536400 }, { "epoch": 1.39, "learning_rate": 9.143218561826527e-05, "loss": 0.0109, "step": 536410 }, { "epoch": 1.39, "learning_rate": 9.142829740189381e-05, "loss": 0.0119, "step": 536420 }, { "epoch": 1.39, "learning_rate": 9.142440918552234e-05, "loss": 0.0081, "step": 536430 }, { "epoch": 1.39, "learning_rate": 9.142052096915088e-05, "loss": 0.0079, "step": 536440 }, { "epoch": 1.39, "learning_rate": 9.14166327527794e-05, "loss": 0.0069, "step": 536450 }, { "epoch": 1.39, "learning_rate": 9.141274453640796e-05, "loss": 0.0075, "step": 536460 }, { "epoch": 1.39, "learning_rate": 9.140885632003649e-05, "loss": 0.0091, "step": 536470 }, { "epoch": 1.39, "learning_rate": 9.140496810366503e-05, "loss": 0.0092, "step": 536480 }, { "epoch": 1.39, "learning_rate": 9.140107988729356e-05, "loss": 0.0087, "step": 536490 }, { "epoch": 1.39, "learning_rate": 9.13971916709221e-05, "loss": 0.0077, "step": 536500 }, { "epoch": 1.39, "learning_rate": 9.139330345455063e-05, "loss": 0.0066, "step": 536510 }, { "epoch": 1.39, "learning_rate": 9.138941523817917e-05, "loss": 0.0093, "step": 536520 }, { "epoch": 1.39, "learning_rate": 9.13855270218077e-05, "loss": 0.0106, "step": 536530 }, { "epoch": 1.39, "learning_rate": 9.138163880543624e-05, "loss": 0.0129, "step": 536540 }, { "epoch": 1.39, "learning_rate": 9.137775058906477e-05, "loss": 0.0105, "step": 536550 }, { "epoch": 1.39, "learning_rate": 9.137386237269331e-05, "loss": 0.0129, "step": 536560 }, { "epoch": 1.39, "learning_rate": 9.136997415632184e-05, "loss": 0.0091, "step": 536570 }, { "epoch": 1.39, "learning_rate": 9.136608593995038e-05, "loss": 0.0104, "step": 536580 }, { "epoch": 1.39, "learning_rate": 9.136219772357891e-05, "loss": 0.0086, "step": 536590 }, { "epoch": 1.39, "learning_rate": 9.135830950720745e-05, "loss": 0.0092, "step": 536600 }, { "epoch": 1.39, "learning_rate": 9.135442129083598e-05, "loss": 0.0098, "step": 536610 }, { "epoch": 1.39, "learning_rate": 9.135053307446453e-05, "loss": 0.0094, "step": 536620 }, { "epoch": 1.39, "learning_rate": 9.134664485809306e-05, "loss": 0.0116, "step": 536630 }, { "epoch": 1.39, "learning_rate": 9.13427566417216e-05, "loss": 0.0129, "step": 536640 }, { "epoch": 1.39, "learning_rate": 9.133886842535013e-05, "loss": 0.0079, "step": 536650 }, { "epoch": 1.39, "learning_rate": 9.133498020897866e-05, "loss": 0.009, "step": 536660 }, { "epoch": 1.39, "learning_rate": 9.13310919926072e-05, "loss": 0.0074, "step": 536670 }, { "epoch": 1.39, "learning_rate": 9.132720377623573e-05, "loss": 0.0088, "step": 536680 }, { "epoch": 1.39, "learning_rate": 9.132331555986427e-05, "loss": 0.0066, "step": 536690 }, { "epoch": 1.39, "learning_rate": 9.13194273434928e-05, "loss": 0.0125, "step": 536700 }, { "epoch": 1.39, "learning_rate": 9.131553912712134e-05, "loss": 0.0099, "step": 536710 }, { "epoch": 1.39, "learning_rate": 9.131165091074987e-05, "loss": 0.0099, "step": 536720 }, { "epoch": 1.39, "learning_rate": 9.130776269437841e-05, "loss": 0.0087, "step": 536730 }, { "epoch": 1.39, "learning_rate": 9.130387447800694e-05, "loss": 0.0119, "step": 536740 }, { "epoch": 1.39, "learning_rate": 9.129998626163548e-05, "loss": 0.0099, "step": 536750 }, { "epoch": 1.39, "learning_rate": 9.129609804526401e-05, "loss": 0.0086, "step": 536760 }, { "epoch": 1.39, "learning_rate": 9.129220982889255e-05, "loss": 0.0079, "step": 536770 }, { "epoch": 1.39, "learning_rate": 9.128832161252108e-05, "loss": 0.0089, "step": 536780 }, { "epoch": 1.39, "learning_rate": 9.128443339614963e-05, "loss": 0.0113, "step": 536790 }, { "epoch": 1.39, "learning_rate": 9.128054517977815e-05, "loss": 0.009, "step": 536800 }, { "epoch": 1.39, "learning_rate": 9.12766569634067e-05, "loss": 0.0099, "step": 536810 }, { "epoch": 1.39, "learning_rate": 9.127276874703523e-05, "loss": 0.0107, "step": 536820 }, { "epoch": 1.39, "learning_rate": 9.126888053066377e-05, "loss": 0.009, "step": 536830 }, { "epoch": 1.39, "learning_rate": 9.12649923142923e-05, "loss": 0.0083, "step": 536840 }, { "epoch": 1.39, "learning_rate": 9.126110409792084e-05, "loss": 0.0108, "step": 536850 }, { "epoch": 1.39, "learning_rate": 9.125721588154937e-05, "loss": 0.0089, "step": 536860 }, { "epoch": 1.39, "learning_rate": 9.125332766517791e-05, "loss": 0.0073, "step": 536870 }, { "epoch": 1.39, "learning_rate": 9.124943944880644e-05, "loss": 0.009, "step": 536880 }, { "epoch": 1.39, "learning_rate": 9.124555123243498e-05, "loss": 0.0092, "step": 536890 }, { "epoch": 1.39, "learning_rate": 9.124166301606351e-05, "loss": 0.0079, "step": 536900 }, { "epoch": 1.39, "learning_rate": 9.123777479969204e-05, "loss": 0.0125, "step": 536910 }, { "epoch": 1.39, "learning_rate": 9.123388658332058e-05, "loss": 0.0079, "step": 536920 }, { "epoch": 1.39, "learning_rate": 9.12299983669491e-05, "loss": 0.0078, "step": 536930 }, { "epoch": 1.39, "learning_rate": 9.122611015057765e-05, "loss": 0.0059, "step": 536940 }, { "epoch": 1.39, "learning_rate": 9.122222193420618e-05, "loss": 0.0086, "step": 536950 }, { "epoch": 1.39, "learning_rate": 9.121833371783472e-05, "loss": 0.0104, "step": 536960 }, { "epoch": 1.39, "learning_rate": 9.121444550146325e-05, "loss": 0.0094, "step": 536970 }, { "epoch": 1.39, "learning_rate": 9.12105572850918e-05, "loss": 0.01, "step": 536980 }, { "epoch": 1.39, "learning_rate": 9.120666906872033e-05, "loss": 0.011, "step": 536990 }, { "epoch": 1.39, "learning_rate": 9.120278085234887e-05, "loss": 0.01, "step": 537000 }, { "epoch": 1.39, "eval_cer": 0.8816676953998133, "eval_loss": 0.006287885829806328, "eval_runtime": 107.8496, "eval_samples_per_second": 18.544, "eval_steps_per_second": 4.636, "step": 537000 }, { "epoch": 1.39, "learning_rate": 9.11988926359774e-05, "loss": 0.0101, "step": 537010 }, { "epoch": 1.39, "learning_rate": 9.119500441960594e-05, "loss": 0.0075, "step": 537020 }, { "epoch": 1.39, "learning_rate": 9.119111620323447e-05, "loss": 0.0102, "step": 537030 }, { "epoch": 1.39, "learning_rate": 9.118722798686301e-05, "loss": 0.0087, "step": 537040 }, { "epoch": 1.39, "learning_rate": 9.118333977049154e-05, "loss": 0.0124, "step": 537050 }, { "epoch": 1.39, "learning_rate": 9.117945155412008e-05, "loss": 0.0104, "step": 537060 }, { "epoch": 1.39, "learning_rate": 9.117556333774861e-05, "loss": 0.0086, "step": 537070 }, { "epoch": 1.39, "learning_rate": 9.117167512137715e-05, "loss": 0.0089, "step": 537080 }, { "epoch": 1.39, "learning_rate": 9.116778690500568e-05, "loss": 0.0104, "step": 537090 }, { "epoch": 1.39, "learning_rate": 9.116389868863422e-05, "loss": 0.0103, "step": 537100 }, { "epoch": 1.39, "learning_rate": 9.116001047226275e-05, "loss": 0.0075, "step": 537110 }, { "epoch": 1.39, "learning_rate": 9.115612225589129e-05, "loss": 0.0096, "step": 537120 }, { "epoch": 1.39, "learning_rate": 9.115223403951982e-05, "loss": 0.0089, "step": 537130 }, { "epoch": 1.39, "learning_rate": 9.114834582314837e-05, "loss": 0.0092, "step": 537140 }, { "epoch": 1.39, "learning_rate": 9.11444576067769e-05, "loss": 0.0125, "step": 537150 }, { "epoch": 1.39, "learning_rate": 9.114056939040541e-05, "loss": 0.0091, "step": 537160 }, { "epoch": 1.39, "learning_rate": 9.113668117403397e-05, "loss": 0.0112, "step": 537170 }, { "epoch": 1.39, "learning_rate": 9.11327929576625e-05, "loss": 0.0099, "step": 537180 }, { "epoch": 1.39, "learning_rate": 9.112890474129104e-05, "loss": 0.0099, "step": 537190 }, { "epoch": 1.39, "learning_rate": 9.112501652491957e-05, "loss": 0.0093, "step": 537200 }, { "epoch": 1.39, "learning_rate": 9.112112830854811e-05, "loss": 0.0099, "step": 537210 }, { "epoch": 1.39, "learning_rate": 9.111724009217664e-05, "loss": 0.0108, "step": 537220 }, { "epoch": 1.39, "learning_rate": 9.111335187580518e-05, "loss": 0.0091, "step": 537230 }, { "epoch": 1.39, "learning_rate": 9.110946365943371e-05, "loss": 0.0097, "step": 537240 }, { "epoch": 1.39, "learning_rate": 9.110557544306225e-05, "loss": 0.0113, "step": 537250 }, { "epoch": 1.39, "learning_rate": 9.110168722669078e-05, "loss": 0.0105, "step": 537260 }, { "epoch": 1.39, "learning_rate": 9.109779901031932e-05, "loss": 0.0084, "step": 537270 }, { "epoch": 1.39, "learning_rate": 9.109391079394785e-05, "loss": 0.0105, "step": 537280 }, { "epoch": 1.39, "learning_rate": 9.109002257757639e-05, "loss": 0.0075, "step": 537290 }, { "epoch": 1.39, "learning_rate": 9.108613436120492e-05, "loss": 0.0118, "step": 537300 }, { "epoch": 1.39, "learning_rate": 9.108224614483347e-05, "loss": 0.0079, "step": 537310 }, { "epoch": 1.39, "learning_rate": 9.107835792846199e-05, "loss": 0.0086, "step": 537320 }, { "epoch": 1.39, "learning_rate": 9.107446971209054e-05, "loss": 0.0095, "step": 537330 }, { "epoch": 1.39, "learning_rate": 9.107058149571907e-05, "loss": 0.0103, "step": 537340 }, { "epoch": 1.39, "learning_rate": 9.106669327934761e-05, "loss": 0.0077, "step": 537350 }, { "epoch": 1.39, "learning_rate": 9.106280506297614e-05, "loss": 0.0106, "step": 537360 }, { "epoch": 1.39, "learning_rate": 9.105891684660468e-05, "loss": 0.0118, "step": 537370 }, { "epoch": 1.39, "learning_rate": 9.105502863023321e-05, "loss": 0.0088, "step": 537380 }, { "epoch": 1.39, "learning_rate": 9.105114041386175e-05, "loss": 0.0091, "step": 537390 }, { "epoch": 1.39, "learning_rate": 9.104725219749028e-05, "loss": 0.0101, "step": 537400 }, { "epoch": 1.39, "learning_rate": 9.104336398111881e-05, "loss": 0.0104, "step": 537410 }, { "epoch": 1.39, "learning_rate": 9.103947576474735e-05, "loss": 0.0074, "step": 537420 }, { "epoch": 1.39, "learning_rate": 9.103558754837588e-05, "loss": 0.0102, "step": 537430 }, { "epoch": 1.39, "learning_rate": 9.103169933200442e-05, "loss": 0.0112, "step": 537440 }, { "epoch": 1.39, "learning_rate": 9.102781111563295e-05, "loss": 0.0104, "step": 537450 }, { "epoch": 1.39, "learning_rate": 9.102392289926149e-05, "loss": 0.0101, "step": 537460 }, { "epoch": 1.39, "learning_rate": 9.102003468289002e-05, "loss": 0.0091, "step": 537470 }, { "epoch": 1.39, "learning_rate": 9.101614646651856e-05, "loss": 0.008, "step": 537480 }, { "epoch": 1.39, "learning_rate": 9.101225825014709e-05, "loss": 0.0103, "step": 537490 }, { "epoch": 1.39, "learning_rate": 9.100837003377564e-05, "loss": 0.0126, "step": 537500 }, { "epoch": 1.39, "learning_rate": 9.100448181740417e-05, "loss": 0.0104, "step": 537510 }, { "epoch": 1.39, "learning_rate": 9.100059360103271e-05, "loss": 0.0099, "step": 537520 }, { "epoch": 1.39, "learning_rate": 9.099670538466124e-05, "loss": 0.0128, "step": 537530 }, { "epoch": 1.39, "learning_rate": 9.099281716828978e-05, "loss": 0.0103, "step": 537540 }, { "epoch": 1.39, "learning_rate": 9.098892895191831e-05, "loss": 0.0088, "step": 537550 }, { "epoch": 1.39, "learning_rate": 9.098504073554685e-05, "loss": 0.0118, "step": 537560 }, { "epoch": 1.39, "learning_rate": 9.098115251917538e-05, "loss": 0.0105, "step": 537570 }, { "epoch": 1.39, "learning_rate": 9.097726430280392e-05, "loss": 0.0088, "step": 537580 }, { "epoch": 1.39, "learning_rate": 9.097337608643245e-05, "loss": 0.0091, "step": 537590 }, { "epoch": 1.39, "learning_rate": 9.096948787006099e-05, "loss": 0.008, "step": 537600 }, { "epoch": 1.39, "learning_rate": 9.096559965368952e-05, "loss": 0.0154, "step": 537610 }, { "epoch": 1.39, "learning_rate": 9.096171143731806e-05, "loss": 0.0085, "step": 537620 }, { "epoch": 1.39, "learning_rate": 9.095782322094659e-05, "loss": 0.007, "step": 537630 }, { "epoch": 1.39, "learning_rate": 9.095393500457513e-05, "loss": 0.0101, "step": 537640 }, { "epoch": 1.39, "learning_rate": 9.095004678820366e-05, "loss": 0.0106, "step": 537650 }, { "epoch": 1.39, "learning_rate": 9.094615857183219e-05, "loss": 0.0089, "step": 537660 }, { "epoch": 1.39, "learning_rate": 9.094227035546073e-05, "loss": 0.0082, "step": 537670 }, { "epoch": 1.39, "learning_rate": 9.093838213908925e-05, "loss": 0.0069, "step": 537680 }, { "epoch": 1.39, "learning_rate": 9.093449392271781e-05, "loss": 0.0114, "step": 537690 }, { "epoch": 1.39, "learning_rate": 9.093060570634634e-05, "loss": 0.0128, "step": 537700 }, { "epoch": 1.39, "learning_rate": 9.092671748997488e-05, "loss": 0.0094, "step": 537710 }, { "epoch": 1.39, "learning_rate": 9.092282927360341e-05, "loss": 0.009, "step": 537720 }, { "epoch": 1.39, "learning_rate": 9.091894105723195e-05, "loss": 0.0088, "step": 537730 }, { "epoch": 1.39, "learning_rate": 9.091505284086048e-05, "loss": 0.0105, "step": 537740 }, { "epoch": 1.39, "learning_rate": 9.091116462448902e-05, "loss": 0.0077, "step": 537750 }, { "epoch": 1.39, "learning_rate": 9.090727640811755e-05, "loss": 0.0151, "step": 537760 }, { "epoch": 1.39, "learning_rate": 9.090338819174609e-05, "loss": 0.0075, "step": 537770 }, { "epoch": 1.39, "learning_rate": 9.089949997537462e-05, "loss": 0.0096, "step": 537780 }, { "epoch": 1.39, "learning_rate": 9.089561175900316e-05, "loss": 0.0103, "step": 537790 }, { "epoch": 1.39, "learning_rate": 9.089172354263169e-05, "loss": 0.0092, "step": 537800 }, { "epoch": 1.39, "learning_rate": 9.088783532626023e-05, "loss": 0.0099, "step": 537810 }, { "epoch": 1.39, "learning_rate": 9.088394710988876e-05, "loss": 0.0083, "step": 537820 }, { "epoch": 1.39, "learning_rate": 9.08800588935173e-05, "loss": 0.0096, "step": 537830 }, { "epoch": 1.39, "learning_rate": 9.087617067714583e-05, "loss": 0.0081, "step": 537840 }, { "epoch": 1.39, "learning_rate": 9.087228246077438e-05, "loss": 0.0118, "step": 537850 }, { "epoch": 1.39, "learning_rate": 9.086839424440291e-05, "loss": 0.0107, "step": 537860 }, { "epoch": 1.39, "learning_rate": 9.086450602803145e-05, "loss": 0.0099, "step": 537870 }, { "epoch": 1.39, "learning_rate": 9.086061781165998e-05, "loss": 0.0079, "step": 537880 }, { "epoch": 1.39, "learning_rate": 9.085672959528852e-05, "loss": 0.0089, "step": 537890 }, { "epoch": 1.39, "learning_rate": 9.085284137891705e-05, "loss": 0.0117, "step": 537900 }, { "epoch": 1.39, "learning_rate": 9.084895316254558e-05, "loss": 0.0091, "step": 537910 }, { "epoch": 1.39, "learning_rate": 9.084506494617412e-05, "loss": 0.0085, "step": 537920 }, { "epoch": 1.39, "learning_rate": 9.084117672980265e-05, "loss": 0.0097, "step": 537930 }, { "epoch": 1.39, "learning_rate": 9.083728851343119e-05, "loss": 0.0103, "step": 537940 }, { "epoch": 1.39, "learning_rate": 9.083340029705972e-05, "loss": 0.0097, "step": 537950 }, { "epoch": 1.39, "learning_rate": 9.082951208068826e-05, "loss": 0.0065, "step": 537960 }, { "epoch": 1.39, "learning_rate": 9.082562386431679e-05, "loss": 0.0105, "step": 537970 }, { "epoch": 1.39, "learning_rate": 9.082173564794533e-05, "loss": 0.0107, "step": 537980 }, { "epoch": 1.39, "learning_rate": 9.081784743157386e-05, "loss": 0.0082, "step": 537990 }, { "epoch": 1.39, "learning_rate": 9.08139592152024e-05, "loss": 0.0126, "step": 538000 }, { "epoch": 1.39, "eval_cer": 0.8816522993935373, "eval_loss": 0.006265460047870874, "eval_runtime": 107.8561, "eval_samples_per_second": 18.543, "eval_steps_per_second": 4.636, "step": 538000 }, { "epoch": 1.39, "learning_rate": 9.081007099883093e-05, "loss": 0.0092, "step": 538010 }, { "epoch": 1.39, "learning_rate": 9.080618278245948e-05, "loss": 0.0089, "step": 538020 }, { "epoch": 1.39, "learning_rate": 9.0802294566088e-05, "loss": 0.0136, "step": 538030 }, { "epoch": 1.39, "learning_rate": 9.079840634971655e-05, "loss": 0.0128, "step": 538040 }, { "epoch": 1.39, "learning_rate": 9.079451813334508e-05, "loss": 0.011, "step": 538050 }, { "epoch": 1.39, "learning_rate": 9.079062991697362e-05, "loss": 0.0102, "step": 538060 }, { "epoch": 1.39, "learning_rate": 9.078674170060215e-05, "loss": 0.0084, "step": 538070 }, { "epoch": 1.39, "learning_rate": 9.078285348423069e-05, "loss": 0.0117, "step": 538080 }, { "epoch": 1.39, "learning_rate": 9.077896526785922e-05, "loss": 0.012, "step": 538090 }, { "epoch": 1.39, "learning_rate": 9.077507705148776e-05, "loss": 0.0074, "step": 538100 }, { "epoch": 1.39, "learning_rate": 9.077118883511629e-05, "loss": 0.0108, "step": 538110 }, { "epoch": 1.39, "learning_rate": 9.076730061874483e-05, "loss": 0.0122, "step": 538120 }, { "epoch": 1.39, "learning_rate": 9.076341240237336e-05, "loss": 0.0099, "step": 538130 }, { "epoch": 1.39, "learning_rate": 9.07595241860019e-05, "loss": 0.0073, "step": 538140 }, { "epoch": 1.39, "learning_rate": 9.075563596963043e-05, "loss": 0.0138, "step": 538150 }, { "epoch": 1.39, "learning_rate": 9.075174775325896e-05, "loss": 0.0083, "step": 538160 }, { "epoch": 1.4, "learning_rate": 9.07478595368875e-05, "loss": 0.0133, "step": 538170 }, { "epoch": 1.4, "learning_rate": 9.074397132051603e-05, "loss": 0.0073, "step": 538180 }, { "epoch": 1.4, "learning_rate": 9.074008310414457e-05, "loss": 0.0087, "step": 538190 }, { "epoch": 1.4, "learning_rate": 9.07361948877731e-05, "loss": 0.0075, "step": 538200 }, { "epoch": 1.4, "learning_rate": 9.073230667140165e-05, "loss": 0.0082, "step": 538210 }, { "epoch": 1.4, "learning_rate": 9.072841845503018e-05, "loss": 0.0109, "step": 538220 }, { "epoch": 1.4, "learning_rate": 9.072453023865872e-05, "loss": 0.0065, "step": 538230 }, { "epoch": 1.4, "learning_rate": 9.072064202228725e-05, "loss": 0.0102, "step": 538240 }, { "epoch": 1.4, "learning_rate": 9.071675380591579e-05, "loss": 0.0087, "step": 538250 }, { "epoch": 1.4, "learning_rate": 9.071286558954432e-05, "loss": 0.0085, "step": 538260 }, { "epoch": 1.4, "learning_rate": 9.070897737317286e-05, "loss": 0.012, "step": 538270 }, { "epoch": 1.4, "learning_rate": 9.070508915680139e-05, "loss": 0.0087, "step": 538280 }, { "epoch": 1.4, "learning_rate": 9.070120094042993e-05, "loss": 0.0065, "step": 538290 }, { "epoch": 1.4, "learning_rate": 9.069731272405846e-05, "loss": 0.0214, "step": 538300 }, { "epoch": 1.4, "learning_rate": 9.0693424507687e-05, "loss": 0.0093, "step": 538310 }, { "epoch": 1.4, "learning_rate": 9.068953629131553e-05, "loss": 0.0111, "step": 538320 }, { "epoch": 1.4, "learning_rate": 9.068564807494407e-05, "loss": 0.0102, "step": 538330 }, { "epoch": 1.4, "learning_rate": 9.06817598585726e-05, "loss": 0.0086, "step": 538340 }, { "epoch": 1.4, "learning_rate": 9.067787164220114e-05, "loss": 0.009, "step": 538350 }, { "epoch": 1.4, "learning_rate": 9.067398342582967e-05, "loss": 0.01, "step": 538360 }, { "epoch": 1.4, "learning_rate": 9.067009520945822e-05, "loss": 0.009, "step": 538370 }, { "epoch": 1.4, "learning_rate": 9.066620699308675e-05, "loss": 0.011, "step": 538380 }, { "epoch": 1.4, "learning_rate": 9.066231877671529e-05, "loss": 0.0084, "step": 538390 }, { "epoch": 1.4, "learning_rate": 9.065843056034382e-05, "loss": 0.0069, "step": 538400 }, { "epoch": 1.4, "learning_rate": 9.065454234397235e-05, "loss": 0.0083, "step": 538410 }, { "epoch": 1.4, "learning_rate": 9.065065412760089e-05, "loss": 0.0084, "step": 538420 }, { "epoch": 1.4, "learning_rate": 9.064676591122942e-05, "loss": 0.0097, "step": 538430 }, { "epoch": 1.4, "learning_rate": 9.064287769485796e-05, "loss": 0.0085, "step": 538440 }, { "epoch": 1.4, "learning_rate": 9.063898947848649e-05, "loss": 0.0114, "step": 538450 }, { "epoch": 1.4, "learning_rate": 9.063510126211503e-05, "loss": 0.0083, "step": 538460 }, { "epoch": 1.4, "learning_rate": 9.063121304574356e-05, "loss": 0.0095, "step": 538470 }, { "epoch": 1.4, "learning_rate": 9.06273248293721e-05, "loss": 0.0107, "step": 538480 }, { "epoch": 1.4, "learning_rate": 9.062343661300063e-05, "loss": 0.0087, "step": 538490 }, { "epoch": 1.4, "learning_rate": 9.061954839662917e-05, "loss": 0.0105, "step": 538500 }, { "epoch": 1.4, "learning_rate": 9.06156601802577e-05, "loss": 0.0096, "step": 538510 }, { "epoch": 1.4, "learning_rate": 9.061177196388624e-05, "loss": 0.0108, "step": 538520 }, { "epoch": 1.4, "learning_rate": 9.060788374751477e-05, "loss": 0.0087, "step": 538530 }, { "epoch": 1.4, "learning_rate": 9.060399553114332e-05, "loss": 0.0087, "step": 538540 }, { "epoch": 1.4, "learning_rate": 9.060010731477184e-05, "loss": 0.0125, "step": 538550 }, { "epoch": 1.4, "learning_rate": 9.059621909840039e-05, "loss": 0.0105, "step": 538560 }, { "epoch": 1.4, "learning_rate": 9.059233088202892e-05, "loss": 0.0078, "step": 538570 }, { "epoch": 1.4, "learning_rate": 9.058844266565746e-05, "loss": 0.0078, "step": 538580 }, { "epoch": 1.4, "learning_rate": 9.058455444928599e-05, "loss": 0.008, "step": 538590 }, { "epoch": 1.4, "learning_rate": 9.058066623291453e-05, "loss": 0.0104, "step": 538600 }, { "epoch": 1.4, "learning_rate": 9.057677801654306e-05, "loss": 0.0087, "step": 538610 }, { "epoch": 1.4, "learning_rate": 9.05728898001716e-05, "loss": 0.0078, "step": 538620 }, { "epoch": 1.4, "learning_rate": 9.056900158380013e-05, "loss": 0.0076, "step": 538630 }, { "epoch": 1.4, "learning_rate": 9.056511336742866e-05, "loss": 0.0078, "step": 538640 }, { "epoch": 1.4, "learning_rate": 9.05612251510572e-05, "loss": 0.0097, "step": 538650 }, { "epoch": 1.4, "learning_rate": 9.055733693468573e-05, "loss": 0.009, "step": 538660 }, { "epoch": 1.4, "learning_rate": 9.055344871831427e-05, "loss": 0.0089, "step": 538670 }, { "epoch": 1.4, "learning_rate": 9.05495605019428e-05, "loss": 0.0096, "step": 538680 }, { "epoch": 1.4, "learning_rate": 9.054567228557134e-05, "loss": 0.0143, "step": 538690 }, { "epoch": 1.4, "learning_rate": 9.054178406919986e-05, "loss": 0.0086, "step": 538700 }, { "epoch": 1.4, "learning_rate": 9.05378958528284e-05, "loss": 0.0083, "step": 538710 }, { "epoch": 1.4, "learning_rate": 9.053400763645693e-05, "loss": 0.0081, "step": 538720 }, { "epoch": 1.4, "learning_rate": 9.053011942008549e-05, "loss": 0.0104, "step": 538730 }, { "epoch": 1.4, "learning_rate": 9.052623120371402e-05, "loss": 0.0086, "step": 538740 }, { "epoch": 1.4, "learning_rate": 9.052234298734256e-05, "loss": 0.0083, "step": 538750 }, { "epoch": 1.4, "learning_rate": 9.051845477097109e-05, "loss": 0.007, "step": 538760 }, { "epoch": 1.4, "learning_rate": 9.051456655459963e-05, "loss": 0.0065, "step": 538770 }, { "epoch": 1.4, "learning_rate": 9.051067833822816e-05, "loss": 0.0082, "step": 538780 }, { "epoch": 1.4, "learning_rate": 9.05067901218567e-05, "loss": 0.0097, "step": 538790 }, { "epoch": 1.4, "learning_rate": 9.050290190548523e-05, "loss": 0.0102, "step": 538800 }, { "epoch": 1.4, "learning_rate": 9.049901368911377e-05, "loss": 0.0085, "step": 538810 }, { "epoch": 1.4, "learning_rate": 9.04951254727423e-05, "loss": 0.0087, "step": 538820 }, { "epoch": 1.4, "learning_rate": 9.049123725637084e-05, "loss": 0.0075, "step": 538830 }, { "epoch": 1.4, "learning_rate": 9.048734903999937e-05, "loss": 0.008, "step": 538840 }, { "epoch": 1.4, "learning_rate": 9.048346082362791e-05, "loss": 0.0091, "step": 538850 }, { "epoch": 1.4, "learning_rate": 9.047957260725644e-05, "loss": 0.0118, "step": 538860 }, { "epoch": 1.4, "learning_rate": 9.047568439088498e-05, "loss": 0.0084, "step": 538870 }, { "epoch": 1.4, "learning_rate": 9.04717961745135e-05, "loss": 0.0081, "step": 538880 }, { "epoch": 1.4, "learning_rate": 9.046790795814203e-05, "loss": 0.0099, "step": 538890 }, { "epoch": 1.4, "learning_rate": 9.046401974177059e-05, "loss": 0.0079, "step": 538900 }, { "epoch": 1.4, "learning_rate": 9.04601315253991e-05, "loss": 0.0091, "step": 538910 }, { "epoch": 1.4, "learning_rate": 9.045624330902766e-05, "loss": 0.01, "step": 538920 }, { "epoch": 1.4, "learning_rate": 9.045235509265619e-05, "loss": 0.0082, "step": 538930 }, { "epoch": 1.4, "learning_rate": 9.044846687628473e-05, "loss": 0.0079, "step": 538940 }, { "epoch": 1.4, "learning_rate": 9.044457865991326e-05, "loss": 0.0119, "step": 538950 }, { "epoch": 1.4, "learning_rate": 9.04406904435418e-05, "loss": 0.0086, "step": 538960 }, { "epoch": 1.4, "learning_rate": 9.043680222717033e-05, "loss": 0.009, "step": 538970 }, { "epoch": 1.4, "learning_rate": 9.043291401079887e-05, "loss": 0.012, "step": 538980 }, { "epoch": 1.4, "learning_rate": 9.04290257944274e-05, "loss": 0.0085, "step": 538990 }, { "epoch": 1.4, "learning_rate": 9.042513757805594e-05, "loss": 0.0103, "step": 539000 }, { "epoch": 1.4, "eval_cer": 0.8816746935844841, "eval_loss": 0.006161821540445089, "eval_runtime": 107.9304, "eval_samples_per_second": 18.53, "eval_steps_per_second": 4.633, "step": 539000 }, { "epoch": 1.4, "learning_rate": 9.042124936168447e-05, "loss": 0.0105, "step": 539010 }, { "epoch": 1.4, "learning_rate": 9.041736114531301e-05, "loss": 0.0132, "step": 539020 }, { "epoch": 1.4, "learning_rate": 9.041347292894154e-05, "loss": 0.0101, "step": 539030 }, { "epoch": 1.4, "learning_rate": 9.040958471257008e-05, "loss": 0.0095, "step": 539040 }, { "epoch": 1.4, "learning_rate": 9.04056964961986e-05, "loss": 0.0071, "step": 539050 }, { "epoch": 1.4, "learning_rate": 9.040180827982715e-05, "loss": 0.0112, "step": 539060 }, { "epoch": 1.4, "learning_rate": 9.039792006345568e-05, "loss": 0.009, "step": 539070 }, { "epoch": 1.4, "learning_rate": 9.039403184708423e-05, "loss": 0.0141, "step": 539080 }, { "epoch": 1.4, "learning_rate": 9.039014363071276e-05, "loss": 0.0119, "step": 539090 }, { "epoch": 1.4, "learning_rate": 9.03862554143413e-05, "loss": 0.0117, "step": 539100 }, { "epoch": 1.4, "learning_rate": 9.038236719796983e-05, "loss": 0.012, "step": 539110 }, { "epoch": 1.4, "learning_rate": 9.037847898159837e-05, "loss": 0.0107, "step": 539120 }, { "epoch": 1.4, "learning_rate": 9.03745907652269e-05, "loss": 0.0083, "step": 539130 }, { "epoch": 1.4, "learning_rate": 9.037070254885543e-05, "loss": 0.0106, "step": 539140 }, { "epoch": 1.4, "learning_rate": 9.036681433248397e-05, "loss": 0.0102, "step": 539150 }, { "epoch": 1.4, "learning_rate": 9.03629261161125e-05, "loss": 0.0113, "step": 539160 }, { "epoch": 1.4, "learning_rate": 9.035903789974104e-05, "loss": 0.0099, "step": 539170 }, { "epoch": 1.4, "learning_rate": 9.035514968336957e-05, "loss": 0.0089, "step": 539180 }, { "epoch": 1.4, "learning_rate": 9.035126146699811e-05, "loss": 0.01, "step": 539190 }, { "epoch": 1.4, "learning_rate": 9.034737325062664e-05, "loss": 0.0099, "step": 539200 }, { "epoch": 1.4, "learning_rate": 9.034348503425518e-05, "loss": 0.0084, "step": 539210 }, { "epoch": 1.4, "learning_rate": 9.03395968178837e-05, "loss": 0.0118, "step": 539220 }, { "epoch": 1.4, "learning_rate": 9.033570860151225e-05, "loss": 0.008, "step": 539230 }, { "epoch": 1.4, "learning_rate": 9.033182038514077e-05, "loss": 0.0096, "step": 539240 }, { "epoch": 1.4, "learning_rate": 9.032793216876933e-05, "loss": 0.0117, "step": 539250 }, { "epoch": 1.4, "learning_rate": 9.032404395239784e-05, "loss": 0.008, "step": 539260 }, { "epoch": 1.4, "learning_rate": 9.03201557360264e-05, "loss": 0.0102, "step": 539270 }, { "epoch": 1.4, "learning_rate": 9.031626751965493e-05, "loss": 0.0127, "step": 539280 }, { "epoch": 1.4, "learning_rate": 9.031237930328347e-05, "loss": 0.0101, "step": 539290 }, { "epoch": 1.4, "learning_rate": 9.0308491086912e-05, "loss": 0.0087, "step": 539300 }, { "epoch": 1.4, "learning_rate": 9.030460287054054e-05, "loss": 0.009, "step": 539310 }, { "epoch": 1.4, "learning_rate": 9.030071465416907e-05, "loss": 0.0067, "step": 539320 }, { "epoch": 1.4, "learning_rate": 9.029682643779761e-05, "loss": 0.0085, "step": 539330 }, { "epoch": 1.4, "learning_rate": 9.029293822142614e-05, "loss": 0.007, "step": 539340 }, { "epoch": 1.4, "learning_rate": 9.028905000505468e-05, "loss": 0.0101, "step": 539350 }, { "epoch": 1.4, "learning_rate": 9.02851617886832e-05, "loss": 0.0078, "step": 539360 }, { "epoch": 1.4, "learning_rate": 9.028127357231175e-05, "loss": 0.0094, "step": 539370 }, { "epoch": 1.4, "learning_rate": 9.027738535594028e-05, "loss": 0.0061, "step": 539380 }, { "epoch": 1.4, "learning_rate": 9.02734971395688e-05, "loss": 0.0088, "step": 539390 }, { "epoch": 1.4, "learning_rate": 9.026960892319735e-05, "loss": 0.0084, "step": 539400 }, { "epoch": 1.4, "learning_rate": 9.026572070682587e-05, "loss": 0.0112, "step": 539410 }, { "epoch": 1.4, "learning_rate": 9.026183249045442e-05, "loss": 0.0093, "step": 539420 }, { "epoch": 1.4, "learning_rate": 9.025794427408294e-05, "loss": 0.0066, "step": 539430 }, { "epoch": 1.4, "learning_rate": 9.02540560577115e-05, "loss": 0.0089, "step": 539440 }, { "epoch": 1.4, "learning_rate": 9.025016784134003e-05, "loss": 0.0085, "step": 539450 }, { "epoch": 1.4, "learning_rate": 9.024627962496857e-05, "loss": 0.0104, "step": 539460 }, { "epoch": 1.4, "learning_rate": 9.02423914085971e-05, "loss": 0.0106, "step": 539470 }, { "epoch": 1.4, "learning_rate": 9.023850319222564e-05, "loss": 0.014, "step": 539480 }, { "epoch": 1.4, "learning_rate": 9.023461497585417e-05, "loss": 0.0112, "step": 539490 }, { "epoch": 1.4, "learning_rate": 9.023072675948271e-05, "loss": 0.0082, "step": 539500 }, { "epoch": 1.4, "learning_rate": 9.022683854311124e-05, "loss": 0.0116, "step": 539510 }, { "epoch": 1.4, "learning_rate": 9.022295032673978e-05, "loss": 0.0082, "step": 539520 }, { "epoch": 1.4, "learning_rate": 9.02190621103683e-05, "loss": 0.0146, "step": 539530 }, { "epoch": 1.4, "learning_rate": 9.021517389399685e-05, "loss": 0.0098, "step": 539540 }, { "epoch": 1.4, "learning_rate": 9.021128567762538e-05, "loss": 0.0098, "step": 539550 }, { "epoch": 1.4, "learning_rate": 9.020739746125392e-05, "loss": 0.0077, "step": 539560 }, { "epoch": 1.4, "learning_rate": 9.020350924488245e-05, "loss": 0.0092, "step": 539570 }, { "epoch": 1.4, "learning_rate": 9.019962102851099e-05, "loss": 0.008, "step": 539580 }, { "epoch": 1.4, "learning_rate": 9.019573281213952e-05, "loss": 0.0062, "step": 539590 }, { "epoch": 1.4, "learning_rate": 9.019184459576807e-05, "loss": 0.0092, "step": 539600 }, { "epoch": 1.4, "learning_rate": 9.01879563793966e-05, "loss": 0.0099, "step": 539610 }, { "epoch": 1.4, "learning_rate": 9.018406816302514e-05, "loss": 0.0073, "step": 539620 }, { "epoch": 1.4, "learning_rate": 9.018017994665367e-05, "loss": 0.0108, "step": 539630 }, { "epoch": 1.4, "learning_rate": 9.01762917302822e-05, "loss": 0.0097, "step": 539640 }, { "epoch": 1.4, "learning_rate": 9.017240351391074e-05, "loss": 0.0079, "step": 539650 }, { "epoch": 1.4, "learning_rate": 9.016851529753927e-05, "loss": 0.0068, "step": 539660 }, { "epoch": 1.4, "learning_rate": 9.016462708116781e-05, "loss": 0.0105, "step": 539670 }, { "epoch": 1.4, "learning_rate": 9.016073886479634e-05, "loss": 0.0115, "step": 539680 }, { "epoch": 1.4, "learning_rate": 9.015685064842488e-05, "loss": 0.0097, "step": 539690 }, { "epoch": 1.4, "learning_rate": 9.01529624320534e-05, "loss": 0.0111, "step": 539700 }, { "epoch": 1.4, "learning_rate": 9.014907421568195e-05, "loss": 0.01, "step": 539710 }, { "epoch": 1.4, "learning_rate": 9.014518599931048e-05, "loss": 0.0073, "step": 539720 }, { "epoch": 1.4, "learning_rate": 9.014129778293902e-05, "loss": 0.012, "step": 539730 }, { "epoch": 1.4, "learning_rate": 9.013740956656754e-05, "loss": 0.009, "step": 539740 }, { "epoch": 1.4, "learning_rate": 9.013352135019609e-05, "loss": 0.0089, "step": 539750 }, { "epoch": 1.4, "learning_rate": 9.012963313382461e-05, "loss": 0.0096, "step": 539760 }, { "epoch": 1.4, "learning_rate": 9.012574491745317e-05, "loss": 0.01, "step": 539770 }, { "epoch": 1.4, "learning_rate": 9.012185670108168e-05, "loss": 0.0099, "step": 539780 }, { "epoch": 1.4, "learning_rate": 9.011796848471024e-05, "loss": 0.0101, "step": 539790 }, { "epoch": 1.4, "learning_rate": 9.011408026833877e-05, "loss": 0.0108, "step": 539800 }, { "epoch": 1.4, "learning_rate": 9.011019205196731e-05, "loss": 0.0121, "step": 539810 }, { "epoch": 1.4, "learning_rate": 9.010630383559584e-05, "loss": 0.0104, "step": 539820 }, { "epoch": 1.4, "learning_rate": 9.010241561922438e-05, "loss": 0.0076, "step": 539830 }, { "epoch": 1.4, "learning_rate": 9.009852740285291e-05, "loss": 0.0087, "step": 539840 }, { "epoch": 1.4, "learning_rate": 9.009463918648145e-05, "loss": 0.0082, "step": 539850 }, { "epoch": 1.4, "learning_rate": 9.009075097010998e-05, "loss": 0.0094, "step": 539860 }, { "epoch": 1.4, "learning_rate": 9.008686275373852e-05, "loss": 0.0115, "step": 539870 }, { "epoch": 1.4, "learning_rate": 9.008297453736705e-05, "loss": 0.0072, "step": 539880 }, { "epoch": 1.4, "learning_rate": 9.007908632099557e-05, "loss": 0.0091, "step": 539890 }, { "epoch": 1.4, "learning_rate": 9.007519810462412e-05, "loss": 0.0086, "step": 539900 }, { "epoch": 1.4, "learning_rate": 9.007130988825264e-05, "loss": 0.0079, "step": 539910 }, { "epoch": 1.4, "learning_rate": 9.006742167188119e-05, "loss": 0.0077, "step": 539920 }, { "epoch": 1.4, "learning_rate": 9.006353345550971e-05, "loss": 0.0106, "step": 539930 }, { "epoch": 1.4, "learning_rate": 9.005964523913826e-05, "loss": 0.0082, "step": 539940 }, { "epoch": 1.4, "learning_rate": 9.005575702276678e-05, "loss": 0.0098, "step": 539950 }, { "epoch": 1.4, "learning_rate": 9.005186880639534e-05, "loss": 0.0075, "step": 539960 }, { "epoch": 1.4, "learning_rate": 9.004798059002387e-05, "loss": 0.011, "step": 539970 }, { "epoch": 1.4, "learning_rate": 9.004409237365241e-05, "loss": 0.0096, "step": 539980 }, { "epoch": 1.4, "learning_rate": 9.004020415728094e-05, "loss": 0.0085, "step": 539990 }, { "epoch": 1.4, "learning_rate": 9.003631594090948e-05, "loss": 0.0109, "step": 540000 }, { "epoch": 1.4, "eval_cer": 0.8816704946736816, "eval_loss": 0.006191324442625046, "eval_runtime": 107.7847, "eval_samples_per_second": 18.556, "eval_steps_per_second": 4.639, "step": 540000 }, { "epoch": 1.4, "learning_rate": 9.0032427724538e-05, "loss": 0.013, "step": 540010 }, { "epoch": 1.4, "learning_rate": 9.002853950816655e-05, "loss": 0.0101, "step": 540020 }, { "epoch": 1.4, "learning_rate": 9.002465129179508e-05, "loss": 0.0075, "step": 540030 }, { "epoch": 1.4, "learning_rate": 9.002076307542362e-05, "loss": 0.0117, "step": 540040 }, { "epoch": 1.4, "learning_rate": 9.001687485905215e-05, "loss": 0.0109, "step": 540050 }, { "epoch": 1.4, "learning_rate": 9.001298664268069e-05, "loss": 0.0096, "step": 540060 }, { "epoch": 1.4, "learning_rate": 9.000909842630922e-05, "loss": 0.0093, "step": 540070 }, { "epoch": 1.4, "learning_rate": 9.000521020993776e-05, "loss": 0.0088, "step": 540080 }, { "epoch": 1.4, "learning_rate": 9.000132199356629e-05, "loss": 0.0104, "step": 540090 }, { "epoch": 1.4, "learning_rate": 8.999743377719483e-05, "loss": 0.008, "step": 540100 }, { "epoch": 1.4, "learning_rate": 8.999354556082335e-05, "loss": 0.0109, "step": 540110 }, { "epoch": 1.4, "learning_rate": 8.998965734445191e-05, "loss": 0.0129, "step": 540120 }, { "epoch": 1.4, "learning_rate": 8.998576912808044e-05, "loss": 0.0095, "step": 540130 }, { "epoch": 1.4, "learning_rate": 8.998188091170895e-05, "loss": 0.0102, "step": 540140 }, { "epoch": 1.4, "learning_rate": 8.997799269533751e-05, "loss": 0.0073, "step": 540150 }, { "epoch": 1.4, "learning_rate": 8.997410447896604e-05, "loss": 0.008, "step": 540160 }, { "epoch": 1.4, "learning_rate": 8.997021626259458e-05, "loss": 0.0112, "step": 540170 }, { "epoch": 1.4, "learning_rate": 8.99663280462231e-05, "loss": 0.008, "step": 540180 }, { "epoch": 1.4, "learning_rate": 8.996243982985165e-05, "loss": 0.0099, "step": 540190 }, { "epoch": 1.4, "learning_rate": 8.995855161348018e-05, "loss": 0.0084, "step": 540200 }, { "epoch": 1.4, "learning_rate": 8.995466339710872e-05, "loss": 0.0106, "step": 540210 }, { "epoch": 1.4, "learning_rate": 8.995077518073725e-05, "loss": 0.0081, "step": 540220 }, { "epoch": 1.4, "learning_rate": 8.994688696436579e-05, "loss": 0.0081, "step": 540230 }, { "epoch": 1.4, "learning_rate": 8.994299874799431e-05, "loss": 0.0089, "step": 540240 }, { "epoch": 1.4, "learning_rate": 8.993911053162286e-05, "loss": 0.0073, "step": 540250 }, { "epoch": 1.4, "learning_rate": 8.993522231525138e-05, "loss": 0.0143, "step": 540260 }, { "epoch": 1.4, "learning_rate": 8.993133409887993e-05, "loss": 0.0091, "step": 540270 }, { "epoch": 1.4, "learning_rate": 8.992744588250845e-05, "loss": 0.0097, "step": 540280 }, { "epoch": 1.4, "learning_rate": 8.9923557666137e-05, "loss": 0.0098, "step": 540290 }, { "epoch": 1.4, "learning_rate": 8.991966944976552e-05, "loss": 0.0098, "step": 540300 }, { "epoch": 1.4, "learning_rate": 8.991578123339408e-05, "loss": 0.0096, "step": 540310 }, { "epoch": 1.4, "learning_rate": 8.991189301702261e-05, "loss": 0.0088, "step": 540320 }, { "epoch": 1.4, "learning_rate": 8.990800480065115e-05, "loss": 0.0077, "step": 540330 }, { "epoch": 1.4, "learning_rate": 8.990411658427968e-05, "loss": 0.0089, "step": 540340 }, { "epoch": 1.4, "learning_rate": 8.990022836790822e-05, "loss": 0.0084, "step": 540350 }, { "epoch": 1.4, "learning_rate": 8.989634015153675e-05, "loss": 0.0083, "step": 540360 }, { "epoch": 1.4, "learning_rate": 8.989245193516529e-05, "loss": 0.0085, "step": 540370 }, { "epoch": 1.4, "learning_rate": 8.988856371879382e-05, "loss": 0.009, "step": 540380 }, { "epoch": 1.4, "learning_rate": 8.988467550242234e-05, "loss": 0.0067, "step": 540390 }, { "epoch": 1.4, "learning_rate": 8.988078728605089e-05, "loss": 0.0082, "step": 540400 }, { "epoch": 1.4, "learning_rate": 8.987689906967941e-05, "loss": 0.0108, "step": 540410 }, { "epoch": 1.4, "learning_rate": 8.987301085330796e-05, "loss": 0.0091, "step": 540420 }, { "epoch": 1.4, "learning_rate": 8.986912263693648e-05, "loss": 0.0105, "step": 540430 }, { "epoch": 1.4, "learning_rate": 8.986523442056503e-05, "loss": 0.0114, "step": 540440 }, { "epoch": 1.4, "learning_rate": 8.986134620419355e-05, "loss": 0.0073, "step": 540450 }, { "epoch": 1.4, "learning_rate": 8.98574579878221e-05, "loss": 0.0093, "step": 540460 }, { "epoch": 1.4, "learning_rate": 8.985356977145062e-05, "loss": 0.0097, "step": 540470 }, { "epoch": 1.4, "learning_rate": 8.984968155507918e-05, "loss": 0.0104, "step": 540480 }, { "epoch": 1.4, "learning_rate": 8.98457933387077e-05, "loss": 0.0103, "step": 540490 }, { "epoch": 1.4, "learning_rate": 8.984190512233625e-05, "loss": 0.0111, "step": 540500 }, { "epoch": 1.4, "learning_rate": 8.983801690596478e-05, "loss": 0.0095, "step": 540510 }, { "epoch": 1.4, "learning_rate": 8.983412868959332e-05, "loss": 0.0111, "step": 540520 }, { "epoch": 1.4, "learning_rate": 8.983024047322185e-05, "loss": 0.0118, "step": 540530 }, { "epoch": 1.4, "learning_rate": 8.982635225685039e-05, "loss": 0.0091, "step": 540540 }, { "epoch": 1.4, "learning_rate": 8.982246404047892e-05, "loss": 0.009, "step": 540550 }, { "epoch": 1.4, "learning_rate": 8.981857582410746e-05, "loss": 0.0085, "step": 540560 }, { "epoch": 1.4, "learning_rate": 8.981468760773599e-05, "loss": 0.0095, "step": 540570 }, { "epoch": 1.4, "learning_rate": 8.981079939136453e-05, "loss": 0.0114, "step": 540580 }, { "epoch": 1.4, "learning_rate": 8.980691117499306e-05, "loss": 0.0118, "step": 540590 }, { "epoch": 1.4, "learning_rate": 8.98030229586216e-05, "loss": 0.0076, "step": 540600 }, { "epoch": 1.4, "learning_rate": 8.979913474225013e-05, "loss": 0.0096, "step": 540610 }, { "epoch": 1.4, "learning_rate": 8.979524652587867e-05, "loss": 0.01, "step": 540620 }, { "epoch": 1.4, "learning_rate": 8.97913583095072e-05, "loss": 0.0098, "step": 540630 }, { "epoch": 1.4, "learning_rate": 8.978747009313572e-05, "loss": 0.009, "step": 540640 }, { "epoch": 1.4, "learning_rate": 8.978358187676426e-05, "loss": 0.0108, "step": 540650 }, { "epoch": 1.4, "learning_rate": 8.977969366039279e-05, "loss": 0.0126, "step": 540660 }, { "epoch": 1.4, "learning_rate": 8.977580544402135e-05, "loss": 0.0081, "step": 540670 }, { "epoch": 1.4, "learning_rate": 8.977191722764988e-05, "loss": 0.0118, "step": 540680 }, { "epoch": 1.4, "learning_rate": 8.976802901127842e-05, "loss": 0.0076, "step": 540690 }, { "epoch": 1.4, "learning_rate": 8.976414079490695e-05, "loss": 0.0115, "step": 540700 }, { "epoch": 1.4, "learning_rate": 8.976025257853549e-05, "loss": 0.0083, "step": 540710 }, { "epoch": 1.4, "learning_rate": 8.975636436216402e-05, "loss": 0.0091, "step": 540720 }, { "epoch": 1.4, "learning_rate": 8.975247614579256e-05, "loss": 0.0089, "step": 540730 }, { "epoch": 1.4, "learning_rate": 8.974858792942109e-05, "loss": 0.0091, "step": 540740 }, { "epoch": 1.4, "learning_rate": 8.974469971304963e-05, "loss": 0.0109, "step": 540750 }, { "epoch": 1.4, "learning_rate": 8.974081149667815e-05, "loss": 0.0131, "step": 540760 }, { "epoch": 1.4, "learning_rate": 8.97369232803067e-05, "loss": 0.0098, "step": 540770 }, { "epoch": 1.4, "learning_rate": 8.973303506393522e-05, "loss": 0.0098, "step": 540780 }, { "epoch": 1.4, "learning_rate": 8.972914684756377e-05, "loss": 0.0086, "step": 540790 }, { "epoch": 1.4, "learning_rate": 8.97252586311923e-05, "loss": 0.01, "step": 540800 }, { "epoch": 1.4, "learning_rate": 8.972137041482084e-05, "loss": 0.0088, "step": 540810 }, { "epoch": 1.4, "learning_rate": 8.971748219844936e-05, "loss": 0.0088, "step": 540820 }, { "epoch": 1.4, "learning_rate": 8.971359398207792e-05, "loss": 0.0081, "step": 540830 }, { "epoch": 1.4, "learning_rate": 8.970970576570645e-05, "loss": 0.0078, "step": 540840 }, { "epoch": 1.4, "learning_rate": 8.970581754933499e-05, "loss": 0.0118, "step": 540850 }, { "epoch": 1.4, "learning_rate": 8.970192933296352e-05, "loss": 0.0081, "step": 540860 }, { "epoch": 1.4, "learning_rate": 8.969804111659206e-05, "loss": 0.0085, "step": 540870 }, { "epoch": 1.4, "learning_rate": 8.969415290022059e-05, "loss": 0.0103, "step": 540880 }, { "epoch": 1.4, "learning_rate": 8.969026468384911e-05, "loss": 0.0081, "step": 540890 }, { "epoch": 1.4, "learning_rate": 8.968637646747766e-05, "loss": 0.0108, "step": 540900 }, { "epoch": 1.4, "learning_rate": 8.968248825110618e-05, "loss": 0.0084, "step": 540910 }, { "epoch": 1.4, "learning_rate": 8.967860003473473e-05, "loss": 0.0092, "step": 540920 }, { "epoch": 1.4, "learning_rate": 8.967471181836325e-05, "loss": 0.0093, "step": 540930 }, { "epoch": 1.4, "learning_rate": 8.96708236019918e-05, "loss": 0.0094, "step": 540940 }, { "epoch": 1.4, "learning_rate": 8.966693538562032e-05, "loss": 0.0089, "step": 540950 }, { "epoch": 1.4, "learning_rate": 8.966304716924887e-05, "loss": 0.0079, "step": 540960 }, { "epoch": 1.4, "learning_rate": 8.96591589528774e-05, "loss": 0.0108, "step": 540970 }, { "epoch": 1.4, "learning_rate": 8.965527073650594e-05, "loss": 0.0109, "step": 540980 }, { "epoch": 1.4, "learning_rate": 8.965138252013446e-05, "loss": 0.0085, "step": 540990 }, { "epoch": 1.4, "learning_rate": 8.964749430376302e-05, "loss": 0.0108, "step": 541000 }, { "epoch": 1.4, "eval_cer": 0.8816956881384969, "eval_loss": 0.006157417315989733, "eval_runtime": 107.7568, "eval_samples_per_second": 18.56, "eval_steps_per_second": 4.64, "step": 541000 }, { "epoch": 1.4, "learning_rate": 8.964360608739153e-05, "loss": 0.0082, "step": 541010 }, { "epoch": 1.4, "learning_rate": 8.963971787102009e-05, "loss": 0.0103, "step": 541020 }, { "epoch": 1.4, "learning_rate": 8.963582965464862e-05, "loss": 0.0087, "step": 541030 }, { "epoch": 1.4, "learning_rate": 8.963194143827716e-05, "loss": 0.0075, "step": 541040 }, { "epoch": 1.4, "learning_rate": 8.962805322190569e-05, "loss": 0.0114, "step": 541050 }, { "epoch": 1.4, "learning_rate": 8.962416500553423e-05, "loss": 0.0093, "step": 541060 }, { "epoch": 1.4, "learning_rate": 8.962027678916276e-05, "loss": 0.0103, "step": 541070 }, { "epoch": 1.4, "learning_rate": 8.96163885727913e-05, "loss": 0.0078, "step": 541080 }, { "epoch": 1.4, "learning_rate": 8.961250035641983e-05, "loss": 0.0108, "step": 541090 }, { "epoch": 1.4, "learning_rate": 8.960861214004837e-05, "loss": 0.0068, "step": 541100 }, { "epoch": 1.4, "learning_rate": 8.96047239236769e-05, "loss": 0.0094, "step": 541110 }, { "epoch": 1.4, "learning_rate": 8.960083570730544e-05, "loss": 0.0121, "step": 541120 }, { "epoch": 1.4, "learning_rate": 8.959694749093397e-05, "loss": 0.0082, "step": 541130 }, { "epoch": 1.4, "learning_rate": 8.959305927456249e-05, "loss": 0.0086, "step": 541140 }, { "epoch": 1.4, "learning_rate": 8.958917105819103e-05, "loss": 0.0074, "step": 541150 }, { "epoch": 1.4, "learning_rate": 8.958528284181956e-05, "loss": 0.0101, "step": 541160 }, { "epoch": 1.4, "learning_rate": 8.95813946254481e-05, "loss": 0.0094, "step": 541170 }, { "epoch": 1.4, "learning_rate": 8.957750640907663e-05, "loss": 0.0086, "step": 541180 }, { "epoch": 1.4, "learning_rate": 8.957361819270519e-05, "loss": 0.0078, "step": 541190 }, { "epoch": 1.4, "learning_rate": 8.956972997633372e-05, "loss": 0.0116, "step": 541200 }, { "epoch": 1.4, "learning_rate": 8.956584175996226e-05, "loss": 0.0075, "step": 541210 }, { "epoch": 1.4, "learning_rate": 8.956195354359079e-05, "loss": 0.0137, "step": 541220 }, { "epoch": 1.4, "learning_rate": 8.955806532721933e-05, "loss": 0.0082, "step": 541230 }, { "epoch": 1.4, "learning_rate": 8.955417711084786e-05, "loss": 0.018, "step": 541240 }, { "epoch": 1.4, "learning_rate": 8.95502888944764e-05, "loss": 0.0147, "step": 541250 }, { "epoch": 1.4, "learning_rate": 8.954640067810493e-05, "loss": 0.0104, "step": 541260 }, { "epoch": 1.4, "learning_rate": 8.954251246173347e-05, "loss": 0.0082, "step": 541270 }, { "epoch": 1.4, "learning_rate": 8.9538624245362e-05, "loss": 0.012, "step": 541280 }, { "epoch": 1.4, "learning_rate": 8.953473602899054e-05, "loss": 0.0104, "step": 541290 }, { "epoch": 1.4, "learning_rate": 8.953084781261906e-05, "loss": 0.0093, "step": 541300 }, { "epoch": 1.4, "learning_rate": 8.95269595962476e-05, "loss": 0.008, "step": 541310 }, { "epoch": 1.4, "learning_rate": 8.952307137987613e-05, "loss": 0.0116, "step": 541320 }, { "epoch": 1.4, "learning_rate": 8.951918316350468e-05, "loss": 0.0109, "step": 541330 }, { "epoch": 1.4, "learning_rate": 8.95152949471332e-05, "loss": 0.0104, "step": 541340 }, { "epoch": 1.4, "learning_rate": 8.951140673076176e-05, "loss": 0.0091, "step": 541350 }, { "epoch": 1.4, "learning_rate": 8.950751851439029e-05, "loss": 0.0116, "step": 541360 }, { "epoch": 1.4, "learning_rate": 8.95036302980188e-05, "loss": 0.009, "step": 541370 }, { "epoch": 1.4, "learning_rate": 8.949974208164736e-05, "loss": 0.0092, "step": 541380 }, { "epoch": 1.4, "learning_rate": 8.949585386527589e-05, "loss": 0.0061, "step": 541390 }, { "epoch": 1.4, "learning_rate": 8.949196564890443e-05, "loss": 0.009, "step": 541400 }, { "epoch": 1.4, "learning_rate": 8.948807743253295e-05, "loss": 0.0083, "step": 541410 }, { "epoch": 1.4, "learning_rate": 8.94841892161615e-05, "loss": 0.0079, "step": 541420 }, { "epoch": 1.4, "learning_rate": 8.948030099979002e-05, "loss": 0.0167, "step": 541430 }, { "epoch": 1.4, "learning_rate": 8.947641278341857e-05, "loss": 0.0109, "step": 541440 }, { "epoch": 1.4, "learning_rate": 8.94725245670471e-05, "loss": 0.0125, "step": 541450 }, { "epoch": 1.4, "learning_rate": 8.946863635067564e-05, "loss": 0.0091, "step": 541460 }, { "epoch": 1.4, "learning_rate": 8.946474813430416e-05, "loss": 0.0093, "step": 541470 }, { "epoch": 1.4, "learning_rate": 8.94608599179327e-05, "loss": 0.0107, "step": 541480 }, { "epoch": 1.4, "learning_rate": 8.945697170156123e-05, "loss": 0.0089, "step": 541490 }, { "epoch": 1.4, "learning_rate": 8.945308348518978e-05, "loss": 0.0097, "step": 541500 }, { "epoch": 1.4, "learning_rate": 8.94491952688183e-05, "loss": 0.0122, "step": 541510 }, { "epoch": 1.4, "learning_rate": 8.944530705244686e-05, "loss": 0.0088, "step": 541520 }, { "epoch": 1.4, "learning_rate": 8.944141883607537e-05, "loss": 0.0097, "step": 541530 }, { "epoch": 1.4, "learning_rate": 8.943753061970393e-05, "loss": 0.0087, "step": 541540 }, { "epoch": 1.4, "learning_rate": 8.943364240333246e-05, "loss": 0.0111, "step": 541550 }, { "epoch": 1.4, "learning_rate": 8.9429754186961e-05, "loss": 0.0102, "step": 541560 }, { "epoch": 1.4, "learning_rate": 8.942586597058953e-05, "loss": 0.0098, "step": 541570 }, { "epoch": 1.4, "learning_rate": 8.942197775421807e-05, "loss": 0.0111, "step": 541580 }, { "epoch": 1.4, "learning_rate": 8.94180895378466e-05, "loss": 0.0132, "step": 541590 }, { "epoch": 1.4, "learning_rate": 8.941420132147514e-05, "loss": 0.0101, "step": 541600 }, { "epoch": 1.4, "learning_rate": 8.941031310510367e-05, "loss": 0.0105, "step": 541610 }, { "epoch": 1.4, "learning_rate": 8.94064248887322e-05, "loss": 0.01, "step": 541620 }, { "epoch": 1.4, "learning_rate": 8.940253667236074e-05, "loss": 0.0087, "step": 541630 }, { "epoch": 1.4, "learning_rate": 8.939864845598926e-05, "loss": 0.0128, "step": 541640 }, { "epoch": 1.4, "learning_rate": 8.93947602396178e-05, "loss": 0.0134, "step": 541650 }, { "epoch": 1.4, "learning_rate": 8.939087202324633e-05, "loss": 0.0098, "step": 541660 }, { "epoch": 1.4, "learning_rate": 8.938698380687487e-05, "loss": 0.0099, "step": 541670 }, { "epoch": 1.4, "learning_rate": 8.93830955905034e-05, "loss": 0.0105, "step": 541680 }, { "epoch": 1.4, "learning_rate": 8.937920737413194e-05, "loss": 0.0077, "step": 541690 }, { "epoch": 1.4, "learning_rate": 8.937531915776047e-05, "loss": 0.0087, "step": 541700 }, { "epoch": 1.4, "learning_rate": 8.937143094138903e-05, "loss": 0.0111, "step": 541710 }, { "epoch": 1.4, "learning_rate": 8.936754272501756e-05, "loss": 0.008, "step": 541720 }, { "epoch": 1.4, "learning_rate": 8.93636545086461e-05, "loss": 0.0109, "step": 541730 }, { "epoch": 1.4, "learning_rate": 8.935976629227463e-05, "loss": 0.0095, "step": 541740 }, { "epoch": 1.4, "learning_rate": 8.935587807590317e-05, "loss": 0.0148, "step": 541750 }, { "epoch": 1.4, "learning_rate": 8.93519898595317e-05, "loss": 0.0101, "step": 541760 }, { "epoch": 1.4, "learning_rate": 8.934810164316024e-05, "loss": 0.0107, "step": 541770 }, { "epoch": 1.4, "learning_rate": 8.934421342678876e-05, "loss": 0.0088, "step": 541780 }, { "epoch": 1.4, "learning_rate": 8.93403252104173e-05, "loss": 0.0122, "step": 541790 }, { "epoch": 1.4, "learning_rate": 8.933643699404583e-05, "loss": 0.0094, "step": 541800 }, { "epoch": 1.4, "learning_rate": 8.933254877767438e-05, "loss": 0.0091, "step": 541810 }, { "epoch": 1.4, "learning_rate": 8.93286605613029e-05, "loss": 0.0091, "step": 541820 }, { "epoch": 1.4, "learning_rate": 8.932477234493145e-05, "loss": 0.009, "step": 541830 }, { "epoch": 1.4, "learning_rate": 8.932088412855997e-05, "loss": 0.0083, "step": 541840 }, { "epoch": 1.4, "learning_rate": 8.931699591218852e-05, "loss": 0.0084, "step": 541850 }, { "epoch": 1.4, "learning_rate": 8.931310769581704e-05, "loss": 0.0099, "step": 541860 }, { "epoch": 1.4, "learning_rate": 8.930921947944557e-05, "loss": 0.0092, "step": 541870 }, { "epoch": 1.4, "learning_rate": 8.930533126307411e-05, "loss": 0.0108, "step": 541880 }, { "epoch": 1.4, "learning_rate": 8.930144304670264e-05, "loss": 0.0082, "step": 541890 }, { "epoch": 1.4, "learning_rate": 8.92975548303312e-05, "loss": 0.0112, "step": 541900 }, { "epoch": 1.4, "learning_rate": 8.929366661395972e-05, "loss": 0.0095, "step": 541910 }, { "epoch": 1.4, "learning_rate": 8.928977839758827e-05, "loss": 0.0078, "step": 541920 }, { "epoch": 1.4, "learning_rate": 8.92858901812168e-05, "loss": 0.0087, "step": 541930 }, { "epoch": 1.4, "learning_rate": 8.928200196484534e-05, "loss": 0.009, "step": 541940 }, { "epoch": 1.4, "learning_rate": 8.927811374847386e-05, "loss": 0.0099, "step": 541950 }, { "epoch": 1.4, "learning_rate": 8.92742255321024e-05, "loss": 0.0113, "step": 541960 }, { "epoch": 1.4, "learning_rate": 8.927033731573093e-05, "loss": 0.0099, "step": 541970 }, { "epoch": 1.4, "learning_rate": 8.926644909935948e-05, "loss": 0.0086, "step": 541980 }, { "epoch": 1.4, "learning_rate": 8.9262560882988e-05, "loss": 0.0098, "step": 541990 }, { "epoch": 1.4, "learning_rate": 8.925867266661655e-05, "loss": 0.0122, "step": 542000 }, { "epoch": 1.4, "eval_cer": 0.8816928888646285, "eval_loss": 0.005949368700385094, "eval_runtime": 107.8552, "eval_samples_per_second": 18.543, "eval_steps_per_second": 4.636, "step": 542000 }, { "epoch": 1.4, "learning_rate": 8.925478445024507e-05, "loss": 0.0109, "step": 542010 }, { "epoch": 1.4, "learning_rate": 8.925089623387362e-05, "loss": 0.009, "step": 542020 }, { "epoch": 1.41, "learning_rate": 8.924700801750214e-05, "loss": 0.0094, "step": 542030 }, { "epoch": 1.41, "learning_rate": 8.924311980113068e-05, "loss": 0.0126, "step": 542040 }, { "epoch": 1.41, "learning_rate": 8.923923158475921e-05, "loss": 0.0084, "step": 542050 }, { "epoch": 1.41, "learning_rate": 8.923534336838777e-05, "loss": 0.0109, "step": 542060 }, { "epoch": 1.41, "learning_rate": 8.92314551520163e-05, "loss": 0.013, "step": 542070 }, { "epoch": 1.41, "learning_rate": 8.922756693564484e-05, "loss": 0.0098, "step": 542080 }, { "epoch": 1.41, "learning_rate": 8.922367871927337e-05, "loss": 0.0101, "step": 542090 }, { "epoch": 1.41, "learning_rate": 8.921979050290191e-05, "loss": 0.0134, "step": 542100 }, { "epoch": 1.41, "learning_rate": 8.921590228653044e-05, "loss": 0.01, "step": 542110 }, { "epoch": 1.41, "learning_rate": 8.921201407015896e-05, "loss": 0.0118, "step": 542120 }, { "epoch": 1.41, "learning_rate": 8.92081258537875e-05, "loss": 0.0106, "step": 542130 }, { "epoch": 1.41, "learning_rate": 8.920423763741603e-05, "loss": 0.0119, "step": 542140 }, { "epoch": 1.41, "learning_rate": 8.920034942104458e-05, "loss": 0.0083, "step": 542150 }, { "epoch": 1.41, "learning_rate": 8.91964612046731e-05, "loss": 0.0127, "step": 542160 }, { "epoch": 1.41, "learning_rate": 8.919257298830164e-05, "loss": 0.0089, "step": 542170 }, { "epoch": 1.41, "learning_rate": 8.918868477193017e-05, "loss": 0.0086, "step": 542180 }, { "epoch": 1.41, "learning_rate": 8.918479655555871e-05, "loss": 0.0098, "step": 542190 }, { "epoch": 1.41, "learning_rate": 8.918090833918724e-05, "loss": 0.0112, "step": 542200 }, { "epoch": 1.41, "learning_rate": 8.917702012281578e-05, "loss": 0.0075, "step": 542210 }, { "epoch": 1.41, "learning_rate": 8.917313190644431e-05, "loss": 0.0105, "step": 542220 }, { "epoch": 1.41, "learning_rate": 8.916924369007287e-05, "loss": 0.0096, "step": 542230 }, { "epoch": 1.41, "learning_rate": 8.916535547370138e-05, "loss": 0.0095, "step": 542240 }, { "epoch": 1.41, "learning_rate": 8.916146725732994e-05, "loss": 0.0096, "step": 542250 }, { "epoch": 1.41, "learning_rate": 8.915757904095847e-05, "loss": 0.0077, "step": 542260 }, { "epoch": 1.41, "learning_rate": 8.915369082458701e-05, "loss": 0.0101, "step": 542270 }, { "epoch": 1.41, "learning_rate": 8.914980260821554e-05, "loss": 0.014, "step": 542280 }, { "epoch": 1.41, "learning_rate": 8.914591439184408e-05, "loss": 0.0102, "step": 542290 }, { "epoch": 1.41, "learning_rate": 8.91420261754726e-05, "loss": 0.0096, "step": 542300 }, { "epoch": 1.41, "learning_rate": 8.913813795910115e-05, "loss": 0.0073, "step": 542310 }, { "epoch": 1.41, "learning_rate": 8.913424974272967e-05, "loss": 0.0074, "step": 542320 }, { "epoch": 1.41, "learning_rate": 8.913036152635822e-05, "loss": 0.0111, "step": 542330 }, { "epoch": 1.41, "learning_rate": 8.912647330998674e-05, "loss": 0.0094, "step": 542340 }, { "epoch": 1.41, "learning_rate": 8.912258509361529e-05, "loss": 0.0122, "step": 542350 }, { "epoch": 1.41, "learning_rate": 8.911869687724381e-05, "loss": 0.0094, "step": 542360 }, { "epoch": 1.41, "learning_rate": 8.911480866087234e-05, "loss": 0.009, "step": 542370 }, { "epoch": 1.41, "learning_rate": 8.911092044450088e-05, "loss": 0.0107, "step": 542380 }, { "epoch": 1.41, "learning_rate": 8.910703222812941e-05, "loss": 0.007, "step": 542390 }, { "epoch": 1.41, "learning_rate": 8.910314401175795e-05, "loss": 0.0094, "step": 542400 }, { "epoch": 1.41, "learning_rate": 8.909925579538648e-05, "loss": 0.0085, "step": 542410 }, { "epoch": 1.41, "learning_rate": 8.909536757901504e-05, "loss": 0.0077, "step": 542420 }, { "epoch": 1.41, "learning_rate": 8.909147936264356e-05, "loss": 0.0136, "step": 542430 }, { "epoch": 1.41, "learning_rate": 8.90875911462721e-05, "loss": 0.0098, "step": 542440 }, { "epoch": 1.41, "learning_rate": 8.908370292990063e-05, "loss": 0.0077, "step": 542450 }, { "epoch": 1.41, "learning_rate": 8.907981471352918e-05, "loss": 0.0094, "step": 542460 }, { "epoch": 1.41, "learning_rate": 8.90759264971577e-05, "loss": 0.0092, "step": 542470 }, { "epoch": 1.41, "learning_rate": 8.907203828078625e-05, "loss": 0.0072, "step": 542480 }, { "epoch": 1.41, "learning_rate": 8.906815006441477e-05, "loss": 0.0084, "step": 542490 }, { "epoch": 1.41, "learning_rate": 8.906426184804332e-05, "loss": 0.0097, "step": 542500 }, { "epoch": 1.41, "learning_rate": 8.906037363167184e-05, "loss": 0.0122, "step": 542510 }, { "epoch": 1.41, "learning_rate": 8.905648541530039e-05, "loss": 0.0118, "step": 542520 }, { "epoch": 1.41, "learning_rate": 8.905259719892891e-05, "loss": 0.0087, "step": 542530 }, { "epoch": 1.41, "learning_rate": 8.904870898255746e-05, "loss": 0.0091, "step": 542540 }, { "epoch": 1.41, "learning_rate": 8.904482076618598e-05, "loss": 0.0095, "step": 542550 }, { "epoch": 1.41, "learning_rate": 8.904093254981452e-05, "loss": 0.0114, "step": 542560 }, { "epoch": 1.41, "learning_rate": 8.903704433344305e-05, "loss": 0.0103, "step": 542570 }, { "epoch": 1.41, "learning_rate": 8.903315611707161e-05, "loss": 0.0104, "step": 542580 }, { "epoch": 1.41, "learning_rate": 8.902926790070014e-05, "loss": 0.0089, "step": 542590 }, { "epoch": 1.41, "learning_rate": 8.902537968432868e-05, "loss": 0.0109, "step": 542600 }, { "epoch": 1.41, "learning_rate": 8.90214914679572e-05, "loss": 0.0106, "step": 542610 }, { "epoch": 1.41, "learning_rate": 8.901760325158573e-05, "loss": 0.0066, "step": 542620 }, { "epoch": 1.41, "learning_rate": 8.901371503521428e-05, "loss": 0.0098, "step": 542630 }, { "epoch": 1.41, "learning_rate": 8.90098268188428e-05, "loss": 0.008, "step": 542640 }, { "epoch": 1.41, "learning_rate": 8.900593860247135e-05, "loss": 0.0087, "step": 542650 }, { "epoch": 1.41, "learning_rate": 8.900205038609987e-05, "loss": 0.0079, "step": 542660 }, { "epoch": 1.41, "learning_rate": 8.899816216972842e-05, "loss": 0.0102, "step": 542670 }, { "epoch": 1.41, "learning_rate": 8.899427395335694e-05, "loss": 0.0166, "step": 542680 }, { "epoch": 1.41, "learning_rate": 8.899038573698548e-05, "loss": 0.0154, "step": 542690 }, { "epoch": 1.41, "learning_rate": 8.898649752061401e-05, "loss": 0.0135, "step": 542700 }, { "epoch": 1.41, "learning_rate": 8.898260930424255e-05, "loss": 0.0088, "step": 542710 }, { "epoch": 1.41, "learning_rate": 8.897872108787108e-05, "loss": 0.0126, "step": 542720 }, { "epoch": 1.41, "learning_rate": 8.897483287149962e-05, "loss": 0.0098, "step": 542730 }, { "epoch": 1.41, "learning_rate": 8.897094465512815e-05, "loss": 0.0077, "step": 542740 }, { "epoch": 1.41, "learning_rate": 8.896705643875671e-05, "loss": 0.0104, "step": 542750 }, { "epoch": 1.41, "learning_rate": 8.896316822238522e-05, "loss": 0.0098, "step": 542760 }, { "epoch": 1.41, "learning_rate": 8.895928000601378e-05, "loss": 0.0102, "step": 542770 }, { "epoch": 1.41, "learning_rate": 8.89553917896423e-05, "loss": 0.0104, "step": 542780 }, { "epoch": 1.41, "learning_rate": 8.895150357327085e-05, "loss": 0.008, "step": 542790 }, { "epoch": 1.41, "learning_rate": 8.894761535689938e-05, "loss": 0.0075, "step": 542800 }, { "epoch": 1.41, "learning_rate": 8.894372714052792e-05, "loss": 0.0088, "step": 542810 }, { "epoch": 1.41, "learning_rate": 8.893983892415644e-05, "loss": 0.0119, "step": 542820 }, { "epoch": 1.41, "learning_rate": 8.893595070778499e-05, "loss": 0.0133, "step": 542830 }, { "epoch": 1.41, "learning_rate": 8.893206249141351e-05, "loss": 0.0114, "step": 542840 }, { "epoch": 1.41, "learning_rate": 8.892817427504206e-05, "loss": 0.0069, "step": 542850 }, { "epoch": 1.41, "learning_rate": 8.892428605867058e-05, "loss": 0.0083, "step": 542860 }, { "epoch": 1.41, "learning_rate": 8.892039784229911e-05, "loss": 0.0094, "step": 542870 }, { "epoch": 1.41, "learning_rate": 8.891650962592765e-05, "loss": 0.0107, "step": 542880 }, { "epoch": 1.41, "learning_rate": 8.891262140955618e-05, "loss": 0.0098, "step": 542890 }, { "epoch": 1.41, "learning_rate": 8.890873319318472e-05, "loss": 0.0084, "step": 542900 }, { "epoch": 1.41, "learning_rate": 8.890484497681325e-05, "loss": 0.008, "step": 542910 }, { "epoch": 1.41, "learning_rate": 8.89009567604418e-05, "loss": 0.0093, "step": 542920 }, { "epoch": 1.41, "learning_rate": 8.889706854407032e-05, "loss": 0.0087, "step": 542930 }, { "epoch": 1.41, "learning_rate": 8.889318032769888e-05, "loss": 0.0092, "step": 542940 }, { "epoch": 1.41, "learning_rate": 8.88892921113274e-05, "loss": 0.0086, "step": 542950 }, { "epoch": 1.41, "learning_rate": 8.888540389495595e-05, "loss": 0.0107, "step": 542960 }, { "epoch": 1.41, "learning_rate": 8.888151567858447e-05, "loss": 0.0066, "step": 542970 }, { "epoch": 1.41, "learning_rate": 8.887762746221302e-05, "loss": 0.01, "step": 542980 }, { "epoch": 1.41, "learning_rate": 8.887373924584154e-05, "loss": 0.0121, "step": 542990 }, { "epoch": 1.41, "learning_rate": 8.886985102947009e-05, "loss": 0.0093, "step": 543000 }, { "epoch": 1.41, "eval_cer": 0.8816900895907601, "eval_loss": 0.006007141899317503, "eval_runtime": 107.8179, "eval_samples_per_second": 18.55, "eval_steps_per_second": 4.637, "step": 543000 }, { "epoch": 1.41, "learning_rate": 8.886596281309861e-05, "loss": 0.0093, "step": 543010 }, { "epoch": 1.41, "learning_rate": 8.886207459672716e-05, "loss": 0.0089, "step": 543020 }, { "epoch": 1.41, "learning_rate": 8.885818638035568e-05, "loss": 0.0076, "step": 543030 }, { "epoch": 1.41, "learning_rate": 8.885429816398423e-05, "loss": 0.0086, "step": 543040 }, { "epoch": 1.41, "learning_rate": 8.885040994761275e-05, "loss": 0.0094, "step": 543050 }, { "epoch": 1.41, "learning_rate": 8.88465217312413e-05, "loss": 0.0076, "step": 543060 }, { "epoch": 1.41, "learning_rate": 8.884263351486982e-05, "loss": 0.0086, "step": 543070 }, { "epoch": 1.41, "learning_rate": 8.883874529849836e-05, "loss": 0.0094, "step": 543080 }, { "epoch": 1.41, "learning_rate": 8.883485708212689e-05, "loss": 0.0089, "step": 543090 }, { "epoch": 1.41, "learning_rate": 8.883096886575545e-05, "loss": 0.0075, "step": 543100 }, { "epoch": 1.41, "learning_rate": 8.882708064938398e-05, "loss": 0.0088, "step": 543110 }, { "epoch": 1.41, "learning_rate": 8.882319243301249e-05, "loss": 0.0107, "step": 543120 }, { "epoch": 1.41, "learning_rate": 8.881930421664105e-05, "loss": 0.0101, "step": 543130 }, { "epoch": 1.41, "learning_rate": 8.881541600026957e-05, "loss": 0.0067, "step": 543140 }, { "epoch": 1.41, "learning_rate": 8.881152778389812e-05, "loss": 0.0082, "step": 543150 }, { "epoch": 1.41, "learning_rate": 8.880763956752664e-05, "loss": 0.0075, "step": 543160 }, { "epoch": 1.41, "learning_rate": 8.880375135115519e-05, "loss": 0.0098, "step": 543170 }, { "epoch": 1.41, "learning_rate": 8.879986313478371e-05, "loss": 0.0081, "step": 543180 }, { "epoch": 1.41, "learning_rate": 8.879597491841225e-05, "loss": 0.0106, "step": 543190 }, { "epoch": 1.41, "learning_rate": 8.879208670204078e-05, "loss": 0.009, "step": 543200 }, { "epoch": 1.41, "learning_rate": 8.878819848566932e-05, "loss": 0.0121, "step": 543210 }, { "epoch": 1.41, "learning_rate": 8.878431026929785e-05, "loss": 0.0061, "step": 543220 }, { "epoch": 1.41, "learning_rate": 8.87804220529264e-05, "loss": 0.0088, "step": 543230 }, { "epoch": 1.41, "learning_rate": 8.877653383655492e-05, "loss": 0.0088, "step": 543240 }, { "epoch": 1.41, "learning_rate": 8.877264562018346e-05, "loss": 0.0064, "step": 543250 }, { "epoch": 1.41, "learning_rate": 8.876875740381199e-05, "loss": 0.0092, "step": 543260 }, { "epoch": 1.41, "learning_rate": 8.876486918744053e-05, "loss": 0.0117, "step": 543270 }, { "epoch": 1.41, "learning_rate": 8.876098097106906e-05, "loss": 0.0075, "step": 543280 }, { "epoch": 1.41, "learning_rate": 8.875709275469762e-05, "loss": 0.0107, "step": 543290 }, { "epoch": 1.41, "learning_rate": 8.875320453832615e-05, "loss": 0.0166, "step": 543300 }, { "epoch": 1.41, "learning_rate": 8.874931632195469e-05, "loss": 0.0088, "step": 543310 }, { "epoch": 1.41, "learning_rate": 8.874542810558321e-05, "loss": 0.0123, "step": 543320 }, { "epoch": 1.41, "learning_rate": 8.874153988921176e-05, "loss": 0.008, "step": 543330 }, { "epoch": 1.41, "learning_rate": 8.873765167284028e-05, "loss": 0.0114, "step": 543340 }, { "epoch": 1.41, "learning_rate": 8.873376345646883e-05, "loss": 0.0095, "step": 543350 }, { "epoch": 1.41, "learning_rate": 8.872987524009735e-05, "loss": 0.0123, "step": 543360 }, { "epoch": 1.41, "learning_rate": 8.872598702372588e-05, "loss": 0.0085, "step": 543370 }, { "epoch": 1.41, "learning_rate": 8.872209880735442e-05, "loss": 0.0079, "step": 543380 }, { "epoch": 1.41, "learning_rate": 8.871821059098295e-05, "loss": 0.0086, "step": 543390 }, { "epoch": 1.41, "learning_rate": 8.87143223746115e-05, "loss": 0.0114, "step": 543400 }, { "epoch": 1.41, "learning_rate": 8.871043415824002e-05, "loss": 0.0102, "step": 543410 }, { "epoch": 1.41, "learning_rate": 8.870654594186856e-05, "loss": 0.0097, "step": 543420 }, { "epoch": 1.41, "learning_rate": 8.870265772549709e-05, "loss": 0.0133, "step": 543430 }, { "epoch": 1.41, "learning_rate": 8.869876950912563e-05, "loss": 0.0112, "step": 543440 }, { "epoch": 1.41, "learning_rate": 8.869488129275416e-05, "loss": 0.0156, "step": 543450 }, { "epoch": 1.41, "learning_rate": 8.869099307638272e-05, "loss": 0.0084, "step": 543460 }, { "epoch": 1.41, "learning_rate": 8.868710486001123e-05, "loss": 0.0101, "step": 543470 }, { "epoch": 1.41, "learning_rate": 8.868321664363979e-05, "loss": 0.0103, "step": 543480 }, { "epoch": 1.41, "learning_rate": 8.867932842726831e-05, "loss": 0.0095, "step": 543490 }, { "epoch": 1.41, "learning_rate": 8.867544021089686e-05, "loss": 0.0059, "step": 543500 }, { "epoch": 1.41, "learning_rate": 8.867155199452538e-05, "loss": 0.011, "step": 543510 }, { "epoch": 1.41, "learning_rate": 8.866766377815393e-05, "loss": 0.0098, "step": 543520 }, { "epoch": 1.41, "learning_rate": 8.866377556178245e-05, "loss": 0.0105, "step": 543530 }, { "epoch": 1.41, "learning_rate": 8.8659887345411e-05, "loss": 0.009, "step": 543540 }, { "epoch": 1.41, "learning_rate": 8.865599912903952e-05, "loss": 0.0112, "step": 543550 }, { "epoch": 1.41, "learning_rate": 8.865211091266807e-05, "loss": 0.0108, "step": 543560 }, { "epoch": 1.41, "learning_rate": 8.86482226962966e-05, "loss": 0.0087, "step": 543570 }, { "epoch": 1.41, "learning_rate": 8.864433447992513e-05, "loss": 0.0095, "step": 543580 }, { "epoch": 1.41, "learning_rate": 8.864044626355366e-05, "loss": 0.0085, "step": 543590 }, { "epoch": 1.41, "learning_rate": 8.86365580471822e-05, "loss": 0.0104, "step": 543600 }, { "epoch": 1.41, "learning_rate": 8.863266983081073e-05, "loss": 0.0123, "step": 543610 }, { "epoch": 1.41, "learning_rate": 8.862878161443926e-05, "loss": 0.0099, "step": 543620 }, { "epoch": 1.41, "learning_rate": 8.86248933980678e-05, "loss": 0.0119, "step": 543630 }, { "epoch": 1.41, "learning_rate": 8.862100518169633e-05, "loss": 0.0097, "step": 543640 }, { "epoch": 1.41, "learning_rate": 8.861711696532489e-05, "loss": 0.0132, "step": 543650 }, { "epoch": 1.41, "learning_rate": 8.861322874895341e-05, "loss": 0.0087, "step": 543660 }, { "epoch": 1.41, "learning_rate": 8.860934053258196e-05, "loss": 0.0108, "step": 543670 }, { "epoch": 1.41, "learning_rate": 8.860545231621048e-05, "loss": 0.0107, "step": 543680 }, { "epoch": 1.41, "learning_rate": 8.860156409983903e-05, "loss": 0.01, "step": 543690 }, { "epoch": 1.41, "learning_rate": 8.859767588346755e-05, "loss": 0.0108, "step": 543700 }, { "epoch": 1.41, "learning_rate": 8.85937876670961e-05, "loss": 0.0083, "step": 543710 }, { "epoch": 1.41, "learning_rate": 8.858989945072462e-05, "loss": 0.0083, "step": 543720 }, { "epoch": 1.41, "learning_rate": 8.858601123435316e-05, "loss": 0.0119, "step": 543730 }, { "epoch": 1.41, "learning_rate": 8.858212301798169e-05, "loss": 0.0075, "step": 543740 }, { "epoch": 1.41, "learning_rate": 8.857823480161023e-05, "loss": 0.0137, "step": 543750 }, { "epoch": 1.41, "learning_rate": 8.857434658523876e-05, "loss": 0.0087, "step": 543760 }, { "epoch": 1.41, "learning_rate": 8.85704583688673e-05, "loss": 0.009, "step": 543770 }, { "epoch": 1.41, "learning_rate": 8.856657015249583e-05, "loss": 0.0091, "step": 543780 }, { "epoch": 1.41, "learning_rate": 8.856268193612437e-05, "loss": 0.0079, "step": 543790 }, { "epoch": 1.41, "learning_rate": 8.85587937197529e-05, "loss": 0.0091, "step": 543800 }, { "epoch": 1.41, "learning_rate": 8.855490550338146e-05, "loss": 0.0089, "step": 543810 }, { "epoch": 1.41, "learning_rate": 8.855101728700999e-05, "loss": 0.0093, "step": 543820 }, { "epoch": 1.41, "learning_rate": 8.854712907063853e-05, "loss": 0.011, "step": 543830 }, { "epoch": 1.41, "learning_rate": 8.854324085426705e-05, "loss": 0.0096, "step": 543840 }, { "epoch": 1.41, "learning_rate": 8.853935263789558e-05, "loss": 0.0088, "step": 543850 }, { "epoch": 1.41, "learning_rate": 8.853546442152412e-05, "loss": 0.011, "step": 543860 }, { "epoch": 1.41, "learning_rate": 8.853157620515265e-05, "loss": 0.0107, "step": 543870 }, { "epoch": 1.41, "learning_rate": 8.85276879887812e-05, "loss": 0.0111, "step": 543880 }, { "epoch": 1.41, "learning_rate": 8.852379977240972e-05, "loss": 0.011, "step": 543890 }, { "epoch": 1.41, "learning_rate": 8.851991155603826e-05, "loss": 0.0126, "step": 543900 }, { "epoch": 1.41, "learning_rate": 8.851602333966679e-05, "loss": 0.0087, "step": 543910 }, { "epoch": 1.41, "learning_rate": 8.851213512329533e-05, "loss": 0.0116, "step": 543920 }, { "epoch": 1.41, "learning_rate": 8.850824690692386e-05, "loss": 0.0102, "step": 543930 }, { "epoch": 1.41, "learning_rate": 8.85043586905524e-05, "loss": 0.0142, "step": 543940 }, { "epoch": 1.41, "learning_rate": 8.850047047418093e-05, "loss": 0.009, "step": 543950 }, { "epoch": 1.41, "learning_rate": 8.849658225780947e-05, "loss": 0.0105, "step": 543960 }, { "epoch": 1.41, "learning_rate": 8.8492694041438e-05, "loss": 0.0069, "step": 543970 }, { "epoch": 1.41, "learning_rate": 8.848880582506656e-05, "loss": 0.0078, "step": 543980 }, { "epoch": 1.41, "learning_rate": 8.848491760869507e-05, "loss": 0.009, "step": 543990 }, { "epoch": 1.41, "learning_rate": 8.848102939232363e-05, "loss": 0.0133, "step": 544000 }, { "epoch": 1.41, "eval_cer": 0.8816760932214184, "eval_loss": 0.006026812829077244, "eval_runtime": 107.9103, "eval_samples_per_second": 18.534, "eval_steps_per_second": 4.633, "step": 544000 }, { "epoch": 1.41, "learning_rate": 8.847714117595215e-05, "loss": 0.0129, "step": 544010 }, { "epoch": 1.41, "learning_rate": 8.84732529595807e-05, "loss": 0.0113, "step": 544020 }, { "epoch": 1.41, "learning_rate": 8.846936474320922e-05, "loss": 0.0088, "step": 544030 }, { "epoch": 1.41, "learning_rate": 8.846547652683777e-05, "loss": 0.0132, "step": 544040 }, { "epoch": 1.41, "learning_rate": 8.84615883104663e-05, "loss": 0.0107, "step": 544050 }, { "epoch": 1.41, "learning_rate": 8.845770009409484e-05, "loss": 0.0091, "step": 544060 }, { "epoch": 1.41, "learning_rate": 8.845381187772336e-05, "loss": 0.0086, "step": 544070 }, { "epoch": 1.41, "learning_rate": 8.84499236613519e-05, "loss": 0.0097, "step": 544080 }, { "epoch": 1.41, "learning_rate": 8.844603544498043e-05, "loss": 0.0117, "step": 544090 }, { "epoch": 1.41, "learning_rate": 8.844214722860896e-05, "loss": 0.0078, "step": 544100 }, { "epoch": 1.41, "learning_rate": 8.84382590122375e-05, "loss": 0.0091, "step": 544110 }, { "epoch": 1.41, "learning_rate": 8.843437079586603e-05, "loss": 0.0097, "step": 544120 }, { "epoch": 1.41, "learning_rate": 8.843048257949457e-05, "loss": 0.0092, "step": 544130 }, { "epoch": 1.41, "learning_rate": 8.84265943631231e-05, "loss": 0.006, "step": 544140 }, { "epoch": 1.41, "learning_rate": 8.842270614675164e-05, "loss": 0.0097, "step": 544150 }, { "epoch": 1.41, "learning_rate": 8.841881793038017e-05, "loss": 0.0133, "step": 544160 }, { "epoch": 1.41, "learning_rate": 8.841492971400873e-05, "loss": 0.0093, "step": 544170 }, { "epoch": 1.41, "learning_rate": 8.841104149763725e-05, "loss": 0.0069, "step": 544180 }, { "epoch": 1.41, "learning_rate": 8.84071532812658e-05, "loss": 0.0125, "step": 544190 }, { "epoch": 1.41, "learning_rate": 8.840326506489432e-05, "loss": 0.0081, "step": 544200 }, { "epoch": 1.41, "learning_rate": 8.839937684852287e-05, "loss": 0.0092, "step": 544210 }, { "epoch": 1.41, "learning_rate": 8.839548863215139e-05, "loss": 0.0082, "step": 544220 }, { "epoch": 1.41, "learning_rate": 8.839160041577993e-05, "loss": 0.0109, "step": 544230 }, { "epoch": 1.41, "learning_rate": 8.838771219940846e-05, "loss": 0.0101, "step": 544240 }, { "epoch": 1.41, "learning_rate": 8.8383823983037e-05, "loss": 0.0117, "step": 544250 }, { "epoch": 1.41, "learning_rate": 8.837993576666553e-05, "loss": 0.0067, "step": 544260 }, { "epoch": 1.41, "learning_rate": 8.837604755029407e-05, "loss": 0.009, "step": 544270 }, { "epoch": 1.41, "learning_rate": 8.83721593339226e-05, "loss": 0.0065, "step": 544280 }, { "epoch": 1.41, "learning_rate": 8.836827111755114e-05, "loss": 0.0095, "step": 544290 }, { "epoch": 1.41, "learning_rate": 8.836438290117967e-05, "loss": 0.008, "step": 544300 }, { "epoch": 1.41, "learning_rate": 8.836049468480821e-05, "loss": 0.0059, "step": 544310 }, { "epoch": 1.41, "learning_rate": 8.835660646843674e-05, "loss": 0.0107, "step": 544320 }, { "epoch": 1.41, "learning_rate": 8.83527182520653e-05, "loss": 0.0106, "step": 544330 }, { "epoch": 1.41, "learning_rate": 8.834883003569383e-05, "loss": 0.0092, "step": 544340 }, { "epoch": 1.41, "learning_rate": 8.834494181932234e-05, "loss": 0.0093, "step": 544350 }, { "epoch": 1.41, "learning_rate": 8.83410536029509e-05, "loss": 0.0089, "step": 544360 }, { "epoch": 1.41, "learning_rate": 8.833716538657942e-05, "loss": 0.0088, "step": 544370 }, { "epoch": 1.41, "learning_rate": 8.833327717020796e-05, "loss": 0.0083, "step": 544380 }, { "epoch": 1.41, "learning_rate": 8.832938895383649e-05, "loss": 0.0074, "step": 544390 }, { "epoch": 1.41, "learning_rate": 8.832550073746503e-05, "loss": 0.0117, "step": 544400 }, { "epoch": 1.41, "learning_rate": 8.832161252109356e-05, "loss": 0.0087, "step": 544410 }, { "epoch": 1.41, "learning_rate": 8.83177243047221e-05, "loss": 0.0057, "step": 544420 }, { "epoch": 1.41, "learning_rate": 8.831383608835063e-05, "loss": 0.0101, "step": 544430 }, { "epoch": 1.41, "learning_rate": 8.830994787197917e-05, "loss": 0.0084, "step": 544440 }, { "epoch": 1.41, "learning_rate": 8.83060596556077e-05, "loss": 0.0094, "step": 544450 }, { "epoch": 1.41, "learning_rate": 8.830217143923624e-05, "loss": 0.0127, "step": 544460 }, { "epoch": 1.41, "learning_rate": 8.829828322286477e-05, "loss": 0.0101, "step": 544470 }, { "epoch": 1.41, "learning_rate": 8.829439500649331e-05, "loss": 0.01, "step": 544480 }, { "epoch": 1.41, "learning_rate": 8.829050679012184e-05, "loss": 0.0083, "step": 544490 }, { "epoch": 1.41, "learning_rate": 8.828661857375038e-05, "loss": 0.0081, "step": 544500 }, { "epoch": 1.41, "learning_rate": 8.828273035737891e-05, "loss": 0.0087, "step": 544510 }, { "epoch": 1.41, "learning_rate": 8.827884214100747e-05, "loss": 0.0108, "step": 544520 }, { "epoch": 1.41, "learning_rate": 8.8274953924636e-05, "loss": 0.009, "step": 544530 }, { "epoch": 1.41, "learning_rate": 8.827106570826454e-05, "loss": 0.0104, "step": 544540 }, { "epoch": 1.41, "learning_rate": 8.826717749189306e-05, "loss": 0.0086, "step": 544550 }, { "epoch": 1.41, "learning_rate": 8.82632892755216e-05, "loss": 0.0092, "step": 544560 }, { "epoch": 1.41, "learning_rate": 8.825940105915013e-05, "loss": 0.009, "step": 544570 }, { "epoch": 1.41, "learning_rate": 8.825551284277868e-05, "loss": 0.0128, "step": 544580 }, { "epoch": 1.41, "learning_rate": 8.82516246264072e-05, "loss": 0.0095, "step": 544590 }, { "epoch": 1.41, "learning_rate": 8.824773641003573e-05, "loss": 0.0097, "step": 544600 }, { "epoch": 1.41, "learning_rate": 8.824384819366427e-05, "loss": 0.0101, "step": 544610 }, { "epoch": 1.41, "learning_rate": 8.82399599772928e-05, "loss": 0.0117, "step": 544620 }, { "epoch": 1.41, "learning_rate": 8.823607176092134e-05, "loss": 0.0097, "step": 544630 }, { "epoch": 1.41, "learning_rate": 8.823218354454987e-05, "loss": 0.0117, "step": 544640 }, { "epoch": 1.41, "learning_rate": 8.822829532817841e-05, "loss": 0.0131, "step": 544650 }, { "epoch": 1.41, "learning_rate": 8.822440711180694e-05, "loss": 0.01, "step": 544660 }, { "epoch": 1.41, "learning_rate": 8.822051889543548e-05, "loss": 0.0081, "step": 544670 }, { "epoch": 1.41, "learning_rate": 8.821663067906401e-05, "loss": 0.0081, "step": 544680 }, { "epoch": 1.41, "learning_rate": 8.821274246269257e-05, "loss": 0.007, "step": 544690 }, { "epoch": 1.41, "learning_rate": 8.820885424632108e-05, "loss": 0.0173, "step": 544700 }, { "epoch": 1.41, "learning_rate": 8.820496602994964e-05, "loss": 0.0086, "step": 544710 }, { "epoch": 1.41, "learning_rate": 8.820107781357816e-05, "loss": 0.0105, "step": 544720 }, { "epoch": 1.41, "learning_rate": 8.81971895972067e-05, "loss": 0.0109, "step": 544730 }, { "epoch": 1.41, "learning_rate": 8.819330138083523e-05, "loss": 0.0118, "step": 544740 }, { "epoch": 1.41, "learning_rate": 8.818941316446377e-05, "loss": 0.0121, "step": 544750 }, { "epoch": 1.41, "learning_rate": 8.81855249480923e-05, "loss": 0.0107, "step": 544760 }, { "epoch": 1.41, "learning_rate": 8.818163673172084e-05, "loss": 0.0096, "step": 544770 }, { "epoch": 1.41, "learning_rate": 8.817774851534937e-05, "loss": 0.0076, "step": 544780 }, { "epoch": 1.41, "learning_rate": 8.817386029897791e-05, "loss": 0.0101, "step": 544790 }, { "epoch": 1.41, "learning_rate": 8.816997208260644e-05, "loss": 0.0099, "step": 544800 }, { "epoch": 1.41, "learning_rate": 8.816608386623498e-05, "loss": 0.0064, "step": 544810 }, { "epoch": 1.41, "learning_rate": 8.816219564986351e-05, "loss": 0.0121, "step": 544820 }, { "epoch": 1.41, "learning_rate": 8.815830743349205e-05, "loss": 0.0097, "step": 544830 }, { "epoch": 1.41, "learning_rate": 8.815441921712058e-05, "loss": 0.0105, "step": 544840 }, { "epoch": 1.41, "learning_rate": 8.815053100074911e-05, "loss": 0.0071, "step": 544850 }, { "epoch": 1.41, "learning_rate": 8.814664278437765e-05, "loss": 0.0074, "step": 544860 }, { "epoch": 1.41, "learning_rate": 8.814275456800618e-05, "loss": 0.0098, "step": 544870 }, { "epoch": 1.41, "learning_rate": 8.813886635163473e-05, "loss": 0.0099, "step": 544880 }, { "epoch": 1.41, "learning_rate": 8.813497813526326e-05, "loss": 0.01, "step": 544890 }, { "epoch": 1.41, "learning_rate": 8.81310899188918e-05, "loss": 0.0084, "step": 544900 }, { "epoch": 1.41, "learning_rate": 8.812720170252033e-05, "loss": 0.0091, "step": 544910 }, { "epoch": 1.41, "learning_rate": 8.812331348614887e-05, "loss": 0.008, "step": 544920 }, { "epoch": 1.41, "learning_rate": 8.81194252697774e-05, "loss": 0.0087, "step": 544930 }, { "epoch": 1.41, "learning_rate": 8.811553705340594e-05, "loss": 0.0105, "step": 544940 }, { "epoch": 1.41, "learning_rate": 8.811164883703447e-05, "loss": 0.0087, "step": 544950 }, { "epoch": 1.41, "learning_rate": 8.810776062066301e-05, "loss": 0.0102, "step": 544960 }, { "epoch": 1.41, "learning_rate": 8.810387240429154e-05, "loss": 0.0073, "step": 544970 }, { "epoch": 1.41, "learning_rate": 8.809998418792008e-05, "loss": 0.0095, "step": 544980 }, { "epoch": 1.41, "learning_rate": 8.809609597154861e-05, "loss": 0.0086, "step": 544990 }, { "epoch": 1.41, "learning_rate": 8.809220775517715e-05, "loss": 0.0092, "step": 545000 }, { "epoch": 1.41, "eval_cer": 0.8816816917691551, "eval_loss": 0.0062423269264400005, "eval_runtime": 107.912, "eval_samples_per_second": 18.534, "eval_steps_per_second": 4.633, "step": 545000 }, { "epoch": 1.41, "learning_rate": 8.808831953880568e-05, "loss": 0.0121, "step": 545010 }, { "epoch": 1.41, "learning_rate": 8.808443132243422e-05, "loss": 0.0095, "step": 545020 }, { "epoch": 1.41, "learning_rate": 8.808054310606275e-05, "loss": 0.0098, "step": 545030 }, { "epoch": 1.41, "learning_rate": 8.80766548896913e-05, "loss": 0.0109, "step": 545040 }, { "epoch": 1.41, "learning_rate": 8.807276667331983e-05, "loss": 0.009, "step": 545050 }, { "epoch": 1.41, "learning_rate": 8.806887845694838e-05, "loss": 0.0078, "step": 545060 }, { "epoch": 1.41, "learning_rate": 8.80649902405769e-05, "loss": 0.011, "step": 545070 }, { "epoch": 1.41, "learning_rate": 8.806110202420545e-05, "loss": 0.0093, "step": 545080 }, { "epoch": 1.41, "learning_rate": 8.805721380783397e-05, "loss": 0.0072, "step": 545090 }, { "epoch": 1.41, "learning_rate": 8.80533255914625e-05, "loss": 0.0099, "step": 545100 }, { "epoch": 1.41, "learning_rate": 8.804943737509104e-05, "loss": 0.0104, "step": 545110 }, { "epoch": 1.41, "learning_rate": 8.804554915871957e-05, "loss": 0.0086, "step": 545120 }, { "epoch": 1.41, "learning_rate": 8.804166094234811e-05, "loss": 0.0084, "step": 545130 }, { "epoch": 1.41, "learning_rate": 8.803777272597664e-05, "loss": 0.0085, "step": 545140 }, { "epoch": 1.41, "learning_rate": 8.803388450960518e-05, "loss": 0.0093, "step": 545150 }, { "epoch": 1.41, "learning_rate": 8.802999629323371e-05, "loss": 0.0091, "step": 545160 }, { "epoch": 1.41, "learning_rate": 8.802610807686225e-05, "loss": 0.0095, "step": 545170 }, { "epoch": 1.41, "learning_rate": 8.802221986049078e-05, "loss": 0.0079, "step": 545180 }, { "epoch": 1.41, "learning_rate": 8.801833164411932e-05, "loss": 0.0087, "step": 545190 }, { "epoch": 1.41, "learning_rate": 8.801444342774785e-05, "loss": 0.0106, "step": 545200 }, { "epoch": 1.41, "learning_rate": 8.80105552113764e-05, "loss": 0.0084, "step": 545210 }, { "epoch": 1.41, "learning_rate": 8.800666699500492e-05, "loss": 0.0102, "step": 545220 }, { "epoch": 1.41, "learning_rate": 8.800277877863348e-05, "loss": 0.0119, "step": 545230 }, { "epoch": 1.41, "learning_rate": 8.7998890562262e-05, "loss": 0.0093, "step": 545240 }, { "epoch": 1.41, "learning_rate": 8.799500234589054e-05, "loss": 0.0111, "step": 545250 }, { "epoch": 1.41, "learning_rate": 8.799111412951907e-05, "loss": 0.0094, "step": 545260 }, { "epoch": 1.41, "learning_rate": 8.798722591314761e-05, "loss": 0.008, "step": 545270 }, { "epoch": 1.41, "learning_rate": 8.798333769677614e-05, "loss": 0.01, "step": 545280 }, { "epoch": 1.41, "learning_rate": 8.797944948040468e-05, "loss": 0.0107, "step": 545290 }, { "epoch": 1.41, "learning_rate": 8.797556126403321e-05, "loss": 0.0089, "step": 545300 }, { "epoch": 1.41, "learning_rate": 8.797167304766175e-05, "loss": 0.0082, "step": 545310 }, { "epoch": 1.41, "learning_rate": 8.796778483129028e-05, "loss": 0.0137, "step": 545320 }, { "epoch": 1.41, "learning_rate": 8.796389661491882e-05, "loss": 0.0085, "step": 545330 }, { "epoch": 1.41, "learning_rate": 8.796000839854735e-05, "loss": 0.0117, "step": 545340 }, { "epoch": 1.41, "learning_rate": 8.795612018217588e-05, "loss": 0.0121, "step": 545350 }, { "epoch": 1.41, "learning_rate": 8.795223196580442e-05, "loss": 0.0091, "step": 545360 }, { "epoch": 1.41, "learning_rate": 8.794834374943295e-05, "loss": 0.0109, "step": 545370 }, { "epoch": 1.41, "learning_rate": 8.794445553306149e-05, "loss": 0.0104, "step": 545380 }, { "epoch": 1.41, "learning_rate": 8.794056731669002e-05, "loss": 0.0087, "step": 545390 }, { "epoch": 1.41, "learning_rate": 8.793667910031857e-05, "loss": 0.0096, "step": 545400 }, { "epoch": 1.41, "learning_rate": 8.79327908839471e-05, "loss": 0.0085, "step": 545410 }, { "epoch": 1.41, "learning_rate": 8.792890266757564e-05, "loss": 0.0067, "step": 545420 }, { "epoch": 1.41, "learning_rate": 8.792501445120417e-05, "loss": 0.0086, "step": 545430 }, { "epoch": 1.41, "learning_rate": 8.792112623483271e-05, "loss": 0.0092, "step": 545440 }, { "epoch": 1.41, "learning_rate": 8.791723801846124e-05, "loss": 0.0086, "step": 545450 }, { "epoch": 1.41, "learning_rate": 8.791334980208978e-05, "loss": 0.0087, "step": 545460 }, { "epoch": 1.41, "learning_rate": 8.790946158571831e-05, "loss": 0.0082, "step": 545470 }, { "epoch": 1.41, "learning_rate": 8.790557336934685e-05, "loss": 0.0099, "step": 545480 }, { "epoch": 1.41, "learning_rate": 8.790168515297538e-05, "loss": 0.0092, "step": 545490 }, { "epoch": 1.41, "learning_rate": 8.789779693660392e-05, "loss": 0.009, "step": 545500 }, { "epoch": 1.41, "learning_rate": 8.789390872023245e-05, "loss": 0.011, "step": 545510 }, { "epoch": 1.41, "learning_rate": 8.789002050386099e-05, "loss": 0.0088, "step": 545520 }, { "epoch": 1.41, "learning_rate": 8.788613228748952e-05, "loss": 0.0108, "step": 545530 }, { "epoch": 1.41, "learning_rate": 8.788224407111806e-05, "loss": 0.0118, "step": 545540 }, { "epoch": 1.41, "learning_rate": 8.787835585474659e-05, "loss": 0.0091, "step": 545550 }, { "epoch": 1.41, "learning_rate": 8.787446763837515e-05, "loss": 0.008, "step": 545560 }, { "epoch": 1.41, "learning_rate": 8.787057942200367e-05, "loss": 0.0119, "step": 545570 }, { "epoch": 1.41, "learning_rate": 8.786669120563222e-05, "loss": 0.0104, "step": 545580 }, { "epoch": 1.41, "learning_rate": 8.786280298926074e-05, "loss": 0.0102, "step": 545590 }, { "epoch": 1.41, "learning_rate": 8.785891477288927e-05, "loss": 0.0268, "step": 545600 }, { "epoch": 1.41, "learning_rate": 8.785502655651781e-05, "loss": 0.0087, "step": 545610 }, { "epoch": 1.41, "learning_rate": 8.785113834014634e-05, "loss": 0.0102, "step": 545620 }, { "epoch": 1.41, "learning_rate": 8.784725012377488e-05, "loss": 0.0087, "step": 545630 }, { "epoch": 1.41, "learning_rate": 8.784336190740341e-05, "loss": 0.0119, "step": 545640 }, { "epoch": 1.41, "learning_rate": 8.783947369103195e-05, "loss": 0.0097, "step": 545650 }, { "epoch": 1.41, "learning_rate": 8.783558547466048e-05, "loss": 0.0083, "step": 545660 }, { "epoch": 1.41, "learning_rate": 8.783169725828902e-05, "loss": 0.0101, "step": 545670 }, { "epoch": 1.41, "learning_rate": 8.782780904191755e-05, "loss": 0.0115, "step": 545680 }, { "epoch": 1.41, "learning_rate": 8.782392082554609e-05, "loss": 0.0086, "step": 545690 }, { "epoch": 1.41, "learning_rate": 8.782003260917462e-05, "loss": 0.0068, "step": 545700 }, { "epoch": 1.41, "learning_rate": 8.781614439280316e-05, "loss": 0.0078, "step": 545710 }, { "epoch": 1.41, "learning_rate": 8.781225617643169e-05, "loss": 0.0127, "step": 545720 }, { "epoch": 1.41, "learning_rate": 8.780836796006025e-05, "loss": 0.0123, "step": 545730 }, { "epoch": 1.41, "learning_rate": 8.780447974368876e-05, "loss": 0.0111, "step": 545740 }, { "epoch": 1.41, "learning_rate": 8.780059152731732e-05, "loss": 0.0104, "step": 545750 }, { "epoch": 1.41, "learning_rate": 8.779670331094584e-05, "loss": 0.0102, "step": 545760 }, { "epoch": 1.41, "learning_rate": 8.779281509457438e-05, "loss": 0.0095, "step": 545770 }, { "epoch": 1.41, "learning_rate": 8.778892687820291e-05, "loss": 0.0085, "step": 545780 }, { "epoch": 1.41, "learning_rate": 8.778503866183145e-05, "loss": 0.007, "step": 545790 }, { "epoch": 1.41, "learning_rate": 8.778115044545998e-05, "loss": 0.0091, "step": 545800 }, { "epoch": 1.41, "learning_rate": 8.777726222908852e-05, "loss": 0.0095, "step": 545810 }, { "epoch": 1.41, "learning_rate": 8.777337401271705e-05, "loss": 0.0078, "step": 545820 }, { "epoch": 1.41, "learning_rate": 8.77694857963456e-05, "loss": 0.0097, "step": 545830 }, { "epoch": 1.41, "learning_rate": 8.776559757997412e-05, "loss": 0.0088, "step": 545840 }, { "epoch": 1.41, "learning_rate": 8.776170936360265e-05, "loss": 0.0093, "step": 545850 }, { "epoch": 1.41, "learning_rate": 8.775782114723119e-05, "loss": 0.0107, "step": 545860 }, { "epoch": 1.41, "learning_rate": 8.775393293085972e-05, "loss": 0.0086, "step": 545870 }, { "epoch": 1.41, "learning_rate": 8.775004471448826e-05, "loss": 0.0095, "step": 545880 }, { "epoch": 1.42, "learning_rate": 8.774615649811679e-05, "loss": 0.0107, "step": 545890 }, { "epoch": 1.42, "learning_rate": 8.774226828174533e-05, "loss": 0.0106, "step": 545900 }, { "epoch": 1.42, "learning_rate": 8.773838006537386e-05, "loss": 0.0117, "step": 545910 }, { "epoch": 1.42, "learning_rate": 8.773449184900241e-05, "loss": 0.0093, "step": 545920 }, { "epoch": 1.42, "learning_rate": 8.773060363263094e-05, "loss": 0.008, "step": 545930 }, { "epoch": 1.42, "learning_rate": 8.772671541625948e-05, "loss": 0.009, "step": 545940 }, { "epoch": 1.42, "learning_rate": 8.772282719988801e-05, "loss": 0.0123, "step": 545950 }, { "epoch": 1.42, "learning_rate": 8.771893898351655e-05, "loss": 0.0151, "step": 545960 }, { "epoch": 1.42, "learning_rate": 8.771505076714508e-05, "loss": 0.0092, "step": 545970 }, { "epoch": 1.42, "learning_rate": 8.771116255077362e-05, "loss": 0.0125, "step": 545980 }, { "epoch": 1.42, "learning_rate": 8.770727433440215e-05, "loss": 0.0104, "step": 545990 }, { "epoch": 1.42, "learning_rate": 8.77033861180307e-05, "loss": 0.0106, "step": 546000 }, { "epoch": 1.42, "eval_cer": 0.8816634964890108, "eval_loss": 0.0062417564913630486, "eval_runtime": 107.9696, "eval_samples_per_second": 18.524, "eval_steps_per_second": 4.631, "step": 546000 }, { "epoch": 1.42, "learning_rate": 8.769949790165922e-05, "loss": 0.0111, "step": 546010 }, { "epoch": 1.42, "learning_rate": 8.769560968528776e-05, "loss": 0.011, "step": 546020 }, { "epoch": 1.42, "learning_rate": 8.769172146891629e-05, "loss": 0.0107, "step": 546030 }, { "epoch": 1.42, "learning_rate": 8.768783325254483e-05, "loss": 0.009, "step": 546040 }, { "epoch": 1.42, "learning_rate": 8.768394503617336e-05, "loss": 0.0074, "step": 546050 }, { "epoch": 1.42, "learning_rate": 8.76800568198019e-05, "loss": 0.011, "step": 546060 }, { "epoch": 1.42, "learning_rate": 8.767616860343043e-05, "loss": 0.0083, "step": 546070 }, { "epoch": 1.42, "learning_rate": 8.767228038705899e-05, "loss": 0.0102, "step": 546080 }, { "epoch": 1.42, "learning_rate": 8.76683921706875e-05, "loss": 0.0097, "step": 546090 }, { "epoch": 1.42, "learning_rate": 8.766450395431603e-05, "loss": 0.0088, "step": 546100 }, { "epoch": 1.42, "learning_rate": 8.766061573794458e-05, "loss": 0.0098, "step": 546110 }, { "epoch": 1.42, "learning_rate": 8.765672752157311e-05, "loss": 0.0142, "step": 546120 }, { "epoch": 1.42, "learning_rate": 8.765283930520165e-05, "loss": 0.0082, "step": 546130 }, { "epoch": 1.42, "learning_rate": 8.764895108883018e-05, "loss": 0.0083, "step": 546140 }, { "epoch": 1.42, "learning_rate": 8.764506287245872e-05, "loss": 0.0102, "step": 546150 }, { "epoch": 1.42, "learning_rate": 8.764117465608725e-05, "loss": 0.0119, "step": 546160 }, { "epoch": 1.42, "learning_rate": 8.763728643971579e-05, "loss": 0.0089, "step": 546170 }, { "epoch": 1.42, "learning_rate": 8.763339822334432e-05, "loss": 0.0088, "step": 546180 }, { "epoch": 1.42, "learning_rate": 8.762951000697286e-05, "loss": 0.0191, "step": 546190 }, { "epoch": 1.42, "learning_rate": 8.762562179060139e-05, "loss": 0.0122, "step": 546200 }, { "epoch": 1.42, "learning_rate": 8.762173357422993e-05, "loss": 0.0108, "step": 546210 }, { "epoch": 1.42, "learning_rate": 8.761784535785846e-05, "loss": 0.0089, "step": 546220 }, { "epoch": 1.42, "learning_rate": 8.7613957141487e-05, "loss": 0.0103, "step": 546230 }, { "epoch": 1.42, "learning_rate": 8.761006892511553e-05, "loss": 0.0117, "step": 546240 }, { "epoch": 1.42, "learning_rate": 8.760618070874407e-05, "loss": 0.0081, "step": 546250 }, { "epoch": 1.42, "learning_rate": 8.76022924923726e-05, "loss": 0.0086, "step": 546260 }, { "epoch": 1.42, "learning_rate": 8.759840427600115e-05, "loss": 0.0092, "step": 546270 }, { "epoch": 1.42, "learning_rate": 8.759451605962968e-05, "loss": 0.0086, "step": 546280 }, { "epoch": 1.42, "learning_rate": 8.759062784325822e-05, "loss": 0.0114, "step": 546290 }, { "epoch": 1.42, "learning_rate": 8.758673962688675e-05, "loss": 0.0112, "step": 546300 }, { "epoch": 1.42, "learning_rate": 8.75828514105153e-05, "loss": 0.0085, "step": 546310 }, { "epoch": 1.42, "learning_rate": 8.757896319414382e-05, "loss": 0.0122, "step": 546320 }, { "epoch": 1.42, "learning_rate": 8.757507497777236e-05, "loss": 0.0078, "step": 546330 }, { "epoch": 1.42, "learning_rate": 8.757118676140089e-05, "loss": 0.0103, "step": 546340 }, { "epoch": 1.42, "learning_rate": 8.756729854502942e-05, "loss": 0.0081, "step": 546350 }, { "epoch": 1.42, "learning_rate": 8.756341032865796e-05, "loss": 0.01, "step": 546360 }, { "epoch": 1.42, "learning_rate": 8.755952211228649e-05, "loss": 0.0113, "step": 546370 }, { "epoch": 1.42, "learning_rate": 8.755563389591503e-05, "loss": 0.0077, "step": 546380 }, { "epoch": 1.42, "learning_rate": 8.755174567954356e-05, "loss": 0.0085, "step": 546390 }, { "epoch": 1.42, "learning_rate": 8.75478574631721e-05, "loss": 0.0131, "step": 546400 }, { "epoch": 1.42, "learning_rate": 8.754396924680063e-05, "loss": 0.0116, "step": 546410 }, { "epoch": 1.42, "learning_rate": 8.754008103042917e-05, "loss": 0.0089, "step": 546420 }, { "epoch": 1.42, "learning_rate": 8.75361928140577e-05, "loss": 0.0098, "step": 546430 }, { "epoch": 1.42, "learning_rate": 8.753230459768625e-05, "loss": 0.0065, "step": 546440 }, { "epoch": 1.42, "learning_rate": 8.752841638131477e-05, "loss": 0.009, "step": 546450 }, { "epoch": 1.42, "learning_rate": 8.752452816494332e-05, "loss": 0.009, "step": 546460 }, { "epoch": 1.42, "learning_rate": 8.752063994857185e-05, "loss": 0.0101, "step": 546470 }, { "epoch": 1.42, "learning_rate": 8.75167517322004e-05, "loss": 0.0093, "step": 546480 }, { "epoch": 1.42, "learning_rate": 8.751286351582892e-05, "loss": 0.0085, "step": 546490 }, { "epoch": 1.42, "learning_rate": 8.750897529945746e-05, "loss": 0.0088, "step": 546500 }, { "epoch": 1.42, "learning_rate": 8.750508708308599e-05, "loss": 0.0091, "step": 546510 }, { "epoch": 1.42, "learning_rate": 8.750119886671453e-05, "loss": 0.0082, "step": 546520 }, { "epoch": 1.42, "learning_rate": 8.749731065034306e-05, "loss": 0.0102, "step": 546530 }, { "epoch": 1.42, "learning_rate": 8.74934224339716e-05, "loss": 0.0089, "step": 546540 }, { "epoch": 1.42, "learning_rate": 8.748953421760013e-05, "loss": 0.0094, "step": 546550 }, { "epoch": 1.42, "learning_rate": 8.748564600122867e-05, "loss": 0.0071, "step": 546560 }, { "epoch": 1.42, "learning_rate": 8.74817577848572e-05, "loss": 0.0082, "step": 546570 }, { "epoch": 1.42, "learning_rate": 8.747786956848573e-05, "loss": 0.0095, "step": 546580 }, { "epoch": 1.42, "learning_rate": 8.747398135211427e-05, "loss": 0.008, "step": 546590 }, { "epoch": 1.42, "learning_rate": 8.74700931357428e-05, "loss": 0.0088, "step": 546600 }, { "epoch": 1.42, "learning_rate": 8.746620491937134e-05, "loss": 0.0109, "step": 546610 }, { "epoch": 1.42, "learning_rate": 8.746231670299987e-05, "loss": 0.0116, "step": 546620 }, { "epoch": 1.42, "learning_rate": 8.745842848662842e-05, "loss": 0.0105, "step": 546630 }, { "epoch": 1.42, "learning_rate": 8.745454027025695e-05, "loss": 0.0088, "step": 546640 }, { "epoch": 1.42, "learning_rate": 8.745065205388549e-05, "loss": 0.0091, "step": 546650 }, { "epoch": 1.42, "learning_rate": 8.744676383751402e-05, "loss": 0.0087, "step": 546660 }, { "epoch": 1.42, "learning_rate": 8.744287562114256e-05, "loss": 0.0093, "step": 546670 }, { "epoch": 1.42, "learning_rate": 8.743898740477109e-05, "loss": 0.014, "step": 546680 }, { "epoch": 1.42, "learning_rate": 8.743509918839963e-05, "loss": 0.0103, "step": 546690 }, { "epoch": 1.42, "learning_rate": 8.743121097202816e-05, "loss": 0.0106, "step": 546700 }, { "epoch": 1.42, "learning_rate": 8.74273227556567e-05, "loss": 0.0077, "step": 546710 }, { "epoch": 1.42, "learning_rate": 8.742343453928523e-05, "loss": 0.0134, "step": 546720 }, { "epoch": 1.42, "learning_rate": 8.741954632291377e-05, "loss": 0.0115, "step": 546730 }, { "epoch": 1.42, "learning_rate": 8.74156581065423e-05, "loss": 0.0125, "step": 546740 }, { "epoch": 1.42, "learning_rate": 8.741176989017084e-05, "loss": 0.0092, "step": 546750 }, { "epoch": 1.42, "learning_rate": 8.740788167379937e-05, "loss": 0.0131, "step": 546760 }, { "epoch": 1.42, "learning_rate": 8.740399345742791e-05, "loss": 0.0104, "step": 546770 }, { "epoch": 1.42, "learning_rate": 8.740010524105644e-05, "loss": 0.0199, "step": 546780 }, { "epoch": 1.42, "learning_rate": 8.7396217024685e-05, "loss": 0.0087, "step": 546790 }, { "epoch": 1.42, "learning_rate": 8.739232880831352e-05, "loss": 0.0074, "step": 546800 }, { "epoch": 1.42, "learning_rate": 8.738844059194206e-05, "loss": 0.009, "step": 546810 }, { "epoch": 1.42, "learning_rate": 8.738455237557059e-05, "loss": 0.0096, "step": 546820 }, { "epoch": 1.42, "learning_rate": 8.738066415919912e-05, "loss": 0.0109, "step": 546830 }, { "epoch": 1.42, "learning_rate": 8.737677594282766e-05, "loss": 0.0083, "step": 546840 }, { "epoch": 1.42, "learning_rate": 8.737288772645619e-05, "loss": 0.0079, "step": 546850 }, { "epoch": 1.42, "learning_rate": 8.736899951008473e-05, "loss": 0.0125, "step": 546860 }, { "epoch": 1.42, "learning_rate": 8.736511129371326e-05, "loss": 0.0096, "step": 546870 }, { "epoch": 1.42, "learning_rate": 8.73612230773418e-05, "loss": 0.0077, "step": 546880 }, { "epoch": 1.42, "learning_rate": 8.735733486097033e-05, "loss": 0.0087, "step": 546890 }, { "epoch": 1.42, "learning_rate": 8.735344664459887e-05, "loss": 0.0093, "step": 546900 }, { "epoch": 1.42, "learning_rate": 8.73495584282274e-05, "loss": 0.0107, "step": 546910 }, { "epoch": 1.42, "learning_rate": 8.734567021185594e-05, "loss": 0.0095, "step": 546920 }, { "epoch": 1.42, "learning_rate": 8.734178199548447e-05, "loss": 0.0086, "step": 546930 }, { "epoch": 1.42, "learning_rate": 8.733789377911301e-05, "loss": 0.01, "step": 546940 }, { "epoch": 1.42, "learning_rate": 8.733400556274154e-05, "loss": 0.0103, "step": 546950 }, { "epoch": 1.42, "learning_rate": 8.73301173463701e-05, "loss": 0.0094, "step": 546960 }, { "epoch": 1.42, "learning_rate": 8.732622912999861e-05, "loss": 0.0065, "step": 546970 }, { "epoch": 1.42, "learning_rate": 8.732234091362716e-05, "loss": 0.0097, "step": 546980 }, { "epoch": 1.42, "learning_rate": 8.731845269725569e-05, "loss": 0.0063, "step": 546990 }, { "epoch": 1.42, "learning_rate": 8.731456448088423e-05, "loss": 0.0099, "step": 547000 }, { "epoch": 1.42, "eval_cer": 0.8817166826925096, "eval_loss": 0.006214640568941832, "eval_runtime": 107.961, "eval_samples_per_second": 18.525, "eval_steps_per_second": 4.631, "step": 547000 }, { "epoch": 1.42, "learning_rate": 8.731067626451276e-05, "loss": 0.0073, "step": 547010 }, { "epoch": 1.42, "learning_rate": 8.73067880481413e-05, "loss": 0.0112, "step": 547020 }, { "epoch": 1.42, "learning_rate": 8.730289983176983e-05, "loss": 0.0091, "step": 547030 }, { "epoch": 1.42, "learning_rate": 8.729901161539837e-05, "loss": 0.0102, "step": 547040 }, { "epoch": 1.42, "learning_rate": 8.72951233990269e-05, "loss": 0.0082, "step": 547050 }, { "epoch": 1.42, "learning_rate": 8.729123518265544e-05, "loss": 0.013, "step": 547060 }, { "epoch": 1.42, "learning_rate": 8.728734696628397e-05, "loss": 0.0079, "step": 547070 }, { "epoch": 1.42, "learning_rate": 8.72834587499125e-05, "loss": 0.0089, "step": 547080 }, { "epoch": 1.42, "learning_rate": 8.727957053354104e-05, "loss": 0.0096, "step": 547090 }, { "epoch": 1.42, "learning_rate": 8.727568231716957e-05, "loss": 0.0118, "step": 547100 }, { "epoch": 1.42, "learning_rate": 8.727179410079811e-05, "loss": 0.0097, "step": 547110 }, { "epoch": 1.42, "learning_rate": 8.726790588442664e-05, "loss": 0.0093, "step": 547120 }, { "epoch": 1.42, "learning_rate": 8.726401766805518e-05, "loss": 0.009, "step": 547130 }, { "epoch": 1.42, "learning_rate": 8.726012945168371e-05, "loss": 0.0083, "step": 547140 }, { "epoch": 1.42, "learning_rate": 8.725624123531226e-05, "loss": 0.0072, "step": 547150 }, { "epoch": 1.42, "learning_rate": 8.725235301894079e-05, "loss": 0.0117, "step": 547160 }, { "epoch": 1.42, "learning_rate": 8.724846480256933e-05, "loss": 0.0124, "step": 547170 }, { "epoch": 1.42, "learning_rate": 8.724457658619786e-05, "loss": 0.008, "step": 547180 }, { "epoch": 1.42, "learning_rate": 8.72406883698264e-05, "loss": 0.0119, "step": 547190 }, { "epoch": 1.42, "learning_rate": 8.723680015345493e-05, "loss": 0.0103, "step": 547200 }, { "epoch": 1.42, "learning_rate": 8.723291193708347e-05, "loss": 0.0113, "step": 547210 }, { "epoch": 1.42, "learning_rate": 8.7229023720712e-05, "loss": 0.0114, "step": 547220 }, { "epoch": 1.42, "learning_rate": 8.722513550434054e-05, "loss": 0.0084, "step": 547230 }, { "epoch": 1.42, "learning_rate": 8.722124728796907e-05, "loss": 0.0082, "step": 547240 }, { "epoch": 1.42, "learning_rate": 8.721735907159761e-05, "loss": 0.0086, "step": 547250 }, { "epoch": 1.42, "learning_rate": 8.721347085522614e-05, "loss": 0.0113, "step": 547260 }, { "epoch": 1.42, "learning_rate": 8.720958263885468e-05, "loss": 0.0079, "step": 547270 }, { "epoch": 1.42, "learning_rate": 8.720569442248321e-05, "loss": 0.0095, "step": 547280 }, { "epoch": 1.42, "learning_rate": 8.720180620611175e-05, "loss": 0.0095, "step": 547290 }, { "epoch": 1.42, "learning_rate": 8.719791798974028e-05, "loss": 0.0106, "step": 547300 }, { "epoch": 1.42, "learning_rate": 8.719402977336883e-05, "loss": 0.0101, "step": 547310 }, { "epoch": 1.42, "learning_rate": 8.719014155699736e-05, "loss": 0.008, "step": 547320 }, { "epoch": 1.42, "learning_rate": 8.718625334062588e-05, "loss": 0.0106, "step": 547330 }, { "epoch": 1.42, "learning_rate": 8.718236512425443e-05, "loss": 0.0096, "step": 547340 }, { "epoch": 1.42, "learning_rate": 8.717847690788296e-05, "loss": 0.0083, "step": 547350 }, { "epoch": 1.42, "learning_rate": 8.71745886915115e-05, "loss": 0.0095, "step": 547360 }, { "epoch": 1.42, "learning_rate": 8.717070047514003e-05, "loss": 0.0098, "step": 547370 }, { "epoch": 1.42, "learning_rate": 8.716681225876857e-05, "loss": 0.0094, "step": 547380 }, { "epoch": 1.42, "learning_rate": 8.71629240423971e-05, "loss": 0.0106, "step": 547390 }, { "epoch": 1.42, "learning_rate": 8.715903582602564e-05, "loss": 0.01, "step": 547400 }, { "epoch": 1.42, "learning_rate": 8.715514760965417e-05, "loss": 0.012, "step": 547410 }, { "epoch": 1.42, "learning_rate": 8.715125939328271e-05, "loss": 0.0087, "step": 547420 }, { "epoch": 1.42, "learning_rate": 8.714737117691124e-05, "loss": 0.0088, "step": 547430 }, { "epoch": 1.42, "learning_rate": 8.714348296053978e-05, "loss": 0.0103, "step": 547440 }, { "epoch": 1.42, "learning_rate": 8.713959474416831e-05, "loss": 0.0084, "step": 547450 }, { "epoch": 1.42, "learning_rate": 8.713570652779685e-05, "loss": 0.0096, "step": 547460 }, { "epoch": 1.42, "learning_rate": 8.713181831142538e-05, "loss": 0.0077, "step": 547470 }, { "epoch": 1.42, "learning_rate": 8.712793009505392e-05, "loss": 0.0113, "step": 547480 }, { "epoch": 1.42, "learning_rate": 8.712404187868245e-05, "loss": 0.0078, "step": 547490 }, { "epoch": 1.42, "learning_rate": 8.7120153662311e-05, "loss": 0.0079, "step": 547500 }, { "epoch": 1.42, "learning_rate": 8.711626544593953e-05, "loss": 0.0087, "step": 547510 }, { "epoch": 1.42, "learning_rate": 8.711237722956807e-05, "loss": 0.0079, "step": 547520 }, { "epoch": 1.42, "learning_rate": 8.71084890131966e-05, "loss": 0.0136, "step": 547530 }, { "epoch": 1.42, "learning_rate": 8.710460079682514e-05, "loss": 0.0091, "step": 547540 }, { "epoch": 1.42, "learning_rate": 8.710071258045367e-05, "loss": 0.0109, "step": 547550 }, { "epoch": 1.42, "learning_rate": 8.709682436408221e-05, "loss": 0.0087, "step": 547560 }, { "epoch": 1.42, "learning_rate": 8.709293614771074e-05, "loss": 0.0109, "step": 547570 }, { "epoch": 1.42, "learning_rate": 8.708904793133927e-05, "loss": 0.0072, "step": 547580 }, { "epoch": 1.42, "learning_rate": 8.708515971496781e-05, "loss": 0.0115, "step": 547590 }, { "epoch": 1.42, "learning_rate": 8.708127149859634e-05, "loss": 0.0096, "step": 547600 }, { "epoch": 1.42, "learning_rate": 8.707738328222488e-05, "loss": 0.009, "step": 547610 }, { "epoch": 1.42, "learning_rate": 8.707349506585341e-05, "loss": 0.0084, "step": 547620 }, { "epoch": 1.42, "learning_rate": 8.706960684948195e-05, "loss": 0.0081, "step": 547630 }, { "epoch": 1.42, "learning_rate": 8.706571863311048e-05, "loss": 0.0095, "step": 547640 }, { "epoch": 1.42, "learning_rate": 8.706183041673902e-05, "loss": 0.0066, "step": 547650 }, { "epoch": 1.42, "learning_rate": 8.705794220036755e-05, "loss": 0.0114, "step": 547660 }, { "epoch": 1.42, "learning_rate": 8.70540539839961e-05, "loss": 0.0077, "step": 547670 }, { "epoch": 1.42, "learning_rate": 8.705016576762462e-05, "loss": 0.0103, "step": 547680 }, { "epoch": 1.42, "learning_rate": 8.704627755125317e-05, "loss": 0.0098, "step": 547690 }, { "epoch": 1.42, "learning_rate": 8.70423893348817e-05, "loss": 0.0104, "step": 547700 }, { "epoch": 1.42, "learning_rate": 8.703850111851024e-05, "loss": 0.0083, "step": 547710 }, { "epoch": 1.42, "learning_rate": 8.703461290213877e-05, "loss": 0.01, "step": 547720 }, { "epoch": 1.42, "learning_rate": 8.703072468576731e-05, "loss": 0.0084, "step": 547730 }, { "epoch": 1.42, "learning_rate": 8.702683646939584e-05, "loss": 0.0098, "step": 547740 }, { "epoch": 1.42, "learning_rate": 8.702294825302438e-05, "loss": 0.0096, "step": 547750 }, { "epoch": 1.42, "learning_rate": 8.701906003665291e-05, "loss": 0.0101, "step": 547760 }, { "epoch": 1.42, "learning_rate": 8.701517182028145e-05, "loss": 0.012, "step": 547770 }, { "epoch": 1.42, "learning_rate": 8.701128360390998e-05, "loss": 0.0075, "step": 547780 }, { "epoch": 1.42, "learning_rate": 8.700739538753852e-05, "loss": 0.0079, "step": 547790 }, { "epoch": 1.42, "learning_rate": 8.700350717116705e-05, "loss": 0.0074, "step": 547800 }, { "epoch": 1.42, "learning_rate": 8.699961895479559e-05, "loss": 0.0106, "step": 547810 }, { "epoch": 1.42, "learning_rate": 8.699573073842412e-05, "loss": 0.009, "step": 547820 }, { "epoch": 1.42, "learning_rate": 8.699184252205265e-05, "loss": 0.0073, "step": 547830 }, { "epoch": 1.42, "learning_rate": 8.698795430568119e-05, "loss": 0.0093, "step": 547840 }, { "epoch": 1.42, "learning_rate": 8.698406608930972e-05, "loss": 0.0103, "step": 547850 }, { "epoch": 1.42, "learning_rate": 8.698017787293827e-05, "loss": 0.0104, "step": 547860 }, { "epoch": 1.42, "learning_rate": 8.69762896565668e-05, "loss": 0.0068, "step": 547870 }, { "epoch": 1.42, "learning_rate": 8.697240144019534e-05, "loss": 0.0095, "step": 547880 }, { "epoch": 1.42, "learning_rate": 8.696851322382387e-05, "loss": 0.0102, "step": 547890 }, { "epoch": 1.42, "learning_rate": 8.696462500745241e-05, "loss": 0.0087, "step": 547900 }, { "epoch": 1.42, "learning_rate": 8.696073679108094e-05, "loss": 0.0109, "step": 547910 }, { "epoch": 1.42, "learning_rate": 8.695684857470948e-05, "loss": 0.0085, "step": 547920 }, { "epoch": 1.42, "learning_rate": 8.695296035833801e-05, "loss": 0.0107, "step": 547930 }, { "epoch": 1.42, "learning_rate": 8.694907214196655e-05, "loss": 0.0088, "step": 547940 }, { "epoch": 1.42, "learning_rate": 8.694518392559508e-05, "loss": 0.0098, "step": 547950 }, { "epoch": 1.42, "learning_rate": 8.694129570922362e-05, "loss": 0.0084, "step": 547960 }, { "epoch": 1.42, "learning_rate": 8.693740749285215e-05, "loss": 0.0078, "step": 547970 }, { "epoch": 1.42, "learning_rate": 8.693351927648069e-05, "loss": 0.0102, "step": 547980 }, { "epoch": 1.42, "learning_rate": 8.692963106010922e-05, "loss": 0.0094, "step": 547990 }, { "epoch": 1.42, "learning_rate": 8.692574284373776e-05, "loss": 0.0095, "step": 548000 }, { "epoch": 1.42, "eval_cer": 0.8816802921322209, "eval_loss": 0.006283493246883154, "eval_runtime": 107.9445, "eval_samples_per_second": 18.528, "eval_steps_per_second": 4.632, "step": 548000 }, { "epoch": 1.42, "learning_rate": 8.692185462736629e-05, "loss": 0.0106, "step": 548010 }, { "epoch": 1.42, "learning_rate": 8.691796641099484e-05, "loss": 0.0085, "step": 548020 }, { "epoch": 1.42, "learning_rate": 8.691407819462337e-05, "loss": 0.01, "step": 548030 }, { "epoch": 1.42, "learning_rate": 8.691018997825191e-05, "loss": 0.0101, "step": 548040 }, { "epoch": 1.42, "learning_rate": 8.690630176188044e-05, "loss": 0.0127, "step": 548050 }, { "epoch": 1.42, "learning_rate": 8.690241354550898e-05, "loss": 0.0071, "step": 548060 }, { "epoch": 1.42, "learning_rate": 8.689852532913751e-05, "loss": 0.0091, "step": 548070 }, { "epoch": 1.42, "learning_rate": 8.689463711276604e-05, "loss": 0.0113, "step": 548080 }, { "epoch": 1.42, "learning_rate": 8.689074889639458e-05, "loss": 0.0084, "step": 548090 }, { "epoch": 1.42, "learning_rate": 8.688686068002311e-05, "loss": 0.0104, "step": 548100 }, { "epoch": 1.42, "learning_rate": 8.688297246365165e-05, "loss": 0.01, "step": 548110 }, { "epoch": 1.42, "learning_rate": 8.687908424728018e-05, "loss": 0.0078, "step": 548120 }, { "epoch": 1.42, "learning_rate": 8.687519603090872e-05, "loss": 0.0088, "step": 548130 }, { "epoch": 1.42, "learning_rate": 8.687130781453725e-05, "loss": 0.0099, "step": 548140 }, { "epoch": 1.42, "learning_rate": 8.686741959816579e-05, "loss": 0.0079, "step": 548150 }, { "epoch": 1.42, "learning_rate": 8.686353138179432e-05, "loss": 0.0109, "step": 548160 }, { "epoch": 1.42, "learning_rate": 8.685964316542286e-05, "loss": 0.0098, "step": 548170 }, { "epoch": 1.42, "learning_rate": 8.685575494905139e-05, "loss": 0.0072, "step": 548180 }, { "epoch": 1.42, "learning_rate": 8.685186673267994e-05, "loss": 0.0092, "step": 548190 }, { "epoch": 1.42, "learning_rate": 8.684797851630846e-05, "loss": 0.0096, "step": 548200 }, { "epoch": 1.42, "learning_rate": 8.684409029993701e-05, "loss": 0.0092, "step": 548210 }, { "epoch": 1.42, "learning_rate": 8.684020208356554e-05, "loss": 0.0115, "step": 548220 }, { "epoch": 1.42, "learning_rate": 8.683631386719408e-05, "loss": 0.0107, "step": 548230 }, { "epoch": 1.42, "learning_rate": 8.683242565082261e-05, "loss": 0.0109, "step": 548240 }, { "epoch": 1.42, "learning_rate": 8.682853743445115e-05, "loss": 0.0086, "step": 548250 }, { "epoch": 1.42, "learning_rate": 8.682464921807968e-05, "loss": 0.0096, "step": 548260 }, { "epoch": 1.42, "learning_rate": 8.682076100170822e-05, "loss": 0.0074, "step": 548270 }, { "epoch": 1.42, "learning_rate": 8.681687278533675e-05, "loss": 0.0073, "step": 548280 }, { "epoch": 1.42, "learning_rate": 8.681298456896529e-05, "loss": 0.0077, "step": 548290 }, { "epoch": 1.42, "learning_rate": 8.680909635259382e-05, "loss": 0.0116, "step": 548300 }, { "epoch": 1.42, "learning_rate": 8.680520813622236e-05, "loss": 0.01, "step": 548310 }, { "epoch": 1.42, "learning_rate": 8.680131991985089e-05, "loss": 0.0115, "step": 548320 }, { "epoch": 1.42, "learning_rate": 8.679743170347942e-05, "loss": 0.0081, "step": 548330 }, { "epoch": 1.42, "learning_rate": 8.679354348710796e-05, "loss": 0.0078, "step": 548340 }, { "epoch": 1.42, "learning_rate": 8.678965527073649e-05, "loss": 0.0105, "step": 548350 }, { "epoch": 1.42, "learning_rate": 8.678576705436503e-05, "loss": 0.008, "step": 548360 }, { "epoch": 1.42, "learning_rate": 8.678187883799356e-05, "loss": 0.0089, "step": 548370 }, { "epoch": 1.42, "learning_rate": 8.677799062162211e-05, "loss": 0.0094, "step": 548380 }, { "epoch": 1.42, "learning_rate": 8.677410240525064e-05, "loss": 0.0071, "step": 548390 }, { "epoch": 1.42, "learning_rate": 8.677021418887918e-05, "loss": 0.0116, "step": 548400 }, { "epoch": 1.42, "learning_rate": 8.676632597250771e-05, "loss": 0.0132, "step": 548410 }, { "epoch": 1.42, "learning_rate": 8.676243775613625e-05, "loss": 0.0079, "step": 548420 }, { "epoch": 1.42, "learning_rate": 8.675854953976478e-05, "loss": 0.0092, "step": 548430 }, { "epoch": 1.42, "learning_rate": 8.675466132339332e-05, "loss": 0.0102, "step": 548440 }, { "epoch": 1.42, "learning_rate": 8.675077310702185e-05, "loss": 0.0074, "step": 548450 }, { "epoch": 1.42, "learning_rate": 8.674688489065039e-05, "loss": 0.0074, "step": 548460 }, { "epoch": 1.42, "learning_rate": 8.674299667427892e-05, "loss": 0.0066, "step": 548470 }, { "epoch": 1.42, "learning_rate": 8.673910845790746e-05, "loss": 0.0122, "step": 548480 }, { "epoch": 1.42, "learning_rate": 8.673522024153599e-05, "loss": 0.0116, "step": 548490 }, { "epoch": 1.42, "learning_rate": 8.673133202516453e-05, "loss": 0.0089, "step": 548500 }, { "epoch": 1.42, "learning_rate": 8.672744380879306e-05, "loss": 0.0077, "step": 548510 }, { "epoch": 1.42, "learning_rate": 8.67235555924216e-05, "loss": 0.0091, "step": 548520 }, { "epoch": 1.42, "learning_rate": 8.671966737605013e-05, "loss": 0.0092, "step": 548530 }, { "epoch": 1.42, "learning_rate": 8.671577915967868e-05, "loss": 0.0119, "step": 548540 }, { "epoch": 1.42, "learning_rate": 8.671189094330721e-05, "loss": 0.0109, "step": 548550 }, { "epoch": 1.42, "learning_rate": 8.670800272693575e-05, "loss": 0.0082, "step": 548560 }, { "epoch": 1.42, "learning_rate": 8.670411451056428e-05, "loss": 0.0091, "step": 548570 }, { "epoch": 1.42, "learning_rate": 8.670022629419281e-05, "loss": 0.0094, "step": 548580 }, { "epoch": 1.42, "learning_rate": 8.669633807782135e-05, "loss": 0.0062, "step": 548590 }, { "epoch": 1.42, "learning_rate": 8.669244986144988e-05, "loss": 0.0109, "step": 548600 }, { "epoch": 1.42, "learning_rate": 8.668856164507842e-05, "loss": 0.0097, "step": 548610 }, { "epoch": 1.42, "learning_rate": 8.668467342870695e-05, "loss": 0.0133, "step": 548620 }, { "epoch": 1.42, "learning_rate": 8.668078521233549e-05, "loss": 0.0092, "step": 548630 }, { "epoch": 1.42, "learning_rate": 8.667689699596402e-05, "loss": 0.0089, "step": 548640 }, { "epoch": 1.42, "learning_rate": 8.667300877959256e-05, "loss": 0.0121, "step": 548650 }, { "epoch": 1.42, "learning_rate": 8.666912056322109e-05, "loss": 0.0088, "step": 548660 }, { "epoch": 1.42, "learning_rate": 8.666523234684963e-05, "loss": 0.0084, "step": 548670 }, { "epoch": 1.42, "learning_rate": 8.666134413047816e-05, "loss": 0.009, "step": 548680 }, { "epoch": 1.42, "learning_rate": 8.66574559141067e-05, "loss": 0.01, "step": 548690 }, { "epoch": 1.42, "learning_rate": 8.665356769773523e-05, "loss": 0.008, "step": 548700 }, { "epoch": 1.42, "learning_rate": 8.664967948136377e-05, "loss": 0.0084, "step": 548710 }, { "epoch": 1.42, "learning_rate": 8.66457912649923e-05, "loss": 0.0077, "step": 548720 }, { "epoch": 1.42, "learning_rate": 8.664190304862085e-05, "loss": 0.0092, "step": 548730 }, { "epoch": 1.42, "learning_rate": 8.663801483224938e-05, "loss": 0.0097, "step": 548740 }, { "epoch": 1.42, "learning_rate": 8.663412661587792e-05, "loss": 0.0091, "step": 548750 }, { "epoch": 1.42, "learning_rate": 8.663023839950645e-05, "loss": 0.0098, "step": 548760 }, { "epoch": 1.42, "learning_rate": 8.662635018313499e-05, "loss": 0.011, "step": 548770 }, { "epoch": 1.42, "learning_rate": 8.662246196676352e-05, "loss": 0.0097, "step": 548780 }, { "epoch": 1.42, "learning_rate": 8.661857375039206e-05, "loss": 0.0137, "step": 548790 }, { "epoch": 1.42, "learning_rate": 8.661468553402059e-05, "loss": 0.0141, "step": 548800 }, { "epoch": 1.42, "learning_rate": 8.661079731764913e-05, "loss": 0.0101, "step": 548810 }, { "epoch": 1.42, "learning_rate": 8.660690910127766e-05, "loss": 0.0089, "step": 548820 }, { "epoch": 1.42, "learning_rate": 8.660302088490619e-05, "loss": 0.0088, "step": 548830 }, { "epoch": 1.42, "learning_rate": 8.659913266853473e-05, "loss": 0.0147, "step": 548840 }, { "epoch": 1.42, "learning_rate": 8.659524445216326e-05, "loss": 0.0114, "step": 548850 }, { "epoch": 1.42, "learning_rate": 8.65913562357918e-05, "loss": 0.0115, "step": 548860 }, { "epoch": 1.42, "learning_rate": 8.658746801942033e-05, "loss": 0.0089, "step": 548870 }, { "epoch": 1.42, "learning_rate": 8.658357980304887e-05, "loss": 0.0095, "step": 548880 }, { "epoch": 1.42, "learning_rate": 8.65796915866774e-05, "loss": 0.0076, "step": 548890 }, { "epoch": 1.42, "learning_rate": 8.657580337030595e-05, "loss": 0.0099, "step": 548900 }, { "epoch": 1.42, "learning_rate": 8.657191515393447e-05, "loss": 0.0092, "step": 548910 }, { "epoch": 1.42, "learning_rate": 8.656802693756302e-05, "loss": 0.0074, "step": 548920 }, { "epoch": 1.42, "learning_rate": 8.656413872119155e-05, "loss": 0.0106, "step": 548930 }, { "epoch": 1.42, "learning_rate": 8.656025050482009e-05, "loss": 0.0095, "step": 548940 }, { "epoch": 1.42, "learning_rate": 8.655636228844862e-05, "loss": 0.0092, "step": 548950 }, { "epoch": 1.42, "learning_rate": 8.655247407207716e-05, "loss": 0.0107, "step": 548960 }, { "epoch": 1.42, "learning_rate": 8.654858585570569e-05, "loss": 0.0085, "step": 548970 }, { "epoch": 1.42, "learning_rate": 8.654469763933423e-05, "loss": 0.0097, "step": 548980 }, { "epoch": 1.42, "learning_rate": 8.654080942296276e-05, "loss": 0.0099, "step": 548990 }, { "epoch": 1.42, "learning_rate": 8.65369212065913e-05, "loss": 0.0107, "step": 549000 }, { "epoch": 1.42, "eval_cer": 0.8816914892276944, "eval_loss": 0.006188477389514446, "eval_runtime": 107.8567, "eval_samples_per_second": 18.543, "eval_steps_per_second": 4.636, "step": 549000 }, { "epoch": 1.42, "learning_rate": 8.653303299021983e-05, "loss": 0.01, "step": 549010 }, { "epoch": 1.42, "learning_rate": 8.652914477384837e-05, "loss": 0.0084, "step": 549020 }, { "epoch": 1.42, "learning_rate": 8.65252565574769e-05, "loss": 0.01, "step": 549030 }, { "epoch": 1.42, "learning_rate": 8.652136834110544e-05, "loss": 0.0112, "step": 549040 }, { "epoch": 1.42, "learning_rate": 8.651748012473397e-05, "loss": 0.01, "step": 549050 }, { "epoch": 1.42, "learning_rate": 8.65135919083625e-05, "loss": 0.0092, "step": 549060 }, { "epoch": 1.42, "learning_rate": 8.650970369199104e-05, "loss": 0.0103, "step": 549070 }, { "epoch": 1.42, "learning_rate": 8.650581547561957e-05, "loss": 0.0098, "step": 549080 }, { "epoch": 1.42, "learning_rate": 8.650192725924812e-05, "loss": 0.0072, "step": 549090 }, { "epoch": 1.42, "learning_rate": 8.649803904287665e-05, "loss": 0.0089, "step": 549100 }, { "epoch": 1.42, "learning_rate": 8.649415082650519e-05, "loss": 0.0096, "step": 549110 }, { "epoch": 1.42, "learning_rate": 8.649026261013372e-05, "loss": 0.01, "step": 549120 }, { "epoch": 1.42, "learning_rate": 8.648637439376226e-05, "loss": 0.009, "step": 549130 }, { "epoch": 1.42, "learning_rate": 8.648248617739079e-05, "loss": 0.0091, "step": 549140 }, { "epoch": 1.42, "learning_rate": 8.647859796101933e-05, "loss": 0.0089, "step": 549150 }, { "epoch": 1.42, "learning_rate": 8.647470974464786e-05, "loss": 0.0098, "step": 549160 }, { "epoch": 1.42, "learning_rate": 8.64708215282764e-05, "loss": 0.0068, "step": 549170 }, { "epoch": 1.42, "learning_rate": 8.646693331190493e-05, "loss": 0.0085, "step": 549180 }, { "epoch": 1.42, "learning_rate": 8.646304509553347e-05, "loss": 0.0084, "step": 549190 }, { "epoch": 1.42, "learning_rate": 8.6459156879162e-05, "loss": 0.0089, "step": 549200 }, { "epoch": 1.42, "learning_rate": 8.645526866279054e-05, "loss": 0.0091, "step": 549210 }, { "epoch": 1.42, "learning_rate": 8.645138044641907e-05, "loss": 0.0113, "step": 549220 }, { "epoch": 1.42, "learning_rate": 8.644749223004761e-05, "loss": 0.0084, "step": 549230 }, { "epoch": 1.42, "learning_rate": 8.644360401367614e-05, "loss": 0.0075, "step": 549240 }, { "epoch": 1.42, "learning_rate": 8.643971579730469e-05, "loss": 0.0079, "step": 549250 }, { "epoch": 1.42, "learning_rate": 8.643582758093322e-05, "loss": 0.0107, "step": 549260 }, { "epoch": 1.42, "learning_rate": 8.643193936456176e-05, "loss": 0.0081, "step": 549270 }, { "epoch": 1.42, "learning_rate": 8.642805114819029e-05, "loss": 0.0092, "step": 549280 }, { "epoch": 1.42, "learning_rate": 8.642416293181883e-05, "loss": 0.0089, "step": 549290 }, { "epoch": 1.42, "learning_rate": 8.642027471544736e-05, "loss": 0.0129, "step": 549300 }, { "epoch": 1.42, "learning_rate": 8.641638649907589e-05, "loss": 0.0065, "step": 549310 }, { "epoch": 1.42, "learning_rate": 8.641249828270443e-05, "loss": 0.0107, "step": 549320 }, { "epoch": 1.42, "learning_rate": 8.640861006633296e-05, "loss": 0.0113, "step": 549330 }, { "epoch": 1.42, "learning_rate": 8.64047218499615e-05, "loss": 0.0096, "step": 549340 }, { "epoch": 1.42, "learning_rate": 8.640083363359003e-05, "loss": 0.0103, "step": 549350 }, { "epoch": 1.42, "learning_rate": 8.639694541721857e-05, "loss": 0.0069, "step": 549360 }, { "epoch": 1.42, "learning_rate": 8.63930572008471e-05, "loss": 0.0117, "step": 549370 }, { "epoch": 1.42, "learning_rate": 8.638916898447564e-05, "loss": 0.0109, "step": 549380 }, { "epoch": 1.42, "learning_rate": 8.638528076810417e-05, "loss": 0.0093, "step": 549390 }, { "epoch": 1.42, "learning_rate": 8.638139255173271e-05, "loss": 0.0075, "step": 549400 }, { "epoch": 1.42, "learning_rate": 8.637750433536124e-05, "loss": 0.0101, "step": 549410 }, { "epoch": 1.42, "learning_rate": 8.637361611898979e-05, "loss": 0.0102, "step": 549420 }, { "epoch": 1.42, "learning_rate": 8.63697279026183e-05, "loss": 0.01, "step": 549430 }, { "epoch": 1.42, "learning_rate": 8.636583968624686e-05, "loss": 0.0107, "step": 549440 }, { "epoch": 1.42, "learning_rate": 8.636195146987539e-05, "loss": 0.009, "step": 549450 }, { "epoch": 1.42, "learning_rate": 8.635806325350393e-05, "loss": 0.0103, "step": 549460 }, { "epoch": 1.42, "learning_rate": 8.635417503713246e-05, "loss": 0.0105, "step": 549470 }, { "epoch": 1.42, "learning_rate": 8.6350286820761e-05, "loss": 0.0093, "step": 549480 }, { "epoch": 1.42, "learning_rate": 8.634639860438953e-05, "loss": 0.0101, "step": 549490 }, { "epoch": 1.42, "learning_rate": 8.634251038801807e-05, "loss": 0.0072, "step": 549500 }, { "epoch": 1.42, "learning_rate": 8.63386221716466e-05, "loss": 0.009, "step": 549510 }, { "epoch": 1.42, "learning_rate": 8.633473395527514e-05, "loss": 0.0081, "step": 549520 }, { "epoch": 1.42, "learning_rate": 8.633084573890367e-05, "loss": 0.0098, "step": 549530 }, { "epoch": 1.42, "learning_rate": 8.632695752253221e-05, "loss": 0.0086, "step": 549540 }, { "epoch": 1.42, "learning_rate": 8.632306930616074e-05, "loss": 0.0108, "step": 549550 }, { "epoch": 1.42, "learning_rate": 8.631918108978927e-05, "loss": 0.0096, "step": 549560 }, { "epoch": 1.42, "learning_rate": 8.631529287341781e-05, "loss": 0.0087, "step": 549570 }, { "epoch": 1.42, "learning_rate": 8.631140465704634e-05, "loss": 0.0107, "step": 549580 }, { "epoch": 1.42, "learning_rate": 8.630751644067488e-05, "loss": 0.008, "step": 549590 }, { "epoch": 1.42, "learning_rate": 8.63036282243034e-05, "loss": 0.0087, "step": 549600 }, { "epoch": 1.42, "learning_rate": 8.629974000793196e-05, "loss": 0.0087, "step": 549610 }, { "epoch": 1.42, "learning_rate": 8.629585179156049e-05, "loss": 0.0119, "step": 549620 }, { "epoch": 1.42, "learning_rate": 8.629196357518903e-05, "loss": 0.0106, "step": 549630 }, { "epoch": 1.42, "learning_rate": 8.628807535881756e-05, "loss": 0.0084, "step": 549640 }, { "epoch": 1.42, "learning_rate": 8.62841871424461e-05, "loss": 0.0105, "step": 549650 }, { "epoch": 1.42, "learning_rate": 8.628029892607463e-05, "loss": 0.0084, "step": 549660 }, { "epoch": 1.42, "learning_rate": 8.627641070970317e-05, "loss": 0.007, "step": 549670 }, { "epoch": 1.42, "learning_rate": 8.62725224933317e-05, "loss": 0.0119, "step": 549680 }, { "epoch": 1.42, "learning_rate": 8.626863427696024e-05, "loss": 0.0085, "step": 549690 }, { "epoch": 1.42, "learning_rate": 8.626474606058877e-05, "loss": 0.0094, "step": 549700 }, { "epoch": 1.42, "learning_rate": 8.626085784421731e-05, "loss": 0.0094, "step": 549710 }, { "epoch": 1.42, "learning_rate": 8.625696962784584e-05, "loss": 0.0106, "step": 549720 }, { "epoch": 1.42, "learning_rate": 8.625308141147438e-05, "loss": 0.0103, "step": 549730 }, { "epoch": 1.43, "learning_rate": 8.624919319510291e-05, "loss": 0.0082, "step": 549740 }, { "epoch": 1.43, "learning_rate": 8.624530497873145e-05, "loss": 0.0085, "step": 549750 }, { "epoch": 1.43, "learning_rate": 8.624141676235998e-05, "loss": 0.0079, "step": 549760 }, { "epoch": 1.43, "learning_rate": 8.623752854598853e-05, "loss": 0.0105, "step": 549770 }, { "epoch": 1.43, "learning_rate": 8.623364032961706e-05, "loss": 0.0106, "step": 549780 }, { "epoch": 1.43, "learning_rate": 8.62297521132456e-05, "loss": 0.0078, "step": 549790 }, { "epoch": 1.43, "learning_rate": 8.622586389687413e-05, "loss": 0.0094, "step": 549800 }, { "epoch": 1.43, "learning_rate": 8.622197568050266e-05, "loss": 0.0099, "step": 549810 }, { "epoch": 1.43, "learning_rate": 8.62180874641312e-05, "loss": 0.011, "step": 549820 }, { "epoch": 1.43, "learning_rate": 8.621419924775973e-05, "loss": 0.0088, "step": 549830 }, { "epoch": 1.43, "learning_rate": 8.621031103138827e-05, "loss": 0.0129, "step": 549840 }, { "epoch": 1.43, "learning_rate": 8.62064228150168e-05, "loss": 0.0104, "step": 549850 }, { "epoch": 1.43, "learning_rate": 8.620253459864534e-05, "loss": 0.009, "step": 549860 }, { "epoch": 1.43, "learning_rate": 8.619864638227387e-05, "loss": 0.0105, "step": 549870 }, { "epoch": 1.43, "learning_rate": 8.619475816590241e-05, "loss": 0.01, "step": 549880 }, { "epoch": 1.43, "learning_rate": 8.619086994953094e-05, "loss": 0.009, "step": 549890 }, { "epoch": 1.43, "learning_rate": 8.618698173315948e-05, "loss": 0.008, "step": 549900 }, { "epoch": 1.43, "learning_rate": 8.618309351678801e-05, "loss": 0.0088, "step": 549910 }, { "epoch": 1.43, "learning_rate": 8.617920530041655e-05, "loss": 0.0083, "step": 549920 }, { "epoch": 1.43, "learning_rate": 8.617531708404508e-05, "loss": 0.0108, "step": 549930 }, { "epoch": 1.43, "learning_rate": 8.617142886767363e-05, "loss": 0.0085, "step": 549940 }, { "epoch": 1.43, "learning_rate": 8.616754065130215e-05, "loss": 0.0064, "step": 549950 }, { "epoch": 1.43, "learning_rate": 8.61636524349307e-05, "loss": 0.0099, "step": 549960 }, { "epoch": 1.43, "learning_rate": 8.615976421855923e-05, "loss": 0.0114, "step": 549970 }, { "epoch": 1.43, "learning_rate": 8.615587600218777e-05, "loss": 0.011, "step": 549980 }, { "epoch": 1.43, "learning_rate": 8.61519877858163e-05, "loss": 0.0096, "step": 549990 }, { "epoch": 1.43, "learning_rate": 8.614809956944484e-05, "loss": 0.0107, "step": 550000 }, { "epoch": 1.43, "eval_cer": 0.8816774928583525, "eval_loss": 0.006080552935600281, "eval_runtime": 107.8759, "eval_samples_per_second": 18.54, "eval_steps_per_second": 4.635, "step": 550000 }, { "epoch": 1.43, "learning_rate": 8.614421135307337e-05, "loss": 0.0092, "step": 550010 }, { "epoch": 1.43, "learning_rate": 8.614032313670191e-05, "loss": 0.0097, "step": 550020 }, { "epoch": 1.43, "learning_rate": 8.613643492033044e-05, "loss": 0.0081, "step": 550030 }, { "epoch": 1.43, "learning_rate": 8.613254670395898e-05, "loss": 0.01, "step": 550040 }, { "epoch": 1.43, "learning_rate": 8.612865848758751e-05, "loss": 0.0077, "step": 550050 }, { "epoch": 1.43, "learning_rate": 8.612477027121604e-05, "loss": 0.0074, "step": 550060 }, { "epoch": 1.43, "learning_rate": 8.612088205484458e-05, "loss": 0.0066, "step": 550070 }, { "epoch": 1.43, "learning_rate": 8.61169938384731e-05, "loss": 0.0104, "step": 550080 }, { "epoch": 1.43, "learning_rate": 8.611310562210165e-05, "loss": 0.0104, "step": 550090 }, { "epoch": 1.43, "learning_rate": 8.610921740573018e-05, "loss": 0.0126, "step": 550100 }, { "epoch": 1.43, "learning_rate": 8.610532918935872e-05, "loss": 0.0092, "step": 550110 }, { "epoch": 1.43, "learning_rate": 8.610144097298725e-05, "loss": 0.0122, "step": 550120 }, { "epoch": 1.43, "learning_rate": 8.60975527566158e-05, "loss": 0.01, "step": 550130 }, { "epoch": 1.43, "learning_rate": 8.609366454024433e-05, "loss": 0.0125, "step": 550140 }, { "epoch": 1.43, "learning_rate": 8.608977632387287e-05, "loss": 0.0071, "step": 550150 }, { "epoch": 1.43, "learning_rate": 8.60858881075014e-05, "loss": 0.0104, "step": 550160 }, { "epoch": 1.43, "learning_rate": 8.608199989112994e-05, "loss": 0.0079, "step": 550170 }, { "epoch": 1.43, "learning_rate": 8.607811167475847e-05, "loss": 0.0089, "step": 550180 }, { "epoch": 1.43, "learning_rate": 8.607422345838701e-05, "loss": 0.0082, "step": 550190 }, { "epoch": 1.43, "learning_rate": 8.607033524201554e-05, "loss": 0.0075, "step": 550200 }, { "epoch": 1.43, "learning_rate": 8.606644702564408e-05, "loss": 0.0083, "step": 550210 }, { "epoch": 1.43, "learning_rate": 8.606255880927261e-05, "loss": 0.0084, "step": 550220 }, { "epoch": 1.43, "learning_rate": 8.605867059290115e-05, "loss": 0.0073, "step": 550230 }, { "epoch": 1.43, "learning_rate": 8.605478237652968e-05, "loss": 0.0103, "step": 550240 }, { "epoch": 1.43, "learning_rate": 8.605089416015822e-05, "loss": 0.0108, "step": 550250 }, { "epoch": 1.43, "learning_rate": 8.604700594378675e-05, "loss": 0.0094, "step": 550260 }, { "epoch": 1.43, "learning_rate": 8.604311772741529e-05, "loss": 0.0099, "step": 550270 }, { "epoch": 1.43, "learning_rate": 8.603922951104382e-05, "loss": 0.007, "step": 550280 }, { "epoch": 1.43, "learning_rate": 8.603534129467237e-05, "loss": 0.0087, "step": 550290 }, { "epoch": 1.43, "learning_rate": 8.603145307830089e-05, "loss": 0.0073, "step": 550300 }, { "epoch": 1.43, "learning_rate": 8.602756486192942e-05, "loss": 0.0073, "step": 550310 }, { "epoch": 1.43, "learning_rate": 8.602367664555797e-05, "loss": 0.0101, "step": 550320 }, { "epoch": 1.43, "learning_rate": 8.60197884291865e-05, "loss": 0.0083, "step": 550330 }, { "epoch": 1.43, "learning_rate": 8.601590021281504e-05, "loss": 0.0076, "step": 550340 }, { "epoch": 1.43, "learning_rate": 8.601201199644357e-05, "loss": 0.011, "step": 550350 }, { "epoch": 1.43, "learning_rate": 8.600812378007211e-05, "loss": 0.0082, "step": 550360 }, { "epoch": 1.43, "learning_rate": 8.600423556370064e-05, "loss": 0.0117, "step": 550370 }, { "epoch": 1.43, "learning_rate": 8.600034734732918e-05, "loss": 0.0103, "step": 550380 }, { "epoch": 1.43, "learning_rate": 8.599645913095771e-05, "loss": 0.0079, "step": 550390 }, { "epoch": 1.43, "learning_rate": 8.599257091458625e-05, "loss": 0.0072, "step": 550400 }, { "epoch": 1.43, "learning_rate": 8.598868269821478e-05, "loss": 0.0097, "step": 550410 }, { "epoch": 1.43, "learning_rate": 8.598479448184332e-05, "loss": 0.006, "step": 550420 }, { "epoch": 1.43, "learning_rate": 8.598090626547185e-05, "loss": 0.0073, "step": 550430 }, { "epoch": 1.43, "learning_rate": 8.597701804910039e-05, "loss": 0.0084, "step": 550440 }, { "epoch": 1.43, "learning_rate": 8.597312983272892e-05, "loss": 0.0093, "step": 550450 }, { "epoch": 1.43, "learning_rate": 8.596924161635746e-05, "loss": 0.0092, "step": 550460 }, { "epoch": 1.43, "learning_rate": 8.596535339998599e-05, "loss": 0.0116, "step": 550470 }, { "epoch": 1.43, "learning_rate": 8.596146518361454e-05, "loss": 0.0112, "step": 550480 }, { "epoch": 1.43, "learning_rate": 8.595757696724307e-05, "loss": 0.0084, "step": 550490 }, { "epoch": 1.43, "learning_rate": 8.595368875087161e-05, "loss": 0.0118, "step": 550500 }, { "epoch": 1.43, "learning_rate": 8.594980053450014e-05, "loss": 0.0093, "step": 550510 }, { "epoch": 1.43, "learning_rate": 8.594591231812868e-05, "loss": 0.0094, "step": 550520 }, { "epoch": 1.43, "learning_rate": 8.594202410175721e-05, "loss": 0.0123, "step": 550530 }, { "epoch": 1.43, "learning_rate": 8.593813588538575e-05, "loss": 0.0058, "step": 550540 }, { "epoch": 1.43, "learning_rate": 8.593424766901428e-05, "loss": 0.0087, "step": 550550 }, { "epoch": 1.43, "learning_rate": 8.593035945264281e-05, "loss": 0.0087, "step": 550560 }, { "epoch": 1.43, "learning_rate": 8.592647123627135e-05, "loss": 0.0088, "step": 550570 }, { "epoch": 1.43, "learning_rate": 8.592258301989988e-05, "loss": 0.0112, "step": 550580 }, { "epoch": 1.43, "learning_rate": 8.591869480352842e-05, "loss": 0.0118, "step": 550590 }, { "epoch": 1.43, "learning_rate": 8.591480658715695e-05, "loss": 0.0126, "step": 550600 }, { "epoch": 1.43, "learning_rate": 8.591091837078549e-05, "loss": 0.012, "step": 550610 }, { "epoch": 1.43, "learning_rate": 8.590703015441402e-05, "loss": 0.0113, "step": 550620 }, { "epoch": 1.43, "learning_rate": 8.590314193804256e-05, "loss": 0.01, "step": 550630 }, { "epoch": 1.43, "learning_rate": 8.589925372167109e-05, "loss": 0.0106, "step": 550640 }, { "epoch": 1.43, "learning_rate": 8.589536550529964e-05, "loss": 0.0055, "step": 550650 }, { "epoch": 1.43, "learning_rate": 8.589147728892816e-05, "loss": 0.0084, "step": 550660 }, { "epoch": 1.43, "learning_rate": 8.588758907255671e-05, "loss": 0.0084, "step": 550670 }, { "epoch": 1.43, "learning_rate": 8.588370085618524e-05, "loss": 0.0134, "step": 550680 }, { "epoch": 1.43, "learning_rate": 8.587981263981378e-05, "loss": 0.0107, "step": 550690 }, { "epoch": 1.43, "learning_rate": 8.587592442344231e-05, "loss": 0.0105, "step": 550700 }, { "epoch": 1.43, "learning_rate": 8.587203620707085e-05, "loss": 0.0089, "step": 550710 }, { "epoch": 1.43, "learning_rate": 8.586814799069938e-05, "loss": 0.007, "step": 550720 }, { "epoch": 1.43, "learning_rate": 8.586425977432792e-05, "loss": 0.0061, "step": 550730 }, { "epoch": 1.43, "learning_rate": 8.586037155795645e-05, "loss": 0.0105, "step": 550740 }, { "epoch": 1.43, "learning_rate": 8.585648334158499e-05, "loss": 0.0089, "step": 550750 }, { "epoch": 1.43, "learning_rate": 8.585259512521352e-05, "loss": 0.0076, "step": 550760 }, { "epoch": 1.43, "learning_rate": 8.584870690884206e-05, "loss": 0.01, "step": 550770 }, { "epoch": 1.43, "learning_rate": 8.584481869247059e-05, "loss": 0.0103, "step": 550780 }, { "epoch": 1.43, "learning_rate": 8.584093047609913e-05, "loss": 0.008, "step": 550790 }, { "epoch": 1.43, "learning_rate": 8.583704225972766e-05, "loss": 0.0085, "step": 550800 }, { "epoch": 1.43, "learning_rate": 8.583315404335619e-05, "loss": 0.0095, "step": 550810 }, { "epoch": 1.43, "learning_rate": 8.582926582698473e-05, "loss": 0.0122, "step": 550820 }, { "epoch": 1.43, "learning_rate": 8.582537761061326e-05, "loss": 0.0093, "step": 550830 }, { "epoch": 1.43, "learning_rate": 8.582148939424181e-05, "loss": 0.0105, "step": 550840 }, { "epoch": 1.43, "learning_rate": 8.581760117787034e-05, "loss": 0.0056, "step": 550850 }, { "epoch": 1.43, "learning_rate": 8.581371296149888e-05, "loss": 0.0076, "step": 550860 }, { "epoch": 1.43, "learning_rate": 8.580982474512741e-05, "loss": 0.0085, "step": 550870 }, { "epoch": 1.43, "learning_rate": 8.580593652875595e-05, "loss": 0.013, "step": 550880 }, { "epoch": 1.43, "learning_rate": 8.580204831238448e-05, "loss": 0.0103, "step": 550890 }, { "epoch": 1.43, "learning_rate": 8.579816009601302e-05, "loss": 0.0073, "step": 550900 }, { "epoch": 1.43, "learning_rate": 8.579427187964155e-05, "loss": 0.0085, "step": 550910 }, { "epoch": 1.43, "learning_rate": 8.579038366327009e-05, "loss": 0.0095, "step": 550920 }, { "epoch": 1.43, "learning_rate": 8.578649544689862e-05, "loss": 0.0129, "step": 550930 }, { "epoch": 1.43, "learning_rate": 8.578260723052716e-05, "loss": 0.0097, "step": 550940 }, { "epoch": 1.43, "learning_rate": 8.577871901415569e-05, "loss": 0.0073, "step": 550950 }, { "epoch": 1.43, "learning_rate": 8.577483079778423e-05, "loss": 0.0117, "step": 550960 }, { "epoch": 1.43, "learning_rate": 8.577094258141276e-05, "loss": 0.0109, "step": 550970 }, { "epoch": 1.43, "learning_rate": 8.57670543650413e-05, "loss": 0.0121, "step": 550980 }, { "epoch": 1.43, "learning_rate": 8.576316614866983e-05, "loss": 0.0117, "step": 550990 }, { "epoch": 1.43, "learning_rate": 8.575927793229838e-05, "loss": 0.0086, "step": 551000 }, { "epoch": 1.43, "eval_cer": 0.8816760932214184, "eval_loss": 0.006159137934446335, "eval_runtime": 107.439, "eval_samples_per_second": 18.615, "eval_steps_per_second": 4.654, "step": 551000 }, { "epoch": 1.43, "learning_rate": 8.575538971592691e-05, "loss": 0.0098, "step": 551010 }, { "epoch": 1.43, "learning_rate": 8.575150149955545e-05, "loss": 0.0115, "step": 551020 }, { "epoch": 1.43, "learning_rate": 8.574761328318398e-05, "loss": 0.0077, "step": 551030 }, { "epoch": 1.43, "learning_rate": 8.574372506681252e-05, "loss": 0.0074, "step": 551040 }, { "epoch": 1.43, "learning_rate": 8.573983685044105e-05, "loss": 0.0077, "step": 551050 }, { "epoch": 1.43, "learning_rate": 8.573594863406958e-05, "loss": 0.0096, "step": 551060 }, { "epoch": 1.43, "learning_rate": 8.573206041769812e-05, "loss": 0.0116, "step": 551070 }, { "epoch": 1.43, "learning_rate": 8.572817220132665e-05, "loss": 0.0065, "step": 551080 }, { "epoch": 1.43, "learning_rate": 8.572428398495519e-05, "loss": 0.0093, "step": 551090 }, { "epoch": 1.43, "learning_rate": 8.572039576858372e-05, "loss": 0.0123, "step": 551100 }, { "epoch": 1.43, "learning_rate": 8.571650755221226e-05, "loss": 0.0085, "step": 551110 }, { "epoch": 1.43, "learning_rate": 8.571261933584079e-05, "loss": 0.008, "step": 551120 }, { "epoch": 1.43, "learning_rate": 8.570873111946933e-05, "loss": 0.0094, "step": 551130 }, { "epoch": 1.43, "learning_rate": 8.570484290309786e-05, "loss": 0.009, "step": 551140 }, { "epoch": 1.43, "learning_rate": 8.57009546867264e-05, "loss": 0.0069, "step": 551150 }, { "epoch": 1.43, "learning_rate": 8.569706647035493e-05, "loss": 0.0088, "step": 551160 }, { "epoch": 1.43, "learning_rate": 8.569317825398348e-05, "loss": 0.0082, "step": 551170 }, { "epoch": 1.43, "learning_rate": 8.5689290037612e-05, "loss": 0.0089, "step": 551180 }, { "epoch": 1.43, "learning_rate": 8.568540182124055e-05, "loss": 0.0118, "step": 551190 }, { "epoch": 1.43, "learning_rate": 8.568151360486908e-05, "loss": 0.0077, "step": 551200 }, { "epoch": 1.43, "learning_rate": 8.567762538849762e-05, "loss": 0.0094, "step": 551210 }, { "epoch": 1.43, "learning_rate": 8.567373717212615e-05, "loss": 0.0096, "step": 551220 }, { "epoch": 1.43, "learning_rate": 8.566984895575469e-05, "loss": 0.0132, "step": 551230 }, { "epoch": 1.43, "learning_rate": 8.566596073938322e-05, "loss": 0.0083, "step": 551240 }, { "epoch": 1.43, "learning_rate": 8.566207252301176e-05, "loss": 0.0113, "step": 551250 }, { "epoch": 1.43, "learning_rate": 8.565818430664029e-05, "loss": 0.0099, "step": 551260 }, { "epoch": 1.43, "learning_rate": 8.565429609026883e-05, "loss": 0.0111, "step": 551270 }, { "epoch": 1.43, "learning_rate": 8.565040787389736e-05, "loss": 0.0107, "step": 551280 }, { "epoch": 1.43, "learning_rate": 8.56465196575259e-05, "loss": 0.011, "step": 551290 }, { "epoch": 1.43, "learning_rate": 8.564263144115443e-05, "loss": 0.0091, "step": 551300 }, { "epoch": 1.43, "learning_rate": 8.563874322478296e-05, "loss": 0.0091, "step": 551310 }, { "epoch": 1.43, "learning_rate": 8.56348550084115e-05, "loss": 0.0114, "step": 551320 }, { "epoch": 1.43, "learning_rate": 8.563096679204003e-05, "loss": 0.0093, "step": 551330 }, { "epoch": 1.43, "learning_rate": 8.562707857566857e-05, "loss": 0.0113, "step": 551340 }, { "epoch": 1.43, "learning_rate": 8.56231903592971e-05, "loss": 0.0089, "step": 551350 }, { "epoch": 1.43, "learning_rate": 8.561930214292565e-05, "loss": 0.0104, "step": 551360 }, { "epoch": 1.43, "learning_rate": 8.561541392655418e-05, "loss": 0.01, "step": 551370 }, { "epoch": 1.43, "learning_rate": 8.561152571018272e-05, "loss": 0.0102, "step": 551380 }, { "epoch": 1.43, "learning_rate": 8.560763749381125e-05, "loss": 0.0133, "step": 551390 }, { "epoch": 1.43, "learning_rate": 8.560374927743979e-05, "loss": 0.0073, "step": 551400 }, { "epoch": 1.43, "learning_rate": 8.559986106106832e-05, "loss": 0.0101, "step": 551410 }, { "epoch": 1.43, "learning_rate": 8.559597284469686e-05, "loss": 0.0102, "step": 551420 }, { "epoch": 1.43, "learning_rate": 8.559208462832539e-05, "loss": 0.0098, "step": 551430 }, { "epoch": 1.43, "learning_rate": 8.558819641195393e-05, "loss": 0.0095, "step": 551440 }, { "epoch": 1.43, "learning_rate": 8.558430819558246e-05, "loss": 0.0076, "step": 551450 }, { "epoch": 1.43, "learning_rate": 8.5580419979211e-05, "loss": 0.0118, "step": 551460 }, { "epoch": 1.43, "learning_rate": 8.557653176283953e-05, "loss": 0.012, "step": 551470 }, { "epoch": 1.43, "learning_rate": 8.557264354646807e-05, "loss": 0.0097, "step": 551480 }, { "epoch": 1.43, "learning_rate": 8.55687553300966e-05, "loss": 0.0108, "step": 551490 }, { "epoch": 1.43, "learning_rate": 8.556486711372514e-05, "loss": 0.0082, "step": 551500 }, { "epoch": 1.43, "learning_rate": 8.556097889735367e-05, "loss": 0.011, "step": 551510 }, { "epoch": 1.43, "learning_rate": 8.555709068098222e-05, "loss": 0.0082, "step": 551520 }, { "epoch": 1.43, "learning_rate": 8.555320246461074e-05, "loss": 0.0105, "step": 551530 }, { "epoch": 1.43, "learning_rate": 8.554931424823929e-05, "loss": 0.0134, "step": 551540 }, { "epoch": 1.43, "learning_rate": 8.554542603186782e-05, "loss": 0.0073, "step": 551550 }, { "epoch": 1.43, "learning_rate": 8.554153781549635e-05, "loss": 0.0097, "step": 551560 }, { "epoch": 1.43, "learning_rate": 8.553764959912489e-05, "loss": 0.0087, "step": 551570 }, { "epoch": 1.43, "learning_rate": 8.553376138275342e-05, "loss": 0.0105, "step": 551580 }, { "epoch": 1.43, "learning_rate": 8.552987316638196e-05, "loss": 0.01, "step": 551590 }, { "epoch": 1.43, "learning_rate": 8.552598495001049e-05, "loss": 0.0086, "step": 551600 }, { "epoch": 1.43, "learning_rate": 8.552209673363903e-05, "loss": 0.0121, "step": 551610 }, { "epoch": 1.43, "learning_rate": 8.551820851726756e-05, "loss": 0.0089, "step": 551620 }, { "epoch": 1.43, "learning_rate": 8.55143203008961e-05, "loss": 0.0115, "step": 551630 }, { "epoch": 1.43, "learning_rate": 8.551043208452463e-05, "loss": 0.0092, "step": 551640 }, { "epoch": 1.43, "learning_rate": 8.550654386815317e-05, "loss": 0.0106, "step": 551650 }, { "epoch": 1.43, "learning_rate": 8.55026556517817e-05, "loss": 0.008, "step": 551660 }, { "epoch": 1.43, "learning_rate": 8.549876743541024e-05, "loss": 0.0084, "step": 551670 }, { "epoch": 1.43, "learning_rate": 8.549487921903877e-05, "loss": 0.0095, "step": 551680 }, { "epoch": 1.43, "learning_rate": 8.549099100266731e-05, "loss": 0.0096, "step": 551690 }, { "epoch": 1.43, "learning_rate": 8.548710278629584e-05, "loss": 0.0135, "step": 551700 }, { "epoch": 1.43, "learning_rate": 8.548321456992439e-05, "loss": 0.0066, "step": 551710 }, { "epoch": 1.43, "learning_rate": 8.547932635355292e-05, "loss": 0.0073, "step": 551720 }, { "epoch": 1.43, "learning_rate": 8.547543813718146e-05, "loss": 0.0078, "step": 551730 }, { "epoch": 1.43, "learning_rate": 8.547154992080999e-05, "loss": 0.0091, "step": 551740 }, { "epoch": 1.43, "learning_rate": 8.546766170443853e-05, "loss": 0.0143, "step": 551750 }, { "epoch": 1.43, "learning_rate": 8.546377348806706e-05, "loss": 0.0084, "step": 551760 }, { "epoch": 1.43, "learning_rate": 8.54598852716956e-05, "loss": 0.0093, "step": 551770 }, { "epoch": 1.43, "learning_rate": 8.545599705532413e-05, "loss": 0.0104, "step": 551780 }, { "epoch": 1.43, "learning_rate": 8.545210883895266e-05, "loss": 0.0096, "step": 551790 }, { "epoch": 1.43, "learning_rate": 8.54482206225812e-05, "loss": 0.0079, "step": 551800 }, { "epoch": 1.43, "learning_rate": 8.544433240620973e-05, "loss": 0.0104, "step": 551810 }, { "epoch": 1.43, "learning_rate": 8.544044418983827e-05, "loss": 0.0107, "step": 551820 }, { "epoch": 1.43, "learning_rate": 8.54365559734668e-05, "loss": 0.0087, "step": 551830 }, { "epoch": 1.43, "learning_rate": 8.543266775709534e-05, "loss": 0.0112, "step": 551840 }, { "epoch": 1.43, "learning_rate": 8.542877954072387e-05, "loss": 0.0118, "step": 551850 }, { "epoch": 1.43, "learning_rate": 8.542489132435241e-05, "loss": 0.0101, "step": 551860 }, { "epoch": 1.43, "learning_rate": 8.542100310798093e-05, "loss": 0.0114, "step": 551870 }, { "epoch": 1.43, "learning_rate": 8.541711489160949e-05, "loss": 0.0094, "step": 551880 }, { "epoch": 1.43, "learning_rate": 8.5413226675238e-05, "loss": 0.007, "step": 551890 }, { "epoch": 1.43, "learning_rate": 8.540933845886656e-05, "loss": 0.0085, "step": 551900 }, { "epoch": 1.43, "learning_rate": 8.540545024249509e-05, "loss": 0.01, "step": 551910 }, { "epoch": 1.43, "learning_rate": 8.540156202612363e-05, "loss": 0.0112, "step": 551920 }, { "epoch": 1.43, "learning_rate": 8.539767380975216e-05, "loss": 0.0116, "step": 551930 }, { "epoch": 1.43, "learning_rate": 8.53937855933807e-05, "loss": 0.008, "step": 551940 }, { "epoch": 1.43, "learning_rate": 8.538989737700923e-05, "loss": 0.0062, "step": 551950 }, { "epoch": 1.43, "learning_rate": 8.538600916063777e-05, "loss": 0.0082, "step": 551960 }, { "epoch": 1.43, "learning_rate": 8.53821209442663e-05, "loss": 0.0083, "step": 551970 }, { "epoch": 1.43, "learning_rate": 8.537823272789484e-05, "loss": 0.0083, "step": 551980 }, { "epoch": 1.43, "learning_rate": 8.537434451152337e-05, "loss": 0.0107, "step": 551990 }, { "epoch": 1.43, "learning_rate": 8.537045629515191e-05, "loss": 0.0107, "step": 552000 }, { "epoch": 1.43, "eval_cer": 0.8816746935844841, "eval_loss": 0.006157498341053724, "eval_runtime": 107.7718, "eval_samples_per_second": 18.558, "eval_steps_per_second": 4.639, "step": 552000 }, { "epoch": 1.43, "learning_rate": 8.536656807878044e-05, "loss": 0.0084, "step": 552010 }, { "epoch": 1.43, "learning_rate": 8.536267986240898e-05, "loss": 0.0105, "step": 552020 }, { "epoch": 1.43, "learning_rate": 8.53587916460375e-05, "loss": 0.0117, "step": 552030 }, { "epoch": 1.43, "learning_rate": 8.535490342966603e-05, "loss": 0.0115, "step": 552040 }, { "epoch": 1.43, "learning_rate": 8.535101521329458e-05, "loss": 0.0103, "step": 552050 }, { "epoch": 1.43, "learning_rate": 8.53471269969231e-05, "loss": 0.0089, "step": 552060 }, { "epoch": 1.43, "learning_rate": 8.534323878055166e-05, "loss": 0.0092, "step": 552070 }, { "epoch": 1.43, "learning_rate": 8.533935056418019e-05, "loss": 0.0088, "step": 552080 }, { "epoch": 1.43, "learning_rate": 8.533546234780873e-05, "loss": 0.0092, "step": 552090 }, { "epoch": 1.43, "learning_rate": 8.533157413143726e-05, "loss": 0.0091, "step": 552100 }, { "epoch": 1.43, "learning_rate": 8.53276859150658e-05, "loss": 0.0094, "step": 552110 }, { "epoch": 1.43, "learning_rate": 8.532379769869433e-05, "loss": 0.011, "step": 552120 }, { "epoch": 1.43, "learning_rate": 8.531990948232287e-05, "loss": 0.0109, "step": 552130 }, { "epoch": 1.43, "learning_rate": 8.53160212659514e-05, "loss": 0.0068, "step": 552140 }, { "epoch": 1.43, "learning_rate": 8.531213304957994e-05, "loss": 0.0161, "step": 552150 }, { "epoch": 1.43, "learning_rate": 8.530824483320847e-05, "loss": 0.0082, "step": 552160 }, { "epoch": 1.43, "learning_rate": 8.530435661683701e-05, "loss": 0.0102, "step": 552170 }, { "epoch": 1.43, "learning_rate": 8.530046840046554e-05, "loss": 0.0074, "step": 552180 }, { "epoch": 1.43, "learning_rate": 8.529658018409408e-05, "loss": 0.0088, "step": 552190 }, { "epoch": 1.43, "learning_rate": 8.52926919677226e-05, "loss": 0.0137, "step": 552200 }, { "epoch": 1.43, "learning_rate": 8.528880375135115e-05, "loss": 0.0107, "step": 552210 }, { "epoch": 1.43, "learning_rate": 8.528491553497968e-05, "loss": 0.0127, "step": 552220 }, { "epoch": 1.43, "learning_rate": 8.528102731860823e-05, "loss": 0.0092, "step": 552230 }, { "epoch": 1.43, "learning_rate": 8.527713910223676e-05, "loss": 0.0086, "step": 552240 }, { "epoch": 1.43, "learning_rate": 8.52732508858653e-05, "loss": 0.008, "step": 552250 }, { "epoch": 1.43, "learning_rate": 8.526936266949383e-05, "loss": 0.014, "step": 552260 }, { "epoch": 1.43, "learning_rate": 8.526547445312237e-05, "loss": 0.0088, "step": 552270 }, { "epoch": 1.43, "learning_rate": 8.52615862367509e-05, "loss": 0.0113, "step": 552280 }, { "epoch": 1.43, "learning_rate": 8.525769802037943e-05, "loss": 0.0079, "step": 552290 }, { "epoch": 1.43, "learning_rate": 8.525380980400797e-05, "loss": 0.0077, "step": 552300 }, { "epoch": 1.43, "learning_rate": 8.52499215876365e-05, "loss": 0.011, "step": 552310 }, { "epoch": 1.43, "learning_rate": 8.524603337126504e-05, "loss": 0.0127, "step": 552320 }, { "epoch": 1.43, "learning_rate": 8.524214515489357e-05, "loss": 0.0081, "step": 552330 }, { "epoch": 1.43, "learning_rate": 8.523825693852211e-05, "loss": 0.0118, "step": 552340 }, { "epoch": 1.43, "learning_rate": 8.523436872215064e-05, "loss": 0.0105, "step": 552350 }, { "epoch": 1.43, "learning_rate": 8.523048050577918e-05, "loss": 0.0139, "step": 552360 }, { "epoch": 1.43, "learning_rate": 8.52265922894077e-05, "loss": 0.0094, "step": 552370 }, { "epoch": 1.43, "learning_rate": 8.522270407303625e-05, "loss": 0.0091, "step": 552380 }, { "epoch": 1.43, "learning_rate": 8.521881585666477e-05, "loss": 0.0087, "step": 552390 }, { "epoch": 1.43, "learning_rate": 8.521492764029333e-05, "loss": 0.01, "step": 552400 }, { "epoch": 1.43, "learning_rate": 8.521103942392184e-05, "loss": 0.0089, "step": 552410 }, { "epoch": 1.43, "learning_rate": 8.52071512075504e-05, "loss": 0.0095, "step": 552420 }, { "epoch": 1.43, "learning_rate": 8.520326299117893e-05, "loss": 0.0085, "step": 552430 }, { "epoch": 1.43, "learning_rate": 8.519937477480747e-05, "loss": 0.0072, "step": 552440 }, { "epoch": 1.43, "learning_rate": 8.5195486558436e-05, "loss": 0.0071, "step": 552450 }, { "epoch": 1.43, "learning_rate": 8.519159834206454e-05, "loss": 0.0099, "step": 552460 }, { "epoch": 1.43, "learning_rate": 8.518771012569307e-05, "loss": 0.0091, "step": 552470 }, { "epoch": 1.43, "learning_rate": 8.518382190932161e-05, "loss": 0.0091, "step": 552480 }, { "epoch": 1.43, "learning_rate": 8.517993369295014e-05, "loss": 0.0112, "step": 552490 }, { "epoch": 1.43, "learning_rate": 8.517604547657868e-05, "loss": 0.008, "step": 552500 }, { "epoch": 1.43, "learning_rate": 8.51721572602072e-05, "loss": 0.0092, "step": 552510 }, { "epoch": 1.43, "learning_rate": 8.516826904383575e-05, "loss": 0.0075, "step": 552520 }, { "epoch": 1.43, "learning_rate": 8.516438082746428e-05, "loss": 0.0079, "step": 552530 }, { "epoch": 1.43, "learning_rate": 8.51604926110928e-05, "loss": 0.0104, "step": 552540 }, { "epoch": 1.43, "learning_rate": 8.515660439472135e-05, "loss": 0.0069, "step": 552550 }, { "epoch": 1.43, "learning_rate": 8.515271617834987e-05, "loss": 0.0069, "step": 552560 }, { "epoch": 1.43, "learning_rate": 8.514882796197842e-05, "loss": 0.0077, "step": 552570 }, { "epoch": 1.43, "learning_rate": 8.514493974560694e-05, "loss": 0.0099, "step": 552580 }, { "epoch": 1.43, "learning_rate": 8.51410515292355e-05, "loss": 0.0107, "step": 552590 }, { "epoch": 1.43, "learning_rate": 8.513716331286403e-05, "loss": 0.0077, "step": 552600 }, { "epoch": 1.43, "learning_rate": 8.513327509649257e-05, "loss": 0.0085, "step": 552610 }, { "epoch": 1.43, "learning_rate": 8.51293868801211e-05, "loss": 0.0097, "step": 552620 }, { "epoch": 1.43, "learning_rate": 8.512549866374964e-05, "loss": 0.0085, "step": 552630 }, { "epoch": 1.43, "learning_rate": 8.512161044737817e-05, "loss": 0.007, "step": 552640 }, { "epoch": 1.43, "learning_rate": 8.511772223100671e-05, "loss": 0.0083, "step": 552650 }, { "epoch": 1.43, "learning_rate": 8.511383401463524e-05, "loss": 0.0076, "step": 552660 }, { "epoch": 1.43, "learning_rate": 8.510994579826378e-05, "loss": 0.0087, "step": 552670 }, { "epoch": 1.43, "learning_rate": 8.51060575818923e-05, "loss": 0.0086, "step": 552680 }, { "epoch": 1.43, "learning_rate": 8.510216936552085e-05, "loss": 0.0099, "step": 552690 }, { "epoch": 1.43, "learning_rate": 8.509828114914938e-05, "loss": 0.0098, "step": 552700 }, { "epoch": 1.43, "learning_rate": 8.509439293277792e-05, "loss": 0.012, "step": 552710 }, { "epoch": 1.43, "learning_rate": 8.509050471640645e-05, "loss": 0.0128, "step": 552720 }, { "epoch": 1.43, "learning_rate": 8.508661650003499e-05, "loss": 0.0134, "step": 552730 }, { "epoch": 1.43, "learning_rate": 8.508272828366352e-05, "loss": 0.0088, "step": 552740 }, { "epoch": 1.43, "learning_rate": 8.507884006729207e-05, "loss": 0.0073, "step": 552750 }, { "epoch": 1.43, "learning_rate": 8.50749518509206e-05, "loss": 0.0116, "step": 552760 }, { "epoch": 1.43, "learning_rate": 8.507106363454914e-05, "loss": 0.0082, "step": 552770 }, { "epoch": 1.43, "learning_rate": 8.506717541817767e-05, "loss": 0.0089, "step": 552780 }, { "epoch": 1.43, "learning_rate": 8.50632872018062e-05, "loss": 0.0072, "step": 552790 }, { "epoch": 1.43, "learning_rate": 8.505939898543474e-05, "loss": 0.009, "step": 552800 }, { "epoch": 1.43, "learning_rate": 8.505551076906327e-05, "loss": 0.0109, "step": 552810 }, { "epoch": 1.43, "learning_rate": 8.505162255269181e-05, "loss": 0.0078, "step": 552820 }, { "epoch": 1.43, "learning_rate": 8.504773433632034e-05, "loss": 0.0077, "step": 552830 }, { "epoch": 1.43, "learning_rate": 8.504384611994888e-05, "loss": 0.0097, "step": 552840 }, { "epoch": 1.43, "learning_rate": 8.50399579035774e-05, "loss": 0.0114, "step": 552850 }, { "epoch": 1.43, "learning_rate": 8.503606968720595e-05, "loss": 0.0127, "step": 552860 }, { "epoch": 1.43, "learning_rate": 8.503218147083448e-05, "loss": 0.0114, "step": 552870 }, { "epoch": 1.43, "learning_rate": 8.502829325446302e-05, "loss": 0.0103, "step": 552880 }, { "epoch": 1.43, "learning_rate": 8.502440503809154e-05, "loss": 0.0145, "step": 552890 }, { "epoch": 1.43, "learning_rate": 8.502051682172009e-05, "loss": 0.0074, "step": 552900 }, { "epoch": 1.43, "learning_rate": 8.501662860534861e-05, "loss": 0.0068, "step": 552910 }, { "epoch": 1.43, "learning_rate": 8.501274038897716e-05, "loss": 0.0097, "step": 552920 }, { "epoch": 1.43, "learning_rate": 8.500885217260568e-05, "loss": 0.0064, "step": 552930 }, { "epoch": 1.43, "learning_rate": 8.500496395623424e-05, "loss": 0.0119, "step": 552940 }, { "epoch": 1.43, "learning_rate": 8.500107573986277e-05, "loss": 0.0086, "step": 552950 }, { "epoch": 1.43, "learning_rate": 8.499718752349131e-05, "loss": 0.0087, "step": 552960 }, { "epoch": 1.43, "learning_rate": 8.499329930711984e-05, "loss": 0.0083, "step": 552970 }, { "epoch": 1.43, "learning_rate": 8.498941109074838e-05, "loss": 0.0068, "step": 552980 }, { "epoch": 1.43, "learning_rate": 8.498552287437691e-05, "loss": 0.0104, "step": 552990 }, { "epoch": 1.43, "learning_rate": 8.498163465800545e-05, "loss": 0.0112, "step": 553000 }, { "epoch": 1.43, "eval_cer": 0.8816984874123652, "eval_loss": 0.006217279937118292, "eval_runtime": 107.8256, "eval_samples_per_second": 18.548, "eval_steps_per_second": 4.637, "step": 553000 }, { "epoch": 1.43, "learning_rate": 8.497774644163398e-05, "loss": 0.0072, "step": 553010 }, { "epoch": 1.43, "learning_rate": 8.497385822526252e-05, "loss": 0.0102, "step": 553020 }, { "epoch": 1.43, "learning_rate": 8.496997000889105e-05, "loss": 0.008, "step": 553030 }, { "epoch": 1.43, "learning_rate": 8.496608179251957e-05, "loss": 0.0135, "step": 553040 }, { "epoch": 1.43, "learning_rate": 8.496219357614812e-05, "loss": 0.0089, "step": 553050 }, { "epoch": 1.43, "learning_rate": 8.495830535977664e-05, "loss": 0.0102, "step": 553060 }, { "epoch": 1.43, "learning_rate": 8.495441714340519e-05, "loss": 0.0104, "step": 553070 }, { "epoch": 1.43, "learning_rate": 8.495052892703371e-05, "loss": 0.0102, "step": 553080 }, { "epoch": 1.43, "learning_rate": 8.494664071066226e-05, "loss": 0.0101, "step": 553090 }, { "epoch": 1.43, "learning_rate": 8.494275249429078e-05, "loss": 0.0108, "step": 553100 }, { "epoch": 1.43, "learning_rate": 8.493886427791934e-05, "loss": 0.0096, "step": 553110 }, { "epoch": 1.43, "learning_rate": 8.493497606154785e-05, "loss": 0.0088, "step": 553120 }, { "epoch": 1.43, "learning_rate": 8.493108784517641e-05, "loss": 0.0089, "step": 553130 }, { "epoch": 1.43, "learning_rate": 8.492719962880494e-05, "loss": 0.0075, "step": 553140 }, { "epoch": 1.43, "learning_rate": 8.492331141243348e-05, "loss": 0.0105, "step": 553150 }, { "epoch": 1.43, "learning_rate": 8.4919423196062e-05, "loss": 0.0084, "step": 553160 }, { "epoch": 1.43, "learning_rate": 8.491553497969055e-05, "loss": 0.0097, "step": 553170 }, { "epoch": 1.43, "learning_rate": 8.491164676331908e-05, "loss": 0.0108, "step": 553180 }, { "epoch": 1.43, "learning_rate": 8.490775854694762e-05, "loss": 0.0079, "step": 553190 }, { "epoch": 1.43, "learning_rate": 8.490387033057615e-05, "loss": 0.0092, "step": 553200 }, { "epoch": 1.43, "learning_rate": 8.489998211420469e-05, "loss": 0.0116, "step": 553210 }, { "epoch": 1.43, "learning_rate": 8.489609389783322e-05, "loss": 0.01, "step": 553220 }, { "epoch": 1.43, "learning_rate": 8.489220568146176e-05, "loss": 0.0093, "step": 553230 }, { "epoch": 1.43, "learning_rate": 8.488831746509029e-05, "loss": 0.0078, "step": 553240 }, { "epoch": 1.43, "learning_rate": 8.488442924871883e-05, "loss": 0.0085, "step": 553250 }, { "epoch": 1.43, "learning_rate": 8.488054103234736e-05, "loss": 0.0092, "step": 553260 }, { "epoch": 1.43, "learning_rate": 8.487665281597591e-05, "loss": 0.0097, "step": 553270 }, { "epoch": 1.43, "learning_rate": 8.487276459960442e-05, "loss": 0.0109, "step": 553280 }, { "epoch": 1.43, "learning_rate": 8.486887638323295e-05, "loss": 0.0125, "step": 553290 }, { "epoch": 1.43, "learning_rate": 8.486498816686151e-05, "loss": 0.0098, "step": 553300 }, { "epoch": 1.43, "learning_rate": 8.486109995049004e-05, "loss": 0.007, "step": 553310 }, { "epoch": 1.43, "learning_rate": 8.485721173411858e-05, "loss": 0.0086, "step": 553320 }, { "epoch": 1.43, "learning_rate": 8.48533235177471e-05, "loss": 0.0084, "step": 553330 }, { "epoch": 1.43, "learning_rate": 8.484943530137565e-05, "loss": 0.0099, "step": 553340 }, { "epoch": 1.43, "learning_rate": 8.484554708500418e-05, "loss": 0.0097, "step": 553350 }, { "epoch": 1.43, "learning_rate": 8.484165886863272e-05, "loss": 0.0079, "step": 553360 }, { "epoch": 1.43, "learning_rate": 8.483777065226125e-05, "loss": 0.0071, "step": 553370 }, { "epoch": 1.43, "learning_rate": 8.483388243588979e-05, "loss": 0.0095, "step": 553380 }, { "epoch": 1.43, "learning_rate": 8.482999421951832e-05, "loss": 0.0104, "step": 553390 }, { "epoch": 1.43, "learning_rate": 8.482610600314686e-05, "loss": 0.0103, "step": 553400 }, { "epoch": 1.43, "learning_rate": 8.482221778677538e-05, "loss": 0.0107, "step": 553410 }, { "epoch": 1.43, "learning_rate": 8.481832957040393e-05, "loss": 0.009, "step": 553420 }, { "epoch": 1.43, "learning_rate": 8.481444135403245e-05, "loss": 0.0108, "step": 553430 }, { "epoch": 1.43, "learning_rate": 8.4810553137661e-05, "loss": 0.0112, "step": 553440 }, { "epoch": 1.43, "learning_rate": 8.480666492128952e-05, "loss": 0.0101, "step": 553450 }, { "epoch": 1.43, "learning_rate": 8.480277670491808e-05, "loss": 0.0092, "step": 553460 }, { "epoch": 1.43, "learning_rate": 8.479888848854661e-05, "loss": 0.0114, "step": 553470 }, { "epoch": 1.43, "learning_rate": 8.479500027217515e-05, "loss": 0.0121, "step": 553480 }, { "epoch": 1.43, "learning_rate": 8.479111205580368e-05, "loss": 0.0097, "step": 553490 }, { "epoch": 1.43, "learning_rate": 8.478722383943222e-05, "loss": 0.0099, "step": 553500 }, { "epoch": 1.43, "learning_rate": 8.478333562306075e-05, "loss": 0.0102, "step": 553510 }, { "epoch": 1.43, "learning_rate": 8.477944740668929e-05, "loss": 0.0098, "step": 553520 }, { "epoch": 1.43, "learning_rate": 8.477555919031782e-05, "loss": 0.0091, "step": 553530 }, { "epoch": 1.43, "learning_rate": 8.477167097394634e-05, "loss": 0.0121, "step": 553540 }, { "epoch": 1.43, "learning_rate": 8.476778275757489e-05, "loss": 0.0102, "step": 553550 }, { "epoch": 1.43, "learning_rate": 8.476389454120341e-05, "loss": 0.0106, "step": 553560 }, { "epoch": 1.43, "learning_rate": 8.476000632483196e-05, "loss": 0.0115, "step": 553570 }, { "epoch": 1.43, "learning_rate": 8.475611810846048e-05, "loss": 0.0096, "step": 553580 }, { "epoch": 1.43, "learning_rate": 8.475222989208903e-05, "loss": 0.0148, "step": 553590 }, { "epoch": 1.44, "learning_rate": 8.474834167571755e-05, "loss": 0.0072, "step": 553600 }, { "epoch": 1.44, "learning_rate": 8.47444534593461e-05, "loss": 0.0096, "step": 553610 }, { "epoch": 1.44, "learning_rate": 8.474056524297462e-05, "loss": 0.0088, "step": 553620 }, { "epoch": 1.44, "learning_rate": 8.473667702660318e-05, "loss": 0.01, "step": 553630 }, { "epoch": 1.44, "learning_rate": 8.47327888102317e-05, "loss": 0.0087, "step": 553640 }, { "epoch": 1.44, "learning_rate": 8.472890059386025e-05, "loss": 0.0096, "step": 553650 }, { "epoch": 1.44, "learning_rate": 8.472501237748878e-05, "loss": 0.0083, "step": 553660 }, { "epoch": 1.44, "learning_rate": 8.472112416111732e-05, "loss": 0.0094, "step": 553670 }, { "epoch": 1.44, "learning_rate": 8.471723594474585e-05, "loss": 0.0085, "step": 553680 }, { "epoch": 1.44, "learning_rate": 8.471334772837439e-05, "loss": 0.0074, "step": 553690 }, { "epoch": 1.44, "learning_rate": 8.470945951200292e-05, "loss": 0.0126, "step": 553700 }, { "epoch": 1.44, "learning_rate": 8.470557129563146e-05, "loss": 0.0105, "step": 553710 }, { "epoch": 1.44, "learning_rate": 8.470168307925999e-05, "loss": 0.009, "step": 553720 }, { "epoch": 1.44, "learning_rate": 8.469779486288853e-05, "loss": 0.0111, "step": 553730 }, { "epoch": 1.44, "learning_rate": 8.469390664651706e-05, "loss": 0.0104, "step": 553740 }, { "epoch": 1.44, "learning_rate": 8.46900184301456e-05, "loss": 0.0107, "step": 553750 }, { "epoch": 1.44, "learning_rate": 8.468613021377413e-05, "loss": 0.0089, "step": 553760 }, { "epoch": 1.44, "learning_rate": 8.468224199740267e-05, "loss": 0.009, "step": 553770 }, { "epoch": 1.44, "learning_rate": 8.46783537810312e-05, "loss": 0.0103, "step": 553780 }, { "epoch": 1.44, "learning_rate": 8.467446556465972e-05, "loss": 0.0089, "step": 553790 }, { "epoch": 1.44, "learning_rate": 8.467057734828826e-05, "loss": 0.009, "step": 553800 }, { "epoch": 1.44, "learning_rate": 8.466668913191679e-05, "loss": 0.0089, "step": 553810 }, { "epoch": 1.44, "learning_rate": 8.466280091554535e-05, "loss": 0.0089, "step": 553820 }, { "epoch": 1.44, "learning_rate": 8.465891269917388e-05, "loss": 0.0117, "step": 553830 }, { "epoch": 1.44, "learning_rate": 8.465502448280242e-05, "loss": 0.0086, "step": 553840 }, { "epoch": 1.44, "learning_rate": 8.465113626643095e-05, "loss": 0.0087, "step": 553850 }, { "epoch": 1.44, "learning_rate": 8.464724805005949e-05, "loss": 0.0104, "step": 553860 }, { "epoch": 1.44, "learning_rate": 8.464335983368802e-05, "loss": 0.0138, "step": 553870 }, { "epoch": 1.44, "learning_rate": 8.463947161731656e-05, "loss": 0.0101, "step": 553880 }, { "epoch": 1.44, "learning_rate": 8.463558340094509e-05, "loss": 0.0096, "step": 553890 }, { "epoch": 1.44, "learning_rate": 8.463169518457363e-05, "loss": 0.0092, "step": 553900 }, { "epoch": 1.44, "learning_rate": 8.462780696820216e-05, "loss": 0.0113, "step": 553910 }, { "epoch": 1.44, "learning_rate": 8.46239187518307e-05, "loss": 0.0074, "step": 553920 }, { "epoch": 1.44, "learning_rate": 8.462003053545922e-05, "loss": 0.0103, "step": 553930 }, { "epoch": 1.44, "learning_rate": 8.461614231908777e-05, "loss": 0.0106, "step": 553940 }, { "epoch": 1.44, "learning_rate": 8.46122541027163e-05, "loss": 0.0083, "step": 553950 }, { "epoch": 1.44, "learning_rate": 8.460836588634484e-05, "loss": 0.0103, "step": 553960 }, { "epoch": 1.44, "learning_rate": 8.460447766997336e-05, "loss": 0.0074, "step": 553970 }, { "epoch": 1.44, "learning_rate": 8.460058945360192e-05, "loss": 0.0092, "step": 553980 }, { "epoch": 1.44, "learning_rate": 8.459670123723045e-05, "loss": 0.0113, "step": 553990 }, { "epoch": 1.44, "learning_rate": 8.459281302085899e-05, "loss": 0.008, "step": 554000 }, { "epoch": 1.44, "eval_cer": 0.8816774928583525, "eval_loss": 0.006148200016468763, "eval_runtime": 107.8579, "eval_samples_per_second": 18.543, "eval_steps_per_second": 4.636, "step": 554000 }, { "epoch": 1.44, "learning_rate": 8.458892480448752e-05, "loss": 0.0101, "step": 554010 }, { "epoch": 1.44, "learning_rate": 8.458503658811606e-05, "loss": 0.0082, "step": 554020 }, { "epoch": 1.44, "learning_rate": 8.458114837174459e-05, "loss": 0.009, "step": 554030 }, { "epoch": 1.44, "learning_rate": 8.457726015537312e-05, "loss": 0.0089, "step": 554040 }, { "epoch": 1.44, "learning_rate": 8.457337193900166e-05, "loss": 0.0101, "step": 554050 }, { "epoch": 1.44, "learning_rate": 8.456948372263018e-05, "loss": 0.0108, "step": 554060 }, { "epoch": 1.44, "learning_rate": 8.456559550625873e-05, "loss": 0.0082, "step": 554070 }, { "epoch": 1.44, "learning_rate": 8.456170728988725e-05, "loss": 0.0076, "step": 554080 }, { "epoch": 1.44, "learning_rate": 8.45578190735158e-05, "loss": 0.0096, "step": 554090 }, { "epoch": 1.44, "learning_rate": 8.455393085714432e-05, "loss": 0.0115, "step": 554100 }, { "epoch": 1.44, "learning_rate": 8.455004264077287e-05, "loss": 0.0086, "step": 554110 }, { "epoch": 1.44, "learning_rate": 8.45461544244014e-05, "loss": 0.009, "step": 554120 }, { "epoch": 1.44, "learning_rate": 8.454226620802994e-05, "loss": 0.007, "step": 554130 }, { "epoch": 1.44, "learning_rate": 8.453837799165846e-05, "loss": 0.0082, "step": 554140 }, { "epoch": 1.44, "learning_rate": 8.453448977528702e-05, "loss": 0.0113, "step": 554150 }, { "epoch": 1.44, "learning_rate": 8.453060155891553e-05, "loss": 0.0081, "step": 554160 }, { "epoch": 1.44, "learning_rate": 8.452671334254409e-05, "loss": 0.0098, "step": 554170 }, { "epoch": 1.44, "learning_rate": 8.452282512617262e-05, "loss": 0.0081, "step": 554180 }, { "epoch": 1.44, "learning_rate": 8.451893690980116e-05, "loss": 0.0109, "step": 554190 }, { "epoch": 1.44, "learning_rate": 8.451504869342969e-05, "loss": 0.0084, "step": 554200 }, { "epoch": 1.44, "learning_rate": 8.451116047705823e-05, "loss": 0.0123, "step": 554210 }, { "epoch": 1.44, "learning_rate": 8.450727226068676e-05, "loss": 0.0092, "step": 554220 }, { "epoch": 1.44, "learning_rate": 8.45033840443153e-05, "loss": 0.0094, "step": 554230 }, { "epoch": 1.44, "learning_rate": 8.449949582794383e-05, "loss": 0.011, "step": 554240 }, { "epoch": 1.44, "learning_rate": 8.449560761157237e-05, "loss": 0.0086, "step": 554250 }, { "epoch": 1.44, "learning_rate": 8.44917193952009e-05, "loss": 0.0087, "step": 554260 }, { "epoch": 1.44, "learning_rate": 8.448783117882944e-05, "loss": 0.0094, "step": 554270 }, { "epoch": 1.44, "learning_rate": 8.448394296245797e-05, "loss": 0.0079, "step": 554280 }, { "epoch": 1.44, "learning_rate": 8.44800547460865e-05, "loss": 0.009, "step": 554290 }, { "epoch": 1.44, "learning_rate": 8.447616652971503e-05, "loss": 0.0109, "step": 554300 }, { "epoch": 1.44, "learning_rate": 8.447227831334356e-05, "loss": 0.01, "step": 554310 }, { "epoch": 1.44, "learning_rate": 8.44683900969721e-05, "loss": 0.0101, "step": 554320 }, { "epoch": 1.44, "learning_rate": 8.446450188060063e-05, "loss": 0.0095, "step": 554330 }, { "epoch": 1.44, "learning_rate": 8.446061366422919e-05, "loss": 0.0103, "step": 554340 }, { "epoch": 1.44, "learning_rate": 8.445672544785772e-05, "loss": 0.0084, "step": 554350 }, { "epoch": 1.44, "learning_rate": 8.445283723148626e-05, "loss": 0.0102, "step": 554360 }, { "epoch": 1.44, "learning_rate": 8.444894901511479e-05, "loss": 0.0097, "step": 554370 }, { "epoch": 1.44, "learning_rate": 8.444506079874333e-05, "loss": 0.0096, "step": 554380 }, { "epoch": 1.44, "learning_rate": 8.444117258237186e-05, "loss": 0.0125, "step": 554390 }, { "epoch": 1.44, "learning_rate": 8.44372843660004e-05, "loss": 0.0109, "step": 554400 }, { "epoch": 1.44, "learning_rate": 8.443339614962893e-05, "loss": 0.0104, "step": 554410 }, { "epoch": 1.44, "learning_rate": 8.442950793325747e-05, "loss": 0.009, "step": 554420 }, { "epoch": 1.44, "learning_rate": 8.4425619716886e-05, "loss": 0.0105, "step": 554430 }, { "epoch": 1.44, "learning_rate": 8.442173150051454e-05, "loss": 0.011, "step": 554440 }, { "epoch": 1.44, "learning_rate": 8.441784328414306e-05, "loss": 0.0111, "step": 554450 }, { "epoch": 1.44, "learning_rate": 8.44139550677716e-05, "loss": 0.0103, "step": 554460 }, { "epoch": 1.44, "learning_rate": 8.441006685140013e-05, "loss": 0.0111, "step": 554470 }, { "epoch": 1.44, "learning_rate": 8.440617863502868e-05, "loss": 0.0122, "step": 554480 }, { "epoch": 1.44, "learning_rate": 8.44022904186572e-05, "loss": 0.0091, "step": 554490 }, { "epoch": 1.44, "learning_rate": 8.439840220228576e-05, "loss": 0.0061, "step": 554500 }, { "epoch": 1.44, "learning_rate": 8.439451398591427e-05, "loss": 0.0129, "step": 554510 }, { "epoch": 1.44, "learning_rate": 8.43906257695428e-05, "loss": 0.0093, "step": 554520 }, { "epoch": 1.44, "learning_rate": 8.438673755317136e-05, "loss": 0.0074, "step": 554530 }, { "epoch": 1.44, "learning_rate": 8.438284933679989e-05, "loss": 0.0105, "step": 554540 }, { "epoch": 1.44, "learning_rate": 8.437896112042843e-05, "loss": 0.0089, "step": 554550 }, { "epoch": 1.44, "learning_rate": 8.437507290405695e-05, "loss": 0.0063, "step": 554560 }, { "epoch": 1.44, "learning_rate": 8.43711846876855e-05, "loss": 0.0091, "step": 554570 }, { "epoch": 1.44, "learning_rate": 8.436729647131402e-05, "loss": 0.0089, "step": 554580 }, { "epoch": 1.44, "learning_rate": 8.436340825494257e-05, "loss": 0.0076, "step": 554590 }, { "epoch": 1.44, "learning_rate": 8.43595200385711e-05, "loss": 0.01, "step": 554600 }, { "epoch": 1.44, "learning_rate": 8.435563182219964e-05, "loss": 0.0064, "step": 554610 }, { "epoch": 1.44, "learning_rate": 8.435174360582816e-05, "loss": 0.0103, "step": 554620 }, { "epoch": 1.44, "learning_rate": 8.43478553894567e-05, "loss": 0.0088, "step": 554630 }, { "epoch": 1.44, "learning_rate": 8.434396717308523e-05, "loss": 0.0097, "step": 554640 }, { "epoch": 1.44, "learning_rate": 8.434007895671378e-05, "loss": 0.0093, "step": 554650 }, { "epoch": 1.44, "learning_rate": 8.43361907403423e-05, "loss": 0.007, "step": 554660 }, { "epoch": 1.44, "learning_rate": 8.433230252397085e-05, "loss": 0.0083, "step": 554670 }, { "epoch": 1.44, "learning_rate": 8.432841430759937e-05, "loss": 0.0093, "step": 554680 }, { "epoch": 1.44, "learning_rate": 8.432452609122793e-05, "loss": 0.012, "step": 554690 }, { "epoch": 1.44, "learning_rate": 8.432063787485646e-05, "loss": 0.01, "step": 554700 }, { "epoch": 1.44, "learning_rate": 8.4316749658485e-05, "loss": 0.011, "step": 554710 }, { "epoch": 1.44, "learning_rate": 8.431286144211353e-05, "loss": 0.0109, "step": 554720 }, { "epoch": 1.44, "learning_rate": 8.430897322574207e-05, "loss": 0.009, "step": 554730 }, { "epoch": 1.44, "learning_rate": 8.43050850093706e-05, "loss": 0.0118, "step": 554740 }, { "epoch": 1.44, "learning_rate": 8.430119679299914e-05, "loss": 0.0063, "step": 554750 }, { "epoch": 1.44, "learning_rate": 8.429730857662767e-05, "loss": 0.0122, "step": 554760 }, { "epoch": 1.44, "learning_rate": 8.42934203602562e-05, "loss": 0.0116, "step": 554770 }, { "epoch": 1.44, "learning_rate": 8.428953214388474e-05, "loss": 0.0104, "step": 554780 }, { "epoch": 1.44, "learning_rate": 8.428564392751326e-05, "loss": 0.0091, "step": 554790 }, { "epoch": 1.44, "learning_rate": 8.42817557111418e-05, "loss": 0.0117, "step": 554800 }, { "epoch": 1.44, "learning_rate": 8.427786749477033e-05, "loss": 0.0087, "step": 554810 }, { "epoch": 1.44, "learning_rate": 8.427397927839887e-05, "loss": 0.0077, "step": 554820 }, { "epoch": 1.44, "learning_rate": 8.42700910620274e-05, "loss": 0.0111, "step": 554830 }, { "epoch": 1.44, "learning_rate": 8.426620284565594e-05, "loss": 0.0117, "step": 554840 }, { "epoch": 1.44, "learning_rate": 8.426231462928447e-05, "loss": 0.0087, "step": 554850 }, { "epoch": 1.44, "learning_rate": 8.425842641291303e-05, "loss": 0.0081, "step": 554860 }, { "epoch": 1.44, "learning_rate": 8.425453819654154e-05, "loss": 0.0069, "step": 554870 }, { "epoch": 1.44, "learning_rate": 8.42506499801701e-05, "loss": 0.01, "step": 554880 }, { "epoch": 1.44, "learning_rate": 8.424676176379863e-05, "loss": 0.009, "step": 554890 }, { "epoch": 1.44, "learning_rate": 8.424287354742717e-05, "loss": 0.0087, "step": 554900 }, { "epoch": 1.44, "learning_rate": 8.42389853310557e-05, "loss": 0.0118, "step": 554910 }, { "epoch": 1.44, "learning_rate": 8.423509711468424e-05, "loss": 0.012, "step": 554920 }, { "epoch": 1.44, "learning_rate": 8.423120889831277e-05, "loss": 0.0122, "step": 554930 }, { "epoch": 1.44, "learning_rate": 8.42273206819413e-05, "loss": 0.0089, "step": 554940 }, { "epoch": 1.44, "learning_rate": 8.422343246556983e-05, "loss": 0.0081, "step": 554950 }, { "epoch": 1.44, "learning_rate": 8.421954424919838e-05, "loss": 0.0078, "step": 554960 }, { "epoch": 1.44, "learning_rate": 8.42156560328269e-05, "loss": 0.0088, "step": 554970 }, { "epoch": 1.44, "learning_rate": 8.421176781645545e-05, "loss": 0.0098, "step": 554980 }, { "epoch": 1.44, "learning_rate": 8.420787960008397e-05, "loss": 0.0105, "step": 554990 }, { "epoch": 1.44, "learning_rate": 8.420399138371252e-05, "loss": 0.0111, "step": 555000 }, { "epoch": 1.44, "eval_cer": 0.8816760932214184, "eval_loss": 0.006103316321969032, "eval_runtime": 107.9114, "eval_samples_per_second": 18.534, "eval_steps_per_second": 4.633, "step": 555000 }, { "epoch": 1.44, "learning_rate": 8.420010316734104e-05, "loss": 0.0099, "step": 555010 }, { "epoch": 1.44, "learning_rate": 8.419621495096957e-05, "loss": 0.0141, "step": 555020 }, { "epoch": 1.44, "learning_rate": 8.419232673459811e-05, "loss": 0.0099, "step": 555030 }, { "epoch": 1.44, "learning_rate": 8.418843851822664e-05, "loss": 0.011, "step": 555040 }, { "epoch": 1.44, "learning_rate": 8.41845503018552e-05, "loss": 0.0092, "step": 555050 }, { "epoch": 1.44, "learning_rate": 8.418066208548373e-05, "loss": 0.0115, "step": 555060 }, { "epoch": 1.44, "learning_rate": 8.417677386911227e-05, "loss": 0.0072, "step": 555070 }, { "epoch": 1.44, "learning_rate": 8.41728856527408e-05, "loss": 0.0097, "step": 555080 }, { "epoch": 1.44, "learning_rate": 8.416899743636934e-05, "loss": 0.0147, "step": 555090 }, { "epoch": 1.44, "learning_rate": 8.416510921999786e-05, "loss": 0.0098, "step": 555100 }, { "epoch": 1.44, "learning_rate": 8.41612210036264e-05, "loss": 0.0087, "step": 555110 }, { "epoch": 1.44, "learning_rate": 8.415733278725493e-05, "loss": 0.0123, "step": 555120 }, { "epoch": 1.44, "learning_rate": 8.415344457088348e-05, "loss": 0.0105, "step": 555130 }, { "epoch": 1.44, "learning_rate": 8.4149556354512e-05, "loss": 0.0105, "step": 555140 }, { "epoch": 1.44, "learning_rate": 8.414566813814055e-05, "loss": 0.0064, "step": 555150 }, { "epoch": 1.44, "learning_rate": 8.414177992176907e-05, "loss": 0.0102, "step": 555160 }, { "epoch": 1.44, "learning_rate": 8.413789170539762e-05, "loss": 0.0081, "step": 555170 }, { "epoch": 1.44, "learning_rate": 8.413400348902614e-05, "loss": 0.0089, "step": 555180 }, { "epoch": 1.44, "learning_rate": 8.413011527265469e-05, "loss": 0.0073, "step": 555190 }, { "epoch": 1.44, "learning_rate": 8.412622705628321e-05, "loss": 0.0066, "step": 555200 }, { "epoch": 1.44, "learning_rate": 8.412233883991177e-05, "loss": 0.0083, "step": 555210 }, { "epoch": 1.44, "learning_rate": 8.41184506235403e-05, "loss": 0.0089, "step": 555220 }, { "epoch": 1.44, "learning_rate": 8.411456240716884e-05, "loss": 0.0106, "step": 555230 }, { "epoch": 1.44, "learning_rate": 8.411067419079737e-05, "loss": 0.0096, "step": 555240 }, { "epoch": 1.44, "learning_rate": 8.410678597442591e-05, "loss": 0.0117, "step": 555250 }, { "epoch": 1.44, "learning_rate": 8.410289775805444e-05, "loss": 0.0155, "step": 555260 }, { "epoch": 1.44, "learning_rate": 8.409900954168296e-05, "loss": 0.0076, "step": 555270 }, { "epoch": 1.44, "learning_rate": 8.40951213253115e-05, "loss": 0.0089, "step": 555280 }, { "epoch": 1.44, "learning_rate": 8.409123310894003e-05, "loss": 0.0072, "step": 555290 }, { "epoch": 1.44, "learning_rate": 8.408734489256858e-05, "loss": 0.0129, "step": 555300 }, { "epoch": 1.44, "learning_rate": 8.40834566761971e-05, "loss": 0.0083, "step": 555310 }, { "epoch": 1.44, "learning_rate": 8.407956845982565e-05, "loss": 0.0095, "step": 555320 }, { "epoch": 1.44, "learning_rate": 8.407568024345417e-05, "loss": 0.0082, "step": 555330 }, { "epoch": 1.44, "learning_rate": 8.407179202708271e-05, "loss": 0.0083, "step": 555340 }, { "epoch": 1.44, "learning_rate": 8.406790381071124e-05, "loss": 0.0091, "step": 555350 }, { "epoch": 1.44, "learning_rate": 8.406401559433978e-05, "loss": 0.0088, "step": 555360 }, { "epoch": 1.44, "learning_rate": 8.406012737796831e-05, "loss": 0.0086, "step": 555370 }, { "epoch": 1.44, "learning_rate": 8.405623916159687e-05, "loss": 0.0105, "step": 555380 }, { "epoch": 1.44, "learning_rate": 8.405235094522538e-05, "loss": 0.012, "step": 555390 }, { "epoch": 1.44, "learning_rate": 8.404846272885394e-05, "loss": 0.0166, "step": 555400 }, { "epoch": 1.44, "learning_rate": 8.404457451248247e-05, "loss": 0.0108, "step": 555410 }, { "epoch": 1.44, "learning_rate": 8.404068629611101e-05, "loss": 0.0075, "step": 555420 }, { "epoch": 1.44, "learning_rate": 8.403679807973954e-05, "loss": 0.0113, "step": 555430 }, { "epoch": 1.44, "learning_rate": 8.403290986336808e-05, "loss": 0.0094, "step": 555440 }, { "epoch": 1.44, "learning_rate": 8.40290216469966e-05, "loss": 0.0097, "step": 555450 }, { "epoch": 1.44, "learning_rate": 8.402513343062515e-05, "loss": 0.0091, "step": 555460 }, { "epoch": 1.44, "learning_rate": 8.402124521425367e-05, "loss": 0.0143, "step": 555470 }, { "epoch": 1.44, "learning_rate": 8.401735699788222e-05, "loss": 0.0082, "step": 555480 }, { "epoch": 1.44, "learning_rate": 8.401346878151074e-05, "loss": 0.0075, "step": 555490 }, { "epoch": 1.44, "learning_rate": 8.400958056513929e-05, "loss": 0.0086, "step": 555500 }, { "epoch": 1.44, "learning_rate": 8.400569234876781e-05, "loss": 0.0095, "step": 555510 }, { "epoch": 1.44, "learning_rate": 8.400180413239634e-05, "loss": 0.0074, "step": 555520 }, { "epoch": 1.44, "learning_rate": 8.399791591602488e-05, "loss": 0.0109, "step": 555530 }, { "epoch": 1.44, "learning_rate": 8.399402769965341e-05, "loss": 0.0109, "step": 555540 }, { "epoch": 1.44, "learning_rate": 8.399013948328195e-05, "loss": 0.0107, "step": 555550 }, { "epoch": 1.44, "learning_rate": 8.398625126691048e-05, "loss": 0.0125, "step": 555560 }, { "epoch": 1.44, "learning_rate": 8.398236305053904e-05, "loss": 0.0089, "step": 555570 }, { "epoch": 1.44, "learning_rate": 8.397847483416756e-05, "loss": 0.0114, "step": 555580 }, { "epoch": 1.44, "learning_rate": 8.39745866177961e-05, "loss": 0.011, "step": 555590 }, { "epoch": 1.44, "learning_rate": 8.397069840142463e-05, "loss": 0.0101, "step": 555600 }, { "epoch": 1.44, "learning_rate": 8.396681018505318e-05, "loss": 0.0087, "step": 555610 }, { "epoch": 1.44, "learning_rate": 8.39629219686817e-05, "loss": 0.0086, "step": 555620 }, { "epoch": 1.44, "learning_rate": 8.395903375231025e-05, "loss": 0.0099, "step": 555630 }, { "epoch": 1.44, "learning_rate": 8.395514553593877e-05, "loss": 0.0092, "step": 555640 }, { "epoch": 1.44, "learning_rate": 8.395125731956732e-05, "loss": 0.0079, "step": 555650 }, { "epoch": 1.44, "learning_rate": 8.394736910319584e-05, "loss": 0.0073, "step": 555660 }, { "epoch": 1.44, "learning_rate": 8.394348088682439e-05, "loss": 0.0096, "step": 555670 }, { "epoch": 1.44, "learning_rate": 8.393959267045291e-05, "loss": 0.0091, "step": 555680 }, { "epoch": 1.44, "learning_rate": 8.393570445408146e-05, "loss": 0.0088, "step": 555690 }, { "epoch": 1.44, "learning_rate": 8.393181623770998e-05, "loss": 0.0103, "step": 555700 }, { "epoch": 1.44, "learning_rate": 8.392792802133852e-05, "loss": 0.01, "step": 555710 }, { "epoch": 1.44, "learning_rate": 8.392403980496705e-05, "loss": 0.0086, "step": 555720 }, { "epoch": 1.44, "learning_rate": 8.392015158859561e-05, "loss": 0.0089, "step": 555730 }, { "epoch": 1.44, "learning_rate": 8.391626337222412e-05, "loss": 0.0134, "step": 555740 }, { "epoch": 1.44, "learning_rate": 8.391237515585268e-05, "loss": 0.007, "step": 555750 }, { "epoch": 1.44, "learning_rate": 8.39084869394812e-05, "loss": 0.0079, "step": 555760 }, { "epoch": 1.44, "learning_rate": 8.390459872310973e-05, "loss": 0.0144, "step": 555770 }, { "epoch": 1.44, "learning_rate": 8.390071050673828e-05, "loss": 0.0109, "step": 555780 }, { "epoch": 1.44, "learning_rate": 8.38968222903668e-05, "loss": 0.0087, "step": 555790 }, { "epoch": 1.44, "learning_rate": 8.389293407399535e-05, "loss": 0.0106, "step": 555800 }, { "epoch": 1.44, "learning_rate": 8.388904585762387e-05, "loss": 0.0087, "step": 555810 }, { "epoch": 1.44, "learning_rate": 8.388515764125242e-05, "loss": 0.0101, "step": 555820 }, { "epoch": 1.44, "learning_rate": 8.388126942488094e-05, "loss": 0.0077, "step": 555830 }, { "epoch": 1.44, "learning_rate": 8.387738120850948e-05, "loss": 0.0102, "step": 555840 }, { "epoch": 1.44, "learning_rate": 8.387349299213801e-05, "loss": 0.0105, "step": 555850 }, { "epoch": 1.44, "learning_rate": 8.386960477576655e-05, "loss": 0.01, "step": 555860 }, { "epoch": 1.44, "learning_rate": 8.386571655939508e-05, "loss": 0.0098, "step": 555870 }, { "epoch": 1.44, "learning_rate": 8.386182834302362e-05, "loss": 0.0077, "step": 555880 }, { "epoch": 1.44, "learning_rate": 8.385794012665215e-05, "loss": 0.0093, "step": 555890 }, { "epoch": 1.44, "learning_rate": 8.38540519102807e-05, "loss": 0.0091, "step": 555900 }, { "epoch": 1.44, "learning_rate": 8.385016369390922e-05, "loss": 0.0122, "step": 555910 }, { "epoch": 1.44, "learning_rate": 8.384627547753778e-05, "loss": 0.0119, "step": 555920 }, { "epoch": 1.44, "learning_rate": 8.38423872611663e-05, "loss": 0.0102, "step": 555930 }, { "epoch": 1.44, "learning_rate": 8.383849904479485e-05, "loss": 0.009, "step": 555940 }, { "epoch": 1.44, "learning_rate": 8.383461082842338e-05, "loss": 0.0084, "step": 555950 }, { "epoch": 1.44, "learning_rate": 8.383072261205192e-05, "loss": 0.0097, "step": 555960 }, { "epoch": 1.44, "learning_rate": 8.382683439568044e-05, "loss": 0.0112, "step": 555970 }, { "epoch": 1.44, "learning_rate": 8.382294617930899e-05, "loss": 0.0072, "step": 555980 }, { "epoch": 1.44, "learning_rate": 8.381905796293751e-05, "loss": 0.0102, "step": 555990 }, { "epoch": 1.44, "learning_rate": 8.381516974656606e-05, "loss": 0.0118, "step": 556000 }, { "epoch": 1.44, "eval_cer": 0.88167329394755, "eval_loss": 0.0062253098003566265, "eval_runtime": 107.7174, "eval_samples_per_second": 18.567, "eval_steps_per_second": 4.642, "step": 556000 }, { "epoch": 1.44, "learning_rate": 8.381128153019458e-05, "loss": 0.0078, "step": 556010 }, { "epoch": 1.44, "learning_rate": 8.380739331382311e-05, "loss": 0.0055, "step": 556020 }, { "epoch": 1.44, "learning_rate": 8.380350509745165e-05, "loss": 0.0091, "step": 556030 }, { "epoch": 1.44, "learning_rate": 8.379961688108018e-05, "loss": 0.0083, "step": 556040 }, { "epoch": 1.44, "learning_rate": 8.379572866470872e-05, "loss": 0.0068, "step": 556050 }, { "epoch": 1.44, "learning_rate": 8.379184044833725e-05, "loss": 0.0079, "step": 556060 }, { "epoch": 1.44, "learning_rate": 8.37879522319658e-05, "loss": 0.01, "step": 556070 }, { "epoch": 1.44, "learning_rate": 8.378406401559432e-05, "loss": 0.0096, "step": 556080 }, { "epoch": 1.44, "learning_rate": 8.378017579922288e-05, "loss": 0.01, "step": 556090 }, { "epoch": 1.44, "learning_rate": 8.377628758285139e-05, "loss": 0.0123, "step": 556100 }, { "epoch": 1.44, "learning_rate": 8.377239936647995e-05, "loss": 0.0085, "step": 556110 }, { "epoch": 1.44, "learning_rate": 8.376851115010847e-05, "loss": 0.0123, "step": 556120 }, { "epoch": 1.44, "learning_rate": 8.376462293373702e-05, "loss": 0.0097, "step": 556130 }, { "epoch": 1.44, "learning_rate": 8.376073471736554e-05, "loss": 0.0081, "step": 556140 }, { "epoch": 1.44, "learning_rate": 8.375684650099409e-05, "loss": 0.0073, "step": 556150 }, { "epoch": 1.44, "learning_rate": 8.375295828462261e-05, "loss": 0.0097, "step": 556160 }, { "epoch": 1.44, "learning_rate": 8.374907006825116e-05, "loss": 0.0079, "step": 556170 }, { "epoch": 1.44, "learning_rate": 8.374518185187968e-05, "loss": 0.0108, "step": 556180 }, { "epoch": 1.44, "learning_rate": 8.374129363550823e-05, "loss": 0.0098, "step": 556190 }, { "epoch": 1.44, "learning_rate": 8.373740541913675e-05, "loss": 0.0088, "step": 556200 }, { "epoch": 1.44, "learning_rate": 8.37335172027653e-05, "loss": 0.0077, "step": 556210 }, { "epoch": 1.44, "learning_rate": 8.372962898639382e-05, "loss": 0.0088, "step": 556220 }, { "epoch": 1.44, "learning_rate": 8.372574077002236e-05, "loss": 0.0108, "step": 556230 }, { "epoch": 1.44, "learning_rate": 8.372185255365089e-05, "loss": 0.0081, "step": 556240 }, { "epoch": 1.44, "learning_rate": 8.371796433727945e-05, "loss": 0.0083, "step": 556250 }, { "epoch": 1.44, "learning_rate": 8.371407612090796e-05, "loss": 0.0091, "step": 556260 }, { "epoch": 1.44, "learning_rate": 8.371018790453649e-05, "loss": 0.01, "step": 556270 }, { "epoch": 1.44, "learning_rate": 8.370629968816505e-05, "loss": 0.0072, "step": 556280 }, { "epoch": 1.44, "learning_rate": 8.370241147179357e-05, "loss": 0.0139, "step": 556290 }, { "epoch": 1.44, "learning_rate": 8.369852325542212e-05, "loss": 0.0077, "step": 556300 }, { "epoch": 1.44, "learning_rate": 8.369463503905064e-05, "loss": 0.0113, "step": 556310 }, { "epoch": 1.44, "learning_rate": 8.369074682267919e-05, "loss": 0.0094, "step": 556320 }, { "epoch": 1.44, "learning_rate": 8.368685860630771e-05, "loss": 0.0087, "step": 556330 }, { "epoch": 1.44, "learning_rate": 8.368297038993626e-05, "loss": 0.0104, "step": 556340 }, { "epoch": 1.44, "learning_rate": 8.367908217356478e-05, "loss": 0.0107, "step": 556350 }, { "epoch": 1.44, "learning_rate": 8.367519395719332e-05, "loss": 0.0109, "step": 556360 }, { "epoch": 1.44, "learning_rate": 8.367130574082185e-05, "loss": 0.009, "step": 556370 }, { "epoch": 1.44, "learning_rate": 8.36674175244504e-05, "loss": 0.0089, "step": 556380 }, { "epoch": 1.44, "learning_rate": 8.366352930807892e-05, "loss": 0.0084, "step": 556390 }, { "epoch": 1.44, "learning_rate": 8.365964109170746e-05, "loss": 0.0092, "step": 556400 }, { "epoch": 1.44, "learning_rate": 8.365575287533599e-05, "loss": 0.0105, "step": 556410 }, { "epoch": 1.44, "learning_rate": 8.365186465896453e-05, "loss": 0.0082, "step": 556420 }, { "epoch": 1.44, "learning_rate": 8.364797644259306e-05, "loss": 0.0098, "step": 556430 }, { "epoch": 1.44, "learning_rate": 8.364408822622162e-05, "loss": 0.0083, "step": 556440 }, { "epoch": 1.44, "learning_rate": 8.364020000985015e-05, "loss": 0.0075, "step": 556450 }, { "epoch": 1.44, "learning_rate": 8.363631179347869e-05, "loss": 0.0085, "step": 556460 }, { "epoch": 1.44, "learning_rate": 8.363242357710722e-05, "loss": 0.0076, "step": 556470 }, { "epoch": 1.44, "learning_rate": 8.362853536073576e-05, "loss": 0.0094, "step": 556480 }, { "epoch": 1.44, "learning_rate": 8.362464714436428e-05, "loss": 0.0087, "step": 556490 }, { "epoch": 1.44, "learning_rate": 8.362075892799283e-05, "loss": 0.0119, "step": 556500 }, { "epoch": 1.44, "learning_rate": 8.361687071162135e-05, "loss": 0.008, "step": 556510 }, { "epoch": 1.44, "learning_rate": 8.361298249524988e-05, "loss": 0.01, "step": 556520 }, { "epoch": 1.44, "learning_rate": 8.360909427887842e-05, "loss": 0.0096, "step": 556530 }, { "epoch": 1.44, "learning_rate": 8.360520606250695e-05, "loss": 0.0083, "step": 556540 }, { "epoch": 1.44, "learning_rate": 8.36013178461355e-05, "loss": 0.0079, "step": 556550 }, { "epoch": 1.44, "learning_rate": 8.359742962976402e-05, "loss": 0.0091, "step": 556560 }, { "epoch": 1.44, "learning_rate": 8.359354141339256e-05, "loss": 0.0119, "step": 556570 }, { "epoch": 1.44, "learning_rate": 8.358965319702109e-05, "loss": 0.0155, "step": 556580 }, { "epoch": 1.44, "learning_rate": 8.358576498064963e-05, "loss": 0.0092, "step": 556590 }, { "epoch": 1.44, "learning_rate": 8.358187676427816e-05, "loss": 0.0094, "step": 556600 }, { "epoch": 1.44, "learning_rate": 8.357798854790672e-05, "loss": 0.0074, "step": 556610 }, { "epoch": 1.44, "learning_rate": 8.357410033153523e-05, "loss": 0.0097, "step": 556620 }, { "epoch": 1.44, "learning_rate": 8.357021211516379e-05, "loss": 0.0102, "step": 556630 }, { "epoch": 1.44, "learning_rate": 8.356632389879231e-05, "loss": 0.0088, "step": 556640 }, { "epoch": 1.44, "learning_rate": 8.356243568242086e-05, "loss": 0.0113, "step": 556650 }, { "epoch": 1.44, "learning_rate": 8.355854746604938e-05, "loss": 0.0083, "step": 556660 }, { "epoch": 1.44, "learning_rate": 8.355465924967793e-05, "loss": 0.0098, "step": 556670 }, { "epoch": 1.44, "learning_rate": 8.355077103330645e-05, "loss": 0.0105, "step": 556680 }, { "epoch": 1.44, "learning_rate": 8.3546882816935e-05, "loss": 0.0083, "step": 556690 }, { "epoch": 1.44, "learning_rate": 8.354299460056352e-05, "loss": 0.0092, "step": 556700 }, { "epoch": 1.44, "learning_rate": 8.353910638419207e-05, "loss": 0.0078, "step": 556710 }, { "epoch": 1.44, "learning_rate": 8.35352181678206e-05, "loss": 0.0102, "step": 556720 }, { "epoch": 1.44, "learning_rate": 8.353132995144914e-05, "loss": 0.0081, "step": 556730 }, { "epoch": 1.44, "learning_rate": 8.352744173507766e-05, "loss": 0.0096, "step": 556740 }, { "epoch": 1.44, "learning_rate": 8.35235535187062e-05, "loss": 0.0093, "step": 556750 }, { "epoch": 1.44, "learning_rate": 8.351966530233473e-05, "loss": 0.0084, "step": 556760 }, { "epoch": 1.44, "learning_rate": 8.351577708596326e-05, "loss": 0.0073, "step": 556770 }, { "epoch": 1.44, "learning_rate": 8.35118888695918e-05, "loss": 0.0107, "step": 556780 }, { "epoch": 1.44, "learning_rate": 8.350800065322033e-05, "loss": 0.0096, "step": 556790 }, { "epoch": 1.44, "learning_rate": 8.350411243684889e-05, "loss": 0.0098, "step": 556800 }, { "epoch": 1.44, "learning_rate": 8.350022422047741e-05, "loss": 0.0102, "step": 556810 }, { "epoch": 1.44, "learning_rate": 8.349633600410596e-05, "loss": 0.0101, "step": 556820 }, { "epoch": 1.44, "learning_rate": 8.349244778773448e-05, "loss": 0.0079, "step": 556830 }, { "epoch": 1.44, "learning_rate": 8.348855957136303e-05, "loss": 0.0076, "step": 556840 }, { "epoch": 1.44, "learning_rate": 8.348467135499155e-05, "loss": 0.009, "step": 556850 }, { "epoch": 1.44, "learning_rate": 8.34807831386201e-05, "loss": 0.0105, "step": 556860 }, { "epoch": 1.44, "learning_rate": 8.347689492224862e-05, "loss": 0.013, "step": 556870 }, { "epoch": 1.44, "learning_rate": 8.347300670587716e-05, "loss": 0.0076, "step": 556880 }, { "epoch": 1.44, "learning_rate": 8.346911848950569e-05, "loss": 0.0093, "step": 556890 }, { "epoch": 1.44, "learning_rate": 8.346523027313423e-05, "loss": 0.0136, "step": 556900 }, { "epoch": 1.44, "learning_rate": 8.346134205676276e-05, "loss": 0.0113, "step": 556910 }, { "epoch": 1.44, "learning_rate": 8.34574538403913e-05, "loss": 0.0062, "step": 556920 }, { "epoch": 1.44, "learning_rate": 8.345356562401983e-05, "loss": 0.0086, "step": 556930 }, { "epoch": 1.44, "learning_rate": 8.344967740764837e-05, "loss": 0.0096, "step": 556940 }, { "epoch": 1.44, "learning_rate": 8.34457891912769e-05, "loss": 0.0085, "step": 556950 }, { "epoch": 1.44, "learning_rate": 8.344190097490546e-05, "loss": 0.0095, "step": 556960 }, { "epoch": 1.44, "learning_rate": 8.343801275853399e-05, "loss": 0.0108, "step": 556970 }, { "epoch": 1.44, "learning_rate": 8.343412454216253e-05, "loss": 0.0101, "step": 556980 }, { "epoch": 1.44, "learning_rate": 8.343023632579106e-05, "loss": 0.0076, "step": 556990 }, { "epoch": 1.44, "learning_rate": 8.342634810941958e-05, "loss": 0.0101, "step": 557000 }, { "epoch": 1.44, "eval_cer": 0.8816872903168917, "eval_loss": 0.006132596172392368, "eval_runtime": 107.8337, "eval_samples_per_second": 18.547, "eval_steps_per_second": 4.637, "step": 557000 }, { "epoch": 1.44, "learning_rate": 8.342245989304812e-05, "loss": 0.0092, "step": 557010 }, { "epoch": 1.44, "learning_rate": 8.341857167667665e-05, "loss": 0.0075, "step": 557020 }, { "epoch": 1.44, "learning_rate": 8.34146834603052e-05, "loss": 0.0099, "step": 557030 }, { "epoch": 1.44, "learning_rate": 8.341079524393372e-05, "loss": 0.0092, "step": 557040 }, { "epoch": 1.44, "learning_rate": 8.340690702756226e-05, "loss": 0.0095, "step": 557050 }, { "epoch": 1.44, "learning_rate": 8.340301881119079e-05, "loss": 0.0092, "step": 557060 }, { "epoch": 1.44, "learning_rate": 8.339913059481933e-05, "loss": 0.0088, "step": 557070 }, { "epoch": 1.44, "learning_rate": 8.339524237844786e-05, "loss": 0.0068, "step": 557080 }, { "epoch": 1.44, "learning_rate": 8.33913541620764e-05, "loss": 0.0115, "step": 557090 }, { "epoch": 1.44, "learning_rate": 8.338746594570493e-05, "loss": 0.0072, "step": 557100 }, { "epoch": 1.44, "learning_rate": 8.338357772933347e-05, "loss": 0.009, "step": 557110 }, { "epoch": 1.44, "learning_rate": 8.3379689512962e-05, "loss": 0.0086, "step": 557120 }, { "epoch": 1.44, "learning_rate": 8.337580129659054e-05, "loss": 0.0078, "step": 557130 }, { "epoch": 1.44, "learning_rate": 8.337191308021907e-05, "loss": 0.0104, "step": 557140 }, { "epoch": 1.44, "learning_rate": 8.336802486384763e-05, "loss": 0.0111, "step": 557150 }, { "epoch": 1.44, "learning_rate": 8.336413664747615e-05, "loss": 0.0061, "step": 557160 }, { "epoch": 1.44, "learning_rate": 8.33602484311047e-05, "loss": 0.0096, "step": 557170 }, { "epoch": 1.44, "learning_rate": 8.335636021473322e-05, "loss": 0.01, "step": 557180 }, { "epoch": 1.44, "learning_rate": 8.335247199836177e-05, "loss": 0.009, "step": 557190 }, { "epoch": 1.44, "learning_rate": 8.33485837819903e-05, "loss": 0.0111, "step": 557200 }, { "epoch": 1.44, "learning_rate": 8.334469556561884e-05, "loss": 0.0092, "step": 557210 }, { "epoch": 1.44, "learning_rate": 8.334080734924736e-05, "loss": 0.009, "step": 557220 }, { "epoch": 1.44, "learning_rate": 8.33369191328759e-05, "loss": 0.0078, "step": 557230 }, { "epoch": 1.44, "learning_rate": 8.333303091650443e-05, "loss": 0.0087, "step": 557240 }, { "epoch": 1.44, "learning_rate": 8.332914270013296e-05, "loss": 0.0118, "step": 557250 }, { "epoch": 1.44, "learning_rate": 8.33252544837615e-05, "loss": 0.0081, "step": 557260 }, { "epoch": 1.44, "learning_rate": 8.332136626739003e-05, "loss": 0.0064, "step": 557270 }, { "epoch": 1.44, "learning_rate": 8.331747805101857e-05, "loss": 0.011, "step": 557280 }, { "epoch": 1.44, "learning_rate": 8.33135898346471e-05, "loss": 0.0068, "step": 557290 }, { "epoch": 1.44, "learning_rate": 8.330970161827564e-05, "loss": 0.0099, "step": 557300 }, { "epoch": 1.44, "learning_rate": 8.330581340190417e-05, "loss": 0.0126, "step": 557310 }, { "epoch": 1.44, "learning_rate": 8.330192518553273e-05, "loss": 0.009, "step": 557320 }, { "epoch": 1.44, "learning_rate": 8.329803696916124e-05, "loss": 0.0112, "step": 557330 }, { "epoch": 1.44, "learning_rate": 8.32941487527898e-05, "loss": 0.0103, "step": 557340 }, { "epoch": 1.44, "learning_rate": 8.329026053641832e-05, "loss": 0.0117, "step": 557350 }, { "epoch": 1.44, "learning_rate": 8.328637232004687e-05, "loss": 0.0131, "step": 557360 }, { "epoch": 1.44, "learning_rate": 8.32824841036754e-05, "loss": 0.0095, "step": 557370 }, { "epoch": 1.44, "learning_rate": 8.327859588730393e-05, "loss": 0.0081, "step": 557380 }, { "epoch": 1.44, "learning_rate": 8.327470767093246e-05, "loss": 0.0101, "step": 557390 }, { "epoch": 1.44, "learning_rate": 8.3270819454561e-05, "loss": 0.0103, "step": 557400 }, { "epoch": 1.44, "learning_rate": 8.326693123818953e-05, "loss": 0.0085, "step": 557410 }, { "epoch": 1.44, "learning_rate": 8.326304302181807e-05, "loss": 0.0099, "step": 557420 }, { "epoch": 1.44, "learning_rate": 8.32591548054466e-05, "loss": 0.008, "step": 557430 }, { "epoch": 1.44, "learning_rate": 8.325526658907514e-05, "loss": 0.0101, "step": 557440 }, { "epoch": 1.44, "learning_rate": 8.325137837270367e-05, "loss": 0.0071, "step": 557450 }, { "epoch": 1.45, "learning_rate": 8.324749015633221e-05, "loss": 0.0099, "step": 557460 }, { "epoch": 1.45, "learning_rate": 8.324360193996074e-05, "loss": 0.0099, "step": 557470 }, { "epoch": 1.45, "learning_rate": 8.32397137235893e-05, "loss": 0.0108, "step": 557480 }, { "epoch": 1.45, "learning_rate": 8.323582550721781e-05, "loss": 0.0101, "step": 557490 }, { "epoch": 1.45, "learning_rate": 8.323193729084634e-05, "loss": 0.0096, "step": 557500 }, { "epoch": 1.45, "learning_rate": 8.32280490744749e-05, "loss": 0.0115, "step": 557510 }, { "epoch": 1.45, "learning_rate": 8.322416085810342e-05, "loss": 0.0097, "step": 557520 }, { "epoch": 1.45, "learning_rate": 8.322027264173196e-05, "loss": 0.0095, "step": 557530 }, { "epoch": 1.45, "learning_rate": 8.321638442536049e-05, "loss": 0.012, "step": 557540 }, { "epoch": 1.45, "learning_rate": 8.321249620898903e-05, "loss": 0.0119, "step": 557550 }, { "epoch": 1.45, "learning_rate": 8.320860799261756e-05, "loss": 0.0097, "step": 557560 }, { "epoch": 1.45, "learning_rate": 8.32047197762461e-05, "loss": 0.0075, "step": 557570 }, { "epoch": 1.45, "learning_rate": 8.320083155987463e-05, "loss": 0.0097, "step": 557580 }, { "epoch": 1.45, "learning_rate": 8.319694334350317e-05, "loss": 0.0074, "step": 557590 }, { "epoch": 1.45, "learning_rate": 8.31930551271317e-05, "loss": 0.0066, "step": 557600 }, { "epoch": 1.45, "learning_rate": 8.318916691076024e-05, "loss": 0.0068, "step": 557610 }, { "epoch": 1.45, "learning_rate": 8.318527869438877e-05, "loss": 0.0091, "step": 557620 }, { "epoch": 1.45, "learning_rate": 8.318139047801731e-05, "loss": 0.0115, "step": 557630 }, { "epoch": 1.45, "learning_rate": 8.317750226164584e-05, "loss": 0.0086, "step": 557640 }, { "epoch": 1.45, "learning_rate": 8.317361404527438e-05, "loss": 0.0106, "step": 557650 }, { "epoch": 1.45, "learning_rate": 8.316972582890291e-05, "loss": 0.0115, "step": 557660 }, { "epoch": 1.45, "learning_rate": 8.316583761253147e-05, "loss": 0.0067, "step": 557670 }, { "epoch": 1.45, "learning_rate": 8.316194939616e-05, "loss": 0.0105, "step": 557680 }, { "epoch": 1.45, "learning_rate": 8.315806117978854e-05, "loss": 0.0085, "step": 557690 }, { "epoch": 1.45, "learning_rate": 8.315417296341706e-05, "loss": 0.0094, "step": 557700 }, { "epoch": 1.45, "learning_rate": 8.31502847470456e-05, "loss": 0.0076, "step": 557710 }, { "epoch": 1.45, "learning_rate": 8.314639653067413e-05, "loss": 0.012, "step": 557720 }, { "epoch": 1.45, "learning_rate": 8.314250831430268e-05, "loss": 0.0073, "step": 557730 }, { "epoch": 1.45, "learning_rate": 8.31386200979312e-05, "loss": 0.0103, "step": 557740 }, { "epoch": 1.45, "learning_rate": 8.313473188155973e-05, "loss": 0.0106, "step": 557750 }, { "epoch": 1.45, "learning_rate": 8.313084366518827e-05, "loss": 0.0101, "step": 557760 }, { "epoch": 1.45, "learning_rate": 8.31269554488168e-05, "loss": 0.013, "step": 557770 }, { "epoch": 1.45, "learning_rate": 8.312306723244534e-05, "loss": 0.0082, "step": 557780 }, { "epoch": 1.45, "learning_rate": 8.311917901607387e-05, "loss": 0.0079, "step": 557790 }, { "epoch": 1.45, "learning_rate": 8.311529079970241e-05, "loss": 0.0086, "step": 557800 }, { "epoch": 1.45, "learning_rate": 8.311140258333094e-05, "loss": 0.0084, "step": 557810 }, { "epoch": 1.45, "learning_rate": 8.310751436695948e-05, "loss": 0.0107, "step": 557820 }, { "epoch": 1.45, "learning_rate": 8.310362615058801e-05, "loss": 0.0082, "step": 557830 }, { "epoch": 1.45, "learning_rate": 8.309973793421657e-05, "loss": 0.0156, "step": 557840 }, { "epoch": 1.45, "learning_rate": 8.309584971784508e-05, "loss": 0.0092, "step": 557850 }, { "epoch": 1.45, "learning_rate": 8.309196150147364e-05, "loss": 0.0103, "step": 557860 }, { "epoch": 1.45, "learning_rate": 8.308807328510216e-05, "loss": 0.0105, "step": 557870 }, { "epoch": 1.45, "learning_rate": 8.30841850687307e-05, "loss": 0.0112, "step": 557880 }, { "epoch": 1.45, "learning_rate": 8.308029685235923e-05, "loss": 0.0107, "step": 557890 }, { "epoch": 1.45, "learning_rate": 8.307640863598777e-05, "loss": 0.0095, "step": 557900 }, { "epoch": 1.45, "learning_rate": 8.30725204196163e-05, "loss": 0.0071, "step": 557910 }, { "epoch": 1.45, "learning_rate": 8.306863220324484e-05, "loss": 0.0109, "step": 557920 }, { "epoch": 1.45, "learning_rate": 8.306474398687337e-05, "loss": 0.0087, "step": 557930 }, { "epoch": 1.45, "learning_rate": 8.306085577050191e-05, "loss": 0.0073, "step": 557940 }, { "epoch": 1.45, "learning_rate": 8.305696755413044e-05, "loss": 0.011, "step": 557950 }, { "epoch": 1.45, "learning_rate": 8.305307933775898e-05, "loss": 0.0084, "step": 557960 }, { "epoch": 1.45, "learning_rate": 8.304919112138751e-05, "loss": 0.0083, "step": 557970 }, { "epoch": 1.45, "learning_rate": 8.304530290501605e-05, "loss": 0.0092, "step": 557980 }, { "epoch": 1.45, "learning_rate": 8.304141468864458e-05, "loss": 0.0091, "step": 557990 }, { "epoch": 1.45, "learning_rate": 8.303752647227311e-05, "loss": 0.0111, "step": 558000 }, { "epoch": 1.45, "eval_cer": 0.8816942885015627, "eval_loss": 0.006029914598912001, "eval_runtime": 108.0298, "eval_samples_per_second": 18.513, "eval_steps_per_second": 4.628, "step": 558000 }, { "epoch": 1.45, "learning_rate": 8.303363825590165e-05, "loss": 0.01, "step": 558010 }, { "epoch": 1.45, "learning_rate": 8.302975003953018e-05, "loss": 0.0076, "step": 558020 }, { "epoch": 1.45, "learning_rate": 8.302586182315873e-05, "loss": 0.0064, "step": 558030 }, { "epoch": 1.45, "learning_rate": 8.302197360678726e-05, "loss": 0.0121, "step": 558040 }, { "epoch": 1.45, "learning_rate": 8.30180853904158e-05, "loss": 0.0096, "step": 558050 }, { "epoch": 1.45, "learning_rate": 8.301419717404433e-05, "loss": 0.0103, "step": 558060 }, { "epoch": 1.45, "learning_rate": 8.301030895767287e-05, "loss": 0.0098, "step": 558070 }, { "epoch": 1.45, "learning_rate": 8.30064207413014e-05, "loss": 0.0102, "step": 558080 }, { "epoch": 1.45, "learning_rate": 8.300253252492994e-05, "loss": 0.0133, "step": 558090 }, { "epoch": 1.45, "learning_rate": 8.299864430855847e-05, "loss": 0.0112, "step": 558100 }, { "epoch": 1.45, "learning_rate": 8.299475609218701e-05, "loss": 0.0096, "step": 558110 }, { "epoch": 1.45, "learning_rate": 8.299086787581554e-05, "loss": 0.008, "step": 558120 }, { "epoch": 1.45, "learning_rate": 8.298697965944408e-05, "loss": 0.01, "step": 558130 }, { "epoch": 1.45, "learning_rate": 8.298309144307261e-05, "loss": 0.0092, "step": 558140 }, { "epoch": 1.45, "learning_rate": 8.297920322670115e-05, "loss": 0.0093, "step": 558150 }, { "epoch": 1.45, "learning_rate": 8.297531501032968e-05, "loss": 0.0071, "step": 558160 }, { "epoch": 1.45, "learning_rate": 8.297142679395822e-05, "loss": 0.0106, "step": 558170 }, { "epoch": 1.45, "learning_rate": 8.296753857758675e-05, "loss": 0.0068, "step": 558180 }, { "epoch": 1.45, "learning_rate": 8.29636503612153e-05, "loss": 0.0115, "step": 558190 }, { "epoch": 1.45, "learning_rate": 8.295976214484383e-05, "loss": 0.0092, "step": 558200 }, { "epoch": 1.45, "learning_rate": 8.295587392847238e-05, "loss": 0.0094, "step": 558210 }, { "epoch": 1.45, "learning_rate": 8.29519857121009e-05, "loss": 0.0079, "step": 558220 }, { "epoch": 1.45, "learning_rate": 8.294809749572945e-05, "loss": 0.0088, "step": 558230 }, { "epoch": 1.45, "learning_rate": 8.294420927935797e-05, "loss": 0.013, "step": 558240 }, { "epoch": 1.45, "learning_rate": 8.29403210629865e-05, "loss": 0.0098, "step": 558250 }, { "epoch": 1.45, "learning_rate": 8.293643284661504e-05, "loss": 0.0075, "step": 558260 }, { "epoch": 1.45, "learning_rate": 8.293254463024357e-05, "loss": 0.0122, "step": 558270 }, { "epoch": 1.45, "learning_rate": 8.292865641387211e-05, "loss": 0.0093, "step": 558280 }, { "epoch": 1.45, "learning_rate": 8.292476819750064e-05, "loss": 0.0093, "step": 558290 }, { "epoch": 1.45, "learning_rate": 8.292087998112918e-05, "loss": 0.0091, "step": 558300 }, { "epoch": 1.45, "learning_rate": 8.291699176475771e-05, "loss": 0.0084, "step": 558310 }, { "epoch": 1.45, "learning_rate": 8.291310354838625e-05, "loss": 0.0096, "step": 558320 }, { "epoch": 1.45, "learning_rate": 8.290921533201478e-05, "loss": 0.0103, "step": 558330 }, { "epoch": 1.45, "learning_rate": 8.290532711564332e-05, "loss": 0.0057, "step": 558340 }, { "epoch": 1.45, "learning_rate": 8.290143889927185e-05, "loss": 0.0087, "step": 558350 }, { "epoch": 1.45, "learning_rate": 8.28975506829004e-05, "loss": 0.0076, "step": 558360 }, { "epoch": 1.45, "learning_rate": 8.289366246652892e-05, "loss": 0.0091, "step": 558370 }, { "epoch": 1.45, "learning_rate": 8.288977425015748e-05, "loss": 0.0064, "step": 558380 }, { "epoch": 1.45, "learning_rate": 8.2885886033786e-05, "loss": 0.009, "step": 558390 }, { "epoch": 1.45, "learning_rate": 8.288199781741455e-05, "loss": 0.0085, "step": 558400 }, { "epoch": 1.45, "learning_rate": 8.287810960104307e-05, "loss": 0.0108, "step": 558410 }, { "epoch": 1.45, "learning_rate": 8.287422138467161e-05, "loss": 0.0071, "step": 558420 }, { "epoch": 1.45, "learning_rate": 8.287033316830014e-05, "loss": 0.0119, "step": 558430 }, { "epoch": 1.45, "learning_rate": 8.286644495192868e-05, "loss": 0.0081, "step": 558440 }, { "epoch": 1.45, "learning_rate": 8.286255673555721e-05, "loss": 0.0101, "step": 558450 }, { "epoch": 1.45, "learning_rate": 8.285866851918575e-05, "loss": 0.0087, "step": 558460 }, { "epoch": 1.45, "learning_rate": 8.285478030281428e-05, "loss": 0.0136, "step": 558470 }, { "epoch": 1.45, "learning_rate": 8.285089208644282e-05, "loss": 0.0079, "step": 558480 }, { "epoch": 1.45, "learning_rate": 8.284700387007135e-05, "loss": 0.0074, "step": 558490 }, { "epoch": 1.45, "learning_rate": 8.284311565369988e-05, "loss": 0.0068, "step": 558500 }, { "epoch": 1.45, "learning_rate": 8.283922743732842e-05, "loss": 0.0126, "step": 558510 }, { "epoch": 1.45, "learning_rate": 8.283533922095695e-05, "loss": 0.0102, "step": 558520 }, { "epoch": 1.45, "learning_rate": 8.283145100458549e-05, "loss": 0.0128, "step": 558530 }, { "epoch": 1.45, "learning_rate": 8.282756278821402e-05, "loss": 0.01, "step": 558540 }, { "epoch": 1.45, "learning_rate": 8.282367457184257e-05, "loss": 0.0097, "step": 558550 }, { "epoch": 1.45, "learning_rate": 8.28197863554711e-05, "loss": 0.0096, "step": 558560 }, { "epoch": 1.45, "learning_rate": 8.281589813909964e-05, "loss": 0.0105, "step": 558570 }, { "epoch": 1.45, "learning_rate": 8.281200992272817e-05, "loss": 0.0103, "step": 558580 }, { "epoch": 1.45, "learning_rate": 8.280812170635671e-05, "loss": 0.0084, "step": 558590 }, { "epoch": 1.45, "learning_rate": 8.280423348998524e-05, "loss": 0.0076, "step": 558600 }, { "epoch": 1.45, "learning_rate": 8.280034527361378e-05, "loss": 0.0093, "step": 558610 }, { "epoch": 1.45, "learning_rate": 8.279645705724231e-05, "loss": 0.0091, "step": 558620 }, { "epoch": 1.45, "learning_rate": 8.279256884087085e-05, "loss": 0.0119, "step": 558630 }, { "epoch": 1.45, "learning_rate": 8.278868062449938e-05, "loss": 0.0114, "step": 558640 }, { "epoch": 1.45, "learning_rate": 8.278479240812792e-05, "loss": 0.0065, "step": 558650 }, { "epoch": 1.45, "learning_rate": 8.278090419175645e-05, "loss": 0.0089, "step": 558660 }, { "epoch": 1.45, "learning_rate": 8.277701597538499e-05, "loss": 0.0094, "step": 558670 }, { "epoch": 1.45, "learning_rate": 8.277312775901352e-05, "loss": 0.0107, "step": 558680 }, { "epoch": 1.45, "learning_rate": 8.276923954264206e-05, "loss": 0.0071, "step": 558690 }, { "epoch": 1.45, "learning_rate": 8.276535132627059e-05, "loss": 0.0097, "step": 558700 }, { "epoch": 1.45, "learning_rate": 8.276146310989915e-05, "loss": 0.0112, "step": 558710 }, { "epoch": 1.45, "learning_rate": 8.275757489352766e-05, "loss": 0.0107, "step": 558720 }, { "epoch": 1.45, "learning_rate": 8.275368667715622e-05, "loss": 0.0093, "step": 558730 }, { "epoch": 1.45, "learning_rate": 8.274979846078474e-05, "loss": 0.0088, "step": 558740 }, { "epoch": 1.45, "learning_rate": 8.274591024441327e-05, "loss": 0.0094, "step": 558750 }, { "epoch": 1.45, "learning_rate": 8.274202202804181e-05, "loss": 0.0097, "step": 558760 }, { "epoch": 1.45, "learning_rate": 8.273813381167034e-05, "loss": 0.0103, "step": 558770 }, { "epoch": 1.45, "learning_rate": 8.273424559529888e-05, "loss": 0.0086, "step": 558780 }, { "epoch": 1.45, "learning_rate": 8.273035737892741e-05, "loss": 0.0085, "step": 558790 }, { "epoch": 1.45, "learning_rate": 8.272646916255595e-05, "loss": 0.0096, "step": 558800 }, { "epoch": 1.45, "learning_rate": 8.272258094618448e-05, "loss": 0.01, "step": 558810 }, { "epoch": 1.45, "learning_rate": 8.271869272981302e-05, "loss": 0.0118, "step": 558820 }, { "epoch": 1.45, "learning_rate": 8.271480451344155e-05, "loss": 0.0089, "step": 558830 }, { "epoch": 1.45, "learning_rate": 8.271091629707009e-05, "loss": 0.0094, "step": 558840 }, { "epoch": 1.45, "learning_rate": 8.270702808069862e-05, "loss": 0.0073, "step": 558850 }, { "epoch": 1.45, "learning_rate": 8.270313986432716e-05, "loss": 0.0099, "step": 558860 }, { "epoch": 1.45, "learning_rate": 8.269925164795569e-05, "loss": 0.0074, "step": 558870 }, { "epoch": 1.45, "learning_rate": 8.269536343158423e-05, "loss": 0.0088, "step": 558880 }, { "epoch": 1.45, "learning_rate": 8.269147521521276e-05, "loss": 0.0118, "step": 558890 }, { "epoch": 1.45, "learning_rate": 8.268758699884132e-05, "loss": 0.0107, "step": 558900 }, { "epoch": 1.45, "learning_rate": 8.268369878246984e-05, "loss": 0.0125, "step": 558910 }, { "epoch": 1.45, "learning_rate": 8.267981056609838e-05, "loss": 0.0083, "step": 558920 }, { "epoch": 1.45, "learning_rate": 8.267592234972691e-05, "loss": 0.0097, "step": 558930 }, { "epoch": 1.45, "learning_rate": 8.267203413335545e-05, "loss": 0.0075, "step": 558940 }, { "epoch": 1.45, "learning_rate": 8.266814591698398e-05, "loss": 0.0075, "step": 558950 }, { "epoch": 1.45, "learning_rate": 8.266425770061252e-05, "loss": 0.0088, "step": 558960 }, { "epoch": 1.45, "learning_rate": 8.266036948424105e-05, "loss": 0.0107, "step": 558970 }, { "epoch": 1.45, "learning_rate": 8.26564812678696e-05, "loss": 0.0105, "step": 558980 }, { "epoch": 1.45, "learning_rate": 8.265259305149812e-05, "loss": 0.0092, "step": 558990 }, { "epoch": 1.45, "learning_rate": 8.264870483512665e-05, "loss": 0.0097, "step": 559000 }, { "epoch": 1.45, "eval_cer": 0.8817138834186412, "eval_loss": 0.005990092176944017, "eval_runtime": 107.8601, "eval_samples_per_second": 18.543, "eval_steps_per_second": 4.636, "step": 559000 }, { "epoch": 1.45, "learning_rate": 8.264481661875519e-05, "loss": 0.0109, "step": 559010 }, { "epoch": 1.45, "learning_rate": 8.264092840238372e-05, "loss": 0.009, "step": 559020 }, { "epoch": 1.45, "learning_rate": 8.263704018601226e-05, "loss": 0.0098, "step": 559030 }, { "epoch": 1.45, "learning_rate": 8.263315196964079e-05, "loss": 0.0119, "step": 559040 }, { "epoch": 1.45, "learning_rate": 8.262926375326933e-05, "loss": 0.0159, "step": 559050 }, { "epoch": 1.45, "learning_rate": 8.262537553689786e-05, "loss": 0.0093, "step": 559060 }, { "epoch": 1.45, "learning_rate": 8.262148732052641e-05, "loss": 0.0106, "step": 559070 }, { "epoch": 1.45, "learning_rate": 8.261759910415493e-05, "loss": 0.0107, "step": 559080 }, { "epoch": 1.45, "learning_rate": 8.261371088778348e-05, "loss": 0.0071, "step": 559090 }, { "epoch": 1.45, "learning_rate": 8.260982267141201e-05, "loss": 0.0106, "step": 559100 }, { "epoch": 1.45, "learning_rate": 8.260593445504055e-05, "loss": 0.0113, "step": 559110 }, { "epoch": 1.45, "learning_rate": 8.260204623866908e-05, "loss": 0.0095, "step": 559120 }, { "epoch": 1.45, "learning_rate": 8.259815802229762e-05, "loss": 0.0113, "step": 559130 }, { "epoch": 1.45, "learning_rate": 8.259426980592615e-05, "loss": 0.0076, "step": 559140 }, { "epoch": 1.45, "learning_rate": 8.25903815895547e-05, "loss": 0.008, "step": 559150 }, { "epoch": 1.45, "learning_rate": 8.258649337318322e-05, "loss": 0.0144, "step": 559160 }, { "epoch": 1.45, "learning_rate": 8.258260515681176e-05, "loss": 0.0069, "step": 559170 }, { "epoch": 1.45, "learning_rate": 8.257871694044029e-05, "loss": 0.0134, "step": 559180 }, { "epoch": 1.45, "learning_rate": 8.257482872406883e-05, "loss": 0.0075, "step": 559190 }, { "epoch": 1.45, "learning_rate": 8.257094050769736e-05, "loss": 0.0177, "step": 559200 }, { "epoch": 1.45, "learning_rate": 8.25670522913259e-05, "loss": 0.0109, "step": 559210 }, { "epoch": 1.45, "learning_rate": 8.256316407495443e-05, "loss": 0.0099, "step": 559220 }, { "epoch": 1.45, "learning_rate": 8.255927585858299e-05, "loss": 0.0108, "step": 559230 }, { "epoch": 1.45, "learning_rate": 8.25553876422115e-05, "loss": 0.0128, "step": 559240 }, { "epoch": 1.45, "learning_rate": 8.255149942584003e-05, "loss": 0.0115, "step": 559250 }, { "epoch": 1.45, "learning_rate": 8.254761120946858e-05, "loss": 0.0088, "step": 559260 }, { "epoch": 1.45, "learning_rate": 8.254372299309711e-05, "loss": 0.0087, "step": 559270 }, { "epoch": 1.45, "learning_rate": 8.253983477672565e-05, "loss": 0.0082, "step": 559280 }, { "epoch": 1.45, "learning_rate": 8.253594656035418e-05, "loss": 0.0082, "step": 559290 }, { "epoch": 1.45, "learning_rate": 8.253205834398272e-05, "loss": 0.0085, "step": 559300 }, { "epoch": 1.45, "learning_rate": 8.252817012761125e-05, "loss": 0.0066, "step": 559310 }, { "epoch": 1.45, "learning_rate": 8.252428191123979e-05, "loss": 0.0076, "step": 559320 }, { "epoch": 1.45, "learning_rate": 8.252039369486832e-05, "loss": 0.0104, "step": 559330 }, { "epoch": 1.45, "learning_rate": 8.251650547849686e-05, "loss": 0.0077, "step": 559340 }, { "epoch": 1.45, "learning_rate": 8.251261726212539e-05, "loss": 0.0102, "step": 559350 }, { "epoch": 1.45, "learning_rate": 8.250872904575393e-05, "loss": 0.0128, "step": 559360 }, { "epoch": 1.45, "learning_rate": 8.250484082938246e-05, "loss": 0.0078, "step": 559370 }, { "epoch": 1.45, "learning_rate": 8.2500952613011e-05, "loss": 0.0086, "step": 559380 }, { "epoch": 1.45, "learning_rate": 8.249706439663953e-05, "loss": 0.0079, "step": 559390 }, { "epoch": 1.45, "learning_rate": 8.249317618026807e-05, "loss": 0.008, "step": 559400 }, { "epoch": 1.45, "learning_rate": 8.24892879638966e-05, "loss": 0.0116, "step": 559410 }, { "epoch": 1.45, "learning_rate": 8.248539974752516e-05, "loss": 0.0104, "step": 559420 }, { "epoch": 1.45, "learning_rate": 8.248151153115368e-05, "loss": 0.0084, "step": 559430 }, { "epoch": 1.45, "learning_rate": 8.247762331478222e-05, "loss": 0.0124, "step": 559440 }, { "epoch": 1.45, "learning_rate": 8.247373509841075e-05, "loss": 0.0099, "step": 559450 }, { "epoch": 1.45, "learning_rate": 8.24698468820393e-05, "loss": 0.0088, "step": 559460 }, { "epoch": 1.45, "learning_rate": 8.246595866566782e-05, "loss": 0.0088, "step": 559470 }, { "epoch": 1.45, "learning_rate": 8.246207044929636e-05, "loss": 0.0095, "step": 559480 }, { "epoch": 1.45, "learning_rate": 8.245818223292489e-05, "loss": 0.0086, "step": 559490 }, { "epoch": 1.45, "learning_rate": 8.245429401655342e-05, "loss": 0.0097, "step": 559500 }, { "epoch": 1.45, "learning_rate": 8.245040580018196e-05, "loss": 0.009, "step": 559510 }, { "epoch": 1.45, "learning_rate": 8.244651758381049e-05, "loss": 0.0099, "step": 559520 }, { "epoch": 1.45, "learning_rate": 8.244262936743903e-05, "loss": 0.0089, "step": 559530 }, { "epoch": 1.45, "learning_rate": 8.243874115106756e-05, "loss": 0.0107, "step": 559540 }, { "epoch": 1.45, "learning_rate": 8.24348529346961e-05, "loss": 0.0093, "step": 559550 }, { "epoch": 1.45, "learning_rate": 8.243096471832463e-05, "loss": 0.0132, "step": 559560 }, { "epoch": 1.45, "learning_rate": 8.242707650195317e-05, "loss": 0.009, "step": 559570 }, { "epoch": 1.45, "learning_rate": 8.24231882855817e-05, "loss": 0.0111, "step": 559580 }, { "epoch": 1.45, "learning_rate": 8.241930006921025e-05, "loss": 0.009, "step": 559590 }, { "epoch": 1.45, "learning_rate": 8.241541185283877e-05, "loss": 0.0088, "step": 559600 }, { "epoch": 1.45, "learning_rate": 8.241152363646732e-05, "loss": 0.0089, "step": 559610 }, { "epoch": 1.45, "learning_rate": 8.240763542009585e-05, "loss": 0.0088, "step": 559620 }, { "epoch": 1.45, "learning_rate": 8.24037472037244e-05, "loss": 0.011, "step": 559630 }, { "epoch": 1.45, "learning_rate": 8.239985898735292e-05, "loss": 0.011, "step": 559640 }, { "epoch": 1.45, "learning_rate": 8.239597077098146e-05, "loss": 0.0095, "step": 559650 }, { "epoch": 1.45, "learning_rate": 8.239208255460999e-05, "loss": 0.0096, "step": 559660 }, { "epoch": 1.45, "learning_rate": 8.238819433823853e-05, "loss": 0.0095, "step": 559670 }, { "epoch": 1.45, "learning_rate": 8.238430612186706e-05, "loss": 0.0077, "step": 559680 }, { "epoch": 1.45, "learning_rate": 8.23804179054956e-05, "loss": 0.0078, "step": 559690 }, { "epoch": 1.45, "learning_rate": 8.237652968912413e-05, "loss": 0.0113, "step": 559700 }, { "epoch": 1.45, "learning_rate": 8.237264147275267e-05, "loss": 0.0083, "step": 559710 }, { "epoch": 1.45, "learning_rate": 8.23687532563812e-05, "loss": 0.0088, "step": 559720 }, { "epoch": 1.45, "learning_rate": 8.236486504000973e-05, "loss": 0.0079, "step": 559730 }, { "epoch": 1.45, "learning_rate": 8.236097682363827e-05, "loss": 0.0086, "step": 559740 }, { "epoch": 1.45, "learning_rate": 8.23570886072668e-05, "loss": 0.0098, "step": 559750 }, { "epoch": 1.45, "learning_rate": 8.235320039089534e-05, "loss": 0.0072, "step": 559760 }, { "epoch": 1.45, "learning_rate": 8.234931217452387e-05, "loss": 0.0094, "step": 559770 }, { "epoch": 1.45, "learning_rate": 8.234542395815242e-05, "loss": 0.0079, "step": 559780 }, { "epoch": 1.45, "learning_rate": 8.234153574178095e-05, "loss": 0.0108, "step": 559790 }, { "epoch": 1.45, "learning_rate": 8.23376475254095e-05, "loss": 0.0085, "step": 559800 }, { "epoch": 1.45, "learning_rate": 8.233375930903802e-05, "loss": 0.0108, "step": 559810 }, { "epoch": 1.45, "learning_rate": 8.232987109266656e-05, "loss": 0.0079, "step": 559820 }, { "epoch": 1.45, "learning_rate": 8.232598287629509e-05, "loss": 0.0085, "step": 559830 }, { "epoch": 1.45, "learning_rate": 8.232209465992363e-05, "loss": 0.0118, "step": 559840 }, { "epoch": 1.45, "learning_rate": 8.231820644355216e-05, "loss": 0.01, "step": 559850 }, { "epoch": 1.45, "learning_rate": 8.23143182271807e-05, "loss": 0.0128, "step": 559860 }, { "epoch": 1.45, "learning_rate": 8.231043001080923e-05, "loss": 0.0101, "step": 559870 }, { "epoch": 1.45, "learning_rate": 8.230654179443777e-05, "loss": 0.0094, "step": 559880 }, { "epoch": 1.45, "learning_rate": 8.23026535780663e-05, "loss": 0.0089, "step": 559890 }, { "epoch": 1.45, "learning_rate": 8.229876536169484e-05, "loss": 0.0091, "step": 559900 }, { "epoch": 1.45, "learning_rate": 8.229487714532337e-05, "loss": 0.0098, "step": 559910 }, { "epoch": 1.45, "learning_rate": 8.229098892895191e-05, "loss": 0.0104, "step": 559920 }, { "epoch": 1.45, "learning_rate": 8.228710071258044e-05, "loss": 0.0096, "step": 559930 }, { "epoch": 1.45, "learning_rate": 8.2283212496209e-05, "loss": 0.0087, "step": 559940 }, { "epoch": 1.45, "learning_rate": 8.227932427983751e-05, "loss": 0.0107, "step": 559950 }, { "epoch": 1.45, "learning_rate": 8.227543606346606e-05, "loss": 0.0071, "step": 559960 }, { "epoch": 1.45, "learning_rate": 8.227154784709459e-05, "loss": 0.009, "step": 559970 }, { "epoch": 1.45, "learning_rate": 8.226765963072312e-05, "loss": 0.0095, "step": 559980 }, { "epoch": 1.45, "learning_rate": 8.226377141435166e-05, "loss": 0.0098, "step": 559990 }, { "epoch": 1.45, "learning_rate": 8.225988319798019e-05, "loss": 0.0105, "step": 560000 }, { "epoch": 1.45, "eval_cer": 0.881688689953826, "eval_loss": 0.00610503600910306, "eval_runtime": 108.0797, "eval_samples_per_second": 18.505, "eval_steps_per_second": 4.626, "step": 560000 }, { "epoch": 1.45, "learning_rate": 8.225599498160873e-05, "loss": 0.0116, "step": 560010 }, { "epoch": 1.45, "learning_rate": 8.225210676523726e-05, "loss": 0.0078, "step": 560020 }, { "epoch": 1.45, "learning_rate": 8.22482185488658e-05, "loss": 0.0082, "step": 560030 }, { "epoch": 1.45, "learning_rate": 8.224433033249433e-05, "loss": 0.0109, "step": 560040 }, { "epoch": 1.45, "learning_rate": 8.224044211612287e-05, "loss": 0.0103, "step": 560050 }, { "epoch": 1.45, "learning_rate": 8.22365538997514e-05, "loss": 0.0057, "step": 560060 }, { "epoch": 1.45, "learning_rate": 8.223266568337994e-05, "loss": 0.0099, "step": 560070 }, { "epoch": 1.45, "learning_rate": 8.222877746700847e-05, "loss": 0.0079, "step": 560080 }, { "epoch": 1.45, "learning_rate": 8.222488925063701e-05, "loss": 0.0088, "step": 560090 }, { "epoch": 1.45, "learning_rate": 8.222100103426554e-05, "loss": 0.0078, "step": 560100 }, { "epoch": 1.45, "learning_rate": 8.221711281789408e-05, "loss": 0.0098, "step": 560110 }, { "epoch": 1.45, "learning_rate": 8.221322460152261e-05, "loss": 0.0107, "step": 560120 }, { "epoch": 1.45, "learning_rate": 8.220933638515116e-05, "loss": 0.0105, "step": 560130 }, { "epoch": 1.45, "learning_rate": 8.220544816877969e-05, "loss": 0.0106, "step": 560140 }, { "epoch": 1.45, "learning_rate": 8.220155995240823e-05, "loss": 0.0103, "step": 560150 }, { "epoch": 1.45, "learning_rate": 8.219767173603676e-05, "loss": 0.0081, "step": 560160 }, { "epoch": 1.45, "learning_rate": 8.21937835196653e-05, "loss": 0.009, "step": 560170 }, { "epoch": 1.45, "learning_rate": 8.218989530329383e-05, "loss": 0.0063, "step": 560180 }, { "epoch": 1.45, "learning_rate": 8.218600708692237e-05, "loss": 0.0121, "step": 560190 }, { "epoch": 1.45, "learning_rate": 8.21821188705509e-05, "loss": 0.0086, "step": 560200 }, { "epoch": 1.45, "learning_rate": 8.217823065417944e-05, "loss": 0.0115, "step": 560210 }, { "epoch": 1.45, "learning_rate": 8.217434243780797e-05, "loss": 0.0084, "step": 560220 }, { "epoch": 1.45, "learning_rate": 8.21704542214365e-05, "loss": 0.009, "step": 560230 }, { "epoch": 1.45, "learning_rate": 8.216656600506504e-05, "loss": 0.0128, "step": 560240 }, { "epoch": 1.45, "learning_rate": 8.216267778869357e-05, "loss": 0.0099, "step": 560250 }, { "epoch": 1.45, "learning_rate": 8.215878957232211e-05, "loss": 0.0088, "step": 560260 }, { "epoch": 1.45, "learning_rate": 8.215490135595064e-05, "loss": 0.0101, "step": 560270 }, { "epoch": 1.45, "learning_rate": 8.215101313957918e-05, "loss": 0.0115, "step": 560280 }, { "epoch": 1.45, "learning_rate": 8.214712492320771e-05, "loss": 0.0094, "step": 560290 }, { "epoch": 1.45, "learning_rate": 8.214323670683626e-05, "loss": 0.0092, "step": 560300 }, { "epoch": 1.45, "learning_rate": 8.213934849046478e-05, "loss": 0.0084, "step": 560310 }, { "epoch": 1.45, "learning_rate": 8.213546027409333e-05, "loss": 0.0128, "step": 560320 }, { "epoch": 1.45, "learning_rate": 8.213157205772186e-05, "loss": 0.0086, "step": 560330 }, { "epoch": 1.45, "learning_rate": 8.21276838413504e-05, "loss": 0.0118, "step": 560340 }, { "epoch": 1.45, "learning_rate": 8.212379562497893e-05, "loss": 0.0113, "step": 560350 }, { "epoch": 1.45, "learning_rate": 8.211990740860747e-05, "loss": 0.0081, "step": 560360 }, { "epoch": 1.45, "learning_rate": 8.2116019192236e-05, "loss": 0.0072, "step": 560370 }, { "epoch": 1.45, "learning_rate": 8.211213097586454e-05, "loss": 0.0073, "step": 560380 }, { "epoch": 1.45, "learning_rate": 8.210824275949307e-05, "loss": 0.0091, "step": 560390 }, { "epoch": 1.45, "learning_rate": 8.210435454312161e-05, "loss": 0.0081, "step": 560400 }, { "epoch": 1.45, "learning_rate": 8.210046632675014e-05, "loss": 0.0091, "step": 560410 }, { "epoch": 1.45, "learning_rate": 8.209657811037868e-05, "loss": 0.0082, "step": 560420 }, { "epoch": 1.45, "learning_rate": 8.209268989400721e-05, "loss": 0.0076, "step": 560430 }, { "epoch": 1.45, "learning_rate": 8.208880167763575e-05, "loss": 0.0092, "step": 560440 }, { "epoch": 1.45, "learning_rate": 8.208491346126428e-05, "loss": 0.0078, "step": 560450 }, { "epoch": 1.45, "learning_rate": 8.208102524489283e-05, "loss": 0.0094, "step": 560460 }, { "epoch": 1.45, "learning_rate": 8.207713702852135e-05, "loss": 0.0074, "step": 560470 }, { "epoch": 1.45, "learning_rate": 8.207324881214988e-05, "loss": 0.0075, "step": 560480 }, { "epoch": 1.45, "learning_rate": 8.206936059577843e-05, "loss": 0.0066, "step": 560490 }, { "epoch": 1.45, "learning_rate": 8.206547237940696e-05, "loss": 0.0115, "step": 560500 }, { "epoch": 1.45, "learning_rate": 8.20615841630355e-05, "loss": 0.0102, "step": 560510 }, { "epoch": 1.45, "learning_rate": 8.205769594666403e-05, "loss": 0.0096, "step": 560520 }, { "epoch": 1.45, "learning_rate": 8.205380773029257e-05, "loss": 0.0088, "step": 560530 }, { "epoch": 1.45, "learning_rate": 8.20499195139211e-05, "loss": 0.0093, "step": 560540 }, { "epoch": 1.45, "learning_rate": 8.204603129754964e-05, "loss": 0.0091, "step": 560550 }, { "epoch": 1.45, "learning_rate": 8.204214308117817e-05, "loss": 0.0073, "step": 560560 }, { "epoch": 1.45, "learning_rate": 8.203825486480671e-05, "loss": 0.0084, "step": 560570 }, { "epoch": 1.45, "learning_rate": 8.203436664843524e-05, "loss": 0.0087, "step": 560580 }, { "epoch": 1.45, "learning_rate": 8.203047843206378e-05, "loss": 0.0111, "step": 560590 }, { "epoch": 1.45, "learning_rate": 8.202659021569231e-05, "loss": 0.0097, "step": 560600 }, { "epoch": 1.45, "learning_rate": 8.202270199932085e-05, "loss": 0.0114, "step": 560610 }, { "epoch": 1.45, "learning_rate": 8.201881378294938e-05, "loss": 0.0099, "step": 560620 }, { "epoch": 1.45, "learning_rate": 8.201492556657792e-05, "loss": 0.009, "step": 560630 }, { "epoch": 1.45, "learning_rate": 8.201103735020645e-05, "loss": 0.0083, "step": 560640 }, { "epoch": 1.45, "learning_rate": 8.2007149133835e-05, "loss": 0.0115, "step": 560650 }, { "epoch": 1.45, "learning_rate": 8.200326091746353e-05, "loss": 0.0107, "step": 560660 }, { "epoch": 1.45, "learning_rate": 8.199937270109207e-05, "loss": 0.0104, "step": 560670 }, { "epoch": 1.45, "learning_rate": 8.19954844847206e-05, "loss": 0.0107, "step": 560680 }, { "epoch": 1.45, "learning_rate": 8.199159626834914e-05, "loss": 0.0084, "step": 560690 }, { "epoch": 1.45, "learning_rate": 8.198770805197767e-05, "loss": 0.0106, "step": 560700 }, { "epoch": 1.45, "learning_rate": 8.198381983560621e-05, "loss": 0.0081, "step": 560710 }, { "epoch": 1.45, "learning_rate": 8.197993161923474e-05, "loss": 0.0105, "step": 560720 }, { "epoch": 1.45, "learning_rate": 8.197604340286327e-05, "loss": 0.0095, "step": 560730 }, { "epoch": 1.45, "learning_rate": 8.197215518649181e-05, "loss": 0.0093, "step": 560740 }, { "epoch": 1.45, "learning_rate": 8.196826697012034e-05, "loss": 0.0103, "step": 560750 }, { "epoch": 1.45, "learning_rate": 8.196437875374888e-05, "loss": 0.011, "step": 560760 }, { "epoch": 1.45, "learning_rate": 8.196049053737741e-05, "loss": 0.0069, "step": 560770 }, { "epoch": 1.45, "learning_rate": 8.195660232100595e-05, "loss": 0.008, "step": 560780 }, { "epoch": 1.45, "learning_rate": 8.195271410463448e-05, "loss": 0.0103, "step": 560790 }, { "epoch": 1.45, "learning_rate": 8.194882588826302e-05, "loss": 0.0089, "step": 560800 }, { "epoch": 1.45, "learning_rate": 8.194493767189155e-05, "loss": 0.0082, "step": 560810 }, { "epoch": 1.45, "learning_rate": 8.19410494555201e-05, "loss": 0.0094, "step": 560820 }, { "epoch": 1.45, "learning_rate": 8.193716123914862e-05, "loss": 0.0105, "step": 560830 }, { "epoch": 1.45, "learning_rate": 8.193327302277717e-05, "loss": 0.0094, "step": 560840 }, { "epoch": 1.45, "learning_rate": 8.19293848064057e-05, "loss": 0.0083, "step": 560850 }, { "epoch": 1.45, "learning_rate": 8.192549659003424e-05, "loss": 0.0086, "step": 560860 }, { "epoch": 1.45, "learning_rate": 8.192160837366277e-05, "loss": 0.0074, "step": 560870 }, { "epoch": 1.45, "learning_rate": 8.191772015729131e-05, "loss": 0.0088, "step": 560880 }, { "epoch": 1.45, "learning_rate": 8.191383194091984e-05, "loss": 0.0111, "step": 560890 }, { "epoch": 1.45, "learning_rate": 8.190994372454838e-05, "loss": 0.0079, "step": 560900 }, { "epoch": 1.45, "learning_rate": 8.190605550817691e-05, "loss": 0.0077, "step": 560910 }, { "epoch": 1.45, "learning_rate": 8.190216729180545e-05, "loss": 0.0104, "step": 560920 }, { "epoch": 1.45, "learning_rate": 8.189827907543398e-05, "loss": 0.0107, "step": 560930 }, { "epoch": 1.45, "learning_rate": 8.189439085906252e-05, "loss": 0.0076, "step": 560940 }, { "epoch": 1.45, "learning_rate": 8.189050264269105e-05, "loss": 0.0085, "step": 560950 }, { "epoch": 1.45, "learning_rate": 8.188661442631959e-05, "loss": 0.009, "step": 560960 }, { "epoch": 1.45, "learning_rate": 8.188272620994812e-05, "loss": 0.0067, "step": 560970 }, { "epoch": 1.45, "learning_rate": 8.187883799357665e-05, "loss": 0.0079, "step": 560980 }, { "epoch": 1.45, "learning_rate": 8.187494977720519e-05, "loss": 0.0074, "step": 560990 }, { "epoch": 1.45, "learning_rate": 8.187106156083372e-05, "loss": 0.0194, "step": 561000 }, { "epoch": 1.45, "eval_cer": 0.8816984874123652, "eval_loss": 0.00594002241268754, "eval_runtime": 107.9686, "eval_samples_per_second": 18.524, "eval_steps_per_second": 4.631, "step": 561000 }, { "epoch": 1.45, "learning_rate": 8.186717334446227e-05, "loss": 0.0074, "step": 561010 }, { "epoch": 1.45, "learning_rate": 8.18632851280908e-05, "loss": 0.0106, "step": 561020 }, { "epoch": 1.45, "learning_rate": 8.185939691171934e-05, "loss": 0.0109, "step": 561030 }, { "epoch": 1.45, "learning_rate": 8.185550869534787e-05, "loss": 0.0063, "step": 561040 }, { "epoch": 1.45, "learning_rate": 8.185162047897641e-05, "loss": 0.008, "step": 561050 }, { "epoch": 1.45, "learning_rate": 8.184773226260494e-05, "loss": 0.0083, "step": 561060 }, { "epoch": 1.45, "learning_rate": 8.184384404623348e-05, "loss": 0.0096, "step": 561070 }, { "epoch": 1.45, "learning_rate": 8.183995582986201e-05, "loss": 0.0106, "step": 561080 }, { "epoch": 1.45, "learning_rate": 8.183606761349055e-05, "loss": 0.0096, "step": 561090 }, { "epoch": 1.45, "learning_rate": 8.183217939711908e-05, "loss": 0.0086, "step": 561100 }, { "epoch": 1.45, "learning_rate": 8.182829118074762e-05, "loss": 0.0075, "step": 561110 }, { "epoch": 1.45, "learning_rate": 8.182440296437615e-05, "loss": 0.0101, "step": 561120 }, { "epoch": 1.45, "learning_rate": 8.182051474800469e-05, "loss": 0.0092, "step": 561130 }, { "epoch": 1.45, "learning_rate": 8.181662653163322e-05, "loss": 0.012, "step": 561140 }, { "epoch": 1.45, "learning_rate": 8.181273831526176e-05, "loss": 0.008, "step": 561150 }, { "epoch": 1.45, "learning_rate": 8.180885009889029e-05, "loss": 0.0093, "step": 561160 }, { "epoch": 1.45, "learning_rate": 8.180496188251884e-05, "loss": 0.0136, "step": 561170 }, { "epoch": 1.45, "learning_rate": 8.180107366614737e-05, "loss": 0.0093, "step": 561180 }, { "epoch": 1.45, "learning_rate": 8.179718544977591e-05, "loss": 0.0114, "step": 561190 }, { "epoch": 1.45, "learning_rate": 8.179329723340444e-05, "loss": 0.0107, "step": 561200 }, { "epoch": 1.45, "learning_rate": 8.178940901703298e-05, "loss": 0.0112, "step": 561210 }, { "epoch": 1.45, "learning_rate": 8.178552080066151e-05, "loss": 0.0106, "step": 561220 }, { "epoch": 1.45, "learning_rate": 8.178163258429004e-05, "loss": 0.0086, "step": 561230 }, { "epoch": 1.45, "learning_rate": 8.177774436791858e-05, "loss": 0.0062, "step": 561240 }, { "epoch": 1.45, "learning_rate": 8.177385615154711e-05, "loss": 0.0086, "step": 561250 }, { "epoch": 1.45, "learning_rate": 8.176996793517565e-05, "loss": 0.0074, "step": 561260 }, { "epoch": 1.45, "learning_rate": 8.176607971880418e-05, "loss": 0.0098, "step": 561270 }, { "epoch": 1.45, "learning_rate": 8.176219150243272e-05, "loss": 0.0074, "step": 561280 }, { "epoch": 1.45, "learning_rate": 8.175830328606125e-05, "loss": 0.0121, "step": 561290 }, { "epoch": 1.45, "learning_rate": 8.175441506968979e-05, "loss": 0.0135, "step": 561300 }, { "epoch": 1.45, "learning_rate": 8.175052685331832e-05, "loss": 0.0101, "step": 561310 }, { "epoch": 1.46, "learning_rate": 8.174663863694686e-05, "loss": 0.0126, "step": 561320 }, { "epoch": 1.46, "learning_rate": 8.174275042057539e-05, "loss": 0.0063, "step": 561330 }, { "epoch": 1.46, "learning_rate": 8.173886220420393e-05, "loss": 0.0092, "step": 561340 }, { "epoch": 1.46, "learning_rate": 8.173497398783246e-05, "loss": 0.0087, "step": 561350 }, { "epoch": 1.46, "learning_rate": 8.173108577146101e-05, "loss": 0.0073, "step": 561360 }, { "epoch": 1.46, "learning_rate": 8.172719755508954e-05, "loss": 0.0085, "step": 561370 }, { "epoch": 1.46, "learning_rate": 8.172330933871808e-05, "loss": 0.0089, "step": 561380 }, { "epoch": 1.46, "learning_rate": 8.171942112234661e-05, "loss": 0.0107, "step": 561390 }, { "epoch": 1.46, "learning_rate": 8.171553290597515e-05, "loss": 0.0146, "step": 561400 }, { "epoch": 1.46, "learning_rate": 8.171164468960368e-05, "loss": 0.0086, "step": 561410 }, { "epoch": 1.46, "learning_rate": 8.170775647323222e-05, "loss": 0.0075, "step": 561420 }, { "epoch": 1.46, "learning_rate": 8.170386825686075e-05, "loss": 0.0081, "step": 561430 }, { "epoch": 1.46, "learning_rate": 8.169998004048929e-05, "loss": 0.0096, "step": 561440 }, { "epoch": 1.46, "learning_rate": 8.169609182411782e-05, "loss": 0.0075, "step": 561450 }, { "epoch": 1.46, "learning_rate": 8.169220360774636e-05, "loss": 0.0101, "step": 561460 }, { "epoch": 1.46, "learning_rate": 8.168831539137489e-05, "loss": 0.0119, "step": 561470 }, { "epoch": 1.46, "learning_rate": 8.168442717500342e-05, "loss": 0.0105, "step": 561480 }, { "epoch": 1.46, "learning_rate": 8.168053895863196e-05, "loss": 0.0104, "step": 561490 }, { "epoch": 1.46, "learning_rate": 8.167665074226049e-05, "loss": 0.008, "step": 561500 }, { "epoch": 1.46, "learning_rate": 8.167276252588903e-05, "loss": 0.0084, "step": 561510 }, { "epoch": 1.46, "learning_rate": 8.166887430951756e-05, "loss": 0.0099, "step": 561520 }, { "epoch": 1.46, "learning_rate": 8.166498609314611e-05, "loss": 0.0104, "step": 561530 }, { "epoch": 1.46, "learning_rate": 8.166109787677463e-05, "loss": 0.0078, "step": 561540 }, { "epoch": 1.46, "learning_rate": 8.165720966040318e-05, "loss": 0.011, "step": 561550 }, { "epoch": 1.46, "learning_rate": 8.165332144403171e-05, "loss": 0.0093, "step": 561560 }, { "epoch": 1.46, "learning_rate": 8.164943322766025e-05, "loss": 0.0068, "step": 561570 }, { "epoch": 1.46, "learning_rate": 8.164554501128878e-05, "loss": 0.0086, "step": 561580 }, { "epoch": 1.46, "learning_rate": 8.164165679491732e-05, "loss": 0.0099, "step": 561590 }, { "epoch": 1.46, "learning_rate": 8.163776857854585e-05, "loss": 0.0109, "step": 561600 }, { "epoch": 1.46, "learning_rate": 8.163388036217439e-05, "loss": 0.0092, "step": 561610 }, { "epoch": 1.46, "learning_rate": 8.162999214580292e-05, "loss": 0.008, "step": 561620 }, { "epoch": 1.46, "learning_rate": 8.162610392943146e-05, "loss": 0.0091, "step": 561630 }, { "epoch": 1.46, "learning_rate": 8.162221571305999e-05, "loss": 0.0093, "step": 561640 }, { "epoch": 1.46, "learning_rate": 8.161832749668853e-05, "loss": 0.0085, "step": 561650 }, { "epoch": 1.46, "learning_rate": 8.161443928031706e-05, "loss": 0.0091, "step": 561660 }, { "epoch": 1.46, "learning_rate": 8.16105510639456e-05, "loss": 0.0098, "step": 561670 }, { "epoch": 1.46, "learning_rate": 8.160666284757413e-05, "loss": 0.0097, "step": 561680 }, { "epoch": 1.46, "learning_rate": 8.160277463120268e-05, "loss": 0.0097, "step": 561690 }, { "epoch": 1.46, "learning_rate": 8.15988864148312e-05, "loss": 0.0083, "step": 561700 }, { "epoch": 1.46, "learning_rate": 8.159499819845975e-05, "loss": 0.0099, "step": 561710 }, { "epoch": 1.46, "learning_rate": 8.159110998208828e-05, "loss": 0.0057, "step": 561720 }, { "epoch": 1.46, "learning_rate": 8.158722176571681e-05, "loss": 0.0095, "step": 561730 }, { "epoch": 1.46, "learning_rate": 8.158333354934535e-05, "loss": 0.0082, "step": 561740 }, { "epoch": 1.46, "learning_rate": 8.157944533297388e-05, "loss": 0.0157, "step": 561750 }, { "epoch": 1.46, "learning_rate": 8.157555711660242e-05, "loss": 0.0084, "step": 561760 }, { "epoch": 1.46, "learning_rate": 8.157166890023095e-05, "loss": 0.0089, "step": 561770 }, { "epoch": 1.46, "learning_rate": 8.156778068385949e-05, "loss": 0.0119, "step": 561780 }, { "epoch": 1.46, "learning_rate": 8.156389246748802e-05, "loss": 0.0085, "step": 561790 }, { "epoch": 1.46, "learning_rate": 8.156000425111656e-05, "loss": 0.0094, "step": 561800 }, { "epoch": 1.46, "learning_rate": 8.155611603474509e-05, "loss": 0.01, "step": 561810 }, { "epoch": 1.46, "learning_rate": 8.155222781837363e-05, "loss": 0.0145, "step": 561820 }, { "epoch": 1.46, "learning_rate": 8.154833960200216e-05, "loss": 0.0123, "step": 561830 }, { "epoch": 1.46, "learning_rate": 8.15444513856307e-05, "loss": 0.0089, "step": 561840 }, { "epoch": 1.46, "learning_rate": 8.154056316925923e-05, "loss": 0.0079, "step": 561850 }, { "epoch": 1.46, "learning_rate": 8.153667495288777e-05, "loss": 0.0124, "step": 561860 }, { "epoch": 1.46, "learning_rate": 8.15327867365163e-05, "loss": 0.0088, "step": 561870 }, { "epoch": 1.46, "learning_rate": 8.152889852014485e-05, "loss": 0.0089, "step": 561880 }, { "epoch": 1.46, "learning_rate": 8.152501030377338e-05, "loss": 0.01, "step": 561890 }, { "epoch": 1.46, "learning_rate": 8.152112208740192e-05, "loss": 0.0096, "step": 561900 }, { "epoch": 1.46, "learning_rate": 8.151723387103045e-05, "loss": 0.0091, "step": 561910 }, { "epoch": 1.46, "learning_rate": 8.151334565465899e-05, "loss": 0.0087, "step": 561920 }, { "epoch": 1.46, "learning_rate": 8.150945743828752e-05, "loss": 0.0078, "step": 561930 }, { "epoch": 1.46, "learning_rate": 8.150556922191606e-05, "loss": 0.0103, "step": 561940 }, { "epoch": 1.46, "learning_rate": 8.150168100554459e-05, "loss": 0.0097, "step": 561950 }, { "epoch": 1.46, "learning_rate": 8.149779278917313e-05, "loss": 0.0097, "step": 561960 }, { "epoch": 1.46, "learning_rate": 8.149390457280166e-05, "loss": 0.0135, "step": 561970 }, { "epoch": 1.46, "learning_rate": 8.149001635643019e-05, "loss": 0.0073, "step": 561980 }, { "epoch": 1.46, "learning_rate": 8.148612814005873e-05, "loss": 0.0124, "step": 561990 }, { "epoch": 1.46, "learning_rate": 8.148223992368726e-05, "loss": 0.0098, "step": 562000 }, { "epoch": 1.46, "eval_cer": 0.8816942885015627, "eval_loss": 0.006133432034403086, "eval_runtime": 107.8225, "eval_samples_per_second": 18.549, "eval_steps_per_second": 4.637, "step": 562000 }, { "epoch": 1.46, "learning_rate": 8.14783517073158e-05, "loss": 0.0069, "step": 562010 }, { "epoch": 1.46, "learning_rate": 8.147446349094433e-05, "loss": 0.0077, "step": 562020 }, { "epoch": 1.46, "learning_rate": 8.147057527457287e-05, "loss": 0.0082, "step": 562030 }, { "epoch": 1.46, "learning_rate": 8.14666870582014e-05, "loss": 0.0091, "step": 562040 }, { "epoch": 1.46, "learning_rate": 8.146279884182995e-05, "loss": 0.0094, "step": 562050 }, { "epoch": 1.46, "learning_rate": 8.145891062545847e-05, "loss": 0.0081, "step": 562060 }, { "epoch": 1.46, "learning_rate": 8.145502240908702e-05, "loss": 0.0108, "step": 562070 }, { "epoch": 1.46, "learning_rate": 8.145113419271555e-05, "loss": 0.0109, "step": 562080 }, { "epoch": 1.46, "learning_rate": 8.144724597634409e-05, "loss": 0.0117, "step": 562090 }, { "epoch": 1.46, "learning_rate": 8.144335775997262e-05, "loss": 0.0124, "step": 562100 }, { "epoch": 1.46, "learning_rate": 8.143946954360116e-05, "loss": 0.0103, "step": 562110 }, { "epoch": 1.46, "learning_rate": 8.143558132722969e-05, "loss": 0.0073, "step": 562120 }, { "epoch": 1.46, "learning_rate": 8.143169311085823e-05, "loss": 0.0107, "step": 562130 }, { "epoch": 1.46, "learning_rate": 8.142780489448676e-05, "loss": 0.0068, "step": 562140 }, { "epoch": 1.46, "learning_rate": 8.14239166781153e-05, "loss": 0.0067, "step": 562150 }, { "epoch": 1.46, "learning_rate": 8.142002846174383e-05, "loss": 0.0098, "step": 562160 }, { "epoch": 1.46, "learning_rate": 8.141614024537237e-05, "loss": 0.0101, "step": 562170 }, { "epoch": 1.46, "learning_rate": 8.14122520290009e-05, "loss": 0.0093, "step": 562180 }, { "epoch": 1.46, "learning_rate": 8.140836381262944e-05, "loss": 0.011, "step": 562190 }, { "epoch": 1.46, "learning_rate": 8.140447559625797e-05, "loss": 0.0113, "step": 562200 }, { "epoch": 1.46, "learning_rate": 8.14005873798865e-05, "loss": 0.0089, "step": 562210 }, { "epoch": 1.46, "learning_rate": 8.139669916351504e-05, "loss": 0.0093, "step": 562220 }, { "epoch": 1.46, "learning_rate": 8.139281094714357e-05, "loss": 0.0103, "step": 562230 }, { "epoch": 1.46, "learning_rate": 8.138892273077212e-05, "loss": 0.013, "step": 562240 }, { "epoch": 1.46, "learning_rate": 8.138503451440065e-05, "loss": 0.0077, "step": 562250 }, { "epoch": 1.46, "learning_rate": 8.138114629802919e-05, "loss": 0.0087, "step": 562260 }, { "epoch": 1.46, "learning_rate": 8.137725808165772e-05, "loss": 0.0092, "step": 562270 }, { "epoch": 1.46, "learning_rate": 8.137336986528626e-05, "loss": 0.0077, "step": 562280 }, { "epoch": 1.46, "learning_rate": 8.136948164891479e-05, "loss": 0.0088, "step": 562290 }, { "epoch": 1.46, "learning_rate": 8.136559343254333e-05, "loss": 0.0083, "step": 562300 }, { "epoch": 1.46, "learning_rate": 8.136170521617186e-05, "loss": 0.0078, "step": 562310 }, { "epoch": 1.46, "learning_rate": 8.13578169998004e-05, "loss": 0.0097, "step": 562320 }, { "epoch": 1.46, "learning_rate": 8.135392878342893e-05, "loss": 0.0107, "step": 562330 }, { "epoch": 1.46, "learning_rate": 8.135004056705747e-05, "loss": 0.0074, "step": 562340 }, { "epoch": 1.46, "learning_rate": 8.1346152350686e-05, "loss": 0.011, "step": 562350 }, { "epoch": 1.46, "learning_rate": 8.134226413431454e-05, "loss": 0.0067, "step": 562360 }, { "epoch": 1.46, "learning_rate": 8.133837591794307e-05, "loss": 0.0102, "step": 562370 }, { "epoch": 1.46, "learning_rate": 8.133448770157161e-05, "loss": 0.0095, "step": 562380 }, { "epoch": 1.46, "learning_rate": 8.133059948520014e-05, "loss": 0.0129, "step": 562390 }, { "epoch": 1.46, "learning_rate": 8.132671126882869e-05, "loss": 0.008, "step": 562400 }, { "epoch": 1.46, "learning_rate": 8.132282305245722e-05, "loss": 0.0094, "step": 562410 }, { "epoch": 1.46, "learning_rate": 8.131893483608576e-05, "loss": 0.0097, "step": 562420 }, { "epoch": 1.46, "learning_rate": 8.131504661971429e-05, "loss": 0.0136, "step": 562430 }, { "epoch": 1.46, "learning_rate": 8.131115840334283e-05, "loss": 0.0121, "step": 562440 }, { "epoch": 1.46, "learning_rate": 8.130727018697136e-05, "loss": 0.0137, "step": 562450 }, { "epoch": 1.46, "learning_rate": 8.130338197059989e-05, "loss": 0.0098, "step": 562460 }, { "epoch": 1.46, "learning_rate": 8.129949375422843e-05, "loss": 0.0108, "step": 562470 }, { "epoch": 1.46, "learning_rate": 8.129560553785696e-05, "loss": 0.0141, "step": 562480 }, { "epoch": 1.46, "learning_rate": 8.12917173214855e-05, "loss": 0.009, "step": 562490 }, { "epoch": 1.46, "learning_rate": 8.128782910511403e-05, "loss": 0.0071, "step": 562500 }, { "epoch": 1.46, "learning_rate": 8.128394088874257e-05, "loss": 0.0076, "step": 562510 }, { "epoch": 1.46, "learning_rate": 8.12800526723711e-05, "loss": 0.0105, "step": 562520 }, { "epoch": 1.46, "learning_rate": 8.127616445599964e-05, "loss": 0.0068, "step": 562530 }, { "epoch": 1.46, "learning_rate": 8.127227623962817e-05, "loss": 0.0122, "step": 562540 }, { "epoch": 1.46, "learning_rate": 8.126838802325671e-05, "loss": 0.0077, "step": 562550 }, { "epoch": 1.46, "learning_rate": 8.126449980688524e-05, "loss": 0.009, "step": 562560 }, { "epoch": 1.46, "learning_rate": 8.126061159051379e-05, "loss": 0.0085, "step": 562570 }, { "epoch": 1.46, "learning_rate": 8.125672337414231e-05, "loss": 0.0091, "step": 562580 }, { "epoch": 1.46, "learning_rate": 8.125283515777086e-05, "loss": 0.0097, "step": 562590 }, { "epoch": 1.46, "learning_rate": 8.124894694139939e-05, "loss": 0.0098, "step": 562600 }, { "epoch": 1.46, "learning_rate": 8.124505872502793e-05, "loss": 0.0096, "step": 562610 }, { "epoch": 1.46, "learning_rate": 8.124117050865646e-05, "loss": 0.0118, "step": 562620 }, { "epoch": 1.46, "learning_rate": 8.1237282292285e-05, "loss": 0.0098, "step": 562630 }, { "epoch": 1.46, "learning_rate": 8.123339407591353e-05, "loss": 0.0098, "step": 562640 }, { "epoch": 1.46, "learning_rate": 8.122950585954207e-05, "loss": 0.0089, "step": 562650 }, { "epoch": 1.46, "learning_rate": 8.12256176431706e-05, "loss": 0.0087, "step": 562660 }, { "epoch": 1.46, "learning_rate": 8.122172942679914e-05, "loss": 0.0076, "step": 562670 }, { "epoch": 1.46, "learning_rate": 8.121784121042767e-05, "loss": 0.0134, "step": 562680 }, { "epoch": 1.46, "learning_rate": 8.121395299405621e-05, "loss": 0.0098, "step": 562690 }, { "epoch": 1.46, "learning_rate": 8.121006477768474e-05, "loss": 0.009, "step": 562700 }, { "epoch": 1.46, "learning_rate": 8.120617656131327e-05, "loss": 0.0064, "step": 562710 }, { "epoch": 1.46, "learning_rate": 8.120228834494181e-05, "loss": 0.0101, "step": 562720 }, { "epoch": 1.46, "learning_rate": 8.119840012857034e-05, "loss": 0.0161, "step": 562730 }, { "epoch": 1.46, "learning_rate": 8.119451191219888e-05, "loss": 0.0088, "step": 562740 }, { "epoch": 1.46, "learning_rate": 8.11906236958274e-05, "loss": 0.0076, "step": 562750 }, { "epoch": 1.46, "learning_rate": 8.118673547945596e-05, "loss": 0.008, "step": 562760 }, { "epoch": 1.46, "learning_rate": 8.118284726308449e-05, "loss": 0.0068, "step": 562770 }, { "epoch": 1.46, "learning_rate": 8.117895904671303e-05, "loss": 0.0068, "step": 562780 }, { "epoch": 1.46, "learning_rate": 8.117507083034156e-05, "loss": 0.0067, "step": 562790 }, { "epoch": 1.46, "learning_rate": 8.11711826139701e-05, "loss": 0.0074, "step": 562800 }, { "epoch": 1.46, "learning_rate": 8.116729439759863e-05, "loss": 0.0109, "step": 562810 }, { "epoch": 1.46, "learning_rate": 8.116340618122717e-05, "loss": 0.0074, "step": 562820 }, { "epoch": 1.46, "learning_rate": 8.11595179648557e-05, "loss": 0.0101, "step": 562830 }, { "epoch": 1.46, "learning_rate": 8.115562974848424e-05, "loss": 0.007, "step": 562840 }, { "epoch": 1.46, "learning_rate": 8.115174153211277e-05, "loss": 0.0071, "step": 562850 }, { "epoch": 1.46, "learning_rate": 8.114785331574131e-05, "loss": 0.008, "step": 562860 }, { "epoch": 1.46, "learning_rate": 8.114396509936984e-05, "loss": 0.0129, "step": 562870 }, { "epoch": 1.46, "learning_rate": 8.114007688299838e-05, "loss": 0.0087, "step": 562880 }, { "epoch": 1.46, "learning_rate": 8.113618866662691e-05, "loss": 0.008, "step": 562890 }, { "epoch": 1.46, "learning_rate": 8.113230045025545e-05, "loss": 0.0126, "step": 562900 }, { "epoch": 1.46, "learning_rate": 8.112841223388398e-05, "loss": 0.0109, "step": 562910 }, { "epoch": 1.46, "learning_rate": 8.112452401751253e-05, "loss": 0.0058, "step": 562920 }, { "epoch": 1.46, "learning_rate": 8.112063580114105e-05, "loss": 0.0081, "step": 562930 }, { "epoch": 1.46, "learning_rate": 8.11167475847696e-05, "loss": 0.0088, "step": 562940 }, { "epoch": 1.46, "learning_rate": 8.111285936839813e-05, "loss": 0.0087, "step": 562950 }, { "epoch": 1.46, "learning_rate": 8.110897115202666e-05, "loss": 0.0079, "step": 562960 }, { "epoch": 1.46, "learning_rate": 8.11050829356552e-05, "loss": 0.0119, "step": 562970 }, { "epoch": 1.46, "learning_rate": 8.110119471928373e-05, "loss": 0.0105, "step": 562980 }, { "epoch": 1.46, "learning_rate": 8.109730650291227e-05, "loss": 0.0067, "step": 562990 }, { "epoch": 1.46, "learning_rate": 8.10934182865408e-05, "loss": 0.009, "step": 563000 }, { "epoch": 1.46, "eval_cer": 0.8816942885015627, "eval_loss": 0.0060217659920454025, "eval_runtime": 108.0142, "eval_samples_per_second": 18.516, "eval_steps_per_second": 4.629, "step": 563000 }, { "epoch": 1.46, "learning_rate": 8.108953007016934e-05, "loss": 0.0124, "step": 563010 }, { "epoch": 1.46, "learning_rate": 8.108564185379787e-05, "loss": 0.008, "step": 563020 }, { "epoch": 1.46, "learning_rate": 8.108175363742641e-05, "loss": 0.0089, "step": 563030 }, { "epoch": 1.46, "learning_rate": 8.107786542105494e-05, "loss": 0.0234, "step": 563040 }, { "epoch": 1.46, "learning_rate": 8.107397720468348e-05, "loss": 0.0133, "step": 563050 }, { "epoch": 1.46, "learning_rate": 8.107008898831201e-05, "loss": 0.01, "step": 563060 }, { "epoch": 1.46, "learning_rate": 8.106620077194055e-05, "loss": 0.0093, "step": 563070 }, { "epoch": 1.46, "learning_rate": 8.106231255556908e-05, "loss": 0.0098, "step": 563080 }, { "epoch": 1.46, "learning_rate": 8.105842433919762e-05, "loss": 0.0113, "step": 563090 }, { "epoch": 1.46, "learning_rate": 8.105453612282615e-05, "loss": 0.0078, "step": 563100 }, { "epoch": 1.46, "learning_rate": 8.10506479064547e-05, "loss": 0.0089, "step": 563110 }, { "epoch": 1.46, "learning_rate": 8.104675969008323e-05, "loss": 0.0078, "step": 563120 }, { "epoch": 1.46, "learning_rate": 8.104287147371177e-05, "loss": 0.0093, "step": 563130 }, { "epoch": 1.46, "learning_rate": 8.10389832573403e-05, "loss": 0.0079, "step": 563140 }, { "epoch": 1.46, "learning_rate": 8.103509504096884e-05, "loss": 0.0096, "step": 563150 }, { "epoch": 1.46, "learning_rate": 8.103120682459737e-05, "loss": 0.0066, "step": 563160 }, { "epoch": 1.46, "learning_rate": 8.102731860822591e-05, "loss": 0.0116, "step": 563170 }, { "epoch": 1.46, "learning_rate": 8.102343039185444e-05, "loss": 0.0098, "step": 563180 }, { "epoch": 1.46, "learning_rate": 8.101954217548298e-05, "loss": 0.0069, "step": 563190 }, { "epoch": 1.46, "learning_rate": 8.101565395911151e-05, "loss": 0.0133, "step": 563200 }, { "epoch": 1.46, "learning_rate": 8.101176574274004e-05, "loss": 0.0088, "step": 563210 }, { "epoch": 1.46, "learning_rate": 8.100787752636858e-05, "loss": 0.0077, "step": 563220 }, { "epoch": 1.46, "learning_rate": 8.10039893099971e-05, "loss": 0.0091, "step": 563230 }, { "epoch": 1.46, "learning_rate": 8.100010109362565e-05, "loss": 0.0065, "step": 563240 }, { "epoch": 1.46, "learning_rate": 8.099621287725418e-05, "loss": 0.0144, "step": 563250 }, { "epoch": 1.46, "learning_rate": 8.099232466088272e-05, "loss": 0.0108, "step": 563260 }, { "epoch": 1.46, "learning_rate": 8.098843644451125e-05, "loss": 0.007, "step": 563270 }, { "epoch": 1.46, "learning_rate": 8.09845482281398e-05, "loss": 0.0107, "step": 563280 }, { "epoch": 1.46, "learning_rate": 8.098066001176832e-05, "loss": 0.0101, "step": 563290 }, { "epoch": 1.46, "learning_rate": 8.097677179539687e-05, "loss": 0.0063, "step": 563300 }, { "epoch": 1.46, "learning_rate": 8.09728835790254e-05, "loss": 0.0142, "step": 563310 }, { "epoch": 1.46, "learning_rate": 8.096899536265394e-05, "loss": 0.0101, "step": 563320 }, { "epoch": 1.46, "learning_rate": 8.096510714628247e-05, "loss": 0.0114, "step": 563330 }, { "epoch": 1.46, "learning_rate": 8.096121892991101e-05, "loss": 0.0107, "step": 563340 }, { "epoch": 1.46, "learning_rate": 8.095733071353954e-05, "loss": 0.0084, "step": 563350 }, { "epoch": 1.46, "learning_rate": 8.095344249716808e-05, "loss": 0.0093, "step": 563360 }, { "epoch": 1.46, "learning_rate": 8.094955428079661e-05, "loss": 0.0092, "step": 563370 }, { "epoch": 1.46, "learning_rate": 8.094566606442515e-05, "loss": 0.0108, "step": 563380 }, { "epoch": 1.46, "learning_rate": 8.094177784805368e-05, "loss": 0.0098, "step": 563390 }, { "epoch": 1.46, "learning_rate": 8.093788963168222e-05, "loss": 0.0116, "step": 563400 }, { "epoch": 1.46, "learning_rate": 8.093400141531075e-05, "loss": 0.0093, "step": 563410 }, { "epoch": 1.46, "learning_rate": 8.093011319893929e-05, "loss": 0.0089, "step": 563420 }, { "epoch": 1.46, "learning_rate": 8.092622498256782e-05, "loss": 0.0131, "step": 563430 }, { "epoch": 1.46, "learning_rate": 8.092233676619637e-05, "loss": 0.0067, "step": 563440 }, { "epoch": 1.46, "learning_rate": 8.091844854982489e-05, "loss": 0.0089, "step": 563450 }, { "epoch": 1.46, "learning_rate": 8.091456033345342e-05, "loss": 0.0084, "step": 563460 }, { "epoch": 1.46, "learning_rate": 8.091067211708197e-05, "loss": 0.0086, "step": 563470 }, { "epoch": 1.46, "learning_rate": 8.09067839007105e-05, "loss": 0.0082, "step": 563480 }, { "epoch": 1.46, "learning_rate": 8.090289568433904e-05, "loss": 0.0071, "step": 563490 }, { "epoch": 1.46, "learning_rate": 8.089900746796757e-05, "loss": 0.0102, "step": 563500 }, { "epoch": 1.46, "learning_rate": 8.089511925159611e-05, "loss": 0.0121, "step": 563510 }, { "epoch": 1.46, "learning_rate": 8.089123103522464e-05, "loss": 0.0097, "step": 563520 }, { "epoch": 1.46, "learning_rate": 8.088734281885318e-05, "loss": 0.0089, "step": 563530 }, { "epoch": 1.46, "learning_rate": 8.088345460248171e-05, "loss": 0.0103, "step": 563540 }, { "epoch": 1.46, "learning_rate": 8.087956638611025e-05, "loss": 0.0088, "step": 563550 }, { "epoch": 1.46, "learning_rate": 8.087567816973878e-05, "loss": 0.0162, "step": 563560 }, { "epoch": 1.46, "learning_rate": 8.087178995336732e-05, "loss": 0.0101, "step": 563570 }, { "epoch": 1.46, "learning_rate": 8.086790173699585e-05, "loss": 0.0097, "step": 563580 }, { "epoch": 1.46, "learning_rate": 8.086401352062439e-05, "loss": 0.011, "step": 563590 }, { "epoch": 1.46, "learning_rate": 8.086012530425292e-05, "loss": 0.0092, "step": 563600 }, { "epoch": 1.46, "learning_rate": 8.085623708788146e-05, "loss": 0.0093, "step": 563610 }, { "epoch": 1.46, "learning_rate": 8.085234887150999e-05, "loss": 0.0094, "step": 563620 }, { "epoch": 1.46, "learning_rate": 8.084846065513854e-05, "loss": 0.0098, "step": 563630 }, { "epoch": 1.46, "learning_rate": 8.084457243876707e-05, "loss": 0.0108, "step": 563640 }, { "epoch": 1.46, "learning_rate": 8.084068422239561e-05, "loss": 0.0088, "step": 563650 }, { "epoch": 1.46, "learning_rate": 8.083679600602414e-05, "loss": 0.0093, "step": 563660 }, { "epoch": 1.46, "learning_rate": 8.083290778965268e-05, "loss": 0.0124, "step": 563670 }, { "epoch": 1.46, "learning_rate": 8.082901957328121e-05, "loss": 0.0074, "step": 563680 }, { "epoch": 1.46, "learning_rate": 8.082513135690975e-05, "loss": 0.0084, "step": 563690 }, { "epoch": 1.46, "learning_rate": 8.082124314053828e-05, "loss": 0.0104, "step": 563700 }, { "epoch": 1.46, "learning_rate": 8.081735492416681e-05, "loss": 0.0157, "step": 563710 }, { "epoch": 1.46, "learning_rate": 8.081346670779535e-05, "loss": 0.0086, "step": 563720 }, { "epoch": 1.46, "learning_rate": 8.080957849142388e-05, "loss": 0.01, "step": 563730 }, { "epoch": 1.46, "learning_rate": 8.080569027505242e-05, "loss": 0.0095, "step": 563740 }, { "epoch": 1.46, "learning_rate": 8.080180205868095e-05, "loss": 0.0079, "step": 563750 }, { "epoch": 1.46, "learning_rate": 8.079791384230949e-05, "loss": 0.0101, "step": 563760 }, { "epoch": 1.46, "learning_rate": 8.079402562593802e-05, "loss": 0.0098, "step": 563770 }, { "epoch": 1.46, "learning_rate": 8.079013740956656e-05, "loss": 0.0103, "step": 563780 }, { "epoch": 1.46, "learning_rate": 8.078624919319509e-05, "loss": 0.0107, "step": 563790 }, { "epoch": 1.46, "learning_rate": 8.078236097682364e-05, "loss": 0.0101, "step": 563800 }, { "epoch": 1.46, "learning_rate": 8.077847276045216e-05, "loss": 0.0088, "step": 563810 }, { "epoch": 1.46, "learning_rate": 8.077458454408071e-05, "loss": 0.0071, "step": 563820 }, { "epoch": 1.46, "learning_rate": 8.077069632770924e-05, "loss": 0.008, "step": 563830 }, { "epoch": 1.46, "learning_rate": 8.076680811133778e-05, "loss": 0.0118, "step": 563840 }, { "epoch": 1.46, "learning_rate": 8.076291989496631e-05, "loss": 0.0074, "step": 563850 }, { "epoch": 1.46, "learning_rate": 8.075903167859485e-05, "loss": 0.0092, "step": 563860 }, { "epoch": 1.46, "learning_rate": 8.075514346222338e-05, "loss": 0.01, "step": 563870 }, { "epoch": 1.46, "learning_rate": 8.075125524585192e-05, "loss": 0.0095, "step": 563880 }, { "epoch": 1.46, "learning_rate": 8.074736702948045e-05, "loss": 0.0062, "step": 563890 }, { "epoch": 1.46, "learning_rate": 8.074347881310899e-05, "loss": 0.0095, "step": 563900 }, { "epoch": 1.46, "learning_rate": 8.073959059673752e-05, "loss": 0.0093, "step": 563910 }, { "epoch": 1.46, "learning_rate": 8.073570238036606e-05, "loss": 0.0094, "step": 563920 }, { "epoch": 1.46, "learning_rate": 8.073181416399459e-05, "loss": 0.0103, "step": 563930 }, { "epoch": 1.46, "learning_rate": 8.072792594762313e-05, "loss": 0.0082, "step": 563940 }, { "epoch": 1.46, "learning_rate": 8.072403773125166e-05, "loss": 0.0081, "step": 563950 }, { "epoch": 1.46, "learning_rate": 8.072014951488019e-05, "loss": 0.0075, "step": 563960 }, { "epoch": 1.46, "learning_rate": 8.071626129850873e-05, "loss": 0.0085, "step": 563970 }, { "epoch": 1.46, "learning_rate": 8.071237308213726e-05, "loss": 0.0071, "step": 563980 }, { "epoch": 1.46, "learning_rate": 8.070848486576581e-05, "loss": 0.008, "step": 563990 }, { "epoch": 1.46, "learning_rate": 8.070459664939434e-05, "loss": 0.007, "step": 564000 }, { "epoch": 1.46, "eval_cer": 0.8816844910430235, "eval_loss": 0.006286456249654293, "eval_runtime": 107.8864, "eval_samples_per_second": 18.538, "eval_steps_per_second": 4.635, "step": 564000 }, { "epoch": 1.46, "learning_rate": 8.070070843302288e-05, "loss": 0.0086, "step": 564010 }, { "epoch": 1.46, "learning_rate": 8.069682021665141e-05, "loss": 0.0081, "step": 564020 }, { "epoch": 1.46, "learning_rate": 8.069293200027995e-05, "loss": 0.011, "step": 564030 }, { "epoch": 1.46, "learning_rate": 8.068904378390848e-05, "loss": 0.0104, "step": 564040 }, { "epoch": 1.46, "learning_rate": 8.068515556753702e-05, "loss": 0.0084, "step": 564050 }, { "epoch": 1.46, "learning_rate": 8.068126735116555e-05, "loss": 0.0081, "step": 564060 }, { "epoch": 1.46, "learning_rate": 8.067737913479409e-05, "loss": 0.0079, "step": 564070 }, { "epoch": 1.46, "learning_rate": 8.067349091842262e-05, "loss": 0.0101, "step": 564080 }, { "epoch": 1.46, "learning_rate": 8.066960270205116e-05, "loss": 0.007, "step": 564090 }, { "epoch": 1.46, "learning_rate": 8.066571448567969e-05, "loss": 0.0084, "step": 564100 }, { "epoch": 1.46, "learning_rate": 8.066182626930823e-05, "loss": 0.0093, "step": 564110 }, { "epoch": 1.46, "learning_rate": 8.065793805293676e-05, "loss": 0.012, "step": 564120 }, { "epoch": 1.46, "learning_rate": 8.06540498365653e-05, "loss": 0.0105, "step": 564130 }, { "epoch": 1.46, "learning_rate": 8.065016162019383e-05, "loss": 0.0132, "step": 564140 }, { "epoch": 1.46, "learning_rate": 8.064627340382238e-05, "loss": 0.0092, "step": 564150 }, { "epoch": 1.46, "learning_rate": 8.06423851874509e-05, "loss": 0.0096, "step": 564160 }, { "epoch": 1.46, "learning_rate": 8.063849697107945e-05, "loss": 0.0112, "step": 564170 }, { "epoch": 1.46, "learning_rate": 8.063460875470798e-05, "loss": 0.0126, "step": 564180 }, { "epoch": 1.46, "learning_rate": 8.063072053833652e-05, "loss": 0.0096, "step": 564190 }, { "epoch": 1.46, "learning_rate": 8.062683232196505e-05, "loss": 0.0102, "step": 564200 }, { "epoch": 1.46, "learning_rate": 8.062294410559358e-05, "loss": 0.0076, "step": 564210 }, { "epoch": 1.46, "learning_rate": 8.061905588922212e-05, "loss": 0.0092, "step": 564220 }, { "epoch": 1.46, "learning_rate": 8.061516767285065e-05, "loss": 0.0098, "step": 564230 }, { "epoch": 1.46, "learning_rate": 8.061127945647919e-05, "loss": 0.01, "step": 564240 }, { "epoch": 1.46, "learning_rate": 8.060739124010772e-05, "loss": 0.0068, "step": 564250 }, { "epoch": 1.46, "learning_rate": 8.060350302373626e-05, "loss": 0.0084, "step": 564260 }, { "epoch": 1.46, "learning_rate": 8.059961480736479e-05, "loss": 0.0074, "step": 564270 }, { "epoch": 1.46, "learning_rate": 8.059572659099333e-05, "loss": 0.0091, "step": 564280 }, { "epoch": 1.46, "learning_rate": 8.059183837462186e-05, "loss": 0.0109, "step": 564290 }, { "epoch": 1.46, "learning_rate": 8.05879501582504e-05, "loss": 0.01, "step": 564300 }, { "epoch": 1.46, "learning_rate": 8.058406194187893e-05, "loss": 0.0086, "step": 564310 }, { "epoch": 1.46, "learning_rate": 8.058017372550747e-05, "loss": 0.0108, "step": 564320 }, { "epoch": 1.46, "learning_rate": 8.0576285509136e-05, "loss": 0.0087, "step": 564330 }, { "epoch": 1.46, "learning_rate": 8.057239729276455e-05, "loss": 0.0078, "step": 564340 }, { "epoch": 1.46, "learning_rate": 8.056850907639308e-05, "loss": 0.0091, "step": 564350 }, { "epoch": 1.46, "learning_rate": 8.056462086002162e-05, "loss": 0.0077, "step": 564360 }, { "epoch": 1.46, "learning_rate": 8.056073264365015e-05, "loss": 0.0081, "step": 564370 }, { "epoch": 1.46, "learning_rate": 8.055684442727869e-05, "loss": 0.0106, "step": 564380 }, { "epoch": 1.46, "learning_rate": 8.055295621090722e-05, "loss": 0.011, "step": 564390 }, { "epoch": 1.46, "learning_rate": 8.054906799453576e-05, "loss": 0.0091, "step": 564400 }, { "epoch": 1.46, "learning_rate": 8.054517977816429e-05, "loss": 0.0089, "step": 564410 }, { "epoch": 1.46, "learning_rate": 8.054129156179283e-05, "loss": 0.0087, "step": 564420 }, { "epoch": 1.46, "learning_rate": 8.053740334542136e-05, "loss": 0.0088, "step": 564430 }, { "epoch": 1.46, "learning_rate": 8.05335151290499e-05, "loss": 0.008, "step": 564440 }, { "epoch": 1.46, "learning_rate": 8.052962691267843e-05, "loss": 0.0096, "step": 564450 }, { "epoch": 1.46, "learning_rate": 8.052573869630696e-05, "loss": 0.0255, "step": 564460 }, { "epoch": 1.46, "learning_rate": 8.05218504799355e-05, "loss": 0.0087, "step": 564470 }, { "epoch": 1.46, "learning_rate": 8.051796226356403e-05, "loss": 0.0086, "step": 564480 }, { "epoch": 1.46, "learning_rate": 8.051407404719257e-05, "loss": 0.009, "step": 564490 }, { "epoch": 1.46, "learning_rate": 8.05101858308211e-05, "loss": 0.0122, "step": 564500 }, { "epoch": 1.46, "learning_rate": 8.050629761444965e-05, "loss": 0.0061, "step": 564510 }, { "epoch": 1.46, "learning_rate": 8.050240939807816e-05, "loss": 0.008, "step": 564520 }, { "epoch": 1.46, "learning_rate": 8.049852118170672e-05, "loss": 0.0089, "step": 564530 }, { "epoch": 1.46, "learning_rate": 8.049463296533525e-05, "loss": 0.0114, "step": 564540 }, { "epoch": 1.46, "learning_rate": 8.049074474896379e-05, "loss": 0.0078, "step": 564550 }, { "epoch": 1.46, "learning_rate": 8.048685653259232e-05, "loss": 0.0142, "step": 564560 }, { "epoch": 1.46, "learning_rate": 8.048296831622086e-05, "loss": 0.0136, "step": 564570 }, { "epoch": 1.46, "learning_rate": 8.047908009984939e-05, "loss": 0.0092, "step": 564580 }, { "epoch": 1.46, "learning_rate": 8.047519188347793e-05, "loss": 0.0085, "step": 564590 }, { "epoch": 1.46, "learning_rate": 8.047130366710646e-05, "loss": 0.0119, "step": 564600 }, { "epoch": 1.46, "learning_rate": 8.0467415450735e-05, "loss": 0.0089, "step": 564610 }, { "epoch": 1.46, "learning_rate": 8.046352723436353e-05, "loss": 0.0085, "step": 564620 }, { "epoch": 1.46, "learning_rate": 8.045963901799207e-05, "loss": 0.0116, "step": 564630 }, { "epoch": 1.46, "learning_rate": 8.04557508016206e-05, "loss": 0.0074, "step": 564640 }, { "epoch": 1.46, "learning_rate": 8.045186258524914e-05, "loss": 0.0089, "step": 564650 }, { "epoch": 1.46, "learning_rate": 8.044797436887767e-05, "loss": 0.0104, "step": 564660 }, { "epoch": 1.46, "learning_rate": 8.044408615250622e-05, "loss": 0.0127, "step": 564670 }, { "epoch": 1.46, "learning_rate": 8.044019793613474e-05, "loss": 0.0066, "step": 564680 }, { "epoch": 1.46, "learning_rate": 8.043630971976329e-05, "loss": 0.0093, "step": 564690 }, { "epoch": 1.46, "learning_rate": 8.043242150339182e-05, "loss": 0.0102, "step": 564700 }, { "epoch": 1.46, "learning_rate": 8.042853328702035e-05, "loss": 0.0116, "step": 564710 }, { "epoch": 1.46, "learning_rate": 8.042464507064889e-05, "loss": 0.0096, "step": 564720 }, { "epoch": 1.46, "learning_rate": 8.042075685427742e-05, "loss": 0.0097, "step": 564730 }, { "epoch": 1.46, "learning_rate": 8.041686863790596e-05, "loss": 0.0097, "step": 564740 }, { "epoch": 1.46, "learning_rate": 8.041298042153449e-05, "loss": 0.0117, "step": 564750 }, { "epoch": 1.46, "learning_rate": 8.040909220516303e-05, "loss": 0.0089, "step": 564760 }, { "epoch": 1.46, "learning_rate": 8.040520398879156e-05, "loss": 0.0073, "step": 564770 }, { "epoch": 1.46, "learning_rate": 8.04013157724201e-05, "loss": 0.0084, "step": 564780 }, { "epoch": 1.46, "learning_rate": 8.039742755604863e-05, "loss": 0.011, "step": 564790 }, { "epoch": 1.46, "learning_rate": 8.039353933967717e-05, "loss": 0.0105, "step": 564800 }, { "epoch": 1.46, "learning_rate": 8.03896511233057e-05, "loss": 0.0101, "step": 564810 }, { "epoch": 1.46, "learning_rate": 8.038576290693424e-05, "loss": 0.0083, "step": 564820 }, { "epoch": 1.46, "learning_rate": 8.038187469056277e-05, "loss": 0.0068, "step": 564830 }, { "epoch": 1.46, "learning_rate": 8.037798647419131e-05, "loss": 0.0085, "step": 564840 }, { "epoch": 1.46, "learning_rate": 8.037409825781984e-05, "loss": 0.0108, "step": 564850 }, { "epoch": 1.46, "learning_rate": 8.037021004144839e-05, "loss": 0.0075, "step": 564860 }, { "epoch": 1.46, "learning_rate": 8.036632182507692e-05, "loss": 0.0075, "step": 564870 }, { "epoch": 1.46, "learning_rate": 8.036243360870546e-05, "loss": 0.0117, "step": 564880 }, { "epoch": 1.46, "learning_rate": 8.035854539233399e-05, "loss": 0.0097, "step": 564890 }, { "epoch": 1.46, "learning_rate": 8.035465717596253e-05, "loss": 0.0113, "step": 564900 }, { "epoch": 1.46, "learning_rate": 8.035076895959106e-05, "loss": 0.0063, "step": 564910 }, { "epoch": 1.46, "learning_rate": 8.03468807432196e-05, "loss": 0.0097, "step": 564920 }, { "epoch": 1.46, "learning_rate": 8.034299252684813e-05, "loss": 0.0088, "step": 564930 }, { "epoch": 1.46, "learning_rate": 8.033910431047666e-05, "loss": 0.0087, "step": 564940 }, { "epoch": 1.46, "learning_rate": 8.03352160941052e-05, "loss": 0.0112, "step": 564950 }, { "epoch": 1.46, "learning_rate": 8.033132787773373e-05, "loss": 0.0096, "step": 564960 }, { "epoch": 1.46, "learning_rate": 8.032743966136227e-05, "loss": 0.0142, "step": 564970 }, { "epoch": 1.46, "learning_rate": 8.03235514449908e-05, "loss": 0.0092, "step": 564980 }, { "epoch": 1.46, "learning_rate": 8.031966322861934e-05, "loss": 0.0106, "step": 564990 }, { "epoch": 1.46, "learning_rate": 8.031577501224787e-05, "loss": 0.0112, "step": 565000 }, { "epoch": 1.46, "eval_cer": 0.8816704946736816, "eval_loss": 0.006258940789848566, "eval_runtime": 107.7505, "eval_samples_per_second": 18.561, "eval_steps_per_second": 4.64, "step": 565000 }, { "epoch": 1.46, "learning_rate": 8.031188679587641e-05, "loss": 0.0104, "step": 565010 }, { "epoch": 1.46, "learning_rate": 8.030799857950494e-05, "loss": 0.0068, "step": 565020 }, { "epoch": 1.46, "learning_rate": 8.030411036313349e-05, "loss": 0.0082, "step": 565030 }, { "epoch": 1.46, "learning_rate": 8.0300222146762e-05, "loss": 0.008, "step": 565040 }, { "epoch": 1.46, "learning_rate": 8.029633393039056e-05, "loss": 0.0085, "step": 565050 }, { "epoch": 1.46, "learning_rate": 8.029244571401909e-05, "loss": 0.011, "step": 565060 }, { "epoch": 1.46, "learning_rate": 8.028855749764763e-05, "loss": 0.0096, "step": 565070 }, { "epoch": 1.46, "learning_rate": 8.028466928127616e-05, "loss": 0.0076, "step": 565080 }, { "epoch": 1.46, "learning_rate": 8.02807810649047e-05, "loss": 0.0087, "step": 565090 }, { "epoch": 1.46, "learning_rate": 8.027689284853323e-05, "loss": 0.0111, "step": 565100 }, { "epoch": 1.46, "learning_rate": 8.027300463216177e-05, "loss": 0.0093, "step": 565110 }, { "epoch": 1.46, "learning_rate": 8.02691164157903e-05, "loss": 0.0122, "step": 565120 }, { "epoch": 1.46, "learning_rate": 8.026522819941884e-05, "loss": 0.0081, "step": 565130 }, { "epoch": 1.46, "learning_rate": 8.026133998304737e-05, "loss": 0.0103, "step": 565140 }, { "epoch": 1.46, "learning_rate": 8.025745176667591e-05, "loss": 0.0084, "step": 565150 }, { "epoch": 1.46, "learning_rate": 8.025356355030444e-05, "loss": 0.0153, "step": 565160 }, { "epoch": 1.47, "learning_rate": 8.024967533393298e-05, "loss": 0.0073, "step": 565170 }, { "epoch": 1.47, "learning_rate": 8.02457871175615e-05, "loss": 0.0101, "step": 565180 }, { "epoch": 1.47, "learning_rate": 8.024189890119003e-05, "loss": 0.009, "step": 565190 }, { "epoch": 1.47, "learning_rate": 8.023801068481858e-05, "loss": 0.0152, "step": 565200 }, { "epoch": 1.47, "learning_rate": 8.02341224684471e-05, "loss": 0.0114, "step": 565210 }, { "epoch": 1.47, "learning_rate": 8.023023425207566e-05, "loss": 0.0083, "step": 565220 }, { "epoch": 1.47, "learning_rate": 8.022634603570419e-05, "loss": 0.0077, "step": 565230 }, { "epoch": 1.47, "learning_rate": 8.022245781933273e-05, "loss": 0.0106, "step": 565240 }, { "epoch": 1.47, "learning_rate": 8.021856960296126e-05, "loss": 0.008, "step": 565250 }, { "epoch": 1.47, "learning_rate": 8.02146813865898e-05, "loss": 0.007, "step": 565260 }, { "epoch": 1.47, "learning_rate": 8.021079317021833e-05, "loss": 0.0068, "step": 565270 }, { "epoch": 1.47, "learning_rate": 8.020690495384687e-05, "loss": 0.0083, "step": 565280 }, { "epoch": 1.47, "learning_rate": 8.02030167374754e-05, "loss": 0.0093, "step": 565290 }, { "epoch": 1.47, "learning_rate": 8.019912852110394e-05, "loss": 0.008, "step": 565300 }, { "epoch": 1.47, "learning_rate": 8.019524030473247e-05, "loss": 0.009, "step": 565310 }, { "epoch": 1.47, "learning_rate": 8.019135208836101e-05, "loss": 0.0085, "step": 565320 }, { "epoch": 1.47, "learning_rate": 8.018746387198954e-05, "loss": 0.0077, "step": 565330 }, { "epoch": 1.47, "learning_rate": 8.018357565561808e-05, "loss": 0.0104, "step": 565340 }, { "epoch": 1.47, "learning_rate": 8.01796874392466e-05, "loss": 0.0061, "step": 565350 }, { "epoch": 1.47, "learning_rate": 8.017579922287515e-05, "loss": 0.0109, "step": 565360 }, { "epoch": 1.47, "learning_rate": 8.017191100650368e-05, "loss": 0.0083, "step": 565370 }, { "epoch": 1.47, "learning_rate": 8.016802279013223e-05, "loss": 0.0099, "step": 565380 }, { "epoch": 1.47, "learning_rate": 8.016413457376076e-05, "loss": 0.0071, "step": 565390 }, { "epoch": 1.47, "learning_rate": 8.01602463573893e-05, "loss": 0.008, "step": 565400 }, { "epoch": 1.47, "learning_rate": 8.015635814101783e-05, "loss": 0.0085, "step": 565410 }, { "epoch": 1.47, "learning_rate": 8.015246992464637e-05, "loss": 0.0092, "step": 565420 }, { "epoch": 1.47, "learning_rate": 8.01485817082749e-05, "loss": 0.0117, "step": 565430 }, { "epoch": 1.47, "learning_rate": 8.014469349190343e-05, "loss": 0.0099, "step": 565440 }, { "epoch": 1.47, "learning_rate": 8.014080527553197e-05, "loss": 0.0082, "step": 565450 }, { "epoch": 1.47, "learning_rate": 8.01369170591605e-05, "loss": 0.0097, "step": 565460 }, { "epoch": 1.47, "learning_rate": 8.013302884278904e-05, "loss": 0.0074, "step": 565470 }, { "epoch": 1.47, "learning_rate": 8.012914062641757e-05, "loss": 0.0077, "step": 565480 }, { "epoch": 1.47, "learning_rate": 8.012525241004611e-05, "loss": 0.0092, "step": 565490 }, { "epoch": 1.47, "learning_rate": 8.012136419367464e-05, "loss": 0.0119, "step": 565500 }, { "epoch": 1.47, "learning_rate": 8.011747597730318e-05, "loss": 0.0094, "step": 565510 }, { "epoch": 1.47, "learning_rate": 8.01135877609317e-05, "loss": 0.0076, "step": 565520 }, { "epoch": 1.47, "learning_rate": 8.010969954456025e-05, "loss": 0.008, "step": 565530 }, { "epoch": 1.47, "learning_rate": 8.010581132818877e-05, "loss": 0.008, "step": 565540 }, { "epoch": 1.47, "learning_rate": 8.010192311181732e-05, "loss": 0.0112, "step": 565550 }, { "epoch": 1.47, "learning_rate": 8.009803489544584e-05, "loss": 0.0133, "step": 565560 }, { "epoch": 1.47, "learning_rate": 8.00941466790744e-05, "loss": 0.0081, "step": 565570 }, { "epoch": 1.47, "learning_rate": 8.009025846270293e-05, "loss": 0.0092, "step": 565580 }, { "epoch": 1.47, "learning_rate": 8.008637024633147e-05, "loss": 0.0108, "step": 565590 }, { "epoch": 1.47, "learning_rate": 8.008248202996e-05, "loss": 0.0103, "step": 565600 }, { "epoch": 1.47, "learning_rate": 8.007859381358854e-05, "loss": 0.0133, "step": 565610 }, { "epoch": 1.47, "learning_rate": 8.007470559721707e-05, "loss": 0.0082, "step": 565620 }, { "epoch": 1.47, "learning_rate": 8.007081738084561e-05, "loss": 0.0064, "step": 565630 }, { "epoch": 1.47, "learning_rate": 8.006692916447414e-05, "loss": 0.0075, "step": 565640 }, { "epoch": 1.47, "learning_rate": 8.006304094810268e-05, "loss": 0.0125, "step": 565650 }, { "epoch": 1.47, "learning_rate": 8.005915273173121e-05, "loss": 0.0075, "step": 565660 }, { "epoch": 1.47, "learning_rate": 8.005526451535975e-05, "loss": 0.0095, "step": 565670 }, { "epoch": 1.47, "learning_rate": 8.005137629898828e-05, "loss": 0.0083, "step": 565680 }, { "epoch": 1.47, "learning_rate": 8.00474880826168e-05, "loss": 0.0075, "step": 565690 }, { "epoch": 1.47, "learning_rate": 8.004359986624535e-05, "loss": 0.0109, "step": 565700 }, { "epoch": 1.47, "learning_rate": 8.003971164987387e-05, "loss": 0.0073, "step": 565710 }, { "epoch": 1.47, "learning_rate": 8.003582343350242e-05, "loss": 0.0091, "step": 565720 }, { "epoch": 1.47, "learning_rate": 8.003193521713094e-05, "loss": 0.0086, "step": 565730 }, { "epoch": 1.47, "learning_rate": 8.00280470007595e-05, "loss": 0.0072, "step": 565740 }, { "epoch": 1.47, "learning_rate": 8.002415878438801e-05, "loss": 0.0096, "step": 565750 }, { "epoch": 1.47, "learning_rate": 8.002027056801657e-05, "loss": 0.0085, "step": 565760 }, { "epoch": 1.47, "learning_rate": 8.00163823516451e-05, "loss": 0.0151, "step": 565770 }, { "epoch": 1.47, "learning_rate": 8.001249413527364e-05, "loss": 0.008, "step": 565780 }, { "epoch": 1.47, "learning_rate": 8.000860591890217e-05, "loss": 0.0119, "step": 565790 }, { "epoch": 1.47, "learning_rate": 8.000471770253071e-05, "loss": 0.0069, "step": 565800 }, { "epoch": 1.47, "learning_rate": 8.000082948615924e-05, "loss": 0.0072, "step": 565810 }, { "epoch": 1.47, "learning_rate": 7.999694126978778e-05, "loss": 0.0115, "step": 565820 }, { "epoch": 1.47, "learning_rate": 7.99930530534163e-05, "loss": 0.0112, "step": 565830 }, { "epoch": 1.47, "learning_rate": 7.998916483704485e-05, "loss": 0.0102, "step": 565840 }, { "epoch": 1.47, "learning_rate": 7.998527662067338e-05, "loss": 0.0099, "step": 565850 }, { "epoch": 1.47, "learning_rate": 7.998138840430192e-05, "loss": 0.0109, "step": 565860 }, { "epoch": 1.47, "learning_rate": 7.997750018793045e-05, "loss": 0.009, "step": 565870 }, { "epoch": 1.47, "learning_rate": 7.997361197155899e-05, "loss": 0.0073, "step": 565880 }, { "epoch": 1.47, "learning_rate": 7.996972375518752e-05, "loss": 0.0078, "step": 565890 }, { "epoch": 1.47, "learning_rate": 7.996583553881607e-05, "loss": 0.0094, "step": 565900 }, { "epoch": 1.47, "learning_rate": 7.996194732244459e-05, "loss": 0.01, "step": 565910 }, { "epoch": 1.47, "learning_rate": 7.995805910607314e-05, "loss": 0.008, "step": 565920 }, { "epoch": 1.47, "learning_rate": 7.995417088970167e-05, "loss": 0.0089, "step": 565930 }, { "epoch": 1.47, "learning_rate": 7.99502826733302e-05, "loss": 0.0096, "step": 565940 }, { "epoch": 1.47, "learning_rate": 7.994639445695874e-05, "loss": 0.0066, "step": 565950 }, { "epoch": 1.47, "learning_rate": 7.994250624058727e-05, "loss": 0.0091, "step": 565960 }, { "epoch": 1.47, "learning_rate": 7.993861802421581e-05, "loss": 0.0095, "step": 565970 }, { "epoch": 1.47, "learning_rate": 7.993472980784434e-05, "loss": 0.0118, "step": 565980 }, { "epoch": 1.47, "learning_rate": 7.993084159147288e-05, "loss": 0.0074, "step": 565990 }, { "epoch": 1.47, "learning_rate": 7.99269533751014e-05, "loss": 0.0098, "step": 566000 }, { "epoch": 1.47, "eval_cer": 0.8817180823294437, "eval_loss": 0.0061110155656933784, "eval_runtime": 107.9972, "eval_samples_per_second": 18.519, "eval_steps_per_second": 4.63, "step": 566000 }, { "epoch": 1.47, "learning_rate": 7.992306515872995e-05, "loss": 0.0099, "step": 566010 }, { "epoch": 1.47, "learning_rate": 7.991917694235848e-05, "loss": 0.0087, "step": 566020 }, { "epoch": 1.47, "learning_rate": 7.991528872598702e-05, "loss": 0.0073, "step": 566030 }, { "epoch": 1.47, "learning_rate": 7.991140050961555e-05, "loss": 0.009, "step": 566040 }, { "epoch": 1.47, "learning_rate": 7.990751229324409e-05, "loss": 0.0072, "step": 566050 }, { "epoch": 1.47, "learning_rate": 7.990362407687261e-05, "loss": 0.0093, "step": 566060 }, { "epoch": 1.47, "learning_rate": 7.989973586050116e-05, "loss": 0.0075, "step": 566070 }, { "epoch": 1.47, "learning_rate": 7.989584764412968e-05, "loss": 0.0098, "step": 566080 }, { "epoch": 1.47, "learning_rate": 7.989195942775824e-05, "loss": 0.0078, "step": 566090 }, { "epoch": 1.47, "learning_rate": 7.988807121138677e-05, "loss": 0.0097, "step": 566100 }, { "epoch": 1.47, "learning_rate": 7.988418299501531e-05, "loss": 0.0089, "step": 566110 }, { "epoch": 1.47, "learning_rate": 7.988029477864384e-05, "loss": 0.0073, "step": 566120 }, { "epoch": 1.47, "learning_rate": 7.987640656227238e-05, "loss": 0.0061, "step": 566130 }, { "epoch": 1.47, "learning_rate": 7.987251834590091e-05, "loss": 0.0097, "step": 566140 }, { "epoch": 1.47, "learning_rate": 7.986863012952945e-05, "loss": 0.0092, "step": 566150 }, { "epoch": 1.47, "learning_rate": 7.986474191315798e-05, "loss": 0.0067, "step": 566160 }, { "epoch": 1.47, "learning_rate": 7.986085369678652e-05, "loss": 0.0098, "step": 566170 }, { "epoch": 1.47, "learning_rate": 7.985696548041505e-05, "loss": 0.0082, "step": 566180 }, { "epoch": 1.47, "learning_rate": 7.985307726404357e-05, "loss": 0.01, "step": 566190 }, { "epoch": 1.47, "learning_rate": 7.984918904767212e-05, "loss": 0.0097, "step": 566200 }, { "epoch": 1.47, "learning_rate": 7.984530083130064e-05, "loss": 0.0085, "step": 566210 }, { "epoch": 1.47, "learning_rate": 7.984141261492919e-05, "loss": 0.0087, "step": 566220 }, { "epoch": 1.47, "learning_rate": 7.983752439855771e-05, "loss": 0.0092, "step": 566230 }, { "epoch": 1.47, "learning_rate": 7.983363618218626e-05, "loss": 0.013, "step": 566240 }, { "epoch": 1.47, "learning_rate": 7.982974796581478e-05, "loss": 0.0089, "step": 566250 }, { "epoch": 1.47, "learning_rate": 7.982585974944334e-05, "loss": 0.0085, "step": 566260 }, { "epoch": 1.47, "learning_rate": 7.982197153307185e-05, "loss": 0.0096, "step": 566270 }, { "epoch": 1.47, "learning_rate": 7.981808331670041e-05, "loss": 0.0068, "step": 566280 }, { "epoch": 1.47, "learning_rate": 7.981419510032894e-05, "loss": 0.0123, "step": 566290 }, { "epoch": 1.47, "learning_rate": 7.981030688395748e-05, "loss": 0.0109, "step": 566300 }, { "epoch": 1.47, "learning_rate": 7.9806418667586e-05, "loss": 0.0105, "step": 566310 }, { "epoch": 1.47, "learning_rate": 7.980253045121455e-05, "loss": 0.0084, "step": 566320 }, { "epoch": 1.47, "learning_rate": 7.979864223484308e-05, "loss": 0.0099, "step": 566330 }, { "epoch": 1.47, "learning_rate": 7.979475401847162e-05, "loss": 0.0105, "step": 566340 }, { "epoch": 1.47, "learning_rate": 7.979086580210015e-05, "loss": 0.0093, "step": 566350 }, { "epoch": 1.47, "learning_rate": 7.978697758572869e-05, "loss": 0.0115, "step": 566360 }, { "epoch": 1.47, "learning_rate": 7.978308936935722e-05, "loss": 0.0128, "step": 566370 }, { "epoch": 1.47, "learning_rate": 7.977920115298576e-05, "loss": 0.0139, "step": 566380 }, { "epoch": 1.47, "learning_rate": 7.977531293661429e-05, "loss": 0.0115, "step": 566390 }, { "epoch": 1.47, "learning_rate": 7.977142472024283e-05, "loss": 0.0091, "step": 566400 }, { "epoch": 1.47, "learning_rate": 7.976753650387136e-05, "loss": 0.0077, "step": 566410 }, { "epoch": 1.47, "learning_rate": 7.976364828749991e-05, "loss": 0.0091, "step": 566420 }, { "epoch": 1.47, "learning_rate": 7.975976007112843e-05, "loss": 0.0091, "step": 566430 }, { "epoch": 1.47, "learning_rate": 7.975587185475695e-05, "loss": 0.0078, "step": 566440 }, { "epoch": 1.47, "learning_rate": 7.975198363838551e-05, "loss": 0.0107, "step": 566450 }, { "epoch": 1.47, "learning_rate": 7.974809542201404e-05, "loss": 0.0077, "step": 566460 }, { "epoch": 1.47, "learning_rate": 7.974420720564258e-05, "loss": 0.0064, "step": 566470 }, { "epoch": 1.47, "learning_rate": 7.97403189892711e-05, "loss": 0.01, "step": 566480 }, { "epoch": 1.47, "learning_rate": 7.973643077289965e-05, "loss": 0.0094, "step": 566490 }, { "epoch": 1.47, "learning_rate": 7.973254255652818e-05, "loss": 0.0075, "step": 566500 }, { "epoch": 1.47, "learning_rate": 7.972865434015672e-05, "loss": 0.0101, "step": 566510 }, { "epoch": 1.47, "learning_rate": 7.972476612378525e-05, "loss": 0.0072, "step": 566520 }, { "epoch": 1.47, "learning_rate": 7.972087790741379e-05, "loss": 0.011, "step": 566530 }, { "epoch": 1.47, "learning_rate": 7.971698969104232e-05, "loss": 0.0093, "step": 566540 }, { "epoch": 1.47, "learning_rate": 7.971310147467086e-05, "loss": 0.0103, "step": 566550 }, { "epoch": 1.47, "learning_rate": 7.970921325829939e-05, "loss": 0.0093, "step": 566560 }, { "epoch": 1.47, "learning_rate": 7.970532504192793e-05, "loss": 0.0095, "step": 566570 }, { "epoch": 1.47, "learning_rate": 7.970143682555645e-05, "loss": 0.0073, "step": 566580 }, { "epoch": 1.47, "learning_rate": 7.9697548609185e-05, "loss": 0.0077, "step": 566590 }, { "epoch": 1.47, "learning_rate": 7.969366039281352e-05, "loss": 0.0074, "step": 566600 }, { "epoch": 1.47, "learning_rate": 7.968977217644208e-05, "loss": 0.0099, "step": 566610 }, { "epoch": 1.47, "learning_rate": 7.968588396007061e-05, "loss": 0.0109, "step": 566620 }, { "epoch": 1.47, "learning_rate": 7.968199574369915e-05, "loss": 0.0112, "step": 566630 }, { "epoch": 1.47, "learning_rate": 7.967810752732768e-05, "loss": 0.0076, "step": 566640 }, { "epoch": 1.47, "learning_rate": 7.967421931095622e-05, "loss": 0.0104, "step": 566650 }, { "epoch": 1.47, "learning_rate": 7.967033109458475e-05, "loss": 0.0079, "step": 566660 }, { "epoch": 1.47, "learning_rate": 7.966644287821329e-05, "loss": 0.0092, "step": 566670 }, { "epoch": 1.47, "learning_rate": 7.966255466184182e-05, "loss": 0.0098, "step": 566680 }, { "epoch": 1.47, "learning_rate": 7.965866644547035e-05, "loss": 0.0097, "step": 566690 }, { "epoch": 1.47, "learning_rate": 7.965477822909889e-05, "loss": 0.0073, "step": 566700 }, { "epoch": 1.47, "learning_rate": 7.965089001272741e-05, "loss": 0.0079, "step": 566710 }, { "epoch": 1.47, "learning_rate": 7.964700179635596e-05, "loss": 0.0096, "step": 566720 }, { "epoch": 1.47, "learning_rate": 7.964311357998448e-05, "loss": 0.0112, "step": 566730 }, { "epoch": 1.47, "learning_rate": 7.963922536361303e-05, "loss": 0.0059, "step": 566740 }, { "epoch": 1.47, "learning_rate": 7.963533714724155e-05, "loss": 0.0072, "step": 566750 }, { "epoch": 1.47, "learning_rate": 7.96314489308701e-05, "loss": 0.0109, "step": 566760 }, { "epoch": 1.47, "learning_rate": 7.962756071449862e-05, "loss": 0.0119, "step": 566770 }, { "epoch": 1.47, "learning_rate": 7.962367249812717e-05, "loss": 0.0085, "step": 566780 }, { "epoch": 1.47, "learning_rate": 7.96197842817557e-05, "loss": 0.0096, "step": 566790 }, { "epoch": 1.47, "learning_rate": 7.961589606538425e-05, "loss": 0.0105, "step": 566800 }, { "epoch": 1.47, "learning_rate": 7.961200784901278e-05, "loss": 0.0085, "step": 566810 }, { "epoch": 1.47, "learning_rate": 7.960811963264132e-05, "loss": 0.0102, "step": 566820 }, { "epoch": 1.47, "learning_rate": 7.960423141626985e-05, "loss": 0.0068, "step": 566830 }, { "epoch": 1.47, "learning_rate": 7.960034319989839e-05, "loss": 0.007, "step": 566840 }, { "epoch": 1.47, "learning_rate": 7.959645498352692e-05, "loss": 0.0095, "step": 566850 }, { "epoch": 1.47, "learning_rate": 7.959256676715546e-05, "loss": 0.0087, "step": 566860 }, { "epoch": 1.47, "learning_rate": 7.958867855078399e-05, "loss": 0.0071, "step": 566870 }, { "epoch": 1.47, "learning_rate": 7.958479033441253e-05, "loss": 0.0062, "step": 566880 }, { "epoch": 1.47, "learning_rate": 7.958090211804106e-05, "loss": 0.008, "step": 566890 }, { "epoch": 1.47, "learning_rate": 7.95770139016696e-05, "loss": 0.0088, "step": 566900 }, { "epoch": 1.47, "learning_rate": 7.957312568529813e-05, "loss": 0.0076, "step": 566910 }, { "epoch": 1.47, "learning_rate": 7.956923746892667e-05, "loss": 0.009, "step": 566920 }, { "epoch": 1.47, "learning_rate": 7.95653492525552e-05, "loss": 0.0105, "step": 566930 }, { "epoch": 1.47, "learning_rate": 7.956146103618372e-05, "loss": 0.01, "step": 566940 }, { "epoch": 1.47, "learning_rate": 7.955757281981226e-05, "loss": 0.0122, "step": 566950 }, { "epoch": 1.47, "learning_rate": 7.955368460344079e-05, "loss": 0.009, "step": 566960 }, { "epoch": 1.47, "learning_rate": 7.954979638706935e-05, "loss": 0.01, "step": 566970 }, { "epoch": 1.47, "learning_rate": 7.954590817069788e-05, "loss": 0.0123, "step": 566980 }, { "epoch": 1.47, "learning_rate": 7.954201995432642e-05, "loss": 0.01, "step": 566990 }, { "epoch": 1.47, "learning_rate": 7.953813173795495e-05, "loss": 0.0095, "step": 567000 }, { "epoch": 1.47, "eval_cer": 0.88167329394755, "eval_loss": 0.006201473996043205, "eval_runtime": 108.0039, "eval_samples_per_second": 18.518, "eval_steps_per_second": 4.629, "step": 567000 }, { "epoch": 1.47, "learning_rate": 7.953424352158349e-05, "loss": 0.0078, "step": 567010 }, { "epoch": 1.47, "learning_rate": 7.953035530521202e-05, "loss": 0.0085, "step": 567020 }, { "epoch": 1.47, "learning_rate": 7.952646708884056e-05, "loss": 0.0086, "step": 567030 }, { "epoch": 1.47, "learning_rate": 7.952257887246909e-05, "loss": 0.0086, "step": 567040 }, { "epoch": 1.47, "learning_rate": 7.951869065609763e-05, "loss": 0.0078, "step": 567050 }, { "epoch": 1.47, "learning_rate": 7.951480243972616e-05, "loss": 0.0105, "step": 567060 }, { "epoch": 1.47, "learning_rate": 7.95109142233547e-05, "loss": 0.0082, "step": 567070 }, { "epoch": 1.47, "learning_rate": 7.950702600698322e-05, "loss": 0.0089, "step": 567080 }, { "epoch": 1.47, "learning_rate": 7.950313779061177e-05, "loss": 0.0104, "step": 567090 }, { "epoch": 1.47, "learning_rate": 7.94992495742403e-05, "loss": 0.0099, "step": 567100 }, { "epoch": 1.47, "learning_rate": 7.949536135786884e-05, "loss": 0.0161, "step": 567110 }, { "epoch": 1.47, "learning_rate": 7.949147314149736e-05, "loss": 0.0083, "step": 567120 }, { "epoch": 1.47, "learning_rate": 7.948758492512592e-05, "loss": 0.0114, "step": 567130 }, { "epoch": 1.47, "learning_rate": 7.948369670875443e-05, "loss": 0.0086, "step": 567140 }, { "epoch": 1.47, "learning_rate": 7.947980849238299e-05, "loss": 0.0095, "step": 567150 }, { "epoch": 1.47, "learning_rate": 7.947592027601152e-05, "loss": 0.0089, "step": 567160 }, { "epoch": 1.47, "learning_rate": 7.947203205964006e-05, "loss": 0.0128, "step": 567170 }, { "epoch": 1.47, "learning_rate": 7.946814384326859e-05, "loss": 0.009, "step": 567180 }, { "epoch": 1.47, "learning_rate": 7.946425562689712e-05, "loss": 0.013, "step": 567190 }, { "epoch": 1.47, "learning_rate": 7.946036741052566e-05, "loss": 0.0078, "step": 567200 }, { "epoch": 1.47, "learning_rate": 7.945647919415418e-05, "loss": 0.009, "step": 567210 }, { "epoch": 1.47, "learning_rate": 7.945259097778273e-05, "loss": 0.0096, "step": 567220 }, { "epoch": 1.47, "learning_rate": 7.944870276141125e-05, "loss": 0.0089, "step": 567230 }, { "epoch": 1.47, "learning_rate": 7.94448145450398e-05, "loss": 0.0103, "step": 567240 }, { "epoch": 1.47, "learning_rate": 7.944092632866832e-05, "loss": 0.0094, "step": 567250 }, { "epoch": 1.47, "learning_rate": 7.943703811229687e-05, "loss": 0.0093, "step": 567260 }, { "epoch": 1.47, "learning_rate": 7.94331498959254e-05, "loss": 0.008, "step": 567270 }, { "epoch": 1.47, "learning_rate": 7.942926167955394e-05, "loss": 0.0095, "step": 567280 }, { "epoch": 1.47, "learning_rate": 7.942537346318246e-05, "loss": 0.0096, "step": 567290 }, { "epoch": 1.47, "learning_rate": 7.9421485246811e-05, "loss": 0.0083, "step": 567300 }, { "epoch": 1.47, "learning_rate": 7.941759703043953e-05, "loss": 0.01, "step": 567310 }, { "epoch": 1.47, "learning_rate": 7.941370881406809e-05, "loss": 0.0095, "step": 567320 }, { "epoch": 1.47, "learning_rate": 7.940982059769662e-05, "loss": 0.0078, "step": 567330 }, { "epoch": 1.47, "learning_rate": 7.940593238132516e-05, "loss": 0.0113, "step": 567340 }, { "epoch": 1.47, "learning_rate": 7.940204416495369e-05, "loss": 0.0099, "step": 567350 }, { "epoch": 1.47, "learning_rate": 7.939815594858223e-05, "loss": 0.0095, "step": 567360 }, { "epoch": 1.47, "learning_rate": 7.939426773221076e-05, "loss": 0.0119, "step": 567370 }, { "epoch": 1.47, "learning_rate": 7.93903795158393e-05, "loss": 0.01, "step": 567380 }, { "epoch": 1.47, "learning_rate": 7.938649129946783e-05, "loss": 0.0097, "step": 567390 }, { "epoch": 1.47, "learning_rate": 7.938260308309637e-05, "loss": 0.0111, "step": 567400 }, { "epoch": 1.47, "learning_rate": 7.93787148667249e-05, "loss": 0.0089, "step": 567410 }, { "epoch": 1.47, "learning_rate": 7.937482665035342e-05, "loss": 0.0105, "step": 567420 }, { "epoch": 1.47, "learning_rate": 7.937093843398197e-05, "loss": 0.0085, "step": 567430 }, { "epoch": 1.47, "learning_rate": 7.93670502176105e-05, "loss": 0.0106, "step": 567440 }, { "epoch": 1.47, "learning_rate": 7.936316200123904e-05, "loss": 0.0121, "step": 567450 }, { "epoch": 1.47, "learning_rate": 7.935927378486756e-05, "loss": 0.0103, "step": 567460 }, { "epoch": 1.47, "learning_rate": 7.93553855684961e-05, "loss": 0.0115, "step": 567470 }, { "epoch": 1.47, "learning_rate": 7.935149735212463e-05, "loss": 0.0093, "step": 567480 }, { "epoch": 1.47, "learning_rate": 7.934760913575319e-05, "loss": 0.0082, "step": 567490 }, { "epoch": 1.47, "learning_rate": 7.93437209193817e-05, "loss": 0.012, "step": 567500 }, { "epoch": 1.47, "learning_rate": 7.933983270301026e-05, "loss": 0.0072, "step": 567510 }, { "epoch": 1.47, "learning_rate": 7.933594448663879e-05, "loss": 0.0072, "step": 567520 }, { "epoch": 1.47, "learning_rate": 7.933205627026733e-05, "loss": 0.0082, "step": 567530 }, { "epoch": 1.47, "learning_rate": 7.932816805389586e-05, "loss": 0.0089, "step": 567540 }, { "epoch": 1.47, "learning_rate": 7.93242798375244e-05, "loss": 0.0104, "step": 567550 }, { "epoch": 1.47, "learning_rate": 7.932039162115293e-05, "loss": 0.009, "step": 567560 }, { "epoch": 1.47, "learning_rate": 7.931650340478147e-05, "loss": 0.01, "step": 567570 }, { "epoch": 1.47, "learning_rate": 7.931261518841e-05, "loss": 0.0069, "step": 567580 }, { "epoch": 1.47, "learning_rate": 7.930872697203854e-05, "loss": 0.0093, "step": 567590 }, { "epoch": 1.47, "learning_rate": 7.930483875566706e-05, "loss": 0.0075, "step": 567600 }, { "epoch": 1.47, "learning_rate": 7.93009505392956e-05, "loss": 0.0081, "step": 567610 }, { "epoch": 1.47, "learning_rate": 7.929706232292413e-05, "loss": 0.0091, "step": 567620 }, { "epoch": 1.47, "learning_rate": 7.929317410655268e-05, "loss": 0.0089, "step": 567630 }, { "epoch": 1.47, "learning_rate": 7.92892858901812e-05, "loss": 0.0081, "step": 567640 }, { "epoch": 1.47, "learning_rate": 7.928539767380976e-05, "loss": 0.0093, "step": 567650 }, { "epoch": 1.47, "learning_rate": 7.928150945743827e-05, "loss": 0.0105, "step": 567660 }, { "epoch": 1.47, "learning_rate": 7.92776212410668e-05, "loss": 0.0104, "step": 567670 }, { "epoch": 1.47, "learning_rate": 7.927373302469536e-05, "loss": 0.0091, "step": 567680 }, { "epoch": 1.47, "learning_rate": 7.926984480832389e-05, "loss": 0.0073, "step": 567690 }, { "epoch": 1.47, "learning_rate": 7.926595659195243e-05, "loss": 0.011, "step": 567700 }, { "epoch": 1.47, "learning_rate": 7.926206837558096e-05, "loss": 0.0114, "step": 567710 }, { "epoch": 1.47, "learning_rate": 7.92581801592095e-05, "loss": 0.0082, "step": 567720 }, { "epoch": 1.47, "learning_rate": 7.925429194283802e-05, "loss": 0.0086, "step": 567730 }, { "epoch": 1.47, "learning_rate": 7.925040372646657e-05, "loss": 0.0101, "step": 567740 }, { "epoch": 1.47, "learning_rate": 7.92465155100951e-05, "loss": 0.0079, "step": 567750 }, { "epoch": 1.47, "learning_rate": 7.924262729372364e-05, "loss": 0.008, "step": 567760 }, { "epoch": 1.47, "learning_rate": 7.923873907735216e-05, "loss": 0.009, "step": 567770 }, { "epoch": 1.47, "learning_rate": 7.92348508609807e-05, "loss": 0.0076, "step": 567780 }, { "epoch": 1.47, "learning_rate": 7.923096264460923e-05, "loss": 0.0098, "step": 567790 }, { "epoch": 1.47, "learning_rate": 7.922707442823778e-05, "loss": 0.0096, "step": 567800 }, { "epoch": 1.47, "learning_rate": 7.92231862118663e-05, "loss": 0.0085, "step": 567810 }, { "epoch": 1.47, "learning_rate": 7.921929799549485e-05, "loss": 0.01, "step": 567820 }, { "epoch": 1.47, "learning_rate": 7.921540977912337e-05, "loss": 0.0091, "step": 567830 }, { "epoch": 1.47, "learning_rate": 7.921152156275193e-05, "loss": 0.0091, "step": 567840 }, { "epoch": 1.47, "learning_rate": 7.920763334638046e-05, "loss": 0.0065, "step": 567850 }, { "epoch": 1.47, "learning_rate": 7.9203745130009e-05, "loss": 0.0121, "step": 567860 }, { "epoch": 1.47, "learning_rate": 7.919985691363753e-05, "loss": 0.0118, "step": 567870 }, { "epoch": 1.47, "learning_rate": 7.919596869726607e-05, "loss": 0.0093, "step": 567880 }, { "epoch": 1.47, "learning_rate": 7.91920804808946e-05, "loss": 0.0082, "step": 567890 }, { "epoch": 1.47, "learning_rate": 7.918819226452314e-05, "loss": 0.0106, "step": 567900 }, { "epoch": 1.47, "learning_rate": 7.918430404815167e-05, "loss": 0.0122, "step": 567910 }, { "epoch": 1.47, "learning_rate": 7.91804158317802e-05, "loss": 0.0091, "step": 567920 }, { "epoch": 1.47, "learning_rate": 7.917652761540874e-05, "loss": 0.0086, "step": 567930 }, { "epoch": 1.47, "learning_rate": 7.917263939903726e-05, "loss": 0.0093, "step": 567940 }, { "epoch": 1.47, "learning_rate": 7.91687511826658e-05, "loss": 0.0095, "step": 567950 }, { "epoch": 1.47, "learning_rate": 7.916486296629433e-05, "loss": 0.0099, "step": 567960 }, { "epoch": 1.47, "learning_rate": 7.916097474992288e-05, "loss": 0.0093, "step": 567970 }, { "epoch": 1.47, "learning_rate": 7.91570865335514e-05, "loss": 0.0104, "step": 567980 }, { "epoch": 1.47, "learning_rate": 7.915319831717994e-05, "loss": 0.0097, "step": 567990 }, { "epoch": 1.47, "learning_rate": 7.914931010080847e-05, "loss": 0.0078, "step": 568000 }, { "epoch": 1.47, "eval_cer": 0.8817166826925096, "eval_loss": 0.00597924692556262, "eval_runtime": 108.0502, "eval_samples_per_second": 18.51, "eval_steps_per_second": 4.627, "step": 568000 }, { "epoch": 1.47, "learning_rate": 7.914542188443703e-05, "loss": 0.0069, "step": 568010 }, { "epoch": 1.47, "learning_rate": 7.914153366806554e-05, "loss": 0.0116, "step": 568020 }, { "epoch": 1.47, "learning_rate": 7.91376454516941e-05, "loss": 0.0092, "step": 568030 }, { "epoch": 1.47, "learning_rate": 7.913375723532263e-05, "loss": 0.008, "step": 568040 }, { "epoch": 1.47, "learning_rate": 7.912986901895117e-05, "loss": 0.0079, "step": 568050 }, { "epoch": 1.47, "learning_rate": 7.91259808025797e-05, "loss": 0.0103, "step": 568060 }, { "epoch": 1.47, "learning_rate": 7.912209258620824e-05, "loss": 0.0118, "step": 568070 }, { "epoch": 1.47, "learning_rate": 7.911820436983677e-05, "loss": 0.0117, "step": 568080 }, { "epoch": 1.47, "learning_rate": 7.911431615346531e-05, "loss": 0.01, "step": 568090 }, { "epoch": 1.47, "learning_rate": 7.911042793709384e-05, "loss": 0.0088, "step": 568100 }, { "epoch": 1.47, "learning_rate": 7.910653972072238e-05, "loss": 0.0087, "step": 568110 }, { "epoch": 1.47, "learning_rate": 7.91026515043509e-05, "loss": 0.0118, "step": 568120 }, { "epoch": 1.47, "learning_rate": 7.909876328797945e-05, "loss": 0.01, "step": 568130 }, { "epoch": 1.47, "learning_rate": 7.909487507160797e-05, "loss": 0.0072, "step": 568140 }, { "epoch": 1.47, "learning_rate": 7.909098685523652e-05, "loss": 0.0112, "step": 568150 }, { "epoch": 1.47, "learning_rate": 7.908709863886504e-05, "loss": 0.0071, "step": 568160 }, { "epoch": 1.47, "learning_rate": 7.908321042249357e-05, "loss": 0.0095, "step": 568170 }, { "epoch": 1.47, "learning_rate": 7.907932220612211e-05, "loss": 0.0101, "step": 568180 }, { "epoch": 1.47, "learning_rate": 7.907543398975064e-05, "loss": 0.0118, "step": 568190 }, { "epoch": 1.47, "learning_rate": 7.90715457733792e-05, "loss": 0.008, "step": 568200 }, { "epoch": 1.47, "learning_rate": 7.906765755700773e-05, "loss": 0.0128, "step": 568210 }, { "epoch": 1.47, "learning_rate": 7.906376934063627e-05, "loss": 0.0096, "step": 568220 }, { "epoch": 1.47, "learning_rate": 7.90598811242648e-05, "loss": 0.0088, "step": 568230 }, { "epoch": 1.47, "learning_rate": 7.905599290789334e-05, "loss": 0.0123, "step": 568240 }, { "epoch": 1.47, "learning_rate": 7.905210469152186e-05, "loss": 0.0081, "step": 568250 }, { "epoch": 1.47, "learning_rate": 7.90482164751504e-05, "loss": 0.0117, "step": 568260 }, { "epoch": 1.47, "learning_rate": 7.904432825877893e-05, "loss": 0.0101, "step": 568270 }, { "epoch": 1.47, "learning_rate": 7.904044004240748e-05, "loss": 0.0088, "step": 568280 }, { "epoch": 1.47, "learning_rate": 7.9036551826036e-05, "loss": 0.0107, "step": 568290 }, { "epoch": 1.47, "learning_rate": 7.903266360966455e-05, "loss": 0.0065, "step": 568300 }, { "epoch": 1.47, "learning_rate": 7.902877539329307e-05, "loss": 0.0075, "step": 568310 }, { "epoch": 1.47, "learning_rate": 7.902488717692162e-05, "loss": 0.0075, "step": 568320 }, { "epoch": 1.47, "learning_rate": 7.902099896055014e-05, "loss": 0.01, "step": 568330 }, { "epoch": 1.47, "learning_rate": 7.901711074417869e-05, "loss": 0.0106, "step": 568340 }, { "epoch": 1.47, "learning_rate": 7.901322252780721e-05, "loss": 0.0072, "step": 568350 }, { "epoch": 1.47, "learning_rate": 7.900933431143577e-05, "loss": 0.0117, "step": 568360 }, { "epoch": 1.47, "learning_rate": 7.900544609506428e-05, "loss": 0.0087, "step": 568370 }, { "epoch": 1.47, "learning_rate": 7.900155787869284e-05, "loss": 0.0088, "step": 568380 }, { "epoch": 1.47, "learning_rate": 7.899766966232137e-05, "loss": 0.0103, "step": 568390 }, { "epoch": 1.47, "learning_rate": 7.899378144594991e-05, "loss": 0.0093, "step": 568400 }, { "epoch": 1.47, "learning_rate": 7.898989322957844e-05, "loss": 0.0096, "step": 568410 }, { "epoch": 1.47, "learning_rate": 7.898600501320696e-05, "loss": 0.0109, "step": 568420 }, { "epoch": 1.47, "learning_rate": 7.89821167968355e-05, "loss": 0.0158, "step": 568430 }, { "epoch": 1.47, "learning_rate": 7.897822858046403e-05, "loss": 0.0086, "step": 568440 }, { "epoch": 1.47, "learning_rate": 7.897434036409258e-05, "loss": 0.009, "step": 568450 }, { "epoch": 1.47, "learning_rate": 7.89704521477211e-05, "loss": 0.0079, "step": 568460 }, { "epoch": 1.47, "learning_rate": 7.896656393134965e-05, "loss": 0.0116, "step": 568470 }, { "epoch": 1.47, "learning_rate": 7.896267571497817e-05, "loss": 0.0095, "step": 568480 }, { "epoch": 1.47, "learning_rate": 7.895878749860671e-05, "loss": 0.0085, "step": 568490 }, { "epoch": 1.47, "learning_rate": 7.895489928223524e-05, "loss": 0.0096, "step": 568500 }, { "epoch": 1.47, "learning_rate": 7.895101106586378e-05, "loss": 0.0153, "step": 568510 }, { "epoch": 1.47, "learning_rate": 7.894712284949231e-05, "loss": 0.0092, "step": 568520 }, { "epoch": 1.47, "learning_rate": 7.894323463312085e-05, "loss": 0.0089, "step": 568530 }, { "epoch": 1.47, "learning_rate": 7.893934641674938e-05, "loss": 0.0098, "step": 568540 }, { "epoch": 1.47, "learning_rate": 7.893545820037794e-05, "loss": 0.0081, "step": 568550 }, { "epoch": 1.47, "learning_rate": 7.893156998400647e-05, "loss": 0.0156, "step": 568560 }, { "epoch": 1.47, "learning_rate": 7.892768176763501e-05, "loss": 0.0088, "step": 568570 }, { "epoch": 1.47, "learning_rate": 7.892379355126354e-05, "loss": 0.0101, "step": 568580 }, { "epoch": 1.47, "learning_rate": 7.891990533489208e-05, "loss": 0.0109, "step": 568590 }, { "epoch": 1.47, "learning_rate": 7.89160171185206e-05, "loss": 0.0112, "step": 568600 }, { "epoch": 1.47, "learning_rate": 7.891212890214915e-05, "loss": 0.0104, "step": 568610 }, { "epoch": 1.47, "learning_rate": 7.890824068577767e-05, "loss": 0.0118, "step": 568620 }, { "epoch": 1.47, "learning_rate": 7.890435246940622e-05, "loss": 0.0127, "step": 568630 }, { "epoch": 1.47, "learning_rate": 7.890046425303474e-05, "loss": 0.0087, "step": 568640 }, { "epoch": 1.47, "learning_rate": 7.889657603666329e-05, "loss": 0.0093, "step": 568650 }, { "epoch": 1.47, "learning_rate": 7.889268782029181e-05, "loss": 0.0078, "step": 568660 }, { "epoch": 1.47, "learning_rate": 7.888879960392034e-05, "loss": 0.0068, "step": 568670 }, { "epoch": 1.47, "learning_rate": 7.888491138754888e-05, "loss": 0.0093, "step": 568680 }, { "epoch": 1.47, "learning_rate": 7.888102317117741e-05, "loss": 0.009, "step": 568690 }, { "epoch": 1.47, "learning_rate": 7.887713495480595e-05, "loss": 0.0089, "step": 568700 }, { "epoch": 1.47, "learning_rate": 7.887324673843448e-05, "loss": 0.0117, "step": 568710 }, { "epoch": 1.47, "learning_rate": 7.886935852206304e-05, "loss": 0.0078, "step": 568720 }, { "epoch": 1.47, "learning_rate": 7.886547030569155e-05, "loss": 0.0112, "step": 568730 }, { "epoch": 1.47, "learning_rate": 7.886158208932011e-05, "loss": 0.0084, "step": 568740 }, { "epoch": 1.47, "learning_rate": 7.885769387294863e-05, "loss": 0.0072, "step": 568750 }, { "epoch": 1.47, "learning_rate": 7.885380565657718e-05, "loss": 0.0104, "step": 568760 }, { "epoch": 1.47, "learning_rate": 7.88499174402057e-05, "loss": 0.0088, "step": 568770 }, { "epoch": 1.47, "learning_rate": 7.884602922383425e-05, "loss": 0.0064, "step": 568780 }, { "epoch": 1.47, "learning_rate": 7.884214100746277e-05, "loss": 0.0078, "step": 568790 }, { "epoch": 1.47, "learning_rate": 7.883825279109132e-05, "loss": 0.011, "step": 568800 }, { "epoch": 1.47, "learning_rate": 7.883436457471984e-05, "loss": 0.0109, "step": 568810 }, { "epoch": 1.47, "learning_rate": 7.883047635834839e-05, "loss": 0.0111, "step": 568820 }, { "epoch": 1.47, "learning_rate": 7.882658814197691e-05, "loss": 0.0079, "step": 568830 }, { "epoch": 1.47, "learning_rate": 7.882269992560546e-05, "loss": 0.0079, "step": 568840 }, { "epoch": 1.47, "learning_rate": 7.881881170923398e-05, "loss": 0.0076, "step": 568850 }, { "epoch": 1.47, "learning_rate": 7.881492349286253e-05, "loss": 0.0084, "step": 568860 }, { "epoch": 1.47, "learning_rate": 7.881103527649105e-05, "loss": 0.0067, "step": 568870 }, { "epoch": 1.47, "learning_rate": 7.880714706011961e-05, "loss": 0.0101, "step": 568880 }, { "epoch": 1.47, "learning_rate": 7.880325884374812e-05, "loss": 0.0073, "step": 568890 }, { "epoch": 1.47, "learning_rate": 7.879937062737668e-05, "loss": 0.0087, "step": 568900 }, { "epoch": 1.47, "learning_rate": 7.87954824110052e-05, "loss": 0.0105, "step": 568910 }, { "epoch": 1.47, "learning_rate": 7.879159419463373e-05, "loss": 0.0071, "step": 568920 }, { "epoch": 1.47, "learning_rate": 7.878770597826228e-05, "loss": 0.0065, "step": 568930 }, { "epoch": 1.47, "learning_rate": 7.87838177618908e-05, "loss": 0.0073, "step": 568940 }, { "epoch": 1.47, "learning_rate": 7.877992954551935e-05, "loss": 0.0064, "step": 568950 }, { "epoch": 1.47, "learning_rate": 7.877604132914787e-05, "loss": 0.0083, "step": 568960 }, { "epoch": 1.47, "learning_rate": 7.877215311277642e-05, "loss": 0.0085, "step": 568970 }, { "epoch": 1.47, "learning_rate": 7.876826489640494e-05, "loss": 0.0077, "step": 568980 }, { "epoch": 1.47, "learning_rate": 7.876437668003349e-05, "loss": 0.0102, "step": 568990 }, { "epoch": 1.47, "learning_rate": 7.876048846366201e-05, "loss": 0.0089, "step": 569000 }, { "epoch": 1.47, "eval_cer": 0.8816956881384969, "eval_loss": 0.006051726173609495, "eval_runtime": 107.8929, "eval_samples_per_second": 18.537, "eval_steps_per_second": 4.634, "step": 569000 }, { "epoch": 1.47, "learning_rate": 7.875660024729055e-05, "loss": 0.0087, "step": 569010 }, { "epoch": 1.47, "learning_rate": 7.875271203091908e-05, "loss": 0.0106, "step": 569020 }, { "epoch": 1.48, "learning_rate": 7.874882381454762e-05, "loss": 0.0075, "step": 569030 }, { "epoch": 1.48, "learning_rate": 7.874493559817615e-05, "loss": 0.0093, "step": 569040 }, { "epoch": 1.48, "learning_rate": 7.87410473818047e-05, "loss": 0.0096, "step": 569050 }, { "epoch": 1.48, "learning_rate": 7.873715916543322e-05, "loss": 0.0087, "step": 569060 }, { "epoch": 1.48, "learning_rate": 7.873327094906178e-05, "loss": 0.0067, "step": 569070 }, { "epoch": 1.48, "learning_rate": 7.87293827326903e-05, "loss": 0.01, "step": 569080 }, { "epoch": 1.48, "learning_rate": 7.872549451631885e-05, "loss": 0.0074, "step": 569090 }, { "epoch": 1.48, "learning_rate": 7.872160629994738e-05, "loss": 0.0089, "step": 569100 }, { "epoch": 1.48, "learning_rate": 7.871771808357592e-05, "loss": 0.0098, "step": 569110 }, { "epoch": 1.48, "learning_rate": 7.871382986720445e-05, "loss": 0.0114, "step": 569120 }, { "epoch": 1.48, "learning_rate": 7.870994165083299e-05, "loss": 0.0083, "step": 569130 }, { "epoch": 1.48, "learning_rate": 7.870605343446151e-05, "loss": 0.008, "step": 569140 }, { "epoch": 1.48, "learning_rate": 7.870216521809006e-05, "loss": 0.0102, "step": 569150 }, { "epoch": 1.48, "learning_rate": 7.869827700171858e-05, "loss": 0.0074, "step": 569160 }, { "epoch": 1.48, "learning_rate": 7.869438878534711e-05, "loss": 0.0081, "step": 569170 }, { "epoch": 1.48, "learning_rate": 7.869050056897565e-05, "loss": 0.0106, "step": 569180 }, { "epoch": 1.48, "learning_rate": 7.868661235260418e-05, "loss": 0.0079, "step": 569190 }, { "epoch": 1.48, "learning_rate": 7.868272413623272e-05, "loss": 0.0111, "step": 569200 }, { "epoch": 1.48, "learning_rate": 7.867883591986125e-05, "loss": 0.01, "step": 569210 }, { "epoch": 1.48, "learning_rate": 7.86749477034898e-05, "loss": 0.01, "step": 569220 }, { "epoch": 1.48, "learning_rate": 7.867105948711832e-05, "loss": 0.0107, "step": 569230 }, { "epoch": 1.48, "learning_rate": 7.866717127074688e-05, "loss": 0.0092, "step": 569240 }, { "epoch": 1.48, "learning_rate": 7.866328305437539e-05, "loss": 0.0094, "step": 569250 }, { "epoch": 1.48, "learning_rate": 7.865939483800395e-05, "loss": 0.0126, "step": 569260 }, { "epoch": 1.48, "learning_rate": 7.865550662163247e-05, "loss": 0.0083, "step": 569270 }, { "epoch": 1.48, "learning_rate": 7.865161840526102e-05, "loss": 0.0115, "step": 569280 }, { "epoch": 1.48, "learning_rate": 7.864773018888954e-05, "loss": 0.0093, "step": 569290 }, { "epoch": 1.48, "learning_rate": 7.864384197251809e-05, "loss": 0.0082, "step": 569300 }, { "epoch": 1.48, "learning_rate": 7.863995375614661e-05, "loss": 0.0078, "step": 569310 }, { "epoch": 1.48, "learning_rate": 7.863606553977516e-05, "loss": 0.0093, "step": 569320 }, { "epoch": 1.48, "learning_rate": 7.863217732340368e-05, "loss": 0.0075, "step": 569330 }, { "epoch": 1.48, "learning_rate": 7.862828910703223e-05, "loss": 0.0101, "step": 569340 }, { "epoch": 1.48, "learning_rate": 7.862440089066075e-05, "loss": 0.0082, "step": 569350 }, { "epoch": 1.48, "learning_rate": 7.86205126742893e-05, "loss": 0.0072, "step": 569360 }, { "epoch": 1.48, "learning_rate": 7.861662445791782e-05, "loss": 0.0085, "step": 569370 }, { "epoch": 1.48, "learning_rate": 7.861273624154637e-05, "loss": 0.0109, "step": 569380 }, { "epoch": 1.48, "learning_rate": 7.860884802517489e-05, "loss": 0.0112, "step": 569390 }, { "epoch": 1.48, "learning_rate": 7.860495980880345e-05, "loss": 0.009, "step": 569400 }, { "epoch": 1.48, "learning_rate": 7.860107159243196e-05, "loss": 0.0109, "step": 569410 }, { "epoch": 1.48, "learning_rate": 7.859718337606049e-05, "loss": 0.0117, "step": 569420 }, { "epoch": 1.48, "learning_rate": 7.859329515968905e-05, "loss": 0.0089, "step": 569430 }, { "epoch": 1.48, "learning_rate": 7.858940694331757e-05, "loss": 0.0084, "step": 569440 }, { "epoch": 1.48, "learning_rate": 7.858551872694612e-05, "loss": 0.0086, "step": 569450 }, { "epoch": 1.48, "learning_rate": 7.858163051057464e-05, "loss": 0.0087, "step": 569460 }, { "epoch": 1.48, "learning_rate": 7.857774229420319e-05, "loss": 0.0109, "step": 569470 }, { "epoch": 1.48, "learning_rate": 7.857385407783171e-05, "loss": 0.0078, "step": 569480 }, { "epoch": 1.48, "learning_rate": 7.856996586146026e-05, "loss": 0.0077, "step": 569490 }, { "epoch": 1.48, "learning_rate": 7.856607764508878e-05, "loss": 0.0065, "step": 569500 }, { "epoch": 1.48, "learning_rate": 7.856218942871733e-05, "loss": 0.0102, "step": 569510 }, { "epoch": 1.48, "learning_rate": 7.855830121234585e-05, "loss": 0.0093, "step": 569520 }, { "epoch": 1.48, "learning_rate": 7.85544129959744e-05, "loss": 0.0098, "step": 569530 }, { "epoch": 1.48, "learning_rate": 7.855052477960292e-05, "loss": 0.0083, "step": 569540 }, { "epoch": 1.48, "learning_rate": 7.854663656323146e-05, "loss": 0.0073, "step": 569550 }, { "epoch": 1.48, "learning_rate": 7.854274834685999e-05, "loss": 0.0117, "step": 569560 }, { "epoch": 1.48, "learning_rate": 7.853886013048853e-05, "loss": 0.007, "step": 569570 }, { "epoch": 1.48, "learning_rate": 7.853497191411706e-05, "loss": 0.0083, "step": 569580 }, { "epoch": 1.48, "learning_rate": 7.853108369774562e-05, "loss": 0.0076, "step": 569590 }, { "epoch": 1.48, "learning_rate": 7.852719548137415e-05, "loss": 0.0102, "step": 569600 }, { "epoch": 1.48, "learning_rate": 7.852330726500269e-05, "loss": 0.009, "step": 569610 }, { "epoch": 1.48, "learning_rate": 7.851941904863122e-05, "loss": 0.0093, "step": 569620 }, { "epoch": 1.48, "learning_rate": 7.851553083225976e-05, "loss": 0.0087, "step": 569630 }, { "epoch": 1.48, "learning_rate": 7.851164261588829e-05, "loss": 0.0111, "step": 569640 }, { "epoch": 1.48, "learning_rate": 7.850775439951683e-05, "loss": 0.0095, "step": 569650 }, { "epoch": 1.48, "learning_rate": 7.850386618314535e-05, "loss": 0.0085, "step": 569660 }, { "epoch": 1.48, "learning_rate": 7.849997796677388e-05, "loss": 0.0101, "step": 569670 }, { "epoch": 1.48, "learning_rate": 7.849608975040242e-05, "loss": 0.0085, "step": 569680 }, { "epoch": 1.48, "learning_rate": 7.849220153403095e-05, "loss": 0.0108, "step": 569690 }, { "epoch": 1.48, "learning_rate": 7.84883133176595e-05, "loss": 0.0072, "step": 569700 }, { "epoch": 1.48, "learning_rate": 7.848442510128802e-05, "loss": 0.0086, "step": 569710 }, { "epoch": 1.48, "learning_rate": 7.848053688491656e-05, "loss": 0.008, "step": 569720 }, { "epoch": 1.48, "learning_rate": 7.847664866854509e-05, "loss": 0.0074, "step": 569730 }, { "epoch": 1.48, "learning_rate": 7.847276045217363e-05, "loss": 0.0079, "step": 569740 }, { "epoch": 1.48, "learning_rate": 7.846887223580216e-05, "loss": 0.0128, "step": 569750 }, { "epoch": 1.48, "learning_rate": 7.84649840194307e-05, "loss": 0.0089, "step": 569760 }, { "epoch": 1.48, "learning_rate": 7.846109580305923e-05, "loss": 0.0123, "step": 569770 }, { "epoch": 1.48, "learning_rate": 7.845720758668779e-05, "loss": 0.0082, "step": 569780 }, { "epoch": 1.48, "learning_rate": 7.845331937031631e-05, "loss": 0.0071, "step": 569790 }, { "epoch": 1.48, "learning_rate": 7.844943115394486e-05, "loss": 0.0084, "step": 569800 }, { "epoch": 1.48, "learning_rate": 7.844554293757338e-05, "loss": 0.0109, "step": 569810 }, { "epoch": 1.48, "learning_rate": 7.844165472120193e-05, "loss": 0.009, "step": 569820 }, { "epoch": 1.48, "learning_rate": 7.843776650483045e-05, "loss": 0.0101, "step": 569830 }, { "epoch": 1.48, "learning_rate": 7.8433878288459e-05, "loss": 0.0076, "step": 569840 }, { "epoch": 1.48, "learning_rate": 7.842999007208752e-05, "loss": 0.0137, "step": 569850 }, { "epoch": 1.48, "learning_rate": 7.842610185571607e-05, "loss": 0.0097, "step": 569860 }, { "epoch": 1.48, "learning_rate": 7.84222136393446e-05, "loss": 0.0088, "step": 569870 }, { "epoch": 1.48, "learning_rate": 7.841832542297314e-05, "loss": 0.0079, "step": 569880 }, { "epoch": 1.48, "learning_rate": 7.841443720660166e-05, "loss": 0.0112, "step": 569890 }, { "epoch": 1.48, "learning_rate": 7.84105489902302e-05, "loss": 0.0108, "step": 569900 }, { "epoch": 1.48, "learning_rate": 7.840666077385873e-05, "loss": 0.0071, "step": 569910 }, { "epoch": 1.48, "learning_rate": 7.840277255748726e-05, "loss": 0.0103, "step": 569920 }, { "epoch": 1.48, "learning_rate": 7.83988843411158e-05, "loss": 0.0089, "step": 569930 }, { "epoch": 1.48, "learning_rate": 7.839499612474433e-05, "loss": 0.0106, "step": 569940 }, { "epoch": 1.48, "learning_rate": 7.839110790837289e-05, "loss": 0.0091, "step": 569950 }, { "epoch": 1.48, "learning_rate": 7.83872196920014e-05, "loss": 0.01, "step": 569960 }, { "epoch": 1.48, "learning_rate": 7.838333147562996e-05, "loss": 0.0099, "step": 569970 }, { "epoch": 1.48, "learning_rate": 7.837944325925848e-05, "loss": 0.008, "step": 569980 }, { "epoch": 1.48, "learning_rate": 7.837555504288703e-05, "loss": 0.0091, "step": 569990 }, { "epoch": 1.48, "learning_rate": 7.837166682651555e-05, "loss": 0.009, "step": 570000 }, { "epoch": 1.48, "eval_cer": 0.8817082848709045, "eval_loss": 0.006050651427358389, "eval_runtime": 107.8737, "eval_samples_per_second": 18.54, "eval_steps_per_second": 4.635, "step": 570000 }, { "epoch": 1.48, "learning_rate": 7.83677786101441e-05, "loss": 0.0104, "step": 570010 }, { "epoch": 1.48, "learning_rate": 7.836389039377262e-05, "loss": 0.0105, "step": 570020 }, { "epoch": 1.48, "learning_rate": 7.836000217740116e-05, "loss": 0.0102, "step": 570030 }, { "epoch": 1.48, "learning_rate": 7.835611396102969e-05, "loss": 0.0104, "step": 570040 }, { "epoch": 1.48, "learning_rate": 7.835222574465823e-05, "loss": 0.0061, "step": 570050 }, { "epoch": 1.48, "learning_rate": 7.834833752828676e-05, "loss": 0.013, "step": 570060 }, { "epoch": 1.48, "learning_rate": 7.83444493119153e-05, "loss": 0.0066, "step": 570070 }, { "epoch": 1.48, "learning_rate": 7.834056109554383e-05, "loss": 0.0128, "step": 570080 }, { "epoch": 1.48, "learning_rate": 7.833667287917237e-05, "loss": 0.011, "step": 570090 }, { "epoch": 1.48, "learning_rate": 7.83327846628009e-05, "loss": 0.0109, "step": 570100 }, { "epoch": 1.48, "learning_rate": 7.832889644642946e-05, "loss": 0.0106, "step": 570110 }, { "epoch": 1.48, "learning_rate": 7.832500823005797e-05, "loss": 0.0059, "step": 570120 }, { "epoch": 1.48, "learning_rate": 7.832112001368653e-05, "loss": 0.0074, "step": 570130 }, { "epoch": 1.48, "learning_rate": 7.831723179731506e-05, "loss": 0.0123, "step": 570140 }, { "epoch": 1.48, "learning_rate": 7.831334358094358e-05, "loss": 0.0145, "step": 570150 }, { "epoch": 1.48, "learning_rate": 7.830945536457212e-05, "loss": 0.0084, "step": 570160 }, { "epoch": 1.48, "learning_rate": 7.830556714820065e-05, "loss": 0.0082, "step": 570170 }, { "epoch": 1.48, "learning_rate": 7.83016789318292e-05, "loss": 0.01, "step": 570180 }, { "epoch": 1.48, "learning_rate": 7.829779071545772e-05, "loss": 0.0111, "step": 570190 }, { "epoch": 1.48, "learning_rate": 7.829390249908626e-05, "loss": 0.0093, "step": 570200 }, { "epoch": 1.48, "learning_rate": 7.829001428271479e-05, "loss": 0.0084, "step": 570210 }, { "epoch": 1.48, "learning_rate": 7.828612606634333e-05, "loss": 0.0111, "step": 570220 }, { "epoch": 1.48, "learning_rate": 7.828223784997186e-05, "loss": 0.0096, "step": 570230 }, { "epoch": 1.48, "learning_rate": 7.82783496336004e-05, "loss": 0.0079, "step": 570240 }, { "epoch": 1.48, "learning_rate": 7.827446141722893e-05, "loss": 0.0085, "step": 570250 }, { "epoch": 1.48, "learning_rate": 7.827057320085747e-05, "loss": 0.0086, "step": 570260 }, { "epoch": 1.48, "learning_rate": 7.8266684984486e-05, "loss": 0.0063, "step": 570270 }, { "epoch": 1.48, "learning_rate": 7.826279676811454e-05, "loss": 0.0118, "step": 570280 }, { "epoch": 1.48, "learning_rate": 7.825890855174307e-05, "loss": 0.0081, "step": 570290 }, { "epoch": 1.48, "learning_rate": 7.825502033537163e-05, "loss": 0.0079, "step": 570300 }, { "epoch": 1.48, "learning_rate": 7.825113211900015e-05, "loss": 0.0094, "step": 570310 }, { "epoch": 1.48, "learning_rate": 7.82472439026287e-05, "loss": 0.0075, "step": 570320 }, { "epoch": 1.48, "learning_rate": 7.824335568625722e-05, "loss": 0.0141, "step": 570330 }, { "epoch": 1.48, "learning_rate": 7.823946746988577e-05, "loss": 0.011, "step": 570340 }, { "epoch": 1.48, "learning_rate": 7.82355792535143e-05, "loss": 0.009, "step": 570350 }, { "epoch": 1.48, "learning_rate": 7.823169103714284e-05, "loss": 0.0106, "step": 570360 }, { "epoch": 1.48, "learning_rate": 7.822780282077136e-05, "loss": 0.0083, "step": 570370 }, { "epoch": 1.48, "learning_rate": 7.82239146043999e-05, "loss": 0.0077, "step": 570380 }, { "epoch": 1.48, "learning_rate": 7.822002638802843e-05, "loss": 0.0083, "step": 570390 }, { "epoch": 1.48, "learning_rate": 7.821613817165696e-05, "loss": 0.0104, "step": 570400 }, { "epoch": 1.48, "learning_rate": 7.82122499552855e-05, "loss": 0.0152, "step": 570410 }, { "epoch": 1.48, "learning_rate": 7.820836173891403e-05, "loss": 0.0085, "step": 570420 }, { "epoch": 1.48, "learning_rate": 7.820447352254257e-05, "loss": 0.0074, "step": 570430 }, { "epoch": 1.48, "learning_rate": 7.82005853061711e-05, "loss": 0.0083, "step": 570440 }, { "epoch": 1.48, "learning_rate": 7.819669708979964e-05, "loss": 0.0116, "step": 570450 }, { "epoch": 1.48, "learning_rate": 7.819280887342817e-05, "loss": 0.0067, "step": 570460 }, { "epoch": 1.48, "learning_rate": 7.818892065705673e-05, "loss": 0.0104, "step": 570470 }, { "epoch": 1.48, "learning_rate": 7.818503244068524e-05, "loss": 0.0082, "step": 570480 }, { "epoch": 1.48, "learning_rate": 7.81811442243138e-05, "loss": 0.0201, "step": 570490 }, { "epoch": 1.48, "learning_rate": 7.817725600794232e-05, "loss": 0.009, "step": 570500 }, { "epoch": 1.48, "learning_rate": 7.817336779157087e-05, "loss": 0.011, "step": 570510 }, { "epoch": 1.48, "learning_rate": 7.81694795751994e-05, "loss": 0.0107, "step": 570520 }, { "epoch": 1.48, "learning_rate": 7.816559135882794e-05, "loss": 0.0103, "step": 570530 }, { "epoch": 1.48, "learning_rate": 7.816170314245646e-05, "loss": 0.0084, "step": 570540 }, { "epoch": 1.48, "learning_rate": 7.8157814926085e-05, "loss": 0.0079, "step": 570550 }, { "epoch": 1.48, "learning_rate": 7.815392670971353e-05, "loss": 0.0093, "step": 570560 }, { "epoch": 1.48, "learning_rate": 7.815003849334207e-05, "loss": 0.0069, "step": 570570 }, { "epoch": 1.48, "learning_rate": 7.81461502769706e-05, "loss": 0.0109, "step": 570580 }, { "epoch": 1.48, "learning_rate": 7.814226206059914e-05, "loss": 0.0079, "step": 570590 }, { "epoch": 1.48, "learning_rate": 7.813837384422767e-05, "loss": 0.0079, "step": 570600 }, { "epoch": 1.48, "learning_rate": 7.813448562785621e-05, "loss": 0.0115, "step": 570610 }, { "epoch": 1.48, "learning_rate": 7.813059741148474e-05, "loss": 0.0099, "step": 570620 }, { "epoch": 1.48, "learning_rate": 7.81267091951133e-05, "loss": 0.0102, "step": 570630 }, { "epoch": 1.48, "learning_rate": 7.812282097874181e-05, "loss": 0.0087, "step": 570640 }, { "epoch": 1.48, "learning_rate": 7.811893276237034e-05, "loss": 0.0072, "step": 570650 }, { "epoch": 1.48, "learning_rate": 7.81150445459989e-05, "loss": 0.0109, "step": 570660 }, { "epoch": 1.48, "learning_rate": 7.811115632962742e-05, "loss": 0.0069, "step": 570670 }, { "epoch": 1.48, "learning_rate": 7.810726811325596e-05, "loss": 0.0084, "step": 570680 }, { "epoch": 1.48, "learning_rate": 7.810337989688449e-05, "loss": 0.0102, "step": 570690 }, { "epoch": 1.48, "learning_rate": 7.809949168051303e-05, "loss": 0.0088, "step": 570700 }, { "epoch": 1.48, "learning_rate": 7.809560346414156e-05, "loss": 0.0084, "step": 570710 }, { "epoch": 1.48, "learning_rate": 7.80917152477701e-05, "loss": 0.0093, "step": 570720 }, { "epoch": 1.48, "learning_rate": 7.808782703139863e-05, "loss": 0.0099, "step": 570730 }, { "epoch": 1.48, "learning_rate": 7.808393881502717e-05, "loss": 0.0069, "step": 570740 }, { "epoch": 1.48, "learning_rate": 7.80800505986557e-05, "loss": 0.0086, "step": 570750 }, { "epoch": 1.48, "learning_rate": 7.807616238228424e-05, "loss": 0.0118, "step": 570760 }, { "epoch": 1.48, "learning_rate": 7.807227416591277e-05, "loss": 0.0089, "step": 570770 }, { "epoch": 1.48, "learning_rate": 7.806838594954131e-05, "loss": 0.0109, "step": 570780 }, { "epoch": 1.48, "learning_rate": 7.806449773316984e-05, "loss": 0.0107, "step": 570790 }, { "epoch": 1.48, "learning_rate": 7.806060951679838e-05, "loss": 0.0075, "step": 570800 }, { "epoch": 1.48, "learning_rate": 7.805672130042691e-05, "loss": 0.0079, "step": 570810 }, { "epoch": 1.48, "learning_rate": 7.805283308405547e-05, "loss": 0.0081, "step": 570820 }, { "epoch": 1.48, "learning_rate": 7.8048944867684e-05, "loss": 0.0103, "step": 570830 }, { "epoch": 1.48, "learning_rate": 7.804505665131254e-05, "loss": 0.0102, "step": 570840 }, { "epoch": 1.48, "learning_rate": 7.804116843494106e-05, "loss": 0.0076, "step": 570850 }, { "epoch": 1.48, "learning_rate": 7.80372802185696e-05, "loss": 0.0072, "step": 570860 }, { "epoch": 1.48, "learning_rate": 7.803339200219813e-05, "loss": 0.0099, "step": 570870 }, { "epoch": 1.48, "learning_rate": 7.802950378582668e-05, "loss": 0.008, "step": 570880 }, { "epoch": 1.48, "learning_rate": 7.80256155694552e-05, "loss": 0.0068, "step": 570890 }, { "epoch": 1.48, "learning_rate": 7.802172735308373e-05, "loss": 0.0111, "step": 570900 }, { "epoch": 1.48, "learning_rate": 7.801783913671227e-05, "loss": 0.0098, "step": 570910 }, { "epoch": 1.48, "learning_rate": 7.80139509203408e-05, "loss": 0.008, "step": 570920 }, { "epoch": 1.48, "learning_rate": 7.801006270396934e-05, "loss": 0.0091, "step": 570930 }, { "epoch": 1.48, "learning_rate": 7.800617448759787e-05, "loss": 0.0108, "step": 570940 }, { "epoch": 1.48, "learning_rate": 7.800228627122641e-05, "loss": 0.0078, "step": 570950 }, { "epoch": 1.48, "learning_rate": 7.799839805485494e-05, "loss": 0.0094, "step": 570960 }, { "epoch": 1.48, "learning_rate": 7.799450983848348e-05, "loss": 0.0079, "step": 570970 }, { "epoch": 1.48, "learning_rate": 7.799062162211201e-05, "loss": 0.0099, "step": 570980 }, { "epoch": 1.48, "learning_rate": 7.798673340574055e-05, "loss": 0.0118, "step": 570990 }, { "epoch": 1.48, "learning_rate": 7.798284518936908e-05, "loss": 0.0062, "step": 571000 }, { "epoch": 1.48, "eval_cer": 0.8816746935844841, "eval_loss": 0.006170371081680059, "eval_runtime": 108.0088, "eval_samples_per_second": 18.517, "eval_steps_per_second": 4.629, "step": 571000 }, { "epoch": 1.48, "learning_rate": 7.797895697299764e-05, "loss": 0.0086, "step": 571010 }, { "epoch": 1.48, "learning_rate": 7.797506875662616e-05, "loss": 0.0093, "step": 571020 }, { "epoch": 1.48, "learning_rate": 7.79711805402547e-05, "loss": 0.0103, "step": 571030 }, { "epoch": 1.48, "learning_rate": 7.796729232388323e-05, "loss": 0.0106, "step": 571040 }, { "epoch": 1.48, "learning_rate": 7.796340410751178e-05, "loss": 0.008, "step": 571050 }, { "epoch": 1.48, "learning_rate": 7.79595158911403e-05, "loss": 0.0081, "step": 571060 }, { "epoch": 1.48, "learning_rate": 7.795562767476884e-05, "loss": 0.0086, "step": 571070 }, { "epoch": 1.48, "learning_rate": 7.795173945839737e-05, "loss": 0.0071, "step": 571080 }, { "epoch": 1.48, "learning_rate": 7.794785124202591e-05, "loss": 0.0102, "step": 571090 }, { "epoch": 1.48, "learning_rate": 7.794396302565444e-05, "loss": 0.0121, "step": 571100 }, { "epoch": 1.48, "learning_rate": 7.794007480928298e-05, "loss": 0.0103, "step": 571110 }, { "epoch": 1.48, "learning_rate": 7.793618659291151e-05, "loss": 0.0094, "step": 571120 }, { "epoch": 1.48, "learning_rate": 7.793229837654005e-05, "loss": 0.0084, "step": 571130 }, { "epoch": 1.48, "learning_rate": 7.792841016016858e-05, "loss": 0.008, "step": 571140 }, { "epoch": 1.48, "learning_rate": 7.792452194379711e-05, "loss": 0.0111, "step": 571150 }, { "epoch": 1.48, "learning_rate": 7.792063372742565e-05, "loss": 0.0077, "step": 571160 }, { "epoch": 1.48, "learning_rate": 7.791674551105418e-05, "loss": 0.0098, "step": 571170 }, { "epoch": 1.48, "learning_rate": 7.791285729468273e-05, "loss": 0.0077, "step": 571180 }, { "epoch": 1.48, "learning_rate": 7.790896907831126e-05, "loss": 0.0133, "step": 571190 }, { "epoch": 1.48, "learning_rate": 7.79050808619398e-05, "loss": 0.0125, "step": 571200 }, { "epoch": 1.48, "learning_rate": 7.790119264556833e-05, "loss": 0.0082, "step": 571210 }, { "epoch": 1.48, "learning_rate": 7.789730442919687e-05, "loss": 0.0096, "step": 571220 }, { "epoch": 1.48, "learning_rate": 7.78934162128254e-05, "loss": 0.0092, "step": 571230 }, { "epoch": 1.48, "learning_rate": 7.788952799645394e-05, "loss": 0.0121, "step": 571240 }, { "epoch": 1.48, "learning_rate": 7.788563978008247e-05, "loss": 0.008, "step": 571250 }, { "epoch": 1.48, "learning_rate": 7.788175156371101e-05, "loss": 0.0068, "step": 571260 }, { "epoch": 1.48, "learning_rate": 7.787786334733954e-05, "loss": 0.0108, "step": 571270 }, { "epoch": 1.48, "learning_rate": 7.787397513096808e-05, "loss": 0.0093, "step": 571280 }, { "epoch": 1.48, "learning_rate": 7.787008691459661e-05, "loss": 0.0066, "step": 571290 }, { "epoch": 1.48, "learning_rate": 7.786619869822515e-05, "loss": 0.0087, "step": 571300 }, { "epoch": 1.48, "learning_rate": 7.786231048185368e-05, "loss": 0.0087, "step": 571310 }, { "epoch": 1.48, "learning_rate": 7.785842226548222e-05, "loss": 0.0131, "step": 571320 }, { "epoch": 1.48, "learning_rate": 7.785453404911075e-05, "loss": 0.0083, "step": 571330 }, { "epoch": 1.48, "learning_rate": 7.78506458327393e-05, "loss": 0.0093, "step": 571340 }, { "epoch": 1.48, "learning_rate": 7.784675761636782e-05, "loss": 0.0095, "step": 571350 }, { "epoch": 1.48, "learning_rate": 7.784286939999638e-05, "loss": 0.0102, "step": 571360 }, { "epoch": 1.48, "learning_rate": 7.78389811836249e-05, "loss": 0.0107, "step": 571370 }, { "epoch": 1.48, "learning_rate": 7.783509296725345e-05, "loss": 0.0123, "step": 571380 }, { "epoch": 1.48, "learning_rate": 7.783120475088197e-05, "loss": 0.0084, "step": 571390 }, { "epoch": 1.48, "learning_rate": 7.78273165345105e-05, "loss": 0.0082, "step": 571400 }, { "epoch": 1.48, "learning_rate": 7.782342831813904e-05, "loss": 0.0182, "step": 571410 }, { "epoch": 1.48, "learning_rate": 7.781954010176757e-05, "loss": 0.0076, "step": 571420 }, { "epoch": 1.48, "learning_rate": 7.781565188539611e-05, "loss": 0.0089, "step": 571430 }, { "epoch": 1.48, "learning_rate": 7.781176366902464e-05, "loss": 0.0125, "step": 571440 }, { "epoch": 1.48, "learning_rate": 7.780787545265318e-05, "loss": 0.0086, "step": 571450 }, { "epoch": 1.48, "learning_rate": 7.780398723628171e-05, "loss": 0.0097, "step": 571460 }, { "epoch": 1.48, "learning_rate": 7.780009901991025e-05, "loss": 0.0092, "step": 571470 }, { "epoch": 1.48, "learning_rate": 7.779621080353878e-05, "loss": 0.0082, "step": 571480 }, { "epoch": 1.48, "learning_rate": 7.779232258716732e-05, "loss": 0.0075, "step": 571490 }, { "epoch": 1.48, "learning_rate": 7.778843437079585e-05, "loss": 0.0092, "step": 571500 }, { "epoch": 1.48, "learning_rate": 7.778454615442439e-05, "loss": 0.0111, "step": 571510 }, { "epoch": 1.48, "learning_rate": 7.778065793805292e-05, "loss": 0.0129, "step": 571520 }, { "epoch": 1.48, "learning_rate": 7.777676972168148e-05, "loss": 0.0083, "step": 571530 }, { "epoch": 1.48, "learning_rate": 7.777288150531e-05, "loss": 0.0084, "step": 571540 }, { "epoch": 1.48, "learning_rate": 7.776899328893855e-05, "loss": 0.0083, "step": 571550 }, { "epoch": 1.48, "learning_rate": 7.776510507256707e-05, "loss": 0.0067, "step": 571560 }, { "epoch": 1.48, "learning_rate": 7.776121685619561e-05, "loss": 0.0096, "step": 571570 }, { "epoch": 1.48, "learning_rate": 7.775732863982414e-05, "loss": 0.0113, "step": 571580 }, { "epoch": 1.48, "learning_rate": 7.775344042345268e-05, "loss": 0.0091, "step": 571590 }, { "epoch": 1.48, "learning_rate": 7.774955220708121e-05, "loss": 0.0108, "step": 571600 }, { "epoch": 1.48, "learning_rate": 7.774566399070975e-05, "loss": 0.0081, "step": 571610 }, { "epoch": 1.48, "learning_rate": 7.774177577433828e-05, "loss": 0.0122, "step": 571620 }, { "epoch": 1.48, "learning_rate": 7.773788755796682e-05, "loss": 0.0089, "step": 571630 }, { "epoch": 1.48, "learning_rate": 7.773399934159535e-05, "loss": 0.0104, "step": 571640 }, { "epoch": 1.48, "learning_rate": 7.773011112522388e-05, "loss": 0.008, "step": 571650 }, { "epoch": 1.48, "learning_rate": 7.772622290885242e-05, "loss": 0.0086, "step": 571660 }, { "epoch": 1.48, "learning_rate": 7.772233469248095e-05, "loss": 0.0128, "step": 571670 }, { "epoch": 1.48, "learning_rate": 7.771844647610949e-05, "loss": 0.0093, "step": 571680 }, { "epoch": 1.48, "learning_rate": 7.771455825973802e-05, "loss": 0.0087, "step": 571690 }, { "epoch": 1.48, "learning_rate": 7.771067004336657e-05, "loss": 0.0089, "step": 571700 }, { "epoch": 1.48, "learning_rate": 7.770678182699509e-05, "loss": 0.0089, "step": 571710 }, { "epoch": 1.48, "learning_rate": 7.770289361062364e-05, "loss": 0.0084, "step": 571720 }, { "epoch": 1.48, "learning_rate": 7.769900539425217e-05, "loss": 0.0068, "step": 571730 }, { "epoch": 1.48, "learning_rate": 7.769511717788071e-05, "loss": 0.0096, "step": 571740 }, { "epoch": 1.48, "learning_rate": 7.769122896150924e-05, "loss": 0.0157, "step": 571750 }, { "epoch": 1.48, "learning_rate": 7.768734074513778e-05, "loss": 0.0083, "step": 571760 }, { "epoch": 1.48, "learning_rate": 7.768345252876631e-05, "loss": 0.0109, "step": 571770 }, { "epoch": 1.48, "learning_rate": 7.767956431239485e-05, "loss": 0.0095, "step": 571780 }, { "epoch": 1.48, "learning_rate": 7.767567609602338e-05, "loss": 0.0117, "step": 571790 }, { "epoch": 1.48, "learning_rate": 7.767178787965192e-05, "loss": 0.0115, "step": 571800 }, { "epoch": 1.48, "learning_rate": 7.766789966328045e-05, "loss": 0.0079, "step": 571810 }, { "epoch": 1.48, "learning_rate": 7.7664011446909e-05, "loss": 0.011, "step": 571820 }, { "epoch": 1.48, "learning_rate": 7.766012323053752e-05, "loss": 0.0088, "step": 571830 }, { "epoch": 1.48, "learning_rate": 7.765623501416606e-05, "loss": 0.0117, "step": 571840 }, { "epoch": 1.48, "learning_rate": 7.765234679779459e-05, "loss": 0.0091, "step": 571850 }, { "epoch": 1.48, "learning_rate": 7.764845858142315e-05, "loss": 0.0103, "step": 571860 }, { "epoch": 1.48, "learning_rate": 7.764457036505166e-05, "loss": 0.0096, "step": 571870 }, { "epoch": 1.48, "learning_rate": 7.764068214868022e-05, "loss": 0.0082, "step": 571880 }, { "epoch": 1.48, "learning_rate": 7.763679393230874e-05, "loss": 0.0098, "step": 571890 }, { "epoch": 1.48, "learning_rate": 7.763290571593727e-05, "loss": 0.0096, "step": 571900 }, { "epoch": 1.48, "learning_rate": 7.762901749956581e-05, "loss": 0.0112, "step": 571910 }, { "epoch": 1.48, "learning_rate": 7.762512928319434e-05, "loss": 0.0132, "step": 571920 }, { "epoch": 1.48, "learning_rate": 7.762124106682288e-05, "loss": 0.0104, "step": 571930 }, { "epoch": 1.48, "learning_rate": 7.761735285045141e-05, "loss": 0.0088, "step": 571940 }, { "epoch": 1.48, "learning_rate": 7.761346463407995e-05, "loss": 0.012, "step": 571950 }, { "epoch": 1.48, "learning_rate": 7.760957641770848e-05, "loss": 0.0097, "step": 571960 }, { "epoch": 1.48, "learning_rate": 7.760568820133702e-05, "loss": 0.0098, "step": 571970 }, { "epoch": 1.48, "learning_rate": 7.760179998496555e-05, "loss": 0.0113, "step": 571980 }, { "epoch": 1.48, "learning_rate": 7.759791176859409e-05, "loss": 0.0097, "step": 571990 }, { "epoch": 1.48, "learning_rate": 7.759402355222262e-05, "loss": 0.0086, "step": 572000 }, { "epoch": 1.48, "eval_cer": 0.8817110841447728, "eval_loss": 0.006190904416143894, "eval_runtime": 107.9681, "eval_samples_per_second": 18.524, "eval_steps_per_second": 4.631, "step": 572000 }, { "epoch": 1.48, "learning_rate": 7.759013533585116e-05, "loss": 0.0098, "step": 572010 }, { "epoch": 1.48, "learning_rate": 7.758624711947969e-05, "loss": 0.0122, "step": 572020 }, { "epoch": 1.48, "learning_rate": 7.758235890310823e-05, "loss": 0.0079, "step": 572030 }, { "epoch": 1.48, "learning_rate": 7.757847068673676e-05, "loss": 0.0092, "step": 572040 }, { "epoch": 1.48, "learning_rate": 7.757458247036532e-05, "loss": 0.0119, "step": 572050 }, { "epoch": 1.48, "learning_rate": 7.757069425399384e-05, "loss": 0.0092, "step": 572060 }, { "epoch": 1.48, "learning_rate": 7.756680603762239e-05, "loss": 0.0084, "step": 572070 }, { "epoch": 1.48, "learning_rate": 7.756291782125091e-05, "loss": 0.0123, "step": 572080 }, { "epoch": 1.48, "learning_rate": 7.755902960487945e-05, "loss": 0.0094, "step": 572090 }, { "epoch": 1.48, "learning_rate": 7.755514138850798e-05, "loss": 0.0118, "step": 572100 }, { "epoch": 1.48, "learning_rate": 7.755125317213652e-05, "loss": 0.0094, "step": 572110 }, { "epoch": 1.48, "learning_rate": 7.754736495576505e-05, "loss": 0.0081, "step": 572120 }, { "epoch": 1.48, "learning_rate": 7.75434767393936e-05, "loss": 0.0109, "step": 572130 }, { "epoch": 1.48, "learning_rate": 7.753958852302212e-05, "loss": 0.0091, "step": 572140 }, { "epoch": 1.48, "learning_rate": 7.753570030665065e-05, "loss": 0.0082, "step": 572150 }, { "epoch": 1.48, "learning_rate": 7.753181209027919e-05, "loss": 0.0111, "step": 572160 }, { "epoch": 1.48, "learning_rate": 7.752792387390772e-05, "loss": 0.0088, "step": 572170 }, { "epoch": 1.48, "learning_rate": 7.752403565753626e-05, "loss": 0.0069, "step": 572180 }, { "epoch": 1.48, "learning_rate": 7.752014744116479e-05, "loss": 0.0127, "step": 572190 }, { "epoch": 1.48, "learning_rate": 7.751625922479333e-05, "loss": 0.0099, "step": 572200 }, { "epoch": 1.48, "learning_rate": 7.751237100842186e-05, "loss": 0.0099, "step": 572210 }, { "epoch": 1.48, "learning_rate": 7.750848279205041e-05, "loss": 0.0074, "step": 572220 }, { "epoch": 1.48, "learning_rate": 7.750459457567893e-05, "loss": 0.0089, "step": 572230 }, { "epoch": 1.48, "learning_rate": 7.750070635930748e-05, "loss": 0.0078, "step": 572240 }, { "epoch": 1.48, "learning_rate": 7.749681814293601e-05, "loss": 0.0085, "step": 572250 }, { "epoch": 1.48, "learning_rate": 7.749292992656455e-05, "loss": 0.0083, "step": 572260 }, { "epoch": 1.48, "learning_rate": 7.748904171019308e-05, "loss": 0.0133, "step": 572270 }, { "epoch": 1.48, "learning_rate": 7.748515349382162e-05, "loss": 0.0107, "step": 572280 }, { "epoch": 1.48, "learning_rate": 7.748126527745015e-05, "loss": 0.0078, "step": 572290 }, { "epoch": 1.48, "learning_rate": 7.74773770610787e-05, "loss": 0.011, "step": 572300 }, { "epoch": 1.48, "learning_rate": 7.747348884470722e-05, "loss": 0.0093, "step": 572310 }, { "epoch": 1.48, "learning_rate": 7.746960062833576e-05, "loss": 0.0106, "step": 572320 }, { "epoch": 1.48, "learning_rate": 7.746571241196429e-05, "loss": 0.0079, "step": 572330 }, { "epoch": 1.48, "learning_rate": 7.746182419559283e-05, "loss": 0.0088, "step": 572340 }, { "epoch": 1.48, "learning_rate": 7.745793597922136e-05, "loss": 0.0088, "step": 572350 }, { "epoch": 1.48, "learning_rate": 7.74540477628499e-05, "loss": 0.0098, "step": 572360 }, { "epoch": 1.48, "learning_rate": 7.745015954647843e-05, "loss": 0.0074, "step": 572370 }, { "epoch": 1.48, "learning_rate": 7.744627133010697e-05, "loss": 0.011, "step": 572380 }, { "epoch": 1.48, "learning_rate": 7.74423831137355e-05, "loss": 0.012, "step": 572390 }, { "epoch": 1.48, "learning_rate": 7.743849489736403e-05, "loss": 0.0093, "step": 572400 }, { "epoch": 1.48, "learning_rate": 7.743460668099258e-05, "loss": 0.0084, "step": 572410 }, { "epoch": 1.48, "learning_rate": 7.743071846462111e-05, "loss": 0.0099, "step": 572420 }, { "epoch": 1.48, "learning_rate": 7.742683024824965e-05, "loss": 0.0094, "step": 572430 }, { "epoch": 1.48, "learning_rate": 7.742294203187818e-05, "loss": 0.0078, "step": 572440 }, { "epoch": 1.48, "learning_rate": 7.741905381550672e-05, "loss": 0.0091, "step": 572450 }, { "epoch": 1.48, "learning_rate": 7.741516559913525e-05, "loss": 0.0075, "step": 572460 }, { "epoch": 1.48, "learning_rate": 7.741127738276379e-05, "loss": 0.0081, "step": 572470 }, { "epoch": 1.48, "learning_rate": 7.740738916639232e-05, "loss": 0.0073, "step": 572480 }, { "epoch": 1.48, "learning_rate": 7.740350095002086e-05, "loss": 0.0093, "step": 572490 }, { "epoch": 1.48, "learning_rate": 7.739961273364939e-05, "loss": 0.0072, "step": 572500 }, { "epoch": 1.48, "learning_rate": 7.739572451727793e-05, "loss": 0.0115, "step": 572510 }, { "epoch": 1.48, "learning_rate": 7.739183630090646e-05, "loss": 0.0118, "step": 572520 }, { "epoch": 1.48, "learning_rate": 7.7387948084535e-05, "loss": 0.011, "step": 572530 }, { "epoch": 1.48, "learning_rate": 7.738405986816353e-05, "loss": 0.011, "step": 572540 }, { "epoch": 1.48, "learning_rate": 7.738017165179207e-05, "loss": 0.0104, "step": 572550 }, { "epoch": 1.48, "learning_rate": 7.73762834354206e-05, "loss": 0.0073, "step": 572560 }, { "epoch": 1.48, "learning_rate": 7.737239521904916e-05, "loss": 0.0079, "step": 572570 }, { "epoch": 1.48, "learning_rate": 7.736850700267767e-05, "loss": 0.0115, "step": 572580 }, { "epoch": 1.48, "learning_rate": 7.736461878630623e-05, "loss": 0.0093, "step": 572590 }, { "epoch": 1.48, "learning_rate": 7.736073056993475e-05, "loss": 0.0083, "step": 572600 }, { "epoch": 1.48, "learning_rate": 7.73568423535633e-05, "loss": 0.0087, "step": 572610 }, { "epoch": 1.48, "learning_rate": 7.735295413719182e-05, "loss": 0.0068, "step": 572620 }, { "epoch": 1.48, "learning_rate": 7.734906592082036e-05, "loss": 0.0107, "step": 572630 }, { "epoch": 1.48, "learning_rate": 7.734517770444889e-05, "loss": 0.0076, "step": 572640 }, { "epoch": 1.48, "learning_rate": 7.734128948807742e-05, "loss": 0.0082, "step": 572650 }, { "epoch": 1.48, "learning_rate": 7.733740127170596e-05, "loss": 0.013, "step": 572660 }, { "epoch": 1.48, "learning_rate": 7.733351305533449e-05, "loss": 0.01, "step": 572670 }, { "epoch": 1.48, "learning_rate": 7.732962483896303e-05, "loss": 0.0097, "step": 572680 }, { "epoch": 1.48, "learning_rate": 7.732573662259156e-05, "loss": 0.0093, "step": 572690 }, { "epoch": 1.48, "learning_rate": 7.73218484062201e-05, "loss": 0.0099, "step": 572700 }, { "epoch": 1.48, "learning_rate": 7.731796018984863e-05, "loss": 0.01, "step": 572710 }, { "epoch": 1.48, "learning_rate": 7.731407197347717e-05, "loss": 0.0119, "step": 572720 }, { "epoch": 1.48, "learning_rate": 7.73101837571057e-05, "loss": 0.0094, "step": 572730 }, { "epoch": 1.48, "learning_rate": 7.730629554073424e-05, "loss": 0.0101, "step": 572740 }, { "epoch": 1.48, "learning_rate": 7.730240732436277e-05, "loss": 0.0097, "step": 572750 }, { "epoch": 1.48, "learning_rate": 7.729851910799132e-05, "loss": 0.0078, "step": 572760 }, { "epoch": 1.48, "learning_rate": 7.729463089161985e-05, "loss": 0.0097, "step": 572770 }, { "epoch": 1.48, "learning_rate": 7.72907426752484e-05, "loss": 0.007, "step": 572780 }, { "epoch": 1.48, "learning_rate": 7.728685445887692e-05, "loss": 0.0091, "step": 572790 }, { "epoch": 1.48, "learning_rate": 7.728296624250546e-05, "loss": 0.0088, "step": 572800 }, { "epoch": 1.48, "learning_rate": 7.727907802613399e-05, "loss": 0.0071, "step": 572810 }, { "epoch": 1.48, "learning_rate": 7.727518980976253e-05, "loss": 0.0098, "step": 572820 }, { "epoch": 1.48, "learning_rate": 7.727130159339106e-05, "loss": 0.0067, "step": 572830 }, { "epoch": 1.48, "learning_rate": 7.72674133770196e-05, "loss": 0.008, "step": 572840 }, { "epoch": 1.48, "learning_rate": 7.726352516064813e-05, "loss": 0.0089, "step": 572850 }, { "epoch": 1.48, "learning_rate": 7.725963694427667e-05, "loss": 0.0088, "step": 572860 }, { "epoch": 1.48, "learning_rate": 7.72557487279052e-05, "loss": 0.0081, "step": 572870 }, { "epoch": 1.48, "learning_rate": 7.725186051153373e-05, "loss": 0.0098, "step": 572880 }, { "epoch": 1.49, "learning_rate": 7.724797229516227e-05, "loss": 0.0083, "step": 572890 }, { "epoch": 1.49, "learning_rate": 7.72440840787908e-05, "loss": 0.009, "step": 572900 }, { "epoch": 1.49, "learning_rate": 7.724019586241934e-05, "loss": 0.01, "step": 572910 }, { "epoch": 1.49, "learning_rate": 7.723630764604787e-05, "loss": 0.0096, "step": 572920 }, { "epoch": 1.49, "learning_rate": 7.723241942967642e-05, "loss": 0.0087, "step": 572930 }, { "epoch": 1.49, "learning_rate": 7.722853121330494e-05, "loss": 0.0075, "step": 572940 }, { "epoch": 1.49, "learning_rate": 7.72246429969335e-05, "loss": 0.0104, "step": 572950 }, { "epoch": 1.49, "learning_rate": 7.722075478056202e-05, "loss": 0.0134, "step": 572960 }, { "epoch": 1.49, "learning_rate": 7.721686656419056e-05, "loss": 0.0076, "step": 572970 }, { "epoch": 1.49, "learning_rate": 7.721297834781909e-05, "loss": 0.0069, "step": 572980 }, { "epoch": 1.49, "learning_rate": 7.720909013144763e-05, "loss": 0.0108, "step": 572990 }, { "epoch": 1.49, "learning_rate": 7.720520191507616e-05, "loss": 0.0096, "step": 573000 }, { "epoch": 1.49, "eval_cer": 0.8817026863231677, "eval_loss": 0.006154380738735199, "eval_runtime": 107.6789, "eval_samples_per_second": 18.574, "eval_steps_per_second": 4.643, "step": 573000 }, { "epoch": 1.49, "learning_rate": 7.72013136987047e-05, "loss": 0.0111, "step": 573010 }, { "epoch": 1.49, "learning_rate": 7.719742548233323e-05, "loss": 0.0092, "step": 573020 }, { "epoch": 1.49, "learning_rate": 7.719353726596177e-05, "loss": 0.0075, "step": 573030 }, { "epoch": 1.49, "learning_rate": 7.71896490495903e-05, "loss": 0.0079, "step": 573040 }, { "epoch": 1.49, "learning_rate": 7.718576083321884e-05, "loss": 0.0084, "step": 573050 }, { "epoch": 1.49, "learning_rate": 7.718187261684737e-05, "loss": 0.0106, "step": 573060 }, { "epoch": 1.49, "learning_rate": 7.717798440047591e-05, "loss": 0.0095, "step": 573070 }, { "epoch": 1.49, "learning_rate": 7.717409618410444e-05, "loss": 0.0066, "step": 573080 }, { "epoch": 1.49, "learning_rate": 7.7170207967733e-05, "loss": 0.0108, "step": 573090 }, { "epoch": 1.49, "learning_rate": 7.716631975136151e-05, "loss": 0.0115, "step": 573100 }, { "epoch": 1.49, "learning_rate": 7.716243153499006e-05, "loss": 0.0089, "step": 573110 }, { "epoch": 1.49, "learning_rate": 7.715854331861859e-05, "loss": 0.0093, "step": 573120 }, { "epoch": 1.49, "learning_rate": 7.715465510224712e-05, "loss": 0.0098, "step": 573130 }, { "epoch": 1.49, "learning_rate": 7.715076688587566e-05, "loss": 0.0074, "step": 573140 }, { "epoch": 1.49, "learning_rate": 7.714687866950419e-05, "loss": 0.008, "step": 573150 }, { "epoch": 1.49, "learning_rate": 7.714299045313273e-05, "loss": 0.0079, "step": 573160 }, { "epoch": 1.49, "learning_rate": 7.713910223676126e-05, "loss": 0.0088, "step": 573170 }, { "epoch": 1.49, "learning_rate": 7.71352140203898e-05, "loss": 0.0081, "step": 573180 }, { "epoch": 1.49, "learning_rate": 7.713132580401833e-05, "loss": 0.0081, "step": 573190 }, { "epoch": 1.49, "learning_rate": 7.712743758764687e-05, "loss": 0.0088, "step": 573200 }, { "epoch": 1.49, "learning_rate": 7.71235493712754e-05, "loss": 0.0074, "step": 573210 }, { "epoch": 1.49, "learning_rate": 7.711966115490394e-05, "loss": 0.0102, "step": 573220 }, { "epoch": 1.49, "learning_rate": 7.711577293853247e-05, "loss": 0.0108, "step": 573230 }, { "epoch": 1.49, "learning_rate": 7.711188472216101e-05, "loss": 0.0089, "step": 573240 }, { "epoch": 1.49, "learning_rate": 7.710799650578954e-05, "loss": 0.0084, "step": 573250 }, { "epoch": 1.49, "learning_rate": 7.710410828941808e-05, "loss": 0.0082, "step": 573260 }, { "epoch": 1.49, "learning_rate": 7.710022007304661e-05, "loss": 0.0136, "step": 573270 }, { "epoch": 1.49, "learning_rate": 7.709633185667516e-05, "loss": 0.0063, "step": 573280 }, { "epoch": 1.49, "learning_rate": 7.709244364030369e-05, "loss": 0.0096, "step": 573290 }, { "epoch": 1.49, "learning_rate": 7.708855542393223e-05, "loss": 0.0096, "step": 573300 }, { "epoch": 1.49, "learning_rate": 7.708466720756076e-05, "loss": 0.0083, "step": 573310 }, { "epoch": 1.49, "learning_rate": 7.70807789911893e-05, "loss": 0.0124, "step": 573320 }, { "epoch": 1.49, "learning_rate": 7.707689077481783e-05, "loss": 0.0119, "step": 573330 }, { "epoch": 1.49, "learning_rate": 7.707300255844637e-05, "loss": 0.0095, "step": 573340 }, { "epoch": 1.49, "learning_rate": 7.70691143420749e-05, "loss": 0.0088, "step": 573350 }, { "epoch": 1.49, "learning_rate": 7.706522612570344e-05, "loss": 0.0073, "step": 573360 }, { "epoch": 1.49, "learning_rate": 7.706133790933197e-05, "loss": 0.0094, "step": 573370 }, { "epoch": 1.49, "learning_rate": 7.70574496929605e-05, "loss": 0.0073, "step": 573380 }, { "epoch": 1.49, "learning_rate": 7.705356147658904e-05, "loss": 0.0089, "step": 573390 }, { "epoch": 1.49, "learning_rate": 7.704967326021757e-05, "loss": 0.01, "step": 573400 }, { "epoch": 1.49, "learning_rate": 7.704578504384611e-05, "loss": 0.0111, "step": 573410 }, { "epoch": 1.49, "learning_rate": 7.704189682747464e-05, "loss": 0.0099, "step": 573420 }, { "epoch": 1.49, "learning_rate": 7.703800861110318e-05, "loss": 0.0121, "step": 573430 }, { "epoch": 1.49, "learning_rate": 7.703412039473171e-05, "loss": 0.0108, "step": 573440 }, { "epoch": 1.49, "learning_rate": 7.703023217836026e-05, "loss": 0.0075, "step": 573450 }, { "epoch": 1.49, "learning_rate": 7.702634396198878e-05, "loss": 0.0115, "step": 573460 }, { "epoch": 1.49, "learning_rate": 7.702245574561733e-05, "loss": 0.0105, "step": 573470 }, { "epoch": 1.49, "learning_rate": 7.701856752924586e-05, "loss": 0.0081, "step": 573480 }, { "epoch": 1.49, "learning_rate": 7.70146793128744e-05, "loss": 0.009, "step": 573490 }, { "epoch": 1.49, "learning_rate": 7.701079109650293e-05, "loss": 0.0075, "step": 573500 }, { "epoch": 1.49, "learning_rate": 7.700690288013147e-05, "loss": 0.0102, "step": 573510 }, { "epoch": 1.49, "learning_rate": 7.700301466376e-05, "loss": 0.0097, "step": 573520 }, { "epoch": 1.49, "learning_rate": 7.699912644738854e-05, "loss": 0.008, "step": 573530 }, { "epoch": 1.49, "learning_rate": 7.699523823101707e-05, "loss": 0.0091, "step": 573540 }, { "epoch": 1.49, "learning_rate": 7.699135001464561e-05, "loss": 0.01, "step": 573550 }, { "epoch": 1.49, "learning_rate": 7.698746179827414e-05, "loss": 0.0097, "step": 573560 }, { "epoch": 1.49, "learning_rate": 7.698357358190268e-05, "loss": 0.0105, "step": 573570 }, { "epoch": 1.49, "learning_rate": 7.697968536553121e-05, "loss": 0.0066, "step": 573580 }, { "epoch": 1.49, "learning_rate": 7.697579714915975e-05, "loss": 0.0099, "step": 573590 }, { "epoch": 1.49, "learning_rate": 7.697190893278828e-05, "loss": 0.0085, "step": 573600 }, { "epoch": 1.49, "learning_rate": 7.696802071641684e-05, "loss": 0.01, "step": 573610 }, { "epoch": 1.49, "learning_rate": 7.696413250004535e-05, "loss": 0.0075, "step": 573620 }, { "epoch": 1.49, "learning_rate": 7.696024428367388e-05, "loss": 0.0119, "step": 573630 }, { "epoch": 1.49, "learning_rate": 7.695635606730243e-05, "loss": 0.0091, "step": 573640 }, { "epoch": 1.49, "learning_rate": 7.695246785093096e-05, "loss": 0.0105, "step": 573650 }, { "epoch": 1.49, "learning_rate": 7.69485796345595e-05, "loss": 0.0093, "step": 573660 }, { "epoch": 1.49, "learning_rate": 7.694469141818803e-05, "loss": 0.0097, "step": 573670 }, { "epoch": 1.49, "learning_rate": 7.694080320181657e-05, "loss": 0.0098, "step": 573680 }, { "epoch": 1.49, "learning_rate": 7.69369149854451e-05, "loss": 0.0124, "step": 573690 }, { "epoch": 1.49, "learning_rate": 7.693302676907364e-05, "loss": 0.008, "step": 573700 }, { "epoch": 1.49, "learning_rate": 7.692913855270217e-05, "loss": 0.0118, "step": 573710 }, { "epoch": 1.49, "learning_rate": 7.692525033633071e-05, "loss": 0.0085, "step": 573720 }, { "epoch": 1.49, "learning_rate": 7.692136211995924e-05, "loss": 0.0097, "step": 573730 }, { "epoch": 1.49, "learning_rate": 7.691747390358778e-05, "loss": 0.0106, "step": 573740 }, { "epoch": 1.49, "learning_rate": 7.691358568721631e-05, "loss": 0.0095, "step": 573750 }, { "epoch": 1.49, "learning_rate": 7.690969747084485e-05, "loss": 0.0084, "step": 573760 }, { "epoch": 1.49, "learning_rate": 7.690580925447338e-05, "loss": 0.008, "step": 573770 }, { "epoch": 1.49, "learning_rate": 7.690192103810192e-05, "loss": 0.0091, "step": 573780 }, { "epoch": 1.49, "learning_rate": 7.689803282173045e-05, "loss": 0.0094, "step": 573790 }, { "epoch": 1.49, "learning_rate": 7.6894144605359e-05, "loss": 0.0104, "step": 573800 }, { "epoch": 1.49, "learning_rate": 7.689025638898753e-05, "loss": 0.0078, "step": 573810 }, { "epoch": 1.49, "learning_rate": 7.688636817261607e-05, "loss": 0.0084, "step": 573820 }, { "epoch": 1.49, "learning_rate": 7.68824799562446e-05, "loss": 0.0086, "step": 573830 }, { "epoch": 1.49, "learning_rate": 7.687859173987314e-05, "loss": 0.0089, "step": 573840 }, { "epoch": 1.49, "learning_rate": 7.687470352350167e-05, "loss": 0.0101, "step": 573850 }, { "epoch": 1.49, "learning_rate": 7.687081530713021e-05, "loss": 0.0128, "step": 573860 }, { "epoch": 1.49, "learning_rate": 7.686692709075874e-05, "loss": 0.0106, "step": 573870 }, { "epoch": 1.49, "learning_rate": 7.686303887438727e-05, "loss": 0.0091, "step": 573880 }, { "epoch": 1.49, "learning_rate": 7.685915065801581e-05, "loss": 0.0067, "step": 573890 }, { "epoch": 1.49, "learning_rate": 7.685526244164434e-05, "loss": 0.0092, "step": 573900 }, { "epoch": 1.49, "learning_rate": 7.685137422527288e-05, "loss": 0.007, "step": 573910 }, { "epoch": 1.49, "learning_rate": 7.684748600890141e-05, "loss": 0.0135, "step": 573920 }, { "epoch": 1.49, "learning_rate": 7.684359779252995e-05, "loss": 0.0087, "step": 573930 }, { "epoch": 1.49, "learning_rate": 7.683970957615848e-05, "loss": 0.0076, "step": 573940 }, { "epoch": 1.49, "learning_rate": 7.683582135978702e-05, "loss": 0.0073, "step": 573950 }, { "epoch": 1.49, "learning_rate": 7.683193314341555e-05, "loss": 0.0088, "step": 573960 }, { "epoch": 1.49, "learning_rate": 7.682804492704409e-05, "loss": 0.0077, "step": 573970 }, { "epoch": 1.49, "learning_rate": 7.682415671067262e-05, "loss": 0.01, "step": 573980 }, { "epoch": 1.49, "learning_rate": 7.682026849430117e-05, "loss": 0.01, "step": 573990 }, { "epoch": 1.49, "learning_rate": 7.68163802779297e-05, "loss": 0.0116, "step": 574000 }, { "epoch": 1.49, "eval_cer": 0.8816858906799576, "eval_loss": 0.0060965148732066154, "eval_runtime": 107.9458, "eval_samples_per_second": 18.528, "eval_steps_per_second": 4.632, "step": 574000 }, { "epoch": 1.49, "learning_rate": 7.681249206155824e-05, "loss": 0.0106, "step": 574010 }, { "epoch": 1.49, "learning_rate": 7.680860384518677e-05, "loss": 0.0094, "step": 574020 }, { "epoch": 1.49, "learning_rate": 7.680471562881531e-05, "loss": 0.0074, "step": 574030 }, { "epoch": 1.49, "learning_rate": 7.680082741244384e-05, "loss": 0.0092, "step": 574040 }, { "epoch": 1.49, "learning_rate": 7.679693919607238e-05, "loss": 0.0076, "step": 574050 }, { "epoch": 1.49, "learning_rate": 7.679305097970091e-05, "loss": 0.0072, "step": 574060 }, { "epoch": 1.49, "learning_rate": 7.678916276332945e-05, "loss": 0.0082, "step": 574070 }, { "epoch": 1.49, "learning_rate": 7.678527454695798e-05, "loss": 0.0073, "step": 574080 }, { "epoch": 1.49, "learning_rate": 7.678138633058652e-05, "loss": 0.0082, "step": 574090 }, { "epoch": 1.49, "learning_rate": 7.677749811421505e-05, "loss": 0.0091, "step": 574100 }, { "epoch": 1.49, "learning_rate": 7.677360989784359e-05, "loss": 0.0078, "step": 574110 }, { "epoch": 1.49, "learning_rate": 7.676972168147212e-05, "loss": 0.0093, "step": 574120 }, { "epoch": 1.49, "learning_rate": 7.676583346510065e-05, "loss": 0.007, "step": 574130 }, { "epoch": 1.49, "learning_rate": 7.676194524872919e-05, "loss": 0.0058, "step": 574140 }, { "epoch": 1.49, "learning_rate": 7.675805703235772e-05, "loss": 0.0073, "step": 574150 }, { "epoch": 1.49, "learning_rate": 7.675416881598627e-05, "loss": 0.0054, "step": 574160 }, { "epoch": 1.49, "learning_rate": 7.675028059961479e-05, "loss": 0.008, "step": 574170 }, { "epoch": 1.49, "learning_rate": 7.674639238324334e-05, "loss": 0.0153, "step": 574180 }, { "epoch": 1.49, "learning_rate": 7.674250416687187e-05, "loss": 0.0084, "step": 574190 }, { "epoch": 1.49, "learning_rate": 7.673861595050041e-05, "loss": 0.0071, "step": 574200 }, { "epoch": 1.49, "learning_rate": 7.673472773412894e-05, "loss": 0.0113, "step": 574210 }, { "epoch": 1.49, "learning_rate": 7.673083951775748e-05, "loss": 0.0104, "step": 574220 }, { "epoch": 1.49, "learning_rate": 7.672695130138601e-05, "loss": 0.0096, "step": 574230 }, { "epoch": 1.49, "learning_rate": 7.672306308501455e-05, "loss": 0.0068, "step": 574240 }, { "epoch": 1.49, "learning_rate": 7.671917486864308e-05, "loss": 0.0104, "step": 574250 }, { "epoch": 1.49, "learning_rate": 7.671528665227162e-05, "loss": 0.008, "step": 574260 }, { "epoch": 1.49, "learning_rate": 7.671139843590015e-05, "loss": 0.0077, "step": 574270 }, { "epoch": 1.49, "learning_rate": 7.670751021952869e-05, "loss": 0.0083, "step": 574280 }, { "epoch": 1.49, "learning_rate": 7.670362200315722e-05, "loss": 0.0087, "step": 574290 }, { "epoch": 1.49, "learning_rate": 7.669973378678576e-05, "loss": 0.0081, "step": 574300 }, { "epoch": 1.49, "learning_rate": 7.669584557041429e-05, "loss": 0.0085, "step": 574310 }, { "epoch": 1.49, "learning_rate": 7.669195735404284e-05, "loss": 0.01, "step": 574320 }, { "epoch": 1.49, "learning_rate": 7.668806913767136e-05, "loss": 0.0098, "step": 574330 }, { "epoch": 1.49, "learning_rate": 7.668418092129991e-05, "loss": 0.0098, "step": 574340 }, { "epoch": 1.49, "learning_rate": 7.668029270492844e-05, "loss": 0.0118, "step": 574350 }, { "epoch": 1.49, "learning_rate": 7.667640448855698e-05, "loss": 0.0106, "step": 574360 }, { "epoch": 1.49, "learning_rate": 7.667251627218551e-05, "loss": 0.011, "step": 574370 }, { "epoch": 1.49, "learning_rate": 7.666862805581404e-05, "loss": 0.009, "step": 574380 }, { "epoch": 1.49, "learning_rate": 7.666473983944258e-05, "loss": 0.0081, "step": 574390 }, { "epoch": 1.49, "learning_rate": 7.666085162307111e-05, "loss": 0.0092, "step": 574400 }, { "epoch": 1.49, "learning_rate": 7.665696340669965e-05, "loss": 0.0084, "step": 574410 }, { "epoch": 1.49, "learning_rate": 7.665307519032818e-05, "loss": 0.0078, "step": 574420 }, { "epoch": 1.49, "learning_rate": 7.664918697395672e-05, "loss": 0.0145, "step": 574430 }, { "epoch": 1.49, "learning_rate": 7.664529875758525e-05, "loss": 0.0096, "step": 574440 }, { "epoch": 1.49, "learning_rate": 7.664141054121379e-05, "loss": 0.0086, "step": 574450 }, { "epoch": 1.49, "learning_rate": 7.663752232484232e-05, "loss": 0.0142, "step": 574460 }, { "epoch": 1.49, "learning_rate": 7.663363410847086e-05, "loss": 0.0045, "step": 574470 }, { "epoch": 1.49, "learning_rate": 7.662974589209939e-05, "loss": 0.0107, "step": 574480 }, { "epoch": 1.49, "learning_rate": 7.662585767572793e-05, "loss": 0.007, "step": 574490 }, { "epoch": 1.49, "learning_rate": 7.662196945935646e-05, "loss": 0.0082, "step": 574500 }, { "epoch": 1.49, "learning_rate": 7.661808124298501e-05, "loss": 0.0123, "step": 574510 }, { "epoch": 1.49, "learning_rate": 7.661419302661354e-05, "loss": 0.0106, "step": 574520 }, { "epoch": 1.49, "learning_rate": 7.661030481024208e-05, "loss": 0.0081, "step": 574530 }, { "epoch": 1.49, "learning_rate": 7.660641659387061e-05, "loss": 0.013, "step": 574540 }, { "epoch": 1.49, "learning_rate": 7.660252837749915e-05, "loss": 0.0089, "step": 574550 }, { "epoch": 1.49, "learning_rate": 7.659864016112768e-05, "loss": 0.0091, "step": 574560 }, { "epoch": 1.49, "learning_rate": 7.659475194475622e-05, "loss": 0.0083, "step": 574570 }, { "epoch": 1.49, "learning_rate": 7.659086372838475e-05, "loss": 0.0131, "step": 574580 }, { "epoch": 1.49, "learning_rate": 7.658697551201329e-05, "loss": 0.0108, "step": 574590 }, { "epoch": 1.49, "learning_rate": 7.658308729564182e-05, "loss": 0.0123, "step": 574600 }, { "epoch": 1.49, "learning_rate": 7.657919907927036e-05, "loss": 0.0085, "step": 574610 }, { "epoch": 1.49, "learning_rate": 7.657531086289889e-05, "loss": 0.0112, "step": 574620 }, { "epoch": 1.49, "learning_rate": 7.657142264652742e-05, "loss": 0.0077, "step": 574630 }, { "epoch": 1.49, "learning_rate": 7.656753443015596e-05, "loss": 0.0083, "step": 574640 }, { "epoch": 1.49, "learning_rate": 7.656364621378449e-05, "loss": 0.0137, "step": 574650 }, { "epoch": 1.49, "learning_rate": 7.655975799741303e-05, "loss": 0.009, "step": 574660 }, { "epoch": 1.49, "learning_rate": 7.655586978104156e-05, "loss": 0.0095, "step": 574670 }, { "epoch": 1.49, "learning_rate": 7.655198156467011e-05, "loss": 0.01, "step": 574680 }, { "epoch": 1.49, "learning_rate": 7.654809334829863e-05, "loss": 0.0079, "step": 574690 }, { "epoch": 1.49, "learning_rate": 7.654420513192718e-05, "loss": 0.0066, "step": 574700 }, { "epoch": 1.49, "learning_rate": 7.654031691555571e-05, "loss": 0.0099, "step": 574710 }, { "epoch": 1.49, "learning_rate": 7.653642869918425e-05, "loss": 0.0107, "step": 574720 }, { "epoch": 1.49, "learning_rate": 7.653254048281278e-05, "loss": 0.01, "step": 574730 }, { "epoch": 1.49, "learning_rate": 7.652865226644132e-05, "loss": 0.0086, "step": 574740 }, { "epoch": 1.49, "learning_rate": 7.652476405006985e-05, "loss": 0.0104, "step": 574750 }, { "epoch": 1.49, "learning_rate": 7.652087583369839e-05, "loss": 0.0082, "step": 574760 }, { "epoch": 1.49, "learning_rate": 7.651698761732692e-05, "loss": 0.0101, "step": 574770 }, { "epoch": 1.49, "learning_rate": 7.651309940095546e-05, "loss": 0.0083, "step": 574780 }, { "epoch": 1.49, "learning_rate": 7.650921118458399e-05, "loss": 0.0078, "step": 574790 }, { "epoch": 1.49, "learning_rate": 7.650532296821253e-05, "loss": 0.0118, "step": 574800 }, { "epoch": 1.49, "learning_rate": 7.650143475184106e-05, "loss": 0.0078, "step": 574810 }, { "epoch": 1.49, "learning_rate": 7.64975465354696e-05, "loss": 0.01, "step": 574820 }, { "epoch": 1.49, "learning_rate": 7.649365831909813e-05, "loss": 0.0104, "step": 574830 }, { "epoch": 1.49, "learning_rate": 7.648977010272668e-05, "loss": 0.0073, "step": 574840 }, { "epoch": 1.49, "learning_rate": 7.64858818863552e-05, "loss": 0.0106, "step": 574850 }, { "epoch": 1.49, "learning_rate": 7.648199366998375e-05, "loss": 0.01, "step": 574860 }, { "epoch": 1.49, "learning_rate": 7.647810545361228e-05, "loss": 0.0098, "step": 574870 }, { "epoch": 1.49, "learning_rate": 7.647421723724081e-05, "loss": 0.012, "step": 574880 }, { "epoch": 1.49, "learning_rate": 7.647032902086935e-05, "loss": 0.008, "step": 574890 }, { "epoch": 1.49, "learning_rate": 7.646644080449788e-05, "loss": 0.0121, "step": 574900 }, { "epoch": 1.49, "learning_rate": 7.646255258812642e-05, "loss": 0.0113, "step": 574910 }, { "epoch": 1.49, "learning_rate": 7.645866437175495e-05, "loss": 0.0097, "step": 574920 }, { "epoch": 1.49, "learning_rate": 7.645477615538349e-05, "loss": 0.0106, "step": 574930 }, { "epoch": 1.49, "learning_rate": 7.645088793901202e-05, "loss": 0.0126, "step": 574940 }, { "epoch": 1.49, "learning_rate": 7.644699972264056e-05, "loss": 0.0104, "step": 574950 }, { "epoch": 1.49, "learning_rate": 7.644311150626909e-05, "loss": 0.0105, "step": 574960 }, { "epoch": 1.49, "learning_rate": 7.643922328989763e-05, "loss": 0.0085, "step": 574970 }, { "epoch": 1.49, "learning_rate": 7.643533507352616e-05, "loss": 0.0092, "step": 574980 }, { "epoch": 1.49, "learning_rate": 7.64314468571547e-05, "loss": 0.0085, "step": 574990 }, { "epoch": 1.49, "learning_rate": 7.642755864078323e-05, "loss": 0.0095, "step": 575000 }, { "epoch": 1.49, "eval_cer": 0.8817166826925096, "eval_loss": 0.006032513454556465, "eval_runtime": 107.7203, "eval_samples_per_second": 18.567, "eval_steps_per_second": 4.642, "step": 575000 }, { "epoch": 1.49, "learning_rate": 7.642367042441177e-05, "loss": 0.0083, "step": 575010 }, { "epoch": 1.49, "learning_rate": 7.64197822080403e-05, "loss": 0.0082, "step": 575020 }, { "epoch": 1.49, "learning_rate": 7.641589399166885e-05, "loss": 0.0099, "step": 575030 }, { "epoch": 1.49, "learning_rate": 7.641200577529738e-05, "loss": 0.0103, "step": 575040 }, { "epoch": 1.49, "learning_rate": 7.640811755892592e-05, "loss": 0.0105, "step": 575050 }, { "epoch": 1.49, "learning_rate": 7.640422934255445e-05, "loss": 0.0097, "step": 575060 }, { "epoch": 1.49, "learning_rate": 7.640034112618299e-05, "loss": 0.0081, "step": 575070 }, { "epoch": 1.49, "learning_rate": 7.639645290981152e-05, "loss": 0.0081, "step": 575080 }, { "epoch": 1.49, "learning_rate": 7.639256469344006e-05, "loss": 0.0082, "step": 575090 }, { "epoch": 1.49, "learning_rate": 7.638867647706859e-05, "loss": 0.0112, "step": 575100 }, { "epoch": 1.49, "learning_rate": 7.638478826069713e-05, "loss": 0.008, "step": 575110 }, { "epoch": 1.49, "learning_rate": 7.638090004432566e-05, "loss": 0.0096, "step": 575120 }, { "epoch": 1.49, "learning_rate": 7.637701182795419e-05, "loss": 0.0087, "step": 575130 }, { "epoch": 1.49, "learning_rate": 7.637312361158273e-05, "loss": 0.0122, "step": 575140 }, { "epoch": 1.49, "learning_rate": 7.636923539521126e-05, "loss": 0.0079, "step": 575150 }, { "epoch": 1.49, "learning_rate": 7.63653471788398e-05, "loss": 0.0107, "step": 575160 }, { "epoch": 1.49, "learning_rate": 7.636145896246833e-05, "loss": 0.0146, "step": 575170 }, { "epoch": 1.49, "learning_rate": 7.635757074609687e-05, "loss": 0.0076, "step": 575180 }, { "epoch": 1.49, "learning_rate": 7.63536825297254e-05, "loss": 0.0082, "step": 575190 }, { "epoch": 1.49, "learning_rate": 7.634979431335394e-05, "loss": 0.0097, "step": 575200 }, { "epoch": 1.49, "learning_rate": 7.634590609698247e-05, "loss": 0.0078, "step": 575210 }, { "epoch": 1.49, "learning_rate": 7.634201788061102e-05, "loss": 0.0093, "step": 575220 }, { "epoch": 1.49, "learning_rate": 7.633812966423955e-05, "loss": 0.0114, "step": 575230 }, { "epoch": 1.49, "learning_rate": 7.633424144786809e-05, "loss": 0.0107, "step": 575240 }, { "epoch": 1.49, "learning_rate": 7.633035323149662e-05, "loss": 0.0094, "step": 575250 }, { "epoch": 1.49, "learning_rate": 7.632646501512516e-05, "loss": 0.0067, "step": 575260 }, { "epoch": 1.49, "learning_rate": 7.632257679875369e-05, "loss": 0.0105, "step": 575270 }, { "epoch": 1.49, "learning_rate": 7.631868858238223e-05, "loss": 0.0098, "step": 575280 }, { "epoch": 1.49, "learning_rate": 7.631480036601076e-05, "loss": 0.009, "step": 575290 }, { "epoch": 1.49, "learning_rate": 7.63109121496393e-05, "loss": 0.0113, "step": 575300 }, { "epoch": 1.49, "learning_rate": 7.630702393326783e-05, "loss": 0.0103, "step": 575310 }, { "epoch": 1.49, "learning_rate": 7.630313571689637e-05, "loss": 0.0175, "step": 575320 }, { "epoch": 1.49, "learning_rate": 7.62992475005249e-05, "loss": 0.01, "step": 575330 }, { "epoch": 1.49, "learning_rate": 7.629535928415344e-05, "loss": 0.0078, "step": 575340 }, { "epoch": 1.49, "learning_rate": 7.629147106778197e-05, "loss": 0.008, "step": 575350 }, { "epoch": 1.49, "learning_rate": 7.62875828514105e-05, "loss": 0.0066, "step": 575360 }, { "epoch": 1.49, "learning_rate": 7.628369463503904e-05, "loss": 0.0091, "step": 575370 }, { "epoch": 1.49, "learning_rate": 7.627980641866757e-05, "loss": 0.0104, "step": 575380 }, { "epoch": 1.49, "learning_rate": 7.627591820229612e-05, "loss": 0.0115, "step": 575390 }, { "epoch": 1.49, "learning_rate": 7.627202998592465e-05, "loss": 0.0073, "step": 575400 }, { "epoch": 1.49, "learning_rate": 7.626814176955319e-05, "loss": 0.0084, "step": 575410 }, { "epoch": 1.49, "learning_rate": 7.626425355318172e-05, "loss": 0.0079, "step": 575420 }, { "epoch": 1.49, "learning_rate": 7.626036533681026e-05, "loss": 0.0067, "step": 575430 }, { "epoch": 1.49, "learning_rate": 7.625647712043879e-05, "loss": 0.007, "step": 575440 }, { "epoch": 1.49, "learning_rate": 7.625258890406733e-05, "loss": 0.0086, "step": 575450 }, { "epoch": 1.49, "learning_rate": 7.624870068769586e-05, "loss": 0.0087, "step": 575460 }, { "epoch": 1.49, "learning_rate": 7.62448124713244e-05, "loss": 0.0099, "step": 575470 }, { "epoch": 1.49, "learning_rate": 7.624092425495293e-05, "loss": 0.0072, "step": 575480 }, { "epoch": 1.49, "learning_rate": 7.623703603858147e-05, "loss": 0.0098, "step": 575490 }, { "epoch": 1.49, "learning_rate": 7.623314782221e-05, "loss": 0.0077, "step": 575500 }, { "epoch": 1.49, "learning_rate": 7.622925960583854e-05, "loss": 0.0083, "step": 575510 }, { "epoch": 1.49, "learning_rate": 7.622537138946707e-05, "loss": 0.0082, "step": 575520 }, { "epoch": 1.49, "learning_rate": 7.622148317309561e-05, "loss": 0.0083, "step": 575530 }, { "epoch": 1.49, "learning_rate": 7.621759495672414e-05, "loss": 0.0094, "step": 575540 }, { "epoch": 1.49, "learning_rate": 7.621370674035269e-05, "loss": 0.0084, "step": 575550 }, { "epoch": 1.49, "learning_rate": 7.620981852398121e-05, "loss": 0.0087, "step": 575560 }, { "epoch": 1.49, "learning_rate": 7.620593030760976e-05, "loss": 0.0089, "step": 575570 }, { "epoch": 1.49, "learning_rate": 7.620204209123829e-05, "loss": 0.0104, "step": 575580 }, { "epoch": 1.49, "learning_rate": 7.619815387486683e-05, "loss": 0.0085, "step": 575590 }, { "epoch": 1.49, "learning_rate": 7.619426565849536e-05, "loss": 0.0093, "step": 575600 }, { "epoch": 1.49, "learning_rate": 7.619037744212389e-05, "loss": 0.0168, "step": 575610 }, { "epoch": 1.49, "learning_rate": 7.618648922575243e-05, "loss": 0.0113, "step": 575620 }, { "epoch": 1.49, "learning_rate": 7.618260100938096e-05, "loss": 0.0076, "step": 575630 }, { "epoch": 1.49, "learning_rate": 7.61787127930095e-05, "loss": 0.0087, "step": 575640 }, { "epoch": 1.49, "learning_rate": 7.617482457663803e-05, "loss": 0.01, "step": 575650 }, { "epoch": 1.49, "learning_rate": 7.617093636026657e-05, "loss": 0.0105, "step": 575660 }, { "epoch": 1.49, "learning_rate": 7.61670481438951e-05, "loss": 0.0082, "step": 575670 }, { "epoch": 1.49, "learning_rate": 7.616315992752364e-05, "loss": 0.0078, "step": 575680 }, { "epoch": 1.49, "learning_rate": 7.615927171115217e-05, "loss": 0.0081, "step": 575690 }, { "epoch": 1.49, "learning_rate": 7.615538349478071e-05, "loss": 0.0055, "step": 575700 }, { "epoch": 1.49, "learning_rate": 7.615149527840924e-05, "loss": 0.0082, "step": 575710 }, { "epoch": 1.49, "learning_rate": 7.614760706203778e-05, "loss": 0.0071, "step": 575720 }, { "epoch": 1.49, "learning_rate": 7.614371884566631e-05, "loss": 0.0088, "step": 575730 }, { "epoch": 1.49, "learning_rate": 7.613983062929486e-05, "loss": 0.0089, "step": 575740 }, { "epoch": 1.49, "learning_rate": 7.613594241292339e-05, "loss": 0.01, "step": 575750 }, { "epoch": 1.49, "learning_rate": 7.613205419655193e-05, "loss": 0.0225, "step": 575760 }, { "epoch": 1.49, "learning_rate": 7.612816598018046e-05, "loss": 0.0091, "step": 575770 }, { "epoch": 1.49, "learning_rate": 7.6124277763809e-05, "loss": 0.0123, "step": 575780 }, { "epoch": 1.49, "learning_rate": 7.612038954743753e-05, "loss": 0.0094, "step": 575790 }, { "epoch": 1.49, "learning_rate": 7.611650133106607e-05, "loss": 0.0098, "step": 575800 }, { "epoch": 1.49, "learning_rate": 7.61126131146946e-05, "loss": 0.0072, "step": 575810 }, { "epoch": 1.49, "learning_rate": 7.610872489832314e-05, "loss": 0.0094, "step": 575820 }, { "epoch": 1.49, "learning_rate": 7.610483668195167e-05, "loss": 0.0077, "step": 575830 }, { "epoch": 1.49, "learning_rate": 7.610094846558021e-05, "loss": 0.0086, "step": 575840 }, { "epoch": 1.49, "learning_rate": 7.609706024920874e-05, "loss": 0.008, "step": 575850 }, { "epoch": 1.49, "learning_rate": 7.609317203283727e-05, "loss": 0.0081, "step": 575860 }, { "epoch": 1.49, "learning_rate": 7.608928381646581e-05, "loss": 0.0065, "step": 575870 }, { "epoch": 1.49, "learning_rate": 7.608539560009434e-05, "loss": 0.0099, "step": 575880 }, { "epoch": 1.49, "learning_rate": 7.608150738372288e-05, "loss": 0.0095, "step": 575890 }, { "epoch": 1.49, "learning_rate": 7.60776191673514e-05, "loss": 0.0117, "step": 575900 }, { "epoch": 1.49, "learning_rate": 7.607373095097996e-05, "loss": 0.0103, "step": 575910 }, { "epoch": 1.49, "learning_rate": 7.606984273460848e-05, "loss": 0.0124, "step": 575920 }, { "epoch": 1.49, "learning_rate": 7.606595451823703e-05, "loss": 0.0111, "step": 575930 }, { "epoch": 1.49, "learning_rate": 7.606206630186556e-05, "loss": 0.0116, "step": 575940 }, { "epoch": 1.49, "learning_rate": 7.60581780854941e-05, "loss": 0.0093, "step": 575950 }, { "epoch": 1.49, "learning_rate": 7.605428986912263e-05, "loss": 0.0079, "step": 575960 }, { "epoch": 1.49, "learning_rate": 7.605040165275117e-05, "loss": 0.0063, "step": 575970 }, { "epoch": 1.49, "learning_rate": 7.60465134363797e-05, "loss": 0.0094, "step": 575980 }, { "epoch": 1.49, "learning_rate": 7.604262522000824e-05, "loss": 0.01, "step": 575990 }, { "epoch": 1.49, "learning_rate": 7.603873700363677e-05, "loss": 0.0092, "step": 576000 }, { "epoch": 1.49, "eval_cer": 0.8817124837817071, "eval_loss": 0.006118689198046923, "eval_runtime": 107.8667, "eval_samples_per_second": 18.541, "eval_steps_per_second": 4.635, "step": 576000 }, { "epoch": 1.49, "learning_rate": 7.603484878726531e-05, "loss": 0.0081, "step": 576010 }, { "epoch": 1.49, "learning_rate": 7.603096057089384e-05, "loss": 0.012, "step": 576020 }, { "epoch": 1.49, "learning_rate": 7.602707235452238e-05, "loss": 0.0107, "step": 576030 }, { "epoch": 1.49, "learning_rate": 7.602318413815091e-05, "loss": 0.0091, "step": 576040 }, { "epoch": 1.49, "learning_rate": 7.601929592177945e-05, "loss": 0.0082, "step": 576050 }, { "epoch": 1.49, "learning_rate": 7.601540770540798e-05, "loss": 0.0099, "step": 576060 }, { "epoch": 1.49, "learning_rate": 7.601151948903653e-05, "loss": 0.0087, "step": 576070 }, { "epoch": 1.49, "learning_rate": 7.600763127266505e-05, "loss": 0.0082, "step": 576080 }, { "epoch": 1.49, "learning_rate": 7.60037430562936e-05, "loss": 0.0099, "step": 576090 }, { "epoch": 1.49, "learning_rate": 7.599985483992213e-05, "loss": 0.008, "step": 576100 }, { "epoch": 1.49, "learning_rate": 7.599596662355066e-05, "loss": 0.0109, "step": 576110 }, { "epoch": 1.49, "learning_rate": 7.59920784071792e-05, "loss": 0.0103, "step": 576120 }, { "epoch": 1.49, "learning_rate": 7.598819019080773e-05, "loss": 0.0084, "step": 576130 }, { "epoch": 1.49, "learning_rate": 7.598430197443627e-05, "loss": 0.0095, "step": 576140 }, { "epoch": 1.49, "learning_rate": 7.59804137580648e-05, "loss": 0.015, "step": 576150 }, { "epoch": 1.49, "learning_rate": 7.597652554169334e-05, "loss": 0.0118, "step": 576160 }, { "epoch": 1.49, "learning_rate": 7.597263732532187e-05, "loss": 0.0106, "step": 576170 }, { "epoch": 1.49, "learning_rate": 7.596874910895041e-05, "loss": 0.0074, "step": 576180 }, { "epoch": 1.49, "learning_rate": 7.596486089257894e-05, "loss": 0.0069, "step": 576190 }, { "epoch": 1.49, "learning_rate": 7.596097267620748e-05, "loss": 0.0083, "step": 576200 }, { "epoch": 1.49, "learning_rate": 7.595708445983601e-05, "loss": 0.0112, "step": 576210 }, { "epoch": 1.49, "learning_rate": 7.595319624346455e-05, "loss": 0.0083, "step": 576220 }, { "epoch": 1.49, "learning_rate": 7.594930802709308e-05, "loss": 0.0099, "step": 576230 }, { "epoch": 1.49, "learning_rate": 7.594541981072162e-05, "loss": 0.0106, "step": 576240 }, { "epoch": 1.49, "learning_rate": 7.594153159435015e-05, "loss": 0.0072, "step": 576250 }, { "epoch": 1.49, "learning_rate": 7.59376433779787e-05, "loss": 0.0093, "step": 576260 }, { "epoch": 1.49, "learning_rate": 7.593375516160723e-05, "loss": 0.0081, "step": 576270 }, { "epoch": 1.49, "learning_rate": 7.592986694523577e-05, "loss": 0.0089, "step": 576280 }, { "epoch": 1.49, "learning_rate": 7.59259787288643e-05, "loss": 0.0102, "step": 576290 }, { "epoch": 1.49, "learning_rate": 7.592209051249284e-05, "loss": 0.008, "step": 576300 }, { "epoch": 1.49, "learning_rate": 7.591820229612137e-05, "loss": 0.0117, "step": 576310 }, { "epoch": 1.49, "learning_rate": 7.591431407974991e-05, "loss": 0.0074, "step": 576320 }, { "epoch": 1.49, "learning_rate": 7.591042586337844e-05, "loss": 0.0096, "step": 576330 }, { "epoch": 1.49, "learning_rate": 7.590653764700698e-05, "loss": 0.009, "step": 576340 }, { "epoch": 1.49, "learning_rate": 7.590264943063551e-05, "loss": 0.0086, "step": 576350 }, { "epoch": 1.49, "learning_rate": 7.589876121426404e-05, "loss": 0.0097, "step": 576360 }, { "epoch": 1.49, "learning_rate": 7.589487299789258e-05, "loss": 0.0137, "step": 576370 }, { "epoch": 1.49, "learning_rate": 7.589098478152111e-05, "loss": 0.0084, "step": 576380 }, { "epoch": 1.49, "learning_rate": 7.588709656514965e-05, "loss": 0.0094, "step": 576390 }, { "epoch": 1.49, "learning_rate": 7.588320834877818e-05, "loss": 0.0106, "step": 576400 }, { "epoch": 1.49, "learning_rate": 7.587932013240672e-05, "loss": 0.0079, "step": 576410 }, { "epoch": 1.49, "learning_rate": 7.587543191603525e-05, "loss": 0.0081, "step": 576420 }, { "epoch": 1.49, "learning_rate": 7.58715436996638e-05, "loss": 0.0075, "step": 576430 }, { "epoch": 1.49, "learning_rate": 7.586765548329232e-05, "loss": 0.0127, "step": 576440 }, { "epoch": 1.49, "learning_rate": 7.586376726692087e-05, "loss": 0.0078, "step": 576450 }, { "epoch": 1.49, "learning_rate": 7.58598790505494e-05, "loss": 0.0111, "step": 576460 }, { "epoch": 1.49, "learning_rate": 7.585599083417794e-05, "loss": 0.0146, "step": 576470 }, { "epoch": 1.49, "learning_rate": 7.585210261780647e-05, "loss": 0.0079, "step": 576480 }, { "epoch": 1.49, "learning_rate": 7.584821440143501e-05, "loss": 0.0104, "step": 576490 }, { "epoch": 1.49, "learning_rate": 7.584432618506354e-05, "loss": 0.0077, "step": 576500 }, { "epoch": 1.49, "learning_rate": 7.584043796869208e-05, "loss": 0.0091, "step": 576510 }, { "epoch": 1.49, "learning_rate": 7.583654975232061e-05, "loss": 0.0104, "step": 576520 }, { "epoch": 1.49, "learning_rate": 7.583266153594915e-05, "loss": 0.0086, "step": 576530 }, { "epoch": 1.49, "learning_rate": 7.582877331957768e-05, "loss": 0.0085, "step": 576540 }, { "epoch": 1.49, "learning_rate": 7.582488510320622e-05, "loss": 0.0093, "step": 576550 }, { "epoch": 1.49, "learning_rate": 7.582099688683475e-05, "loss": 0.0097, "step": 576560 }, { "epoch": 1.49, "learning_rate": 7.581710867046329e-05, "loss": 0.0063, "step": 576570 }, { "epoch": 1.49, "learning_rate": 7.581322045409182e-05, "loss": 0.0067, "step": 576580 }, { "epoch": 1.49, "learning_rate": 7.580933223772036e-05, "loss": 0.0166, "step": 576590 }, { "epoch": 1.49, "learning_rate": 7.580544402134889e-05, "loss": 0.0083, "step": 576600 }, { "epoch": 1.49, "learning_rate": 7.580155580497742e-05, "loss": 0.0073, "step": 576610 }, { "epoch": 1.49, "learning_rate": 7.579766758860597e-05, "loss": 0.0068, "step": 576620 }, { "epoch": 1.49, "learning_rate": 7.57937793722345e-05, "loss": 0.0076, "step": 576630 }, { "epoch": 1.49, "learning_rate": 7.578989115586304e-05, "loss": 0.0097, "step": 576640 }, { "epoch": 1.49, "learning_rate": 7.578600293949157e-05, "loss": 0.0098, "step": 576650 }, { "epoch": 1.49, "learning_rate": 7.578211472312011e-05, "loss": 0.0097, "step": 576660 }, { "epoch": 1.49, "learning_rate": 7.577822650674864e-05, "loss": 0.0091, "step": 576670 }, { "epoch": 1.49, "learning_rate": 7.577433829037718e-05, "loss": 0.0092, "step": 576680 }, { "epoch": 1.49, "learning_rate": 7.577045007400571e-05, "loss": 0.0087, "step": 576690 }, { "epoch": 1.49, "learning_rate": 7.576656185763425e-05, "loss": 0.0115, "step": 576700 }, { "epoch": 1.49, "learning_rate": 7.576267364126278e-05, "loss": 0.0093, "step": 576710 }, { "epoch": 1.49, "learning_rate": 7.575878542489132e-05, "loss": 0.0079, "step": 576720 }, { "epoch": 1.49, "learning_rate": 7.575489720851985e-05, "loss": 0.0087, "step": 576730 }, { "epoch": 1.49, "learning_rate": 7.575100899214839e-05, "loss": 0.0088, "step": 576740 }, { "epoch": 1.5, "learning_rate": 7.574712077577692e-05, "loss": 0.0105, "step": 576750 }, { "epoch": 1.5, "learning_rate": 7.574323255940546e-05, "loss": 0.0109, "step": 576760 }, { "epoch": 1.5, "learning_rate": 7.573934434303399e-05, "loss": 0.0063, "step": 576770 }, { "epoch": 1.5, "learning_rate": 7.573545612666254e-05, "loss": 0.0092, "step": 576780 }, { "epoch": 1.5, "learning_rate": 7.573156791029106e-05, "loss": 0.006, "step": 576790 }, { "epoch": 1.5, "learning_rate": 7.572767969391961e-05, "loss": 0.0077, "step": 576800 }, { "epoch": 1.5, "learning_rate": 7.572379147754814e-05, "loss": 0.0072, "step": 576810 }, { "epoch": 1.5, "learning_rate": 7.571990326117668e-05, "loss": 0.0111, "step": 576820 }, { "epoch": 1.5, "learning_rate": 7.571601504480521e-05, "loss": 0.0079, "step": 576830 }, { "epoch": 1.5, "learning_rate": 7.571212682843375e-05, "loss": 0.0112, "step": 576840 }, { "epoch": 1.5, "learning_rate": 7.570823861206228e-05, "loss": 0.0097, "step": 576850 }, { "epoch": 1.5, "learning_rate": 7.570435039569081e-05, "loss": 0.0095, "step": 576860 }, { "epoch": 1.5, "learning_rate": 7.570046217931935e-05, "loss": 0.009, "step": 576870 }, { "epoch": 1.5, "learning_rate": 7.569657396294788e-05, "loss": 0.0086, "step": 576880 }, { "epoch": 1.5, "learning_rate": 7.569268574657642e-05, "loss": 0.0092, "step": 576890 }, { "epoch": 1.5, "learning_rate": 7.568879753020495e-05, "loss": 0.006, "step": 576900 }, { "epoch": 1.5, "learning_rate": 7.568490931383349e-05, "loss": 0.0078, "step": 576910 }, { "epoch": 1.5, "learning_rate": 7.568102109746202e-05, "loss": 0.0079, "step": 576920 }, { "epoch": 1.5, "learning_rate": 7.567713288109056e-05, "loss": 0.0094, "step": 576930 }, { "epoch": 1.5, "learning_rate": 7.567324466471909e-05, "loss": 0.0076, "step": 576940 }, { "epoch": 1.5, "learning_rate": 7.566935644834763e-05, "loss": 0.011, "step": 576950 }, { "epoch": 1.5, "learning_rate": 7.566546823197616e-05, "loss": 0.0092, "step": 576960 }, { "epoch": 1.5, "learning_rate": 7.566158001560471e-05, "loss": 0.0076, "step": 576970 }, { "epoch": 1.5, "learning_rate": 7.565769179923324e-05, "loss": 0.0097, "step": 576980 }, { "epoch": 1.5, "learning_rate": 7.565380358286178e-05, "loss": 0.0102, "step": 576990 }, { "epoch": 1.5, "learning_rate": 7.564991536649031e-05, "loss": 0.0079, "step": 577000 }, { "epoch": 1.5, "eval_cer": 0.8817180823294437, "eval_loss": 0.006126715801656246, "eval_runtime": 107.6241, "eval_samples_per_second": 18.583, "eval_steps_per_second": 4.646, "step": 577000 }, { "epoch": 1.5, "learning_rate": 7.564602715011885e-05, "loss": 0.0096, "step": 577010 }, { "epoch": 1.5, "learning_rate": 7.564213893374738e-05, "loss": 0.0107, "step": 577020 }, { "epoch": 1.5, "learning_rate": 7.563825071737592e-05, "loss": 0.0106, "step": 577030 }, { "epoch": 1.5, "learning_rate": 7.563436250100445e-05, "loss": 0.0128, "step": 577040 }, { "epoch": 1.5, "learning_rate": 7.563047428463299e-05, "loss": 0.0089, "step": 577050 }, { "epoch": 1.5, "learning_rate": 7.562658606826152e-05, "loss": 0.0097, "step": 577060 }, { "epoch": 1.5, "learning_rate": 7.562269785189006e-05, "loss": 0.0099, "step": 577070 }, { "epoch": 1.5, "learning_rate": 7.561880963551859e-05, "loss": 0.0077, "step": 577080 }, { "epoch": 1.5, "learning_rate": 7.561492141914713e-05, "loss": 0.0076, "step": 577090 }, { "epoch": 1.5, "learning_rate": 7.561103320277566e-05, "loss": 0.0075, "step": 577100 }, { "epoch": 1.5, "learning_rate": 7.560714498640419e-05, "loss": 0.0074, "step": 577110 }, { "epoch": 1.5, "learning_rate": 7.560325677003273e-05, "loss": 0.0083, "step": 577120 }, { "epoch": 1.5, "learning_rate": 7.559936855366126e-05, "loss": 0.0102, "step": 577130 }, { "epoch": 1.5, "learning_rate": 7.559548033728981e-05, "loss": 0.0106, "step": 577140 }, { "epoch": 1.5, "learning_rate": 7.559159212091833e-05, "loss": 0.0082, "step": 577150 }, { "epoch": 1.5, "learning_rate": 7.558770390454688e-05, "loss": 0.0078, "step": 577160 }, { "epoch": 1.5, "learning_rate": 7.558381568817541e-05, "loss": 0.0097, "step": 577170 }, { "epoch": 1.5, "learning_rate": 7.557992747180395e-05, "loss": 0.0086, "step": 577180 }, { "epoch": 1.5, "learning_rate": 7.557603925543248e-05, "loss": 0.0122, "step": 577190 }, { "epoch": 1.5, "learning_rate": 7.557215103906102e-05, "loss": 0.0085, "step": 577200 }, { "epoch": 1.5, "learning_rate": 7.556826282268955e-05, "loss": 0.0099, "step": 577210 }, { "epoch": 1.5, "learning_rate": 7.556437460631809e-05, "loss": 0.0092, "step": 577220 }, { "epoch": 1.5, "learning_rate": 7.556048638994662e-05, "loss": 0.007, "step": 577230 }, { "epoch": 1.5, "learning_rate": 7.555659817357516e-05, "loss": 0.0101, "step": 577240 }, { "epoch": 1.5, "learning_rate": 7.555270995720369e-05, "loss": 0.0094, "step": 577250 }, { "epoch": 1.5, "learning_rate": 7.554882174083223e-05, "loss": 0.0087, "step": 577260 }, { "epoch": 1.5, "learning_rate": 7.554493352446076e-05, "loss": 0.0076, "step": 577270 }, { "epoch": 1.5, "learning_rate": 7.55410453080893e-05, "loss": 0.0099, "step": 577280 }, { "epoch": 1.5, "learning_rate": 7.553715709171783e-05, "loss": 0.0126, "step": 577290 }, { "epoch": 1.5, "learning_rate": 7.553326887534638e-05, "loss": 0.0104, "step": 577300 }, { "epoch": 1.5, "learning_rate": 7.55293806589749e-05, "loss": 0.011, "step": 577310 }, { "epoch": 1.5, "learning_rate": 7.552549244260345e-05, "loss": 0.0067, "step": 577320 }, { "epoch": 1.5, "learning_rate": 7.552160422623198e-05, "loss": 0.0155, "step": 577330 }, { "epoch": 1.5, "learning_rate": 7.551771600986052e-05, "loss": 0.0092, "step": 577340 }, { "epoch": 1.5, "learning_rate": 7.551382779348905e-05, "loss": 0.0098, "step": 577350 }, { "epoch": 1.5, "learning_rate": 7.550993957711758e-05, "loss": 0.0089, "step": 577360 }, { "epoch": 1.5, "learning_rate": 7.550605136074612e-05, "loss": 0.0124, "step": 577370 }, { "epoch": 1.5, "learning_rate": 7.550216314437465e-05, "loss": 0.0058, "step": 577380 }, { "epoch": 1.5, "learning_rate": 7.549827492800319e-05, "loss": 0.0097, "step": 577390 }, { "epoch": 1.5, "learning_rate": 7.549438671163172e-05, "loss": 0.0072, "step": 577400 }, { "epoch": 1.5, "learning_rate": 7.549049849526026e-05, "loss": 0.0094, "step": 577410 }, { "epoch": 1.5, "learning_rate": 7.548661027888879e-05, "loss": 0.0113, "step": 577420 }, { "epoch": 1.5, "learning_rate": 7.548272206251733e-05, "loss": 0.0091, "step": 577430 }, { "epoch": 1.5, "learning_rate": 7.547883384614586e-05, "loss": 0.0076, "step": 577440 }, { "epoch": 1.5, "learning_rate": 7.54749456297744e-05, "loss": 0.0062, "step": 577450 }, { "epoch": 1.5, "learning_rate": 7.547105741340293e-05, "loss": 0.0103, "step": 577460 }, { "epoch": 1.5, "learning_rate": 7.546716919703147e-05, "loss": 0.0118, "step": 577470 }, { "epoch": 1.5, "learning_rate": 7.546328098066e-05, "loss": 0.0081, "step": 577480 }, { "epoch": 1.5, "learning_rate": 7.545939276428855e-05, "loss": 0.01, "step": 577490 }, { "epoch": 1.5, "learning_rate": 7.545550454791708e-05, "loss": 0.0127, "step": 577500 }, { "epoch": 1.5, "learning_rate": 7.545161633154562e-05, "loss": 0.0081, "step": 577510 }, { "epoch": 1.5, "learning_rate": 7.544772811517415e-05, "loss": 0.01, "step": 577520 }, { "epoch": 1.5, "learning_rate": 7.544383989880269e-05, "loss": 0.008, "step": 577530 }, { "epoch": 1.5, "learning_rate": 7.543995168243122e-05, "loss": 0.0093, "step": 577540 }, { "epoch": 1.5, "learning_rate": 7.543606346605976e-05, "loss": 0.0064, "step": 577550 }, { "epoch": 1.5, "learning_rate": 7.543217524968829e-05, "loss": 0.0089, "step": 577560 }, { "epoch": 1.5, "learning_rate": 7.542828703331683e-05, "loss": 0.0075, "step": 577570 }, { "epoch": 1.5, "learning_rate": 7.542439881694536e-05, "loss": 0.007, "step": 577580 }, { "epoch": 1.5, "learning_rate": 7.54205106005739e-05, "loss": 0.0085, "step": 577590 }, { "epoch": 1.5, "learning_rate": 7.541662238420243e-05, "loss": 0.0108, "step": 577600 }, { "epoch": 1.5, "learning_rate": 7.541273416783096e-05, "loss": 0.0096, "step": 577610 }, { "epoch": 1.5, "learning_rate": 7.54088459514595e-05, "loss": 0.0083, "step": 577620 }, { "epoch": 1.5, "learning_rate": 7.540495773508803e-05, "loss": 0.0103, "step": 577630 }, { "epoch": 1.5, "learning_rate": 7.540106951871657e-05, "loss": 0.0088, "step": 577640 }, { "epoch": 1.5, "learning_rate": 7.53971813023451e-05, "loss": 0.0081, "step": 577650 }, { "epoch": 1.5, "learning_rate": 7.539329308597365e-05, "loss": 0.0091, "step": 577660 }, { "epoch": 1.5, "learning_rate": 7.538940486960217e-05, "loss": 0.0067, "step": 577670 }, { "epoch": 1.5, "learning_rate": 7.538551665323072e-05, "loss": 0.0053, "step": 577680 }, { "epoch": 1.5, "learning_rate": 7.538162843685925e-05, "loss": 0.0083, "step": 577690 }, { "epoch": 1.5, "learning_rate": 7.537774022048779e-05, "loss": 0.0112, "step": 577700 }, { "epoch": 1.5, "learning_rate": 7.537385200411632e-05, "loss": 0.0101, "step": 577710 }, { "epoch": 1.5, "learning_rate": 7.536996378774486e-05, "loss": 0.007, "step": 577720 }, { "epoch": 1.5, "learning_rate": 7.536607557137339e-05, "loss": 0.0101, "step": 577730 }, { "epoch": 1.5, "learning_rate": 7.536218735500193e-05, "loss": 0.0093, "step": 577740 }, { "epoch": 1.5, "learning_rate": 7.535829913863046e-05, "loss": 0.0074, "step": 577750 }, { "epoch": 1.5, "learning_rate": 7.5354410922259e-05, "loss": 0.0102, "step": 577760 }, { "epoch": 1.5, "learning_rate": 7.535052270588753e-05, "loss": 0.011, "step": 577770 }, { "epoch": 1.5, "learning_rate": 7.534663448951607e-05, "loss": 0.0068, "step": 577780 }, { "epoch": 1.5, "learning_rate": 7.53427462731446e-05, "loss": 0.0099, "step": 577790 }, { "epoch": 1.5, "learning_rate": 7.533885805677314e-05, "loss": 0.0074, "step": 577800 }, { "epoch": 1.5, "learning_rate": 7.533496984040167e-05, "loss": 0.0098, "step": 577810 }, { "epoch": 1.5, "learning_rate": 7.533108162403022e-05, "loss": 0.0105, "step": 577820 }, { "epoch": 1.5, "learning_rate": 7.532719340765874e-05, "loss": 0.0082, "step": 577830 }, { "epoch": 1.5, "learning_rate": 7.532330519128729e-05, "loss": 0.0083, "step": 577840 }, { "epoch": 1.5, "learning_rate": 7.531941697491582e-05, "loss": 0.0087, "step": 577850 }, { "epoch": 1.5, "learning_rate": 7.531552875854435e-05, "loss": 0.0074, "step": 577860 }, { "epoch": 1.5, "learning_rate": 7.531164054217289e-05, "loss": 0.0102, "step": 577870 }, { "epoch": 1.5, "learning_rate": 7.530775232580142e-05, "loss": 0.0104, "step": 577880 }, { "epoch": 1.5, "learning_rate": 7.530386410942996e-05, "loss": 0.0098, "step": 577890 }, { "epoch": 1.5, "learning_rate": 7.529997589305849e-05, "loss": 0.0124, "step": 577900 }, { "epoch": 1.5, "learning_rate": 7.529608767668703e-05, "loss": 0.0099, "step": 577910 }, { "epoch": 1.5, "learning_rate": 7.529219946031556e-05, "loss": 0.0104, "step": 577920 }, { "epoch": 1.5, "learning_rate": 7.52883112439441e-05, "loss": 0.0076, "step": 577930 }, { "epoch": 1.5, "learning_rate": 7.528442302757263e-05, "loss": 0.0065, "step": 577940 }, { "epoch": 1.5, "learning_rate": 7.528053481120117e-05, "loss": 0.0067, "step": 577950 }, { "epoch": 1.5, "learning_rate": 7.52766465948297e-05, "loss": 0.0064, "step": 577960 }, { "epoch": 1.5, "learning_rate": 7.527275837845824e-05, "loss": 0.0084, "step": 577970 }, { "epoch": 1.5, "learning_rate": 7.526887016208677e-05, "loss": 0.0079, "step": 577980 }, { "epoch": 1.5, "learning_rate": 7.526498194571531e-05, "loss": 0.0101, "step": 577990 }, { "epoch": 1.5, "learning_rate": 7.526109372934384e-05, "loss": 0.0082, "step": 578000 }, { "epoch": 1.5, "eval_cer": 0.8817096845078387, "eval_loss": 0.0061296941712498665, "eval_runtime": 107.7949, "eval_samples_per_second": 18.554, "eval_steps_per_second": 4.638, "step": 578000 }, { "epoch": 1.5, "learning_rate": 7.525720551297239e-05, "loss": 0.0082, "step": 578010 }, { "epoch": 1.5, "learning_rate": 7.525331729660092e-05, "loss": 0.0083, "step": 578020 }, { "epoch": 1.5, "learning_rate": 7.524942908022946e-05, "loss": 0.0107, "step": 578030 }, { "epoch": 1.5, "learning_rate": 7.524554086385799e-05, "loss": 0.0096, "step": 578040 }, { "epoch": 1.5, "learning_rate": 7.524165264748653e-05, "loss": 0.0094, "step": 578050 }, { "epoch": 1.5, "learning_rate": 7.523776443111506e-05, "loss": 0.0067, "step": 578060 }, { "epoch": 1.5, "learning_rate": 7.52338762147436e-05, "loss": 0.0082, "step": 578070 }, { "epoch": 1.5, "learning_rate": 7.522998799837213e-05, "loss": 0.0116, "step": 578080 }, { "epoch": 1.5, "learning_rate": 7.522609978200066e-05, "loss": 0.0129, "step": 578090 }, { "epoch": 1.5, "learning_rate": 7.52222115656292e-05, "loss": 0.0099, "step": 578100 }, { "epoch": 1.5, "learning_rate": 7.521832334925773e-05, "loss": 0.0093, "step": 578110 }, { "epoch": 1.5, "learning_rate": 7.521443513288627e-05, "loss": 0.0102, "step": 578120 }, { "epoch": 1.5, "learning_rate": 7.52105469165148e-05, "loss": 0.0098, "step": 578130 }, { "epoch": 1.5, "learning_rate": 7.520665870014334e-05, "loss": 0.0078, "step": 578140 }, { "epoch": 1.5, "learning_rate": 7.520277048377187e-05, "loss": 0.0089, "step": 578150 }, { "epoch": 1.5, "learning_rate": 7.519888226740041e-05, "loss": 0.0081, "step": 578160 }, { "epoch": 1.5, "learning_rate": 7.519499405102894e-05, "loss": 0.0107, "step": 578170 }, { "epoch": 1.5, "learning_rate": 7.519110583465748e-05, "loss": 0.0104, "step": 578180 }, { "epoch": 1.5, "learning_rate": 7.5187217618286e-05, "loss": 0.0084, "step": 578190 }, { "epoch": 1.5, "learning_rate": 7.518332940191456e-05, "loss": 0.0098, "step": 578200 }, { "epoch": 1.5, "learning_rate": 7.517944118554309e-05, "loss": 0.0102, "step": 578210 }, { "epoch": 1.5, "learning_rate": 7.517555296917163e-05, "loss": 0.0077, "step": 578220 }, { "epoch": 1.5, "learning_rate": 7.517166475280016e-05, "loss": 0.0103, "step": 578230 }, { "epoch": 1.5, "learning_rate": 7.51677765364287e-05, "loss": 0.0106, "step": 578240 }, { "epoch": 1.5, "learning_rate": 7.516388832005723e-05, "loss": 0.0095, "step": 578250 }, { "epoch": 1.5, "learning_rate": 7.516000010368577e-05, "loss": 0.009, "step": 578260 }, { "epoch": 1.5, "learning_rate": 7.51561118873143e-05, "loss": 0.0061, "step": 578270 }, { "epoch": 1.5, "learning_rate": 7.515222367094284e-05, "loss": 0.0081, "step": 578280 }, { "epoch": 1.5, "learning_rate": 7.514833545457137e-05, "loss": 0.0132, "step": 578290 }, { "epoch": 1.5, "learning_rate": 7.514444723819991e-05, "loss": 0.0053, "step": 578300 }, { "epoch": 1.5, "learning_rate": 7.514055902182844e-05, "loss": 0.0113, "step": 578310 }, { "epoch": 1.5, "learning_rate": 7.513667080545698e-05, "loss": 0.0084, "step": 578320 }, { "epoch": 1.5, "learning_rate": 7.51327825890855e-05, "loss": 0.0112, "step": 578330 }, { "epoch": 1.5, "learning_rate": 7.512889437271403e-05, "loss": 0.0074, "step": 578340 }, { "epoch": 1.5, "learning_rate": 7.512500615634258e-05, "loss": 0.0129, "step": 578350 }, { "epoch": 1.5, "learning_rate": 7.51211179399711e-05, "loss": 0.0101, "step": 578360 }, { "epoch": 1.5, "learning_rate": 7.511722972359966e-05, "loss": 0.0143, "step": 578370 }, { "epoch": 1.5, "learning_rate": 7.511334150722817e-05, "loss": 0.0086, "step": 578380 }, { "epoch": 1.5, "learning_rate": 7.510945329085673e-05, "loss": 0.0103, "step": 578390 }, { "epoch": 1.5, "learning_rate": 7.510556507448526e-05, "loss": 0.0076, "step": 578400 }, { "epoch": 1.5, "learning_rate": 7.51016768581138e-05, "loss": 0.01, "step": 578410 }, { "epoch": 1.5, "learning_rate": 7.509778864174233e-05, "loss": 0.0125, "step": 578420 }, { "epoch": 1.5, "learning_rate": 7.509390042537087e-05, "loss": 0.0099, "step": 578430 }, { "epoch": 1.5, "learning_rate": 7.50900122089994e-05, "loss": 0.0115, "step": 578440 }, { "epoch": 1.5, "learning_rate": 7.508612399262794e-05, "loss": 0.0089, "step": 578450 }, { "epoch": 1.5, "learning_rate": 7.508223577625647e-05, "loss": 0.0071, "step": 578460 }, { "epoch": 1.5, "learning_rate": 7.507834755988501e-05, "loss": 0.0103, "step": 578470 }, { "epoch": 1.5, "learning_rate": 7.507445934351354e-05, "loss": 0.011, "step": 578480 }, { "epoch": 1.5, "learning_rate": 7.507057112714208e-05, "loss": 0.0139, "step": 578490 }, { "epoch": 1.5, "learning_rate": 7.50666829107706e-05, "loss": 0.0116, "step": 578500 }, { "epoch": 1.5, "learning_rate": 7.506279469439915e-05, "loss": 0.0096, "step": 578510 }, { "epoch": 1.5, "learning_rate": 7.505890647802768e-05, "loss": 0.0083, "step": 578520 }, { "epoch": 1.5, "learning_rate": 7.505501826165623e-05, "loss": 0.0096, "step": 578530 }, { "epoch": 1.5, "learning_rate": 7.505113004528475e-05, "loss": 0.0069, "step": 578540 }, { "epoch": 1.5, "learning_rate": 7.50472418289133e-05, "loss": 0.0074, "step": 578550 }, { "epoch": 1.5, "learning_rate": 7.504335361254183e-05, "loss": 0.0079, "step": 578560 }, { "epoch": 1.5, "learning_rate": 7.503946539617037e-05, "loss": 0.0103, "step": 578570 }, { "epoch": 1.5, "learning_rate": 7.50355771797989e-05, "loss": 0.0107, "step": 578580 }, { "epoch": 1.5, "learning_rate": 7.503168896342743e-05, "loss": 0.0101, "step": 578590 }, { "epoch": 1.5, "learning_rate": 7.502780074705597e-05, "loss": 0.0047, "step": 578600 }, { "epoch": 1.5, "learning_rate": 7.50239125306845e-05, "loss": 0.0092, "step": 578610 }, { "epoch": 1.5, "learning_rate": 7.502002431431304e-05, "loss": 0.0104, "step": 578620 }, { "epoch": 1.5, "learning_rate": 7.501613609794157e-05, "loss": 0.0112, "step": 578630 }, { "epoch": 1.5, "learning_rate": 7.501224788157011e-05, "loss": 0.0071, "step": 578640 }, { "epoch": 1.5, "learning_rate": 7.500835966519864e-05, "loss": 0.0122, "step": 578650 }, { "epoch": 1.5, "learning_rate": 7.500447144882718e-05, "loss": 0.0084, "step": 578660 }, { "epoch": 1.5, "learning_rate": 7.50005832324557e-05, "loss": 0.0098, "step": 578670 }, { "epoch": 1.5, "learning_rate": 7.499669501608425e-05, "loss": 0.008, "step": 578680 }, { "epoch": 1.5, "learning_rate": 7.499280679971279e-05, "loss": 0.008, "step": 578690 }, { "epoch": 1.5, "learning_rate": 7.498891858334132e-05, "loss": 0.0078, "step": 578700 }, { "epoch": 1.5, "learning_rate": 7.498503036696984e-05, "loss": 0.0128, "step": 578710 }, { "epoch": 1.5, "learning_rate": 7.498114215059839e-05, "loss": 0.008, "step": 578720 }, { "epoch": 1.5, "learning_rate": 7.497725393422693e-05, "loss": 0.0081, "step": 578730 }, { "epoch": 1.5, "learning_rate": 7.497336571785546e-05, "loss": 0.0087, "step": 578740 }, { "epoch": 1.5, "learning_rate": 7.4969477501484e-05, "loss": 0.0097, "step": 578750 }, { "epoch": 1.5, "learning_rate": 7.496558928511253e-05, "loss": 0.0129, "step": 578760 }, { "epoch": 1.5, "learning_rate": 7.496170106874107e-05, "loss": 0.0094, "step": 578770 }, { "epoch": 1.5, "learning_rate": 7.49578128523696e-05, "loss": 0.0072, "step": 578780 }, { "epoch": 1.5, "learning_rate": 7.495392463599814e-05, "loss": 0.0078, "step": 578790 }, { "epoch": 1.5, "learning_rate": 7.495003641962667e-05, "loss": 0.0112, "step": 578800 }, { "epoch": 1.5, "learning_rate": 7.494614820325521e-05, "loss": 0.0107, "step": 578810 }, { "epoch": 1.5, "learning_rate": 7.494225998688375e-05, "loss": 0.0084, "step": 578820 }, { "epoch": 1.5, "learning_rate": 7.493837177051228e-05, "loss": 0.0091, "step": 578830 }, { "epoch": 1.5, "learning_rate": 7.493448355414082e-05, "loss": 0.0074, "step": 578840 }, { "epoch": 1.5, "learning_rate": 7.493059533776935e-05, "loss": 0.0096, "step": 578850 }, { "epoch": 1.5, "learning_rate": 7.492670712139789e-05, "loss": 0.0082, "step": 578860 }, { "epoch": 1.5, "learning_rate": 7.492281890502642e-05, "loss": 0.0077, "step": 578870 }, { "epoch": 1.5, "learning_rate": 7.491893068865496e-05, "loss": 0.0072, "step": 578880 }, { "epoch": 1.5, "learning_rate": 7.49150424722835e-05, "loss": 0.0128, "step": 578890 }, { "epoch": 1.5, "learning_rate": 7.491115425591203e-05, "loss": 0.0079, "step": 578900 }, { "epoch": 1.5, "learning_rate": 7.490726603954057e-05, "loss": 0.0068, "step": 578910 }, { "epoch": 1.5, "learning_rate": 7.49033778231691e-05, "loss": 0.0074, "step": 578920 }, { "epoch": 1.5, "learning_rate": 7.489948960679764e-05, "loss": 0.007, "step": 578930 }, { "epoch": 1.5, "learning_rate": 7.489560139042617e-05, "loss": 0.0067, "step": 578940 }, { "epoch": 1.5, "learning_rate": 7.489171317405471e-05, "loss": 0.0077, "step": 578950 }, { "epoch": 1.5, "learning_rate": 7.488782495768324e-05, "loss": 0.0074, "step": 578960 }, { "epoch": 1.5, "learning_rate": 7.488393674131176e-05, "loss": 0.0073, "step": 578970 }, { "epoch": 1.5, "learning_rate": 7.48800485249403e-05, "loss": 0.0092, "step": 578980 }, { "epoch": 1.5, "learning_rate": 7.487616030856885e-05, "loss": 0.0082, "step": 578990 }, { "epoch": 1.5, "learning_rate": 7.487227209219738e-05, "loss": 0.0089, "step": 579000 }, { "epoch": 1.5, "eval_cer": 0.8816774928583525, "eval_loss": 0.006176051218062639, "eval_runtime": 107.8782, "eval_samples_per_second": 18.539, "eval_steps_per_second": 4.635, "step": 579000 }, { "epoch": 1.5, "learning_rate": 7.486838387582592e-05, "loss": 0.0083, "step": 579010 }, { "epoch": 1.5, "learning_rate": 7.486449565945445e-05, "loss": 0.0091, "step": 579020 }, { "epoch": 1.5, "learning_rate": 7.486060744308299e-05, "loss": 0.0065, "step": 579030 }, { "epoch": 1.5, "learning_rate": 7.485671922671152e-05, "loss": 0.0124, "step": 579040 }, { "epoch": 1.5, "learning_rate": 7.485283101034006e-05, "loss": 0.0071, "step": 579050 }, { "epoch": 1.5, "learning_rate": 7.484894279396859e-05, "loss": 0.0072, "step": 579060 }, { "epoch": 1.5, "learning_rate": 7.484505457759713e-05, "loss": 0.0085, "step": 579070 }, { "epoch": 1.5, "learning_rate": 7.484116636122567e-05, "loss": 0.0092, "step": 579080 }, { "epoch": 1.5, "learning_rate": 7.48372781448542e-05, "loss": 0.0072, "step": 579090 }, { "epoch": 1.5, "learning_rate": 7.483338992848274e-05, "loss": 0.0103, "step": 579100 }, { "epoch": 1.5, "learning_rate": 7.482950171211127e-05, "loss": 0.0097, "step": 579110 }, { "epoch": 1.5, "learning_rate": 7.482561349573981e-05, "loss": 0.0084, "step": 579120 }, { "epoch": 1.5, "learning_rate": 7.482172527936834e-05, "loss": 0.0086, "step": 579130 }, { "epoch": 1.5, "learning_rate": 7.481783706299688e-05, "loss": 0.0075, "step": 579140 }, { "epoch": 1.5, "learning_rate": 7.481394884662542e-05, "loss": 0.0078, "step": 579150 }, { "epoch": 1.5, "learning_rate": 7.481006063025395e-05, "loss": 0.0096, "step": 579160 }, { "epoch": 1.5, "learning_rate": 7.480617241388249e-05, "loss": 0.0086, "step": 579170 }, { "epoch": 1.5, "learning_rate": 7.480228419751102e-05, "loss": 0.0086, "step": 579180 }, { "epoch": 1.5, "learning_rate": 7.479839598113956e-05, "loss": 0.0108, "step": 579190 }, { "epoch": 1.5, "learning_rate": 7.479450776476809e-05, "loss": 0.0085, "step": 579200 }, { "epoch": 1.5, "learning_rate": 7.479061954839662e-05, "loss": 0.0086, "step": 579210 }, { "epoch": 1.5, "learning_rate": 7.478673133202516e-05, "loss": 0.0112, "step": 579220 }, { "epoch": 1.5, "learning_rate": 7.478284311565368e-05, "loss": 0.0112, "step": 579230 }, { "epoch": 1.5, "learning_rate": 7.477895489928223e-05, "loss": 0.0087, "step": 579240 }, { "epoch": 1.5, "learning_rate": 7.477506668291077e-05, "loss": 0.0075, "step": 579250 }, { "epoch": 1.5, "learning_rate": 7.47711784665393e-05, "loss": 0.0083, "step": 579260 }, { "epoch": 1.5, "learning_rate": 7.476729025016784e-05, "loss": 0.0081, "step": 579270 }, { "epoch": 1.5, "learning_rate": 7.476340203379637e-05, "loss": 0.009, "step": 579280 }, { "epoch": 1.5, "learning_rate": 7.475951381742491e-05, "loss": 0.0097, "step": 579290 }, { "epoch": 1.5, "learning_rate": 7.475562560105344e-05, "loss": 0.0104, "step": 579300 }, { "epoch": 1.5, "learning_rate": 7.475173738468198e-05, "loss": 0.0105, "step": 579310 }, { "epoch": 1.5, "learning_rate": 7.47478491683105e-05, "loss": 0.0089, "step": 579320 }, { "epoch": 1.5, "learning_rate": 7.474396095193905e-05, "loss": 0.017, "step": 579330 }, { "epoch": 1.5, "learning_rate": 7.474007273556759e-05, "loss": 0.0089, "step": 579340 }, { "epoch": 1.5, "learning_rate": 7.473618451919612e-05, "loss": 0.0118, "step": 579350 }, { "epoch": 1.5, "learning_rate": 7.473229630282466e-05, "loss": 0.012, "step": 579360 }, { "epoch": 1.5, "learning_rate": 7.472840808645319e-05, "loss": 0.0076, "step": 579370 }, { "epoch": 1.5, "learning_rate": 7.472451987008173e-05, "loss": 0.0078, "step": 579380 }, { "epoch": 1.5, "learning_rate": 7.472063165371026e-05, "loss": 0.009, "step": 579390 }, { "epoch": 1.5, "learning_rate": 7.47167434373388e-05, "loss": 0.0079, "step": 579400 }, { "epoch": 1.5, "learning_rate": 7.471285522096733e-05, "loss": 0.0083, "step": 579410 }, { "epoch": 1.5, "learning_rate": 7.470896700459587e-05, "loss": 0.0079, "step": 579420 }, { "epoch": 1.5, "learning_rate": 7.470507878822441e-05, "loss": 0.0077, "step": 579430 }, { "epoch": 1.5, "learning_rate": 7.470119057185294e-05, "loss": 0.007, "step": 579440 }, { "epoch": 1.5, "learning_rate": 7.469730235548148e-05, "loss": 0.01, "step": 579450 }, { "epoch": 1.5, "learning_rate": 7.469341413911001e-05, "loss": 0.0088, "step": 579460 }, { "epoch": 1.5, "learning_rate": 7.468952592273853e-05, "loss": 0.0099, "step": 579470 }, { "epoch": 1.5, "learning_rate": 7.468563770636708e-05, "loss": 0.0082, "step": 579480 }, { "epoch": 1.5, "learning_rate": 7.46817494899956e-05, "loss": 0.0084, "step": 579490 }, { "epoch": 1.5, "learning_rate": 7.467786127362415e-05, "loss": 0.0125, "step": 579500 }, { "epoch": 1.5, "learning_rate": 7.467397305725267e-05, "loss": 0.01, "step": 579510 }, { "epoch": 1.5, "learning_rate": 7.467008484088122e-05, "loss": 0.0089, "step": 579520 }, { "epoch": 1.5, "learning_rate": 7.466619662450976e-05, "loss": 0.0093, "step": 579530 }, { "epoch": 1.5, "learning_rate": 7.466230840813829e-05, "loss": 0.0106, "step": 579540 }, { "epoch": 1.5, "learning_rate": 7.465842019176683e-05, "loss": 0.0106, "step": 579550 }, { "epoch": 1.5, "learning_rate": 7.465453197539536e-05, "loss": 0.0071, "step": 579560 }, { "epoch": 1.5, "learning_rate": 7.46506437590239e-05, "loss": 0.0081, "step": 579570 }, { "epoch": 1.5, "learning_rate": 7.464675554265243e-05, "loss": 0.0103, "step": 579580 }, { "epoch": 1.5, "learning_rate": 7.464286732628097e-05, "loss": 0.0089, "step": 579590 }, { "epoch": 1.5, "learning_rate": 7.463897910990951e-05, "loss": 0.0102, "step": 579600 }, { "epoch": 1.5, "learning_rate": 7.463509089353804e-05, "loss": 0.009, "step": 579610 }, { "epoch": 1.5, "learning_rate": 7.463120267716658e-05, "loss": 0.0097, "step": 579620 }, { "epoch": 1.5, "learning_rate": 7.46273144607951e-05, "loss": 0.0155, "step": 579630 }, { "epoch": 1.5, "learning_rate": 7.462342624442365e-05, "loss": 0.0081, "step": 579640 }, { "epoch": 1.5, "learning_rate": 7.461953802805218e-05, "loss": 0.0084, "step": 579650 }, { "epoch": 1.5, "learning_rate": 7.461564981168072e-05, "loss": 0.0107, "step": 579660 }, { "epoch": 1.5, "learning_rate": 7.461176159530925e-05, "loss": 0.008, "step": 579670 }, { "epoch": 1.5, "learning_rate": 7.460787337893779e-05, "loss": 0.0082, "step": 579680 }, { "epoch": 1.5, "learning_rate": 7.460398516256633e-05, "loss": 0.0089, "step": 579690 }, { "epoch": 1.5, "learning_rate": 7.460009694619486e-05, "loss": 0.0089, "step": 579700 }, { "epoch": 1.5, "learning_rate": 7.459620872982339e-05, "loss": 0.0079, "step": 579710 }, { "epoch": 1.5, "learning_rate": 7.459232051345193e-05, "loss": 0.0093, "step": 579720 }, { "epoch": 1.5, "learning_rate": 7.458843229708045e-05, "loss": 0.0082, "step": 579730 }, { "epoch": 1.5, "learning_rate": 7.4584544080709e-05, "loss": 0.0078, "step": 579740 }, { "epoch": 1.5, "learning_rate": 7.458065586433752e-05, "loss": 0.0098, "step": 579750 }, { "epoch": 1.5, "learning_rate": 7.457676764796607e-05, "loss": 0.0076, "step": 579760 }, { "epoch": 1.5, "learning_rate": 7.45728794315946e-05, "loss": 0.0108, "step": 579770 }, { "epoch": 1.5, "learning_rate": 7.456899121522314e-05, "loss": 0.0098, "step": 579780 }, { "epoch": 1.5, "learning_rate": 7.456510299885168e-05, "loss": 0.0086, "step": 579790 }, { "epoch": 1.5, "learning_rate": 7.45612147824802e-05, "loss": 0.0079, "step": 579800 }, { "epoch": 1.5, "learning_rate": 7.455732656610875e-05, "loss": 0.0088, "step": 579810 }, { "epoch": 1.5, "learning_rate": 7.455343834973728e-05, "loss": 0.0101, "step": 579820 }, { "epoch": 1.5, "learning_rate": 7.454955013336582e-05, "loss": 0.0095, "step": 579830 }, { "epoch": 1.5, "learning_rate": 7.454566191699435e-05, "loss": 0.0106, "step": 579840 }, { "epoch": 1.5, "learning_rate": 7.454177370062289e-05, "loss": 0.0086, "step": 579850 }, { "epoch": 1.5, "learning_rate": 7.453788548425143e-05, "loss": 0.0087, "step": 579860 }, { "epoch": 1.5, "learning_rate": 7.453399726787996e-05, "loss": 0.0099, "step": 579870 }, { "epoch": 1.5, "learning_rate": 7.45301090515085e-05, "loss": 0.0082, "step": 579880 }, { "epoch": 1.5, "learning_rate": 7.452622083513703e-05, "loss": 0.0096, "step": 579890 }, { "epoch": 1.5, "learning_rate": 7.452233261876557e-05, "loss": 0.0077, "step": 579900 }, { "epoch": 1.5, "learning_rate": 7.45184444023941e-05, "loss": 0.0092, "step": 579910 }, { "epoch": 1.5, "learning_rate": 7.451455618602264e-05, "loss": 0.0078, "step": 579920 }, { "epoch": 1.5, "learning_rate": 7.451066796965117e-05, "loss": 0.0096, "step": 579930 }, { "epoch": 1.5, "learning_rate": 7.450677975327971e-05, "loss": 0.0094, "step": 579940 }, { "epoch": 1.5, "learning_rate": 7.450289153690824e-05, "loss": 0.0129, "step": 579950 }, { "epoch": 1.5, "learning_rate": 7.449900332053678e-05, "loss": 0.0084, "step": 579960 }, { "epoch": 1.5, "learning_rate": 7.44951151041653e-05, "loss": 0.0095, "step": 579970 }, { "epoch": 1.5, "learning_rate": 7.449122688779385e-05, "loss": 0.0089, "step": 579980 }, { "epoch": 1.5, "learning_rate": 7.448733867142237e-05, "loss": 0.0093, "step": 579990 }, { "epoch": 1.5, "learning_rate": 7.448345045505092e-05, "loss": 0.0111, "step": 580000 }, { "epoch": 1.5, "eval_cer": 0.8816928888646285, "eval_loss": 0.006042073480784893, "eval_runtime": 107.9383, "eval_samples_per_second": 18.529, "eval_steps_per_second": 4.632, "step": 580000 }, { "epoch": 1.5, "learning_rate": 7.447956223867944e-05, "loss": 0.0091, "step": 580010 }, { "epoch": 1.5, "learning_rate": 7.447567402230799e-05, "loss": 0.0067, "step": 580020 }, { "epoch": 1.5, "learning_rate": 7.447178580593651e-05, "loss": 0.0122, "step": 580030 }, { "epoch": 1.5, "learning_rate": 7.446789758956506e-05, "loss": 0.0111, "step": 580040 }, { "epoch": 1.5, "learning_rate": 7.44640093731936e-05, "loss": 0.0079, "step": 580050 }, { "epoch": 1.5, "learning_rate": 7.446012115682213e-05, "loss": 0.0108, "step": 580060 }, { "epoch": 1.5, "learning_rate": 7.445623294045067e-05, "loss": 0.0101, "step": 580070 }, { "epoch": 1.5, "learning_rate": 7.44523447240792e-05, "loss": 0.0072, "step": 580080 }, { "epoch": 1.5, "learning_rate": 7.444845650770774e-05, "loss": 0.0108, "step": 580090 }, { "epoch": 1.5, "learning_rate": 7.444456829133627e-05, "loss": 0.0085, "step": 580100 }, { "epoch": 1.5, "learning_rate": 7.444068007496481e-05, "loss": 0.0094, "step": 580110 }, { "epoch": 1.5, "learning_rate": 7.443679185859335e-05, "loss": 0.0098, "step": 580120 }, { "epoch": 1.5, "learning_rate": 7.443290364222188e-05, "loss": 0.0118, "step": 580130 }, { "epoch": 1.5, "learning_rate": 7.442901542585042e-05, "loss": 0.0103, "step": 580140 }, { "epoch": 1.5, "learning_rate": 7.442512720947895e-05, "loss": 0.0059, "step": 580150 }, { "epoch": 1.5, "learning_rate": 7.442123899310749e-05, "loss": 0.0095, "step": 580160 }, { "epoch": 1.5, "learning_rate": 7.441735077673602e-05, "loss": 0.0103, "step": 580170 }, { "epoch": 1.5, "learning_rate": 7.441346256036456e-05, "loss": 0.009, "step": 580180 }, { "epoch": 1.5, "learning_rate": 7.440957434399309e-05, "loss": 0.0072, "step": 580190 }, { "epoch": 1.5, "learning_rate": 7.440568612762161e-05, "loss": 0.0067, "step": 580200 }, { "epoch": 1.5, "learning_rate": 7.440179791125016e-05, "loss": 0.0069, "step": 580210 }, { "epoch": 1.5, "learning_rate": 7.43979096948787e-05, "loss": 0.0085, "step": 580220 }, { "epoch": 1.5, "learning_rate": 7.439402147850723e-05, "loss": 0.0114, "step": 580230 }, { "epoch": 1.5, "learning_rate": 7.439013326213577e-05, "loss": 0.0084, "step": 580240 }, { "epoch": 1.5, "learning_rate": 7.43862450457643e-05, "loss": 0.0084, "step": 580250 }, { "epoch": 1.5, "learning_rate": 7.438235682939284e-05, "loss": 0.011, "step": 580260 }, { "epoch": 1.5, "learning_rate": 7.437846861302136e-05, "loss": 0.0135, "step": 580270 }, { "epoch": 1.5, "learning_rate": 7.43745803966499e-05, "loss": 0.0093, "step": 580280 }, { "epoch": 1.5, "learning_rate": 7.437069218027843e-05, "loss": 0.0082, "step": 580290 }, { "epoch": 1.5, "learning_rate": 7.436680396390698e-05, "loss": 0.0083, "step": 580300 }, { "epoch": 1.5, "learning_rate": 7.436291574753552e-05, "loss": 0.009, "step": 580310 }, { "epoch": 1.5, "learning_rate": 7.435902753116405e-05, "loss": 0.0115, "step": 580320 }, { "epoch": 1.5, "learning_rate": 7.435513931479259e-05, "loss": 0.0088, "step": 580330 }, { "epoch": 1.5, "learning_rate": 7.435125109842112e-05, "loss": 0.0093, "step": 580340 }, { "epoch": 1.5, "learning_rate": 7.434736288204966e-05, "loss": 0.0084, "step": 580350 }, { "epoch": 1.5, "learning_rate": 7.434347466567819e-05, "loss": 0.0124, "step": 580360 }, { "epoch": 1.5, "learning_rate": 7.433958644930673e-05, "loss": 0.0078, "step": 580370 }, { "epoch": 1.5, "learning_rate": 7.433569823293527e-05, "loss": 0.0063, "step": 580380 }, { "epoch": 1.5, "learning_rate": 7.43318100165638e-05, "loss": 0.0073, "step": 580390 }, { "epoch": 1.5, "learning_rate": 7.432792180019234e-05, "loss": 0.0091, "step": 580400 }, { "epoch": 1.5, "learning_rate": 7.432403358382087e-05, "loss": 0.0141, "step": 580410 }, { "epoch": 1.5, "learning_rate": 7.432014536744941e-05, "loss": 0.0065, "step": 580420 }, { "epoch": 1.5, "learning_rate": 7.431625715107794e-05, "loss": 0.0084, "step": 580430 }, { "epoch": 1.5, "learning_rate": 7.431236893470648e-05, "loss": 0.0106, "step": 580440 }, { "epoch": 1.5, "learning_rate": 7.4308480718335e-05, "loss": 0.0084, "step": 580450 }, { "epoch": 1.5, "learning_rate": 7.430459250196353e-05, "loss": 0.0089, "step": 580460 }, { "epoch": 1.5, "learning_rate": 7.430070428559208e-05, "loss": 0.0065, "step": 580470 }, { "epoch": 1.5, "learning_rate": 7.429681606922062e-05, "loss": 0.0083, "step": 580480 }, { "epoch": 1.5, "learning_rate": 7.429292785284915e-05, "loss": 0.0095, "step": 580490 }, { "epoch": 1.5, "learning_rate": 7.428903963647769e-05, "loss": 0.007, "step": 580500 }, { "epoch": 1.5, "learning_rate": 7.428515142010621e-05, "loss": 0.012, "step": 580510 }, { "epoch": 1.5, "learning_rate": 7.428126320373476e-05, "loss": 0.0097, "step": 580520 }, { "epoch": 1.5, "learning_rate": 7.427737498736328e-05, "loss": 0.0121, "step": 580530 }, { "epoch": 1.5, "learning_rate": 7.427348677099183e-05, "loss": 0.0061, "step": 580540 }, { "epoch": 1.5, "learning_rate": 7.426959855462035e-05, "loss": 0.0087, "step": 580550 }, { "epoch": 1.5, "learning_rate": 7.42657103382489e-05, "loss": 0.0079, "step": 580560 }, { "epoch": 1.5, "learning_rate": 7.426182212187744e-05, "loss": 0.0084, "step": 580570 }, { "epoch": 1.5, "learning_rate": 7.425793390550597e-05, "loss": 0.0093, "step": 580580 }, { "epoch": 1.5, "learning_rate": 7.425404568913451e-05, "loss": 0.0064, "step": 580590 }, { "epoch": 1.5, "learning_rate": 7.425015747276304e-05, "loss": 0.0079, "step": 580600 }, { "epoch": 1.51, "learning_rate": 7.424626925639158e-05, "loss": 0.0112, "step": 580610 }, { "epoch": 1.51, "learning_rate": 7.42423810400201e-05, "loss": 0.0089, "step": 580620 }, { "epoch": 1.51, "learning_rate": 7.423849282364865e-05, "loss": 0.007, "step": 580630 }, { "epoch": 1.51, "learning_rate": 7.423460460727719e-05, "loss": 0.0126, "step": 580640 }, { "epoch": 1.51, "learning_rate": 7.423071639090572e-05, "loss": 0.0095, "step": 580650 }, { "epoch": 1.51, "learning_rate": 7.422682817453426e-05, "loss": 0.0099, "step": 580660 }, { "epoch": 1.51, "learning_rate": 7.422293995816279e-05, "loss": 0.009, "step": 580670 }, { "epoch": 1.51, "learning_rate": 7.421905174179133e-05, "loss": 0.0124, "step": 580680 }, { "epoch": 1.51, "learning_rate": 7.421516352541986e-05, "loss": 0.0077, "step": 580690 }, { "epoch": 1.51, "learning_rate": 7.421127530904838e-05, "loss": 0.0082, "step": 580700 }, { "epoch": 1.51, "learning_rate": 7.420738709267693e-05, "loss": 0.009, "step": 580710 }, { "epoch": 1.51, "learning_rate": 7.420349887630545e-05, "loss": 0.0066, "step": 580720 }, { "epoch": 1.51, "learning_rate": 7.4199610659934e-05, "loss": 0.0089, "step": 580730 }, { "epoch": 1.51, "learning_rate": 7.419572244356254e-05, "loss": 0.0088, "step": 580740 }, { "epoch": 1.51, "learning_rate": 7.419183422719107e-05, "loss": 0.0072, "step": 580750 }, { "epoch": 1.51, "learning_rate": 7.41879460108196e-05, "loss": 0.0067, "step": 580760 }, { "epoch": 1.51, "learning_rate": 7.418405779444813e-05, "loss": 0.016, "step": 580770 }, { "epoch": 1.51, "learning_rate": 7.418016957807668e-05, "loss": 0.0096, "step": 580780 }, { "epoch": 1.51, "learning_rate": 7.41762813617052e-05, "loss": 0.0072, "step": 580790 }, { "epoch": 1.51, "learning_rate": 7.417239314533375e-05, "loss": 0.0068, "step": 580800 }, { "epoch": 1.51, "learning_rate": 7.416850492896227e-05, "loss": 0.009, "step": 580810 }, { "epoch": 1.51, "learning_rate": 7.416461671259082e-05, "loss": 0.0072, "step": 580820 }, { "epoch": 1.51, "learning_rate": 7.416072849621936e-05, "loss": 0.007, "step": 580830 }, { "epoch": 1.51, "learning_rate": 7.415684027984789e-05, "loss": 0.0064, "step": 580840 }, { "epoch": 1.51, "learning_rate": 7.415295206347643e-05, "loss": 0.0076, "step": 580850 }, { "epoch": 1.51, "learning_rate": 7.414906384710496e-05, "loss": 0.0074, "step": 580860 }, { "epoch": 1.51, "learning_rate": 7.41451756307335e-05, "loss": 0.0077, "step": 580870 }, { "epoch": 1.51, "learning_rate": 7.414128741436202e-05, "loss": 0.008, "step": 580880 }, { "epoch": 1.51, "learning_rate": 7.413739919799057e-05, "loss": 0.0118, "step": 580890 }, { "epoch": 1.51, "learning_rate": 7.41335109816191e-05, "loss": 0.0074, "step": 580900 }, { "epoch": 1.51, "learning_rate": 7.412962276524764e-05, "loss": 0.0087, "step": 580910 }, { "epoch": 1.51, "learning_rate": 7.412573454887618e-05, "loss": 0.0089, "step": 580920 }, { "epoch": 1.51, "learning_rate": 7.41218463325047e-05, "loss": 0.0067, "step": 580930 }, { "epoch": 1.51, "learning_rate": 7.411795811613325e-05, "loss": 0.0078, "step": 580940 }, { "epoch": 1.51, "learning_rate": 7.411406989976178e-05, "loss": 0.012, "step": 580950 }, { "epoch": 1.51, "learning_rate": 7.41101816833903e-05, "loss": 0.0102, "step": 580960 }, { "epoch": 1.51, "learning_rate": 7.410629346701885e-05, "loss": 0.0107, "step": 580970 }, { "epoch": 1.51, "learning_rate": 7.410240525064737e-05, "loss": 0.0096, "step": 580980 }, { "epoch": 1.51, "learning_rate": 7.409851703427592e-05, "loss": 0.0086, "step": 580990 }, { "epoch": 1.51, "learning_rate": 7.409462881790444e-05, "loss": 0.0095, "step": 581000 }, { "epoch": 1.51, "eval_cer": 0.8816984874123652, "eval_loss": 0.006130463909357786, "eval_runtime": 107.9133, "eval_samples_per_second": 18.533, "eval_steps_per_second": 4.633, "step": 581000 }, { "epoch": 1.51, "learning_rate": 7.409074060153298e-05, "loss": 0.0092, "step": 581010 }, { "epoch": 1.51, "learning_rate": 7.408685238516153e-05, "loss": 0.0081, "step": 581020 }, { "epoch": 1.51, "learning_rate": 7.408296416879005e-05, "loss": 0.0084, "step": 581030 }, { "epoch": 1.51, "learning_rate": 7.40790759524186e-05, "loss": 0.0077, "step": 581040 }, { "epoch": 1.51, "learning_rate": 7.407518773604712e-05, "loss": 0.0099, "step": 581050 }, { "epoch": 1.51, "learning_rate": 7.407129951967567e-05, "loss": 0.0105, "step": 581060 }, { "epoch": 1.51, "learning_rate": 7.40674113033042e-05, "loss": 0.0101, "step": 581070 }, { "epoch": 1.51, "learning_rate": 7.406352308693274e-05, "loss": 0.0085, "step": 581080 }, { "epoch": 1.51, "learning_rate": 7.405963487056128e-05, "loss": 0.007, "step": 581090 }, { "epoch": 1.51, "learning_rate": 7.40557466541898e-05, "loss": 0.0099, "step": 581100 }, { "epoch": 1.51, "learning_rate": 7.405185843781835e-05, "loss": 0.0115, "step": 581110 }, { "epoch": 1.51, "learning_rate": 7.404797022144688e-05, "loss": 0.0129, "step": 581120 }, { "epoch": 1.51, "learning_rate": 7.404408200507542e-05, "loss": 0.01, "step": 581130 }, { "epoch": 1.51, "learning_rate": 7.404019378870394e-05, "loss": 0.0075, "step": 581140 }, { "epoch": 1.51, "learning_rate": 7.403630557233249e-05, "loss": 0.0096, "step": 581150 }, { "epoch": 1.51, "learning_rate": 7.403241735596101e-05, "loss": 0.0088, "step": 581160 }, { "epoch": 1.51, "learning_rate": 7.402852913958956e-05, "loss": 0.0075, "step": 581170 }, { "epoch": 1.51, "learning_rate": 7.40246409232181e-05, "loss": 0.0079, "step": 581180 }, { "epoch": 1.51, "learning_rate": 7.402075270684663e-05, "loss": 0.0056, "step": 581190 }, { "epoch": 1.51, "learning_rate": 7.401686449047515e-05, "loss": 0.0067, "step": 581200 }, { "epoch": 1.51, "learning_rate": 7.40129762741037e-05, "loss": 0.0081, "step": 581210 }, { "epoch": 1.51, "learning_rate": 7.400908805773222e-05, "loss": 0.0089, "step": 581220 }, { "epoch": 1.51, "learning_rate": 7.400519984136077e-05, "loss": 0.008, "step": 581230 }, { "epoch": 1.51, "learning_rate": 7.40013116249893e-05, "loss": 0.0093, "step": 581240 }, { "epoch": 1.51, "learning_rate": 7.399742340861784e-05, "loss": 0.0111, "step": 581250 }, { "epoch": 1.51, "learning_rate": 7.399353519224636e-05, "loss": 0.0082, "step": 581260 }, { "epoch": 1.51, "learning_rate": 7.39896469758749e-05, "loss": 0.011, "step": 581270 }, { "epoch": 1.51, "learning_rate": 7.398575875950345e-05, "loss": 0.0084, "step": 581280 }, { "epoch": 1.51, "learning_rate": 7.398187054313197e-05, "loss": 0.0079, "step": 581290 }, { "epoch": 1.51, "learning_rate": 7.397798232676052e-05, "loss": 0.0071, "step": 581300 }, { "epoch": 1.51, "learning_rate": 7.397409411038904e-05, "loss": 0.008, "step": 581310 }, { "epoch": 1.51, "learning_rate": 7.397020589401759e-05, "loss": 0.0105, "step": 581320 }, { "epoch": 1.51, "learning_rate": 7.396631767764611e-05, "loss": 0.0103, "step": 581330 }, { "epoch": 1.51, "learning_rate": 7.396242946127466e-05, "loss": 0.0086, "step": 581340 }, { "epoch": 1.51, "learning_rate": 7.39585412449032e-05, "loss": 0.013, "step": 581350 }, { "epoch": 1.51, "learning_rate": 7.395465302853173e-05, "loss": 0.0053, "step": 581360 }, { "epoch": 1.51, "learning_rate": 7.395076481216027e-05, "loss": 0.01, "step": 581370 }, { "epoch": 1.51, "learning_rate": 7.39468765957888e-05, "loss": 0.0086, "step": 581380 }, { "epoch": 1.51, "learning_rate": 7.394298837941734e-05, "loss": 0.0096, "step": 581390 }, { "epoch": 1.51, "learning_rate": 7.393910016304586e-05, "loss": 0.0101, "step": 581400 }, { "epoch": 1.51, "learning_rate": 7.39352119466744e-05, "loss": 0.0098, "step": 581410 }, { "epoch": 1.51, "learning_rate": 7.393132373030293e-05, "loss": 0.009, "step": 581420 }, { "epoch": 1.51, "learning_rate": 7.392743551393148e-05, "loss": 0.0098, "step": 581430 }, { "epoch": 1.51, "learning_rate": 7.392354729756e-05, "loss": 0.0072, "step": 581440 }, { "epoch": 1.51, "learning_rate": 7.391965908118855e-05, "loss": 0.0113, "step": 581450 }, { "epoch": 1.51, "learning_rate": 7.391577086481707e-05, "loss": 0.0097, "step": 581460 }, { "epoch": 1.51, "learning_rate": 7.391188264844562e-05, "loss": 0.0079, "step": 581470 }, { "epoch": 1.51, "learning_rate": 7.390799443207414e-05, "loss": 0.0105, "step": 581480 }, { "epoch": 1.51, "learning_rate": 7.390410621570269e-05, "loss": 0.0078, "step": 581490 }, { "epoch": 1.51, "learning_rate": 7.390021799933121e-05, "loss": 0.0101, "step": 581500 }, { "epoch": 1.51, "learning_rate": 7.389632978295976e-05, "loss": 0.0097, "step": 581510 }, { "epoch": 1.51, "learning_rate": 7.389244156658828e-05, "loss": 0.0103, "step": 581520 }, { "epoch": 1.51, "learning_rate": 7.388855335021682e-05, "loss": 0.0088, "step": 581530 }, { "epoch": 1.51, "learning_rate": 7.388466513384537e-05, "loss": 0.0114, "step": 581540 }, { "epoch": 1.51, "learning_rate": 7.38807769174739e-05, "loss": 0.0116, "step": 581550 }, { "epoch": 1.51, "learning_rate": 7.387688870110244e-05, "loss": 0.0072, "step": 581560 }, { "epoch": 1.51, "learning_rate": 7.387300048473096e-05, "loss": 0.0072, "step": 581570 }, { "epoch": 1.51, "learning_rate": 7.38691122683595e-05, "loss": 0.0083, "step": 581580 }, { "epoch": 1.51, "learning_rate": 7.386522405198803e-05, "loss": 0.0087, "step": 581590 }, { "epoch": 1.51, "learning_rate": 7.386133583561658e-05, "loss": 0.0081, "step": 581600 }, { "epoch": 1.51, "learning_rate": 7.385744761924512e-05, "loss": 0.0075, "step": 581610 }, { "epoch": 1.51, "learning_rate": 7.385355940287365e-05, "loss": 0.0087, "step": 581620 }, { "epoch": 1.51, "learning_rate": 7.384967118650219e-05, "loss": 0.0077, "step": 581630 }, { "epoch": 1.51, "learning_rate": 7.384578297013072e-05, "loss": 0.0077, "step": 581640 }, { "epoch": 1.51, "learning_rate": 7.384189475375926e-05, "loss": 0.0125, "step": 581650 }, { "epoch": 1.51, "learning_rate": 7.383800653738778e-05, "loss": 0.009, "step": 581660 }, { "epoch": 1.51, "learning_rate": 7.383411832101633e-05, "loss": 0.0082, "step": 581670 }, { "epoch": 1.51, "learning_rate": 7.383023010464485e-05, "loss": 0.0092, "step": 581680 }, { "epoch": 1.51, "learning_rate": 7.382634188827338e-05, "loss": 0.0087, "step": 581690 }, { "epoch": 1.51, "learning_rate": 7.382245367190192e-05, "loss": 0.0087, "step": 581700 }, { "epoch": 1.51, "learning_rate": 7.381856545553047e-05, "loss": 0.0099, "step": 581710 }, { "epoch": 1.51, "learning_rate": 7.3814677239159e-05, "loss": 0.0077, "step": 581720 }, { "epoch": 1.51, "learning_rate": 7.381078902278754e-05, "loss": 0.0096, "step": 581730 }, { "epoch": 1.51, "learning_rate": 7.380690080641606e-05, "loss": 0.0149, "step": 581740 }, { "epoch": 1.51, "learning_rate": 7.38030125900446e-05, "loss": 0.0088, "step": 581750 }, { "epoch": 1.51, "learning_rate": 7.379912437367313e-05, "loss": 0.0083, "step": 581760 }, { "epoch": 1.51, "learning_rate": 7.379523615730168e-05, "loss": 0.0085, "step": 581770 }, { "epoch": 1.51, "learning_rate": 7.37913479409302e-05, "loss": 0.0088, "step": 581780 }, { "epoch": 1.51, "learning_rate": 7.378745972455874e-05, "loss": 0.0077, "step": 581790 }, { "epoch": 1.51, "learning_rate": 7.378357150818729e-05, "loss": 0.0076, "step": 581800 }, { "epoch": 1.51, "learning_rate": 7.377968329181581e-05, "loss": 0.0089, "step": 581810 }, { "epoch": 1.51, "learning_rate": 7.377579507544436e-05, "loss": 0.01, "step": 581820 }, { "epoch": 1.51, "learning_rate": 7.377190685907288e-05, "loss": 0.0105, "step": 581830 }, { "epoch": 1.51, "learning_rate": 7.376801864270143e-05, "loss": 0.009, "step": 581840 }, { "epoch": 1.51, "learning_rate": 7.376413042632995e-05, "loss": 0.0093, "step": 581850 }, { "epoch": 1.51, "learning_rate": 7.37602422099585e-05, "loss": 0.0082, "step": 581860 }, { "epoch": 1.51, "learning_rate": 7.375635399358704e-05, "loss": 0.0081, "step": 581870 }, { "epoch": 1.51, "learning_rate": 7.375246577721557e-05, "loss": 0.0127, "step": 581880 }, { "epoch": 1.51, "learning_rate": 7.374857756084411e-05, "loss": 0.0079, "step": 581890 }, { "epoch": 1.51, "learning_rate": 7.374468934447264e-05, "loss": 0.0075, "step": 581900 }, { "epoch": 1.51, "learning_rate": 7.374080112810118e-05, "loss": 0.0081, "step": 581910 }, { "epoch": 1.51, "learning_rate": 7.37369129117297e-05, "loss": 0.0109, "step": 581920 }, { "epoch": 1.51, "learning_rate": 7.373302469535825e-05, "loss": 0.0111, "step": 581930 }, { "epoch": 1.51, "learning_rate": 7.372913647898677e-05, "loss": 0.0075, "step": 581940 }, { "epoch": 1.51, "learning_rate": 7.37252482626153e-05, "loss": 0.0059, "step": 581950 }, { "epoch": 1.51, "learning_rate": 7.372136004624384e-05, "loss": 0.0086, "step": 581960 }, { "epoch": 1.51, "learning_rate": 7.371747182987239e-05, "loss": 0.0079, "step": 581970 }, { "epoch": 1.51, "learning_rate": 7.371358361350091e-05, "loss": 0.0095, "step": 581980 }, { "epoch": 1.51, "learning_rate": 7.370969539712946e-05, "loss": 0.0096, "step": 581990 }, { "epoch": 1.51, "learning_rate": 7.370580718075798e-05, "loss": 0.0091, "step": 582000 }, { "epoch": 1.51, "eval_cer": 0.8816984874123652, "eval_loss": 0.005966072902083397, "eval_runtime": 107.7983, "eval_samples_per_second": 18.553, "eval_steps_per_second": 4.638, "step": 582000 }, { "epoch": 1.51, "learning_rate": 7.370191896438653e-05, "loss": 0.0067, "step": 582010 }, { "epoch": 1.51, "learning_rate": 7.369803074801505e-05, "loss": 0.0095, "step": 582020 }, { "epoch": 1.51, "learning_rate": 7.36941425316436e-05, "loss": 0.0106, "step": 582030 }, { "epoch": 1.51, "learning_rate": 7.369025431527212e-05, "loss": 0.0067, "step": 582040 }, { "epoch": 1.51, "learning_rate": 7.368636609890066e-05, "loss": 0.0088, "step": 582050 }, { "epoch": 1.51, "learning_rate": 7.36824778825292e-05, "loss": 0.0091, "step": 582060 }, { "epoch": 1.51, "learning_rate": 7.367858966615773e-05, "loss": 0.007, "step": 582070 }, { "epoch": 1.51, "learning_rate": 7.367470144978628e-05, "loss": 0.0081, "step": 582080 }, { "epoch": 1.51, "learning_rate": 7.36708132334148e-05, "loss": 0.009, "step": 582090 }, { "epoch": 1.51, "learning_rate": 7.366692501704335e-05, "loss": 0.0081, "step": 582100 }, { "epoch": 1.51, "learning_rate": 7.366303680067187e-05, "loss": 0.0117, "step": 582110 }, { "epoch": 1.51, "learning_rate": 7.365914858430042e-05, "loss": 0.0154, "step": 582120 }, { "epoch": 1.51, "learning_rate": 7.365526036792896e-05, "loss": 0.0077, "step": 582130 }, { "epoch": 1.51, "learning_rate": 7.365137215155749e-05, "loss": 0.0125, "step": 582140 }, { "epoch": 1.51, "learning_rate": 7.364748393518603e-05, "loss": 0.0095, "step": 582150 }, { "epoch": 1.51, "learning_rate": 7.364359571881456e-05, "loss": 0.0084, "step": 582160 }, { "epoch": 1.51, "learning_rate": 7.36397075024431e-05, "loss": 0.0114, "step": 582170 }, { "epoch": 1.51, "learning_rate": 7.363581928607162e-05, "loss": 0.0091, "step": 582180 }, { "epoch": 1.51, "learning_rate": 7.363193106970015e-05, "loss": 0.0094, "step": 582190 }, { "epoch": 1.51, "learning_rate": 7.36280428533287e-05, "loss": 0.0084, "step": 582200 }, { "epoch": 1.51, "learning_rate": 7.362415463695722e-05, "loss": 0.0077, "step": 582210 }, { "epoch": 1.51, "learning_rate": 7.362026642058576e-05, "loss": 0.0115, "step": 582220 }, { "epoch": 1.51, "learning_rate": 7.36163782042143e-05, "loss": 0.0077, "step": 582230 }, { "epoch": 1.51, "learning_rate": 7.361248998784283e-05, "loss": 0.0084, "step": 582240 }, { "epoch": 1.51, "learning_rate": 7.360860177147138e-05, "loss": 0.0096, "step": 582250 }, { "epoch": 1.51, "learning_rate": 7.36047135550999e-05, "loss": 0.0094, "step": 582260 }, { "epoch": 1.51, "learning_rate": 7.360082533872845e-05, "loss": 0.0094, "step": 582270 }, { "epoch": 1.51, "learning_rate": 7.359693712235697e-05, "loss": 0.0102, "step": 582280 }, { "epoch": 1.51, "learning_rate": 7.359304890598552e-05, "loss": 0.009, "step": 582290 }, { "epoch": 1.51, "learning_rate": 7.358916068961404e-05, "loss": 0.0085, "step": 582300 }, { "epoch": 1.51, "learning_rate": 7.358527247324258e-05, "loss": 0.0082, "step": 582310 }, { "epoch": 1.51, "learning_rate": 7.358138425687113e-05, "loss": 0.0071, "step": 582320 }, { "epoch": 1.51, "learning_rate": 7.357749604049965e-05, "loss": 0.0092, "step": 582330 }, { "epoch": 1.51, "learning_rate": 7.35736078241282e-05, "loss": 0.008, "step": 582340 }, { "epoch": 1.51, "learning_rate": 7.356971960775672e-05, "loss": 0.0087, "step": 582350 }, { "epoch": 1.51, "learning_rate": 7.356583139138527e-05, "loss": 0.0098, "step": 582360 }, { "epoch": 1.51, "learning_rate": 7.35619431750138e-05, "loss": 0.014, "step": 582370 }, { "epoch": 1.51, "learning_rate": 7.355805495864234e-05, "loss": 0.0084, "step": 582380 }, { "epoch": 1.51, "learning_rate": 7.355416674227086e-05, "loss": 0.0109, "step": 582390 }, { "epoch": 1.51, "learning_rate": 7.35502785258994e-05, "loss": 0.0088, "step": 582400 }, { "epoch": 1.51, "learning_rate": 7.354639030952795e-05, "loss": 0.0062, "step": 582410 }, { "epoch": 1.51, "learning_rate": 7.354250209315647e-05, "loss": 0.0123, "step": 582420 }, { "epoch": 1.51, "learning_rate": 7.353861387678502e-05, "loss": 0.0072, "step": 582430 }, { "epoch": 1.51, "learning_rate": 7.353472566041354e-05, "loss": 0.0082, "step": 582440 }, { "epoch": 1.51, "learning_rate": 7.353083744404207e-05, "loss": 0.0096, "step": 582450 }, { "epoch": 1.51, "learning_rate": 7.352694922767061e-05, "loss": 0.0072, "step": 582460 }, { "epoch": 1.51, "learning_rate": 7.352306101129914e-05, "loss": 0.0103, "step": 582470 }, { "epoch": 1.51, "learning_rate": 7.351917279492768e-05, "loss": 0.0074, "step": 582480 }, { "epoch": 1.51, "learning_rate": 7.351528457855621e-05, "loss": 0.0107, "step": 582490 }, { "epoch": 1.51, "learning_rate": 7.351139636218475e-05, "loss": 0.0102, "step": 582500 }, { "epoch": 1.51, "learning_rate": 7.35075081458133e-05, "loss": 0.0119, "step": 582510 }, { "epoch": 1.51, "learning_rate": 7.350361992944182e-05, "loss": 0.0106, "step": 582520 }, { "epoch": 1.51, "learning_rate": 7.349973171307037e-05, "loss": 0.0122, "step": 582530 }, { "epoch": 1.51, "learning_rate": 7.34958434966989e-05, "loss": 0.0079, "step": 582540 }, { "epoch": 1.51, "learning_rate": 7.349195528032743e-05, "loss": 0.0105, "step": 582550 }, { "epoch": 1.51, "learning_rate": 7.348806706395596e-05, "loss": 0.0077, "step": 582560 }, { "epoch": 1.51, "learning_rate": 7.34841788475845e-05, "loss": 0.0088, "step": 582570 }, { "epoch": 1.51, "learning_rate": 7.348029063121305e-05, "loss": 0.0125, "step": 582580 }, { "epoch": 1.51, "learning_rate": 7.347640241484157e-05, "loss": 0.0098, "step": 582590 }, { "epoch": 1.51, "learning_rate": 7.347251419847012e-05, "loss": 0.009, "step": 582600 }, { "epoch": 1.51, "learning_rate": 7.346862598209864e-05, "loss": 0.0103, "step": 582610 }, { "epoch": 1.51, "learning_rate": 7.346473776572719e-05, "loss": 0.0095, "step": 582620 }, { "epoch": 1.51, "learning_rate": 7.346084954935571e-05, "loss": 0.0131, "step": 582630 }, { "epoch": 1.51, "learning_rate": 7.345696133298426e-05, "loss": 0.0091, "step": 582640 }, { "epoch": 1.51, "learning_rate": 7.345307311661278e-05, "loss": 0.0085, "step": 582650 }, { "epoch": 1.51, "learning_rate": 7.344918490024133e-05, "loss": 0.0118, "step": 582660 }, { "epoch": 1.51, "learning_rate": 7.344529668386987e-05, "loss": 0.0108, "step": 582670 }, { "epoch": 1.51, "learning_rate": 7.34414084674984e-05, "loss": 0.0072, "step": 582680 }, { "epoch": 1.51, "learning_rate": 7.343752025112692e-05, "loss": 0.0091, "step": 582690 }, { "epoch": 1.51, "learning_rate": 7.343363203475546e-05, "loss": 0.0092, "step": 582700 }, { "epoch": 1.51, "learning_rate": 7.342974381838399e-05, "loss": 0.0089, "step": 582710 }, { "epoch": 1.51, "learning_rate": 7.342585560201253e-05, "loss": 0.0125, "step": 582720 }, { "epoch": 1.51, "learning_rate": 7.342196738564106e-05, "loss": 0.0094, "step": 582730 }, { "epoch": 1.51, "learning_rate": 7.34180791692696e-05, "loss": 0.0111, "step": 582740 }, { "epoch": 1.51, "learning_rate": 7.341419095289813e-05, "loss": 0.0087, "step": 582750 }, { "epoch": 1.51, "learning_rate": 7.341030273652667e-05, "loss": 0.0098, "step": 582760 }, { "epoch": 1.51, "learning_rate": 7.340641452015522e-05, "loss": 0.0096, "step": 582770 }, { "epoch": 1.51, "learning_rate": 7.340252630378374e-05, "loss": 0.0106, "step": 582780 }, { "epoch": 1.51, "learning_rate": 7.339863808741229e-05, "loss": 0.0088, "step": 582790 }, { "epoch": 1.51, "learning_rate": 7.339474987104081e-05, "loss": 0.0092, "step": 582800 }, { "epoch": 1.51, "learning_rate": 7.339086165466935e-05, "loss": 0.0123, "step": 582810 }, { "epoch": 1.51, "learning_rate": 7.338697343829788e-05, "loss": 0.0087, "step": 582820 }, { "epoch": 1.51, "learning_rate": 7.338308522192642e-05, "loss": 0.0084, "step": 582830 }, { "epoch": 1.51, "learning_rate": 7.337919700555497e-05, "loss": 0.01, "step": 582840 }, { "epoch": 1.51, "learning_rate": 7.33753087891835e-05, "loss": 0.0109, "step": 582850 }, { "epoch": 1.51, "learning_rate": 7.337142057281204e-05, "loss": 0.0096, "step": 582860 }, { "epoch": 1.51, "learning_rate": 7.336753235644056e-05, "loss": 0.0089, "step": 582870 }, { "epoch": 1.51, "learning_rate": 7.33636441400691e-05, "loss": 0.0084, "step": 582880 }, { "epoch": 1.51, "learning_rate": 7.335975592369763e-05, "loss": 0.0099, "step": 582890 }, { "epoch": 1.51, "learning_rate": 7.335586770732618e-05, "loss": 0.0097, "step": 582900 }, { "epoch": 1.51, "learning_rate": 7.33519794909547e-05, "loss": 0.0125, "step": 582910 }, { "epoch": 1.51, "learning_rate": 7.334809127458325e-05, "loss": 0.0141, "step": 582920 }, { "epoch": 1.51, "learning_rate": 7.334420305821177e-05, "loss": 0.0101, "step": 582930 }, { "epoch": 1.51, "learning_rate": 7.334031484184031e-05, "loss": 0.0112, "step": 582940 }, { "epoch": 1.51, "learning_rate": 7.333642662546884e-05, "loss": 0.0087, "step": 582950 }, { "epoch": 1.51, "learning_rate": 7.333253840909738e-05, "loss": 0.0066, "step": 582960 }, { "epoch": 1.51, "learning_rate": 7.332865019272591e-05, "loss": 0.0103, "step": 582970 }, { "epoch": 1.51, "learning_rate": 7.332476197635445e-05, "loss": 0.0082, "step": 582980 }, { "epoch": 1.51, "learning_rate": 7.332087375998298e-05, "loss": 0.0098, "step": 582990 }, { "epoch": 1.51, "learning_rate": 7.331698554361152e-05, "loss": 0.0098, "step": 583000 }, { "epoch": 1.51, "eval_cer": 0.8817138834186412, "eval_loss": 0.006150657311081886, "eval_runtime": 107.9428, "eval_samples_per_second": 18.528, "eval_steps_per_second": 4.632, "step": 583000 }, { "epoch": 1.51, "learning_rate": 7.331309732724005e-05, "loss": 0.0065, "step": 583010 }, { "epoch": 1.51, "learning_rate": 7.33092091108686e-05, "loss": 0.008, "step": 583020 }, { "epoch": 1.51, "learning_rate": 7.330532089449714e-05, "loss": 0.0059, "step": 583030 }, { "epoch": 1.51, "learning_rate": 7.330143267812566e-05, "loss": 0.0095, "step": 583040 }, { "epoch": 1.51, "learning_rate": 7.32975444617542e-05, "loss": 0.0068, "step": 583050 }, { "epoch": 1.51, "learning_rate": 7.329365624538273e-05, "loss": 0.0082, "step": 583060 }, { "epoch": 1.51, "learning_rate": 7.328976802901127e-05, "loss": 0.0079, "step": 583070 }, { "epoch": 1.51, "learning_rate": 7.32858798126398e-05, "loss": 0.0099, "step": 583080 }, { "epoch": 1.51, "learning_rate": 7.328199159626834e-05, "loss": 0.007, "step": 583090 }, { "epoch": 1.51, "learning_rate": 7.327810337989689e-05, "loss": 0.0097, "step": 583100 }, { "epoch": 1.51, "learning_rate": 7.327421516352541e-05, "loss": 0.0099, "step": 583110 }, { "epoch": 1.51, "learning_rate": 7.327032694715396e-05, "loss": 0.0077, "step": 583120 }, { "epoch": 1.51, "learning_rate": 7.326643873078248e-05, "loss": 0.0092, "step": 583130 }, { "epoch": 1.51, "learning_rate": 7.326255051441103e-05, "loss": 0.0084, "step": 583140 }, { "epoch": 1.51, "learning_rate": 7.325866229803955e-05, "loss": 0.0085, "step": 583150 }, { "epoch": 1.51, "learning_rate": 7.32547740816681e-05, "loss": 0.0082, "step": 583160 }, { "epoch": 1.51, "learning_rate": 7.325088586529662e-05, "loss": 0.0101, "step": 583170 }, { "epoch": 1.51, "learning_rate": 7.324699764892515e-05, "loss": 0.0075, "step": 583180 }, { "epoch": 1.51, "learning_rate": 7.324310943255369e-05, "loss": 0.0116, "step": 583190 }, { "epoch": 1.51, "learning_rate": 7.323922121618223e-05, "loss": 0.009, "step": 583200 }, { "epoch": 1.51, "learning_rate": 7.323533299981076e-05, "loss": 0.0056, "step": 583210 }, { "epoch": 1.51, "learning_rate": 7.32314447834393e-05, "loss": 0.0114, "step": 583220 }, { "epoch": 1.51, "learning_rate": 7.322755656706783e-05, "loss": 0.0083, "step": 583230 }, { "epoch": 1.51, "learning_rate": 7.322366835069637e-05, "loss": 0.0115, "step": 583240 }, { "epoch": 1.51, "learning_rate": 7.32197801343249e-05, "loss": 0.0096, "step": 583250 }, { "epoch": 1.51, "learning_rate": 7.321589191795344e-05, "loss": 0.008, "step": 583260 }, { "epoch": 1.51, "learning_rate": 7.321200370158197e-05, "loss": 0.0084, "step": 583270 }, { "epoch": 1.51, "learning_rate": 7.320811548521051e-05, "loss": 0.0067, "step": 583280 }, { "epoch": 1.51, "learning_rate": 7.320422726883906e-05, "loss": 0.0091, "step": 583290 }, { "epoch": 1.51, "learning_rate": 7.320033905246758e-05, "loss": 0.008, "step": 583300 }, { "epoch": 1.51, "learning_rate": 7.319645083609613e-05, "loss": 0.0098, "step": 583310 }, { "epoch": 1.51, "learning_rate": 7.319256261972465e-05, "loss": 0.0079, "step": 583320 }, { "epoch": 1.51, "learning_rate": 7.31886744033532e-05, "loss": 0.0084, "step": 583330 }, { "epoch": 1.51, "learning_rate": 7.318478618698172e-05, "loss": 0.008, "step": 583340 }, { "epoch": 1.51, "learning_rate": 7.318089797061026e-05, "loss": 0.0083, "step": 583350 }, { "epoch": 1.51, "learning_rate": 7.31770097542388e-05, "loss": 0.0106, "step": 583360 }, { "epoch": 1.51, "learning_rate": 7.317312153786733e-05, "loss": 0.0087, "step": 583370 }, { "epoch": 1.51, "learning_rate": 7.316923332149588e-05, "loss": 0.0115, "step": 583380 }, { "epoch": 1.51, "learning_rate": 7.31653451051244e-05, "loss": 0.0094, "step": 583390 }, { "epoch": 1.51, "learning_rate": 7.316145688875295e-05, "loss": 0.008, "step": 583400 }, { "epoch": 1.51, "learning_rate": 7.315756867238147e-05, "loss": 0.0083, "step": 583410 }, { "epoch": 1.51, "learning_rate": 7.315368045601002e-05, "loss": 0.0093, "step": 583420 }, { "epoch": 1.51, "learning_rate": 7.314979223963854e-05, "loss": 0.0099, "step": 583430 }, { "epoch": 1.51, "learning_rate": 7.314590402326707e-05, "loss": 0.0085, "step": 583440 }, { "epoch": 1.51, "learning_rate": 7.314201580689561e-05, "loss": 0.007, "step": 583450 }, { "epoch": 1.51, "learning_rate": 7.313812759052415e-05, "loss": 0.0091, "step": 583460 }, { "epoch": 1.51, "learning_rate": 7.313423937415268e-05, "loss": 0.0107, "step": 583470 }, { "epoch": 1.51, "learning_rate": 7.313035115778122e-05, "loss": 0.0088, "step": 583480 }, { "epoch": 1.51, "learning_rate": 7.312646294140975e-05, "loss": 0.0084, "step": 583490 }, { "epoch": 1.51, "learning_rate": 7.31225747250383e-05, "loss": 0.0106, "step": 583500 }, { "epoch": 1.51, "learning_rate": 7.311868650866682e-05, "loss": 0.0073, "step": 583510 }, { "epoch": 1.51, "learning_rate": 7.311479829229536e-05, "loss": 0.0107, "step": 583520 }, { "epoch": 1.51, "learning_rate": 7.311091007592389e-05, "loss": 0.0141, "step": 583530 }, { "epoch": 1.51, "learning_rate": 7.310702185955243e-05, "loss": 0.0075, "step": 583540 }, { "epoch": 1.51, "learning_rate": 7.310313364318098e-05, "loss": 0.0106, "step": 583550 }, { "epoch": 1.51, "learning_rate": 7.30992454268095e-05, "loss": 0.0068, "step": 583560 }, { "epoch": 1.51, "learning_rate": 7.309535721043805e-05, "loss": 0.0123, "step": 583570 }, { "epoch": 1.51, "learning_rate": 7.309146899406657e-05, "loss": 0.0105, "step": 583580 }, { "epoch": 1.51, "learning_rate": 7.308758077769511e-05, "loss": 0.011, "step": 583590 }, { "epoch": 1.51, "learning_rate": 7.308369256132364e-05, "loss": 0.0063, "step": 583600 }, { "epoch": 1.51, "learning_rate": 7.307980434495218e-05, "loss": 0.0071, "step": 583610 }, { "epoch": 1.51, "learning_rate": 7.307591612858071e-05, "loss": 0.0108, "step": 583620 }, { "epoch": 1.51, "learning_rate": 7.307202791220925e-05, "loss": 0.0079, "step": 583630 }, { "epoch": 1.51, "learning_rate": 7.30681396958378e-05, "loss": 0.0087, "step": 583640 }, { "epoch": 1.51, "learning_rate": 7.306425147946632e-05, "loss": 0.0081, "step": 583650 }, { "epoch": 1.51, "learning_rate": 7.306036326309487e-05, "loss": 0.0069, "step": 583660 }, { "epoch": 1.51, "learning_rate": 7.30564750467234e-05, "loss": 0.0091, "step": 583670 }, { "epoch": 1.51, "learning_rate": 7.305258683035192e-05, "loss": 0.0091, "step": 583680 }, { "epoch": 1.51, "learning_rate": 7.304869861398046e-05, "loss": 0.0055, "step": 583690 }, { "epoch": 1.51, "learning_rate": 7.304481039760899e-05, "loss": 0.0112, "step": 583700 }, { "epoch": 1.51, "learning_rate": 7.304092218123753e-05, "loss": 0.0117, "step": 583710 }, { "epoch": 1.51, "learning_rate": 7.303703396486606e-05, "loss": 0.0099, "step": 583720 }, { "epoch": 1.51, "learning_rate": 7.30331457484946e-05, "loss": 0.0086, "step": 583730 }, { "epoch": 1.51, "learning_rate": 7.302925753212314e-05, "loss": 0.0101, "step": 583740 }, { "epoch": 1.51, "learning_rate": 7.302536931575167e-05, "loss": 0.0081, "step": 583750 }, { "epoch": 1.51, "learning_rate": 7.302148109938021e-05, "loss": 0.009, "step": 583760 }, { "epoch": 1.51, "learning_rate": 7.301759288300874e-05, "loss": 0.0091, "step": 583770 }, { "epoch": 1.51, "learning_rate": 7.301370466663728e-05, "loss": 0.0079, "step": 583780 }, { "epoch": 1.51, "learning_rate": 7.300981645026581e-05, "loss": 0.013, "step": 583790 }, { "epoch": 1.51, "learning_rate": 7.300592823389435e-05, "loss": 0.0082, "step": 583800 }, { "epoch": 1.51, "learning_rate": 7.30020400175229e-05, "loss": 0.0085, "step": 583810 }, { "epoch": 1.51, "learning_rate": 7.299815180115142e-05, "loss": 0.0085, "step": 583820 }, { "epoch": 1.51, "learning_rate": 7.299426358477996e-05, "loss": 0.0095, "step": 583830 }, { "epoch": 1.51, "learning_rate": 7.299037536840849e-05, "loss": 0.0101, "step": 583840 }, { "epoch": 1.51, "learning_rate": 7.298648715203703e-05, "loss": 0.0078, "step": 583850 }, { "epoch": 1.51, "learning_rate": 7.298259893566556e-05, "loss": 0.0068, "step": 583860 }, { "epoch": 1.51, "learning_rate": 7.29787107192941e-05, "loss": 0.0076, "step": 583870 }, { "epoch": 1.51, "learning_rate": 7.297482250292263e-05, "loss": 0.0088, "step": 583880 }, { "epoch": 1.51, "learning_rate": 7.297093428655117e-05, "loss": 0.0085, "step": 583890 }, { "epoch": 1.51, "learning_rate": 7.296704607017972e-05, "loss": 0.0099, "step": 583900 }, { "epoch": 1.51, "learning_rate": 7.296315785380824e-05, "loss": 0.008, "step": 583910 }, { "epoch": 1.51, "learning_rate": 7.295926963743677e-05, "loss": 0.0084, "step": 583920 }, { "epoch": 1.51, "learning_rate": 7.295538142106531e-05, "loss": 0.0087, "step": 583930 }, { "epoch": 1.51, "learning_rate": 7.295149320469384e-05, "loss": 0.0108, "step": 583940 }, { "epoch": 1.51, "learning_rate": 7.294760498832238e-05, "loss": 0.0093, "step": 583950 }, { "epoch": 1.51, "learning_rate": 7.294371677195091e-05, "loss": 0.0062, "step": 583960 }, { "epoch": 1.51, "learning_rate": 7.293982855557945e-05, "loss": 0.0097, "step": 583970 }, { "epoch": 1.51, "learning_rate": 7.293594033920798e-05, "loss": 0.0104, "step": 583980 }, { "epoch": 1.51, "learning_rate": 7.293205212283652e-05, "loss": 0.0079, "step": 583990 }, { "epoch": 1.51, "learning_rate": 7.292816390646506e-05, "loss": 0.0078, "step": 584000 }, { "epoch": 1.51, "eval_cer": 0.8816970877754311, "eval_loss": 0.005978405941277742, "eval_runtime": 107.7544, "eval_samples_per_second": 18.561, "eval_steps_per_second": 4.64, "step": 584000 }, { "epoch": 1.51, "learning_rate": 7.292427569009359e-05, "loss": 0.0067, "step": 584010 }, { "epoch": 1.51, "learning_rate": 7.292038747372213e-05, "loss": 0.0088, "step": 584020 }, { "epoch": 1.51, "learning_rate": 7.291649925735066e-05, "loss": 0.0101, "step": 584030 }, { "epoch": 1.51, "learning_rate": 7.29126110409792e-05, "loss": 0.0079, "step": 584040 }, { "epoch": 1.51, "learning_rate": 7.290872282460773e-05, "loss": 0.006, "step": 584050 }, { "epoch": 1.51, "learning_rate": 7.290483460823627e-05, "loss": 0.0091, "step": 584060 }, { "epoch": 1.51, "learning_rate": 7.290094639186482e-05, "loss": 0.0114, "step": 584070 }, { "epoch": 1.51, "learning_rate": 7.289705817549334e-05, "loss": 0.0074, "step": 584080 }, { "epoch": 1.51, "learning_rate": 7.289316995912188e-05, "loss": 0.0103, "step": 584090 }, { "epoch": 1.51, "learning_rate": 7.288928174275041e-05, "loss": 0.0088, "step": 584100 }, { "epoch": 1.51, "learning_rate": 7.288539352637895e-05, "loss": 0.0098, "step": 584110 }, { "epoch": 1.51, "learning_rate": 7.288150531000748e-05, "loss": 0.0108, "step": 584120 }, { "epoch": 1.51, "learning_rate": 7.287761709363602e-05, "loss": 0.0087, "step": 584130 }, { "epoch": 1.51, "learning_rate": 7.287372887726455e-05, "loss": 0.0097, "step": 584140 }, { "epoch": 1.51, "learning_rate": 7.28698406608931e-05, "loss": 0.0136, "step": 584150 }, { "epoch": 1.51, "learning_rate": 7.286595244452164e-05, "loss": 0.0118, "step": 584160 }, { "epoch": 1.51, "learning_rate": 7.286206422815016e-05, "loss": 0.0105, "step": 584170 }, { "epoch": 1.51, "learning_rate": 7.285817601177869e-05, "loss": 0.0099, "step": 584180 }, { "epoch": 1.51, "learning_rate": 7.285428779540723e-05, "loss": 0.0084, "step": 584190 }, { "epoch": 1.51, "learning_rate": 7.285039957903576e-05, "loss": 0.0097, "step": 584200 }, { "epoch": 1.51, "learning_rate": 7.28465113626643e-05, "loss": 0.0071, "step": 584210 }, { "epoch": 1.51, "learning_rate": 7.284262314629283e-05, "loss": 0.009, "step": 584220 }, { "epoch": 1.51, "learning_rate": 7.283873492992137e-05, "loss": 0.0107, "step": 584230 }, { "epoch": 1.51, "learning_rate": 7.28348467135499e-05, "loss": 0.0072, "step": 584240 }, { "epoch": 1.51, "learning_rate": 7.283095849717844e-05, "loss": 0.0063, "step": 584250 }, { "epoch": 1.51, "learning_rate": 7.282707028080698e-05, "loss": 0.0077, "step": 584260 }, { "epoch": 1.51, "learning_rate": 7.282318206443551e-05, "loss": 0.0104, "step": 584270 }, { "epoch": 1.51, "learning_rate": 7.281929384806405e-05, "loss": 0.0063, "step": 584280 }, { "epoch": 1.51, "learning_rate": 7.281540563169258e-05, "loss": 0.0085, "step": 584290 }, { "epoch": 1.51, "learning_rate": 7.281151741532112e-05, "loss": 0.0079, "step": 584300 }, { "epoch": 1.51, "learning_rate": 7.280762919894965e-05, "loss": 0.0105, "step": 584310 }, { "epoch": 1.51, "learning_rate": 7.28037409825782e-05, "loss": 0.0098, "step": 584320 }, { "epoch": 1.51, "learning_rate": 7.279985276620674e-05, "loss": 0.0069, "step": 584330 }, { "epoch": 1.51, "learning_rate": 7.279596454983526e-05, "loss": 0.0097, "step": 584340 }, { "epoch": 1.51, "learning_rate": 7.27920763334638e-05, "loss": 0.0106, "step": 584350 }, { "epoch": 1.51, "learning_rate": 7.278818811709233e-05, "loss": 0.011, "step": 584360 }, { "epoch": 1.51, "learning_rate": 7.278429990072087e-05, "loss": 0.0084, "step": 584370 }, { "epoch": 1.51, "learning_rate": 7.27804116843494e-05, "loss": 0.0147, "step": 584380 }, { "epoch": 1.51, "learning_rate": 7.277652346797794e-05, "loss": 0.0115, "step": 584390 }, { "epoch": 1.51, "learning_rate": 7.277263525160647e-05, "loss": 0.0066, "step": 584400 }, { "epoch": 1.51, "learning_rate": 7.276874703523501e-05, "loss": 0.0099, "step": 584410 }, { "epoch": 1.51, "learning_rate": 7.276485881886354e-05, "loss": 0.0098, "step": 584420 }, { "epoch": 1.51, "learning_rate": 7.276097060249208e-05, "loss": 0.0096, "step": 584430 }, { "epoch": 1.51, "learning_rate": 7.275708238612061e-05, "loss": 0.0122, "step": 584440 }, { "epoch": 1.51, "learning_rate": 7.275319416974915e-05, "loss": 0.0071, "step": 584450 }, { "epoch": 1.52, "learning_rate": 7.274930595337768e-05, "loss": 0.0097, "step": 584460 }, { "epoch": 1.52, "learning_rate": 7.274541773700622e-05, "loss": 0.0084, "step": 584470 }, { "epoch": 1.52, "learning_rate": 7.274152952063475e-05, "loss": 0.007, "step": 584480 }, { "epoch": 1.52, "learning_rate": 7.273764130426329e-05, "loss": 0.0108, "step": 584490 }, { "epoch": 1.52, "learning_rate": 7.273375308789182e-05, "loss": 0.0087, "step": 584500 }, { "epoch": 1.52, "learning_rate": 7.272986487152036e-05, "loss": 0.0084, "step": 584510 }, { "epoch": 1.52, "learning_rate": 7.27259766551489e-05, "loss": 0.0094, "step": 584520 }, { "epoch": 1.52, "learning_rate": 7.272208843877743e-05, "loss": 0.0076, "step": 584530 }, { "epoch": 1.52, "learning_rate": 7.271820022240597e-05, "loss": 0.0103, "step": 584540 }, { "epoch": 1.52, "learning_rate": 7.27143120060345e-05, "loss": 0.0062, "step": 584550 }, { "epoch": 1.52, "learning_rate": 7.271042378966304e-05, "loss": 0.0115, "step": 584560 }, { "epoch": 1.52, "learning_rate": 7.270653557329157e-05, "loss": 0.0091, "step": 584570 }, { "epoch": 1.52, "learning_rate": 7.270264735692011e-05, "loss": 0.008, "step": 584580 }, { "epoch": 1.52, "learning_rate": 7.269875914054866e-05, "loss": 0.008, "step": 584590 }, { "epoch": 1.52, "learning_rate": 7.269487092417718e-05, "loss": 0.0107, "step": 584600 }, { "epoch": 1.52, "learning_rate": 7.269098270780572e-05, "loss": 0.0069, "step": 584610 }, { "epoch": 1.52, "learning_rate": 7.268709449143425e-05, "loss": 0.008, "step": 584620 }, { "epoch": 1.52, "learning_rate": 7.26832062750628e-05, "loss": 0.0088, "step": 584630 }, { "epoch": 1.52, "learning_rate": 7.267931805869132e-05, "loss": 0.0081, "step": 584640 }, { "epoch": 1.52, "learning_rate": 7.267542984231986e-05, "loss": 0.0096, "step": 584650 }, { "epoch": 1.52, "learning_rate": 7.267154162594839e-05, "loss": 0.0083, "step": 584660 }, { "epoch": 1.52, "learning_rate": 7.266765340957692e-05, "loss": 0.0074, "step": 584670 }, { "epoch": 1.52, "learning_rate": 7.266376519320546e-05, "loss": 0.0108, "step": 584680 }, { "epoch": 1.52, "learning_rate": 7.2659876976834e-05, "loss": 0.0108, "step": 584690 }, { "epoch": 1.52, "learning_rate": 7.265598876046253e-05, "loss": 0.008, "step": 584700 }, { "epoch": 1.52, "learning_rate": 7.265210054409107e-05, "loss": 0.0072, "step": 584710 }, { "epoch": 1.52, "learning_rate": 7.26482123277196e-05, "loss": 0.0087, "step": 584720 }, { "epoch": 1.52, "learning_rate": 7.264432411134814e-05, "loss": 0.009, "step": 584730 }, { "epoch": 1.52, "learning_rate": 7.264043589497667e-05, "loss": 0.0101, "step": 584740 }, { "epoch": 1.52, "learning_rate": 7.263654767860521e-05, "loss": 0.0107, "step": 584750 }, { "epoch": 1.52, "learning_rate": 7.263265946223374e-05, "loss": 0.0085, "step": 584760 }, { "epoch": 1.52, "learning_rate": 7.262877124586228e-05, "loss": 0.0083, "step": 584770 }, { "epoch": 1.52, "learning_rate": 7.262488302949082e-05, "loss": 0.0076, "step": 584780 }, { "epoch": 1.52, "learning_rate": 7.262099481311935e-05, "loss": 0.0098, "step": 584790 }, { "epoch": 1.52, "learning_rate": 7.26171065967479e-05, "loss": 0.01, "step": 584800 }, { "epoch": 1.52, "learning_rate": 7.261321838037642e-05, "loss": 0.0114, "step": 584810 }, { "epoch": 1.52, "learning_rate": 7.260933016400496e-05, "loss": 0.0107, "step": 584820 }, { "epoch": 1.52, "learning_rate": 7.260544194763349e-05, "loss": 0.0069, "step": 584830 }, { "epoch": 1.52, "learning_rate": 7.260155373126203e-05, "loss": 0.0089, "step": 584840 }, { "epoch": 1.52, "learning_rate": 7.259766551489058e-05, "loss": 0.0081, "step": 584850 }, { "epoch": 1.52, "learning_rate": 7.25937772985191e-05, "loss": 0.0084, "step": 584860 }, { "epoch": 1.52, "learning_rate": 7.258988908214764e-05, "loss": 0.0066, "step": 584870 }, { "epoch": 1.52, "learning_rate": 7.258600086577617e-05, "loss": 0.0095, "step": 584880 }, { "epoch": 1.52, "learning_rate": 7.258211264940471e-05, "loss": 0.0082, "step": 584890 }, { "epoch": 1.52, "learning_rate": 7.257822443303324e-05, "loss": 0.0075, "step": 584900 }, { "epoch": 1.52, "learning_rate": 7.257433621666178e-05, "loss": 0.0085, "step": 584910 }, { "epoch": 1.52, "learning_rate": 7.257044800029031e-05, "loss": 0.0103, "step": 584920 }, { "epoch": 1.52, "learning_rate": 7.256655978391884e-05, "loss": 0.0093, "step": 584930 }, { "epoch": 1.52, "learning_rate": 7.256267156754738e-05, "loss": 0.0077, "step": 584940 }, { "epoch": 1.52, "learning_rate": 7.255878335117592e-05, "loss": 0.0093, "step": 584950 }, { "epoch": 1.52, "learning_rate": 7.255489513480445e-05, "loss": 0.0099, "step": 584960 }, { "epoch": 1.52, "learning_rate": 7.2551006918433e-05, "loss": 0.0077, "step": 584970 }, { "epoch": 1.52, "learning_rate": 7.254711870206152e-05, "loss": 0.0113, "step": 584980 }, { "epoch": 1.52, "learning_rate": 7.254323048569006e-05, "loss": 0.0101, "step": 584990 }, { "epoch": 1.52, "learning_rate": 7.253934226931859e-05, "loss": 0.0061, "step": 585000 }, { "epoch": 1.52, "eval_cer": 0.8816746935844841, "eval_loss": 0.005952306557446718, "eval_runtime": 107.7504, "eval_samples_per_second": 18.561, "eval_steps_per_second": 4.64, "step": 585000 }, { "epoch": 1.52, "learning_rate": 7.253545405294713e-05, "loss": 0.0096, "step": 585010 }, { "epoch": 1.52, "learning_rate": 7.253156583657566e-05, "loss": 0.0086, "step": 585020 }, { "epoch": 1.52, "learning_rate": 7.25276776202042e-05, "loss": 0.0089, "step": 585030 }, { "epoch": 1.52, "learning_rate": 7.252378940383274e-05, "loss": 0.0108, "step": 585040 }, { "epoch": 1.52, "learning_rate": 7.251990118746127e-05, "loss": 0.0072, "step": 585050 }, { "epoch": 1.52, "learning_rate": 7.251601297108981e-05, "loss": 0.0099, "step": 585060 }, { "epoch": 1.52, "learning_rate": 7.251212475471834e-05, "loss": 0.0077, "step": 585070 }, { "epoch": 1.52, "learning_rate": 7.250823653834688e-05, "loss": 0.0095, "step": 585080 }, { "epoch": 1.52, "learning_rate": 7.250434832197541e-05, "loss": 0.0149, "step": 585090 }, { "epoch": 1.52, "learning_rate": 7.250046010560395e-05, "loss": 0.0096, "step": 585100 }, { "epoch": 1.52, "learning_rate": 7.249657188923248e-05, "loss": 0.0089, "step": 585110 }, { "epoch": 1.52, "learning_rate": 7.249268367286102e-05, "loss": 0.0077, "step": 585120 }, { "epoch": 1.52, "learning_rate": 7.248879545648956e-05, "loss": 0.0105, "step": 585130 }, { "epoch": 1.52, "learning_rate": 7.248490724011809e-05, "loss": 0.0066, "step": 585140 }, { "epoch": 1.52, "learning_rate": 7.248101902374663e-05, "loss": 0.0102, "step": 585150 }, { "epoch": 1.52, "learning_rate": 7.247713080737516e-05, "loss": 0.0099, "step": 585160 }, { "epoch": 1.52, "learning_rate": 7.247324259100369e-05, "loss": 0.0085, "step": 585170 }, { "epoch": 1.52, "learning_rate": 7.246935437463223e-05, "loss": 0.0082, "step": 585180 }, { "epoch": 1.52, "learning_rate": 7.246546615826076e-05, "loss": 0.0094, "step": 585190 }, { "epoch": 1.52, "learning_rate": 7.24615779418893e-05, "loss": 0.0105, "step": 585200 }, { "epoch": 1.52, "learning_rate": 7.245768972551783e-05, "loss": 0.0089, "step": 585210 }, { "epoch": 1.52, "learning_rate": 7.245380150914637e-05, "loss": 0.0086, "step": 585220 }, { "epoch": 1.52, "learning_rate": 7.244991329277491e-05, "loss": 0.0088, "step": 585230 }, { "epoch": 1.52, "learning_rate": 7.244602507640344e-05, "loss": 0.0082, "step": 585240 }, { "epoch": 1.52, "learning_rate": 7.244213686003198e-05, "loss": 0.0081, "step": 585250 }, { "epoch": 1.52, "learning_rate": 7.243824864366051e-05, "loss": 0.0092, "step": 585260 }, { "epoch": 1.52, "learning_rate": 7.243436042728905e-05, "loss": 0.0097, "step": 585270 }, { "epoch": 1.52, "learning_rate": 7.243047221091758e-05, "loss": 0.0089, "step": 585280 }, { "epoch": 1.52, "learning_rate": 7.242658399454612e-05, "loss": 0.0067, "step": 585290 }, { "epoch": 1.52, "learning_rate": 7.242269577817466e-05, "loss": 0.0098, "step": 585300 }, { "epoch": 1.52, "learning_rate": 7.241880756180319e-05, "loss": 0.0077, "step": 585310 }, { "epoch": 1.52, "learning_rate": 7.241491934543173e-05, "loss": 0.0077, "step": 585320 }, { "epoch": 1.52, "learning_rate": 7.241103112906026e-05, "loss": 0.0072, "step": 585330 }, { "epoch": 1.52, "learning_rate": 7.24071429126888e-05, "loss": 0.0103, "step": 585340 }, { "epoch": 1.52, "learning_rate": 7.240325469631733e-05, "loss": 0.0079, "step": 585350 }, { "epoch": 1.52, "learning_rate": 7.239936647994587e-05, "loss": 0.0108, "step": 585360 }, { "epoch": 1.52, "learning_rate": 7.23954782635744e-05, "loss": 0.0086, "step": 585370 }, { "epoch": 1.52, "learning_rate": 7.239159004720294e-05, "loss": 0.0102, "step": 585380 }, { "epoch": 1.52, "learning_rate": 7.238770183083148e-05, "loss": 0.0098, "step": 585390 }, { "epoch": 1.52, "learning_rate": 7.238381361446001e-05, "loss": 0.0084, "step": 585400 }, { "epoch": 1.52, "learning_rate": 7.237992539808854e-05, "loss": 0.0104, "step": 585410 }, { "epoch": 1.52, "learning_rate": 7.237603718171708e-05, "loss": 0.0109, "step": 585420 }, { "epoch": 1.52, "learning_rate": 7.237214896534561e-05, "loss": 0.0096, "step": 585430 }, { "epoch": 1.52, "learning_rate": 7.236826074897415e-05, "loss": 0.009, "step": 585440 }, { "epoch": 1.52, "learning_rate": 7.236437253260268e-05, "loss": 0.0111, "step": 585450 }, { "epoch": 1.52, "learning_rate": 7.236048431623122e-05, "loss": 0.0096, "step": 585460 }, { "epoch": 1.52, "learning_rate": 7.235659609985975e-05, "loss": 0.0097, "step": 585470 }, { "epoch": 1.52, "learning_rate": 7.235270788348829e-05, "loss": 0.0084, "step": 585480 }, { "epoch": 1.52, "learning_rate": 7.234881966711683e-05, "loss": 0.0084, "step": 585490 }, { "epoch": 1.52, "learning_rate": 7.234493145074536e-05, "loss": 0.0095, "step": 585500 }, { "epoch": 1.52, "learning_rate": 7.23410432343739e-05, "loss": 0.0088, "step": 585510 }, { "epoch": 1.52, "learning_rate": 7.233715501800243e-05, "loss": 0.0137, "step": 585520 }, { "epoch": 1.52, "learning_rate": 7.233326680163097e-05, "loss": 0.0078, "step": 585530 }, { "epoch": 1.52, "learning_rate": 7.23293785852595e-05, "loss": 0.0075, "step": 585540 }, { "epoch": 1.52, "learning_rate": 7.232549036888804e-05, "loss": 0.0079, "step": 585550 }, { "epoch": 1.52, "learning_rate": 7.232160215251658e-05, "loss": 0.0106, "step": 585560 }, { "epoch": 1.52, "learning_rate": 7.231771393614511e-05, "loss": 0.0071, "step": 585570 }, { "epoch": 1.52, "learning_rate": 7.231382571977365e-05, "loss": 0.0087, "step": 585580 }, { "epoch": 1.52, "learning_rate": 7.230993750340218e-05, "loss": 0.0087, "step": 585590 }, { "epoch": 1.52, "learning_rate": 7.230604928703072e-05, "loss": 0.0079, "step": 585600 }, { "epoch": 1.52, "learning_rate": 7.230216107065925e-05, "loss": 0.0116, "step": 585610 }, { "epoch": 1.52, "learning_rate": 7.22982728542878e-05, "loss": 0.0077, "step": 585620 }, { "epoch": 1.52, "learning_rate": 7.229438463791632e-05, "loss": 0.0097, "step": 585630 }, { "epoch": 1.52, "learning_rate": 7.229049642154486e-05, "loss": 0.011, "step": 585640 }, { "epoch": 1.52, "learning_rate": 7.22866082051734e-05, "loss": 0.0067, "step": 585650 }, { "epoch": 1.52, "learning_rate": 7.228271998880193e-05, "loss": 0.0138, "step": 585660 }, { "epoch": 1.52, "learning_rate": 7.227883177243046e-05, "loss": 0.0072, "step": 585670 }, { "epoch": 1.52, "learning_rate": 7.2274943556059e-05, "loss": 0.0081, "step": 585680 }, { "epoch": 1.52, "learning_rate": 7.227105533968753e-05, "loss": 0.01, "step": 585690 }, { "epoch": 1.52, "learning_rate": 7.226716712331607e-05, "loss": 0.0085, "step": 585700 }, { "epoch": 1.52, "learning_rate": 7.22632789069446e-05, "loss": 0.0078, "step": 585710 }, { "epoch": 1.52, "learning_rate": 7.225939069057314e-05, "loss": 0.0088, "step": 585720 }, { "epoch": 1.52, "learning_rate": 7.225550247420167e-05, "loss": 0.0093, "step": 585730 }, { "epoch": 1.52, "learning_rate": 7.225161425783021e-05, "loss": 0.0094, "step": 585740 }, { "epoch": 1.52, "learning_rate": 7.224772604145875e-05, "loss": 0.0071, "step": 585750 }, { "epoch": 1.52, "learning_rate": 7.224383782508728e-05, "loss": 0.0073, "step": 585760 }, { "epoch": 1.52, "learning_rate": 7.223994960871582e-05, "loss": 0.0066, "step": 585770 }, { "epoch": 1.52, "learning_rate": 7.223606139234435e-05, "loss": 0.0104, "step": 585780 }, { "epoch": 1.52, "learning_rate": 7.223217317597289e-05, "loss": 0.0094, "step": 585790 }, { "epoch": 1.52, "learning_rate": 7.222828495960142e-05, "loss": 0.0119, "step": 585800 }, { "epoch": 1.52, "learning_rate": 7.222439674322996e-05, "loss": 0.0117, "step": 585810 }, { "epoch": 1.52, "learning_rate": 7.22205085268585e-05, "loss": 0.0064, "step": 585820 }, { "epoch": 1.52, "learning_rate": 7.221662031048703e-05, "loss": 0.0093, "step": 585830 }, { "epoch": 1.52, "learning_rate": 7.221273209411557e-05, "loss": 0.0088, "step": 585840 }, { "epoch": 1.52, "learning_rate": 7.22088438777441e-05, "loss": 0.0079, "step": 585850 }, { "epoch": 1.52, "learning_rate": 7.220495566137264e-05, "loss": 0.0099, "step": 585860 }, { "epoch": 1.52, "learning_rate": 7.220106744500117e-05, "loss": 0.013, "step": 585870 }, { "epoch": 1.52, "learning_rate": 7.219717922862971e-05, "loss": 0.0079, "step": 585880 }, { "epoch": 1.52, "learning_rate": 7.219329101225824e-05, "loss": 0.0071, "step": 585890 }, { "epoch": 1.52, "learning_rate": 7.218940279588678e-05, "loss": 0.0066, "step": 585900 }, { "epoch": 1.52, "learning_rate": 7.218551457951531e-05, "loss": 0.0099, "step": 585910 }, { "epoch": 1.52, "learning_rate": 7.218162636314385e-05, "loss": 0.0086, "step": 585920 }, { "epoch": 1.52, "learning_rate": 7.217773814677238e-05, "loss": 0.0111, "step": 585930 }, { "epoch": 1.52, "learning_rate": 7.217384993040092e-05, "loss": 0.0096, "step": 585940 }, { "epoch": 1.52, "learning_rate": 7.216996171402945e-05, "loss": 0.0075, "step": 585950 }, { "epoch": 1.52, "learning_rate": 7.216607349765799e-05, "loss": 0.0094, "step": 585960 }, { "epoch": 1.52, "learning_rate": 7.216218528128652e-05, "loss": 0.0109, "step": 585970 }, { "epoch": 1.52, "learning_rate": 7.215829706491506e-05, "loss": 0.0094, "step": 585980 }, { "epoch": 1.52, "learning_rate": 7.215440884854359e-05, "loss": 0.0109, "step": 585990 }, { "epoch": 1.52, "learning_rate": 7.215052063217213e-05, "loss": 0.0127, "step": 586000 }, { "epoch": 1.52, "eval_cer": 0.8816900895907601, "eval_loss": 0.00595942372456193, "eval_runtime": 107.8725, "eval_samples_per_second": 18.54, "eval_steps_per_second": 4.635, "step": 586000 }, { "epoch": 1.52, "learning_rate": 7.214663241580067e-05, "loss": 0.012, "step": 586010 }, { "epoch": 1.52, "learning_rate": 7.21427441994292e-05, "loss": 0.0105, "step": 586020 }, { "epoch": 1.52, "learning_rate": 7.213885598305774e-05, "loss": 0.0072, "step": 586030 }, { "epoch": 1.52, "learning_rate": 7.213496776668627e-05, "loss": 0.0095, "step": 586040 }, { "epoch": 1.52, "learning_rate": 7.213107955031481e-05, "loss": 0.0085, "step": 586050 }, { "epoch": 1.52, "learning_rate": 7.212719133394334e-05, "loss": 0.0105, "step": 586060 }, { "epoch": 1.52, "learning_rate": 7.212330311757188e-05, "loss": 0.0073, "step": 586070 }, { "epoch": 1.52, "learning_rate": 7.211941490120042e-05, "loss": 0.0124, "step": 586080 }, { "epoch": 1.52, "learning_rate": 7.211552668482895e-05, "loss": 0.0099, "step": 586090 }, { "epoch": 1.52, "learning_rate": 7.21116384684575e-05, "loss": 0.01, "step": 586100 }, { "epoch": 1.52, "learning_rate": 7.210775025208602e-05, "loss": 0.0098, "step": 586110 }, { "epoch": 1.52, "learning_rate": 7.210386203571456e-05, "loss": 0.0087, "step": 586120 }, { "epoch": 1.52, "learning_rate": 7.209997381934309e-05, "loss": 0.0084, "step": 586130 }, { "epoch": 1.52, "learning_rate": 7.209608560297163e-05, "loss": 0.009, "step": 586140 }, { "epoch": 1.52, "learning_rate": 7.209219738660016e-05, "loss": 0.0082, "step": 586150 }, { "epoch": 1.52, "learning_rate": 7.208830917022869e-05, "loss": 0.0079, "step": 586160 }, { "epoch": 1.52, "learning_rate": 7.208442095385723e-05, "loss": 0.0081, "step": 586170 }, { "epoch": 1.52, "learning_rate": 7.208053273748577e-05, "loss": 0.0109, "step": 586180 }, { "epoch": 1.52, "learning_rate": 7.20766445211143e-05, "loss": 0.0092, "step": 586190 }, { "epoch": 1.52, "learning_rate": 7.207275630474284e-05, "loss": 0.0087, "step": 586200 }, { "epoch": 1.52, "learning_rate": 7.206886808837137e-05, "loss": 0.0111, "step": 586210 }, { "epoch": 1.52, "learning_rate": 7.206497987199991e-05, "loss": 0.008, "step": 586220 }, { "epoch": 1.52, "learning_rate": 7.206109165562844e-05, "loss": 0.0098, "step": 586230 }, { "epoch": 1.52, "learning_rate": 7.205720343925698e-05, "loss": 0.0104, "step": 586240 }, { "epoch": 1.52, "learning_rate": 7.205331522288551e-05, "loss": 0.0077, "step": 586250 }, { "epoch": 1.52, "learning_rate": 7.204942700651405e-05, "loss": 0.007, "step": 586260 }, { "epoch": 1.52, "learning_rate": 7.204553879014259e-05, "loss": 0.0084, "step": 586270 }, { "epoch": 1.52, "learning_rate": 7.204165057377112e-05, "loss": 0.0119, "step": 586280 }, { "epoch": 1.52, "learning_rate": 7.203776235739966e-05, "loss": 0.0086, "step": 586290 }, { "epoch": 1.52, "learning_rate": 7.203387414102819e-05, "loss": 0.0082, "step": 586300 }, { "epoch": 1.52, "learning_rate": 7.202998592465673e-05, "loss": 0.0094, "step": 586310 }, { "epoch": 1.52, "learning_rate": 7.202609770828526e-05, "loss": 0.0083, "step": 586320 }, { "epoch": 1.52, "learning_rate": 7.20222094919138e-05, "loss": 0.0079, "step": 586330 }, { "epoch": 1.52, "learning_rate": 7.201832127554234e-05, "loss": 0.009, "step": 586340 }, { "epoch": 1.52, "learning_rate": 7.201443305917087e-05, "loss": 0.0097, "step": 586350 }, { "epoch": 1.52, "learning_rate": 7.201054484279941e-05, "loss": 0.011, "step": 586360 }, { "epoch": 1.52, "learning_rate": 7.200665662642794e-05, "loss": 0.0077, "step": 586370 }, { "epoch": 1.52, "learning_rate": 7.200276841005648e-05, "loss": 0.011, "step": 586380 }, { "epoch": 1.52, "learning_rate": 7.199888019368501e-05, "loss": 0.0123, "step": 586390 }, { "epoch": 1.52, "learning_rate": 7.199499197731355e-05, "loss": 0.0103, "step": 586400 }, { "epoch": 1.52, "learning_rate": 7.199110376094208e-05, "loss": 0.0101, "step": 586410 }, { "epoch": 1.52, "learning_rate": 7.198721554457061e-05, "loss": 0.0076, "step": 586420 }, { "epoch": 1.52, "learning_rate": 7.198332732819915e-05, "loss": 0.0074, "step": 586430 }, { "epoch": 1.52, "learning_rate": 7.197943911182769e-05, "loss": 0.0091, "step": 586440 }, { "epoch": 1.52, "learning_rate": 7.197555089545622e-05, "loss": 0.0105, "step": 586450 }, { "epoch": 1.52, "learning_rate": 7.197166267908476e-05, "loss": 0.0084, "step": 586460 }, { "epoch": 1.52, "learning_rate": 7.196777446271329e-05, "loss": 0.011, "step": 586470 }, { "epoch": 1.52, "learning_rate": 7.196388624634183e-05, "loss": 0.0094, "step": 586480 }, { "epoch": 1.52, "learning_rate": 7.195999802997036e-05, "loss": 0.0099, "step": 586490 }, { "epoch": 1.52, "learning_rate": 7.19561098135989e-05, "loss": 0.0069, "step": 586500 }, { "epoch": 1.52, "learning_rate": 7.195222159722743e-05, "loss": 0.0051, "step": 586510 }, { "epoch": 1.52, "learning_rate": 7.194833338085597e-05, "loss": 0.0112, "step": 586520 }, { "epoch": 1.52, "learning_rate": 7.194444516448451e-05, "loss": 0.0072, "step": 586530 }, { "epoch": 1.52, "learning_rate": 7.194055694811304e-05, "loss": 0.0081, "step": 586540 }, { "epoch": 1.52, "learning_rate": 7.193666873174158e-05, "loss": 0.009, "step": 586550 }, { "epoch": 1.52, "learning_rate": 7.193278051537011e-05, "loss": 0.0067, "step": 586560 }, { "epoch": 1.52, "learning_rate": 7.192889229899865e-05, "loss": 0.0102, "step": 586570 }, { "epoch": 1.52, "learning_rate": 7.192500408262718e-05, "loss": 0.0101, "step": 586580 }, { "epoch": 1.52, "learning_rate": 7.192111586625572e-05, "loss": 0.0109, "step": 586590 }, { "epoch": 1.52, "learning_rate": 7.191722764988425e-05, "loss": 0.0105, "step": 586600 }, { "epoch": 1.52, "learning_rate": 7.191333943351279e-05, "loss": 0.008, "step": 586610 }, { "epoch": 1.52, "learning_rate": 7.190945121714133e-05, "loss": 0.0091, "step": 586620 }, { "epoch": 1.52, "learning_rate": 7.190556300076986e-05, "loss": 0.0071, "step": 586630 }, { "epoch": 1.52, "learning_rate": 7.19016747843984e-05, "loss": 0.0107, "step": 586640 }, { "epoch": 1.52, "learning_rate": 7.189778656802693e-05, "loss": 0.0094, "step": 586650 }, { "epoch": 1.52, "learning_rate": 7.189389835165546e-05, "loss": 0.0085, "step": 586660 }, { "epoch": 1.52, "learning_rate": 7.1890010135284e-05, "loss": 0.0076, "step": 586670 }, { "epoch": 1.52, "learning_rate": 7.188612191891253e-05, "loss": 0.0056, "step": 586680 }, { "epoch": 1.52, "learning_rate": 7.188223370254107e-05, "loss": 0.0087, "step": 586690 }, { "epoch": 1.52, "learning_rate": 7.18783454861696e-05, "loss": 0.0075, "step": 586700 }, { "epoch": 1.52, "learning_rate": 7.187445726979814e-05, "loss": 0.0092, "step": 586710 }, { "epoch": 1.52, "learning_rate": 7.187056905342668e-05, "loss": 0.0088, "step": 586720 }, { "epoch": 1.52, "learning_rate": 7.186668083705521e-05, "loss": 0.0088, "step": 586730 }, { "epoch": 1.52, "learning_rate": 7.186279262068375e-05, "loss": 0.0113, "step": 586740 }, { "epoch": 1.52, "learning_rate": 7.185890440431228e-05, "loss": 0.0084, "step": 586750 }, { "epoch": 1.52, "learning_rate": 7.185501618794082e-05, "loss": 0.0093, "step": 586760 }, { "epoch": 1.52, "learning_rate": 7.185112797156935e-05, "loss": 0.0122, "step": 586770 }, { "epoch": 1.52, "learning_rate": 7.184723975519789e-05, "loss": 0.0075, "step": 586780 }, { "epoch": 1.52, "learning_rate": 7.184335153882643e-05, "loss": 0.0109, "step": 586790 }, { "epoch": 1.52, "learning_rate": 7.183946332245496e-05, "loss": 0.0095, "step": 586800 }, { "epoch": 1.52, "learning_rate": 7.18355751060835e-05, "loss": 0.0073, "step": 586810 }, { "epoch": 1.52, "learning_rate": 7.183168688971203e-05, "loss": 0.0073, "step": 586820 }, { "epoch": 1.52, "learning_rate": 7.182779867334057e-05, "loss": 0.0086, "step": 586830 }, { "epoch": 1.52, "learning_rate": 7.18239104569691e-05, "loss": 0.0108, "step": 586840 }, { "epoch": 1.52, "learning_rate": 7.182002224059764e-05, "loss": 0.0095, "step": 586850 }, { "epoch": 1.52, "learning_rate": 7.181613402422617e-05, "loss": 0.0105, "step": 586860 }, { "epoch": 1.52, "learning_rate": 7.181224580785471e-05, "loss": 0.0088, "step": 586870 }, { "epoch": 1.52, "learning_rate": 7.180835759148325e-05, "loss": 0.0072, "step": 586880 }, { "epoch": 1.52, "learning_rate": 7.180446937511178e-05, "loss": 0.0083, "step": 586890 }, { "epoch": 1.52, "learning_rate": 7.180058115874031e-05, "loss": 0.0062, "step": 586900 }, { "epoch": 1.52, "learning_rate": 7.179669294236885e-05, "loss": 0.008, "step": 586910 }, { "epoch": 1.52, "learning_rate": 7.179280472599738e-05, "loss": 0.0079, "step": 586920 }, { "epoch": 1.52, "learning_rate": 7.178891650962592e-05, "loss": 0.0082, "step": 586930 }, { "epoch": 1.52, "learning_rate": 7.178502829325445e-05, "loss": 0.0083, "step": 586940 }, { "epoch": 1.52, "learning_rate": 7.178114007688299e-05, "loss": 0.0106, "step": 586950 }, { "epoch": 1.52, "learning_rate": 7.177725186051152e-05, "loss": 0.0068, "step": 586960 }, { "epoch": 1.52, "learning_rate": 7.177336364414006e-05, "loss": 0.0101, "step": 586970 }, { "epoch": 1.52, "learning_rate": 7.17694754277686e-05, "loss": 0.0086, "step": 586980 }, { "epoch": 1.52, "learning_rate": 7.176558721139713e-05, "loss": 0.0077, "step": 586990 }, { "epoch": 1.52, "learning_rate": 7.176169899502567e-05, "loss": 0.0087, "step": 587000 }, { "epoch": 1.52, "eval_cer": 0.8816956881384969, "eval_loss": 0.005926743149757385, "eval_runtime": 107.8399, "eval_samples_per_second": 18.546, "eval_steps_per_second": 4.637, "step": 587000 }, { "epoch": 1.52, "learning_rate": 7.17578107786542e-05, "loss": 0.0067, "step": 587010 }, { "epoch": 1.52, "learning_rate": 7.175392256228274e-05, "loss": 0.0066, "step": 587020 }, { "epoch": 1.52, "learning_rate": 7.175003434591127e-05, "loss": 0.0083, "step": 587030 }, { "epoch": 1.52, "learning_rate": 7.174614612953981e-05, "loss": 0.0089, "step": 587040 }, { "epoch": 1.52, "learning_rate": 7.174225791316835e-05, "loss": 0.0086, "step": 587050 }, { "epoch": 1.52, "learning_rate": 7.173836969679688e-05, "loss": 0.0098, "step": 587060 }, { "epoch": 1.52, "learning_rate": 7.173448148042542e-05, "loss": 0.0083, "step": 587070 }, { "epoch": 1.52, "learning_rate": 7.173059326405395e-05, "loss": 0.0081, "step": 587080 }, { "epoch": 1.52, "learning_rate": 7.172670504768249e-05, "loss": 0.0077, "step": 587090 }, { "epoch": 1.52, "learning_rate": 7.172281683131102e-05, "loss": 0.0076, "step": 587100 }, { "epoch": 1.52, "learning_rate": 7.171892861493956e-05, "loss": 0.0078, "step": 587110 }, { "epoch": 1.52, "learning_rate": 7.171504039856809e-05, "loss": 0.0098, "step": 587120 }, { "epoch": 1.52, "learning_rate": 7.171115218219663e-05, "loss": 0.0099, "step": 587130 }, { "epoch": 1.52, "learning_rate": 7.170726396582517e-05, "loss": 0.0083, "step": 587140 }, { "epoch": 1.52, "learning_rate": 7.17033757494537e-05, "loss": 0.0122, "step": 587150 }, { "epoch": 1.52, "learning_rate": 7.169948753308223e-05, "loss": 0.0062, "step": 587160 }, { "epoch": 1.52, "learning_rate": 7.169559931671077e-05, "loss": 0.0128, "step": 587170 }, { "epoch": 1.52, "learning_rate": 7.16917111003393e-05, "loss": 0.0076, "step": 587180 }, { "epoch": 1.52, "learning_rate": 7.168782288396784e-05, "loss": 0.009, "step": 587190 }, { "epoch": 1.52, "learning_rate": 7.168393466759637e-05, "loss": 0.0081, "step": 587200 }, { "epoch": 1.52, "learning_rate": 7.168004645122491e-05, "loss": 0.0068, "step": 587210 }, { "epoch": 1.52, "learning_rate": 7.167615823485344e-05, "loss": 0.0053, "step": 587220 }, { "epoch": 1.52, "learning_rate": 7.167227001848198e-05, "loss": 0.0084, "step": 587230 }, { "epoch": 1.52, "learning_rate": 7.166838180211052e-05, "loss": 0.0099, "step": 587240 }, { "epoch": 1.52, "learning_rate": 7.166449358573905e-05, "loss": 0.0076, "step": 587250 }, { "epoch": 1.52, "learning_rate": 7.166060536936759e-05, "loss": 0.0056, "step": 587260 }, { "epoch": 1.52, "learning_rate": 7.165671715299612e-05, "loss": 0.01, "step": 587270 }, { "epoch": 1.52, "learning_rate": 7.165282893662466e-05, "loss": 0.0085, "step": 587280 }, { "epoch": 1.52, "learning_rate": 7.164894072025319e-05, "loss": 0.0107, "step": 587290 }, { "epoch": 1.52, "learning_rate": 7.164505250388173e-05, "loss": 0.0087, "step": 587300 }, { "epoch": 1.52, "learning_rate": 7.164116428751027e-05, "loss": 0.0093, "step": 587310 }, { "epoch": 1.52, "learning_rate": 7.16372760711388e-05, "loss": 0.0106, "step": 587320 }, { "epoch": 1.52, "learning_rate": 7.163338785476734e-05, "loss": 0.0064, "step": 587330 }, { "epoch": 1.52, "learning_rate": 7.162949963839587e-05, "loss": 0.006, "step": 587340 }, { "epoch": 1.52, "learning_rate": 7.162561142202441e-05, "loss": 0.0085, "step": 587350 }, { "epoch": 1.52, "learning_rate": 7.162172320565294e-05, "loss": 0.0097, "step": 587360 }, { "epoch": 1.52, "learning_rate": 7.161783498928148e-05, "loss": 0.0076, "step": 587370 }, { "epoch": 1.52, "learning_rate": 7.161394677291001e-05, "loss": 0.0073, "step": 587380 }, { "epoch": 1.52, "learning_rate": 7.161005855653855e-05, "loss": 0.008, "step": 587390 }, { "epoch": 1.52, "learning_rate": 7.160617034016708e-05, "loss": 0.0081, "step": 587400 }, { "epoch": 1.52, "learning_rate": 7.160228212379562e-05, "loss": 0.0074, "step": 587410 }, { "epoch": 1.52, "learning_rate": 7.159839390742415e-05, "loss": 0.0083, "step": 587420 }, { "epoch": 1.52, "learning_rate": 7.159450569105269e-05, "loss": 0.007, "step": 587430 }, { "epoch": 1.52, "learning_rate": 7.159061747468122e-05, "loss": 0.0093, "step": 587440 }, { "epoch": 1.52, "learning_rate": 7.158672925830976e-05, "loss": 0.0098, "step": 587450 }, { "epoch": 1.52, "learning_rate": 7.158284104193829e-05, "loss": 0.0112, "step": 587460 }, { "epoch": 1.52, "learning_rate": 7.157895282556683e-05, "loss": 0.0095, "step": 587470 }, { "epoch": 1.52, "learning_rate": 7.157506460919536e-05, "loss": 0.0111, "step": 587480 }, { "epoch": 1.52, "learning_rate": 7.15711763928239e-05, "loss": 0.008, "step": 587490 }, { "epoch": 1.52, "learning_rate": 7.156728817645244e-05, "loss": 0.0089, "step": 587500 }, { "epoch": 1.52, "learning_rate": 7.156339996008097e-05, "loss": 0.014, "step": 587510 }, { "epoch": 1.52, "learning_rate": 7.155951174370951e-05, "loss": 0.0091, "step": 587520 }, { "epoch": 1.52, "learning_rate": 7.155562352733804e-05, "loss": 0.0098, "step": 587530 }, { "epoch": 1.52, "learning_rate": 7.155173531096658e-05, "loss": 0.0089, "step": 587540 }, { "epoch": 1.52, "learning_rate": 7.154784709459511e-05, "loss": 0.0064, "step": 587550 }, { "epoch": 1.52, "learning_rate": 7.154395887822365e-05, "loss": 0.0088, "step": 587560 }, { "epoch": 1.52, "learning_rate": 7.154007066185219e-05, "loss": 0.01, "step": 587570 }, { "epoch": 1.52, "learning_rate": 7.153618244548072e-05, "loss": 0.0077, "step": 587580 }, { "epoch": 1.52, "learning_rate": 7.153229422910926e-05, "loss": 0.0119, "step": 587590 }, { "epoch": 1.52, "learning_rate": 7.152840601273779e-05, "loss": 0.0074, "step": 587600 }, { "epoch": 1.52, "learning_rate": 7.152451779636633e-05, "loss": 0.011, "step": 587610 }, { "epoch": 1.52, "learning_rate": 7.152062957999486e-05, "loss": 0.0099, "step": 587620 }, { "epoch": 1.52, "learning_rate": 7.15167413636234e-05, "loss": 0.0106, "step": 587630 }, { "epoch": 1.52, "learning_rate": 7.151285314725193e-05, "loss": 0.0051, "step": 587640 }, { "epoch": 1.52, "learning_rate": 7.150896493088046e-05, "loss": 0.008, "step": 587650 }, { "epoch": 1.52, "learning_rate": 7.1505076714509e-05, "loss": 0.0082, "step": 587660 }, { "epoch": 1.52, "learning_rate": 7.150118849813754e-05, "loss": 0.0077, "step": 587670 }, { "epoch": 1.52, "learning_rate": 7.149730028176607e-05, "loss": 0.0085, "step": 587680 }, { "epoch": 1.52, "learning_rate": 7.149341206539461e-05, "loss": 0.0106, "step": 587690 }, { "epoch": 1.52, "learning_rate": 7.148952384902314e-05, "loss": 0.0093, "step": 587700 }, { "epoch": 1.52, "learning_rate": 7.148563563265168e-05, "loss": 0.0095, "step": 587710 }, { "epoch": 1.52, "learning_rate": 7.148174741628021e-05, "loss": 0.0083, "step": 587720 }, { "epoch": 1.52, "learning_rate": 7.147785919990875e-05, "loss": 0.0107, "step": 587730 }, { "epoch": 1.52, "learning_rate": 7.147397098353728e-05, "loss": 0.0107, "step": 587740 }, { "epoch": 1.52, "learning_rate": 7.147008276716582e-05, "loss": 0.0074, "step": 587750 }, { "epoch": 1.52, "learning_rate": 7.146619455079436e-05, "loss": 0.0099, "step": 587760 }, { "epoch": 1.52, "learning_rate": 7.146230633442289e-05, "loss": 0.0085, "step": 587770 }, { "epoch": 1.52, "learning_rate": 7.145841811805143e-05, "loss": 0.0082, "step": 587780 }, { "epoch": 1.52, "learning_rate": 7.145452990167996e-05, "loss": 0.0057, "step": 587790 }, { "epoch": 1.52, "learning_rate": 7.14506416853085e-05, "loss": 0.0094, "step": 587800 }, { "epoch": 1.52, "learning_rate": 7.144675346893703e-05, "loss": 0.0097, "step": 587810 }, { "epoch": 1.52, "learning_rate": 7.144286525256557e-05, "loss": 0.0097, "step": 587820 }, { "epoch": 1.52, "learning_rate": 7.14389770361941e-05, "loss": 0.0082, "step": 587830 }, { "epoch": 1.52, "learning_rate": 7.143508881982264e-05, "loss": 0.0084, "step": 587840 }, { "epoch": 1.52, "learning_rate": 7.143120060345118e-05, "loss": 0.0083, "step": 587850 }, { "epoch": 1.52, "learning_rate": 7.142731238707971e-05, "loss": 0.011, "step": 587860 }, { "epoch": 1.52, "learning_rate": 7.142342417070825e-05, "loss": 0.0067, "step": 587870 }, { "epoch": 1.52, "learning_rate": 7.141953595433678e-05, "loss": 0.0086, "step": 587880 }, { "epoch": 1.52, "learning_rate": 7.141564773796531e-05, "loss": 0.0069, "step": 587890 }, { "epoch": 1.52, "learning_rate": 7.141175952159385e-05, "loss": 0.0067, "step": 587900 }, { "epoch": 1.52, "learning_rate": 7.140787130522238e-05, "loss": 0.0092, "step": 587910 }, { "epoch": 1.52, "learning_rate": 7.140398308885092e-05, "loss": 0.0094, "step": 587920 }, { "epoch": 1.52, "learning_rate": 7.140009487247945e-05, "loss": 0.0091, "step": 587930 }, { "epoch": 1.52, "learning_rate": 7.139620665610799e-05, "loss": 0.0113, "step": 587940 }, { "epoch": 1.52, "learning_rate": 7.139231843973653e-05, "loss": 0.0109, "step": 587950 }, { "epoch": 1.52, "learning_rate": 7.138843022336506e-05, "loss": 0.0082, "step": 587960 }, { "epoch": 1.52, "learning_rate": 7.13845420069936e-05, "loss": 0.0096, "step": 587970 }, { "epoch": 1.52, "learning_rate": 7.138065379062213e-05, "loss": 0.0102, "step": 587980 }, { "epoch": 1.52, "learning_rate": 7.137676557425067e-05, "loss": 0.0073, "step": 587990 }, { "epoch": 1.52, "learning_rate": 7.13728773578792e-05, "loss": 0.0072, "step": 588000 }, { "epoch": 1.52, "eval_cer": 0.8816900895907601, "eval_loss": 0.005772036034613848, "eval_runtime": 107.6593, "eval_samples_per_second": 18.577, "eval_steps_per_second": 4.644, "step": 588000 }, { "epoch": 1.52, "learning_rate": 7.136898914150774e-05, "loss": 0.0073, "step": 588010 }, { "epoch": 1.52, "learning_rate": 7.136510092513628e-05, "loss": 0.0102, "step": 588020 }, { "epoch": 1.52, "learning_rate": 7.136121270876481e-05, "loss": 0.01, "step": 588030 }, { "epoch": 1.52, "learning_rate": 7.135732449239335e-05, "loss": 0.0083, "step": 588040 }, { "epoch": 1.52, "learning_rate": 7.135343627602188e-05, "loss": 0.0085, "step": 588050 }, { "epoch": 1.52, "learning_rate": 7.134954805965042e-05, "loss": 0.0091, "step": 588060 }, { "epoch": 1.52, "learning_rate": 7.134565984327895e-05, "loss": 0.0075, "step": 588070 }, { "epoch": 1.52, "learning_rate": 7.134177162690749e-05, "loss": 0.012, "step": 588080 }, { "epoch": 1.52, "learning_rate": 7.133788341053602e-05, "loss": 0.0109, "step": 588090 }, { "epoch": 1.52, "learning_rate": 7.133399519416456e-05, "loss": 0.008, "step": 588100 }, { "epoch": 1.52, "learning_rate": 7.13301069777931e-05, "loss": 0.0073, "step": 588110 }, { "epoch": 1.52, "learning_rate": 7.132621876142163e-05, "loss": 0.0095, "step": 588120 }, { "epoch": 1.52, "learning_rate": 7.132233054505017e-05, "loss": 0.0098, "step": 588130 }, { "epoch": 1.52, "learning_rate": 7.13184423286787e-05, "loss": 0.0066, "step": 588140 }, { "epoch": 1.52, "learning_rate": 7.131455411230723e-05, "loss": 0.0087, "step": 588150 }, { "epoch": 1.52, "learning_rate": 7.131066589593577e-05, "loss": 0.0102, "step": 588160 }, { "epoch": 1.52, "learning_rate": 7.13067776795643e-05, "loss": 0.009, "step": 588170 }, { "epoch": 1.52, "learning_rate": 7.130288946319284e-05, "loss": 0.009, "step": 588180 }, { "epoch": 1.52, "learning_rate": 7.129900124682137e-05, "loss": 0.0106, "step": 588190 }, { "epoch": 1.52, "learning_rate": 7.129511303044991e-05, "loss": 0.0092, "step": 588200 }, { "epoch": 1.52, "learning_rate": 7.129122481407845e-05, "loss": 0.0107, "step": 588210 }, { "epoch": 1.52, "learning_rate": 7.128733659770698e-05, "loss": 0.0101, "step": 588220 }, { "epoch": 1.52, "learning_rate": 7.128344838133552e-05, "loss": 0.0085, "step": 588230 }, { "epoch": 1.52, "learning_rate": 7.127956016496405e-05, "loss": 0.0088, "step": 588240 }, { "epoch": 1.52, "learning_rate": 7.127567194859259e-05, "loss": 0.0109, "step": 588250 }, { "epoch": 1.52, "learning_rate": 7.127178373222112e-05, "loss": 0.0128, "step": 588260 }, { "epoch": 1.52, "learning_rate": 7.126789551584966e-05, "loss": 0.0127, "step": 588270 }, { "epoch": 1.52, "learning_rate": 7.12640072994782e-05, "loss": 0.01, "step": 588280 }, { "epoch": 1.52, "learning_rate": 7.126011908310673e-05, "loss": 0.0104, "step": 588290 }, { "epoch": 1.52, "learning_rate": 7.125623086673527e-05, "loss": 0.0087, "step": 588300 }, { "epoch": 1.52, "learning_rate": 7.12523426503638e-05, "loss": 0.0088, "step": 588310 }, { "epoch": 1.53, "learning_rate": 7.124845443399234e-05, "loss": 0.0105, "step": 588320 }, { "epoch": 1.53, "learning_rate": 7.124456621762087e-05, "loss": 0.0089, "step": 588330 }, { "epoch": 1.53, "learning_rate": 7.124067800124941e-05, "loss": 0.0115, "step": 588340 }, { "epoch": 1.53, "learning_rate": 7.123678978487794e-05, "loss": 0.0087, "step": 588350 }, { "epoch": 1.53, "learning_rate": 7.123290156850648e-05, "loss": 0.0081, "step": 588360 }, { "epoch": 1.53, "learning_rate": 7.122901335213502e-05, "loss": 0.0085, "step": 588370 }, { "epoch": 1.53, "learning_rate": 7.122512513576355e-05, "loss": 0.0085, "step": 588380 }, { "epoch": 1.53, "learning_rate": 7.122123691939208e-05, "loss": 0.009, "step": 588390 }, { "epoch": 1.53, "learning_rate": 7.121734870302062e-05, "loss": 0.0114, "step": 588400 }, { "epoch": 1.53, "learning_rate": 7.121346048664915e-05, "loss": 0.0095, "step": 588410 }, { "epoch": 1.53, "learning_rate": 7.120957227027769e-05, "loss": 0.01, "step": 588420 }, { "epoch": 1.53, "learning_rate": 7.120568405390622e-05, "loss": 0.0076, "step": 588430 }, { "epoch": 1.53, "learning_rate": 7.120179583753476e-05, "loss": 0.0082, "step": 588440 }, { "epoch": 1.53, "learning_rate": 7.119790762116329e-05, "loss": 0.0108, "step": 588450 }, { "epoch": 1.53, "learning_rate": 7.119401940479183e-05, "loss": 0.0098, "step": 588460 }, { "epoch": 1.53, "learning_rate": 7.119013118842037e-05, "loss": 0.0084, "step": 588470 }, { "epoch": 1.53, "learning_rate": 7.11862429720489e-05, "loss": 0.0099, "step": 588480 }, { "epoch": 1.53, "learning_rate": 7.118235475567744e-05, "loss": 0.01, "step": 588490 }, { "epoch": 1.53, "learning_rate": 7.117846653930597e-05, "loss": 0.0101, "step": 588500 }, { "epoch": 1.53, "learning_rate": 7.117457832293451e-05, "loss": 0.0079, "step": 588510 }, { "epoch": 1.53, "learning_rate": 7.117069010656304e-05, "loss": 0.0058, "step": 588520 }, { "epoch": 1.53, "learning_rate": 7.116680189019158e-05, "loss": 0.0134, "step": 588530 }, { "epoch": 1.53, "learning_rate": 7.116291367382012e-05, "loss": 0.0091, "step": 588540 }, { "epoch": 1.53, "learning_rate": 7.115902545744865e-05, "loss": 0.0085, "step": 588550 }, { "epoch": 1.53, "learning_rate": 7.115513724107719e-05, "loss": 0.0084, "step": 588560 }, { "epoch": 1.53, "learning_rate": 7.115124902470572e-05, "loss": 0.0075, "step": 588570 }, { "epoch": 1.53, "learning_rate": 7.114736080833426e-05, "loss": 0.0078, "step": 588580 }, { "epoch": 1.53, "learning_rate": 7.114347259196279e-05, "loss": 0.0089, "step": 588590 }, { "epoch": 1.53, "learning_rate": 7.113958437559133e-05, "loss": 0.0082, "step": 588600 }, { "epoch": 1.53, "learning_rate": 7.113569615921986e-05, "loss": 0.0069, "step": 588610 }, { "epoch": 1.53, "learning_rate": 7.11318079428484e-05, "loss": 0.0094, "step": 588620 }, { "epoch": 1.53, "learning_rate": 7.112791972647694e-05, "loss": 0.0062, "step": 588630 }, { "epoch": 1.53, "learning_rate": 7.112403151010547e-05, "loss": 0.0082, "step": 588640 }, { "epoch": 1.53, "learning_rate": 7.1120143293734e-05, "loss": 0.0076, "step": 588650 }, { "epoch": 1.53, "learning_rate": 7.111625507736254e-05, "loss": 0.0116, "step": 588660 }, { "epoch": 1.53, "learning_rate": 7.111236686099107e-05, "loss": 0.0103, "step": 588670 }, { "epoch": 1.53, "learning_rate": 7.110847864461961e-05, "loss": 0.0076, "step": 588680 }, { "epoch": 1.53, "learning_rate": 7.110459042824814e-05, "loss": 0.009, "step": 588690 }, { "epoch": 1.53, "learning_rate": 7.110070221187668e-05, "loss": 0.0096, "step": 588700 }, { "epoch": 1.53, "learning_rate": 7.109681399550521e-05, "loss": 0.0142, "step": 588710 }, { "epoch": 1.53, "learning_rate": 7.109292577913375e-05, "loss": 0.0097, "step": 588720 }, { "epoch": 1.53, "learning_rate": 7.108903756276229e-05, "loss": 0.0092, "step": 588730 }, { "epoch": 1.53, "learning_rate": 7.108514934639082e-05, "loss": 0.0084, "step": 588740 }, { "epoch": 1.53, "learning_rate": 7.108126113001936e-05, "loss": 0.01, "step": 588750 }, { "epoch": 1.53, "learning_rate": 7.107737291364789e-05, "loss": 0.0096, "step": 588760 }, { "epoch": 1.53, "learning_rate": 7.107348469727643e-05, "loss": 0.012, "step": 588770 }, { "epoch": 1.53, "learning_rate": 7.106959648090496e-05, "loss": 0.0073, "step": 588780 }, { "epoch": 1.53, "learning_rate": 7.10657082645335e-05, "loss": 0.0054, "step": 588790 }, { "epoch": 1.53, "learning_rate": 7.106182004816204e-05, "loss": 0.0073, "step": 588800 }, { "epoch": 1.53, "learning_rate": 7.105793183179057e-05, "loss": 0.006, "step": 588810 }, { "epoch": 1.53, "learning_rate": 7.105404361541911e-05, "loss": 0.0078, "step": 588820 }, { "epoch": 1.53, "learning_rate": 7.105015539904764e-05, "loss": 0.0078, "step": 588830 }, { "epoch": 1.53, "learning_rate": 7.104626718267618e-05, "loss": 0.0106, "step": 588840 }, { "epoch": 1.53, "learning_rate": 7.104237896630471e-05, "loss": 0.0063, "step": 588850 }, { "epoch": 1.53, "learning_rate": 7.103849074993325e-05, "loss": 0.0089, "step": 588860 }, { "epoch": 1.53, "learning_rate": 7.103460253356178e-05, "loss": 0.0072, "step": 588870 }, { "epoch": 1.53, "learning_rate": 7.103071431719032e-05, "loss": 0.0077, "step": 588880 }, { "epoch": 1.53, "learning_rate": 7.102682610081885e-05, "loss": 0.0099, "step": 588890 }, { "epoch": 1.53, "learning_rate": 7.102293788444739e-05, "loss": 0.0113, "step": 588900 }, { "epoch": 1.53, "learning_rate": 7.101904966807592e-05, "loss": 0.0072, "step": 588910 }, { "epoch": 1.53, "learning_rate": 7.101516145170446e-05, "loss": 0.0084, "step": 588920 }, { "epoch": 1.53, "learning_rate": 7.101127323533299e-05, "loss": 0.0075, "step": 588930 }, { "epoch": 1.53, "learning_rate": 7.100738501896153e-05, "loss": 0.0065, "step": 588940 }, { "epoch": 1.53, "learning_rate": 7.100349680259006e-05, "loss": 0.0094, "step": 588950 }, { "epoch": 1.53, "learning_rate": 7.09996085862186e-05, "loss": 0.0102, "step": 588960 }, { "epoch": 1.53, "learning_rate": 7.099572036984713e-05, "loss": 0.0079, "step": 588970 }, { "epoch": 1.53, "learning_rate": 7.099183215347567e-05, "loss": 0.0096, "step": 588980 }, { "epoch": 1.53, "learning_rate": 7.098794393710421e-05, "loss": 0.0073, "step": 588990 }, { "epoch": 1.53, "learning_rate": 7.098405572073274e-05, "loss": 0.0068, "step": 589000 }, { "epoch": 1.53, "eval_cer": 0.8816788924952867, "eval_loss": 0.005820184480398893, "eval_runtime": 107.9961, "eval_samples_per_second": 18.519, "eval_steps_per_second": 4.63, "step": 589000 }, { "epoch": 1.53, "learning_rate": 7.098016750436128e-05, "loss": 0.0064, "step": 589010 }, { "epoch": 1.53, "learning_rate": 7.097627928798981e-05, "loss": 0.0086, "step": 589020 }, { "epoch": 1.53, "learning_rate": 7.097239107161835e-05, "loss": 0.008, "step": 589030 }, { "epoch": 1.53, "learning_rate": 7.096850285524688e-05, "loss": 0.0094, "step": 589040 }, { "epoch": 1.53, "learning_rate": 7.096461463887542e-05, "loss": 0.0073, "step": 589050 }, { "epoch": 1.53, "learning_rate": 7.096072642250396e-05, "loss": 0.0142, "step": 589060 }, { "epoch": 1.53, "learning_rate": 7.095683820613249e-05, "loss": 0.0084, "step": 589070 }, { "epoch": 1.53, "learning_rate": 7.095294998976103e-05, "loss": 0.0076, "step": 589080 }, { "epoch": 1.53, "learning_rate": 7.094906177338956e-05, "loss": 0.0078, "step": 589090 }, { "epoch": 1.53, "learning_rate": 7.09451735570181e-05, "loss": 0.0094, "step": 589100 }, { "epoch": 1.53, "learning_rate": 7.094128534064663e-05, "loss": 0.0074, "step": 589110 }, { "epoch": 1.53, "learning_rate": 7.093739712427517e-05, "loss": 0.0142, "step": 589120 }, { "epoch": 1.53, "learning_rate": 7.09335089079037e-05, "loss": 0.0066, "step": 589130 }, { "epoch": 1.53, "learning_rate": 7.092962069153223e-05, "loss": 0.0106, "step": 589140 }, { "epoch": 1.53, "learning_rate": 7.092573247516077e-05, "loss": 0.0081, "step": 589150 }, { "epoch": 1.53, "learning_rate": 7.092184425878931e-05, "loss": 0.0085, "step": 589160 }, { "epoch": 1.53, "learning_rate": 7.091795604241784e-05, "loss": 0.0114, "step": 589170 }, { "epoch": 1.53, "learning_rate": 7.091406782604638e-05, "loss": 0.0101, "step": 589180 }, { "epoch": 1.53, "learning_rate": 7.091017960967491e-05, "loss": 0.0094, "step": 589190 }, { "epoch": 1.53, "learning_rate": 7.090629139330345e-05, "loss": 0.009, "step": 589200 }, { "epoch": 1.53, "learning_rate": 7.090240317693198e-05, "loss": 0.0079, "step": 589210 }, { "epoch": 1.53, "learning_rate": 7.089851496056052e-05, "loss": 0.009, "step": 589220 }, { "epoch": 1.53, "learning_rate": 7.089462674418905e-05, "loss": 0.0084, "step": 589230 }, { "epoch": 1.53, "learning_rate": 7.089073852781759e-05, "loss": 0.007, "step": 589240 }, { "epoch": 1.53, "learning_rate": 7.088685031144613e-05, "loss": 0.0106, "step": 589250 }, { "epoch": 1.53, "learning_rate": 7.088296209507466e-05, "loss": 0.0076, "step": 589260 }, { "epoch": 1.53, "learning_rate": 7.08790738787032e-05, "loss": 0.0071, "step": 589270 }, { "epoch": 1.53, "learning_rate": 7.087518566233173e-05, "loss": 0.0111, "step": 589280 }, { "epoch": 1.53, "learning_rate": 7.087129744596027e-05, "loss": 0.0084, "step": 589290 }, { "epoch": 1.53, "learning_rate": 7.08674092295888e-05, "loss": 0.0091, "step": 589300 }, { "epoch": 1.53, "learning_rate": 7.086352101321734e-05, "loss": 0.0081, "step": 589310 }, { "epoch": 1.53, "learning_rate": 7.085963279684587e-05, "loss": 0.0078, "step": 589320 }, { "epoch": 1.53, "learning_rate": 7.085574458047441e-05, "loss": 0.0081, "step": 589330 }, { "epoch": 1.53, "learning_rate": 7.085185636410295e-05, "loss": 0.0079, "step": 589340 }, { "epoch": 1.53, "learning_rate": 7.084796814773148e-05, "loss": 0.01, "step": 589350 }, { "epoch": 1.53, "learning_rate": 7.084407993136002e-05, "loss": 0.01, "step": 589360 }, { "epoch": 1.53, "learning_rate": 7.084019171498855e-05, "loss": 0.0074, "step": 589370 }, { "epoch": 1.53, "learning_rate": 7.083630349861708e-05, "loss": 0.0079, "step": 589380 }, { "epoch": 1.53, "learning_rate": 7.083241528224562e-05, "loss": 0.0068, "step": 589390 }, { "epoch": 1.53, "learning_rate": 7.082852706587415e-05, "loss": 0.0089, "step": 589400 }, { "epoch": 1.53, "learning_rate": 7.082463884950269e-05, "loss": 0.0104, "step": 589410 }, { "epoch": 1.53, "learning_rate": 7.082075063313122e-05, "loss": 0.0091, "step": 589420 }, { "epoch": 1.53, "learning_rate": 7.081686241675976e-05, "loss": 0.0103, "step": 589430 }, { "epoch": 1.53, "learning_rate": 7.08129742003883e-05, "loss": 0.0067, "step": 589440 }, { "epoch": 1.53, "learning_rate": 7.080908598401683e-05, "loss": 0.0116, "step": 589450 }, { "epoch": 1.53, "learning_rate": 7.080519776764537e-05, "loss": 0.0074, "step": 589460 }, { "epoch": 1.53, "learning_rate": 7.08013095512739e-05, "loss": 0.0109, "step": 589470 }, { "epoch": 1.53, "learning_rate": 7.079742133490244e-05, "loss": 0.0071, "step": 589480 }, { "epoch": 1.53, "learning_rate": 7.079353311853097e-05, "loss": 0.007, "step": 589490 }, { "epoch": 1.53, "learning_rate": 7.078964490215951e-05, "loss": 0.0106, "step": 589500 }, { "epoch": 1.53, "learning_rate": 7.078575668578805e-05, "loss": 0.0099, "step": 589510 }, { "epoch": 1.53, "learning_rate": 7.078186846941658e-05, "loss": 0.0084, "step": 589520 }, { "epoch": 1.53, "learning_rate": 7.077798025304512e-05, "loss": 0.0093, "step": 589530 }, { "epoch": 1.53, "learning_rate": 7.077409203667365e-05, "loss": 0.0095, "step": 589540 }, { "epoch": 1.53, "learning_rate": 7.077020382030219e-05, "loss": 0.0108, "step": 589550 }, { "epoch": 1.53, "learning_rate": 7.076631560393072e-05, "loss": 0.007, "step": 589560 }, { "epoch": 1.53, "learning_rate": 7.076242738755926e-05, "loss": 0.0076, "step": 589570 }, { "epoch": 1.53, "learning_rate": 7.075853917118779e-05, "loss": 0.0095, "step": 589580 }, { "epoch": 1.53, "learning_rate": 7.075465095481633e-05, "loss": 0.0085, "step": 589590 }, { "epoch": 1.53, "learning_rate": 7.075076273844487e-05, "loss": 0.0077, "step": 589600 }, { "epoch": 1.53, "learning_rate": 7.07468745220734e-05, "loss": 0.0069, "step": 589610 }, { "epoch": 1.53, "learning_rate": 7.074298630570194e-05, "loss": 0.0112, "step": 589620 }, { "epoch": 1.53, "learning_rate": 7.073909808933047e-05, "loss": 0.0063, "step": 589630 }, { "epoch": 1.53, "learning_rate": 7.0735209872959e-05, "loss": 0.0073, "step": 589640 }, { "epoch": 1.53, "learning_rate": 7.073132165658754e-05, "loss": 0.0102, "step": 589650 }, { "epoch": 1.53, "learning_rate": 7.072743344021607e-05, "loss": 0.009, "step": 589660 }, { "epoch": 1.53, "learning_rate": 7.072354522384461e-05, "loss": 0.0111, "step": 589670 }, { "epoch": 1.53, "learning_rate": 7.071965700747314e-05, "loss": 0.0068, "step": 589680 }, { "epoch": 1.53, "learning_rate": 7.071576879110168e-05, "loss": 0.011, "step": 589690 }, { "epoch": 1.53, "learning_rate": 7.071188057473022e-05, "loss": 0.0068, "step": 589700 }, { "epoch": 1.53, "learning_rate": 7.070799235835875e-05, "loss": 0.0071, "step": 589710 }, { "epoch": 1.53, "learning_rate": 7.070410414198729e-05, "loss": 0.0061, "step": 589720 }, { "epoch": 1.53, "learning_rate": 7.070021592561582e-05, "loss": 0.0073, "step": 589730 }, { "epoch": 1.53, "learning_rate": 7.069632770924436e-05, "loss": 0.0095, "step": 589740 }, { "epoch": 1.53, "learning_rate": 7.069243949287289e-05, "loss": 0.007, "step": 589750 }, { "epoch": 1.53, "learning_rate": 7.068855127650143e-05, "loss": 0.0069, "step": 589760 }, { "epoch": 1.53, "learning_rate": 7.068466306012997e-05, "loss": 0.0078, "step": 589770 }, { "epoch": 1.53, "learning_rate": 7.06807748437585e-05, "loss": 0.0086, "step": 589780 }, { "epoch": 1.53, "learning_rate": 7.067688662738704e-05, "loss": 0.0077, "step": 589790 }, { "epoch": 1.53, "learning_rate": 7.067299841101557e-05, "loss": 0.0092, "step": 589800 }, { "epoch": 1.53, "learning_rate": 7.066911019464411e-05, "loss": 0.0073, "step": 589810 }, { "epoch": 1.53, "learning_rate": 7.066522197827264e-05, "loss": 0.0069, "step": 589820 }, { "epoch": 1.53, "learning_rate": 7.066133376190118e-05, "loss": 0.0099, "step": 589830 }, { "epoch": 1.53, "learning_rate": 7.065744554552971e-05, "loss": 0.0104, "step": 589840 }, { "epoch": 1.53, "learning_rate": 7.065355732915825e-05, "loss": 0.0075, "step": 589850 }, { "epoch": 1.53, "learning_rate": 7.064966911278679e-05, "loss": 0.0094, "step": 589860 }, { "epoch": 1.53, "learning_rate": 7.064578089641532e-05, "loss": 0.0102, "step": 589870 }, { "epoch": 1.53, "learning_rate": 7.064189268004385e-05, "loss": 0.0118, "step": 589880 }, { "epoch": 1.53, "learning_rate": 7.063800446367239e-05, "loss": 0.0098, "step": 589890 }, { "epoch": 1.53, "learning_rate": 7.063411624730092e-05, "loss": 0.0099, "step": 589900 }, { "epoch": 1.53, "learning_rate": 7.063022803092946e-05, "loss": 0.0079, "step": 589910 }, { "epoch": 1.53, "learning_rate": 7.062633981455799e-05, "loss": 0.0091, "step": 589920 }, { "epoch": 1.53, "learning_rate": 7.062245159818653e-05, "loss": 0.0128, "step": 589930 }, { "epoch": 1.53, "learning_rate": 7.061856338181506e-05, "loss": 0.0097, "step": 589940 }, { "epoch": 1.53, "learning_rate": 7.06146751654436e-05, "loss": 0.0087, "step": 589950 }, { "epoch": 1.53, "learning_rate": 7.061078694907214e-05, "loss": 0.0097, "step": 589960 }, { "epoch": 1.53, "learning_rate": 7.060689873270067e-05, "loss": 0.0106, "step": 589970 }, { "epoch": 1.53, "learning_rate": 7.060301051632921e-05, "loss": 0.0069, "step": 589980 }, { "epoch": 1.53, "learning_rate": 7.059912229995774e-05, "loss": 0.0085, "step": 589990 }, { "epoch": 1.53, "learning_rate": 7.059523408358628e-05, "loss": 0.0081, "step": 590000 }, { "epoch": 1.53, "eval_cer": 0.8816830914060892, "eval_loss": 0.00574450334534049, "eval_runtime": 108.0014, "eval_samples_per_second": 18.518, "eval_steps_per_second": 4.63, "step": 590000 }, { "epoch": 1.53, "learning_rate": 7.059134586721481e-05, "loss": 0.0084, "step": 590010 }, { "epoch": 1.53, "learning_rate": 7.058745765084335e-05, "loss": 0.01, "step": 590020 }, { "epoch": 1.53, "learning_rate": 7.058356943447189e-05, "loss": 0.0102, "step": 590030 }, { "epoch": 1.53, "learning_rate": 7.057968121810042e-05, "loss": 0.0081, "step": 590040 }, { "epoch": 1.53, "learning_rate": 7.057579300172896e-05, "loss": 0.0124, "step": 590050 }, { "epoch": 1.53, "learning_rate": 7.057190478535749e-05, "loss": 0.0137, "step": 590060 }, { "epoch": 1.53, "learning_rate": 7.056801656898603e-05, "loss": 0.009, "step": 590070 }, { "epoch": 1.53, "learning_rate": 7.056412835261456e-05, "loss": 0.0064, "step": 590080 }, { "epoch": 1.53, "learning_rate": 7.05602401362431e-05, "loss": 0.0078, "step": 590090 }, { "epoch": 1.53, "learning_rate": 7.055635191987163e-05, "loss": 0.0068, "step": 590100 }, { "epoch": 1.53, "learning_rate": 7.055246370350017e-05, "loss": 0.0091, "step": 590110 }, { "epoch": 1.53, "learning_rate": 7.054857548712871e-05, "loss": 0.008, "step": 590120 }, { "epoch": 1.53, "learning_rate": 7.054468727075724e-05, "loss": 0.0081, "step": 590130 }, { "epoch": 1.53, "learning_rate": 7.054079905438577e-05, "loss": 0.0121, "step": 590140 }, { "epoch": 1.53, "learning_rate": 7.053691083801431e-05, "loss": 0.0103, "step": 590150 }, { "epoch": 1.53, "learning_rate": 7.053302262164284e-05, "loss": 0.0079, "step": 590160 }, { "epoch": 1.53, "learning_rate": 7.052913440527138e-05, "loss": 0.0068, "step": 590170 }, { "epoch": 1.53, "learning_rate": 7.052524618889991e-05, "loss": 0.0065, "step": 590180 }, { "epoch": 1.53, "learning_rate": 7.052135797252845e-05, "loss": 0.0063, "step": 590190 }, { "epoch": 1.53, "learning_rate": 7.051746975615698e-05, "loss": 0.0056, "step": 590200 }, { "epoch": 1.53, "learning_rate": 7.051358153978552e-05, "loss": 0.0091, "step": 590210 }, { "epoch": 1.53, "learning_rate": 7.050969332341406e-05, "loss": 0.0107, "step": 590220 }, { "epoch": 1.53, "learning_rate": 7.050580510704259e-05, "loss": 0.008, "step": 590230 }, { "epoch": 1.53, "learning_rate": 7.050191689067113e-05, "loss": 0.0095, "step": 590240 }, { "epoch": 1.53, "learning_rate": 7.049802867429966e-05, "loss": 0.0084, "step": 590250 }, { "epoch": 1.53, "learning_rate": 7.04941404579282e-05, "loss": 0.006, "step": 590260 }, { "epoch": 1.53, "learning_rate": 7.049025224155673e-05, "loss": 0.0099, "step": 590270 }, { "epoch": 1.53, "learning_rate": 7.048636402518527e-05, "loss": 0.008, "step": 590280 }, { "epoch": 1.53, "learning_rate": 7.048247580881381e-05, "loss": 0.0084, "step": 590290 }, { "epoch": 1.53, "learning_rate": 7.047858759244234e-05, "loss": 0.0076, "step": 590300 }, { "epoch": 1.53, "learning_rate": 7.047469937607088e-05, "loss": 0.007, "step": 590310 }, { "epoch": 1.53, "learning_rate": 7.047081115969941e-05, "loss": 0.0108, "step": 590320 }, { "epoch": 1.53, "learning_rate": 7.046692294332795e-05, "loss": 0.008, "step": 590330 }, { "epoch": 1.53, "learning_rate": 7.046303472695648e-05, "loss": 0.0091, "step": 590340 }, { "epoch": 1.53, "learning_rate": 7.045914651058502e-05, "loss": 0.011, "step": 590350 }, { "epoch": 1.53, "learning_rate": 7.045525829421355e-05, "loss": 0.0078, "step": 590360 }, { "epoch": 1.53, "learning_rate": 7.045137007784208e-05, "loss": 0.0079, "step": 590370 }, { "epoch": 1.53, "learning_rate": 7.044748186147062e-05, "loss": 0.0069, "step": 590380 }, { "epoch": 1.53, "learning_rate": 7.044359364509916e-05, "loss": 0.0089, "step": 590390 }, { "epoch": 1.53, "learning_rate": 7.043970542872769e-05, "loss": 0.0075, "step": 590400 }, { "epoch": 1.53, "learning_rate": 7.043581721235623e-05, "loss": 0.0084, "step": 590410 }, { "epoch": 1.53, "learning_rate": 7.043192899598476e-05, "loss": 0.0068, "step": 590420 }, { "epoch": 1.53, "learning_rate": 7.04280407796133e-05, "loss": 0.0082, "step": 590430 }, { "epoch": 1.53, "learning_rate": 7.042415256324183e-05, "loss": 0.0078, "step": 590440 }, { "epoch": 1.53, "learning_rate": 7.042026434687037e-05, "loss": 0.007, "step": 590450 }, { "epoch": 1.53, "learning_rate": 7.04163761304989e-05, "loss": 0.0081, "step": 590460 }, { "epoch": 1.53, "learning_rate": 7.041248791412744e-05, "loss": 0.0079, "step": 590470 }, { "epoch": 1.53, "learning_rate": 7.040859969775598e-05, "loss": 0.0104, "step": 590480 }, { "epoch": 1.53, "learning_rate": 7.040471148138451e-05, "loss": 0.0084, "step": 590490 }, { "epoch": 1.53, "learning_rate": 7.040082326501305e-05, "loss": 0.0087, "step": 590500 }, { "epoch": 1.53, "learning_rate": 7.039693504864158e-05, "loss": 0.01, "step": 590510 }, { "epoch": 1.53, "learning_rate": 7.039304683227012e-05, "loss": 0.0123, "step": 590520 }, { "epoch": 1.53, "learning_rate": 7.038915861589865e-05, "loss": 0.0095, "step": 590530 }, { "epoch": 1.53, "learning_rate": 7.038527039952719e-05, "loss": 0.0092, "step": 590540 }, { "epoch": 1.53, "learning_rate": 7.038138218315573e-05, "loss": 0.01, "step": 590550 }, { "epoch": 1.53, "learning_rate": 7.037749396678426e-05, "loss": 0.0068, "step": 590560 }, { "epoch": 1.53, "learning_rate": 7.03736057504128e-05, "loss": 0.0077, "step": 590570 }, { "epoch": 1.53, "learning_rate": 7.036971753404133e-05, "loss": 0.0074, "step": 590580 }, { "epoch": 1.53, "learning_rate": 7.036582931766987e-05, "loss": 0.0154, "step": 590590 }, { "epoch": 1.53, "learning_rate": 7.03619411012984e-05, "loss": 0.008, "step": 590600 }, { "epoch": 1.53, "learning_rate": 7.035805288492694e-05, "loss": 0.0092, "step": 590610 }, { "epoch": 1.53, "learning_rate": 7.035416466855547e-05, "loss": 0.0089, "step": 590620 }, { "epoch": 1.53, "learning_rate": 7.0350276452184e-05, "loss": 0.0087, "step": 590630 }, { "epoch": 1.53, "learning_rate": 7.034638823581254e-05, "loss": 0.0074, "step": 590640 }, { "epoch": 1.53, "learning_rate": 7.034250001944108e-05, "loss": 0.007, "step": 590650 }, { "epoch": 1.53, "learning_rate": 7.033861180306961e-05, "loss": 0.0087, "step": 590660 }, { "epoch": 1.53, "learning_rate": 7.033472358669815e-05, "loss": 0.0099, "step": 590670 }, { "epoch": 1.53, "learning_rate": 7.033083537032668e-05, "loss": 0.0096, "step": 590680 }, { "epoch": 1.53, "learning_rate": 7.032694715395522e-05, "loss": 0.0073, "step": 590690 }, { "epoch": 1.53, "learning_rate": 7.032305893758375e-05, "loss": 0.0076, "step": 590700 }, { "epoch": 1.53, "learning_rate": 7.031917072121229e-05, "loss": 0.0084, "step": 590710 }, { "epoch": 1.53, "learning_rate": 7.031528250484082e-05, "loss": 0.0101, "step": 590720 }, { "epoch": 1.53, "learning_rate": 7.031139428846936e-05, "loss": 0.0082, "step": 590730 }, { "epoch": 1.53, "learning_rate": 7.03075060720979e-05, "loss": 0.0093, "step": 590740 }, { "epoch": 1.53, "learning_rate": 7.030361785572643e-05, "loss": 0.0078, "step": 590750 }, { "epoch": 1.53, "learning_rate": 7.029972963935497e-05, "loss": 0.0095, "step": 590760 }, { "epoch": 1.53, "learning_rate": 7.02958414229835e-05, "loss": 0.0076, "step": 590770 }, { "epoch": 1.53, "learning_rate": 7.029195320661204e-05, "loss": 0.0093, "step": 590780 }, { "epoch": 1.53, "learning_rate": 7.028806499024057e-05, "loss": 0.0082, "step": 590790 }, { "epoch": 1.53, "learning_rate": 7.028417677386911e-05, "loss": 0.008, "step": 590800 }, { "epoch": 1.53, "learning_rate": 7.028028855749764e-05, "loss": 0.0083, "step": 590810 }, { "epoch": 1.53, "learning_rate": 7.027640034112618e-05, "loss": 0.0088, "step": 590820 }, { "epoch": 1.53, "learning_rate": 7.027251212475472e-05, "loss": 0.0083, "step": 590830 }, { "epoch": 1.53, "learning_rate": 7.026862390838325e-05, "loss": 0.0076, "step": 590840 }, { "epoch": 1.53, "learning_rate": 7.026473569201179e-05, "loss": 0.0143, "step": 590850 }, { "epoch": 1.53, "learning_rate": 7.026084747564032e-05, "loss": 0.0069, "step": 590860 }, { "epoch": 1.53, "learning_rate": 7.025695925926885e-05, "loss": 0.0093, "step": 590870 }, { "epoch": 1.53, "learning_rate": 7.025307104289739e-05, "loss": 0.0114, "step": 590880 }, { "epoch": 1.53, "learning_rate": 7.024918282652592e-05, "loss": 0.0079, "step": 590890 }, { "epoch": 1.53, "learning_rate": 7.024529461015446e-05, "loss": 0.0087, "step": 590900 }, { "epoch": 1.53, "learning_rate": 7.024140639378299e-05, "loss": 0.0063, "step": 590910 }, { "epoch": 1.53, "learning_rate": 7.023751817741153e-05, "loss": 0.01, "step": 590920 }, { "epoch": 1.53, "learning_rate": 7.023362996104007e-05, "loss": 0.0136, "step": 590930 }, { "epoch": 1.53, "learning_rate": 7.02297417446686e-05, "loss": 0.0104, "step": 590940 }, { "epoch": 1.53, "learning_rate": 7.022585352829714e-05, "loss": 0.0082, "step": 590950 }, { "epoch": 1.53, "learning_rate": 7.022196531192567e-05, "loss": 0.0086, "step": 590960 }, { "epoch": 1.53, "learning_rate": 7.021807709555421e-05, "loss": 0.0063, "step": 590970 }, { "epoch": 1.53, "learning_rate": 7.021418887918274e-05, "loss": 0.0106, "step": 590980 }, { "epoch": 1.53, "learning_rate": 7.021030066281128e-05, "loss": 0.0096, "step": 590990 }, { "epoch": 1.53, "learning_rate": 7.020641244643982e-05, "loss": 0.01, "step": 591000 }, { "epoch": 1.53, "eval_cer": 0.8816858906799576, "eval_loss": 0.005933051463216543, "eval_runtime": 107.84, "eval_samples_per_second": 18.546, "eval_steps_per_second": 4.636, "step": 591000 }, { "epoch": 1.53, "learning_rate": 7.020252423006835e-05, "loss": 0.0103, "step": 591010 }, { "epoch": 1.53, "learning_rate": 7.019863601369689e-05, "loss": 0.0126, "step": 591020 }, { "epoch": 1.53, "learning_rate": 7.019474779732542e-05, "loss": 0.0116, "step": 591030 }, { "epoch": 1.53, "learning_rate": 7.019085958095396e-05, "loss": 0.0085, "step": 591040 }, { "epoch": 1.53, "learning_rate": 7.018697136458249e-05, "loss": 0.0079, "step": 591050 }, { "epoch": 1.53, "learning_rate": 7.018308314821103e-05, "loss": 0.0072, "step": 591060 }, { "epoch": 1.53, "learning_rate": 7.017919493183956e-05, "loss": 0.0087, "step": 591070 }, { "epoch": 1.53, "learning_rate": 7.01753067154681e-05, "loss": 0.0087, "step": 591080 }, { "epoch": 1.53, "learning_rate": 7.017141849909664e-05, "loss": 0.01, "step": 591090 }, { "epoch": 1.53, "learning_rate": 7.016753028272517e-05, "loss": 0.006, "step": 591100 }, { "epoch": 1.53, "learning_rate": 7.016364206635371e-05, "loss": 0.0097, "step": 591110 }, { "epoch": 1.53, "learning_rate": 7.015975384998224e-05, "loss": 0.0086, "step": 591120 }, { "epoch": 1.53, "learning_rate": 7.015586563361077e-05, "loss": 0.0075, "step": 591130 }, { "epoch": 1.53, "learning_rate": 7.015197741723931e-05, "loss": 0.0086, "step": 591140 }, { "epoch": 1.53, "learning_rate": 7.014808920086784e-05, "loss": 0.0095, "step": 591150 }, { "epoch": 1.53, "learning_rate": 7.014420098449638e-05, "loss": 0.0101, "step": 591160 }, { "epoch": 1.53, "learning_rate": 7.01403127681249e-05, "loss": 0.0116, "step": 591170 }, { "epoch": 1.53, "learning_rate": 7.013642455175345e-05, "loss": 0.0065, "step": 591180 }, { "epoch": 1.53, "learning_rate": 7.013253633538199e-05, "loss": 0.0086, "step": 591190 }, { "epoch": 1.53, "learning_rate": 7.012864811901052e-05, "loss": 0.0135, "step": 591200 }, { "epoch": 1.53, "learning_rate": 7.012475990263906e-05, "loss": 0.0086, "step": 591210 }, { "epoch": 1.53, "learning_rate": 7.012087168626759e-05, "loss": 0.0079, "step": 591220 }, { "epoch": 1.53, "learning_rate": 7.011698346989613e-05, "loss": 0.0099, "step": 591230 }, { "epoch": 1.53, "learning_rate": 7.011309525352466e-05, "loss": 0.0096, "step": 591240 }, { "epoch": 1.53, "learning_rate": 7.01092070371532e-05, "loss": 0.011, "step": 591250 }, { "epoch": 1.53, "learning_rate": 7.010531882078174e-05, "loss": 0.0095, "step": 591260 }, { "epoch": 1.53, "learning_rate": 7.010143060441027e-05, "loss": 0.0082, "step": 591270 }, { "epoch": 1.53, "learning_rate": 7.009754238803881e-05, "loss": 0.0078, "step": 591280 }, { "epoch": 1.53, "learning_rate": 7.009365417166734e-05, "loss": 0.0068, "step": 591290 }, { "epoch": 1.53, "learning_rate": 7.008976595529588e-05, "loss": 0.0073, "step": 591300 }, { "epoch": 1.53, "learning_rate": 7.008587773892441e-05, "loss": 0.0083, "step": 591310 }, { "epoch": 1.53, "learning_rate": 7.008198952255295e-05, "loss": 0.0121, "step": 591320 }, { "epoch": 1.53, "learning_rate": 7.007810130618148e-05, "loss": 0.0091, "step": 591330 }, { "epoch": 1.53, "learning_rate": 7.007421308981002e-05, "loss": 0.008, "step": 591340 }, { "epoch": 1.53, "learning_rate": 7.007032487343856e-05, "loss": 0.008, "step": 591350 }, { "epoch": 1.53, "learning_rate": 7.006643665706709e-05, "loss": 0.0081, "step": 591360 }, { "epoch": 1.53, "learning_rate": 7.006254844069562e-05, "loss": 0.0063, "step": 591370 }, { "epoch": 1.53, "learning_rate": 7.005866022432416e-05, "loss": 0.0093, "step": 591380 }, { "epoch": 1.53, "learning_rate": 7.005477200795269e-05, "loss": 0.0091, "step": 591390 }, { "epoch": 1.53, "learning_rate": 7.005088379158123e-05, "loss": 0.0063, "step": 591400 }, { "epoch": 1.53, "learning_rate": 7.004699557520976e-05, "loss": 0.0089, "step": 591410 }, { "epoch": 1.53, "learning_rate": 7.00431073588383e-05, "loss": 0.0077, "step": 591420 }, { "epoch": 1.53, "learning_rate": 7.003921914246683e-05, "loss": 0.0092, "step": 591430 }, { "epoch": 1.53, "learning_rate": 7.003533092609537e-05, "loss": 0.009, "step": 591440 }, { "epoch": 1.53, "learning_rate": 7.003144270972391e-05, "loss": 0.0084, "step": 591450 }, { "epoch": 1.53, "learning_rate": 7.002755449335244e-05, "loss": 0.0064, "step": 591460 }, { "epoch": 1.53, "learning_rate": 7.002366627698098e-05, "loss": 0.011, "step": 591470 }, { "epoch": 1.53, "learning_rate": 7.00197780606095e-05, "loss": 0.01, "step": 591480 }, { "epoch": 1.53, "learning_rate": 7.001588984423805e-05, "loss": 0.0081, "step": 591490 }, { "epoch": 1.53, "learning_rate": 7.001200162786658e-05, "loss": 0.0131, "step": 591500 }, { "epoch": 1.53, "learning_rate": 7.000811341149512e-05, "loss": 0.0087, "step": 591510 }, { "epoch": 1.53, "learning_rate": 7.000422519512366e-05, "loss": 0.0075, "step": 591520 }, { "epoch": 1.53, "learning_rate": 7.000033697875219e-05, "loss": 0.0076, "step": 591530 }, { "epoch": 1.53, "learning_rate": 6.999644876238073e-05, "loss": 0.0092, "step": 591540 }, { "epoch": 1.53, "learning_rate": 6.999256054600926e-05, "loss": 0.0091, "step": 591550 }, { "epoch": 1.53, "learning_rate": 6.99886723296378e-05, "loss": 0.0088, "step": 591560 }, { "epoch": 1.53, "learning_rate": 6.998478411326633e-05, "loss": 0.0106, "step": 591570 }, { "epoch": 1.53, "learning_rate": 6.998089589689487e-05, "loss": 0.0076, "step": 591580 }, { "epoch": 1.53, "learning_rate": 6.99770076805234e-05, "loss": 0.0085, "step": 591590 }, { "epoch": 1.53, "learning_rate": 6.997311946415194e-05, "loss": 0.0096, "step": 591600 }, { "epoch": 1.53, "learning_rate": 6.996923124778048e-05, "loss": 0.0083, "step": 591610 }, { "epoch": 1.53, "learning_rate": 6.996534303140901e-05, "loss": 0.0087, "step": 591620 }, { "epoch": 1.53, "learning_rate": 6.996145481503754e-05, "loss": 0.0091, "step": 591630 }, { "epoch": 1.53, "learning_rate": 6.995756659866608e-05, "loss": 0.0078, "step": 591640 }, { "epoch": 1.53, "learning_rate": 6.99536783822946e-05, "loss": 0.0072, "step": 591650 }, { "epoch": 1.53, "learning_rate": 6.994979016592315e-05, "loss": 0.0107, "step": 591660 }, { "epoch": 1.53, "learning_rate": 6.994590194955168e-05, "loss": 0.0097, "step": 591670 }, { "epoch": 1.53, "learning_rate": 6.994201373318022e-05, "loss": 0.0069, "step": 591680 }, { "epoch": 1.53, "learning_rate": 6.993812551680875e-05, "loss": 0.0095, "step": 591690 }, { "epoch": 1.53, "learning_rate": 6.993423730043729e-05, "loss": 0.0084, "step": 591700 }, { "epoch": 1.53, "learning_rate": 6.993034908406583e-05, "loss": 0.0085, "step": 591710 }, { "epoch": 1.53, "learning_rate": 6.992646086769436e-05, "loss": 0.0102, "step": 591720 }, { "epoch": 1.53, "learning_rate": 6.99225726513229e-05, "loss": 0.0085, "step": 591730 }, { "epoch": 1.53, "learning_rate": 6.991868443495143e-05, "loss": 0.0144, "step": 591740 }, { "epoch": 1.53, "learning_rate": 6.991479621857997e-05, "loss": 0.0082, "step": 591750 }, { "epoch": 1.53, "learning_rate": 6.99109080022085e-05, "loss": 0.0079, "step": 591760 }, { "epoch": 1.53, "learning_rate": 6.990701978583704e-05, "loss": 0.0098, "step": 591770 }, { "epoch": 1.53, "learning_rate": 6.990313156946558e-05, "loss": 0.0086, "step": 591780 }, { "epoch": 1.53, "learning_rate": 6.989924335309411e-05, "loss": 0.007, "step": 591790 }, { "epoch": 1.53, "learning_rate": 6.989535513672265e-05, "loss": 0.0078, "step": 591800 }, { "epoch": 1.53, "learning_rate": 6.989146692035118e-05, "loss": 0.0091, "step": 591810 }, { "epoch": 1.53, "learning_rate": 6.988757870397972e-05, "loss": 0.0099, "step": 591820 }, { "epoch": 1.53, "learning_rate": 6.988369048760825e-05, "loss": 0.009, "step": 591830 }, { "epoch": 1.53, "learning_rate": 6.987980227123679e-05, "loss": 0.0097, "step": 591840 }, { "epoch": 1.53, "learning_rate": 6.987591405486532e-05, "loss": 0.0064, "step": 591850 }, { "epoch": 1.53, "learning_rate": 6.987202583849385e-05, "loss": 0.0081, "step": 591860 }, { "epoch": 1.53, "learning_rate": 6.986813762212239e-05, "loss": 0.0092, "step": 591870 }, { "epoch": 1.53, "learning_rate": 6.986424940575093e-05, "loss": 0.0082, "step": 591880 }, { "epoch": 1.53, "learning_rate": 6.986036118937946e-05, "loss": 0.0058, "step": 591890 }, { "epoch": 1.53, "learning_rate": 6.9856472973008e-05, "loss": 0.0081, "step": 591900 }, { "epoch": 1.53, "learning_rate": 6.985258475663653e-05, "loss": 0.0086, "step": 591910 }, { "epoch": 1.53, "learning_rate": 6.984869654026507e-05, "loss": 0.0119, "step": 591920 }, { "epoch": 1.53, "learning_rate": 6.98448083238936e-05, "loss": 0.0073, "step": 591930 }, { "epoch": 1.53, "learning_rate": 6.984092010752214e-05, "loss": 0.0086, "step": 591940 }, { "epoch": 1.53, "learning_rate": 6.983703189115067e-05, "loss": 0.0077, "step": 591950 }, { "epoch": 1.53, "learning_rate": 6.983314367477921e-05, "loss": 0.0094, "step": 591960 }, { "epoch": 1.53, "learning_rate": 6.982925545840775e-05, "loss": 0.0079, "step": 591970 }, { "epoch": 1.53, "learning_rate": 6.982536724203628e-05, "loss": 0.0083, "step": 591980 }, { "epoch": 1.53, "learning_rate": 6.982147902566482e-05, "loss": 0.0066, "step": 591990 }, { "epoch": 1.53, "learning_rate": 6.981759080929335e-05, "loss": 0.0081, "step": 592000 }, { "epoch": 1.53, "eval_cer": 0.8816816917691551, "eval_loss": 0.005928897298872471, "eval_runtime": 107.9324, "eval_samples_per_second": 18.53, "eval_steps_per_second": 4.633, "step": 592000 }, { "epoch": 1.53, "learning_rate": 6.981370259292189e-05, "loss": 0.0095, "step": 592010 }, { "epoch": 1.53, "learning_rate": 6.980981437655042e-05, "loss": 0.0064, "step": 592020 }, { "epoch": 1.53, "learning_rate": 6.980592616017896e-05, "loss": 0.0112, "step": 592030 }, { "epoch": 1.53, "learning_rate": 6.980203794380749e-05, "loss": 0.0104, "step": 592040 }, { "epoch": 1.53, "learning_rate": 6.979814972743603e-05, "loss": 0.0116, "step": 592050 }, { "epoch": 1.53, "learning_rate": 6.979426151106457e-05, "loss": 0.0121, "step": 592060 }, { "epoch": 1.53, "learning_rate": 6.97903732946931e-05, "loss": 0.0094, "step": 592070 }, { "epoch": 1.53, "learning_rate": 6.978648507832164e-05, "loss": 0.0101, "step": 592080 }, { "epoch": 1.53, "learning_rate": 6.978259686195017e-05, "loss": 0.01, "step": 592090 }, { "epoch": 1.53, "learning_rate": 6.977870864557871e-05, "loss": 0.0109, "step": 592100 }, { "epoch": 1.53, "learning_rate": 6.977482042920724e-05, "loss": 0.0072, "step": 592110 }, { "epoch": 1.53, "learning_rate": 6.977093221283576e-05, "loss": 0.0096, "step": 592120 }, { "epoch": 1.53, "learning_rate": 6.97670439964643e-05, "loss": 0.0061, "step": 592130 }, { "epoch": 1.53, "learning_rate": 6.976315578009283e-05, "loss": 0.0069, "step": 592140 }, { "epoch": 1.53, "learning_rate": 6.975926756372138e-05, "loss": 0.0105, "step": 592150 }, { "epoch": 1.53, "learning_rate": 6.975537934734992e-05, "loss": 0.0084, "step": 592160 }, { "epoch": 1.53, "learning_rate": 6.975149113097845e-05, "loss": 0.0093, "step": 592170 }, { "epoch": 1.54, "learning_rate": 6.974760291460699e-05, "loss": 0.012, "step": 592180 }, { "epoch": 1.54, "learning_rate": 6.974371469823552e-05, "loss": 0.0095, "step": 592190 }, { "epoch": 1.54, "learning_rate": 6.973982648186406e-05, "loss": 0.0072, "step": 592200 }, { "epoch": 1.54, "learning_rate": 6.973593826549259e-05, "loss": 0.0086, "step": 592210 }, { "epoch": 1.54, "learning_rate": 6.973205004912113e-05, "loss": 0.0076, "step": 592220 }, { "epoch": 1.54, "learning_rate": 6.972816183274967e-05, "loss": 0.0077, "step": 592230 }, { "epoch": 1.54, "learning_rate": 6.97242736163782e-05, "loss": 0.0083, "step": 592240 }, { "epoch": 1.54, "learning_rate": 6.972038540000674e-05, "loss": 0.0066, "step": 592250 }, { "epoch": 1.54, "learning_rate": 6.971649718363527e-05, "loss": 0.0124, "step": 592260 }, { "epoch": 1.54, "learning_rate": 6.971260896726381e-05, "loss": 0.0065, "step": 592270 }, { "epoch": 1.54, "learning_rate": 6.970872075089234e-05, "loss": 0.0107, "step": 592280 }, { "epoch": 1.54, "learning_rate": 6.970483253452088e-05, "loss": 0.0088, "step": 592290 }, { "epoch": 1.54, "learning_rate": 6.97009443181494e-05, "loss": 0.0082, "step": 592300 }, { "epoch": 1.54, "learning_rate": 6.969705610177795e-05, "loss": 0.0063, "step": 592310 }, { "epoch": 1.54, "learning_rate": 6.969316788540649e-05, "loss": 0.0105, "step": 592320 }, { "epoch": 1.54, "learning_rate": 6.968927966903502e-05, "loss": 0.0101, "step": 592330 }, { "epoch": 1.54, "learning_rate": 6.968539145266356e-05, "loss": 0.0093, "step": 592340 }, { "epoch": 1.54, "learning_rate": 6.968150323629209e-05, "loss": 0.0088, "step": 592350 }, { "epoch": 1.54, "learning_rate": 6.967761501992062e-05, "loss": 0.0084, "step": 592360 }, { "epoch": 1.54, "learning_rate": 6.967372680354916e-05, "loss": 0.0081, "step": 592370 }, { "epoch": 1.54, "learning_rate": 6.966983858717768e-05, "loss": 0.0081, "step": 592380 }, { "epoch": 1.54, "learning_rate": 6.966595037080623e-05, "loss": 0.0095, "step": 592390 }, { "epoch": 1.54, "learning_rate": 6.966206215443475e-05, "loss": 0.009, "step": 592400 }, { "epoch": 1.54, "learning_rate": 6.96581739380633e-05, "loss": 0.0082, "step": 592410 }, { "epoch": 1.54, "learning_rate": 6.965428572169184e-05, "loss": 0.0089, "step": 592420 }, { "epoch": 1.54, "learning_rate": 6.965039750532037e-05, "loss": 0.0102, "step": 592430 }, { "epoch": 1.54, "learning_rate": 6.964650928894891e-05, "loss": 0.0099, "step": 592440 }, { "epoch": 1.54, "learning_rate": 6.964262107257744e-05, "loss": 0.0073, "step": 592450 }, { "epoch": 1.54, "learning_rate": 6.963873285620598e-05, "loss": 0.0073, "step": 592460 }, { "epoch": 1.54, "learning_rate": 6.96348446398345e-05, "loss": 0.0102, "step": 592470 }, { "epoch": 1.54, "learning_rate": 6.963095642346305e-05, "loss": 0.0074, "step": 592480 }, { "epoch": 1.54, "learning_rate": 6.962706820709159e-05, "loss": 0.0111, "step": 592490 }, { "epoch": 1.54, "learning_rate": 6.962317999072012e-05, "loss": 0.0092, "step": 592500 }, { "epoch": 1.54, "learning_rate": 6.961929177434866e-05, "loss": 0.0087, "step": 592510 }, { "epoch": 1.54, "learning_rate": 6.961540355797719e-05, "loss": 0.0086, "step": 592520 }, { "epoch": 1.54, "learning_rate": 6.961151534160573e-05, "loss": 0.0115, "step": 592530 }, { "epoch": 1.54, "learning_rate": 6.960762712523426e-05, "loss": 0.0103, "step": 592540 }, { "epoch": 1.54, "learning_rate": 6.96037389088628e-05, "loss": 0.0085, "step": 592550 }, { "epoch": 1.54, "learning_rate": 6.959985069249133e-05, "loss": 0.0094, "step": 592560 }, { "epoch": 1.54, "learning_rate": 6.959596247611987e-05, "loss": 0.0092, "step": 592570 }, { "epoch": 1.54, "learning_rate": 6.959207425974841e-05, "loss": 0.0086, "step": 592580 }, { "epoch": 1.54, "learning_rate": 6.958818604337694e-05, "loss": 0.0081, "step": 592590 }, { "epoch": 1.54, "learning_rate": 6.958429782700548e-05, "loss": 0.0073, "step": 592600 }, { "epoch": 1.54, "learning_rate": 6.958040961063401e-05, "loss": 0.0089, "step": 592610 }, { "epoch": 1.54, "learning_rate": 6.957652139426254e-05, "loss": 0.0095, "step": 592620 }, { "epoch": 1.54, "learning_rate": 6.957263317789108e-05, "loss": 0.0122, "step": 592630 }, { "epoch": 1.54, "learning_rate": 6.95687449615196e-05, "loss": 0.0066, "step": 592640 }, { "epoch": 1.54, "learning_rate": 6.956485674514815e-05, "loss": 0.0066, "step": 592650 }, { "epoch": 1.54, "learning_rate": 6.956096852877667e-05, "loss": 0.008, "step": 592660 }, { "epoch": 1.54, "learning_rate": 6.955708031240522e-05, "loss": 0.0091, "step": 592670 }, { "epoch": 1.54, "learning_rate": 6.955319209603376e-05, "loss": 0.0131, "step": 592680 }, { "epoch": 1.54, "learning_rate": 6.954930387966229e-05, "loss": 0.0122, "step": 592690 }, { "epoch": 1.54, "learning_rate": 6.954541566329083e-05, "loss": 0.0087, "step": 592700 }, { "epoch": 1.54, "learning_rate": 6.954152744691936e-05, "loss": 0.0077, "step": 592710 }, { "epoch": 1.54, "learning_rate": 6.95376392305479e-05, "loss": 0.0089, "step": 592720 }, { "epoch": 1.54, "learning_rate": 6.953375101417643e-05, "loss": 0.0119, "step": 592730 }, { "epoch": 1.54, "learning_rate": 6.952986279780497e-05, "loss": 0.0085, "step": 592740 }, { "epoch": 1.54, "learning_rate": 6.952597458143351e-05, "loss": 0.0106, "step": 592750 }, { "epoch": 1.54, "learning_rate": 6.952208636506204e-05, "loss": 0.0112, "step": 592760 }, { "epoch": 1.54, "learning_rate": 6.951819814869058e-05, "loss": 0.0101, "step": 592770 }, { "epoch": 1.54, "learning_rate": 6.95143099323191e-05, "loss": 0.0065, "step": 592780 }, { "epoch": 1.54, "learning_rate": 6.951042171594765e-05, "loss": 0.0111, "step": 592790 }, { "epoch": 1.54, "learning_rate": 6.950653349957618e-05, "loss": 0.0096, "step": 592800 }, { "epoch": 1.54, "learning_rate": 6.950264528320472e-05, "loss": 0.0102, "step": 592810 }, { "epoch": 1.54, "learning_rate": 6.949875706683325e-05, "loss": 0.0092, "step": 592820 }, { "epoch": 1.54, "learning_rate": 6.949486885046179e-05, "loss": 0.0087, "step": 592830 }, { "epoch": 1.54, "learning_rate": 6.949098063409033e-05, "loss": 0.0071, "step": 592840 }, { "epoch": 1.54, "learning_rate": 6.948709241771886e-05, "loss": 0.0097, "step": 592850 }, { "epoch": 1.54, "learning_rate": 6.948320420134739e-05, "loss": 0.0092, "step": 592860 }, { "epoch": 1.54, "learning_rate": 6.947931598497593e-05, "loss": 0.0072, "step": 592870 }, { "epoch": 1.54, "learning_rate": 6.947542776860446e-05, "loss": 0.01, "step": 592880 }, { "epoch": 1.54, "learning_rate": 6.9471539552233e-05, "loss": 0.0086, "step": 592890 }, { "epoch": 1.54, "learning_rate": 6.946765133586152e-05, "loss": 0.0111, "step": 592900 }, { "epoch": 1.54, "learning_rate": 6.946376311949007e-05, "loss": 0.0086, "step": 592910 }, { "epoch": 1.54, "learning_rate": 6.94598749031186e-05, "loss": 0.0079, "step": 592920 }, { "epoch": 1.54, "learning_rate": 6.945598668674714e-05, "loss": 0.0092, "step": 592930 }, { "epoch": 1.54, "learning_rate": 6.945209847037568e-05, "loss": 0.0083, "step": 592940 }, { "epoch": 1.54, "learning_rate": 6.94482102540042e-05, "loss": 0.007, "step": 592950 }, { "epoch": 1.54, "learning_rate": 6.944432203763275e-05, "loss": 0.0095, "step": 592960 }, { "epoch": 1.54, "learning_rate": 6.944043382126128e-05, "loss": 0.0082, "step": 592970 }, { "epoch": 1.54, "learning_rate": 6.943654560488982e-05, "loss": 0.0108, "step": 592980 }, { "epoch": 1.54, "learning_rate": 6.943265738851835e-05, "loss": 0.0056, "step": 592990 }, { "epoch": 1.54, "learning_rate": 6.942876917214689e-05, "loss": 0.0097, "step": 593000 }, { "epoch": 1.54, "eval_cer": 0.8816872903168917, "eval_loss": 0.005945616401731968, "eval_runtime": 107.8905, "eval_samples_per_second": 18.537, "eval_steps_per_second": 4.634, "step": 593000 }, { "epoch": 1.54, "learning_rate": 6.942488095577543e-05, "loss": 0.0064, "step": 593010 }, { "epoch": 1.54, "learning_rate": 6.942099273940396e-05, "loss": 0.0081, "step": 593020 }, { "epoch": 1.54, "learning_rate": 6.94171045230325e-05, "loss": 0.0092, "step": 593030 }, { "epoch": 1.54, "learning_rate": 6.941321630666103e-05, "loss": 0.0071, "step": 593040 }, { "epoch": 1.54, "learning_rate": 6.940932809028957e-05, "loss": 0.0106, "step": 593050 }, { "epoch": 1.54, "learning_rate": 6.94054398739181e-05, "loss": 0.0057, "step": 593060 }, { "epoch": 1.54, "learning_rate": 6.940155165754664e-05, "loss": 0.0082, "step": 593070 }, { "epoch": 1.54, "learning_rate": 6.939766344117517e-05, "loss": 0.0079, "step": 593080 }, { "epoch": 1.54, "learning_rate": 6.939377522480371e-05, "loss": 0.0103, "step": 593090 }, { "epoch": 1.54, "learning_rate": 6.938988700843224e-05, "loss": 0.0127, "step": 593100 }, { "epoch": 1.54, "learning_rate": 6.938599879206078e-05, "loss": 0.0101, "step": 593110 }, { "epoch": 1.54, "learning_rate": 6.93821105756893e-05, "loss": 0.0083, "step": 593120 }, { "epoch": 1.54, "learning_rate": 6.937822235931785e-05, "loss": 0.01, "step": 593130 }, { "epoch": 1.54, "learning_rate": 6.937433414294638e-05, "loss": 0.0094, "step": 593140 }, { "epoch": 1.54, "learning_rate": 6.937044592657492e-05, "loss": 0.0083, "step": 593150 }, { "epoch": 1.54, "learning_rate": 6.936655771020344e-05, "loss": 0.0083, "step": 593160 }, { "epoch": 1.54, "learning_rate": 6.936266949383199e-05, "loss": 0.0082, "step": 593170 }, { "epoch": 1.54, "learning_rate": 6.935878127746051e-05, "loss": 0.0111, "step": 593180 }, { "epoch": 1.54, "learning_rate": 6.935489306108906e-05, "loss": 0.0075, "step": 593190 }, { "epoch": 1.54, "learning_rate": 6.93510048447176e-05, "loss": 0.0087, "step": 593200 }, { "epoch": 1.54, "learning_rate": 6.934711662834613e-05, "loss": 0.0093, "step": 593210 }, { "epoch": 1.54, "learning_rate": 6.934322841197467e-05, "loss": 0.0092, "step": 593220 }, { "epoch": 1.54, "learning_rate": 6.93393401956032e-05, "loss": 0.0109, "step": 593230 }, { "epoch": 1.54, "learning_rate": 6.933545197923174e-05, "loss": 0.0087, "step": 593240 }, { "epoch": 1.54, "learning_rate": 6.933156376286027e-05, "loss": 0.0133, "step": 593250 }, { "epoch": 1.54, "learning_rate": 6.932767554648881e-05, "loss": 0.0086, "step": 593260 }, { "epoch": 1.54, "learning_rate": 6.932378733011735e-05, "loss": 0.0096, "step": 593270 }, { "epoch": 1.54, "learning_rate": 6.931989911374588e-05, "loss": 0.0121, "step": 593280 }, { "epoch": 1.54, "learning_rate": 6.931601089737442e-05, "loss": 0.0064, "step": 593290 }, { "epoch": 1.54, "learning_rate": 6.931212268100295e-05, "loss": 0.0093, "step": 593300 }, { "epoch": 1.54, "learning_rate": 6.930823446463149e-05, "loss": 0.0101, "step": 593310 }, { "epoch": 1.54, "learning_rate": 6.930434624826002e-05, "loss": 0.0074, "step": 593320 }, { "epoch": 1.54, "learning_rate": 6.930045803188856e-05, "loss": 0.0088, "step": 593330 }, { "epoch": 1.54, "learning_rate": 6.929656981551709e-05, "loss": 0.0114, "step": 593340 }, { "epoch": 1.54, "learning_rate": 6.929268159914561e-05, "loss": 0.0087, "step": 593350 }, { "epoch": 1.54, "learning_rate": 6.928879338277416e-05, "loss": 0.0106, "step": 593360 }, { "epoch": 1.54, "learning_rate": 6.92849051664027e-05, "loss": 0.0085, "step": 593370 }, { "epoch": 1.54, "learning_rate": 6.928101695003123e-05, "loss": 0.008, "step": 593380 }, { "epoch": 1.54, "learning_rate": 6.927712873365977e-05, "loss": 0.0099, "step": 593390 }, { "epoch": 1.54, "learning_rate": 6.92732405172883e-05, "loss": 0.0051, "step": 593400 }, { "epoch": 1.54, "learning_rate": 6.926935230091684e-05, "loss": 0.0081, "step": 593410 }, { "epoch": 1.54, "learning_rate": 6.926546408454536e-05, "loss": 0.0094, "step": 593420 }, { "epoch": 1.54, "learning_rate": 6.92615758681739e-05, "loss": 0.0084, "step": 593430 }, { "epoch": 1.54, "learning_rate": 6.925768765180243e-05, "loss": 0.0081, "step": 593440 }, { "epoch": 1.54, "learning_rate": 6.925379943543098e-05, "loss": 0.0124, "step": 593450 }, { "epoch": 1.54, "learning_rate": 6.924991121905952e-05, "loss": 0.0123, "step": 593460 }, { "epoch": 1.54, "learning_rate": 6.924602300268805e-05, "loss": 0.0086, "step": 593470 }, { "epoch": 1.54, "learning_rate": 6.924213478631659e-05, "loss": 0.0087, "step": 593480 }, { "epoch": 1.54, "learning_rate": 6.923824656994512e-05, "loss": 0.0085, "step": 593490 }, { "epoch": 1.54, "learning_rate": 6.923435835357366e-05, "loss": 0.0096, "step": 593500 }, { "epoch": 1.54, "learning_rate": 6.923047013720219e-05, "loss": 0.0092, "step": 593510 }, { "epoch": 1.54, "learning_rate": 6.922658192083073e-05, "loss": 0.0075, "step": 593520 }, { "epoch": 1.54, "learning_rate": 6.922269370445925e-05, "loss": 0.0164, "step": 593530 }, { "epoch": 1.54, "learning_rate": 6.92188054880878e-05, "loss": 0.0095, "step": 593540 }, { "epoch": 1.54, "learning_rate": 6.921491727171634e-05, "loss": 0.0092, "step": 593550 }, { "epoch": 1.54, "learning_rate": 6.921102905534487e-05, "loss": 0.0093, "step": 593560 }, { "epoch": 1.54, "learning_rate": 6.920714083897341e-05, "loss": 0.0098, "step": 593570 }, { "epoch": 1.54, "learning_rate": 6.920325262260194e-05, "loss": 0.0083, "step": 593580 }, { "epoch": 1.54, "learning_rate": 6.919936440623048e-05, "loss": 0.0093, "step": 593590 }, { "epoch": 1.54, "learning_rate": 6.9195476189859e-05, "loss": 0.0077, "step": 593600 }, { "epoch": 1.54, "learning_rate": 6.919158797348753e-05, "loss": 0.0072, "step": 593610 }, { "epoch": 1.54, "learning_rate": 6.918769975711608e-05, "loss": 0.0059, "step": 593620 }, { "epoch": 1.54, "learning_rate": 6.91838115407446e-05, "loss": 0.0083, "step": 593630 }, { "epoch": 1.54, "learning_rate": 6.917992332437315e-05, "loss": 0.0089, "step": 593640 }, { "epoch": 1.54, "learning_rate": 6.917603510800169e-05, "loss": 0.0134, "step": 593650 }, { "epoch": 1.54, "learning_rate": 6.917214689163021e-05, "loss": 0.0103, "step": 593660 }, { "epoch": 1.54, "learning_rate": 6.916825867525876e-05, "loss": 0.0091, "step": 593670 }, { "epoch": 1.54, "learning_rate": 6.916437045888728e-05, "loss": 0.009, "step": 593680 }, { "epoch": 1.54, "learning_rate": 6.916048224251583e-05, "loss": 0.0152, "step": 593690 }, { "epoch": 1.54, "learning_rate": 6.915659402614435e-05, "loss": 0.0065, "step": 593700 }, { "epoch": 1.54, "learning_rate": 6.91527058097729e-05, "loss": 0.0097, "step": 593710 }, { "epoch": 1.54, "learning_rate": 6.914881759340144e-05, "loss": 0.0055, "step": 593720 }, { "epoch": 1.54, "learning_rate": 6.914492937702997e-05, "loss": 0.0092, "step": 593730 }, { "epoch": 1.54, "learning_rate": 6.914104116065851e-05, "loss": 0.0078, "step": 593740 }, { "epoch": 1.54, "learning_rate": 6.913715294428704e-05, "loss": 0.0104, "step": 593750 }, { "epoch": 1.54, "learning_rate": 6.913326472791558e-05, "loss": 0.0102, "step": 593760 }, { "epoch": 1.54, "learning_rate": 6.91293765115441e-05, "loss": 0.01, "step": 593770 }, { "epoch": 1.54, "learning_rate": 6.912548829517265e-05, "loss": 0.0116, "step": 593780 }, { "epoch": 1.54, "learning_rate": 6.912160007880117e-05, "loss": 0.0076, "step": 593790 }, { "epoch": 1.54, "learning_rate": 6.911771186242972e-05, "loss": 0.0088, "step": 593800 }, { "epoch": 1.54, "learning_rate": 6.911382364605826e-05, "loss": 0.0087, "step": 593810 }, { "epoch": 1.54, "learning_rate": 6.910993542968679e-05, "loss": 0.0101, "step": 593820 }, { "epoch": 1.54, "learning_rate": 6.910604721331533e-05, "loss": 0.0073, "step": 593830 }, { "epoch": 1.54, "learning_rate": 6.910215899694386e-05, "loss": 0.0077, "step": 593840 }, { "epoch": 1.54, "learning_rate": 6.909827078057238e-05, "loss": 0.0114, "step": 593850 }, { "epoch": 1.54, "learning_rate": 6.909438256420093e-05, "loss": 0.0112, "step": 593860 }, { "epoch": 1.54, "learning_rate": 6.909049434782945e-05, "loss": 0.0084, "step": 593870 }, { "epoch": 1.54, "learning_rate": 6.9086606131458e-05, "loss": 0.0097, "step": 593880 }, { "epoch": 1.54, "learning_rate": 6.908271791508652e-05, "loss": 0.0084, "step": 593890 }, { "epoch": 1.54, "learning_rate": 6.907882969871507e-05, "loss": 0.0096, "step": 593900 }, { "epoch": 1.54, "learning_rate": 6.907494148234361e-05, "loss": 0.0086, "step": 593910 }, { "epoch": 1.54, "learning_rate": 6.907105326597213e-05, "loss": 0.0095, "step": 593920 }, { "epoch": 1.54, "learning_rate": 6.906716504960068e-05, "loss": 0.0108, "step": 593930 }, { "epoch": 1.54, "learning_rate": 6.90632768332292e-05, "loss": 0.0118, "step": 593940 }, { "epoch": 1.54, "learning_rate": 6.905938861685775e-05, "loss": 0.0102, "step": 593950 }, { "epoch": 1.54, "learning_rate": 6.905550040048627e-05, "loss": 0.0088, "step": 593960 }, { "epoch": 1.54, "learning_rate": 6.905161218411482e-05, "loss": 0.01, "step": 593970 }, { "epoch": 1.54, "learning_rate": 6.904772396774336e-05, "loss": 0.0103, "step": 593980 }, { "epoch": 1.54, "learning_rate": 6.904383575137189e-05, "loss": 0.0097, "step": 593990 }, { "epoch": 1.54, "learning_rate": 6.903994753500043e-05, "loss": 0.0116, "step": 594000 }, { "epoch": 1.54, "eval_cer": 0.8816998870492994, "eval_loss": 0.005914547014981508, "eval_runtime": 107.9749, "eval_samples_per_second": 18.523, "eval_steps_per_second": 4.631, "step": 594000 }, { "epoch": 1.54, "learning_rate": 6.903605931862896e-05, "loss": 0.0106, "step": 594010 }, { "epoch": 1.54, "learning_rate": 6.90321711022575e-05, "loss": 0.0092, "step": 594020 }, { "epoch": 1.54, "learning_rate": 6.902828288588603e-05, "loss": 0.0096, "step": 594030 }, { "epoch": 1.54, "learning_rate": 6.902439466951457e-05, "loss": 0.0105, "step": 594040 }, { "epoch": 1.54, "learning_rate": 6.90205064531431e-05, "loss": 0.007, "step": 594050 }, { "epoch": 1.54, "learning_rate": 6.901661823677164e-05, "loss": 0.0112, "step": 594060 }, { "epoch": 1.54, "learning_rate": 6.901273002040018e-05, "loss": 0.0127, "step": 594070 }, { "epoch": 1.54, "learning_rate": 6.90088418040287e-05, "loss": 0.0065, "step": 594080 }, { "epoch": 1.54, "learning_rate": 6.900495358765725e-05, "loss": 0.0097, "step": 594090 }, { "epoch": 1.54, "learning_rate": 6.900106537128578e-05, "loss": 0.0066, "step": 594100 }, { "epoch": 1.54, "learning_rate": 6.89971771549143e-05, "loss": 0.0091, "step": 594110 }, { "epoch": 1.54, "learning_rate": 6.899328893854285e-05, "loss": 0.0085, "step": 594120 }, { "epoch": 1.54, "learning_rate": 6.898940072217137e-05, "loss": 0.0102, "step": 594130 }, { "epoch": 1.54, "learning_rate": 6.898551250579992e-05, "loss": 0.0107, "step": 594140 }, { "epoch": 1.54, "learning_rate": 6.898162428942844e-05, "loss": 0.0077, "step": 594150 }, { "epoch": 1.54, "learning_rate": 6.897773607305699e-05, "loss": 0.0098, "step": 594160 }, { "epoch": 1.54, "learning_rate": 6.897384785668553e-05, "loss": 0.008, "step": 594170 }, { "epoch": 1.54, "learning_rate": 6.896995964031405e-05, "loss": 0.0097, "step": 594180 }, { "epoch": 1.54, "learning_rate": 6.89660714239426e-05, "loss": 0.0102, "step": 594190 }, { "epoch": 1.54, "learning_rate": 6.896218320757112e-05, "loss": 0.0081, "step": 594200 }, { "epoch": 1.54, "learning_rate": 6.895829499119967e-05, "loss": 0.0085, "step": 594210 }, { "epoch": 1.54, "learning_rate": 6.89544067748282e-05, "loss": 0.0092, "step": 594220 }, { "epoch": 1.54, "learning_rate": 6.895051855845674e-05, "loss": 0.0117, "step": 594230 }, { "epoch": 1.54, "learning_rate": 6.894663034208528e-05, "loss": 0.0099, "step": 594240 }, { "epoch": 1.54, "learning_rate": 6.89427421257138e-05, "loss": 0.0089, "step": 594250 }, { "epoch": 1.54, "learning_rate": 6.893885390934235e-05, "loss": 0.0103, "step": 594260 }, { "epoch": 1.54, "learning_rate": 6.893496569297088e-05, "loss": 0.0095, "step": 594270 }, { "epoch": 1.54, "learning_rate": 6.893107747659942e-05, "loss": 0.0085, "step": 594280 }, { "epoch": 1.54, "learning_rate": 6.892718926022795e-05, "loss": 0.009, "step": 594290 }, { "epoch": 1.54, "learning_rate": 6.892330104385649e-05, "loss": 0.0076, "step": 594300 }, { "epoch": 1.54, "learning_rate": 6.891941282748501e-05, "loss": 0.0089, "step": 594310 }, { "epoch": 1.54, "learning_rate": 6.891552461111356e-05, "loss": 0.0081, "step": 594320 }, { "epoch": 1.54, "learning_rate": 6.89116363947421e-05, "loss": 0.008, "step": 594330 }, { "epoch": 1.54, "learning_rate": 6.890774817837063e-05, "loss": 0.0087, "step": 594340 }, { "epoch": 1.54, "learning_rate": 6.890385996199915e-05, "loss": 0.0076, "step": 594350 }, { "epoch": 1.54, "learning_rate": 6.88999717456277e-05, "loss": 0.0084, "step": 594360 }, { "epoch": 1.54, "learning_rate": 6.889608352925622e-05, "loss": 0.0066, "step": 594370 }, { "epoch": 1.54, "learning_rate": 6.889219531288477e-05, "loss": 0.0069, "step": 594380 }, { "epoch": 1.54, "learning_rate": 6.88883070965133e-05, "loss": 0.0095, "step": 594390 }, { "epoch": 1.54, "learning_rate": 6.888441888014184e-05, "loss": 0.011, "step": 594400 }, { "epoch": 1.54, "learning_rate": 6.888053066377036e-05, "loss": 0.0088, "step": 594410 }, { "epoch": 1.54, "learning_rate": 6.88766424473989e-05, "loss": 0.0075, "step": 594420 }, { "epoch": 1.54, "learning_rate": 6.887275423102745e-05, "loss": 0.0104, "step": 594430 }, { "epoch": 1.54, "learning_rate": 6.886886601465597e-05, "loss": 0.0104, "step": 594440 }, { "epoch": 1.54, "learning_rate": 6.886497779828452e-05, "loss": 0.0115, "step": 594450 }, { "epoch": 1.54, "learning_rate": 6.886108958191304e-05, "loss": 0.0064, "step": 594460 }, { "epoch": 1.54, "learning_rate": 6.885720136554159e-05, "loss": 0.0068, "step": 594470 }, { "epoch": 1.54, "learning_rate": 6.885331314917011e-05, "loss": 0.0101, "step": 594480 }, { "epoch": 1.54, "learning_rate": 6.884942493279866e-05, "loss": 0.0094, "step": 594490 }, { "epoch": 1.54, "learning_rate": 6.88455367164272e-05, "loss": 0.0076, "step": 594500 }, { "epoch": 1.54, "learning_rate": 6.884164850005573e-05, "loss": 0.0081, "step": 594510 }, { "epoch": 1.54, "learning_rate": 6.883776028368427e-05, "loss": 0.0069, "step": 594520 }, { "epoch": 1.54, "learning_rate": 6.88338720673128e-05, "loss": 0.0085, "step": 594530 }, { "epoch": 1.54, "learning_rate": 6.882998385094134e-05, "loss": 0.0106, "step": 594540 }, { "epoch": 1.54, "learning_rate": 6.882609563456987e-05, "loss": 0.0061, "step": 594550 }, { "epoch": 1.54, "learning_rate": 6.88222074181984e-05, "loss": 0.007, "step": 594560 }, { "epoch": 1.54, "learning_rate": 6.881831920182693e-05, "loss": 0.007, "step": 594570 }, { "epoch": 1.54, "learning_rate": 6.881443098545548e-05, "loss": 0.0069, "step": 594580 }, { "epoch": 1.54, "learning_rate": 6.8810542769084e-05, "loss": 0.0089, "step": 594590 }, { "epoch": 1.54, "learning_rate": 6.880665455271255e-05, "loss": 0.0087, "step": 594600 }, { "epoch": 1.54, "learning_rate": 6.880276633634107e-05, "loss": 0.0068, "step": 594610 }, { "epoch": 1.54, "learning_rate": 6.879887811996962e-05, "loss": 0.0087, "step": 594620 }, { "epoch": 1.54, "learning_rate": 6.879498990359814e-05, "loss": 0.0076, "step": 594630 }, { "epoch": 1.54, "learning_rate": 6.879110168722669e-05, "loss": 0.0127, "step": 594640 }, { "epoch": 1.54, "learning_rate": 6.878721347085521e-05, "loss": 0.0077, "step": 594650 }, { "epoch": 1.54, "learning_rate": 6.878332525448376e-05, "loss": 0.0098, "step": 594660 }, { "epoch": 1.54, "learning_rate": 6.877943703811228e-05, "loss": 0.0108, "step": 594670 }, { "epoch": 1.54, "learning_rate": 6.877554882174083e-05, "loss": 0.0116, "step": 594680 }, { "epoch": 1.54, "learning_rate": 6.877166060536937e-05, "loss": 0.008, "step": 594690 }, { "epoch": 1.54, "learning_rate": 6.87677723889979e-05, "loss": 0.008, "step": 594700 }, { "epoch": 1.54, "learning_rate": 6.876388417262644e-05, "loss": 0.0081, "step": 594710 }, { "epoch": 1.54, "learning_rate": 6.875999595625496e-05, "loss": 0.008, "step": 594720 }, { "epoch": 1.54, "learning_rate": 6.87561077398835e-05, "loss": 0.0114, "step": 594730 }, { "epoch": 1.54, "learning_rate": 6.875221952351203e-05, "loss": 0.013, "step": 594740 }, { "epoch": 1.54, "learning_rate": 6.874833130714058e-05, "loss": 0.0096, "step": 594750 }, { "epoch": 1.54, "learning_rate": 6.87444430907691e-05, "loss": 0.0097, "step": 594760 }, { "epoch": 1.54, "learning_rate": 6.874055487439765e-05, "loss": 0.009, "step": 594770 }, { "epoch": 1.54, "learning_rate": 6.873666665802619e-05, "loss": 0.0091, "step": 594780 }, { "epoch": 1.54, "learning_rate": 6.873277844165472e-05, "loss": 0.0112, "step": 594790 }, { "epoch": 1.54, "learning_rate": 6.872889022528326e-05, "loss": 0.0087, "step": 594800 }, { "epoch": 1.54, "learning_rate": 6.872500200891179e-05, "loss": 0.0097, "step": 594810 }, { "epoch": 1.54, "learning_rate": 6.872111379254033e-05, "loss": 0.0074, "step": 594820 }, { "epoch": 1.54, "learning_rate": 6.871722557616885e-05, "loss": 0.0073, "step": 594830 }, { "epoch": 1.54, "learning_rate": 6.871333735979738e-05, "loss": 0.0084, "step": 594840 }, { "epoch": 1.54, "learning_rate": 6.870944914342592e-05, "loss": 0.0092, "step": 594850 }, { "epoch": 1.54, "learning_rate": 6.870556092705447e-05, "loss": 0.0085, "step": 594860 }, { "epoch": 1.54, "learning_rate": 6.8701672710683e-05, "loss": 0.0087, "step": 594870 }, { "epoch": 1.54, "learning_rate": 6.869778449431154e-05, "loss": 0.0081, "step": 594880 }, { "epoch": 1.54, "learning_rate": 6.869389627794006e-05, "loss": 0.0125, "step": 594890 }, { "epoch": 1.54, "learning_rate": 6.86900080615686e-05, "loss": 0.0067, "step": 594900 }, { "epoch": 1.54, "learning_rate": 6.868611984519713e-05, "loss": 0.0081, "step": 594910 }, { "epoch": 1.54, "learning_rate": 6.868223162882568e-05, "loss": 0.0075, "step": 594920 }, { "epoch": 1.54, "learning_rate": 6.86783434124542e-05, "loss": 0.0082, "step": 594930 }, { "epoch": 1.54, "learning_rate": 6.867445519608275e-05, "loss": 0.0108, "step": 594940 }, { "epoch": 1.54, "learning_rate": 6.867056697971129e-05, "loss": 0.01, "step": 594950 }, { "epoch": 1.54, "learning_rate": 6.866667876333981e-05, "loss": 0.008, "step": 594960 }, { "epoch": 1.54, "learning_rate": 6.866279054696836e-05, "loss": 0.0106, "step": 594970 }, { "epoch": 1.54, "learning_rate": 6.865890233059688e-05, "loss": 0.0073, "step": 594980 }, { "epoch": 1.54, "learning_rate": 6.865501411422543e-05, "loss": 0.0084, "step": 594990 }, { "epoch": 1.54, "learning_rate": 6.865112589785395e-05, "loss": 0.0088, "step": 595000 }, { "epoch": 1.54, "eval_cer": 0.8817082848709045, "eval_loss": 0.00575125589966774, "eval_runtime": 107.7066, "eval_samples_per_second": 18.569, "eval_steps_per_second": 4.642, "step": 595000 }, { "epoch": 1.54, "learning_rate": 6.86472376814825e-05, "loss": 0.0097, "step": 595010 }, { "epoch": 1.54, "learning_rate": 6.864334946511102e-05, "loss": 0.0103, "step": 595020 }, { "epoch": 1.54, "learning_rate": 6.863946124873957e-05, "loss": 0.0075, "step": 595030 }, { "epoch": 1.54, "learning_rate": 6.863557303236811e-05, "loss": 0.0106, "step": 595040 }, { "epoch": 1.54, "learning_rate": 6.863168481599664e-05, "loss": 0.0073, "step": 595050 }, { "epoch": 1.54, "learning_rate": 6.862779659962518e-05, "loss": 0.0096, "step": 595060 }, { "epoch": 1.54, "learning_rate": 6.86239083832537e-05, "loss": 0.0079, "step": 595070 }, { "epoch": 1.54, "learning_rate": 6.862002016688225e-05, "loss": 0.0099, "step": 595080 }, { "epoch": 1.54, "learning_rate": 6.861613195051077e-05, "loss": 0.0102, "step": 595090 }, { "epoch": 1.54, "learning_rate": 6.86122437341393e-05, "loss": 0.0099, "step": 595100 }, { "epoch": 1.54, "learning_rate": 6.860835551776784e-05, "loss": 0.0104, "step": 595110 }, { "epoch": 1.54, "learning_rate": 6.860446730139637e-05, "loss": 0.0082, "step": 595120 }, { "epoch": 1.54, "learning_rate": 6.860057908502491e-05, "loss": 0.0119, "step": 595130 }, { "epoch": 1.54, "learning_rate": 6.859669086865346e-05, "loss": 0.0094, "step": 595140 }, { "epoch": 1.54, "learning_rate": 6.859280265228198e-05, "loss": 0.0089, "step": 595150 }, { "epoch": 1.54, "learning_rate": 6.858891443591053e-05, "loss": 0.0084, "step": 595160 }, { "epoch": 1.54, "learning_rate": 6.858502621953905e-05, "loss": 0.0074, "step": 595170 }, { "epoch": 1.54, "learning_rate": 6.85811380031676e-05, "loss": 0.0075, "step": 595180 }, { "epoch": 1.54, "learning_rate": 6.857724978679612e-05, "loss": 0.0088, "step": 595190 }, { "epoch": 1.54, "learning_rate": 6.857336157042466e-05, "loss": 0.0099, "step": 595200 }, { "epoch": 1.54, "learning_rate": 6.85694733540532e-05, "loss": 0.0072, "step": 595210 }, { "epoch": 1.54, "learning_rate": 6.856558513768173e-05, "loss": 0.0102, "step": 595220 }, { "epoch": 1.54, "learning_rate": 6.856169692131028e-05, "loss": 0.0087, "step": 595230 }, { "epoch": 1.54, "learning_rate": 6.85578087049388e-05, "loss": 0.0096, "step": 595240 }, { "epoch": 1.54, "learning_rate": 6.855392048856735e-05, "loss": 0.0062, "step": 595250 }, { "epoch": 1.54, "learning_rate": 6.855003227219587e-05, "loss": 0.0071, "step": 595260 }, { "epoch": 1.54, "learning_rate": 6.854614405582442e-05, "loss": 0.0102, "step": 595270 }, { "epoch": 1.54, "learning_rate": 6.854225583945294e-05, "loss": 0.0072, "step": 595280 }, { "epoch": 1.54, "learning_rate": 6.853836762308149e-05, "loss": 0.0109, "step": 595290 }, { "epoch": 1.54, "learning_rate": 6.853447940671003e-05, "loss": 0.0068, "step": 595300 }, { "epoch": 1.54, "learning_rate": 6.853059119033856e-05, "loss": 0.0086, "step": 595310 }, { "epoch": 1.54, "learning_rate": 6.85267029739671e-05, "loss": 0.0069, "step": 595320 }, { "epoch": 1.54, "learning_rate": 6.852281475759562e-05, "loss": 0.009, "step": 595330 }, { "epoch": 1.54, "learning_rate": 6.851892654122415e-05, "loss": 0.0105, "step": 595340 }, { "epoch": 1.54, "learning_rate": 6.85150383248527e-05, "loss": 0.0125, "step": 595350 }, { "epoch": 1.54, "learning_rate": 6.851115010848122e-05, "loss": 0.0134, "step": 595360 }, { "epoch": 1.54, "learning_rate": 6.850726189210976e-05, "loss": 0.0078, "step": 595370 }, { "epoch": 1.54, "learning_rate": 6.850337367573829e-05, "loss": 0.0073, "step": 595380 }, { "epoch": 1.54, "learning_rate": 6.849948545936683e-05, "loss": 0.0107, "step": 595390 }, { "epoch": 1.54, "learning_rate": 6.849559724299538e-05, "loss": 0.0077, "step": 595400 }, { "epoch": 1.54, "learning_rate": 6.84917090266239e-05, "loss": 0.0087, "step": 595410 }, { "epoch": 1.54, "learning_rate": 6.848782081025245e-05, "loss": 0.0123, "step": 595420 }, { "epoch": 1.54, "learning_rate": 6.848393259388097e-05, "loss": 0.0123, "step": 595430 }, { "epoch": 1.54, "learning_rate": 6.848004437750952e-05, "loss": 0.009, "step": 595440 }, { "epoch": 1.54, "learning_rate": 6.847615616113804e-05, "loss": 0.0078, "step": 595450 }, { "epoch": 1.54, "learning_rate": 6.847226794476658e-05, "loss": 0.0102, "step": 595460 }, { "epoch": 1.54, "learning_rate": 6.846837972839513e-05, "loss": 0.0129, "step": 595470 }, { "epoch": 1.54, "learning_rate": 6.846449151202365e-05, "loss": 0.0089, "step": 595480 }, { "epoch": 1.54, "learning_rate": 6.84606032956522e-05, "loss": 0.0082, "step": 595490 }, { "epoch": 1.54, "learning_rate": 6.845671507928072e-05, "loss": 0.0076, "step": 595500 }, { "epoch": 1.54, "learning_rate": 6.845282686290927e-05, "loss": 0.0088, "step": 595510 }, { "epoch": 1.54, "learning_rate": 6.84489386465378e-05, "loss": 0.0066, "step": 595520 }, { "epoch": 1.54, "learning_rate": 6.844505043016634e-05, "loss": 0.0121, "step": 595530 }, { "epoch": 1.54, "learning_rate": 6.844116221379486e-05, "loss": 0.0085, "step": 595540 }, { "epoch": 1.54, "learning_rate": 6.84372739974234e-05, "loss": 0.0081, "step": 595550 }, { "epoch": 1.54, "learning_rate": 6.843338578105195e-05, "loss": 0.0086, "step": 595560 }, { "epoch": 1.54, "learning_rate": 6.842949756468048e-05, "loss": 0.0086, "step": 595570 }, { "epoch": 1.54, "learning_rate": 6.8425609348309e-05, "loss": 0.0074, "step": 595580 }, { "epoch": 1.54, "learning_rate": 6.842172113193754e-05, "loss": 0.0114, "step": 595590 }, { "epoch": 1.54, "learning_rate": 6.841783291556607e-05, "loss": 0.0068, "step": 595600 }, { "epoch": 1.54, "learning_rate": 6.841394469919461e-05, "loss": 0.0085, "step": 595610 }, { "epoch": 1.54, "learning_rate": 6.841005648282314e-05, "loss": 0.0113, "step": 595620 }, { "epoch": 1.54, "learning_rate": 6.840616826645168e-05, "loss": 0.0079, "step": 595630 }, { "epoch": 1.54, "learning_rate": 6.840228005008021e-05, "loss": 0.0092, "step": 595640 }, { "epoch": 1.54, "learning_rate": 6.839839183370875e-05, "loss": 0.0084, "step": 595650 }, { "epoch": 1.54, "learning_rate": 6.83945036173373e-05, "loss": 0.0102, "step": 595660 }, { "epoch": 1.54, "learning_rate": 6.839061540096582e-05, "loss": 0.0078, "step": 595670 }, { "epoch": 1.54, "learning_rate": 6.838672718459437e-05, "loss": 0.0094, "step": 595680 }, { "epoch": 1.54, "learning_rate": 6.83828389682229e-05, "loss": 0.0067, "step": 595690 }, { "epoch": 1.54, "learning_rate": 6.837895075185144e-05, "loss": 0.0102, "step": 595700 }, { "epoch": 1.54, "learning_rate": 6.837506253547996e-05, "loss": 0.0094, "step": 595710 }, { "epoch": 1.54, "learning_rate": 6.83711743191085e-05, "loss": 0.0121, "step": 595720 }, { "epoch": 1.54, "learning_rate": 6.836728610273705e-05, "loss": 0.0079, "step": 595730 }, { "epoch": 1.54, "learning_rate": 6.836339788636557e-05, "loss": 0.0098, "step": 595740 }, { "epoch": 1.54, "learning_rate": 6.835950966999412e-05, "loss": 0.0081, "step": 595750 }, { "epoch": 1.54, "learning_rate": 6.835562145362264e-05, "loss": 0.0089, "step": 595760 }, { "epoch": 1.54, "learning_rate": 6.835173323725119e-05, "loss": 0.008, "step": 595770 }, { "epoch": 1.54, "learning_rate": 6.834784502087971e-05, "loss": 0.0113, "step": 595780 }, { "epoch": 1.54, "learning_rate": 6.834395680450826e-05, "loss": 0.0076, "step": 595790 }, { "epoch": 1.54, "learning_rate": 6.834006858813678e-05, "loss": 0.0111, "step": 595800 }, { "epoch": 1.54, "learning_rate": 6.833618037176533e-05, "loss": 0.0098, "step": 595810 }, { "epoch": 1.54, "learning_rate": 6.833229215539387e-05, "loss": 0.0073, "step": 595820 }, { "epoch": 1.54, "learning_rate": 6.83284039390224e-05, "loss": 0.0106, "step": 595830 }, { "epoch": 1.54, "learning_rate": 6.832451572265092e-05, "loss": 0.0079, "step": 595840 }, { "epoch": 1.54, "learning_rate": 6.832062750627946e-05, "loss": 0.0094, "step": 595850 }, { "epoch": 1.54, "learning_rate": 6.831673928990799e-05, "loss": 0.008, "step": 595860 }, { "epoch": 1.54, "learning_rate": 6.831285107353653e-05, "loss": 0.0096, "step": 595870 }, { "epoch": 1.54, "learning_rate": 6.830896285716506e-05, "loss": 0.0088, "step": 595880 }, { "epoch": 1.54, "learning_rate": 6.83050746407936e-05, "loss": 0.0074, "step": 595890 }, { "epoch": 1.54, "learning_rate": 6.830118642442213e-05, "loss": 0.0089, "step": 595900 }, { "epoch": 1.54, "learning_rate": 6.829729820805067e-05, "loss": 0.0083, "step": 595910 }, { "epoch": 1.54, "learning_rate": 6.829340999167922e-05, "loss": 0.0075, "step": 595920 }, { "epoch": 1.54, "learning_rate": 6.828952177530774e-05, "loss": 0.0122, "step": 595930 }, { "epoch": 1.54, "learning_rate": 6.828563355893629e-05, "loss": 0.0076, "step": 595940 }, { "epoch": 1.54, "learning_rate": 6.828174534256481e-05, "loss": 0.0128, "step": 595950 }, { "epoch": 1.54, "learning_rate": 6.827785712619336e-05, "loss": 0.0115, "step": 595960 }, { "epoch": 1.54, "learning_rate": 6.827396890982188e-05, "loss": 0.0104, "step": 595970 }, { "epoch": 1.54, "learning_rate": 6.827008069345042e-05, "loss": 0.0097, "step": 595980 }, { "epoch": 1.54, "learning_rate": 6.826619247707897e-05, "loss": 0.0117, "step": 595990 }, { "epoch": 1.54, "learning_rate": 6.82623042607075e-05, "loss": 0.0064, "step": 596000 }, { "epoch": 1.54, "eval_cer": 0.8816928888646285, "eval_loss": 0.006005590315908194, "eval_runtime": 107.81, "eval_samples_per_second": 18.551, "eval_steps_per_second": 4.638, "step": 596000 }, { "epoch": 1.54, "learning_rate": 6.825841604433604e-05, "loss": 0.0122, "step": 596010 }, { "epoch": 1.54, "learning_rate": 6.825452782796456e-05, "loss": 0.0077, "step": 596020 }, { "epoch": 1.54, "learning_rate": 6.82506396115931e-05, "loss": 0.0084, "step": 596030 }, { "epoch": 1.55, "learning_rate": 6.824675139522163e-05, "loss": 0.0092, "step": 596040 }, { "epoch": 1.55, "learning_rate": 6.824286317885018e-05, "loss": 0.0072, "step": 596050 }, { "epoch": 1.55, "learning_rate": 6.82389749624787e-05, "loss": 0.0078, "step": 596060 }, { "epoch": 1.55, "learning_rate": 6.823508674610725e-05, "loss": 0.0072, "step": 596070 }, { "epoch": 1.55, "learning_rate": 6.823119852973577e-05, "loss": 0.0068, "step": 596080 }, { "epoch": 1.55, "learning_rate": 6.822731031336432e-05, "loss": 0.0079, "step": 596090 }, { "epoch": 1.55, "learning_rate": 6.822342209699284e-05, "loss": 0.0055, "step": 596100 }, { "epoch": 1.55, "learning_rate": 6.821953388062138e-05, "loss": 0.0095, "step": 596110 }, { "epoch": 1.55, "learning_rate": 6.821564566424991e-05, "loss": 0.0084, "step": 596120 }, { "epoch": 1.55, "learning_rate": 6.821175744787845e-05, "loss": 0.009, "step": 596130 }, { "epoch": 1.55, "learning_rate": 6.820786923150698e-05, "loss": 0.0127, "step": 596140 }, { "epoch": 1.55, "learning_rate": 6.820398101513552e-05, "loss": 0.0086, "step": 596150 }, { "epoch": 1.55, "learning_rate": 6.820009279876405e-05, "loss": 0.0088, "step": 596160 }, { "epoch": 1.55, "learning_rate": 6.81962045823926e-05, "loss": 0.0083, "step": 596170 }, { "epoch": 1.55, "learning_rate": 6.819231636602114e-05, "loss": 0.0101, "step": 596180 }, { "epoch": 1.55, "learning_rate": 6.818842814964966e-05, "loss": 0.0065, "step": 596190 }, { "epoch": 1.55, "learning_rate": 6.81845399332782e-05, "loss": 0.0073, "step": 596200 }, { "epoch": 1.55, "learning_rate": 6.818065171690673e-05, "loss": 0.0064, "step": 596210 }, { "epoch": 1.55, "learning_rate": 6.817676350053528e-05, "loss": 0.0075, "step": 596220 }, { "epoch": 1.55, "learning_rate": 6.81728752841638e-05, "loss": 0.0079, "step": 596230 }, { "epoch": 1.55, "learning_rate": 6.816898706779234e-05, "loss": 0.0119, "step": 596240 }, { "epoch": 1.55, "learning_rate": 6.816509885142087e-05, "loss": 0.0071, "step": 596250 }, { "epoch": 1.55, "learning_rate": 6.816121063504941e-05, "loss": 0.0103, "step": 596260 }, { "epoch": 1.55, "learning_rate": 6.815732241867796e-05, "loss": 0.0089, "step": 596270 }, { "epoch": 1.55, "learning_rate": 6.815343420230648e-05, "loss": 0.0074, "step": 596280 }, { "epoch": 1.55, "learning_rate": 6.814954598593503e-05, "loss": 0.0081, "step": 596290 }, { "epoch": 1.55, "learning_rate": 6.814565776956355e-05, "loss": 0.0096, "step": 596300 }, { "epoch": 1.55, "learning_rate": 6.81417695531921e-05, "loss": 0.009, "step": 596310 }, { "epoch": 1.55, "learning_rate": 6.813788133682062e-05, "loss": 0.0083, "step": 596320 }, { "epoch": 1.55, "learning_rate": 6.813399312044915e-05, "loss": 0.0118, "step": 596330 }, { "epoch": 1.55, "learning_rate": 6.81301049040777e-05, "loss": 0.0116, "step": 596340 }, { "epoch": 1.55, "learning_rate": 6.812621668770622e-05, "loss": 0.0097, "step": 596350 }, { "epoch": 1.55, "learning_rate": 6.812232847133476e-05, "loss": 0.0096, "step": 596360 }, { "epoch": 1.55, "learning_rate": 6.81184402549633e-05, "loss": 0.0092, "step": 596370 }, { "epoch": 1.55, "learning_rate": 6.811455203859183e-05, "loss": 0.0074, "step": 596380 }, { "epoch": 1.55, "learning_rate": 6.811066382222037e-05, "loss": 0.0068, "step": 596390 }, { "epoch": 1.55, "learning_rate": 6.81067756058489e-05, "loss": 0.0078, "step": 596400 }, { "epoch": 1.55, "learning_rate": 6.810288738947744e-05, "loss": 0.0087, "step": 596410 }, { "epoch": 1.55, "learning_rate": 6.809899917310597e-05, "loss": 0.0071, "step": 596420 }, { "epoch": 1.55, "learning_rate": 6.809511095673451e-05, "loss": 0.0092, "step": 596430 }, { "epoch": 1.55, "learning_rate": 6.809122274036306e-05, "loss": 0.0062, "step": 596440 }, { "epoch": 1.55, "learning_rate": 6.808733452399158e-05, "loss": 0.0075, "step": 596450 }, { "epoch": 1.55, "learning_rate": 6.808344630762013e-05, "loss": 0.0094, "step": 596460 }, { "epoch": 1.55, "learning_rate": 6.807955809124865e-05, "loss": 0.0073, "step": 596470 }, { "epoch": 1.55, "learning_rate": 6.80756698748772e-05, "loss": 0.0089, "step": 596480 }, { "epoch": 1.55, "learning_rate": 6.807178165850572e-05, "loss": 0.0089, "step": 596490 }, { "epoch": 1.55, "learning_rate": 6.806789344213426e-05, "loss": 0.0103, "step": 596500 }, { "epoch": 1.55, "learning_rate": 6.806400522576279e-05, "loss": 0.0103, "step": 596510 }, { "epoch": 1.55, "learning_rate": 6.806011700939133e-05, "loss": 0.0122, "step": 596520 }, { "epoch": 1.55, "learning_rate": 6.805622879301988e-05, "loss": 0.0083, "step": 596530 }, { "epoch": 1.55, "learning_rate": 6.80523405766484e-05, "loss": 0.0087, "step": 596540 }, { "epoch": 1.55, "learning_rate": 6.804845236027695e-05, "loss": 0.0068, "step": 596550 }, { "epoch": 1.55, "learning_rate": 6.804456414390547e-05, "loss": 0.0097, "step": 596560 }, { "epoch": 1.55, "learning_rate": 6.804067592753402e-05, "loss": 0.008, "step": 596570 }, { "epoch": 1.55, "learning_rate": 6.803678771116254e-05, "loss": 0.0071, "step": 596580 }, { "epoch": 1.55, "learning_rate": 6.803289949479107e-05, "loss": 0.0068, "step": 596590 }, { "epoch": 1.55, "learning_rate": 6.802901127841961e-05, "loss": 0.0121, "step": 596600 }, { "epoch": 1.55, "learning_rate": 6.802512306204814e-05, "loss": 0.0076, "step": 596610 }, { "epoch": 1.55, "learning_rate": 6.802123484567668e-05, "loss": 0.006, "step": 596620 }, { "epoch": 1.55, "learning_rate": 6.801734662930522e-05, "loss": 0.0086, "step": 596630 }, { "epoch": 1.55, "learning_rate": 6.801345841293375e-05, "loss": 0.0087, "step": 596640 }, { "epoch": 1.55, "learning_rate": 6.80095701965623e-05, "loss": 0.0073, "step": 596650 }, { "epoch": 1.55, "learning_rate": 6.800568198019082e-05, "loss": 0.0113, "step": 596660 }, { "epoch": 1.55, "learning_rate": 6.800179376381936e-05, "loss": 0.0076, "step": 596670 }, { "epoch": 1.55, "learning_rate": 6.799790554744789e-05, "loss": 0.009, "step": 596680 }, { "epoch": 1.55, "learning_rate": 6.799401733107643e-05, "loss": 0.0094, "step": 596690 }, { "epoch": 1.55, "learning_rate": 6.799012911470498e-05, "loss": 0.0085, "step": 596700 }, { "epoch": 1.55, "learning_rate": 6.79862408983335e-05, "loss": 0.0098, "step": 596710 }, { "epoch": 1.55, "learning_rate": 6.798235268196205e-05, "loss": 0.0095, "step": 596720 }, { "epoch": 1.55, "learning_rate": 6.797846446559057e-05, "loss": 0.0095, "step": 596730 }, { "epoch": 1.55, "learning_rate": 6.797457624921911e-05, "loss": 0.0083, "step": 596740 }, { "epoch": 1.55, "learning_rate": 6.797068803284764e-05, "loss": 0.0062, "step": 596750 }, { "epoch": 1.55, "learning_rate": 6.796679981647618e-05, "loss": 0.0091, "step": 596760 }, { "epoch": 1.55, "learning_rate": 6.796291160010471e-05, "loss": 0.0069, "step": 596770 }, { "epoch": 1.55, "learning_rate": 6.795902338373325e-05, "loss": 0.0094, "step": 596780 }, { "epoch": 1.55, "learning_rate": 6.79551351673618e-05, "loss": 0.0081, "step": 596790 }, { "epoch": 1.55, "learning_rate": 6.795124695099032e-05, "loss": 0.009, "step": 596800 }, { "epoch": 1.55, "learning_rate": 6.794735873461887e-05, "loss": 0.0093, "step": 596810 }, { "epoch": 1.55, "learning_rate": 6.79434705182474e-05, "loss": 0.0067, "step": 596820 }, { "epoch": 1.55, "learning_rate": 6.793958230187592e-05, "loss": 0.0082, "step": 596830 }, { "epoch": 1.55, "learning_rate": 6.793569408550446e-05, "loss": 0.0103, "step": 596840 }, { "epoch": 1.55, "learning_rate": 6.793180586913299e-05, "loss": 0.0093, "step": 596850 }, { "epoch": 1.55, "learning_rate": 6.792791765276153e-05, "loss": 0.0096, "step": 596860 }, { "epoch": 1.55, "learning_rate": 6.792402943639006e-05, "loss": 0.0091, "step": 596870 }, { "epoch": 1.55, "learning_rate": 6.79201412200186e-05, "loss": 0.0125, "step": 596880 }, { "epoch": 1.55, "learning_rate": 6.791625300364714e-05, "loss": 0.0071, "step": 596890 }, { "epoch": 1.55, "learning_rate": 6.791236478727567e-05, "loss": 0.0081, "step": 596900 }, { "epoch": 1.55, "learning_rate": 6.790847657090421e-05, "loss": 0.0102, "step": 596910 }, { "epoch": 1.55, "learning_rate": 6.790458835453274e-05, "loss": 0.0071, "step": 596920 }, { "epoch": 1.55, "learning_rate": 6.790070013816128e-05, "loss": 0.0104, "step": 596930 }, { "epoch": 1.55, "learning_rate": 6.789681192178981e-05, "loss": 0.0085, "step": 596940 }, { "epoch": 1.55, "learning_rate": 6.789292370541835e-05, "loss": 0.0073, "step": 596950 }, { "epoch": 1.55, "learning_rate": 6.78890354890469e-05, "loss": 0.0075, "step": 596960 }, { "epoch": 1.55, "learning_rate": 6.788514727267542e-05, "loss": 0.0075, "step": 596970 }, { "epoch": 1.55, "learning_rate": 6.788125905630397e-05, "loss": 0.0116, "step": 596980 }, { "epoch": 1.55, "learning_rate": 6.78773708399325e-05, "loss": 0.0095, "step": 596990 }, { "epoch": 1.55, "learning_rate": 6.787348262356103e-05, "loss": 0.0082, "step": 597000 }, { "epoch": 1.55, "eval_cer": 0.8817082848709045, "eval_loss": 0.005668503697961569, "eval_runtime": 107.8595, "eval_samples_per_second": 18.543, "eval_steps_per_second": 4.636, "step": 597000 }, { "epoch": 1.55, "learning_rate": 6.786959440718956e-05, "loss": 0.0091, "step": 597010 }, { "epoch": 1.55, "learning_rate": 6.78657061908181e-05, "loss": 0.0097, "step": 597020 }, { "epoch": 1.55, "learning_rate": 6.786181797444663e-05, "loss": 0.0084, "step": 597030 }, { "epoch": 1.55, "learning_rate": 6.785792975807517e-05, "loss": 0.008, "step": 597040 }, { "epoch": 1.55, "learning_rate": 6.785404154170372e-05, "loss": 0.0099, "step": 597050 }, { "epoch": 1.55, "learning_rate": 6.785015332533224e-05, "loss": 0.01, "step": 597060 }, { "epoch": 1.55, "learning_rate": 6.784626510896077e-05, "loss": 0.0072, "step": 597070 }, { "epoch": 1.55, "learning_rate": 6.784237689258931e-05, "loss": 0.005, "step": 597080 }, { "epoch": 1.55, "learning_rate": 6.783848867621784e-05, "loss": 0.0111, "step": 597090 }, { "epoch": 1.55, "learning_rate": 6.783460045984638e-05, "loss": 0.0082, "step": 597100 }, { "epoch": 1.55, "learning_rate": 6.783071224347491e-05, "loss": 0.0086, "step": 597110 }, { "epoch": 1.55, "learning_rate": 6.782682402710345e-05, "loss": 0.0094, "step": 597120 }, { "epoch": 1.55, "learning_rate": 6.782293581073198e-05, "loss": 0.0088, "step": 597130 }, { "epoch": 1.55, "learning_rate": 6.781904759436052e-05, "loss": 0.016, "step": 597140 }, { "epoch": 1.55, "learning_rate": 6.781515937798906e-05, "loss": 0.009, "step": 597150 }, { "epoch": 1.55, "learning_rate": 6.781127116161759e-05, "loss": 0.0077, "step": 597160 }, { "epoch": 1.55, "learning_rate": 6.780738294524613e-05, "loss": 0.0085, "step": 597170 }, { "epoch": 1.55, "learning_rate": 6.780349472887466e-05, "loss": 0.0093, "step": 597180 }, { "epoch": 1.55, "learning_rate": 6.77996065125032e-05, "loss": 0.0097, "step": 597190 }, { "epoch": 1.55, "learning_rate": 6.779571829613173e-05, "loss": 0.0094, "step": 597200 }, { "epoch": 1.55, "learning_rate": 6.779183007976027e-05, "loss": 0.0069, "step": 597210 }, { "epoch": 1.55, "learning_rate": 6.778794186338882e-05, "loss": 0.0129, "step": 597220 }, { "epoch": 1.55, "learning_rate": 6.778405364701734e-05, "loss": 0.0085, "step": 597230 }, { "epoch": 1.55, "learning_rate": 6.778016543064589e-05, "loss": 0.008, "step": 597240 }, { "epoch": 1.55, "learning_rate": 6.777627721427441e-05, "loss": 0.0093, "step": 597250 }, { "epoch": 1.55, "learning_rate": 6.777238899790295e-05, "loss": 0.0085, "step": 597260 }, { "epoch": 1.55, "learning_rate": 6.776850078153148e-05, "loss": 0.0115, "step": 597270 }, { "epoch": 1.55, "learning_rate": 6.776461256516002e-05, "loss": 0.0093, "step": 597280 }, { "epoch": 1.55, "learning_rate": 6.776072434878855e-05, "loss": 0.0075, "step": 597290 }, { "epoch": 1.55, "learning_rate": 6.77568361324171e-05, "loss": 0.0121, "step": 597300 }, { "epoch": 1.55, "learning_rate": 6.775294791604564e-05, "loss": 0.0109, "step": 597310 }, { "epoch": 1.55, "learning_rate": 6.774905969967416e-05, "loss": 0.0087, "step": 597320 }, { "epoch": 1.55, "learning_rate": 6.774517148330269e-05, "loss": 0.0115, "step": 597330 }, { "epoch": 1.55, "learning_rate": 6.774128326693123e-05, "loss": 0.0103, "step": 597340 }, { "epoch": 1.55, "learning_rate": 6.773739505055976e-05, "loss": 0.0075, "step": 597350 }, { "epoch": 1.55, "learning_rate": 6.77335068341883e-05, "loss": 0.0076, "step": 597360 }, { "epoch": 1.55, "learning_rate": 6.772961861781683e-05, "loss": 0.0096, "step": 597370 }, { "epoch": 1.55, "learning_rate": 6.772573040144537e-05, "loss": 0.0091, "step": 597380 }, { "epoch": 1.55, "learning_rate": 6.77218421850739e-05, "loss": 0.0077, "step": 597390 }, { "epoch": 1.55, "learning_rate": 6.771795396870244e-05, "loss": 0.0099, "step": 597400 }, { "epoch": 1.55, "learning_rate": 6.771406575233098e-05, "loss": 0.0102, "step": 597410 }, { "epoch": 1.55, "learning_rate": 6.771017753595951e-05, "loss": 0.0094, "step": 597420 }, { "epoch": 1.55, "learning_rate": 6.770628931958805e-05, "loss": 0.0089, "step": 597430 }, { "epoch": 1.55, "learning_rate": 6.770240110321658e-05, "loss": 0.0107, "step": 597440 }, { "epoch": 1.55, "learning_rate": 6.769851288684512e-05, "loss": 0.0089, "step": 597450 }, { "epoch": 1.55, "learning_rate": 6.769462467047365e-05, "loss": 0.0108, "step": 597460 }, { "epoch": 1.55, "learning_rate": 6.76907364541022e-05, "loss": 0.0104, "step": 597470 }, { "epoch": 1.55, "learning_rate": 6.768684823773074e-05, "loss": 0.0071, "step": 597480 }, { "epoch": 1.55, "learning_rate": 6.768296002135926e-05, "loss": 0.0083, "step": 597490 }, { "epoch": 1.55, "learning_rate": 6.76790718049878e-05, "loss": 0.0103, "step": 597500 }, { "epoch": 1.55, "learning_rate": 6.767518358861633e-05, "loss": 0.0076, "step": 597510 }, { "epoch": 1.55, "learning_rate": 6.767129537224487e-05, "loss": 0.009, "step": 597520 }, { "epoch": 1.55, "learning_rate": 6.76674071558734e-05, "loss": 0.0076, "step": 597530 }, { "epoch": 1.55, "learning_rate": 6.766351893950194e-05, "loss": 0.0077, "step": 597540 }, { "epoch": 1.55, "learning_rate": 6.765963072313047e-05, "loss": 0.0115, "step": 597550 }, { "epoch": 1.55, "learning_rate": 6.765574250675901e-05, "loss": 0.007, "step": 597560 }, { "epoch": 1.55, "learning_rate": 6.765185429038754e-05, "loss": 0.0071, "step": 597570 }, { "epoch": 1.55, "learning_rate": 6.764796607401608e-05, "loss": 0.0104, "step": 597580 }, { "epoch": 1.55, "learning_rate": 6.764407785764461e-05, "loss": 0.0079, "step": 597590 }, { "epoch": 1.55, "learning_rate": 6.764018964127315e-05, "loss": 0.0083, "step": 597600 }, { "epoch": 1.55, "learning_rate": 6.763630142490168e-05, "loss": 0.0088, "step": 597610 }, { "epoch": 1.55, "learning_rate": 6.763241320853022e-05, "loss": 0.0072, "step": 597620 }, { "epoch": 1.55, "learning_rate": 6.762852499215875e-05, "loss": 0.0077, "step": 597630 }, { "epoch": 1.55, "learning_rate": 6.762463677578729e-05, "loss": 0.0093, "step": 597640 }, { "epoch": 1.55, "learning_rate": 6.762074855941582e-05, "loss": 0.0071, "step": 597650 }, { "epoch": 1.55, "learning_rate": 6.761686034304436e-05, "loss": 0.0099, "step": 597660 }, { "epoch": 1.55, "learning_rate": 6.76129721266729e-05, "loss": 0.0099, "step": 597670 }, { "epoch": 1.55, "learning_rate": 6.760908391030143e-05, "loss": 0.0137, "step": 597680 }, { "epoch": 1.55, "learning_rate": 6.760519569392997e-05, "loss": 0.0099, "step": 597690 }, { "epoch": 1.55, "learning_rate": 6.76013074775585e-05, "loss": 0.0097, "step": 597700 }, { "epoch": 1.55, "learning_rate": 6.759741926118704e-05, "loss": 0.0085, "step": 597710 }, { "epoch": 1.55, "learning_rate": 6.759353104481557e-05, "loss": 0.0075, "step": 597720 }, { "epoch": 1.55, "learning_rate": 6.758964282844411e-05, "loss": 0.0085, "step": 597730 }, { "epoch": 1.55, "learning_rate": 6.758575461207264e-05, "loss": 0.0082, "step": 597740 }, { "epoch": 1.55, "learning_rate": 6.758186639570118e-05, "loss": 0.009, "step": 597750 }, { "epoch": 1.55, "learning_rate": 6.757797817932973e-05, "loss": 0.0088, "step": 597760 }, { "epoch": 1.55, "learning_rate": 6.757408996295825e-05, "loss": 0.0091, "step": 597770 }, { "epoch": 1.55, "learning_rate": 6.75702017465868e-05, "loss": 0.0074, "step": 597780 }, { "epoch": 1.55, "learning_rate": 6.756631353021532e-05, "loss": 0.0085, "step": 597790 }, { "epoch": 1.55, "learning_rate": 6.756242531384386e-05, "loss": 0.0077, "step": 597800 }, { "epoch": 1.55, "learning_rate": 6.755853709747239e-05, "loss": 0.0087, "step": 597810 }, { "epoch": 1.55, "learning_rate": 6.755464888110092e-05, "loss": 0.0093, "step": 597820 }, { "epoch": 1.55, "learning_rate": 6.755076066472946e-05, "loss": 0.0114, "step": 597830 }, { "epoch": 1.55, "learning_rate": 6.754687244835799e-05, "loss": 0.0076, "step": 597840 }, { "epoch": 1.55, "learning_rate": 6.754298423198653e-05, "loss": 0.0081, "step": 597850 }, { "epoch": 1.55, "learning_rate": 6.753909601561507e-05, "loss": 0.0066, "step": 597860 }, { "epoch": 1.55, "learning_rate": 6.75352077992436e-05, "loss": 0.0067, "step": 597870 }, { "epoch": 1.55, "learning_rate": 6.753131958287214e-05, "loss": 0.0106, "step": 597880 }, { "epoch": 1.55, "learning_rate": 6.752743136650067e-05, "loss": 0.0092, "step": 597890 }, { "epoch": 1.55, "learning_rate": 6.752354315012921e-05, "loss": 0.0083, "step": 597900 }, { "epoch": 1.55, "learning_rate": 6.751965493375774e-05, "loss": 0.0082, "step": 597910 }, { "epoch": 1.55, "learning_rate": 6.751576671738628e-05, "loss": 0.0097, "step": 597920 }, { "epoch": 1.55, "learning_rate": 6.751187850101482e-05, "loss": 0.0093, "step": 597930 }, { "epoch": 1.55, "learning_rate": 6.750799028464335e-05, "loss": 0.0105, "step": 597940 }, { "epoch": 1.55, "learning_rate": 6.75041020682719e-05, "loss": 0.0084, "step": 597950 }, { "epoch": 1.55, "learning_rate": 6.750021385190042e-05, "loss": 0.0066, "step": 597960 }, { "epoch": 1.55, "learning_rate": 6.749632563552896e-05, "loss": 0.0056, "step": 597970 }, { "epoch": 1.55, "learning_rate": 6.749243741915749e-05, "loss": 0.0096, "step": 597980 }, { "epoch": 1.55, "learning_rate": 6.748854920278603e-05, "loss": 0.0092, "step": 597990 }, { "epoch": 1.55, "learning_rate": 6.748466098641456e-05, "loss": 0.0084, "step": 598000 }, { "epoch": 1.55, "eval_cer": 0.8816844910430235, "eval_loss": 0.005743164103478193, "eval_runtime": 107.8556, "eval_samples_per_second": 18.543, "eval_steps_per_second": 4.636, "step": 598000 }, { "epoch": 1.55, "learning_rate": 6.74807727700431e-05, "loss": 0.0088, "step": 598010 }, { "epoch": 1.55, "learning_rate": 6.747688455367164e-05, "loss": 0.0096, "step": 598020 }, { "epoch": 1.55, "learning_rate": 6.747299633730017e-05, "loss": 0.0087, "step": 598030 }, { "epoch": 1.55, "learning_rate": 6.746910812092871e-05, "loss": 0.0078, "step": 598040 }, { "epoch": 1.55, "learning_rate": 6.746521990455724e-05, "loss": 0.0102, "step": 598050 }, { "epoch": 1.55, "learning_rate": 6.746133168818578e-05, "loss": 0.0082, "step": 598060 }, { "epoch": 1.55, "learning_rate": 6.745744347181431e-05, "loss": 0.0084, "step": 598070 }, { "epoch": 1.55, "learning_rate": 6.745355525544284e-05, "loss": 0.0091, "step": 598080 }, { "epoch": 1.55, "learning_rate": 6.744966703907138e-05, "loss": 0.0083, "step": 598090 }, { "epoch": 1.55, "learning_rate": 6.744577882269991e-05, "loss": 0.0124, "step": 598100 }, { "epoch": 1.55, "learning_rate": 6.744189060632845e-05, "loss": 0.0096, "step": 598110 }, { "epoch": 1.55, "learning_rate": 6.7438002389957e-05, "loss": 0.0068, "step": 598120 }, { "epoch": 1.55, "learning_rate": 6.743411417358552e-05, "loss": 0.009, "step": 598130 }, { "epoch": 1.55, "learning_rate": 6.743022595721406e-05, "loss": 0.0118, "step": 598140 }, { "epoch": 1.55, "learning_rate": 6.742633774084259e-05, "loss": 0.0095, "step": 598150 }, { "epoch": 1.55, "learning_rate": 6.742244952447113e-05, "loss": 0.0091, "step": 598160 }, { "epoch": 1.55, "learning_rate": 6.741856130809966e-05, "loss": 0.0113, "step": 598170 }, { "epoch": 1.55, "learning_rate": 6.74146730917282e-05, "loss": 0.0085, "step": 598180 }, { "epoch": 1.55, "learning_rate": 6.741078487535674e-05, "loss": 0.009, "step": 598190 }, { "epoch": 1.55, "learning_rate": 6.740689665898527e-05, "loss": 0.0117, "step": 598200 }, { "epoch": 1.55, "learning_rate": 6.740300844261381e-05, "loss": 0.0108, "step": 598210 }, { "epoch": 1.55, "learning_rate": 6.739912022624234e-05, "loss": 0.0073, "step": 598220 }, { "epoch": 1.55, "learning_rate": 6.739523200987088e-05, "loss": 0.0077, "step": 598230 }, { "epoch": 1.55, "learning_rate": 6.739134379349941e-05, "loss": 0.0071, "step": 598240 }, { "epoch": 1.55, "learning_rate": 6.738745557712795e-05, "loss": 0.0083, "step": 598250 }, { "epoch": 1.55, "learning_rate": 6.738356736075648e-05, "loss": 0.0106, "step": 598260 }, { "epoch": 1.55, "learning_rate": 6.737967914438502e-05, "loss": 0.0122, "step": 598270 }, { "epoch": 1.55, "learning_rate": 6.737579092801356e-05, "loss": 0.0135, "step": 598280 }, { "epoch": 1.55, "learning_rate": 6.737190271164209e-05, "loss": 0.0074, "step": 598290 }, { "epoch": 1.55, "learning_rate": 6.736801449527063e-05, "loss": 0.0068, "step": 598300 }, { "epoch": 1.55, "learning_rate": 6.736412627889916e-05, "loss": 0.0078, "step": 598310 }, { "epoch": 1.55, "learning_rate": 6.736023806252769e-05, "loss": 0.0116, "step": 598320 }, { "epoch": 1.55, "learning_rate": 6.735634984615623e-05, "loss": 0.0076, "step": 598330 }, { "epoch": 1.55, "learning_rate": 6.735246162978476e-05, "loss": 0.0107, "step": 598340 }, { "epoch": 1.55, "learning_rate": 6.73485734134133e-05, "loss": 0.0072, "step": 598350 }, { "epoch": 1.55, "learning_rate": 6.734468519704183e-05, "loss": 0.0096, "step": 598360 }, { "epoch": 1.55, "learning_rate": 6.734079698067037e-05, "loss": 0.0116, "step": 598370 }, { "epoch": 1.55, "learning_rate": 6.733690876429891e-05, "loss": 0.0118, "step": 598380 }, { "epoch": 1.55, "learning_rate": 6.733302054792744e-05, "loss": 0.0073, "step": 598390 }, { "epoch": 1.55, "learning_rate": 6.732913233155598e-05, "loss": 0.0094, "step": 598400 }, { "epoch": 1.55, "learning_rate": 6.732524411518451e-05, "loss": 0.0083, "step": 598410 }, { "epoch": 1.55, "learning_rate": 6.732135589881305e-05, "loss": 0.0092, "step": 598420 }, { "epoch": 1.55, "learning_rate": 6.731746768244158e-05, "loss": 0.0091, "step": 598430 }, { "epoch": 1.55, "learning_rate": 6.731357946607012e-05, "loss": 0.0132, "step": 598440 }, { "epoch": 1.55, "learning_rate": 6.730969124969866e-05, "loss": 0.0083, "step": 598450 }, { "epoch": 1.55, "learning_rate": 6.730580303332719e-05, "loss": 0.0097, "step": 598460 }, { "epoch": 1.55, "learning_rate": 6.730191481695573e-05, "loss": 0.0086, "step": 598470 }, { "epoch": 1.55, "learning_rate": 6.729802660058426e-05, "loss": 0.0115, "step": 598480 }, { "epoch": 1.55, "learning_rate": 6.72941383842128e-05, "loss": 0.0094, "step": 598490 }, { "epoch": 1.55, "learning_rate": 6.729025016784133e-05, "loss": 0.009, "step": 598500 }, { "epoch": 1.55, "learning_rate": 6.728636195146987e-05, "loss": 0.0087, "step": 598510 }, { "epoch": 1.55, "learning_rate": 6.72824737350984e-05, "loss": 0.0075, "step": 598520 }, { "epoch": 1.55, "learning_rate": 6.727858551872694e-05, "loss": 0.0088, "step": 598530 }, { "epoch": 1.55, "learning_rate": 6.727469730235548e-05, "loss": 0.0098, "step": 598540 }, { "epoch": 1.55, "learning_rate": 6.727080908598401e-05, "loss": 0.0133, "step": 598550 }, { "epoch": 1.55, "learning_rate": 6.726692086961254e-05, "loss": 0.0083, "step": 598560 }, { "epoch": 1.55, "learning_rate": 6.726303265324108e-05, "loss": 0.0066, "step": 598570 }, { "epoch": 1.55, "learning_rate": 6.725914443686961e-05, "loss": 0.0095, "step": 598580 }, { "epoch": 1.55, "learning_rate": 6.725525622049815e-05, "loss": 0.0102, "step": 598590 }, { "epoch": 1.55, "learning_rate": 6.725136800412668e-05, "loss": 0.0114, "step": 598600 }, { "epoch": 1.55, "learning_rate": 6.724747978775522e-05, "loss": 0.0077, "step": 598610 }, { "epoch": 1.55, "learning_rate": 6.724359157138375e-05, "loss": 0.0076, "step": 598620 }, { "epoch": 1.55, "learning_rate": 6.723970335501229e-05, "loss": 0.0092, "step": 598630 }, { "epoch": 1.55, "learning_rate": 6.723581513864083e-05, "loss": 0.0097, "step": 598640 }, { "epoch": 1.55, "learning_rate": 6.723192692226936e-05, "loss": 0.0081, "step": 598650 }, { "epoch": 1.55, "learning_rate": 6.72280387058979e-05, "loss": 0.0099, "step": 598660 }, { "epoch": 1.55, "learning_rate": 6.722415048952643e-05, "loss": 0.0105, "step": 598670 }, { "epoch": 1.55, "learning_rate": 6.722026227315497e-05, "loss": 0.0103, "step": 598680 }, { "epoch": 1.55, "learning_rate": 6.72163740567835e-05, "loss": 0.007, "step": 598690 }, { "epoch": 1.55, "learning_rate": 6.721248584041204e-05, "loss": 0.0073, "step": 598700 }, { "epoch": 1.55, "learning_rate": 6.720859762404058e-05, "loss": 0.0077, "step": 598710 }, { "epoch": 1.55, "learning_rate": 6.720470940766911e-05, "loss": 0.0091, "step": 598720 }, { "epoch": 1.55, "learning_rate": 6.720082119129765e-05, "loss": 0.0082, "step": 598730 }, { "epoch": 1.55, "learning_rate": 6.719693297492618e-05, "loss": 0.0102, "step": 598740 }, { "epoch": 1.55, "learning_rate": 6.719304475855472e-05, "loss": 0.0079, "step": 598750 }, { "epoch": 1.55, "learning_rate": 6.718915654218325e-05, "loss": 0.0085, "step": 598760 }, { "epoch": 1.55, "learning_rate": 6.71852683258118e-05, "loss": 0.0099, "step": 598770 }, { "epoch": 1.55, "learning_rate": 6.718138010944032e-05, "loss": 0.0075, "step": 598780 }, { "epoch": 1.55, "learning_rate": 6.717749189306886e-05, "loss": 0.0074, "step": 598790 }, { "epoch": 1.55, "learning_rate": 6.71736036766974e-05, "loss": 0.0107, "step": 598800 }, { "epoch": 1.55, "learning_rate": 6.716971546032593e-05, "loss": 0.0078, "step": 598810 }, { "epoch": 1.55, "learning_rate": 6.716582724395446e-05, "loss": 0.0078, "step": 598820 }, { "epoch": 1.55, "learning_rate": 6.7161939027583e-05, "loss": 0.0097, "step": 598830 }, { "epoch": 1.55, "learning_rate": 6.715805081121153e-05, "loss": 0.01, "step": 598840 }, { "epoch": 1.55, "learning_rate": 6.715416259484007e-05, "loss": 0.0053, "step": 598850 }, { "epoch": 1.55, "learning_rate": 6.71502743784686e-05, "loss": 0.0083, "step": 598860 }, { "epoch": 1.55, "learning_rate": 6.714638616209714e-05, "loss": 0.0096, "step": 598870 }, { "epoch": 1.55, "learning_rate": 6.714249794572567e-05, "loss": 0.0084, "step": 598880 }, { "epoch": 1.55, "learning_rate": 6.713860972935421e-05, "loss": 0.0073, "step": 598890 }, { "epoch": 1.55, "learning_rate": 6.713472151298275e-05, "loss": 0.0142, "step": 598900 }, { "epoch": 1.55, "learning_rate": 6.713083329661128e-05, "loss": 0.0083, "step": 598910 }, { "epoch": 1.55, "learning_rate": 6.712694508023982e-05, "loss": 0.0108, "step": 598920 }, { "epoch": 1.55, "learning_rate": 6.712305686386835e-05, "loss": 0.0088, "step": 598930 }, { "epoch": 1.55, "learning_rate": 6.711916864749689e-05, "loss": 0.0088, "step": 598940 }, { "epoch": 1.55, "learning_rate": 6.711528043112542e-05, "loss": 0.0081, "step": 598950 }, { "epoch": 1.55, "learning_rate": 6.711139221475396e-05, "loss": 0.0073, "step": 598960 }, { "epoch": 1.55, "learning_rate": 6.710750399838249e-05, "loss": 0.0096, "step": 598970 }, { "epoch": 1.55, "learning_rate": 6.710361578201103e-05, "loss": 0.0088, "step": 598980 }, { "epoch": 1.55, "learning_rate": 6.709972756563957e-05, "loss": 0.0084, "step": 598990 }, { "epoch": 1.55, "learning_rate": 6.70958393492681e-05, "loss": 0.0112, "step": 599000 }, { "epoch": 1.55, "eval_cer": 0.881704085960102, "eval_loss": 0.005739094223827124, "eval_runtime": 107.7697, "eval_samples_per_second": 18.558, "eval_steps_per_second": 4.64, "step": 599000 }, { "epoch": 1.55, "learning_rate": 6.709195113289664e-05, "loss": 0.0065, "step": 599010 }, { "epoch": 1.55, "learning_rate": 6.708806291652517e-05, "loss": 0.0084, "step": 599020 }, { "epoch": 1.55, "learning_rate": 6.708417470015371e-05, "loss": 0.0085, "step": 599030 }, { "epoch": 1.55, "learning_rate": 6.708028648378224e-05, "loss": 0.0077, "step": 599040 }, { "epoch": 1.55, "learning_rate": 6.707639826741078e-05, "loss": 0.0118, "step": 599050 }, { "epoch": 1.55, "learning_rate": 6.707251005103931e-05, "loss": 0.008, "step": 599060 }, { "epoch": 1.55, "learning_rate": 6.706862183466785e-05, "loss": 0.0112, "step": 599070 }, { "epoch": 1.55, "learning_rate": 6.706473361829638e-05, "loss": 0.0076, "step": 599080 }, { "epoch": 1.55, "learning_rate": 6.706084540192492e-05, "loss": 0.0082, "step": 599090 }, { "epoch": 1.55, "learning_rate": 6.705695718555345e-05, "loss": 0.012, "step": 599100 }, { "epoch": 1.55, "learning_rate": 6.705306896918199e-05, "loss": 0.0068, "step": 599110 }, { "epoch": 1.55, "learning_rate": 6.704918075281052e-05, "loss": 0.0095, "step": 599120 }, { "epoch": 1.55, "learning_rate": 6.704529253643906e-05, "loss": 0.0082, "step": 599130 }, { "epoch": 1.55, "learning_rate": 6.704140432006759e-05, "loss": 0.0098, "step": 599140 }, { "epoch": 1.55, "learning_rate": 6.703751610369613e-05, "loss": 0.0087, "step": 599150 }, { "epoch": 1.55, "learning_rate": 6.703362788732467e-05, "loss": 0.0081, "step": 599160 }, { "epoch": 1.55, "learning_rate": 6.70297396709532e-05, "loss": 0.007, "step": 599170 }, { "epoch": 1.55, "learning_rate": 6.702585145458174e-05, "loss": 0.0097, "step": 599180 }, { "epoch": 1.55, "learning_rate": 6.702196323821027e-05, "loss": 0.008, "step": 599190 }, { "epoch": 1.55, "learning_rate": 6.701807502183881e-05, "loss": 0.0105, "step": 599200 }, { "epoch": 1.55, "learning_rate": 6.701418680546734e-05, "loss": 0.0087, "step": 599210 }, { "epoch": 1.55, "learning_rate": 6.701029858909588e-05, "loss": 0.0122, "step": 599220 }, { "epoch": 1.55, "learning_rate": 6.700641037272441e-05, "loss": 0.0083, "step": 599230 }, { "epoch": 1.55, "learning_rate": 6.700252215635295e-05, "loss": 0.0099, "step": 599240 }, { "epoch": 1.55, "learning_rate": 6.69986339399815e-05, "loss": 0.0188, "step": 599250 }, { "epoch": 1.55, "learning_rate": 6.699474572361002e-05, "loss": 0.0099, "step": 599260 }, { "epoch": 1.55, "learning_rate": 6.699085750723856e-05, "loss": 0.0088, "step": 599270 }, { "epoch": 1.55, "learning_rate": 6.698696929086709e-05, "loss": 0.0106, "step": 599280 }, { "epoch": 1.55, "learning_rate": 6.698308107449563e-05, "loss": 0.0096, "step": 599290 }, { "epoch": 1.55, "learning_rate": 6.697919285812416e-05, "loss": 0.0082, "step": 599300 }, { "epoch": 1.55, "learning_rate": 6.697530464175269e-05, "loss": 0.0108, "step": 599310 }, { "epoch": 1.55, "learning_rate": 6.697141642538123e-05, "loss": 0.0085, "step": 599320 }, { "epoch": 1.55, "learning_rate": 6.696752820900976e-05, "loss": 0.0092, "step": 599330 }, { "epoch": 1.55, "learning_rate": 6.69636399926383e-05, "loss": 0.0109, "step": 599340 }, { "epoch": 1.55, "learning_rate": 6.695975177626684e-05, "loss": 0.0089, "step": 599350 }, { "epoch": 1.55, "learning_rate": 6.695586355989537e-05, "loss": 0.009, "step": 599360 }, { "epoch": 1.55, "learning_rate": 6.695197534352391e-05, "loss": 0.0098, "step": 599370 }, { "epoch": 1.55, "learning_rate": 6.694808712715244e-05, "loss": 0.0071, "step": 599380 }, { "epoch": 1.55, "learning_rate": 6.694419891078098e-05, "loss": 0.0101, "step": 599390 }, { "epoch": 1.55, "learning_rate": 6.694031069440951e-05, "loss": 0.0071, "step": 599400 }, { "epoch": 1.55, "learning_rate": 6.693642247803805e-05, "loss": 0.0089, "step": 599410 }, { "epoch": 1.55, "learning_rate": 6.69325342616666e-05, "loss": 0.0098, "step": 599420 }, { "epoch": 1.55, "learning_rate": 6.692864604529512e-05, "loss": 0.0073, "step": 599430 }, { "epoch": 1.55, "learning_rate": 6.692475782892366e-05, "loss": 0.0079, "step": 599440 }, { "epoch": 1.55, "learning_rate": 6.692086961255219e-05, "loss": 0.0134, "step": 599450 }, { "epoch": 1.55, "learning_rate": 6.691698139618073e-05, "loss": 0.0066, "step": 599460 }, { "epoch": 1.55, "learning_rate": 6.691309317980926e-05, "loss": 0.0067, "step": 599470 }, { "epoch": 1.55, "learning_rate": 6.69092049634378e-05, "loss": 0.0087, "step": 599480 }, { "epoch": 1.55, "learning_rate": 6.690531674706633e-05, "loss": 0.0085, "step": 599490 }, { "epoch": 1.55, "learning_rate": 6.690142853069487e-05, "loss": 0.0096, "step": 599500 }, { "epoch": 1.55, "learning_rate": 6.689754031432341e-05, "loss": 0.0118, "step": 599510 }, { "epoch": 1.55, "learning_rate": 6.689365209795194e-05, "loss": 0.0102, "step": 599520 }, { "epoch": 1.55, "learning_rate": 6.688976388158048e-05, "loss": 0.0079, "step": 599530 }, { "epoch": 1.55, "learning_rate": 6.688587566520901e-05, "loss": 0.0082, "step": 599540 }, { "epoch": 1.55, "learning_rate": 6.688198744883754e-05, "loss": 0.0094, "step": 599550 }, { "epoch": 1.55, "learning_rate": 6.687809923246608e-05, "loss": 0.0134, "step": 599560 }, { "epoch": 1.55, "learning_rate": 6.687421101609461e-05, "loss": 0.0088, "step": 599570 }, { "epoch": 1.55, "learning_rate": 6.687032279972315e-05, "loss": 0.0068, "step": 599580 }, { "epoch": 1.55, "learning_rate": 6.686643458335168e-05, "loss": 0.0087, "step": 599590 }, { "epoch": 1.55, "learning_rate": 6.686254636698022e-05, "loss": 0.0071, "step": 599600 }, { "epoch": 1.55, "learning_rate": 6.685865815060876e-05, "loss": 0.014, "step": 599610 }, { "epoch": 1.55, "learning_rate": 6.685476993423729e-05, "loss": 0.0076, "step": 599620 }, { "epoch": 1.55, "learning_rate": 6.685088171786583e-05, "loss": 0.0071, "step": 599630 }, { "epoch": 1.55, "learning_rate": 6.684699350149436e-05, "loss": 0.0113, "step": 599640 }, { "epoch": 1.55, "learning_rate": 6.68431052851229e-05, "loss": 0.0092, "step": 599650 }, { "epoch": 1.55, "learning_rate": 6.683921706875143e-05, "loss": 0.0128, "step": 599660 }, { "epoch": 1.55, "learning_rate": 6.683532885237997e-05, "loss": 0.0106, "step": 599670 }, { "epoch": 1.55, "learning_rate": 6.683144063600851e-05, "loss": 0.0065, "step": 599680 }, { "epoch": 1.55, "learning_rate": 6.682755241963704e-05, "loss": 0.0067, "step": 599690 }, { "epoch": 1.55, "learning_rate": 6.682366420326558e-05, "loss": 0.0109, "step": 599700 }, { "epoch": 1.55, "learning_rate": 6.681977598689411e-05, "loss": 0.0079, "step": 599710 }, { "epoch": 1.55, "learning_rate": 6.681588777052265e-05, "loss": 0.0082, "step": 599720 }, { "epoch": 1.55, "learning_rate": 6.681199955415118e-05, "loss": 0.0092, "step": 599730 }, { "epoch": 1.55, "learning_rate": 6.680811133777972e-05, "loss": 0.0078, "step": 599740 }, { "epoch": 1.55, "learning_rate": 6.680422312140825e-05, "loss": 0.0088, "step": 599750 }, { "epoch": 1.55, "learning_rate": 6.680033490503679e-05, "loss": 0.0063, "step": 599760 }, { "epoch": 1.55, "learning_rate": 6.679644668866533e-05, "loss": 0.0087, "step": 599770 }, { "epoch": 1.55, "learning_rate": 6.679255847229386e-05, "loss": 0.0092, "step": 599780 }, { "epoch": 1.55, "learning_rate": 6.67886702559224e-05, "loss": 0.009, "step": 599790 }, { "epoch": 1.55, "learning_rate": 6.678478203955093e-05, "loss": 0.0072, "step": 599800 }, { "epoch": 1.55, "learning_rate": 6.678089382317946e-05, "loss": 0.0078, "step": 599810 }, { "epoch": 1.55, "learning_rate": 6.6777005606808e-05, "loss": 0.008, "step": 599820 }, { "epoch": 1.55, "learning_rate": 6.677311739043653e-05, "loss": 0.0087, "step": 599830 }, { "epoch": 1.55, "learning_rate": 6.676922917406507e-05, "loss": 0.0121, "step": 599840 }, { "epoch": 1.55, "learning_rate": 6.67653409576936e-05, "loss": 0.0079, "step": 599850 }, { "epoch": 1.55, "learning_rate": 6.676145274132214e-05, "loss": 0.0091, "step": 599860 }, { "epoch": 1.55, "learning_rate": 6.675756452495068e-05, "loss": 0.0075, "step": 599870 }, { "epoch": 1.55, "learning_rate": 6.675367630857921e-05, "loss": 0.0072, "step": 599880 }, { "epoch": 1.56, "learning_rate": 6.674978809220775e-05, "loss": 0.0102, "step": 599890 }, { "epoch": 1.56, "learning_rate": 6.674589987583628e-05, "loss": 0.0079, "step": 599900 }, { "epoch": 1.56, "learning_rate": 6.674201165946482e-05, "loss": 0.0082, "step": 599910 }, { "epoch": 1.56, "learning_rate": 6.673812344309335e-05, "loss": 0.0095, "step": 599920 }, { "epoch": 1.56, "learning_rate": 6.673423522672189e-05, "loss": 0.0092, "step": 599930 }, { "epoch": 1.56, "learning_rate": 6.673034701035043e-05, "loss": 0.0092, "step": 599940 }, { "epoch": 1.56, "learning_rate": 6.672645879397896e-05, "loss": 0.0078, "step": 599950 }, { "epoch": 1.56, "learning_rate": 6.67225705776075e-05, "loss": 0.0104, "step": 599960 }, { "epoch": 1.56, "learning_rate": 6.671868236123603e-05, "loss": 0.0087, "step": 599970 }, { "epoch": 1.56, "learning_rate": 6.671479414486457e-05, "loss": 0.0091, "step": 599980 }, { "epoch": 1.56, "learning_rate": 6.67109059284931e-05, "loss": 0.0086, "step": 599990 }, { "epoch": 1.56, "learning_rate": 6.670701771212164e-05, "loss": 0.0143, "step": 600000 }, { "epoch": 1.56, "eval_cer": 0.88167329394755, "eval_loss": 0.005724812392145395, "eval_runtime": 107.7634, "eval_samples_per_second": 18.559, "eval_steps_per_second": 4.64, "step": 600000 }, { "epoch": 1.56, "learning_rate": 6.670312949575017e-05, "loss": 0.0087, "step": 600010 }, { "epoch": 1.56, "learning_rate": 6.669924127937871e-05, "loss": 0.0082, "step": 600020 }, { "epoch": 1.56, "learning_rate": 6.669535306300725e-05, "loss": 0.0091, "step": 600030 }, { "epoch": 1.56, "learning_rate": 6.669146484663578e-05, "loss": 0.009, "step": 600040 }, { "epoch": 1.56, "learning_rate": 6.668757663026431e-05, "loss": 0.0082, "step": 600050 }, { "epoch": 1.56, "learning_rate": 6.668368841389285e-05, "loss": 0.0089, "step": 600060 }, { "epoch": 1.56, "learning_rate": 6.667980019752138e-05, "loss": 0.01, "step": 600070 }, { "epoch": 1.56, "learning_rate": 6.667591198114992e-05, "loss": 0.0091, "step": 600080 }, { "epoch": 1.56, "learning_rate": 6.667202376477845e-05, "loss": 0.0097, "step": 600090 }, { "epoch": 1.56, "learning_rate": 6.666813554840699e-05, "loss": 0.0077, "step": 600100 }, { "epoch": 1.56, "learning_rate": 6.666424733203552e-05, "loss": 0.0079, "step": 600110 }, { "epoch": 1.56, "learning_rate": 6.666035911566406e-05, "loss": 0.0107, "step": 600120 }, { "epoch": 1.56, "learning_rate": 6.66564708992926e-05, "loss": 0.0074, "step": 600130 }, { "epoch": 1.56, "learning_rate": 6.665258268292113e-05, "loss": 0.008, "step": 600140 }, { "epoch": 1.56, "learning_rate": 6.664869446654967e-05, "loss": 0.0108, "step": 600150 }, { "epoch": 1.56, "learning_rate": 6.66448062501782e-05, "loss": 0.0075, "step": 600160 }, { "epoch": 1.56, "learning_rate": 6.664091803380674e-05, "loss": 0.007, "step": 600170 }, { "epoch": 1.56, "learning_rate": 6.663702981743527e-05, "loss": 0.0065, "step": 600180 }, { "epoch": 1.56, "learning_rate": 6.663314160106381e-05, "loss": 0.0062, "step": 600190 }, { "epoch": 1.56, "learning_rate": 6.662925338469235e-05, "loss": 0.0082, "step": 600200 }, { "epoch": 1.56, "learning_rate": 6.662536516832088e-05, "loss": 0.008, "step": 600210 }, { "epoch": 1.56, "learning_rate": 6.662147695194942e-05, "loss": 0.0093, "step": 600220 }, { "epoch": 1.56, "learning_rate": 6.661758873557795e-05, "loss": 0.0108, "step": 600230 }, { "epoch": 1.56, "learning_rate": 6.661370051920649e-05, "loss": 0.011, "step": 600240 }, { "epoch": 1.56, "learning_rate": 6.660981230283502e-05, "loss": 0.0079, "step": 600250 }, { "epoch": 1.56, "learning_rate": 6.660592408646356e-05, "loss": 0.0108, "step": 600260 }, { "epoch": 1.56, "learning_rate": 6.660203587009209e-05, "loss": 0.0105, "step": 600270 }, { "epoch": 1.56, "learning_rate": 6.659814765372063e-05, "loss": 0.0119, "step": 600280 }, { "epoch": 1.56, "learning_rate": 6.659425943734917e-05, "loss": 0.0065, "step": 600290 }, { "epoch": 1.56, "learning_rate": 6.65903712209777e-05, "loss": 0.0105, "step": 600300 }, { "epoch": 1.56, "learning_rate": 6.658648300460623e-05, "loss": 0.0068, "step": 600310 }, { "epoch": 1.56, "learning_rate": 6.658259478823477e-05, "loss": 0.0079, "step": 600320 }, { "epoch": 1.56, "learning_rate": 6.65787065718633e-05, "loss": 0.0062, "step": 600330 }, { "epoch": 1.56, "learning_rate": 6.657481835549184e-05, "loss": 0.0082, "step": 600340 }, { "epoch": 1.56, "learning_rate": 6.657093013912037e-05, "loss": 0.008, "step": 600350 }, { "epoch": 1.56, "learning_rate": 6.656704192274891e-05, "loss": 0.0094, "step": 600360 }, { "epoch": 1.56, "learning_rate": 6.656315370637744e-05, "loss": 0.0088, "step": 600370 }, { "epoch": 1.56, "learning_rate": 6.655926549000598e-05, "loss": 0.0056, "step": 600380 }, { "epoch": 1.56, "learning_rate": 6.655537727363452e-05, "loss": 0.008, "step": 600390 }, { "epoch": 1.56, "learning_rate": 6.655148905726305e-05, "loss": 0.0077, "step": 600400 }, { "epoch": 1.56, "learning_rate": 6.654760084089159e-05, "loss": 0.0078, "step": 600410 }, { "epoch": 1.56, "learning_rate": 6.654371262452012e-05, "loss": 0.0121, "step": 600420 }, { "epoch": 1.56, "learning_rate": 6.653982440814866e-05, "loss": 0.0121, "step": 600430 }, { "epoch": 1.56, "learning_rate": 6.653593619177719e-05, "loss": 0.0083, "step": 600440 }, { "epoch": 1.56, "learning_rate": 6.653204797540573e-05, "loss": 0.0074, "step": 600450 }, { "epoch": 1.56, "learning_rate": 6.652815975903426e-05, "loss": 0.01, "step": 600460 }, { "epoch": 1.56, "learning_rate": 6.65242715426628e-05, "loss": 0.009, "step": 600470 }, { "epoch": 1.56, "learning_rate": 6.652038332629134e-05, "loss": 0.0098, "step": 600480 }, { "epoch": 1.56, "learning_rate": 6.651649510991987e-05, "loss": 0.0093, "step": 600490 }, { "epoch": 1.56, "learning_rate": 6.651260689354841e-05, "loss": 0.0069, "step": 600500 }, { "epoch": 1.56, "learning_rate": 6.650871867717694e-05, "loss": 0.0128, "step": 600510 }, { "epoch": 1.56, "learning_rate": 6.650483046080548e-05, "loss": 0.0101, "step": 600520 }, { "epoch": 1.56, "learning_rate": 6.650094224443401e-05, "loss": 0.0082, "step": 600530 }, { "epoch": 1.56, "learning_rate": 6.649705402806255e-05, "loss": 0.009, "step": 600540 }, { "epoch": 1.56, "learning_rate": 6.649316581169108e-05, "loss": 0.0088, "step": 600550 }, { "epoch": 1.56, "learning_rate": 6.648927759531961e-05, "loss": 0.0079, "step": 600560 }, { "epoch": 1.56, "learning_rate": 6.648538937894815e-05, "loss": 0.0088, "step": 600570 }, { "epoch": 1.56, "learning_rate": 6.648150116257669e-05, "loss": 0.0119, "step": 600580 }, { "epoch": 1.56, "learning_rate": 6.647761294620522e-05, "loss": 0.011, "step": 600590 }, { "epoch": 1.56, "learning_rate": 6.647372472983376e-05, "loss": 0.0096, "step": 600600 }, { "epoch": 1.56, "learning_rate": 6.646983651346229e-05, "loss": 0.0096, "step": 600610 }, { "epoch": 1.56, "learning_rate": 6.646594829709083e-05, "loss": 0.0112, "step": 600620 }, { "epoch": 1.56, "learning_rate": 6.646206008071936e-05, "loss": 0.01, "step": 600630 }, { "epoch": 1.56, "learning_rate": 6.64581718643479e-05, "loss": 0.008, "step": 600640 }, { "epoch": 1.56, "learning_rate": 6.645428364797644e-05, "loss": 0.0132, "step": 600650 }, { "epoch": 1.56, "learning_rate": 6.645039543160497e-05, "loss": 0.0124, "step": 600660 }, { "epoch": 1.56, "learning_rate": 6.644650721523351e-05, "loss": 0.0085, "step": 600670 }, { "epoch": 1.56, "learning_rate": 6.644261899886204e-05, "loss": 0.0087, "step": 600680 }, { "epoch": 1.56, "learning_rate": 6.643873078249058e-05, "loss": 0.007, "step": 600690 }, { "epoch": 1.56, "learning_rate": 6.643484256611911e-05, "loss": 0.0091, "step": 600700 }, { "epoch": 1.56, "learning_rate": 6.643095434974765e-05, "loss": 0.01, "step": 600710 }, { "epoch": 1.56, "learning_rate": 6.642706613337618e-05, "loss": 0.0101, "step": 600720 }, { "epoch": 1.56, "learning_rate": 6.642317791700472e-05, "loss": 0.009, "step": 600730 }, { "epoch": 1.56, "learning_rate": 6.641928970063326e-05, "loss": 0.0071, "step": 600740 }, { "epoch": 1.56, "learning_rate": 6.641540148426179e-05, "loss": 0.0078, "step": 600750 }, { "epoch": 1.56, "learning_rate": 6.641151326789033e-05, "loss": 0.0092, "step": 600760 }, { "epoch": 1.56, "learning_rate": 6.640762505151886e-05, "loss": 0.0087, "step": 600770 }, { "epoch": 1.56, "learning_rate": 6.64037368351474e-05, "loss": 0.0089, "step": 600780 }, { "epoch": 1.56, "learning_rate": 6.639984861877593e-05, "loss": 0.0089, "step": 600790 }, { "epoch": 1.56, "learning_rate": 6.639596040240446e-05, "loss": 0.0158, "step": 600800 }, { "epoch": 1.56, "learning_rate": 6.6392072186033e-05, "loss": 0.0106, "step": 600810 }, { "epoch": 1.56, "learning_rate": 6.638818396966153e-05, "loss": 0.0124, "step": 600820 }, { "epoch": 1.56, "learning_rate": 6.638429575329007e-05, "loss": 0.0094, "step": 600830 }, { "epoch": 1.56, "learning_rate": 6.638040753691861e-05, "loss": 0.0108, "step": 600840 }, { "epoch": 1.56, "learning_rate": 6.637651932054714e-05, "loss": 0.0098, "step": 600850 }, { "epoch": 1.56, "learning_rate": 6.637263110417568e-05, "loss": 0.0073, "step": 600860 }, { "epoch": 1.56, "learning_rate": 6.636874288780421e-05, "loss": 0.0097, "step": 600870 }, { "epoch": 1.56, "learning_rate": 6.636485467143275e-05, "loss": 0.0109, "step": 600880 }, { "epoch": 1.56, "learning_rate": 6.636096645506128e-05, "loss": 0.0088, "step": 600890 }, { "epoch": 1.56, "learning_rate": 6.635707823868982e-05, "loss": 0.0098, "step": 600900 }, { "epoch": 1.56, "learning_rate": 6.635319002231836e-05, "loss": 0.0078, "step": 600910 }, { "epoch": 1.56, "learning_rate": 6.634930180594689e-05, "loss": 0.0076, "step": 600920 }, { "epoch": 1.56, "learning_rate": 6.634541358957543e-05, "loss": 0.0075, "step": 600930 }, { "epoch": 1.56, "learning_rate": 6.634152537320396e-05, "loss": 0.0098, "step": 600940 }, { "epoch": 1.56, "learning_rate": 6.63376371568325e-05, "loss": 0.0087, "step": 600950 }, { "epoch": 1.56, "learning_rate": 6.633374894046103e-05, "loss": 0.007, "step": 600960 }, { "epoch": 1.56, "learning_rate": 6.632986072408957e-05, "loss": 0.0064, "step": 600970 }, { "epoch": 1.56, "learning_rate": 6.63259725077181e-05, "loss": 0.0097, "step": 600980 }, { "epoch": 1.56, "learning_rate": 6.632208429134664e-05, "loss": 0.0065, "step": 600990 }, { "epoch": 1.56, "learning_rate": 6.631819607497518e-05, "loss": 0.0124, "step": 601000 }, { "epoch": 1.56, "eval_cer": 0.8817110841447728, "eval_loss": 0.005832574795931578, "eval_runtime": 107.8162, "eval_samples_per_second": 18.55, "eval_steps_per_second": 4.638, "step": 601000 }, { "epoch": 1.56, "learning_rate": 6.631430785860371e-05, "loss": 0.0098, "step": 601010 }, { "epoch": 1.56, "learning_rate": 6.631041964223225e-05, "loss": 0.0111, "step": 601020 }, { "epoch": 1.56, "learning_rate": 6.630653142586078e-05, "loss": 0.0087, "step": 601030 }, { "epoch": 1.56, "learning_rate": 6.630264320948931e-05, "loss": 0.0086, "step": 601040 }, { "epoch": 1.56, "learning_rate": 6.629875499311785e-05, "loss": 0.0123, "step": 601050 }, { "epoch": 1.56, "learning_rate": 6.629486677674638e-05, "loss": 0.0113, "step": 601060 }, { "epoch": 1.56, "learning_rate": 6.629097856037492e-05, "loss": 0.0111, "step": 601070 }, { "epoch": 1.56, "learning_rate": 6.628709034400345e-05, "loss": 0.01, "step": 601080 }, { "epoch": 1.56, "learning_rate": 6.628320212763199e-05, "loss": 0.0083, "step": 601090 }, { "epoch": 1.56, "learning_rate": 6.627931391126053e-05, "loss": 0.0084, "step": 601100 }, { "epoch": 1.56, "learning_rate": 6.627542569488906e-05, "loss": 0.0065, "step": 601110 }, { "epoch": 1.56, "learning_rate": 6.62715374785176e-05, "loss": 0.0061, "step": 601120 }, { "epoch": 1.56, "learning_rate": 6.626764926214613e-05, "loss": 0.0102, "step": 601130 }, { "epoch": 1.56, "learning_rate": 6.626376104577467e-05, "loss": 0.0075, "step": 601140 }, { "epoch": 1.56, "learning_rate": 6.62598728294032e-05, "loss": 0.0083, "step": 601150 }, { "epoch": 1.56, "learning_rate": 6.625598461303174e-05, "loss": 0.008, "step": 601160 }, { "epoch": 1.56, "learning_rate": 6.625209639666028e-05, "loss": 0.01, "step": 601170 }, { "epoch": 1.56, "learning_rate": 6.624820818028881e-05, "loss": 0.0061, "step": 601180 }, { "epoch": 1.56, "learning_rate": 6.624431996391735e-05, "loss": 0.0123, "step": 601190 }, { "epoch": 1.56, "learning_rate": 6.624043174754588e-05, "loss": 0.0075, "step": 601200 }, { "epoch": 1.56, "learning_rate": 6.623654353117442e-05, "loss": 0.0097, "step": 601210 }, { "epoch": 1.56, "learning_rate": 6.623265531480295e-05, "loss": 0.0089, "step": 601220 }, { "epoch": 1.56, "learning_rate": 6.622876709843149e-05, "loss": 0.0095, "step": 601230 }, { "epoch": 1.56, "learning_rate": 6.622487888206002e-05, "loss": 0.0077, "step": 601240 }, { "epoch": 1.56, "learning_rate": 6.622099066568856e-05, "loss": 0.0075, "step": 601250 }, { "epoch": 1.56, "learning_rate": 6.62171024493171e-05, "loss": 0.0133, "step": 601260 }, { "epoch": 1.56, "learning_rate": 6.621321423294563e-05, "loss": 0.0081, "step": 601270 }, { "epoch": 1.56, "learning_rate": 6.620932601657417e-05, "loss": 0.0083, "step": 601280 }, { "epoch": 1.56, "learning_rate": 6.62054378002027e-05, "loss": 0.0116, "step": 601290 }, { "epoch": 1.56, "learning_rate": 6.620154958383123e-05, "loss": 0.0101, "step": 601300 }, { "epoch": 1.56, "learning_rate": 6.619766136745977e-05, "loss": 0.0072, "step": 601310 }, { "epoch": 1.56, "learning_rate": 6.61937731510883e-05, "loss": 0.0084, "step": 601320 }, { "epoch": 1.56, "learning_rate": 6.618988493471684e-05, "loss": 0.0081, "step": 601330 }, { "epoch": 1.56, "learning_rate": 6.618599671834537e-05, "loss": 0.0105, "step": 601340 }, { "epoch": 1.56, "learning_rate": 6.618210850197391e-05, "loss": 0.0088, "step": 601350 }, { "epoch": 1.56, "learning_rate": 6.617822028560245e-05, "loss": 0.0083, "step": 601360 }, { "epoch": 1.56, "learning_rate": 6.617433206923098e-05, "loss": 0.0077, "step": 601370 }, { "epoch": 1.56, "learning_rate": 6.617044385285952e-05, "loss": 0.0097, "step": 601380 }, { "epoch": 1.56, "learning_rate": 6.616655563648805e-05, "loss": 0.0105, "step": 601390 }, { "epoch": 1.56, "learning_rate": 6.616266742011659e-05, "loss": 0.0101, "step": 601400 }, { "epoch": 1.56, "learning_rate": 6.615877920374512e-05, "loss": 0.0087, "step": 601410 }, { "epoch": 1.56, "learning_rate": 6.615489098737366e-05, "loss": 0.0107, "step": 601420 }, { "epoch": 1.56, "learning_rate": 6.61510027710022e-05, "loss": 0.0099, "step": 601430 }, { "epoch": 1.56, "learning_rate": 6.614711455463073e-05, "loss": 0.0076, "step": 601440 }, { "epoch": 1.56, "learning_rate": 6.614322633825927e-05, "loss": 0.0069, "step": 601450 }, { "epoch": 1.56, "learning_rate": 6.61393381218878e-05, "loss": 0.0065, "step": 601460 }, { "epoch": 1.56, "learning_rate": 6.613544990551634e-05, "loss": 0.0108, "step": 601470 }, { "epoch": 1.56, "learning_rate": 6.613156168914487e-05, "loss": 0.0078, "step": 601480 }, { "epoch": 1.56, "learning_rate": 6.612767347277341e-05, "loss": 0.0104, "step": 601490 }, { "epoch": 1.56, "learning_rate": 6.612378525640194e-05, "loss": 0.0084, "step": 601500 }, { "epoch": 1.56, "learning_rate": 6.611989704003048e-05, "loss": 0.0081, "step": 601510 }, { "epoch": 1.56, "learning_rate": 6.611600882365902e-05, "loss": 0.0097, "step": 601520 }, { "epoch": 1.56, "learning_rate": 6.611212060728755e-05, "loss": 0.0078, "step": 601530 }, { "epoch": 1.56, "learning_rate": 6.610823239091608e-05, "loss": 0.0094, "step": 601540 }, { "epoch": 1.56, "learning_rate": 6.610434417454462e-05, "loss": 0.0078, "step": 601550 }, { "epoch": 1.56, "learning_rate": 6.610045595817315e-05, "loss": 0.009, "step": 601560 }, { "epoch": 1.56, "learning_rate": 6.609656774180169e-05, "loss": 0.0087, "step": 601570 }, { "epoch": 1.56, "learning_rate": 6.609267952543022e-05, "loss": 0.0075, "step": 601580 }, { "epoch": 1.56, "learning_rate": 6.608879130905876e-05, "loss": 0.0071, "step": 601590 }, { "epoch": 1.56, "learning_rate": 6.608490309268729e-05, "loss": 0.0077, "step": 601600 }, { "epoch": 1.56, "learning_rate": 6.608101487631583e-05, "loss": 0.0088, "step": 601610 }, { "epoch": 1.56, "learning_rate": 6.607712665994437e-05, "loss": 0.0073, "step": 601620 }, { "epoch": 1.56, "learning_rate": 6.60732384435729e-05, "loss": 0.0099, "step": 601630 }, { "epoch": 1.56, "learning_rate": 6.606935022720144e-05, "loss": 0.0121, "step": 601640 }, { "epoch": 1.56, "learning_rate": 6.606546201082997e-05, "loss": 0.0078, "step": 601650 }, { "epoch": 1.56, "learning_rate": 6.606157379445851e-05, "loss": 0.0079, "step": 601660 }, { "epoch": 1.56, "learning_rate": 6.605768557808704e-05, "loss": 0.0097, "step": 601670 }, { "epoch": 1.56, "learning_rate": 6.605379736171558e-05, "loss": 0.0083, "step": 601680 }, { "epoch": 1.56, "learning_rate": 6.604990914534412e-05, "loss": 0.0093, "step": 601690 }, { "epoch": 1.56, "learning_rate": 6.604602092897265e-05, "loss": 0.0095, "step": 601700 }, { "epoch": 1.56, "learning_rate": 6.604213271260119e-05, "loss": 0.0134, "step": 601710 }, { "epoch": 1.56, "learning_rate": 6.603824449622972e-05, "loss": 0.0096, "step": 601720 }, { "epoch": 1.56, "learning_rate": 6.603435627985826e-05, "loss": 0.0075, "step": 601730 }, { "epoch": 1.56, "learning_rate": 6.603046806348679e-05, "loss": 0.0077, "step": 601740 }, { "epoch": 1.56, "learning_rate": 6.602657984711533e-05, "loss": 0.0071, "step": 601750 }, { "epoch": 1.56, "learning_rate": 6.602269163074386e-05, "loss": 0.0073, "step": 601760 }, { "epoch": 1.56, "learning_rate": 6.60188034143724e-05, "loss": 0.0092, "step": 601770 }, { "epoch": 1.56, "learning_rate": 6.601491519800094e-05, "loss": 0.0067, "step": 601780 }, { "epoch": 1.56, "learning_rate": 6.601102698162947e-05, "loss": 0.0103, "step": 601790 }, { "epoch": 1.56, "learning_rate": 6.6007138765258e-05, "loss": 0.0107, "step": 601800 }, { "epoch": 1.56, "learning_rate": 6.600325054888654e-05, "loss": 0.009, "step": 601810 }, { "epoch": 1.56, "learning_rate": 6.599936233251507e-05, "loss": 0.0071, "step": 601820 }, { "epoch": 1.56, "learning_rate": 6.599547411614361e-05, "loss": 0.0101, "step": 601830 }, { "epoch": 1.56, "learning_rate": 6.599158589977214e-05, "loss": 0.007, "step": 601840 }, { "epoch": 1.56, "learning_rate": 6.598769768340068e-05, "loss": 0.0064, "step": 601850 }, { "epoch": 1.56, "learning_rate": 6.598380946702921e-05, "loss": 0.0088, "step": 601860 }, { "epoch": 1.56, "learning_rate": 6.597992125065775e-05, "loss": 0.0098, "step": 601870 }, { "epoch": 1.56, "learning_rate": 6.597603303428629e-05, "loss": 0.0095, "step": 601880 }, { "epoch": 1.56, "learning_rate": 6.597214481791482e-05, "loss": 0.01, "step": 601890 }, { "epoch": 1.56, "learning_rate": 6.596825660154336e-05, "loss": 0.0119, "step": 601900 }, { "epoch": 1.56, "learning_rate": 6.596436838517189e-05, "loss": 0.0071, "step": 601910 }, { "epoch": 1.56, "learning_rate": 6.596048016880043e-05, "loss": 0.0076, "step": 601920 }, { "epoch": 1.56, "learning_rate": 6.595659195242896e-05, "loss": 0.0066, "step": 601930 }, { "epoch": 1.56, "learning_rate": 6.59527037360575e-05, "loss": 0.006, "step": 601940 }, { "epoch": 1.56, "learning_rate": 6.594881551968603e-05, "loss": 0.01, "step": 601950 }, { "epoch": 1.56, "learning_rate": 6.594492730331457e-05, "loss": 0.0086, "step": 601960 }, { "epoch": 1.56, "learning_rate": 6.594103908694311e-05, "loss": 0.0081, "step": 601970 }, { "epoch": 1.56, "learning_rate": 6.593715087057164e-05, "loss": 0.0072, "step": 601980 }, { "epoch": 1.56, "learning_rate": 6.593326265420018e-05, "loss": 0.0094, "step": 601990 }, { "epoch": 1.56, "learning_rate": 6.592937443782871e-05, "loss": 0.0099, "step": 602000 }, { "epoch": 1.56, "eval_cer": 0.8817208816033121, "eval_loss": 0.005837557837367058, "eval_runtime": 107.7975, "eval_samples_per_second": 18.553, "eval_steps_per_second": 4.638, "step": 602000 }, { "epoch": 1.56, "learning_rate": 6.592548622145725e-05, "loss": 0.0063, "step": 602010 }, { "epoch": 1.56, "learning_rate": 6.592159800508578e-05, "loss": 0.0104, "step": 602020 }, { "epoch": 1.56, "learning_rate": 6.591770978871432e-05, "loss": 0.0086, "step": 602030 }, { "epoch": 1.56, "learning_rate": 6.591382157234285e-05, "loss": 0.0066, "step": 602040 }, { "epoch": 1.56, "learning_rate": 6.590993335597138e-05, "loss": 0.0067, "step": 602050 }, { "epoch": 1.56, "learning_rate": 6.590604513959992e-05, "loss": 0.0074, "step": 602060 }, { "epoch": 1.56, "learning_rate": 6.590215692322846e-05, "loss": 0.011, "step": 602070 }, { "epoch": 1.56, "learning_rate": 6.589826870685699e-05, "loss": 0.0068, "step": 602080 }, { "epoch": 1.56, "learning_rate": 6.589438049048553e-05, "loss": 0.0078, "step": 602090 }, { "epoch": 1.56, "learning_rate": 6.589049227411406e-05, "loss": 0.0103, "step": 602100 }, { "epoch": 1.56, "learning_rate": 6.58866040577426e-05, "loss": 0.0112, "step": 602110 }, { "epoch": 1.56, "learning_rate": 6.588271584137113e-05, "loss": 0.0069, "step": 602120 }, { "epoch": 1.56, "learning_rate": 6.587882762499967e-05, "loss": 0.0076, "step": 602130 }, { "epoch": 1.56, "learning_rate": 6.587493940862821e-05, "loss": 0.0092, "step": 602140 }, { "epoch": 1.56, "learning_rate": 6.587105119225674e-05, "loss": 0.0118, "step": 602150 }, { "epoch": 1.56, "learning_rate": 6.586716297588528e-05, "loss": 0.013, "step": 602160 }, { "epoch": 1.56, "learning_rate": 6.586327475951381e-05, "loss": 0.0072, "step": 602170 }, { "epoch": 1.56, "learning_rate": 6.585938654314235e-05, "loss": 0.0082, "step": 602180 }, { "epoch": 1.56, "learning_rate": 6.585549832677088e-05, "loss": 0.0095, "step": 602190 }, { "epoch": 1.56, "learning_rate": 6.585161011039942e-05, "loss": 0.0088, "step": 602200 }, { "epoch": 1.56, "learning_rate": 6.584772189402795e-05, "loss": 0.0056, "step": 602210 }, { "epoch": 1.56, "learning_rate": 6.584383367765649e-05, "loss": 0.0086, "step": 602220 }, { "epoch": 1.56, "learning_rate": 6.583994546128503e-05, "loss": 0.0081, "step": 602230 }, { "epoch": 1.56, "learning_rate": 6.583605724491356e-05, "loss": 0.0093, "step": 602240 }, { "epoch": 1.56, "learning_rate": 6.58321690285421e-05, "loss": 0.0087, "step": 602250 }, { "epoch": 1.56, "learning_rate": 6.582828081217063e-05, "loss": 0.0085, "step": 602260 }, { "epoch": 1.56, "learning_rate": 6.582439259579917e-05, "loss": 0.0095, "step": 602270 }, { "epoch": 1.56, "learning_rate": 6.58205043794277e-05, "loss": 0.0097, "step": 602280 }, { "epoch": 1.56, "learning_rate": 6.581661616305623e-05, "loss": 0.0081, "step": 602290 }, { "epoch": 1.56, "learning_rate": 6.581272794668477e-05, "loss": 0.008, "step": 602300 }, { "epoch": 1.56, "learning_rate": 6.58088397303133e-05, "loss": 0.0082, "step": 602310 }, { "epoch": 1.56, "learning_rate": 6.580495151394184e-05, "loss": 0.0102, "step": 602320 }, { "epoch": 1.56, "learning_rate": 6.580106329757038e-05, "loss": 0.0092, "step": 602330 }, { "epoch": 1.56, "learning_rate": 6.579717508119891e-05, "loss": 0.0069, "step": 602340 }, { "epoch": 1.56, "learning_rate": 6.579328686482745e-05, "loss": 0.0093, "step": 602350 }, { "epoch": 1.56, "learning_rate": 6.578939864845598e-05, "loss": 0.0068, "step": 602360 }, { "epoch": 1.56, "learning_rate": 6.578551043208452e-05, "loss": 0.0105, "step": 602370 }, { "epoch": 1.56, "learning_rate": 6.578162221571305e-05, "loss": 0.0087, "step": 602380 }, { "epoch": 1.56, "learning_rate": 6.577773399934159e-05, "loss": 0.0084, "step": 602390 }, { "epoch": 1.56, "learning_rate": 6.577384578297013e-05, "loss": 0.008, "step": 602400 }, { "epoch": 1.56, "learning_rate": 6.576995756659866e-05, "loss": 0.0096, "step": 602410 }, { "epoch": 1.56, "learning_rate": 6.57660693502272e-05, "loss": 0.0142, "step": 602420 }, { "epoch": 1.56, "learning_rate": 6.576218113385573e-05, "loss": 0.0094, "step": 602430 }, { "epoch": 1.56, "learning_rate": 6.575829291748427e-05, "loss": 0.0077, "step": 602440 }, { "epoch": 1.56, "learning_rate": 6.57544047011128e-05, "loss": 0.0091, "step": 602450 }, { "epoch": 1.56, "learning_rate": 6.575051648474134e-05, "loss": 0.0113, "step": 602460 }, { "epoch": 1.56, "learning_rate": 6.574662826836987e-05, "loss": 0.0102, "step": 602470 }, { "epoch": 1.56, "learning_rate": 6.574274005199841e-05, "loss": 0.0086, "step": 602480 }, { "epoch": 1.56, "learning_rate": 6.573885183562695e-05, "loss": 0.0086, "step": 602490 }, { "epoch": 1.56, "learning_rate": 6.573496361925548e-05, "loss": 0.0062, "step": 602500 }, { "epoch": 1.56, "learning_rate": 6.573107540288402e-05, "loss": 0.0085, "step": 602510 }, { "epoch": 1.56, "learning_rate": 6.572718718651255e-05, "loss": 0.0078, "step": 602520 }, { "epoch": 1.56, "learning_rate": 6.572329897014108e-05, "loss": 0.0067, "step": 602530 }, { "epoch": 1.56, "learning_rate": 6.571941075376962e-05, "loss": 0.0092, "step": 602540 }, { "epoch": 1.56, "learning_rate": 6.571552253739815e-05, "loss": 0.0078, "step": 602550 }, { "epoch": 1.56, "learning_rate": 6.571163432102669e-05, "loss": 0.0066, "step": 602560 }, { "epoch": 1.56, "learning_rate": 6.570774610465522e-05, "loss": 0.0103, "step": 602570 }, { "epoch": 1.56, "learning_rate": 6.570385788828376e-05, "loss": 0.0101, "step": 602580 }, { "epoch": 1.56, "learning_rate": 6.56999696719123e-05, "loss": 0.0081, "step": 602590 }, { "epoch": 1.56, "learning_rate": 6.569608145554083e-05, "loss": 0.0068, "step": 602600 }, { "epoch": 1.56, "learning_rate": 6.569219323916937e-05, "loss": 0.0084, "step": 602610 }, { "epoch": 1.56, "learning_rate": 6.56883050227979e-05, "loss": 0.01, "step": 602620 }, { "epoch": 1.56, "learning_rate": 6.568441680642644e-05, "loss": 0.0064, "step": 602630 }, { "epoch": 1.56, "learning_rate": 6.568052859005497e-05, "loss": 0.0087, "step": 602640 }, { "epoch": 1.56, "learning_rate": 6.567664037368351e-05, "loss": 0.0111, "step": 602650 }, { "epoch": 1.56, "learning_rate": 6.567275215731205e-05, "loss": 0.0072, "step": 602660 }, { "epoch": 1.56, "learning_rate": 6.566886394094058e-05, "loss": 0.0126, "step": 602670 }, { "epoch": 1.56, "learning_rate": 6.566497572456912e-05, "loss": 0.0094, "step": 602680 }, { "epoch": 1.56, "learning_rate": 6.566108750819765e-05, "loss": 0.0078, "step": 602690 }, { "epoch": 1.56, "learning_rate": 6.565719929182619e-05, "loss": 0.0101, "step": 602700 }, { "epoch": 1.56, "learning_rate": 6.565331107545472e-05, "loss": 0.008, "step": 602710 }, { "epoch": 1.56, "learning_rate": 6.564942285908326e-05, "loss": 0.0092, "step": 602720 }, { "epoch": 1.56, "learning_rate": 6.564553464271179e-05, "loss": 0.0085, "step": 602730 }, { "epoch": 1.56, "learning_rate": 6.564164642634033e-05, "loss": 0.0111, "step": 602740 }, { "epoch": 1.56, "learning_rate": 6.563775820996887e-05, "loss": 0.0061, "step": 602750 }, { "epoch": 1.56, "learning_rate": 6.56338699935974e-05, "loss": 0.008, "step": 602760 }, { "epoch": 1.56, "learning_rate": 6.562998177722594e-05, "loss": 0.0063, "step": 602770 }, { "epoch": 1.56, "learning_rate": 6.562609356085447e-05, "loss": 0.0057, "step": 602780 }, { "epoch": 1.56, "learning_rate": 6.5622205344483e-05, "loss": 0.0087, "step": 602790 }, { "epoch": 1.56, "learning_rate": 6.561831712811154e-05, "loss": 0.0088, "step": 602800 }, { "epoch": 1.56, "learning_rate": 6.561442891174007e-05, "loss": 0.0102, "step": 602810 }, { "epoch": 1.56, "learning_rate": 6.561054069536861e-05, "loss": 0.012, "step": 602820 }, { "epoch": 1.56, "learning_rate": 6.560665247899714e-05, "loss": 0.0084, "step": 602830 }, { "epoch": 1.56, "learning_rate": 6.560276426262568e-05, "loss": 0.0079, "step": 602840 }, { "epoch": 1.56, "learning_rate": 6.559887604625422e-05, "loss": 0.009, "step": 602850 }, { "epoch": 1.56, "learning_rate": 6.559498782988275e-05, "loss": 0.0085, "step": 602860 }, { "epoch": 1.56, "learning_rate": 6.559109961351129e-05, "loss": 0.0114, "step": 602870 }, { "epoch": 1.56, "learning_rate": 6.558721139713982e-05, "loss": 0.0096, "step": 602880 }, { "epoch": 1.56, "learning_rate": 6.558332318076836e-05, "loss": 0.0084, "step": 602890 }, { "epoch": 1.56, "learning_rate": 6.557943496439689e-05, "loss": 0.0115, "step": 602900 }, { "epoch": 1.56, "learning_rate": 6.557554674802543e-05, "loss": 0.0069, "step": 602910 }, { "epoch": 1.56, "learning_rate": 6.557165853165397e-05, "loss": 0.0104, "step": 602920 }, { "epoch": 1.56, "learning_rate": 6.55677703152825e-05, "loss": 0.0089, "step": 602930 }, { "epoch": 1.56, "learning_rate": 6.556388209891104e-05, "loss": 0.0081, "step": 602940 }, { "epoch": 1.56, "learning_rate": 6.555999388253957e-05, "loss": 0.0067, "step": 602950 }, { "epoch": 1.56, "learning_rate": 6.555610566616811e-05, "loss": 0.0093, "step": 602960 }, { "epoch": 1.56, "learning_rate": 6.555221744979664e-05, "loss": 0.0086, "step": 602970 }, { "epoch": 1.56, "learning_rate": 6.554832923342518e-05, "loss": 0.0063, "step": 602980 }, { "epoch": 1.56, "learning_rate": 6.554444101705371e-05, "loss": 0.0088, "step": 602990 }, { "epoch": 1.56, "learning_rate": 6.554055280068225e-05, "loss": 0.0106, "step": 603000 }, { "epoch": 1.56, "eval_cer": 0.8816788924952867, "eval_loss": 0.005703043192625046, "eval_runtime": 107.9387, "eval_samples_per_second": 18.529, "eval_steps_per_second": 4.632, "step": 603000 }, { "epoch": 1.56, "learning_rate": 6.553666458431079e-05, "loss": 0.0093, "step": 603010 }, { "epoch": 1.56, "learning_rate": 6.553277636793932e-05, "loss": 0.0096, "step": 603020 }, { "epoch": 1.56, "learning_rate": 6.552888815156785e-05, "loss": 0.01, "step": 603030 }, { "epoch": 1.56, "learning_rate": 6.552499993519639e-05, "loss": 0.0116, "step": 603040 }, { "epoch": 1.56, "learning_rate": 6.552111171882492e-05, "loss": 0.011, "step": 603050 }, { "epoch": 1.56, "learning_rate": 6.551722350245346e-05, "loss": 0.0083, "step": 603060 }, { "epoch": 1.56, "learning_rate": 6.551333528608199e-05, "loss": 0.009, "step": 603070 }, { "epoch": 1.56, "learning_rate": 6.550944706971053e-05, "loss": 0.0116, "step": 603080 }, { "epoch": 1.56, "learning_rate": 6.550555885333906e-05, "loss": 0.0072, "step": 603090 }, { "epoch": 1.56, "learning_rate": 6.55016706369676e-05, "loss": 0.0077, "step": 603100 }, { "epoch": 1.56, "learning_rate": 6.549778242059614e-05, "loss": 0.008, "step": 603110 }, { "epoch": 1.56, "learning_rate": 6.549389420422467e-05, "loss": 0.0132, "step": 603120 }, { "epoch": 1.56, "learning_rate": 6.549000598785321e-05, "loss": 0.0094, "step": 603130 }, { "epoch": 1.56, "learning_rate": 6.548611777148174e-05, "loss": 0.0091, "step": 603140 }, { "epoch": 1.56, "learning_rate": 6.548222955511028e-05, "loss": 0.0097, "step": 603150 }, { "epoch": 1.56, "learning_rate": 6.547834133873881e-05, "loss": 0.0079, "step": 603160 }, { "epoch": 1.56, "learning_rate": 6.547445312236735e-05, "loss": 0.01, "step": 603170 }, { "epoch": 1.56, "learning_rate": 6.547056490599588e-05, "loss": 0.0101, "step": 603180 }, { "epoch": 1.56, "learning_rate": 6.546667668962442e-05, "loss": 0.0098, "step": 603190 }, { "epoch": 1.56, "learning_rate": 6.546278847325296e-05, "loss": 0.0079, "step": 603200 }, { "epoch": 1.56, "learning_rate": 6.545890025688149e-05, "loss": 0.0103, "step": 603210 }, { "epoch": 1.56, "learning_rate": 6.545501204051003e-05, "loss": 0.0077, "step": 603220 }, { "epoch": 1.56, "learning_rate": 6.545112382413856e-05, "loss": 0.0092, "step": 603230 }, { "epoch": 1.56, "learning_rate": 6.54472356077671e-05, "loss": 0.0085, "step": 603240 }, { "epoch": 1.56, "learning_rate": 6.544334739139563e-05, "loss": 0.0058, "step": 603250 }, { "epoch": 1.56, "learning_rate": 6.543945917502417e-05, "loss": 0.0074, "step": 603260 }, { "epoch": 1.56, "learning_rate": 6.543557095865271e-05, "loss": 0.0076, "step": 603270 }, { "epoch": 1.56, "learning_rate": 6.543168274228124e-05, "loss": 0.0091, "step": 603280 }, { "epoch": 1.56, "learning_rate": 6.542779452590977e-05, "loss": 0.0113, "step": 603290 }, { "epoch": 1.56, "learning_rate": 6.542390630953831e-05, "loss": 0.008, "step": 603300 }, { "epoch": 1.56, "learning_rate": 6.542001809316684e-05, "loss": 0.0099, "step": 603310 }, { "epoch": 1.56, "learning_rate": 6.541612987679538e-05, "loss": 0.012, "step": 603320 }, { "epoch": 1.56, "learning_rate": 6.541224166042391e-05, "loss": 0.0093, "step": 603330 }, { "epoch": 1.56, "learning_rate": 6.540835344405245e-05, "loss": 0.0082, "step": 603340 }, { "epoch": 1.56, "learning_rate": 6.540446522768098e-05, "loss": 0.0074, "step": 603350 }, { "epoch": 1.56, "learning_rate": 6.540057701130952e-05, "loss": 0.0072, "step": 603360 }, { "epoch": 1.56, "learning_rate": 6.539668879493806e-05, "loss": 0.0072, "step": 603370 }, { "epoch": 1.56, "learning_rate": 6.539280057856659e-05, "loss": 0.0062, "step": 603380 }, { "epoch": 1.56, "learning_rate": 6.538891236219513e-05, "loss": 0.007, "step": 603390 }, { "epoch": 1.56, "learning_rate": 6.538502414582366e-05, "loss": 0.0099, "step": 603400 }, { "epoch": 1.56, "learning_rate": 6.53811359294522e-05, "loss": 0.0091, "step": 603410 }, { "epoch": 1.56, "learning_rate": 6.537724771308073e-05, "loss": 0.0061, "step": 603420 }, { "epoch": 1.56, "learning_rate": 6.537335949670927e-05, "loss": 0.0082, "step": 603430 }, { "epoch": 1.56, "learning_rate": 6.53694712803378e-05, "loss": 0.0073, "step": 603440 }, { "epoch": 1.56, "learning_rate": 6.536558306396634e-05, "loss": 0.0079, "step": 603450 }, { "epoch": 1.56, "learning_rate": 6.536169484759488e-05, "loss": 0.0112, "step": 603460 }, { "epoch": 1.56, "learning_rate": 6.535780663122341e-05, "loss": 0.0101, "step": 603470 }, { "epoch": 1.56, "learning_rate": 6.535391841485195e-05, "loss": 0.0089, "step": 603480 }, { "epoch": 1.56, "learning_rate": 6.535003019848048e-05, "loss": 0.0096, "step": 603490 }, { "epoch": 1.56, "learning_rate": 6.534614198210902e-05, "loss": 0.0066, "step": 603500 }, { "epoch": 1.56, "learning_rate": 6.534225376573755e-05, "loss": 0.0087, "step": 603510 }, { "epoch": 1.56, "learning_rate": 6.533836554936608e-05, "loss": 0.0075, "step": 603520 }, { "epoch": 1.56, "learning_rate": 6.533447733299462e-05, "loss": 0.0098, "step": 603530 }, { "epoch": 1.56, "learning_rate": 6.533058911662315e-05, "loss": 0.0079, "step": 603540 }, { "epoch": 1.56, "learning_rate": 6.532670090025169e-05, "loss": 0.0102, "step": 603550 }, { "epoch": 1.56, "learning_rate": 6.532281268388023e-05, "loss": 0.0108, "step": 603560 }, { "epoch": 1.56, "learning_rate": 6.531892446750876e-05, "loss": 0.0078, "step": 603570 }, { "epoch": 1.56, "learning_rate": 6.53150362511373e-05, "loss": 0.0098, "step": 603580 }, { "epoch": 1.56, "learning_rate": 6.531114803476583e-05, "loss": 0.0082, "step": 603590 }, { "epoch": 1.56, "learning_rate": 6.530725981839437e-05, "loss": 0.0072, "step": 603600 }, { "epoch": 1.56, "learning_rate": 6.53033716020229e-05, "loss": 0.0086, "step": 603610 }, { "epoch": 1.56, "learning_rate": 6.529948338565144e-05, "loss": 0.006, "step": 603620 }, { "epoch": 1.56, "learning_rate": 6.529559516927998e-05, "loss": 0.0064, "step": 603630 }, { "epoch": 1.56, "learning_rate": 6.529170695290851e-05, "loss": 0.01, "step": 603640 }, { "epoch": 1.56, "learning_rate": 6.528781873653705e-05, "loss": 0.006, "step": 603650 }, { "epoch": 1.56, "learning_rate": 6.528393052016558e-05, "loss": 0.0105, "step": 603660 }, { "epoch": 1.56, "learning_rate": 6.528004230379412e-05, "loss": 0.0127, "step": 603670 }, { "epoch": 1.56, "learning_rate": 6.527615408742265e-05, "loss": 0.0078, "step": 603680 }, { "epoch": 1.56, "learning_rate": 6.527226587105119e-05, "loss": 0.0077, "step": 603690 }, { "epoch": 1.56, "learning_rate": 6.526837765467972e-05, "loss": 0.0075, "step": 603700 }, { "epoch": 1.56, "learning_rate": 6.526448943830826e-05, "loss": 0.0091, "step": 603710 }, { "epoch": 1.56, "learning_rate": 6.52606012219368e-05, "loss": 0.0106, "step": 603720 }, { "epoch": 1.56, "learning_rate": 6.525671300556533e-05, "loss": 0.0073, "step": 603730 }, { "epoch": 1.56, "learning_rate": 6.525282478919387e-05, "loss": 0.0079, "step": 603740 }, { "epoch": 1.57, "learning_rate": 6.52489365728224e-05, "loss": 0.0097, "step": 603750 }, { "epoch": 1.57, "learning_rate": 6.524504835645094e-05, "loss": 0.0102, "step": 603760 }, { "epoch": 1.57, "learning_rate": 6.524116014007947e-05, "loss": 0.0089, "step": 603770 }, { "epoch": 1.57, "learning_rate": 6.5237271923708e-05, "loss": 0.0085, "step": 603780 }, { "epoch": 1.57, "learning_rate": 6.523338370733654e-05, "loss": 0.0058, "step": 603790 }, { "epoch": 1.57, "learning_rate": 6.522949549096507e-05, "loss": 0.0075, "step": 603800 }, { "epoch": 1.57, "learning_rate": 6.522560727459361e-05, "loss": 0.0123, "step": 603810 }, { "epoch": 1.57, "learning_rate": 6.522171905822215e-05, "loss": 0.0083, "step": 603820 }, { "epoch": 1.57, "learning_rate": 6.521783084185068e-05, "loss": 0.0099, "step": 603830 }, { "epoch": 1.57, "learning_rate": 6.521394262547922e-05, "loss": 0.0064, "step": 603840 }, { "epoch": 1.57, "learning_rate": 6.521005440910775e-05, "loss": 0.008, "step": 603850 }, { "epoch": 1.57, "learning_rate": 6.520616619273629e-05, "loss": 0.01, "step": 603860 }, { "epoch": 1.57, "learning_rate": 6.520227797636482e-05, "loss": 0.0113, "step": 603870 }, { "epoch": 1.57, "learning_rate": 6.519838975999336e-05, "loss": 0.0079, "step": 603880 }, { "epoch": 1.57, "learning_rate": 6.51945015436219e-05, "loss": 0.0084, "step": 603890 }, { "epoch": 1.57, "learning_rate": 6.519061332725043e-05, "loss": 0.0073, "step": 603900 }, { "epoch": 1.57, "learning_rate": 6.518672511087897e-05, "loss": 0.0081, "step": 603910 }, { "epoch": 1.57, "learning_rate": 6.51828368945075e-05, "loss": 0.0092, "step": 603920 }, { "epoch": 1.57, "learning_rate": 6.517894867813604e-05, "loss": 0.0129, "step": 603930 }, { "epoch": 1.57, "learning_rate": 6.517506046176457e-05, "loss": 0.0075, "step": 603940 }, { "epoch": 1.57, "learning_rate": 6.517117224539311e-05, "loss": 0.0062, "step": 603950 }, { "epoch": 1.57, "learning_rate": 6.516728402902164e-05, "loss": 0.0077, "step": 603960 }, { "epoch": 1.57, "learning_rate": 6.516339581265018e-05, "loss": 0.0072, "step": 603970 }, { "epoch": 1.57, "learning_rate": 6.515950759627872e-05, "loss": 0.0118, "step": 603980 }, { "epoch": 1.57, "learning_rate": 6.515561937990725e-05, "loss": 0.0097, "step": 603990 }, { "epoch": 1.57, "learning_rate": 6.515173116353579e-05, "loss": 0.0073, "step": 604000 }, { "epoch": 1.57, "eval_cer": 0.8817110841447728, "eval_loss": 0.005707249511033297, "eval_runtime": 107.7161, "eval_samples_per_second": 18.567, "eval_steps_per_second": 4.642, "step": 604000 }, { "epoch": 1.57, "learning_rate": 6.514784294716432e-05, "loss": 0.0092, "step": 604010 }, { "epoch": 1.57, "learning_rate": 6.514395473079285e-05, "loss": 0.0114, "step": 604020 }, { "epoch": 1.57, "learning_rate": 6.514006651442139e-05, "loss": 0.008, "step": 604030 }, { "epoch": 1.57, "learning_rate": 6.513617829804992e-05, "loss": 0.0076, "step": 604040 }, { "epoch": 1.57, "learning_rate": 6.513229008167846e-05, "loss": 0.0082, "step": 604050 }, { "epoch": 1.57, "learning_rate": 6.512840186530699e-05, "loss": 0.0106, "step": 604060 }, { "epoch": 1.57, "learning_rate": 6.512451364893553e-05, "loss": 0.0069, "step": 604070 }, { "epoch": 1.57, "learning_rate": 6.512062543256407e-05, "loss": 0.0091, "step": 604080 }, { "epoch": 1.57, "learning_rate": 6.51167372161926e-05, "loss": 0.0106, "step": 604090 }, { "epoch": 1.57, "learning_rate": 6.511284899982114e-05, "loss": 0.0103, "step": 604100 }, { "epoch": 1.57, "learning_rate": 6.510896078344967e-05, "loss": 0.007, "step": 604110 }, { "epoch": 1.57, "learning_rate": 6.510507256707821e-05, "loss": 0.0099, "step": 604120 }, { "epoch": 1.57, "learning_rate": 6.510118435070674e-05, "loss": 0.0082, "step": 604130 }, { "epoch": 1.57, "learning_rate": 6.509729613433528e-05, "loss": 0.0073, "step": 604140 }, { "epoch": 1.57, "learning_rate": 6.509340791796382e-05, "loss": 0.0098, "step": 604150 }, { "epoch": 1.57, "learning_rate": 6.508951970159235e-05, "loss": 0.0075, "step": 604160 }, { "epoch": 1.57, "learning_rate": 6.508563148522089e-05, "loss": 0.0104, "step": 604170 }, { "epoch": 1.57, "learning_rate": 6.508174326884942e-05, "loss": 0.0075, "step": 604180 }, { "epoch": 1.57, "learning_rate": 6.507785505247796e-05, "loss": 0.0068, "step": 604190 }, { "epoch": 1.57, "learning_rate": 6.507396683610649e-05, "loss": 0.0065, "step": 604200 }, { "epoch": 1.57, "learning_rate": 6.507007861973503e-05, "loss": 0.0076, "step": 604210 }, { "epoch": 1.57, "learning_rate": 6.506619040336356e-05, "loss": 0.0071, "step": 604220 }, { "epoch": 1.57, "learning_rate": 6.50623021869921e-05, "loss": 0.0079, "step": 604230 }, { "epoch": 1.57, "learning_rate": 6.505841397062064e-05, "loss": 0.0113, "step": 604240 }, { "epoch": 1.57, "learning_rate": 6.505452575424917e-05, "loss": 0.0107, "step": 604250 }, { "epoch": 1.57, "learning_rate": 6.505063753787771e-05, "loss": 0.0104, "step": 604260 }, { "epoch": 1.57, "learning_rate": 6.504674932150624e-05, "loss": 0.0076, "step": 604270 }, { "epoch": 1.57, "learning_rate": 6.504286110513477e-05, "loss": 0.0116, "step": 604280 }, { "epoch": 1.57, "learning_rate": 6.503897288876331e-05, "loss": 0.0079, "step": 604290 }, { "epoch": 1.57, "learning_rate": 6.503508467239184e-05, "loss": 0.0081, "step": 604300 }, { "epoch": 1.57, "learning_rate": 6.503119645602038e-05, "loss": 0.0093, "step": 604310 }, { "epoch": 1.57, "learning_rate": 6.50273082396489e-05, "loss": 0.0114, "step": 604320 }, { "epoch": 1.57, "learning_rate": 6.502342002327745e-05, "loss": 0.0088, "step": 604330 }, { "epoch": 1.57, "learning_rate": 6.501953180690599e-05, "loss": 0.0112, "step": 604340 }, { "epoch": 1.57, "learning_rate": 6.501564359053452e-05, "loss": 0.0077, "step": 604350 }, { "epoch": 1.57, "learning_rate": 6.501175537416306e-05, "loss": 0.0091, "step": 604360 }, { "epoch": 1.57, "learning_rate": 6.500786715779159e-05, "loss": 0.0114, "step": 604370 }, { "epoch": 1.57, "learning_rate": 6.500397894142013e-05, "loss": 0.0074, "step": 604380 }, { "epoch": 1.57, "learning_rate": 6.500009072504866e-05, "loss": 0.0107, "step": 604390 }, { "epoch": 1.57, "learning_rate": 6.49962025086772e-05, "loss": 0.0096, "step": 604400 }, { "epoch": 1.57, "learning_rate": 6.499231429230574e-05, "loss": 0.0122, "step": 604410 }, { "epoch": 1.57, "learning_rate": 6.498842607593427e-05, "loss": 0.0082, "step": 604420 }, { "epoch": 1.57, "learning_rate": 6.498453785956281e-05, "loss": 0.0051, "step": 604430 }, { "epoch": 1.57, "learning_rate": 6.498064964319134e-05, "loss": 0.0089, "step": 604440 }, { "epoch": 1.57, "learning_rate": 6.497676142681988e-05, "loss": 0.0103, "step": 604450 }, { "epoch": 1.57, "learning_rate": 6.497287321044841e-05, "loss": 0.0063, "step": 604460 }, { "epoch": 1.57, "learning_rate": 6.496898499407695e-05, "loss": 0.0094, "step": 604470 }, { "epoch": 1.57, "learning_rate": 6.496509677770548e-05, "loss": 0.0092, "step": 604480 }, { "epoch": 1.57, "learning_rate": 6.496120856133402e-05, "loss": 0.0058, "step": 604490 }, { "epoch": 1.57, "learning_rate": 6.495732034496256e-05, "loss": 0.01, "step": 604500 }, { "epoch": 1.57, "learning_rate": 6.495343212859109e-05, "loss": 0.0087, "step": 604510 }, { "epoch": 1.57, "learning_rate": 6.494954391221962e-05, "loss": 0.0089, "step": 604520 }, { "epoch": 1.57, "learning_rate": 6.494565569584816e-05, "loss": 0.0108, "step": 604530 }, { "epoch": 1.57, "learning_rate": 6.494176747947669e-05, "loss": 0.0077, "step": 604540 }, { "epoch": 1.57, "learning_rate": 6.493787926310523e-05, "loss": 0.01, "step": 604550 }, { "epoch": 1.57, "learning_rate": 6.493399104673376e-05, "loss": 0.0098, "step": 604560 }, { "epoch": 1.57, "learning_rate": 6.49301028303623e-05, "loss": 0.0083, "step": 604570 }, { "epoch": 1.57, "learning_rate": 6.492621461399083e-05, "loss": 0.0095, "step": 604580 }, { "epoch": 1.57, "learning_rate": 6.492232639761937e-05, "loss": 0.0068, "step": 604590 }, { "epoch": 1.57, "learning_rate": 6.491843818124791e-05, "loss": 0.0123, "step": 604600 }, { "epoch": 1.57, "learning_rate": 6.491454996487644e-05, "loss": 0.0084, "step": 604610 }, { "epoch": 1.57, "learning_rate": 6.491066174850498e-05, "loss": 0.0064, "step": 604620 }, { "epoch": 1.57, "learning_rate": 6.490677353213351e-05, "loss": 0.0074, "step": 604630 }, { "epoch": 1.57, "learning_rate": 6.490288531576205e-05, "loss": 0.0075, "step": 604640 }, { "epoch": 1.57, "learning_rate": 6.489899709939058e-05, "loss": 0.0099, "step": 604650 }, { "epoch": 1.57, "learning_rate": 6.489510888301912e-05, "loss": 0.0072, "step": 604660 }, { "epoch": 1.57, "learning_rate": 6.489122066664765e-05, "loss": 0.0096, "step": 604670 }, { "epoch": 1.57, "learning_rate": 6.488733245027619e-05, "loss": 0.0082, "step": 604680 }, { "epoch": 1.57, "learning_rate": 6.488344423390473e-05, "loss": 0.0089, "step": 604690 }, { "epoch": 1.57, "learning_rate": 6.487955601753326e-05, "loss": 0.0087, "step": 604700 }, { "epoch": 1.57, "learning_rate": 6.48756678011618e-05, "loss": 0.0096, "step": 604710 }, { "epoch": 1.57, "learning_rate": 6.487177958479033e-05, "loss": 0.0085, "step": 604720 }, { "epoch": 1.57, "learning_rate": 6.486789136841887e-05, "loss": 0.0083, "step": 604730 }, { "epoch": 1.57, "learning_rate": 6.48640031520474e-05, "loss": 0.0089, "step": 604740 }, { "epoch": 1.57, "learning_rate": 6.486011493567594e-05, "loss": 0.0073, "step": 604750 }, { "epoch": 1.57, "learning_rate": 6.485622671930447e-05, "loss": 0.0088, "step": 604760 }, { "epoch": 1.57, "learning_rate": 6.4852338502933e-05, "loss": 0.0091, "step": 604770 }, { "epoch": 1.57, "learning_rate": 6.484845028656154e-05, "loss": 0.0067, "step": 604780 }, { "epoch": 1.57, "learning_rate": 6.484456207019008e-05, "loss": 0.0061, "step": 604790 }, { "epoch": 1.57, "learning_rate": 6.48406738538186e-05, "loss": 0.0115, "step": 604800 }, { "epoch": 1.57, "learning_rate": 6.483678563744715e-05, "loss": 0.0086, "step": 604810 }, { "epoch": 1.57, "learning_rate": 6.483289742107568e-05, "loss": 0.009, "step": 604820 }, { "epoch": 1.57, "learning_rate": 6.482900920470422e-05, "loss": 0.0137, "step": 604830 }, { "epoch": 1.57, "learning_rate": 6.482512098833275e-05, "loss": 0.0081, "step": 604840 }, { "epoch": 1.57, "learning_rate": 6.482123277196129e-05, "loss": 0.011, "step": 604850 }, { "epoch": 1.57, "learning_rate": 6.481734455558983e-05, "loss": 0.0094, "step": 604860 }, { "epoch": 1.57, "learning_rate": 6.481345633921836e-05, "loss": 0.0067, "step": 604870 }, { "epoch": 1.57, "learning_rate": 6.48095681228469e-05, "loss": 0.0082, "step": 604880 }, { "epoch": 1.57, "learning_rate": 6.480567990647543e-05, "loss": 0.0106, "step": 604890 }, { "epoch": 1.57, "learning_rate": 6.480179169010397e-05, "loss": 0.0076, "step": 604900 }, { "epoch": 1.57, "learning_rate": 6.47979034737325e-05, "loss": 0.0091, "step": 604910 }, { "epoch": 1.57, "learning_rate": 6.479401525736104e-05, "loss": 0.0078, "step": 604920 }, { "epoch": 1.57, "learning_rate": 6.479012704098957e-05, "loss": 0.0114, "step": 604930 }, { "epoch": 1.57, "learning_rate": 6.478623882461811e-05, "loss": 0.008, "step": 604940 }, { "epoch": 1.57, "learning_rate": 6.478235060824665e-05, "loss": 0.0084, "step": 604950 }, { "epoch": 1.57, "learning_rate": 6.477846239187518e-05, "loss": 0.0072, "step": 604960 }, { "epoch": 1.57, "learning_rate": 6.477457417550372e-05, "loss": 0.0094, "step": 604970 }, { "epoch": 1.57, "learning_rate": 6.477068595913225e-05, "loss": 0.008, "step": 604980 }, { "epoch": 1.57, "learning_rate": 6.476679774276079e-05, "loss": 0.0077, "step": 604990 }, { "epoch": 1.57, "learning_rate": 6.476290952638932e-05, "loss": 0.0078, "step": 605000 }, { "epoch": 1.57, "eval_cer": 0.8816830914060892, "eval_loss": 0.005784572102129459, "eval_runtime": 107.7017, "eval_samples_per_second": 18.57, "eval_steps_per_second": 4.642, "step": 605000 }, { "epoch": 1.57, "learning_rate": 6.475902131001785e-05, "loss": 0.0078, "step": 605010 }, { "epoch": 1.57, "learning_rate": 6.475513309364639e-05, "loss": 0.0067, "step": 605020 }, { "epoch": 1.57, "learning_rate": 6.475124487727491e-05, "loss": 0.007, "step": 605030 }, { "epoch": 1.57, "learning_rate": 6.474735666090346e-05, "loss": 0.009, "step": 605040 }, { "epoch": 1.57, "learning_rate": 6.4743468444532e-05, "loss": 0.0076, "step": 605050 }, { "epoch": 1.57, "learning_rate": 6.473958022816053e-05, "loss": 0.01, "step": 605060 }, { "epoch": 1.57, "learning_rate": 6.473569201178907e-05, "loss": 0.0085, "step": 605070 }, { "epoch": 1.57, "learning_rate": 6.47318037954176e-05, "loss": 0.0084, "step": 605080 }, { "epoch": 1.57, "learning_rate": 6.472791557904614e-05, "loss": 0.0078, "step": 605090 }, { "epoch": 1.57, "learning_rate": 6.472402736267467e-05, "loss": 0.0083, "step": 605100 }, { "epoch": 1.57, "learning_rate": 6.472013914630321e-05, "loss": 0.0079, "step": 605110 }, { "epoch": 1.57, "learning_rate": 6.471625092993175e-05, "loss": 0.0086, "step": 605120 }, { "epoch": 1.57, "learning_rate": 6.471236271356028e-05, "loss": 0.0067, "step": 605130 }, { "epoch": 1.57, "learning_rate": 6.470847449718882e-05, "loss": 0.0073, "step": 605140 }, { "epoch": 1.57, "learning_rate": 6.470458628081735e-05, "loss": 0.0085, "step": 605150 }, { "epoch": 1.57, "learning_rate": 6.470069806444589e-05, "loss": 0.0082, "step": 605160 }, { "epoch": 1.57, "learning_rate": 6.469680984807442e-05, "loss": 0.0125, "step": 605170 }, { "epoch": 1.57, "learning_rate": 6.469292163170296e-05, "loss": 0.009, "step": 605180 }, { "epoch": 1.57, "learning_rate": 6.468903341533149e-05, "loss": 0.0085, "step": 605190 }, { "epoch": 1.57, "learning_rate": 6.468514519896003e-05, "loss": 0.0081, "step": 605200 }, { "epoch": 1.57, "learning_rate": 6.468125698258857e-05, "loss": 0.0104, "step": 605210 }, { "epoch": 1.57, "learning_rate": 6.46773687662171e-05, "loss": 0.0112, "step": 605220 }, { "epoch": 1.57, "learning_rate": 6.467348054984564e-05, "loss": 0.009, "step": 605230 }, { "epoch": 1.57, "learning_rate": 6.466959233347417e-05, "loss": 0.0094, "step": 605240 }, { "epoch": 1.57, "learning_rate": 6.466570411710271e-05, "loss": 0.0083, "step": 605250 }, { "epoch": 1.57, "learning_rate": 6.466181590073124e-05, "loss": 0.0089, "step": 605260 }, { "epoch": 1.57, "learning_rate": 6.465792768435977e-05, "loss": 0.0104, "step": 605270 }, { "epoch": 1.57, "learning_rate": 6.465403946798831e-05, "loss": 0.0098, "step": 605280 }, { "epoch": 1.57, "learning_rate": 6.465015125161683e-05, "loss": 0.0129, "step": 605290 }, { "epoch": 1.57, "learning_rate": 6.464626303524538e-05, "loss": 0.0141, "step": 605300 }, { "epoch": 1.57, "learning_rate": 6.464237481887392e-05, "loss": 0.0125, "step": 605310 }, { "epoch": 1.57, "learning_rate": 6.463848660250245e-05, "loss": 0.0098, "step": 605320 }, { "epoch": 1.57, "learning_rate": 6.463459838613099e-05, "loss": 0.0082, "step": 605330 }, { "epoch": 1.57, "learning_rate": 6.463071016975952e-05, "loss": 0.0075, "step": 605340 }, { "epoch": 1.57, "learning_rate": 6.462682195338806e-05, "loss": 0.0107, "step": 605350 }, { "epoch": 1.57, "learning_rate": 6.462293373701659e-05, "loss": 0.009, "step": 605360 }, { "epoch": 1.57, "learning_rate": 6.461904552064513e-05, "loss": 0.0107, "step": 605370 }, { "epoch": 1.57, "learning_rate": 6.461515730427367e-05, "loss": 0.0097, "step": 605380 }, { "epoch": 1.57, "learning_rate": 6.46112690879022e-05, "loss": 0.0064, "step": 605390 }, { "epoch": 1.57, "learning_rate": 6.460738087153074e-05, "loss": 0.0078, "step": 605400 }, { "epoch": 1.57, "learning_rate": 6.460349265515927e-05, "loss": 0.0075, "step": 605410 }, { "epoch": 1.57, "learning_rate": 6.459960443878781e-05, "loss": 0.0063, "step": 605420 }, { "epoch": 1.57, "learning_rate": 6.459571622241634e-05, "loss": 0.0074, "step": 605430 }, { "epoch": 1.57, "learning_rate": 6.459182800604488e-05, "loss": 0.0067, "step": 605440 }, { "epoch": 1.57, "learning_rate": 6.45879397896734e-05, "loss": 0.0059, "step": 605450 }, { "epoch": 1.57, "learning_rate": 6.458405157330195e-05, "loss": 0.0086, "step": 605460 }, { "epoch": 1.57, "learning_rate": 6.458016335693049e-05, "loss": 0.0071, "step": 605470 }, { "epoch": 1.57, "learning_rate": 6.457627514055902e-05, "loss": 0.0095, "step": 605480 }, { "epoch": 1.57, "learning_rate": 6.457238692418756e-05, "loss": 0.0079, "step": 605490 }, { "epoch": 1.57, "learning_rate": 6.456849870781609e-05, "loss": 0.0077, "step": 605500 }, { "epoch": 1.57, "learning_rate": 6.456461049144462e-05, "loss": 0.0108, "step": 605510 }, { "epoch": 1.57, "learning_rate": 6.456072227507316e-05, "loss": 0.0084, "step": 605520 }, { "epoch": 1.57, "learning_rate": 6.455683405870169e-05, "loss": 0.0071, "step": 605530 }, { "epoch": 1.57, "learning_rate": 6.455294584233023e-05, "loss": 0.0067, "step": 605540 }, { "epoch": 1.57, "learning_rate": 6.454905762595875e-05, "loss": 0.0092, "step": 605550 }, { "epoch": 1.57, "learning_rate": 6.45451694095873e-05, "loss": 0.0092, "step": 605560 }, { "epoch": 1.57, "learning_rate": 6.454128119321584e-05, "loss": 0.0067, "step": 605570 }, { "epoch": 1.57, "learning_rate": 6.453739297684437e-05, "loss": 0.0087, "step": 605580 }, { "epoch": 1.57, "learning_rate": 6.453350476047291e-05, "loss": 0.0061, "step": 605590 }, { "epoch": 1.57, "learning_rate": 6.452961654410144e-05, "loss": 0.0069, "step": 605600 }, { "epoch": 1.57, "learning_rate": 6.452572832772998e-05, "loss": 0.0095, "step": 605610 }, { "epoch": 1.57, "learning_rate": 6.45218401113585e-05, "loss": 0.0079, "step": 605620 }, { "epoch": 1.57, "learning_rate": 6.451795189498705e-05, "loss": 0.0102, "step": 605630 }, { "epoch": 1.57, "learning_rate": 6.451406367861559e-05, "loss": 0.0091, "step": 605640 }, { "epoch": 1.57, "learning_rate": 6.451017546224412e-05, "loss": 0.0077, "step": 605650 }, { "epoch": 1.57, "learning_rate": 6.450628724587266e-05, "loss": 0.0062, "step": 605660 }, { "epoch": 1.57, "learning_rate": 6.450239902950119e-05, "loss": 0.0074, "step": 605670 }, { "epoch": 1.57, "learning_rate": 6.449851081312973e-05, "loss": 0.0054, "step": 605680 }, { "epoch": 1.57, "learning_rate": 6.449462259675826e-05, "loss": 0.0062, "step": 605690 }, { "epoch": 1.57, "learning_rate": 6.44907343803868e-05, "loss": 0.0061, "step": 605700 }, { "epoch": 1.57, "learning_rate": 6.448684616401533e-05, "loss": 0.0076, "step": 605710 }, { "epoch": 1.57, "learning_rate": 6.448295794764387e-05, "loss": 0.0095, "step": 605720 }, { "epoch": 1.57, "learning_rate": 6.447906973127241e-05, "loss": 0.0094, "step": 605730 }, { "epoch": 1.57, "learning_rate": 6.447518151490094e-05, "loss": 0.0061, "step": 605740 }, { "epoch": 1.57, "learning_rate": 6.447129329852948e-05, "loss": 0.0073, "step": 605750 }, { "epoch": 1.57, "learning_rate": 6.446740508215801e-05, "loss": 0.0101, "step": 605760 }, { "epoch": 1.57, "learning_rate": 6.446351686578654e-05, "loss": 0.0081, "step": 605770 }, { "epoch": 1.57, "learning_rate": 6.445962864941508e-05, "loss": 0.0133, "step": 605780 }, { "epoch": 1.57, "learning_rate": 6.44557404330436e-05, "loss": 0.0083, "step": 605790 }, { "epoch": 1.57, "learning_rate": 6.445185221667215e-05, "loss": 0.0091, "step": 605800 }, { "epoch": 1.57, "learning_rate": 6.444796400030067e-05, "loss": 0.0079, "step": 605810 }, { "epoch": 1.57, "learning_rate": 6.444407578392922e-05, "loss": 0.0078, "step": 605820 }, { "epoch": 1.57, "learning_rate": 6.444018756755776e-05, "loss": 0.0076, "step": 605830 }, { "epoch": 1.57, "learning_rate": 6.443629935118629e-05, "loss": 0.0098, "step": 605840 }, { "epoch": 1.57, "learning_rate": 6.443241113481483e-05, "loss": 0.0159, "step": 605850 }, { "epoch": 1.57, "learning_rate": 6.442852291844336e-05, "loss": 0.0102, "step": 605860 }, { "epoch": 1.57, "learning_rate": 6.44246347020719e-05, "loss": 0.0093, "step": 605870 }, { "epoch": 1.57, "learning_rate": 6.442074648570043e-05, "loss": 0.0074, "step": 605880 }, { "epoch": 1.57, "learning_rate": 6.441685826932897e-05, "loss": 0.0086, "step": 605890 }, { "epoch": 1.57, "learning_rate": 6.441297005295751e-05, "loss": 0.0106, "step": 605900 }, { "epoch": 1.57, "learning_rate": 6.440908183658604e-05, "loss": 0.0108, "step": 605910 }, { "epoch": 1.57, "learning_rate": 6.440519362021458e-05, "loss": 0.0086, "step": 605920 }, { "epoch": 1.57, "learning_rate": 6.44013054038431e-05, "loss": 0.0082, "step": 605930 }, { "epoch": 1.57, "learning_rate": 6.439741718747165e-05, "loss": 0.0092, "step": 605940 }, { "epoch": 1.57, "learning_rate": 6.439352897110018e-05, "loss": 0.0116, "step": 605950 }, { "epoch": 1.57, "learning_rate": 6.438964075472872e-05, "loss": 0.0117, "step": 605960 }, { "epoch": 1.57, "learning_rate": 6.438575253835725e-05, "loss": 0.008, "step": 605970 }, { "epoch": 1.57, "learning_rate": 6.438186432198579e-05, "loss": 0.0118, "step": 605980 }, { "epoch": 1.57, "learning_rate": 6.437797610561433e-05, "loss": 0.0124, "step": 605990 }, { "epoch": 1.57, "learning_rate": 6.437408788924286e-05, "loss": 0.0088, "step": 606000 }, { "epoch": 1.57, "eval_cer": 0.8817124837817071, "eval_loss": 0.005717435386031866, "eval_runtime": 107.7826, "eval_samples_per_second": 18.556, "eval_steps_per_second": 4.639, "step": 606000 }, { "epoch": 1.57, "learning_rate": 6.437019967287139e-05, "loss": 0.0095, "step": 606010 }, { "epoch": 1.57, "learning_rate": 6.436631145649993e-05, "loss": 0.0098, "step": 606020 }, { "epoch": 1.57, "learning_rate": 6.436242324012846e-05, "loss": 0.0092, "step": 606030 }, { "epoch": 1.57, "learning_rate": 6.4358535023757e-05, "loss": 0.0089, "step": 606040 }, { "epoch": 1.57, "learning_rate": 6.435464680738553e-05, "loss": 0.01, "step": 606050 }, { "epoch": 1.57, "learning_rate": 6.435075859101407e-05, "loss": 0.0067, "step": 606060 }, { "epoch": 1.57, "learning_rate": 6.43468703746426e-05, "loss": 0.0085, "step": 606070 }, { "epoch": 1.57, "learning_rate": 6.434298215827114e-05, "loss": 0.0066, "step": 606080 }, { "epoch": 1.57, "learning_rate": 6.433909394189968e-05, "loss": 0.0086, "step": 606090 }, { "epoch": 1.57, "learning_rate": 6.43352057255282e-05, "loss": 0.0092, "step": 606100 }, { "epoch": 1.57, "learning_rate": 6.433131750915675e-05, "loss": 0.0096, "step": 606110 }, { "epoch": 1.57, "learning_rate": 6.432742929278528e-05, "loss": 0.0081, "step": 606120 }, { "epoch": 1.57, "learning_rate": 6.432354107641382e-05, "loss": 0.0097, "step": 606130 }, { "epoch": 1.57, "learning_rate": 6.431965286004235e-05, "loss": 0.0066, "step": 606140 }, { "epoch": 1.57, "learning_rate": 6.431576464367089e-05, "loss": 0.011, "step": 606150 }, { "epoch": 1.57, "learning_rate": 6.431187642729942e-05, "loss": 0.0066, "step": 606160 }, { "epoch": 1.57, "learning_rate": 6.430798821092796e-05, "loss": 0.0097, "step": 606170 }, { "epoch": 1.57, "learning_rate": 6.43040999945565e-05, "loss": 0.0073, "step": 606180 }, { "epoch": 1.57, "learning_rate": 6.430021177818503e-05, "loss": 0.0103, "step": 606190 }, { "epoch": 1.57, "learning_rate": 6.429632356181357e-05, "loss": 0.0079, "step": 606200 }, { "epoch": 1.57, "learning_rate": 6.42924353454421e-05, "loss": 0.0087, "step": 606210 }, { "epoch": 1.57, "learning_rate": 6.428854712907064e-05, "loss": 0.0102, "step": 606220 }, { "epoch": 1.57, "learning_rate": 6.428465891269917e-05, "loss": 0.0059, "step": 606230 }, { "epoch": 1.57, "learning_rate": 6.428077069632771e-05, "loss": 0.0071, "step": 606240 }, { "epoch": 1.57, "learning_rate": 6.427688247995624e-05, "loss": 0.0075, "step": 606250 }, { "epoch": 1.57, "learning_rate": 6.427299426358476e-05, "loss": 0.0086, "step": 606260 }, { "epoch": 1.57, "learning_rate": 6.42691060472133e-05, "loss": 0.0089, "step": 606270 }, { "epoch": 1.57, "learning_rate": 6.426521783084185e-05, "loss": 0.0061, "step": 606280 }, { "epoch": 1.57, "learning_rate": 6.426132961447038e-05, "loss": 0.0081, "step": 606290 }, { "epoch": 1.57, "learning_rate": 6.425744139809892e-05, "loss": 0.0093, "step": 606300 }, { "epoch": 1.57, "learning_rate": 6.425355318172744e-05, "loss": 0.0096, "step": 606310 }, { "epoch": 1.57, "learning_rate": 6.424966496535599e-05, "loss": 0.0099, "step": 606320 }, { "epoch": 1.57, "learning_rate": 6.424577674898451e-05, "loss": 0.0082, "step": 606330 }, { "epoch": 1.57, "learning_rate": 6.424188853261306e-05, "loss": 0.0069, "step": 606340 }, { "epoch": 1.57, "learning_rate": 6.42380003162416e-05, "loss": 0.0077, "step": 606350 }, { "epoch": 1.57, "learning_rate": 6.423411209987013e-05, "loss": 0.01, "step": 606360 }, { "epoch": 1.57, "learning_rate": 6.423022388349867e-05, "loss": 0.0076, "step": 606370 }, { "epoch": 1.57, "learning_rate": 6.42263356671272e-05, "loss": 0.0077, "step": 606380 }, { "epoch": 1.57, "learning_rate": 6.422244745075574e-05, "loss": 0.0088, "step": 606390 }, { "epoch": 1.57, "learning_rate": 6.421855923438427e-05, "loss": 0.0103, "step": 606400 }, { "epoch": 1.57, "learning_rate": 6.421467101801281e-05, "loss": 0.0085, "step": 606410 }, { "epoch": 1.57, "learning_rate": 6.421078280164134e-05, "loss": 0.0108, "step": 606420 }, { "epoch": 1.57, "learning_rate": 6.420689458526988e-05, "loss": 0.0055, "step": 606430 }, { "epoch": 1.57, "learning_rate": 6.420300636889842e-05, "loss": 0.0097, "step": 606440 }, { "epoch": 1.57, "learning_rate": 6.419911815252695e-05, "loss": 0.0083, "step": 606450 }, { "epoch": 1.57, "learning_rate": 6.419522993615549e-05, "loss": 0.0073, "step": 606460 }, { "epoch": 1.57, "learning_rate": 6.419134171978402e-05, "loss": 0.0103, "step": 606470 }, { "epoch": 1.57, "learning_rate": 6.418745350341256e-05, "loss": 0.0075, "step": 606480 }, { "epoch": 1.57, "learning_rate": 6.418356528704109e-05, "loss": 0.0084, "step": 606490 }, { "epoch": 1.57, "learning_rate": 6.417967707066961e-05, "loss": 0.0083, "step": 606500 }, { "epoch": 1.57, "learning_rate": 6.417578885429816e-05, "loss": 0.0073, "step": 606510 }, { "epoch": 1.57, "learning_rate": 6.417190063792668e-05, "loss": 0.0129, "step": 606520 }, { "epoch": 1.57, "learning_rate": 6.416801242155523e-05, "loss": 0.0072, "step": 606530 }, { "epoch": 1.57, "learning_rate": 6.416412420518377e-05, "loss": 0.0082, "step": 606540 }, { "epoch": 1.57, "learning_rate": 6.41602359888123e-05, "loss": 0.009, "step": 606550 }, { "epoch": 1.57, "learning_rate": 6.415634777244084e-05, "loss": 0.0065, "step": 606560 }, { "epoch": 1.57, "learning_rate": 6.415245955606936e-05, "loss": 0.0121, "step": 606570 }, { "epoch": 1.57, "learning_rate": 6.41485713396979e-05, "loss": 0.0091, "step": 606580 }, { "epoch": 1.57, "learning_rate": 6.414468312332643e-05, "loss": 0.0092, "step": 606590 }, { "epoch": 1.57, "learning_rate": 6.414079490695498e-05, "loss": 0.009, "step": 606600 }, { "epoch": 1.57, "learning_rate": 6.413690669058352e-05, "loss": 0.0097, "step": 606610 }, { "epoch": 1.57, "learning_rate": 6.413301847421205e-05, "loss": 0.0162, "step": 606620 }, { "epoch": 1.57, "learning_rate": 6.412913025784059e-05, "loss": 0.0067, "step": 606630 }, { "epoch": 1.57, "learning_rate": 6.412524204146912e-05, "loss": 0.0081, "step": 606640 }, { "epoch": 1.57, "learning_rate": 6.412135382509766e-05, "loss": 0.0074, "step": 606650 }, { "epoch": 1.57, "learning_rate": 6.411746560872619e-05, "loss": 0.011, "step": 606660 }, { "epoch": 1.57, "learning_rate": 6.411357739235473e-05, "loss": 0.0106, "step": 606670 }, { "epoch": 1.57, "learning_rate": 6.410968917598326e-05, "loss": 0.0088, "step": 606680 }, { "epoch": 1.57, "learning_rate": 6.41058009596118e-05, "loss": 0.0097, "step": 606690 }, { "epoch": 1.57, "learning_rate": 6.410191274324034e-05, "loss": 0.0089, "step": 606700 }, { "epoch": 1.57, "learning_rate": 6.409802452686887e-05, "loss": 0.0089, "step": 606710 }, { "epoch": 1.57, "learning_rate": 6.409413631049741e-05, "loss": 0.0081, "step": 606720 }, { "epoch": 1.57, "learning_rate": 6.409024809412594e-05, "loss": 0.0072, "step": 606730 }, { "epoch": 1.57, "learning_rate": 6.408635987775448e-05, "loss": 0.0108, "step": 606740 }, { "epoch": 1.57, "learning_rate": 6.4082471661383e-05, "loss": 0.0078, "step": 606750 }, { "epoch": 1.57, "learning_rate": 6.407858344501153e-05, "loss": 0.0079, "step": 606760 }, { "epoch": 1.57, "learning_rate": 6.407469522864008e-05, "loss": 0.0107, "step": 606770 }, { "epoch": 1.57, "learning_rate": 6.40708070122686e-05, "loss": 0.0111, "step": 606780 }, { "epoch": 1.57, "learning_rate": 6.406691879589715e-05, "loss": 0.008, "step": 606790 }, { "epoch": 1.57, "learning_rate": 6.406303057952569e-05, "loss": 0.0095, "step": 606800 }, { "epoch": 1.57, "learning_rate": 6.405914236315422e-05, "loss": 0.008, "step": 606810 }, { "epoch": 1.57, "learning_rate": 6.405525414678276e-05, "loss": 0.0088, "step": 606820 }, { "epoch": 1.57, "learning_rate": 6.405136593041128e-05, "loss": 0.0105, "step": 606830 }, { "epoch": 1.57, "learning_rate": 6.404747771403983e-05, "loss": 0.0061, "step": 606840 }, { "epoch": 1.57, "learning_rate": 6.404358949766835e-05, "loss": 0.0109, "step": 606850 }, { "epoch": 1.57, "learning_rate": 6.40397012812969e-05, "loss": 0.0089, "step": 606860 }, { "epoch": 1.57, "learning_rate": 6.403581306492544e-05, "loss": 0.0093, "step": 606870 }, { "epoch": 1.57, "learning_rate": 6.403192484855397e-05, "loss": 0.011, "step": 606880 }, { "epoch": 1.57, "learning_rate": 6.402803663218251e-05, "loss": 0.0101, "step": 606890 }, { "epoch": 1.57, "learning_rate": 6.402414841581104e-05, "loss": 0.0097, "step": 606900 }, { "epoch": 1.57, "learning_rate": 6.402026019943958e-05, "loss": 0.0097, "step": 606910 }, { "epoch": 1.57, "learning_rate": 6.40163719830681e-05, "loss": 0.0096, "step": 606920 }, { "epoch": 1.57, "learning_rate": 6.401248376669665e-05, "loss": 0.0086, "step": 606930 }, { "epoch": 1.57, "learning_rate": 6.400859555032518e-05, "loss": 0.0077, "step": 606940 }, { "epoch": 1.57, "learning_rate": 6.400470733395372e-05, "loss": 0.01, "step": 606950 }, { "epoch": 1.57, "learning_rate": 6.400081911758226e-05, "loss": 0.0292, "step": 606960 }, { "epoch": 1.57, "learning_rate": 6.399693090121079e-05, "loss": 0.0104, "step": 606970 }, { "epoch": 1.57, "learning_rate": 6.399304268483933e-05, "loss": 0.0074, "step": 606980 }, { "epoch": 1.57, "learning_rate": 6.398915446846786e-05, "loss": 0.0117, "step": 606990 }, { "epoch": 1.57, "learning_rate": 6.398526625209638e-05, "loss": 0.0089, "step": 607000 }, { "epoch": 1.57, "eval_cer": 0.8816746935844841, "eval_loss": 0.00562703050673008, "eval_runtime": 107.9194, "eval_samples_per_second": 18.532, "eval_steps_per_second": 4.633, "step": 607000 }, { "epoch": 1.57, "learning_rate": 6.398137803572493e-05, "loss": 0.0116, "step": 607010 }, { "epoch": 1.57, "learning_rate": 6.397748981935345e-05, "loss": 0.0076, "step": 607020 }, { "epoch": 1.57, "learning_rate": 6.3973601602982e-05, "loss": 0.0134, "step": 607030 }, { "epoch": 1.57, "learning_rate": 6.396971338661052e-05, "loss": 0.0097, "step": 607040 }, { "epoch": 1.57, "learning_rate": 6.396582517023907e-05, "loss": 0.0113, "step": 607050 }, { "epoch": 1.57, "learning_rate": 6.396193695386761e-05, "loss": 0.0079, "step": 607060 }, { "epoch": 1.57, "learning_rate": 6.395804873749614e-05, "loss": 0.0114, "step": 607070 }, { "epoch": 1.57, "learning_rate": 6.395416052112468e-05, "loss": 0.0079, "step": 607080 }, { "epoch": 1.57, "learning_rate": 6.39502723047532e-05, "loss": 0.0101, "step": 607090 }, { "epoch": 1.57, "learning_rate": 6.394638408838175e-05, "loss": 0.0067, "step": 607100 }, { "epoch": 1.57, "learning_rate": 6.394249587201027e-05, "loss": 0.0082, "step": 607110 }, { "epoch": 1.57, "learning_rate": 6.393860765563882e-05, "loss": 0.0103, "step": 607120 }, { "epoch": 1.57, "learning_rate": 6.393471943926736e-05, "loss": 0.0074, "step": 607130 }, { "epoch": 1.57, "learning_rate": 6.393083122289589e-05, "loss": 0.0105, "step": 607140 }, { "epoch": 1.57, "learning_rate": 6.392694300652443e-05, "loss": 0.0072, "step": 607150 }, { "epoch": 1.57, "learning_rate": 6.392305479015296e-05, "loss": 0.008, "step": 607160 }, { "epoch": 1.57, "learning_rate": 6.39191665737815e-05, "loss": 0.0087, "step": 607170 }, { "epoch": 1.57, "learning_rate": 6.391527835741003e-05, "loss": 0.0067, "step": 607180 }, { "epoch": 1.57, "learning_rate": 6.391139014103857e-05, "loss": 0.008, "step": 607190 }, { "epoch": 1.57, "learning_rate": 6.39075019246671e-05, "loss": 0.0083, "step": 607200 }, { "epoch": 1.57, "learning_rate": 6.390361370829564e-05, "loss": 0.0104, "step": 607210 }, { "epoch": 1.57, "learning_rate": 6.389972549192418e-05, "loss": 0.0082, "step": 607220 }, { "epoch": 1.57, "learning_rate": 6.38958372755527e-05, "loss": 0.0093, "step": 607230 }, { "epoch": 1.57, "learning_rate": 6.389194905918125e-05, "loss": 0.0092, "step": 607240 }, { "epoch": 1.57, "learning_rate": 6.388806084280978e-05, "loss": 0.0085, "step": 607250 }, { "epoch": 1.57, "learning_rate": 6.38841726264383e-05, "loss": 0.0104, "step": 607260 }, { "epoch": 1.57, "learning_rate": 6.388028441006685e-05, "loss": 0.0073, "step": 607270 }, { "epoch": 1.57, "learning_rate": 6.387639619369537e-05, "loss": 0.0078, "step": 607280 }, { "epoch": 1.57, "learning_rate": 6.387250797732392e-05, "loss": 0.0078, "step": 607290 }, { "epoch": 1.57, "learning_rate": 6.386861976095244e-05, "loss": 0.0093, "step": 607300 }, { "epoch": 1.57, "learning_rate": 6.386473154458099e-05, "loss": 0.0088, "step": 607310 }, { "epoch": 1.57, "learning_rate": 6.386084332820953e-05, "loss": 0.0074, "step": 607320 }, { "epoch": 1.57, "learning_rate": 6.385695511183806e-05, "loss": 0.009, "step": 607330 }, { "epoch": 1.57, "learning_rate": 6.38530668954666e-05, "loss": 0.0093, "step": 607340 }, { "epoch": 1.57, "learning_rate": 6.384917867909512e-05, "loss": 0.0075, "step": 607350 }, { "epoch": 1.57, "learning_rate": 6.384529046272367e-05, "loss": 0.0088, "step": 607360 }, { "epoch": 1.57, "learning_rate": 6.38414022463522e-05, "loss": 0.0109, "step": 607370 }, { "epoch": 1.57, "learning_rate": 6.383751402998074e-05, "loss": 0.0113, "step": 607380 }, { "epoch": 1.57, "learning_rate": 6.383362581360926e-05, "loss": 0.008, "step": 607390 }, { "epoch": 1.57, "learning_rate": 6.38297375972378e-05, "loss": 0.0072, "step": 607400 }, { "epoch": 1.57, "learning_rate": 6.382584938086635e-05, "loss": 0.0079, "step": 607410 }, { "epoch": 1.57, "learning_rate": 6.382196116449488e-05, "loss": 0.0074, "step": 607420 }, { "epoch": 1.57, "learning_rate": 6.381807294812342e-05, "loss": 0.0095, "step": 607430 }, { "epoch": 1.57, "learning_rate": 6.381418473175195e-05, "loss": 0.01, "step": 607440 }, { "epoch": 1.57, "learning_rate": 6.381029651538049e-05, "loss": 0.0077, "step": 607450 }, { "epoch": 1.57, "learning_rate": 6.380640829900902e-05, "loss": 0.0067, "step": 607460 }, { "epoch": 1.57, "learning_rate": 6.380252008263756e-05, "loss": 0.0076, "step": 607470 }, { "epoch": 1.57, "learning_rate": 6.37986318662661e-05, "loss": 0.0075, "step": 607480 }, { "epoch": 1.57, "learning_rate": 6.379474364989461e-05, "loss": 0.0074, "step": 607490 }, { "epoch": 1.57, "learning_rate": 6.379085543352315e-05, "loss": 0.007, "step": 607500 }, { "epoch": 1.57, "learning_rate": 6.37869672171517e-05, "loss": 0.0075, "step": 607510 }, { "epoch": 1.57, "learning_rate": 6.378307900078022e-05, "loss": 0.0108, "step": 607520 }, { "epoch": 1.57, "learning_rate": 6.377919078440877e-05, "loss": 0.0067, "step": 607530 }, { "epoch": 1.57, "learning_rate": 6.37753025680373e-05, "loss": 0.01, "step": 607540 }, { "epoch": 1.57, "learning_rate": 6.377141435166584e-05, "loss": 0.0115, "step": 607550 }, { "epoch": 1.57, "learning_rate": 6.376752613529436e-05, "loss": 0.0072, "step": 607560 }, { "epoch": 1.57, "learning_rate": 6.37636379189229e-05, "loss": 0.0065, "step": 607570 }, { "epoch": 1.57, "learning_rate": 6.375974970255145e-05, "loss": 0.011, "step": 607580 }, { "epoch": 1.57, "learning_rate": 6.375586148617998e-05, "loss": 0.0087, "step": 607590 }, { "epoch": 1.57, "learning_rate": 6.375197326980852e-05, "loss": 0.0091, "step": 607600 }, { "epoch": 1.58, "learning_rate": 6.374808505343704e-05, "loss": 0.0111, "step": 607610 }, { "epoch": 1.58, "learning_rate": 6.374419683706559e-05, "loss": 0.0079, "step": 607620 }, { "epoch": 1.58, "learning_rate": 6.374030862069411e-05, "loss": 0.0089, "step": 607630 }, { "epoch": 1.58, "learning_rate": 6.373642040432266e-05, "loss": 0.0104, "step": 607640 }, { "epoch": 1.58, "learning_rate": 6.373253218795118e-05, "loss": 0.0083, "step": 607650 }, { "epoch": 1.58, "learning_rate": 6.372864397157973e-05, "loss": 0.0099, "step": 607660 }, { "epoch": 1.58, "learning_rate": 6.372475575520827e-05, "loss": 0.0081, "step": 607670 }, { "epoch": 1.58, "learning_rate": 6.37208675388368e-05, "loss": 0.0065, "step": 607680 }, { "epoch": 1.58, "learning_rate": 6.371697932246534e-05, "loss": 0.0099, "step": 607690 }, { "epoch": 1.58, "learning_rate": 6.371309110609387e-05, "loss": 0.0094, "step": 607700 }, { "epoch": 1.58, "learning_rate": 6.370920288972241e-05, "loss": 0.0085, "step": 607710 }, { "epoch": 1.58, "learning_rate": 6.370531467335093e-05, "loss": 0.0085, "step": 607720 }, { "epoch": 1.58, "learning_rate": 6.370142645697948e-05, "loss": 0.0126, "step": 607730 }, { "epoch": 1.58, "learning_rate": 6.3697538240608e-05, "loss": 0.0096, "step": 607740 }, { "epoch": 1.58, "learning_rate": 6.369365002423653e-05, "loss": 0.0065, "step": 607750 }, { "epoch": 1.58, "learning_rate": 6.368976180786507e-05, "loss": 0.007, "step": 607760 }, { "epoch": 1.58, "learning_rate": 6.368587359149362e-05, "loss": 0.0064, "step": 607770 }, { "epoch": 1.58, "learning_rate": 6.368198537512214e-05, "loss": 0.0093, "step": 607780 }, { "epoch": 1.58, "learning_rate": 6.367809715875069e-05, "loss": 0.0093, "step": 607790 }, { "epoch": 1.58, "learning_rate": 6.367420894237921e-05, "loss": 0.0072, "step": 607800 }, { "epoch": 1.58, "learning_rate": 6.367032072600776e-05, "loss": 0.0105, "step": 607810 }, { "epoch": 1.58, "learning_rate": 6.366643250963628e-05, "loss": 0.0072, "step": 607820 }, { "epoch": 1.58, "learning_rate": 6.366254429326483e-05, "loss": 0.0067, "step": 607830 }, { "epoch": 1.58, "learning_rate": 6.365865607689337e-05, "loss": 0.0075, "step": 607840 }, { "epoch": 1.58, "learning_rate": 6.36547678605219e-05, "loss": 0.0075, "step": 607850 }, { "epoch": 1.58, "learning_rate": 6.365087964415044e-05, "loss": 0.0102, "step": 607860 }, { "epoch": 1.58, "learning_rate": 6.364699142777896e-05, "loss": 0.0088, "step": 607870 }, { "epoch": 1.58, "learning_rate": 6.36431032114075e-05, "loss": 0.0076, "step": 607880 }, { "epoch": 1.58, "learning_rate": 6.363921499503603e-05, "loss": 0.0075, "step": 607890 }, { "epoch": 1.58, "learning_rate": 6.363532677866458e-05, "loss": 0.0095, "step": 607900 }, { "epoch": 1.58, "learning_rate": 6.36314385622931e-05, "loss": 0.0078, "step": 607910 }, { "epoch": 1.58, "learning_rate": 6.362755034592165e-05, "loss": 0.0077, "step": 607920 }, { "epoch": 1.58, "learning_rate": 6.362366212955019e-05, "loss": 0.0079, "step": 607930 }, { "epoch": 1.58, "learning_rate": 6.361977391317872e-05, "loss": 0.0069, "step": 607940 }, { "epoch": 1.58, "learning_rate": 6.361588569680726e-05, "loss": 0.0073, "step": 607950 }, { "epoch": 1.58, "learning_rate": 6.361199748043579e-05, "loss": 0.0083, "step": 607960 }, { "epoch": 1.58, "learning_rate": 6.360810926406433e-05, "loss": 0.011, "step": 607970 }, { "epoch": 1.58, "learning_rate": 6.360422104769285e-05, "loss": 0.0072, "step": 607980 }, { "epoch": 1.58, "learning_rate": 6.360033283132138e-05, "loss": 0.0073, "step": 607990 }, { "epoch": 1.58, "learning_rate": 6.359644461494992e-05, "loss": 0.0085, "step": 608000 }, { "epoch": 1.58, "eval_cer": 0.8816942885015627, "eval_loss": 0.00566211948171258, "eval_runtime": 107.9004, "eval_samples_per_second": 18.536, "eval_steps_per_second": 4.634, "step": 608000 }, { "epoch": 1.58, "learning_rate": 6.359255639857845e-05, "loss": 0.0093, "step": 608010 }, { "epoch": 1.58, "learning_rate": 6.3588668182207e-05, "loss": 0.0104, "step": 608020 }, { "epoch": 1.58, "learning_rate": 6.358477996583554e-05, "loss": 0.0075, "step": 608030 }, { "epoch": 1.58, "learning_rate": 6.358089174946406e-05, "loss": 0.0093, "step": 608040 }, { "epoch": 1.58, "learning_rate": 6.35770035330926e-05, "loss": 0.0088, "step": 608050 }, { "epoch": 1.58, "learning_rate": 6.357311531672113e-05, "loss": 0.0116, "step": 608060 }, { "epoch": 1.58, "learning_rate": 6.356922710034968e-05, "loss": 0.0075, "step": 608070 }, { "epoch": 1.58, "learning_rate": 6.35653388839782e-05, "loss": 0.0087, "step": 608080 }, { "epoch": 1.58, "learning_rate": 6.356145066760675e-05, "loss": 0.0078, "step": 608090 }, { "epoch": 1.58, "learning_rate": 6.355756245123529e-05, "loss": 0.0079, "step": 608100 }, { "epoch": 1.58, "learning_rate": 6.355367423486381e-05, "loss": 0.0094, "step": 608110 }, { "epoch": 1.58, "learning_rate": 6.354978601849236e-05, "loss": 0.0062, "step": 608120 }, { "epoch": 1.58, "learning_rate": 6.354589780212088e-05, "loss": 0.0075, "step": 608130 }, { "epoch": 1.58, "learning_rate": 6.354200958574943e-05, "loss": 0.0066, "step": 608140 }, { "epoch": 1.58, "learning_rate": 6.353812136937795e-05, "loss": 0.0077, "step": 608150 }, { "epoch": 1.58, "learning_rate": 6.35342331530065e-05, "loss": 0.0084, "step": 608160 }, { "epoch": 1.58, "learning_rate": 6.353034493663502e-05, "loss": 0.0091, "step": 608170 }, { "epoch": 1.58, "learning_rate": 6.352645672026357e-05, "loss": 0.0101, "step": 608180 }, { "epoch": 1.58, "learning_rate": 6.352256850389211e-05, "loss": 0.008, "step": 608190 }, { "epoch": 1.58, "learning_rate": 6.351868028752064e-05, "loss": 0.0082, "step": 608200 }, { "epoch": 1.58, "learning_rate": 6.351479207114918e-05, "loss": 0.0056, "step": 608210 }, { "epoch": 1.58, "learning_rate": 6.35109038547777e-05, "loss": 0.0082, "step": 608220 }, { "epoch": 1.58, "learning_rate": 6.350701563840625e-05, "loss": 0.0096, "step": 608230 }, { "epoch": 1.58, "learning_rate": 6.350312742203477e-05, "loss": 0.0103, "step": 608240 }, { "epoch": 1.58, "learning_rate": 6.34992392056633e-05, "loss": 0.0067, "step": 608250 }, { "epoch": 1.58, "learning_rate": 6.349535098929184e-05, "loss": 0.0069, "step": 608260 }, { "epoch": 1.58, "learning_rate": 6.349146277292037e-05, "loss": 0.0072, "step": 608270 }, { "epoch": 1.58, "learning_rate": 6.348757455654891e-05, "loss": 0.0074, "step": 608280 }, { "epoch": 1.58, "learning_rate": 6.348368634017746e-05, "loss": 0.0101, "step": 608290 }, { "epoch": 1.58, "learning_rate": 6.347979812380598e-05, "loss": 0.0082, "step": 608300 }, { "epoch": 1.58, "learning_rate": 6.347590990743453e-05, "loss": 0.0149, "step": 608310 }, { "epoch": 1.58, "learning_rate": 6.347202169106305e-05, "loss": 0.0079, "step": 608320 }, { "epoch": 1.58, "learning_rate": 6.34681334746916e-05, "loss": 0.0097, "step": 608330 }, { "epoch": 1.58, "learning_rate": 6.346424525832012e-05, "loss": 0.0074, "step": 608340 }, { "epoch": 1.58, "learning_rate": 6.346035704194867e-05, "loss": 0.008, "step": 608350 }, { "epoch": 1.58, "learning_rate": 6.345646882557721e-05, "loss": 0.0067, "step": 608360 }, { "epoch": 1.58, "learning_rate": 6.345258060920573e-05, "loss": 0.0087, "step": 608370 }, { "epoch": 1.58, "learning_rate": 6.344869239283428e-05, "loss": 0.0135, "step": 608380 }, { "epoch": 1.58, "learning_rate": 6.34448041764628e-05, "loss": 0.0079, "step": 608390 }, { "epoch": 1.58, "learning_rate": 6.344091596009135e-05, "loss": 0.0115, "step": 608400 }, { "epoch": 1.58, "learning_rate": 6.343702774371987e-05, "loss": 0.0098, "step": 608410 }, { "epoch": 1.58, "learning_rate": 6.343313952734842e-05, "loss": 0.0106, "step": 608420 }, { "epoch": 1.58, "learning_rate": 6.342925131097694e-05, "loss": 0.0091, "step": 608430 }, { "epoch": 1.58, "learning_rate": 6.342536309460549e-05, "loss": 0.0094, "step": 608440 }, { "epoch": 1.58, "learning_rate": 6.342147487823403e-05, "loss": 0.0104, "step": 608450 }, { "epoch": 1.58, "learning_rate": 6.341758666186256e-05, "loss": 0.0076, "step": 608460 }, { "epoch": 1.58, "learning_rate": 6.34136984454911e-05, "loss": 0.008, "step": 608470 }, { "epoch": 1.58, "learning_rate": 6.340981022911963e-05, "loss": 0.0115, "step": 608480 }, { "epoch": 1.58, "learning_rate": 6.340592201274815e-05, "loss": 0.0095, "step": 608490 }, { "epoch": 1.58, "learning_rate": 6.34020337963767e-05, "loss": 0.0061, "step": 608500 }, { "epoch": 1.58, "learning_rate": 6.339814558000522e-05, "loss": 0.0105, "step": 608510 }, { "epoch": 1.58, "learning_rate": 6.339425736363376e-05, "loss": 0.0063, "step": 608520 }, { "epoch": 1.58, "learning_rate": 6.339036914726229e-05, "loss": 0.0085, "step": 608530 }, { "epoch": 1.58, "learning_rate": 6.338648093089083e-05, "loss": 0.0102, "step": 608540 }, { "epoch": 1.58, "learning_rate": 6.338259271451938e-05, "loss": 0.0076, "step": 608550 }, { "epoch": 1.58, "learning_rate": 6.33787044981479e-05, "loss": 0.01, "step": 608560 }, { "epoch": 1.58, "learning_rate": 6.337481628177645e-05, "loss": 0.0069, "step": 608570 }, { "epoch": 1.58, "learning_rate": 6.337092806540497e-05, "loss": 0.0078, "step": 608580 }, { "epoch": 1.58, "learning_rate": 6.336703984903352e-05, "loss": 0.0099, "step": 608590 }, { "epoch": 1.58, "learning_rate": 6.336315163266204e-05, "loss": 0.0074, "step": 608600 }, { "epoch": 1.58, "learning_rate": 6.335926341629059e-05, "loss": 0.0066, "step": 608610 }, { "epoch": 1.58, "learning_rate": 6.335537519991913e-05, "loss": 0.0099, "step": 608620 }, { "epoch": 1.58, "learning_rate": 6.335148698354765e-05, "loss": 0.0069, "step": 608630 }, { "epoch": 1.58, "learning_rate": 6.33475987671762e-05, "loss": 0.0099, "step": 608640 }, { "epoch": 1.58, "learning_rate": 6.334371055080472e-05, "loss": 0.0067, "step": 608650 }, { "epoch": 1.58, "learning_rate": 6.333982233443327e-05, "loss": 0.0074, "step": 608660 }, { "epoch": 1.58, "learning_rate": 6.33359341180618e-05, "loss": 0.0087, "step": 608670 }, { "epoch": 1.58, "learning_rate": 6.333204590169034e-05, "loss": 0.0087, "step": 608680 }, { "epoch": 1.58, "learning_rate": 6.332815768531886e-05, "loss": 0.0127, "step": 608690 }, { "epoch": 1.58, "learning_rate": 6.33242694689474e-05, "loss": 0.0119, "step": 608700 }, { "epoch": 1.58, "learning_rate": 6.332038125257595e-05, "loss": 0.0083, "step": 608710 }, { "epoch": 1.58, "learning_rate": 6.331649303620448e-05, "loss": 0.0081, "step": 608720 }, { "epoch": 1.58, "learning_rate": 6.3312604819833e-05, "loss": 0.007, "step": 608730 }, { "epoch": 1.58, "learning_rate": 6.330871660346155e-05, "loss": 0.007, "step": 608740 }, { "epoch": 1.58, "learning_rate": 6.330482838709007e-05, "loss": 0.0093, "step": 608750 }, { "epoch": 1.58, "learning_rate": 6.330094017071861e-05, "loss": 0.0086, "step": 608760 }, { "epoch": 1.58, "learning_rate": 6.329705195434714e-05, "loss": 0.0089, "step": 608770 }, { "epoch": 1.58, "learning_rate": 6.329316373797568e-05, "loss": 0.0134, "step": 608780 }, { "epoch": 1.58, "learning_rate": 6.328927552160421e-05, "loss": 0.0069, "step": 608790 }, { "epoch": 1.58, "learning_rate": 6.328538730523275e-05, "loss": 0.008, "step": 608800 }, { "epoch": 1.58, "learning_rate": 6.32814990888613e-05, "loss": 0.0083, "step": 608810 }, { "epoch": 1.58, "learning_rate": 6.327761087248982e-05, "loss": 0.0086, "step": 608820 }, { "epoch": 1.58, "learning_rate": 6.327372265611837e-05, "loss": 0.0087, "step": 608830 }, { "epoch": 1.58, "learning_rate": 6.32698344397469e-05, "loss": 0.0118, "step": 608840 }, { "epoch": 1.58, "learning_rate": 6.326594622337544e-05, "loss": 0.0106, "step": 608850 }, { "epoch": 1.58, "learning_rate": 6.326205800700396e-05, "loss": 0.0078, "step": 608860 }, { "epoch": 1.58, "learning_rate": 6.32581697906325e-05, "loss": 0.0082, "step": 608870 }, { "epoch": 1.58, "learning_rate": 6.325428157426103e-05, "loss": 0.0062, "step": 608880 }, { "epoch": 1.58, "learning_rate": 6.325039335788957e-05, "loss": 0.0092, "step": 608890 }, { "epoch": 1.58, "learning_rate": 6.324650514151812e-05, "loss": 0.0085, "step": 608900 }, { "epoch": 1.58, "learning_rate": 6.324261692514664e-05, "loss": 0.0095, "step": 608910 }, { "epoch": 1.58, "learning_rate": 6.323872870877519e-05, "loss": 0.0161, "step": 608920 }, { "epoch": 1.58, "learning_rate": 6.323484049240371e-05, "loss": 0.0093, "step": 608930 }, { "epoch": 1.58, "learning_rate": 6.323095227603226e-05, "loss": 0.0085, "step": 608940 }, { "epoch": 1.58, "learning_rate": 6.322706405966078e-05, "loss": 0.0085, "step": 608950 }, { "epoch": 1.58, "learning_rate": 6.322317584328933e-05, "loss": 0.0081, "step": 608960 }, { "epoch": 1.58, "learning_rate": 6.321928762691787e-05, "loss": 0.006, "step": 608970 }, { "epoch": 1.58, "learning_rate": 6.321539941054638e-05, "loss": 0.01, "step": 608980 }, { "epoch": 1.58, "learning_rate": 6.321151119417492e-05, "loss": 0.006, "step": 608990 }, { "epoch": 1.58, "learning_rate": 6.320762297780347e-05, "loss": 0.0114, "step": 609000 }, { "epoch": 1.58, "eval_cer": 0.8816942885015627, "eval_loss": 0.005694786552339792, "eval_runtime": 107.9833, "eval_samples_per_second": 18.521, "eval_steps_per_second": 4.63, "step": 609000 }, { "epoch": 1.58, "learning_rate": 6.320373476143199e-05, "loss": 0.0093, "step": 609010 }, { "epoch": 1.58, "learning_rate": 6.319984654506053e-05, "loss": 0.0085, "step": 609020 }, { "epoch": 1.58, "learning_rate": 6.319595832868906e-05, "loss": 0.0108, "step": 609030 }, { "epoch": 1.58, "learning_rate": 6.31920701123176e-05, "loss": 0.0069, "step": 609040 }, { "epoch": 1.58, "learning_rate": 6.318818189594613e-05, "loss": 0.0056, "step": 609050 }, { "epoch": 1.58, "learning_rate": 6.318429367957467e-05, "loss": 0.0079, "step": 609060 }, { "epoch": 1.58, "learning_rate": 6.318040546320322e-05, "loss": 0.0079, "step": 609070 }, { "epoch": 1.58, "learning_rate": 6.317651724683174e-05, "loss": 0.0078, "step": 609080 }, { "epoch": 1.58, "learning_rate": 6.317262903046029e-05, "loss": 0.0129, "step": 609090 }, { "epoch": 1.58, "learning_rate": 6.316874081408881e-05, "loss": 0.0087, "step": 609100 }, { "epoch": 1.58, "learning_rate": 6.316485259771736e-05, "loss": 0.008, "step": 609110 }, { "epoch": 1.58, "learning_rate": 6.316096438134588e-05, "loss": 0.0079, "step": 609120 }, { "epoch": 1.58, "learning_rate": 6.315707616497442e-05, "loss": 0.0104, "step": 609130 }, { "epoch": 1.58, "learning_rate": 6.315318794860295e-05, "loss": 0.0074, "step": 609140 }, { "epoch": 1.58, "learning_rate": 6.31492997322315e-05, "loss": 0.0069, "step": 609150 }, { "epoch": 1.58, "learning_rate": 6.314541151586004e-05, "loss": 0.0095, "step": 609160 }, { "epoch": 1.58, "learning_rate": 6.314152329948856e-05, "loss": 0.0094, "step": 609170 }, { "epoch": 1.58, "learning_rate": 6.31376350831171e-05, "loss": 0.0081, "step": 609180 }, { "epoch": 1.58, "learning_rate": 6.313374686674563e-05, "loss": 0.0087, "step": 609190 }, { "epoch": 1.58, "learning_rate": 6.312985865037418e-05, "loss": 0.0069, "step": 609200 }, { "epoch": 1.58, "learning_rate": 6.31259704340027e-05, "loss": 0.0088, "step": 609210 }, { "epoch": 1.58, "learning_rate": 6.312208221763125e-05, "loss": 0.0069, "step": 609220 }, { "epoch": 1.58, "learning_rate": 6.311819400125977e-05, "loss": 0.0083, "step": 609230 }, { "epoch": 1.58, "learning_rate": 6.31143057848883e-05, "loss": 0.0057, "step": 609240 }, { "epoch": 1.58, "learning_rate": 6.311041756851684e-05, "loss": 0.0091, "step": 609250 }, { "epoch": 1.58, "learning_rate": 6.310652935214538e-05, "loss": 0.0085, "step": 609260 }, { "epoch": 1.58, "learning_rate": 6.310264113577391e-05, "loss": 0.0078, "step": 609270 }, { "epoch": 1.58, "learning_rate": 6.309875291940245e-05, "loss": 0.0067, "step": 609280 }, { "epoch": 1.58, "learning_rate": 6.309486470303098e-05, "loss": 0.0065, "step": 609290 }, { "epoch": 1.58, "learning_rate": 6.309097648665952e-05, "loss": 0.0079, "step": 609300 }, { "epoch": 1.58, "learning_rate": 6.308708827028805e-05, "loss": 0.0086, "step": 609310 }, { "epoch": 1.58, "learning_rate": 6.30832000539166e-05, "loss": 0.0082, "step": 609320 }, { "epoch": 1.58, "learning_rate": 6.307931183754514e-05, "loss": 0.0085, "step": 609330 }, { "epoch": 1.58, "learning_rate": 6.307542362117366e-05, "loss": 0.0072, "step": 609340 }, { "epoch": 1.58, "learning_rate": 6.30715354048022e-05, "loss": 0.0059, "step": 609350 }, { "epoch": 1.58, "learning_rate": 6.306764718843073e-05, "loss": 0.0105, "step": 609360 }, { "epoch": 1.58, "learning_rate": 6.306375897205928e-05, "loss": 0.0061, "step": 609370 }, { "epoch": 1.58, "learning_rate": 6.30598707556878e-05, "loss": 0.0107, "step": 609380 }, { "epoch": 1.58, "learning_rate": 6.305598253931634e-05, "loss": 0.0069, "step": 609390 }, { "epoch": 1.58, "learning_rate": 6.305209432294487e-05, "loss": 0.0093, "step": 609400 }, { "epoch": 1.58, "learning_rate": 6.304820610657341e-05, "loss": 0.0071, "step": 609410 }, { "epoch": 1.58, "learning_rate": 6.304431789020196e-05, "loss": 0.0089, "step": 609420 }, { "epoch": 1.58, "learning_rate": 6.304042967383048e-05, "loss": 0.0087, "step": 609430 }, { "epoch": 1.58, "learning_rate": 6.303654145745903e-05, "loss": 0.01, "step": 609440 }, { "epoch": 1.58, "learning_rate": 6.303265324108755e-05, "loss": 0.0092, "step": 609450 }, { "epoch": 1.58, "learning_rate": 6.30287650247161e-05, "loss": 0.0066, "step": 609460 }, { "epoch": 1.58, "learning_rate": 6.302487680834462e-05, "loss": 0.0083, "step": 609470 }, { "epoch": 1.58, "learning_rate": 6.302098859197315e-05, "loss": 0.0084, "step": 609480 }, { "epoch": 1.58, "learning_rate": 6.30171003756017e-05, "loss": 0.01, "step": 609490 }, { "epoch": 1.58, "learning_rate": 6.301321215923022e-05, "loss": 0.0096, "step": 609500 }, { "epoch": 1.58, "learning_rate": 6.300932394285876e-05, "loss": 0.0078, "step": 609510 }, { "epoch": 1.58, "learning_rate": 6.30054357264873e-05, "loss": 0.0108, "step": 609520 }, { "epoch": 1.58, "learning_rate": 6.300154751011583e-05, "loss": 0.0085, "step": 609530 }, { "epoch": 1.58, "learning_rate": 6.299765929374437e-05, "loss": 0.0094, "step": 609540 }, { "epoch": 1.58, "learning_rate": 6.29937710773729e-05, "loss": 0.0098, "step": 609550 }, { "epoch": 1.58, "learning_rate": 6.298988286100144e-05, "loss": 0.0078, "step": 609560 }, { "epoch": 1.58, "learning_rate": 6.298599464462997e-05, "loss": 0.0143, "step": 609570 }, { "epoch": 1.58, "learning_rate": 6.298210642825851e-05, "loss": 0.0069, "step": 609580 }, { "epoch": 1.58, "learning_rate": 6.297821821188706e-05, "loss": 0.0091, "step": 609590 }, { "epoch": 1.58, "learning_rate": 6.297432999551558e-05, "loss": 0.007, "step": 609600 }, { "epoch": 1.58, "learning_rate": 6.297044177914413e-05, "loss": 0.0113, "step": 609610 }, { "epoch": 1.58, "learning_rate": 6.296655356277265e-05, "loss": 0.0108, "step": 609620 }, { "epoch": 1.58, "learning_rate": 6.29626653464012e-05, "loss": 0.0111, "step": 609630 }, { "epoch": 1.58, "learning_rate": 6.295877713002972e-05, "loss": 0.0092, "step": 609640 }, { "epoch": 1.58, "learning_rate": 6.295488891365826e-05, "loss": 0.0096, "step": 609650 }, { "epoch": 1.58, "learning_rate": 6.295100069728679e-05, "loss": 0.0084, "step": 609660 }, { "epoch": 1.58, "learning_rate": 6.294711248091533e-05, "loss": 0.0084, "step": 609670 }, { "epoch": 1.58, "learning_rate": 6.294322426454388e-05, "loss": 0.0065, "step": 609680 }, { "epoch": 1.58, "learning_rate": 6.29393360481724e-05, "loss": 0.0062, "step": 609690 }, { "epoch": 1.58, "learning_rate": 6.293544783180095e-05, "loss": 0.0087, "step": 609700 }, { "epoch": 1.58, "learning_rate": 6.293155961542947e-05, "loss": 0.009, "step": 609710 }, { "epoch": 1.58, "learning_rate": 6.292767139905802e-05, "loss": 0.0075, "step": 609720 }, { "epoch": 1.58, "learning_rate": 6.292378318268654e-05, "loss": 0.0063, "step": 609730 }, { "epoch": 1.58, "learning_rate": 6.291989496631507e-05, "loss": 0.0054, "step": 609740 }, { "epoch": 1.58, "learning_rate": 6.291600674994361e-05, "loss": 0.0105, "step": 609750 }, { "epoch": 1.58, "learning_rate": 6.291211853357214e-05, "loss": 0.008, "step": 609760 }, { "epoch": 1.58, "learning_rate": 6.290823031720068e-05, "loss": 0.0063, "step": 609770 }, { "epoch": 1.58, "learning_rate": 6.290434210082922e-05, "loss": 0.0085, "step": 609780 }, { "epoch": 1.58, "learning_rate": 6.290045388445775e-05, "loss": 0.0074, "step": 609790 }, { "epoch": 1.58, "learning_rate": 6.28965656680863e-05, "loss": 0.0081, "step": 609800 }, { "epoch": 1.58, "learning_rate": 6.289267745171482e-05, "loss": 0.0069, "step": 609810 }, { "epoch": 1.58, "learning_rate": 6.288878923534336e-05, "loss": 0.0093, "step": 609820 }, { "epoch": 1.58, "learning_rate": 6.288490101897189e-05, "loss": 0.0061, "step": 609830 }, { "epoch": 1.58, "learning_rate": 6.288101280260043e-05, "loss": 0.0077, "step": 609840 }, { "epoch": 1.58, "learning_rate": 6.287712458622898e-05, "loss": 0.0091, "step": 609850 }, { "epoch": 1.58, "learning_rate": 6.28732363698575e-05, "loss": 0.0086, "step": 609860 }, { "epoch": 1.58, "learning_rate": 6.286934815348605e-05, "loss": 0.0097, "step": 609870 }, { "epoch": 1.58, "learning_rate": 6.286545993711457e-05, "loss": 0.0081, "step": 609880 }, { "epoch": 1.58, "learning_rate": 6.286157172074312e-05, "loss": 0.0089, "step": 609890 }, { "epoch": 1.58, "learning_rate": 6.285768350437164e-05, "loss": 0.0091, "step": 609900 }, { "epoch": 1.58, "learning_rate": 6.285379528800018e-05, "loss": 0.0071, "step": 609910 }, { "epoch": 1.58, "learning_rate": 6.284990707162871e-05, "loss": 0.0076, "step": 609920 }, { "epoch": 1.58, "learning_rate": 6.284601885525725e-05, "loss": 0.0086, "step": 609930 }, { "epoch": 1.58, "learning_rate": 6.28421306388858e-05, "loss": 0.0063, "step": 609940 }, { "epoch": 1.58, "learning_rate": 6.283824242251432e-05, "loss": 0.0101, "step": 609950 }, { "epoch": 1.58, "learning_rate": 6.283435420614287e-05, "loss": 0.0117, "step": 609960 }, { "epoch": 1.58, "learning_rate": 6.28304659897714e-05, "loss": 0.0076, "step": 609970 }, { "epoch": 1.58, "learning_rate": 6.282657777339992e-05, "loss": 0.0063, "step": 609980 }, { "epoch": 1.58, "learning_rate": 6.282268955702846e-05, "loss": 0.0114, "step": 609990 }, { "epoch": 1.58, "learning_rate": 6.281880134065699e-05, "loss": 0.0159, "step": 610000 }, { "epoch": 1.58, "eval_cer": 0.8816956881384969, "eval_loss": 0.005619341507554054, "eval_runtime": 107.799, "eval_samples_per_second": 18.553, "eval_steps_per_second": 4.638, "step": 610000 }, { "epoch": 1.58, "learning_rate": 6.281491312428553e-05, "loss": 0.0054, "step": 610010 }, { "epoch": 1.58, "learning_rate": 6.281102490791406e-05, "loss": 0.008, "step": 610020 }, { "epoch": 1.58, "learning_rate": 6.28071366915426e-05, "loss": 0.0133, "step": 610030 }, { "epoch": 1.58, "learning_rate": 6.280324847517114e-05, "loss": 0.0086, "step": 610040 }, { "epoch": 1.58, "learning_rate": 6.279936025879967e-05, "loss": 0.0084, "step": 610050 }, { "epoch": 1.58, "learning_rate": 6.279547204242821e-05, "loss": 0.0081, "step": 610060 }, { "epoch": 1.58, "learning_rate": 6.279158382605674e-05, "loss": 0.0099, "step": 610070 }, { "epoch": 1.58, "learning_rate": 6.278769560968528e-05, "loss": 0.0092, "step": 610080 }, { "epoch": 1.58, "learning_rate": 6.278380739331381e-05, "loss": 0.0096, "step": 610090 }, { "epoch": 1.58, "learning_rate": 6.277991917694235e-05, "loss": 0.0092, "step": 610100 }, { "epoch": 1.58, "learning_rate": 6.27760309605709e-05, "loss": 0.0076, "step": 610110 }, { "epoch": 1.58, "learning_rate": 6.277214274419942e-05, "loss": 0.009, "step": 610120 }, { "epoch": 1.58, "learning_rate": 6.276825452782797e-05, "loss": 0.0109, "step": 610130 }, { "epoch": 1.58, "learning_rate": 6.27643663114565e-05, "loss": 0.0092, "step": 610140 }, { "epoch": 1.58, "learning_rate": 6.276047809508504e-05, "loss": 0.0126, "step": 610150 }, { "epoch": 1.58, "learning_rate": 6.275658987871356e-05, "loss": 0.0071, "step": 610160 }, { "epoch": 1.58, "learning_rate": 6.27527016623421e-05, "loss": 0.007, "step": 610170 }, { "epoch": 1.58, "learning_rate": 6.274881344597063e-05, "loss": 0.0106, "step": 610180 }, { "epoch": 1.58, "learning_rate": 6.274492522959917e-05, "loss": 0.0088, "step": 610190 }, { "epoch": 1.58, "learning_rate": 6.274103701322772e-05, "loss": 0.0074, "step": 610200 }, { "epoch": 1.58, "learning_rate": 6.273714879685624e-05, "loss": 0.0089, "step": 610210 }, { "epoch": 1.58, "learning_rate": 6.273326058048477e-05, "loss": 0.0062, "step": 610220 }, { "epoch": 1.58, "learning_rate": 6.272937236411331e-05, "loss": 0.0096, "step": 610230 }, { "epoch": 1.58, "learning_rate": 6.272548414774184e-05, "loss": 0.0094, "step": 610240 }, { "epoch": 1.58, "learning_rate": 6.272159593137038e-05, "loss": 0.0086, "step": 610250 }, { "epoch": 1.58, "learning_rate": 6.271770771499891e-05, "loss": 0.0115, "step": 610260 }, { "epoch": 1.58, "learning_rate": 6.271381949862745e-05, "loss": 0.0091, "step": 610270 }, { "epoch": 1.58, "learning_rate": 6.270993128225598e-05, "loss": 0.0082, "step": 610280 }, { "epoch": 1.58, "learning_rate": 6.270604306588452e-05, "loss": 0.0095, "step": 610290 }, { "epoch": 1.58, "learning_rate": 6.270215484951306e-05, "loss": 0.0085, "step": 610300 }, { "epoch": 1.58, "learning_rate": 6.269826663314159e-05, "loss": 0.0124, "step": 610310 }, { "epoch": 1.58, "learning_rate": 6.269437841677013e-05, "loss": 0.0123, "step": 610320 }, { "epoch": 1.58, "learning_rate": 6.269049020039866e-05, "loss": 0.0128, "step": 610330 }, { "epoch": 1.58, "learning_rate": 6.26866019840272e-05, "loss": 0.0088, "step": 610340 }, { "epoch": 1.58, "learning_rate": 6.268271376765573e-05, "loss": 0.0073, "step": 610350 }, { "epoch": 1.58, "learning_rate": 6.267882555128427e-05, "loss": 0.0092, "step": 610360 }, { "epoch": 1.58, "learning_rate": 6.26749373349128e-05, "loss": 0.0102, "step": 610370 }, { "epoch": 1.58, "learning_rate": 6.267104911854134e-05, "loss": 0.0076, "step": 610380 }, { "epoch": 1.58, "learning_rate": 6.266716090216989e-05, "loss": 0.0093, "step": 610390 }, { "epoch": 1.58, "learning_rate": 6.266327268579841e-05, "loss": 0.0075, "step": 610400 }, { "epoch": 1.58, "learning_rate": 6.265938446942696e-05, "loss": 0.0152, "step": 610410 }, { "epoch": 1.58, "learning_rate": 6.265549625305548e-05, "loss": 0.009, "step": 610420 }, { "epoch": 1.58, "learning_rate": 6.265160803668402e-05, "loss": 0.0072, "step": 610430 }, { "epoch": 1.58, "learning_rate": 6.264771982031255e-05, "loss": 0.007, "step": 610440 }, { "epoch": 1.58, "learning_rate": 6.26438316039411e-05, "loss": 0.0064, "step": 610450 }, { "epoch": 1.58, "learning_rate": 6.263994338756964e-05, "loss": 0.0089, "step": 610460 }, { "epoch": 1.58, "learning_rate": 6.263605517119815e-05, "loss": 0.0094, "step": 610470 }, { "epoch": 1.58, "learning_rate": 6.263216695482669e-05, "loss": 0.0082, "step": 610480 }, { "epoch": 1.58, "learning_rate": 6.262827873845523e-05, "loss": 0.0086, "step": 610490 }, { "epoch": 1.58, "learning_rate": 6.262439052208376e-05, "loss": 0.0066, "step": 610500 }, { "epoch": 1.58, "learning_rate": 6.26205023057123e-05, "loss": 0.0078, "step": 610510 }, { "epoch": 1.58, "learning_rate": 6.261661408934083e-05, "loss": 0.0087, "step": 610520 }, { "epoch": 1.58, "learning_rate": 6.261272587296937e-05, "loss": 0.0086, "step": 610530 }, { "epoch": 1.58, "learning_rate": 6.26088376565979e-05, "loss": 0.0095, "step": 610540 }, { "epoch": 1.58, "learning_rate": 6.260494944022644e-05, "loss": 0.0066, "step": 610550 }, { "epoch": 1.58, "learning_rate": 6.260106122385498e-05, "loss": 0.0108, "step": 610560 }, { "epoch": 1.58, "learning_rate": 6.259717300748351e-05, "loss": 0.0086, "step": 610570 }, { "epoch": 1.58, "learning_rate": 6.259328479111205e-05, "loss": 0.0117, "step": 610580 }, { "epoch": 1.58, "learning_rate": 6.258939657474058e-05, "loss": 0.0083, "step": 610590 }, { "epoch": 1.58, "learning_rate": 6.258550835836912e-05, "loss": 0.0061, "step": 610600 }, { "epoch": 1.58, "learning_rate": 6.258162014199765e-05, "loss": 0.009, "step": 610610 }, { "epoch": 1.58, "learning_rate": 6.25777319256262e-05, "loss": 0.0106, "step": 610620 }, { "epoch": 1.58, "learning_rate": 6.257384370925472e-05, "loss": 0.0094, "step": 610630 }, { "epoch": 1.58, "learning_rate": 6.256995549288326e-05, "loss": 0.0073, "step": 610640 }, { "epoch": 1.58, "learning_rate": 6.25660672765118e-05, "loss": 0.0112, "step": 610650 }, { "epoch": 1.58, "learning_rate": 6.256217906014033e-05, "loss": 0.0087, "step": 610660 }, { "epoch": 1.58, "learning_rate": 6.255829084376887e-05, "loss": 0.0085, "step": 610670 }, { "epoch": 1.58, "learning_rate": 6.25544026273974e-05, "loss": 0.0092, "step": 610680 }, { "epoch": 1.58, "learning_rate": 6.255051441102594e-05, "loss": 0.0099, "step": 610690 }, { "epoch": 1.58, "learning_rate": 6.254662619465447e-05, "loss": 0.0099, "step": 610700 }, { "epoch": 1.58, "learning_rate": 6.254273797828301e-05, "loss": 0.0095, "step": 610710 }, { "epoch": 1.58, "learning_rate": 6.253884976191154e-05, "loss": 0.0078, "step": 610720 }, { "epoch": 1.58, "learning_rate": 6.253496154554007e-05, "loss": 0.0085, "step": 610730 }, { "epoch": 1.58, "learning_rate": 6.253107332916861e-05, "loss": 0.0076, "step": 610740 }, { "epoch": 1.58, "learning_rate": 6.252718511279715e-05, "loss": 0.0088, "step": 610750 }, { "epoch": 1.58, "learning_rate": 6.252329689642568e-05, "loss": 0.0074, "step": 610760 }, { "epoch": 1.58, "learning_rate": 6.251940868005422e-05, "loss": 0.0068, "step": 610770 }, { "epoch": 1.58, "learning_rate": 6.251552046368275e-05, "loss": 0.0082, "step": 610780 }, { "epoch": 1.58, "learning_rate": 6.25116322473113e-05, "loss": 0.0078, "step": 610790 }, { "epoch": 1.58, "learning_rate": 6.250774403093982e-05, "loss": 0.008, "step": 610800 }, { "epoch": 1.58, "learning_rate": 6.250385581456836e-05, "loss": 0.0127, "step": 610810 }, { "epoch": 1.58, "learning_rate": 6.24999675981969e-05, "loss": 0.009, "step": 610820 }, { "epoch": 1.58, "learning_rate": 6.249607938182543e-05, "loss": 0.0092, "step": 610830 }, { "epoch": 1.58, "learning_rate": 6.249219116545397e-05, "loss": 0.0073, "step": 610840 }, { "epoch": 1.58, "learning_rate": 6.24883029490825e-05, "loss": 0.0109, "step": 610850 }, { "epoch": 1.58, "learning_rate": 6.248441473271104e-05, "loss": 0.0071, "step": 610860 }, { "epoch": 1.58, "learning_rate": 6.248052651633957e-05, "loss": 0.0081, "step": 610870 }, { "epoch": 1.58, "learning_rate": 6.247663829996811e-05, "loss": 0.0107, "step": 610880 }, { "epoch": 1.58, "learning_rate": 6.247275008359664e-05, "loss": 0.0085, "step": 610890 }, { "epoch": 1.58, "learning_rate": 6.246886186722518e-05, "loss": 0.0065, "step": 610900 }, { "epoch": 1.58, "learning_rate": 6.246497365085373e-05, "loss": 0.0081, "step": 610910 }, { "epoch": 1.58, "learning_rate": 6.246108543448225e-05, "loss": 0.0102, "step": 610920 }, { "epoch": 1.58, "learning_rate": 6.24571972181108e-05, "loss": 0.0111, "step": 610930 }, { "epoch": 1.58, "learning_rate": 6.245330900173932e-05, "loss": 0.0108, "step": 610940 }, { "epoch": 1.58, "learning_rate": 6.244942078536786e-05, "loss": 0.0114, "step": 610950 }, { "epoch": 1.58, "learning_rate": 6.244553256899639e-05, "loss": 0.0094, "step": 610960 }, { "epoch": 1.58, "learning_rate": 6.244164435262492e-05, "loss": 0.0092, "step": 610970 }, { "epoch": 1.58, "learning_rate": 6.243775613625346e-05, "loss": 0.0064, "step": 610980 }, { "epoch": 1.58, "learning_rate": 6.243386791988199e-05, "loss": 0.0104, "step": 610990 }, { "epoch": 1.58, "learning_rate": 6.242997970351053e-05, "loss": 0.0091, "step": 611000 }, { "epoch": 1.58, "eval_cer": 0.8816872903168917, "eval_loss": 0.005523571744561195, "eval_runtime": 107.8962, "eval_samples_per_second": 18.536, "eval_steps_per_second": 4.634, "step": 611000 }, { "epoch": 1.58, "learning_rate": 6.242609148713907e-05, "loss": 0.0079, "step": 611010 }, { "epoch": 1.58, "learning_rate": 6.24222032707676e-05, "loss": 0.0078, "step": 611020 }, { "epoch": 1.58, "learning_rate": 6.241831505439614e-05, "loss": 0.0083, "step": 611030 }, { "epoch": 1.58, "learning_rate": 6.241442683802467e-05, "loss": 0.0077, "step": 611040 }, { "epoch": 1.58, "learning_rate": 6.241053862165321e-05, "loss": 0.0089, "step": 611050 }, { "epoch": 1.58, "learning_rate": 6.240665040528174e-05, "loss": 0.0097, "step": 611060 }, { "epoch": 1.58, "learning_rate": 6.240276218891028e-05, "loss": 0.0075, "step": 611070 }, { "epoch": 1.58, "learning_rate": 6.239887397253882e-05, "loss": 0.0077, "step": 611080 }, { "epoch": 1.58, "learning_rate": 6.239498575616735e-05, "loss": 0.0078, "step": 611090 }, { "epoch": 1.58, "learning_rate": 6.23910975397959e-05, "loss": 0.0093, "step": 611100 }, { "epoch": 1.58, "learning_rate": 6.238720932342442e-05, "loss": 0.0083, "step": 611110 }, { "epoch": 1.58, "learning_rate": 6.238332110705296e-05, "loss": 0.0104, "step": 611120 }, { "epoch": 1.58, "learning_rate": 6.237943289068149e-05, "loss": 0.0045, "step": 611130 }, { "epoch": 1.58, "learning_rate": 6.237554467431003e-05, "loss": 0.0143, "step": 611140 }, { "epoch": 1.58, "learning_rate": 6.237165645793856e-05, "loss": 0.0081, "step": 611150 }, { "epoch": 1.58, "learning_rate": 6.23677682415671e-05, "loss": 0.0083, "step": 611160 }, { "epoch": 1.58, "learning_rate": 6.236388002519565e-05, "loss": 0.0076, "step": 611170 }, { "epoch": 1.58, "learning_rate": 6.235999180882417e-05, "loss": 0.0093, "step": 611180 }, { "epoch": 1.58, "learning_rate": 6.235610359245271e-05, "loss": 0.008, "step": 611190 }, { "epoch": 1.58, "learning_rate": 6.235221537608124e-05, "loss": 0.0112, "step": 611200 }, { "epoch": 1.58, "learning_rate": 6.234832715970978e-05, "loss": 0.0109, "step": 611210 }, { "epoch": 1.58, "learning_rate": 6.234443894333831e-05, "loss": 0.0107, "step": 611220 }, { "epoch": 1.58, "learning_rate": 6.234055072696684e-05, "loss": 0.0097, "step": 611230 }, { "epoch": 1.58, "learning_rate": 6.233666251059538e-05, "loss": 0.0085, "step": 611240 }, { "epoch": 1.58, "learning_rate": 6.233277429422391e-05, "loss": 0.0059, "step": 611250 }, { "epoch": 1.58, "learning_rate": 6.232888607785245e-05, "loss": 0.0079, "step": 611260 }, { "epoch": 1.58, "learning_rate": 6.2324997861481e-05, "loss": 0.006, "step": 611270 }, { "epoch": 1.58, "learning_rate": 6.232110964510952e-05, "loss": 0.0128, "step": 611280 }, { "epoch": 1.58, "learning_rate": 6.231722142873806e-05, "loss": 0.0096, "step": 611290 }, { "epoch": 1.58, "learning_rate": 6.231333321236659e-05, "loss": 0.0078, "step": 611300 }, { "epoch": 1.58, "learning_rate": 6.230944499599513e-05, "loss": 0.0096, "step": 611310 }, { "epoch": 1.58, "learning_rate": 6.230555677962366e-05, "loss": 0.0096, "step": 611320 }, { "epoch": 1.58, "learning_rate": 6.23016685632522e-05, "loss": 0.0116, "step": 611330 }, { "epoch": 1.58, "learning_rate": 6.229778034688074e-05, "loss": 0.0077, "step": 611340 }, { "epoch": 1.58, "learning_rate": 6.229389213050927e-05, "loss": 0.0073, "step": 611350 }, { "epoch": 1.58, "learning_rate": 6.229000391413781e-05, "loss": 0.0107, "step": 611360 }, { "epoch": 1.58, "learning_rate": 6.228611569776634e-05, "loss": 0.0068, "step": 611370 }, { "epoch": 1.58, "learning_rate": 6.228222748139488e-05, "loss": 0.0069, "step": 611380 }, { "epoch": 1.58, "learning_rate": 6.227833926502341e-05, "loss": 0.0126, "step": 611390 }, { "epoch": 1.58, "learning_rate": 6.227445104865195e-05, "loss": 0.0084, "step": 611400 }, { "epoch": 1.58, "learning_rate": 6.227056283228048e-05, "loss": 0.0109, "step": 611410 }, { "epoch": 1.58, "learning_rate": 6.226667461590902e-05, "loss": 0.0094, "step": 611420 }, { "epoch": 1.58, "learning_rate": 6.226278639953757e-05, "loss": 0.007, "step": 611430 }, { "epoch": 1.58, "learning_rate": 6.225889818316609e-05, "loss": 0.0073, "step": 611440 }, { "epoch": 1.58, "learning_rate": 6.225500996679463e-05, "loss": 0.0074, "step": 611450 }, { "epoch": 1.58, "learning_rate": 6.225112175042316e-05, "loss": 0.0082, "step": 611460 }, { "epoch": 1.59, "learning_rate": 6.224723353405169e-05, "loss": 0.0115, "step": 611470 }, { "epoch": 1.59, "learning_rate": 6.224334531768023e-05, "loss": 0.0088, "step": 611480 }, { "epoch": 1.59, "learning_rate": 6.223945710130876e-05, "loss": 0.0082, "step": 611490 }, { "epoch": 1.59, "learning_rate": 6.22355688849373e-05, "loss": 0.0101, "step": 611500 }, { "epoch": 1.59, "learning_rate": 6.223168066856583e-05, "loss": 0.0069, "step": 611510 }, { "epoch": 1.59, "learning_rate": 6.222779245219437e-05, "loss": 0.0074, "step": 611520 }, { "epoch": 1.59, "learning_rate": 6.222390423582291e-05, "loss": 0.0074, "step": 611530 }, { "epoch": 1.59, "learning_rate": 6.222001601945144e-05, "loss": 0.0077, "step": 611540 }, { "epoch": 1.59, "learning_rate": 6.221612780307998e-05, "loss": 0.0082, "step": 611550 }, { "epoch": 1.59, "learning_rate": 6.221223958670851e-05, "loss": 0.0082, "step": 611560 }, { "epoch": 1.59, "learning_rate": 6.220835137033705e-05, "loss": 0.0081, "step": 611570 }, { "epoch": 1.59, "learning_rate": 6.220446315396558e-05, "loss": 0.0085, "step": 611580 }, { "epoch": 1.59, "learning_rate": 6.220057493759412e-05, "loss": 0.0087, "step": 611590 }, { "epoch": 1.59, "learning_rate": 6.219668672122265e-05, "loss": 0.009, "step": 611600 }, { "epoch": 1.59, "learning_rate": 6.219279850485119e-05, "loss": 0.0072, "step": 611610 }, { "epoch": 1.59, "learning_rate": 6.218891028847973e-05, "loss": 0.0067, "step": 611620 }, { "epoch": 1.59, "learning_rate": 6.218502207210826e-05, "loss": 0.0068, "step": 611630 }, { "epoch": 1.59, "learning_rate": 6.21811338557368e-05, "loss": 0.0115, "step": 611640 }, { "epoch": 1.59, "learning_rate": 6.217724563936533e-05, "loss": 0.0055, "step": 611650 }, { "epoch": 1.59, "learning_rate": 6.217335742299387e-05, "loss": 0.0091, "step": 611660 }, { "epoch": 1.59, "learning_rate": 6.21694692066224e-05, "loss": 0.0078, "step": 611670 }, { "epoch": 1.59, "learning_rate": 6.216558099025094e-05, "loss": 0.0076, "step": 611680 }, { "epoch": 1.59, "learning_rate": 6.216169277387949e-05, "loss": 0.0092, "step": 611690 }, { "epoch": 1.59, "learning_rate": 6.215780455750801e-05, "loss": 0.0108, "step": 611700 }, { "epoch": 1.59, "learning_rate": 6.215391634113654e-05, "loss": 0.0119, "step": 611710 }, { "epoch": 1.59, "learning_rate": 6.215002812476508e-05, "loss": 0.014, "step": 611720 }, { "epoch": 1.59, "learning_rate": 6.214613990839361e-05, "loss": 0.0077, "step": 611730 }, { "epoch": 1.59, "learning_rate": 6.214225169202215e-05, "loss": 0.0078, "step": 611740 }, { "epoch": 1.59, "learning_rate": 6.213836347565068e-05, "loss": 0.0082, "step": 611750 }, { "epoch": 1.59, "learning_rate": 6.213447525927922e-05, "loss": 0.0105, "step": 611760 }, { "epoch": 1.59, "learning_rate": 6.213058704290775e-05, "loss": 0.0096, "step": 611770 }, { "epoch": 1.59, "learning_rate": 6.212669882653629e-05, "loss": 0.0079, "step": 611780 }, { "epoch": 1.59, "learning_rate": 6.212281061016483e-05, "loss": 0.0074, "step": 611790 }, { "epoch": 1.59, "learning_rate": 6.211892239379336e-05, "loss": 0.0082, "step": 611800 }, { "epoch": 1.59, "learning_rate": 6.21150341774219e-05, "loss": 0.0099, "step": 611810 }, { "epoch": 1.59, "learning_rate": 6.211114596105043e-05, "loss": 0.0073, "step": 611820 }, { "epoch": 1.59, "learning_rate": 6.210725774467897e-05, "loss": 0.008, "step": 611830 }, { "epoch": 1.59, "learning_rate": 6.21033695283075e-05, "loss": 0.0094, "step": 611840 }, { "epoch": 1.59, "learning_rate": 6.209948131193604e-05, "loss": 0.0084, "step": 611850 }, { "epoch": 1.59, "learning_rate": 6.209559309556457e-05, "loss": 0.008, "step": 611860 }, { "epoch": 1.59, "learning_rate": 6.209170487919311e-05, "loss": 0.0094, "step": 611870 }, { "epoch": 1.59, "learning_rate": 6.208781666282165e-05, "loss": 0.0101, "step": 611880 }, { "epoch": 1.59, "learning_rate": 6.208392844645018e-05, "loss": 0.0052, "step": 611890 }, { "epoch": 1.59, "learning_rate": 6.208004023007872e-05, "loss": 0.0068, "step": 611900 }, { "epoch": 1.59, "learning_rate": 6.207615201370725e-05, "loss": 0.0136, "step": 611910 }, { "epoch": 1.59, "learning_rate": 6.20722637973358e-05, "loss": 0.0086, "step": 611920 }, { "epoch": 1.59, "learning_rate": 6.206837558096432e-05, "loss": 0.0099, "step": 611930 }, { "epoch": 1.59, "learning_rate": 6.206448736459286e-05, "loss": 0.0076, "step": 611940 }, { "epoch": 1.59, "learning_rate": 6.20605991482214e-05, "loss": 0.0138, "step": 611950 }, { "epoch": 1.59, "learning_rate": 6.205671093184992e-05, "loss": 0.0099, "step": 611960 }, { "epoch": 1.59, "learning_rate": 6.205282271547846e-05, "loss": 0.0095, "step": 611970 }, { "epoch": 1.59, "learning_rate": 6.2048934499107e-05, "loss": 0.0111, "step": 611980 }, { "epoch": 1.59, "learning_rate": 6.204504628273553e-05, "loss": 0.0091, "step": 611990 }, { "epoch": 1.59, "learning_rate": 6.204115806636407e-05, "loss": 0.0058, "step": 612000 }, { "epoch": 1.59, "eval_cer": 0.8816942885015627, "eval_loss": 0.005586665123701096, "eval_runtime": 107.9859, "eval_samples_per_second": 18.521, "eval_steps_per_second": 4.63, "step": 612000 }, { "epoch": 1.59, "learning_rate": 6.20372698499926e-05, "loss": 0.0136, "step": 612010 }, { "epoch": 1.59, "learning_rate": 6.203338163362114e-05, "loss": 0.0122, "step": 612020 }, { "epoch": 1.59, "learning_rate": 6.202949341724967e-05, "loss": 0.0098, "step": 612030 }, { "epoch": 1.59, "learning_rate": 6.202560520087821e-05, "loss": 0.0118, "step": 612040 }, { "epoch": 1.59, "learning_rate": 6.202171698450675e-05, "loss": 0.0087, "step": 612050 }, { "epoch": 1.59, "learning_rate": 6.201782876813528e-05, "loss": 0.0096, "step": 612060 }, { "epoch": 1.59, "learning_rate": 6.201394055176382e-05, "loss": 0.0073, "step": 612070 }, { "epoch": 1.59, "learning_rate": 6.201005233539235e-05, "loss": 0.0076, "step": 612080 }, { "epoch": 1.59, "learning_rate": 6.200616411902089e-05, "loss": 0.0095, "step": 612090 }, { "epoch": 1.59, "learning_rate": 6.200227590264942e-05, "loss": 0.0048, "step": 612100 }, { "epoch": 1.59, "learning_rate": 6.199838768627796e-05, "loss": 0.0101, "step": 612110 }, { "epoch": 1.59, "learning_rate": 6.199449946990649e-05, "loss": 0.0068, "step": 612120 }, { "epoch": 1.59, "learning_rate": 6.199061125353503e-05, "loss": 0.0105, "step": 612130 }, { "epoch": 1.59, "learning_rate": 6.198672303716357e-05, "loss": 0.0054, "step": 612140 }, { "epoch": 1.59, "learning_rate": 6.19828348207921e-05, "loss": 0.0082, "step": 612150 }, { "epoch": 1.59, "learning_rate": 6.197894660442064e-05, "loss": 0.0099, "step": 612160 }, { "epoch": 1.59, "learning_rate": 6.197505838804917e-05, "loss": 0.0066, "step": 612170 }, { "epoch": 1.59, "learning_rate": 6.197117017167771e-05, "loss": 0.0073, "step": 612180 }, { "epoch": 1.59, "learning_rate": 6.196728195530624e-05, "loss": 0.0098, "step": 612190 }, { "epoch": 1.59, "learning_rate": 6.196339373893478e-05, "loss": 0.0091, "step": 612200 }, { "epoch": 1.59, "learning_rate": 6.195950552256331e-05, "loss": 0.0114, "step": 612210 }, { "epoch": 1.59, "learning_rate": 6.195561730619184e-05, "loss": 0.0092, "step": 612220 }, { "epoch": 1.59, "learning_rate": 6.195172908982038e-05, "loss": 0.0078, "step": 612230 }, { "epoch": 1.59, "learning_rate": 6.194784087344892e-05, "loss": 0.0098, "step": 612240 }, { "epoch": 1.59, "learning_rate": 6.194395265707745e-05, "loss": 0.0085, "step": 612250 }, { "epoch": 1.59, "learning_rate": 6.194006444070599e-05, "loss": 0.0072, "step": 612260 }, { "epoch": 1.59, "learning_rate": 6.193617622433452e-05, "loss": 0.0096, "step": 612270 }, { "epoch": 1.59, "learning_rate": 6.193228800796306e-05, "loss": 0.0098, "step": 612280 }, { "epoch": 1.59, "learning_rate": 6.192839979159159e-05, "loss": 0.0094, "step": 612290 }, { "epoch": 1.59, "learning_rate": 6.192451157522013e-05, "loss": 0.0096, "step": 612300 }, { "epoch": 1.59, "learning_rate": 6.192062335884867e-05, "loss": 0.0078, "step": 612310 }, { "epoch": 1.59, "learning_rate": 6.19167351424772e-05, "loss": 0.0105, "step": 612320 }, { "epoch": 1.59, "learning_rate": 6.191284692610574e-05, "loss": 0.0084, "step": 612330 }, { "epoch": 1.59, "learning_rate": 6.190895870973427e-05, "loss": 0.008, "step": 612340 }, { "epoch": 1.59, "learning_rate": 6.190507049336281e-05, "loss": 0.0098, "step": 612350 }, { "epoch": 1.59, "learning_rate": 6.190118227699134e-05, "loss": 0.0088, "step": 612360 }, { "epoch": 1.59, "learning_rate": 6.189729406061988e-05, "loss": 0.0072, "step": 612370 }, { "epoch": 1.59, "learning_rate": 6.189340584424841e-05, "loss": 0.0077, "step": 612380 }, { "epoch": 1.59, "learning_rate": 6.188951762787695e-05, "loss": 0.0069, "step": 612390 }, { "epoch": 1.59, "learning_rate": 6.18856294115055e-05, "loss": 0.0092, "step": 612400 }, { "epoch": 1.59, "learning_rate": 6.188174119513402e-05, "loss": 0.0088, "step": 612410 }, { "epoch": 1.59, "learning_rate": 6.187785297876256e-05, "loss": 0.0103, "step": 612420 }, { "epoch": 1.59, "learning_rate": 6.187396476239109e-05, "loss": 0.0075, "step": 612430 }, { "epoch": 1.59, "learning_rate": 6.187007654601963e-05, "loss": 0.0085, "step": 612440 }, { "epoch": 1.59, "learning_rate": 6.186618832964816e-05, "loss": 0.006, "step": 612450 }, { "epoch": 1.59, "learning_rate": 6.186230011327669e-05, "loss": 0.0086, "step": 612460 }, { "epoch": 1.59, "learning_rate": 6.185841189690523e-05, "loss": 0.0096, "step": 612470 }, { "epoch": 1.59, "learning_rate": 6.185452368053376e-05, "loss": 0.0077, "step": 612480 }, { "epoch": 1.59, "learning_rate": 6.18506354641623e-05, "loss": 0.009, "step": 612490 }, { "epoch": 1.59, "learning_rate": 6.184674724779084e-05, "loss": 0.012, "step": 612500 }, { "epoch": 1.59, "learning_rate": 6.184285903141937e-05, "loss": 0.0099, "step": 612510 }, { "epoch": 1.59, "learning_rate": 6.183897081504791e-05, "loss": 0.0106, "step": 612520 }, { "epoch": 1.59, "learning_rate": 6.183508259867644e-05, "loss": 0.009, "step": 612530 }, { "epoch": 1.59, "learning_rate": 6.183119438230498e-05, "loss": 0.0086, "step": 612540 }, { "epoch": 1.59, "learning_rate": 6.182730616593351e-05, "loss": 0.0094, "step": 612550 }, { "epoch": 1.59, "learning_rate": 6.182341794956205e-05, "loss": 0.0087, "step": 612560 }, { "epoch": 1.59, "learning_rate": 6.18195297331906e-05, "loss": 0.0058, "step": 612570 }, { "epoch": 1.59, "learning_rate": 6.181564151681912e-05, "loss": 0.0101, "step": 612580 }, { "epoch": 1.59, "learning_rate": 6.181175330044766e-05, "loss": 0.0099, "step": 612590 }, { "epoch": 1.59, "learning_rate": 6.180786508407619e-05, "loss": 0.0074, "step": 612600 }, { "epoch": 1.59, "learning_rate": 6.180397686770473e-05, "loss": 0.0088, "step": 612610 }, { "epoch": 1.59, "learning_rate": 6.180008865133326e-05, "loss": 0.0061, "step": 612620 }, { "epoch": 1.59, "learning_rate": 6.17962004349618e-05, "loss": 0.0073, "step": 612630 }, { "epoch": 1.59, "learning_rate": 6.179231221859033e-05, "loss": 0.007, "step": 612640 }, { "epoch": 1.59, "learning_rate": 6.178842400221887e-05, "loss": 0.008, "step": 612650 }, { "epoch": 1.59, "learning_rate": 6.178453578584741e-05, "loss": 0.0075, "step": 612660 }, { "epoch": 1.59, "learning_rate": 6.178064756947594e-05, "loss": 0.0088, "step": 612670 }, { "epoch": 1.59, "learning_rate": 6.177675935310448e-05, "loss": 0.0093, "step": 612680 }, { "epoch": 1.59, "learning_rate": 6.177287113673301e-05, "loss": 0.0071, "step": 612690 }, { "epoch": 1.59, "learning_rate": 6.176898292036154e-05, "loss": 0.0088, "step": 612700 }, { "epoch": 1.59, "learning_rate": 6.176509470399008e-05, "loss": 0.012, "step": 612710 }, { "epoch": 1.59, "learning_rate": 6.176120648761861e-05, "loss": 0.0116, "step": 612720 }, { "epoch": 1.59, "learning_rate": 6.175731827124715e-05, "loss": 0.0076, "step": 612730 }, { "epoch": 1.59, "learning_rate": 6.175343005487568e-05, "loss": 0.0057, "step": 612740 }, { "epoch": 1.59, "learning_rate": 6.174954183850422e-05, "loss": 0.0081, "step": 612750 }, { "epoch": 1.59, "learning_rate": 6.174565362213276e-05, "loss": 0.0091, "step": 612760 }, { "epoch": 1.59, "learning_rate": 6.174176540576129e-05, "loss": 0.008, "step": 612770 }, { "epoch": 1.59, "learning_rate": 6.173787718938983e-05, "loss": 0.014, "step": 612780 }, { "epoch": 1.59, "learning_rate": 6.173398897301836e-05, "loss": 0.0104, "step": 612790 }, { "epoch": 1.59, "learning_rate": 6.17301007566469e-05, "loss": 0.0062, "step": 612800 }, { "epoch": 1.59, "learning_rate": 6.172621254027543e-05, "loss": 0.0081, "step": 612810 }, { "epoch": 1.59, "learning_rate": 6.172232432390397e-05, "loss": 0.0105, "step": 612820 }, { "epoch": 1.59, "learning_rate": 6.171843610753251e-05, "loss": 0.0088, "step": 612830 }, { "epoch": 1.59, "learning_rate": 6.171454789116104e-05, "loss": 0.0114, "step": 612840 }, { "epoch": 1.59, "learning_rate": 6.171065967478958e-05, "loss": 0.0074, "step": 612850 }, { "epoch": 1.59, "learning_rate": 6.170677145841811e-05, "loss": 0.0075, "step": 612860 }, { "epoch": 1.59, "learning_rate": 6.170288324204665e-05, "loss": 0.0071, "step": 612870 }, { "epoch": 1.59, "learning_rate": 6.169899502567518e-05, "loss": 0.0063, "step": 612880 }, { "epoch": 1.59, "learning_rate": 6.169510680930372e-05, "loss": 0.0077, "step": 612890 }, { "epoch": 1.59, "learning_rate": 6.169121859293225e-05, "loss": 0.008, "step": 612900 }, { "epoch": 1.59, "learning_rate": 6.168733037656079e-05, "loss": 0.0101, "step": 612910 }, { "epoch": 1.59, "learning_rate": 6.168344216018933e-05, "loss": 0.0094, "step": 612920 }, { "epoch": 1.59, "learning_rate": 6.167955394381786e-05, "loss": 0.009, "step": 612930 }, { "epoch": 1.59, "learning_rate": 6.16756657274464e-05, "loss": 0.0103, "step": 612940 }, { "epoch": 1.59, "learning_rate": 6.167177751107493e-05, "loss": 0.0084, "step": 612950 }, { "epoch": 1.59, "learning_rate": 6.166788929470346e-05, "loss": 0.01, "step": 612960 }, { "epoch": 1.59, "learning_rate": 6.1664001078332e-05, "loss": 0.0084, "step": 612970 }, { "epoch": 1.59, "learning_rate": 6.166011286196053e-05, "loss": 0.012, "step": 612980 }, { "epoch": 1.59, "learning_rate": 6.165622464558907e-05, "loss": 0.007, "step": 612990 }, { "epoch": 1.59, "learning_rate": 6.16523364292176e-05, "loss": 0.007, "step": 613000 }, { "epoch": 1.59, "eval_cer": 0.8816774928583525, "eval_loss": 0.005634871311485767, "eval_runtime": 107.6649, "eval_samples_per_second": 18.576, "eval_steps_per_second": 4.644, "step": 613000 }, { "epoch": 1.59, "learning_rate": 6.164844821284614e-05, "loss": 0.0105, "step": 613010 }, { "epoch": 1.59, "learning_rate": 6.164455999647468e-05, "loss": 0.009, "step": 613020 }, { "epoch": 1.59, "learning_rate": 6.164067178010321e-05, "loss": 0.0083, "step": 613030 }, { "epoch": 1.59, "learning_rate": 6.163678356373175e-05, "loss": 0.011, "step": 613040 }, { "epoch": 1.59, "learning_rate": 6.163289534736028e-05, "loss": 0.0064, "step": 613050 }, { "epoch": 1.59, "learning_rate": 6.162900713098882e-05, "loss": 0.0091, "step": 613060 }, { "epoch": 1.59, "learning_rate": 6.162511891461735e-05, "loss": 0.0101, "step": 613070 }, { "epoch": 1.59, "learning_rate": 6.162123069824589e-05, "loss": 0.009, "step": 613080 }, { "epoch": 1.59, "learning_rate": 6.161734248187442e-05, "loss": 0.0073, "step": 613090 }, { "epoch": 1.59, "learning_rate": 6.161345426550296e-05, "loss": 0.008, "step": 613100 }, { "epoch": 1.59, "learning_rate": 6.16095660491315e-05, "loss": 0.0082, "step": 613110 }, { "epoch": 1.59, "learning_rate": 6.160567783276003e-05, "loss": 0.0091, "step": 613120 }, { "epoch": 1.59, "learning_rate": 6.160178961638857e-05, "loss": 0.0062, "step": 613130 }, { "epoch": 1.59, "learning_rate": 6.15979014000171e-05, "loss": 0.0068, "step": 613140 }, { "epoch": 1.59, "learning_rate": 6.159401318364564e-05, "loss": 0.0103, "step": 613150 }, { "epoch": 1.59, "learning_rate": 6.159012496727417e-05, "loss": 0.0078, "step": 613160 }, { "epoch": 1.59, "learning_rate": 6.158623675090271e-05, "loss": 0.0053, "step": 613170 }, { "epoch": 1.59, "learning_rate": 6.158234853453125e-05, "loss": 0.0098, "step": 613180 }, { "epoch": 1.59, "learning_rate": 6.157846031815978e-05, "loss": 0.0104, "step": 613190 }, { "epoch": 1.59, "learning_rate": 6.157457210178831e-05, "loss": 0.0099, "step": 613200 }, { "epoch": 1.59, "learning_rate": 6.157068388541685e-05, "loss": 0.0092, "step": 613210 }, { "epoch": 1.59, "learning_rate": 6.156679566904538e-05, "loss": 0.0081, "step": 613220 }, { "epoch": 1.59, "learning_rate": 6.156290745267392e-05, "loss": 0.0067, "step": 613230 }, { "epoch": 1.59, "learning_rate": 6.155901923630245e-05, "loss": 0.0151, "step": 613240 }, { "epoch": 1.59, "learning_rate": 6.155513101993099e-05, "loss": 0.011, "step": 613250 }, { "epoch": 1.59, "learning_rate": 6.155124280355952e-05, "loss": 0.0072, "step": 613260 }, { "epoch": 1.59, "learning_rate": 6.154735458718806e-05, "loss": 0.0106, "step": 613270 }, { "epoch": 1.59, "learning_rate": 6.15434663708166e-05, "loss": 0.0071, "step": 613280 }, { "epoch": 1.59, "learning_rate": 6.153957815444513e-05, "loss": 0.0106, "step": 613290 }, { "epoch": 1.59, "learning_rate": 6.153568993807367e-05, "loss": 0.0097, "step": 613300 }, { "epoch": 1.59, "learning_rate": 6.15318017217022e-05, "loss": 0.0076, "step": 613310 }, { "epoch": 1.59, "learning_rate": 6.152791350533074e-05, "loss": 0.0089, "step": 613320 }, { "epoch": 1.59, "learning_rate": 6.152402528895927e-05, "loss": 0.0075, "step": 613330 }, { "epoch": 1.59, "learning_rate": 6.152013707258781e-05, "loss": 0.0086, "step": 613340 }, { "epoch": 1.59, "learning_rate": 6.151624885621634e-05, "loss": 0.009, "step": 613350 }, { "epoch": 1.59, "learning_rate": 6.151236063984488e-05, "loss": 0.0087, "step": 613360 }, { "epoch": 1.59, "learning_rate": 6.150847242347342e-05, "loss": 0.0066, "step": 613370 }, { "epoch": 1.59, "learning_rate": 6.150458420710195e-05, "loss": 0.0069, "step": 613380 }, { "epoch": 1.59, "learning_rate": 6.150069599073049e-05, "loss": 0.009, "step": 613390 }, { "epoch": 1.59, "learning_rate": 6.149680777435902e-05, "loss": 0.0073, "step": 613400 }, { "epoch": 1.59, "learning_rate": 6.149291955798756e-05, "loss": 0.0087, "step": 613410 }, { "epoch": 1.59, "learning_rate": 6.148903134161609e-05, "loss": 0.0078, "step": 613420 }, { "epoch": 1.59, "learning_rate": 6.148514312524463e-05, "loss": 0.0061, "step": 613430 }, { "epoch": 1.59, "learning_rate": 6.148125490887317e-05, "loss": 0.0083, "step": 613440 }, { "epoch": 1.59, "learning_rate": 6.147736669250169e-05, "loss": 0.0068, "step": 613450 }, { "epoch": 1.59, "learning_rate": 6.147347847613023e-05, "loss": 0.009, "step": 613460 }, { "epoch": 1.59, "learning_rate": 6.146959025975877e-05, "loss": 0.007, "step": 613470 }, { "epoch": 1.59, "learning_rate": 6.14657020433873e-05, "loss": 0.0053, "step": 613480 }, { "epoch": 1.59, "learning_rate": 6.146181382701584e-05, "loss": 0.0077, "step": 613490 }, { "epoch": 1.59, "learning_rate": 6.145792561064437e-05, "loss": 0.0061, "step": 613500 }, { "epoch": 1.59, "learning_rate": 6.145403739427291e-05, "loss": 0.0091, "step": 613510 }, { "epoch": 1.59, "learning_rate": 6.145014917790144e-05, "loss": 0.0097, "step": 613520 }, { "epoch": 1.59, "learning_rate": 6.144626096152998e-05, "loss": 0.009, "step": 613530 }, { "epoch": 1.59, "learning_rate": 6.144237274515852e-05, "loss": 0.0067, "step": 613540 }, { "epoch": 1.59, "learning_rate": 6.143848452878705e-05, "loss": 0.0084, "step": 613550 }, { "epoch": 1.59, "learning_rate": 6.143459631241559e-05, "loss": 0.0114, "step": 613560 }, { "epoch": 1.59, "learning_rate": 6.143070809604412e-05, "loss": 0.0098, "step": 613570 }, { "epoch": 1.59, "learning_rate": 6.142681987967266e-05, "loss": 0.0088, "step": 613580 }, { "epoch": 1.59, "learning_rate": 6.142293166330119e-05, "loss": 0.0093, "step": 613590 }, { "epoch": 1.59, "learning_rate": 6.141904344692973e-05, "loss": 0.0065, "step": 613600 }, { "epoch": 1.59, "learning_rate": 6.141515523055826e-05, "loss": 0.0072, "step": 613610 }, { "epoch": 1.59, "learning_rate": 6.14112670141868e-05, "loss": 0.0084, "step": 613620 }, { "epoch": 1.59, "learning_rate": 6.140737879781534e-05, "loss": 0.0122, "step": 613630 }, { "epoch": 1.59, "learning_rate": 6.140349058144387e-05, "loss": 0.0079, "step": 613640 }, { "epoch": 1.59, "learning_rate": 6.139960236507241e-05, "loss": 0.0081, "step": 613650 }, { "epoch": 1.59, "learning_rate": 6.139571414870094e-05, "loss": 0.0095, "step": 613660 }, { "epoch": 1.59, "learning_rate": 6.139182593232948e-05, "loss": 0.009, "step": 613670 }, { "epoch": 1.59, "learning_rate": 6.138793771595801e-05, "loss": 0.008, "step": 613680 }, { "epoch": 1.59, "learning_rate": 6.138404949958655e-05, "loss": 0.009, "step": 613690 }, { "epoch": 1.59, "learning_rate": 6.138016128321508e-05, "loss": 0.0077, "step": 613700 }, { "epoch": 1.59, "learning_rate": 6.137627306684361e-05, "loss": 0.0079, "step": 613710 }, { "epoch": 1.59, "learning_rate": 6.137238485047215e-05, "loss": 0.006, "step": 613720 }, { "epoch": 1.59, "learning_rate": 6.136849663410069e-05, "loss": 0.0101, "step": 613730 }, { "epoch": 1.59, "learning_rate": 6.136460841772922e-05, "loss": 0.0102, "step": 613740 }, { "epoch": 1.59, "learning_rate": 6.136072020135776e-05, "loss": 0.0083, "step": 613750 }, { "epoch": 1.59, "learning_rate": 6.135683198498629e-05, "loss": 0.0115, "step": 613760 }, { "epoch": 1.59, "learning_rate": 6.135294376861483e-05, "loss": 0.0085, "step": 613770 }, { "epoch": 1.59, "learning_rate": 6.134905555224336e-05, "loss": 0.0094, "step": 613780 }, { "epoch": 1.59, "learning_rate": 6.13451673358719e-05, "loss": 0.0071, "step": 613790 }, { "epoch": 1.59, "learning_rate": 6.134127911950044e-05, "loss": 0.0083, "step": 613800 }, { "epoch": 1.59, "learning_rate": 6.133739090312897e-05, "loss": 0.0094, "step": 613810 }, { "epoch": 1.59, "learning_rate": 6.133350268675751e-05, "loss": 0.0086, "step": 613820 }, { "epoch": 1.59, "learning_rate": 6.132961447038604e-05, "loss": 0.0086, "step": 613830 }, { "epoch": 1.59, "learning_rate": 6.132572625401458e-05, "loss": 0.0083, "step": 613840 }, { "epoch": 1.59, "learning_rate": 6.132183803764311e-05, "loss": 0.0097, "step": 613850 }, { "epoch": 1.59, "learning_rate": 6.131794982127165e-05, "loss": 0.0088, "step": 613860 }, { "epoch": 1.59, "learning_rate": 6.131406160490018e-05, "loss": 0.0074, "step": 613870 }, { "epoch": 1.59, "learning_rate": 6.131017338852872e-05, "loss": 0.0073, "step": 613880 }, { "epoch": 1.59, "learning_rate": 6.130628517215726e-05, "loss": 0.009, "step": 613890 }, { "epoch": 1.59, "learning_rate": 6.130239695578579e-05, "loss": 0.0102, "step": 613900 }, { "epoch": 1.59, "learning_rate": 6.129850873941433e-05, "loss": 0.009, "step": 613910 }, { "epoch": 1.59, "learning_rate": 6.129462052304286e-05, "loss": 0.0085, "step": 613920 }, { "epoch": 1.59, "learning_rate": 6.12907323066714e-05, "loss": 0.0079, "step": 613930 }, { "epoch": 1.59, "learning_rate": 6.128684409029993e-05, "loss": 0.0121, "step": 613940 }, { "epoch": 1.59, "learning_rate": 6.128295587392846e-05, "loss": 0.0083, "step": 613950 }, { "epoch": 1.59, "learning_rate": 6.1279067657557e-05, "loss": 0.0103, "step": 613960 }, { "epoch": 1.59, "learning_rate": 6.127517944118553e-05, "loss": 0.0076, "step": 613970 }, { "epoch": 1.59, "learning_rate": 6.127129122481407e-05, "loss": 0.0086, "step": 613980 }, { "epoch": 1.59, "learning_rate": 6.126740300844261e-05, "loss": 0.0134, "step": 613990 }, { "epoch": 1.59, "learning_rate": 6.126351479207114e-05, "loss": 0.0076, "step": 614000 }, { "epoch": 1.59, "eval_cer": 0.8816704946736816, "eval_loss": 0.005931103602051735, "eval_runtime": 107.8086, "eval_samples_per_second": 18.551, "eval_steps_per_second": 4.638, "step": 614000 }, { "epoch": 1.59, "learning_rate": 6.125962657569968e-05, "loss": 0.0103, "step": 614010 }, { "epoch": 1.59, "learning_rate": 6.125573835932821e-05, "loss": 0.0106, "step": 614020 }, { "epoch": 1.59, "learning_rate": 6.125185014295675e-05, "loss": 0.0114, "step": 614030 }, { "epoch": 1.59, "learning_rate": 6.124796192658528e-05, "loss": 0.0078, "step": 614040 }, { "epoch": 1.59, "learning_rate": 6.124407371021382e-05, "loss": 0.0077, "step": 614050 }, { "epoch": 1.59, "learning_rate": 6.124018549384236e-05, "loss": 0.0098, "step": 614060 }, { "epoch": 1.59, "learning_rate": 6.123629727747089e-05, "loss": 0.0072, "step": 614070 }, { "epoch": 1.59, "learning_rate": 6.123240906109943e-05, "loss": 0.0098, "step": 614080 }, { "epoch": 1.59, "learning_rate": 6.122852084472796e-05, "loss": 0.0097, "step": 614090 }, { "epoch": 1.59, "learning_rate": 6.12246326283565e-05, "loss": 0.0079, "step": 614100 }, { "epoch": 1.59, "learning_rate": 6.122074441198503e-05, "loss": 0.0093, "step": 614110 }, { "epoch": 1.59, "learning_rate": 6.121685619561357e-05, "loss": 0.0078, "step": 614120 }, { "epoch": 1.59, "learning_rate": 6.12129679792421e-05, "loss": 0.0077, "step": 614130 }, { "epoch": 1.59, "learning_rate": 6.120907976287064e-05, "loss": 0.0096, "step": 614140 }, { "epoch": 1.59, "learning_rate": 6.120519154649918e-05, "loss": 0.0106, "step": 614150 }, { "epoch": 1.59, "learning_rate": 6.120130333012771e-05, "loss": 0.0078, "step": 614160 }, { "epoch": 1.59, "learning_rate": 6.119741511375625e-05, "loss": 0.0093, "step": 614170 }, { "epoch": 1.59, "learning_rate": 6.119352689738478e-05, "loss": 0.0077, "step": 614180 }, { "epoch": 1.59, "learning_rate": 6.118963868101331e-05, "loss": 0.0069, "step": 614190 }, { "epoch": 1.59, "learning_rate": 6.118575046464185e-05, "loss": 0.0099, "step": 614200 }, { "epoch": 1.59, "learning_rate": 6.118186224827038e-05, "loss": 0.0117, "step": 614210 }, { "epoch": 1.59, "learning_rate": 6.117797403189892e-05, "loss": 0.0098, "step": 614220 }, { "epoch": 1.59, "learning_rate": 6.117408581552745e-05, "loss": 0.0094, "step": 614230 }, { "epoch": 1.59, "learning_rate": 6.117019759915599e-05, "loss": 0.0108, "step": 614240 }, { "epoch": 1.59, "learning_rate": 6.116630938278453e-05, "loss": 0.0068, "step": 614250 }, { "epoch": 1.59, "learning_rate": 6.116242116641306e-05, "loss": 0.0085, "step": 614260 }, { "epoch": 1.59, "learning_rate": 6.11585329500416e-05, "loss": 0.0095, "step": 614270 }, { "epoch": 1.59, "learning_rate": 6.115464473367013e-05, "loss": 0.0077, "step": 614280 }, { "epoch": 1.59, "learning_rate": 6.115075651729867e-05, "loss": 0.0062, "step": 614290 }, { "epoch": 1.59, "learning_rate": 6.11468683009272e-05, "loss": 0.0064, "step": 614300 }, { "epoch": 1.59, "learning_rate": 6.114298008455574e-05, "loss": 0.0068, "step": 614310 }, { "epoch": 1.59, "learning_rate": 6.113909186818428e-05, "loss": 0.0117, "step": 614320 }, { "epoch": 1.59, "learning_rate": 6.113520365181281e-05, "loss": 0.0107, "step": 614330 }, { "epoch": 1.59, "learning_rate": 6.113131543544135e-05, "loss": 0.0084, "step": 614340 }, { "epoch": 1.59, "learning_rate": 6.112742721906988e-05, "loss": 0.0123, "step": 614350 }, { "epoch": 1.59, "learning_rate": 6.112353900269842e-05, "loss": 0.0085, "step": 614360 }, { "epoch": 1.59, "learning_rate": 6.111965078632695e-05, "loss": 0.0066, "step": 614370 }, { "epoch": 1.59, "learning_rate": 6.111576256995549e-05, "loss": 0.0102, "step": 614380 }, { "epoch": 1.59, "learning_rate": 6.111187435358402e-05, "loss": 0.0122, "step": 614390 }, { "epoch": 1.59, "learning_rate": 6.110798613721256e-05, "loss": 0.0078, "step": 614400 }, { "epoch": 1.59, "learning_rate": 6.11040979208411e-05, "loss": 0.0114, "step": 614410 }, { "epoch": 1.59, "learning_rate": 6.110020970446963e-05, "loss": 0.0114, "step": 614420 }, { "epoch": 1.59, "learning_rate": 6.109632148809817e-05, "loss": 0.008, "step": 614430 }, { "epoch": 1.59, "learning_rate": 6.10924332717267e-05, "loss": 0.0075, "step": 614440 }, { "epoch": 1.59, "learning_rate": 6.108854505535523e-05, "loss": 0.0079, "step": 614450 }, { "epoch": 1.59, "learning_rate": 6.108465683898377e-05, "loss": 0.0096, "step": 614460 }, { "epoch": 1.59, "learning_rate": 6.10807686226123e-05, "loss": 0.0088, "step": 614470 }, { "epoch": 1.59, "learning_rate": 6.107688040624084e-05, "loss": 0.0077, "step": 614480 }, { "epoch": 1.59, "learning_rate": 6.107299218986937e-05, "loss": 0.0087, "step": 614490 }, { "epoch": 1.59, "learning_rate": 6.106910397349791e-05, "loss": 0.0086, "step": 614500 }, { "epoch": 1.59, "learning_rate": 6.106521575712645e-05, "loss": 0.0063, "step": 614510 }, { "epoch": 1.59, "learning_rate": 6.106132754075498e-05, "loss": 0.0071, "step": 614520 }, { "epoch": 1.59, "learning_rate": 6.105743932438352e-05, "loss": 0.01, "step": 614530 }, { "epoch": 1.59, "learning_rate": 6.105355110801205e-05, "loss": 0.0073, "step": 614540 }, { "epoch": 1.59, "learning_rate": 6.104966289164059e-05, "loss": 0.0057, "step": 614550 }, { "epoch": 1.59, "learning_rate": 6.104577467526912e-05, "loss": 0.0092, "step": 614560 }, { "epoch": 1.59, "learning_rate": 6.104188645889766e-05, "loss": 0.0073, "step": 614570 }, { "epoch": 1.59, "learning_rate": 6.103799824252619e-05, "loss": 0.008, "step": 614580 }, { "epoch": 1.59, "learning_rate": 6.103411002615473e-05, "loss": 0.0098, "step": 614590 }, { "epoch": 1.59, "learning_rate": 6.1030221809783265e-05, "loss": 0.0099, "step": 614600 }, { "epoch": 1.59, "learning_rate": 6.10263335934118e-05, "loss": 0.0106, "step": 614610 }, { "epoch": 1.59, "learning_rate": 6.1022445377040335e-05, "loss": 0.0082, "step": 614620 }, { "epoch": 1.59, "learning_rate": 6.101855716066888e-05, "loss": 0.0092, "step": 614630 }, { "epoch": 1.59, "learning_rate": 6.101466894429741e-05, "loss": 0.0119, "step": 614640 }, { "epoch": 1.59, "learning_rate": 6.1010780727925946e-05, "loss": 0.0078, "step": 614650 }, { "epoch": 1.59, "learning_rate": 6.100689251155448e-05, "loss": 0.0062, "step": 614660 }, { "epoch": 1.59, "learning_rate": 6.1003004295183016e-05, "loss": 0.0072, "step": 614670 }, { "epoch": 1.59, "learning_rate": 6.099911607881155e-05, "loss": 0.0082, "step": 614680 }, { "epoch": 1.59, "learning_rate": 6.099522786244008e-05, "loss": 0.0071, "step": 614690 }, { "epoch": 1.59, "learning_rate": 6.0991339646068614e-05, "loss": 0.01, "step": 614700 }, { "epoch": 1.59, "learning_rate": 6.098745142969715e-05, "loss": 0.0099, "step": 614710 }, { "epoch": 1.59, "learning_rate": 6.0983563213325684e-05, "loss": 0.0071, "step": 614720 }, { "epoch": 1.59, "learning_rate": 6.0979674996954225e-05, "loss": 0.008, "step": 614730 }, { "epoch": 1.59, "learning_rate": 6.097578678058276e-05, "loss": 0.01, "step": 614740 }, { "epoch": 1.59, "learning_rate": 6.0971898564211295e-05, "loss": 0.0061, "step": 614750 }, { "epoch": 1.59, "learning_rate": 6.096801034783983e-05, "loss": 0.0093, "step": 614760 }, { "epoch": 1.59, "learning_rate": 6.0964122131468365e-05, "loss": 0.0079, "step": 614770 }, { "epoch": 1.59, "learning_rate": 6.09602339150969e-05, "loss": 0.0086, "step": 614780 }, { "epoch": 1.59, "learning_rate": 6.0956345698725434e-05, "loss": 0.0074, "step": 614790 }, { "epoch": 1.59, "learning_rate": 6.095245748235397e-05, "loss": 0.0099, "step": 614800 }, { "epoch": 1.59, "learning_rate": 6.094856926598251e-05, "loss": 0.007, "step": 614810 }, { "epoch": 1.59, "learning_rate": 6.0944681049611046e-05, "loss": 0.0092, "step": 614820 }, { "epoch": 1.59, "learning_rate": 6.094079283323958e-05, "loss": 0.0077, "step": 614830 }, { "epoch": 1.59, "learning_rate": 6.0936904616868116e-05, "loss": 0.0094, "step": 614840 }, { "epoch": 1.59, "learning_rate": 6.093301640049665e-05, "loss": 0.0082, "step": 614850 }, { "epoch": 1.59, "learning_rate": 6.0929128184125185e-05, "loss": 0.0089, "step": 614860 }, { "epoch": 1.59, "learning_rate": 6.092523996775372e-05, "loss": 0.007, "step": 614870 }, { "epoch": 1.59, "learning_rate": 6.0921351751382255e-05, "loss": 0.0066, "step": 614880 }, { "epoch": 1.59, "learning_rate": 6.0917463535010797e-05, "loss": 0.0063, "step": 614890 }, { "epoch": 1.59, "learning_rate": 6.091357531863933e-05, "loss": 0.0097, "step": 614900 }, { "epoch": 1.59, "learning_rate": 6.0909687102267866e-05, "loss": 0.0083, "step": 614910 }, { "epoch": 1.59, "learning_rate": 6.09057988858964e-05, "loss": 0.009, "step": 614920 }, { "epoch": 1.59, "learning_rate": 6.0901910669524936e-05, "loss": 0.0089, "step": 614930 }, { "epoch": 1.59, "learning_rate": 6.0898022453153464e-05, "loss": 0.0085, "step": 614940 }, { "epoch": 1.59, "learning_rate": 6.0894134236782e-05, "loss": 0.006, "step": 614950 }, { "epoch": 1.59, "learning_rate": 6.0890246020410534e-05, "loss": 0.01, "step": 614960 }, { "epoch": 1.59, "learning_rate": 6.088635780403907e-05, "loss": 0.0076, "step": 614970 }, { "epoch": 1.59, "learning_rate": 6.0882469587667604e-05, "loss": 0.0088, "step": 614980 }, { "epoch": 1.59, "learning_rate": 6.0878581371296145e-05, "loss": 0.0089, "step": 614990 }, { "epoch": 1.59, "learning_rate": 6.087469315492468e-05, "loss": 0.0113, "step": 615000 }, { "epoch": 1.59, "eval_cer": 0.8816998870492994, "eval_loss": 0.005477694794535637, "eval_runtime": 107.7529, "eval_samples_per_second": 18.561, "eval_steps_per_second": 4.64, "step": 615000 }, { "epoch": 1.59, "learning_rate": 6.0870804938553215e-05, "loss": 0.0063, "step": 615010 }, { "epoch": 1.59, "learning_rate": 6.086691672218175e-05, "loss": 0.0062, "step": 615020 }, { "epoch": 1.59, "learning_rate": 6.0863028505810285e-05, "loss": 0.0091, "step": 615030 }, { "epoch": 1.59, "learning_rate": 6.085914028943882e-05, "loss": 0.0098, "step": 615040 }, { "epoch": 1.59, "learning_rate": 6.0855252073067354e-05, "loss": 0.008, "step": 615050 }, { "epoch": 1.59, "learning_rate": 6.085136385669589e-05, "loss": 0.0072, "step": 615060 }, { "epoch": 1.59, "learning_rate": 6.084747564032443e-05, "loss": 0.0098, "step": 615070 }, { "epoch": 1.59, "learning_rate": 6.0843587423952966e-05, "loss": 0.011, "step": 615080 }, { "epoch": 1.59, "learning_rate": 6.08396992075815e-05, "loss": 0.0052, "step": 615090 }, { "epoch": 1.59, "learning_rate": 6.0835810991210035e-05, "loss": 0.0065, "step": 615100 }, { "epoch": 1.59, "learning_rate": 6.083192277483857e-05, "loss": 0.0088, "step": 615110 }, { "epoch": 1.59, "learning_rate": 6.0828034558467105e-05, "loss": 0.0105, "step": 615120 }, { "epoch": 1.59, "learning_rate": 6.082414634209564e-05, "loss": 0.0106, "step": 615130 }, { "epoch": 1.59, "learning_rate": 6.0820258125724175e-05, "loss": 0.0065, "step": 615140 }, { "epoch": 1.59, "learning_rate": 6.0816369909352717e-05, "loss": 0.0066, "step": 615150 }, { "epoch": 1.59, "learning_rate": 6.081248169298125e-05, "loss": 0.0093, "step": 615160 }, { "epoch": 1.59, "learning_rate": 6.0808593476609786e-05, "loss": 0.0078, "step": 615170 }, { "epoch": 1.59, "learning_rate": 6.080470526023832e-05, "loss": 0.0065, "step": 615180 }, { "epoch": 1.59, "learning_rate": 6.080081704386685e-05, "loss": 0.0079, "step": 615190 }, { "epoch": 1.59, "learning_rate": 6.0796928827495384e-05, "loss": 0.0088, "step": 615200 }, { "epoch": 1.59, "learning_rate": 6.079304061112392e-05, "loss": 0.0069, "step": 615210 }, { "epoch": 1.59, "learning_rate": 6.0789152394752454e-05, "loss": 0.0065, "step": 615220 }, { "epoch": 1.59, "learning_rate": 6.078526417838099e-05, "loss": 0.0085, "step": 615230 }, { "epoch": 1.59, "learning_rate": 6.0781375962009524e-05, "loss": 0.0074, "step": 615240 }, { "epoch": 1.59, "learning_rate": 6.0777487745638065e-05, "loss": 0.0092, "step": 615250 }, { "epoch": 1.59, "learning_rate": 6.07735995292666e-05, "loss": 0.01, "step": 615260 }, { "epoch": 1.59, "learning_rate": 6.0769711312895135e-05, "loss": 0.0086, "step": 615270 }, { "epoch": 1.59, "learning_rate": 6.076582309652367e-05, "loss": 0.0072, "step": 615280 }, { "epoch": 1.59, "learning_rate": 6.0761934880152205e-05, "loss": 0.0087, "step": 615290 }, { "epoch": 1.59, "learning_rate": 6.075804666378074e-05, "loss": 0.0074, "step": 615300 }, { "epoch": 1.59, "learning_rate": 6.0754158447409274e-05, "loss": 0.0066, "step": 615310 }, { "epoch": 1.59, "learning_rate": 6.075027023103781e-05, "loss": 0.0087, "step": 615320 }, { "epoch": 1.6, "learning_rate": 6.074638201466635e-05, "loss": 0.0086, "step": 615330 }, { "epoch": 1.6, "learning_rate": 6.0742493798294886e-05, "loss": 0.0074, "step": 615340 }, { "epoch": 1.6, "learning_rate": 6.073860558192342e-05, "loss": 0.0052, "step": 615350 }, { "epoch": 1.6, "learning_rate": 6.0734717365551955e-05, "loss": 0.0111, "step": 615360 }, { "epoch": 1.6, "learning_rate": 6.073082914918049e-05, "loss": 0.008, "step": 615370 }, { "epoch": 1.6, "learning_rate": 6.0726940932809025e-05, "loss": 0.0087, "step": 615380 }, { "epoch": 1.6, "learning_rate": 6.072305271643756e-05, "loss": 0.0076, "step": 615390 }, { "epoch": 1.6, "learning_rate": 6.0719164500066095e-05, "loss": 0.0098, "step": 615400 }, { "epoch": 1.6, "learning_rate": 6.0715276283694637e-05, "loss": 0.0078, "step": 615410 }, { "epoch": 1.6, "learning_rate": 6.071138806732317e-05, "loss": 0.0088, "step": 615420 }, { "epoch": 1.6, "learning_rate": 6.07074998509517e-05, "loss": 0.0083, "step": 615430 }, { "epoch": 1.6, "learning_rate": 6.0703611634580234e-05, "loss": 0.0088, "step": 615440 }, { "epoch": 1.6, "learning_rate": 6.069972341820877e-05, "loss": 0.0092, "step": 615450 }, { "epoch": 1.6, "learning_rate": 6.0695835201837304e-05, "loss": 0.0086, "step": 615460 }, { "epoch": 1.6, "learning_rate": 6.069194698546584e-05, "loss": 0.0081, "step": 615470 }, { "epoch": 1.6, "learning_rate": 6.0688058769094374e-05, "loss": 0.0061, "step": 615480 }, { "epoch": 1.6, "learning_rate": 6.068417055272291e-05, "loss": 0.0073, "step": 615490 }, { "epoch": 1.6, "learning_rate": 6.0680282336351443e-05, "loss": 0.0115, "step": 615500 }, { "epoch": 1.6, "learning_rate": 6.0676394119979985e-05, "loss": 0.0085, "step": 615510 }, { "epoch": 1.6, "learning_rate": 6.067250590360852e-05, "loss": 0.0094, "step": 615520 }, { "epoch": 1.6, "learning_rate": 6.0668617687237055e-05, "loss": 0.007, "step": 615530 }, { "epoch": 1.6, "learning_rate": 6.066472947086559e-05, "loss": 0.0063, "step": 615540 }, { "epoch": 1.6, "learning_rate": 6.0660841254494125e-05, "loss": 0.0104, "step": 615550 }, { "epoch": 1.6, "learning_rate": 6.065695303812266e-05, "loss": 0.0089, "step": 615560 }, { "epoch": 1.6, "learning_rate": 6.0653064821751194e-05, "loss": 0.0068, "step": 615570 }, { "epoch": 1.6, "learning_rate": 6.064917660537973e-05, "loss": 0.0073, "step": 615580 }, { "epoch": 1.6, "learning_rate": 6.064528838900827e-05, "loss": 0.0061, "step": 615590 }, { "epoch": 1.6, "learning_rate": 6.0641400172636806e-05, "loss": 0.0087, "step": 615600 }, { "epoch": 1.6, "learning_rate": 6.063751195626534e-05, "loss": 0.0094, "step": 615610 }, { "epoch": 1.6, "learning_rate": 6.0633623739893875e-05, "loss": 0.0099, "step": 615620 }, { "epoch": 1.6, "learning_rate": 6.062973552352241e-05, "loss": 0.0093, "step": 615630 }, { "epoch": 1.6, "learning_rate": 6.0625847307150945e-05, "loss": 0.0075, "step": 615640 }, { "epoch": 1.6, "learning_rate": 6.062195909077948e-05, "loss": 0.0108, "step": 615650 }, { "epoch": 1.6, "learning_rate": 6.0618070874408015e-05, "loss": 0.0081, "step": 615660 }, { "epoch": 1.6, "learning_rate": 6.061418265803655e-05, "loss": 0.0099, "step": 615670 }, { "epoch": 1.6, "learning_rate": 6.061029444166508e-05, "loss": 0.0074, "step": 615680 }, { "epoch": 1.6, "learning_rate": 6.060640622529362e-05, "loss": 0.0049, "step": 615690 }, { "epoch": 1.6, "learning_rate": 6.0602518008922154e-05, "loss": 0.0095, "step": 615700 }, { "epoch": 1.6, "learning_rate": 6.059862979255069e-05, "loss": 0.009, "step": 615710 }, { "epoch": 1.6, "learning_rate": 6.0594741576179224e-05, "loss": 0.0054, "step": 615720 }, { "epoch": 1.6, "learning_rate": 6.059085335980776e-05, "loss": 0.0083, "step": 615730 }, { "epoch": 1.6, "learning_rate": 6.0586965143436294e-05, "loss": 0.0097, "step": 615740 }, { "epoch": 1.6, "learning_rate": 6.058307692706483e-05, "loss": 0.0113, "step": 615750 }, { "epoch": 1.6, "learning_rate": 6.0579188710693363e-05, "loss": 0.0083, "step": 615760 }, { "epoch": 1.6, "learning_rate": 6.0575300494321905e-05, "loss": 0.0096, "step": 615770 }, { "epoch": 1.6, "learning_rate": 6.057141227795044e-05, "loss": 0.0096, "step": 615780 }, { "epoch": 1.6, "learning_rate": 6.0567524061578975e-05, "loss": 0.0079, "step": 615790 }, { "epoch": 1.6, "learning_rate": 6.056363584520751e-05, "loss": 0.0086, "step": 615800 }, { "epoch": 1.6, "learning_rate": 6.0559747628836045e-05, "loss": 0.0103, "step": 615810 }, { "epoch": 1.6, "learning_rate": 6.055585941246458e-05, "loss": 0.0109, "step": 615820 }, { "epoch": 1.6, "learning_rate": 6.0551971196093114e-05, "loss": 0.0074, "step": 615830 }, { "epoch": 1.6, "learning_rate": 6.054808297972165e-05, "loss": 0.0094, "step": 615840 }, { "epoch": 1.6, "learning_rate": 6.0544194763350184e-05, "loss": 0.0105, "step": 615850 }, { "epoch": 1.6, "learning_rate": 6.0540306546978726e-05, "loss": 0.0078, "step": 615860 }, { "epoch": 1.6, "learning_rate": 6.053641833060726e-05, "loss": 0.0108, "step": 615870 }, { "epoch": 1.6, "learning_rate": 6.0532530114235795e-05, "loss": 0.0067, "step": 615880 }, { "epoch": 1.6, "learning_rate": 6.052864189786433e-05, "loss": 0.0079, "step": 615890 }, { "epoch": 1.6, "learning_rate": 6.0524753681492865e-05, "loss": 0.008, "step": 615900 }, { "epoch": 1.6, "learning_rate": 6.05208654651214e-05, "loss": 0.0072, "step": 615910 }, { "epoch": 1.6, "learning_rate": 6.0516977248749935e-05, "loss": 0.0078, "step": 615920 }, { "epoch": 1.6, "learning_rate": 6.051308903237846e-05, "loss": 0.0079, "step": 615930 }, { "epoch": 1.6, "learning_rate": 6.0509200816007e-05, "loss": 0.0079, "step": 615940 }, { "epoch": 1.6, "learning_rate": 6.050531259963553e-05, "loss": 0.0113, "step": 615950 }, { "epoch": 1.6, "learning_rate": 6.0501424383264074e-05, "loss": 0.0073, "step": 615960 }, { "epoch": 1.6, "learning_rate": 6.049753616689261e-05, "loss": 0.0085, "step": 615970 }, { "epoch": 1.6, "learning_rate": 6.0493647950521144e-05, "loss": 0.0081, "step": 615980 }, { "epoch": 1.6, "learning_rate": 6.048975973414968e-05, "loss": 0.0078, "step": 615990 }, { "epoch": 1.6, "learning_rate": 6.0485871517778214e-05, "loss": 0.0076, "step": 616000 }, { "epoch": 1.6, "eval_cer": 0.8817124837817071, "eval_loss": 0.005670115817338228, "eval_runtime": 107.9064, "eval_samples_per_second": 18.535, "eval_steps_per_second": 4.634, "step": 616000 }, { "epoch": 1.6, "learning_rate": 6.048198330140675e-05, "loss": 0.0088, "step": 616010 }, { "epoch": 1.6, "learning_rate": 6.0478095085035283e-05, "loss": 0.0101, "step": 616020 }, { "epoch": 1.6, "learning_rate": 6.047420686866382e-05, "loss": 0.0117, "step": 616030 }, { "epoch": 1.6, "learning_rate": 6.047031865229236e-05, "loss": 0.0092, "step": 616040 }, { "epoch": 1.6, "learning_rate": 6.0466430435920895e-05, "loss": 0.0069, "step": 616050 }, { "epoch": 1.6, "learning_rate": 6.046254221954943e-05, "loss": 0.0073, "step": 616060 }, { "epoch": 1.6, "learning_rate": 6.0458654003177964e-05, "loss": 0.0078, "step": 616070 }, { "epoch": 1.6, "learning_rate": 6.04547657868065e-05, "loss": 0.0061, "step": 616080 }, { "epoch": 1.6, "learning_rate": 6.0450877570435034e-05, "loss": 0.0103, "step": 616090 }, { "epoch": 1.6, "learning_rate": 6.044698935406357e-05, "loss": 0.0096, "step": 616100 }, { "epoch": 1.6, "learning_rate": 6.0443101137692104e-05, "loss": 0.0094, "step": 616110 }, { "epoch": 1.6, "learning_rate": 6.0439212921320646e-05, "loss": 0.0089, "step": 616120 }, { "epoch": 1.6, "learning_rate": 6.043532470494918e-05, "loss": 0.0084, "step": 616130 }, { "epoch": 1.6, "learning_rate": 6.0431436488577715e-05, "loss": 0.007, "step": 616140 }, { "epoch": 1.6, "learning_rate": 6.042754827220625e-05, "loss": 0.01, "step": 616150 }, { "epoch": 1.6, "learning_rate": 6.0423660055834785e-05, "loss": 0.0065, "step": 616160 }, { "epoch": 1.6, "learning_rate": 6.041977183946332e-05, "loss": 0.0095, "step": 616170 }, { "epoch": 1.6, "learning_rate": 6.041588362309185e-05, "loss": 0.0111, "step": 616180 }, { "epoch": 1.6, "learning_rate": 6.041199540672038e-05, "loss": 0.0068, "step": 616190 }, { "epoch": 1.6, "learning_rate": 6.040810719034892e-05, "loss": 0.0094, "step": 616200 }, { "epoch": 1.6, "learning_rate": 6.040421897397745e-05, "loss": 0.0101, "step": 616210 }, { "epoch": 1.6, "learning_rate": 6.0400330757605994e-05, "loss": 0.0109, "step": 616220 }, { "epoch": 1.6, "learning_rate": 6.039644254123453e-05, "loss": 0.0077, "step": 616230 }, { "epoch": 1.6, "learning_rate": 6.0392554324863064e-05, "loss": 0.0078, "step": 616240 }, { "epoch": 1.6, "learning_rate": 6.03886661084916e-05, "loss": 0.0073, "step": 616250 }, { "epoch": 1.6, "learning_rate": 6.0384777892120134e-05, "loss": 0.0078, "step": 616260 }, { "epoch": 1.6, "learning_rate": 6.038088967574867e-05, "loss": 0.0075, "step": 616270 }, { "epoch": 1.6, "learning_rate": 6.03770014593772e-05, "loss": 0.0061, "step": 616280 }, { "epoch": 1.6, "learning_rate": 6.037311324300574e-05, "loss": 0.0093, "step": 616290 }, { "epoch": 1.6, "learning_rate": 6.036922502663428e-05, "loss": 0.0123, "step": 616300 }, { "epoch": 1.6, "learning_rate": 6.0365336810262815e-05, "loss": 0.0088, "step": 616310 }, { "epoch": 1.6, "learning_rate": 6.036144859389135e-05, "loss": 0.0078, "step": 616320 }, { "epoch": 1.6, "learning_rate": 6.0357560377519884e-05, "loss": 0.0074, "step": 616330 }, { "epoch": 1.6, "learning_rate": 6.035367216114842e-05, "loss": 0.011, "step": 616340 }, { "epoch": 1.6, "learning_rate": 6.0349783944776954e-05, "loss": 0.0108, "step": 616350 }, { "epoch": 1.6, "learning_rate": 6.034589572840549e-05, "loss": 0.0074, "step": 616360 }, { "epoch": 1.6, "learning_rate": 6.0342007512034024e-05, "loss": 0.008, "step": 616370 }, { "epoch": 1.6, "learning_rate": 6.0338119295662566e-05, "loss": 0.0075, "step": 616380 }, { "epoch": 1.6, "learning_rate": 6.03342310792911e-05, "loss": 0.0084, "step": 616390 }, { "epoch": 1.6, "learning_rate": 6.0330342862919635e-05, "loss": 0.0098, "step": 616400 }, { "epoch": 1.6, "learning_rate": 6.032645464654817e-05, "loss": 0.0101, "step": 616410 }, { "epoch": 1.6, "learning_rate": 6.0322566430176705e-05, "loss": 0.0086, "step": 616420 }, { "epoch": 1.6, "learning_rate": 6.031867821380523e-05, "loss": 0.009, "step": 616430 }, { "epoch": 1.6, "learning_rate": 6.031478999743377e-05, "loss": 0.01, "step": 616440 }, { "epoch": 1.6, "learning_rate": 6.03109017810623e-05, "loss": 0.0097, "step": 616450 }, { "epoch": 1.6, "learning_rate": 6.030701356469084e-05, "loss": 0.0109, "step": 616460 }, { "epoch": 1.6, "learning_rate": 6.030312534831937e-05, "loss": 0.0091, "step": 616470 }, { "epoch": 1.6, "learning_rate": 6.0299237131947914e-05, "loss": 0.0078, "step": 616480 }, { "epoch": 1.6, "learning_rate": 6.029534891557645e-05, "loss": 0.0101, "step": 616490 }, { "epoch": 1.6, "learning_rate": 6.0291460699204984e-05, "loss": 0.0109, "step": 616500 }, { "epoch": 1.6, "learning_rate": 6.028757248283352e-05, "loss": 0.0084, "step": 616510 }, { "epoch": 1.6, "learning_rate": 6.0283684266462054e-05, "loss": 0.0109, "step": 616520 }, { "epoch": 1.6, "learning_rate": 6.027979605009059e-05, "loss": 0.0083, "step": 616530 }, { "epoch": 1.6, "learning_rate": 6.027590783371912e-05, "loss": 0.0071, "step": 616540 }, { "epoch": 1.6, "learning_rate": 6.027201961734766e-05, "loss": 0.0109, "step": 616550 }, { "epoch": 1.6, "learning_rate": 6.02681314009762e-05, "loss": 0.0101, "step": 616560 }, { "epoch": 1.6, "learning_rate": 6.0264243184604735e-05, "loss": 0.0083, "step": 616570 }, { "epoch": 1.6, "learning_rate": 6.026035496823327e-05, "loss": 0.0076, "step": 616580 }, { "epoch": 1.6, "learning_rate": 6.0256466751861804e-05, "loss": 0.008, "step": 616590 }, { "epoch": 1.6, "learning_rate": 6.025257853549034e-05, "loss": 0.0107, "step": 616600 }, { "epoch": 1.6, "learning_rate": 6.0248690319118874e-05, "loss": 0.0078, "step": 616610 }, { "epoch": 1.6, "learning_rate": 6.024480210274741e-05, "loss": 0.0076, "step": 616620 }, { "epoch": 1.6, "learning_rate": 6.0240913886375944e-05, "loss": 0.0094, "step": 616630 }, { "epoch": 1.6, "learning_rate": 6.0237025670004485e-05, "loss": 0.0086, "step": 616640 }, { "epoch": 1.6, "learning_rate": 6.023313745363302e-05, "loss": 0.0069, "step": 616650 }, { "epoch": 1.6, "learning_rate": 6.0229249237261555e-05, "loss": 0.0088, "step": 616660 }, { "epoch": 1.6, "learning_rate": 6.022536102089008e-05, "loss": 0.0084, "step": 616670 }, { "epoch": 1.6, "learning_rate": 6.022147280451862e-05, "loss": 0.008, "step": 616680 }, { "epoch": 1.6, "learning_rate": 6.021758458814715e-05, "loss": 0.0092, "step": 616690 }, { "epoch": 1.6, "learning_rate": 6.021369637177569e-05, "loss": 0.0075, "step": 616700 }, { "epoch": 1.6, "learning_rate": 6.020980815540422e-05, "loss": 0.0086, "step": 616710 }, { "epoch": 1.6, "learning_rate": 6.020591993903276e-05, "loss": 0.0063, "step": 616720 }, { "epoch": 1.6, "learning_rate": 6.020203172266129e-05, "loss": 0.0093, "step": 616730 }, { "epoch": 1.6, "learning_rate": 6.0198143506289834e-05, "loss": 0.0119, "step": 616740 }, { "epoch": 1.6, "learning_rate": 6.019425528991837e-05, "loss": 0.0067, "step": 616750 }, { "epoch": 1.6, "learning_rate": 6.0190367073546904e-05, "loss": 0.0097, "step": 616760 }, { "epoch": 1.6, "learning_rate": 6.018647885717544e-05, "loss": 0.007, "step": 616770 }, { "epoch": 1.6, "learning_rate": 6.0182590640803974e-05, "loss": 0.0084, "step": 616780 }, { "epoch": 1.6, "learning_rate": 6.017870242443251e-05, "loss": 0.0105, "step": 616790 }, { "epoch": 1.6, "learning_rate": 6.017481420806104e-05, "loss": 0.0094, "step": 616800 }, { "epoch": 1.6, "learning_rate": 6.017092599168958e-05, "loss": 0.0088, "step": 616810 }, { "epoch": 1.6, "learning_rate": 6.016703777531812e-05, "loss": 0.0092, "step": 616820 }, { "epoch": 1.6, "learning_rate": 6.0163149558946655e-05, "loss": 0.0064, "step": 616830 }, { "epoch": 1.6, "learning_rate": 6.015926134257519e-05, "loss": 0.0075, "step": 616840 }, { "epoch": 1.6, "learning_rate": 6.0155373126203724e-05, "loss": 0.009, "step": 616850 }, { "epoch": 1.6, "learning_rate": 6.015148490983226e-05, "loss": 0.0083, "step": 616860 }, { "epoch": 1.6, "learning_rate": 6.0147596693460794e-05, "loss": 0.0081, "step": 616870 }, { "epoch": 1.6, "learning_rate": 6.014370847708933e-05, "loss": 0.0093, "step": 616880 }, { "epoch": 1.6, "learning_rate": 6.0139820260717864e-05, "loss": 0.008, "step": 616890 }, { "epoch": 1.6, "learning_rate": 6.0135932044346405e-05, "loss": 0.0084, "step": 616900 }, { "epoch": 1.6, "learning_rate": 6.013204382797494e-05, "loss": 0.0085, "step": 616910 }, { "epoch": 1.6, "learning_rate": 6.012815561160347e-05, "loss": 0.0088, "step": 616920 }, { "epoch": 1.6, "learning_rate": 6.0124267395232e-05, "loss": 0.0076, "step": 616930 }, { "epoch": 1.6, "learning_rate": 6.012037917886054e-05, "loss": 0.0061, "step": 616940 }, { "epoch": 1.6, "learning_rate": 6.011649096248907e-05, "loss": 0.0088, "step": 616950 }, { "epoch": 1.6, "learning_rate": 6.011260274611761e-05, "loss": 0.0097, "step": 616960 }, { "epoch": 1.6, "learning_rate": 6.010871452974614e-05, "loss": 0.0108, "step": 616970 }, { "epoch": 1.6, "learning_rate": 6.010482631337468e-05, "loss": 0.0058, "step": 616980 }, { "epoch": 1.6, "learning_rate": 6.010093809700321e-05, "loss": 0.0095, "step": 616990 }, { "epoch": 1.6, "learning_rate": 6.0097049880631754e-05, "loss": 0.007, "step": 617000 }, { "epoch": 1.6, "eval_cer": 0.8816690950367475, "eval_loss": 0.005568648222833872, "eval_runtime": 107.8731, "eval_samples_per_second": 18.54, "eval_steps_per_second": 4.635, "step": 617000 }, { "epoch": 1.6, "learning_rate": 6.009316166426029e-05, "loss": 0.0089, "step": 617010 }, { "epoch": 1.6, "learning_rate": 6.0089273447888824e-05, "loss": 0.0068, "step": 617020 }, { "epoch": 1.6, "learning_rate": 6.008538523151736e-05, "loss": 0.0102, "step": 617030 }, { "epoch": 1.6, "learning_rate": 6.0081497015145893e-05, "loss": 0.0088, "step": 617040 }, { "epoch": 1.6, "learning_rate": 6.007760879877443e-05, "loss": 0.0097, "step": 617050 }, { "epoch": 1.6, "learning_rate": 6.007372058240296e-05, "loss": 0.0086, "step": 617060 }, { "epoch": 1.6, "learning_rate": 6.00698323660315e-05, "loss": 0.0093, "step": 617070 }, { "epoch": 1.6, "learning_rate": 6.006594414966004e-05, "loss": 0.01, "step": 617080 }, { "epoch": 1.6, "learning_rate": 6.0062055933288575e-05, "loss": 0.0075, "step": 617090 }, { "epoch": 1.6, "learning_rate": 6.005816771691711e-05, "loss": 0.0076, "step": 617100 }, { "epoch": 1.6, "learning_rate": 6.0054279500545644e-05, "loss": 0.0062, "step": 617110 }, { "epoch": 1.6, "learning_rate": 6.005039128417418e-05, "loss": 0.0093, "step": 617120 }, { "epoch": 1.6, "learning_rate": 6.0046503067802714e-05, "loss": 0.011, "step": 617130 }, { "epoch": 1.6, "learning_rate": 6.004261485143125e-05, "loss": 0.0099, "step": 617140 }, { "epoch": 1.6, "learning_rate": 6.0038726635059784e-05, "loss": 0.0084, "step": 617150 }, { "epoch": 1.6, "learning_rate": 6.003483841868832e-05, "loss": 0.0084, "step": 617160 }, { "epoch": 1.6, "learning_rate": 6.003095020231685e-05, "loss": 0.0087, "step": 617170 }, { "epoch": 1.6, "learning_rate": 6.002706198594539e-05, "loss": 0.0097, "step": 617180 }, { "epoch": 1.6, "learning_rate": 6.002317376957392e-05, "loss": 0.0061, "step": 617190 }, { "epoch": 1.6, "learning_rate": 6.001928555320246e-05, "loss": 0.0093, "step": 617200 }, { "epoch": 1.6, "learning_rate": 6.001539733683099e-05, "loss": 0.0128, "step": 617210 }, { "epoch": 1.6, "learning_rate": 6.001150912045953e-05, "loss": 0.008, "step": 617220 }, { "epoch": 1.6, "learning_rate": 6.000762090408806e-05, "loss": 0.008, "step": 617230 }, { "epoch": 1.6, "learning_rate": 6.00037326877166e-05, "loss": 0.0093, "step": 617240 }, { "epoch": 1.6, "learning_rate": 5.999984447134513e-05, "loss": 0.0071, "step": 617250 }, { "epoch": 1.6, "learning_rate": 5.999595625497367e-05, "loss": 0.0077, "step": 617260 }, { "epoch": 1.6, "learning_rate": 5.999206803860221e-05, "loss": 0.009, "step": 617270 }, { "epoch": 1.6, "learning_rate": 5.9988179822230744e-05, "loss": 0.0076, "step": 617280 }, { "epoch": 1.6, "learning_rate": 5.998429160585928e-05, "loss": 0.0085, "step": 617290 }, { "epoch": 1.6, "learning_rate": 5.9980403389487813e-05, "loss": 0.0086, "step": 617300 }, { "epoch": 1.6, "learning_rate": 5.997651517311635e-05, "loss": 0.0101, "step": 617310 }, { "epoch": 1.6, "learning_rate": 5.997262695674488e-05, "loss": 0.0074, "step": 617320 }, { "epoch": 1.6, "learning_rate": 5.996873874037342e-05, "loss": 0.0055, "step": 617330 }, { "epoch": 1.6, "learning_rate": 5.996485052400195e-05, "loss": 0.0065, "step": 617340 }, { "epoch": 1.6, "learning_rate": 5.9960962307630495e-05, "loss": 0.0102, "step": 617350 }, { "epoch": 1.6, "learning_rate": 5.995707409125903e-05, "loss": 0.0088, "step": 617360 }, { "epoch": 1.6, "learning_rate": 5.9953185874887564e-05, "loss": 0.0099, "step": 617370 }, { "epoch": 1.6, "learning_rate": 5.99492976585161e-05, "loss": 0.0079, "step": 617380 }, { "epoch": 1.6, "learning_rate": 5.9945409442144634e-05, "loss": 0.007, "step": 617390 }, { "epoch": 1.6, "learning_rate": 5.994152122577317e-05, "loss": 0.0109, "step": 617400 }, { "epoch": 1.6, "learning_rate": 5.9937633009401704e-05, "loss": 0.0078, "step": 617410 }, { "epoch": 1.6, "learning_rate": 5.993374479303023e-05, "loss": 0.0072, "step": 617420 }, { "epoch": 1.6, "learning_rate": 5.992985657665877e-05, "loss": 0.0101, "step": 617430 }, { "epoch": 1.6, "learning_rate": 5.99259683602873e-05, "loss": 0.0066, "step": 617440 }, { "epoch": 1.6, "learning_rate": 5.992208014391584e-05, "loss": 0.0092, "step": 617450 }, { "epoch": 1.6, "learning_rate": 5.991819192754438e-05, "loss": 0.0076, "step": 617460 }, { "epoch": 1.6, "learning_rate": 5.991430371117291e-05, "loss": 0.0096, "step": 617470 }, { "epoch": 1.6, "learning_rate": 5.991041549480145e-05, "loss": 0.0077, "step": 617480 }, { "epoch": 1.6, "learning_rate": 5.990652727842998e-05, "loss": 0.0078, "step": 617490 }, { "epoch": 1.6, "learning_rate": 5.990263906205852e-05, "loss": 0.0091, "step": 617500 }, { "epoch": 1.6, "learning_rate": 5.989875084568705e-05, "loss": 0.0106, "step": 617510 }, { "epoch": 1.6, "learning_rate": 5.989486262931559e-05, "loss": 0.0077, "step": 617520 }, { "epoch": 1.6, "learning_rate": 5.989097441294413e-05, "loss": 0.0088, "step": 617530 }, { "epoch": 1.6, "learning_rate": 5.9887086196572664e-05, "loss": 0.009, "step": 617540 }, { "epoch": 1.6, "learning_rate": 5.98831979802012e-05, "loss": 0.0078, "step": 617550 }, { "epoch": 1.6, "learning_rate": 5.987930976382973e-05, "loss": 0.0076, "step": 617560 }, { "epoch": 1.6, "learning_rate": 5.987542154745827e-05, "loss": 0.0103, "step": 617570 }, { "epoch": 1.6, "learning_rate": 5.98715333310868e-05, "loss": 0.0095, "step": 617580 }, { "epoch": 1.6, "learning_rate": 5.986764511471534e-05, "loss": 0.0105, "step": 617590 }, { "epoch": 1.6, "learning_rate": 5.986375689834387e-05, "loss": 0.008, "step": 617600 }, { "epoch": 1.6, "learning_rate": 5.9859868681972414e-05, "loss": 0.0098, "step": 617610 }, { "epoch": 1.6, "learning_rate": 5.985598046560095e-05, "loss": 0.0094, "step": 617620 }, { "epoch": 1.6, "learning_rate": 5.9852092249229484e-05, "loss": 0.009, "step": 617630 }, { "epoch": 1.6, "learning_rate": 5.984820403285802e-05, "loss": 0.0077, "step": 617640 }, { "epoch": 1.6, "learning_rate": 5.9844315816486554e-05, "loss": 0.0092, "step": 617650 }, { "epoch": 1.6, "learning_rate": 5.984042760011509e-05, "loss": 0.0082, "step": 617660 }, { "epoch": 1.6, "learning_rate": 5.983653938374362e-05, "loss": 0.0067, "step": 617670 }, { "epoch": 1.6, "learning_rate": 5.983265116737215e-05, "loss": 0.0103, "step": 617680 }, { "epoch": 1.6, "learning_rate": 5.9828762951000687e-05, "loss": 0.0077, "step": 617690 }, { "epoch": 1.6, "learning_rate": 5.982487473462922e-05, "loss": 0.0082, "step": 617700 }, { "epoch": 1.6, "learning_rate": 5.982098651825776e-05, "loss": 0.0089, "step": 617710 }, { "epoch": 1.6, "learning_rate": 5.98170983018863e-05, "loss": 0.0077, "step": 617720 }, { "epoch": 1.6, "learning_rate": 5.981321008551483e-05, "loss": 0.0094, "step": 617730 }, { "epoch": 1.6, "learning_rate": 5.980932186914337e-05, "loss": 0.0096, "step": 617740 }, { "epoch": 1.6, "learning_rate": 5.98054336527719e-05, "loss": 0.0086, "step": 617750 }, { "epoch": 1.6, "learning_rate": 5.980154543640044e-05, "loss": 0.0071, "step": 617760 }, { "epoch": 1.6, "learning_rate": 5.979765722002897e-05, "loss": 0.0104, "step": 617770 }, { "epoch": 1.6, "learning_rate": 5.979376900365751e-05, "loss": 0.0065, "step": 617780 }, { "epoch": 1.6, "learning_rate": 5.978988078728605e-05, "loss": 0.0069, "step": 617790 }, { "epoch": 1.6, "learning_rate": 5.9785992570914584e-05, "loss": 0.0084, "step": 617800 }, { "epoch": 1.6, "learning_rate": 5.978210435454312e-05, "loss": 0.0066, "step": 617810 }, { "epoch": 1.6, "learning_rate": 5.977821613817165e-05, "loss": 0.0074, "step": 617820 }, { "epoch": 1.6, "learning_rate": 5.977432792180019e-05, "loss": 0.007, "step": 617830 }, { "epoch": 1.6, "learning_rate": 5.977043970542872e-05, "loss": 0.0089, "step": 617840 }, { "epoch": 1.6, "learning_rate": 5.976655148905726e-05, "loss": 0.0098, "step": 617850 }, { "epoch": 1.6, "learning_rate": 5.976266327268579e-05, "loss": 0.0124, "step": 617860 }, { "epoch": 1.6, "learning_rate": 5.9758775056314334e-05, "loss": 0.0098, "step": 617870 }, { "epoch": 1.6, "learning_rate": 5.975488683994287e-05, "loss": 0.0074, "step": 617880 }, { "epoch": 1.6, "learning_rate": 5.9750998623571404e-05, "loss": 0.0098, "step": 617890 }, { "epoch": 1.6, "learning_rate": 5.974711040719994e-05, "loss": 0.0075, "step": 617900 }, { "epoch": 1.6, "learning_rate": 5.974322219082847e-05, "loss": 0.0065, "step": 617910 }, { "epoch": 1.6, "learning_rate": 5.9739333974457e-05, "loss": 0.007, "step": 617920 }, { "epoch": 1.6, "learning_rate": 5.973544575808554e-05, "loss": 0.0089, "step": 617930 }, { "epoch": 1.6, "learning_rate": 5.973155754171407e-05, "loss": 0.009, "step": 617940 }, { "epoch": 1.6, "learning_rate": 5.9727669325342607e-05, "loss": 0.0083, "step": 617950 }, { "epoch": 1.6, "learning_rate": 5.972378110897114e-05, "loss": 0.0075, "step": 617960 }, { "epoch": 1.6, "learning_rate": 5.971989289259968e-05, "loss": 0.0096, "step": 617970 }, { "epoch": 1.6, "learning_rate": 5.971600467622822e-05, "loss": 0.0105, "step": 617980 }, { "epoch": 1.6, "learning_rate": 5.971211645985675e-05, "loss": 0.0084, "step": 617990 }, { "epoch": 1.6, "learning_rate": 5.970822824348529e-05, "loss": 0.0095, "step": 618000 }, { "epoch": 1.6, "eval_cer": 0.8816816917691551, "eval_loss": 0.0055539365857839584, "eval_runtime": 107.9153, "eval_samples_per_second": 18.533, "eval_steps_per_second": 4.633, "step": 618000 }, { "epoch": 1.6, "learning_rate": 5.970434002711382e-05, "loss": 0.0072, "step": 618010 }, { "epoch": 1.6, "learning_rate": 5.970045181074236e-05, "loss": 0.0086, "step": 618020 }, { "epoch": 1.6, "learning_rate": 5.969656359437089e-05, "loss": 0.0121, "step": 618030 }, { "epoch": 1.6, "learning_rate": 5.969267537799943e-05, "loss": 0.0078, "step": 618040 }, { "epoch": 1.6, "learning_rate": 5.968878716162797e-05, "loss": 0.0083, "step": 618050 }, { "epoch": 1.6, "learning_rate": 5.9684898945256504e-05, "loss": 0.0115, "step": 618060 }, { "epoch": 1.6, "learning_rate": 5.968101072888504e-05, "loss": 0.0074, "step": 618070 }, { "epoch": 1.6, "learning_rate": 5.967712251251357e-05, "loss": 0.0129, "step": 618080 }, { "epoch": 1.6, "learning_rate": 5.967323429614211e-05, "loss": 0.0113, "step": 618090 }, { "epoch": 1.6, "learning_rate": 5.966934607977064e-05, "loss": 0.0076, "step": 618100 }, { "epoch": 1.6, "learning_rate": 5.966545786339918e-05, "loss": 0.0101, "step": 618110 }, { "epoch": 1.6, "learning_rate": 5.966156964702771e-05, "loss": 0.0092, "step": 618120 }, { "epoch": 1.6, "learning_rate": 5.9657681430656254e-05, "loss": 0.0085, "step": 618130 }, { "epoch": 1.6, "learning_rate": 5.965379321428479e-05, "loss": 0.0084, "step": 618140 }, { "epoch": 1.6, "learning_rate": 5.9649904997913324e-05, "loss": 0.0091, "step": 618150 }, { "epoch": 1.6, "learning_rate": 5.964601678154185e-05, "loss": 0.0066, "step": 618160 }, { "epoch": 1.6, "learning_rate": 5.964212856517039e-05, "loss": 0.01, "step": 618170 }, { "epoch": 1.6, "learning_rate": 5.963824034879892e-05, "loss": 0.0082, "step": 618180 }, { "epoch": 1.6, "learning_rate": 5.963435213242746e-05, "loss": 0.0091, "step": 618190 }, { "epoch": 1.6, "learning_rate": 5.963046391605599e-05, "loss": 0.0084, "step": 618200 }, { "epoch": 1.6, "learning_rate": 5.9626575699684526e-05, "loss": 0.0076, "step": 618210 }, { "epoch": 1.6, "learning_rate": 5.962268748331306e-05, "loss": 0.0075, "step": 618220 }, { "epoch": 1.6, "learning_rate": 5.96187992669416e-05, "loss": 0.0098, "step": 618230 }, { "epoch": 1.6, "learning_rate": 5.961491105057014e-05, "loss": 0.0083, "step": 618240 }, { "epoch": 1.6, "learning_rate": 5.961102283419867e-05, "loss": 0.0082, "step": 618250 }, { "epoch": 1.6, "learning_rate": 5.960713461782721e-05, "loss": 0.0113, "step": 618260 }, { "epoch": 1.6, "learning_rate": 5.960324640145574e-05, "loss": 0.0068, "step": 618270 }, { "epoch": 1.6, "learning_rate": 5.959935818508428e-05, "loss": 0.0077, "step": 618280 }, { "epoch": 1.6, "learning_rate": 5.959546996871281e-05, "loss": 0.0111, "step": 618290 }, { "epoch": 1.6, "learning_rate": 5.959158175234135e-05, "loss": 0.0094, "step": 618300 }, { "epoch": 1.6, "learning_rate": 5.958769353596989e-05, "loss": 0.0091, "step": 618310 }, { "epoch": 1.6, "learning_rate": 5.9583805319598424e-05, "loss": 0.0081, "step": 618320 }, { "epoch": 1.6, "learning_rate": 5.957991710322696e-05, "loss": 0.0052, "step": 618330 }, { "epoch": 1.6, "learning_rate": 5.957602888685549e-05, "loss": 0.0104, "step": 618340 }, { "epoch": 1.6, "learning_rate": 5.957214067048403e-05, "loss": 0.0099, "step": 618350 }, { "epoch": 1.6, "learning_rate": 5.956825245411256e-05, "loss": 0.0088, "step": 618360 }, { "epoch": 1.6, "learning_rate": 5.95643642377411e-05, "loss": 0.0078, "step": 618370 }, { "epoch": 1.6, "learning_rate": 5.956047602136963e-05, "loss": 0.0089, "step": 618380 }, { "epoch": 1.6, "learning_rate": 5.9556587804998174e-05, "loss": 0.0087, "step": 618390 }, { "epoch": 1.6, "learning_rate": 5.955269958862671e-05, "loss": 0.0103, "step": 618400 }, { "epoch": 1.6, "learning_rate": 5.954881137225524e-05, "loss": 0.0135, "step": 618410 }, { "epoch": 1.6, "learning_rate": 5.954492315588377e-05, "loss": 0.0093, "step": 618420 }, { "epoch": 1.6, "learning_rate": 5.954103493951231e-05, "loss": 0.0088, "step": 618430 }, { "epoch": 1.6, "learning_rate": 5.953714672314084e-05, "loss": 0.0119, "step": 618440 }, { "epoch": 1.6, "learning_rate": 5.953325850676938e-05, "loss": 0.0099, "step": 618450 }, { "epoch": 1.6, "learning_rate": 5.952937029039791e-05, "loss": 0.0079, "step": 618460 }, { "epoch": 1.6, "learning_rate": 5.9525482074026446e-05, "loss": 0.0093, "step": 618470 }, { "epoch": 1.6, "learning_rate": 5.952159385765498e-05, "loss": 0.009, "step": 618480 }, { "epoch": 1.6, "learning_rate": 5.951770564128352e-05, "loss": 0.0087, "step": 618490 }, { "epoch": 1.6, "learning_rate": 5.951381742491206e-05, "loss": 0.0079, "step": 618500 }, { "epoch": 1.6, "learning_rate": 5.950992920854059e-05, "loss": 0.0064, "step": 618510 }, { "epoch": 1.6, "learning_rate": 5.950604099216913e-05, "loss": 0.0111, "step": 618520 }, { "epoch": 1.6, "learning_rate": 5.950215277579766e-05, "loss": 0.0067, "step": 618530 }, { "epoch": 1.6, "learning_rate": 5.94982645594262e-05, "loss": 0.0102, "step": 618540 }, { "epoch": 1.6, "learning_rate": 5.949437634305473e-05, "loss": 0.0096, "step": 618550 }, { "epoch": 1.6, "learning_rate": 5.949048812668327e-05, "loss": 0.0113, "step": 618560 }, { "epoch": 1.6, "learning_rate": 5.94865999103118e-05, "loss": 0.0067, "step": 618570 }, { "epoch": 1.6, "learning_rate": 5.9482711693940343e-05, "loss": 0.0106, "step": 618580 }, { "epoch": 1.6, "learning_rate": 5.947882347756888e-05, "loss": 0.0092, "step": 618590 }, { "epoch": 1.6, "learning_rate": 5.947493526119741e-05, "loss": 0.006, "step": 618600 }, { "epoch": 1.6, "learning_rate": 5.947104704482595e-05, "loss": 0.0072, "step": 618610 }, { "epoch": 1.6, "learning_rate": 5.946715882845448e-05, "loss": 0.0108, "step": 618620 }, { "epoch": 1.6, "learning_rate": 5.946327061208302e-05, "loss": 0.0078, "step": 618630 }, { "epoch": 1.6, "learning_rate": 5.945938239571155e-05, "loss": 0.0095, "step": 618640 }, { "epoch": 1.6, "learning_rate": 5.945549417934009e-05, "loss": 0.0093, "step": 618650 }, { "epoch": 1.6, "learning_rate": 5.9451605962968616e-05, "loss": 0.0077, "step": 618660 }, { "epoch": 1.6, "learning_rate": 5.944771774659715e-05, "loss": 0.0074, "step": 618670 }, { "epoch": 1.6, "learning_rate": 5.944382953022569e-05, "loss": 0.0059, "step": 618680 }, { "epoch": 1.6, "learning_rate": 5.943994131385423e-05, "loss": 0.0068, "step": 618690 }, { "epoch": 1.6, "learning_rate": 5.943605309748276e-05, "loss": 0.0096, "step": 618700 }, { "epoch": 1.6, "learning_rate": 5.94321648811113e-05, "loss": 0.0083, "step": 618710 }, { "epoch": 1.6, "learning_rate": 5.942827666473983e-05, "loss": 0.0106, "step": 618720 }, { "epoch": 1.6, "learning_rate": 5.9424388448368366e-05, "loss": 0.0064, "step": 618730 }, { "epoch": 1.6, "learning_rate": 5.94205002319969e-05, "loss": 0.0083, "step": 618740 }, { "epoch": 1.6, "learning_rate": 5.9416612015625436e-05, "loss": 0.0068, "step": 618750 }, { "epoch": 1.6, "learning_rate": 5.941272379925398e-05, "loss": 0.0071, "step": 618760 }, { "epoch": 1.6, "learning_rate": 5.940883558288251e-05, "loss": 0.01, "step": 618770 }, { "epoch": 1.6, "learning_rate": 5.940494736651105e-05, "loss": 0.0072, "step": 618780 }, { "epoch": 1.6, "learning_rate": 5.940105915013958e-05, "loss": 0.011, "step": 618790 }, { "epoch": 1.6, "learning_rate": 5.939717093376812e-05, "loss": 0.0114, "step": 618800 }, { "epoch": 1.6, "learning_rate": 5.939328271739665e-05, "loss": 0.0091, "step": 618810 }, { "epoch": 1.6, "learning_rate": 5.938939450102519e-05, "loss": 0.0084, "step": 618820 }, { "epoch": 1.6, "learning_rate": 5.938550628465372e-05, "loss": 0.0078, "step": 618830 }, { "epoch": 1.6, "learning_rate": 5.9381618068282263e-05, "loss": 0.0085, "step": 618840 }, { "epoch": 1.6, "learning_rate": 5.93777298519108e-05, "loss": 0.0094, "step": 618850 }, { "epoch": 1.6, "learning_rate": 5.937384163553933e-05, "loss": 0.0069, "step": 618860 }, { "epoch": 1.6, "learning_rate": 5.936995341916787e-05, "loss": 0.0095, "step": 618870 }, { "epoch": 1.6, "learning_rate": 5.93660652027964e-05, "loss": 0.0068, "step": 618880 }, { "epoch": 1.6, "learning_rate": 5.936217698642494e-05, "loss": 0.0075, "step": 618890 }, { "epoch": 1.6, "learning_rate": 5.935828877005347e-05, "loss": 0.0106, "step": 618900 }, { "epoch": 1.6, "learning_rate": 5.9354400553682e-05, "loss": 0.0097, "step": 618910 }, { "epoch": 1.6, "learning_rate": 5.9350512337310536e-05, "loss": 0.0115, "step": 618920 }, { "epoch": 1.6, "learning_rate": 5.934662412093907e-05, "loss": 0.0099, "step": 618930 }, { "epoch": 1.6, "learning_rate": 5.934273590456761e-05, "loss": 0.01, "step": 618940 }, { "epoch": 1.6, "learning_rate": 5.933884768819615e-05, "loss": 0.0067, "step": 618950 }, { "epoch": 1.6, "learning_rate": 5.933495947182468e-05, "loss": 0.0072, "step": 618960 }, { "epoch": 1.6, "learning_rate": 5.933107125545322e-05, "loss": 0.0076, "step": 618970 }, { "epoch": 1.6, "learning_rate": 5.932718303908175e-05, "loss": 0.0057, "step": 618980 }, { "epoch": 1.6, "learning_rate": 5.9323294822710286e-05, "loss": 0.0091, "step": 618990 }, { "epoch": 1.6, "learning_rate": 5.931940660633882e-05, "loss": 0.0083, "step": 619000 }, { "epoch": 1.6, "eval_cer": 0.8816872903168917, "eval_loss": 0.005528622306883335, "eval_runtime": 107.7525, "eval_samples_per_second": 18.561, "eval_steps_per_second": 4.64, "step": 619000 }, { "epoch": 1.6, "learning_rate": 5.9315518389967356e-05, "loss": 0.0105, "step": 619010 }, { "epoch": 1.6, "learning_rate": 5.93116301735959e-05, "loss": 0.0101, "step": 619020 }, { "epoch": 1.6, "learning_rate": 5.930774195722443e-05, "loss": 0.0105, "step": 619030 }, { "epoch": 1.6, "learning_rate": 5.930385374085297e-05, "loss": 0.0083, "step": 619040 }, { "epoch": 1.6, "learning_rate": 5.92999655244815e-05, "loss": 0.0111, "step": 619050 }, { "epoch": 1.6, "learning_rate": 5.929607730811004e-05, "loss": 0.0077, "step": 619060 }, { "epoch": 1.6, "learning_rate": 5.929218909173857e-05, "loss": 0.0093, "step": 619070 }, { "epoch": 1.6, "learning_rate": 5.928830087536711e-05, "loss": 0.008, "step": 619080 }, { "epoch": 1.6, "learning_rate": 5.928441265899564e-05, "loss": 0.0089, "step": 619090 }, { "epoch": 1.6, "learning_rate": 5.928052444262418e-05, "loss": 0.0103, "step": 619100 }, { "epoch": 1.6, "learning_rate": 5.927663622625272e-05, "loss": 0.007, "step": 619110 }, { "epoch": 1.6, "learning_rate": 5.927274800988125e-05, "loss": 0.0106, "step": 619120 }, { "epoch": 1.6, "learning_rate": 5.926885979350979e-05, "loss": 0.0085, "step": 619130 }, { "epoch": 1.6, "learning_rate": 5.926497157713832e-05, "loss": 0.0086, "step": 619140 }, { "epoch": 1.6, "learning_rate": 5.926108336076686e-05, "loss": 0.006, "step": 619150 }, { "epoch": 1.6, "learning_rate": 5.9257195144395386e-05, "loss": 0.0073, "step": 619160 }, { "epoch": 1.6, "learning_rate": 5.925330692802392e-05, "loss": 0.006, "step": 619170 }, { "epoch": 1.61, "learning_rate": 5.9249418711652455e-05, "loss": 0.0092, "step": 619180 }, { "epoch": 1.61, "learning_rate": 5.924553049528099e-05, "loss": 0.0096, "step": 619190 }, { "epoch": 1.61, "learning_rate": 5.924164227890953e-05, "loss": 0.0078, "step": 619200 }, { "epoch": 1.61, "learning_rate": 5.923775406253807e-05, "loss": 0.0095, "step": 619210 }, { "epoch": 1.61, "learning_rate": 5.92338658461666e-05, "loss": 0.0091, "step": 619220 }, { "epoch": 1.61, "learning_rate": 5.9229977629795137e-05, "loss": 0.0084, "step": 619230 }, { "epoch": 1.61, "learning_rate": 5.922608941342367e-05, "loss": 0.008, "step": 619240 }, { "epoch": 1.61, "learning_rate": 5.9222201197052206e-05, "loss": 0.0123, "step": 619250 }, { "epoch": 1.61, "learning_rate": 5.921831298068074e-05, "loss": 0.0085, "step": 619260 }, { "epoch": 1.61, "learning_rate": 5.9214424764309276e-05, "loss": 0.0098, "step": 619270 }, { "epoch": 1.61, "learning_rate": 5.921053654793782e-05, "loss": 0.0083, "step": 619280 }, { "epoch": 1.61, "learning_rate": 5.920664833156635e-05, "loss": 0.011, "step": 619290 }, { "epoch": 1.61, "learning_rate": 5.920276011519489e-05, "loss": 0.0088, "step": 619300 }, { "epoch": 1.61, "learning_rate": 5.919887189882342e-05, "loss": 0.0082, "step": 619310 }, { "epoch": 1.61, "learning_rate": 5.919498368245196e-05, "loss": 0.0109, "step": 619320 }, { "epoch": 1.61, "learning_rate": 5.919109546608049e-05, "loss": 0.0107, "step": 619330 }, { "epoch": 1.61, "learning_rate": 5.918720724970903e-05, "loss": 0.0053, "step": 619340 }, { "epoch": 1.61, "learning_rate": 5.918331903333756e-05, "loss": 0.0061, "step": 619350 }, { "epoch": 1.61, "learning_rate": 5.91794308169661e-05, "loss": 0.008, "step": 619360 }, { "epoch": 1.61, "learning_rate": 5.917554260059464e-05, "loss": 0.0088, "step": 619370 }, { "epoch": 1.61, "learning_rate": 5.917165438422317e-05, "loss": 0.012, "step": 619380 }, { "epoch": 1.61, "learning_rate": 5.916776616785171e-05, "loss": 0.0085, "step": 619390 }, { "epoch": 1.61, "learning_rate": 5.9163877951480236e-05, "loss": 0.0091, "step": 619400 }, { "epoch": 1.61, "learning_rate": 5.915998973510877e-05, "loss": 0.0129, "step": 619410 }, { "epoch": 1.61, "learning_rate": 5.9156101518737306e-05, "loss": 0.0103, "step": 619420 }, { "epoch": 1.61, "learning_rate": 5.915221330236584e-05, "loss": 0.0088, "step": 619430 }, { "epoch": 1.61, "learning_rate": 5.9148325085994375e-05, "loss": 0.0084, "step": 619440 }, { "epoch": 1.61, "learning_rate": 5.914443686962291e-05, "loss": 0.009, "step": 619450 }, { "epoch": 1.61, "learning_rate": 5.914054865325145e-05, "loss": 0.011, "step": 619460 }, { "epoch": 1.61, "learning_rate": 5.913666043687999e-05, "loss": 0.0068, "step": 619470 }, { "epoch": 1.61, "learning_rate": 5.913277222050852e-05, "loss": 0.0109, "step": 619480 }, { "epoch": 1.61, "learning_rate": 5.9128884004137057e-05, "loss": 0.0089, "step": 619490 }, { "epoch": 1.61, "learning_rate": 5.912499578776559e-05, "loss": 0.0096, "step": 619500 }, { "epoch": 1.61, "learning_rate": 5.9121107571394126e-05, "loss": 0.0106, "step": 619510 }, { "epoch": 1.61, "learning_rate": 5.911721935502266e-05, "loss": 0.0089, "step": 619520 }, { "epoch": 1.61, "learning_rate": 5.9113331138651196e-05, "loss": 0.0117, "step": 619530 }, { "epoch": 1.61, "learning_rate": 5.910944292227974e-05, "loss": 0.0087, "step": 619540 }, { "epoch": 1.61, "learning_rate": 5.910555470590827e-05, "loss": 0.0085, "step": 619550 }, { "epoch": 1.61, "learning_rate": 5.910166648953681e-05, "loss": 0.0087, "step": 619560 }, { "epoch": 1.61, "learning_rate": 5.909777827316534e-05, "loss": 0.0078, "step": 619570 }, { "epoch": 1.61, "learning_rate": 5.909389005679388e-05, "loss": 0.0061, "step": 619580 }, { "epoch": 1.61, "learning_rate": 5.909000184042241e-05, "loss": 0.0081, "step": 619590 }, { "epoch": 1.61, "learning_rate": 5.908611362405095e-05, "loss": 0.0114, "step": 619600 }, { "epoch": 1.61, "learning_rate": 5.908222540767948e-05, "loss": 0.0086, "step": 619610 }, { "epoch": 1.61, "learning_rate": 5.907833719130802e-05, "loss": 0.0108, "step": 619620 }, { "epoch": 1.61, "learning_rate": 5.907444897493656e-05, "loss": 0.0077, "step": 619630 }, { "epoch": 1.61, "learning_rate": 5.907056075856509e-05, "loss": 0.0091, "step": 619640 }, { "epoch": 1.61, "learning_rate": 5.906667254219362e-05, "loss": 0.0087, "step": 619650 }, { "epoch": 1.61, "learning_rate": 5.9062784325822156e-05, "loss": 0.0086, "step": 619660 }, { "epoch": 1.61, "learning_rate": 5.905889610945069e-05, "loss": 0.0076, "step": 619670 }, { "epoch": 1.61, "learning_rate": 5.9055007893079226e-05, "loss": 0.0091, "step": 619680 }, { "epoch": 1.61, "learning_rate": 5.905111967670776e-05, "loss": 0.0111, "step": 619690 }, { "epoch": 1.61, "learning_rate": 5.9047231460336295e-05, "loss": 0.0091, "step": 619700 }, { "epoch": 1.61, "learning_rate": 5.904334324396483e-05, "loss": 0.0087, "step": 619710 }, { "epoch": 1.61, "learning_rate": 5.903945502759337e-05, "loss": 0.0068, "step": 619720 }, { "epoch": 1.61, "learning_rate": 5.903556681122191e-05, "loss": 0.0055, "step": 619730 }, { "epoch": 1.61, "learning_rate": 5.903167859485044e-05, "loss": 0.0089, "step": 619740 }, { "epoch": 1.61, "learning_rate": 5.9027790378478976e-05, "loss": 0.0101, "step": 619750 }, { "epoch": 1.61, "learning_rate": 5.902390216210751e-05, "loss": 0.0072, "step": 619760 }, { "epoch": 1.61, "learning_rate": 5.9020013945736046e-05, "loss": 0.0119, "step": 619770 }, { "epoch": 1.61, "learning_rate": 5.901612572936458e-05, "loss": 0.0073, "step": 619780 }, { "epoch": 1.61, "learning_rate": 5.9012237512993116e-05, "loss": 0.0083, "step": 619790 }, { "epoch": 1.61, "learning_rate": 5.900834929662166e-05, "loss": 0.0072, "step": 619800 }, { "epoch": 1.61, "learning_rate": 5.900446108025019e-05, "loss": 0.0057, "step": 619810 }, { "epoch": 1.61, "learning_rate": 5.900057286387873e-05, "loss": 0.0092, "step": 619820 }, { "epoch": 1.61, "learning_rate": 5.899668464750726e-05, "loss": 0.009, "step": 619830 }, { "epoch": 1.61, "learning_rate": 5.89927964311358e-05, "loss": 0.0101, "step": 619840 }, { "epoch": 1.61, "learning_rate": 5.898890821476433e-05, "loss": 0.0097, "step": 619850 }, { "epoch": 1.61, "learning_rate": 5.898501999839287e-05, "loss": 0.0103, "step": 619860 }, { "epoch": 1.61, "learning_rate": 5.89811317820214e-05, "loss": 0.0081, "step": 619870 }, { "epoch": 1.61, "learning_rate": 5.8977243565649936e-05, "loss": 0.0081, "step": 619880 }, { "epoch": 1.61, "learning_rate": 5.897335534927848e-05, "loss": 0.0082, "step": 619890 }, { "epoch": 1.61, "learning_rate": 5.8969467132907006e-05, "loss": 0.0057, "step": 619900 }, { "epoch": 1.61, "learning_rate": 5.896557891653554e-05, "loss": 0.0075, "step": 619910 }, { "epoch": 1.61, "learning_rate": 5.8961690700164076e-05, "loss": 0.0074, "step": 619920 }, { "epoch": 1.61, "learning_rate": 5.895780248379261e-05, "loss": 0.0076, "step": 619930 }, { "epoch": 1.61, "learning_rate": 5.8953914267421146e-05, "loss": 0.0077, "step": 619940 }, { "epoch": 1.61, "learning_rate": 5.895002605104968e-05, "loss": 0.0094, "step": 619950 }, { "epoch": 1.61, "learning_rate": 5.8946137834678215e-05, "loss": 0.0114, "step": 619960 }, { "epoch": 1.61, "learning_rate": 5.894224961830675e-05, "loss": 0.01, "step": 619970 }, { "epoch": 1.61, "learning_rate": 5.8938361401935285e-05, "loss": 0.0067, "step": 619980 }, { "epoch": 1.61, "learning_rate": 5.893447318556383e-05, "loss": 0.0074, "step": 619990 }, { "epoch": 1.61, "learning_rate": 5.893058496919236e-05, "loss": 0.0073, "step": 620000 }, { "epoch": 1.61, "eval_cer": 0.8816830914060892, "eval_loss": 0.00557528343051672, "eval_runtime": 107.8677, "eval_samples_per_second": 18.541, "eval_steps_per_second": 4.635, "step": 620000 }, { "epoch": 1.61, "learning_rate": 5.8926696752820896e-05, "loss": 0.0118, "step": 620010 }, { "epoch": 1.61, "learning_rate": 5.892280853644943e-05, "loss": 0.0103, "step": 620020 }, { "epoch": 1.61, "learning_rate": 5.8918920320077966e-05, "loss": 0.0076, "step": 620030 }, { "epoch": 1.61, "learning_rate": 5.89150321037065e-05, "loss": 0.0097, "step": 620040 }, { "epoch": 1.61, "learning_rate": 5.8911143887335036e-05, "loss": 0.0078, "step": 620050 }, { "epoch": 1.61, "learning_rate": 5.890725567096357e-05, "loss": 0.0137, "step": 620060 }, { "epoch": 1.61, "learning_rate": 5.890336745459211e-05, "loss": 0.009, "step": 620070 }, { "epoch": 1.61, "learning_rate": 5.889947923822065e-05, "loss": 0.0091, "step": 620080 }, { "epoch": 1.61, "learning_rate": 5.889559102184918e-05, "loss": 0.0088, "step": 620090 }, { "epoch": 1.61, "learning_rate": 5.889170280547772e-05, "loss": 0.0084, "step": 620100 }, { "epoch": 1.61, "learning_rate": 5.888781458910625e-05, "loss": 0.0085, "step": 620110 }, { "epoch": 1.61, "learning_rate": 5.888392637273479e-05, "loss": 0.0066, "step": 620120 }, { "epoch": 1.61, "learning_rate": 5.888003815636332e-05, "loss": 0.0092, "step": 620130 }, { "epoch": 1.61, "learning_rate": 5.8876149939991856e-05, "loss": 0.0133, "step": 620140 }, { "epoch": 1.61, "learning_rate": 5.8872261723620384e-05, "loss": 0.0087, "step": 620150 }, { "epoch": 1.61, "learning_rate": 5.886837350724892e-05, "loss": 0.0111, "step": 620160 }, { "epoch": 1.61, "learning_rate": 5.886448529087746e-05, "loss": 0.0097, "step": 620170 }, { "epoch": 1.61, "learning_rate": 5.8860597074505996e-05, "loss": 0.0101, "step": 620180 }, { "epoch": 1.61, "learning_rate": 5.885670885813453e-05, "loss": 0.0055, "step": 620190 }, { "epoch": 1.61, "learning_rate": 5.8852820641763066e-05, "loss": 0.0084, "step": 620200 }, { "epoch": 1.61, "learning_rate": 5.88489324253916e-05, "loss": 0.0096, "step": 620210 }, { "epoch": 1.61, "learning_rate": 5.8845044209020135e-05, "loss": 0.0065, "step": 620220 }, { "epoch": 1.61, "learning_rate": 5.884115599264867e-05, "loss": 0.0062, "step": 620230 }, { "epoch": 1.61, "learning_rate": 5.8837267776277205e-05, "loss": 0.0087, "step": 620240 }, { "epoch": 1.61, "learning_rate": 5.883337955990575e-05, "loss": 0.0071, "step": 620250 }, { "epoch": 1.61, "learning_rate": 5.882949134353428e-05, "loss": 0.0092, "step": 620260 }, { "epoch": 1.61, "learning_rate": 5.8825603127162816e-05, "loss": 0.0068, "step": 620270 }, { "epoch": 1.61, "learning_rate": 5.882171491079135e-05, "loss": 0.0128, "step": 620280 }, { "epoch": 1.61, "learning_rate": 5.8817826694419886e-05, "loss": 0.0084, "step": 620290 }, { "epoch": 1.61, "learning_rate": 5.881393847804842e-05, "loss": 0.0074, "step": 620300 }, { "epoch": 1.61, "learning_rate": 5.8810050261676956e-05, "loss": 0.0078, "step": 620310 }, { "epoch": 1.61, "learning_rate": 5.880616204530549e-05, "loss": 0.0074, "step": 620320 }, { "epoch": 1.61, "learning_rate": 5.880227382893403e-05, "loss": 0.0103, "step": 620330 }, { "epoch": 1.61, "learning_rate": 5.879838561256257e-05, "loss": 0.0063, "step": 620340 }, { "epoch": 1.61, "learning_rate": 5.87944973961911e-05, "loss": 0.0093, "step": 620350 }, { "epoch": 1.61, "learning_rate": 5.879060917981964e-05, "loss": 0.0082, "step": 620360 }, { "epoch": 1.61, "learning_rate": 5.878672096344817e-05, "loss": 0.0145, "step": 620370 }, { "epoch": 1.61, "learning_rate": 5.878283274707671e-05, "loss": 0.0089, "step": 620380 }, { "epoch": 1.61, "learning_rate": 5.877894453070524e-05, "loss": 0.0078, "step": 620390 }, { "epoch": 1.61, "learning_rate": 5.877505631433377e-05, "loss": 0.0116, "step": 620400 }, { "epoch": 1.61, "learning_rate": 5.8771168097962304e-05, "loss": 0.0096, "step": 620410 }, { "epoch": 1.61, "learning_rate": 5.876727988159084e-05, "loss": 0.0077, "step": 620420 }, { "epoch": 1.61, "learning_rate": 5.876339166521938e-05, "loss": 0.0127, "step": 620430 }, { "epoch": 1.61, "learning_rate": 5.8759503448847916e-05, "loss": 0.0114, "step": 620440 }, { "epoch": 1.61, "learning_rate": 5.875561523247645e-05, "loss": 0.008, "step": 620450 }, { "epoch": 1.61, "learning_rate": 5.8751727016104986e-05, "loss": 0.0085, "step": 620460 }, { "epoch": 1.61, "learning_rate": 5.874783879973352e-05, "loss": 0.0093, "step": 620470 }, { "epoch": 1.61, "learning_rate": 5.8743950583362055e-05, "loss": 0.0071, "step": 620480 }, { "epoch": 1.61, "learning_rate": 5.874006236699059e-05, "loss": 0.0112, "step": 620490 }, { "epoch": 1.61, "learning_rate": 5.8736174150619125e-05, "loss": 0.0073, "step": 620500 }, { "epoch": 1.61, "learning_rate": 5.8732285934247667e-05, "loss": 0.0083, "step": 620510 }, { "epoch": 1.61, "learning_rate": 5.87283977178762e-05, "loss": 0.0072, "step": 620520 }, { "epoch": 1.61, "learning_rate": 5.8724509501504736e-05, "loss": 0.0088, "step": 620530 }, { "epoch": 1.61, "learning_rate": 5.872062128513327e-05, "loss": 0.0111, "step": 620540 }, { "epoch": 1.61, "learning_rate": 5.8716733068761806e-05, "loss": 0.0079, "step": 620550 }, { "epoch": 1.61, "learning_rate": 5.871284485239034e-05, "loss": 0.008, "step": 620560 }, { "epoch": 1.61, "learning_rate": 5.8708956636018876e-05, "loss": 0.011, "step": 620570 }, { "epoch": 1.61, "learning_rate": 5.870506841964741e-05, "loss": 0.0089, "step": 620580 }, { "epoch": 1.61, "learning_rate": 5.870118020327595e-05, "loss": 0.0079, "step": 620590 }, { "epoch": 1.61, "learning_rate": 5.869729198690449e-05, "loss": 0.007, "step": 620600 }, { "epoch": 1.61, "learning_rate": 5.869340377053302e-05, "loss": 0.0081, "step": 620610 }, { "epoch": 1.61, "learning_rate": 5.868951555416156e-05, "loss": 0.009, "step": 620620 }, { "epoch": 1.61, "learning_rate": 5.868562733779009e-05, "loss": 0.006, "step": 620630 }, { "epoch": 1.61, "learning_rate": 5.868173912141862e-05, "loss": 0.0086, "step": 620640 }, { "epoch": 1.61, "learning_rate": 5.8677850905047155e-05, "loss": 0.0079, "step": 620650 }, { "epoch": 1.61, "learning_rate": 5.867396268867569e-05, "loss": 0.0091, "step": 620660 }, { "epoch": 1.61, "learning_rate": 5.8670074472304224e-05, "loss": 0.0074, "step": 620670 }, { "epoch": 1.61, "learning_rate": 5.866618625593276e-05, "loss": 0.007, "step": 620680 }, { "epoch": 1.61, "learning_rate": 5.86622980395613e-05, "loss": 0.0083, "step": 620690 }, { "epoch": 1.61, "learning_rate": 5.8658409823189836e-05, "loss": 0.0077, "step": 620700 }, { "epoch": 1.61, "learning_rate": 5.865452160681837e-05, "loss": 0.0073, "step": 620710 }, { "epoch": 1.61, "learning_rate": 5.8650633390446905e-05, "loss": 0.01, "step": 620720 }, { "epoch": 1.61, "learning_rate": 5.864674517407544e-05, "loss": 0.0075, "step": 620730 }, { "epoch": 1.61, "learning_rate": 5.8642856957703975e-05, "loss": 0.0091, "step": 620740 }, { "epoch": 1.61, "learning_rate": 5.863896874133251e-05, "loss": 0.0065, "step": 620750 }, { "epoch": 1.61, "learning_rate": 5.8635080524961045e-05, "loss": 0.0104, "step": 620760 }, { "epoch": 1.61, "learning_rate": 5.8631192308589587e-05, "loss": 0.009, "step": 620770 }, { "epoch": 1.61, "learning_rate": 5.862730409221812e-05, "loss": 0.0056, "step": 620780 }, { "epoch": 1.61, "learning_rate": 5.8623415875846656e-05, "loss": 0.0079, "step": 620790 }, { "epoch": 1.61, "learning_rate": 5.861952765947519e-05, "loss": 0.0081, "step": 620800 }, { "epoch": 1.61, "learning_rate": 5.8615639443103726e-05, "loss": 0.0074, "step": 620810 }, { "epoch": 1.61, "learning_rate": 5.861175122673226e-05, "loss": 0.0121, "step": 620820 }, { "epoch": 1.61, "learning_rate": 5.8607863010360796e-05, "loss": 0.0066, "step": 620830 }, { "epoch": 1.61, "learning_rate": 5.860397479398933e-05, "loss": 0.0104, "step": 620840 }, { "epoch": 1.61, "learning_rate": 5.860008657761787e-05, "loss": 0.0101, "step": 620850 }, { "epoch": 1.61, "learning_rate": 5.859619836124641e-05, "loss": 0.0079, "step": 620860 }, { "epoch": 1.61, "learning_rate": 5.859231014487494e-05, "loss": 0.008, "step": 620870 }, { "epoch": 1.61, "learning_rate": 5.858842192850348e-05, "loss": 0.0092, "step": 620880 }, { "epoch": 1.61, "learning_rate": 5.8584533712132005e-05, "loss": 0.0093, "step": 620890 }, { "epoch": 1.61, "learning_rate": 5.858064549576054e-05, "loss": 0.0102, "step": 620900 }, { "epoch": 1.61, "learning_rate": 5.8576757279389075e-05, "loss": 0.0069, "step": 620910 }, { "epoch": 1.61, "learning_rate": 5.857286906301761e-05, "loss": 0.0114, "step": 620920 }, { "epoch": 1.61, "learning_rate": 5.8568980846646144e-05, "loss": 0.0072, "step": 620930 }, { "epoch": 1.61, "learning_rate": 5.856509263027468e-05, "loss": 0.0072, "step": 620940 }, { "epoch": 1.61, "learning_rate": 5.856120441390322e-05, "loss": 0.0082, "step": 620950 }, { "epoch": 1.61, "learning_rate": 5.8557316197531756e-05, "loss": 0.0101, "step": 620960 }, { "epoch": 1.61, "learning_rate": 5.855342798116029e-05, "loss": 0.01, "step": 620970 }, { "epoch": 1.61, "learning_rate": 5.8549539764788825e-05, "loss": 0.0083, "step": 620980 }, { "epoch": 1.61, "learning_rate": 5.854565154841736e-05, "loss": 0.0074, "step": 620990 }, { "epoch": 1.61, "learning_rate": 5.8541763332045895e-05, "loss": 0.0092, "step": 621000 }, { "epoch": 1.61, "eval_cer": 0.881704085960102, "eval_loss": 0.0054284194484353065, "eval_runtime": 107.746, "eval_samples_per_second": 18.562, "eval_steps_per_second": 4.641, "step": 621000 }, { "epoch": 1.61, "learning_rate": 5.853787511567443e-05, "loss": 0.0138, "step": 621010 }, { "epoch": 1.61, "learning_rate": 5.8533986899302965e-05, "loss": 0.0113, "step": 621020 }, { "epoch": 1.61, "learning_rate": 5.8530098682931507e-05, "loss": 0.0077, "step": 621030 }, { "epoch": 1.61, "learning_rate": 5.852621046656004e-05, "loss": 0.0081, "step": 621040 }, { "epoch": 1.61, "learning_rate": 5.8522322250188576e-05, "loss": 0.008, "step": 621050 }, { "epoch": 1.61, "learning_rate": 5.851843403381711e-05, "loss": 0.0094, "step": 621060 }, { "epoch": 1.61, "learning_rate": 5.8514545817445646e-05, "loss": 0.0089, "step": 621070 }, { "epoch": 1.61, "learning_rate": 5.851065760107418e-05, "loss": 0.0103, "step": 621080 }, { "epoch": 1.61, "learning_rate": 5.8506769384702716e-05, "loss": 0.0078, "step": 621090 }, { "epoch": 1.61, "learning_rate": 5.850288116833125e-05, "loss": 0.0051, "step": 621100 }, { "epoch": 1.61, "learning_rate": 5.849899295195979e-05, "loss": 0.0089, "step": 621110 }, { "epoch": 1.61, "learning_rate": 5.849510473558833e-05, "loss": 0.0083, "step": 621120 }, { "epoch": 1.61, "learning_rate": 5.849121651921686e-05, "loss": 0.0077, "step": 621130 }, { "epoch": 1.61, "learning_rate": 5.848732830284539e-05, "loss": 0.0076, "step": 621140 }, { "epoch": 1.61, "learning_rate": 5.8483440086473925e-05, "loss": 0.0088, "step": 621150 }, { "epoch": 1.61, "learning_rate": 5.847955187010246e-05, "loss": 0.0105, "step": 621160 }, { "epoch": 1.61, "learning_rate": 5.8475663653730995e-05, "loss": 0.0077, "step": 621170 }, { "epoch": 1.61, "learning_rate": 5.847177543735953e-05, "loss": 0.0082, "step": 621180 }, { "epoch": 1.61, "learning_rate": 5.8467887220988064e-05, "loss": 0.0091, "step": 621190 }, { "epoch": 1.61, "learning_rate": 5.84639990046166e-05, "loss": 0.0103, "step": 621200 }, { "epoch": 1.61, "learning_rate": 5.846011078824514e-05, "loss": 0.0123, "step": 621210 }, { "epoch": 1.61, "learning_rate": 5.8456222571873676e-05, "loss": 0.0088, "step": 621220 }, { "epoch": 1.61, "learning_rate": 5.845233435550221e-05, "loss": 0.0067, "step": 621230 }, { "epoch": 1.61, "learning_rate": 5.8448446139130745e-05, "loss": 0.0099, "step": 621240 }, { "epoch": 1.61, "learning_rate": 5.844455792275928e-05, "loss": 0.0075, "step": 621250 }, { "epoch": 1.61, "learning_rate": 5.8440669706387815e-05, "loss": 0.0109, "step": 621260 }, { "epoch": 1.61, "learning_rate": 5.843678149001635e-05, "loss": 0.0086, "step": 621270 }, { "epoch": 1.61, "learning_rate": 5.8432893273644885e-05, "loss": 0.0079, "step": 621280 }, { "epoch": 1.61, "learning_rate": 5.8429005057273426e-05, "loss": 0.0073, "step": 621290 }, { "epoch": 1.61, "learning_rate": 5.842511684090196e-05, "loss": 0.0109, "step": 621300 }, { "epoch": 1.61, "learning_rate": 5.8421228624530496e-05, "loss": 0.0105, "step": 621310 }, { "epoch": 1.61, "learning_rate": 5.841734040815903e-05, "loss": 0.0084, "step": 621320 }, { "epoch": 1.61, "learning_rate": 5.8413452191787566e-05, "loss": 0.0074, "step": 621330 }, { "epoch": 1.61, "learning_rate": 5.84095639754161e-05, "loss": 0.0066, "step": 621340 }, { "epoch": 1.61, "learning_rate": 5.8405675759044636e-05, "loss": 0.0099, "step": 621350 }, { "epoch": 1.61, "learning_rate": 5.840178754267317e-05, "loss": 0.0106, "step": 621360 }, { "epoch": 1.61, "learning_rate": 5.8397899326301705e-05, "loss": 0.0089, "step": 621370 }, { "epoch": 1.61, "learning_rate": 5.839401110993025e-05, "loss": 0.0095, "step": 621380 }, { "epoch": 1.61, "learning_rate": 5.8390122893558775e-05, "loss": 0.0075, "step": 621390 }, { "epoch": 1.61, "learning_rate": 5.838623467718731e-05, "loss": 0.0111, "step": 621400 }, { "epoch": 1.61, "learning_rate": 5.8382346460815845e-05, "loss": 0.006, "step": 621410 }, { "epoch": 1.61, "learning_rate": 5.837845824444438e-05, "loss": 0.0074, "step": 621420 }, { "epoch": 1.61, "learning_rate": 5.8374570028072915e-05, "loss": 0.0074, "step": 621430 }, { "epoch": 1.61, "learning_rate": 5.837068181170145e-05, "loss": 0.0079, "step": 621440 }, { "epoch": 1.61, "learning_rate": 5.8366793595329984e-05, "loss": 0.0101, "step": 621450 }, { "epoch": 1.61, "learning_rate": 5.836290537895852e-05, "loss": 0.009, "step": 621460 }, { "epoch": 1.61, "learning_rate": 5.8359017162587054e-05, "loss": 0.0066, "step": 621470 }, { "epoch": 1.61, "learning_rate": 5.8355128946215596e-05, "loss": 0.0106, "step": 621480 }, { "epoch": 1.61, "learning_rate": 5.835124072984413e-05, "loss": 0.0084, "step": 621490 }, { "epoch": 1.61, "learning_rate": 5.8347352513472665e-05, "loss": 0.0092, "step": 621500 }, { "epoch": 1.61, "learning_rate": 5.83434642971012e-05, "loss": 0.0077, "step": 621510 }, { "epoch": 1.61, "learning_rate": 5.8339576080729735e-05, "loss": 0.0076, "step": 621520 }, { "epoch": 1.61, "learning_rate": 5.833568786435827e-05, "loss": 0.0085, "step": 621530 }, { "epoch": 1.61, "learning_rate": 5.8331799647986805e-05, "loss": 0.009, "step": 621540 }, { "epoch": 1.61, "learning_rate": 5.832791143161534e-05, "loss": 0.0077, "step": 621550 }, { "epoch": 1.61, "learning_rate": 5.832402321524388e-05, "loss": 0.0066, "step": 621560 }, { "epoch": 1.61, "learning_rate": 5.8320134998872416e-05, "loss": 0.0072, "step": 621570 }, { "epoch": 1.61, "learning_rate": 5.831624678250095e-05, "loss": 0.0097, "step": 621580 }, { "epoch": 1.61, "learning_rate": 5.8312358566129486e-05, "loss": 0.0096, "step": 621590 }, { "epoch": 1.61, "learning_rate": 5.830847034975802e-05, "loss": 0.0071, "step": 621600 }, { "epoch": 1.61, "learning_rate": 5.8304582133386556e-05, "loss": 0.0076, "step": 621610 }, { "epoch": 1.61, "learning_rate": 5.830069391701509e-05, "loss": 0.007, "step": 621620 }, { "epoch": 1.61, "learning_rate": 5.8296805700643625e-05, "loss": 0.0081, "step": 621630 }, { "epoch": 1.61, "learning_rate": 5.829291748427215e-05, "loss": 0.0075, "step": 621640 }, { "epoch": 1.61, "learning_rate": 5.828902926790069e-05, "loss": 0.0106, "step": 621650 }, { "epoch": 1.61, "learning_rate": 5.828514105152923e-05, "loss": 0.0085, "step": 621660 }, { "epoch": 1.61, "learning_rate": 5.8281252835157765e-05, "loss": 0.0078, "step": 621670 }, { "epoch": 1.61, "learning_rate": 5.82773646187863e-05, "loss": 0.007, "step": 621680 }, { "epoch": 1.61, "learning_rate": 5.8273476402414834e-05, "loss": 0.0078, "step": 621690 }, { "epoch": 1.61, "learning_rate": 5.826958818604337e-05, "loss": 0.0097, "step": 621700 }, { "epoch": 1.61, "learning_rate": 5.8265699969671904e-05, "loss": 0.0073, "step": 621710 }, { "epoch": 1.61, "learning_rate": 5.826181175330044e-05, "loss": 0.0082, "step": 621720 }, { "epoch": 1.61, "learning_rate": 5.8257923536928974e-05, "loss": 0.0089, "step": 621730 }, { "epoch": 1.61, "learning_rate": 5.8254035320557516e-05, "loss": 0.0079, "step": 621740 }, { "epoch": 1.61, "learning_rate": 5.825014710418605e-05, "loss": 0.0114, "step": 621750 }, { "epoch": 1.61, "learning_rate": 5.8246258887814585e-05, "loss": 0.008, "step": 621760 }, { "epoch": 1.61, "learning_rate": 5.824237067144312e-05, "loss": 0.0098, "step": 621770 }, { "epoch": 1.61, "learning_rate": 5.8238482455071655e-05, "loss": 0.0062, "step": 621780 }, { "epoch": 1.61, "learning_rate": 5.823459423870019e-05, "loss": 0.0113, "step": 621790 }, { "epoch": 1.61, "learning_rate": 5.8230706022328725e-05, "loss": 0.0068, "step": 621800 }, { "epoch": 1.61, "learning_rate": 5.822681780595726e-05, "loss": 0.0098, "step": 621810 }, { "epoch": 1.61, "learning_rate": 5.82229295895858e-05, "loss": 0.0122, "step": 621820 }, { "epoch": 1.61, "learning_rate": 5.8219041373214336e-05, "loss": 0.0097, "step": 621830 }, { "epoch": 1.61, "learning_rate": 5.821515315684287e-05, "loss": 0.0074, "step": 621840 }, { "epoch": 1.61, "learning_rate": 5.8211264940471406e-05, "loss": 0.0069, "step": 621850 }, { "epoch": 1.61, "learning_rate": 5.820737672409994e-05, "loss": 0.007, "step": 621860 }, { "epoch": 1.61, "learning_rate": 5.8203488507728476e-05, "loss": 0.008, "step": 621870 }, { "epoch": 1.61, "learning_rate": 5.8199600291357004e-05, "loss": 0.0098, "step": 621880 }, { "epoch": 1.61, "learning_rate": 5.819571207498554e-05, "loss": 0.0065, "step": 621890 }, { "epoch": 1.61, "learning_rate": 5.819182385861407e-05, "loss": 0.0085, "step": 621900 }, { "epoch": 1.61, "learning_rate": 5.818793564224261e-05, "loss": 0.0075, "step": 621910 }, { "epoch": 1.61, "learning_rate": 5.818404742587115e-05, "loss": 0.0083, "step": 621920 }, { "epoch": 1.61, "learning_rate": 5.8180159209499685e-05, "loss": 0.0083, "step": 621930 }, { "epoch": 1.61, "learning_rate": 5.817627099312822e-05, "loss": 0.0085, "step": 621940 }, { "epoch": 1.61, "learning_rate": 5.8172382776756754e-05, "loss": 0.0088, "step": 621950 }, { "epoch": 1.61, "learning_rate": 5.816849456038529e-05, "loss": 0.0122, "step": 621960 }, { "epoch": 1.61, "learning_rate": 5.8164606344013824e-05, "loss": 0.006, "step": 621970 }, { "epoch": 1.61, "learning_rate": 5.816071812764236e-05, "loss": 0.0066, "step": 621980 }, { "epoch": 1.61, "learning_rate": 5.8156829911270894e-05, "loss": 0.0066, "step": 621990 }, { "epoch": 1.61, "learning_rate": 5.8152941694899436e-05, "loss": 0.0106, "step": 622000 }, { "epoch": 1.61, "eval_cer": 0.881688689953826, "eval_loss": 0.005423935130238533, "eval_runtime": 108.0541, "eval_samples_per_second": 18.509, "eval_steps_per_second": 4.627, "step": 622000 }, { "epoch": 1.61, "learning_rate": 5.814905347852797e-05, "loss": 0.0078, "step": 622010 }, { "epoch": 1.61, "learning_rate": 5.8145165262156505e-05, "loss": 0.0088, "step": 622020 }, { "epoch": 1.61, "learning_rate": 5.814127704578504e-05, "loss": 0.0119, "step": 622030 }, { "epoch": 1.61, "learning_rate": 5.8137388829413575e-05, "loss": 0.0068, "step": 622040 }, { "epoch": 1.61, "learning_rate": 5.813350061304211e-05, "loss": 0.0105, "step": 622050 }, { "epoch": 1.61, "learning_rate": 5.8129612396670645e-05, "loss": 0.0076, "step": 622060 }, { "epoch": 1.61, "learning_rate": 5.812572418029918e-05, "loss": 0.0064, "step": 622070 }, { "epoch": 1.61, "learning_rate": 5.812183596392772e-05, "loss": 0.0074, "step": 622080 }, { "epoch": 1.61, "learning_rate": 5.8117947747556256e-05, "loss": 0.0076, "step": 622090 }, { "epoch": 1.61, "learning_rate": 5.811405953118479e-05, "loss": 0.008, "step": 622100 }, { "epoch": 1.61, "learning_rate": 5.8110171314813326e-05, "loss": 0.0067, "step": 622110 }, { "epoch": 1.61, "learning_rate": 5.810628309844186e-05, "loss": 0.008, "step": 622120 }, { "epoch": 1.61, "learning_rate": 5.810239488207039e-05, "loss": 0.0111, "step": 622130 }, { "epoch": 1.61, "learning_rate": 5.8098506665698924e-05, "loss": 0.0098, "step": 622140 }, { "epoch": 1.61, "learning_rate": 5.809461844932746e-05, "loss": 0.0081, "step": 622150 }, { "epoch": 1.61, "learning_rate": 5.809073023295599e-05, "loss": 0.0096, "step": 622160 }, { "epoch": 1.61, "learning_rate": 5.808684201658453e-05, "loss": 0.0102, "step": 622170 }, { "epoch": 1.61, "learning_rate": 5.808295380021307e-05, "loss": 0.0111, "step": 622180 }, { "epoch": 1.61, "learning_rate": 5.8079065583841605e-05, "loss": 0.0095, "step": 622190 }, { "epoch": 1.61, "learning_rate": 5.807517736747014e-05, "loss": 0.0067, "step": 622200 }, { "epoch": 1.61, "learning_rate": 5.8071289151098674e-05, "loss": 0.0108, "step": 622210 }, { "epoch": 1.61, "learning_rate": 5.806740093472721e-05, "loss": 0.0091, "step": 622220 }, { "epoch": 1.61, "learning_rate": 5.8063512718355744e-05, "loss": 0.0111, "step": 622230 }, { "epoch": 1.61, "learning_rate": 5.805962450198428e-05, "loss": 0.007, "step": 622240 }, { "epoch": 1.61, "learning_rate": 5.8055736285612814e-05, "loss": 0.007, "step": 622250 }, { "epoch": 1.61, "learning_rate": 5.8051848069241355e-05, "loss": 0.0073, "step": 622260 }, { "epoch": 1.61, "learning_rate": 5.804795985286989e-05, "loss": 0.0107, "step": 622270 }, { "epoch": 1.61, "learning_rate": 5.8044071636498425e-05, "loss": 0.0088, "step": 622280 }, { "epoch": 1.61, "learning_rate": 5.804018342012696e-05, "loss": 0.0092, "step": 622290 }, { "epoch": 1.61, "learning_rate": 5.8036295203755495e-05, "loss": 0.0081, "step": 622300 }, { "epoch": 1.61, "learning_rate": 5.803240698738403e-05, "loss": 0.0098, "step": 622310 }, { "epoch": 1.61, "learning_rate": 5.8028518771012565e-05, "loss": 0.0094, "step": 622320 }, { "epoch": 1.61, "learning_rate": 5.80246305546411e-05, "loss": 0.008, "step": 622330 }, { "epoch": 1.61, "learning_rate": 5.802074233826964e-05, "loss": 0.008, "step": 622340 }, { "epoch": 1.61, "learning_rate": 5.8016854121898176e-05, "loss": 0.0089, "step": 622350 }, { "epoch": 1.61, "learning_rate": 5.801296590552671e-05, "loss": 0.0118, "step": 622360 }, { "epoch": 1.61, "learning_rate": 5.8009077689155246e-05, "loss": 0.0084, "step": 622370 }, { "epoch": 1.61, "learning_rate": 5.8005189472783774e-05, "loss": 0.0078, "step": 622380 }, { "epoch": 1.61, "learning_rate": 5.800130125641231e-05, "loss": 0.0075, "step": 622390 }, { "epoch": 1.61, "learning_rate": 5.7997413040040844e-05, "loss": 0.0072, "step": 622400 }, { "epoch": 1.61, "learning_rate": 5.799352482366938e-05, "loss": 0.0077, "step": 622410 }, { "epoch": 1.61, "learning_rate": 5.798963660729791e-05, "loss": 0.0105, "step": 622420 }, { "epoch": 1.61, "learning_rate": 5.798574839092645e-05, "loss": 0.0069, "step": 622430 }, { "epoch": 1.61, "learning_rate": 5.798186017455499e-05, "loss": 0.0078, "step": 622440 }, { "epoch": 1.61, "learning_rate": 5.7977971958183525e-05, "loss": 0.0107, "step": 622450 }, { "epoch": 1.61, "learning_rate": 5.797408374181206e-05, "loss": 0.0093, "step": 622460 }, { "epoch": 1.61, "learning_rate": 5.7970195525440594e-05, "loss": 0.0062, "step": 622470 }, { "epoch": 1.61, "learning_rate": 5.796630730906913e-05, "loss": 0.0117, "step": 622480 }, { "epoch": 1.61, "learning_rate": 5.7962419092697664e-05, "loss": 0.0114, "step": 622490 }, { "epoch": 1.61, "learning_rate": 5.79585308763262e-05, "loss": 0.0085, "step": 622500 }, { "epoch": 1.61, "learning_rate": 5.7954642659954734e-05, "loss": 0.0102, "step": 622510 }, { "epoch": 1.61, "learning_rate": 5.7950754443583275e-05, "loss": 0.0084, "step": 622520 }, { "epoch": 1.61, "learning_rate": 5.794686622721181e-05, "loss": 0.0068, "step": 622530 }, { "epoch": 1.61, "learning_rate": 5.7942978010840345e-05, "loss": 0.0067, "step": 622540 }, { "epoch": 1.61, "learning_rate": 5.793908979446888e-05, "loss": 0.0083, "step": 622550 }, { "epoch": 1.61, "learning_rate": 5.7935201578097415e-05, "loss": 0.0086, "step": 622560 }, { "epoch": 1.61, "learning_rate": 5.793131336172595e-05, "loss": 0.0076, "step": 622570 }, { "epoch": 1.61, "learning_rate": 5.7927425145354485e-05, "loss": 0.0134, "step": 622580 }, { "epoch": 1.61, "learning_rate": 5.792353692898302e-05, "loss": 0.0087, "step": 622590 }, { "epoch": 1.61, "learning_rate": 5.791964871261156e-05, "loss": 0.0081, "step": 622600 }, { "epoch": 1.61, "learning_rate": 5.7915760496240096e-05, "loss": 0.0081, "step": 622610 }, { "epoch": 1.61, "learning_rate": 5.791187227986863e-05, "loss": 0.0095, "step": 622620 }, { "epoch": 1.61, "learning_rate": 5.790798406349716e-05, "loss": 0.0106, "step": 622630 }, { "epoch": 1.61, "learning_rate": 5.7904095847125694e-05, "loss": 0.0081, "step": 622640 }, { "epoch": 1.61, "learning_rate": 5.790020763075423e-05, "loss": 0.0103, "step": 622650 }, { "epoch": 1.61, "learning_rate": 5.7896319414382763e-05, "loss": 0.0089, "step": 622660 }, { "epoch": 1.61, "learning_rate": 5.78924311980113e-05, "loss": 0.0093, "step": 622670 }, { "epoch": 1.61, "learning_rate": 5.788854298163983e-05, "loss": 0.0089, "step": 622680 }, { "epoch": 1.61, "learning_rate": 5.788465476526837e-05, "loss": 0.0077, "step": 622690 }, { "epoch": 1.61, "learning_rate": 5.788076654889691e-05, "loss": 0.009, "step": 622700 }, { "epoch": 1.61, "learning_rate": 5.7876878332525445e-05, "loss": 0.0092, "step": 622710 }, { "epoch": 1.61, "learning_rate": 5.787299011615398e-05, "loss": 0.0102, "step": 622720 }, { "epoch": 1.61, "learning_rate": 5.7869101899782514e-05, "loss": 0.008, "step": 622730 }, { "epoch": 1.61, "learning_rate": 5.786521368341105e-05, "loss": 0.0103, "step": 622740 }, { "epoch": 1.61, "learning_rate": 5.7861325467039584e-05, "loss": 0.0077, "step": 622750 }, { "epoch": 1.61, "learning_rate": 5.785743725066812e-05, "loss": 0.0078, "step": 622760 }, { "epoch": 1.61, "learning_rate": 5.7853549034296654e-05, "loss": 0.0061, "step": 622770 }, { "epoch": 1.61, "learning_rate": 5.784966081792519e-05, "loss": 0.009, "step": 622780 }, { "epoch": 1.61, "learning_rate": 5.784577260155373e-05, "loss": 0.0089, "step": 622790 }, { "epoch": 1.61, "learning_rate": 5.7841884385182265e-05, "loss": 0.0091, "step": 622800 }, { "epoch": 1.61, "learning_rate": 5.78379961688108e-05, "loss": 0.0089, "step": 622810 }, { "epoch": 1.61, "learning_rate": 5.7834107952439335e-05, "loss": 0.0089, "step": 622820 }, { "epoch": 1.61, "learning_rate": 5.783021973606787e-05, "loss": 0.0081, "step": 622830 }, { "epoch": 1.61, "learning_rate": 5.7826331519696405e-05, "loss": 0.0074, "step": 622840 }, { "epoch": 1.61, "learning_rate": 5.782244330332494e-05, "loss": 0.0061, "step": 622850 }, { "epoch": 1.61, "learning_rate": 5.7818555086953474e-05, "loss": 0.0078, "step": 622860 }, { "epoch": 1.61, "learning_rate": 5.7814666870582016e-05, "loss": 0.0088, "step": 622870 }, { "epoch": 1.61, "learning_rate": 5.781077865421054e-05, "loss": 0.0097, "step": 622880 }, { "epoch": 1.61, "learning_rate": 5.780689043783908e-05, "loss": 0.0079, "step": 622890 }, { "epoch": 1.61, "learning_rate": 5.7803002221467614e-05, "loss": 0.0072, "step": 622900 }, { "epoch": 1.61, "learning_rate": 5.779911400509615e-05, "loss": 0.0087, "step": 622910 }, { "epoch": 1.61, "learning_rate": 5.7795225788724683e-05, "loss": 0.0079, "step": 622920 }, { "epoch": 1.61, "learning_rate": 5.779133757235322e-05, "loss": 0.0117, "step": 622930 }, { "epoch": 1.61, "learning_rate": 5.778744935598175e-05, "loss": 0.0119, "step": 622940 }, { "epoch": 1.61, "learning_rate": 5.778356113961029e-05, "loss": 0.008, "step": 622950 }, { "epoch": 1.61, "learning_rate": 5.777967292323882e-05, "loss": 0.0098, "step": 622960 }, { "epoch": 1.61, "learning_rate": 5.7775784706867365e-05, "loss": 0.0075, "step": 622970 }, { "epoch": 1.61, "learning_rate": 5.77718964904959e-05, "loss": 0.0073, "step": 622980 }, { "epoch": 1.61, "learning_rate": 5.7768008274124434e-05, "loss": 0.0078, "step": 622990 }, { "epoch": 1.61, "learning_rate": 5.776412005775297e-05, "loss": 0.0109, "step": 623000 }, { "epoch": 1.61, "eval_cer": 0.8816634964890108, "eval_loss": 0.005499746184796095, "eval_runtime": 107.9534, "eval_samples_per_second": 18.527, "eval_steps_per_second": 4.632, "step": 623000 }, { "epoch": 1.61, "learning_rate": 5.7760231841381504e-05, "loss": 0.0086, "step": 623010 }, { "epoch": 1.61, "learning_rate": 5.775634362501004e-05, "loss": 0.0082, "step": 623020 }, { "epoch": 1.61, "learning_rate": 5.7752455408638574e-05, "loss": 0.0082, "step": 623030 }, { "epoch": 1.62, "learning_rate": 5.774856719226711e-05, "loss": 0.0071, "step": 623040 }, { "epoch": 1.62, "learning_rate": 5.774467897589565e-05, "loss": 0.0083, "step": 623050 }, { "epoch": 1.62, "learning_rate": 5.7740790759524185e-05, "loss": 0.0066, "step": 623060 }, { "epoch": 1.62, "learning_rate": 5.773690254315272e-05, "loss": 0.0068, "step": 623070 }, { "epoch": 1.62, "learning_rate": 5.7733014326781255e-05, "loss": 0.009, "step": 623080 }, { "epoch": 1.62, "learning_rate": 5.772912611040979e-05, "loss": 0.014, "step": 623090 }, { "epoch": 1.62, "learning_rate": 5.7725237894038324e-05, "loss": 0.0103, "step": 623100 }, { "epoch": 1.62, "learning_rate": 5.772134967766686e-05, "loss": 0.0091, "step": 623110 }, { "epoch": 1.62, "learning_rate": 5.771746146129539e-05, "loss": 0.0086, "step": 623120 }, { "epoch": 1.62, "learning_rate": 5.771357324492392e-05, "loss": 0.0074, "step": 623130 }, { "epoch": 1.62, "learning_rate": 5.770968502855246e-05, "loss": 0.0116, "step": 623140 }, { "epoch": 1.62, "learning_rate": 5.7705796812181e-05, "loss": 0.009, "step": 623150 }, { "epoch": 1.62, "learning_rate": 5.7701908595809534e-05, "loss": 0.0077, "step": 623160 }, { "epoch": 1.62, "learning_rate": 5.769802037943807e-05, "loss": 0.0091, "step": 623170 }, { "epoch": 1.62, "learning_rate": 5.76941321630666e-05, "loss": 0.0083, "step": 623180 }, { "epoch": 1.62, "learning_rate": 5.769024394669514e-05, "loss": 0.0073, "step": 623190 }, { "epoch": 1.62, "learning_rate": 5.768635573032367e-05, "loss": 0.008, "step": 623200 }, { "epoch": 1.62, "learning_rate": 5.768246751395221e-05, "loss": 0.0081, "step": 623210 }, { "epoch": 1.62, "learning_rate": 5.767857929758074e-05, "loss": 0.0084, "step": 623220 }, { "epoch": 1.62, "learning_rate": 5.7674691081209284e-05, "loss": 0.0079, "step": 623230 }, { "epoch": 1.62, "learning_rate": 5.767080286483782e-05, "loss": 0.008, "step": 623240 }, { "epoch": 1.62, "learning_rate": 5.7666914648466354e-05, "loss": 0.0077, "step": 623250 }, { "epoch": 1.62, "learning_rate": 5.766302643209489e-05, "loss": 0.0094, "step": 623260 }, { "epoch": 1.62, "learning_rate": 5.7659138215723424e-05, "loss": 0.0063, "step": 623270 }, { "epoch": 1.62, "learning_rate": 5.765524999935196e-05, "loss": 0.0072, "step": 623280 }, { "epoch": 1.62, "learning_rate": 5.7651361782980494e-05, "loss": 0.0103, "step": 623290 }, { "epoch": 1.62, "learning_rate": 5.764747356660903e-05, "loss": 0.0076, "step": 623300 }, { "epoch": 1.62, "learning_rate": 5.764358535023757e-05, "loss": 0.007, "step": 623310 }, { "epoch": 1.62, "learning_rate": 5.7639697133866105e-05, "loss": 0.0072, "step": 623320 }, { "epoch": 1.62, "learning_rate": 5.763580891749464e-05, "loss": 0.0093, "step": 623330 }, { "epoch": 1.62, "learning_rate": 5.7631920701123175e-05, "loss": 0.0074, "step": 623340 }, { "epoch": 1.62, "learning_rate": 5.762803248475171e-05, "loss": 0.0091, "step": 623350 }, { "epoch": 1.62, "learning_rate": 5.7624144268380244e-05, "loss": 0.0105, "step": 623360 }, { "epoch": 1.62, "learning_rate": 5.762025605200877e-05, "loss": 0.0089, "step": 623370 }, { "epoch": 1.62, "learning_rate": 5.761636783563731e-05, "loss": 0.0077, "step": 623380 }, { "epoch": 1.62, "learning_rate": 5.761247961926584e-05, "loss": 0.0088, "step": 623390 }, { "epoch": 1.62, "learning_rate": 5.760859140289438e-05, "loss": 0.0073, "step": 623400 }, { "epoch": 1.62, "learning_rate": 5.760470318652292e-05, "loss": 0.0065, "step": 623410 }, { "epoch": 1.62, "learning_rate": 5.7600814970151454e-05, "loss": 0.0081, "step": 623420 }, { "epoch": 1.62, "learning_rate": 5.759692675377999e-05, "loss": 0.0087, "step": 623430 }, { "epoch": 1.62, "learning_rate": 5.759303853740852e-05, "loss": 0.0083, "step": 623440 }, { "epoch": 1.62, "learning_rate": 5.758915032103706e-05, "loss": 0.0062, "step": 623450 }, { "epoch": 1.62, "learning_rate": 5.758526210466559e-05, "loss": 0.0067, "step": 623460 }, { "epoch": 1.62, "learning_rate": 5.758137388829413e-05, "loss": 0.0103, "step": 623470 }, { "epoch": 1.62, "learning_rate": 5.757748567192266e-05, "loss": 0.0081, "step": 623480 }, { "epoch": 1.62, "learning_rate": 5.7573597455551204e-05, "loss": 0.0085, "step": 623490 }, { "epoch": 1.62, "learning_rate": 5.756970923917974e-05, "loss": 0.0081, "step": 623500 }, { "epoch": 1.62, "learning_rate": 5.7565821022808274e-05, "loss": 0.0087, "step": 623510 }, { "epoch": 1.62, "learning_rate": 5.756193280643681e-05, "loss": 0.0072, "step": 623520 }, { "epoch": 1.62, "learning_rate": 5.7558044590065344e-05, "loss": 0.0079, "step": 623530 }, { "epoch": 1.62, "learning_rate": 5.755415637369388e-05, "loss": 0.01, "step": 623540 }, { "epoch": 1.62, "learning_rate": 5.7550268157322414e-05, "loss": 0.0073, "step": 623550 }, { "epoch": 1.62, "learning_rate": 5.754637994095095e-05, "loss": 0.0109, "step": 623560 }, { "epoch": 1.62, "learning_rate": 5.754249172457949e-05, "loss": 0.0079, "step": 623570 }, { "epoch": 1.62, "learning_rate": 5.7538603508208025e-05, "loss": 0.0076, "step": 623580 }, { "epoch": 1.62, "learning_rate": 5.753471529183656e-05, "loss": 0.0074, "step": 623590 }, { "epoch": 1.62, "learning_rate": 5.7530827075465095e-05, "loss": 0.0081, "step": 623600 }, { "epoch": 1.62, "learning_rate": 5.752693885909363e-05, "loss": 0.0077, "step": 623610 }, { "epoch": 1.62, "learning_rate": 5.752305064272216e-05, "loss": 0.0074, "step": 623620 }, { "epoch": 1.62, "learning_rate": 5.751916242635069e-05, "loss": 0.0095, "step": 623630 }, { "epoch": 1.62, "learning_rate": 5.751527420997923e-05, "loss": 0.0078, "step": 623640 }, { "epoch": 1.62, "learning_rate": 5.751138599360776e-05, "loss": 0.0088, "step": 623650 }, { "epoch": 1.62, "learning_rate": 5.75074977772363e-05, "loss": 0.0084, "step": 623660 }, { "epoch": 1.62, "learning_rate": 5.750360956086484e-05, "loss": 0.0079, "step": 623670 }, { "epoch": 1.62, "learning_rate": 5.7499721344493374e-05, "loss": 0.0081, "step": 623680 }, { "epoch": 1.62, "learning_rate": 5.749583312812191e-05, "loss": 0.0074, "step": 623690 }, { "epoch": 1.62, "learning_rate": 5.749194491175044e-05, "loss": 0.0081, "step": 623700 }, { "epoch": 1.62, "learning_rate": 5.748805669537898e-05, "loss": 0.0131, "step": 623710 }, { "epoch": 1.62, "learning_rate": 5.748416847900751e-05, "loss": 0.0096, "step": 623720 }, { "epoch": 1.62, "learning_rate": 5.748028026263605e-05, "loss": 0.0059, "step": 623730 }, { "epoch": 1.62, "learning_rate": 5.747639204626458e-05, "loss": 0.0076, "step": 623740 }, { "epoch": 1.62, "learning_rate": 5.7472503829893124e-05, "loss": 0.0079, "step": 623750 }, { "epoch": 1.62, "learning_rate": 5.746861561352166e-05, "loss": 0.0092, "step": 623760 }, { "epoch": 1.62, "learning_rate": 5.7464727397150194e-05, "loss": 0.0093, "step": 623770 }, { "epoch": 1.62, "learning_rate": 5.746083918077873e-05, "loss": 0.0097, "step": 623780 }, { "epoch": 1.62, "learning_rate": 5.7456950964407264e-05, "loss": 0.0114, "step": 623790 }, { "epoch": 1.62, "learning_rate": 5.74530627480358e-05, "loss": 0.0065, "step": 623800 }, { "epoch": 1.62, "learning_rate": 5.7449174531664334e-05, "loss": 0.0091, "step": 623810 }, { "epoch": 1.62, "learning_rate": 5.744528631529287e-05, "loss": 0.0065, "step": 623820 }, { "epoch": 1.62, "learning_rate": 5.744139809892141e-05, "loss": 0.0074, "step": 623830 }, { "epoch": 1.62, "learning_rate": 5.7437509882549945e-05, "loss": 0.0114, "step": 623840 }, { "epoch": 1.62, "learning_rate": 5.743362166617848e-05, "loss": 0.0092, "step": 623850 }, { "epoch": 1.62, "learning_rate": 5.7429733449807015e-05, "loss": 0.0086, "step": 623860 }, { "epoch": 1.62, "learning_rate": 5.742584523343554e-05, "loss": 0.0078, "step": 623870 }, { "epoch": 1.62, "learning_rate": 5.742195701706408e-05, "loss": 0.0085, "step": 623880 }, { "epoch": 1.62, "learning_rate": 5.741806880069261e-05, "loss": 0.0085, "step": 623890 }, { "epoch": 1.62, "learning_rate": 5.741418058432115e-05, "loss": 0.0086, "step": 623900 }, { "epoch": 1.62, "learning_rate": 5.741029236794968e-05, "loss": 0.0097, "step": 623910 }, { "epoch": 1.62, "learning_rate": 5.740640415157822e-05, "loss": 0.0068, "step": 623920 }, { "epoch": 1.62, "learning_rate": 5.740251593520676e-05, "loss": 0.01, "step": 623930 }, { "epoch": 1.62, "learning_rate": 5.7398627718835294e-05, "loss": 0.0072, "step": 623940 }, { "epoch": 1.62, "learning_rate": 5.739473950246383e-05, "loss": 0.0094, "step": 623950 }, { "epoch": 1.62, "learning_rate": 5.739085128609236e-05, "loss": 0.0081, "step": 623960 }, { "epoch": 1.62, "learning_rate": 5.73869630697209e-05, "loss": 0.0083, "step": 623970 }, { "epoch": 1.62, "learning_rate": 5.738307485334943e-05, "loss": 0.0067, "step": 623980 }, { "epoch": 1.62, "learning_rate": 5.737918663697797e-05, "loss": 0.0101, "step": 623990 }, { "epoch": 1.62, "learning_rate": 5.73752984206065e-05, "loss": 0.0086, "step": 624000 }, { "epoch": 1.62, "eval_cer": 0.8816634964890108, "eval_loss": 0.005575355142354965, "eval_runtime": 107.7874, "eval_samples_per_second": 18.555, "eval_steps_per_second": 4.639, "step": 624000 }, { "epoch": 1.62, "learning_rate": 5.7371410204235044e-05, "loss": 0.009, "step": 624010 }, { "epoch": 1.62, "learning_rate": 5.736752198786358e-05, "loss": 0.0066, "step": 624020 }, { "epoch": 1.62, "learning_rate": 5.7363633771492114e-05, "loss": 0.007, "step": 624030 }, { "epoch": 1.62, "learning_rate": 5.735974555512065e-05, "loss": 0.0092, "step": 624040 }, { "epoch": 1.62, "learning_rate": 5.7355857338749184e-05, "loss": 0.0092, "step": 624050 }, { "epoch": 1.62, "learning_rate": 5.735196912237772e-05, "loss": 0.0084, "step": 624060 }, { "epoch": 1.62, "learning_rate": 5.7348080906006253e-05, "loss": 0.01, "step": 624070 }, { "epoch": 1.62, "learning_rate": 5.734419268963479e-05, "loss": 0.0102, "step": 624080 }, { "epoch": 1.62, "learning_rate": 5.734030447326332e-05, "loss": 0.0083, "step": 624090 }, { "epoch": 1.62, "learning_rate": 5.7336416256891865e-05, "loss": 0.008, "step": 624100 }, { "epoch": 1.62, "learning_rate": 5.73325280405204e-05, "loss": 0.0078, "step": 624110 }, { "epoch": 1.62, "learning_rate": 5.732863982414893e-05, "loss": 0.0085, "step": 624120 }, { "epoch": 1.62, "learning_rate": 5.732475160777746e-05, "loss": 0.0147, "step": 624130 }, { "epoch": 1.62, "learning_rate": 5.7320863391406e-05, "loss": 0.0068, "step": 624140 }, { "epoch": 1.62, "learning_rate": 5.731697517503453e-05, "loss": 0.0066, "step": 624150 }, { "epoch": 1.62, "learning_rate": 5.731308695866307e-05, "loss": 0.0069, "step": 624160 }, { "epoch": 1.62, "learning_rate": 5.73091987422916e-05, "loss": 0.0062, "step": 624170 }, { "epoch": 1.62, "learning_rate": 5.730531052592014e-05, "loss": 0.0082, "step": 624180 }, { "epoch": 1.62, "learning_rate": 5.730142230954867e-05, "loss": 0.0081, "step": 624190 }, { "epoch": 1.62, "learning_rate": 5.7297534093177213e-05, "loss": 0.0077, "step": 624200 }, { "epoch": 1.62, "learning_rate": 5.729364587680575e-05, "loss": 0.0093, "step": 624210 }, { "epoch": 1.62, "learning_rate": 5.728975766043428e-05, "loss": 0.0082, "step": 624220 }, { "epoch": 1.62, "learning_rate": 5.728586944406282e-05, "loss": 0.0086, "step": 624230 }, { "epoch": 1.62, "learning_rate": 5.728198122769135e-05, "loss": 0.007, "step": 624240 }, { "epoch": 1.62, "learning_rate": 5.727809301131989e-05, "loss": 0.0077, "step": 624250 }, { "epoch": 1.62, "learning_rate": 5.727420479494842e-05, "loss": 0.0093, "step": 624260 }, { "epoch": 1.62, "learning_rate": 5.727031657857696e-05, "loss": 0.0084, "step": 624270 }, { "epoch": 1.62, "learning_rate": 5.72664283622055e-05, "loss": 0.0063, "step": 624280 }, { "epoch": 1.62, "learning_rate": 5.7262540145834034e-05, "loss": 0.0108, "step": 624290 }, { "epoch": 1.62, "learning_rate": 5.725865192946257e-05, "loss": 0.0064, "step": 624300 }, { "epoch": 1.62, "learning_rate": 5.7254763713091104e-05, "loss": 0.0064, "step": 624310 }, { "epoch": 1.62, "learning_rate": 5.725087549671964e-05, "loss": 0.0088, "step": 624320 }, { "epoch": 1.62, "learning_rate": 5.7246987280348173e-05, "loss": 0.0121, "step": 624330 }, { "epoch": 1.62, "learning_rate": 5.724309906397671e-05, "loss": 0.0069, "step": 624340 }, { "epoch": 1.62, "learning_rate": 5.723921084760524e-05, "loss": 0.008, "step": 624350 }, { "epoch": 1.62, "learning_rate": 5.7235322631233785e-05, "loss": 0.0102, "step": 624360 }, { "epoch": 1.62, "learning_rate": 5.7231434414862306e-05, "loss": 0.0089, "step": 624370 }, { "epoch": 1.62, "learning_rate": 5.722754619849085e-05, "loss": 0.0068, "step": 624380 }, { "epoch": 1.62, "learning_rate": 5.722365798211938e-05, "loss": 0.0054, "step": 624390 }, { "epoch": 1.62, "learning_rate": 5.721976976574792e-05, "loss": 0.0098, "step": 624400 }, { "epoch": 1.62, "learning_rate": 5.721588154937645e-05, "loss": 0.008, "step": 624410 }, { "epoch": 1.62, "learning_rate": 5.721199333300499e-05, "loss": 0.0055, "step": 624420 }, { "epoch": 1.62, "learning_rate": 5.720810511663352e-05, "loss": 0.01, "step": 624430 }, { "epoch": 1.62, "learning_rate": 5.720421690026206e-05, "loss": 0.0097, "step": 624440 }, { "epoch": 1.62, "learning_rate": 5.720032868389059e-05, "loss": 0.0083, "step": 624450 }, { "epoch": 1.62, "learning_rate": 5.7196440467519133e-05, "loss": 0.0075, "step": 624460 }, { "epoch": 1.62, "learning_rate": 5.719255225114767e-05, "loss": 0.0081, "step": 624470 }, { "epoch": 1.62, "learning_rate": 5.71886640347762e-05, "loss": 0.0076, "step": 624480 }, { "epoch": 1.62, "learning_rate": 5.718477581840474e-05, "loss": 0.008, "step": 624490 }, { "epoch": 1.62, "learning_rate": 5.718088760203327e-05, "loss": 0.0094, "step": 624500 }, { "epoch": 1.62, "learning_rate": 5.717699938566181e-05, "loss": 0.0105, "step": 624510 }, { "epoch": 1.62, "learning_rate": 5.717311116929034e-05, "loss": 0.01, "step": 624520 }, { "epoch": 1.62, "learning_rate": 5.716922295291888e-05, "loss": 0.0138, "step": 624530 }, { "epoch": 1.62, "learning_rate": 5.716533473654742e-05, "loss": 0.0067, "step": 624540 }, { "epoch": 1.62, "learning_rate": 5.7161446520175954e-05, "loss": 0.0093, "step": 624550 }, { "epoch": 1.62, "learning_rate": 5.715755830380449e-05, "loss": 0.0064, "step": 624560 }, { "epoch": 1.62, "learning_rate": 5.7153670087433024e-05, "loss": 0.0076, "step": 624570 }, { "epoch": 1.62, "learning_rate": 5.714978187106156e-05, "loss": 0.0084, "step": 624580 }, { "epoch": 1.62, "learning_rate": 5.714589365469009e-05, "loss": 0.0071, "step": 624590 }, { "epoch": 1.62, "learning_rate": 5.714200543831863e-05, "loss": 0.0091, "step": 624600 }, { "epoch": 1.62, "learning_rate": 5.7138117221947156e-05, "loss": 0.0095, "step": 624610 }, { "epoch": 1.62, "learning_rate": 5.713422900557569e-05, "loss": 0.0089, "step": 624620 }, { "epoch": 1.62, "learning_rate": 5.7130340789204226e-05, "loss": 0.0162, "step": 624630 }, { "epoch": 1.62, "learning_rate": 5.712645257283277e-05, "loss": 0.0081, "step": 624640 }, { "epoch": 1.62, "learning_rate": 5.71225643564613e-05, "loss": 0.0082, "step": 624650 }, { "epoch": 1.62, "learning_rate": 5.711867614008984e-05, "loss": 0.0107, "step": 624660 }, { "epoch": 1.62, "learning_rate": 5.711478792371837e-05, "loss": 0.0083, "step": 624670 }, { "epoch": 1.62, "learning_rate": 5.711089970734691e-05, "loss": 0.0125, "step": 624680 }, { "epoch": 1.62, "learning_rate": 5.710701149097544e-05, "loss": 0.0063, "step": 624690 }, { "epoch": 1.62, "learning_rate": 5.710312327460398e-05, "loss": 0.0076, "step": 624700 }, { "epoch": 1.62, "learning_rate": 5.709923505823251e-05, "loss": 0.0071, "step": 624710 }, { "epoch": 1.62, "learning_rate": 5.709534684186105e-05, "loss": 0.0071, "step": 624720 }, { "epoch": 1.62, "learning_rate": 5.709145862548959e-05, "loss": 0.0085, "step": 624730 }, { "epoch": 1.62, "learning_rate": 5.708757040911812e-05, "loss": 0.0081, "step": 624740 }, { "epoch": 1.62, "learning_rate": 5.708368219274666e-05, "loss": 0.0096, "step": 624750 }, { "epoch": 1.62, "learning_rate": 5.707979397637519e-05, "loss": 0.0113, "step": 624760 }, { "epoch": 1.62, "learning_rate": 5.707590576000373e-05, "loss": 0.0063, "step": 624770 }, { "epoch": 1.62, "learning_rate": 5.707201754363226e-05, "loss": 0.009, "step": 624780 }, { "epoch": 1.62, "learning_rate": 5.70681293272608e-05, "loss": 0.0099, "step": 624790 }, { "epoch": 1.62, "learning_rate": 5.706424111088934e-05, "loss": 0.0077, "step": 624800 }, { "epoch": 1.62, "learning_rate": 5.7060352894517874e-05, "loss": 0.0074, "step": 624810 }, { "epoch": 1.62, "learning_rate": 5.705646467814641e-05, "loss": 0.0066, "step": 624820 }, { "epoch": 1.62, "learning_rate": 5.7052576461774944e-05, "loss": 0.0067, "step": 624830 }, { "epoch": 1.62, "learning_rate": 5.704868824540348e-05, "loss": 0.0087, "step": 624840 }, { "epoch": 1.62, "learning_rate": 5.704480002903201e-05, "loss": 0.0103, "step": 624850 }, { "epoch": 1.62, "learning_rate": 5.704091181266054e-05, "loss": 0.0077, "step": 624860 }, { "epoch": 1.62, "learning_rate": 5.7037023596289076e-05, "loss": 0.008, "step": 624870 }, { "epoch": 1.62, "learning_rate": 5.703313537991761e-05, "loss": 0.0111, "step": 624880 }, { "epoch": 1.62, "learning_rate": 5.7029247163546146e-05, "loss": 0.0079, "step": 624890 }, { "epoch": 1.62, "learning_rate": 5.702535894717469e-05, "loss": 0.0094, "step": 624900 }, { "epoch": 1.62, "learning_rate": 5.702147073080322e-05, "loss": 0.007, "step": 624910 }, { "epoch": 1.62, "learning_rate": 5.701758251443176e-05, "loss": 0.0106, "step": 624920 }, { "epoch": 1.62, "learning_rate": 5.701369429806029e-05, "loss": 0.0079, "step": 624930 }, { "epoch": 1.62, "learning_rate": 5.700980608168883e-05, "loss": 0.0099, "step": 624940 }, { "epoch": 1.62, "learning_rate": 5.700591786531736e-05, "loss": 0.0075, "step": 624950 }, { "epoch": 1.62, "learning_rate": 5.70020296489459e-05, "loss": 0.0094, "step": 624960 }, { "epoch": 1.62, "learning_rate": 5.699814143257443e-05, "loss": 0.0082, "step": 624970 }, { "epoch": 1.62, "learning_rate": 5.699425321620297e-05, "loss": 0.0117, "step": 624980 }, { "epoch": 1.62, "learning_rate": 5.699036499983151e-05, "loss": 0.0079, "step": 624990 }, { "epoch": 1.62, "learning_rate": 5.698647678346004e-05, "loss": 0.0066, "step": 625000 }, { "epoch": 1.62, "eval_cer": 0.8816481004827348, "eval_loss": 0.005520543083548546, "eval_runtime": 107.9384, "eval_samples_per_second": 18.529, "eval_steps_per_second": 4.632, "step": 625000 }, { "epoch": 1.62, "learning_rate": 5.698258856708858e-05, "loss": 0.0059, "step": 625010 }, { "epoch": 1.62, "learning_rate": 5.697870035071711e-05, "loss": 0.0106, "step": 625020 }, { "epoch": 1.62, "learning_rate": 5.697481213434565e-05, "loss": 0.0072, "step": 625030 }, { "epoch": 1.62, "learning_rate": 5.697092391797418e-05, "loss": 0.0103, "step": 625040 }, { "epoch": 1.62, "learning_rate": 5.696703570160272e-05, "loss": 0.0078, "step": 625050 }, { "epoch": 1.62, "learning_rate": 5.696314748523126e-05, "loss": 0.0076, "step": 625060 }, { "epoch": 1.62, "learning_rate": 5.6959259268859794e-05, "loss": 0.0113, "step": 625070 }, { "epoch": 1.62, "learning_rate": 5.695537105248833e-05, "loss": 0.0071, "step": 625080 }, { "epoch": 1.62, "learning_rate": 5.6951482836116864e-05, "loss": 0.0064, "step": 625090 }, { "epoch": 1.62, "learning_rate": 5.69475946197454e-05, "loss": 0.0098, "step": 625100 }, { "epoch": 1.62, "learning_rate": 5.6943706403373927e-05, "loss": 0.006, "step": 625110 }, { "epoch": 1.62, "learning_rate": 5.693981818700246e-05, "loss": 0.0066, "step": 625120 }, { "epoch": 1.62, "learning_rate": 5.6935929970630996e-05, "loss": 0.0082, "step": 625130 }, { "epoch": 1.62, "learning_rate": 5.693204175425953e-05, "loss": 0.0094, "step": 625140 }, { "epoch": 1.62, "learning_rate": 5.6928153537888066e-05, "loss": 0.0076, "step": 625150 }, { "epoch": 1.62, "learning_rate": 5.692426532151661e-05, "loss": 0.0084, "step": 625160 }, { "epoch": 1.62, "learning_rate": 5.692037710514514e-05, "loss": 0.0077, "step": 625170 }, { "epoch": 1.62, "learning_rate": 5.691648888877368e-05, "loss": 0.0073, "step": 625180 }, { "epoch": 1.62, "learning_rate": 5.691260067240221e-05, "loss": 0.0129, "step": 625190 }, { "epoch": 1.62, "learning_rate": 5.690871245603075e-05, "loss": 0.0085, "step": 625200 }, { "epoch": 1.62, "learning_rate": 5.690482423965928e-05, "loss": 0.0077, "step": 625210 }, { "epoch": 1.62, "learning_rate": 5.690093602328782e-05, "loss": 0.0081, "step": 625220 }, { "epoch": 1.62, "learning_rate": 5.689704780691635e-05, "loss": 0.0062, "step": 625230 }, { "epoch": 1.62, "learning_rate": 5.689315959054489e-05, "loss": 0.0093, "step": 625240 }, { "epoch": 1.62, "learning_rate": 5.688927137417343e-05, "loss": 0.0094, "step": 625250 }, { "epoch": 1.62, "learning_rate": 5.688538315780196e-05, "loss": 0.0081, "step": 625260 }, { "epoch": 1.62, "learning_rate": 5.68814949414305e-05, "loss": 0.011, "step": 625270 }, { "epoch": 1.62, "learning_rate": 5.687760672505903e-05, "loss": 0.0108, "step": 625280 }, { "epoch": 1.62, "learning_rate": 5.687371850868757e-05, "loss": 0.006, "step": 625290 }, { "epoch": 1.62, "learning_rate": 5.68698302923161e-05, "loss": 0.0094, "step": 625300 }, { "epoch": 1.62, "learning_rate": 5.686594207594464e-05, "loss": 0.0092, "step": 625310 }, { "epoch": 1.62, "learning_rate": 5.686205385957318e-05, "loss": 0.0076, "step": 625320 }, { "epoch": 1.62, "learning_rate": 5.6858165643201714e-05, "loss": 0.0075, "step": 625330 }, { "epoch": 1.62, "learning_rate": 5.685427742683025e-05, "loss": 0.0092, "step": 625340 }, { "epoch": 1.62, "learning_rate": 5.6850389210458784e-05, "loss": 0.0108, "step": 625350 }, { "epoch": 1.62, "learning_rate": 5.684650099408731e-05, "loss": 0.0077, "step": 625360 }, { "epoch": 1.62, "learning_rate": 5.6842612777715846e-05, "loss": 0.0066, "step": 625370 }, { "epoch": 1.62, "learning_rate": 5.683872456134438e-05, "loss": 0.008, "step": 625380 }, { "epoch": 1.62, "learning_rate": 5.6834836344972916e-05, "loss": 0.008, "step": 625390 }, { "epoch": 1.62, "learning_rate": 5.683094812860145e-05, "loss": 0.0083, "step": 625400 }, { "epoch": 1.62, "learning_rate": 5.6827059912229986e-05, "loss": 0.0083, "step": 625410 }, { "epoch": 1.62, "learning_rate": 5.682317169585853e-05, "loss": 0.0059, "step": 625420 }, { "epoch": 1.62, "learning_rate": 5.681928347948706e-05, "loss": 0.0104, "step": 625430 }, { "epoch": 1.62, "learning_rate": 5.68153952631156e-05, "loss": 0.0092, "step": 625440 }, { "epoch": 1.62, "learning_rate": 5.681150704674413e-05, "loss": 0.0083, "step": 625450 }, { "epoch": 1.62, "learning_rate": 5.680761883037267e-05, "loss": 0.0087, "step": 625460 }, { "epoch": 1.62, "learning_rate": 5.68037306140012e-05, "loss": 0.0101, "step": 625470 }, { "epoch": 1.62, "learning_rate": 5.679984239762974e-05, "loss": 0.0125, "step": 625480 }, { "epoch": 1.62, "learning_rate": 5.679595418125827e-05, "loss": 0.0112, "step": 625490 }, { "epoch": 1.62, "learning_rate": 5.6792065964886806e-05, "loss": 0.0086, "step": 625500 }, { "epoch": 1.62, "learning_rate": 5.678817774851535e-05, "loss": 0.0085, "step": 625510 }, { "epoch": 1.62, "learning_rate": 5.678428953214388e-05, "loss": 0.0091, "step": 625520 }, { "epoch": 1.62, "learning_rate": 5.678040131577242e-05, "loss": 0.0115, "step": 625530 }, { "epoch": 1.62, "learning_rate": 5.677651309940095e-05, "loss": 0.0069, "step": 625540 }, { "epoch": 1.62, "learning_rate": 5.677262488302949e-05, "loss": 0.0089, "step": 625550 }, { "epoch": 1.62, "learning_rate": 5.676873666665802e-05, "loss": 0.0077, "step": 625560 }, { "epoch": 1.62, "learning_rate": 5.676484845028656e-05, "loss": 0.0092, "step": 625570 }, { "epoch": 1.62, "learning_rate": 5.676096023391509e-05, "loss": 0.006, "step": 625580 }, { "epoch": 1.62, "learning_rate": 5.6757072017543634e-05, "loss": 0.0142, "step": 625590 }, { "epoch": 1.62, "learning_rate": 5.675318380117217e-05, "loss": 0.0089, "step": 625600 }, { "epoch": 1.62, "learning_rate": 5.67492955848007e-05, "loss": 0.0096, "step": 625610 }, { "epoch": 1.62, "learning_rate": 5.674540736842923e-05, "loss": 0.0086, "step": 625620 }, { "epoch": 1.62, "learning_rate": 5.6741519152057766e-05, "loss": 0.009, "step": 625630 }, { "epoch": 1.62, "learning_rate": 5.67376309356863e-05, "loss": 0.0078, "step": 625640 }, { "epoch": 1.62, "learning_rate": 5.6733742719314836e-05, "loss": 0.0091, "step": 625650 }, { "epoch": 1.62, "learning_rate": 5.672985450294337e-05, "loss": 0.0122, "step": 625660 }, { "epoch": 1.62, "learning_rate": 5.6725966286571906e-05, "loss": 0.0074, "step": 625670 }, { "epoch": 1.62, "learning_rate": 5.672207807020044e-05, "loss": 0.0077, "step": 625680 }, { "epoch": 1.62, "learning_rate": 5.671818985382898e-05, "loss": 0.0078, "step": 625690 }, { "epoch": 1.62, "learning_rate": 5.671430163745752e-05, "loss": 0.0084, "step": 625700 }, { "epoch": 1.62, "learning_rate": 5.671041342108605e-05, "loss": 0.0098, "step": 625710 }, { "epoch": 1.62, "learning_rate": 5.670652520471459e-05, "loss": 0.0101, "step": 625720 }, { "epoch": 1.62, "learning_rate": 5.670263698834312e-05, "loss": 0.0089, "step": 625730 }, { "epoch": 1.62, "learning_rate": 5.669874877197166e-05, "loss": 0.0087, "step": 625740 }, { "epoch": 1.62, "learning_rate": 5.669486055560019e-05, "loss": 0.0059, "step": 625750 }, { "epoch": 1.62, "learning_rate": 5.6690972339228726e-05, "loss": 0.0068, "step": 625760 }, { "epoch": 1.62, "learning_rate": 5.668708412285727e-05, "loss": 0.0054, "step": 625770 }, { "epoch": 1.62, "learning_rate": 5.66831959064858e-05, "loss": 0.0091, "step": 625780 }, { "epoch": 1.62, "learning_rate": 5.667930769011434e-05, "loss": 0.008, "step": 625790 }, { "epoch": 1.62, "learning_rate": 5.667541947374287e-05, "loss": 0.0105, "step": 625800 }, { "epoch": 1.62, "learning_rate": 5.667153125737141e-05, "loss": 0.0079, "step": 625810 }, { "epoch": 1.62, "learning_rate": 5.666764304099994e-05, "loss": 0.0074, "step": 625820 }, { "epoch": 1.62, "learning_rate": 5.666375482462848e-05, "loss": 0.0097, "step": 625830 }, { "epoch": 1.62, "learning_rate": 5.665986660825701e-05, "loss": 0.0079, "step": 625840 }, { "epoch": 1.62, "learning_rate": 5.665597839188554e-05, "loss": 0.008, "step": 625850 }, { "epoch": 1.62, "learning_rate": 5.6652090175514075e-05, "loss": 0.0087, "step": 625860 }, { "epoch": 1.62, "learning_rate": 5.664820195914262e-05, "loss": 0.0084, "step": 625870 }, { "epoch": 1.62, "learning_rate": 5.664431374277115e-05, "loss": 0.0077, "step": 625880 }, { "epoch": 1.62, "learning_rate": 5.6640425526399686e-05, "loss": 0.0117, "step": 625890 }, { "epoch": 1.62, "learning_rate": 5.663653731002822e-05, "loss": 0.0089, "step": 625900 }, { "epoch": 1.62, "learning_rate": 5.6632649093656756e-05, "loss": 0.0127, "step": 625910 }, { "epoch": 1.62, "learning_rate": 5.662876087728529e-05, "loss": 0.0082, "step": 625920 }, { "epoch": 1.62, "learning_rate": 5.6624872660913826e-05, "loss": 0.0057, "step": 625930 }, { "epoch": 1.62, "learning_rate": 5.662098444454236e-05, "loss": 0.008, "step": 625940 }, { "epoch": 1.62, "learning_rate": 5.66170962281709e-05, "loss": 0.0093, "step": 625950 }, { "epoch": 1.62, "learning_rate": 5.661320801179944e-05, "loss": 0.008, "step": 625960 }, { "epoch": 1.62, "learning_rate": 5.660931979542797e-05, "loss": 0.0085, "step": 625970 }, { "epoch": 1.62, "learning_rate": 5.660543157905651e-05, "loss": 0.0102, "step": 625980 }, { "epoch": 1.62, "learning_rate": 5.660154336268504e-05, "loss": 0.0139, "step": 625990 }, { "epoch": 1.62, "learning_rate": 5.659765514631358e-05, "loss": 0.0084, "step": 626000 }, { "epoch": 1.62, "eval_cer": 0.8816858906799576, "eval_loss": 0.005688130855560303, "eval_runtime": 107.8597, "eval_samples_per_second": 18.543, "eval_steps_per_second": 4.636, "step": 626000 }, { "epoch": 1.62, "learning_rate": 5.659376692994211e-05, "loss": 0.0085, "step": 626010 }, { "epoch": 1.62, "learning_rate": 5.6589878713570646e-05, "loss": 0.0101, "step": 626020 }, { "epoch": 1.62, "learning_rate": 5.658599049719919e-05, "loss": 0.009, "step": 626030 }, { "epoch": 1.62, "learning_rate": 5.658210228082772e-05, "loss": 0.0052, "step": 626040 }, { "epoch": 1.62, "learning_rate": 5.657821406445626e-05, "loss": 0.0077, "step": 626050 }, { "epoch": 1.62, "learning_rate": 5.657432584808479e-05, "loss": 0.0085, "step": 626060 }, { "epoch": 1.62, "learning_rate": 5.657043763171333e-05, "loss": 0.0052, "step": 626070 }, { "epoch": 1.62, "learning_rate": 5.656654941534186e-05, "loss": 0.01, "step": 626080 }, { "epoch": 1.62, "learning_rate": 5.65626611989704e-05, "loss": 0.0099, "step": 626090 }, { "epoch": 1.62, "learning_rate": 5.6558772982598925e-05, "loss": 0.0107, "step": 626100 }, { "epoch": 1.62, "learning_rate": 5.655488476622746e-05, "loss": 0.0086, "step": 626110 }, { "epoch": 1.62, "learning_rate": 5.6550996549855995e-05, "loss": 0.008, "step": 626120 }, { "epoch": 1.62, "learning_rate": 5.6547108333484537e-05, "loss": 0.0096, "step": 626130 }, { "epoch": 1.62, "learning_rate": 5.654322011711307e-05, "loss": 0.0107, "step": 626140 }, { "epoch": 1.62, "learning_rate": 5.6539331900741606e-05, "loss": 0.0083, "step": 626150 }, { "epoch": 1.62, "learning_rate": 5.653544368437014e-05, "loss": 0.0085, "step": 626160 }, { "epoch": 1.62, "learning_rate": 5.6531555467998676e-05, "loss": 0.0068, "step": 626170 }, { "epoch": 1.62, "learning_rate": 5.652766725162721e-05, "loss": 0.0076, "step": 626180 }, { "epoch": 1.62, "learning_rate": 5.6523779035255746e-05, "loss": 0.0074, "step": 626190 }, { "epoch": 1.62, "learning_rate": 5.651989081888428e-05, "loss": 0.0066, "step": 626200 }, { "epoch": 1.62, "learning_rate": 5.651600260251282e-05, "loss": 0.0061, "step": 626210 }, { "epoch": 1.62, "learning_rate": 5.651211438614136e-05, "loss": 0.0073, "step": 626220 }, { "epoch": 1.62, "learning_rate": 5.650822616976989e-05, "loss": 0.0098, "step": 626230 }, { "epoch": 1.62, "learning_rate": 5.650433795339843e-05, "loss": 0.0093, "step": 626240 }, { "epoch": 1.62, "learning_rate": 5.650044973702696e-05, "loss": 0.0099, "step": 626250 }, { "epoch": 1.62, "learning_rate": 5.6496561520655497e-05, "loss": 0.0086, "step": 626260 }, { "epoch": 1.62, "learning_rate": 5.649267330428403e-05, "loss": 0.0073, "step": 626270 }, { "epoch": 1.62, "learning_rate": 5.6488785087912566e-05, "loss": 0.007, "step": 626280 }, { "epoch": 1.62, "learning_rate": 5.648489687154111e-05, "loss": 0.0084, "step": 626290 }, { "epoch": 1.62, "learning_rate": 5.648100865516964e-05, "loss": 0.0077, "step": 626300 }, { "epoch": 1.62, "learning_rate": 5.647712043879818e-05, "loss": 0.0085, "step": 626310 }, { "epoch": 1.62, "learning_rate": 5.647323222242671e-05, "loss": 0.0093, "step": 626320 }, { "epoch": 1.62, "learning_rate": 5.646934400605525e-05, "loss": 0.0083, "step": 626330 }, { "epoch": 1.62, "learning_rate": 5.646545578968378e-05, "loss": 0.0087, "step": 626340 }, { "epoch": 1.62, "learning_rate": 5.646156757331231e-05, "loss": 0.007, "step": 626350 }, { "epoch": 1.62, "learning_rate": 5.6457679356940845e-05, "loss": 0.0112, "step": 626360 }, { "epoch": 1.62, "learning_rate": 5.645379114056938e-05, "loss": 0.0135, "step": 626370 }, { "epoch": 1.62, "learning_rate": 5.6449902924197915e-05, "loss": 0.0081, "step": 626380 }, { "epoch": 1.62, "learning_rate": 5.6446014707826457e-05, "loss": 0.0095, "step": 626390 }, { "epoch": 1.62, "learning_rate": 5.644212649145499e-05, "loss": 0.0093, "step": 626400 }, { "epoch": 1.62, "learning_rate": 5.6438238275083526e-05, "loss": 0.008, "step": 626410 }, { "epoch": 1.62, "learning_rate": 5.643435005871206e-05, "loss": 0.0082, "step": 626420 }, { "epoch": 1.62, "learning_rate": 5.6430461842340596e-05, "loss": 0.0059, "step": 626430 }, { "epoch": 1.62, "learning_rate": 5.642657362596913e-05, "loss": 0.0056, "step": 626440 }, { "epoch": 1.62, "learning_rate": 5.6422685409597666e-05, "loss": 0.009, "step": 626450 }, { "epoch": 1.62, "learning_rate": 5.64187971932262e-05, "loss": 0.0098, "step": 626460 }, { "epoch": 1.62, "learning_rate": 5.641490897685474e-05, "loss": 0.0096, "step": 626470 }, { "epoch": 1.62, "learning_rate": 5.641102076048328e-05, "loss": 0.0078, "step": 626480 }, { "epoch": 1.62, "learning_rate": 5.640713254411181e-05, "loss": 0.0091, "step": 626490 }, { "epoch": 1.62, "learning_rate": 5.640324432774035e-05, "loss": 0.0073, "step": 626500 }, { "epoch": 1.62, "learning_rate": 5.639935611136888e-05, "loss": 0.007, "step": 626510 }, { "epoch": 1.62, "learning_rate": 5.6395467894997417e-05, "loss": 0.0084, "step": 626520 }, { "epoch": 1.62, "learning_rate": 5.639157967862595e-05, "loss": 0.011, "step": 626530 }, { "epoch": 1.62, "learning_rate": 5.6387691462254486e-05, "loss": 0.0089, "step": 626540 }, { "epoch": 1.62, "learning_rate": 5.638380324588303e-05, "loss": 0.0063, "step": 626550 }, { "epoch": 1.62, "learning_rate": 5.637991502951156e-05, "loss": 0.0067, "step": 626560 }, { "epoch": 1.62, "learning_rate": 5.63760268131401e-05, "loss": 0.0097, "step": 626570 }, { "epoch": 1.62, "learning_rate": 5.637213859676863e-05, "loss": 0.0078, "step": 626580 }, { "epoch": 1.62, "learning_rate": 5.636825038039717e-05, "loss": 0.0075, "step": 626590 }, { "epoch": 1.62, "learning_rate": 5.6364362164025695e-05, "loss": 0.0067, "step": 626600 }, { "epoch": 1.62, "learning_rate": 5.636047394765423e-05, "loss": 0.0109, "step": 626610 }, { "epoch": 1.62, "learning_rate": 5.6356585731282765e-05, "loss": 0.0077, "step": 626620 }, { "epoch": 1.62, "learning_rate": 5.63526975149113e-05, "loss": 0.0084, "step": 626630 }, { "epoch": 1.62, "learning_rate": 5.6348809298539835e-05, "loss": 0.0067, "step": 626640 }, { "epoch": 1.62, "learning_rate": 5.6344921082168377e-05, "loss": 0.0096, "step": 626650 }, { "epoch": 1.62, "learning_rate": 5.634103286579691e-05, "loss": 0.0086, "step": 626660 }, { "epoch": 1.62, "learning_rate": 5.6337144649425446e-05, "loss": 0.0111, "step": 626670 }, { "epoch": 1.62, "learning_rate": 5.633325643305398e-05, "loss": 0.0099, "step": 626680 }, { "epoch": 1.62, "learning_rate": 5.6329368216682516e-05, "loss": 0.0078, "step": 626690 }, { "epoch": 1.62, "learning_rate": 5.632548000031105e-05, "loss": 0.0094, "step": 626700 }, { "epoch": 1.62, "learning_rate": 5.6321591783939586e-05, "loss": 0.0106, "step": 626710 }, { "epoch": 1.62, "learning_rate": 5.631770356756812e-05, "loss": 0.0066, "step": 626720 }, { "epoch": 1.62, "learning_rate": 5.631381535119666e-05, "loss": 0.0079, "step": 626730 }, { "epoch": 1.62, "learning_rate": 5.63099271348252e-05, "loss": 0.0077, "step": 626740 }, { "epoch": 1.62, "learning_rate": 5.630603891845373e-05, "loss": 0.0068, "step": 626750 }, { "epoch": 1.62, "learning_rate": 5.630215070208227e-05, "loss": 0.0105, "step": 626760 }, { "epoch": 1.62, "learning_rate": 5.62982624857108e-05, "loss": 0.0064, "step": 626770 }, { "epoch": 1.62, "learning_rate": 5.6294374269339336e-05, "loss": 0.0075, "step": 626780 }, { "epoch": 1.62, "learning_rate": 5.629048605296787e-05, "loss": 0.0054, "step": 626790 }, { "epoch": 1.62, "learning_rate": 5.6286597836596406e-05, "loss": 0.0065, "step": 626800 }, { "epoch": 1.62, "learning_rate": 5.628270962022495e-05, "loss": 0.0088, "step": 626810 }, { "epoch": 1.62, "learning_rate": 5.627882140385348e-05, "loss": 0.0093, "step": 626820 }, { "epoch": 1.62, "learning_rate": 5.627493318748202e-05, "loss": 0.0099, "step": 626830 }, { "epoch": 1.62, "learning_rate": 5.627104497111055e-05, "loss": 0.0059, "step": 626840 }, { "epoch": 1.62, "learning_rate": 5.626715675473908e-05, "loss": 0.0104, "step": 626850 }, { "epoch": 1.62, "learning_rate": 5.6263268538367615e-05, "loss": 0.0059, "step": 626860 }, { "epoch": 1.62, "learning_rate": 5.625938032199615e-05, "loss": 0.0086, "step": 626870 }, { "epoch": 1.62, "learning_rate": 5.6255492105624685e-05, "loss": 0.0075, "step": 626880 }, { "epoch": 1.62, "learning_rate": 5.625160388925322e-05, "loss": 0.0072, "step": 626890 }, { "epoch": 1.63, "learning_rate": 5.6247715672881755e-05, "loss": 0.0076, "step": 626900 }, { "epoch": 1.63, "learning_rate": 5.6243827456510296e-05, "loss": 0.009, "step": 626910 }, { "epoch": 1.63, "learning_rate": 5.623993924013883e-05, "loss": 0.0095, "step": 626920 }, { "epoch": 1.63, "learning_rate": 5.6236051023767366e-05, "loss": 0.0078, "step": 626930 }, { "epoch": 1.63, "learning_rate": 5.62321628073959e-05, "loss": 0.0099, "step": 626940 }, { "epoch": 1.63, "learning_rate": 5.6228274591024436e-05, "loss": 0.0083, "step": 626950 }, { "epoch": 1.63, "learning_rate": 5.622438637465297e-05, "loss": 0.0089, "step": 626960 }, { "epoch": 1.63, "learning_rate": 5.6220498158281506e-05, "loss": 0.0104, "step": 626970 }, { "epoch": 1.63, "learning_rate": 5.621660994191004e-05, "loss": 0.0067, "step": 626980 }, { "epoch": 1.63, "learning_rate": 5.6212721725538575e-05, "loss": 0.0085, "step": 626990 }, { "epoch": 1.63, "learning_rate": 5.620883350916712e-05, "loss": 0.0098, "step": 627000 }, { "epoch": 1.63, "eval_cer": 0.8816397026611297, "eval_loss": 0.005602034740149975, "eval_runtime": 108.0184, "eval_samples_per_second": 18.515, "eval_steps_per_second": 4.629, "step": 627000 }, { "epoch": 1.63, "learning_rate": 5.620494529279565e-05, "loss": 0.0061, "step": 627010 }, { "epoch": 1.63, "learning_rate": 5.620105707642419e-05, "loss": 0.0078, "step": 627020 }, { "epoch": 1.63, "learning_rate": 5.619716886005272e-05, "loss": 0.0106, "step": 627030 }, { "epoch": 1.63, "learning_rate": 5.6193280643681256e-05, "loss": 0.0078, "step": 627040 }, { "epoch": 1.63, "learning_rate": 5.618939242730979e-05, "loss": 0.0089, "step": 627050 }, { "epoch": 1.63, "learning_rate": 5.6185504210938326e-05, "loss": 0.0101, "step": 627060 }, { "epoch": 1.63, "learning_rate": 5.618161599456686e-05, "loss": 0.0119, "step": 627070 }, { "epoch": 1.63, "learning_rate": 5.61777277781954e-05, "loss": 0.0078, "step": 627080 }, { "epoch": 1.63, "learning_rate": 5.6173839561823924e-05, "loss": 0.0101, "step": 627090 }, { "epoch": 1.63, "learning_rate": 5.6169951345452466e-05, "loss": 0.0102, "step": 627100 }, { "epoch": 1.63, "learning_rate": 5.6166063129081e-05, "loss": 0.0077, "step": 627110 }, { "epoch": 1.63, "learning_rate": 5.6162174912709535e-05, "loss": 0.006, "step": 627120 }, { "epoch": 1.63, "learning_rate": 5.615828669633807e-05, "loss": 0.0085, "step": 627130 }, { "epoch": 1.63, "learning_rate": 5.6154398479966605e-05, "loss": 0.0094, "step": 627140 }, { "epoch": 1.63, "learning_rate": 5.615051026359514e-05, "loss": 0.0098, "step": 627150 }, { "epoch": 1.63, "learning_rate": 5.6146622047223675e-05, "loss": 0.0084, "step": 627160 }, { "epoch": 1.63, "learning_rate": 5.614273383085221e-05, "loss": 0.0066, "step": 627170 }, { "epoch": 1.63, "learning_rate": 5.613884561448075e-05, "loss": 0.0079, "step": 627180 }, { "epoch": 1.63, "learning_rate": 5.6134957398109286e-05, "loss": 0.0091, "step": 627190 }, { "epoch": 1.63, "learning_rate": 5.613106918173782e-05, "loss": 0.0128, "step": 627200 }, { "epoch": 1.63, "learning_rate": 5.6127180965366356e-05, "loss": 0.0069, "step": 627210 }, { "epoch": 1.63, "learning_rate": 5.612329274899489e-05, "loss": 0.0072, "step": 627220 }, { "epoch": 1.63, "learning_rate": 5.6119404532623426e-05, "loss": 0.0093, "step": 627230 }, { "epoch": 1.63, "learning_rate": 5.611551631625196e-05, "loss": 0.0054, "step": 627240 }, { "epoch": 1.63, "learning_rate": 5.6111628099880495e-05, "loss": 0.0094, "step": 627250 }, { "epoch": 1.63, "learning_rate": 5.610773988350904e-05, "loss": 0.008, "step": 627260 }, { "epoch": 1.63, "learning_rate": 5.610385166713757e-05, "loss": 0.008, "step": 627270 }, { "epoch": 1.63, "learning_rate": 5.609996345076611e-05, "loss": 0.0096, "step": 627280 }, { "epoch": 1.63, "learning_rate": 5.609607523439464e-05, "loss": 0.006, "step": 627290 }, { "epoch": 1.63, "learning_rate": 5.6092187018023176e-05, "loss": 0.009, "step": 627300 }, { "epoch": 1.63, "learning_rate": 5.608829880165171e-05, "loss": 0.008, "step": 627310 }, { "epoch": 1.63, "learning_rate": 5.6084410585280246e-05, "loss": 0.0092, "step": 627320 }, { "epoch": 1.63, "learning_rate": 5.608052236890878e-05, "loss": 0.0071, "step": 627330 }, { "epoch": 1.63, "learning_rate": 5.607663415253731e-05, "loss": 0.0089, "step": 627340 }, { "epoch": 1.63, "learning_rate": 5.6072745936165844e-05, "loss": 0.0067, "step": 627350 }, { "epoch": 1.63, "learning_rate": 5.6068857719794386e-05, "loss": 0.0076, "step": 627360 }, { "epoch": 1.63, "learning_rate": 5.606496950342292e-05, "loss": 0.007, "step": 627370 }, { "epoch": 1.63, "learning_rate": 5.6061081287051455e-05, "loss": 0.0075, "step": 627380 }, { "epoch": 1.63, "learning_rate": 5.605719307067999e-05, "loss": 0.0107, "step": 627390 }, { "epoch": 1.63, "learning_rate": 5.6053304854308525e-05, "loss": 0.0076, "step": 627400 }, { "epoch": 1.63, "learning_rate": 5.604941663793706e-05, "loss": 0.0101, "step": 627410 }, { "epoch": 1.63, "learning_rate": 5.6045528421565595e-05, "loss": 0.012, "step": 627420 }, { "epoch": 1.63, "learning_rate": 5.604164020519413e-05, "loss": 0.0103, "step": 627430 }, { "epoch": 1.63, "learning_rate": 5.603775198882267e-05, "loss": 0.0092, "step": 627440 }, { "epoch": 1.63, "learning_rate": 5.6033863772451206e-05, "loss": 0.0075, "step": 627450 }, { "epoch": 1.63, "learning_rate": 5.602997555607974e-05, "loss": 0.0082, "step": 627460 }, { "epoch": 1.63, "learning_rate": 5.6026087339708276e-05, "loss": 0.0096, "step": 627470 }, { "epoch": 1.63, "learning_rate": 5.602219912333681e-05, "loss": 0.0078, "step": 627480 }, { "epoch": 1.63, "learning_rate": 5.6018310906965346e-05, "loss": 0.0095, "step": 627490 }, { "epoch": 1.63, "learning_rate": 5.601442269059388e-05, "loss": 0.0093, "step": 627500 }, { "epoch": 1.63, "learning_rate": 5.6010534474222415e-05, "loss": 0.0088, "step": 627510 }, { "epoch": 1.63, "learning_rate": 5.600664625785096e-05, "loss": 0.0083, "step": 627520 }, { "epoch": 1.63, "learning_rate": 5.600275804147949e-05, "loss": 0.0078, "step": 627530 }, { "epoch": 1.63, "learning_rate": 5.5998869825108027e-05, "loss": 0.0063, "step": 627540 }, { "epoch": 1.63, "learning_rate": 5.599498160873656e-05, "loss": 0.0095, "step": 627550 }, { "epoch": 1.63, "learning_rate": 5.5991093392365096e-05, "loss": 0.0105, "step": 627560 }, { "epoch": 1.63, "learning_rate": 5.598720517599363e-05, "loss": 0.0078, "step": 627570 }, { "epoch": 1.63, "learning_rate": 5.5983316959622166e-05, "loss": 0.0075, "step": 627580 }, { "epoch": 1.63, "learning_rate": 5.5979428743250694e-05, "loss": 0.0083, "step": 627590 }, { "epoch": 1.63, "learning_rate": 5.597554052687923e-05, "loss": 0.007, "step": 627600 }, { "epoch": 1.63, "learning_rate": 5.5971652310507764e-05, "loss": 0.0123, "step": 627610 }, { "epoch": 1.63, "learning_rate": 5.5967764094136306e-05, "loss": 0.0078, "step": 627620 }, { "epoch": 1.63, "learning_rate": 5.596387587776484e-05, "loss": 0.0089, "step": 627630 }, { "epoch": 1.63, "learning_rate": 5.5959987661393375e-05, "loss": 0.0096, "step": 627640 }, { "epoch": 1.63, "learning_rate": 5.595609944502191e-05, "loss": 0.0083, "step": 627650 }, { "epoch": 1.63, "learning_rate": 5.5952211228650445e-05, "loss": 0.0067, "step": 627660 }, { "epoch": 1.63, "learning_rate": 5.594832301227898e-05, "loss": 0.008, "step": 627670 }, { "epoch": 1.63, "learning_rate": 5.5944434795907515e-05, "loss": 0.0088, "step": 627680 }, { "epoch": 1.63, "learning_rate": 5.594054657953605e-05, "loss": 0.0074, "step": 627690 }, { "epoch": 1.63, "learning_rate": 5.593665836316459e-05, "loss": 0.0082, "step": 627700 }, { "epoch": 1.63, "learning_rate": 5.5932770146793126e-05, "loss": 0.0082, "step": 627710 }, { "epoch": 1.63, "learning_rate": 5.592888193042166e-05, "loss": 0.0091, "step": 627720 }, { "epoch": 1.63, "learning_rate": 5.5924993714050196e-05, "loss": 0.0075, "step": 627730 }, { "epoch": 1.63, "learning_rate": 5.592110549767873e-05, "loss": 0.0077, "step": 627740 }, { "epoch": 1.63, "learning_rate": 5.5917217281307265e-05, "loss": 0.0074, "step": 627750 }, { "epoch": 1.63, "learning_rate": 5.59133290649358e-05, "loss": 0.0089, "step": 627760 }, { "epoch": 1.63, "learning_rate": 5.5909440848564335e-05, "loss": 0.0122, "step": 627770 }, { "epoch": 1.63, "learning_rate": 5.590555263219288e-05, "loss": 0.0095, "step": 627780 }, { "epoch": 1.63, "learning_rate": 5.590166441582141e-05, "loss": 0.0077, "step": 627790 }, { "epoch": 1.63, "learning_rate": 5.5897776199449947e-05, "loss": 0.0096, "step": 627800 }, { "epoch": 1.63, "learning_rate": 5.589388798307848e-05, "loss": 0.0084, "step": 627810 }, { "epoch": 1.63, "learning_rate": 5.5889999766707016e-05, "loss": 0.0073, "step": 627820 }, { "epoch": 1.63, "learning_rate": 5.588611155033555e-05, "loss": 0.0102, "step": 627830 }, { "epoch": 1.63, "learning_rate": 5.588222333396408e-05, "loss": 0.0075, "step": 627840 }, { "epoch": 1.63, "learning_rate": 5.5878335117592614e-05, "loss": 0.0079, "step": 627850 }, { "epoch": 1.63, "learning_rate": 5.587444690122115e-05, "loss": 0.008, "step": 627860 }, { "epoch": 1.63, "learning_rate": 5.5870558684849684e-05, "loss": 0.0082, "step": 627870 }, { "epoch": 1.63, "learning_rate": 5.5866670468478225e-05, "loss": 0.0103, "step": 627880 }, { "epoch": 1.63, "learning_rate": 5.586278225210676e-05, "loss": 0.0093, "step": 627890 }, { "epoch": 1.63, "learning_rate": 5.5858894035735295e-05, "loss": 0.0079, "step": 627900 }, { "epoch": 1.63, "learning_rate": 5.585500581936383e-05, "loss": 0.0078, "step": 627910 }, { "epoch": 1.63, "learning_rate": 5.5851117602992365e-05, "loss": 0.0073, "step": 627920 }, { "epoch": 1.63, "learning_rate": 5.58472293866209e-05, "loss": 0.0083, "step": 627930 }, { "epoch": 1.63, "learning_rate": 5.5843341170249435e-05, "loss": 0.0078, "step": 627940 }, { "epoch": 1.63, "learning_rate": 5.583945295387797e-05, "loss": 0.0079, "step": 627950 }, { "epoch": 1.63, "learning_rate": 5.583556473750651e-05, "loss": 0.0077, "step": 627960 }, { "epoch": 1.63, "learning_rate": 5.5831676521135046e-05, "loss": 0.0098, "step": 627970 }, { "epoch": 1.63, "learning_rate": 5.582778830476358e-05, "loss": 0.01, "step": 627980 }, { "epoch": 1.63, "learning_rate": 5.5823900088392116e-05, "loss": 0.0097, "step": 627990 }, { "epoch": 1.63, "learning_rate": 5.582001187202065e-05, "loss": 0.0107, "step": 628000 }, { "epoch": 1.63, "eval_cer": 0.8816844910430235, "eval_loss": 0.005415888503193855, "eval_runtime": 107.942, "eval_samples_per_second": 18.528, "eval_steps_per_second": 4.632, "step": 628000 }, { "epoch": 1.63, "learning_rate": 5.5816123655649185e-05, "loss": 0.0066, "step": 628010 }, { "epoch": 1.63, "learning_rate": 5.581223543927772e-05, "loss": 0.0096, "step": 628020 }, { "epoch": 1.63, "learning_rate": 5.5808347222906255e-05, "loss": 0.01, "step": 628030 }, { "epoch": 1.63, "learning_rate": 5.58044590065348e-05, "loss": 0.0069, "step": 628040 }, { "epoch": 1.63, "learning_rate": 5.580057079016333e-05, "loss": 0.008, "step": 628050 }, { "epoch": 1.63, "learning_rate": 5.5796682573791867e-05, "loss": 0.0089, "step": 628060 }, { "epoch": 1.63, "learning_rate": 5.57927943574204e-05, "loss": 0.0079, "step": 628070 }, { "epoch": 1.63, "learning_rate": 5.5788906141048936e-05, "loss": 0.0094, "step": 628080 }, { "epoch": 1.63, "learning_rate": 5.5785017924677464e-05, "loss": 0.0086, "step": 628090 }, { "epoch": 1.63, "learning_rate": 5.5781129708306e-05, "loss": 0.0074, "step": 628100 }, { "epoch": 1.63, "learning_rate": 5.5777241491934534e-05, "loss": 0.0072, "step": 628110 }, { "epoch": 1.63, "learning_rate": 5.577335327556307e-05, "loss": 0.0085, "step": 628120 }, { "epoch": 1.63, "learning_rate": 5.5769465059191604e-05, "loss": 0.0078, "step": 628130 }, { "epoch": 1.63, "learning_rate": 5.5765576842820145e-05, "loss": 0.0063, "step": 628140 }, { "epoch": 1.63, "learning_rate": 5.576168862644868e-05, "loss": 0.0079, "step": 628150 }, { "epoch": 1.63, "learning_rate": 5.5757800410077215e-05, "loss": 0.0067, "step": 628160 }, { "epoch": 1.63, "learning_rate": 5.575391219370575e-05, "loss": 0.0094, "step": 628170 }, { "epoch": 1.63, "learning_rate": 5.5750023977334285e-05, "loss": 0.007, "step": 628180 }, { "epoch": 1.63, "learning_rate": 5.574613576096282e-05, "loss": 0.0094, "step": 628190 }, { "epoch": 1.63, "learning_rate": 5.5742247544591355e-05, "loss": 0.0077, "step": 628200 }, { "epoch": 1.63, "learning_rate": 5.573835932821989e-05, "loss": 0.0088, "step": 628210 }, { "epoch": 1.63, "learning_rate": 5.573447111184843e-05, "loss": 0.0098, "step": 628220 }, { "epoch": 1.63, "learning_rate": 5.5730582895476966e-05, "loss": 0.0094, "step": 628230 }, { "epoch": 1.63, "learning_rate": 5.57266946791055e-05, "loss": 0.0088, "step": 628240 }, { "epoch": 1.63, "learning_rate": 5.5722806462734036e-05, "loss": 0.0065, "step": 628250 }, { "epoch": 1.63, "learning_rate": 5.571891824636257e-05, "loss": 0.0085, "step": 628260 }, { "epoch": 1.63, "learning_rate": 5.5715030029991105e-05, "loss": 0.0094, "step": 628270 }, { "epoch": 1.63, "learning_rate": 5.571114181361964e-05, "loss": 0.0104, "step": 628280 }, { "epoch": 1.63, "learning_rate": 5.5707253597248175e-05, "loss": 0.0071, "step": 628290 }, { "epoch": 1.63, "learning_rate": 5.570336538087671e-05, "loss": 0.007, "step": 628300 }, { "epoch": 1.63, "learning_rate": 5.569947716450525e-05, "loss": 0.007, "step": 628310 }, { "epoch": 1.63, "learning_rate": 5.5695588948133786e-05, "loss": 0.0076, "step": 628320 }, { "epoch": 1.63, "learning_rate": 5.569170073176232e-05, "loss": 0.0098, "step": 628330 }, { "epoch": 1.63, "learning_rate": 5.568781251539085e-05, "loss": 0.0093, "step": 628340 }, { "epoch": 1.63, "learning_rate": 5.5683924299019384e-05, "loss": 0.0082, "step": 628350 }, { "epoch": 1.63, "learning_rate": 5.568003608264792e-05, "loss": 0.0088, "step": 628360 }, { "epoch": 1.63, "learning_rate": 5.5676147866276454e-05, "loss": 0.0067, "step": 628370 }, { "epoch": 1.63, "learning_rate": 5.567225964990499e-05, "loss": 0.0092, "step": 628380 }, { "epoch": 1.63, "learning_rate": 5.5668371433533524e-05, "loss": 0.0096, "step": 628390 }, { "epoch": 1.63, "learning_rate": 5.566448321716206e-05, "loss": 0.0073, "step": 628400 }, { "epoch": 1.63, "learning_rate": 5.56605950007906e-05, "loss": 0.0064, "step": 628410 }, { "epoch": 1.63, "learning_rate": 5.5656706784419135e-05, "loss": 0.0087, "step": 628420 }, { "epoch": 1.63, "learning_rate": 5.565281856804767e-05, "loss": 0.0079, "step": 628430 }, { "epoch": 1.63, "learning_rate": 5.5648930351676205e-05, "loss": 0.0079, "step": 628440 }, { "epoch": 1.63, "learning_rate": 5.564504213530474e-05, "loss": 0.0054, "step": 628450 }, { "epoch": 1.63, "learning_rate": 5.5641153918933275e-05, "loss": 0.0097, "step": 628460 }, { "epoch": 1.63, "learning_rate": 5.563726570256181e-05, "loss": 0.0101, "step": 628470 }, { "epoch": 1.63, "learning_rate": 5.5633377486190344e-05, "loss": 0.0095, "step": 628480 }, { "epoch": 1.63, "learning_rate": 5.5629489269818886e-05, "loss": 0.0109, "step": 628490 }, { "epoch": 1.63, "learning_rate": 5.562560105344742e-05, "loss": 0.0073, "step": 628500 }, { "epoch": 1.63, "learning_rate": 5.5621712837075956e-05, "loss": 0.0075, "step": 628510 }, { "epoch": 1.63, "learning_rate": 5.561782462070449e-05, "loss": 0.0079, "step": 628520 }, { "epoch": 1.63, "learning_rate": 5.5613936404333025e-05, "loss": 0.009, "step": 628530 }, { "epoch": 1.63, "learning_rate": 5.561004818796156e-05, "loss": 0.0064, "step": 628540 }, { "epoch": 1.63, "learning_rate": 5.5606159971590095e-05, "loss": 0.0081, "step": 628550 }, { "epoch": 1.63, "learning_rate": 5.560227175521863e-05, "loss": 0.0069, "step": 628560 }, { "epoch": 1.63, "learning_rate": 5.559838353884717e-05, "loss": 0.0097, "step": 628570 }, { "epoch": 1.63, "learning_rate": 5.559449532247569e-05, "loss": 0.0073, "step": 628580 }, { "epoch": 1.63, "learning_rate": 5.5590607106104235e-05, "loss": 0.0092, "step": 628590 }, { "epoch": 1.63, "learning_rate": 5.558671888973277e-05, "loss": 0.0125, "step": 628600 }, { "epoch": 1.63, "learning_rate": 5.5582830673361304e-05, "loss": 0.0113, "step": 628610 }, { "epoch": 1.63, "learning_rate": 5.557894245698984e-05, "loss": 0.007, "step": 628620 }, { "epoch": 1.63, "learning_rate": 5.5575054240618374e-05, "loss": 0.0075, "step": 628630 }, { "epoch": 1.63, "learning_rate": 5.557116602424691e-05, "loss": 0.0076, "step": 628640 }, { "epoch": 1.63, "learning_rate": 5.5567277807875444e-05, "loss": 0.0061, "step": 628650 }, { "epoch": 1.63, "learning_rate": 5.556338959150398e-05, "loss": 0.0088, "step": 628660 }, { "epoch": 1.63, "learning_rate": 5.555950137513252e-05, "loss": 0.009, "step": 628670 }, { "epoch": 1.63, "learning_rate": 5.5555613158761055e-05, "loss": 0.0064, "step": 628680 }, { "epoch": 1.63, "learning_rate": 5.555172494238959e-05, "loss": 0.0126, "step": 628690 }, { "epoch": 1.63, "learning_rate": 5.5547836726018125e-05, "loss": 0.0083, "step": 628700 }, { "epoch": 1.63, "learning_rate": 5.554394850964666e-05, "loss": 0.007, "step": 628710 }, { "epoch": 1.63, "learning_rate": 5.5540060293275194e-05, "loss": 0.0082, "step": 628720 }, { "epoch": 1.63, "learning_rate": 5.553617207690373e-05, "loss": 0.0054, "step": 628730 }, { "epoch": 1.63, "learning_rate": 5.5532283860532264e-05, "loss": 0.007, "step": 628740 }, { "epoch": 1.63, "learning_rate": 5.5528395644160806e-05, "loss": 0.0143, "step": 628750 }, { "epoch": 1.63, "learning_rate": 5.552450742778934e-05, "loss": 0.0075, "step": 628760 }, { "epoch": 1.63, "learning_rate": 5.5520619211417876e-05, "loss": 0.0079, "step": 628770 }, { "epoch": 1.63, "learning_rate": 5.551673099504641e-05, "loss": 0.0079, "step": 628780 }, { "epoch": 1.63, "learning_rate": 5.5512842778674945e-05, "loss": 0.0084, "step": 628790 }, { "epoch": 1.63, "learning_rate": 5.550895456230348e-05, "loss": 0.0073, "step": 628800 }, { "epoch": 1.63, "learning_rate": 5.5505066345932015e-05, "loss": 0.0091, "step": 628810 }, { "epoch": 1.63, "learning_rate": 5.550117812956055e-05, "loss": 0.007, "step": 628820 }, { "epoch": 1.63, "learning_rate": 5.549728991318908e-05, "loss": 0.0088, "step": 628830 }, { "epoch": 1.63, "learning_rate": 5.549340169681761e-05, "loss": 0.0068, "step": 628840 }, { "epoch": 1.63, "learning_rate": 5.5489513480446154e-05, "loss": 0.0087, "step": 628850 }, { "epoch": 1.63, "learning_rate": 5.548562526407469e-05, "loss": 0.0072, "step": 628860 }, { "epoch": 1.63, "learning_rate": 5.5481737047703224e-05, "loss": 0.0082, "step": 628870 }, { "epoch": 1.63, "learning_rate": 5.547784883133176e-05, "loss": 0.0058, "step": 628880 }, { "epoch": 1.63, "learning_rate": 5.5473960614960294e-05, "loss": 0.0063, "step": 628890 }, { "epoch": 1.63, "learning_rate": 5.547007239858883e-05, "loss": 0.0077, "step": 628900 }, { "epoch": 1.63, "learning_rate": 5.5466184182217364e-05, "loss": 0.0073, "step": 628910 }, { "epoch": 1.63, "learning_rate": 5.54622959658459e-05, "loss": 0.0096, "step": 628920 }, { "epoch": 1.63, "learning_rate": 5.545840774947444e-05, "loss": 0.0103, "step": 628930 }, { "epoch": 1.63, "learning_rate": 5.5454519533102975e-05, "loss": 0.0075, "step": 628940 }, { "epoch": 1.63, "learning_rate": 5.545063131673151e-05, "loss": 0.0082, "step": 628950 }, { "epoch": 1.63, "learning_rate": 5.5446743100360045e-05, "loss": 0.0089, "step": 628960 }, { "epoch": 1.63, "learning_rate": 5.544285488398858e-05, "loss": 0.0086, "step": 628970 }, { "epoch": 1.63, "learning_rate": 5.5438966667617114e-05, "loss": 0.0067, "step": 628980 }, { "epoch": 1.63, "learning_rate": 5.543507845124565e-05, "loss": 0.0101, "step": 628990 }, { "epoch": 1.63, "learning_rate": 5.5431190234874184e-05, "loss": 0.0123, "step": 629000 }, { "epoch": 1.63, "eval_cer": 0.8816522993935373, "eval_loss": 0.005537708289921284, "eval_runtime": 107.8233, "eval_samples_per_second": 18.549, "eval_steps_per_second": 4.637, "step": 629000 }, { "epoch": 1.63, "learning_rate": 5.5427302018502726e-05, "loss": 0.0107, "step": 629010 }, { "epoch": 1.63, "learning_rate": 5.542341380213126e-05, "loss": 0.0085, "step": 629020 }, { "epoch": 1.63, "learning_rate": 5.5419525585759796e-05, "loss": 0.0109, "step": 629030 }, { "epoch": 1.63, "learning_rate": 5.541563736938833e-05, "loss": 0.0099, "step": 629040 }, { "epoch": 1.63, "learning_rate": 5.5411749153016865e-05, "loss": 0.0118, "step": 629050 }, { "epoch": 1.63, "learning_rate": 5.54078609366454e-05, "loss": 0.0122, "step": 629060 }, { "epoch": 1.63, "learning_rate": 5.5403972720273935e-05, "loss": 0.0075, "step": 629070 }, { "epoch": 1.63, "learning_rate": 5.540008450390246e-05, "loss": 0.0108, "step": 629080 }, { "epoch": 1.63, "learning_rate": 5.5396196287531e-05, "loss": 0.0087, "step": 629090 }, { "epoch": 1.63, "learning_rate": 5.539230807115953e-05, "loss": 0.0069, "step": 629100 }, { "epoch": 1.63, "learning_rate": 5.5388419854788074e-05, "loss": 0.0104, "step": 629110 }, { "epoch": 1.63, "learning_rate": 5.538453163841661e-05, "loss": 0.0085, "step": 629120 }, { "epoch": 1.63, "learning_rate": 5.5380643422045144e-05, "loss": 0.0107, "step": 629130 }, { "epoch": 1.63, "learning_rate": 5.537675520567368e-05, "loss": 0.0102, "step": 629140 }, { "epoch": 1.63, "learning_rate": 5.5372866989302214e-05, "loss": 0.0089, "step": 629150 }, { "epoch": 1.63, "learning_rate": 5.536897877293075e-05, "loss": 0.0075, "step": 629160 }, { "epoch": 1.63, "learning_rate": 5.5365090556559284e-05, "loss": 0.014, "step": 629170 }, { "epoch": 1.63, "learning_rate": 5.536120234018782e-05, "loss": 0.0115, "step": 629180 }, { "epoch": 1.63, "learning_rate": 5.535731412381636e-05, "loss": 0.0078, "step": 629190 }, { "epoch": 1.63, "learning_rate": 5.5353425907444895e-05, "loss": 0.008, "step": 629200 }, { "epoch": 1.63, "learning_rate": 5.534953769107343e-05, "loss": 0.0062, "step": 629210 }, { "epoch": 1.63, "learning_rate": 5.5345649474701965e-05, "loss": 0.0081, "step": 629220 }, { "epoch": 1.63, "learning_rate": 5.53417612583305e-05, "loss": 0.0095, "step": 629230 }, { "epoch": 1.63, "learning_rate": 5.5337873041959034e-05, "loss": 0.009, "step": 629240 }, { "epoch": 1.63, "learning_rate": 5.533398482558757e-05, "loss": 0.009, "step": 629250 }, { "epoch": 1.63, "learning_rate": 5.5330096609216104e-05, "loss": 0.0097, "step": 629260 }, { "epoch": 1.63, "learning_rate": 5.5326208392844646e-05, "loss": 0.0071, "step": 629270 }, { "epoch": 1.63, "learning_rate": 5.532232017647318e-05, "loss": 0.0073, "step": 629280 }, { "epoch": 1.63, "learning_rate": 5.5318431960101715e-05, "loss": 0.0099, "step": 629290 }, { "epoch": 1.63, "learning_rate": 5.531454374373025e-05, "loss": 0.0076, "step": 629300 }, { "epoch": 1.63, "learning_rate": 5.5310655527358785e-05, "loss": 0.0086, "step": 629310 }, { "epoch": 1.63, "learning_rate": 5.530676731098732e-05, "loss": 0.0096, "step": 629320 }, { "epoch": 1.63, "learning_rate": 5.530287909461585e-05, "loss": 0.009, "step": 629330 }, { "epoch": 1.63, "learning_rate": 5.529899087824438e-05, "loss": 0.0081, "step": 629340 }, { "epoch": 1.63, "learning_rate": 5.529510266187292e-05, "loss": 0.0083, "step": 629350 }, { "epoch": 1.63, "learning_rate": 5.529121444550145e-05, "loss": 0.0069, "step": 629360 }, { "epoch": 1.63, "learning_rate": 5.5287326229129994e-05, "loss": 0.0098, "step": 629370 }, { "epoch": 1.63, "learning_rate": 5.528343801275853e-05, "loss": 0.0065, "step": 629380 }, { "epoch": 1.63, "learning_rate": 5.5279549796387064e-05, "loss": 0.0094, "step": 629390 }, { "epoch": 1.63, "learning_rate": 5.52756615800156e-05, "loss": 0.0086, "step": 629400 }, { "epoch": 1.63, "learning_rate": 5.5271773363644134e-05, "loss": 0.01, "step": 629410 }, { "epoch": 1.63, "learning_rate": 5.526788514727267e-05, "loss": 0.0088, "step": 629420 }, { "epoch": 1.63, "learning_rate": 5.5263996930901204e-05, "loss": 0.0096, "step": 629430 }, { "epoch": 1.63, "learning_rate": 5.526010871452974e-05, "loss": 0.0103, "step": 629440 }, { "epoch": 1.63, "learning_rate": 5.525622049815828e-05, "loss": 0.0106, "step": 629450 }, { "epoch": 1.63, "learning_rate": 5.5252332281786815e-05, "loss": 0.0066, "step": 629460 }, { "epoch": 1.63, "learning_rate": 5.524844406541535e-05, "loss": 0.008, "step": 629470 }, { "epoch": 1.63, "learning_rate": 5.5244555849043885e-05, "loss": 0.0084, "step": 629480 }, { "epoch": 1.63, "learning_rate": 5.524066763267242e-05, "loss": 0.0091, "step": 629490 }, { "epoch": 1.63, "learning_rate": 5.5236779416300954e-05, "loss": 0.009, "step": 629500 }, { "epoch": 1.63, "learning_rate": 5.523289119992949e-05, "loss": 0.0076, "step": 629510 }, { "epoch": 1.63, "learning_rate": 5.5229002983558024e-05, "loss": 0.0087, "step": 629520 }, { "epoch": 1.63, "learning_rate": 5.5225114767186566e-05, "loss": 0.0076, "step": 629530 }, { "epoch": 1.63, "learning_rate": 5.52212265508151e-05, "loss": 0.0073, "step": 629540 }, { "epoch": 1.63, "learning_rate": 5.5217338334443635e-05, "loss": 0.0076, "step": 629550 }, { "epoch": 1.63, "learning_rate": 5.521345011807217e-05, "loss": 0.0088, "step": 629560 }, { "epoch": 1.63, "learning_rate": 5.5209561901700705e-05, "loss": 0.0089, "step": 629570 }, { "epoch": 1.63, "learning_rate": 5.520567368532923e-05, "loss": 0.008, "step": 629580 }, { "epoch": 1.63, "learning_rate": 5.520178546895777e-05, "loss": 0.0069, "step": 629590 }, { "epoch": 1.63, "learning_rate": 5.51978972525863e-05, "loss": 0.0101, "step": 629600 }, { "epoch": 1.63, "learning_rate": 5.519400903621484e-05, "loss": 0.0094, "step": 629610 }, { "epoch": 1.63, "learning_rate": 5.519012081984337e-05, "loss": 0.0102, "step": 629620 }, { "epoch": 1.63, "learning_rate": 5.5186232603471914e-05, "loss": 0.0107, "step": 629630 }, { "epoch": 1.63, "learning_rate": 5.518234438710045e-05, "loss": 0.0071, "step": 629640 }, { "epoch": 1.63, "learning_rate": 5.5178456170728984e-05, "loss": 0.008, "step": 629650 }, { "epoch": 1.63, "learning_rate": 5.517456795435752e-05, "loss": 0.0081, "step": 629660 }, { "epoch": 1.63, "learning_rate": 5.5170679737986054e-05, "loss": 0.0099, "step": 629670 }, { "epoch": 1.63, "learning_rate": 5.516679152161459e-05, "loss": 0.0074, "step": 629680 }, { "epoch": 1.63, "learning_rate": 5.5162903305243123e-05, "loss": 0.0078, "step": 629690 }, { "epoch": 1.63, "learning_rate": 5.515901508887166e-05, "loss": 0.0103, "step": 629700 }, { "epoch": 1.63, "learning_rate": 5.515512687250019e-05, "loss": 0.0089, "step": 629710 }, { "epoch": 1.63, "learning_rate": 5.5151238656128735e-05, "loss": 0.0092, "step": 629720 }, { "epoch": 1.63, "learning_rate": 5.514735043975727e-05, "loss": 0.009, "step": 629730 }, { "epoch": 1.63, "learning_rate": 5.5143462223385805e-05, "loss": 0.0097, "step": 629740 }, { "epoch": 1.63, "learning_rate": 5.513957400701434e-05, "loss": 0.0109, "step": 629750 }, { "epoch": 1.63, "learning_rate": 5.5135685790642874e-05, "loss": 0.0083, "step": 629760 }, { "epoch": 1.63, "learning_rate": 5.513179757427141e-05, "loss": 0.0106, "step": 629770 }, { "epoch": 1.63, "learning_rate": 5.5127909357899944e-05, "loss": 0.0077, "step": 629780 }, { "epoch": 1.63, "learning_rate": 5.512402114152848e-05, "loss": 0.0075, "step": 629790 }, { "epoch": 1.63, "learning_rate": 5.512013292515702e-05, "loss": 0.008, "step": 629800 }, { "epoch": 1.63, "learning_rate": 5.5116244708785555e-05, "loss": 0.0086, "step": 629810 }, { "epoch": 1.63, "learning_rate": 5.5112356492414083e-05, "loss": 0.0099, "step": 629820 }, { "epoch": 1.63, "learning_rate": 5.510846827604262e-05, "loss": 0.0072, "step": 629830 }, { "epoch": 1.63, "learning_rate": 5.510458005967115e-05, "loss": 0.0093, "step": 629840 }, { "epoch": 1.63, "learning_rate": 5.510069184329969e-05, "loss": 0.0085, "step": 629850 }, { "epoch": 1.63, "learning_rate": 5.509680362692822e-05, "loss": 0.0097, "step": 629860 }, { "epoch": 1.63, "learning_rate": 5.509291541055676e-05, "loss": 0.0116, "step": 629870 }, { "epoch": 1.63, "learning_rate": 5.508902719418529e-05, "loss": 0.0092, "step": 629880 }, { "epoch": 1.63, "learning_rate": 5.508513897781383e-05, "loss": 0.0086, "step": 629890 }, { "epoch": 1.63, "learning_rate": 5.508125076144237e-05, "loss": 0.0073, "step": 629900 }, { "epoch": 1.63, "learning_rate": 5.5077362545070904e-05, "loss": 0.008, "step": 629910 }, { "epoch": 1.63, "learning_rate": 5.507347432869944e-05, "loss": 0.0069, "step": 629920 }, { "epoch": 1.63, "learning_rate": 5.5069586112327974e-05, "loss": 0.0096, "step": 629930 }, { "epoch": 1.63, "learning_rate": 5.506569789595651e-05, "loss": 0.0081, "step": 629940 }, { "epoch": 1.63, "learning_rate": 5.5061809679585043e-05, "loss": 0.0102, "step": 629950 }, { "epoch": 1.63, "learning_rate": 5.505792146321358e-05, "loss": 0.0071, "step": 629960 }, { "epoch": 1.63, "learning_rate": 5.505403324684211e-05, "loss": 0.0083, "step": 629970 }, { "epoch": 1.63, "learning_rate": 5.5050145030470655e-05, "loss": 0.0082, "step": 629980 }, { "epoch": 1.63, "learning_rate": 5.504625681409919e-05, "loss": 0.0109, "step": 629990 }, { "epoch": 1.63, "learning_rate": 5.5042368597727725e-05, "loss": 0.0115, "step": 630000 }, { "epoch": 1.63, "eval_cer": 0.8816774928583525, "eval_loss": 0.005582030396908522, "eval_runtime": 107.8577, "eval_samples_per_second": 18.543, "eval_steps_per_second": 4.636, "step": 630000 }, { "epoch": 1.63, "learning_rate": 5.503848038135626e-05, "loss": 0.0085, "step": 630010 }, { "epoch": 1.63, "learning_rate": 5.5034592164984794e-05, "loss": 0.0082, "step": 630020 }, { "epoch": 1.63, "learning_rate": 5.503070394861333e-05, "loss": 0.0082, "step": 630030 }, { "epoch": 1.63, "learning_rate": 5.5026815732241864e-05, "loss": 0.007, "step": 630040 }, { "epoch": 1.63, "learning_rate": 5.50229275158704e-05, "loss": 0.01, "step": 630050 }, { "epoch": 1.63, "learning_rate": 5.501903929949894e-05, "loss": 0.0066, "step": 630060 }, { "epoch": 1.63, "learning_rate": 5.501515108312746e-05, "loss": 0.0118, "step": 630070 }, { "epoch": 1.63, "learning_rate": 5.5011262866756003e-05, "loss": 0.0174, "step": 630080 }, { "epoch": 1.63, "learning_rate": 5.500737465038454e-05, "loss": 0.008, "step": 630090 }, { "epoch": 1.63, "learning_rate": 5.500348643401307e-05, "loss": 0.0092, "step": 630100 }, { "epoch": 1.63, "learning_rate": 5.499959821764161e-05, "loss": 0.0082, "step": 630110 }, { "epoch": 1.63, "learning_rate": 5.499571000127014e-05, "loss": 0.0089, "step": 630120 }, { "epoch": 1.63, "learning_rate": 5.499182178489868e-05, "loss": 0.0064, "step": 630130 }, { "epoch": 1.63, "learning_rate": 5.498793356852721e-05, "loss": 0.0072, "step": 630140 }, { "epoch": 1.63, "learning_rate": 5.498404535215575e-05, "loss": 0.0085, "step": 630150 }, { "epoch": 1.63, "learning_rate": 5.498015713578429e-05, "loss": 0.0095, "step": 630160 }, { "epoch": 1.63, "learning_rate": 5.4976268919412824e-05, "loss": 0.0072, "step": 630170 }, { "epoch": 1.63, "learning_rate": 5.497238070304136e-05, "loss": 0.0097, "step": 630180 }, { "epoch": 1.63, "learning_rate": 5.4968492486669894e-05, "loss": 0.0106, "step": 630190 }, { "epoch": 1.63, "learning_rate": 5.496460427029843e-05, "loss": 0.0113, "step": 630200 }, { "epoch": 1.63, "learning_rate": 5.496071605392696e-05, "loss": 0.0092, "step": 630210 }, { "epoch": 1.63, "learning_rate": 5.49568278375555e-05, "loss": 0.007, "step": 630220 }, { "epoch": 1.63, "learning_rate": 5.495293962118403e-05, "loss": 0.0088, "step": 630230 }, { "epoch": 1.63, "learning_rate": 5.4949051404812575e-05, "loss": 0.0059, "step": 630240 }, { "epoch": 1.63, "learning_rate": 5.494516318844111e-05, "loss": 0.0103, "step": 630250 }, { "epoch": 1.63, "learning_rate": 5.4941274972069644e-05, "loss": 0.0084, "step": 630260 }, { "epoch": 1.63, "learning_rate": 5.493738675569818e-05, "loss": 0.007, "step": 630270 }, { "epoch": 1.63, "learning_rate": 5.4933498539326714e-05, "loss": 0.0057, "step": 630280 }, { "epoch": 1.63, "learning_rate": 5.492961032295525e-05, "loss": 0.0079, "step": 630290 }, { "epoch": 1.63, "learning_rate": 5.4925722106583784e-05, "loss": 0.0083, "step": 630300 }, { "epoch": 1.63, "learning_rate": 5.492183389021232e-05, "loss": 0.0088, "step": 630310 }, { "epoch": 1.63, "learning_rate": 5.491794567384085e-05, "loss": 0.0098, "step": 630320 }, { "epoch": 1.63, "learning_rate": 5.491405745746938e-05, "loss": 0.0083, "step": 630330 }, { "epoch": 1.63, "learning_rate": 5.491016924109792e-05, "loss": 0.0072, "step": 630340 }, { "epoch": 1.63, "learning_rate": 5.490628102472646e-05, "loss": 0.0079, "step": 630350 }, { "epoch": 1.63, "learning_rate": 5.490239280835499e-05, "loss": 0.01, "step": 630360 }, { "epoch": 1.63, "learning_rate": 5.489850459198353e-05, "loss": 0.0101, "step": 630370 }, { "epoch": 1.63, "learning_rate": 5.489461637561206e-05, "loss": 0.0073, "step": 630380 }, { "epoch": 1.63, "learning_rate": 5.48907281592406e-05, "loss": 0.0078, "step": 630390 }, { "epoch": 1.63, "learning_rate": 5.488683994286913e-05, "loss": 0.0113, "step": 630400 }, { "epoch": 1.63, "learning_rate": 5.488295172649767e-05, "loss": 0.0072, "step": 630410 }, { "epoch": 1.63, "learning_rate": 5.487906351012621e-05, "loss": 0.0091, "step": 630420 }, { "epoch": 1.63, "learning_rate": 5.4875175293754744e-05, "loss": 0.0085, "step": 630430 }, { "epoch": 1.63, "learning_rate": 5.487128707738328e-05, "loss": 0.0086, "step": 630440 }, { "epoch": 1.63, "learning_rate": 5.4867398861011814e-05, "loss": 0.0097, "step": 630450 }, { "epoch": 1.63, "learning_rate": 5.486351064464035e-05, "loss": 0.0075, "step": 630460 }, { "epoch": 1.63, "learning_rate": 5.485962242826888e-05, "loss": 0.0087, "step": 630470 }, { "epoch": 1.63, "learning_rate": 5.485573421189742e-05, "loss": 0.0077, "step": 630480 }, { "epoch": 1.63, "learning_rate": 5.485184599552595e-05, "loss": 0.0074, "step": 630490 }, { "epoch": 1.63, "learning_rate": 5.4847957779154495e-05, "loss": 0.0088, "step": 630500 }, { "epoch": 1.63, "learning_rate": 5.484406956278303e-05, "loss": 0.007, "step": 630510 }, { "epoch": 1.63, "learning_rate": 5.4840181346411564e-05, "loss": 0.0098, "step": 630520 }, { "epoch": 1.63, "learning_rate": 5.48362931300401e-05, "loss": 0.0074, "step": 630530 }, { "epoch": 1.63, "learning_rate": 5.4832404913668634e-05, "loss": 0.0066, "step": 630540 }, { "epoch": 1.63, "learning_rate": 5.482851669729717e-05, "loss": 0.0088, "step": 630550 }, { "epoch": 1.63, "learning_rate": 5.4824628480925704e-05, "loss": 0.0056, "step": 630560 }, { "epoch": 1.63, "learning_rate": 5.482074026455423e-05, "loss": 0.0084, "step": 630570 }, { "epoch": 1.63, "learning_rate": 5.481685204818277e-05, "loss": 0.0119, "step": 630580 }, { "epoch": 1.63, "learning_rate": 5.48129638318113e-05, "loss": 0.0084, "step": 630590 }, { "epoch": 1.63, "learning_rate": 5.480907561543984e-05, "loss": 0.0074, "step": 630600 }, { "epoch": 1.63, "learning_rate": 5.480518739906838e-05, "loss": 0.0078, "step": 630610 }, { "epoch": 1.63, "learning_rate": 5.480129918269691e-05, "loss": 0.0095, "step": 630620 }, { "epoch": 1.63, "learning_rate": 5.479741096632545e-05, "loss": 0.0076, "step": 630630 }, { "epoch": 1.63, "learning_rate": 5.479352274995398e-05, "loss": 0.0051, "step": 630640 }, { "epoch": 1.63, "learning_rate": 5.478963453358252e-05, "loss": 0.0073, "step": 630650 }, { "epoch": 1.63, "learning_rate": 5.478574631721105e-05, "loss": 0.01, "step": 630660 }, { "epoch": 1.63, "learning_rate": 5.478185810083959e-05, "loss": 0.0072, "step": 630670 }, { "epoch": 1.63, "learning_rate": 5.477796988446813e-05, "loss": 0.0103, "step": 630680 }, { "epoch": 1.63, "learning_rate": 5.4774081668096664e-05, "loss": 0.0044, "step": 630690 }, { "epoch": 1.63, "learning_rate": 5.47701934517252e-05, "loss": 0.0072, "step": 630700 }, { "epoch": 1.63, "learning_rate": 5.4766305235353734e-05, "loss": 0.0088, "step": 630710 }, { "epoch": 1.63, "learning_rate": 5.476241701898227e-05, "loss": 0.0092, "step": 630720 }, { "epoch": 1.63, "learning_rate": 5.47585288026108e-05, "loss": 0.0097, "step": 630730 }, { "epoch": 1.63, "learning_rate": 5.475464058623934e-05, "loss": 0.0075, "step": 630740 }, { "epoch": 1.63, "learning_rate": 5.475075236986787e-05, "loss": 0.0076, "step": 630750 }, { "epoch": 1.64, "learning_rate": 5.4746864153496415e-05, "loss": 0.0091, "step": 630760 }, { "epoch": 1.64, "learning_rate": 5.474297593712495e-05, "loss": 0.0126, "step": 630770 }, { "epoch": 1.64, "learning_rate": 5.4739087720753484e-05, "loss": 0.0083, "step": 630780 }, { "epoch": 1.64, "learning_rate": 5.473519950438202e-05, "loss": 0.0119, "step": 630790 }, { "epoch": 1.64, "learning_rate": 5.4731311288010554e-05, "loss": 0.009, "step": 630800 }, { "epoch": 1.64, "learning_rate": 5.472742307163909e-05, "loss": 0.0091, "step": 630810 }, { "epoch": 1.64, "learning_rate": 5.472353485526762e-05, "loss": 0.0099, "step": 630820 }, { "epoch": 1.64, "learning_rate": 5.471964663889615e-05, "loss": 0.0069, "step": 630830 }, { "epoch": 1.64, "learning_rate": 5.471575842252469e-05, "loss": 0.0143, "step": 630840 }, { "epoch": 1.64, "learning_rate": 5.471187020615322e-05, "loss": 0.0071, "step": 630850 }, { "epoch": 1.64, "learning_rate": 5.470798198978176e-05, "loss": 0.0123, "step": 630860 }, { "epoch": 1.64, "learning_rate": 5.47040937734103e-05, "loss": 0.0072, "step": 630870 }, { "epoch": 1.64, "learning_rate": 5.470020555703883e-05, "loss": 0.0073, "step": 630880 }, { "epoch": 1.64, "learning_rate": 5.469631734066737e-05, "loss": 0.0088, "step": 630890 }, { "epoch": 1.64, "learning_rate": 5.46924291242959e-05, "loss": 0.01, "step": 630900 }, { "epoch": 1.64, "learning_rate": 5.468854090792444e-05, "loss": 0.0102, "step": 630910 }, { "epoch": 1.64, "learning_rate": 5.468465269155297e-05, "loss": 0.0104, "step": 630920 }, { "epoch": 1.64, "learning_rate": 5.468076447518151e-05, "loss": 0.0091, "step": 630930 }, { "epoch": 1.64, "learning_rate": 5.467687625881005e-05, "loss": 0.0088, "step": 630940 }, { "epoch": 1.64, "learning_rate": 5.4672988042438584e-05, "loss": 0.008, "step": 630950 }, { "epoch": 1.64, "learning_rate": 5.466909982606712e-05, "loss": 0.0078, "step": 630960 }, { "epoch": 1.64, "learning_rate": 5.4665211609695654e-05, "loss": 0.0062, "step": 630970 }, { "epoch": 1.64, "learning_rate": 5.466132339332419e-05, "loss": 0.0098, "step": 630980 }, { "epoch": 1.64, "learning_rate": 5.465743517695272e-05, "loss": 0.0073, "step": 630990 }, { "epoch": 1.64, "learning_rate": 5.465354696058126e-05, "loss": 0.0064, "step": 631000 }, { "epoch": 1.64, "eval_cer": 0.8816858906799576, "eval_loss": 0.0054400768131017685, "eval_runtime": 107.7582, "eval_samples_per_second": 18.56, "eval_steps_per_second": 4.64, "step": 631000 }, { "epoch": 1.64, "learning_rate": 5.464965874420979e-05, "loss": 0.0078, "step": 631010 }, { "epoch": 1.64, "learning_rate": 5.464577052783833e-05, "loss": 0.0093, "step": 631020 }, { "epoch": 1.64, "learning_rate": 5.464188231146687e-05, "loss": 0.0082, "step": 631030 }, { "epoch": 1.64, "learning_rate": 5.4637994095095404e-05, "loss": 0.0068, "step": 631040 }, { "epoch": 1.64, "learning_rate": 5.463410587872394e-05, "loss": 0.0077, "step": 631050 }, { "epoch": 1.64, "learning_rate": 5.463021766235247e-05, "loss": 0.0074, "step": 631060 }, { "epoch": 1.64, "learning_rate": 5.4626329445981e-05, "loss": 0.008, "step": 631070 }, { "epoch": 1.64, "learning_rate": 5.462244122960954e-05, "loss": 0.0093, "step": 631080 }, { "epoch": 1.64, "learning_rate": 5.461855301323807e-05, "loss": 0.0074, "step": 631090 }, { "epoch": 1.64, "learning_rate": 5.461466479686661e-05, "loss": 0.0087, "step": 631100 }, { "epoch": 1.64, "learning_rate": 5.461077658049514e-05, "loss": 0.0095, "step": 631110 }, { "epoch": 1.64, "learning_rate": 5.460688836412368e-05, "loss": 0.0087, "step": 631120 }, { "epoch": 1.64, "learning_rate": 5.460300014775222e-05, "loss": 0.0066, "step": 631130 }, { "epoch": 1.64, "learning_rate": 5.459911193138075e-05, "loss": 0.0076, "step": 631140 }, { "epoch": 1.64, "learning_rate": 5.459522371500929e-05, "loss": 0.0087, "step": 631150 }, { "epoch": 1.64, "learning_rate": 5.459133549863782e-05, "loss": 0.0122, "step": 631160 }, { "epoch": 1.64, "learning_rate": 5.458744728226636e-05, "loss": 0.0104, "step": 631170 }, { "epoch": 1.64, "learning_rate": 5.458355906589489e-05, "loss": 0.0079, "step": 631180 }, { "epoch": 1.64, "learning_rate": 5.457967084952343e-05, "loss": 0.0062, "step": 631190 }, { "epoch": 1.64, "learning_rate": 5.457578263315196e-05, "loss": 0.0081, "step": 631200 }, { "epoch": 1.64, "learning_rate": 5.4571894416780504e-05, "loss": 0.0112, "step": 631210 }, { "epoch": 1.64, "learning_rate": 5.456800620040904e-05, "loss": 0.0104, "step": 631220 }, { "epoch": 1.64, "learning_rate": 5.4564117984037573e-05, "loss": 0.0129, "step": 631230 }, { "epoch": 1.64, "learning_rate": 5.456022976766611e-05, "loss": 0.0067, "step": 631240 }, { "epoch": 1.64, "learning_rate": 5.455634155129464e-05, "loss": 0.0105, "step": 631250 }, { "epoch": 1.64, "learning_rate": 5.455245333492318e-05, "loss": 0.0095, "step": 631260 }, { "epoch": 1.64, "learning_rate": 5.454856511855171e-05, "loss": 0.0077, "step": 631270 }, { "epoch": 1.64, "learning_rate": 5.454467690218025e-05, "loss": 0.0075, "step": 631280 }, { "epoch": 1.64, "learning_rate": 5.454078868580879e-05, "loss": 0.0071, "step": 631290 }, { "epoch": 1.64, "learning_rate": 5.4536900469437324e-05, "loss": 0.0075, "step": 631300 }, { "epoch": 1.64, "learning_rate": 5.453301225306585e-05, "loss": 0.0094, "step": 631310 }, { "epoch": 1.64, "learning_rate": 5.452912403669439e-05, "loss": 0.0076, "step": 631320 }, { "epoch": 1.64, "learning_rate": 5.452523582032292e-05, "loss": 0.0107, "step": 631330 }, { "epoch": 1.64, "learning_rate": 5.452134760395146e-05, "loss": 0.0088, "step": 631340 }, { "epoch": 1.64, "learning_rate": 5.451745938757999e-05, "loss": 0.0072, "step": 631350 }, { "epoch": 1.64, "learning_rate": 5.451357117120853e-05, "loss": 0.0092, "step": 631360 }, { "epoch": 1.64, "learning_rate": 5.450968295483706e-05, "loss": 0.0059, "step": 631370 }, { "epoch": 1.64, "learning_rate": 5.4505794738465596e-05, "loss": 0.0082, "step": 631380 }, { "epoch": 1.64, "learning_rate": 5.450190652209414e-05, "loss": 0.009, "step": 631390 }, { "epoch": 1.64, "learning_rate": 5.449801830572267e-05, "loss": 0.0098, "step": 631400 }, { "epoch": 1.64, "learning_rate": 5.449413008935121e-05, "loss": 0.0109, "step": 631410 }, { "epoch": 1.64, "learning_rate": 5.449024187297974e-05, "loss": 0.0115, "step": 631420 }, { "epoch": 1.64, "learning_rate": 5.448635365660828e-05, "loss": 0.0081, "step": 631430 }, { "epoch": 1.64, "learning_rate": 5.448246544023681e-05, "loss": 0.0086, "step": 631440 }, { "epoch": 1.64, "learning_rate": 5.447857722386535e-05, "loss": 0.0124, "step": 631450 }, { "epoch": 1.64, "learning_rate": 5.447468900749388e-05, "loss": 0.0078, "step": 631460 }, { "epoch": 1.64, "learning_rate": 5.4470800791122424e-05, "loss": 0.0094, "step": 631470 }, { "epoch": 1.64, "learning_rate": 5.446691257475096e-05, "loss": 0.0068, "step": 631480 }, { "epoch": 1.64, "learning_rate": 5.4463024358379493e-05, "loss": 0.0062, "step": 631490 }, { "epoch": 1.64, "learning_rate": 5.445913614200803e-05, "loss": 0.0087, "step": 631500 }, { "epoch": 1.64, "learning_rate": 5.445524792563656e-05, "loss": 0.0088, "step": 631510 }, { "epoch": 1.64, "learning_rate": 5.44513597092651e-05, "loss": 0.0071, "step": 631520 }, { "epoch": 1.64, "learning_rate": 5.444747149289363e-05, "loss": 0.009, "step": 631530 }, { "epoch": 1.64, "learning_rate": 5.444358327652217e-05, "loss": 0.0128, "step": 631540 }, { "epoch": 1.64, "learning_rate": 5.443969506015071e-05, "loss": 0.0095, "step": 631550 }, { "epoch": 1.64, "learning_rate": 5.443580684377923e-05, "loss": 0.0053, "step": 631560 }, { "epoch": 1.64, "learning_rate": 5.443191862740777e-05, "loss": 0.0072, "step": 631570 }, { "epoch": 1.64, "learning_rate": 5.442803041103631e-05, "loss": 0.0115, "step": 631580 }, { "epoch": 1.64, "learning_rate": 5.442414219466484e-05, "loss": 0.0083, "step": 631590 }, { "epoch": 1.64, "learning_rate": 5.442025397829338e-05, "loss": 0.0062, "step": 631600 }, { "epoch": 1.64, "learning_rate": 5.441636576192191e-05, "loss": 0.0095, "step": 631610 }, { "epoch": 1.64, "learning_rate": 5.441247754555045e-05, "loss": 0.0097, "step": 631620 }, { "epoch": 1.64, "learning_rate": 5.440858932917898e-05, "loss": 0.008, "step": 631630 }, { "epoch": 1.64, "learning_rate": 5.4404701112807516e-05, "loss": 0.0069, "step": 631640 }, { "epoch": 1.64, "learning_rate": 5.440081289643606e-05, "loss": 0.0069, "step": 631650 }, { "epoch": 1.64, "learning_rate": 5.439692468006459e-05, "loss": 0.0072, "step": 631660 }, { "epoch": 1.64, "learning_rate": 5.439303646369313e-05, "loss": 0.0071, "step": 631670 }, { "epoch": 1.64, "learning_rate": 5.438914824732166e-05, "loss": 0.0095, "step": 631680 }, { "epoch": 1.64, "learning_rate": 5.43852600309502e-05, "loss": 0.0078, "step": 631690 }, { "epoch": 1.64, "learning_rate": 5.438137181457873e-05, "loss": 0.0073, "step": 631700 }, { "epoch": 1.64, "learning_rate": 5.437748359820727e-05, "loss": 0.0075, "step": 631710 }, { "epoch": 1.64, "learning_rate": 5.43735953818358e-05, "loss": 0.0094, "step": 631720 }, { "epoch": 1.64, "learning_rate": 5.4369707165464344e-05, "loss": 0.006, "step": 631730 }, { "epoch": 1.64, "learning_rate": 5.436581894909288e-05, "loss": 0.0081, "step": 631740 }, { "epoch": 1.64, "learning_rate": 5.436193073272141e-05, "loss": 0.0059, "step": 631750 }, { "epoch": 1.64, "learning_rate": 5.435804251634995e-05, "loss": 0.0067, "step": 631760 }, { "epoch": 1.64, "learning_rate": 5.435415429997848e-05, "loss": 0.0117, "step": 631770 }, { "epoch": 1.64, "learning_rate": 5.435026608360702e-05, "loss": 0.0079, "step": 631780 }, { "epoch": 1.64, "learning_rate": 5.434637786723555e-05, "loss": 0.0081, "step": 631790 }, { "epoch": 1.64, "learning_rate": 5.434248965086409e-05, "loss": 0.009, "step": 631800 }, { "epoch": 1.64, "learning_rate": 5.4338601434492616e-05, "loss": 0.0085, "step": 631810 }, { "epoch": 1.64, "learning_rate": 5.433471321812115e-05, "loss": 0.0067, "step": 631820 }, { "epoch": 1.64, "learning_rate": 5.433082500174969e-05, "loss": 0.0077, "step": 631830 }, { "epoch": 1.64, "learning_rate": 5.432693678537823e-05, "loss": 0.0078, "step": 631840 }, { "epoch": 1.64, "learning_rate": 5.432304856900676e-05, "loss": 0.0097, "step": 631850 }, { "epoch": 1.64, "learning_rate": 5.43191603526353e-05, "loss": 0.01, "step": 631860 }, { "epoch": 1.64, "learning_rate": 5.431527213626383e-05, "loss": 0.009, "step": 631870 }, { "epoch": 1.64, "learning_rate": 5.4311383919892367e-05, "loss": 0.0064, "step": 631880 }, { "epoch": 1.64, "learning_rate": 5.43074957035209e-05, "loss": 0.008, "step": 631890 }, { "epoch": 1.64, "learning_rate": 5.4303607487149436e-05, "loss": 0.0066, "step": 631900 }, { "epoch": 1.64, "learning_rate": 5.429971927077798e-05, "loss": 0.0056, "step": 631910 }, { "epoch": 1.64, "learning_rate": 5.429583105440651e-05, "loss": 0.0093, "step": 631920 }, { "epoch": 1.64, "learning_rate": 5.429194283803505e-05, "loss": 0.0099, "step": 631930 }, { "epoch": 1.64, "learning_rate": 5.428805462166358e-05, "loss": 0.0087, "step": 631940 }, { "epoch": 1.64, "learning_rate": 5.428416640529212e-05, "loss": 0.0073, "step": 631950 }, { "epoch": 1.64, "learning_rate": 5.428027818892065e-05, "loss": 0.0068, "step": 631960 }, { "epoch": 1.64, "learning_rate": 5.427638997254919e-05, "loss": 0.0083, "step": 631970 }, { "epoch": 1.64, "learning_rate": 5.427250175617772e-05, "loss": 0.006, "step": 631980 }, { "epoch": 1.64, "learning_rate": 5.4268613539806264e-05, "loss": 0.0083, "step": 631990 }, { "epoch": 1.64, "learning_rate": 5.42647253234348e-05, "loss": 0.0084, "step": 632000 }, { "epoch": 1.64, "eval_cer": 0.8816634964890108, "eval_loss": 0.005452393088489771, "eval_runtime": 107.8252, "eval_samples_per_second": 18.549, "eval_steps_per_second": 4.637, "step": 632000 }, { "epoch": 1.64, "learning_rate": 5.426083710706333e-05, "loss": 0.0071, "step": 632010 }, { "epoch": 1.64, "learning_rate": 5.425694889069187e-05, "loss": 0.0097, "step": 632020 }, { "epoch": 1.64, "learning_rate": 5.42530606743204e-05, "loss": 0.0083, "step": 632030 }, { "epoch": 1.64, "learning_rate": 5.424917245794894e-05, "loss": 0.0072, "step": 632040 }, { "epoch": 1.64, "learning_rate": 5.424528424157747e-05, "loss": 0.0069, "step": 632050 }, { "epoch": 1.64, "learning_rate": 5.4241396025206e-05, "loss": 0.007, "step": 632060 }, { "epoch": 1.64, "learning_rate": 5.4237507808834536e-05, "loss": 0.0086, "step": 632070 }, { "epoch": 1.64, "learning_rate": 5.423361959246307e-05, "loss": 0.008, "step": 632080 }, { "epoch": 1.64, "learning_rate": 5.422973137609161e-05, "loss": 0.0063, "step": 632090 }, { "epoch": 1.64, "learning_rate": 5.422584315972015e-05, "loss": 0.0073, "step": 632100 }, { "epoch": 1.64, "learning_rate": 5.422195494334868e-05, "loss": 0.0111, "step": 632110 }, { "epoch": 1.64, "learning_rate": 5.421806672697722e-05, "loss": 0.0084, "step": 632120 }, { "epoch": 1.64, "learning_rate": 5.421417851060575e-05, "loss": 0.0102, "step": 632130 }, { "epoch": 1.64, "learning_rate": 5.4210290294234287e-05, "loss": 0.0074, "step": 632140 }, { "epoch": 1.64, "learning_rate": 5.420640207786282e-05, "loss": 0.007, "step": 632150 }, { "epoch": 1.64, "learning_rate": 5.4202513861491356e-05, "loss": 0.0102, "step": 632160 }, { "epoch": 1.64, "learning_rate": 5.41986256451199e-05, "loss": 0.008, "step": 632170 }, { "epoch": 1.64, "learning_rate": 5.419473742874843e-05, "loss": 0.0083, "step": 632180 }, { "epoch": 1.64, "learning_rate": 5.419084921237697e-05, "loss": 0.0083, "step": 632190 }, { "epoch": 1.64, "learning_rate": 5.41869609960055e-05, "loss": 0.0073, "step": 632200 }, { "epoch": 1.64, "learning_rate": 5.418307277963404e-05, "loss": 0.009, "step": 632210 }, { "epoch": 1.64, "learning_rate": 5.417918456326257e-05, "loss": 0.0077, "step": 632220 }, { "epoch": 1.64, "learning_rate": 5.417529634689111e-05, "loss": 0.0081, "step": 632230 }, { "epoch": 1.64, "learning_rate": 5.417140813051964e-05, "loss": 0.0047, "step": 632240 }, { "epoch": 1.64, "learning_rate": 5.4167519914148184e-05, "loss": 0.0086, "step": 632250 }, { "epoch": 1.64, "learning_rate": 5.416363169777672e-05, "loss": 0.0054, "step": 632260 }, { "epoch": 1.64, "learning_rate": 5.415974348140525e-05, "loss": 0.0091, "step": 632270 }, { "epoch": 1.64, "learning_rate": 5.415585526503379e-05, "loss": 0.0054, "step": 632280 }, { "epoch": 1.64, "learning_rate": 5.415196704866232e-05, "loss": 0.006, "step": 632290 }, { "epoch": 1.64, "learning_rate": 5.414807883229085e-05, "loss": 0.0068, "step": 632300 }, { "epoch": 1.64, "learning_rate": 5.4144190615919386e-05, "loss": 0.0062, "step": 632310 }, { "epoch": 1.64, "learning_rate": 5.414030239954792e-05, "loss": 0.0098, "step": 632320 }, { "epoch": 1.64, "learning_rate": 5.4136414183176456e-05, "loss": 0.0068, "step": 632330 }, { "epoch": 1.64, "learning_rate": 5.413252596680499e-05, "loss": 0.0095, "step": 632340 }, { "epoch": 1.64, "learning_rate": 5.412863775043353e-05, "loss": 0.0091, "step": 632350 }, { "epoch": 1.64, "learning_rate": 5.412474953406207e-05, "loss": 0.0076, "step": 632360 }, { "epoch": 1.64, "learning_rate": 5.41208613176906e-05, "loss": 0.0106, "step": 632370 }, { "epoch": 1.64, "learning_rate": 5.411697310131914e-05, "loss": 0.0082, "step": 632380 }, { "epoch": 1.64, "learning_rate": 5.411308488494767e-05, "loss": 0.0068, "step": 632390 }, { "epoch": 1.64, "learning_rate": 5.4109196668576206e-05, "loss": 0.0085, "step": 632400 }, { "epoch": 1.64, "learning_rate": 5.410530845220474e-05, "loss": 0.0086, "step": 632410 }, { "epoch": 1.64, "learning_rate": 5.4101420235833276e-05, "loss": 0.0086, "step": 632420 }, { "epoch": 1.64, "learning_rate": 5.409753201946182e-05, "loss": 0.0065, "step": 632430 }, { "epoch": 1.64, "learning_rate": 5.409364380309035e-05, "loss": 0.0061, "step": 632440 }, { "epoch": 1.64, "learning_rate": 5.408975558671889e-05, "loss": 0.0082, "step": 632450 }, { "epoch": 1.64, "learning_rate": 5.408586737034742e-05, "loss": 0.0061, "step": 632460 }, { "epoch": 1.64, "learning_rate": 5.408197915397596e-05, "loss": 0.0067, "step": 632470 }, { "epoch": 1.64, "learning_rate": 5.407809093760449e-05, "loss": 0.0067, "step": 632480 }, { "epoch": 1.64, "learning_rate": 5.407420272123303e-05, "loss": 0.0084, "step": 632490 }, { "epoch": 1.64, "learning_rate": 5.407031450486156e-05, "loss": 0.0081, "step": 632500 }, { "epoch": 1.64, "learning_rate": 5.40664262884901e-05, "loss": 0.0088, "step": 632510 }, { "epoch": 1.64, "learning_rate": 5.406253807211864e-05, "loss": 0.0089, "step": 632520 }, { "epoch": 1.64, "learning_rate": 5.405864985574717e-05, "loss": 0.0075, "step": 632530 }, { "epoch": 1.64, "learning_rate": 5.405476163937571e-05, "loss": 0.0084, "step": 632540 }, { "epoch": 1.64, "learning_rate": 5.4050873423004236e-05, "loss": 0.0091, "step": 632550 }, { "epoch": 1.64, "learning_rate": 5.404698520663277e-05, "loss": 0.0109, "step": 632560 }, { "epoch": 1.64, "learning_rate": 5.4043096990261306e-05, "loss": 0.0078, "step": 632570 }, { "epoch": 1.64, "learning_rate": 5.403920877388984e-05, "loss": 0.0096, "step": 632580 }, { "epoch": 1.64, "learning_rate": 5.4035320557518376e-05, "loss": 0.0085, "step": 632590 }, { "epoch": 1.64, "learning_rate": 5.403143234114691e-05, "loss": 0.007, "step": 632600 }, { "epoch": 1.64, "learning_rate": 5.4027544124775445e-05, "loss": 0.008, "step": 632610 }, { "epoch": 1.64, "learning_rate": 5.402365590840399e-05, "loss": 0.0095, "step": 632620 }, { "epoch": 1.64, "learning_rate": 5.401976769203252e-05, "loss": 0.0091, "step": 632630 }, { "epoch": 1.64, "learning_rate": 5.401587947566106e-05, "loss": 0.0099, "step": 632640 }, { "epoch": 1.64, "learning_rate": 5.401199125928959e-05, "loss": 0.01, "step": 632650 }, { "epoch": 1.64, "learning_rate": 5.4008103042918126e-05, "loss": 0.0054, "step": 632660 }, { "epoch": 1.64, "learning_rate": 5.400421482654666e-05, "loss": 0.015, "step": 632670 }, { "epoch": 1.64, "learning_rate": 5.4000326610175196e-05, "loss": 0.0087, "step": 632680 }, { "epoch": 1.64, "learning_rate": 5.399643839380373e-05, "loss": 0.0092, "step": 632690 }, { "epoch": 1.64, "learning_rate": 5.399255017743227e-05, "loss": 0.0107, "step": 632700 }, { "epoch": 1.64, "learning_rate": 5.398866196106081e-05, "loss": 0.0077, "step": 632710 }, { "epoch": 1.64, "learning_rate": 5.398477374468934e-05, "loss": 0.0086, "step": 632720 }, { "epoch": 1.64, "learning_rate": 5.398088552831788e-05, "loss": 0.0075, "step": 632730 }, { "epoch": 1.64, "learning_rate": 5.397699731194641e-05, "loss": 0.0094, "step": 632740 }, { "epoch": 1.64, "learning_rate": 5.397310909557495e-05, "loss": 0.0114, "step": 632750 }, { "epoch": 1.64, "learning_rate": 5.396922087920348e-05, "loss": 0.0091, "step": 632760 }, { "epoch": 1.64, "learning_rate": 5.396533266283202e-05, "loss": 0.0109, "step": 632770 }, { "epoch": 1.64, "learning_rate": 5.396144444646056e-05, "loss": 0.0069, "step": 632780 }, { "epoch": 1.64, "learning_rate": 5.395755623008909e-05, "loss": 0.0063, "step": 632790 }, { "epoch": 1.64, "learning_rate": 5.395366801371762e-05, "loss": 0.0088, "step": 632800 }, { "epoch": 1.64, "learning_rate": 5.3949779797346156e-05, "loss": 0.0087, "step": 632810 }, { "epoch": 1.64, "learning_rate": 5.394589158097469e-05, "loss": 0.009, "step": 632820 }, { "epoch": 1.64, "learning_rate": 5.3942003364603226e-05, "loss": 0.008, "step": 632830 }, { "epoch": 1.64, "learning_rate": 5.393811514823176e-05, "loss": 0.0078, "step": 632840 }, { "epoch": 1.64, "learning_rate": 5.3934226931860296e-05, "loss": 0.0069, "step": 632850 }, { "epoch": 1.64, "learning_rate": 5.393033871548883e-05, "loss": 0.0085, "step": 632860 }, { "epoch": 1.64, "learning_rate": 5.3926450499117365e-05, "loss": 0.0123, "step": 632870 }, { "epoch": 1.64, "learning_rate": 5.392256228274591e-05, "loss": 0.0078, "step": 632880 }, { "epoch": 1.64, "learning_rate": 5.391867406637444e-05, "loss": 0.0075, "step": 632890 }, { "epoch": 1.64, "learning_rate": 5.391478585000298e-05, "loss": 0.008, "step": 632900 }, { "epoch": 1.64, "learning_rate": 5.391089763363151e-05, "loss": 0.0068, "step": 632910 }, { "epoch": 1.64, "learning_rate": 5.3907009417260046e-05, "loss": 0.0087, "step": 632920 }, { "epoch": 1.64, "learning_rate": 5.390312120088858e-05, "loss": 0.0086, "step": 632930 }, { "epoch": 1.64, "learning_rate": 5.3899232984517116e-05, "loss": 0.0061, "step": 632940 }, { "epoch": 1.64, "learning_rate": 5.389534476814565e-05, "loss": 0.0111, "step": 632950 }, { "epoch": 1.64, "learning_rate": 5.389145655177419e-05, "loss": 0.0106, "step": 632960 }, { "epoch": 1.64, "learning_rate": 5.388756833540273e-05, "loss": 0.0109, "step": 632970 }, { "epoch": 1.64, "learning_rate": 5.388368011903126e-05, "loss": 0.014, "step": 632980 }, { "epoch": 1.64, "learning_rate": 5.38797919026598e-05, "loss": 0.0063, "step": 632990 }, { "epoch": 1.64, "learning_rate": 5.387590368628833e-05, "loss": 0.0107, "step": 633000 }, { "epoch": 1.64, "eval_cer": 0.8816536990304715, "eval_loss": 0.005239309277385473, "eval_runtime": 107.9136, "eval_samples_per_second": 18.533, "eval_steps_per_second": 4.633, "step": 633000 }, { "epoch": 1.64, "learning_rate": 5.387201546991687e-05, "loss": 0.0074, "step": 633010 }, { "epoch": 1.64, "learning_rate": 5.38681272535454e-05, "loss": 0.0081, "step": 633020 }, { "epoch": 1.64, "learning_rate": 5.386423903717394e-05, "loss": 0.0056, "step": 633030 }, { "epoch": 1.64, "learning_rate": 5.386035082080248e-05, "loss": 0.01, "step": 633040 }, { "epoch": 1.64, "learning_rate": 5.3856462604431e-05, "loss": 0.0107, "step": 633050 }, { "epoch": 1.64, "learning_rate": 5.385257438805954e-05, "loss": 0.0072, "step": 633060 }, { "epoch": 1.64, "learning_rate": 5.3848686171688076e-05, "loss": 0.01, "step": 633070 }, { "epoch": 1.64, "learning_rate": 5.384479795531661e-05, "loss": 0.0072, "step": 633080 }, { "epoch": 1.64, "learning_rate": 5.3840909738945146e-05, "loss": 0.0103, "step": 633090 }, { "epoch": 1.64, "learning_rate": 5.383702152257368e-05, "loss": 0.0077, "step": 633100 }, { "epoch": 1.64, "learning_rate": 5.3833133306202216e-05, "loss": 0.0078, "step": 633110 }, { "epoch": 1.64, "learning_rate": 5.382924508983075e-05, "loss": 0.0083, "step": 633120 }, { "epoch": 1.64, "learning_rate": 5.3825356873459285e-05, "loss": 0.0091, "step": 633130 }, { "epoch": 1.64, "learning_rate": 5.382146865708783e-05, "loss": 0.0098, "step": 633140 }, { "epoch": 1.64, "learning_rate": 5.381758044071636e-05, "loss": 0.0065, "step": 633150 }, { "epoch": 1.64, "learning_rate": 5.3813692224344897e-05, "loss": 0.0062, "step": 633160 }, { "epoch": 1.64, "learning_rate": 5.380980400797343e-05, "loss": 0.0055, "step": 633170 }, { "epoch": 1.64, "learning_rate": 5.3805915791601966e-05, "loss": 0.0078, "step": 633180 }, { "epoch": 1.64, "learning_rate": 5.38020275752305e-05, "loss": 0.0099, "step": 633190 }, { "epoch": 1.64, "learning_rate": 5.3798139358859036e-05, "loss": 0.0086, "step": 633200 }, { "epoch": 1.64, "learning_rate": 5.379425114248757e-05, "loss": 0.0091, "step": 633210 }, { "epoch": 1.64, "learning_rate": 5.379036292611611e-05, "loss": 0.0101, "step": 633220 }, { "epoch": 1.64, "learning_rate": 5.378647470974465e-05, "loss": 0.0073, "step": 633230 }, { "epoch": 1.64, "learning_rate": 5.378258649337318e-05, "loss": 0.0053, "step": 633240 }, { "epoch": 1.64, "learning_rate": 5.377869827700172e-05, "loss": 0.0066, "step": 633250 }, { "epoch": 1.64, "learning_rate": 5.377481006063025e-05, "loss": 0.01, "step": 633260 }, { "epoch": 1.64, "learning_rate": 5.377092184425879e-05, "loss": 0.0068, "step": 633270 }, { "epoch": 1.64, "learning_rate": 5.376703362788732e-05, "loss": 0.0086, "step": 633280 }, { "epoch": 1.64, "learning_rate": 5.3763145411515857e-05, "loss": 0.0089, "step": 633290 }, { "epoch": 1.64, "learning_rate": 5.3759257195144385e-05, "loss": 0.0091, "step": 633300 }, { "epoch": 1.64, "learning_rate": 5.375536897877292e-05, "loss": 0.009, "step": 633310 }, { "epoch": 1.64, "learning_rate": 5.375148076240146e-05, "loss": 0.0089, "step": 633320 }, { "epoch": 1.64, "learning_rate": 5.3747592546029996e-05, "loss": 0.0088, "step": 633330 }, { "epoch": 1.64, "learning_rate": 5.374370432965853e-05, "loss": 0.0126, "step": 633340 }, { "epoch": 1.64, "learning_rate": 5.3739816113287066e-05, "loss": 0.0063, "step": 633350 }, { "epoch": 1.64, "learning_rate": 5.37359278969156e-05, "loss": 0.0114, "step": 633360 }, { "epoch": 1.64, "learning_rate": 5.3732039680544135e-05, "loss": 0.0104, "step": 633370 }, { "epoch": 1.64, "learning_rate": 5.372815146417267e-05, "loss": 0.0086, "step": 633380 }, { "epoch": 1.64, "learning_rate": 5.3724263247801205e-05, "loss": 0.0068, "step": 633390 }, { "epoch": 1.64, "learning_rate": 5.372037503142975e-05, "loss": 0.0074, "step": 633400 }, { "epoch": 1.64, "learning_rate": 5.371648681505828e-05, "loss": 0.0074, "step": 633410 }, { "epoch": 1.64, "learning_rate": 5.3712598598686817e-05, "loss": 0.0074, "step": 633420 }, { "epoch": 1.64, "learning_rate": 5.370871038231535e-05, "loss": 0.0075, "step": 633430 }, { "epoch": 1.64, "learning_rate": 5.3704822165943886e-05, "loss": 0.0058, "step": 633440 }, { "epoch": 1.64, "learning_rate": 5.370093394957242e-05, "loss": 0.0077, "step": 633450 }, { "epoch": 1.64, "learning_rate": 5.3697045733200956e-05, "loss": 0.0075, "step": 633460 }, { "epoch": 1.64, "learning_rate": 5.369315751682949e-05, "loss": 0.0102, "step": 633470 }, { "epoch": 1.64, "learning_rate": 5.368926930045803e-05, "loss": 0.0066, "step": 633480 }, { "epoch": 1.64, "learning_rate": 5.368538108408657e-05, "loss": 0.0093, "step": 633490 }, { "epoch": 1.64, "learning_rate": 5.36814928677151e-05, "loss": 0.0073, "step": 633500 }, { "epoch": 1.64, "learning_rate": 5.367760465134364e-05, "loss": 0.0106, "step": 633510 }, { "epoch": 1.64, "learning_rate": 5.367371643497217e-05, "loss": 0.007, "step": 633520 }, { "epoch": 1.64, "learning_rate": 5.366982821860071e-05, "loss": 0.0086, "step": 633530 }, { "epoch": 1.64, "learning_rate": 5.366594000222924e-05, "loss": 0.0073, "step": 633540 }, { "epoch": 1.64, "learning_rate": 5.366205178585777e-05, "loss": 0.0085, "step": 633550 }, { "epoch": 1.64, "learning_rate": 5.3658163569486305e-05, "loss": 0.0064, "step": 633560 }, { "epoch": 1.64, "learning_rate": 5.365427535311484e-05, "loss": 0.0091, "step": 633570 }, { "epoch": 1.64, "learning_rate": 5.365038713674338e-05, "loss": 0.0092, "step": 633580 }, { "epoch": 1.64, "learning_rate": 5.3646498920371916e-05, "loss": 0.009, "step": 633590 }, { "epoch": 1.64, "learning_rate": 5.364261070400045e-05, "loss": 0.0071, "step": 633600 }, { "epoch": 1.64, "learning_rate": 5.3638722487628986e-05, "loss": 0.0084, "step": 633610 }, { "epoch": 1.64, "learning_rate": 5.363483427125752e-05, "loss": 0.0106, "step": 633620 }, { "epoch": 1.64, "learning_rate": 5.3630946054886055e-05, "loss": 0.0083, "step": 633630 }, { "epoch": 1.64, "learning_rate": 5.362705783851459e-05, "loss": 0.0094, "step": 633640 }, { "epoch": 1.64, "learning_rate": 5.3623169622143125e-05, "loss": 0.0088, "step": 633650 }, { "epoch": 1.64, "learning_rate": 5.361928140577167e-05, "loss": 0.0106, "step": 633660 }, { "epoch": 1.64, "learning_rate": 5.36153931894002e-05, "loss": 0.0099, "step": 633670 }, { "epoch": 1.64, "learning_rate": 5.3611504973028737e-05, "loss": 0.0075, "step": 633680 }, { "epoch": 1.64, "learning_rate": 5.360761675665727e-05, "loss": 0.0083, "step": 633690 }, { "epoch": 1.64, "learning_rate": 5.3603728540285806e-05, "loss": 0.0049, "step": 633700 }, { "epoch": 1.64, "learning_rate": 5.359984032391434e-05, "loss": 0.0085, "step": 633710 }, { "epoch": 1.64, "learning_rate": 5.3595952107542876e-05, "loss": 0.0125, "step": 633720 }, { "epoch": 1.64, "learning_rate": 5.359206389117141e-05, "loss": 0.0073, "step": 633730 }, { "epoch": 1.64, "learning_rate": 5.358817567479995e-05, "loss": 0.0078, "step": 633740 }, { "epoch": 1.64, "learning_rate": 5.358428745842849e-05, "loss": 0.0082, "step": 633750 }, { "epoch": 1.64, "learning_rate": 5.358039924205702e-05, "loss": 0.0072, "step": 633760 }, { "epoch": 1.64, "learning_rate": 5.357651102568556e-05, "loss": 0.0084, "step": 633770 }, { "epoch": 1.64, "learning_rate": 5.357262280931409e-05, "loss": 0.0077, "step": 633780 }, { "epoch": 1.64, "learning_rate": 5.356873459294262e-05, "loss": 0.0088, "step": 633790 }, { "epoch": 1.64, "learning_rate": 5.3564846376571155e-05, "loss": 0.0102, "step": 633800 }, { "epoch": 1.64, "learning_rate": 5.356095816019969e-05, "loss": 0.0063, "step": 633810 }, { "epoch": 1.64, "learning_rate": 5.3557069943828225e-05, "loss": 0.0085, "step": 633820 }, { "epoch": 1.64, "learning_rate": 5.355318172745676e-05, "loss": 0.0092, "step": 633830 }, { "epoch": 1.64, "learning_rate": 5.35492935110853e-05, "loss": 0.0067, "step": 633840 }, { "epoch": 1.64, "learning_rate": 5.3545405294713836e-05, "loss": 0.0093, "step": 633850 }, { "epoch": 1.64, "learning_rate": 5.354151707834237e-05, "loss": 0.0088, "step": 633860 }, { "epoch": 1.64, "learning_rate": 5.3537628861970906e-05, "loss": 0.0092, "step": 633870 }, { "epoch": 1.64, "learning_rate": 5.353374064559944e-05, "loss": 0.0087, "step": 633880 }, { "epoch": 1.64, "learning_rate": 5.3529852429227975e-05, "loss": 0.0081, "step": 633890 }, { "epoch": 1.64, "learning_rate": 5.352596421285651e-05, "loss": 0.0095, "step": 633900 }, { "epoch": 1.64, "learning_rate": 5.3522075996485045e-05, "loss": 0.0103, "step": 633910 }, { "epoch": 1.64, "learning_rate": 5.351818778011358e-05, "loss": 0.0113, "step": 633920 }, { "epoch": 1.64, "learning_rate": 5.351429956374212e-05, "loss": 0.0094, "step": 633930 }, { "epoch": 1.64, "learning_rate": 5.3510411347370656e-05, "loss": 0.0062, "step": 633940 }, { "epoch": 1.64, "learning_rate": 5.350652313099919e-05, "loss": 0.0096, "step": 633950 }, { "epoch": 1.64, "learning_rate": 5.3502634914627726e-05, "loss": 0.0088, "step": 633960 }, { "epoch": 1.64, "learning_rate": 5.349874669825626e-05, "loss": 0.0079, "step": 633970 }, { "epoch": 1.64, "learning_rate": 5.3494858481884796e-05, "loss": 0.0102, "step": 633980 }, { "epoch": 1.64, "learning_rate": 5.349097026551333e-05, "loss": 0.0083, "step": 633990 }, { "epoch": 1.64, "learning_rate": 5.3487082049141866e-05, "loss": 0.0062, "step": 634000 }, { "epoch": 1.64, "eval_cer": 0.8816830914060892, "eval_loss": 0.005355716682970524, "eval_runtime": 107.9589, "eval_samples_per_second": 18.526, "eval_steps_per_second": 4.631, "step": 634000 }, { "epoch": 1.64, "learning_rate": 5.348319383277041e-05, "loss": 0.0087, "step": 634010 }, { "epoch": 1.64, "learning_rate": 5.347930561639894e-05, "loss": 0.0063, "step": 634020 }, { "epoch": 1.64, "learning_rate": 5.347541740002748e-05, "loss": 0.0094, "step": 634030 }, { "epoch": 1.64, "learning_rate": 5.3471529183656005e-05, "loss": 0.0075, "step": 634040 }, { "epoch": 1.64, "learning_rate": 5.346764096728454e-05, "loss": 0.0092, "step": 634050 }, { "epoch": 1.64, "learning_rate": 5.3463752750913075e-05, "loss": 0.0074, "step": 634060 }, { "epoch": 1.64, "learning_rate": 5.345986453454161e-05, "loss": 0.0064, "step": 634070 }, { "epoch": 1.64, "learning_rate": 5.3455976318170145e-05, "loss": 0.0109, "step": 634080 }, { "epoch": 1.64, "learning_rate": 5.345208810179868e-05, "loss": 0.0085, "step": 634090 }, { "epoch": 1.64, "learning_rate": 5.3448199885427214e-05, "loss": 0.0068, "step": 634100 }, { "epoch": 1.64, "learning_rate": 5.3444311669055756e-05, "loss": 0.0077, "step": 634110 }, { "epoch": 1.64, "learning_rate": 5.344042345268429e-05, "loss": 0.0069, "step": 634120 }, { "epoch": 1.64, "learning_rate": 5.3436535236312826e-05, "loss": 0.0074, "step": 634130 }, { "epoch": 1.64, "learning_rate": 5.343264701994136e-05, "loss": 0.0082, "step": 634140 }, { "epoch": 1.64, "learning_rate": 5.3428758803569895e-05, "loss": 0.0094, "step": 634150 }, { "epoch": 1.64, "learning_rate": 5.342487058719843e-05, "loss": 0.0087, "step": 634160 }, { "epoch": 1.64, "learning_rate": 5.3420982370826965e-05, "loss": 0.0088, "step": 634170 }, { "epoch": 1.64, "learning_rate": 5.34170941544555e-05, "loss": 0.0067, "step": 634180 }, { "epoch": 1.64, "learning_rate": 5.341320593808404e-05, "loss": 0.0072, "step": 634190 }, { "epoch": 1.64, "learning_rate": 5.3409317721712576e-05, "loss": 0.0078, "step": 634200 }, { "epoch": 1.64, "learning_rate": 5.340542950534111e-05, "loss": 0.0075, "step": 634210 }, { "epoch": 1.64, "learning_rate": 5.3401541288969646e-05, "loss": 0.0077, "step": 634220 }, { "epoch": 1.64, "learning_rate": 5.339765307259818e-05, "loss": 0.0111, "step": 634230 }, { "epoch": 1.64, "learning_rate": 5.3393764856226716e-05, "loss": 0.0064, "step": 634240 }, { "epoch": 1.64, "learning_rate": 5.338987663985525e-05, "loss": 0.0086, "step": 634250 }, { "epoch": 1.64, "learning_rate": 5.3385988423483786e-05, "loss": 0.0087, "step": 634260 }, { "epoch": 1.64, "learning_rate": 5.338210020711233e-05, "loss": 0.0061, "step": 634270 }, { "epoch": 1.64, "learning_rate": 5.337821199074086e-05, "loss": 0.0072, "step": 634280 }, { "epoch": 1.64, "learning_rate": 5.337432377436939e-05, "loss": 0.0116, "step": 634290 }, { "epoch": 1.64, "learning_rate": 5.3370435557997925e-05, "loss": 0.0079, "step": 634300 }, { "epoch": 1.64, "learning_rate": 5.336654734162646e-05, "loss": 0.0079, "step": 634310 }, { "epoch": 1.64, "learning_rate": 5.3362659125254995e-05, "loss": 0.0053, "step": 634320 }, { "epoch": 1.64, "learning_rate": 5.335877090888353e-05, "loss": 0.0057, "step": 634330 }, { "epoch": 1.64, "learning_rate": 5.3354882692512064e-05, "loss": 0.0114, "step": 634340 }, { "epoch": 1.64, "learning_rate": 5.33509944761406e-05, "loss": 0.0073, "step": 634350 }, { "epoch": 1.64, "learning_rate": 5.3347106259769134e-05, "loss": 0.0075, "step": 634360 }, { "epoch": 1.64, "learning_rate": 5.3343218043397676e-05, "loss": 0.0073, "step": 634370 }, { "epoch": 1.64, "learning_rate": 5.333932982702621e-05, "loss": 0.0109, "step": 634380 }, { "epoch": 1.64, "learning_rate": 5.3335441610654746e-05, "loss": 0.0083, "step": 634390 }, { "epoch": 1.64, "learning_rate": 5.333155339428328e-05, "loss": 0.0078, "step": 634400 }, { "epoch": 1.64, "learning_rate": 5.3327665177911815e-05, "loss": 0.0087, "step": 634410 }, { "epoch": 1.64, "learning_rate": 5.332377696154035e-05, "loss": 0.0108, "step": 634420 }, { "epoch": 1.64, "learning_rate": 5.3319888745168885e-05, "loss": 0.0116, "step": 634430 }, { "epoch": 1.64, "learning_rate": 5.331600052879742e-05, "loss": 0.0072, "step": 634440 }, { "epoch": 1.64, "learning_rate": 5.331211231242596e-05, "loss": 0.0112, "step": 634450 }, { "epoch": 1.64, "learning_rate": 5.3308224096054496e-05, "loss": 0.0097, "step": 634460 }, { "epoch": 1.64, "learning_rate": 5.330433587968303e-05, "loss": 0.0081, "step": 634470 }, { "epoch": 1.64, "learning_rate": 5.3300447663311566e-05, "loss": 0.0066, "step": 634480 }, { "epoch": 1.64, "learning_rate": 5.32965594469401e-05, "loss": 0.008, "step": 634490 }, { "epoch": 1.64, "learning_rate": 5.3292671230568636e-05, "loss": 0.01, "step": 634500 }, { "epoch": 1.64, "learning_rate": 5.328878301419717e-05, "loss": 0.0096, "step": 634510 }, { "epoch": 1.64, "learning_rate": 5.3284894797825706e-05, "loss": 0.0083, "step": 634520 }, { "epoch": 1.64, "learning_rate": 5.328100658145425e-05, "loss": 0.0104, "step": 634530 }, { "epoch": 1.64, "learning_rate": 5.327711836508277e-05, "loss": 0.0097, "step": 634540 }, { "epoch": 1.64, "learning_rate": 5.327323014871131e-05, "loss": 0.0067, "step": 634550 }, { "epoch": 1.64, "learning_rate": 5.3269341932339845e-05, "loss": 0.0109, "step": 634560 }, { "epoch": 1.64, "learning_rate": 5.326545371596838e-05, "loss": 0.0095, "step": 634570 }, { "epoch": 1.64, "learning_rate": 5.3261565499596915e-05, "loss": 0.0126, "step": 634580 }, { "epoch": 1.64, "learning_rate": 5.325767728322545e-05, "loss": 0.0077, "step": 634590 }, { "epoch": 1.64, "learning_rate": 5.3253789066853984e-05, "loss": 0.0112, "step": 634600 }, { "epoch": 1.64, "learning_rate": 5.324990085048252e-05, "loss": 0.0087, "step": 634610 }, { "epoch": 1.65, "learning_rate": 5.3246012634111054e-05, "loss": 0.0089, "step": 634620 }, { "epoch": 1.65, "learning_rate": 5.3242124417739596e-05, "loss": 0.006, "step": 634630 }, { "epoch": 1.65, "learning_rate": 5.323823620136813e-05, "loss": 0.0074, "step": 634640 }, { "epoch": 1.65, "learning_rate": 5.3234347984996666e-05, "loss": 0.0076, "step": 634650 }, { "epoch": 1.65, "learning_rate": 5.32304597686252e-05, "loss": 0.0068, "step": 634660 }, { "epoch": 1.65, "learning_rate": 5.3226571552253735e-05, "loss": 0.0085, "step": 634670 }, { "epoch": 1.65, "learning_rate": 5.322268333588227e-05, "loss": 0.0099, "step": 634680 }, { "epoch": 1.65, "learning_rate": 5.3218795119510805e-05, "loss": 0.0096, "step": 634690 }, { "epoch": 1.65, "learning_rate": 5.321490690313934e-05, "loss": 0.0089, "step": 634700 }, { "epoch": 1.65, "learning_rate": 5.321101868676788e-05, "loss": 0.0081, "step": 634710 }, { "epoch": 1.65, "learning_rate": 5.3207130470396416e-05, "loss": 0.0085, "step": 634720 }, { "epoch": 1.65, "learning_rate": 5.320324225402495e-05, "loss": 0.0101, "step": 634730 }, { "epoch": 1.65, "learning_rate": 5.3199354037653486e-05, "loss": 0.0083, "step": 634740 }, { "epoch": 1.65, "learning_rate": 5.319546582128202e-05, "loss": 0.0068, "step": 634750 }, { "epoch": 1.65, "learning_rate": 5.3191577604910556e-05, "loss": 0.0117, "step": 634760 }, { "epoch": 1.65, "learning_rate": 5.318768938853909e-05, "loss": 0.0104, "step": 634770 }, { "epoch": 1.65, "learning_rate": 5.3183801172167625e-05, "loss": 0.0065, "step": 634780 }, { "epoch": 1.65, "learning_rate": 5.3179912955796154e-05, "loss": 0.0112, "step": 634790 }, { "epoch": 1.65, "learning_rate": 5.317602473942469e-05, "loss": 0.0105, "step": 634800 }, { "epoch": 1.65, "learning_rate": 5.317213652305323e-05, "loss": 0.0068, "step": 634810 }, { "epoch": 1.65, "learning_rate": 5.3168248306681765e-05, "loss": 0.0074, "step": 634820 }, { "epoch": 1.65, "learning_rate": 5.31643600903103e-05, "loss": 0.0082, "step": 634830 }, { "epoch": 1.65, "learning_rate": 5.3160471873938835e-05, "loss": 0.008, "step": 634840 }, { "epoch": 1.65, "learning_rate": 5.315658365756737e-05, "loss": 0.0069, "step": 634850 }, { "epoch": 1.65, "learning_rate": 5.3152695441195904e-05, "loss": 0.0074, "step": 634860 }, { "epoch": 1.65, "learning_rate": 5.314880722482444e-05, "loss": 0.0077, "step": 634870 }, { "epoch": 1.65, "learning_rate": 5.3144919008452974e-05, "loss": 0.009, "step": 634880 }, { "epoch": 1.65, "learning_rate": 5.3141030792081516e-05, "loss": 0.0125, "step": 634890 }, { "epoch": 1.65, "learning_rate": 5.313714257571005e-05, "loss": 0.0087, "step": 634900 }, { "epoch": 1.65, "learning_rate": 5.3133254359338585e-05, "loss": 0.009, "step": 634910 }, { "epoch": 1.65, "learning_rate": 5.312936614296712e-05, "loss": 0.0077, "step": 634920 }, { "epoch": 1.65, "learning_rate": 5.3125477926595655e-05, "loss": 0.0085, "step": 634930 }, { "epoch": 1.65, "learning_rate": 5.312158971022419e-05, "loss": 0.0093, "step": 634940 }, { "epoch": 1.65, "learning_rate": 5.3117701493852725e-05, "loss": 0.0077, "step": 634950 }, { "epoch": 1.65, "learning_rate": 5.311381327748126e-05, "loss": 0.007, "step": 634960 }, { "epoch": 1.65, "learning_rate": 5.31099250611098e-05, "loss": 0.0056, "step": 634970 }, { "epoch": 1.65, "learning_rate": 5.3106036844738336e-05, "loss": 0.0117, "step": 634980 }, { "epoch": 1.65, "learning_rate": 5.310214862836687e-05, "loss": 0.0078, "step": 634990 }, { "epoch": 1.65, "learning_rate": 5.3098260411995406e-05, "loss": 0.0047, "step": 635000 }, { "epoch": 1.65, "eval_cer": 0.8816718943106159, "eval_loss": 0.005286786239594221, "eval_runtime": 107.9393, "eval_samples_per_second": 18.529, "eval_steps_per_second": 4.632, "step": 635000 }, { "epoch": 1.65, "learning_rate": 5.309437219562394e-05, "loss": 0.0077, "step": 635010 }, { "epoch": 1.65, "learning_rate": 5.3090483979252476e-05, "loss": 0.0082, "step": 635020 }, { "epoch": 1.65, "learning_rate": 5.3086595762881004e-05, "loss": 0.0077, "step": 635030 }, { "epoch": 1.65, "learning_rate": 5.308270754650954e-05, "loss": 0.0109, "step": 635040 }, { "epoch": 1.65, "learning_rate": 5.3078819330138074e-05, "loss": 0.0085, "step": 635050 }, { "epoch": 1.65, "learning_rate": 5.307493111376661e-05, "loss": 0.0095, "step": 635060 }, { "epoch": 1.65, "learning_rate": 5.307104289739515e-05, "loss": 0.01, "step": 635070 }, { "epoch": 1.65, "learning_rate": 5.3067154681023685e-05, "loss": 0.0074, "step": 635080 }, { "epoch": 1.65, "learning_rate": 5.306326646465222e-05, "loss": 0.0093, "step": 635090 }, { "epoch": 1.65, "learning_rate": 5.3059378248280755e-05, "loss": 0.0082, "step": 635100 }, { "epoch": 1.65, "learning_rate": 5.305549003190929e-05, "loss": 0.0091, "step": 635110 }, { "epoch": 1.65, "learning_rate": 5.3051601815537824e-05, "loss": 0.0084, "step": 635120 }, { "epoch": 1.65, "learning_rate": 5.304771359916636e-05, "loss": 0.0093, "step": 635130 }, { "epoch": 1.65, "learning_rate": 5.3043825382794894e-05, "loss": 0.0081, "step": 635140 }, { "epoch": 1.65, "learning_rate": 5.3039937166423436e-05, "loss": 0.0084, "step": 635150 }, { "epoch": 1.65, "learning_rate": 5.303604895005197e-05, "loss": 0.0082, "step": 635160 }, { "epoch": 1.65, "learning_rate": 5.3032160733680505e-05, "loss": 0.0072, "step": 635170 }, { "epoch": 1.65, "learning_rate": 5.302827251730904e-05, "loss": 0.0101, "step": 635180 }, { "epoch": 1.65, "learning_rate": 5.3024384300937575e-05, "loss": 0.0076, "step": 635190 }, { "epoch": 1.65, "learning_rate": 5.302049608456611e-05, "loss": 0.0084, "step": 635200 }, { "epoch": 1.65, "learning_rate": 5.3016607868194645e-05, "loss": 0.0073, "step": 635210 }, { "epoch": 1.65, "learning_rate": 5.301271965182318e-05, "loss": 0.0092, "step": 635220 }, { "epoch": 1.65, "learning_rate": 5.3008831435451715e-05, "loss": 0.0096, "step": 635230 }, { "epoch": 1.65, "learning_rate": 5.3004943219080256e-05, "loss": 0.0088, "step": 635240 }, { "epoch": 1.65, "learning_rate": 5.300105500270879e-05, "loss": 0.0075, "step": 635250 }, { "epoch": 1.65, "learning_rate": 5.2997166786337326e-05, "loss": 0.0079, "step": 635260 }, { "epoch": 1.65, "learning_rate": 5.299327856996586e-05, "loss": 0.0076, "step": 635270 }, { "epoch": 1.65, "learning_rate": 5.298939035359439e-05, "loss": 0.0071, "step": 635280 }, { "epoch": 1.65, "learning_rate": 5.2985502137222924e-05, "loss": 0.0135, "step": 635290 }, { "epoch": 1.65, "learning_rate": 5.298161392085146e-05, "loss": 0.0078, "step": 635300 }, { "epoch": 1.65, "learning_rate": 5.2977725704479993e-05, "loss": 0.0108, "step": 635310 }, { "epoch": 1.65, "learning_rate": 5.297383748810853e-05, "loss": 0.0077, "step": 635320 }, { "epoch": 1.65, "learning_rate": 5.296994927173707e-05, "loss": 0.0091, "step": 635330 }, { "epoch": 1.65, "learning_rate": 5.2966061055365605e-05, "loss": 0.0081, "step": 635340 }, { "epoch": 1.65, "learning_rate": 5.296217283899414e-05, "loss": 0.0097, "step": 635350 }, { "epoch": 1.65, "learning_rate": 5.2958284622622675e-05, "loss": 0.0085, "step": 635360 }, { "epoch": 1.65, "learning_rate": 5.295439640625121e-05, "loss": 0.0081, "step": 635370 }, { "epoch": 1.65, "learning_rate": 5.2950508189879744e-05, "loss": 0.0059, "step": 635380 }, { "epoch": 1.65, "learning_rate": 5.294661997350828e-05, "loss": 0.0081, "step": 635390 }, { "epoch": 1.65, "learning_rate": 5.2942731757136814e-05, "loss": 0.0095, "step": 635400 }, { "epoch": 1.65, "learning_rate": 5.293884354076535e-05, "loss": 0.0081, "step": 635410 }, { "epoch": 1.65, "learning_rate": 5.293495532439389e-05, "loss": 0.0092, "step": 635420 }, { "epoch": 1.65, "learning_rate": 5.2931067108022425e-05, "loss": 0.009, "step": 635430 }, { "epoch": 1.65, "learning_rate": 5.292717889165096e-05, "loss": 0.0156, "step": 635440 }, { "epoch": 1.65, "learning_rate": 5.2923290675279495e-05, "loss": 0.0079, "step": 635450 }, { "epoch": 1.65, "learning_rate": 5.291940245890803e-05, "loss": 0.0083, "step": 635460 }, { "epoch": 1.65, "learning_rate": 5.2915514242536565e-05, "loss": 0.0086, "step": 635470 }, { "epoch": 1.65, "learning_rate": 5.29116260261651e-05, "loss": 0.0078, "step": 635480 }, { "epoch": 1.65, "learning_rate": 5.2907737809793635e-05, "loss": 0.0094, "step": 635490 }, { "epoch": 1.65, "learning_rate": 5.2903849593422176e-05, "loss": 0.0072, "step": 635500 }, { "epoch": 1.65, "learning_rate": 5.289996137705071e-05, "loss": 0.0099, "step": 635510 }, { "epoch": 1.65, "learning_rate": 5.2896073160679246e-05, "loss": 0.0067, "step": 635520 }, { "epoch": 1.65, "learning_rate": 5.2892184944307774e-05, "loss": 0.0061, "step": 635530 }, { "epoch": 1.65, "learning_rate": 5.288829672793631e-05, "loss": 0.0086, "step": 635540 }, { "epoch": 1.65, "learning_rate": 5.2884408511564844e-05, "loss": 0.0077, "step": 635550 }, { "epoch": 1.65, "learning_rate": 5.288052029519338e-05, "loss": 0.008, "step": 635560 }, { "epoch": 1.65, "learning_rate": 5.2876632078821913e-05, "loss": 0.0067, "step": 635570 }, { "epoch": 1.65, "learning_rate": 5.287274386245045e-05, "loss": 0.0095, "step": 635580 }, { "epoch": 1.65, "learning_rate": 5.286885564607898e-05, "loss": 0.0089, "step": 635590 }, { "epoch": 1.65, "learning_rate": 5.2864967429707525e-05, "loss": 0.0099, "step": 635600 }, { "epoch": 1.65, "learning_rate": 5.286107921333606e-05, "loss": 0.0069, "step": 635610 }, { "epoch": 1.65, "learning_rate": 5.2857190996964595e-05, "loss": 0.0073, "step": 635620 }, { "epoch": 1.65, "learning_rate": 5.285330278059313e-05, "loss": 0.0079, "step": 635630 }, { "epoch": 1.65, "learning_rate": 5.2849414564221664e-05, "loss": 0.0076, "step": 635640 }, { "epoch": 1.65, "learning_rate": 5.28455263478502e-05, "loss": 0.008, "step": 635650 }, { "epoch": 1.65, "learning_rate": 5.2841638131478734e-05, "loss": 0.0072, "step": 635660 }, { "epoch": 1.65, "learning_rate": 5.283774991510727e-05, "loss": 0.0115, "step": 635670 }, { "epoch": 1.65, "learning_rate": 5.283386169873581e-05, "loss": 0.0081, "step": 635680 }, { "epoch": 1.65, "learning_rate": 5.2829973482364345e-05, "loss": 0.0091, "step": 635690 }, { "epoch": 1.65, "learning_rate": 5.282608526599288e-05, "loss": 0.0097, "step": 635700 }, { "epoch": 1.65, "learning_rate": 5.2822197049621415e-05, "loss": 0.0061, "step": 635710 }, { "epoch": 1.65, "learning_rate": 5.281830883324995e-05, "loss": 0.0062, "step": 635720 }, { "epoch": 1.65, "learning_rate": 5.2814420616878485e-05, "loss": 0.0073, "step": 635730 }, { "epoch": 1.65, "learning_rate": 5.281053240050702e-05, "loss": 0.0094, "step": 635740 }, { "epoch": 1.65, "learning_rate": 5.2806644184135554e-05, "loss": 0.0077, "step": 635750 }, { "epoch": 1.65, "learning_rate": 5.2802755967764096e-05, "loss": 0.0094, "step": 635760 }, { "epoch": 1.65, "learning_rate": 5.279886775139263e-05, "loss": 0.0086, "step": 635770 }, { "epoch": 1.65, "learning_rate": 5.279497953502116e-05, "loss": 0.0078, "step": 635780 }, { "epoch": 1.65, "learning_rate": 5.2791091318649694e-05, "loss": 0.0123, "step": 635790 }, { "epoch": 1.65, "learning_rate": 5.278720310227823e-05, "loss": 0.0065, "step": 635800 }, { "epoch": 1.65, "learning_rate": 5.2783314885906764e-05, "loss": 0.0051, "step": 635810 }, { "epoch": 1.65, "learning_rate": 5.27794266695353e-05, "loss": 0.0077, "step": 635820 }, { "epoch": 1.65, "learning_rate": 5.277553845316383e-05, "loss": 0.0092, "step": 635830 }, { "epoch": 1.65, "learning_rate": 5.277165023679237e-05, "loss": 0.008, "step": 635840 }, { "epoch": 1.65, "learning_rate": 5.27677620204209e-05, "loss": 0.0092, "step": 635850 }, { "epoch": 1.65, "learning_rate": 5.2763873804049445e-05, "loss": 0.0079, "step": 635860 }, { "epoch": 1.65, "learning_rate": 5.275998558767798e-05, "loss": 0.0101, "step": 635870 }, { "epoch": 1.65, "learning_rate": 5.2756097371306514e-05, "loss": 0.0087, "step": 635880 }, { "epoch": 1.65, "learning_rate": 5.275220915493505e-05, "loss": 0.0096, "step": 635890 }, { "epoch": 1.65, "learning_rate": 5.2748320938563584e-05, "loss": 0.008, "step": 635900 }, { "epoch": 1.65, "learning_rate": 5.274443272219212e-05, "loss": 0.0102, "step": 635910 }, { "epoch": 1.65, "learning_rate": 5.2740544505820654e-05, "loss": 0.0115, "step": 635920 }, { "epoch": 1.65, "learning_rate": 5.273665628944919e-05, "loss": 0.0074, "step": 635930 }, { "epoch": 1.65, "learning_rate": 5.273276807307773e-05, "loss": 0.008, "step": 635940 }, { "epoch": 1.65, "learning_rate": 5.2728879856706265e-05, "loss": 0.0084, "step": 635950 }, { "epoch": 1.65, "learning_rate": 5.27249916403348e-05, "loss": 0.0092, "step": 635960 }, { "epoch": 1.65, "learning_rate": 5.2721103423963335e-05, "loss": 0.0104, "step": 635970 }, { "epoch": 1.65, "learning_rate": 5.271721520759187e-05, "loss": 0.011, "step": 635980 }, { "epoch": 1.65, "learning_rate": 5.2713326991220405e-05, "loss": 0.0051, "step": 635990 }, { "epoch": 1.65, "learning_rate": 5.270943877484894e-05, "loss": 0.0082, "step": 636000 }, { "epoch": 1.65, "eval_cer": 0.8817012866862336, "eval_loss": 0.005146949551999569, "eval_runtime": 108.0488, "eval_samples_per_second": 18.51, "eval_steps_per_second": 4.628, "step": 636000 }, { "epoch": 1.65, "learning_rate": 5.2705550558477474e-05, "loss": 0.0081, "step": 636010 }, { "epoch": 1.65, "learning_rate": 5.2701662342106016e-05, "loss": 0.0068, "step": 636020 }, { "epoch": 1.65, "learning_rate": 5.269777412573454e-05, "loss": 0.0096, "step": 636030 }, { "epoch": 1.65, "learning_rate": 5.269388590936308e-05, "loss": 0.0072, "step": 636040 }, { "epoch": 1.65, "learning_rate": 5.2689997692991614e-05, "loss": 0.0082, "step": 636050 }, { "epoch": 1.65, "learning_rate": 5.268610947662015e-05, "loss": 0.0062, "step": 636060 }, { "epoch": 1.65, "learning_rate": 5.2682221260248684e-05, "loss": 0.0086, "step": 636070 }, { "epoch": 1.65, "learning_rate": 5.267833304387722e-05, "loss": 0.0073, "step": 636080 }, { "epoch": 1.65, "learning_rate": 5.267444482750575e-05, "loss": 0.0081, "step": 636090 }, { "epoch": 1.65, "learning_rate": 5.267055661113429e-05, "loss": 0.0093, "step": 636100 }, { "epoch": 1.65, "learning_rate": 5.266666839476282e-05, "loss": 0.0101, "step": 636110 }, { "epoch": 1.65, "learning_rate": 5.2662780178391365e-05, "loss": 0.0071, "step": 636120 }, { "epoch": 1.65, "learning_rate": 5.26588919620199e-05, "loss": 0.0057, "step": 636130 }, { "epoch": 1.65, "learning_rate": 5.2655003745648434e-05, "loss": 0.0091, "step": 636140 }, { "epoch": 1.65, "learning_rate": 5.265111552927697e-05, "loss": 0.01, "step": 636150 }, { "epoch": 1.65, "learning_rate": 5.2647227312905504e-05, "loss": 0.0081, "step": 636160 }, { "epoch": 1.65, "learning_rate": 5.264333909653404e-05, "loss": 0.0059, "step": 636170 }, { "epoch": 1.65, "learning_rate": 5.2639450880162574e-05, "loss": 0.0093, "step": 636180 }, { "epoch": 1.65, "learning_rate": 5.263556266379111e-05, "loss": 0.006, "step": 636190 }, { "epoch": 1.65, "learning_rate": 5.263167444741965e-05, "loss": 0.0081, "step": 636200 }, { "epoch": 1.65, "learning_rate": 5.2627786231048185e-05, "loss": 0.0089, "step": 636210 }, { "epoch": 1.65, "learning_rate": 5.262389801467672e-05, "loss": 0.0068, "step": 636220 }, { "epoch": 1.65, "learning_rate": 5.2620009798305255e-05, "loss": 0.0052, "step": 636230 }, { "epoch": 1.65, "learning_rate": 5.261612158193379e-05, "loss": 0.0122, "step": 636240 }, { "epoch": 1.65, "learning_rate": 5.2612233365562325e-05, "loss": 0.0116, "step": 636250 }, { "epoch": 1.65, "learning_rate": 5.260834514919086e-05, "loss": 0.0093, "step": 636260 }, { "epoch": 1.65, "learning_rate": 5.260445693281939e-05, "loss": 0.0076, "step": 636270 }, { "epoch": 1.65, "learning_rate": 5.260056871644792e-05, "loss": 0.0065, "step": 636280 }, { "epoch": 1.65, "learning_rate": 5.259668050007646e-05, "loss": 0.0101, "step": 636290 }, { "epoch": 1.65, "learning_rate": 5.2592792283705e-05, "loss": 0.0089, "step": 636300 }, { "epoch": 1.65, "learning_rate": 5.2588904067333534e-05, "loss": 0.0082, "step": 636310 }, { "epoch": 1.65, "learning_rate": 5.258501585096207e-05, "loss": 0.008, "step": 636320 }, { "epoch": 1.65, "learning_rate": 5.2581127634590604e-05, "loss": 0.008, "step": 636330 }, { "epoch": 1.65, "learning_rate": 5.257723941821914e-05, "loss": 0.0094, "step": 636340 }, { "epoch": 1.65, "learning_rate": 5.257335120184767e-05, "loss": 0.0066, "step": 636350 }, { "epoch": 1.65, "learning_rate": 5.256946298547621e-05, "loss": 0.0068, "step": 636360 }, { "epoch": 1.65, "learning_rate": 5.256557476910474e-05, "loss": 0.0062, "step": 636370 }, { "epoch": 1.65, "learning_rate": 5.2561686552733285e-05, "loss": 0.0061, "step": 636380 }, { "epoch": 1.65, "learning_rate": 5.255779833636182e-05, "loss": 0.0073, "step": 636390 }, { "epoch": 1.65, "learning_rate": 5.2553910119990354e-05, "loss": 0.0099, "step": 636400 }, { "epoch": 1.65, "learning_rate": 5.255002190361889e-05, "loss": 0.0073, "step": 636410 }, { "epoch": 1.65, "learning_rate": 5.2546133687247424e-05, "loss": 0.007, "step": 636420 }, { "epoch": 1.65, "learning_rate": 5.254224547087596e-05, "loss": 0.0106, "step": 636430 }, { "epoch": 1.65, "learning_rate": 5.2538357254504494e-05, "loss": 0.0073, "step": 636440 }, { "epoch": 1.65, "learning_rate": 5.253446903813303e-05, "loss": 0.0075, "step": 636450 }, { "epoch": 1.65, "learning_rate": 5.253058082176157e-05, "loss": 0.0101, "step": 636460 }, { "epoch": 1.65, "learning_rate": 5.2526692605390105e-05, "loss": 0.0088, "step": 636470 }, { "epoch": 1.65, "learning_rate": 5.252280438901864e-05, "loss": 0.0092, "step": 636480 }, { "epoch": 1.65, "learning_rate": 5.2518916172647175e-05, "loss": 0.0093, "step": 636490 }, { "epoch": 1.65, "learning_rate": 5.251502795627571e-05, "loss": 0.0067, "step": 636500 }, { "epoch": 1.65, "learning_rate": 5.2511139739904245e-05, "loss": 0.0104, "step": 636510 }, { "epoch": 1.65, "learning_rate": 5.250725152353277e-05, "loss": 0.009, "step": 636520 }, { "epoch": 1.65, "learning_rate": 5.250336330716131e-05, "loss": 0.0063, "step": 636530 }, { "epoch": 1.65, "learning_rate": 5.249947509078984e-05, "loss": 0.0066, "step": 636540 }, { "epoch": 1.65, "learning_rate": 5.249558687441838e-05, "loss": 0.007, "step": 636550 }, { "epoch": 1.65, "learning_rate": 5.249169865804692e-05, "loss": 0.0054, "step": 636560 }, { "epoch": 1.65, "learning_rate": 5.2487810441675454e-05, "loss": 0.0054, "step": 636570 }, { "epoch": 1.65, "learning_rate": 5.248392222530399e-05, "loss": 0.0087, "step": 636580 }, { "epoch": 1.65, "learning_rate": 5.2480034008932524e-05, "loss": 0.0083, "step": 636590 }, { "epoch": 1.65, "learning_rate": 5.247614579256106e-05, "loss": 0.0087, "step": 636600 }, { "epoch": 1.65, "learning_rate": 5.247225757618959e-05, "loss": 0.0098, "step": 636610 }, { "epoch": 1.65, "learning_rate": 5.246836935981813e-05, "loss": 0.0087, "step": 636620 }, { "epoch": 1.65, "learning_rate": 5.246448114344666e-05, "loss": 0.0092, "step": 636630 }, { "epoch": 1.65, "learning_rate": 5.2460592927075205e-05, "loss": 0.0113, "step": 636640 }, { "epoch": 1.65, "learning_rate": 5.245670471070374e-05, "loss": 0.0069, "step": 636650 }, { "epoch": 1.65, "learning_rate": 5.2452816494332274e-05, "loss": 0.0068, "step": 636660 }, { "epoch": 1.65, "learning_rate": 5.244892827796081e-05, "loss": 0.0112, "step": 636670 }, { "epoch": 1.65, "learning_rate": 5.2445040061589344e-05, "loss": 0.0094, "step": 636680 }, { "epoch": 1.65, "learning_rate": 5.244115184521788e-05, "loss": 0.0073, "step": 636690 }, { "epoch": 1.65, "learning_rate": 5.2437263628846414e-05, "loss": 0.0083, "step": 636700 }, { "epoch": 1.65, "learning_rate": 5.243337541247495e-05, "loss": 0.0085, "step": 636710 }, { "epoch": 1.65, "learning_rate": 5.2429487196103483e-05, "loss": 0.0088, "step": 636720 }, { "epoch": 1.65, "learning_rate": 5.2425598979732025e-05, "loss": 0.0111, "step": 636730 }, { "epoch": 1.65, "learning_rate": 5.242171076336056e-05, "loss": 0.0058, "step": 636740 }, { "epoch": 1.65, "learning_rate": 5.2417822546989095e-05, "loss": 0.0103, "step": 636750 }, { "epoch": 1.65, "learning_rate": 5.241393433061763e-05, "loss": 0.0072, "step": 636760 }, { "epoch": 1.65, "learning_rate": 5.241004611424616e-05, "loss": 0.0069, "step": 636770 }, { "epoch": 1.65, "learning_rate": 5.240615789787469e-05, "loss": 0.0105, "step": 636780 }, { "epoch": 1.65, "learning_rate": 5.240226968150323e-05, "loss": 0.009, "step": 636790 }, { "epoch": 1.65, "learning_rate": 5.239838146513176e-05, "loss": 0.0099, "step": 636800 }, { "epoch": 1.65, "learning_rate": 5.23944932487603e-05, "loss": 0.0075, "step": 636810 }, { "epoch": 1.65, "learning_rate": 5.239060503238883e-05, "loss": 0.0113, "step": 636820 }, { "epoch": 1.65, "learning_rate": 5.2386716816017374e-05, "loss": 0.0067, "step": 636830 }, { "epoch": 1.65, "learning_rate": 5.238282859964591e-05, "loss": 0.0096, "step": 636840 }, { "epoch": 1.65, "learning_rate": 5.2378940383274443e-05, "loss": 0.0085, "step": 636850 }, { "epoch": 1.65, "learning_rate": 5.237505216690298e-05, "loss": 0.0096, "step": 636860 }, { "epoch": 1.65, "learning_rate": 5.237116395053151e-05, "loss": 0.0099, "step": 636870 }, { "epoch": 1.65, "learning_rate": 5.236727573416005e-05, "loss": 0.0082, "step": 636880 }, { "epoch": 1.65, "learning_rate": 5.236338751778858e-05, "loss": 0.0096, "step": 636890 }, { "epoch": 1.65, "learning_rate": 5.235949930141712e-05, "loss": 0.0076, "step": 636900 }, { "epoch": 1.65, "learning_rate": 5.235561108504566e-05, "loss": 0.0057, "step": 636910 }, { "epoch": 1.65, "learning_rate": 5.2351722868674194e-05, "loss": 0.0095, "step": 636920 }, { "epoch": 1.65, "learning_rate": 5.234783465230273e-05, "loss": 0.0089, "step": 636930 }, { "epoch": 1.65, "learning_rate": 5.2343946435931264e-05, "loss": 0.0064, "step": 636940 }, { "epoch": 1.65, "learning_rate": 5.23400582195598e-05, "loss": 0.007, "step": 636950 }, { "epoch": 1.65, "learning_rate": 5.2336170003188334e-05, "loss": 0.0055, "step": 636960 }, { "epoch": 1.65, "learning_rate": 5.233228178681687e-05, "loss": 0.0091, "step": 636970 }, { "epoch": 1.65, "learning_rate": 5.2328393570445403e-05, "loss": 0.007, "step": 636980 }, { "epoch": 1.65, "learning_rate": 5.2324505354073945e-05, "loss": 0.0087, "step": 636990 }, { "epoch": 1.65, "learning_rate": 5.232061713770248e-05, "loss": 0.0057, "step": 637000 }, { "epoch": 1.65, "eval_cer": 0.8816718943106159, "eval_loss": 0.005305544938892126, "eval_runtime": 107.7801, "eval_samples_per_second": 18.556, "eval_steps_per_second": 4.639, "step": 637000 }, { "epoch": 1.65, "learning_rate": 5.2316728921331015e-05, "loss": 0.0079, "step": 637010 }, { "epoch": 1.65, "learning_rate": 5.231284070495954e-05, "loss": 0.0086, "step": 637020 }, { "epoch": 1.65, "learning_rate": 5.230895248858808e-05, "loss": 0.0111, "step": 637030 }, { "epoch": 1.65, "learning_rate": 5.230506427221661e-05, "loss": 0.0082, "step": 637040 }, { "epoch": 1.65, "learning_rate": 5.230117605584515e-05, "loss": 0.0091, "step": 637050 }, { "epoch": 1.65, "learning_rate": 5.229728783947368e-05, "loss": 0.009, "step": 637060 }, { "epoch": 1.65, "learning_rate": 5.229339962310222e-05, "loss": 0.007, "step": 637070 }, { "epoch": 1.65, "learning_rate": 5.228951140673075e-05, "loss": 0.0087, "step": 637080 }, { "epoch": 1.65, "learning_rate": 5.2285623190359294e-05, "loss": 0.0097, "step": 637090 }, { "epoch": 1.65, "learning_rate": 5.228173497398783e-05, "loss": 0.008, "step": 637100 }, { "epoch": 1.65, "learning_rate": 5.2277846757616363e-05, "loss": 0.0085, "step": 637110 }, { "epoch": 1.65, "learning_rate": 5.22739585412449e-05, "loss": 0.0104, "step": 637120 }, { "epoch": 1.65, "learning_rate": 5.227007032487343e-05, "loss": 0.0109, "step": 637130 }, { "epoch": 1.65, "learning_rate": 5.226618210850197e-05, "loss": 0.0112, "step": 637140 }, { "epoch": 1.65, "learning_rate": 5.22622938921305e-05, "loss": 0.0107, "step": 637150 }, { "epoch": 1.65, "learning_rate": 5.225840567575904e-05, "loss": 0.0074, "step": 637160 }, { "epoch": 1.65, "learning_rate": 5.225451745938758e-05, "loss": 0.0085, "step": 637170 }, { "epoch": 1.65, "learning_rate": 5.2250629243016114e-05, "loss": 0.0066, "step": 637180 }, { "epoch": 1.65, "learning_rate": 5.224674102664465e-05, "loss": 0.0101, "step": 637190 }, { "epoch": 1.65, "learning_rate": 5.2242852810273184e-05, "loss": 0.0096, "step": 637200 }, { "epoch": 1.65, "learning_rate": 5.223896459390172e-05, "loss": 0.0089, "step": 637210 }, { "epoch": 1.65, "learning_rate": 5.2235076377530254e-05, "loss": 0.0085, "step": 637220 }, { "epoch": 1.65, "learning_rate": 5.223118816115879e-05, "loss": 0.0113, "step": 637230 }, { "epoch": 1.65, "learning_rate": 5.222729994478732e-05, "loss": 0.0092, "step": 637240 }, { "epoch": 1.65, "learning_rate": 5.2223411728415865e-05, "loss": 0.0066, "step": 637250 }, { "epoch": 1.65, "learning_rate": 5.22195235120444e-05, "loss": 0.0077, "step": 637260 }, { "epoch": 1.65, "learning_rate": 5.221563529567293e-05, "loss": 0.0107, "step": 637270 }, { "epoch": 1.65, "learning_rate": 5.221174707930146e-05, "loss": 0.0096, "step": 637280 }, { "epoch": 1.65, "learning_rate": 5.220785886293e-05, "loss": 0.0089, "step": 637290 }, { "epoch": 1.65, "learning_rate": 5.220397064655853e-05, "loss": 0.0078, "step": 637300 }, { "epoch": 1.65, "learning_rate": 5.220008243018707e-05, "loss": 0.0108, "step": 637310 }, { "epoch": 1.65, "learning_rate": 5.21961942138156e-05, "loss": 0.0069, "step": 637320 }, { "epoch": 1.65, "learning_rate": 5.219230599744414e-05, "loss": 0.0065, "step": 637330 }, { "epoch": 1.65, "learning_rate": 5.218841778107267e-05, "loss": 0.0089, "step": 637340 }, { "epoch": 1.65, "learning_rate": 5.2184529564701214e-05, "loss": 0.0074, "step": 637350 }, { "epoch": 1.65, "learning_rate": 5.218064134832975e-05, "loss": 0.0083, "step": 637360 }, { "epoch": 1.65, "learning_rate": 5.217675313195828e-05, "loss": 0.006, "step": 637370 }, { "epoch": 1.65, "learning_rate": 5.217286491558682e-05, "loss": 0.0094, "step": 637380 }, { "epoch": 1.65, "learning_rate": 5.216897669921535e-05, "loss": 0.0094, "step": 637390 }, { "epoch": 1.65, "learning_rate": 5.216508848284389e-05, "loss": 0.0087, "step": 637400 }, { "epoch": 1.65, "learning_rate": 5.216120026647242e-05, "loss": 0.0071, "step": 637410 }, { "epoch": 1.65, "learning_rate": 5.215731205010096e-05, "loss": 0.0096, "step": 637420 }, { "epoch": 1.65, "learning_rate": 5.21534238337295e-05, "loss": 0.0111, "step": 637430 }, { "epoch": 1.65, "learning_rate": 5.2149535617358034e-05, "loss": 0.0074, "step": 637440 }, { "epoch": 1.65, "learning_rate": 5.214564740098657e-05, "loss": 0.0079, "step": 637450 }, { "epoch": 1.65, "learning_rate": 5.2141759184615104e-05, "loss": 0.0085, "step": 637460 }, { "epoch": 1.65, "learning_rate": 5.213787096824364e-05, "loss": 0.0077, "step": 637470 }, { "epoch": 1.65, "learning_rate": 5.2133982751872174e-05, "loss": 0.0079, "step": 637480 }, { "epoch": 1.65, "learning_rate": 5.213009453550071e-05, "loss": 0.0062, "step": 637490 }, { "epoch": 1.65, "learning_rate": 5.212620631912924e-05, "loss": 0.0083, "step": 637500 }, { "epoch": 1.65, "learning_rate": 5.212231810275777e-05, "loss": 0.0082, "step": 637510 }, { "epoch": 1.65, "learning_rate": 5.2118429886386306e-05, "loss": 0.0082, "step": 637520 }, { "epoch": 1.65, "learning_rate": 5.211454167001485e-05, "loss": 0.0126, "step": 637530 }, { "epoch": 1.65, "learning_rate": 5.211065345364338e-05, "loss": 0.0067, "step": 637540 }, { "epoch": 1.65, "learning_rate": 5.210676523727192e-05, "loss": 0.0061, "step": 637550 }, { "epoch": 1.65, "learning_rate": 5.210287702090045e-05, "loss": 0.0086, "step": 637560 }, { "epoch": 1.65, "learning_rate": 5.209898880452899e-05, "loss": 0.0059, "step": 637570 }, { "epoch": 1.65, "learning_rate": 5.209510058815752e-05, "loss": 0.0083, "step": 637580 }, { "epoch": 1.65, "learning_rate": 5.209121237178606e-05, "loss": 0.0056, "step": 637590 }, { "epoch": 1.65, "learning_rate": 5.208732415541459e-05, "loss": 0.0091, "step": 637600 }, { "epoch": 1.65, "learning_rate": 5.2083435939043134e-05, "loss": 0.0107, "step": 637610 }, { "epoch": 1.65, "learning_rate": 5.207954772267167e-05, "loss": 0.0101, "step": 637620 }, { "epoch": 1.65, "learning_rate": 5.20756595063002e-05, "loss": 0.0087, "step": 637630 }, { "epoch": 1.65, "learning_rate": 5.207177128992874e-05, "loss": 0.0075, "step": 637640 }, { "epoch": 1.65, "learning_rate": 5.206788307355727e-05, "loss": 0.0078, "step": 637650 }, { "epoch": 1.65, "learning_rate": 5.206399485718581e-05, "loss": 0.0071, "step": 637660 }, { "epoch": 1.65, "learning_rate": 5.206010664081434e-05, "loss": 0.0099, "step": 637670 }, { "epoch": 1.65, "learning_rate": 5.205621842444288e-05, "loss": 0.0091, "step": 637680 }, { "epoch": 1.65, "learning_rate": 5.205233020807142e-05, "loss": 0.0078, "step": 637690 }, { "epoch": 1.65, "learning_rate": 5.2048441991699954e-05, "loss": 0.0089, "step": 637700 }, { "epoch": 1.65, "learning_rate": 5.204455377532849e-05, "loss": 0.0074, "step": 637710 }, { "epoch": 1.65, "learning_rate": 5.2040665558957024e-05, "loss": 0.0094, "step": 637720 }, { "epoch": 1.65, "learning_rate": 5.203677734258556e-05, "loss": 0.0101, "step": 637730 }, { "epoch": 1.65, "learning_rate": 5.2032889126214094e-05, "loss": 0.0082, "step": 637740 }, { "epoch": 1.65, "learning_rate": 5.202900090984263e-05, "loss": 0.0073, "step": 637750 }, { "epoch": 1.65, "learning_rate": 5.2025112693471157e-05, "loss": 0.0108, "step": 637760 }, { "epoch": 1.65, "learning_rate": 5.202122447709969e-05, "loss": 0.0075, "step": 637770 }, { "epoch": 1.65, "learning_rate": 5.2017336260728226e-05, "loss": 0.013, "step": 637780 }, { "epoch": 1.65, "learning_rate": 5.201344804435677e-05, "loss": 0.008, "step": 637790 }, { "epoch": 1.65, "learning_rate": 5.20095598279853e-05, "loss": 0.008, "step": 637800 }, { "epoch": 1.65, "learning_rate": 5.200567161161384e-05, "loss": 0.008, "step": 637810 }, { "epoch": 1.65, "learning_rate": 5.200178339524237e-05, "loss": 0.0081, "step": 637820 }, { "epoch": 1.65, "learning_rate": 5.199789517887091e-05, "loss": 0.0094, "step": 637830 }, { "epoch": 1.65, "learning_rate": 5.199400696249944e-05, "loss": 0.0061, "step": 637840 }, { "epoch": 1.65, "learning_rate": 5.199011874612798e-05, "loss": 0.0084, "step": 637850 }, { "epoch": 1.65, "learning_rate": 5.198623052975651e-05, "loss": 0.0109, "step": 637860 }, { "epoch": 1.65, "learning_rate": 5.1982342313385054e-05, "loss": 0.0083, "step": 637870 }, { "epoch": 1.65, "learning_rate": 5.197845409701359e-05, "loss": 0.0097, "step": 637880 }, { "epoch": 1.65, "learning_rate": 5.197456588064212e-05, "loss": 0.0085, "step": 637890 }, { "epoch": 1.65, "learning_rate": 5.197067766427066e-05, "loss": 0.0057, "step": 637900 }, { "epoch": 1.65, "learning_rate": 5.196678944789919e-05, "loss": 0.0068, "step": 637910 }, { "epoch": 1.65, "learning_rate": 5.196290123152773e-05, "loss": 0.0088, "step": 637920 }, { "epoch": 1.65, "learning_rate": 5.195901301515626e-05, "loss": 0.0098, "step": 637930 }, { "epoch": 1.65, "learning_rate": 5.19551247987848e-05, "loss": 0.0075, "step": 637940 }, { "epoch": 1.65, "learning_rate": 5.195123658241334e-05, "loss": 0.0078, "step": 637950 }, { "epoch": 1.65, "learning_rate": 5.1947348366041874e-05, "loss": 0.0079, "step": 637960 }, { "epoch": 1.65, "learning_rate": 5.194346014967041e-05, "loss": 0.0081, "step": 637970 }, { "epoch": 1.65, "learning_rate": 5.1939571933298944e-05, "loss": 0.0074, "step": 637980 }, { "epoch": 1.65, "learning_rate": 5.193568371692748e-05, "loss": 0.0083, "step": 637990 }, { "epoch": 1.65, "learning_rate": 5.1931795500556014e-05, "loss": 0.01, "step": 638000 }, { "epoch": 1.65, "eval_cer": 0.8816718943106159, "eval_loss": 0.005293059162795544, "eval_runtime": 107.9559, "eval_samples_per_second": 18.526, "eval_steps_per_second": 4.632, "step": 638000 }, { "epoch": 1.65, "learning_rate": 5.192790728418454e-05, "loss": 0.0094, "step": 638010 }, { "epoch": 1.65, "learning_rate": 5.1924019067813076e-05, "loss": 0.0091, "step": 638020 }, { "epoch": 1.65, "learning_rate": 5.192013085144161e-05, "loss": 0.0063, "step": 638030 }, { "epoch": 1.65, "learning_rate": 5.1916242635070146e-05, "loss": 0.0101, "step": 638040 }, { "epoch": 1.65, "learning_rate": 5.191235441869869e-05, "loss": 0.0066, "step": 638050 }, { "epoch": 1.65, "learning_rate": 5.190846620232722e-05, "loss": 0.0069, "step": 638060 }, { "epoch": 1.65, "learning_rate": 5.190457798595576e-05, "loss": 0.011, "step": 638070 }, { "epoch": 1.65, "learning_rate": 5.190068976958429e-05, "loss": 0.0091, "step": 638080 }, { "epoch": 1.65, "learning_rate": 5.189680155321283e-05, "loss": 0.0091, "step": 638090 }, { "epoch": 1.65, "learning_rate": 5.189291333684136e-05, "loss": 0.0068, "step": 638100 }, { "epoch": 1.65, "learning_rate": 5.18890251204699e-05, "loss": 0.0094, "step": 638110 }, { "epoch": 1.65, "learning_rate": 5.188513690409843e-05, "loss": 0.0064, "step": 638120 }, { "epoch": 1.65, "learning_rate": 5.188124868772697e-05, "loss": 0.011, "step": 638130 }, { "epoch": 1.65, "learning_rate": 5.187736047135551e-05, "loss": 0.0071, "step": 638140 }, { "epoch": 1.65, "learning_rate": 5.187347225498404e-05, "loss": 0.0097, "step": 638150 }, { "epoch": 1.65, "learning_rate": 5.186958403861258e-05, "loss": 0.0101, "step": 638160 }, { "epoch": 1.65, "learning_rate": 5.186569582224111e-05, "loss": 0.0078, "step": 638170 }, { "epoch": 1.65, "learning_rate": 5.186180760586965e-05, "loss": 0.0084, "step": 638180 }, { "epoch": 1.65, "learning_rate": 5.185791938949818e-05, "loss": 0.0065, "step": 638190 }, { "epoch": 1.65, "learning_rate": 5.185403117312672e-05, "loss": 0.01, "step": 638200 }, { "epoch": 1.65, "learning_rate": 5.185014295675525e-05, "loss": 0.0067, "step": 638210 }, { "epoch": 1.65, "learning_rate": 5.1846254740383794e-05, "loss": 0.0074, "step": 638220 }, { "epoch": 1.65, "learning_rate": 5.184236652401233e-05, "loss": 0.0072, "step": 638230 }, { "epoch": 1.65, "learning_rate": 5.1838478307640864e-05, "loss": 0.0067, "step": 638240 }, { "epoch": 1.65, "learning_rate": 5.18345900912694e-05, "loss": 0.01, "step": 638250 }, { "epoch": 1.65, "learning_rate": 5.183070187489793e-05, "loss": 0.009, "step": 638260 }, { "epoch": 1.65, "learning_rate": 5.182681365852646e-05, "loss": 0.0091, "step": 638270 }, { "epoch": 1.65, "learning_rate": 5.1822925442154996e-05, "loss": 0.007, "step": 638280 }, { "epoch": 1.65, "learning_rate": 5.181903722578353e-05, "loss": 0.0109, "step": 638290 }, { "epoch": 1.65, "learning_rate": 5.1815149009412066e-05, "loss": 0.0067, "step": 638300 }, { "epoch": 1.65, "learning_rate": 5.18112607930406e-05, "loss": 0.0089, "step": 638310 }, { "epoch": 1.65, "learning_rate": 5.180737257666914e-05, "loss": 0.0067, "step": 638320 }, { "epoch": 1.65, "learning_rate": 5.180348436029768e-05, "loss": 0.009, "step": 638330 }, { "epoch": 1.65, "learning_rate": 5.179959614392621e-05, "loss": 0.0072, "step": 638340 }, { "epoch": 1.65, "learning_rate": 5.179570792755475e-05, "loss": 0.0096, "step": 638350 }, { "epoch": 1.65, "learning_rate": 5.179181971118328e-05, "loss": 0.0081, "step": 638360 }, { "epoch": 1.65, "learning_rate": 5.178793149481182e-05, "loss": 0.0094, "step": 638370 }, { "epoch": 1.65, "learning_rate": 5.178404327844035e-05, "loss": 0.0099, "step": 638380 }, { "epoch": 1.65, "learning_rate": 5.178015506206889e-05, "loss": 0.0095, "step": 638390 }, { "epoch": 1.65, "learning_rate": 5.177626684569743e-05, "loss": 0.0066, "step": 638400 }, { "epoch": 1.65, "learning_rate": 5.177237862932596e-05, "loss": 0.0101, "step": 638410 }, { "epoch": 1.65, "learning_rate": 5.17684904129545e-05, "loss": 0.0077, "step": 638420 }, { "epoch": 1.65, "learning_rate": 5.176460219658303e-05, "loss": 0.009, "step": 638430 }, { "epoch": 1.65, "learning_rate": 5.176071398021157e-05, "loss": 0.0076, "step": 638440 }, { "epoch": 1.65, "learning_rate": 5.17568257638401e-05, "loss": 0.0085, "step": 638450 }, { "epoch": 1.65, "learning_rate": 5.175293754746864e-05, "loss": 0.0069, "step": 638460 }, { "epoch": 1.66, "learning_rate": 5.174904933109717e-05, "loss": 0.0078, "step": 638470 }, { "epoch": 1.66, "learning_rate": 5.1745161114725714e-05, "loss": 0.0062, "step": 638480 }, { "epoch": 1.66, "learning_rate": 5.174127289835425e-05, "loss": 0.0068, "step": 638490 }, { "epoch": 1.66, "learning_rate": 5.1737384681982784e-05, "loss": 0.0088, "step": 638500 }, { "epoch": 1.66, "learning_rate": 5.173349646561131e-05, "loss": 0.0079, "step": 638510 }, { "epoch": 1.66, "learning_rate": 5.172960824923985e-05, "loss": 0.0069, "step": 638520 }, { "epoch": 1.66, "learning_rate": 5.172572003286838e-05, "loss": 0.0098, "step": 638530 }, { "epoch": 1.66, "learning_rate": 5.1721831816496916e-05, "loss": 0.0057, "step": 638540 }, { "epoch": 1.66, "learning_rate": 5.171794360012545e-05, "loss": 0.0101, "step": 638550 }, { "epoch": 1.66, "learning_rate": 5.1714055383753986e-05, "loss": 0.0111, "step": 638560 }, { "epoch": 1.66, "learning_rate": 5.171016716738252e-05, "loss": 0.0077, "step": 638570 }, { "epoch": 1.66, "learning_rate": 5.170627895101106e-05, "loss": 0.0082, "step": 638580 }, { "epoch": 1.66, "learning_rate": 5.17023907346396e-05, "loss": 0.0118, "step": 638590 }, { "epoch": 1.66, "learning_rate": 5.169850251826813e-05, "loss": 0.0143, "step": 638600 }, { "epoch": 1.66, "learning_rate": 5.169461430189667e-05, "loss": 0.0069, "step": 638610 }, { "epoch": 1.66, "learning_rate": 5.16907260855252e-05, "loss": 0.0069, "step": 638620 }, { "epoch": 1.66, "learning_rate": 5.168683786915374e-05, "loss": 0.008, "step": 638630 }, { "epoch": 1.66, "learning_rate": 5.168294965278227e-05, "loss": 0.0063, "step": 638640 }, { "epoch": 1.66, "learning_rate": 5.167906143641081e-05, "loss": 0.0067, "step": 638650 }, { "epoch": 1.66, "learning_rate": 5.167517322003935e-05, "loss": 0.0081, "step": 638660 }, { "epoch": 1.66, "learning_rate": 5.167128500366788e-05, "loss": 0.0059, "step": 638670 }, { "epoch": 1.66, "learning_rate": 5.166739678729642e-05, "loss": 0.0086, "step": 638680 }, { "epoch": 1.66, "learning_rate": 5.166350857092495e-05, "loss": 0.0094, "step": 638690 }, { "epoch": 1.66, "learning_rate": 5.165962035455349e-05, "loss": 0.009, "step": 638700 }, { "epoch": 1.66, "learning_rate": 5.165573213818202e-05, "loss": 0.0095, "step": 638710 }, { "epoch": 1.66, "learning_rate": 5.165184392181056e-05, "loss": 0.007, "step": 638720 }, { "epoch": 1.66, "learning_rate": 5.164795570543909e-05, "loss": 0.0072, "step": 638730 }, { "epoch": 1.66, "learning_rate": 5.1644067489067634e-05, "loss": 0.0076, "step": 638740 }, { "epoch": 1.66, "learning_rate": 5.164017927269617e-05, "loss": 0.0077, "step": 638750 }, { "epoch": 1.66, "learning_rate": 5.16362910563247e-05, "loss": 0.0129, "step": 638760 }, { "epoch": 1.66, "learning_rate": 5.163240283995323e-05, "loss": 0.0085, "step": 638770 }, { "epoch": 1.66, "learning_rate": 5.1628514623581767e-05, "loss": 0.0098, "step": 638780 }, { "epoch": 1.66, "learning_rate": 5.16246264072103e-05, "loss": 0.0072, "step": 638790 }, { "epoch": 1.66, "learning_rate": 5.1620738190838836e-05, "loss": 0.0076, "step": 638800 }, { "epoch": 1.66, "learning_rate": 5.161684997446737e-05, "loss": 0.0099, "step": 638810 }, { "epoch": 1.66, "learning_rate": 5.1612961758095906e-05, "loss": 0.0073, "step": 638820 }, { "epoch": 1.66, "learning_rate": 5.160907354172444e-05, "loss": 0.0073, "step": 638830 }, { "epoch": 1.66, "learning_rate": 5.160518532535298e-05, "loss": 0.0087, "step": 638840 }, { "epoch": 1.66, "learning_rate": 5.160129710898152e-05, "loss": 0.0086, "step": 638850 }, { "epoch": 1.66, "learning_rate": 5.159740889261005e-05, "loss": 0.0084, "step": 638860 }, { "epoch": 1.66, "learning_rate": 5.159352067623859e-05, "loss": 0.0068, "step": 638870 }, { "epoch": 1.66, "learning_rate": 5.158963245986712e-05, "loss": 0.0067, "step": 638880 }, { "epoch": 1.66, "learning_rate": 5.158574424349566e-05, "loss": 0.0073, "step": 638890 }, { "epoch": 1.66, "learning_rate": 5.158185602712419e-05, "loss": 0.0137, "step": 638900 }, { "epoch": 1.66, "learning_rate": 5.1577967810752727e-05, "loss": 0.0084, "step": 638910 }, { "epoch": 1.66, "learning_rate": 5.157407959438127e-05, "loss": 0.009, "step": 638920 }, { "epoch": 1.66, "learning_rate": 5.15701913780098e-05, "loss": 0.0068, "step": 638930 }, { "epoch": 1.66, "learning_rate": 5.156630316163834e-05, "loss": 0.0098, "step": 638940 }, { "epoch": 1.66, "learning_rate": 5.156241494526687e-05, "loss": 0.0076, "step": 638950 }, { "epoch": 1.66, "learning_rate": 5.155852672889541e-05, "loss": 0.0055, "step": 638960 }, { "epoch": 1.66, "learning_rate": 5.155463851252394e-05, "loss": 0.0105, "step": 638970 }, { "epoch": 1.66, "learning_rate": 5.155075029615248e-05, "loss": 0.0071, "step": 638980 }, { "epoch": 1.66, "learning_rate": 5.154686207978101e-05, "loss": 0.0101, "step": 638990 }, { "epoch": 1.66, "learning_rate": 5.154297386340954e-05, "loss": 0.0095, "step": 639000 }, { "epoch": 1.66, "eval_cer": 0.8816564983043399, "eval_loss": 0.005335902329534292, "eval_runtime": 107.8798, "eval_samples_per_second": 18.539, "eval_steps_per_second": 4.635, "step": 639000 }, { "epoch": 1.66, "learning_rate": 5.1539085647038075e-05, "loss": 0.0056, "step": 639010 }, { "epoch": 1.66, "learning_rate": 5.153519743066662e-05, "loss": 0.0079, "step": 639020 }, { "epoch": 1.66, "learning_rate": 5.153130921429515e-05, "loss": 0.0089, "step": 639030 }, { "epoch": 1.66, "learning_rate": 5.1527420997923687e-05, "loss": 0.0075, "step": 639040 }, { "epoch": 1.66, "learning_rate": 5.152353278155222e-05, "loss": 0.0065, "step": 639050 }, { "epoch": 1.66, "learning_rate": 5.1519644565180756e-05, "loss": 0.0092, "step": 639060 }, { "epoch": 1.66, "learning_rate": 5.151575634880929e-05, "loss": 0.0095, "step": 639070 }, { "epoch": 1.66, "learning_rate": 5.1511868132437826e-05, "loss": 0.0112, "step": 639080 }, { "epoch": 1.66, "learning_rate": 5.150797991606636e-05, "loss": 0.0095, "step": 639090 }, { "epoch": 1.66, "learning_rate": 5.15040916996949e-05, "loss": 0.0078, "step": 639100 }, { "epoch": 1.66, "learning_rate": 5.150020348332344e-05, "loss": 0.011, "step": 639110 }, { "epoch": 1.66, "learning_rate": 5.149631526695197e-05, "loss": 0.0076, "step": 639120 }, { "epoch": 1.66, "learning_rate": 5.149242705058051e-05, "loss": 0.0079, "step": 639130 }, { "epoch": 1.66, "learning_rate": 5.148853883420904e-05, "loss": 0.0061, "step": 639140 }, { "epoch": 1.66, "learning_rate": 5.148465061783758e-05, "loss": 0.0065, "step": 639150 }, { "epoch": 1.66, "learning_rate": 5.148076240146611e-05, "loss": 0.0067, "step": 639160 }, { "epoch": 1.66, "learning_rate": 5.1476874185094647e-05, "loss": 0.0093, "step": 639170 }, { "epoch": 1.66, "learning_rate": 5.147298596872319e-05, "loss": 0.0065, "step": 639180 }, { "epoch": 1.66, "learning_rate": 5.146909775235172e-05, "loss": 0.0067, "step": 639190 }, { "epoch": 1.66, "learning_rate": 5.146520953598026e-05, "loss": 0.0074, "step": 639200 }, { "epoch": 1.66, "learning_rate": 5.146132131960879e-05, "loss": 0.0065, "step": 639210 }, { "epoch": 1.66, "learning_rate": 5.145743310323733e-05, "loss": 0.0093, "step": 639220 }, { "epoch": 1.66, "learning_rate": 5.145354488686586e-05, "loss": 0.0079, "step": 639230 }, { "epoch": 1.66, "learning_rate": 5.14496566704944e-05, "loss": 0.0083, "step": 639240 }, { "epoch": 1.66, "learning_rate": 5.1445768454122925e-05, "loss": 0.0073, "step": 639250 }, { "epoch": 1.66, "learning_rate": 5.144188023775146e-05, "loss": 0.0101, "step": 639260 }, { "epoch": 1.66, "learning_rate": 5.1437992021379995e-05, "loss": 0.0081, "step": 639270 }, { "epoch": 1.66, "learning_rate": 5.143410380500854e-05, "loss": 0.008, "step": 639280 }, { "epoch": 1.66, "learning_rate": 5.143021558863707e-05, "loss": 0.0099, "step": 639290 }, { "epoch": 1.66, "learning_rate": 5.1426327372265607e-05, "loss": 0.0084, "step": 639300 }, { "epoch": 1.66, "learning_rate": 5.142243915589414e-05, "loss": 0.0057, "step": 639310 }, { "epoch": 1.66, "learning_rate": 5.1418550939522676e-05, "loss": 0.0068, "step": 639320 }, { "epoch": 1.66, "learning_rate": 5.141466272315121e-05, "loss": 0.012, "step": 639330 }, { "epoch": 1.66, "learning_rate": 5.1410774506779746e-05, "loss": 0.0088, "step": 639340 }, { "epoch": 1.66, "learning_rate": 5.140688629040828e-05, "loss": 0.009, "step": 639350 }, { "epoch": 1.66, "learning_rate": 5.140299807403682e-05, "loss": 0.0092, "step": 639360 }, { "epoch": 1.66, "learning_rate": 5.139910985766536e-05, "loss": 0.0081, "step": 639370 }, { "epoch": 1.66, "learning_rate": 5.139522164129389e-05, "loss": 0.0096, "step": 639380 }, { "epoch": 1.66, "learning_rate": 5.139133342492243e-05, "loss": 0.0085, "step": 639390 }, { "epoch": 1.66, "learning_rate": 5.138744520855096e-05, "loss": 0.0064, "step": 639400 }, { "epoch": 1.66, "learning_rate": 5.13835569921795e-05, "loss": 0.0085, "step": 639410 }, { "epoch": 1.66, "learning_rate": 5.137966877580803e-05, "loss": 0.0106, "step": 639420 }, { "epoch": 1.66, "learning_rate": 5.1375780559436566e-05, "loss": 0.0118, "step": 639430 }, { "epoch": 1.66, "learning_rate": 5.13718923430651e-05, "loss": 0.0062, "step": 639440 }, { "epoch": 1.66, "learning_rate": 5.136800412669364e-05, "loss": 0.0066, "step": 639450 }, { "epoch": 1.66, "learning_rate": 5.136411591032218e-05, "loss": 0.0094, "step": 639460 }, { "epoch": 1.66, "learning_rate": 5.136022769395071e-05, "loss": 0.0073, "step": 639470 }, { "epoch": 1.66, "learning_rate": 5.135633947757925e-05, "loss": 0.0073, "step": 639480 }, { "epoch": 1.66, "learning_rate": 5.135245126120778e-05, "loss": 0.0093, "step": 639490 }, { "epoch": 1.66, "learning_rate": 5.134856304483631e-05, "loss": 0.0068, "step": 639500 }, { "epoch": 1.66, "learning_rate": 5.1344674828464845e-05, "loss": 0.0087, "step": 639510 }, { "epoch": 1.66, "learning_rate": 5.134078661209338e-05, "loss": 0.0064, "step": 639520 }, { "epoch": 1.66, "learning_rate": 5.1336898395721915e-05, "loss": 0.0092, "step": 639530 }, { "epoch": 1.66, "learning_rate": 5.133301017935046e-05, "loss": 0.0077, "step": 639540 }, { "epoch": 1.66, "learning_rate": 5.132912196297899e-05, "loss": 0.0098, "step": 639550 }, { "epoch": 1.66, "learning_rate": 5.1325233746607526e-05, "loss": 0.0072, "step": 639560 }, { "epoch": 1.66, "learning_rate": 5.132134553023606e-05, "loss": 0.0072, "step": 639570 }, { "epoch": 1.66, "learning_rate": 5.1317457313864596e-05, "loss": 0.0096, "step": 639580 }, { "epoch": 1.66, "learning_rate": 5.131356909749313e-05, "loss": 0.0048, "step": 639590 }, { "epoch": 1.66, "learning_rate": 5.1309680881121666e-05, "loss": 0.0069, "step": 639600 }, { "epoch": 1.66, "learning_rate": 5.13057926647502e-05, "loss": 0.0092, "step": 639610 }, { "epoch": 1.66, "learning_rate": 5.1301904448378736e-05, "loss": 0.0125, "step": 639620 }, { "epoch": 1.66, "learning_rate": 5.129801623200728e-05, "loss": 0.008, "step": 639630 }, { "epoch": 1.66, "learning_rate": 5.129412801563581e-05, "loss": 0.0072, "step": 639640 }, { "epoch": 1.66, "learning_rate": 5.129023979926435e-05, "loss": 0.0103, "step": 639650 }, { "epoch": 1.66, "learning_rate": 5.128635158289288e-05, "loss": 0.0077, "step": 639660 }, { "epoch": 1.66, "learning_rate": 5.128246336652142e-05, "loss": 0.01, "step": 639670 }, { "epoch": 1.66, "learning_rate": 5.127857515014995e-05, "loss": 0.0075, "step": 639680 }, { "epoch": 1.66, "learning_rate": 5.1274686933778486e-05, "loss": 0.009, "step": 639690 }, { "epoch": 1.66, "learning_rate": 5.127079871740702e-05, "loss": 0.0087, "step": 639700 }, { "epoch": 1.66, "learning_rate": 5.126691050103556e-05, "loss": 0.0072, "step": 639710 }, { "epoch": 1.66, "learning_rate": 5.12630222846641e-05, "loss": 0.0075, "step": 639720 }, { "epoch": 1.66, "learning_rate": 5.125913406829263e-05, "loss": 0.007, "step": 639730 }, { "epoch": 1.66, "learning_rate": 5.125524585192117e-05, "loss": 0.0083, "step": 639740 }, { "epoch": 1.66, "learning_rate": 5.1251357635549696e-05, "loss": 0.0079, "step": 639750 }, { "epoch": 1.66, "learning_rate": 5.124746941917823e-05, "loss": 0.0042, "step": 639760 }, { "epoch": 1.66, "learning_rate": 5.1243581202806765e-05, "loss": 0.0068, "step": 639770 }, { "epoch": 1.66, "learning_rate": 5.12396929864353e-05, "loss": 0.009, "step": 639780 }, { "epoch": 1.66, "learning_rate": 5.1235804770063835e-05, "loss": 0.0104, "step": 639790 }, { "epoch": 1.66, "learning_rate": 5.123191655369237e-05, "loss": 0.0099, "step": 639800 }, { "epoch": 1.66, "learning_rate": 5.122802833732091e-05, "loss": 0.007, "step": 639810 }, { "epoch": 1.66, "learning_rate": 5.1224140120949446e-05, "loss": 0.0111, "step": 639820 }, { "epoch": 1.66, "learning_rate": 5.122025190457798e-05, "loss": 0.0068, "step": 639830 }, { "epoch": 1.66, "learning_rate": 5.1216363688206516e-05, "loss": 0.0097, "step": 639840 }, { "epoch": 1.66, "learning_rate": 5.121247547183505e-05, "loss": 0.0075, "step": 639850 }, { "epoch": 1.66, "learning_rate": 5.1208587255463586e-05, "loss": 0.0094, "step": 639860 }, { "epoch": 1.66, "learning_rate": 5.120469903909212e-05, "loss": 0.0103, "step": 639870 }, { "epoch": 1.66, "learning_rate": 5.1200810822720656e-05, "loss": 0.0095, "step": 639880 }, { "epoch": 1.66, "learning_rate": 5.11969226063492e-05, "loss": 0.0069, "step": 639890 }, { "epoch": 1.66, "learning_rate": 5.119303438997773e-05, "loss": 0.0076, "step": 639900 }, { "epoch": 1.66, "learning_rate": 5.118914617360627e-05, "loss": 0.0105, "step": 639910 }, { "epoch": 1.66, "learning_rate": 5.11852579572348e-05, "loss": 0.0092, "step": 639920 }, { "epoch": 1.66, "learning_rate": 5.118136974086334e-05, "loss": 0.0116, "step": 639930 }, { "epoch": 1.66, "learning_rate": 5.117748152449187e-05, "loss": 0.0077, "step": 639940 }, { "epoch": 1.66, "learning_rate": 5.1173593308120406e-05, "loss": 0.013, "step": 639950 }, { "epoch": 1.66, "learning_rate": 5.116970509174894e-05, "loss": 0.0077, "step": 639960 }, { "epoch": 1.66, "learning_rate": 5.116581687537748e-05, "loss": 0.0085, "step": 639970 }, { "epoch": 1.66, "learning_rate": 5.116192865900602e-05, "loss": 0.0098, "step": 639980 }, { "epoch": 1.66, "learning_rate": 5.115804044263455e-05, "loss": 0.0072, "step": 639990 }, { "epoch": 1.66, "learning_rate": 5.115415222626308e-05, "loss": 0.008, "step": 640000 }, { "epoch": 1.66, "eval_cer": 0.8816830914060892, "eval_loss": 0.005218719597905874, "eval_runtime": 107.9407, "eval_samples_per_second": 18.529, "eval_steps_per_second": 4.632, "step": 640000 }, { "epoch": 1.66, "learning_rate": 5.1150264009891616e-05, "loss": 0.0117, "step": 640010 }, { "epoch": 1.66, "learning_rate": 5.114637579352015e-05, "loss": 0.0093, "step": 640020 }, { "epoch": 1.66, "learning_rate": 5.1142487577148685e-05, "loss": 0.0089, "step": 640030 }, { "epoch": 1.66, "learning_rate": 5.113859936077722e-05, "loss": 0.0073, "step": 640040 }, { "epoch": 1.66, "learning_rate": 5.1134711144405755e-05, "loss": 0.0078, "step": 640050 }, { "epoch": 1.66, "learning_rate": 5.113082292803429e-05, "loss": 0.0091, "step": 640060 }, { "epoch": 1.66, "learning_rate": 5.112693471166283e-05, "loss": 0.0061, "step": 640070 }, { "epoch": 1.66, "learning_rate": 5.1123046495291366e-05, "loss": 0.0078, "step": 640080 }, { "epoch": 1.66, "learning_rate": 5.11191582789199e-05, "loss": 0.007, "step": 640090 }, { "epoch": 1.66, "learning_rate": 5.1115270062548436e-05, "loss": 0.011, "step": 640100 }, { "epoch": 1.66, "learning_rate": 5.111138184617697e-05, "loss": 0.0079, "step": 640110 }, { "epoch": 1.66, "learning_rate": 5.1107493629805506e-05, "loss": 0.0063, "step": 640120 }, { "epoch": 1.66, "learning_rate": 5.110360541343404e-05, "loss": 0.0076, "step": 640130 }, { "epoch": 1.66, "learning_rate": 5.1099717197062576e-05, "loss": 0.0075, "step": 640140 }, { "epoch": 1.66, "learning_rate": 5.109582898069112e-05, "loss": 0.0055, "step": 640150 }, { "epoch": 1.66, "learning_rate": 5.109194076431965e-05, "loss": 0.0074, "step": 640160 }, { "epoch": 1.66, "learning_rate": 5.108805254794819e-05, "loss": 0.0072, "step": 640170 }, { "epoch": 1.66, "learning_rate": 5.108416433157672e-05, "loss": 0.0078, "step": 640180 }, { "epoch": 1.66, "learning_rate": 5.1080276115205257e-05, "loss": 0.0106, "step": 640190 }, { "epoch": 1.66, "learning_rate": 5.107638789883379e-05, "loss": 0.0065, "step": 640200 }, { "epoch": 1.66, "learning_rate": 5.1072499682462326e-05, "loss": 0.01, "step": 640210 }, { "epoch": 1.66, "learning_rate": 5.106861146609086e-05, "loss": 0.0101, "step": 640220 }, { "epoch": 1.66, "learning_rate": 5.10647232497194e-05, "loss": 0.0089, "step": 640230 }, { "epoch": 1.66, "learning_rate": 5.1060835033347924e-05, "loss": 0.0092, "step": 640240 }, { "epoch": 1.66, "learning_rate": 5.1056946816976466e-05, "loss": 0.0071, "step": 640250 }, { "epoch": 1.66, "learning_rate": 5.1053058600605e-05, "loss": 0.0084, "step": 640260 }, { "epoch": 1.66, "learning_rate": 5.1049170384233536e-05, "loss": 0.0083, "step": 640270 }, { "epoch": 1.66, "learning_rate": 5.104528216786207e-05, "loss": 0.0112, "step": 640280 }, { "epoch": 1.66, "learning_rate": 5.1041393951490605e-05, "loss": 0.0114, "step": 640290 }, { "epoch": 1.66, "learning_rate": 5.103750573511914e-05, "loss": 0.0088, "step": 640300 }, { "epoch": 1.66, "learning_rate": 5.1033617518747675e-05, "loss": 0.0112, "step": 640310 }, { "epoch": 1.66, "learning_rate": 5.102972930237621e-05, "loss": 0.0069, "step": 640320 }, { "epoch": 1.66, "learning_rate": 5.102584108600475e-05, "loss": 0.0083, "step": 640330 }, { "epoch": 1.66, "learning_rate": 5.1021952869633286e-05, "loss": 0.0101, "step": 640340 }, { "epoch": 1.66, "learning_rate": 5.101806465326182e-05, "loss": 0.0082, "step": 640350 }, { "epoch": 1.66, "learning_rate": 5.1014176436890356e-05, "loss": 0.0089, "step": 640360 }, { "epoch": 1.66, "learning_rate": 5.101028822051889e-05, "loss": 0.0114, "step": 640370 }, { "epoch": 1.66, "learning_rate": 5.1006400004147426e-05, "loss": 0.0085, "step": 640380 }, { "epoch": 1.66, "learning_rate": 5.100251178777596e-05, "loss": 0.0129, "step": 640390 }, { "epoch": 1.66, "learning_rate": 5.0998623571404495e-05, "loss": 0.0101, "step": 640400 }, { "epoch": 1.66, "learning_rate": 5.099473535503304e-05, "loss": 0.0124, "step": 640410 }, { "epoch": 1.66, "learning_rate": 5.099084713866157e-05, "loss": 0.0064, "step": 640420 }, { "epoch": 1.66, "learning_rate": 5.098695892229011e-05, "loss": 0.0084, "step": 640430 }, { "epoch": 1.66, "learning_rate": 5.098307070591864e-05, "loss": 0.0068, "step": 640440 }, { "epoch": 1.66, "learning_rate": 5.0979182489547177e-05, "loss": 0.0079, "step": 640450 }, { "epoch": 1.66, "learning_rate": 5.097529427317571e-05, "loss": 0.0069, "step": 640460 }, { "epoch": 1.66, "learning_rate": 5.0971406056804246e-05, "loss": 0.0082, "step": 640470 }, { "epoch": 1.66, "learning_rate": 5.096751784043278e-05, "loss": 0.0062, "step": 640480 }, { "epoch": 1.66, "learning_rate": 5.096362962406131e-05, "loss": 0.0109, "step": 640490 }, { "epoch": 1.66, "learning_rate": 5.0959741407689844e-05, "loss": 0.0134, "step": 640500 }, { "epoch": 1.66, "learning_rate": 5.0955853191318386e-05, "loss": 0.009, "step": 640510 }, { "epoch": 1.66, "learning_rate": 5.095196497494692e-05, "loss": 0.0061, "step": 640520 }, { "epoch": 1.66, "learning_rate": 5.0948076758575455e-05, "loss": 0.0109, "step": 640530 }, { "epoch": 1.66, "learning_rate": 5.094418854220399e-05, "loss": 0.0103, "step": 640540 }, { "epoch": 1.66, "learning_rate": 5.0940300325832525e-05, "loss": 0.0069, "step": 640550 }, { "epoch": 1.66, "learning_rate": 5.093641210946106e-05, "loss": 0.0064, "step": 640560 }, { "epoch": 1.66, "learning_rate": 5.0932523893089595e-05, "loss": 0.0067, "step": 640570 }, { "epoch": 1.66, "learning_rate": 5.092863567671813e-05, "loss": 0.0088, "step": 640580 }, { "epoch": 1.66, "learning_rate": 5.092474746034667e-05, "loss": 0.011, "step": 640590 }, { "epoch": 1.66, "learning_rate": 5.0920859243975206e-05, "loss": 0.0072, "step": 640600 }, { "epoch": 1.66, "learning_rate": 5.091697102760374e-05, "loss": 0.0089, "step": 640610 }, { "epoch": 1.66, "learning_rate": 5.0913082811232276e-05, "loss": 0.0065, "step": 640620 }, { "epoch": 1.66, "learning_rate": 5.090919459486081e-05, "loss": 0.0067, "step": 640630 }, { "epoch": 1.66, "learning_rate": 5.0905306378489346e-05, "loss": 0.0073, "step": 640640 }, { "epoch": 1.66, "learning_rate": 5.090141816211788e-05, "loss": 0.0075, "step": 640650 }, { "epoch": 1.66, "learning_rate": 5.0897529945746415e-05, "loss": 0.0068, "step": 640660 }, { "epoch": 1.66, "learning_rate": 5.089364172937496e-05, "loss": 0.0091, "step": 640670 }, { "epoch": 1.66, "learning_rate": 5.088975351300349e-05, "loss": 0.009, "step": 640680 }, { "epoch": 1.66, "learning_rate": 5.088586529663203e-05, "loss": 0.0082, "step": 640690 }, { "epoch": 1.66, "learning_rate": 5.088197708026056e-05, "loss": 0.0081, "step": 640700 }, { "epoch": 1.66, "learning_rate": 5.0878088863889097e-05, "loss": 0.006, "step": 640710 }, { "epoch": 1.66, "learning_rate": 5.087420064751763e-05, "loss": 0.0098, "step": 640720 }, { "epoch": 1.66, "learning_rate": 5.0870312431146166e-05, "loss": 0.0089, "step": 640730 }, { "epoch": 1.66, "learning_rate": 5.0866424214774694e-05, "loss": 0.0115, "step": 640740 }, { "epoch": 1.66, "learning_rate": 5.086253599840323e-05, "loss": 0.0078, "step": 640750 }, { "epoch": 1.66, "learning_rate": 5.0858647782031764e-05, "loss": 0.0092, "step": 640760 }, { "epoch": 1.66, "learning_rate": 5.0854759565660306e-05, "loss": 0.0066, "step": 640770 }, { "epoch": 1.66, "learning_rate": 5.085087134928884e-05, "loss": 0.0098, "step": 640780 }, { "epoch": 1.66, "learning_rate": 5.0846983132917375e-05, "loss": 0.0084, "step": 640790 }, { "epoch": 1.66, "learning_rate": 5.084309491654591e-05, "loss": 0.0051, "step": 640800 }, { "epoch": 1.66, "learning_rate": 5.0839206700174445e-05, "loss": 0.0105, "step": 640810 }, { "epoch": 1.66, "learning_rate": 5.083531848380298e-05, "loss": 0.0091, "step": 640820 }, { "epoch": 1.66, "learning_rate": 5.0831430267431515e-05, "loss": 0.0119, "step": 640830 }, { "epoch": 1.66, "learning_rate": 5.082754205106005e-05, "loss": 0.0094, "step": 640840 }, { "epoch": 1.66, "learning_rate": 5.082365383468859e-05, "loss": 0.008, "step": 640850 }, { "epoch": 1.66, "learning_rate": 5.0819765618317126e-05, "loss": 0.0085, "step": 640860 }, { "epoch": 1.66, "learning_rate": 5.081587740194566e-05, "loss": 0.0086, "step": 640870 }, { "epoch": 1.66, "learning_rate": 5.0811989185574196e-05, "loss": 0.0129, "step": 640880 }, { "epoch": 1.66, "learning_rate": 5.080810096920273e-05, "loss": 0.0087, "step": 640890 }, { "epoch": 1.66, "learning_rate": 5.0804212752831266e-05, "loss": 0.0064, "step": 640900 }, { "epoch": 1.66, "learning_rate": 5.08003245364598e-05, "loss": 0.0064, "step": 640910 }, { "epoch": 1.66, "learning_rate": 5.0796436320088335e-05, "loss": 0.0071, "step": 640920 }, { "epoch": 1.66, "learning_rate": 5.079254810371687e-05, "loss": 0.0069, "step": 640930 }, { "epoch": 1.66, "learning_rate": 5.078865988734541e-05, "loss": 0.0095, "step": 640940 }, { "epoch": 1.66, "learning_rate": 5.078477167097395e-05, "loss": 0.01, "step": 640950 }, { "epoch": 1.66, "learning_rate": 5.078088345460248e-05, "loss": 0.0091, "step": 640960 }, { "epoch": 1.66, "learning_rate": 5.0776995238231016e-05, "loss": 0.0103, "step": 640970 }, { "epoch": 1.66, "learning_rate": 5.077310702185955e-05, "loss": 0.0057, "step": 640980 }, { "epoch": 1.66, "learning_rate": 5.076921880548808e-05, "loss": 0.0085, "step": 640990 }, { "epoch": 1.66, "learning_rate": 5.0765330589116614e-05, "loss": 0.0097, "step": 641000 }, { "epoch": 1.66, "eval_cer": 0.8816746935844841, "eval_loss": 0.005241747945547104, "eval_runtime": 107.7049, "eval_samples_per_second": 18.569, "eval_steps_per_second": 4.642, "step": 641000 }, { "epoch": 1.66, "learning_rate": 5.076144237274515e-05, "loss": 0.0089, "step": 641010 }, { "epoch": 1.66, "learning_rate": 5.0757554156373684e-05, "loss": 0.0068, "step": 641020 }, { "epoch": 1.66, "learning_rate": 5.075366594000222e-05, "loss": 0.0067, "step": 641030 }, { "epoch": 1.66, "learning_rate": 5.074977772363076e-05, "loss": 0.0076, "step": 641040 }, { "epoch": 1.66, "learning_rate": 5.0745889507259295e-05, "loss": 0.0081, "step": 641050 }, { "epoch": 1.66, "learning_rate": 5.074200129088783e-05, "loss": 0.0069, "step": 641060 }, { "epoch": 1.66, "learning_rate": 5.0738113074516365e-05, "loss": 0.0076, "step": 641070 }, { "epoch": 1.66, "learning_rate": 5.07342248581449e-05, "loss": 0.0095, "step": 641080 }, { "epoch": 1.66, "learning_rate": 5.0730336641773435e-05, "loss": 0.0071, "step": 641090 }, { "epoch": 1.66, "learning_rate": 5.072644842540197e-05, "loss": 0.0086, "step": 641100 }, { "epoch": 1.66, "learning_rate": 5.0722560209030505e-05, "loss": 0.0108, "step": 641110 }, { "epoch": 1.66, "learning_rate": 5.0718671992659046e-05, "loss": 0.0111, "step": 641120 }, { "epoch": 1.66, "learning_rate": 5.071478377628758e-05, "loss": 0.0088, "step": 641130 }, { "epoch": 1.66, "learning_rate": 5.0710895559916116e-05, "loss": 0.0073, "step": 641140 }, { "epoch": 1.66, "learning_rate": 5.070700734354465e-05, "loss": 0.0096, "step": 641150 }, { "epoch": 1.66, "learning_rate": 5.0703119127173186e-05, "loss": 0.0077, "step": 641160 }, { "epoch": 1.66, "learning_rate": 5.069923091080172e-05, "loss": 0.0072, "step": 641170 }, { "epoch": 1.66, "learning_rate": 5.0695342694430255e-05, "loss": 0.0106, "step": 641180 }, { "epoch": 1.66, "learning_rate": 5.069145447805879e-05, "loss": 0.0117, "step": 641190 }, { "epoch": 1.66, "learning_rate": 5.068756626168733e-05, "loss": 0.0076, "step": 641200 }, { "epoch": 1.66, "learning_rate": 5.068367804531587e-05, "loss": 0.0066, "step": 641210 }, { "epoch": 1.66, "learning_rate": 5.06797898289444e-05, "loss": 0.0082, "step": 641220 }, { "epoch": 1.66, "learning_rate": 5.0675901612572936e-05, "loss": 0.0092, "step": 641230 }, { "epoch": 1.66, "learning_rate": 5.0672013396201465e-05, "loss": 0.0096, "step": 641240 }, { "epoch": 1.66, "learning_rate": 5.066812517983e-05, "loss": 0.0099, "step": 641250 }, { "epoch": 1.66, "learning_rate": 5.0664236963458534e-05, "loss": 0.0086, "step": 641260 }, { "epoch": 1.66, "learning_rate": 5.066034874708707e-05, "loss": 0.0079, "step": 641270 }, { "epoch": 1.66, "learning_rate": 5.0656460530715604e-05, "loss": 0.0078, "step": 641280 }, { "epoch": 1.66, "learning_rate": 5.065257231434414e-05, "loss": 0.0082, "step": 641290 }, { "epoch": 1.66, "learning_rate": 5.064868409797268e-05, "loss": 0.0074, "step": 641300 }, { "epoch": 1.66, "learning_rate": 5.0644795881601215e-05, "loss": 0.0094, "step": 641310 }, { "epoch": 1.66, "learning_rate": 5.064090766522975e-05, "loss": 0.0081, "step": 641320 }, { "epoch": 1.66, "learning_rate": 5.0637019448858285e-05, "loss": 0.009, "step": 641330 }, { "epoch": 1.66, "learning_rate": 5.063313123248682e-05, "loss": 0.0102, "step": 641340 }, { "epoch": 1.66, "learning_rate": 5.0629243016115355e-05, "loss": 0.0084, "step": 641350 }, { "epoch": 1.66, "learning_rate": 5.062535479974389e-05, "loss": 0.007, "step": 641360 }, { "epoch": 1.66, "learning_rate": 5.0621466583372424e-05, "loss": 0.007, "step": 641370 }, { "epoch": 1.66, "learning_rate": 5.0617578367000966e-05, "loss": 0.0084, "step": 641380 }, { "epoch": 1.66, "learning_rate": 5.06136901506295e-05, "loss": 0.011, "step": 641390 }, { "epoch": 1.66, "learning_rate": 5.0609801934258036e-05, "loss": 0.0075, "step": 641400 }, { "epoch": 1.66, "learning_rate": 5.060591371788657e-05, "loss": 0.0072, "step": 641410 }, { "epoch": 1.66, "learning_rate": 5.0602025501515106e-05, "loss": 0.0097, "step": 641420 }, { "epoch": 1.66, "learning_rate": 5.059813728514364e-05, "loss": 0.0058, "step": 641430 }, { "epoch": 1.66, "learning_rate": 5.0594249068772175e-05, "loss": 0.0142, "step": 641440 }, { "epoch": 1.66, "learning_rate": 5.059036085240071e-05, "loss": 0.0063, "step": 641450 }, { "epoch": 1.66, "learning_rate": 5.058647263602925e-05, "loss": 0.0084, "step": 641460 }, { "epoch": 1.66, "learning_rate": 5.058258441965779e-05, "loss": 0.0083, "step": 641470 }, { "epoch": 1.66, "learning_rate": 5.0578696203286315e-05, "loss": 0.01, "step": 641480 }, { "epoch": 1.66, "learning_rate": 5.057480798691485e-05, "loss": 0.0073, "step": 641490 }, { "epoch": 1.66, "learning_rate": 5.0570919770543384e-05, "loss": 0.0076, "step": 641500 }, { "epoch": 1.66, "learning_rate": 5.056703155417192e-05, "loss": 0.0098, "step": 641510 }, { "epoch": 1.66, "learning_rate": 5.0563143337800454e-05, "loss": 0.0086, "step": 641520 }, { "epoch": 1.66, "learning_rate": 5.055925512142899e-05, "loss": 0.0095, "step": 641530 }, { "epoch": 1.66, "learning_rate": 5.0555366905057524e-05, "loss": 0.0082, "step": 641540 }, { "epoch": 1.66, "learning_rate": 5.055147868868606e-05, "loss": 0.008, "step": 641550 }, { "epoch": 1.66, "learning_rate": 5.05475904723146e-05, "loss": 0.0061, "step": 641560 }, { "epoch": 1.66, "learning_rate": 5.0543702255943135e-05, "loss": 0.0095, "step": 641570 }, { "epoch": 1.66, "learning_rate": 5.053981403957167e-05, "loss": 0.0083, "step": 641580 }, { "epoch": 1.66, "learning_rate": 5.0535925823200205e-05, "loss": 0.0065, "step": 641590 }, { "epoch": 1.66, "learning_rate": 5.053203760682874e-05, "loss": 0.0087, "step": 641600 }, { "epoch": 1.66, "learning_rate": 5.0528149390457275e-05, "loss": 0.0067, "step": 641610 }, { "epoch": 1.66, "learning_rate": 5.052426117408581e-05, "loss": 0.0113, "step": 641620 }, { "epoch": 1.66, "learning_rate": 5.0520372957714344e-05, "loss": 0.0102, "step": 641630 }, { "epoch": 1.66, "learning_rate": 5.0516484741342886e-05, "loss": 0.0072, "step": 641640 }, { "epoch": 1.66, "learning_rate": 5.051259652497142e-05, "loss": 0.0094, "step": 641650 }, { "epoch": 1.66, "learning_rate": 5.0508708308599956e-05, "loss": 0.0094, "step": 641660 }, { "epoch": 1.66, "learning_rate": 5.050482009222849e-05, "loss": 0.006, "step": 641670 }, { "epoch": 1.66, "learning_rate": 5.0500931875857026e-05, "loss": 0.0073, "step": 641680 }, { "epoch": 1.66, "learning_rate": 5.049704365948556e-05, "loss": 0.0079, "step": 641690 }, { "epoch": 1.66, "learning_rate": 5.0493155443114095e-05, "loss": 0.0133, "step": 641700 }, { "epoch": 1.66, "learning_rate": 5.048926722674263e-05, "loss": 0.0065, "step": 641710 }, { "epoch": 1.66, "learning_rate": 5.048537901037117e-05, "loss": 0.0087, "step": 641720 }, { "epoch": 1.66, "learning_rate": 5.048149079399969e-05, "loss": 0.0079, "step": 641730 }, { "epoch": 1.66, "learning_rate": 5.0477602577628235e-05, "loss": 0.0109, "step": 641740 }, { "epoch": 1.66, "learning_rate": 5.047371436125677e-05, "loss": 0.0125, "step": 641750 }, { "epoch": 1.66, "learning_rate": 5.0469826144885304e-05, "loss": 0.0116, "step": 641760 }, { "epoch": 1.66, "learning_rate": 5.046593792851384e-05, "loss": 0.0076, "step": 641770 }, { "epoch": 1.66, "learning_rate": 5.0462049712142374e-05, "loss": 0.0071, "step": 641780 }, { "epoch": 1.66, "learning_rate": 5.045816149577091e-05, "loss": 0.0097, "step": 641790 }, { "epoch": 1.66, "learning_rate": 5.0454273279399444e-05, "loss": 0.0125, "step": 641800 }, { "epoch": 1.66, "learning_rate": 5.045038506302798e-05, "loss": 0.0068, "step": 641810 }, { "epoch": 1.66, "learning_rate": 5.044649684665652e-05, "loss": 0.0093, "step": 641820 }, { "epoch": 1.66, "learning_rate": 5.0442608630285055e-05, "loss": 0.0088, "step": 641830 }, { "epoch": 1.66, "learning_rate": 5.043872041391359e-05, "loss": 0.0097, "step": 641840 }, { "epoch": 1.66, "learning_rate": 5.0434832197542125e-05, "loss": 0.0081, "step": 641850 }, { "epoch": 1.66, "learning_rate": 5.043094398117066e-05, "loss": 0.0073, "step": 641860 }, { "epoch": 1.66, "learning_rate": 5.0427055764799195e-05, "loss": 0.0079, "step": 641870 }, { "epoch": 1.66, "learning_rate": 5.042316754842773e-05, "loss": 0.0069, "step": 641880 }, { "epoch": 1.66, "learning_rate": 5.0419279332056264e-05, "loss": 0.0106, "step": 641890 }, { "epoch": 1.66, "learning_rate": 5.0415391115684806e-05, "loss": 0.0072, "step": 641900 }, { "epoch": 1.66, "learning_rate": 5.041150289931334e-05, "loss": 0.0096, "step": 641910 }, { "epoch": 1.66, "learning_rate": 5.0407614682941876e-05, "loss": 0.0075, "step": 641920 }, { "epoch": 1.66, "learning_rate": 5.040372646657041e-05, "loss": 0.0094, "step": 641930 }, { "epoch": 1.66, "learning_rate": 5.0399838250198945e-05, "loss": 0.0093, "step": 641940 }, { "epoch": 1.66, "learning_rate": 5.039595003382748e-05, "loss": 0.0104, "step": 641950 }, { "epoch": 1.66, "learning_rate": 5.0392061817456015e-05, "loss": 0.0093, "step": 641960 }, { "epoch": 1.66, "learning_rate": 5.038817360108455e-05, "loss": 0.0069, "step": 641970 }, { "epoch": 1.66, "learning_rate": 5.038428538471308e-05, "loss": 0.0076, "step": 641980 }, { "epoch": 1.66, "learning_rate": 5.038039716834161e-05, "loss": 0.006, "step": 641990 }, { "epoch": 1.66, "learning_rate": 5.0376508951970155e-05, "loss": 0.0082, "step": 642000 }, { "epoch": 1.66, "eval_cer": 0.88167329394755, "eval_loss": 0.005268983077257872, "eval_runtime": 107.7603, "eval_samples_per_second": 18.56, "eval_steps_per_second": 4.64, "step": 642000 }, { "epoch": 1.66, "learning_rate": 5.037262073559869e-05, "loss": 0.0058, "step": 642010 }, { "epoch": 1.66, "learning_rate": 5.0368732519227224e-05, "loss": 0.0084, "step": 642020 }, { "epoch": 1.66, "learning_rate": 5.036484430285576e-05, "loss": 0.0084, "step": 642030 }, { "epoch": 1.66, "learning_rate": 5.0360956086484294e-05, "loss": 0.0079, "step": 642040 }, { "epoch": 1.66, "learning_rate": 5.035706787011283e-05, "loss": 0.0053, "step": 642050 }, { "epoch": 1.66, "learning_rate": 5.0353179653741364e-05, "loss": 0.0094, "step": 642060 }, { "epoch": 1.66, "learning_rate": 5.03492914373699e-05, "loss": 0.0087, "step": 642070 }, { "epoch": 1.66, "learning_rate": 5.034540322099844e-05, "loss": 0.0054, "step": 642080 }, { "epoch": 1.66, "learning_rate": 5.0341515004626975e-05, "loss": 0.0093, "step": 642090 }, { "epoch": 1.66, "learning_rate": 5.033762678825551e-05, "loss": 0.01, "step": 642100 }, { "epoch": 1.66, "learning_rate": 5.0333738571884045e-05, "loss": 0.0093, "step": 642110 }, { "epoch": 1.66, "learning_rate": 5.032985035551258e-05, "loss": 0.0092, "step": 642120 }, { "epoch": 1.66, "learning_rate": 5.0325962139141115e-05, "loss": 0.0097, "step": 642130 }, { "epoch": 1.66, "learning_rate": 5.032207392276965e-05, "loss": 0.0107, "step": 642140 }, { "epoch": 1.66, "learning_rate": 5.0318185706398184e-05, "loss": 0.0076, "step": 642150 }, { "epoch": 1.66, "learning_rate": 5.0314297490026726e-05, "loss": 0.0069, "step": 642160 }, { "epoch": 1.66, "learning_rate": 5.031040927365526e-05, "loss": 0.008, "step": 642170 }, { "epoch": 1.66, "learning_rate": 5.0306521057283796e-05, "loss": 0.009, "step": 642180 }, { "epoch": 1.66, "learning_rate": 5.030263284091233e-05, "loss": 0.0072, "step": 642190 }, { "epoch": 1.66, "learning_rate": 5.0298744624540865e-05, "loss": 0.0061, "step": 642200 }, { "epoch": 1.66, "learning_rate": 5.02948564081694e-05, "loss": 0.0086, "step": 642210 }, { "epoch": 1.66, "learning_rate": 5.0290968191797935e-05, "loss": 0.0089, "step": 642220 }, { "epoch": 1.66, "learning_rate": 5.028707997542646e-05, "loss": 0.0101, "step": 642230 }, { "epoch": 1.66, "learning_rate": 5.0283191759055e-05, "loss": 0.0102, "step": 642240 }, { "epoch": 1.66, "learning_rate": 5.027930354268353e-05, "loss": 0.0075, "step": 642250 }, { "epoch": 1.66, "learning_rate": 5.0275415326312075e-05, "loss": 0.0084, "step": 642260 }, { "epoch": 1.66, "learning_rate": 5.027152710994061e-05, "loss": 0.0081, "step": 642270 }, { "epoch": 1.66, "learning_rate": 5.0267638893569144e-05, "loss": 0.0093, "step": 642280 }, { "epoch": 1.66, "learning_rate": 5.026375067719768e-05, "loss": 0.0071, "step": 642290 }, { "epoch": 1.66, "learning_rate": 5.0259862460826214e-05, "loss": 0.0099, "step": 642300 }, { "epoch": 1.66, "learning_rate": 5.025597424445475e-05, "loss": 0.0084, "step": 642310 }, { "epoch": 1.66, "learning_rate": 5.0252086028083284e-05, "loss": 0.0108, "step": 642320 }, { "epoch": 1.67, "learning_rate": 5.024819781171182e-05, "loss": 0.0072, "step": 642330 }, { "epoch": 1.67, "learning_rate": 5.0244309595340353e-05, "loss": 0.0065, "step": 642340 }, { "epoch": 1.67, "learning_rate": 5.0240421378968895e-05, "loss": 0.0097, "step": 642350 }, { "epoch": 1.67, "learning_rate": 5.023653316259743e-05, "loss": 0.0092, "step": 642360 }, { "epoch": 1.67, "learning_rate": 5.0232644946225965e-05, "loss": 0.0076, "step": 642370 }, { "epoch": 1.67, "learning_rate": 5.02287567298545e-05, "loss": 0.0078, "step": 642380 }, { "epoch": 1.67, "learning_rate": 5.0224868513483035e-05, "loss": 0.0065, "step": 642390 }, { "epoch": 1.67, "learning_rate": 5.022098029711157e-05, "loss": 0.0093, "step": 642400 }, { "epoch": 1.67, "learning_rate": 5.0217092080740104e-05, "loss": 0.0082, "step": 642410 }, { "epoch": 1.67, "learning_rate": 5.021320386436864e-05, "loss": 0.0093, "step": 642420 }, { "epoch": 1.67, "learning_rate": 5.020931564799718e-05, "loss": 0.0093, "step": 642430 }, { "epoch": 1.67, "learning_rate": 5.0205427431625716e-05, "loss": 0.0078, "step": 642440 }, { "epoch": 1.67, "learning_rate": 5.020153921525425e-05, "loss": 0.0059, "step": 642450 }, { "epoch": 1.67, "learning_rate": 5.0197650998882785e-05, "loss": 0.0073, "step": 642460 }, { "epoch": 1.67, "learning_rate": 5.019376278251132e-05, "loss": 0.0066, "step": 642470 }, { "epoch": 1.67, "learning_rate": 5.018987456613985e-05, "loss": 0.0085, "step": 642480 }, { "epoch": 1.67, "learning_rate": 5.018598634976838e-05, "loss": 0.0075, "step": 642490 }, { "epoch": 1.67, "learning_rate": 5.018209813339692e-05, "loss": 0.0069, "step": 642500 }, { "epoch": 1.67, "learning_rate": 5.017820991702545e-05, "loss": 0.0107, "step": 642510 }, { "epoch": 1.67, "learning_rate": 5.017432170065399e-05, "loss": 0.0081, "step": 642520 }, { "epoch": 1.67, "learning_rate": 5.017043348428253e-05, "loss": 0.0086, "step": 642530 }, { "epoch": 1.67, "learning_rate": 5.0166545267911064e-05, "loss": 0.009, "step": 642540 }, { "epoch": 1.67, "learning_rate": 5.01626570515396e-05, "loss": 0.0073, "step": 642550 }, { "epoch": 1.67, "learning_rate": 5.0158768835168134e-05, "loss": 0.0059, "step": 642560 }, { "epoch": 1.67, "learning_rate": 5.015488061879667e-05, "loss": 0.006, "step": 642570 }, { "epoch": 1.67, "learning_rate": 5.0150992402425204e-05, "loss": 0.0085, "step": 642580 }, { "epoch": 1.67, "learning_rate": 5.014710418605374e-05, "loss": 0.011, "step": 642590 }, { "epoch": 1.67, "learning_rate": 5.0143215969682273e-05, "loss": 0.009, "step": 642600 }, { "epoch": 1.67, "learning_rate": 5.0139327753310815e-05, "loss": 0.0083, "step": 642610 }, { "epoch": 1.67, "learning_rate": 5.013543953693935e-05, "loss": 0.007, "step": 642620 }, { "epoch": 1.67, "learning_rate": 5.0131551320567885e-05, "loss": 0.0089, "step": 642630 }, { "epoch": 1.67, "learning_rate": 5.012766310419642e-05, "loss": 0.0066, "step": 642640 }, { "epoch": 1.67, "learning_rate": 5.0123774887824955e-05, "loss": 0.0098, "step": 642650 }, { "epoch": 1.67, "learning_rate": 5.011988667145349e-05, "loss": 0.0065, "step": 642660 }, { "epoch": 1.67, "learning_rate": 5.0115998455082024e-05, "loss": 0.0075, "step": 642670 }, { "epoch": 1.67, "learning_rate": 5.011211023871056e-05, "loss": 0.0077, "step": 642680 }, { "epoch": 1.67, "learning_rate": 5.01082220223391e-05, "loss": 0.0071, "step": 642690 }, { "epoch": 1.67, "learning_rate": 5.0104333805967636e-05, "loss": 0.0101, "step": 642700 }, { "epoch": 1.67, "learning_rate": 5.010044558959617e-05, "loss": 0.008, "step": 642710 }, { "epoch": 1.67, "learning_rate": 5.0096557373224705e-05, "loss": 0.0091, "step": 642720 }, { "epoch": 1.67, "learning_rate": 5.0092669156853233e-05, "loss": 0.0062, "step": 642730 }, { "epoch": 1.67, "learning_rate": 5.008878094048177e-05, "loss": 0.0068, "step": 642740 }, { "epoch": 1.67, "learning_rate": 5.00848927241103e-05, "loss": 0.0098, "step": 642750 }, { "epoch": 1.67, "learning_rate": 5.008100450773884e-05, "loss": 0.0067, "step": 642760 }, { "epoch": 1.67, "learning_rate": 5.007711629136737e-05, "loss": 0.0061, "step": 642770 }, { "epoch": 1.67, "learning_rate": 5.007322807499591e-05, "loss": 0.0076, "step": 642780 }, { "epoch": 1.67, "learning_rate": 5.006933985862445e-05, "loss": 0.0069, "step": 642790 }, { "epoch": 1.67, "learning_rate": 5.0065451642252984e-05, "loss": 0.0075, "step": 642800 }, { "epoch": 1.67, "learning_rate": 5.006156342588152e-05, "loss": 0.0077, "step": 642810 }, { "epoch": 1.67, "learning_rate": 5.0057675209510054e-05, "loss": 0.0087, "step": 642820 }, { "epoch": 1.67, "learning_rate": 5.005378699313859e-05, "loss": 0.0063, "step": 642830 }, { "epoch": 1.67, "learning_rate": 5.0049898776767124e-05, "loss": 0.0059, "step": 642840 }, { "epoch": 1.67, "learning_rate": 5.004601056039566e-05, "loss": 0.0103, "step": 642850 }, { "epoch": 1.67, "learning_rate": 5.004212234402419e-05, "loss": 0.0102, "step": 642860 }, { "epoch": 1.67, "learning_rate": 5.0038234127652735e-05, "loss": 0.0089, "step": 642870 }, { "epoch": 1.67, "learning_rate": 5.003434591128127e-05, "loss": 0.0111, "step": 642880 }, { "epoch": 1.67, "learning_rate": 5.0030457694909805e-05, "loss": 0.0094, "step": 642890 }, { "epoch": 1.67, "learning_rate": 5.002656947853834e-05, "loss": 0.0084, "step": 642900 }, { "epoch": 1.67, "learning_rate": 5.0022681262166874e-05, "loss": 0.0088, "step": 642910 }, { "epoch": 1.67, "learning_rate": 5.001879304579541e-05, "loss": 0.0093, "step": 642920 }, { "epoch": 1.67, "learning_rate": 5.0014904829423944e-05, "loss": 0.0057, "step": 642930 }, { "epoch": 1.67, "learning_rate": 5.001101661305248e-05, "loss": 0.0081, "step": 642940 }, { "epoch": 1.67, "learning_rate": 5.000712839668102e-05, "loss": 0.0087, "step": 642950 }, { "epoch": 1.67, "learning_rate": 5.0003240180309556e-05, "loss": 0.0082, "step": 642960 }, { "epoch": 1.67, "learning_rate": 4.9999351963938084e-05, "loss": 0.0099, "step": 642970 }, { "epoch": 1.67, "learning_rate": 4.999546374756662e-05, "loss": 0.0076, "step": 642980 }, { "epoch": 1.67, "learning_rate": 4.999157553119515e-05, "loss": 0.0067, "step": 642990 }, { "epoch": 1.67, "learning_rate": 4.998768731482369e-05, "loss": 0.0089, "step": 643000 }, { "epoch": 1.67, "eval_cer": 0.8816956881384969, "eval_loss": 0.005269117187708616, "eval_runtime": 107.7748, "eval_samples_per_second": 18.557, "eval_steps_per_second": 4.639, "step": 643000 }, { "epoch": 1.67, "learning_rate": 4.998379909845222e-05, "loss": 0.0094, "step": 643010 }, { "epoch": 1.67, "learning_rate": 4.997991088208076e-05, "loss": 0.0074, "step": 643020 }, { "epoch": 1.67, "learning_rate": 4.997602266570929e-05, "loss": 0.0074, "step": 643030 }, { "epoch": 1.67, "learning_rate": 4.997213444933783e-05, "loss": 0.0068, "step": 643040 }, { "epoch": 1.67, "learning_rate": 4.996824623296637e-05, "loss": 0.0079, "step": 643050 }, { "epoch": 1.67, "learning_rate": 4.9964358016594904e-05, "loss": 0.0081, "step": 643060 }, { "epoch": 1.67, "learning_rate": 4.996046980022344e-05, "loss": 0.0068, "step": 643070 }, { "epoch": 1.67, "learning_rate": 4.9956581583851974e-05, "loss": 0.0061, "step": 643080 }, { "epoch": 1.67, "learning_rate": 4.995269336748051e-05, "loss": 0.0071, "step": 643090 }, { "epoch": 1.67, "learning_rate": 4.9948805151109044e-05, "loss": 0.0065, "step": 643100 }, { "epoch": 1.67, "learning_rate": 4.994491693473758e-05, "loss": 0.0091, "step": 643110 }, { "epoch": 1.67, "learning_rate": 4.994102871836611e-05, "loss": 0.0063, "step": 643120 }, { "epoch": 1.67, "learning_rate": 4.9937140501994655e-05, "loss": 0.007, "step": 643130 }, { "epoch": 1.67, "learning_rate": 4.993325228562319e-05, "loss": 0.0081, "step": 643140 }, { "epoch": 1.67, "learning_rate": 4.9929364069251725e-05, "loss": 0.0089, "step": 643150 }, { "epoch": 1.67, "learning_rate": 4.992547585288026e-05, "loss": 0.0076, "step": 643160 }, { "epoch": 1.67, "learning_rate": 4.9921587636508794e-05, "loss": 0.0091, "step": 643170 }, { "epoch": 1.67, "learning_rate": 4.991769942013733e-05, "loss": 0.008, "step": 643180 }, { "epoch": 1.67, "learning_rate": 4.9913811203765864e-05, "loss": 0.0102, "step": 643190 }, { "epoch": 1.67, "learning_rate": 4.99099229873944e-05, "loss": 0.0088, "step": 643200 }, { "epoch": 1.67, "learning_rate": 4.990603477102294e-05, "loss": 0.0099, "step": 643210 }, { "epoch": 1.67, "learning_rate": 4.990214655465146e-05, "loss": 0.0084, "step": 643220 }, { "epoch": 1.67, "learning_rate": 4.9898258338280004e-05, "loss": 0.0096, "step": 643230 }, { "epoch": 1.67, "learning_rate": 4.989437012190854e-05, "loss": 0.008, "step": 643240 }, { "epoch": 1.67, "learning_rate": 4.989048190553707e-05, "loss": 0.007, "step": 643250 }, { "epoch": 1.67, "learning_rate": 4.988659368916561e-05, "loss": 0.0081, "step": 643260 }, { "epoch": 1.67, "learning_rate": 4.988270547279414e-05, "loss": 0.0076, "step": 643270 }, { "epoch": 1.67, "learning_rate": 4.987881725642268e-05, "loss": 0.0072, "step": 643280 }, { "epoch": 1.67, "learning_rate": 4.987492904005121e-05, "loss": 0.0091, "step": 643290 }, { "epoch": 1.67, "learning_rate": 4.987104082367975e-05, "loss": 0.0083, "step": 643300 }, { "epoch": 1.67, "learning_rate": 4.986715260730829e-05, "loss": 0.0062, "step": 643310 }, { "epoch": 1.67, "learning_rate": 4.9863264390936824e-05, "loss": 0.0097, "step": 643320 }, { "epoch": 1.67, "learning_rate": 4.985937617456536e-05, "loss": 0.0065, "step": 643330 }, { "epoch": 1.67, "learning_rate": 4.9855487958193894e-05, "loss": 0.0084, "step": 643340 }, { "epoch": 1.67, "learning_rate": 4.985159974182243e-05, "loss": 0.0134, "step": 643350 }, { "epoch": 1.67, "learning_rate": 4.9847711525450964e-05, "loss": 0.0078, "step": 643360 }, { "epoch": 1.67, "learning_rate": 4.98438233090795e-05, "loss": 0.0089, "step": 643370 }, { "epoch": 1.67, "learning_rate": 4.983993509270803e-05, "loss": 0.0065, "step": 643380 }, { "epoch": 1.67, "learning_rate": 4.9836046876336575e-05, "loss": 0.0093, "step": 643390 }, { "epoch": 1.67, "learning_rate": 4.983215865996511e-05, "loss": 0.0088, "step": 643400 }, { "epoch": 1.67, "learning_rate": 4.9828270443593645e-05, "loss": 0.007, "step": 643410 }, { "epoch": 1.67, "learning_rate": 4.982438222722218e-05, "loss": 0.0082, "step": 643420 }, { "epoch": 1.67, "learning_rate": 4.9820494010850714e-05, "loss": 0.0096, "step": 643430 }, { "epoch": 1.67, "learning_rate": 4.981660579447925e-05, "loss": 0.0069, "step": 643440 }, { "epoch": 1.67, "learning_rate": 4.9812717578107784e-05, "loss": 0.0121, "step": 643450 }, { "epoch": 1.67, "learning_rate": 4.980882936173632e-05, "loss": 0.007, "step": 643460 }, { "epoch": 1.67, "learning_rate": 4.980494114536485e-05, "loss": 0.0076, "step": 643470 }, { "epoch": 1.67, "learning_rate": 4.980105292899338e-05, "loss": 0.0138, "step": 643480 }, { "epoch": 1.67, "learning_rate": 4.9797164712621924e-05, "loss": 0.0055, "step": 643490 }, { "epoch": 1.67, "learning_rate": 4.979327649625046e-05, "loss": 0.0076, "step": 643500 }, { "epoch": 1.67, "learning_rate": 4.978938827987899e-05, "loss": 0.0081, "step": 643510 }, { "epoch": 1.67, "learning_rate": 4.978550006350753e-05, "loss": 0.0076, "step": 643520 }, { "epoch": 1.67, "learning_rate": 4.978161184713606e-05, "loss": 0.0095, "step": 643530 }, { "epoch": 1.67, "learning_rate": 4.97777236307646e-05, "loss": 0.0078, "step": 643540 }, { "epoch": 1.67, "learning_rate": 4.977383541439313e-05, "loss": 0.0088, "step": 643550 }, { "epoch": 1.67, "learning_rate": 4.976994719802167e-05, "loss": 0.0108, "step": 643560 }, { "epoch": 1.67, "learning_rate": 4.976605898165021e-05, "loss": 0.0098, "step": 643570 }, { "epoch": 1.67, "learning_rate": 4.9762170765278744e-05, "loss": 0.0069, "step": 643580 }, { "epoch": 1.67, "learning_rate": 4.975828254890728e-05, "loss": 0.0063, "step": 643590 }, { "epoch": 1.67, "learning_rate": 4.9754394332535814e-05, "loss": 0.0109, "step": 643600 }, { "epoch": 1.67, "learning_rate": 4.975050611616435e-05, "loss": 0.0052, "step": 643610 }, { "epoch": 1.67, "learning_rate": 4.9746617899792884e-05, "loss": 0.0084, "step": 643620 }, { "epoch": 1.67, "learning_rate": 4.974272968342142e-05, "loss": 0.0074, "step": 643630 }, { "epoch": 1.67, "learning_rate": 4.973884146704995e-05, "loss": 0.0073, "step": 643640 }, { "epoch": 1.67, "learning_rate": 4.973495325067849e-05, "loss": 0.0069, "step": 643650 }, { "epoch": 1.67, "learning_rate": 4.973106503430703e-05, "loss": 0.0096, "step": 643660 }, { "epoch": 1.67, "learning_rate": 4.9727176817935565e-05, "loss": 0.0077, "step": 643670 }, { "epoch": 1.67, "learning_rate": 4.97232886015641e-05, "loss": 0.0096, "step": 643680 }, { "epoch": 1.67, "learning_rate": 4.9719400385192634e-05, "loss": 0.0076, "step": 643690 }, { "epoch": 1.67, "learning_rate": 4.971551216882117e-05, "loss": 0.0085, "step": 643700 }, { "epoch": 1.67, "learning_rate": 4.9711623952449704e-05, "loss": 0.0104, "step": 643710 }, { "epoch": 1.67, "learning_rate": 4.970773573607823e-05, "loss": 0.0094, "step": 643720 }, { "epoch": 1.67, "learning_rate": 4.970384751970677e-05, "loss": 0.0073, "step": 643730 }, { "epoch": 1.67, "learning_rate": 4.96999593033353e-05, "loss": 0.0062, "step": 643740 }, { "epoch": 1.67, "learning_rate": 4.969607108696384e-05, "loss": 0.0097, "step": 643750 }, { "epoch": 1.67, "learning_rate": 4.969218287059238e-05, "loss": 0.0074, "step": 643760 }, { "epoch": 1.67, "learning_rate": 4.968829465422091e-05, "loss": 0.0089, "step": 643770 }, { "epoch": 1.67, "learning_rate": 4.968440643784945e-05, "loss": 0.0062, "step": 643780 }, { "epoch": 1.67, "learning_rate": 4.968051822147798e-05, "loss": 0.009, "step": 643790 }, { "epoch": 1.67, "learning_rate": 4.967663000510652e-05, "loss": 0.0099, "step": 643800 }, { "epoch": 1.67, "learning_rate": 4.967274178873505e-05, "loss": 0.008, "step": 643810 }, { "epoch": 1.67, "learning_rate": 4.966885357236359e-05, "loss": 0.0062, "step": 643820 }, { "epoch": 1.67, "learning_rate": 4.966496535599212e-05, "loss": 0.0079, "step": 643830 }, { "epoch": 1.67, "learning_rate": 4.9661077139620664e-05, "loss": 0.0076, "step": 643840 }, { "epoch": 1.67, "learning_rate": 4.96571889232492e-05, "loss": 0.0086, "step": 643850 }, { "epoch": 1.67, "learning_rate": 4.9653300706877734e-05, "loss": 0.0073, "step": 643860 }, { "epoch": 1.67, "learning_rate": 4.964941249050627e-05, "loss": 0.0073, "step": 643870 }, { "epoch": 1.67, "learning_rate": 4.9645524274134803e-05, "loss": 0.0073, "step": 643880 }, { "epoch": 1.67, "learning_rate": 4.964163605776334e-05, "loss": 0.0076, "step": 643890 }, { "epoch": 1.67, "learning_rate": 4.963774784139187e-05, "loss": 0.0059, "step": 643900 }, { "epoch": 1.67, "learning_rate": 4.963385962502041e-05, "loss": 0.008, "step": 643910 }, { "epoch": 1.67, "learning_rate": 4.962997140864895e-05, "loss": 0.0107, "step": 643920 }, { "epoch": 1.67, "learning_rate": 4.9626083192277485e-05, "loss": 0.0067, "step": 643930 }, { "epoch": 1.67, "learning_rate": 4.962219497590602e-05, "loss": 0.0072, "step": 643940 }, { "epoch": 1.67, "learning_rate": 4.9618306759534554e-05, "loss": 0.0092, "step": 643950 }, { "epoch": 1.67, "learning_rate": 4.961441854316309e-05, "loss": 0.0069, "step": 643960 }, { "epoch": 1.67, "learning_rate": 4.961053032679162e-05, "loss": 0.008, "step": 643970 }, { "epoch": 1.67, "learning_rate": 4.960664211042015e-05, "loss": 0.0088, "step": 643980 }, { "epoch": 1.67, "learning_rate": 4.960275389404869e-05, "loss": 0.0077, "step": 643990 }, { "epoch": 1.67, "learning_rate": 4.959886567767722e-05, "loss": 0.0075, "step": 644000 }, { "epoch": 1.67, "eval_cer": 0.8816690950367475, "eval_loss": 0.005179722793400288, "eval_runtime": 107.801, "eval_samples_per_second": 18.553, "eval_steps_per_second": 4.638, "step": 644000 }, { "epoch": 1.67, "learning_rate": 4.959497746130576e-05, "loss": 0.0078, "step": 644010 }, { "epoch": 1.67, "learning_rate": 4.95910892449343e-05, "loss": 0.0082, "step": 644020 }, { "epoch": 1.67, "learning_rate": 4.958720102856283e-05, "loss": 0.0074, "step": 644030 }, { "epoch": 1.67, "learning_rate": 4.958331281219137e-05, "loss": 0.0083, "step": 644040 }, { "epoch": 1.67, "learning_rate": 4.95794245958199e-05, "loss": 0.0081, "step": 644050 }, { "epoch": 1.67, "learning_rate": 4.957553637944844e-05, "loss": 0.0077, "step": 644060 }, { "epoch": 1.67, "learning_rate": 4.957164816307697e-05, "loss": 0.0063, "step": 644070 }, { "epoch": 1.67, "learning_rate": 4.956775994670551e-05, "loss": 0.0093, "step": 644080 }, { "epoch": 1.67, "learning_rate": 4.956387173033404e-05, "loss": 0.0118, "step": 644090 }, { "epoch": 1.67, "learning_rate": 4.9559983513962584e-05, "loss": 0.008, "step": 644100 }, { "epoch": 1.67, "learning_rate": 4.955609529759112e-05, "loss": 0.0088, "step": 644110 }, { "epoch": 1.67, "learning_rate": 4.9552207081219654e-05, "loss": 0.0103, "step": 644120 }, { "epoch": 1.67, "learning_rate": 4.954831886484819e-05, "loss": 0.0083, "step": 644130 }, { "epoch": 1.67, "learning_rate": 4.9544430648476723e-05, "loss": 0.0086, "step": 644140 }, { "epoch": 1.67, "learning_rate": 4.954054243210526e-05, "loss": 0.0134, "step": 644150 }, { "epoch": 1.67, "learning_rate": 4.953665421573379e-05, "loss": 0.0079, "step": 644160 }, { "epoch": 1.67, "learning_rate": 4.953276599936233e-05, "loss": 0.0072, "step": 644170 }, { "epoch": 1.67, "learning_rate": 4.952887778299087e-05, "loss": 0.011, "step": 644180 }, { "epoch": 1.67, "learning_rate": 4.9524989566619405e-05, "loss": 0.0056, "step": 644190 }, { "epoch": 1.67, "learning_rate": 4.952110135024794e-05, "loss": 0.0078, "step": 644200 }, { "epoch": 1.67, "learning_rate": 4.951721313387647e-05, "loss": 0.0088, "step": 644210 }, { "epoch": 1.67, "learning_rate": 4.9513324917505e-05, "loss": 0.0066, "step": 644220 }, { "epoch": 1.67, "learning_rate": 4.950943670113354e-05, "loss": 0.0073, "step": 644230 }, { "epoch": 1.67, "learning_rate": 4.950554848476207e-05, "loss": 0.0098, "step": 644240 }, { "epoch": 1.67, "learning_rate": 4.950166026839061e-05, "loss": 0.0113, "step": 644250 }, { "epoch": 1.67, "learning_rate": 4.949777205201914e-05, "loss": 0.0104, "step": 644260 }, { "epoch": 1.67, "learning_rate": 4.949388383564768e-05, "loss": 0.0078, "step": 644270 }, { "epoch": 1.67, "learning_rate": 4.948999561927622e-05, "loss": 0.0079, "step": 644280 }, { "epoch": 1.67, "learning_rate": 4.948610740290475e-05, "loss": 0.0087, "step": 644290 }, { "epoch": 1.67, "learning_rate": 4.948221918653329e-05, "loss": 0.0085, "step": 644300 }, { "epoch": 1.67, "learning_rate": 4.947833097016182e-05, "loss": 0.007, "step": 644310 }, { "epoch": 1.67, "learning_rate": 4.947444275379036e-05, "loss": 0.0067, "step": 644320 }, { "epoch": 1.67, "learning_rate": 4.947055453741889e-05, "loss": 0.01, "step": 644330 }, { "epoch": 1.67, "learning_rate": 4.946666632104743e-05, "loss": 0.0076, "step": 644340 }, { "epoch": 1.67, "learning_rate": 4.946277810467596e-05, "loss": 0.0081, "step": 644350 }, { "epoch": 1.67, "learning_rate": 4.9458889888304504e-05, "loss": 0.0101, "step": 644360 }, { "epoch": 1.67, "learning_rate": 4.945500167193304e-05, "loss": 0.0096, "step": 644370 }, { "epoch": 1.67, "learning_rate": 4.9451113455561574e-05, "loss": 0.0083, "step": 644380 }, { "epoch": 1.67, "learning_rate": 4.944722523919011e-05, "loss": 0.0078, "step": 644390 }, { "epoch": 1.67, "learning_rate": 4.944333702281864e-05, "loss": 0.0079, "step": 644400 }, { "epoch": 1.67, "learning_rate": 4.943944880644718e-05, "loss": 0.0077, "step": 644410 }, { "epoch": 1.67, "learning_rate": 4.943556059007571e-05, "loss": 0.0061, "step": 644420 }, { "epoch": 1.67, "learning_rate": 4.943167237370425e-05, "loss": 0.009, "step": 644430 }, { "epoch": 1.67, "learning_rate": 4.942778415733279e-05, "loss": 0.0077, "step": 644440 }, { "epoch": 1.67, "learning_rate": 4.9423895940961324e-05, "loss": 0.0075, "step": 644450 }, { "epoch": 1.67, "learning_rate": 4.942000772458985e-05, "loss": 0.0102, "step": 644460 }, { "epoch": 1.67, "learning_rate": 4.941611950821839e-05, "loss": 0.0058, "step": 644470 }, { "epoch": 1.67, "learning_rate": 4.941223129184692e-05, "loss": 0.0084, "step": 644480 }, { "epoch": 1.67, "learning_rate": 4.940834307547546e-05, "loss": 0.0079, "step": 644490 }, { "epoch": 1.67, "learning_rate": 4.940445485910399e-05, "loss": 0.0115, "step": 644500 }, { "epoch": 1.67, "learning_rate": 4.940056664273253e-05, "loss": 0.0077, "step": 644510 }, { "epoch": 1.67, "learning_rate": 4.939667842636106e-05, "loss": 0.0117, "step": 644520 }, { "epoch": 1.67, "learning_rate": 4.9392790209989597e-05, "loss": 0.0054, "step": 644530 }, { "epoch": 1.67, "learning_rate": 4.938890199361814e-05, "loss": 0.0057, "step": 644540 }, { "epoch": 1.67, "learning_rate": 4.938501377724667e-05, "loss": 0.0082, "step": 644550 }, { "epoch": 1.67, "learning_rate": 4.938112556087521e-05, "loss": 0.0073, "step": 644560 }, { "epoch": 1.67, "learning_rate": 4.937723734450374e-05, "loss": 0.01, "step": 644570 }, { "epoch": 1.67, "learning_rate": 4.937334912813228e-05, "loss": 0.0062, "step": 644580 }, { "epoch": 1.67, "learning_rate": 4.936946091176081e-05, "loss": 0.0058, "step": 644590 }, { "epoch": 1.67, "learning_rate": 4.936557269538935e-05, "loss": 0.0084, "step": 644600 }, { "epoch": 1.67, "learning_rate": 4.936168447901788e-05, "loss": 0.0102, "step": 644610 }, { "epoch": 1.67, "learning_rate": 4.9357796262646424e-05, "loss": 0.0082, "step": 644620 }, { "epoch": 1.67, "learning_rate": 4.935390804627496e-05, "loss": 0.0095, "step": 644630 }, { "epoch": 1.67, "learning_rate": 4.9350019829903494e-05, "loss": 0.0077, "step": 644640 }, { "epoch": 1.67, "learning_rate": 4.934613161353203e-05, "loss": 0.0095, "step": 644650 }, { "epoch": 1.67, "learning_rate": 4.934224339716056e-05, "loss": 0.0078, "step": 644660 }, { "epoch": 1.67, "learning_rate": 4.93383551807891e-05, "loss": 0.007, "step": 644670 }, { "epoch": 1.67, "learning_rate": 4.933446696441763e-05, "loss": 0.0079, "step": 644680 }, { "epoch": 1.67, "learning_rate": 4.933057874804617e-05, "loss": 0.0102, "step": 644690 }, { "epoch": 1.67, "learning_rate": 4.932669053167471e-05, "loss": 0.0082, "step": 644700 }, { "epoch": 1.67, "learning_rate": 4.932280231530323e-05, "loss": 0.007, "step": 644710 }, { "epoch": 1.67, "learning_rate": 4.931891409893177e-05, "loss": 0.0103, "step": 644720 }, { "epoch": 1.67, "learning_rate": 4.931502588256031e-05, "loss": 0.0093, "step": 644730 }, { "epoch": 1.67, "learning_rate": 4.931113766618884e-05, "loss": 0.0077, "step": 644740 }, { "epoch": 1.67, "learning_rate": 4.930724944981738e-05, "loss": 0.0067, "step": 644750 }, { "epoch": 1.67, "learning_rate": 4.930336123344591e-05, "loss": 0.0113, "step": 644760 }, { "epoch": 1.67, "learning_rate": 4.929947301707445e-05, "loss": 0.0062, "step": 644770 }, { "epoch": 1.67, "learning_rate": 4.929558480070298e-05, "loss": 0.0081, "step": 644780 }, { "epoch": 1.67, "learning_rate": 4.9291696584331517e-05, "loss": 0.0166, "step": 644790 }, { "epoch": 1.67, "learning_rate": 4.928780836796006e-05, "loss": 0.0076, "step": 644800 }, { "epoch": 1.67, "learning_rate": 4.928392015158859e-05, "loss": 0.0115, "step": 644810 }, { "epoch": 1.67, "learning_rate": 4.928003193521713e-05, "loss": 0.0126, "step": 644820 }, { "epoch": 1.67, "learning_rate": 4.927614371884566e-05, "loss": 0.008, "step": 644830 }, { "epoch": 1.67, "learning_rate": 4.92722555024742e-05, "loss": 0.0057, "step": 644840 }, { "epoch": 1.67, "learning_rate": 4.926836728610273e-05, "loss": 0.0086, "step": 644850 }, { "epoch": 1.67, "learning_rate": 4.926447906973127e-05, "loss": 0.0077, "step": 644860 }, { "epoch": 1.67, "learning_rate": 4.92605908533598e-05, "loss": 0.0099, "step": 644870 }, { "epoch": 1.67, "learning_rate": 4.9256702636988344e-05, "loss": 0.0087, "step": 644880 }, { "epoch": 1.67, "learning_rate": 4.925281442061688e-05, "loss": 0.0075, "step": 644890 }, { "epoch": 1.67, "learning_rate": 4.9248926204245414e-05, "loss": 0.0089, "step": 644900 }, { "epoch": 1.67, "learning_rate": 4.924503798787395e-05, "loss": 0.0074, "step": 644910 }, { "epoch": 1.67, "learning_rate": 4.924114977150248e-05, "loss": 0.0161, "step": 644920 }, { "epoch": 1.67, "learning_rate": 4.923726155513102e-05, "loss": 0.0085, "step": 644930 }, { "epoch": 1.67, "learning_rate": 4.923337333875955e-05, "loss": 0.0082, "step": 644940 }, { "epoch": 1.67, "learning_rate": 4.922948512238809e-05, "loss": 0.0105, "step": 644950 }, { "epoch": 1.67, "learning_rate": 4.9225596906016616e-05, "loss": 0.0071, "step": 644960 }, { "epoch": 1.67, "learning_rate": 4.922170868964515e-05, "loss": 0.006, "step": 644970 }, { "epoch": 1.67, "learning_rate": 4.921782047327369e-05, "loss": 0.0082, "step": 644980 }, { "epoch": 1.67, "learning_rate": 4.921393225690223e-05, "loss": 0.0102, "step": 644990 }, { "epoch": 1.67, "learning_rate": 4.921004404053076e-05, "loss": 0.0078, "step": 645000 }, { "epoch": 1.67, "eval_cer": 0.8816718943106159, "eval_loss": 0.0051052626222372055, "eval_runtime": 107.7487, "eval_samples_per_second": 18.562, "eval_steps_per_second": 4.64, "step": 645000 }, { "epoch": 1.67, "learning_rate": 4.92061558241593e-05, "loss": 0.0079, "step": 645010 }, { "epoch": 1.67, "learning_rate": 4.920226760778783e-05, "loss": 0.0077, "step": 645020 }, { "epoch": 1.67, "learning_rate": 4.919837939141637e-05, "loss": 0.0115, "step": 645030 }, { "epoch": 1.67, "learning_rate": 4.91944911750449e-05, "loss": 0.0078, "step": 645040 }, { "epoch": 1.67, "learning_rate": 4.9190602958673436e-05, "loss": 0.0093, "step": 645050 }, { "epoch": 1.67, "learning_rate": 4.918671474230198e-05, "loss": 0.0077, "step": 645060 }, { "epoch": 1.67, "learning_rate": 4.918282652593051e-05, "loss": 0.0088, "step": 645070 }, { "epoch": 1.67, "learning_rate": 4.917893830955905e-05, "loss": 0.0091, "step": 645080 }, { "epoch": 1.67, "learning_rate": 4.917505009318758e-05, "loss": 0.0081, "step": 645090 }, { "epoch": 1.67, "learning_rate": 4.917116187681612e-05, "loss": 0.0059, "step": 645100 }, { "epoch": 1.67, "learning_rate": 4.916727366044465e-05, "loss": 0.0067, "step": 645110 }, { "epoch": 1.67, "learning_rate": 4.916338544407319e-05, "loss": 0.0077, "step": 645120 }, { "epoch": 1.67, "learning_rate": 4.915949722770172e-05, "loss": 0.0088, "step": 645130 }, { "epoch": 1.67, "learning_rate": 4.915560901133026e-05, "loss": 0.0095, "step": 645140 }, { "epoch": 1.67, "learning_rate": 4.91517207949588e-05, "loss": 0.0082, "step": 645150 }, { "epoch": 1.67, "learning_rate": 4.9147832578587334e-05, "loss": 0.0071, "step": 645160 }, { "epoch": 1.67, "learning_rate": 4.914394436221587e-05, "loss": 0.0083, "step": 645170 }, { "epoch": 1.67, "learning_rate": 4.91400561458444e-05, "loss": 0.0095, "step": 645180 }, { "epoch": 1.67, "learning_rate": 4.913616792947294e-05, "loss": 0.0072, "step": 645190 }, { "epoch": 1.67, "learning_rate": 4.913227971310147e-05, "loss": 0.0095, "step": 645200 }, { "epoch": 1.67, "learning_rate": 4.912839149673e-05, "loss": 0.0074, "step": 645210 }, { "epoch": 1.67, "learning_rate": 4.9124503280358536e-05, "loss": 0.0066, "step": 645220 }, { "epoch": 1.67, "learning_rate": 4.912061506398707e-05, "loss": 0.0083, "step": 645230 }, { "epoch": 1.67, "learning_rate": 4.9116726847615606e-05, "loss": 0.0066, "step": 645240 }, { "epoch": 1.67, "learning_rate": 4.911283863124415e-05, "loss": 0.0093, "step": 645250 }, { "epoch": 1.67, "learning_rate": 4.910895041487268e-05, "loss": 0.0089, "step": 645260 }, { "epoch": 1.67, "learning_rate": 4.910506219850122e-05, "loss": 0.0092, "step": 645270 }, { "epoch": 1.67, "learning_rate": 4.910117398212975e-05, "loss": 0.0069, "step": 645280 }, { "epoch": 1.67, "learning_rate": 4.909728576575829e-05, "loss": 0.006, "step": 645290 }, { "epoch": 1.67, "learning_rate": 4.909339754938682e-05, "loss": 0.0116, "step": 645300 }, { "epoch": 1.67, "learning_rate": 4.9089509333015356e-05, "loss": 0.0071, "step": 645310 }, { "epoch": 1.67, "learning_rate": 4.908562111664389e-05, "loss": 0.0073, "step": 645320 }, { "epoch": 1.67, "learning_rate": 4.908173290027243e-05, "loss": 0.0071, "step": 645330 }, { "epoch": 1.67, "learning_rate": 4.907784468390097e-05, "loss": 0.0105, "step": 645340 }, { "epoch": 1.67, "learning_rate": 4.90739564675295e-05, "loss": 0.0085, "step": 645350 }, { "epoch": 1.67, "learning_rate": 4.907006825115804e-05, "loss": 0.0121, "step": 645360 }, { "epoch": 1.67, "learning_rate": 4.906618003478657e-05, "loss": 0.0091, "step": 645370 }, { "epoch": 1.67, "learning_rate": 4.906229181841511e-05, "loss": 0.0113, "step": 645380 }, { "epoch": 1.67, "learning_rate": 4.905840360204364e-05, "loss": 0.005, "step": 645390 }, { "epoch": 1.67, "learning_rate": 4.905451538567218e-05, "loss": 0.0053, "step": 645400 }, { "epoch": 1.67, "learning_rate": 4.905062716930072e-05, "loss": 0.0073, "step": 645410 }, { "epoch": 1.67, "learning_rate": 4.9046738952929253e-05, "loss": 0.0077, "step": 645420 }, { "epoch": 1.67, "learning_rate": 4.904285073655779e-05, "loss": 0.0098, "step": 645430 }, { "epoch": 1.67, "learning_rate": 4.903896252018632e-05, "loss": 0.0079, "step": 645440 }, { "epoch": 1.67, "learning_rate": 4.903507430381485e-05, "loss": 0.0073, "step": 645450 }, { "epoch": 1.67, "learning_rate": 4.9031186087443386e-05, "loss": 0.011, "step": 645460 }, { "epoch": 1.67, "learning_rate": 4.902729787107192e-05, "loss": 0.0096, "step": 645470 }, { "epoch": 1.67, "learning_rate": 4.9023409654700456e-05, "loss": 0.0093, "step": 645480 }, { "epoch": 1.67, "learning_rate": 4.901952143832899e-05, "loss": 0.0094, "step": 645490 }, { "epoch": 1.67, "learning_rate": 4.9015633221957526e-05, "loss": 0.0066, "step": 645500 }, { "epoch": 1.67, "learning_rate": 4.901174500558607e-05, "loss": 0.0096, "step": 645510 }, { "epoch": 1.67, "learning_rate": 4.90078567892146e-05, "loss": 0.0108, "step": 645520 }, { "epoch": 1.67, "learning_rate": 4.900396857284314e-05, "loss": 0.0064, "step": 645530 }, { "epoch": 1.67, "learning_rate": 4.900008035647167e-05, "loss": 0.008, "step": 645540 }, { "epoch": 1.67, "learning_rate": 4.899619214010021e-05, "loss": 0.0066, "step": 645550 }, { "epoch": 1.67, "learning_rate": 4.899230392372874e-05, "loss": 0.0106, "step": 645560 }, { "epoch": 1.67, "learning_rate": 4.8988415707357276e-05, "loss": 0.0079, "step": 645570 }, { "epoch": 1.67, "learning_rate": 4.898452749098581e-05, "loss": 0.0137, "step": 645580 }, { "epoch": 1.67, "learning_rate": 4.898063927461435e-05, "loss": 0.0101, "step": 645590 }, { "epoch": 1.67, "learning_rate": 4.897675105824289e-05, "loss": 0.0089, "step": 645600 }, { "epoch": 1.67, "learning_rate": 4.897286284187142e-05, "loss": 0.0107, "step": 645610 }, { "epoch": 1.67, "learning_rate": 4.896897462549996e-05, "loss": 0.0096, "step": 645620 }, { "epoch": 1.67, "learning_rate": 4.896508640912849e-05, "loss": 0.0106, "step": 645630 }, { "epoch": 1.67, "learning_rate": 4.896119819275703e-05, "loss": 0.0104, "step": 645640 }, { "epoch": 1.67, "learning_rate": 4.895730997638556e-05, "loss": 0.007, "step": 645650 }, { "epoch": 1.67, "learning_rate": 4.89534217600141e-05, "loss": 0.008, "step": 645660 }, { "epoch": 1.67, "learning_rate": 4.894953354364264e-05, "loss": 0.0065, "step": 645670 }, { "epoch": 1.67, "learning_rate": 4.8945645327271173e-05, "loss": 0.0074, "step": 645680 }, { "epoch": 1.67, "learning_rate": 4.894175711089971e-05, "loss": 0.0074, "step": 645690 }, { "epoch": 1.67, "learning_rate": 4.8937868894528236e-05, "loss": 0.0103, "step": 645700 }, { "epoch": 1.67, "learning_rate": 4.893398067815677e-05, "loss": 0.0105, "step": 645710 }, { "epoch": 1.67, "learning_rate": 4.8930092461785306e-05, "loss": 0.0081, "step": 645720 }, { "epoch": 1.67, "learning_rate": 4.892620424541384e-05, "loss": 0.0086, "step": 645730 }, { "epoch": 1.67, "learning_rate": 4.8922316029042376e-05, "loss": 0.0065, "step": 645740 }, { "epoch": 1.67, "learning_rate": 4.891842781267091e-05, "loss": 0.0073, "step": 645750 }, { "epoch": 1.67, "learning_rate": 4.8914539596299446e-05, "loss": 0.0071, "step": 645760 }, { "epoch": 1.67, "learning_rate": 4.891065137992799e-05, "loss": 0.008, "step": 645770 }, { "epoch": 1.67, "learning_rate": 4.890676316355652e-05, "loss": 0.0079, "step": 645780 }, { "epoch": 1.67, "learning_rate": 4.890287494718506e-05, "loss": 0.0071, "step": 645790 }, { "epoch": 1.67, "learning_rate": 4.889898673081359e-05, "loss": 0.0069, "step": 645800 }, { "epoch": 1.67, "learning_rate": 4.8895098514442127e-05, "loss": 0.0073, "step": 645810 }, { "epoch": 1.67, "learning_rate": 4.889121029807066e-05, "loss": 0.0092, "step": 645820 }, { "epoch": 1.67, "learning_rate": 4.8887322081699196e-05, "loss": 0.0088, "step": 645830 }, { "epoch": 1.67, "learning_rate": 4.888343386532773e-05, "loss": 0.0066, "step": 645840 }, { "epoch": 1.67, "learning_rate": 4.887954564895627e-05, "loss": 0.008, "step": 645850 }, { "epoch": 1.67, "learning_rate": 4.887565743258481e-05, "loss": 0.0072, "step": 645860 }, { "epoch": 1.67, "learning_rate": 4.887176921621334e-05, "loss": 0.0087, "step": 645870 }, { "epoch": 1.67, "learning_rate": 4.886788099984188e-05, "loss": 0.0065, "step": 645880 }, { "epoch": 1.67, "learning_rate": 4.886399278347041e-05, "loss": 0.0088, "step": 645890 }, { "epoch": 1.67, "learning_rate": 4.886010456709895e-05, "loss": 0.0083, "step": 645900 }, { "epoch": 1.67, "learning_rate": 4.885621635072748e-05, "loss": 0.0084, "step": 645910 }, { "epoch": 1.67, "learning_rate": 4.885232813435602e-05, "loss": 0.0076, "step": 645920 }, { "epoch": 1.67, "learning_rate": 4.884843991798456e-05, "loss": 0.0154, "step": 645930 }, { "epoch": 1.67, "learning_rate": 4.884455170161309e-05, "loss": 0.0092, "step": 645940 }, { "epoch": 1.67, "learning_rate": 4.884066348524162e-05, "loss": 0.0093, "step": 645950 }, { "epoch": 1.67, "learning_rate": 4.8836775268870156e-05, "loss": 0.0099, "step": 645960 }, { "epoch": 1.67, "learning_rate": 4.883288705249869e-05, "loss": 0.0086, "step": 645970 }, { "epoch": 1.67, "learning_rate": 4.8828998836127226e-05, "loss": 0.012, "step": 645980 }, { "epoch": 1.67, "learning_rate": 4.882511061975576e-05, "loss": 0.0079, "step": 645990 }, { "epoch": 1.67, "learning_rate": 4.8821222403384296e-05, "loss": 0.0097, "step": 646000 }, { "epoch": 1.67, "eval_cer": 0.8816830914060892, "eval_loss": 0.00513434037566185, "eval_runtime": 108.0024, "eval_samples_per_second": 18.518, "eval_steps_per_second": 4.63, "step": 646000 }, { "epoch": 1.67, "learning_rate": 4.881733418701283e-05, "loss": 0.0096, "step": 646010 }, { "epoch": 1.67, "learning_rate": 4.8813445970641365e-05, "loss": 0.0062, "step": 646020 }, { "epoch": 1.67, "learning_rate": 4.880955775426991e-05, "loss": 0.0069, "step": 646030 }, { "epoch": 1.67, "learning_rate": 4.880566953789844e-05, "loss": 0.0081, "step": 646040 }, { "epoch": 1.67, "learning_rate": 4.880178132152698e-05, "loss": 0.0072, "step": 646050 }, { "epoch": 1.67, "learning_rate": 4.879789310515551e-05, "loss": 0.0086, "step": 646060 }, { "epoch": 1.67, "learning_rate": 4.8794004888784047e-05, "loss": 0.0078, "step": 646070 }, { "epoch": 1.67, "learning_rate": 4.879011667241258e-05, "loss": 0.008, "step": 646080 }, { "epoch": 1.67, "learning_rate": 4.8786228456041116e-05, "loss": 0.0066, "step": 646090 }, { "epoch": 1.67, "learning_rate": 4.878234023966965e-05, "loss": 0.0088, "step": 646100 }, { "epoch": 1.67, "learning_rate": 4.877845202329819e-05, "loss": 0.0111, "step": 646110 }, { "epoch": 1.67, "learning_rate": 4.877456380692673e-05, "loss": 0.01, "step": 646120 }, { "epoch": 1.67, "learning_rate": 4.877067559055526e-05, "loss": 0.0059, "step": 646130 }, { "epoch": 1.67, "learning_rate": 4.87667873741838e-05, "loss": 0.0075, "step": 646140 }, { "epoch": 1.67, "learning_rate": 4.876289915781233e-05, "loss": 0.0065, "step": 646150 }, { "epoch": 1.67, "learning_rate": 4.875901094144087e-05, "loss": 0.0077, "step": 646160 }, { "epoch": 1.67, "learning_rate": 4.87551227250694e-05, "loss": 0.0091, "step": 646170 }, { "epoch": 1.67, "learning_rate": 4.875123450869794e-05, "loss": 0.0078, "step": 646180 }, { "epoch": 1.68, "learning_rate": 4.874734629232648e-05, "loss": 0.0069, "step": 646190 }, { "epoch": 1.68, "learning_rate": 4.8743458075955e-05, "loss": 0.0086, "step": 646200 }, { "epoch": 1.68, "learning_rate": 4.873956985958354e-05, "loss": 0.0088, "step": 646210 }, { "epoch": 1.68, "learning_rate": 4.8735681643212076e-05, "loss": 0.0069, "step": 646220 }, { "epoch": 1.68, "learning_rate": 4.873179342684061e-05, "loss": 0.0062, "step": 646230 }, { "epoch": 1.68, "learning_rate": 4.8727905210469146e-05, "loss": 0.0074, "step": 646240 }, { "epoch": 1.68, "learning_rate": 4.872401699409768e-05, "loss": 0.0087, "step": 646250 }, { "epoch": 1.68, "learning_rate": 4.8720128777726216e-05, "loss": 0.009, "step": 646260 }, { "epoch": 1.68, "learning_rate": 4.871624056135475e-05, "loss": 0.007, "step": 646270 }, { "epoch": 1.68, "learning_rate": 4.8712352344983285e-05, "loss": 0.0067, "step": 646280 }, { "epoch": 1.68, "learning_rate": 4.870846412861183e-05, "loss": 0.0073, "step": 646290 }, { "epoch": 1.68, "learning_rate": 4.870457591224036e-05, "loss": 0.0075, "step": 646300 }, { "epoch": 1.68, "learning_rate": 4.87006876958689e-05, "loss": 0.0091, "step": 646310 }, { "epoch": 1.68, "learning_rate": 4.869679947949743e-05, "loss": 0.0071, "step": 646320 }, { "epoch": 1.68, "learning_rate": 4.8692911263125967e-05, "loss": 0.0062, "step": 646330 }, { "epoch": 1.68, "learning_rate": 4.86890230467545e-05, "loss": 0.007, "step": 646340 }, { "epoch": 1.68, "learning_rate": 4.8685134830383036e-05, "loss": 0.0074, "step": 646350 }, { "epoch": 1.68, "learning_rate": 4.868124661401157e-05, "loss": 0.0067, "step": 646360 }, { "epoch": 1.68, "learning_rate": 4.867735839764011e-05, "loss": 0.0102, "step": 646370 }, { "epoch": 1.68, "learning_rate": 4.867347018126865e-05, "loss": 0.0073, "step": 646380 }, { "epoch": 1.68, "learning_rate": 4.866958196489718e-05, "loss": 0.0073, "step": 646390 }, { "epoch": 1.68, "learning_rate": 4.866569374852572e-05, "loss": 0.008, "step": 646400 }, { "epoch": 1.68, "learning_rate": 4.866180553215425e-05, "loss": 0.0067, "step": 646410 }, { "epoch": 1.68, "learning_rate": 4.865791731578279e-05, "loss": 0.0099, "step": 646420 }, { "epoch": 1.68, "learning_rate": 4.865402909941132e-05, "loss": 0.0083, "step": 646430 }, { "epoch": 1.68, "learning_rate": 4.865014088303986e-05, "loss": 0.0078, "step": 646440 }, { "epoch": 1.68, "learning_rate": 4.8646252666668385e-05, "loss": 0.0087, "step": 646450 }, { "epoch": 1.68, "learning_rate": 4.864236445029692e-05, "loss": 0.0091, "step": 646460 }, { "epoch": 1.68, "learning_rate": 4.863847623392546e-05, "loss": 0.0087, "step": 646470 }, { "epoch": 1.68, "learning_rate": 4.8634588017553996e-05, "loss": 0.0084, "step": 646480 }, { "epoch": 1.68, "learning_rate": 4.863069980118253e-05, "loss": 0.0061, "step": 646490 }, { "epoch": 1.68, "learning_rate": 4.8626811584811066e-05, "loss": 0.0118, "step": 646500 }, { "epoch": 1.68, "learning_rate": 4.86229233684396e-05, "loss": 0.0082, "step": 646510 }, { "epoch": 1.68, "learning_rate": 4.8619035152068136e-05, "loss": 0.0065, "step": 646520 }, { "epoch": 1.68, "learning_rate": 4.861514693569667e-05, "loss": 0.0082, "step": 646530 }, { "epoch": 1.68, "learning_rate": 4.8611258719325205e-05, "loss": 0.0077, "step": 646540 }, { "epoch": 1.68, "learning_rate": 4.860737050295374e-05, "loss": 0.0085, "step": 646550 }, { "epoch": 1.68, "learning_rate": 4.860348228658228e-05, "loss": 0.0105, "step": 646560 }, { "epoch": 1.68, "learning_rate": 4.859959407021082e-05, "loss": 0.0079, "step": 646570 }, { "epoch": 1.68, "learning_rate": 4.859570585383935e-05, "loss": 0.0111, "step": 646580 }, { "epoch": 1.68, "learning_rate": 4.8591817637467886e-05, "loss": 0.0097, "step": 646590 }, { "epoch": 1.68, "learning_rate": 4.858792942109642e-05, "loss": 0.0113, "step": 646600 }, { "epoch": 1.68, "learning_rate": 4.8584041204724956e-05, "loss": 0.0079, "step": 646610 }, { "epoch": 1.68, "learning_rate": 4.858015298835349e-05, "loss": 0.0093, "step": 646620 }, { "epoch": 1.68, "learning_rate": 4.8576264771982026e-05, "loss": 0.013, "step": 646630 }, { "epoch": 1.68, "learning_rate": 4.857237655561057e-05, "loss": 0.0096, "step": 646640 }, { "epoch": 1.68, "learning_rate": 4.85684883392391e-05, "loss": 0.0065, "step": 646650 }, { "epoch": 1.68, "learning_rate": 4.856460012286764e-05, "loss": 0.0073, "step": 646660 }, { "epoch": 1.68, "learning_rate": 4.856071190649617e-05, "loss": 0.0089, "step": 646670 }, { "epoch": 1.68, "learning_rate": 4.855682369012471e-05, "loss": 0.0086, "step": 646680 }, { "epoch": 1.68, "learning_rate": 4.8552935473753235e-05, "loss": 0.0058, "step": 646690 }, { "epoch": 1.68, "learning_rate": 4.854904725738177e-05, "loss": 0.0084, "step": 646700 }, { "epoch": 1.68, "learning_rate": 4.8545159041010305e-05, "loss": 0.006, "step": 646710 }, { "epoch": 1.68, "learning_rate": 4.854127082463884e-05, "loss": 0.0105, "step": 646720 }, { "epoch": 1.68, "learning_rate": 4.8537382608267375e-05, "loss": 0.0111, "step": 646730 }, { "epoch": 1.68, "learning_rate": 4.8533494391895916e-05, "loss": 0.0105, "step": 646740 }, { "epoch": 1.68, "learning_rate": 4.852960617552445e-05, "loss": 0.0096, "step": 646750 }, { "epoch": 1.68, "learning_rate": 4.8525717959152986e-05, "loss": 0.0081, "step": 646760 }, { "epoch": 1.68, "learning_rate": 4.852182974278152e-05, "loss": 0.0071, "step": 646770 }, { "epoch": 1.68, "learning_rate": 4.8517941526410056e-05, "loss": 0.007, "step": 646780 }, { "epoch": 1.68, "learning_rate": 4.851405331003859e-05, "loss": 0.0089, "step": 646790 }, { "epoch": 1.68, "learning_rate": 4.8510165093667125e-05, "loss": 0.0102, "step": 646800 }, { "epoch": 1.68, "learning_rate": 4.850627687729566e-05, "loss": 0.0081, "step": 646810 }, { "epoch": 1.68, "learning_rate": 4.85023886609242e-05, "loss": 0.0137, "step": 646820 }, { "epoch": 1.68, "learning_rate": 4.849850044455274e-05, "loss": 0.0087, "step": 646830 }, { "epoch": 1.68, "learning_rate": 4.849461222818127e-05, "loss": 0.0066, "step": 646840 }, { "epoch": 1.68, "learning_rate": 4.8490724011809806e-05, "loss": 0.0064, "step": 646850 }, { "epoch": 1.68, "learning_rate": 4.848683579543834e-05, "loss": 0.0087, "step": 646860 }, { "epoch": 1.68, "learning_rate": 4.8482947579066876e-05, "loss": 0.0064, "step": 646870 }, { "epoch": 1.68, "learning_rate": 4.847905936269541e-05, "loss": 0.0093, "step": 646880 }, { "epoch": 1.68, "learning_rate": 4.8475171146323946e-05, "loss": 0.0102, "step": 646890 }, { "epoch": 1.68, "learning_rate": 4.847128292995249e-05, "loss": 0.0076, "step": 646900 }, { "epoch": 1.68, "learning_rate": 4.846739471358102e-05, "loss": 0.008, "step": 646910 }, { "epoch": 1.68, "learning_rate": 4.846350649720956e-05, "loss": 0.006, "step": 646920 }, { "epoch": 1.68, "learning_rate": 4.845961828083809e-05, "loss": 0.0076, "step": 646930 }, { "epoch": 1.68, "learning_rate": 4.845573006446662e-05, "loss": 0.0104, "step": 646940 }, { "epoch": 1.68, "learning_rate": 4.8451841848095155e-05, "loss": 0.0089, "step": 646950 }, { "epoch": 1.68, "learning_rate": 4.844795363172369e-05, "loss": 0.0071, "step": 646960 }, { "epoch": 1.68, "learning_rate": 4.8444065415352225e-05, "loss": 0.008, "step": 646970 }, { "epoch": 1.68, "learning_rate": 4.844017719898076e-05, "loss": 0.0091, "step": 646980 }, { "epoch": 1.68, "learning_rate": 4.8436288982609294e-05, "loss": 0.0118, "step": 646990 }, { "epoch": 1.68, "learning_rate": 4.8432400766237836e-05, "loss": 0.0079, "step": 647000 }, { "epoch": 1.68, "eval_cer": 0.8816746935844841, "eval_loss": 0.005205851048231125, "eval_runtime": 107.5257, "eval_samples_per_second": 18.6, "eval_steps_per_second": 4.65, "step": 647000 }, { "epoch": 1.68, "learning_rate": 4.842851254986637e-05, "loss": 0.0118, "step": 647010 }, { "epoch": 1.68, "learning_rate": 4.8424624333494906e-05, "loss": 0.0064, "step": 647020 }, { "epoch": 1.68, "learning_rate": 4.842073611712344e-05, "loss": 0.0095, "step": 647030 }, { "epoch": 1.68, "learning_rate": 4.8416847900751976e-05, "loss": 0.009, "step": 647040 }, { "epoch": 1.68, "learning_rate": 4.841295968438051e-05, "loss": 0.0079, "step": 647050 }, { "epoch": 1.68, "learning_rate": 4.8409071468009045e-05, "loss": 0.0088, "step": 647060 }, { "epoch": 1.68, "learning_rate": 4.840518325163758e-05, "loss": 0.0096, "step": 647070 }, { "epoch": 1.68, "learning_rate": 4.840129503526612e-05, "loss": 0.0128, "step": 647080 }, { "epoch": 1.68, "learning_rate": 4.839740681889466e-05, "loss": 0.0104, "step": 647090 }, { "epoch": 1.68, "learning_rate": 4.839351860252319e-05, "loss": 0.0089, "step": 647100 }, { "epoch": 1.68, "learning_rate": 4.8389630386151726e-05, "loss": 0.0077, "step": 647110 }, { "epoch": 1.68, "learning_rate": 4.838574216978026e-05, "loss": 0.0066, "step": 647120 }, { "epoch": 1.68, "learning_rate": 4.8381853953408796e-05, "loss": 0.0098, "step": 647130 }, { "epoch": 1.68, "learning_rate": 4.837796573703733e-05, "loss": 0.0071, "step": 647140 }, { "epoch": 1.68, "learning_rate": 4.8374077520665866e-05, "loss": 0.0069, "step": 647150 }, { "epoch": 1.68, "learning_rate": 4.837018930429441e-05, "loss": 0.0086, "step": 647160 }, { "epoch": 1.68, "learning_rate": 4.836630108792294e-05, "loss": 0.0093, "step": 647170 }, { "epoch": 1.68, "learning_rate": 4.836241287155148e-05, "loss": 0.0062, "step": 647180 }, { "epoch": 1.68, "learning_rate": 4.8358524655180005e-05, "loss": 0.0067, "step": 647190 }, { "epoch": 1.68, "learning_rate": 4.835463643880854e-05, "loss": 0.0095, "step": 647200 }, { "epoch": 1.68, "learning_rate": 4.8350748222437075e-05, "loss": 0.0076, "step": 647210 }, { "epoch": 1.68, "learning_rate": 4.834686000606561e-05, "loss": 0.0103, "step": 647220 }, { "epoch": 1.68, "learning_rate": 4.8342971789694145e-05, "loss": 0.0051, "step": 647230 }, { "epoch": 1.68, "learning_rate": 4.833908357332268e-05, "loss": 0.0103, "step": 647240 }, { "epoch": 1.68, "learning_rate": 4.8335195356951214e-05, "loss": 0.0092, "step": 647250 }, { "epoch": 1.68, "learning_rate": 4.8331307140579756e-05, "loss": 0.0065, "step": 647260 }, { "epoch": 1.68, "learning_rate": 4.832741892420829e-05, "loss": 0.0091, "step": 647270 }, { "epoch": 1.68, "learning_rate": 4.8323530707836826e-05, "loss": 0.0082, "step": 647280 }, { "epoch": 1.68, "learning_rate": 4.831964249146536e-05, "loss": 0.0076, "step": 647290 }, { "epoch": 1.68, "learning_rate": 4.8315754275093896e-05, "loss": 0.0073, "step": 647300 }, { "epoch": 1.68, "learning_rate": 4.831186605872243e-05, "loss": 0.0102, "step": 647310 }, { "epoch": 1.68, "learning_rate": 4.8307977842350965e-05, "loss": 0.0077, "step": 647320 }, { "epoch": 1.68, "learning_rate": 4.83040896259795e-05, "loss": 0.0096, "step": 647330 }, { "epoch": 1.68, "learning_rate": 4.830020140960804e-05, "loss": 0.006, "step": 647340 }, { "epoch": 1.68, "learning_rate": 4.8296313193236577e-05, "loss": 0.0075, "step": 647350 }, { "epoch": 1.68, "learning_rate": 4.829242497686511e-05, "loss": 0.0086, "step": 647360 }, { "epoch": 1.68, "learning_rate": 4.8288536760493646e-05, "loss": 0.0098, "step": 647370 }, { "epoch": 1.68, "learning_rate": 4.828464854412218e-05, "loss": 0.0067, "step": 647380 }, { "epoch": 1.68, "learning_rate": 4.8280760327750716e-05, "loss": 0.0094, "step": 647390 }, { "epoch": 1.68, "learning_rate": 4.827687211137925e-05, "loss": 0.0084, "step": 647400 }, { "epoch": 1.68, "learning_rate": 4.8272983895007786e-05, "loss": 0.0081, "step": 647410 }, { "epoch": 1.68, "learning_rate": 4.826909567863633e-05, "loss": 0.009, "step": 647420 }, { "epoch": 1.68, "learning_rate": 4.826520746226486e-05, "loss": 0.0072, "step": 647430 }, { "epoch": 1.68, "learning_rate": 4.826131924589339e-05, "loss": 0.0096, "step": 647440 }, { "epoch": 1.68, "learning_rate": 4.8257431029521925e-05, "loss": 0.0067, "step": 647450 }, { "epoch": 1.68, "learning_rate": 4.825354281315046e-05, "loss": 0.0104, "step": 647460 }, { "epoch": 1.68, "learning_rate": 4.8249654596778995e-05, "loss": 0.0077, "step": 647470 }, { "epoch": 1.68, "learning_rate": 4.824576638040753e-05, "loss": 0.0092, "step": 647480 }, { "epoch": 1.68, "learning_rate": 4.8241878164036065e-05, "loss": 0.0062, "step": 647490 }, { "epoch": 1.68, "learning_rate": 4.82379899476646e-05, "loss": 0.0106, "step": 647500 }, { "epoch": 1.68, "learning_rate": 4.8234101731293134e-05, "loss": 0.0102, "step": 647510 }, { "epoch": 1.68, "learning_rate": 4.8230213514921676e-05, "loss": 0.0083, "step": 647520 }, { "epoch": 1.68, "learning_rate": 4.822632529855021e-05, "loss": 0.0086, "step": 647530 }, { "epoch": 1.68, "learning_rate": 4.8222437082178746e-05, "loss": 0.008, "step": 647540 }, { "epoch": 1.68, "learning_rate": 4.821854886580728e-05, "loss": 0.0074, "step": 647550 }, { "epoch": 1.68, "learning_rate": 4.8214660649435815e-05, "loss": 0.0086, "step": 647560 }, { "epoch": 1.68, "learning_rate": 4.821077243306435e-05, "loss": 0.0058, "step": 647570 }, { "epoch": 1.68, "learning_rate": 4.8206884216692885e-05, "loss": 0.0073, "step": 647580 }, { "epoch": 1.68, "learning_rate": 4.820299600032142e-05, "loss": 0.007, "step": 647590 }, { "epoch": 1.68, "learning_rate": 4.819910778394996e-05, "loss": 0.0065, "step": 647600 }, { "epoch": 1.68, "learning_rate": 4.8195219567578497e-05, "loss": 0.0098, "step": 647610 }, { "epoch": 1.68, "learning_rate": 4.819133135120703e-05, "loss": 0.0091, "step": 647620 }, { "epoch": 1.68, "learning_rate": 4.8187443134835566e-05, "loss": 0.0065, "step": 647630 }, { "epoch": 1.68, "learning_rate": 4.81835549184641e-05, "loss": 0.008, "step": 647640 }, { "epoch": 1.68, "learning_rate": 4.8179666702092636e-05, "loss": 0.01, "step": 647650 }, { "epoch": 1.68, "learning_rate": 4.817577848572117e-05, "loss": 0.0079, "step": 647660 }, { "epoch": 1.68, "learning_rate": 4.8171890269349706e-05, "loss": 0.008, "step": 647670 }, { "epoch": 1.68, "learning_rate": 4.816800205297825e-05, "loss": 0.0092, "step": 647680 }, { "epoch": 1.68, "learning_rate": 4.816411383660677e-05, "loss": 0.0066, "step": 647690 }, { "epoch": 1.68, "learning_rate": 4.816022562023531e-05, "loss": 0.0083, "step": 647700 }, { "epoch": 1.68, "learning_rate": 4.8156337403863845e-05, "loss": 0.0077, "step": 647710 }, { "epoch": 1.68, "learning_rate": 4.815244918749238e-05, "loss": 0.0073, "step": 647720 }, { "epoch": 1.68, "learning_rate": 4.8148560971120915e-05, "loss": 0.0123, "step": 647730 }, { "epoch": 1.68, "learning_rate": 4.814467275474945e-05, "loss": 0.0081, "step": 647740 }, { "epoch": 1.68, "learning_rate": 4.8140784538377985e-05, "loss": 0.0084, "step": 647750 }, { "epoch": 1.68, "learning_rate": 4.813689632200652e-05, "loss": 0.0065, "step": 647760 }, { "epoch": 1.68, "learning_rate": 4.8133008105635054e-05, "loss": 0.0111, "step": 647770 }, { "epoch": 1.68, "learning_rate": 4.8129119889263596e-05, "loss": 0.0078, "step": 647780 }, { "epoch": 1.68, "learning_rate": 4.812523167289213e-05, "loss": 0.0067, "step": 647790 }, { "epoch": 1.68, "learning_rate": 4.8121343456520666e-05, "loss": 0.0077, "step": 647800 }, { "epoch": 1.68, "learning_rate": 4.81174552401492e-05, "loss": 0.0071, "step": 647810 }, { "epoch": 1.68, "learning_rate": 4.8113567023777735e-05, "loss": 0.008, "step": 647820 }, { "epoch": 1.68, "learning_rate": 4.810967880740627e-05, "loss": 0.0071, "step": 647830 }, { "epoch": 1.68, "learning_rate": 4.8105790591034805e-05, "loss": 0.0053, "step": 647840 }, { "epoch": 1.68, "learning_rate": 4.810190237466334e-05, "loss": 0.0072, "step": 647850 }, { "epoch": 1.68, "learning_rate": 4.8098014158291875e-05, "loss": 0.0102, "step": 647860 }, { "epoch": 1.68, "learning_rate": 4.8094125941920416e-05, "loss": 0.0065, "step": 647870 }, { "epoch": 1.68, "learning_rate": 4.809023772554895e-05, "loss": 0.0132, "step": 647880 }, { "epoch": 1.68, "learning_rate": 4.8086349509177486e-05, "loss": 0.0079, "step": 647890 }, { "epoch": 1.68, "learning_rate": 4.808246129280602e-05, "loss": 0.0074, "step": 647900 }, { "epoch": 1.68, "learning_rate": 4.8078573076434556e-05, "loss": 0.0086, "step": 647910 }, { "epoch": 1.68, "learning_rate": 4.807468486006309e-05, "loss": 0.0088, "step": 647920 }, { "epoch": 1.68, "learning_rate": 4.8070796643691626e-05, "loss": 0.0074, "step": 647930 }, { "epoch": 1.68, "learning_rate": 4.8066908427320154e-05, "loss": 0.0075, "step": 647940 }, { "epoch": 1.68, "learning_rate": 4.806302021094869e-05, "loss": 0.0086, "step": 647950 }, { "epoch": 1.68, "learning_rate": 4.8059131994577223e-05, "loss": 0.0109, "step": 647960 }, { "epoch": 1.68, "learning_rate": 4.8055243778205765e-05, "loss": 0.0097, "step": 647970 }, { "epoch": 1.68, "learning_rate": 4.80513555618343e-05, "loss": 0.0074, "step": 647980 }, { "epoch": 1.68, "learning_rate": 4.8047467345462835e-05, "loss": 0.0073, "step": 647990 }, { "epoch": 1.68, "learning_rate": 4.804357912909137e-05, "loss": 0.0071, "step": 648000 }, { "epoch": 1.68, "eval_cer": 0.8816802921322209, "eval_loss": 0.005112422164529562, "eval_runtime": 107.9114, "eval_samples_per_second": 18.534, "eval_steps_per_second": 4.633, "step": 648000 }, { "epoch": 1.68, "learning_rate": 4.8039690912719905e-05, "loss": 0.0072, "step": 648010 }, { "epoch": 1.68, "learning_rate": 4.803580269634844e-05, "loss": 0.0086, "step": 648020 }, { "epoch": 1.68, "learning_rate": 4.8031914479976974e-05, "loss": 0.01, "step": 648030 }, { "epoch": 1.68, "learning_rate": 4.802802626360551e-05, "loss": 0.0065, "step": 648040 }, { "epoch": 1.68, "learning_rate": 4.802413804723405e-05, "loss": 0.0096, "step": 648050 }, { "epoch": 1.68, "learning_rate": 4.8020249830862586e-05, "loss": 0.0089, "step": 648060 }, { "epoch": 1.68, "learning_rate": 4.801636161449112e-05, "loss": 0.0082, "step": 648070 }, { "epoch": 1.68, "learning_rate": 4.8012473398119655e-05, "loss": 0.0069, "step": 648080 }, { "epoch": 1.68, "learning_rate": 4.800858518174819e-05, "loss": 0.0098, "step": 648090 }, { "epoch": 1.68, "learning_rate": 4.8004696965376725e-05, "loss": 0.015, "step": 648100 }, { "epoch": 1.68, "learning_rate": 4.800080874900526e-05, "loss": 0.0063, "step": 648110 }, { "epoch": 1.68, "learning_rate": 4.7996920532633795e-05, "loss": 0.0086, "step": 648120 }, { "epoch": 1.68, "learning_rate": 4.7993032316262336e-05, "loss": 0.0083, "step": 648130 }, { "epoch": 1.68, "learning_rate": 4.798914409989087e-05, "loss": 0.0081, "step": 648140 }, { "epoch": 1.68, "learning_rate": 4.7985255883519406e-05, "loss": 0.0072, "step": 648150 }, { "epoch": 1.68, "learning_rate": 4.798136766714794e-05, "loss": 0.0069, "step": 648160 }, { "epoch": 1.68, "learning_rate": 4.7977479450776476e-05, "loss": 0.0074, "step": 648170 }, { "epoch": 1.68, "learning_rate": 4.7973591234405004e-05, "loss": 0.0064, "step": 648180 }, { "epoch": 1.68, "learning_rate": 4.796970301803354e-05, "loss": 0.0075, "step": 648190 }, { "epoch": 1.68, "learning_rate": 4.7965814801662074e-05, "loss": 0.0087, "step": 648200 }, { "epoch": 1.68, "learning_rate": 4.796192658529061e-05, "loss": 0.0072, "step": 648210 }, { "epoch": 1.68, "learning_rate": 4.7958038368919143e-05, "loss": 0.0076, "step": 648220 }, { "epoch": 1.68, "learning_rate": 4.7954150152547685e-05, "loss": 0.0081, "step": 648230 }, { "epoch": 1.68, "learning_rate": 4.795026193617622e-05, "loss": 0.0081, "step": 648240 }, { "epoch": 1.68, "learning_rate": 4.7946373719804755e-05, "loss": 0.0087, "step": 648250 }, { "epoch": 1.68, "learning_rate": 4.794248550343329e-05, "loss": 0.0072, "step": 648260 }, { "epoch": 1.68, "learning_rate": 4.7938597287061825e-05, "loss": 0.0098, "step": 648270 }, { "epoch": 1.68, "learning_rate": 4.793470907069036e-05, "loss": 0.0089, "step": 648280 }, { "epoch": 1.68, "learning_rate": 4.7930820854318894e-05, "loss": 0.0092, "step": 648290 }, { "epoch": 1.68, "learning_rate": 4.792693263794743e-05, "loss": 0.0091, "step": 648300 }, { "epoch": 1.68, "learning_rate": 4.792304442157597e-05, "loss": 0.0078, "step": 648310 }, { "epoch": 1.68, "learning_rate": 4.7919156205204506e-05, "loss": 0.0083, "step": 648320 }, { "epoch": 1.68, "learning_rate": 4.791526798883304e-05, "loss": 0.0079, "step": 648330 }, { "epoch": 1.68, "learning_rate": 4.7911379772461575e-05, "loss": 0.0105, "step": 648340 }, { "epoch": 1.68, "learning_rate": 4.790749155609011e-05, "loss": 0.0091, "step": 648350 }, { "epoch": 1.68, "learning_rate": 4.7903603339718645e-05, "loss": 0.0098, "step": 648360 }, { "epoch": 1.68, "learning_rate": 4.789971512334718e-05, "loss": 0.0079, "step": 648370 }, { "epoch": 1.68, "learning_rate": 4.7895826906975715e-05, "loss": 0.0081, "step": 648380 }, { "epoch": 1.68, "learning_rate": 4.7891938690604256e-05, "loss": 0.0078, "step": 648390 }, { "epoch": 1.68, "learning_rate": 4.788805047423279e-05, "loss": 0.0062, "step": 648400 }, { "epoch": 1.68, "learning_rate": 4.7884162257861326e-05, "loss": 0.0052, "step": 648410 }, { "epoch": 1.68, "learning_rate": 4.788027404148986e-05, "loss": 0.0061, "step": 648420 }, { "epoch": 1.68, "learning_rate": 4.787638582511839e-05, "loss": 0.0087, "step": 648430 }, { "epoch": 1.68, "learning_rate": 4.7872497608746924e-05, "loss": 0.0091, "step": 648440 }, { "epoch": 1.68, "learning_rate": 4.786860939237546e-05, "loss": 0.0087, "step": 648450 }, { "epoch": 1.68, "learning_rate": 4.7864721176003994e-05, "loss": 0.0077, "step": 648460 }, { "epoch": 1.68, "learning_rate": 4.786083295963253e-05, "loss": 0.0104, "step": 648470 }, { "epoch": 1.68, "learning_rate": 4.785694474326106e-05, "loss": 0.006, "step": 648480 }, { "epoch": 1.68, "learning_rate": 4.7853056526889605e-05, "loss": 0.0055, "step": 648490 }, { "epoch": 1.68, "learning_rate": 4.784916831051814e-05, "loss": 0.0076, "step": 648500 }, { "epoch": 1.68, "learning_rate": 4.7845280094146675e-05, "loss": 0.0082, "step": 648510 }, { "epoch": 1.68, "learning_rate": 4.784139187777521e-05, "loss": 0.01, "step": 648520 }, { "epoch": 1.68, "learning_rate": 4.7837503661403744e-05, "loss": 0.006, "step": 648530 }, { "epoch": 1.68, "learning_rate": 4.783361544503228e-05, "loss": 0.0073, "step": 648540 }, { "epoch": 1.68, "learning_rate": 4.7829727228660814e-05, "loss": 0.0088, "step": 648550 }, { "epoch": 1.68, "learning_rate": 4.782583901228935e-05, "loss": 0.0069, "step": 648560 }, { "epoch": 1.68, "learning_rate": 4.782195079591789e-05, "loss": 0.0095, "step": 648570 }, { "epoch": 1.68, "learning_rate": 4.7818062579546426e-05, "loss": 0.0089, "step": 648580 }, { "epoch": 1.68, "learning_rate": 4.781417436317496e-05, "loss": 0.0072, "step": 648590 }, { "epoch": 1.68, "learning_rate": 4.7810286146803495e-05, "loss": 0.0092, "step": 648600 }, { "epoch": 1.68, "learning_rate": 4.780639793043203e-05, "loss": 0.006, "step": 648610 }, { "epoch": 1.68, "learning_rate": 4.7802509714060565e-05, "loss": 0.0084, "step": 648620 }, { "epoch": 1.68, "learning_rate": 4.77986214976891e-05, "loss": 0.0087, "step": 648630 }, { "epoch": 1.68, "learning_rate": 4.7794733281317635e-05, "loss": 0.008, "step": 648640 }, { "epoch": 1.68, "learning_rate": 4.7790845064946176e-05, "loss": 0.0091, "step": 648650 }, { "epoch": 1.68, "learning_rate": 4.778695684857471e-05, "loss": 0.0063, "step": 648660 }, { "epoch": 1.68, "learning_rate": 4.7783068632203246e-05, "loss": 0.0082, "step": 648670 }, { "epoch": 1.68, "learning_rate": 4.7779180415831774e-05, "loss": 0.009, "step": 648680 }, { "epoch": 1.68, "learning_rate": 4.777529219946031e-05, "loss": 0.0078, "step": 648690 }, { "epoch": 1.68, "learning_rate": 4.7771403983088844e-05, "loss": 0.0113, "step": 648700 }, { "epoch": 1.68, "learning_rate": 4.776751576671738e-05, "loss": 0.0104, "step": 648710 }, { "epoch": 1.68, "learning_rate": 4.7763627550345914e-05, "loss": 0.0085, "step": 648720 }, { "epoch": 1.68, "learning_rate": 4.775973933397445e-05, "loss": 0.0077, "step": 648730 }, { "epoch": 1.68, "learning_rate": 4.775585111760298e-05, "loss": 0.0074, "step": 648740 }, { "epoch": 1.68, "learning_rate": 4.7751962901231525e-05, "loss": 0.007, "step": 648750 }, { "epoch": 1.68, "learning_rate": 4.774807468486006e-05, "loss": 0.0108, "step": 648760 }, { "epoch": 1.68, "learning_rate": 4.7744186468488595e-05, "loss": 0.0083, "step": 648770 }, { "epoch": 1.68, "learning_rate": 4.774029825211713e-05, "loss": 0.0077, "step": 648780 }, { "epoch": 1.68, "learning_rate": 4.7736410035745664e-05, "loss": 0.0085, "step": 648790 }, { "epoch": 1.68, "learning_rate": 4.77325218193742e-05, "loss": 0.0076, "step": 648800 }, { "epoch": 1.68, "learning_rate": 4.7728633603002734e-05, "loss": 0.0089, "step": 648810 }, { "epoch": 1.68, "learning_rate": 4.772474538663127e-05, "loss": 0.007, "step": 648820 }, { "epoch": 1.68, "learning_rate": 4.772085717025981e-05, "loss": 0.008, "step": 648830 }, { "epoch": 1.68, "learning_rate": 4.7716968953888345e-05, "loss": 0.0081, "step": 648840 }, { "epoch": 1.68, "learning_rate": 4.771308073751688e-05, "loss": 0.0065, "step": 648850 }, { "epoch": 1.68, "learning_rate": 4.7709192521145415e-05, "loss": 0.0101, "step": 648860 }, { "epoch": 1.68, "learning_rate": 4.770530430477395e-05, "loss": 0.0068, "step": 648870 }, { "epoch": 1.68, "learning_rate": 4.7701416088402485e-05, "loss": 0.008, "step": 648880 }, { "epoch": 1.68, "learning_rate": 4.769752787203102e-05, "loss": 0.0102, "step": 648890 }, { "epoch": 1.68, "learning_rate": 4.7693639655659555e-05, "loss": 0.0078, "step": 648900 }, { "epoch": 1.68, "learning_rate": 4.7689751439288096e-05, "loss": 0.0075, "step": 648910 }, { "epoch": 1.68, "learning_rate": 4.768586322291663e-05, "loss": 0.0105, "step": 648920 }, { "epoch": 1.68, "learning_rate": 4.768197500654516e-05, "loss": 0.0078, "step": 648930 }, { "epoch": 1.68, "learning_rate": 4.7678086790173694e-05, "loss": 0.0103, "step": 648940 }, { "epoch": 1.68, "learning_rate": 4.767419857380223e-05, "loss": 0.006, "step": 648950 }, { "epoch": 1.68, "learning_rate": 4.7670310357430764e-05, "loss": 0.0122, "step": 648960 }, { "epoch": 1.68, "learning_rate": 4.76664221410593e-05, "loss": 0.0097, "step": 648970 }, { "epoch": 1.68, "learning_rate": 4.7662533924687834e-05, "loss": 0.0078, "step": 648980 }, { "epoch": 1.68, "learning_rate": 4.765864570831637e-05, "loss": 0.0069, "step": 648990 }, { "epoch": 1.68, "learning_rate": 4.76547574919449e-05, "loss": 0.0087, "step": 649000 }, { "epoch": 1.68, "eval_cer": 0.8816606972151424, "eval_loss": 0.005129742436110973, "eval_runtime": 108.1719, "eval_samples_per_second": 18.489, "eval_steps_per_second": 4.622, "step": 649000 }, { "epoch": 1.68, "learning_rate": 4.7650869275573445e-05, "loss": 0.0078, "step": 649010 }, { "epoch": 1.68, "learning_rate": 4.764698105920198e-05, "loss": 0.0075, "step": 649020 }, { "epoch": 1.68, "learning_rate": 4.7643092842830515e-05, "loss": 0.011, "step": 649030 }, { "epoch": 1.68, "learning_rate": 4.763920462645905e-05, "loss": 0.0101, "step": 649040 }, { "epoch": 1.68, "learning_rate": 4.7635316410087584e-05, "loss": 0.0108, "step": 649050 }, { "epoch": 1.68, "learning_rate": 4.763142819371612e-05, "loss": 0.0073, "step": 649060 }, { "epoch": 1.68, "learning_rate": 4.7627539977344654e-05, "loss": 0.0096, "step": 649070 }, { "epoch": 1.68, "learning_rate": 4.762365176097319e-05, "loss": 0.0075, "step": 649080 }, { "epoch": 1.68, "learning_rate": 4.761976354460173e-05, "loss": 0.0068, "step": 649090 }, { "epoch": 1.68, "learning_rate": 4.7615875328230265e-05, "loss": 0.0105, "step": 649100 }, { "epoch": 1.68, "learning_rate": 4.76119871118588e-05, "loss": 0.0086, "step": 649110 }, { "epoch": 1.68, "learning_rate": 4.7608098895487335e-05, "loss": 0.0071, "step": 649120 }, { "epoch": 1.68, "learning_rate": 4.760421067911587e-05, "loss": 0.0119, "step": 649130 }, { "epoch": 1.68, "learning_rate": 4.7600322462744405e-05, "loss": 0.01, "step": 649140 }, { "epoch": 1.68, "learning_rate": 4.759643424637294e-05, "loss": 0.0113, "step": 649150 }, { "epoch": 1.68, "learning_rate": 4.7592546030001475e-05, "loss": 0.0089, "step": 649160 }, { "epoch": 1.68, "learning_rate": 4.758865781363001e-05, "loss": 0.0074, "step": 649170 }, { "epoch": 1.68, "learning_rate": 4.758476959725854e-05, "loss": 0.0062, "step": 649180 }, { "epoch": 1.68, "learning_rate": 4.758088138088708e-05, "loss": 0.0085, "step": 649190 }, { "epoch": 1.68, "learning_rate": 4.7576993164515614e-05, "loss": 0.0088, "step": 649200 }, { "epoch": 1.68, "learning_rate": 4.757310494814415e-05, "loss": 0.0096, "step": 649210 }, { "epoch": 1.68, "learning_rate": 4.7569216731772684e-05, "loss": 0.0075, "step": 649220 }, { "epoch": 1.68, "learning_rate": 4.756532851540122e-05, "loss": 0.0093, "step": 649230 }, { "epoch": 1.68, "learning_rate": 4.7561440299029754e-05, "loss": 0.0046, "step": 649240 }, { "epoch": 1.68, "learning_rate": 4.755755208265829e-05, "loss": 0.0091, "step": 649250 }, { "epoch": 1.68, "learning_rate": 4.755366386628682e-05, "loss": 0.0071, "step": 649260 }, { "epoch": 1.68, "learning_rate": 4.7549775649915365e-05, "loss": 0.007, "step": 649270 }, { "epoch": 1.68, "learning_rate": 4.75458874335439e-05, "loss": 0.0075, "step": 649280 }, { "epoch": 1.68, "learning_rate": 4.7541999217172435e-05, "loss": 0.0093, "step": 649290 }, { "epoch": 1.68, "learning_rate": 4.753811100080097e-05, "loss": 0.0118, "step": 649300 }, { "epoch": 1.68, "learning_rate": 4.7534222784429504e-05, "loss": 0.0089, "step": 649310 }, { "epoch": 1.68, "learning_rate": 4.753033456805804e-05, "loss": 0.0098, "step": 649320 }, { "epoch": 1.68, "learning_rate": 4.7526446351686574e-05, "loss": 0.0091, "step": 649330 }, { "epoch": 1.68, "learning_rate": 4.752255813531511e-05, "loss": 0.0076, "step": 649340 }, { "epoch": 1.68, "learning_rate": 4.7518669918943644e-05, "loss": 0.0047, "step": 649350 }, { "epoch": 1.68, "learning_rate": 4.7514781702572185e-05, "loss": 0.0074, "step": 649360 }, { "epoch": 1.68, "learning_rate": 4.751089348620072e-05, "loss": 0.009, "step": 649370 }, { "epoch": 1.68, "learning_rate": 4.7507005269829255e-05, "loss": 0.0057, "step": 649380 }, { "epoch": 1.68, "learning_rate": 4.750311705345779e-05, "loss": 0.0095, "step": 649390 }, { "epoch": 1.68, "learning_rate": 4.7499228837086325e-05, "loss": 0.009, "step": 649400 }, { "epoch": 1.68, "learning_rate": 4.749534062071486e-05, "loss": 0.01, "step": 649410 }, { "epoch": 1.68, "learning_rate": 4.749145240434339e-05, "loss": 0.0081, "step": 649420 }, { "epoch": 1.68, "learning_rate": 4.748756418797192e-05, "loss": 0.0065, "step": 649430 }, { "epoch": 1.68, "learning_rate": 4.748367597160046e-05, "loss": 0.0085, "step": 649440 }, { "epoch": 1.68, "learning_rate": 4.747978775522899e-05, "loss": 0.0091, "step": 649450 }, { "epoch": 1.68, "learning_rate": 4.7475899538857534e-05, "loss": 0.0082, "step": 649460 }, { "epoch": 1.68, "learning_rate": 4.747201132248607e-05, "loss": 0.0059, "step": 649470 }, { "epoch": 1.68, "learning_rate": 4.7468123106114604e-05, "loss": 0.007, "step": 649480 }, { "epoch": 1.68, "learning_rate": 4.746423488974314e-05, "loss": 0.0083, "step": 649490 }, { "epoch": 1.68, "learning_rate": 4.7460346673371673e-05, "loss": 0.0099, "step": 649500 }, { "epoch": 1.68, "learning_rate": 4.745645845700021e-05, "loss": 0.0088, "step": 649510 }, { "epoch": 1.68, "learning_rate": 4.745257024062874e-05, "loss": 0.0068, "step": 649520 }, { "epoch": 1.68, "learning_rate": 4.744868202425728e-05, "loss": 0.0074, "step": 649530 }, { "epoch": 1.68, "learning_rate": 4.744479380788582e-05, "loss": 0.0073, "step": 649540 }, { "epoch": 1.68, "learning_rate": 4.7440905591514355e-05, "loss": 0.0068, "step": 649550 }, { "epoch": 1.68, "learning_rate": 4.743701737514289e-05, "loss": 0.0061, "step": 649560 }, { "epoch": 1.68, "learning_rate": 4.7433129158771424e-05, "loss": 0.0092, "step": 649570 }, { "epoch": 1.68, "learning_rate": 4.742924094239996e-05, "loss": 0.0095, "step": 649580 }, { "epoch": 1.68, "learning_rate": 4.7425352726028494e-05, "loss": 0.0086, "step": 649590 }, { "epoch": 1.68, "learning_rate": 4.742146450965703e-05, "loss": 0.007, "step": 649600 }, { "epoch": 1.68, "learning_rate": 4.7417576293285564e-05, "loss": 0.0077, "step": 649610 }, { "epoch": 1.68, "learning_rate": 4.7413688076914105e-05, "loss": 0.0069, "step": 649620 }, { "epoch": 1.68, "learning_rate": 4.740979986054264e-05, "loss": 0.009, "step": 649630 }, { "epoch": 1.68, "learning_rate": 4.7405911644171175e-05, "loss": 0.0098, "step": 649640 }, { "epoch": 1.68, "learning_rate": 4.740202342779971e-05, "loss": 0.0068, "step": 649650 }, { "epoch": 1.68, "learning_rate": 4.7398135211428245e-05, "loss": 0.0086, "step": 649660 }, { "epoch": 1.68, "learning_rate": 4.739424699505677e-05, "loss": 0.0092, "step": 649670 }, { "epoch": 1.68, "learning_rate": 4.739035877868531e-05, "loss": 0.0065, "step": 649680 }, { "epoch": 1.68, "learning_rate": 4.738647056231384e-05, "loss": 0.0088, "step": 649690 }, { "epoch": 1.68, "learning_rate": 4.738258234594238e-05, "loss": 0.0077, "step": 649700 }, { "epoch": 1.68, "learning_rate": 4.737869412957091e-05, "loss": 0.0094, "step": 649710 }, { "epoch": 1.68, "learning_rate": 4.7374805913199454e-05, "loss": 0.0065, "step": 649720 }, { "epoch": 1.68, "learning_rate": 4.737091769682799e-05, "loss": 0.0069, "step": 649730 }, { "epoch": 1.68, "learning_rate": 4.7367029480456524e-05, "loss": 0.0087, "step": 649740 }, { "epoch": 1.68, "learning_rate": 4.736314126408506e-05, "loss": 0.0068, "step": 649750 }, { "epoch": 1.68, "learning_rate": 4.7359253047713593e-05, "loss": 0.0105, "step": 649760 }, { "epoch": 1.68, "learning_rate": 4.735536483134213e-05, "loss": 0.0073, "step": 649770 }, { "epoch": 1.68, "learning_rate": 4.735147661497066e-05, "loss": 0.0084, "step": 649780 }, { "epoch": 1.68, "learning_rate": 4.73475883985992e-05, "loss": 0.0108, "step": 649790 }, { "epoch": 1.68, "learning_rate": 4.734370018222774e-05, "loss": 0.0072, "step": 649800 }, { "epoch": 1.68, "learning_rate": 4.7339811965856274e-05, "loss": 0.0082, "step": 649810 }, { "epoch": 1.68, "learning_rate": 4.733592374948481e-05, "loss": 0.0063, "step": 649820 }, { "epoch": 1.68, "learning_rate": 4.7332035533113344e-05, "loss": 0.0086, "step": 649830 }, { "epoch": 1.68, "learning_rate": 4.732814731674188e-05, "loss": 0.0069, "step": 649840 }, { "epoch": 1.68, "learning_rate": 4.7324259100370414e-05, "loss": 0.0059, "step": 649850 }, { "epoch": 1.68, "learning_rate": 4.732037088399895e-05, "loss": 0.0108, "step": 649860 }, { "epoch": 1.68, "learning_rate": 4.7316482667627484e-05, "loss": 0.0069, "step": 649870 }, { "epoch": 1.68, "learning_rate": 4.7312594451256025e-05, "loss": 0.0091, "step": 649880 }, { "epoch": 1.68, "learning_rate": 4.730870623488456e-05, "loss": 0.0103, "step": 649890 }, { "epoch": 1.68, "learning_rate": 4.7304818018513095e-05, "loss": 0.0065, "step": 649900 }, { "epoch": 1.68, "learning_rate": 4.730092980214163e-05, "loss": 0.0075, "step": 649910 }, { "epoch": 1.68, "learning_rate": 4.729704158577016e-05, "loss": 0.0082, "step": 649920 }, { "epoch": 1.68, "learning_rate": 4.729315336939869e-05, "loss": 0.0057, "step": 649930 }, { "epoch": 1.68, "learning_rate": 4.728926515302723e-05, "loss": 0.0083, "step": 649940 }, { "epoch": 1.68, "learning_rate": 4.728537693665576e-05, "loss": 0.007, "step": 649950 }, { "epoch": 1.68, "learning_rate": 4.72814887202843e-05, "loss": 0.011, "step": 649960 }, { "epoch": 1.68, "learning_rate": 4.727760050391283e-05, "loss": 0.0097, "step": 649970 }, { "epoch": 1.68, "learning_rate": 4.7273712287541374e-05, "loss": 0.0079, "step": 649980 }, { "epoch": 1.68, "learning_rate": 4.726982407116991e-05, "loss": 0.0071, "step": 649990 }, { "epoch": 1.68, "learning_rate": 4.7265935854798444e-05, "loss": 0.0083, "step": 650000 }, { "epoch": 1.68, "eval_cer": 0.8816774928583525, "eval_loss": 0.005187535658478737, "eval_runtime": 107.9437, "eval_samples_per_second": 18.528, "eval_steps_per_second": 4.632, "step": 650000 }, { "epoch": 1.68, "learning_rate": 4.726204763842698e-05, "loss": 0.0114, "step": 650010 }, { "epoch": 1.68, "learning_rate": 4.725815942205551e-05, "loss": 0.0081, "step": 650020 }, { "epoch": 1.68, "learning_rate": 4.725427120568405e-05, "loss": 0.0079, "step": 650030 }, { "epoch": 1.68, "learning_rate": 4.725038298931258e-05, "loss": 0.0084, "step": 650040 }, { "epoch": 1.69, "learning_rate": 4.724649477294112e-05, "loss": 0.0077, "step": 650050 }, { "epoch": 1.69, "learning_rate": 4.724260655656966e-05, "loss": 0.0075, "step": 650060 }, { "epoch": 1.69, "learning_rate": 4.7238718340198194e-05, "loss": 0.0078, "step": 650070 }, { "epoch": 1.69, "learning_rate": 4.723483012382673e-05, "loss": 0.007, "step": 650080 }, { "epoch": 1.69, "learning_rate": 4.7230941907455264e-05, "loss": 0.0063, "step": 650090 }, { "epoch": 1.69, "learning_rate": 4.72270536910838e-05, "loss": 0.0066, "step": 650100 }, { "epoch": 1.69, "learning_rate": 4.7223165474712334e-05, "loss": 0.0096, "step": 650110 }, { "epoch": 1.69, "learning_rate": 4.721927725834087e-05, "loss": 0.0072, "step": 650120 }, { "epoch": 1.69, "learning_rate": 4.7215389041969404e-05, "loss": 0.0092, "step": 650130 }, { "epoch": 1.69, "learning_rate": 4.7211500825597945e-05, "loss": 0.0079, "step": 650140 }, { "epoch": 1.69, "learning_rate": 4.720761260922648e-05, "loss": 0.0083, "step": 650150 }, { "epoch": 1.69, "learning_rate": 4.7203724392855015e-05, "loss": 0.006, "step": 650160 }, { "epoch": 1.69, "learning_rate": 4.719983617648354e-05, "loss": 0.0087, "step": 650170 }, { "epoch": 1.69, "learning_rate": 4.719594796011208e-05, "loss": 0.008, "step": 650180 }, { "epoch": 1.69, "learning_rate": 4.719205974374061e-05, "loss": 0.0084, "step": 650190 }, { "epoch": 1.69, "learning_rate": 4.718817152736915e-05, "loss": 0.007, "step": 650200 }, { "epoch": 1.69, "learning_rate": 4.718428331099768e-05, "loss": 0.008, "step": 650210 }, { "epoch": 1.69, "learning_rate": 4.718039509462622e-05, "loss": 0.0051, "step": 650220 }, { "epoch": 1.69, "learning_rate": 4.717650687825475e-05, "loss": 0.0061, "step": 650230 }, { "epoch": 1.69, "learning_rate": 4.7172618661883294e-05, "loss": 0.0069, "step": 650240 }, { "epoch": 1.69, "learning_rate": 4.716873044551183e-05, "loss": 0.0098, "step": 650250 }, { "epoch": 1.69, "learning_rate": 4.7164842229140364e-05, "loss": 0.0097, "step": 650260 }, { "epoch": 1.69, "learning_rate": 4.71609540127689e-05, "loss": 0.0064, "step": 650270 }, { "epoch": 1.69, "learning_rate": 4.715706579639743e-05, "loss": 0.0068, "step": 650280 }, { "epoch": 1.69, "learning_rate": 4.715317758002597e-05, "loss": 0.0071, "step": 650290 }, { "epoch": 1.69, "learning_rate": 4.71492893636545e-05, "loss": 0.0078, "step": 650300 }, { "epoch": 1.69, "learning_rate": 4.714540114728304e-05, "loss": 0.0069, "step": 650310 }, { "epoch": 1.69, "learning_rate": 4.714151293091158e-05, "loss": 0.0061, "step": 650320 }, { "epoch": 1.69, "learning_rate": 4.7137624714540114e-05, "loss": 0.0087, "step": 650330 }, { "epoch": 1.69, "learning_rate": 4.713373649816865e-05, "loss": 0.0084, "step": 650340 }, { "epoch": 1.69, "learning_rate": 4.7129848281797184e-05, "loss": 0.0097, "step": 650350 }, { "epoch": 1.69, "learning_rate": 4.712596006542572e-05, "loss": 0.0088, "step": 650360 }, { "epoch": 1.69, "learning_rate": 4.7122071849054254e-05, "loss": 0.0075, "step": 650370 }, { "epoch": 1.69, "learning_rate": 4.711818363268279e-05, "loss": 0.0148, "step": 650380 }, { "epoch": 1.69, "learning_rate": 4.7114295416311324e-05, "loss": 0.009, "step": 650390 }, { "epoch": 1.69, "learning_rate": 4.7110407199939865e-05, "loss": 0.007, "step": 650400 }, { "epoch": 1.69, "learning_rate": 4.71065189835684e-05, "loss": 0.0107, "step": 650410 }, { "epoch": 1.69, "learning_rate": 4.710263076719693e-05, "loss": 0.0081, "step": 650420 }, { "epoch": 1.69, "learning_rate": 4.709874255082546e-05, "loss": 0.0098, "step": 650430 }, { "epoch": 1.69, "learning_rate": 4.7094854334454e-05, "loss": 0.0068, "step": 650440 }, { "epoch": 1.69, "learning_rate": 4.709096611808253e-05, "loss": 0.0089, "step": 650450 }, { "epoch": 1.69, "learning_rate": 4.708707790171107e-05, "loss": 0.0069, "step": 650460 }, { "epoch": 1.69, "learning_rate": 4.70831896853396e-05, "loss": 0.0114, "step": 650470 }, { "epoch": 1.69, "learning_rate": 4.707930146896814e-05, "loss": 0.0114, "step": 650480 }, { "epoch": 1.69, "learning_rate": 4.707541325259667e-05, "loss": 0.006, "step": 650490 }, { "epoch": 1.69, "learning_rate": 4.7071525036225214e-05, "loss": 0.0085, "step": 650500 }, { "epoch": 1.69, "learning_rate": 4.706763681985375e-05, "loss": 0.007, "step": 650510 }, { "epoch": 1.69, "learning_rate": 4.7063748603482284e-05, "loss": 0.0071, "step": 650520 }, { "epoch": 1.69, "learning_rate": 4.705986038711082e-05, "loss": 0.0068, "step": 650530 }, { "epoch": 1.69, "learning_rate": 4.705597217073935e-05, "loss": 0.0069, "step": 650540 }, { "epoch": 1.69, "learning_rate": 4.705208395436789e-05, "loss": 0.0092, "step": 650550 }, { "epoch": 1.69, "learning_rate": 4.704819573799642e-05, "loss": 0.0067, "step": 650560 }, { "epoch": 1.69, "learning_rate": 4.704430752162496e-05, "loss": 0.0093, "step": 650570 }, { "epoch": 1.69, "learning_rate": 4.70404193052535e-05, "loss": 0.0075, "step": 650580 }, { "epoch": 1.69, "learning_rate": 4.7036531088882034e-05, "loss": 0.01, "step": 650590 }, { "epoch": 1.69, "learning_rate": 4.703264287251057e-05, "loss": 0.0083, "step": 650600 }, { "epoch": 1.69, "learning_rate": 4.7028754656139104e-05, "loss": 0.0104, "step": 650610 }, { "epoch": 1.69, "learning_rate": 4.702486643976764e-05, "loss": 0.007, "step": 650620 }, { "epoch": 1.69, "learning_rate": 4.7020978223396174e-05, "loss": 0.0077, "step": 650630 }, { "epoch": 1.69, "learning_rate": 4.701709000702471e-05, "loss": 0.0107, "step": 650640 }, { "epoch": 1.69, "learning_rate": 4.7013201790653244e-05, "loss": 0.0072, "step": 650650 }, { "epoch": 1.69, "learning_rate": 4.700931357428177e-05, "loss": 0.0075, "step": 650660 }, { "epoch": 1.69, "learning_rate": 4.7005425357910306e-05, "loss": 0.007, "step": 650670 }, { "epoch": 1.69, "learning_rate": 4.700153714153885e-05, "loss": 0.0068, "step": 650680 }, { "epoch": 1.69, "learning_rate": 4.699764892516738e-05, "loss": 0.0077, "step": 650690 }, { "epoch": 1.69, "learning_rate": 4.699376070879592e-05, "loss": 0.0077, "step": 650700 }, { "epoch": 1.69, "learning_rate": 4.698987249242445e-05, "loss": 0.0056, "step": 650710 }, { "epoch": 1.69, "learning_rate": 4.698598427605299e-05, "loss": 0.0075, "step": 650720 }, { "epoch": 1.69, "learning_rate": 4.698209605968152e-05, "loss": 0.0101, "step": 650730 }, { "epoch": 1.69, "learning_rate": 4.697820784331006e-05, "loss": 0.0078, "step": 650740 }, { "epoch": 1.69, "learning_rate": 4.697431962693859e-05, "loss": 0.0061, "step": 650750 }, { "epoch": 1.69, "learning_rate": 4.697043141056713e-05, "loss": 0.0095, "step": 650760 }, { "epoch": 1.69, "learning_rate": 4.696654319419567e-05, "loss": 0.0092, "step": 650770 }, { "epoch": 1.69, "learning_rate": 4.6962654977824203e-05, "loss": 0.0086, "step": 650780 }, { "epoch": 1.69, "learning_rate": 4.695876676145274e-05, "loss": 0.0071, "step": 650790 }, { "epoch": 1.69, "learning_rate": 4.695487854508127e-05, "loss": 0.0059, "step": 650800 }, { "epoch": 1.69, "learning_rate": 4.695099032870981e-05, "loss": 0.0058, "step": 650810 }, { "epoch": 1.69, "learning_rate": 4.694710211233834e-05, "loss": 0.006, "step": 650820 }, { "epoch": 1.69, "learning_rate": 4.694321389596688e-05, "loss": 0.0072, "step": 650830 }, { "epoch": 1.69, "learning_rate": 4.693932567959541e-05, "loss": 0.0079, "step": 650840 }, { "epoch": 1.69, "learning_rate": 4.6935437463223954e-05, "loss": 0.0063, "step": 650850 }, { "epoch": 1.69, "learning_rate": 4.693154924685249e-05, "loss": 0.0065, "step": 650860 }, { "epoch": 1.69, "learning_rate": 4.6927661030481024e-05, "loss": 0.0097, "step": 650870 }, { "epoch": 1.69, "learning_rate": 4.692377281410956e-05, "loss": 0.0133, "step": 650880 }, { "epoch": 1.69, "learning_rate": 4.6919884597738094e-05, "loss": 0.0077, "step": 650890 }, { "epoch": 1.69, "learning_rate": 4.691599638136663e-05, "loss": 0.0061, "step": 650900 }, { "epoch": 1.69, "learning_rate": 4.691210816499516e-05, "loss": 0.0107, "step": 650910 }, { "epoch": 1.69, "learning_rate": 4.690821994862369e-05, "loss": 0.0074, "step": 650920 }, { "epoch": 1.69, "learning_rate": 4.6904331732252226e-05, "loss": 0.0071, "step": 650930 }, { "epoch": 1.69, "learning_rate": 4.690044351588076e-05, "loss": 0.0094, "step": 650940 }, { "epoch": 1.69, "learning_rate": 4.68965552995093e-05, "loss": 0.0073, "step": 650950 }, { "epoch": 1.69, "learning_rate": 4.689266708313784e-05, "loss": 0.0078, "step": 650960 }, { "epoch": 1.69, "learning_rate": 4.688877886676637e-05, "loss": 0.0072, "step": 650970 }, { "epoch": 1.69, "learning_rate": 4.688489065039491e-05, "loss": 0.0104, "step": 650980 }, { "epoch": 1.69, "learning_rate": 4.688100243402344e-05, "loss": 0.0054, "step": 650990 }, { "epoch": 1.69, "learning_rate": 4.687711421765198e-05, "loss": 0.0129, "step": 651000 }, { "epoch": 1.69, "eval_cer": 0.8816648961259449, "eval_loss": 0.005368160083889961, "eval_runtime": 107.9578, "eval_samples_per_second": 18.526, "eval_steps_per_second": 4.631, "step": 651000 }, { "epoch": 1.69, "learning_rate": 4.687322600128051e-05, "loss": 0.0092, "step": 651010 }, { "epoch": 1.69, "learning_rate": 4.686933778490905e-05, "loss": 0.0078, "step": 651020 }, { "epoch": 1.69, "learning_rate": 4.686544956853759e-05, "loss": 0.0087, "step": 651030 }, { "epoch": 1.69, "learning_rate": 4.6861561352166123e-05, "loss": 0.0068, "step": 651040 }, { "epoch": 1.69, "learning_rate": 4.685767313579466e-05, "loss": 0.01, "step": 651050 }, { "epoch": 1.69, "learning_rate": 4.685378491942319e-05, "loss": 0.0064, "step": 651060 }, { "epoch": 1.69, "learning_rate": 4.684989670305173e-05, "loss": 0.0075, "step": 651070 }, { "epoch": 1.69, "learning_rate": 4.684600848668026e-05, "loss": 0.0065, "step": 651080 }, { "epoch": 1.69, "learning_rate": 4.68421202703088e-05, "loss": 0.0101, "step": 651090 }, { "epoch": 1.69, "learning_rate": 4.683823205393733e-05, "loss": 0.0084, "step": 651100 }, { "epoch": 1.69, "learning_rate": 4.6834343837565874e-05, "loss": 0.009, "step": 651110 }, { "epoch": 1.69, "learning_rate": 4.683045562119441e-05, "loss": 0.0075, "step": 651120 }, { "epoch": 1.69, "learning_rate": 4.6826567404822944e-05, "loss": 0.0075, "step": 651130 }, { "epoch": 1.69, "learning_rate": 4.682267918845148e-05, "loss": 0.0069, "step": 651140 }, { "epoch": 1.69, "learning_rate": 4.6818790972080014e-05, "loss": 0.0074, "step": 651150 }, { "epoch": 1.69, "learning_rate": 4.681490275570854e-05, "loss": 0.0084, "step": 651160 }, { "epoch": 1.69, "learning_rate": 4.681101453933708e-05, "loss": 0.0063, "step": 651170 }, { "epoch": 1.69, "learning_rate": 4.680712632296561e-05, "loss": 0.0085, "step": 651180 }, { "epoch": 1.69, "learning_rate": 4.6803238106594146e-05, "loss": 0.0082, "step": 651190 }, { "epoch": 1.69, "learning_rate": 4.679934989022268e-05, "loss": 0.0093, "step": 651200 }, { "epoch": 1.69, "learning_rate": 4.679546167385122e-05, "loss": 0.0075, "step": 651210 }, { "epoch": 1.69, "learning_rate": 4.679157345747976e-05, "loss": 0.0092, "step": 651220 }, { "epoch": 1.69, "learning_rate": 4.678768524110829e-05, "loss": 0.0096, "step": 651230 }, { "epoch": 1.69, "learning_rate": 4.678379702473683e-05, "loss": 0.0074, "step": 651240 }, { "epoch": 1.69, "learning_rate": 4.677990880836536e-05, "loss": 0.0065, "step": 651250 }, { "epoch": 1.69, "learning_rate": 4.67760205919939e-05, "loss": 0.0066, "step": 651260 }, { "epoch": 1.69, "learning_rate": 4.677213237562243e-05, "loss": 0.0131, "step": 651270 }, { "epoch": 1.69, "learning_rate": 4.676824415925097e-05, "loss": 0.0083, "step": 651280 }, { "epoch": 1.69, "learning_rate": 4.676435594287951e-05, "loss": 0.0095, "step": 651290 }, { "epoch": 1.69, "learning_rate": 4.6760467726508043e-05, "loss": 0.0104, "step": 651300 }, { "epoch": 1.69, "learning_rate": 4.675657951013658e-05, "loss": 0.0086, "step": 651310 }, { "epoch": 1.69, "learning_rate": 4.675269129376511e-05, "loss": 0.0067, "step": 651320 }, { "epoch": 1.69, "learning_rate": 4.674880307739365e-05, "loss": 0.0071, "step": 651330 }, { "epoch": 1.69, "learning_rate": 4.674491486102218e-05, "loss": 0.0087, "step": 651340 }, { "epoch": 1.69, "learning_rate": 4.674102664465072e-05, "loss": 0.0088, "step": 651350 }, { "epoch": 1.69, "learning_rate": 4.673713842827925e-05, "loss": 0.0083, "step": 651360 }, { "epoch": 1.69, "learning_rate": 4.6733250211907794e-05, "loss": 0.0078, "step": 651370 }, { "epoch": 1.69, "learning_rate": 4.672936199553633e-05, "loss": 0.0057, "step": 651380 }, { "epoch": 1.69, "learning_rate": 4.6725473779164864e-05, "loss": 0.0085, "step": 651390 }, { "epoch": 1.69, "learning_rate": 4.67215855627934e-05, "loss": 0.0116, "step": 651400 }, { "epoch": 1.69, "learning_rate": 4.671769734642193e-05, "loss": 0.0077, "step": 651410 }, { "epoch": 1.69, "learning_rate": 4.671380913005046e-05, "loss": 0.0081, "step": 651420 }, { "epoch": 1.69, "learning_rate": 4.6709920913678997e-05, "loss": 0.0068, "step": 651430 }, { "epoch": 1.69, "learning_rate": 4.670603269730753e-05, "loss": 0.0095, "step": 651440 }, { "epoch": 1.69, "learning_rate": 4.6702144480936066e-05, "loss": 0.006, "step": 651450 }, { "epoch": 1.69, "learning_rate": 4.66982562645646e-05, "loss": 0.0084, "step": 651460 }, { "epoch": 1.69, "learning_rate": 4.669436804819314e-05, "loss": 0.0055, "step": 651470 }, { "epoch": 1.69, "learning_rate": 4.669047983182168e-05, "loss": 0.0068, "step": 651480 }, { "epoch": 1.69, "learning_rate": 4.668659161545021e-05, "loss": 0.0065, "step": 651490 }, { "epoch": 1.69, "learning_rate": 4.668270339907875e-05, "loss": 0.0071, "step": 651500 }, { "epoch": 1.69, "learning_rate": 4.667881518270728e-05, "loss": 0.0099, "step": 651510 }, { "epoch": 1.69, "learning_rate": 4.667492696633582e-05, "loss": 0.0067, "step": 651520 }, { "epoch": 1.69, "learning_rate": 4.667103874996435e-05, "loss": 0.0072, "step": 651530 }, { "epoch": 1.69, "learning_rate": 4.666715053359289e-05, "loss": 0.0083, "step": 651540 }, { "epoch": 1.69, "learning_rate": 4.666326231722143e-05, "loss": 0.0073, "step": 651550 }, { "epoch": 1.69, "learning_rate": 4.665937410084996e-05, "loss": 0.0083, "step": 651560 }, { "epoch": 1.69, "learning_rate": 4.66554858844785e-05, "loss": 0.0078, "step": 651570 }, { "epoch": 1.69, "learning_rate": 4.665159766810703e-05, "loss": 0.0078, "step": 651580 }, { "epoch": 1.69, "learning_rate": 4.664770945173557e-05, "loss": 0.0073, "step": 651590 }, { "epoch": 1.69, "learning_rate": 4.66438212353641e-05, "loss": 0.0086, "step": 651600 }, { "epoch": 1.69, "learning_rate": 4.663993301899264e-05, "loss": 0.0079, "step": 651610 }, { "epoch": 1.69, "learning_rate": 4.663604480262117e-05, "loss": 0.0086, "step": 651620 }, { "epoch": 1.69, "learning_rate": 4.6632156586249714e-05, "loss": 0.0096, "step": 651630 }, { "epoch": 1.69, "learning_rate": 4.662826836987825e-05, "loss": 0.0097, "step": 651640 }, { "epoch": 1.69, "learning_rate": 4.6624380153506784e-05, "loss": 0.0078, "step": 651650 }, { "epoch": 1.69, "learning_rate": 4.662049193713531e-05, "loss": 0.0074, "step": 651660 }, { "epoch": 1.69, "learning_rate": 4.661660372076385e-05, "loss": 0.0067, "step": 651670 }, { "epoch": 1.69, "learning_rate": 4.661271550439238e-05, "loss": 0.0073, "step": 651680 }, { "epoch": 1.69, "learning_rate": 4.6608827288020917e-05, "loss": 0.0085, "step": 651690 }, { "epoch": 1.69, "learning_rate": 4.660493907164945e-05, "loss": 0.009, "step": 651700 }, { "epoch": 1.69, "learning_rate": 4.6601050855277986e-05, "loss": 0.009, "step": 651710 }, { "epoch": 1.69, "learning_rate": 4.659716263890652e-05, "loss": 0.0172, "step": 651720 }, { "epoch": 1.69, "learning_rate": 4.659327442253506e-05, "loss": 0.0089, "step": 651730 }, { "epoch": 1.69, "learning_rate": 4.65893862061636e-05, "loss": 0.008, "step": 651740 }, { "epoch": 1.69, "learning_rate": 4.658549798979213e-05, "loss": 0.0073, "step": 651750 }, { "epoch": 1.69, "learning_rate": 4.658160977342067e-05, "loss": 0.0106, "step": 651760 }, { "epoch": 1.69, "learning_rate": 4.65777215570492e-05, "loss": 0.0056, "step": 651770 }, { "epoch": 1.69, "learning_rate": 4.657383334067774e-05, "loss": 0.0108, "step": 651780 }, { "epoch": 1.69, "learning_rate": 4.656994512430627e-05, "loss": 0.0078, "step": 651790 }, { "epoch": 1.69, "learning_rate": 4.656605690793481e-05, "loss": 0.0071, "step": 651800 }, { "epoch": 1.69, "learning_rate": 4.656216869156335e-05, "loss": 0.0093, "step": 651810 }, { "epoch": 1.69, "learning_rate": 4.655828047519188e-05, "loss": 0.0058, "step": 651820 }, { "epoch": 1.69, "learning_rate": 4.655439225882042e-05, "loss": 0.0078, "step": 651830 }, { "epoch": 1.69, "learning_rate": 4.655050404244895e-05, "loss": 0.0069, "step": 651840 }, { "epoch": 1.69, "learning_rate": 4.654661582607749e-05, "loss": 0.0073, "step": 651850 }, { "epoch": 1.69, "learning_rate": 4.654272760970602e-05, "loss": 0.0084, "step": 651860 }, { "epoch": 1.69, "learning_rate": 4.653883939333456e-05, "loss": 0.0109, "step": 651870 }, { "epoch": 1.69, "learning_rate": 4.653495117696309e-05, "loss": 0.0059, "step": 651880 }, { "epoch": 1.69, "learning_rate": 4.6531062960591634e-05, "loss": 0.0099, "step": 651890 }, { "epoch": 1.69, "learning_rate": 4.652717474422017e-05, "loss": 0.0065, "step": 651900 }, { "epoch": 1.69, "learning_rate": 4.65232865278487e-05, "loss": 0.0069, "step": 651910 }, { "epoch": 1.69, "learning_rate": 4.651939831147723e-05, "loss": 0.0065, "step": 651920 }, { "epoch": 1.69, "learning_rate": 4.651551009510577e-05, "loss": 0.005, "step": 651930 }, { "epoch": 1.69, "learning_rate": 4.65116218787343e-05, "loss": 0.0102, "step": 651940 }, { "epoch": 1.69, "learning_rate": 4.6507733662362837e-05, "loss": 0.0101, "step": 651950 }, { "epoch": 1.69, "learning_rate": 4.650384544599137e-05, "loss": 0.0082, "step": 651960 }, { "epoch": 1.69, "learning_rate": 4.6499957229619906e-05, "loss": 0.0069, "step": 651970 }, { "epoch": 1.69, "learning_rate": 4.649606901324844e-05, "loss": 0.0092, "step": 651980 }, { "epoch": 1.69, "learning_rate": 4.649218079687698e-05, "loss": 0.0107, "step": 651990 }, { "epoch": 1.69, "learning_rate": 4.648829258050552e-05, "loss": 0.0075, "step": 652000 }, { "epoch": 1.69, "eval_cer": 0.8816774928583525, "eval_loss": 0.005205278750509024, "eval_runtime": 107.7051, "eval_samples_per_second": 18.569, "eval_steps_per_second": 4.642, "step": 652000 }, { "epoch": 1.69, "learning_rate": 4.648440436413405e-05, "loss": 0.0078, "step": 652010 }, { "epoch": 1.69, "learning_rate": 4.648051614776259e-05, "loss": 0.0067, "step": 652020 }, { "epoch": 1.69, "learning_rate": 4.647662793139112e-05, "loss": 0.006, "step": 652030 }, { "epoch": 1.69, "learning_rate": 4.647273971501966e-05, "loss": 0.008, "step": 652040 }, { "epoch": 1.69, "learning_rate": 4.646885149864819e-05, "loss": 0.0059, "step": 652050 }, { "epoch": 1.69, "learning_rate": 4.646496328227673e-05, "loss": 0.0106, "step": 652060 }, { "epoch": 1.69, "learning_rate": 4.646107506590526e-05, "loss": 0.0094, "step": 652070 }, { "epoch": 1.69, "learning_rate": 4.64571868495338e-05, "loss": 0.0065, "step": 652080 }, { "epoch": 1.69, "learning_rate": 4.645329863316234e-05, "loss": 0.0079, "step": 652090 }, { "epoch": 1.69, "learning_rate": 4.644941041679087e-05, "loss": 0.0106, "step": 652100 }, { "epoch": 1.69, "learning_rate": 4.644552220041941e-05, "loss": 0.0062, "step": 652110 }, { "epoch": 1.69, "learning_rate": 4.644163398404794e-05, "loss": 0.0108, "step": 652120 }, { "epoch": 1.69, "learning_rate": 4.643774576767648e-05, "loss": 0.0106, "step": 652130 }, { "epoch": 1.69, "learning_rate": 4.643385755130501e-05, "loss": 0.0082, "step": 652140 }, { "epoch": 1.69, "learning_rate": 4.642996933493354e-05, "loss": 0.007, "step": 652150 }, { "epoch": 1.69, "learning_rate": 4.6426081118562075e-05, "loss": 0.0086, "step": 652160 }, { "epoch": 1.69, "learning_rate": 4.642219290219061e-05, "loss": 0.0094, "step": 652170 }, { "epoch": 1.69, "learning_rate": 4.641830468581915e-05, "loss": 0.0074, "step": 652180 }, { "epoch": 1.69, "learning_rate": 4.641441646944769e-05, "loss": 0.0099, "step": 652190 }, { "epoch": 1.69, "learning_rate": 4.641052825307622e-05, "loss": 0.0079, "step": 652200 }, { "epoch": 1.69, "learning_rate": 4.6406640036704756e-05, "loss": 0.0072, "step": 652210 }, { "epoch": 1.69, "learning_rate": 4.640275182033329e-05, "loss": 0.0085, "step": 652220 }, { "epoch": 1.69, "learning_rate": 4.6398863603961826e-05, "loss": 0.0102, "step": 652230 }, { "epoch": 1.69, "learning_rate": 4.639497538759036e-05, "loss": 0.0097, "step": 652240 }, { "epoch": 1.69, "learning_rate": 4.6391087171218896e-05, "loss": 0.0092, "step": 652250 }, { "epoch": 1.69, "learning_rate": 4.638719895484744e-05, "loss": 0.0064, "step": 652260 }, { "epoch": 1.69, "learning_rate": 4.638331073847597e-05, "loss": 0.0073, "step": 652270 }, { "epoch": 1.69, "learning_rate": 4.637942252210451e-05, "loss": 0.0085, "step": 652280 }, { "epoch": 1.69, "learning_rate": 4.637553430573304e-05, "loss": 0.0071, "step": 652290 }, { "epoch": 1.69, "learning_rate": 4.637164608936158e-05, "loss": 0.0101, "step": 652300 }, { "epoch": 1.69, "learning_rate": 4.636775787299011e-05, "loss": 0.0087, "step": 652310 }, { "epoch": 1.69, "learning_rate": 4.636386965661865e-05, "loss": 0.0098, "step": 652320 }, { "epoch": 1.69, "learning_rate": 4.635998144024718e-05, "loss": 0.0087, "step": 652330 }, { "epoch": 1.69, "learning_rate": 4.635609322387572e-05, "loss": 0.0095, "step": 652340 }, { "epoch": 1.69, "learning_rate": 4.635220500750426e-05, "loss": 0.0076, "step": 652350 }, { "epoch": 1.69, "learning_rate": 4.634831679113279e-05, "loss": 0.0093, "step": 652360 }, { "epoch": 1.69, "learning_rate": 4.634442857476133e-05, "loss": 0.0085, "step": 652370 }, { "epoch": 1.69, "learning_rate": 4.634054035838986e-05, "loss": 0.0066, "step": 652380 }, { "epoch": 1.69, "learning_rate": 4.63366521420184e-05, "loss": 0.0079, "step": 652390 }, { "epoch": 1.69, "learning_rate": 4.6332763925646926e-05, "loss": 0.0072, "step": 652400 }, { "epoch": 1.69, "learning_rate": 4.632887570927546e-05, "loss": 0.0078, "step": 652410 }, { "epoch": 1.69, "learning_rate": 4.6324987492903995e-05, "loss": 0.0066, "step": 652420 }, { "epoch": 1.69, "learning_rate": 4.632109927653253e-05, "loss": 0.0079, "step": 652430 }, { "epoch": 1.69, "learning_rate": 4.631721106016107e-05, "loss": 0.0089, "step": 652440 }, { "epoch": 1.69, "learning_rate": 4.631332284378961e-05, "loss": 0.0055, "step": 652450 }, { "epoch": 1.69, "learning_rate": 4.630943462741814e-05, "loss": 0.0065, "step": 652460 }, { "epoch": 1.69, "learning_rate": 4.6305546411046676e-05, "loss": 0.008, "step": 652470 }, { "epoch": 1.69, "learning_rate": 4.630165819467521e-05, "loss": 0.0098, "step": 652480 }, { "epoch": 1.69, "learning_rate": 4.6297769978303746e-05, "loss": 0.008, "step": 652490 }, { "epoch": 1.69, "learning_rate": 4.629388176193228e-05, "loss": 0.0081, "step": 652500 }, { "epoch": 1.69, "learning_rate": 4.6289993545560816e-05, "loss": 0.0089, "step": 652510 }, { "epoch": 1.69, "learning_rate": 4.628610532918936e-05, "loss": 0.007, "step": 652520 }, { "epoch": 1.69, "learning_rate": 4.628221711281789e-05, "loss": 0.0074, "step": 652530 }, { "epoch": 1.69, "learning_rate": 4.627832889644643e-05, "loss": 0.0095, "step": 652540 }, { "epoch": 1.69, "learning_rate": 4.627444068007496e-05, "loss": 0.008, "step": 652550 }, { "epoch": 1.69, "learning_rate": 4.62705524637035e-05, "loss": 0.0094, "step": 652560 }, { "epoch": 1.69, "learning_rate": 4.626666424733203e-05, "loss": 0.0076, "step": 652570 }, { "epoch": 1.69, "learning_rate": 4.626277603096057e-05, "loss": 0.0091, "step": 652580 }, { "epoch": 1.69, "learning_rate": 4.62588878145891e-05, "loss": 0.0092, "step": 652590 }, { "epoch": 1.69, "learning_rate": 4.625499959821764e-05, "loss": 0.0066, "step": 652600 }, { "epoch": 1.69, "learning_rate": 4.625111138184618e-05, "loss": 0.0097, "step": 652610 }, { "epoch": 1.69, "learning_rate": 4.624722316547471e-05, "loss": 0.0085, "step": 652620 }, { "epoch": 1.69, "learning_rate": 4.624333494910325e-05, "loss": 0.0082, "step": 652630 }, { "epoch": 1.69, "learning_rate": 4.623944673273178e-05, "loss": 0.0066, "step": 652640 }, { "epoch": 1.69, "learning_rate": 4.623555851636031e-05, "loss": 0.0097, "step": 652650 }, { "epoch": 1.69, "learning_rate": 4.6231670299988846e-05, "loss": 0.0087, "step": 652660 }, { "epoch": 1.69, "learning_rate": 4.622778208361738e-05, "loss": 0.0073, "step": 652670 }, { "epoch": 1.69, "learning_rate": 4.6223893867245915e-05, "loss": 0.0087, "step": 652680 }, { "epoch": 1.69, "learning_rate": 4.622000565087445e-05, "loss": 0.0238, "step": 652690 }, { "epoch": 1.69, "learning_rate": 4.621611743450299e-05, "loss": 0.0074, "step": 652700 }, { "epoch": 1.69, "learning_rate": 4.621222921813153e-05, "loss": 0.006, "step": 652710 }, { "epoch": 1.69, "learning_rate": 4.620834100176006e-05, "loss": 0.0086, "step": 652720 }, { "epoch": 1.69, "learning_rate": 4.6204452785388596e-05, "loss": 0.0056, "step": 652730 }, { "epoch": 1.69, "learning_rate": 4.620056456901713e-05, "loss": 0.0058, "step": 652740 }, { "epoch": 1.69, "learning_rate": 4.6196676352645666e-05, "loss": 0.0083, "step": 652750 }, { "epoch": 1.69, "learning_rate": 4.61927881362742e-05, "loss": 0.0066, "step": 652760 }, { "epoch": 1.69, "learning_rate": 4.6188899919902736e-05, "loss": 0.0089, "step": 652770 }, { "epoch": 1.69, "learning_rate": 4.618501170353128e-05, "loss": 0.0073, "step": 652780 }, { "epoch": 1.69, "learning_rate": 4.618112348715981e-05, "loss": 0.0097, "step": 652790 }, { "epoch": 1.69, "learning_rate": 4.617723527078835e-05, "loss": 0.0105, "step": 652800 }, { "epoch": 1.69, "learning_rate": 4.617334705441688e-05, "loss": 0.0066, "step": 652810 }, { "epoch": 1.69, "learning_rate": 4.616945883804542e-05, "loss": 0.0067, "step": 652820 }, { "epoch": 1.69, "learning_rate": 4.616557062167395e-05, "loss": 0.0076, "step": 652830 }, { "epoch": 1.69, "learning_rate": 4.6161682405302487e-05, "loss": 0.0098, "step": 652840 }, { "epoch": 1.69, "learning_rate": 4.615779418893102e-05, "loss": 0.005, "step": 652850 }, { "epoch": 1.69, "learning_rate": 4.615390597255956e-05, "loss": 0.0088, "step": 652860 }, { "epoch": 1.69, "learning_rate": 4.61500177561881e-05, "loss": 0.0077, "step": 652870 }, { "epoch": 1.69, "learning_rate": 4.614612953981663e-05, "loss": 0.0068, "step": 652880 }, { "epoch": 1.69, "learning_rate": 4.614224132344517e-05, "loss": 0.0073, "step": 652890 }, { "epoch": 1.69, "learning_rate": 4.6138353107073696e-05, "loss": 0.015, "step": 652900 }, { "epoch": 1.69, "learning_rate": 4.613446489070223e-05, "loss": 0.0102, "step": 652910 }, { "epoch": 1.69, "learning_rate": 4.6130576674330766e-05, "loss": 0.0074, "step": 652920 }, { "epoch": 1.69, "learning_rate": 4.61266884579593e-05, "loss": 0.0083, "step": 652930 }, { "epoch": 1.69, "learning_rate": 4.6122800241587835e-05, "loss": 0.0094, "step": 652940 }, { "epoch": 1.69, "learning_rate": 4.611891202521637e-05, "loss": 0.0086, "step": 652950 }, { "epoch": 1.69, "learning_rate": 4.611502380884491e-05, "loss": 0.0087, "step": 652960 }, { "epoch": 1.69, "learning_rate": 4.6111135592473447e-05, "loss": 0.0111, "step": 652970 }, { "epoch": 1.69, "learning_rate": 4.610724737610198e-05, "loss": 0.0075, "step": 652980 }, { "epoch": 1.69, "learning_rate": 4.6103359159730516e-05, "loss": 0.0063, "step": 652990 }, { "epoch": 1.69, "learning_rate": 4.609947094335905e-05, "loss": 0.0068, "step": 653000 }, { "epoch": 1.69, "eval_cer": 0.8816914892276944, "eval_loss": 0.005161790177226067, "eval_runtime": 107.7473, "eval_samples_per_second": 18.562, "eval_steps_per_second": 4.64, "step": 653000 }, { "epoch": 1.69, "learning_rate": 4.6095582726987586e-05, "loss": 0.0063, "step": 653010 }, { "epoch": 1.69, "learning_rate": 4.609169451061612e-05, "loss": 0.0101, "step": 653020 }, { "epoch": 1.69, "learning_rate": 4.6087806294244656e-05, "loss": 0.0066, "step": 653030 }, { "epoch": 1.69, "learning_rate": 4.60839180778732e-05, "loss": 0.0091, "step": 653040 }, { "epoch": 1.69, "learning_rate": 4.608002986150173e-05, "loss": 0.0058, "step": 653050 }, { "epoch": 1.69, "learning_rate": 4.607614164513027e-05, "loss": 0.0062, "step": 653060 }, { "epoch": 1.69, "learning_rate": 4.60722534287588e-05, "loss": 0.0063, "step": 653070 }, { "epoch": 1.69, "learning_rate": 4.606836521238734e-05, "loss": 0.0061, "step": 653080 }, { "epoch": 1.69, "learning_rate": 4.606447699601587e-05, "loss": 0.0077, "step": 653090 }, { "epoch": 1.69, "learning_rate": 4.6060588779644407e-05, "loss": 0.0068, "step": 653100 }, { "epoch": 1.69, "learning_rate": 4.605670056327294e-05, "loss": 0.008, "step": 653110 }, { "epoch": 1.69, "learning_rate": 4.605281234690148e-05, "loss": 0.0088, "step": 653120 }, { "epoch": 1.69, "learning_rate": 4.604892413053002e-05, "loss": 0.0079, "step": 653130 }, { "epoch": 1.69, "learning_rate": 4.604503591415855e-05, "loss": 0.0091, "step": 653140 }, { "epoch": 1.69, "learning_rate": 4.604114769778708e-05, "loss": 0.0069, "step": 653150 }, { "epoch": 1.69, "learning_rate": 4.6037259481415616e-05, "loss": 0.0067, "step": 653160 }, { "epoch": 1.69, "learning_rate": 4.603337126504415e-05, "loss": 0.0056, "step": 653170 }, { "epoch": 1.69, "learning_rate": 4.6029483048672685e-05, "loss": 0.0088, "step": 653180 }, { "epoch": 1.69, "learning_rate": 4.602559483230122e-05, "loss": 0.0099, "step": 653190 }, { "epoch": 1.69, "learning_rate": 4.6021706615929755e-05, "loss": 0.0092, "step": 653200 }, { "epoch": 1.69, "learning_rate": 4.601781839955829e-05, "loss": 0.0074, "step": 653210 }, { "epoch": 1.69, "learning_rate": 4.601393018318683e-05, "loss": 0.0071, "step": 653220 }, { "epoch": 1.69, "learning_rate": 4.6010041966815367e-05, "loss": 0.0062, "step": 653230 }, { "epoch": 1.69, "learning_rate": 4.60061537504439e-05, "loss": 0.0068, "step": 653240 }, { "epoch": 1.69, "learning_rate": 4.6002265534072436e-05, "loss": 0.0066, "step": 653250 }, { "epoch": 1.69, "learning_rate": 4.599837731770097e-05, "loss": 0.0079, "step": 653260 }, { "epoch": 1.69, "learning_rate": 4.5994489101329506e-05, "loss": 0.0069, "step": 653270 }, { "epoch": 1.69, "learning_rate": 4.599060088495804e-05, "loss": 0.0081, "step": 653280 }, { "epoch": 1.69, "learning_rate": 4.5986712668586576e-05, "loss": 0.0095, "step": 653290 }, { "epoch": 1.69, "learning_rate": 4.598282445221512e-05, "loss": 0.0076, "step": 653300 }, { "epoch": 1.69, "learning_rate": 4.597893623584365e-05, "loss": 0.0078, "step": 653310 }, { "epoch": 1.69, "learning_rate": 4.597504801947219e-05, "loss": 0.0105, "step": 653320 }, { "epoch": 1.69, "learning_rate": 4.597115980310072e-05, "loss": 0.0091, "step": 653330 }, { "epoch": 1.69, "learning_rate": 4.596727158672926e-05, "loss": 0.008, "step": 653340 }, { "epoch": 1.69, "learning_rate": 4.596338337035779e-05, "loss": 0.0096, "step": 653350 }, { "epoch": 1.69, "learning_rate": 4.5959495153986327e-05, "loss": 0.0059, "step": 653360 }, { "epoch": 1.69, "learning_rate": 4.595560693761486e-05, "loss": 0.0088, "step": 653370 }, { "epoch": 1.69, "learning_rate": 4.5951718721243396e-05, "loss": 0.0102, "step": 653380 }, { "epoch": 1.69, "learning_rate": 4.5947830504871924e-05, "loss": 0.008, "step": 653390 }, { "epoch": 1.69, "learning_rate": 4.5943942288500466e-05, "loss": 0.0108, "step": 653400 }, { "epoch": 1.69, "learning_rate": 4.5940054072129e-05, "loss": 0.0095, "step": 653410 }, { "epoch": 1.69, "learning_rate": 4.5936165855757536e-05, "loss": 0.0067, "step": 653420 }, { "epoch": 1.69, "learning_rate": 4.593227763938607e-05, "loss": 0.0068, "step": 653430 }, { "epoch": 1.69, "learning_rate": 4.5928389423014605e-05, "loss": 0.007, "step": 653440 }, { "epoch": 1.69, "learning_rate": 4.592450120664314e-05, "loss": 0.0088, "step": 653450 }, { "epoch": 1.69, "learning_rate": 4.5920612990271675e-05, "loss": 0.0074, "step": 653460 }, { "epoch": 1.69, "learning_rate": 4.591672477390021e-05, "loss": 0.009, "step": 653470 }, { "epoch": 1.69, "learning_rate": 4.5912836557528745e-05, "loss": 0.0096, "step": 653480 }, { "epoch": 1.69, "learning_rate": 4.5908948341157286e-05, "loss": 0.0065, "step": 653490 }, { "epoch": 1.69, "learning_rate": 4.590506012478582e-05, "loss": 0.0113, "step": 653500 }, { "epoch": 1.69, "learning_rate": 4.5901171908414356e-05, "loss": 0.008, "step": 653510 }, { "epoch": 1.69, "learning_rate": 4.589728369204289e-05, "loss": 0.016, "step": 653520 }, { "epoch": 1.69, "learning_rate": 4.5893395475671426e-05, "loss": 0.0124, "step": 653530 }, { "epoch": 1.69, "learning_rate": 4.588950725929996e-05, "loss": 0.0067, "step": 653540 }, { "epoch": 1.69, "learning_rate": 4.5885619042928496e-05, "loss": 0.007, "step": 653550 }, { "epoch": 1.69, "learning_rate": 4.588173082655703e-05, "loss": 0.0067, "step": 653560 }, { "epoch": 1.69, "learning_rate": 4.587784261018557e-05, "loss": 0.0059, "step": 653570 }, { "epoch": 1.69, "learning_rate": 4.587395439381411e-05, "loss": 0.0102, "step": 653580 }, { "epoch": 1.69, "learning_rate": 4.587006617744264e-05, "loss": 0.0063, "step": 653590 }, { "epoch": 1.69, "learning_rate": 4.586617796107118e-05, "loss": 0.0085, "step": 653600 }, { "epoch": 1.69, "learning_rate": 4.586228974469971e-05, "loss": 0.0076, "step": 653610 }, { "epoch": 1.69, "learning_rate": 4.5858401528328246e-05, "loss": 0.0067, "step": 653620 }, { "epoch": 1.69, "learning_rate": 4.585451331195678e-05, "loss": 0.0063, "step": 653630 }, { "epoch": 1.69, "learning_rate": 4.585062509558531e-05, "loss": 0.0096, "step": 653640 }, { "epoch": 1.69, "learning_rate": 4.5846736879213844e-05, "loss": 0.0069, "step": 653650 }, { "epoch": 1.69, "learning_rate": 4.584284866284238e-05, "loss": 0.0082, "step": 653660 }, { "epoch": 1.69, "learning_rate": 4.583896044647092e-05, "loss": 0.0073, "step": 653670 }, { "epoch": 1.69, "learning_rate": 4.5835072230099456e-05, "loss": 0.0074, "step": 653680 }, { "epoch": 1.69, "learning_rate": 4.583118401372799e-05, "loss": 0.0074, "step": 653690 }, { "epoch": 1.69, "learning_rate": 4.5827295797356525e-05, "loss": 0.011, "step": 653700 }, { "epoch": 1.69, "learning_rate": 4.582340758098506e-05, "loss": 0.0091, "step": 653710 }, { "epoch": 1.69, "learning_rate": 4.5819519364613595e-05, "loss": 0.0077, "step": 653720 }, { "epoch": 1.69, "learning_rate": 4.581563114824213e-05, "loss": 0.0116, "step": 653730 }, { "epoch": 1.69, "learning_rate": 4.5811742931870665e-05, "loss": 0.0073, "step": 653740 }, { "epoch": 1.69, "learning_rate": 4.5807854715499206e-05, "loss": 0.0087, "step": 653750 }, { "epoch": 1.69, "learning_rate": 4.580396649912774e-05, "loss": 0.0074, "step": 653760 }, { "epoch": 1.69, "learning_rate": 4.5800078282756276e-05, "loss": 0.0062, "step": 653770 }, { "epoch": 1.69, "learning_rate": 4.579619006638481e-05, "loss": 0.0095, "step": 653780 }, { "epoch": 1.69, "learning_rate": 4.5792301850013346e-05, "loss": 0.0141, "step": 653790 }, { "epoch": 1.69, "learning_rate": 4.578841363364188e-05, "loss": 0.0087, "step": 653800 }, { "epoch": 1.69, "learning_rate": 4.5784525417270416e-05, "loss": 0.0103, "step": 653810 }, { "epoch": 1.69, "learning_rate": 4.578063720089895e-05, "loss": 0.0082, "step": 653820 }, { "epoch": 1.69, "learning_rate": 4.577674898452749e-05, "loss": 0.0088, "step": 653830 }, { "epoch": 1.69, "learning_rate": 4.577286076815603e-05, "loss": 0.0064, "step": 653840 }, { "epoch": 1.69, "learning_rate": 4.576897255178456e-05, "loss": 0.0059, "step": 653850 }, { "epoch": 1.69, "learning_rate": 4.57650843354131e-05, "loss": 0.0089, "step": 653860 }, { "epoch": 1.69, "learning_rate": 4.576119611904163e-05, "loss": 0.0063, "step": 653870 }, { "epoch": 1.69, "learning_rate": 4.5757307902670166e-05, "loss": 0.0091, "step": 653880 }, { "epoch": 1.69, "learning_rate": 4.5753419686298695e-05, "loss": 0.007, "step": 653890 }, { "epoch": 1.7, "learning_rate": 4.574953146992723e-05, "loss": 0.01, "step": 653900 }, { "epoch": 1.7, "learning_rate": 4.5745643253555764e-05, "loss": 0.0067, "step": 653910 }, { "epoch": 1.7, "learning_rate": 4.57417550371843e-05, "loss": 0.0088, "step": 653920 }, { "epoch": 1.7, "learning_rate": 4.573786682081284e-05, "loss": 0.0107, "step": 653930 }, { "epoch": 1.7, "learning_rate": 4.5733978604441376e-05, "loss": 0.0094, "step": 653940 }, { "epoch": 1.7, "learning_rate": 4.573009038806991e-05, "loss": 0.0098, "step": 653950 }, { "epoch": 1.7, "learning_rate": 4.5726202171698445e-05, "loss": 0.0083, "step": 653960 }, { "epoch": 1.7, "learning_rate": 4.572231395532698e-05, "loss": 0.0073, "step": 653970 }, { "epoch": 1.7, "learning_rate": 4.5718425738955515e-05, "loss": 0.0077, "step": 653980 }, { "epoch": 1.7, "learning_rate": 4.571453752258405e-05, "loss": 0.0092, "step": 653990 }, { "epoch": 1.7, "learning_rate": 4.5710649306212585e-05, "loss": 0.0054, "step": 654000 }, { "epoch": 1.7, "eval_cer": 0.8816662957628791, "eval_loss": 0.005244317930191755, "eval_runtime": 108.0147, "eval_samples_per_second": 18.516, "eval_steps_per_second": 4.629, "step": 654000 }, { "epoch": 1.7, "learning_rate": 4.5706761089841126e-05, "loss": 0.0084, "step": 654010 }, { "epoch": 1.7, "learning_rate": 4.570287287346966e-05, "loss": 0.0106, "step": 654020 }, { "epoch": 1.7, "learning_rate": 4.5698984657098196e-05, "loss": 0.0073, "step": 654030 }, { "epoch": 1.7, "learning_rate": 4.569509644072673e-05, "loss": 0.01, "step": 654040 }, { "epoch": 1.7, "learning_rate": 4.5691208224355266e-05, "loss": 0.0078, "step": 654050 }, { "epoch": 1.7, "learning_rate": 4.56873200079838e-05, "loss": 0.0067, "step": 654060 }, { "epoch": 1.7, "learning_rate": 4.5683431791612336e-05, "loss": 0.0083, "step": 654070 }, { "epoch": 1.7, "learning_rate": 4.567954357524087e-05, "loss": 0.0069, "step": 654080 }, { "epoch": 1.7, "learning_rate": 4.567565535886941e-05, "loss": 0.0073, "step": 654090 }, { "epoch": 1.7, "learning_rate": 4.567176714249795e-05, "loss": 0.0076, "step": 654100 }, { "epoch": 1.7, "learning_rate": 4.566787892612648e-05, "loss": 0.0071, "step": 654110 }, { "epoch": 1.7, "learning_rate": 4.566399070975502e-05, "loss": 0.0059, "step": 654120 }, { "epoch": 1.7, "learning_rate": 4.566010249338355e-05, "loss": 0.007, "step": 654130 }, { "epoch": 1.7, "learning_rate": 4.565621427701208e-05, "loss": 0.0114, "step": 654140 }, { "epoch": 1.7, "learning_rate": 4.5652326060640614e-05, "loss": 0.0121, "step": 654150 }, { "epoch": 1.7, "learning_rate": 4.564843784426915e-05, "loss": 0.0132, "step": 654160 }, { "epoch": 1.7, "learning_rate": 4.5644549627897684e-05, "loss": 0.0075, "step": 654170 }, { "epoch": 1.7, "learning_rate": 4.564066141152622e-05, "loss": 0.0062, "step": 654180 }, { "epoch": 1.7, "learning_rate": 4.563677319515476e-05, "loss": 0.0089, "step": 654190 }, { "epoch": 1.7, "learning_rate": 4.5632884978783296e-05, "loss": 0.007, "step": 654200 }, { "epoch": 1.7, "learning_rate": 4.562899676241183e-05, "loss": 0.0076, "step": 654210 }, { "epoch": 1.7, "learning_rate": 4.5625108546040365e-05, "loss": 0.0086, "step": 654220 }, { "epoch": 1.7, "learning_rate": 4.56212203296689e-05, "loss": 0.0073, "step": 654230 }, { "epoch": 1.7, "learning_rate": 4.5617332113297435e-05, "loss": 0.008, "step": 654240 }, { "epoch": 1.7, "learning_rate": 4.561344389692597e-05, "loss": 0.0103, "step": 654250 }, { "epoch": 1.7, "learning_rate": 4.5609555680554505e-05, "loss": 0.0099, "step": 654260 }, { "epoch": 1.7, "learning_rate": 4.5605667464183046e-05, "loss": 0.0115, "step": 654270 }, { "epoch": 1.7, "learning_rate": 4.560177924781158e-05, "loss": 0.0068, "step": 654280 }, { "epoch": 1.7, "learning_rate": 4.5597891031440116e-05, "loss": 0.0109, "step": 654290 }, { "epoch": 1.7, "learning_rate": 4.559400281506865e-05, "loss": 0.0084, "step": 654300 }, { "epoch": 1.7, "learning_rate": 4.5590114598697186e-05, "loss": 0.008, "step": 654310 }, { "epoch": 1.7, "learning_rate": 4.558622638232572e-05, "loss": 0.0051, "step": 654320 }, { "epoch": 1.7, "learning_rate": 4.5582338165954256e-05, "loss": 0.0066, "step": 654330 }, { "epoch": 1.7, "learning_rate": 4.557844994958279e-05, "loss": 0.007, "step": 654340 }, { "epoch": 1.7, "learning_rate": 4.557456173321133e-05, "loss": 0.0099, "step": 654350 }, { "epoch": 1.7, "learning_rate": 4.557067351683987e-05, "loss": 0.0096, "step": 654360 }, { "epoch": 1.7, "learning_rate": 4.55667853004684e-05, "loss": 0.0087, "step": 654370 }, { "epoch": 1.7, "learning_rate": 4.5562897084096937e-05, "loss": 0.0083, "step": 654380 }, { "epoch": 1.7, "learning_rate": 4.5559008867725465e-05, "loss": 0.007, "step": 654390 }, { "epoch": 1.7, "learning_rate": 4.5555120651354e-05, "loss": 0.008, "step": 654400 }, { "epoch": 1.7, "learning_rate": 4.5551232434982534e-05, "loss": 0.0076, "step": 654410 }, { "epoch": 1.7, "learning_rate": 4.554734421861107e-05, "loss": 0.0086, "step": 654420 }, { "epoch": 1.7, "learning_rate": 4.5543456002239604e-05, "loss": 0.0075, "step": 654430 }, { "epoch": 1.7, "learning_rate": 4.553956778586814e-05, "loss": 0.008, "step": 654440 }, { "epoch": 1.7, "learning_rate": 4.553567956949668e-05, "loss": 0.0083, "step": 654450 }, { "epoch": 1.7, "learning_rate": 4.5531791353125215e-05, "loss": 0.0081, "step": 654460 }, { "epoch": 1.7, "learning_rate": 4.552790313675375e-05, "loss": 0.0081, "step": 654470 }, { "epoch": 1.7, "learning_rate": 4.5524014920382285e-05, "loss": 0.0061, "step": 654480 }, { "epoch": 1.7, "learning_rate": 4.552012670401082e-05, "loss": 0.006, "step": 654490 }, { "epoch": 1.7, "learning_rate": 4.5516238487639355e-05, "loss": 0.0084, "step": 654500 }, { "epoch": 1.7, "learning_rate": 4.551235027126789e-05, "loss": 0.021, "step": 654510 }, { "epoch": 1.7, "learning_rate": 4.5508462054896425e-05, "loss": 0.0095, "step": 654520 }, { "epoch": 1.7, "learning_rate": 4.5504573838524966e-05, "loss": 0.0079, "step": 654530 }, { "epoch": 1.7, "learning_rate": 4.55006856221535e-05, "loss": 0.009, "step": 654540 }, { "epoch": 1.7, "learning_rate": 4.5496797405782036e-05, "loss": 0.0087, "step": 654550 }, { "epoch": 1.7, "learning_rate": 4.549290918941057e-05, "loss": 0.0086, "step": 654560 }, { "epoch": 1.7, "learning_rate": 4.5489020973039106e-05, "loss": 0.0086, "step": 654570 }, { "epoch": 1.7, "learning_rate": 4.548513275666764e-05, "loss": 0.0083, "step": 654580 }, { "epoch": 1.7, "learning_rate": 4.5481244540296175e-05, "loss": 0.009, "step": 654590 }, { "epoch": 1.7, "learning_rate": 4.547735632392471e-05, "loss": 0.0079, "step": 654600 }, { "epoch": 1.7, "learning_rate": 4.547346810755325e-05, "loss": 0.009, "step": 654610 }, { "epoch": 1.7, "learning_rate": 4.546957989118179e-05, "loss": 0.008, "step": 654620 }, { "epoch": 1.7, "learning_rate": 4.5465691674810315e-05, "loss": 0.0064, "step": 654630 }, { "epoch": 1.7, "learning_rate": 4.546180345843885e-05, "loss": 0.0067, "step": 654640 }, { "epoch": 1.7, "learning_rate": 4.5457915242067385e-05, "loss": 0.0076, "step": 654650 }, { "epoch": 1.7, "learning_rate": 4.545402702569592e-05, "loss": 0.0073, "step": 654660 }, { "epoch": 1.7, "learning_rate": 4.5450138809324454e-05, "loss": 0.0107, "step": 654670 }, { "epoch": 1.7, "learning_rate": 4.544625059295299e-05, "loss": 0.0063, "step": 654680 }, { "epoch": 1.7, "learning_rate": 4.5442362376581524e-05, "loss": 0.012, "step": 654690 }, { "epoch": 1.7, "learning_rate": 4.543847416021006e-05, "loss": 0.0091, "step": 654700 }, { "epoch": 1.7, "learning_rate": 4.54345859438386e-05, "loss": 0.0075, "step": 654710 }, { "epoch": 1.7, "learning_rate": 4.5430697727467135e-05, "loss": 0.0065, "step": 654720 }, { "epoch": 1.7, "learning_rate": 4.542680951109567e-05, "loss": 0.0049, "step": 654730 }, { "epoch": 1.7, "learning_rate": 4.5422921294724205e-05, "loss": 0.0061, "step": 654740 }, { "epoch": 1.7, "learning_rate": 4.541903307835274e-05, "loss": 0.0066, "step": 654750 }, { "epoch": 1.7, "learning_rate": 4.5415144861981275e-05, "loss": 0.0056, "step": 654760 }, { "epoch": 1.7, "learning_rate": 4.541125664560981e-05, "loss": 0.0086, "step": 654770 }, { "epoch": 1.7, "learning_rate": 4.5407368429238345e-05, "loss": 0.0113, "step": 654780 }, { "epoch": 1.7, "learning_rate": 4.5403480212866886e-05, "loss": 0.0059, "step": 654790 }, { "epoch": 1.7, "learning_rate": 4.539959199649542e-05, "loss": 0.0081, "step": 654800 }, { "epoch": 1.7, "learning_rate": 4.5395703780123956e-05, "loss": 0.0075, "step": 654810 }, { "epoch": 1.7, "learning_rate": 4.539181556375249e-05, "loss": 0.0087, "step": 654820 }, { "epoch": 1.7, "learning_rate": 4.5387927347381026e-05, "loss": 0.0084, "step": 654830 }, { "epoch": 1.7, "learning_rate": 4.538403913100956e-05, "loss": 0.0104, "step": 654840 }, { "epoch": 1.7, "learning_rate": 4.5380150914638095e-05, "loss": 0.009, "step": 654850 }, { "epoch": 1.7, "learning_rate": 4.537626269826663e-05, "loss": 0.0071, "step": 654860 }, { "epoch": 1.7, "learning_rate": 4.5372374481895165e-05, "loss": 0.0059, "step": 654870 }, { "epoch": 1.7, "learning_rate": 4.536848626552369e-05, "loss": 0.0089, "step": 654880 }, { "epoch": 1.7, "learning_rate": 4.5364598049152235e-05, "loss": 0.0066, "step": 654890 }, { "epoch": 1.7, "learning_rate": 4.536070983278077e-05, "loss": 0.007, "step": 654900 }, { "epoch": 1.7, "learning_rate": 4.5356821616409305e-05, "loss": 0.0095, "step": 654910 }, { "epoch": 1.7, "learning_rate": 4.535293340003784e-05, "loss": 0.0072, "step": 654920 }, { "epoch": 1.7, "learning_rate": 4.5349045183666374e-05, "loss": 0.0093, "step": 654930 }, { "epoch": 1.7, "learning_rate": 4.534515696729491e-05, "loss": 0.0076, "step": 654940 }, { "epoch": 1.7, "learning_rate": 4.5341268750923444e-05, "loss": 0.009, "step": 654950 }, { "epoch": 1.7, "learning_rate": 4.533738053455198e-05, "loss": 0.0092, "step": 654960 }, { "epoch": 1.7, "learning_rate": 4.5333492318180514e-05, "loss": 0.0094, "step": 654970 }, { "epoch": 1.7, "learning_rate": 4.5329604101809055e-05, "loss": 0.0062, "step": 654980 }, { "epoch": 1.7, "learning_rate": 4.532571588543759e-05, "loss": 0.0063, "step": 654990 }, { "epoch": 1.7, "learning_rate": 4.5321827669066125e-05, "loss": 0.0078, "step": 655000 }, { "epoch": 1.7, "eval_cer": 0.8816942885015627, "eval_loss": 0.005221130792051554, "eval_runtime": 107.696, "eval_samples_per_second": 18.571, "eval_steps_per_second": 4.643, "step": 655000 }, { "epoch": 1.7, "learning_rate": 4.531793945269466e-05, "loss": 0.0087, "step": 655010 }, { "epoch": 1.7, "learning_rate": 4.5314051236323195e-05, "loss": 0.0102, "step": 655020 }, { "epoch": 1.7, "learning_rate": 4.531016301995173e-05, "loss": 0.0071, "step": 655030 }, { "epoch": 1.7, "learning_rate": 4.5306274803580265e-05, "loss": 0.0068, "step": 655040 }, { "epoch": 1.7, "learning_rate": 4.53023865872088e-05, "loss": 0.008, "step": 655050 }, { "epoch": 1.7, "learning_rate": 4.529849837083734e-05, "loss": 0.0071, "step": 655060 }, { "epoch": 1.7, "learning_rate": 4.5294610154465876e-05, "loss": 0.0084, "step": 655070 }, { "epoch": 1.7, "learning_rate": 4.529072193809441e-05, "loss": 0.0103, "step": 655080 }, { "epoch": 1.7, "learning_rate": 4.5286833721722946e-05, "loss": 0.0092, "step": 655090 }, { "epoch": 1.7, "learning_rate": 4.528294550535148e-05, "loss": 0.0084, "step": 655100 }, { "epoch": 1.7, "learning_rate": 4.5279057288980015e-05, "loss": 0.0067, "step": 655110 }, { "epoch": 1.7, "learning_rate": 4.527516907260855e-05, "loss": 0.0064, "step": 655120 }, { "epoch": 1.7, "learning_rate": 4.527128085623708e-05, "loss": 0.0105, "step": 655130 }, { "epoch": 1.7, "learning_rate": 4.526739263986561e-05, "loss": 0.01, "step": 655140 }, { "epoch": 1.7, "learning_rate": 4.526350442349415e-05, "loss": 0.009, "step": 655150 }, { "epoch": 1.7, "learning_rate": 4.525961620712269e-05, "loss": 0.0073, "step": 655160 }, { "epoch": 1.7, "learning_rate": 4.5255727990751225e-05, "loss": 0.009, "step": 655170 }, { "epoch": 1.7, "learning_rate": 4.525183977437976e-05, "loss": 0.0097, "step": 655180 }, { "epoch": 1.7, "learning_rate": 4.5247951558008294e-05, "loss": 0.0064, "step": 655190 }, { "epoch": 1.7, "learning_rate": 4.524406334163683e-05, "loss": 0.0065, "step": 655200 }, { "epoch": 1.7, "learning_rate": 4.5240175125265364e-05, "loss": 0.0081, "step": 655210 }, { "epoch": 1.7, "learning_rate": 4.52362869088939e-05, "loss": 0.0057, "step": 655220 }, { "epoch": 1.7, "learning_rate": 4.5232398692522434e-05, "loss": 0.0081, "step": 655230 }, { "epoch": 1.7, "learning_rate": 4.5228510476150975e-05, "loss": 0.0086, "step": 655240 }, { "epoch": 1.7, "learning_rate": 4.522462225977951e-05, "loss": 0.0075, "step": 655250 }, { "epoch": 1.7, "learning_rate": 4.5220734043408045e-05, "loss": 0.0073, "step": 655260 }, { "epoch": 1.7, "learning_rate": 4.521684582703658e-05, "loss": 0.009, "step": 655270 }, { "epoch": 1.7, "learning_rate": 4.5212957610665115e-05, "loss": 0.0094, "step": 655280 }, { "epoch": 1.7, "learning_rate": 4.520906939429365e-05, "loss": 0.0066, "step": 655290 }, { "epoch": 1.7, "learning_rate": 4.5205181177922185e-05, "loss": 0.0072, "step": 655300 }, { "epoch": 1.7, "learning_rate": 4.520129296155072e-05, "loss": 0.0073, "step": 655310 }, { "epoch": 1.7, "learning_rate": 4.519740474517926e-05, "loss": 0.0071, "step": 655320 }, { "epoch": 1.7, "learning_rate": 4.5193516528807796e-05, "loss": 0.0129, "step": 655330 }, { "epoch": 1.7, "learning_rate": 4.518962831243633e-05, "loss": 0.0079, "step": 655340 }, { "epoch": 1.7, "learning_rate": 4.5185740096064866e-05, "loss": 0.0096, "step": 655350 }, { "epoch": 1.7, "learning_rate": 4.51818518796934e-05, "loss": 0.0091, "step": 655360 }, { "epoch": 1.7, "learning_rate": 4.5177963663321935e-05, "loss": 0.0076, "step": 655370 }, { "epoch": 1.7, "learning_rate": 4.5174075446950463e-05, "loss": 0.0073, "step": 655380 }, { "epoch": 1.7, "learning_rate": 4.5170187230579e-05, "loss": 0.0103, "step": 655390 }, { "epoch": 1.7, "learning_rate": 4.516629901420753e-05, "loss": 0.0085, "step": 655400 }, { "epoch": 1.7, "learning_rate": 4.516241079783607e-05, "loss": 0.0087, "step": 655410 }, { "epoch": 1.7, "learning_rate": 4.515852258146461e-05, "loss": 0.0089, "step": 655420 }, { "epoch": 1.7, "learning_rate": 4.5154634365093144e-05, "loss": 0.0088, "step": 655430 }, { "epoch": 1.7, "learning_rate": 4.515074614872168e-05, "loss": 0.008, "step": 655440 }, { "epoch": 1.7, "learning_rate": 4.5146857932350214e-05, "loss": 0.0072, "step": 655450 }, { "epoch": 1.7, "learning_rate": 4.514296971597875e-05, "loss": 0.0082, "step": 655460 }, { "epoch": 1.7, "learning_rate": 4.5139081499607284e-05, "loss": 0.0073, "step": 655470 }, { "epoch": 1.7, "learning_rate": 4.513519328323582e-05, "loss": 0.0059, "step": 655480 }, { "epoch": 1.7, "learning_rate": 4.5131305066864354e-05, "loss": 0.0068, "step": 655490 }, { "epoch": 1.7, "learning_rate": 4.5127416850492895e-05, "loss": 0.0081, "step": 655500 }, { "epoch": 1.7, "learning_rate": 4.512352863412143e-05, "loss": 0.0079, "step": 655510 }, { "epoch": 1.7, "learning_rate": 4.5119640417749965e-05, "loss": 0.0086, "step": 655520 }, { "epoch": 1.7, "learning_rate": 4.51157522013785e-05, "loss": 0.0064, "step": 655530 }, { "epoch": 1.7, "learning_rate": 4.5111863985007035e-05, "loss": 0.0074, "step": 655540 }, { "epoch": 1.7, "learning_rate": 4.510797576863557e-05, "loss": 0.0053, "step": 655550 }, { "epoch": 1.7, "learning_rate": 4.5104087552264104e-05, "loss": 0.0095, "step": 655560 }, { "epoch": 1.7, "learning_rate": 4.510019933589264e-05, "loss": 0.0096, "step": 655570 }, { "epoch": 1.7, "learning_rate": 4.509631111952118e-05, "loss": 0.0096, "step": 655580 }, { "epoch": 1.7, "learning_rate": 4.5092422903149716e-05, "loss": 0.0063, "step": 655590 }, { "epoch": 1.7, "learning_rate": 4.508853468677825e-05, "loss": 0.0087, "step": 655600 }, { "epoch": 1.7, "learning_rate": 4.5084646470406786e-05, "loss": 0.0111, "step": 655610 }, { "epoch": 1.7, "learning_rate": 4.508075825403532e-05, "loss": 0.0079, "step": 655620 }, { "epoch": 1.7, "learning_rate": 4.507687003766385e-05, "loss": 0.0125, "step": 655630 }, { "epoch": 1.7, "learning_rate": 4.507298182129238e-05, "loss": 0.008, "step": 655640 }, { "epoch": 1.7, "learning_rate": 4.506909360492092e-05, "loss": 0.0094, "step": 655650 }, { "epoch": 1.7, "learning_rate": 4.506520538854945e-05, "loss": 0.007, "step": 655660 }, { "epoch": 1.7, "learning_rate": 4.506131717217799e-05, "loss": 0.0065, "step": 655670 }, { "epoch": 1.7, "learning_rate": 4.505742895580653e-05, "loss": 0.008, "step": 655680 }, { "epoch": 1.7, "learning_rate": 4.5053540739435064e-05, "loss": 0.0079, "step": 655690 }, { "epoch": 1.7, "learning_rate": 4.50496525230636e-05, "loss": 0.0087, "step": 655700 }, { "epoch": 1.7, "learning_rate": 4.5045764306692134e-05, "loss": 0.0073, "step": 655710 }, { "epoch": 1.7, "learning_rate": 4.504187609032067e-05, "loss": 0.0083, "step": 655720 }, { "epoch": 1.7, "learning_rate": 4.5037987873949204e-05, "loss": 0.0072, "step": 655730 }, { "epoch": 1.7, "learning_rate": 4.503409965757774e-05, "loss": 0.0066, "step": 655740 }, { "epoch": 1.7, "learning_rate": 4.5030211441206274e-05, "loss": 0.0057, "step": 655750 }, { "epoch": 1.7, "learning_rate": 4.5026323224834815e-05, "loss": 0.0082, "step": 655760 }, { "epoch": 1.7, "learning_rate": 4.502243500846335e-05, "loss": 0.0109, "step": 655770 }, { "epoch": 1.7, "learning_rate": 4.5018546792091885e-05, "loss": 0.0073, "step": 655780 }, { "epoch": 1.7, "learning_rate": 4.501465857572042e-05, "loss": 0.0084, "step": 655790 }, { "epoch": 1.7, "learning_rate": 4.5010770359348955e-05, "loss": 0.0063, "step": 655800 }, { "epoch": 1.7, "learning_rate": 4.500688214297749e-05, "loss": 0.0091, "step": 655810 }, { "epoch": 1.7, "learning_rate": 4.5002993926606024e-05, "loss": 0.008, "step": 655820 }, { "epoch": 1.7, "learning_rate": 4.499910571023456e-05, "loss": 0.0094, "step": 655830 }, { "epoch": 1.7, "learning_rate": 4.49952174938631e-05, "loss": 0.0081, "step": 655840 }, { "epoch": 1.7, "learning_rate": 4.4991329277491636e-05, "loss": 0.0076, "step": 655850 }, { "epoch": 1.7, "learning_rate": 4.498744106112017e-05, "loss": 0.0107, "step": 655860 }, { "epoch": 1.7, "learning_rate": 4.49835528447487e-05, "loss": 0.0063, "step": 655870 }, { "epoch": 1.7, "learning_rate": 4.4979664628377234e-05, "loss": 0.0065, "step": 655880 }, { "epoch": 1.7, "learning_rate": 4.497577641200577e-05, "loss": 0.0093, "step": 655890 }, { "epoch": 1.7, "learning_rate": 4.49718881956343e-05, "loss": 0.0065, "step": 655900 }, { "epoch": 1.7, "learning_rate": 4.496799997926284e-05, "loss": 0.006, "step": 655910 }, { "epoch": 1.7, "learning_rate": 4.496411176289137e-05, "loss": 0.0066, "step": 655920 }, { "epoch": 1.7, "learning_rate": 4.496022354651991e-05, "loss": 0.0081, "step": 655930 }, { "epoch": 1.7, "learning_rate": 4.495633533014845e-05, "loss": 0.009, "step": 655940 }, { "epoch": 1.7, "learning_rate": 4.4952447113776984e-05, "loss": 0.0114, "step": 655950 }, { "epoch": 1.7, "learning_rate": 4.494855889740552e-05, "loss": 0.0075, "step": 655960 }, { "epoch": 1.7, "learning_rate": 4.4944670681034054e-05, "loss": 0.0069, "step": 655970 }, { "epoch": 1.7, "learning_rate": 4.494078246466259e-05, "loss": 0.0083, "step": 655980 }, { "epoch": 1.7, "learning_rate": 4.4936894248291124e-05, "loss": 0.0066, "step": 655990 }, { "epoch": 1.7, "learning_rate": 4.493300603191966e-05, "loss": 0.0096, "step": 656000 }, { "epoch": 1.7, "eval_cer": 0.8816676953998133, "eval_loss": 0.005197363439947367, "eval_runtime": 108.0429, "eval_samples_per_second": 18.511, "eval_steps_per_second": 4.628, "step": 656000 }, { "epoch": 1.7, "learning_rate": 4.4929117815548194e-05, "loss": 0.0084, "step": 656010 }, { "epoch": 1.7, "learning_rate": 4.4925229599176735e-05, "loss": 0.0082, "step": 656020 }, { "epoch": 1.7, "learning_rate": 4.492134138280527e-05, "loss": 0.0084, "step": 656030 }, { "epoch": 1.7, "learning_rate": 4.4917453166433805e-05, "loss": 0.0106, "step": 656040 }, { "epoch": 1.7, "learning_rate": 4.491356495006234e-05, "loss": 0.0129, "step": 656050 }, { "epoch": 1.7, "learning_rate": 4.4909676733690875e-05, "loss": 0.0082, "step": 656060 }, { "epoch": 1.7, "learning_rate": 4.490578851731941e-05, "loss": 0.0083, "step": 656070 }, { "epoch": 1.7, "learning_rate": 4.4901900300947944e-05, "loss": 0.0063, "step": 656080 }, { "epoch": 1.7, "learning_rate": 4.489801208457648e-05, "loss": 0.0063, "step": 656090 }, { "epoch": 1.7, "learning_rate": 4.489412386820502e-05, "loss": 0.0079, "step": 656100 }, { "epoch": 1.7, "learning_rate": 4.4890235651833556e-05, "loss": 0.009, "step": 656110 }, { "epoch": 1.7, "learning_rate": 4.4886347435462084e-05, "loss": 0.0081, "step": 656120 }, { "epoch": 1.7, "learning_rate": 4.488245921909062e-05, "loss": 0.0082, "step": 656130 }, { "epoch": 1.7, "learning_rate": 4.4878571002719154e-05, "loss": 0.0072, "step": 656140 }, { "epoch": 1.7, "learning_rate": 4.487468278634769e-05, "loss": 0.0064, "step": 656150 }, { "epoch": 1.7, "learning_rate": 4.487079456997622e-05, "loss": 0.0084, "step": 656160 }, { "epoch": 1.7, "learning_rate": 4.486690635360476e-05, "loss": 0.0073, "step": 656170 }, { "epoch": 1.7, "learning_rate": 4.486301813723329e-05, "loss": 0.0073, "step": 656180 }, { "epoch": 1.7, "learning_rate": 4.485912992086183e-05, "loss": 0.0068, "step": 656190 }, { "epoch": 1.7, "learning_rate": 4.485524170449037e-05, "loss": 0.0085, "step": 656200 }, { "epoch": 1.7, "learning_rate": 4.4851353488118904e-05, "loss": 0.0084, "step": 656210 }, { "epoch": 1.7, "learning_rate": 4.484746527174744e-05, "loss": 0.01, "step": 656220 }, { "epoch": 1.7, "learning_rate": 4.4843577055375974e-05, "loss": 0.01, "step": 656230 }, { "epoch": 1.7, "learning_rate": 4.483968883900451e-05, "loss": 0.0112, "step": 656240 }, { "epoch": 1.7, "learning_rate": 4.4835800622633044e-05, "loss": 0.0089, "step": 656250 }, { "epoch": 1.7, "learning_rate": 4.483191240626158e-05, "loss": 0.0076, "step": 656260 }, { "epoch": 1.7, "learning_rate": 4.4828024189890114e-05, "loss": 0.0071, "step": 656270 }, { "epoch": 1.7, "learning_rate": 4.482413597351865e-05, "loss": 0.0071, "step": 656280 }, { "epoch": 1.7, "learning_rate": 4.482024775714719e-05, "loss": 0.0071, "step": 656290 }, { "epoch": 1.7, "learning_rate": 4.4816359540775725e-05, "loss": 0.009, "step": 656300 }, { "epoch": 1.7, "learning_rate": 4.481247132440426e-05, "loss": 0.006, "step": 656310 }, { "epoch": 1.7, "learning_rate": 4.4808583108032795e-05, "loss": 0.0074, "step": 656320 }, { "epoch": 1.7, "learning_rate": 4.480469489166133e-05, "loss": 0.0066, "step": 656330 }, { "epoch": 1.7, "learning_rate": 4.4800806675289864e-05, "loss": 0.0083, "step": 656340 }, { "epoch": 1.7, "learning_rate": 4.47969184589184e-05, "loss": 0.0073, "step": 656350 }, { "epoch": 1.7, "learning_rate": 4.4793030242546934e-05, "loss": 0.0077, "step": 656360 }, { "epoch": 1.7, "learning_rate": 4.478914202617546e-05, "loss": 0.0079, "step": 656370 }, { "epoch": 1.7, "learning_rate": 4.4785253809804e-05, "loss": 0.0081, "step": 656380 }, { "epoch": 1.7, "learning_rate": 4.478136559343254e-05, "loss": 0.0058, "step": 656390 }, { "epoch": 1.7, "learning_rate": 4.4777477377061073e-05, "loss": 0.008, "step": 656400 }, { "epoch": 1.7, "learning_rate": 4.477358916068961e-05, "loss": 0.0086, "step": 656410 }, { "epoch": 1.7, "learning_rate": 4.476970094431814e-05, "loss": 0.0074, "step": 656420 }, { "epoch": 1.7, "learning_rate": 4.476581272794668e-05, "loss": 0.0082, "step": 656430 }, { "epoch": 1.7, "learning_rate": 4.476192451157521e-05, "loss": 0.0081, "step": 656440 }, { "epoch": 1.7, "learning_rate": 4.475803629520375e-05, "loss": 0.0084, "step": 656450 }, { "epoch": 1.7, "learning_rate": 4.475414807883228e-05, "loss": 0.007, "step": 656460 }, { "epoch": 1.7, "learning_rate": 4.4750259862460824e-05, "loss": 0.0102, "step": 656470 }, { "epoch": 1.7, "learning_rate": 4.474637164608936e-05, "loss": 0.0085, "step": 656480 }, { "epoch": 1.7, "learning_rate": 4.4742483429717894e-05, "loss": 0.0056, "step": 656490 }, { "epoch": 1.7, "learning_rate": 4.473859521334643e-05, "loss": 0.0064, "step": 656500 }, { "epoch": 1.7, "learning_rate": 4.4734706996974964e-05, "loss": 0.0079, "step": 656510 }, { "epoch": 1.7, "learning_rate": 4.47308187806035e-05, "loss": 0.0096, "step": 656520 }, { "epoch": 1.7, "learning_rate": 4.4726930564232033e-05, "loss": 0.0067, "step": 656530 }, { "epoch": 1.7, "learning_rate": 4.472304234786057e-05, "loss": 0.0097, "step": 656540 }, { "epoch": 1.7, "learning_rate": 4.471915413148911e-05, "loss": 0.011, "step": 656550 }, { "epoch": 1.7, "learning_rate": 4.4715265915117645e-05, "loss": 0.0078, "step": 656560 }, { "epoch": 1.7, "learning_rate": 4.471137769874618e-05, "loss": 0.011, "step": 656570 }, { "epoch": 1.7, "learning_rate": 4.4707489482374715e-05, "loss": 0.0091, "step": 656580 }, { "epoch": 1.7, "learning_rate": 4.470360126600325e-05, "loss": 0.0065, "step": 656590 }, { "epoch": 1.7, "learning_rate": 4.4699713049631784e-05, "loss": 0.0075, "step": 656600 }, { "epoch": 1.7, "learning_rate": 4.469582483326032e-05, "loss": 0.0106, "step": 656610 }, { "epoch": 1.7, "learning_rate": 4.469193661688885e-05, "loss": 0.006, "step": 656620 }, { "epoch": 1.7, "learning_rate": 4.468804840051738e-05, "loss": 0.0093, "step": 656630 }, { "epoch": 1.7, "learning_rate": 4.468416018414592e-05, "loss": 0.0091, "step": 656640 }, { "epoch": 1.7, "learning_rate": 4.468027196777446e-05, "loss": 0.0072, "step": 656650 }, { "epoch": 1.7, "learning_rate": 4.4676383751402993e-05, "loss": 0.0072, "step": 656660 }, { "epoch": 1.7, "learning_rate": 4.467249553503153e-05, "loss": 0.0095, "step": 656670 }, { "epoch": 1.7, "learning_rate": 4.466860731866006e-05, "loss": 0.0078, "step": 656680 }, { "epoch": 1.7, "learning_rate": 4.46647191022886e-05, "loss": 0.01, "step": 656690 }, { "epoch": 1.7, "learning_rate": 4.466083088591713e-05, "loss": 0.0089, "step": 656700 }, { "epoch": 1.7, "learning_rate": 4.465694266954567e-05, "loss": 0.0069, "step": 656710 }, { "epoch": 1.7, "learning_rate": 4.46530544531742e-05, "loss": 0.0092, "step": 656720 }, { "epoch": 1.7, "learning_rate": 4.4649166236802744e-05, "loss": 0.0063, "step": 656730 }, { "epoch": 1.7, "learning_rate": 4.464527802043128e-05, "loss": 0.0085, "step": 656740 }, { "epoch": 1.7, "learning_rate": 4.4641389804059814e-05, "loss": 0.0105, "step": 656750 }, { "epoch": 1.7, "learning_rate": 4.463750158768835e-05, "loss": 0.0085, "step": 656760 }, { "epoch": 1.7, "learning_rate": 4.4633613371316884e-05, "loss": 0.0069, "step": 656770 }, { "epoch": 1.7, "learning_rate": 4.462972515494542e-05, "loss": 0.0074, "step": 656780 }, { "epoch": 1.7, "learning_rate": 4.4625836938573953e-05, "loss": 0.007, "step": 656790 }, { "epoch": 1.7, "learning_rate": 4.462194872220249e-05, "loss": 0.0091, "step": 656800 }, { "epoch": 1.7, "learning_rate": 4.461806050583103e-05, "loss": 0.0091, "step": 656810 }, { "epoch": 1.7, "learning_rate": 4.4614172289459565e-05, "loss": 0.0097, "step": 656820 }, { "epoch": 1.7, "learning_rate": 4.46102840730881e-05, "loss": 0.0075, "step": 656830 }, { "epoch": 1.7, "learning_rate": 4.4606395856716635e-05, "loss": 0.0091, "step": 656840 }, { "epoch": 1.7, "learning_rate": 4.460250764034517e-05, "loss": 0.0073, "step": 656850 }, { "epoch": 1.7, "learning_rate": 4.4598619423973704e-05, "loss": 0.0072, "step": 656860 }, { "epoch": 1.7, "learning_rate": 4.459473120760223e-05, "loss": 0.0087, "step": 656870 }, { "epoch": 1.7, "learning_rate": 4.459084299123077e-05, "loss": 0.0072, "step": 656880 }, { "epoch": 1.7, "learning_rate": 4.45869547748593e-05, "loss": 0.0194, "step": 656890 }, { "epoch": 1.7, "learning_rate": 4.458306655848784e-05, "loss": 0.0083, "step": 656900 }, { "epoch": 1.7, "learning_rate": 4.457917834211638e-05, "loss": 0.0087, "step": 656910 }, { "epoch": 1.7, "learning_rate": 4.4575290125744913e-05, "loss": 0.0066, "step": 656920 }, { "epoch": 1.7, "learning_rate": 4.457140190937345e-05, "loss": 0.0118, "step": 656930 }, { "epoch": 1.7, "learning_rate": 4.456751369300198e-05, "loss": 0.0075, "step": 656940 }, { "epoch": 1.7, "learning_rate": 4.456362547663052e-05, "loss": 0.0077, "step": 656950 }, { "epoch": 1.7, "learning_rate": 4.455973726025905e-05, "loss": 0.0065, "step": 656960 }, { "epoch": 1.7, "learning_rate": 4.455584904388759e-05, "loss": 0.0065, "step": 656970 }, { "epoch": 1.7, "learning_rate": 4.455196082751612e-05, "loss": 0.0091, "step": 656980 }, { "epoch": 1.7, "learning_rate": 4.4548072611144664e-05, "loss": 0.0074, "step": 656990 }, { "epoch": 1.7, "learning_rate": 4.45441843947732e-05, "loss": 0.0077, "step": 657000 }, { "epoch": 1.7, "eval_cer": 0.88167329394755, "eval_loss": 0.005158776883035898, "eval_runtime": 108.0407, "eval_samples_per_second": 18.512, "eval_steps_per_second": 4.628, "step": 657000 }, { "epoch": 1.7, "learning_rate": 4.4540296178401734e-05, "loss": 0.0071, "step": 657010 }, { "epoch": 1.7, "learning_rate": 4.453640796203027e-05, "loss": 0.009, "step": 657020 }, { "epoch": 1.7, "learning_rate": 4.4532519745658804e-05, "loss": 0.0086, "step": 657030 }, { "epoch": 1.7, "learning_rate": 4.452863152928734e-05, "loss": 0.0072, "step": 657040 }, { "epoch": 1.7, "learning_rate": 4.452474331291587e-05, "loss": 0.0076, "step": 657050 }, { "epoch": 1.7, "learning_rate": 4.452085509654441e-05, "loss": 0.0076, "step": 657060 }, { "epoch": 1.7, "learning_rate": 4.451696688017295e-05, "loss": 0.0077, "step": 657070 }, { "epoch": 1.7, "learning_rate": 4.4513078663801485e-05, "loss": 0.0086, "step": 657080 }, { "epoch": 1.7, "learning_rate": 4.450919044743002e-05, "loss": 0.0084, "step": 657090 }, { "epoch": 1.7, "learning_rate": 4.4505302231058554e-05, "loss": 0.0084, "step": 657100 }, { "epoch": 1.7, "learning_rate": 4.450141401468709e-05, "loss": 0.0069, "step": 657110 }, { "epoch": 1.7, "learning_rate": 4.449752579831562e-05, "loss": 0.0087, "step": 657120 }, { "epoch": 1.7, "learning_rate": 4.449363758194415e-05, "loss": 0.0064, "step": 657130 }, { "epoch": 1.7, "learning_rate": 4.448974936557269e-05, "loss": 0.0075, "step": 657140 }, { "epoch": 1.7, "learning_rate": 4.448586114920122e-05, "loss": 0.0068, "step": 657150 }, { "epoch": 1.7, "learning_rate": 4.448197293282976e-05, "loss": 0.005, "step": 657160 }, { "epoch": 1.7, "learning_rate": 4.44780847164583e-05, "loss": 0.0065, "step": 657170 }, { "epoch": 1.7, "learning_rate": 4.447419650008683e-05, "loss": 0.0055, "step": 657180 }, { "epoch": 1.7, "learning_rate": 4.447030828371537e-05, "loss": 0.0076, "step": 657190 }, { "epoch": 1.7, "learning_rate": 4.44664200673439e-05, "loss": 0.0071, "step": 657200 }, { "epoch": 1.7, "learning_rate": 4.446253185097244e-05, "loss": 0.0091, "step": 657210 }, { "epoch": 1.7, "learning_rate": 4.445864363460097e-05, "loss": 0.0081, "step": 657220 }, { "epoch": 1.7, "learning_rate": 4.445475541822951e-05, "loss": 0.0071, "step": 657230 }, { "epoch": 1.7, "learning_rate": 4.445086720185804e-05, "loss": 0.0075, "step": 657240 }, { "epoch": 1.7, "learning_rate": 4.4446978985486584e-05, "loss": 0.0071, "step": 657250 }, { "epoch": 1.7, "learning_rate": 4.444309076911512e-05, "loss": 0.0072, "step": 657260 }, { "epoch": 1.7, "learning_rate": 4.4439202552743654e-05, "loss": 0.0067, "step": 657270 }, { "epoch": 1.7, "learning_rate": 4.443531433637219e-05, "loss": 0.0091, "step": 657280 }, { "epoch": 1.7, "learning_rate": 4.4431426120000724e-05, "loss": 0.0049, "step": 657290 }, { "epoch": 1.7, "learning_rate": 4.442753790362926e-05, "loss": 0.0081, "step": 657300 }, { "epoch": 1.7, "learning_rate": 4.442364968725779e-05, "loss": 0.0089, "step": 657310 }, { "epoch": 1.7, "learning_rate": 4.441976147088633e-05, "loss": 0.0072, "step": 657320 }, { "epoch": 1.7, "learning_rate": 4.441587325451487e-05, "loss": 0.0074, "step": 657330 }, { "epoch": 1.7, "learning_rate": 4.4411985038143405e-05, "loss": 0.0117, "step": 657340 }, { "epoch": 1.7, "learning_rate": 4.440809682177194e-05, "loss": 0.0105, "step": 657350 }, { "epoch": 1.7, "learning_rate": 4.440420860540047e-05, "loss": 0.0095, "step": 657360 }, { "epoch": 1.7, "learning_rate": 4.4400320389029e-05, "loss": 0.0099, "step": 657370 }, { "epoch": 1.7, "learning_rate": 4.439643217265754e-05, "loss": 0.0086, "step": 657380 }, { "epoch": 1.7, "learning_rate": 4.439254395628607e-05, "loss": 0.0096, "step": 657390 }, { "epoch": 1.7, "learning_rate": 4.438865573991461e-05, "loss": 0.0093, "step": 657400 }, { "epoch": 1.7, "learning_rate": 4.438476752354314e-05, "loss": 0.0109, "step": 657410 }, { "epoch": 1.7, "learning_rate": 4.438087930717168e-05, "loss": 0.0068, "step": 657420 }, { "epoch": 1.7, "learning_rate": 4.437699109080022e-05, "loss": 0.0092, "step": 657430 }, { "epoch": 1.7, "learning_rate": 4.437310287442875e-05, "loss": 0.007, "step": 657440 }, { "epoch": 1.7, "learning_rate": 4.436921465805729e-05, "loss": 0.0087, "step": 657450 }, { "epoch": 1.7, "learning_rate": 4.436532644168582e-05, "loss": 0.0088, "step": 657460 }, { "epoch": 1.7, "learning_rate": 4.436143822531436e-05, "loss": 0.0093, "step": 657470 }, { "epoch": 1.7, "learning_rate": 4.435755000894289e-05, "loss": 0.0061, "step": 657480 }, { "epoch": 1.7, "learning_rate": 4.435366179257143e-05, "loss": 0.0064, "step": 657490 }, { "epoch": 1.7, "learning_rate": 4.434977357619996e-05, "loss": 0.0065, "step": 657500 }, { "epoch": 1.7, "learning_rate": 4.4345885359828504e-05, "loss": 0.0087, "step": 657510 }, { "epoch": 1.7, "learning_rate": 4.434199714345704e-05, "loss": 0.0079, "step": 657520 }, { "epoch": 1.7, "learning_rate": 4.4338108927085574e-05, "loss": 0.0066, "step": 657530 }, { "epoch": 1.7, "learning_rate": 4.433422071071411e-05, "loss": 0.0064, "step": 657540 }, { "epoch": 1.7, "learning_rate": 4.4330332494342644e-05, "loss": 0.0076, "step": 657550 }, { "epoch": 1.7, "learning_rate": 4.432644427797118e-05, "loss": 0.0079, "step": 657560 }, { "epoch": 1.7, "learning_rate": 4.432255606159971e-05, "loss": 0.0079, "step": 657570 }, { "epoch": 1.7, "learning_rate": 4.431866784522825e-05, "loss": 0.0094, "step": 657580 }, { "epoch": 1.7, "learning_rate": 4.431477962885678e-05, "loss": 0.0097, "step": 657590 }, { "epoch": 1.7, "learning_rate": 4.4310891412485325e-05, "loss": 0.0083, "step": 657600 }, { "epoch": 1.7, "learning_rate": 4.430700319611385e-05, "loss": 0.0064, "step": 657610 }, { "epoch": 1.7, "learning_rate": 4.430311497974239e-05, "loss": 0.0055, "step": 657620 }, { "epoch": 1.7, "learning_rate": 4.429922676337092e-05, "loss": 0.0077, "step": 657630 }, { "epoch": 1.7, "learning_rate": 4.429533854699946e-05, "loss": 0.01, "step": 657640 }, { "epoch": 1.7, "learning_rate": 4.429145033062799e-05, "loss": 0.0083, "step": 657650 }, { "epoch": 1.7, "learning_rate": 4.428756211425653e-05, "loss": 0.0127, "step": 657660 }, { "epoch": 1.7, "learning_rate": 4.428367389788506e-05, "loss": 0.0044, "step": 657670 }, { "epoch": 1.7, "learning_rate": 4.42797856815136e-05, "loss": 0.0121, "step": 657680 }, { "epoch": 1.7, "learning_rate": 4.427589746514213e-05, "loss": 0.0115, "step": 657690 }, { "epoch": 1.7, "learning_rate": 4.427200924877067e-05, "loss": 0.0074, "step": 657700 }, { "epoch": 1.7, "learning_rate": 4.426812103239921e-05, "loss": 0.0078, "step": 657710 }, { "epoch": 1.7, "learning_rate": 4.426423281602774e-05, "loss": 0.008, "step": 657720 }, { "epoch": 1.7, "learning_rate": 4.426034459965628e-05, "loss": 0.0081, "step": 657730 }, { "epoch": 1.7, "learning_rate": 4.425645638328481e-05, "loss": 0.0083, "step": 657740 }, { "epoch": 1.7, "learning_rate": 4.425256816691335e-05, "loss": 0.0075, "step": 657750 }, { "epoch": 1.71, "learning_rate": 4.424867995054188e-05, "loss": 0.0087, "step": 657760 }, { "epoch": 1.71, "learning_rate": 4.424479173417042e-05, "loss": 0.0071, "step": 657770 }, { "epoch": 1.71, "learning_rate": 4.424090351779896e-05, "loss": 0.0076, "step": 657780 }, { "epoch": 1.71, "learning_rate": 4.4237015301427494e-05, "loss": 0.0051, "step": 657790 }, { "epoch": 1.71, "learning_rate": 4.423312708505603e-05, "loss": 0.0073, "step": 657800 }, { "epoch": 1.71, "learning_rate": 4.4229238868684564e-05, "loss": 0.0078, "step": 657810 }, { "epoch": 1.71, "learning_rate": 4.42253506523131e-05, "loss": 0.01, "step": 657820 }, { "epoch": 1.71, "learning_rate": 4.422146243594163e-05, "loss": 0.0079, "step": 657830 }, { "epoch": 1.71, "learning_rate": 4.421757421957017e-05, "loss": 0.0078, "step": 657840 }, { "epoch": 1.71, "learning_rate": 4.42136860031987e-05, "loss": 0.0078, "step": 657850 }, { "epoch": 1.71, "learning_rate": 4.420979778682723e-05, "loss": 0.0075, "step": 657860 }, { "epoch": 1.71, "learning_rate": 4.4205909570455766e-05, "loss": 0.0052, "step": 657870 }, { "epoch": 1.71, "learning_rate": 4.420202135408431e-05, "loss": 0.009, "step": 657880 }, { "epoch": 1.71, "learning_rate": 4.419813313771284e-05, "loss": 0.0052, "step": 657890 }, { "epoch": 1.71, "learning_rate": 4.419424492134138e-05, "loss": 0.0072, "step": 657900 }, { "epoch": 1.71, "learning_rate": 4.419035670496991e-05, "loss": 0.0088, "step": 657910 }, { "epoch": 1.71, "learning_rate": 4.418646848859845e-05, "loss": 0.007, "step": 657920 }, { "epoch": 1.71, "learning_rate": 4.418258027222698e-05, "loss": 0.0118, "step": 657930 }, { "epoch": 1.71, "learning_rate": 4.417869205585552e-05, "loss": 0.0083, "step": 657940 }, { "epoch": 1.71, "learning_rate": 4.417480383948405e-05, "loss": 0.0106, "step": 657950 }, { "epoch": 1.71, "learning_rate": 4.417091562311259e-05, "loss": 0.0069, "step": 657960 }, { "epoch": 1.71, "learning_rate": 4.416702740674113e-05, "loss": 0.0052, "step": 657970 }, { "epoch": 1.71, "learning_rate": 4.416313919036966e-05, "loss": 0.0084, "step": 657980 }, { "epoch": 1.71, "learning_rate": 4.41592509739982e-05, "loss": 0.0079, "step": 657990 }, { "epoch": 1.71, "learning_rate": 4.415536275762673e-05, "loss": 0.0094, "step": 658000 }, { "epoch": 1.71, "eval_cer": 0.8816830914060892, "eval_loss": 0.005186532158404589, "eval_runtime": 107.9432, "eval_samples_per_second": 18.528, "eval_steps_per_second": 4.632, "step": 658000 }, { "epoch": 1.71, "learning_rate": 4.415147454125527e-05, "loss": 0.008, "step": 658010 }, { "epoch": 1.71, "learning_rate": 4.41475863248838e-05, "loss": 0.0104, "step": 658020 }, { "epoch": 1.71, "learning_rate": 4.414369810851234e-05, "loss": 0.0098, "step": 658030 }, { "epoch": 1.71, "learning_rate": 4.413980989214088e-05, "loss": 0.0079, "step": 658040 }, { "epoch": 1.71, "learning_rate": 4.4135921675769414e-05, "loss": 0.0062, "step": 658050 }, { "epoch": 1.71, "learning_rate": 4.413203345939795e-05, "loss": 0.0086, "step": 658060 }, { "epoch": 1.71, "learning_rate": 4.4128145243026483e-05, "loss": 0.0085, "step": 658070 }, { "epoch": 1.71, "learning_rate": 4.412425702665502e-05, "loss": 0.0074, "step": 658080 }, { "epoch": 1.71, "learning_rate": 4.412036881028355e-05, "loss": 0.0091, "step": 658090 }, { "epoch": 1.71, "learning_rate": 4.411648059391209e-05, "loss": 0.0085, "step": 658100 }, { "epoch": 1.71, "learning_rate": 4.4112592377540616e-05, "loss": 0.0089, "step": 658110 }, { "epoch": 1.71, "learning_rate": 4.410870416116915e-05, "loss": 0.0066, "step": 658120 }, { "epoch": 1.71, "learning_rate": 4.4104815944797686e-05, "loss": 0.0118, "step": 658130 }, { "epoch": 1.71, "learning_rate": 4.410092772842623e-05, "loss": 0.0075, "step": 658140 }, { "epoch": 1.71, "learning_rate": 4.409703951205476e-05, "loss": 0.0087, "step": 658150 }, { "epoch": 1.71, "learning_rate": 4.40931512956833e-05, "loss": 0.0066, "step": 658160 }, { "epoch": 1.71, "learning_rate": 4.408926307931183e-05, "loss": 0.0065, "step": 658170 }, { "epoch": 1.71, "learning_rate": 4.408537486294037e-05, "loss": 0.0097, "step": 658180 }, { "epoch": 1.71, "learning_rate": 4.40814866465689e-05, "loss": 0.0082, "step": 658190 }, { "epoch": 1.71, "learning_rate": 4.407759843019744e-05, "loss": 0.0081, "step": 658200 }, { "epoch": 1.71, "learning_rate": 4.407371021382597e-05, "loss": 0.0067, "step": 658210 }, { "epoch": 1.71, "learning_rate": 4.406982199745451e-05, "loss": 0.0059, "step": 658220 }, { "epoch": 1.71, "learning_rate": 4.406593378108305e-05, "loss": 0.0065, "step": 658230 }, { "epoch": 1.71, "learning_rate": 4.406204556471158e-05, "loss": 0.0103, "step": 658240 }, { "epoch": 1.71, "learning_rate": 4.405815734834012e-05, "loss": 0.0078, "step": 658250 }, { "epoch": 1.71, "learning_rate": 4.405426913196865e-05, "loss": 0.0082, "step": 658260 }, { "epoch": 1.71, "learning_rate": 4.405038091559719e-05, "loss": 0.0068, "step": 658270 }, { "epoch": 1.71, "learning_rate": 4.404649269922572e-05, "loss": 0.0086, "step": 658280 }, { "epoch": 1.71, "learning_rate": 4.404260448285426e-05, "loss": 0.0072, "step": 658290 }, { "epoch": 1.71, "learning_rate": 4.40387162664828e-05, "loss": 0.01, "step": 658300 }, { "epoch": 1.71, "learning_rate": 4.4034828050111334e-05, "loss": 0.01, "step": 658310 }, { "epoch": 1.71, "learning_rate": 4.403093983373987e-05, "loss": 0.0062, "step": 658320 }, { "epoch": 1.71, "learning_rate": 4.4027051617368403e-05, "loss": 0.0063, "step": 658330 }, { "epoch": 1.71, "learning_rate": 4.402316340099694e-05, "loss": 0.0064, "step": 658340 }, { "epoch": 1.71, "learning_rate": 4.401927518462547e-05, "loss": 0.0093, "step": 658350 }, { "epoch": 1.71, "learning_rate": 4.4015386968254e-05, "loss": 0.0116, "step": 658360 }, { "epoch": 1.71, "learning_rate": 4.4011498751882536e-05, "loss": 0.0067, "step": 658370 }, { "epoch": 1.71, "learning_rate": 4.400761053551107e-05, "loss": 0.0086, "step": 658380 }, { "epoch": 1.71, "learning_rate": 4.4003722319139606e-05, "loss": 0.0084, "step": 658390 }, { "epoch": 1.71, "learning_rate": 4.399983410276815e-05, "loss": 0.0075, "step": 658400 }, { "epoch": 1.71, "learning_rate": 4.399594588639668e-05, "loss": 0.0108, "step": 658410 }, { "epoch": 1.71, "learning_rate": 4.399205767002522e-05, "loss": 0.0089, "step": 658420 }, { "epoch": 1.71, "learning_rate": 4.398816945365375e-05, "loss": 0.0088, "step": 658430 }, { "epoch": 1.71, "learning_rate": 4.398428123728229e-05, "loss": 0.0087, "step": 658440 }, { "epoch": 1.71, "learning_rate": 4.398039302091082e-05, "loss": 0.0075, "step": 658450 }, { "epoch": 1.71, "learning_rate": 4.3976504804539357e-05, "loss": 0.0105, "step": 658460 }, { "epoch": 1.71, "learning_rate": 4.397261658816789e-05, "loss": 0.0085, "step": 658470 }, { "epoch": 1.71, "learning_rate": 4.396872837179643e-05, "loss": 0.0058, "step": 658480 }, { "epoch": 1.71, "learning_rate": 4.396484015542497e-05, "loss": 0.0088, "step": 658490 }, { "epoch": 1.71, "learning_rate": 4.39609519390535e-05, "loss": 0.0089, "step": 658500 }, { "epoch": 1.71, "learning_rate": 4.395706372268204e-05, "loss": 0.0093, "step": 658510 }, { "epoch": 1.71, "learning_rate": 4.395317550631057e-05, "loss": 0.007, "step": 658520 }, { "epoch": 1.71, "learning_rate": 4.394928728993911e-05, "loss": 0.0086, "step": 658530 }, { "epoch": 1.71, "learning_rate": 4.394539907356764e-05, "loss": 0.0076, "step": 658540 }, { "epoch": 1.71, "learning_rate": 4.394151085719618e-05, "loss": 0.0097, "step": 658550 }, { "epoch": 1.71, "learning_rate": 4.393762264082472e-05, "loss": 0.0084, "step": 658560 }, { "epoch": 1.71, "learning_rate": 4.3933734424453254e-05, "loss": 0.0083, "step": 658570 }, { "epoch": 1.71, "learning_rate": 4.392984620808179e-05, "loss": 0.0089, "step": 658580 }, { "epoch": 1.71, "learning_rate": 4.392595799171032e-05, "loss": 0.0079, "step": 658590 }, { "epoch": 1.71, "learning_rate": 4.392206977533885e-05, "loss": 0.009, "step": 658600 }, { "epoch": 1.71, "learning_rate": 4.3918181558967386e-05, "loss": 0.0093, "step": 658610 }, { "epoch": 1.71, "learning_rate": 4.391429334259592e-05, "loss": 0.0055, "step": 658620 }, { "epoch": 1.71, "learning_rate": 4.3910405126224456e-05, "loss": 0.0071, "step": 658630 }, { "epoch": 1.71, "learning_rate": 4.390651690985299e-05, "loss": 0.008, "step": 658640 }, { "epoch": 1.71, "learning_rate": 4.3902628693481526e-05, "loss": 0.0067, "step": 658650 }, { "epoch": 1.71, "learning_rate": 4.389874047711007e-05, "loss": 0.0071, "step": 658660 }, { "epoch": 1.71, "learning_rate": 4.38948522607386e-05, "loss": 0.0084, "step": 658670 }, { "epoch": 1.71, "learning_rate": 4.389096404436714e-05, "loss": 0.009, "step": 658680 }, { "epoch": 1.71, "learning_rate": 4.388707582799567e-05, "loss": 0.0098, "step": 658690 }, { "epoch": 1.71, "learning_rate": 4.388318761162421e-05, "loss": 0.0104, "step": 658700 }, { "epoch": 1.71, "learning_rate": 4.387929939525274e-05, "loss": 0.0071, "step": 658710 }, { "epoch": 1.71, "learning_rate": 4.3875411178881277e-05, "loss": 0.0084, "step": 658720 }, { "epoch": 1.71, "learning_rate": 4.387152296250981e-05, "loss": 0.0095, "step": 658730 }, { "epoch": 1.71, "learning_rate": 4.386763474613835e-05, "loss": 0.0073, "step": 658740 }, { "epoch": 1.71, "learning_rate": 4.386374652976689e-05, "loss": 0.0096, "step": 658750 }, { "epoch": 1.71, "learning_rate": 4.385985831339542e-05, "loss": 0.0076, "step": 658760 }, { "epoch": 1.71, "learning_rate": 4.385597009702396e-05, "loss": 0.0161, "step": 658770 }, { "epoch": 1.71, "learning_rate": 4.385208188065249e-05, "loss": 0.0053, "step": 658780 }, { "epoch": 1.71, "learning_rate": 4.384819366428103e-05, "loss": 0.0045, "step": 658790 }, { "epoch": 1.71, "learning_rate": 4.384430544790956e-05, "loss": 0.0085, "step": 658800 }, { "epoch": 1.71, "learning_rate": 4.38404172315381e-05, "loss": 0.0075, "step": 658810 }, { "epoch": 1.71, "learning_rate": 4.383652901516664e-05, "loss": 0.0061, "step": 658820 }, { "epoch": 1.71, "learning_rate": 4.3832640798795174e-05, "loss": 0.0075, "step": 658830 }, { "epoch": 1.71, "learning_rate": 4.382875258242371e-05, "loss": 0.0071, "step": 658840 }, { "epoch": 1.71, "learning_rate": 4.3824864366052237e-05, "loss": 0.0085, "step": 658850 }, { "epoch": 1.71, "learning_rate": 4.382097614968077e-05, "loss": 0.0079, "step": 658860 }, { "epoch": 1.71, "learning_rate": 4.3817087933309306e-05, "loss": 0.0124, "step": 658870 }, { "epoch": 1.71, "learning_rate": 4.381319971693784e-05, "loss": 0.0067, "step": 658880 }, { "epoch": 1.71, "learning_rate": 4.3809311500566376e-05, "loss": 0.0085, "step": 658890 }, { "epoch": 1.71, "learning_rate": 4.380542328419491e-05, "loss": 0.0088, "step": 658900 }, { "epoch": 1.71, "learning_rate": 4.3801535067823446e-05, "loss": 0.0088, "step": 658910 }, { "epoch": 1.71, "learning_rate": 4.379764685145199e-05, "loss": 0.0067, "step": 658920 }, { "epoch": 1.71, "learning_rate": 4.379375863508052e-05, "loss": 0.0096, "step": 658930 }, { "epoch": 1.71, "learning_rate": 4.378987041870906e-05, "loss": 0.0081, "step": 658940 }, { "epoch": 1.71, "learning_rate": 4.378598220233759e-05, "loss": 0.0097, "step": 658950 }, { "epoch": 1.71, "learning_rate": 4.378209398596613e-05, "loss": 0.0077, "step": 658960 }, { "epoch": 1.71, "learning_rate": 4.377820576959466e-05, "loss": 0.0076, "step": 658970 }, { "epoch": 1.71, "learning_rate": 4.3774317553223197e-05, "loss": 0.0086, "step": 658980 }, { "epoch": 1.71, "learning_rate": 4.377042933685173e-05, "loss": 0.0084, "step": 658990 }, { "epoch": 1.71, "learning_rate": 4.3766541120480266e-05, "loss": 0.0061, "step": 659000 }, { "epoch": 1.71, "eval_cer": 0.8816704946736816, "eval_loss": 0.005243065766990185, "eval_runtime": 107.9368, "eval_samples_per_second": 18.529, "eval_steps_per_second": 4.632, "step": 659000 }, { "epoch": 1.71, "learning_rate": 4.376265290410881e-05, "loss": 0.0086, "step": 659010 }, { "epoch": 1.71, "learning_rate": 4.375876468773734e-05, "loss": 0.0087, "step": 659020 }, { "epoch": 1.71, "learning_rate": 4.375487647136588e-05, "loss": 0.0077, "step": 659030 }, { "epoch": 1.71, "learning_rate": 4.375098825499441e-05, "loss": 0.0067, "step": 659040 }, { "epoch": 1.71, "learning_rate": 4.374710003862295e-05, "loss": 0.0092, "step": 659050 }, { "epoch": 1.71, "learning_rate": 4.374321182225148e-05, "loss": 0.0118, "step": 659060 }, { "epoch": 1.71, "learning_rate": 4.373932360588002e-05, "loss": 0.0092, "step": 659070 }, { "epoch": 1.71, "learning_rate": 4.373543538950855e-05, "loss": 0.0084, "step": 659080 }, { "epoch": 1.71, "learning_rate": 4.3731547173137094e-05, "loss": 0.006, "step": 659090 }, { "epoch": 1.71, "learning_rate": 4.372765895676562e-05, "loss": 0.0103, "step": 659100 }, { "epoch": 1.71, "learning_rate": 4.3723770740394156e-05, "loss": 0.0094, "step": 659110 }, { "epoch": 1.71, "learning_rate": 4.371988252402269e-05, "loss": 0.0075, "step": 659120 }, { "epoch": 1.71, "learning_rate": 4.3715994307651226e-05, "loss": 0.0087, "step": 659130 }, { "epoch": 1.71, "learning_rate": 4.371210609127976e-05, "loss": 0.0069, "step": 659140 }, { "epoch": 1.71, "learning_rate": 4.3708217874908296e-05, "loss": 0.0079, "step": 659150 }, { "epoch": 1.71, "learning_rate": 4.370432965853683e-05, "loss": 0.0077, "step": 659160 }, { "epoch": 1.71, "learning_rate": 4.3700441442165366e-05, "loss": 0.0073, "step": 659170 }, { "epoch": 1.71, "learning_rate": 4.36965532257939e-05, "loss": 0.0071, "step": 659180 }, { "epoch": 1.71, "learning_rate": 4.369266500942244e-05, "loss": 0.0088, "step": 659190 }, { "epoch": 1.71, "learning_rate": 4.368877679305098e-05, "loss": 0.0073, "step": 659200 }, { "epoch": 1.71, "learning_rate": 4.368488857667951e-05, "loss": 0.0076, "step": 659210 }, { "epoch": 1.71, "learning_rate": 4.368100036030805e-05, "loss": 0.0075, "step": 659220 }, { "epoch": 1.71, "learning_rate": 4.367711214393658e-05, "loss": 0.0052, "step": 659230 }, { "epoch": 1.71, "learning_rate": 4.3673223927565116e-05, "loss": 0.007, "step": 659240 }, { "epoch": 1.71, "learning_rate": 4.366933571119365e-05, "loss": 0.0071, "step": 659250 }, { "epoch": 1.71, "learning_rate": 4.3665447494822186e-05, "loss": 0.01, "step": 659260 }, { "epoch": 1.71, "learning_rate": 4.366155927845073e-05, "loss": 0.0105, "step": 659270 }, { "epoch": 1.71, "learning_rate": 4.365767106207926e-05, "loss": 0.0097, "step": 659280 }, { "epoch": 1.71, "learning_rate": 4.36537828457078e-05, "loss": 0.0069, "step": 659290 }, { "epoch": 1.71, "learning_rate": 4.364989462933633e-05, "loss": 0.0101, "step": 659300 }, { "epoch": 1.71, "learning_rate": 4.364600641296487e-05, "loss": 0.0072, "step": 659310 }, { "epoch": 1.71, "learning_rate": 4.36421181965934e-05, "loss": 0.0081, "step": 659320 }, { "epoch": 1.71, "learning_rate": 4.363822998022194e-05, "loss": 0.0092, "step": 659330 }, { "epoch": 1.71, "learning_rate": 4.363434176385047e-05, "loss": 0.0073, "step": 659340 }, { "epoch": 1.71, "learning_rate": 4.3630453547479e-05, "loss": 0.0106, "step": 659350 }, { "epoch": 1.71, "learning_rate": 4.3626565331107535e-05, "loss": 0.01, "step": 659360 }, { "epoch": 1.71, "learning_rate": 4.3622677114736076e-05, "loss": 0.009, "step": 659370 }, { "epoch": 1.71, "learning_rate": 4.361878889836461e-05, "loss": 0.0073, "step": 659380 }, { "epoch": 1.71, "learning_rate": 4.3614900681993146e-05, "loss": 0.0062, "step": 659390 }, { "epoch": 1.71, "learning_rate": 4.361101246562168e-05, "loss": 0.006, "step": 659400 }, { "epoch": 1.71, "learning_rate": 4.3607124249250216e-05, "loss": 0.0108, "step": 659410 }, { "epoch": 1.71, "learning_rate": 4.360323603287875e-05, "loss": 0.0106, "step": 659420 }, { "epoch": 1.71, "learning_rate": 4.3599347816507286e-05, "loss": 0.0079, "step": 659430 }, { "epoch": 1.71, "learning_rate": 4.359545960013582e-05, "loss": 0.0084, "step": 659440 }, { "epoch": 1.71, "learning_rate": 4.359157138376436e-05, "loss": 0.007, "step": 659450 }, { "epoch": 1.71, "learning_rate": 4.35876831673929e-05, "loss": 0.0111, "step": 659460 }, { "epoch": 1.71, "learning_rate": 4.358379495102143e-05, "loss": 0.0093, "step": 659470 }, { "epoch": 1.71, "learning_rate": 4.357990673464997e-05, "loss": 0.0067, "step": 659480 }, { "epoch": 1.71, "learning_rate": 4.35760185182785e-05, "loss": 0.0056, "step": 659490 }, { "epoch": 1.71, "learning_rate": 4.3572130301907036e-05, "loss": 0.0118, "step": 659500 }, { "epoch": 1.71, "learning_rate": 4.356824208553557e-05, "loss": 0.007, "step": 659510 }, { "epoch": 1.71, "learning_rate": 4.3564353869164106e-05, "loss": 0.0071, "step": 659520 }, { "epoch": 1.71, "learning_rate": 4.356046565279265e-05, "loss": 0.0078, "step": 659530 }, { "epoch": 1.71, "learning_rate": 4.355657743642118e-05, "loss": 0.0085, "step": 659540 }, { "epoch": 1.71, "learning_rate": 4.355268922004972e-05, "loss": 0.0059, "step": 659550 }, { "epoch": 1.71, "learning_rate": 4.354880100367825e-05, "loss": 0.007, "step": 659560 }, { "epoch": 1.71, "learning_rate": 4.354491278730679e-05, "loss": 0.0092, "step": 659570 }, { "epoch": 1.71, "learning_rate": 4.354102457093532e-05, "loss": 0.0065, "step": 659580 }, { "epoch": 1.71, "learning_rate": 4.353713635456386e-05, "loss": 0.0062, "step": 659590 }, { "epoch": 1.71, "learning_rate": 4.3533248138192385e-05, "loss": 0.0078, "step": 659600 }, { "epoch": 1.71, "learning_rate": 4.352935992182092e-05, "loss": 0.0084, "step": 659610 }, { "epoch": 1.71, "learning_rate": 4.3525471705449455e-05, "loss": 0.0063, "step": 659620 }, { "epoch": 1.71, "learning_rate": 4.3521583489077996e-05, "loss": 0.0066, "step": 659630 }, { "epoch": 1.71, "learning_rate": 4.351769527270653e-05, "loss": 0.0079, "step": 659640 }, { "epoch": 1.71, "learning_rate": 4.3513807056335066e-05, "loss": 0.0072, "step": 659650 }, { "epoch": 1.71, "learning_rate": 4.35099188399636e-05, "loss": 0.0094, "step": 659660 }, { "epoch": 1.71, "learning_rate": 4.3506030623592136e-05, "loss": 0.0099, "step": 659670 }, { "epoch": 1.71, "learning_rate": 4.350214240722067e-05, "loss": 0.0067, "step": 659680 }, { "epoch": 1.71, "learning_rate": 4.3498254190849206e-05, "loss": 0.0061, "step": 659690 }, { "epoch": 1.71, "learning_rate": 4.349436597447774e-05, "loss": 0.0077, "step": 659700 }, { "epoch": 1.71, "learning_rate": 4.349047775810628e-05, "loss": 0.0064, "step": 659710 }, { "epoch": 1.71, "learning_rate": 4.348658954173482e-05, "loss": 0.0092, "step": 659720 }, { "epoch": 1.71, "learning_rate": 4.348270132536335e-05, "loss": 0.0106, "step": 659730 }, { "epoch": 1.71, "learning_rate": 4.347881310899189e-05, "loss": 0.0062, "step": 659740 }, { "epoch": 1.71, "learning_rate": 4.347492489262042e-05, "loss": 0.0062, "step": 659750 }, { "epoch": 1.71, "learning_rate": 4.3471036676248956e-05, "loss": 0.0106, "step": 659760 }, { "epoch": 1.71, "learning_rate": 4.346714845987749e-05, "loss": 0.0101, "step": 659770 }, { "epoch": 1.71, "learning_rate": 4.3463260243506026e-05, "loss": 0.0134, "step": 659780 }, { "epoch": 1.71, "learning_rate": 4.345937202713457e-05, "loss": 0.0098, "step": 659790 }, { "epoch": 1.71, "learning_rate": 4.34554838107631e-05, "loss": 0.0066, "step": 659800 }, { "epoch": 1.71, "learning_rate": 4.345159559439164e-05, "loss": 0.0066, "step": 659810 }, { "epoch": 1.71, "learning_rate": 4.344770737802017e-05, "loss": 0.0081, "step": 659820 }, { "epoch": 1.71, "learning_rate": 4.344381916164871e-05, "loss": 0.0122, "step": 659830 }, { "epoch": 1.71, "learning_rate": 4.3439930945277235e-05, "loss": 0.0075, "step": 659840 }, { "epoch": 1.71, "learning_rate": 4.343604272890577e-05, "loss": 0.0104, "step": 659850 }, { "epoch": 1.71, "learning_rate": 4.3432154512534305e-05, "loss": 0.0087, "step": 659860 }, { "epoch": 1.71, "learning_rate": 4.342826629616284e-05, "loss": 0.0069, "step": 659870 }, { "epoch": 1.71, "learning_rate": 4.3424378079791375e-05, "loss": 0.0073, "step": 659880 }, { "epoch": 1.71, "learning_rate": 4.3420489863419916e-05, "loss": 0.0097, "step": 659890 }, { "epoch": 1.71, "learning_rate": 4.341660164704845e-05, "loss": 0.0087, "step": 659900 }, { "epoch": 1.71, "learning_rate": 4.3412713430676986e-05, "loss": 0.0085, "step": 659910 }, { "epoch": 1.71, "learning_rate": 4.340882521430552e-05, "loss": 0.0067, "step": 659920 }, { "epoch": 1.71, "learning_rate": 4.3404936997934056e-05, "loss": 0.0059, "step": 659930 }, { "epoch": 1.71, "learning_rate": 4.340104878156259e-05, "loss": 0.0091, "step": 659940 }, { "epoch": 1.71, "learning_rate": 4.3397160565191126e-05, "loss": 0.0076, "step": 659950 }, { "epoch": 1.71, "learning_rate": 4.339327234881966e-05, "loss": 0.0087, "step": 659960 }, { "epoch": 1.71, "learning_rate": 4.33893841324482e-05, "loss": 0.0078, "step": 659970 }, { "epoch": 1.71, "learning_rate": 4.338549591607674e-05, "loss": 0.0074, "step": 659980 }, { "epoch": 1.71, "learning_rate": 4.338160769970527e-05, "loss": 0.0069, "step": 659990 }, { "epoch": 1.71, "learning_rate": 4.3377719483333807e-05, "loss": 0.0097, "step": 660000 }, { "epoch": 1.71, "eval_cer": 0.8816648961259449, "eval_loss": 0.0051537686958909035, "eval_runtime": 107.9648, "eval_samples_per_second": 18.525, "eval_steps_per_second": 4.631, "step": 660000 }, { "epoch": 1.71, "learning_rate": 4.337383126696234e-05, "loss": 0.0066, "step": 660010 }, { "epoch": 1.71, "learning_rate": 4.3369943050590876e-05, "loss": 0.0065, "step": 660020 }, { "epoch": 1.71, "learning_rate": 4.336605483421941e-05, "loss": 0.0064, "step": 660030 }, { "epoch": 1.71, "learning_rate": 4.3362166617847946e-05, "loss": 0.0087, "step": 660040 }, { "epoch": 1.71, "learning_rate": 4.335827840147649e-05, "loss": 0.007, "step": 660050 }, { "epoch": 1.71, "learning_rate": 4.335439018510502e-05, "loss": 0.0065, "step": 660060 }, { "epoch": 1.71, "learning_rate": 4.335050196873356e-05, "loss": 0.0113, "step": 660070 }, { "epoch": 1.71, "learning_rate": 4.334661375236209e-05, "loss": 0.0077, "step": 660080 }, { "epoch": 1.71, "learning_rate": 4.334272553599062e-05, "loss": 0.0071, "step": 660090 }, { "epoch": 1.71, "learning_rate": 4.3338837319619155e-05, "loss": 0.0101, "step": 660100 }, { "epoch": 1.71, "learning_rate": 4.333494910324769e-05, "loss": 0.0076, "step": 660110 }, { "epoch": 1.71, "learning_rate": 4.3331060886876225e-05, "loss": 0.0088, "step": 660120 }, { "epoch": 1.71, "learning_rate": 4.332717267050476e-05, "loss": 0.0061, "step": 660130 }, { "epoch": 1.71, "learning_rate": 4.3323284454133295e-05, "loss": 0.0086, "step": 660140 }, { "epoch": 1.71, "learning_rate": 4.3319396237761836e-05, "loss": 0.0088, "step": 660150 }, { "epoch": 1.71, "learning_rate": 4.331550802139037e-05, "loss": 0.0071, "step": 660160 }, { "epoch": 1.71, "learning_rate": 4.3311619805018906e-05, "loss": 0.0083, "step": 660170 }, { "epoch": 1.71, "learning_rate": 4.330773158864744e-05, "loss": 0.0078, "step": 660180 }, { "epoch": 1.71, "learning_rate": 4.3303843372275976e-05, "loss": 0.0087, "step": 660190 }, { "epoch": 1.71, "learning_rate": 4.329995515590451e-05, "loss": 0.0096, "step": 660200 }, { "epoch": 1.71, "learning_rate": 4.3296066939533045e-05, "loss": 0.0108, "step": 660210 }, { "epoch": 1.71, "learning_rate": 4.329217872316158e-05, "loss": 0.0069, "step": 660220 }, { "epoch": 1.71, "learning_rate": 4.328829050679012e-05, "loss": 0.0098, "step": 660230 }, { "epoch": 1.71, "learning_rate": 4.328440229041866e-05, "loss": 0.0055, "step": 660240 }, { "epoch": 1.71, "learning_rate": 4.328051407404719e-05, "loss": 0.01, "step": 660250 }, { "epoch": 1.71, "learning_rate": 4.3276625857675727e-05, "loss": 0.0088, "step": 660260 }, { "epoch": 1.71, "learning_rate": 4.327273764130426e-05, "loss": 0.008, "step": 660270 }, { "epoch": 1.71, "learning_rate": 4.3268849424932796e-05, "loss": 0.0082, "step": 660280 }, { "epoch": 1.71, "learning_rate": 4.326496120856133e-05, "loss": 0.0102, "step": 660290 }, { "epoch": 1.71, "learning_rate": 4.3261072992189866e-05, "loss": 0.0062, "step": 660300 }, { "epoch": 1.71, "learning_rate": 4.325718477581841e-05, "loss": 0.0135, "step": 660310 }, { "epoch": 1.71, "learning_rate": 4.325329655944694e-05, "loss": 0.0046, "step": 660320 }, { "epoch": 1.71, "learning_rate": 4.324940834307548e-05, "loss": 0.0062, "step": 660330 }, { "epoch": 1.71, "learning_rate": 4.3245520126704005e-05, "loss": 0.0073, "step": 660340 }, { "epoch": 1.71, "learning_rate": 4.324163191033254e-05, "loss": 0.0085, "step": 660350 }, { "epoch": 1.71, "learning_rate": 4.3237743693961075e-05, "loss": 0.0071, "step": 660360 }, { "epoch": 1.71, "learning_rate": 4.323385547758961e-05, "loss": 0.0105, "step": 660370 }, { "epoch": 1.71, "learning_rate": 4.3229967261218145e-05, "loss": 0.0088, "step": 660380 }, { "epoch": 1.71, "learning_rate": 4.322607904484668e-05, "loss": 0.0059, "step": 660390 }, { "epoch": 1.71, "learning_rate": 4.3222190828475215e-05, "loss": 0.0088, "step": 660400 }, { "epoch": 1.71, "learning_rate": 4.3218302612103756e-05, "loss": 0.0087, "step": 660410 }, { "epoch": 1.71, "learning_rate": 4.321441439573229e-05, "loss": 0.0088, "step": 660420 }, { "epoch": 1.71, "learning_rate": 4.3210526179360826e-05, "loss": 0.0091, "step": 660430 }, { "epoch": 1.71, "learning_rate": 4.320663796298936e-05, "loss": 0.008, "step": 660440 }, { "epoch": 1.71, "learning_rate": 4.3202749746617896e-05, "loss": 0.009, "step": 660450 }, { "epoch": 1.71, "learning_rate": 4.319886153024643e-05, "loss": 0.0101, "step": 660460 }, { "epoch": 1.71, "learning_rate": 4.3194973313874965e-05, "loss": 0.0087, "step": 660470 }, { "epoch": 1.71, "learning_rate": 4.31910850975035e-05, "loss": 0.0075, "step": 660480 }, { "epoch": 1.71, "learning_rate": 4.3187196881132035e-05, "loss": 0.0079, "step": 660490 }, { "epoch": 1.71, "learning_rate": 4.318330866476058e-05, "loss": 0.0095, "step": 660500 }, { "epoch": 1.71, "learning_rate": 4.317942044838911e-05, "loss": 0.0079, "step": 660510 }, { "epoch": 1.71, "learning_rate": 4.3175532232017646e-05, "loss": 0.007, "step": 660520 }, { "epoch": 1.71, "learning_rate": 4.317164401564618e-05, "loss": 0.007, "step": 660530 }, { "epoch": 1.71, "learning_rate": 4.3167755799274716e-05, "loss": 0.0093, "step": 660540 }, { "epoch": 1.71, "learning_rate": 4.316386758290325e-05, "loss": 0.0091, "step": 660550 }, { "epoch": 1.71, "learning_rate": 4.3159979366531786e-05, "loss": 0.0077, "step": 660560 }, { "epoch": 1.71, "learning_rate": 4.315609115016032e-05, "loss": 0.0099, "step": 660570 }, { "epoch": 1.71, "learning_rate": 4.315220293378886e-05, "loss": 0.0096, "step": 660580 }, { "epoch": 1.71, "learning_rate": 4.3148314717417384e-05, "loss": 0.0073, "step": 660590 }, { "epoch": 1.71, "learning_rate": 4.3144426501045925e-05, "loss": 0.0118, "step": 660600 }, { "epoch": 1.71, "learning_rate": 4.314053828467446e-05, "loss": 0.0062, "step": 660610 }, { "epoch": 1.71, "learning_rate": 4.3136650068302995e-05, "loss": 0.0119, "step": 660620 }, { "epoch": 1.71, "learning_rate": 4.313276185193153e-05, "loss": 0.008, "step": 660630 }, { "epoch": 1.71, "learning_rate": 4.3128873635560065e-05, "loss": 0.0062, "step": 660640 }, { "epoch": 1.71, "learning_rate": 4.31249854191886e-05, "loss": 0.0092, "step": 660650 }, { "epoch": 1.71, "learning_rate": 4.3121097202817135e-05, "loss": 0.0085, "step": 660660 }, { "epoch": 1.71, "learning_rate": 4.311720898644567e-05, "loss": 0.0105, "step": 660670 }, { "epoch": 1.71, "learning_rate": 4.311332077007421e-05, "loss": 0.008, "step": 660680 }, { "epoch": 1.71, "learning_rate": 4.3109432553702746e-05, "loss": 0.0077, "step": 660690 }, { "epoch": 1.71, "learning_rate": 4.310554433733128e-05, "loss": 0.0054, "step": 660700 }, { "epoch": 1.71, "learning_rate": 4.3101656120959816e-05, "loss": 0.009, "step": 660710 }, { "epoch": 1.71, "learning_rate": 4.309776790458835e-05, "loss": 0.0066, "step": 660720 }, { "epoch": 1.71, "learning_rate": 4.3093879688216885e-05, "loss": 0.0061, "step": 660730 }, { "epoch": 1.71, "learning_rate": 4.308999147184542e-05, "loss": 0.0084, "step": 660740 }, { "epoch": 1.71, "learning_rate": 4.3086103255473955e-05, "loss": 0.0053, "step": 660750 }, { "epoch": 1.71, "learning_rate": 4.30822150391025e-05, "loss": 0.0086, "step": 660760 }, { "epoch": 1.71, "learning_rate": 4.307832682273103e-05, "loss": 0.0064, "step": 660770 }, { "epoch": 1.71, "learning_rate": 4.3074438606359566e-05, "loss": 0.0059, "step": 660780 }, { "epoch": 1.71, "learning_rate": 4.30705503899881e-05, "loss": 0.0068, "step": 660790 }, { "epoch": 1.71, "learning_rate": 4.3066662173616636e-05, "loss": 0.0086, "step": 660800 }, { "epoch": 1.71, "learning_rate": 4.306277395724517e-05, "loss": 0.008, "step": 660810 }, { "epoch": 1.71, "learning_rate": 4.3058885740873706e-05, "loss": 0.0052, "step": 660820 }, { "epoch": 1.71, "learning_rate": 4.305499752450224e-05, "loss": 0.0066, "step": 660830 }, { "epoch": 1.71, "learning_rate": 4.305110930813077e-05, "loss": 0.0075, "step": 660840 }, { "epoch": 1.71, "learning_rate": 4.3047221091759304e-05, "loss": 0.0103, "step": 660850 }, { "epoch": 1.71, "learning_rate": 4.3043332875387845e-05, "loss": 0.0078, "step": 660860 }, { "epoch": 1.71, "learning_rate": 4.303944465901638e-05, "loss": 0.0104, "step": 660870 }, { "epoch": 1.71, "learning_rate": 4.3035556442644915e-05, "loss": 0.01, "step": 660880 }, { "epoch": 1.71, "learning_rate": 4.303166822627345e-05, "loss": 0.0065, "step": 660890 }, { "epoch": 1.71, "learning_rate": 4.3027780009901985e-05, "loss": 0.0069, "step": 660900 }, { "epoch": 1.71, "learning_rate": 4.302389179353052e-05, "loss": 0.01, "step": 660910 }, { "epoch": 1.71, "learning_rate": 4.3020003577159055e-05, "loss": 0.0084, "step": 660920 }, { "epoch": 1.71, "learning_rate": 4.301611536078759e-05, "loss": 0.0097, "step": 660930 }, { "epoch": 1.71, "learning_rate": 4.301222714441613e-05, "loss": 0.0082, "step": 660940 }, { "epoch": 1.71, "learning_rate": 4.3008338928044666e-05, "loss": 0.0066, "step": 660950 }, { "epoch": 1.71, "learning_rate": 4.30044507116732e-05, "loss": 0.0079, "step": 660960 }, { "epoch": 1.71, "learning_rate": 4.3000562495301736e-05, "loss": 0.0077, "step": 660970 }, { "epoch": 1.71, "learning_rate": 4.299667427893027e-05, "loss": 0.0068, "step": 660980 }, { "epoch": 1.71, "learning_rate": 4.2992786062558805e-05, "loss": 0.0069, "step": 660990 }, { "epoch": 1.71, "learning_rate": 4.298889784618734e-05, "loss": 0.0074, "step": 661000 }, { "epoch": 1.71, "eval_cer": 0.8816522993935373, "eval_loss": 0.00525335967540741, "eval_runtime": 107.9903, "eval_samples_per_second": 18.52, "eval_steps_per_second": 4.63, "step": 661000 }, { "epoch": 1.71, "learning_rate": 4.2985009629815875e-05, "loss": 0.009, "step": 661010 }, { "epoch": 1.71, "learning_rate": 4.298112141344442e-05, "loss": 0.0088, "step": 661020 }, { "epoch": 1.71, "learning_rate": 4.297723319707295e-05, "loss": 0.0087, "step": 661030 }, { "epoch": 1.71, "learning_rate": 4.2973344980701486e-05, "loss": 0.008, "step": 661040 }, { "epoch": 1.71, "learning_rate": 4.296945676433002e-05, "loss": 0.0101, "step": 661050 }, { "epoch": 1.71, "learning_rate": 4.2965568547958556e-05, "loss": 0.0077, "step": 661060 }, { "epoch": 1.71, "learning_rate": 4.296168033158709e-05, "loss": 0.0077, "step": 661070 }, { "epoch": 1.71, "learning_rate": 4.2957792115215626e-05, "loss": 0.0066, "step": 661080 }, { "epoch": 1.71, "learning_rate": 4.2953903898844154e-05, "loss": 0.0085, "step": 661090 }, { "epoch": 1.71, "learning_rate": 4.295001568247269e-05, "loss": 0.0092, "step": 661100 }, { "epoch": 1.71, "learning_rate": 4.2946127466101224e-05, "loss": 0.0099, "step": 661110 }, { "epoch": 1.71, "learning_rate": 4.2942239249729765e-05, "loss": 0.009, "step": 661120 }, { "epoch": 1.71, "learning_rate": 4.29383510333583e-05, "loss": 0.0052, "step": 661130 }, { "epoch": 1.71, "learning_rate": 4.2934462816986835e-05, "loss": 0.0055, "step": 661140 }, { "epoch": 1.71, "learning_rate": 4.293057460061537e-05, "loss": 0.0074, "step": 661150 }, { "epoch": 1.71, "learning_rate": 4.2926686384243905e-05, "loss": 0.0071, "step": 661160 }, { "epoch": 1.71, "learning_rate": 4.292279816787244e-05, "loss": 0.0083, "step": 661170 }, { "epoch": 1.71, "learning_rate": 4.2918909951500974e-05, "loss": 0.0076, "step": 661180 }, { "epoch": 1.71, "learning_rate": 4.291502173512951e-05, "loss": 0.0081, "step": 661190 }, { "epoch": 1.71, "learning_rate": 4.291113351875805e-05, "loss": 0.007, "step": 661200 }, { "epoch": 1.71, "learning_rate": 4.2907245302386586e-05, "loss": 0.007, "step": 661210 }, { "epoch": 1.71, "learning_rate": 4.290335708601512e-05, "loss": 0.008, "step": 661220 }, { "epoch": 1.71, "learning_rate": 4.2899468869643656e-05, "loss": 0.0085, "step": 661230 }, { "epoch": 1.71, "learning_rate": 4.289558065327219e-05, "loss": 0.0077, "step": 661240 }, { "epoch": 1.71, "learning_rate": 4.2891692436900725e-05, "loss": 0.0084, "step": 661250 }, { "epoch": 1.71, "learning_rate": 4.288780422052926e-05, "loss": 0.0071, "step": 661260 }, { "epoch": 1.71, "learning_rate": 4.2883916004157795e-05, "loss": 0.0083, "step": 661270 }, { "epoch": 1.71, "learning_rate": 4.288002778778634e-05, "loss": 0.0063, "step": 661280 }, { "epoch": 1.71, "learning_rate": 4.287613957141487e-05, "loss": 0.0081, "step": 661290 }, { "epoch": 1.71, "learning_rate": 4.2872251355043406e-05, "loss": 0.0093, "step": 661300 }, { "epoch": 1.71, "learning_rate": 4.286836313867194e-05, "loss": 0.0107, "step": 661310 }, { "epoch": 1.71, "learning_rate": 4.2864474922300476e-05, "loss": 0.0067, "step": 661320 }, { "epoch": 1.71, "learning_rate": 4.2860586705929004e-05, "loss": 0.0068, "step": 661330 }, { "epoch": 1.71, "learning_rate": 4.285669848955754e-05, "loss": 0.0075, "step": 661340 }, { "epoch": 1.71, "learning_rate": 4.2852810273186074e-05, "loss": 0.0091, "step": 661350 }, { "epoch": 1.71, "learning_rate": 4.284892205681461e-05, "loss": 0.0098, "step": 661360 }, { "epoch": 1.71, "learning_rate": 4.2845033840443144e-05, "loss": 0.0078, "step": 661370 }, { "epoch": 1.71, "learning_rate": 4.2841145624071685e-05, "loss": 0.0068, "step": 661380 }, { "epoch": 1.71, "learning_rate": 4.283725740770022e-05, "loss": 0.0111, "step": 661390 }, { "epoch": 1.71, "learning_rate": 4.2833369191328755e-05, "loss": 0.0091, "step": 661400 }, { "epoch": 1.71, "learning_rate": 4.282948097495729e-05, "loss": 0.0073, "step": 661410 }, { "epoch": 1.71, "learning_rate": 4.2825592758585825e-05, "loss": 0.0123, "step": 661420 }, { "epoch": 1.71, "learning_rate": 4.282170454221436e-05, "loss": 0.0076, "step": 661430 }, { "epoch": 1.71, "learning_rate": 4.2817816325842894e-05, "loss": 0.0112, "step": 661440 }, { "epoch": 1.71, "learning_rate": 4.281392810947143e-05, "loss": 0.009, "step": 661450 }, { "epoch": 1.71, "learning_rate": 4.281003989309997e-05, "loss": 0.0074, "step": 661460 }, { "epoch": 1.71, "learning_rate": 4.2806151676728506e-05, "loss": 0.0068, "step": 661470 }, { "epoch": 1.71, "learning_rate": 4.280226346035704e-05, "loss": 0.0092, "step": 661480 }, { "epoch": 1.71, "learning_rate": 4.2798375243985575e-05, "loss": 0.0087, "step": 661490 }, { "epoch": 1.71, "learning_rate": 4.279448702761411e-05, "loss": 0.0092, "step": 661500 }, { "epoch": 1.71, "learning_rate": 4.2790598811242645e-05, "loss": 0.0075, "step": 661510 }, { "epoch": 1.71, "learning_rate": 4.278671059487118e-05, "loss": 0.0062, "step": 661520 }, { "epoch": 1.71, "learning_rate": 4.2782822378499715e-05, "loss": 0.0097, "step": 661530 }, { "epoch": 1.71, "learning_rate": 4.2778934162128257e-05, "loss": 0.0074, "step": 661540 }, { "epoch": 1.71, "learning_rate": 4.277504594575679e-05, "loss": 0.0102, "step": 661550 }, { "epoch": 1.71, "learning_rate": 4.2771157729385326e-05, "loss": 0.0073, "step": 661560 }, { "epoch": 1.71, "learning_rate": 4.276726951301386e-05, "loss": 0.0077, "step": 661570 }, { "epoch": 1.71, "learning_rate": 4.276338129664239e-05, "loss": 0.0098, "step": 661580 }, { "epoch": 1.71, "learning_rate": 4.2759493080270924e-05, "loss": 0.0097, "step": 661590 }, { "epoch": 1.71, "learning_rate": 4.275560486389946e-05, "loss": 0.0088, "step": 661600 }, { "epoch": 1.71, "learning_rate": 4.2751716647527994e-05, "loss": 0.0112, "step": 661610 }, { "epoch": 1.72, "learning_rate": 4.274782843115653e-05, "loss": 0.0084, "step": 661620 }, { "epoch": 1.72, "learning_rate": 4.2743940214785064e-05, "loss": 0.0118, "step": 661630 }, { "epoch": 1.72, "learning_rate": 4.2740051998413605e-05, "loss": 0.0085, "step": 661640 }, { "epoch": 1.72, "learning_rate": 4.273616378204214e-05, "loss": 0.0084, "step": 661650 }, { "epoch": 1.72, "learning_rate": 4.2732275565670675e-05, "loss": 0.0079, "step": 661660 }, { "epoch": 1.72, "learning_rate": 4.272838734929921e-05, "loss": 0.0086, "step": 661670 }, { "epoch": 1.72, "learning_rate": 4.2724499132927745e-05, "loss": 0.0065, "step": 661680 }, { "epoch": 1.72, "learning_rate": 4.272061091655628e-05, "loss": 0.0075, "step": 661690 }, { "epoch": 1.72, "learning_rate": 4.2716722700184814e-05, "loss": 0.0053, "step": 661700 }, { "epoch": 1.72, "learning_rate": 4.271283448381335e-05, "loss": 0.0083, "step": 661710 }, { "epoch": 1.72, "learning_rate": 4.270894626744189e-05, "loss": 0.0063, "step": 661720 }, { "epoch": 1.72, "learning_rate": 4.2705058051070426e-05, "loss": 0.0065, "step": 661730 }, { "epoch": 1.72, "learning_rate": 4.270116983469896e-05, "loss": 0.009, "step": 661740 }, { "epoch": 1.72, "learning_rate": 4.2697281618327495e-05, "loss": 0.0095, "step": 661750 }, { "epoch": 1.72, "learning_rate": 4.269339340195603e-05, "loss": 0.0092, "step": 661760 }, { "epoch": 1.72, "learning_rate": 4.2689505185584565e-05, "loss": 0.0064, "step": 661770 }, { "epoch": 1.72, "learning_rate": 4.26856169692131e-05, "loss": 0.0095, "step": 661780 }, { "epoch": 1.72, "learning_rate": 4.2681728752841635e-05, "loss": 0.0085, "step": 661790 }, { "epoch": 1.72, "learning_rate": 4.267784053647017e-05, "loss": 0.0084, "step": 661800 }, { "epoch": 1.72, "learning_rate": 4.267395232009871e-05, "loss": 0.0075, "step": 661810 }, { "epoch": 1.72, "learning_rate": 4.2670064103727246e-05, "loss": 0.0096, "step": 661820 }, { "epoch": 1.72, "learning_rate": 4.2666175887355774e-05, "loss": 0.0082, "step": 661830 }, { "epoch": 1.72, "learning_rate": 4.266228767098431e-05, "loss": 0.0093, "step": 661840 }, { "epoch": 1.72, "learning_rate": 4.2658399454612844e-05, "loss": 0.0069, "step": 661850 }, { "epoch": 1.72, "learning_rate": 4.265451123824138e-05, "loss": 0.0079, "step": 661860 }, { "epoch": 1.72, "learning_rate": 4.2650623021869914e-05, "loss": 0.0069, "step": 661870 }, { "epoch": 1.72, "learning_rate": 4.264673480549845e-05, "loss": 0.0101, "step": 661880 }, { "epoch": 1.72, "learning_rate": 4.2642846589126984e-05, "loss": 0.0065, "step": 661890 }, { "epoch": 1.72, "learning_rate": 4.263895837275552e-05, "loss": 0.0068, "step": 661900 }, { "epoch": 1.72, "learning_rate": 4.263507015638406e-05, "loss": 0.008, "step": 661910 }, { "epoch": 1.72, "learning_rate": 4.2631181940012595e-05, "loss": 0.0102, "step": 661920 }, { "epoch": 1.72, "learning_rate": 4.262729372364113e-05, "loss": 0.0067, "step": 661930 }, { "epoch": 1.72, "learning_rate": 4.2623405507269665e-05, "loss": 0.0091, "step": 661940 }, { "epoch": 1.72, "learning_rate": 4.26195172908982e-05, "loss": 0.009, "step": 661950 }, { "epoch": 1.72, "learning_rate": 4.2615629074526734e-05, "loss": 0.0065, "step": 661960 }, { "epoch": 1.72, "learning_rate": 4.261174085815527e-05, "loss": 0.0078, "step": 661970 }, { "epoch": 1.72, "learning_rate": 4.2607852641783804e-05, "loss": 0.0074, "step": 661980 }, { "epoch": 1.72, "learning_rate": 4.2603964425412346e-05, "loss": 0.0072, "step": 661990 }, { "epoch": 1.72, "learning_rate": 4.260007620904088e-05, "loss": 0.0109, "step": 662000 }, { "epoch": 1.72, "eval_cer": 0.8816606972151424, "eval_loss": 0.005079487804323435, "eval_runtime": 107.8535, "eval_samples_per_second": 18.544, "eval_steps_per_second": 4.636, "step": 662000 }, { "epoch": 1.72, "learning_rate": 4.2596187992669415e-05, "loss": 0.0105, "step": 662010 }, { "epoch": 1.72, "learning_rate": 4.259229977629795e-05, "loss": 0.0075, "step": 662020 }, { "epoch": 1.72, "learning_rate": 4.2588411559926485e-05, "loss": 0.0106, "step": 662030 }, { "epoch": 1.72, "learning_rate": 4.258452334355502e-05, "loss": 0.0101, "step": 662040 }, { "epoch": 1.72, "learning_rate": 4.2580635127183555e-05, "loss": 0.0072, "step": 662050 }, { "epoch": 1.72, "learning_rate": 4.257674691081209e-05, "loss": 0.0161, "step": 662060 }, { "epoch": 1.72, "learning_rate": 4.257285869444063e-05, "loss": 0.0093, "step": 662070 }, { "epoch": 1.72, "learning_rate": 4.256897047806915e-05, "loss": 0.0073, "step": 662080 }, { "epoch": 1.72, "learning_rate": 4.2565082261697694e-05, "loss": 0.0066, "step": 662090 }, { "epoch": 1.72, "learning_rate": 4.256119404532623e-05, "loss": 0.0104, "step": 662100 }, { "epoch": 1.72, "learning_rate": 4.2557305828954764e-05, "loss": 0.0092, "step": 662110 }, { "epoch": 1.72, "learning_rate": 4.25534176125833e-05, "loss": 0.0059, "step": 662120 }, { "epoch": 1.72, "learning_rate": 4.2549529396211834e-05, "loss": 0.0074, "step": 662130 }, { "epoch": 1.72, "learning_rate": 4.254564117984037e-05, "loss": 0.0056, "step": 662140 }, { "epoch": 1.72, "learning_rate": 4.2541752963468903e-05, "loss": 0.006, "step": 662150 }, { "epoch": 1.72, "learning_rate": 4.253786474709744e-05, "loss": 0.0084, "step": 662160 }, { "epoch": 1.72, "learning_rate": 4.253397653072598e-05, "loss": 0.0105, "step": 662170 }, { "epoch": 1.72, "learning_rate": 4.2530088314354515e-05, "loss": 0.0074, "step": 662180 }, { "epoch": 1.72, "learning_rate": 4.252620009798305e-05, "loss": 0.0071, "step": 662190 }, { "epoch": 1.72, "learning_rate": 4.2522311881611585e-05, "loss": 0.0071, "step": 662200 }, { "epoch": 1.72, "learning_rate": 4.251842366524012e-05, "loss": 0.0081, "step": 662210 }, { "epoch": 1.72, "learning_rate": 4.2514535448868654e-05, "loss": 0.011, "step": 662220 }, { "epoch": 1.72, "learning_rate": 4.251064723249719e-05, "loss": 0.0068, "step": 662230 }, { "epoch": 1.72, "learning_rate": 4.2506759016125724e-05, "loss": 0.0077, "step": 662240 }, { "epoch": 1.72, "learning_rate": 4.2502870799754266e-05, "loss": 0.0075, "step": 662250 }, { "epoch": 1.72, "learning_rate": 4.24989825833828e-05, "loss": 0.0133, "step": 662260 }, { "epoch": 1.72, "learning_rate": 4.2495094367011335e-05, "loss": 0.0097, "step": 662270 }, { "epoch": 1.72, "learning_rate": 4.249120615063987e-05, "loss": 0.0068, "step": 662280 }, { "epoch": 1.72, "learning_rate": 4.2487317934268405e-05, "loss": 0.0074, "step": 662290 }, { "epoch": 1.72, "learning_rate": 4.248342971789694e-05, "loss": 0.0097, "step": 662300 }, { "epoch": 1.72, "learning_rate": 4.2479541501525475e-05, "loss": 0.0097, "step": 662310 }, { "epoch": 1.72, "learning_rate": 4.247565328515401e-05, "loss": 0.0087, "step": 662320 }, { "epoch": 1.72, "learning_rate": 4.247176506878254e-05, "loss": 0.0072, "step": 662330 }, { "epoch": 1.72, "learning_rate": 4.246787685241107e-05, "loss": 0.0096, "step": 662340 }, { "epoch": 1.72, "learning_rate": 4.2463988636039614e-05, "loss": 0.0101, "step": 662350 }, { "epoch": 1.72, "learning_rate": 4.246010041966815e-05, "loss": 0.0097, "step": 662360 }, { "epoch": 1.72, "learning_rate": 4.2456212203296684e-05, "loss": 0.0095, "step": 662370 }, { "epoch": 1.72, "learning_rate": 4.245232398692522e-05, "loss": 0.0082, "step": 662380 }, { "epoch": 1.72, "learning_rate": 4.2448435770553754e-05, "loss": 0.0076, "step": 662390 }, { "epoch": 1.72, "learning_rate": 4.244454755418229e-05, "loss": 0.0064, "step": 662400 }, { "epoch": 1.72, "learning_rate": 4.2440659337810823e-05, "loss": 0.0087, "step": 662410 }, { "epoch": 1.72, "learning_rate": 4.243677112143936e-05, "loss": 0.0062, "step": 662420 }, { "epoch": 1.72, "learning_rate": 4.24328829050679e-05, "loss": 0.0069, "step": 662430 }, { "epoch": 1.72, "learning_rate": 4.2428994688696435e-05, "loss": 0.0068, "step": 662440 }, { "epoch": 1.72, "learning_rate": 4.242510647232497e-05, "loss": 0.0128, "step": 662450 }, { "epoch": 1.72, "learning_rate": 4.2421218255953504e-05, "loss": 0.0079, "step": 662460 }, { "epoch": 1.72, "learning_rate": 4.241733003958204e-05, "loss": 0.0082, "step": 662470 }, { "epoch": 1.72, "learning_rate": 4.2413441823210574e-05, "loss": 0.0094, "step": 662480 }, { "epoch": 1.72, "learning_rate": 4.240955360683911e-05, "loss": 0.01, "step": 662490 }, { "epoch": 1.72, "learning_rate": 4.2405665390467644e-05, "loss": 0.0105, "step": 662500 }, { "epoch": 1.72, "learning_rate": 4.2401777174096186e-05, "loss": 0.0085, "step": 662510 }, { "epoch": 1.72, "learning_rate": 4.239788895772472e-05, "loss": 0.0051, "step": 662520 }, { "epoch": 1.72, "learning_rate": 4.2394000741353255e-05, "loss": 0.0067, "step": 662530 }, { "epoch": 1.72, "learning_rate": 4.239011252498179e-05, "loss": 0.007, "step": 662540 }, { "epoch": 1.72, "learning_rate": 4.2386224308610325e-05, "loss": 0.0081, "step": 662550 }, { "epoch": 1.72, "learning_rate": 4.238233609223886e-05, "loss": 0.0098, "step": 662560 }, { "epoch": 1.72, "learning_rate": 4.237844787586739e-05, "loss": 0.0078, "step": 662570 }, { "epoch": 1.72, "learning_rate": 4.237455965949592e-05, "loss": 0.0059, "step": 662580 }, { "epoch": 1.72, "learning_rate": 4.237067144312446e-05, "loss": 0.0078, "step": 662590 }, { "epoch": 1.72, "learning_rate": 4.236678322675299e-05, "loss": 0.0082, "step": 662600 }, { "epoch": 1.72, "learning_rate": 4.2362895010381534e-05, "loss": 0.008, "step": 662610 }, { "epoch": 1.72, "learning_rate": 4.235900679401007e-05, "loss": 0.0087, "step": 662620 }, { "epoch": 1.72, "learning_rate": 4.2355118577638604e-05, "loss": 0.0066, "step": 662630 }, { "epoch": 1.72, "learning_rate": 4.235123036126714e-05, "loss": 0.007, "step": 662640 }, { "epoch": 1.72, "learning_rate": 4.2347342144895674e-05, "loss": 0.0066, "step": 662650 }, { "epoch": 1.72, "learning_rate": 4.234345392852421e-05, "loss": 0.0074, "step": 662660 }, { "epoch": 1.72, "learning_rate": 4.233956571215274e-05, "loss": 0.0064, "step": 662670 }, { "epoch": 1.72, "learning_rate": 4.233567749578128e-05, "loss": 0.0099, "step": 662680 }, { "epoch": 1.72, "learning_rate": 4.233178927940982e-05, "loss": 0.0067, "step": 662690 }, { "epoch": 1.72, "learning_rate": 4.2327901063038355e-05, "loss": 0.0062, "step": 662700 }, { "epoch": 1.72, "learning_rate": 4.232401284666689e-05, "loss": 0.0076, "step": 662710 }, { "epoch": 1.72, "learning_rate": 4.2320124630295424e-05, "loss": 0.0073, "step": 662720 }, { "epoch": 1.72, "learning_rate": 4.231623641392396e-05, "loss": 0.01, "step": 662730 }, { "epoch": 1.72, "learning_rate": 4.2312348197552494e-05, "loss": 0.0077, "step": 662740 }, { "epoch": 1.72, "learning_rate": 4.230845998118103e-05, "loss": 0.008, "step": 662750 }, { "epoch": 1.72, "learning_rate": 4.2304571764809564e-05, "loss": 0.0097, "step": 662760 }, { "epoch": 1.72, "learning_rate": 4.2300683548438106e-05, "loss": 0.0151, "step": 662770 }, { "epoch": 1.72, "learning_rate": 4.229679533206664e-05, "loss": 0.0065, "step": 662780 }, { "epoch": 1.72, "learning_rate": 4.2292907115695175e-05, "loss": 0.0084, "step": 662790 }, { "epoch": 1.72, "learning_rate": 4.228901889932371e-05, "loss": 0.0104, "step": 662800 }, { "epoch": 1.72, "learning_rate": 4.2285130682952245e-05, "loss": 0.0082, "step": 662810 }, { "epoch": 1.72, "learning_rate": 4.228124246658077e-05, "loss": 0.0075, "step": 662820 }, { "epoch": 1.72, "learning_rate": 4.227735425020931e-05, "loss": 0.0091, "step": 662830 }, { "epoch": 1.72, "learning_rate": 4.227346603383784e-05, "loss": 0.0099, "step": 662840 }, { "epoch": 1.72, "learning_rate": 4.226957781746638e-05, "loss": 0.0091, "step": 662850 }, { "epoch": 1.72, "learning_rate": 4.226568960109491e-05, "loss": 0.0065, "step": 662860 }, { "epoch": 1.72, "learning_rate": 4.2261801384723454e-05, "loss": 0.0086, "step": 662870 }, { "epoch": 1.72, "learning_rate": 4.225791316835199e-05, "loss": 0.0055, "step": 662880 }, { "epoch": 1.72, "learning_rate": 4.2254024951980524e-05, "loss": 0.0073, "step": 662890 }, { "epoch": 1.72, "learning_rate": 4.225013673560906e-05, "loss": 0.0068, "step": 662900 }, { "epoch": 1.72, "learning_rate": 4.2246248519237594e-05, "loss": 0.0096, "step": 662910 }, { "epoch": 1.72, "learning_rate": 4.224236030286613e-05, "loss": 0.0119, "step": 662920 }, { "epoch": 1.72, "learning_rate": 4.223847208649466e-05, "loss": 0.0088, "step": 662930 }, { "epoch": 1.72, "learning_rate": 4.22345838701232e-05, "loss": 0.0076, "step": 662940 }, { "epoch": 1.72, "learning_rate": 4.223069565375174e-05, "loss": 0.0062, "step": 662950 }, { "epoch": 1.72, "learning_rate": 4.2226807437380275e-05, "loss": 0.0063, "step": 662960 }, { "epoch": 1.72, "learning_rate": 4.222291922100881e-05, "loss": 0.0074, "step": 662970 }, { "epoch": 1.72, "learning_rate": 4.2219031004637344e-05, "loss": 0.0085, "step": 662980 }, { "epoch": 1.72, "learning_rate": 4.221514278826588e-05, "loss": 0.0079, "step": 662990 }, { "epoch": 1.72, "learning_rate": 4.2211254571894414e-05, "loss": 0.007, "step": 663000 }, { "epoch": 1.72, "eval_cer": 0.8816718943106159, "eval_loss": 0.005077589303255081, "eval_runtime": 107.9194, "eval_samples_per_second": 18.532, "eval_steps_per_second": 4.633, "step": 663000 }, { "epoch": 1.72, "learning_rate": 4.220736635552295e-05, "loss": 0.0058, "step": 663010 }, { "epoch": 1.72, "learning_rate": 4.2203478139151484e-05, "loss": 0.0078, "step": 663020 }, { "epoch": 1.72, "learning_rate": 4.2199589922780025e-05, "loss": 0.0084, "step": 663030 }, { "epoch": 1.72, "learning_rate": 4.219570170640856e-05, "loss": 0.0083, "step": 663040 }, { "epoch": 1.72, "learning_rate": 4.2191813490037095e-05, "loss": 0.0057, "step": 663050 }, { "epoch": 1.72, "learning_rate": 4.218792527366563e-05, "loss": 0.0078, "step": 663060 }, { "epoch": 1.72, "learning_rate": 4.218403705729416e-05, "loss": 0.0073, "step": 663070 }, { "epoch": 1.72, "learning_rate": 4.218014884092269e-05, "loss": 0.0084, "step": 663080 }, { "epoch": 1.72, "learning_rate": 4.217626062455123e-05, "loss": 0.0083, "step": 663090 }, { "epoch": 1.72, "learning_rate": 4.217237240817976e-05, "loss": 0.007, "step": 663100 }, { "epoch": 1.72, "learning_rate": 4.21684841918083e-05, "loss": 0.0093, "step": 663110 }, { "epoch": 1.72, "learning_rate": 4.216459597543683e-05, "loss": 0.0094, "step": 663120 }, { "epoch": 1.72, "learning_rate": 4.2160707759065374e-05, "loss": 0.0072, "step": 663130 }, { "epoch": 1.72, "learning_rate": 4.215681954269391e-05, "loss": 0.0096, "step": 663140 }, { "epoch": 1.72, "learning_rate": 4.2152931326322444e-05, "loss": 0.0076, "step": 663150 }, { "epoch": 1.72, "learning_rate": 4.214904310995098e-05, "loss": 0.0089, "step": 663160 }, { "epoch": 1.72, "learning_rate": 4.2145154893579514e-05, "loss": 0.0059, "step": 663170 }, { "epoch": 1.72, "learning_rate": 4.214126667720805e-05, "loss": 0.0143, "step": 663180 }, { "epoch": 1.72, "learning_rate": 4.213737846083658e-05, "loss": 0.0093, "step": 663190 }, { "epoch": 1.72, "learning_rate": 4.213349024446512e-05, "loss": 0.0071, "step": 663200 }, { "epoch": 1.72, "learning_rate": 4.212960202809365e-05, "loss": 0.0096, "step": 663210 }, { "epoch": 1.72, "learning_rate": 4.2125713811722195e-05, "loss": 0.0093, "step": 663220 }, { "epoch": 1.72, "learning_rate": 4.212182559535073e-05, "loss": 0.0078, "step": 663230 }, { "epoch": 1.72, "learning_rate": 4.2117937378979264e-05, "loss": 0.0111, "step": 663240 }, { "epoch": 1.72, "learning_rate": 4.21140491626078e-05, "loss": 0.0073, "step": 663250 }, { "epoch": 1.72, "learning_rate": 4.2110160946236334e-05, "loss": 0.0108, "step": 663260 }, { "epoch": 1.72, "learning_rate": 4.210627272986487e-05, "loss": 0.0092, "step": 663270 }, { "epoch": 1.72, "learning_rate": 4.2102384513493404e-05, "loss": 0.0097, "step": 663280 }, { "epoch": 1.72, "learning_rate": 4.209849629712194e-05, "loss": 0.011, "step": 663290 }, { "epoch": 1.72, "learning_rate": 4.209460808075048e-05, "loss": 0.007, "step": 663300 }, { "epoch": 1.72, "learning_rate": 4.2090719864379015e-05, "loss": 0.0064, "step": 663310 }, { "epoch": 1.72, "learning_rate": 4.208683164800754e-05, "loss": 0.0096, "step": 663320 }, { "epoch": 1.72, "learning_rate": 4.208294343163608e-05, "loss": 0.0073, "step": 663330 }, { "epoch": 1.72, "learning_rate": 4.207905521526461e-05, "loss": 0.0089, "step": 663340 }, { "epoch": 1.72, "learning_rate": 4.207516699889315e-05, "loss": 0.0055, "step": 663350 }, { "epoch": 1.72, "learning_rate": 4.207127878252168e-05, "loss": 0.009, "step": 663360 }, { "epoch": 1.72, "learning_rate": 4.206739056615022e-05, "loss": 0.0077, "step": 663370 }, { "epoch": 1.72, "learning_rate": 4.206350234977875e-05, "loss": 0.0051, "step": 663380 }, { "epoch": 1.72, "learning_rate": 4.205961413340729e-05, "loss": 0.0124, "step": 663390 }, { "epoch": 1.72, "learning_rate": 4.205572591703583e-05, "loss": 0.0092, "step": 663400 }, { "epoch": 1.72, "learning_rate": 4.2051837700664364e-05, "loss": 0.006, "step": 663410 }, { "epoch": 1.72, "learning_rate": 4.20479494842929e-05, "loss": 0.0086, "step": 663420 }, { "epoch": 1.72, "learning_rate": 4.2044061267921433e-05, "loss": 0.0069, "step": 663430 }, { "epoch": 1.72, "learning_rate": 4.204017305154997e-05, "loss": 0.0074, "step": 663440 }, { "epoch": 1.72, "learning_rate": 4.20362848351785e-05, "loss": 0.0073, "step": 663450 }, { "epoch": 1.72, "learning_rate": 4.203239661880704e-05, "loss": 0.0103, "step": 663460 }, { "epoch": 1.72, "learning_rate": 4.202850840243557e-05, "loss": 0.0223, "step": 663470 }, { "epoch": 1.72, "learning_rate": 4.2024620186064115e-05, "loss": 0.0087, "step": 663480 }, { "epoch": 1.72, "learning_rate": 4.202073196969265e-05, "loss": 0.0101, "step": 663490 }, { "epoch": 1.72, "learning_rate": 4.2016843753321184e-05, "loss": 0.0092, "step": 663500 }, { "epoch": 1.72, "learning_rate": 4.201295553694972e-05, "loss": 0.0058, "step": 663510 }, { "epoch": 1.72, "learning_rate": 4.2009067320578254e-05, "loss": 0.0063, "step": 663520 }, { "epoch": 1.72, "learning_rate": 4.200517910420679e-05, "loss": 0.0094, "step": 663530 }, { "epoch": 1.72, "learning_rate": 4.2001290887835324e-05, "loss": 0.0068, "step": 663540 }, { "epoch": 1.72, "learning_rate": 4.199740267146386e-05, "loss": 0.011, "step": 663550 }, { "epoch": 1.72, "learning_rate": 4.19935144550924e-05, "loss": 0.0085, "step": 663560 }, { "epoch": 1.72, "learning_rate": 4.198962623872092e-05, "loss": 0.0105, "step": 663570 }, { "epoch": 1.72, "learning_rate": 4.198573802234946e-05, "loss": 0.0073, "step": 663580 }, { "epoch": 1.72, "learning_rate": 4.1981849805978e-05, "loss": 0.0071, "step": 663590 }, { "epoch": 1.72, "learning_rate": 4.197796158960653e-05, "loss": 0.0087, "step": 663600 }, { "epoch": 1.72, "learning_rate": 4.197407337323507e-05, "loss": 0.0067, "step": 663610 }, { "epoch": 1.72, "learning_rate": 4.19701851568636e-05, "loss": 0.0065, "step": 663620 }, { "epoch": 1.72, "learning_rate": 4.196629694049214e-05, "loss": 0.0085, "step": 663630 }, { "epoch": 1.72, "learning_rate": 4.196240872412067e-05, "loss": 0.0065, "step": 663640 }, { "epoch": 1.72, "learning_rate": 4.195852050774921e-05, "loss": 0.0086, "step": 663650 }, { "epoch": 1.72, "learning_rate": 4.195463229137775e-05, "loss": 0.0068, "step": 663660 }, { "epoch": 1.72, "learning_rate": 4.1950744075006284e-05, "loss": 0.0088, "step": 663670 }, { "epoch": 1.72, "learning_rate": 4.194685585863482e-05, "loss": 0.0114, "step": 663680 }, { "epoch": 1.72, "learning_rate": 4.1942967642263353e-05, "loss": 0.0068, "step": 663690 }, { "epoch": 1.72, "learning_rate": 4.193907942589189e-05, "loss": 0.0114, "step": 663700 }, { "epoch": 1.72, "learning_rate": 4.193519120952042e-05, "loss": 0.0093, "step": 663710 }, { "epoch": 1.72, "learning_rate": 4.193130299314896e-05, "loss": 0.0099, "step": 663720 }, { "epoch": 1.72, "learning_rate": 4.192741477677749e-05, "loss": 0.0101, "step": 663730 }, { "epoch": 1.72, "learning_rate": 4.1923526560406035e-05, "loss": 0.007, "step": 663740 }, { "epoch": 1.72, "learning_rate": 4.191963834403457e-05, "loss": 0.0085, "step": 663750 }, { "epoch": 1.72, "learning_rate": 4.1915750127663104e-05, "loss": 0.0071, "step": 663760 }, { "epoch": 1.72, "learning_rate": 4.191186191129164e-05, "loss": 0.0099, "step": 663770 }, { "epoch": 1.72, "learning_rate": 4.1907973694920174e-05, "loss": 0.0072, "step": 663780 }, { "epoch": 1.72, "learning_rate": 4.190408547854871e-05, "loss": 0.0094, "step": 663790 }, { "epoch": 1.72, "learning_rate": 4.1900197262177244e-05, "loss": 0.007, "step": 663800 }, { "epoch": 1.72, "learning_rate": 4.189630904580577e-05, "loss": 0.0083, "step": 663810 }, { "epoch": 1.72, "learning_rate": 4.189242082943431e-05, "loss": 0.0085, "step": 663820 }, { "epoch": 1.72, "learning_rate": 4.188853261306284e-05, "loss": 0.0078, "step": 663830 }, { "epoch": 1.72, "learning_rate": 4.188464439669138e-05, "loss": 0.0071, "step": 663840 }, { "epoch": 1.72, "learning_rate": 4.188075618031992e-05, "loss": 0.0084, "step": 663850 }, { "epoch": 1.72, "learning_rate": 4.187686796394845e-05, "loss": 0.0115, "step": 663860 }, { "epoch": 1.72, "learning_rate": 4.187297974757699e-05, "loss": 0.0081, "step": 663870 }, { "epoch": 1.72, "learning_rate": 4.186909153120552e-05, "loss": 0.0084, "step": 663880 }, { "epoch": 1.72, "learning_rate": 4.186520331483406e-05, "loss": 0.0102, "step": 663890 }, { "epoch": 1.72, "learning_rate": 4.186131509846259e-05, "loss": 0.0067, "step": 663900 }, { "epoch": 1.72, "learning_rate": 4.185742688209113e-05, "loss": 0.0079, "step": 663910 }, { "epoch": 1.72, "learning_rate": 4.185353866571967e-05, "loss": 0.0104, "step": 663920 }, { "epoch": 1.72, "learning_rate": 4.1849650449348204e-05, "loss": 0.0093, "step": 663930 }, { "epoch": 1.72, "learning_rate": 4.184576223297674e-05, "loss": 0.0067, "step": 663940 }, { "epoch": 1.72, "learning_rate": 4.1841874016605273e-05, "loss": 0.0076, "step": 663950 }, { "epoch": 1.72, "learning_rate": 4.183798580023381e-05, "loss": 0.0068, "step": 663960 }, { "epoch": 1.72, "learning_rate": 4.183409758386234e-05, "loss": 0.0079, "step": 663970 }, { "epoch": 1.72, "learning_rate": 4.183020936749088e-05, "loss": 0.0081, "step": 663980 }, { "epoch": 1.72, "learning_rate": 4.182632115111941e-05, "loss": 0.0068, "step": 663990 }, { "epoch": 1.72, "learning_rate": 4.1822432934747954e-05, "loss": 0.0069, "step": 664000 }, { "epoch": 1.72, "eval_cer": 0.8816536990304715, "eval_loss": 0.0050833625718951225, "eval_runtime": 107.9937, "eval_samples_per_second": 18.52, "eval_steps_per_second": 4.63, "step": 664000 }, { "epoch": 1.72, "learning_rate": 4.181854471837649e-05, "loss": 0.0101, "step": 664010 }, { "epoch": 1.72, "learning_rate": 4.1814656502005024e-05, "loss": 0.0087, "step": 664020 }, { "epoch": 1.72, "learning_rate": 4.181076828563356e-05, "loss": 0.0086, "step": 664030 }, { "epoch": 1.72, "learning_rate": 4.1806880069262094e-05, "loss": 0.0108, "step": 664040 }, { "epoch": 1.72, "learning_rate": 4.180299185289063e-05, "loss": 0.0092, "step": 664050 }, { "epoch": 1.72, "learning_rate": 4.179910363651916e-05, "loss": 0.0067, "step": 664060 }, { "epoch": 1.72, "learning_rate": 4.179521542014769e-05, "loss": 0.0079, "step": 664070 }, { "epoch": 1.72, "learning_rate": 4.1791327203776227e-05, "loss": 0.0079, "step": 664080 }, { "epoch": 1.72, "learning_rate": 4.178743898740476e-05, "loss": 0.0077, "step": 664090 }, { "epoch": 1.72, "learning_rate": 4.17835507710333e-05, "loss": 0.0068, "step": 664100 }, { "epoch": 1.72, "learning_rate": 4.177966255466184e-05, "loss": 0.0065, "step": 664110 }, { "epoch": 1.72, "learning_rate": 4.177577433829037e-05, "loss": 0.0082, "step": 664120 }, { "epoch": 1.72, "learning_rate": 4.177188612191891e-05, "loss": 0.0058, "step": 664130 }, { "epoch": 1.72, "learning_rate": 4.176799790554744e-05, "loss": 0.0132, "step": 664140 }, { "epoch": 1.72, "learning_rate": 4.176410968917598e-05, "loss": 0.0088, "step": 664150 }, { "epoch": 1.72, "learning_rate": 4.176022147280451e-05, "loss": 0.0083, "step": 664160 }, { "epoch": 1.72, "learning_rate": 4.175633325643305e-05, "loss": 0.0071, "step": 664170 }, { "epoch": 1.72, "learning_rate": 4.175244504006159e-05, "loss": 0.0084, "step": 664180 }, { "epoch": 1.72, "learning_rate": 4.1748556823690124e-05, "loss": 0.0067, "step": 664190 }, { "epoch": 1.72, "learning_rate": 4.174466860731866e-05, "loss": 0.008, "step": 664200 }, { "epoch": 1.72, "learning_rate": 4.174078039094719e-05, "loss": 0.0092, "step": 664210 }, { "epoch": 1.72, "learning_rate": 4.173689217457573e-05, "loss": 0.0076, "step": 664220 }, { "epoch": 1.72, "learning_rate": 4.173300395820426e-05, "loss": 0.0078, "step": 664230 }, { "epoch": 1.72, "learning_rate": 4.17291157418328e-05, "loss": 0.0091, "step": 664240 }, { "epoch": 1.72, "learning_rate": 4.172522752546133e-05, "loss": 0.0136, "step": 664250 }, { "epoch": 1.72, "learning_rate": 4.1721339309089874e-05, "loss": 0.0069, "step": 664260 }, { "epoch": 1.72, "learning_rate": 4.171745109271841e-05, "loss": 0.0071, "step": 664270 }, { "epoch": 1.72, "learning_rate": 4.1713562876346944e-05, "loss": 0.0066, "step": 664280 }, { "epoch": 1.72, "learning_rate": 4.170967465997548e-05, "loss": 0.0114, "step": 664290 }, { "epoch": 1.72, "learning_rate": 4.1705786443604014e-05, "loss": 0.0105, "step": 664300 }, { "epoch": 1.72, "learning_rate": 4.170189822723254e-05, "loss": 0.0078, "step": 664310 }, { "epoch": 1.72, "learning_rate": 4.169801001086108e-05, "loss": 0.0086, "step": 664320 }, { "epoch": 1.72, "learning_rate": 4.169412179448961e-05, "loss": 0.0083, "step": 664330 }, { "epoch": 1.72, "learning_rate": 4.1690233578118147e-05, "loss": 0.0071, "step": 664340 }, { "epoch": 1.72, "learning_rate": 4.168634536174668e-05, "loss": 0.0069, "step": 664350 }, { "epoch": 1.72, "learning_rate": 4.168245714537522e-05, "loss": 0.0111, "step": 664360 }, { "epoch": 1.72, "learning_rate": 4.167856892900376e-05, "loss": 0.0065, "step": 664370 }, { "epoch": 1.72, "learning_rate": 4.167468071263229e-05, "loss": 0.012, "step": 664380 }, { "epoch": 1.72, "learning_rate": 4.167079249626083e-05, "loss": 0.008, "step": 664390 }, { "epoch": 1.72, "learning_rate": 4.166690427988936e-05, "loss": 0.0098, "step": 664400 }, { "epoch": 1.72, "learning_rate": 4.16630160635179e-05, "loss": 0.0059, "step": 664410 }, { "epoch": 1.72, "learning_rate": 4.165912784714643e-05, "loss": 0.0106, "step": 664420 }, { "epoch": 1.72, "learning_rate": 4.165523963077497e-05, "loss": 0.0097, "step": 664430 }, { "epoch": 1.72, "learning_rate": 4.165135141440351e-05, "loss": 0.0089, "step": 664440 }, { "epoch": 1.72, "learning_rate": 4.1647463198032044e-05, "loss": 0.0088, "step": 664450 }, { "epoch": 1.72, "learning_rate": 4.164357498166058e-05, "loss": 0.0081, "step": 664460 }, { "epoch": 1.72, "learning_rate": 4.163968676528911e-05, "loss": 0.0082, "step": 664470 }, { "epoch": 1.72, "learning_rate": 4.163579854891765e-05, "loss": 0.0092, "step": 664480 }, { "epoch": 1.72, "learning_rate": 4.163191033254618e-05, "loss": 0.0084, "step": 664490 }, { "epoch": 1.72, "learning_rate": 4.162802211617472e-05, "loss": 0.0061, "step": 664500 }, { "epoch": 1.72, "learning_rate": 4.162413389980325e-05, "loss": 0.007, "step": 664510 }, { "epoch": 1.72, "learning_rate": 4.1620245683431794e-05, "loss": 0.0059, "step": 664520 }, { "epoch": 1.72, "learning_rate": 4.161635746706033e-05, "loss": 0.0074, "step": 664530 }, { "epoch": 1.72, "learning_rate": 4.1612469250688864e-05, "loss": 0.0066, "step": 664540 }, { "epoch": 1.72, "learning_rate": 4.16085810343174e-05, "loss": 0.0058, "step": 664550 }, { "epoch": 1.72, "learning_rate": 4.160469281794593e-05, "loss": 0.0065, "step": 664560 }, { "epoch": 1.72, "learning_rate": 4.160080460157446e-05, "loss": 0.009, "step": 664570 }, { "epoch": 1.72, "learning_rate": 4.1596916385203e-05, "loss": 0.0076, "step": 664580 }, { "epoch": 1.72, "learning_rate": 4.159302816883153e-05, "loss": 0.0078, "step": 664590 }, { "epoch": 1.72, "learning_rate": 4.1589139952460067e-05, "loss": 0.0108, "step": 664600 }, { "epoch": 1.72, "learning_rate": 4.15852517360886e-05, "loss": 0.0056, "step": 664610 }, { "epoch": 1.72, "learning_rate": 4.158136351971714e-05, "loss": 0.0086, "step": 664620 }, { "epoch": 1.72, "learning_rate": 4.157747530334568e-05, "loss": 0.0103, "step": 664630 }, { "epoch": 1.72, "learning_rate": 4.157358708697421e-05, "loss": 0.006, "step": 664640 }, { "epoch": 1.72, "learning_rate": 4.156969887060275e-05, "loss": 0.01, "step": 664650 }, { "epoch": 1.72, "learning_rate": 4.156581065423128e-05, "loss": 0.0062, "step": 664660 }, { "epoch": 1.72, "learning_rate": 4.156192243785982e-05, "loss": 0.0079, "step": 664670 }, { "epoch": 1.72, "learning_rate": 4.155803422148835e-05, "loss": 0.0063, "step": 664680 }, { "epoch": 1.72, "learning_rate": 4.155414600511689e-05, "loss": 0.011, "step": 664690 }, { "epoch": 1.72, "learning_rate": 4.155025778874542e-05, "loss": 0.0065, "step": 664700 }, { "epoch": 1.72, "learning_rate": 4.1546369572373964e-05, "loss": 0.0094, "step": 664710 }, { "epoch": 1.72, "learning_rate": 4.15424813560025e-05, "loss": 0.0092, "step": 664720 }, { "epoch": 1.72, "learning_rate": 4.153859313963103e-05, "loss": 0.0067, "step": 664730 }, { "epoch": 1.72, "learning_rate": 4.153470492325957e-05, "loss": 0.0085, "step": 664740 }, { "epoch": 1.72, "learning_rate": 4.15308167068881e-05, "loss": 0.009, "step": 664750 }, { "epoch": 1.72, "learning_rate": 4.152692849051664e-05, "loss": 0.0066, "step": 664760 }, { "epoch": 1.72, "learning_rate": 4.152304027414517e-05, "loss": 0.0094, "step": 664770 }, { "epoch": 1.72, "learning_rate": 4.151915205777371e-05, "loss": 0.0068, "step": 664780 }, { "epoch": 1.72, "learning_rate": 4.151526384140225e-05, "loss": 0.0075, "step": 664790 }, { "epoch": 1.72, "learning_rate": 4.1511375625030784e-05, "loss": 0.0086, "step": 664800 }, { "epoch": 1.72, "learning_rate": 4.150748740865931e-05, "loss": 0.0079, "step": 664810 }, { "epoch": 1.72, "learning_rate": 4.150359919228785e-05, "loss": 0.0073, "step": 664820 }, { "epoch": 1.72, "learning_rate": 4.149971097591638e-05, "loss": 0.0097, "step": 664830 }, { "epoch": 1.72, "learning_rate": 4.149582275954492e-05, "loss": 0.0118, "step": 664840 }, { "epoch": 1.72, "learning_rate": 4.149193454317345e-05, "loss": 0.0073, "step": 664850 }, { "epoch": 1.72, "learning_rate": 4.1488046326801986e-05, "loss": 0.009, "step": 664860 }, { "epoch": 1.72, "learning_rate": 4.148415811043052e-05, "loss": 0.0076, "step": 664870 }, { "epoch": 1.72, "learning_rate": 4.1480269894059056e-05, "loss": 0.0069, "step": 664880 }, { "epoch": 1.72, "learning_rate": 4.14763816776876e-05, "loss": 0.0072, "step": 664890 }, { "epoch": 1.72, "learning_rate": 4.147249346131613e-05, "loss": 0.009, "step": 664900 }, { "epoch": 1.72, "learning_rate": 4.146860524494467e-05, "loss": 0.0118, "step": 664910 }, { "epoch": 1.72, "learning_rate": 4.14647170285732e-05, "loss": 0.0091, "step": 664920 }, { "epoch": 1.72, "learning_rate": 4.146082881220174e-05, "loss": 0.0112, "step": 664930 }, { "epoch": 1.72, "learning_rate": 4.145694059583027e-05, "loss": 0.0082, "step": 664940 }, { "epoch": 1.72, "learning_rate": 4.145305237945881e-05, "loss": 0.007, "step": 664950 }, { "epoch": 1.72, "learning_rate": 4.144916416308734e-05, "loss": 0.0095, "step": 664960 }, { "epoch": 1.72, "learning_rate": 4.1445275946715883e-05, "loss": 0.0092, "step": 664970 }, { "epoch": 1.72, "learning_rate": 4.144138773034442e-05, "loss": 0.0082, "step": 664980 }, { "epoch": 1.72, "learning_rate": 4.143749951397295e-05, "loss": 0.0077, "step": 664990 }, { "epoch": 1.72, "learning_rate": 4.143361129760149e-05, "loss": 0.0068, "step": 665000 }, { "epoch": 1.72, "eval_cer": 0.8816620968520765, "eval_loss": 0.004966807551681995, "eval_runtime": 107.8902, "eval_samples_per_second": 18.537, "eval_steps_per_second": 4.634, "step": 665000 }, { "epoch": 1.72, "learning_rate": 4.142972308123002e-05, "loss": 0.0067, "step": 665010 }, { "epoch": 1.72, "learning_rate": 4.142583486485856e-05, "loss": 0.0095, "step": 665020 }, { "epoch": 1.72, "learning_rate": 4.142194664848709e-05, "loss": 0.0089, "step": 665030 }, { "epoch": 1.72, "learning_rate": 4.141805843211563e-05, "loss": 0.0061, "step": 665040 }, { "epoch": 1.72, "learning_rate": 4.1414170215744156e-05, "loss": 0.0104, "step": 665050 }, { "epoch": 1.72, "learning_rate": 4.141028199937269e-05, "loss": 0.0076, "step": 665060 }, { "epoch": 1.72, "learning_rate": 4.140639378300123e-05, "loss": 0.0071, "step": 665070 }, { "epoch": 1.72, "learning_rate": 4.140250556662977e-05, "loss": 0.0062, "step": 665080 }, { "epoch": 1.72, "learning_rate": 4.13986173502583e-05, "loss": 0.0087, "step": 665090 }, { "epoch": 1.72, "learning_rate": 4.139472913388684e-05, "loss": 0.0062, "step": 665100 }, { "epoch": 1.72, "learning_rate": 4.139084091751537e-05, "loss": 0.0091, "step": 665110 }, { "epoch": 1.72, "learning_rate": 4.1386952701143906e-05, "loss": 0.0074, "step": 665120 }, { "epoch": 1.72, "learning_rate": 4.138306448477244e-05, "loss": 0.0089, "step": 665130 }, { "epoch": 1.72, "learning_rate": 4.1379176268400976e-05, "loss": 0.0077, "step": 665140 }, { "epoch": 1.72, "learning_rate": 4.137528805202952e-05, "loss": 0.0075, "step": 665150 }, { "epoch": 1.72, "learning_rate": 4.137139983565805e-05, "loss": 0.0071, "step": 665160 }, { "epoch": 1.72, "learning_rate": 4.136751161928659e-05, "loss": 0.0089, "step": 665170 }, { "epoch": 1.72, "learning_rate": 4.136362340291512e-05, "loss": 0.0083, "step": 665180 }, { "epoch": 1.72, "learning_rate": 4.135973518654366e-05, "loss": 0.0092, "step": 665190 }, { "epoch": 1.72, "learning_rate": 4.135584697017219e-05, "loss": 0.0095, "step": 665200 }, { "epoch": 1.72, "learning_rate": 4.135195875380073e-05, "loss": 0.0084, "step": 665210 }, { "epoch": 1.72, "learning_rate": 4.134807053742926e-05, "loss": 0.0079, "step": 665220 }, { "epoch": 1.72, "learning_rate": 4.1344182321057803e-05, "loss": 0.0134, "step": 665230 }, { "epoch": 1.72, "learning_rate": 4.134029410468634e-05, "loss": 0.0083, "step": 665240 }, { "epoch": 1.72, "learning_rate": 4.133640588831487e-05, "loss": 0.0071, "step": 665250 }, { "epoch": 1.72, "learning_rate": 4.133251767194341e-05, "loss": 0.0056, "step": 665260 }, { "epoch": 1.72, "learning_rate": 4.132862945557194e-05, "loss": 0.0082, "step": 665270 }, { "epoch": 1.72, "learning_rate": 4.132474123920048e-05, "loss": 0.009, "step": 665280 }, { "epoch": 1.72, "learning_rate": 4.132085302282901e-05, "loss": 0.0051, "step": 665290 }, { "epoch": 1.72, "learning_rate": 4.131696480645754e-05, "loss": 0.0077, "step": 665300 }, { "epoch": 1.72, "learning_rate": 4.1313076590086076e-05, "loss": 0.0069, "step": 665310 }, { "epoch": 1.72, "learning_rate": 4.130918837371461e-05, "loss": 0.0076, "step": 665320 }, { "epoch": 1.72, "learning_rate": 4.130530015734315e-05, "loss": 0.0052, "step": 665330 }, { "epoch": 1.72, "learning_rate": 4.130141194097169e-05, "loss": 0.0096, "step": 665340 }, { "epoch": 1.72, "learning_rate": 4.129752372460022e-05, "loss": 0.0102, "step": 665350 }, { "epoch": 1.72, "learning_rate": 4.129363550822876e-05, "loss": 0.0086, "step": 665360 }, { "epoch": 1.72, "learning_rate": 4.128974729185729e-05, "loss": 0.0075, "step": 665370 }, { "epoch": 1.72, "learning_rate": 4.1285859075485826e-05, "loss": 0.0059, "step": 665380 }, { "epoch": 1.72, "learning_rate": 4.128197085911436e-05, "loss": 0.0079, "step": 665390 }, { "epoch": 1.72, "learning_rate": 4.1278082642742896e-05, "loss": 0.0077, "step": 665400 }, { "epoch": 1.72, "learning_rate": 4.127419442637144e-05, "loss": 0.0075, "step": 665410 }, { "epoch": 1.72, "learning_rate": 4.127030620999997e-05, "loss": 0.008, "step": 665420 }, { "epoch": 1.72, "learning_rate": 4.126641799362851e-05, "loss": 0.011, "step": 665430 }, { "epoch": 1.72, "learning_rate": 4.126252977725704e-05, "loss": 0.0068, "step": 665440 }, { "epoch": 1.72, "learning_rate": 4.125864156088558e-05, "loss": 0.0065, "step": 665450 }, { "epoch": 1.72, "learning_rate": 4.125475334451411e-05, "loss": 0.0066, "step": 665460 }, { "epoch": 1.72, "learning_rate": 4.125086512814265e-05, "loss": 0.0082, "step": 665470 }, { "epoch": 1.73, "learning_rate": 4.124697691177118e-05, "loss": 0.0071, "step": 665480 }, { "epoch": 1.73, "learning_rate": 4.124308869539972e-05, "loss": 0.0082, "step": 665490 }, { "epoch": 1.73, "learning_rate": 4.123920047902826e-05, "loss": 0.0099, "step": 665500 }, { "epoch": 1.73, "learning_rate": 4.123531226265679e-05, "loss": 0.009, "step": 665510 }, { "epoch": 1.73, "learning_rate": 4.123142404628533e-05, "loss": 0.0061, "step": 665520 }, { "epoch": 1.73, "learning_rate": 4.122753582991386e-05, "loss": 0.0067, "step": 665530 }, { "epoch": 1.73, "learning_rate": 4.12236476135424e-05, "loss": 0.0084, "step": 665540 }, { "epoch": 1.73, "learning_rate": 4.1219759397170926e-05, "loss": 0.0073, "step": 665550 }, { "epoch": 1.73, "learning_rate": 4.121587118079946e-05, "loss": 0.0065, "step": 665560 }, { "epoch": 1.73, "learning_rate": 4.1211982964427996e-05, "loss": 0.0101, "step": 665570 }, { "epoch": 1.73, "learning_rate": 4.120809474805653e-05, "loss": 0.0061, "step": 665580 }, { "epoch": 1.73, "learning_rate": 4.120420653168507e-05, "loss": 0.0073, "step": 665590 }, { "epoch": 1.73, "learning_rate": 4.120031831531361e-05, "loss": 0.0102, "step": 665600 }, { "epoch": 1.73, "learning_rate": 4.119643009894214e-05, "loss": 0.0089, "step": 665610 }, { "epoch": 1.73, "learning_rate": 4.1192541882570677e-05, "loss": 0.007, "step": 665620 }, { "epoch": 1.73, "learning_rate": 4.118865366619921e-05, "loss": 0.0091, "step": 665630 }, { "epoch": 1.73, "learning_rate": 4.1184765449827746e-05, "loss": 0.0061, "step": 665640 }, { "epoch": 1.73, "learning_rate": 4.118087723345628e-05, "loss": 0.0074, "step": 665650 }, { "epoch": 1.73, "learning_rate": 4.1176989017084816e-05, "loss": 0.0077, "step": 665660 }, { "epoch": 1.73, "learning_rate": 4.117310080071336e-05, "loss": 0.0089, "step": 665670 }, { "epoch": 1.73, "learning_rate": 4.116921258434189e-05, "loss": 0.0075, "step": 665680 }, { "epoch": 1.73, "learning_rate": 4.116532436797043e-05, "loss": 0.0074, "step": 665690 }, { "epoch": 1.73, "learning_rate": 4.116143615159896e-05, "loss": 0.0084, "step": 665700 }, { "epoch": 1.73, "learning_rate": 4.11575479352275e-05, "loss": 0.0082, "step": 665710 }, { "epoch": 1.73, "learning_rate": 4.115365971885603e-05, "loss": 0.0067, "step": 665720 }, { "epoch": 1.73, "learning_rate": 4.114977150248457e-05, "loss": 0.0071, "step": 665730 }, { "epoch": 1.73, "learning_rate": 4.11458832861131e-05, "loss": 0.0069, "step": 665740 }, { "epoch": 1.73, "learning_rate": 4.114199506974164e-05, "loss": 0.0069, "step": 665750 }, { "epoch": 1.73, "learning_rate": 4.113810685337018e-05, "loss": 0.0079, "step": 665760 }, { "epoch": 1.73, "learning_rate": 4.113421863699871e-05, "loss": 0.0071, "step": 665770 }, { "epoch": 1.73, "learning_rate": 4.113033042062725e-05, "loss": 0.0057, "step": 665780 }, { "epoch": 1.73, "learning_rate": 4.112644220425578e-05, "loss": 0.0054, "step": 665790 }, { "epoch": 1.73, "learning_rate": 4.112255398788431e-05, "loss": 0.0112, "step": 665800 }, { "epoch": 1.73, "learning_rate": 4.1118665771512846e-05, "loss": 0.0096, "step": 665810 }, { "epoch": 1.73, "learning_rate": 4.111477755514138e-05, "loss": 0.0087, "step": 665820 }, { "epoch": 1.73, "learning_rate": 4.1110889338769915e-05, "loss": 0.0088, "step": 665830 }, { "epoch": 1.73, "learning_rate": 4.110700112239845e-05, "loss": 0.0068, "step": 665840 }, { "epoch": 1.73, "learning_rate": 4.110311290602699e-05, "loss": 0.0099, "step": 665850 }, { "epoch": 1.73, "learning_rate": 4.109922468965553e-05, "loss": 0.0083, "step": 665860 }, { "epoch": 1.73, "learning_rate": 4.109533647328406e-05, "loss": 0.0072, "step": 665870 }, { "epoch": 1.73, "learning_rate": 4.1091448256912597e-05, "loss": 0.0089, "step": 665880 }, { "epoch": 1.73, "learning_rate": 4.108756004054113e-05, "loss": 0.009, "step": 665890 }, { "epoch": 1.73, "learning_rate": 4.1083671824169666e-05, "loss": 0.0101, "step": 665900 }, { "epoch": 1.73, "learning_rate": 4.10797836077982e-05, "loss": 0.0058, "step": 665910 }, { "epoch": 1.73, "learning_rate": 4.1075895391426736e-05, "loss": 0.0095, "step": 665920 }, { "epoch": 1.73, "learning_rate": 4.107200717505528e-05, "loss": 0.0072, "step": 665930 }, { "epoch": 1.73, "learning_rate": 4.106811895868381e-05, "loss": 0.009, "step": 665940 }, { "epoch": 1.73, "learning_rate": 4.106423074231235e-05, "loss": 0.0085, "step": 665950 }, { "epoch": 1.73, "learning_rate": 4.106034252594088e-05, "loss": 0.0097, "step": 665960 }, { "epoch": 1.73, "learning_rate": 4.105645430956942e-05, "loss": 0.009, "step": 665970 }, { "epoch": 1.73, "learning_rate": 4.105256609319795e-05, "loss": 0.0086, "step": 665980 }, { "epoch": 1.73, "learning_rate": 4.104867787682649e-05, "loss": 0.0063, "step": 665990 }, { "epoch": 1.73, "learning_rate": 4.104478966045502e-05, "loss": 0.0063, "step": 666000 }, { "epoch": 1.73, "eval_cer": 0.8816746935844841, "eval_loss": 0.005011801607906818, "eval_runtime": 107.759, "eval_samples_per_second": 18.56, "eval_steps_per_second": 4.64, "step": 666000 }, { "epoch": 1.73, "learning_rate": 4.1040901444083557e-05, "loss": 0.0064, "step": 666010 }, { "epoch": 1.73, "learning_rate": 4.10370132277121e-05, "loss": 0.0094, "step": 666020 }, { "epoch": 1.73, "learning_rate": 4.103312501134063e-05, "loss": 0.0114, "step": 666030 }, { "epoch": 1.73, "learning_rate": 4.102923679496917e-05, "loss": 0.0072, "step": 666040 }, { "epoch": 1.73, "learning_rate": 4.1025348578597696e-05, "loss": 0.0058, "step": 666050 }, { "epoch": 1.73, "learning_rate": 4.102146036222623e-05, "loss": 0.0075, "step": 666060 }, { "epoch": 1.73, "learning_rate": 4.1017572145854766e-05, "loss": 0.0094, "step": 666070 }, { "epoch": 1.73, "learning_rate": 4.10136839294833e-05, "loss": 0.01, "step": 666080 }, { "epoch": 1.73, "learning_rate": 4.1009795713111835e-05, "loss": 0.0104, "step": 666090 }, { "epoch": 1.73, "learning_rate": 4.100590749674037e-05, "loss": 0.0071, "step": 666100 }, { "epoch": 1.73, "learning_rate": 4.1002019280368905e-05, "loss": 0.0085, "step": 666110 }, { "epoch": 1.73, "learning_rate": 4.099813106399745e-05, "loss": 0.0076, "step": 666120 }, { "epoch": 1.73, "learning_rate": 4.099424284762598e-05, "loss": 0.0066, "step": 666130 }, { "epoch": 1.73, "learning_rate": 4.0990354631254516e-05, "loss": 0.0073, "step": 666140 }, { "epoch": 1.73, "learning_rate": 4.098646641488305e-05, "loss": 0.0069, "step": 666150 }, { "epoch": 1.73, "learning_rate": 4.0982578198511586e-05, "loss": 0.0063, "step": 666160 }, { "epoch": 1.73, "learning_rate": 4.097868998214012e-05, "loss": 0.0083, "step": 666170 }, { "epoch": 1.73, "learning_rate": 4.0974801765768656e-05, "loss": 0.0073, "step": 666180 }, { "epoch": 1.73, "learning_rate": 4.097091354939719e-05, "loss": 0.0079, "step": 666190 }, { "epoch": 1.73, "learning_rate": 4.096702533302573e-05, "loss": 0.008, "step": 666200 }, { "epoch": 1.73, "learning_rate": 4.096313711665427e-05, "loss": 0.0091, "step": 666210 }, { "epoch": 1.73, "learning_rate": 4.09592489002828e-05, "loss": 0.0071, "step": 666220 }, { "epoch": 1.73, "learning_rate": 4.095536068391134e-05, "loss": 0.0056, "step": 666230 }, { "epoch": 1.73, "learning_rate": 4.095147246753987e-05, "loss": 0.0057, "step": 666240 }, { "epoch": 1.73, "learning_rate": 4.094758425116841e-05, "loss": 0.0108, "step": 666250 }, { "epoch": 1.73, "learning_rate": 4.094369603479694e-05, "loss": 0.0062, "step": 666260 }, { "epoch": 1.73, "learning_rate": 4.0939807818425476e-05, "loss": 0.0075, "step": 666270 }, { "epoch": 1.73, "learning_rate": 4.093591960205402e-05, "loss": 0.0062, "step": 666280 }, { "epoch": 1.73, "learning_rate": 4.093203138568255e-05, "loss": 0.0075, "step": 666290 }, { "epoch": 1.73, "learning_rate": 4.092814316931108e-05, "loss": 0.0076, "step": 666300 }, { "epoch": 1.73, "learning_rate": 4.0924254952939616e-05, "loss": 0.0074, "step": 666310 }, { "epoch": 1.73, "learning_rate": 4.092036673656815e-05, "loss": 0.0077, "step": 666320 }, { "epoch": 1.73, "learning_rate": 4.0916478520196686e-05, "loss": 0.0054, "step": 666330 }, { "epoch": 1.73, "learning_rate": 4.091259030382522e-05, "loss": 0.0085, "step": 666340 }, { "epoch": 1.73, "learning_rate": 4.0908702087453755e-05, "loss": 0.0073, "step": 666350 }, { "epoch": 1.73, "learning_rate": 4.090481387108229e-05, "loss": 0.0089, "step": 666360 }, { "epoch": 1.73, "learning_rate": 4.0900925654710825e-05, "loss": 0.0069, "step": 666370 }, { "epoch": 1.73, "learning_rate": 4.089703743833937e-05, "loss": 0.006, "step": 666380 }, { "epoch": 1.73, "learning_rate": 4.08931492219679e-05, "loss": 0.0069, "step": 666390 }, { "epoch": 1.73, "learning_rate": 4.0889261005596436e-05, "loss": 0.0092, "step": 666400 }, { "epoch": 1.73, "learning_rate": 4.088537278922497e-05, "loss": 0.0079, "step": 666410 }, { "epoch": 1.73, "learning_rate": 4.0881484572853506e-05, "loss": 0.0095, "step": 666420 }, { "epoch": 1.73, "learning_rate": 4.087759635648204e-05, "loss": 0.0104, "step": 666430 }, { "epoch": 1.73, "learning_rate": 4.0873708140110576e-05, "loss": 0.0088, "step": 666440 }, { "epoch": 1.73, "learning_rate": 4.086981992373911e-05, "loss": 0.0074, "step": 666450 }, { "epoch": 1.73, "learning_rate": 4.086593170736765e-05, "loss": 0.0082, "step": 666460 }, { "epoch": 1.73, "learning_rate": 4.086204349099619e-05, "loss": 0.01, "step": 666470 }, { "epoch": 1.73, "learning_rate": 4.085815527462472e-05, "loss": 0.0075, "step": 666480 }, { "epoch": 1.73, "learning_rate": 4.085426705825326e-05, "loss": 0.0066, "step": 666490 }, { "epoch": 1.73, "learning_rate": 4.085037884188179e-05, "loss": 0.0061, "step": 666500 }, { "epoch": 1.73, "learning_rate": 4.084649062551033e-05, "loss": 0.0071, "step": 666510 }, { "epoch": 1.73, "learning_rate": 4.084260240913886e-05, "loss": 0.0057, "step": 666520 }, { "epoch": 1.73, "learning_rate": 4.0838714192767396e-05, "loss": 0.0074, "step": 666530 }, { "epoch": 1.73, "learning_rate": 4.0834825976395925e-05, "loss": 0.0063, "step": 666540 }, { "epoch": 1.73, "learning_rate": 4.083093776002446e-05, "loss": 0.0079, "step": 666550 }, { "epoch": 1.73, "learning_rate": 4.0827049543653e-05, "loss": 0.006, "step": 666560 }, { "epoch": 1.73, "learning_rate": 4.0823161327281536e-05, "loss": 0.0119, "step": 666570 }, { "epoch": 1.73, "learning_rate": 4.081927311091007e-05, "loss": 0.0088, "step": 666580 }, { "epoch": 1.73, "learning_rate": 4.0815384894538606e-05, "loss": 0.0071, "step": 666590 }, { "epoch": 1.73, "learning_rate": 4.081149667816714e-05, "loss": 0.0056, "step": 666600 }, { "epoch": 1.73, "learning_rate": 4.0807608461795675e-05, "loss": 0.006, "step": 666610 }, { "epoch": 1.73, "learning_rate": 4.080372024542421e-05, "loss": 0.0078, "step": 666620 }, { "epoch": 1.73, "learning_rate": 4.0799832029052745e-05, "loss": 0.0066, "step": 666630 }, { "epoch": 1.73, "learning_rate": 4.079594381268129e-05, "loss": 0.0082, "step": 666640 }, { "epoch": 1.73, "learning_rate": 4.079205559630982e-05, "loss": 0.0061, "step": 666650 }, { "epoch": 1.73, "learning_rate": 4.0788167379938356e-05, "loss": 0.0072, "step": 666660 }, { "epoch": 1.73, "learning_rate": 4.078427916356689e-05, "loss": 0.0104, "step": 666670 }, { "epoch": 1.73, "learning_rate": 4.0780390947195426e-05, "loss": 0.0073, "step": 666680 }, { "epoch": 1.73, "learning_rate": 4.077650273082396e-05, "loss": 0.0074, "step": 666690 }, { "epoch": 1.73, "learning_rate": 4.0772614514452496e-05, "loss": 0.0072, "step": 666700 }, { "epoch": 1.73, "learning_rate": 4.076872629808103e-05, "loss": 0.0098, "step": 666710 }, { "epoch": 1.73, "learning_rate": 4.076483808170957e-05, "loss": 0.0083, "step": 666720 }, { "epoch": 1.73, "learning_rate": 4.076094986533811e-05, "loss": 0.0082, "step": 666730 }, { "epoch": 1.73, "learning_rate": 4.075706164896664e-05, "loss": 0.0085, "step": 666740 }, { "epoch": 1.73, "learning_rate": 4.075317343259518e-05, "loss": 0.0095, "step": 666750 }, { "epoch": 1.73, "learning_rate": 4.074928521622371e-05, "loss": 0.0084, "step": 666760 }, { "epoch": 1.73, "learning_rate": 4.074539699985225e-05, "loss": 0.0087, "step": 666770 }, { "epoch": 1.73, "learning_rate": 4.074150878348078e-05, "loss": 0.0065, "step": 666780 }, { "epoch": 1.73, "learning_rate": 4.073762056710931e-05, "loss": 0.0096, "step": 666790 }, { "epoch": 1.73, "learning_rate": 4.0733732350737844e-05, "loss": 0.0084, "step": 666800 }, { "epoch": 1.73, "learning_rate": 4.072984413436638e-05, "loss": 0.0084, "step": 666810 }, { "epoch": 1.73, "learning_rate": 4.072595591799492e-05, "loss": 0.0053, "step": 666820 }, { "epoch": 1.73, "learning_rate": 4.0722067701623456e-05, "loss": 0.0065, "step": 666830 }, { "epoch": 1.73, "learning_rate": 4.071817948525199e-05, "loss": 0.0084, "step": 666840 }, { "epoch": 1.73, "learning_rate": 4.0714291268880526e-05, "loss": 0.0067, "step": 666850 }, { "epoch": 1.73, "learning_rate": 4.071040305250906e-05, "loss": 0.007, "step": 666860 }, { "epoch": 1.73, "learning_rate": 4.0706514836137595e-05, "loss": 0.0064, "step": 666870 }, { "epoch": 1.73, "learning_rate": 4.070262661976613e-05, "loss": 0.0084, "step": 666880 }, { "epoch": 1.73, "learning_rate": 4.0698738403394665e-05, "loss": 0.0076, "step": 666890 }, { "epoch": 1.73, "learning_rate": 4.069485018702321e-05, "loss": 0.0104, "step": 666900 }, { "epoch": 1.73, "learning_rate": 4.069096197065174e-05, "loss": 0.0063, "step": 666910 }, { "epoch": 1.73, "learning_rate": 4.0687073754280276e-05, "loss": 0.0071, "step": 666920 }, { "epoch": 1.73, "learning_rate": 4.068318553790881e-05, "loss": 0.0143, "step": 666930 }, { "epoch": 1.73, "learning_rate": 4.0679297321537346e-05, "loss": 0.008, "step": 666940 }, { "epoch": 1.73, "learning_rate": 4.067540910516588e-05, "loss": 0.0089, "step": 666950 }, { "epoch": 1.73, "learning_rate": 4.0671520888794416e-05, "loss": 0.0095, "step": 666960 }, { "epoch": 1.73, "learning_rate": 4.066763267242295e-05, "loss": 0.0065, "step": 666970 }, { "epoch": 1.73, "learning_rate": 4.066374445605149e-05, "loss": 0.009, "step": 666980 }, { "epoch": 1.73, "learning_rate": 4.065985623968003e-05, "loss": 0.0066, "step": 666990 }, { "epoch": 1.73, "learning_rate": 4.065596802330856e-05, "loss": 0.0083, "step": 667000 }, { "epoch": 1.73, "eval_cer": 0.8816704946736816, "eval_loss": 0.005013938993215561, "eval_runtime": 107.9123, "eval_samples_per_second": 18.534, "eval_steps_per_second": 4.633, "step": 667000 }, { "epoch": 1.73, "learning_rate": 4.06520798069371e-05, "loss": 0.0077, "step": 667010 }, { "epoch": 1.73, "learning_rate": 4.064819159056563e-05, "loss": 0.0072, "step": 667020 }, { "epoch": 1.73, "learning_rate": 4.0644303374194167e-05, "loss": 0.0095, "step": 667030 }, { "epoch": 1.73, "learning_rate": 4.0640415157822695e-05, "loss": 0.0068, "step": 667040 }, { "epoch": 1.73, "learning_rate": 4.063652694145123e-05, "loss": 0.0068, "step": 667050 }, { "epoch": 1.73, "learning_rate": 4.0632638725079764e-05, "loss": 0.0079, "step": 667060 }, { "epoch": 1.73, "learning_rate": 4.06287505087083e-05, "loss": 0.0094, "step": 667070 }, { "epoch": 1.73, "learning_rate": 4.062486229233684e-05, "loss": 0.0073, "step": 667080 }, { "epoch": 1.73, "learning_rate": 4.0620974075965376e-05, "loss": 0.0073, "step": 667090 }, { "epoch": 1.73, "learning_rate": 4.061708585959391e-05, "loss": 0.0056, "step": 667100 }, { "epoch": 1.73, "learning_rate": 4.0613197643222445e-05, "loss": 0.0104, "step": 667110 }, { "epoch": 1.73, "learning_rate": 4.060930942685098e-05, "loss": 0.0081, "step": 667120 }, { "epoch": 1.73, "learning_rate": 4.0605421210479515e-05, "loss": 0.0069, "step": 667130 }, { "epoch": 1.73, "learning_rate": 4.060153299410805e-05, "loss": 0.0053, "step": 667140 }, { "epoch": 1.73, "learning_rate": 4.0597644777736585e-05, "loss": 0.0073, "step": 667150 }, { "epoch": 1.73, "learning_rate": 4.0593756561365127e-05, "loss": 0.011, "step": 667160 }, { "epoch": 1.73, "learning_rate": 4.058986834499366e-05, "loss": 0.0113, "step": 667170 }, { "epoch": 1.73, "learning_rate": 4.0585980128622196e-05, "loss": 0.0082, "step": 667180 }, { "epoch": 1.73, "learning_rate": 4.058209191225073e-05, "loss": 0.0089, "step": 667190 }, { "epoch": 1.73, "learning_rate": 4.0578203695879266e-05, "loss": 0.0094, "step": 667200 }, { "epoch": 1.73, "learning_rate": 4.05743154795078e-05, "loss": 0.0066, "step": 667210 }, { "epoch": 1.73, "learning_rate": 4.0570427263136336e-05, "loss": 0.0077, "step": 667220 }, { "epoch": 1.73, "learning_rate": 4.056653904676487e-05, "loss": 0.0077, "step": 667230 }, { "epoch": 1.73, "learning_rate": 4.056265083039341e-05, "loss": 0.0082, "step": 667240 }, { "epoch": 1.73, "learning_rate": 4.055876261402195e-05, "loss": 0.0082, "step": 667250 }, { "epoch": 1.73, "learning_rate": 4.055487439765048e-05, "loss": 0.0075, "step": 667260 }, { "epoch": 1.73, "learning_rate": 4.055098618127902e-05, "loss": 0.0074, "step": 667270 }, { "epoch": 1.73, "learning_rate": 4.054709796490755e-05, "loss": 0.0065, "step": 667280 }, { "epoch": 1.73, "learning_rate": 4.054320974853608e-05, "loss": 0.0093, "step": 667290 }, { "epoch": 1.73, "learning_rate": 4.0539321532164615e-05, "loss": 0.0093, "step": 667300 }, { "epoch": 1.73, "learning_rate": 4.053543331579315e-05, "loss": 0.0129, "step": 667310 }, { "epoch": 1.73, "learning_rate": 4.0531545099421684e-05, "loss": 0.0105, "step": 667320 }, { "epoch": 1.73, "learning_rate": 4.052765688305022e-05, "loss": 0.0096, "step": 667330 }, { "epoch": 1.73, "learning_rate": 4.052376866667876e-05, "loss": 0.0091, "step": 667340 }, { "epoch": 1.73, "learning_rate": 4.0519880450307296e-05, "loss": 0.009, "step": 667350 }, { "epoch": 1.73, "learning_rate": 4.051599223393583e-05, "loss": 0.0086, "step": 667360 }, { "epoch": 1.73, "learning_rate": 4.0512104017564365e-05, "loss": 0.0083, "step": 667370 }, { "epoch": 1.73, "learning_rate": 4.05082158011929e-05, "loss": 0.008, "step": 667380 }, { "epoch": 1.73, "learning_rate": 4.0504327584821435e-05, "loss": 0.0066, "step": 667390 }, { "epoch": 1.73, "learning_rate": 4.050043936844997e-05, "loss": 0.0063, "step": 667400 }, { "epoch": 1.73, "learning_rate": 4.0496551152078505e-05, "loss": 0.0062, "step": 667410 }, { "epoch": 1.73, "learning_rate": 4.049266293570704e-05, "loss": 0.0078, "step": 667420 }, { "epoch": 1.73, "learning_rate": 4.048877471933558e-05, "loss": 0.0117, "step": 667430 }, { "epoch": 1.73, "learning_rate": 4.0484886502964116e-05, "loss": 0.0073, "step": 667440 }, { "epoch": 1.73, "learning_rate": 4.048099828659265e-05, "loss": 0.0069, "step": 667450 }, { "epoch": 1.73, "learning_rate": 4.0477110070221186e-05, "loss": 0.0074, "step": 667460 }, { "epoch": 1.73, "learning_rate": 4.047322185384972e-05, "loss": 0.0099, "step": 667470 }, { "epoch": 1.73, "learning_rate": 4.0469333637478256e-05, "loss": 0.0089, "step": 667480 }, { "epoch": 1.73, "learning_rate": 4.046544542110679e-05, "loss": 0.0071, "step": 667490 }, { "epoch": 1.73, "learning_rate": 4.0461557204735325e-05, "loss": 0.0071, "step": 667500 }, { "epoch": 1.73, "learning_rate": 4.045766898836387e-05, "loss": 0.0077, "step": 667510 }, { "epoch": 1.73, "learning_rate": 4.04537807719924e-05, "loss": 0.007, "step": 667520 }, { "epoch": 1.73, "learning_rate": 4.044989255562094e-05, "loss": 0.0121, "step": 667530 }, { "epoch": 1.73, "learning_rate": 4.0446004339249465e-05, "loss": 0.0083, "step": 667540 }, { "epoch": 1.73, "learning_rate": 4.0442116122878e-05, "loss": 0.0068, "step": 667550 }, { "epoch": 1.73, "learning_rate": 4.0438227906506535e-05, "loss": 0.008, "step": 667560 }, { "epoch": 1.73, "learning_rate": 4.043433969013507e-05, "loss": 0.0074, "step": 667570 }, { "epoch": 1.73, "learning_rate": 4.0430451473763604e-05, "loss": 0.0097, "step": 667580 }, { "epoch": 1.73, "learning_rate": 4.042656325739214e-05, "loss": 0.0072, "step": 667590 }, { "epoch": 1.73, "learning_rate": 4.0422675041020674e-05, "loss": 0.0071, "step": 667600 }, { "epoch": 1.73, "learning_rate": 4.0418786824649216e-05, "loss": 0.0076, "step": 667610 }, { "epoch": 1.73, "learning_rate": 4.041489860827775e-05, "loss": 0.0062, "step": 667620 }, { "epoch": 1.73, "learning_rate": 4.0411010391906285e-05, "loss": 0.009, "step": 667630 }, { "epoch": 1.73, "learning_rate": 4.040712217553482e-05, "loss": 0.0099, "step": 667640 }, { "epoch": 1.73, "learning_rate": 4.0403233959163355e-05, "loss": 0.0065, "step": 667650 }, { "epoch": 1.73, "learning_rate": 4.039934574279189e-05, "loss": 0.0091, "step": 667660 }, { "epoch": 1.73, "learning_rate": 4.0395457526420425e-05, "loss": 0.0066, "step": 667670 }, { "epoch": 1.73, "learning_rate": 4.039156931004896e-05, "loss": 0.01, "step": 667680 }, { "epoch": 1.73, "learning_rate": 4.03876810936775e-05, "loss": 0.0059, "step": 667690 }, { "epoch": 1.73, "learning_rate": 4.0383792877306036e-05, "loss": 0.0095, "step": 667700 }, { "epoch": 1.73, "learning_rate": 4.037990466093457e-05, "loss": 0.0076, "step": 667710 }, { "epoch": 1.73, "learning_rate": 4.0376016444563106e-05, "loss": 0.0096, "step": 667720 }, { "epoch": 1.73, "learning_rate": 4.037212822819164e-05, "loss": 0.0069, "step": 667730 }, { "epoch": 1.73, "learning_rate": 4.0368240011820176e-05, "loss": 0.0078, "step": 667740 }, { "epoch": 1.73, "learning_rate": 4.036435179544871e-05, "loss": 0.0079, "step": 667750 }, { "epoch": 1.73, "learning_rate": 4.0360463579077245e-05, "loss": 0.0081, "step": 667760 }, { "epoch": 1.73, "learning_rate": 4.035657536270579e-05, "loss": 0.0106, "step": 667770 }, { "epoch": 1.73, "learning_rate": 4.035268714633431e-05, "loss": 0.0066, "step": 667780 }, { "epoch": 1.73, "learning_rate": 4.034879892996285e-05, "loss": 0.0056, "step": 667790 }, { "epoch": 1.73, "learning_rate": 4.0344910713591385e-05, "loss": 0.0074, "step": 667800 }, { "epoch": 1.73, "learning_rate": 4.034102249721992e-05, "loss": 0.0078, "step": 667810 }, { "epoch": 1.73, "learning_rate": 4.0337134280848455e-05, "loss": 0.0066, "step": 667820 }, { "epoch": 1.73, "learning_rate": 4.033324606447699e-05, "loss": 0.0081, "step": 667830 }, { "epoch": 1.73, "learning_rate": 4.0329357848105524e-05, "loss": 0.0084, "step": 667840 }, { "epoch": 1.73, "learning_rate": 4.032546963173406e-05, "loss": 0.008, "step": 667850 }, { "epoch": 1.73, "learning_rate": 4.0321581415362594e-05, "loss": 0.0071, "step": 667860 }, { "epoch": 1.73, "learning_rate": 4.0317693198991136e-05, "loss": 0.0115, "step": 667870 }, { "epoch": 1.73, "learning_rate": 4.031380498261967e-05, "loss": 0.0075, "step": 667880 }, { "epoch": 1.73, "learning_rate": 4.0309916766248205e-05, "loss": 0.0073, "step": 667890 }, { "epoch": 1.73, "learning_rate": 4.030602854987674e-05, "loss": 0.006, "step": 667900 }, { "epoch": 1.73, "learning_rate": 4.0302140333505275e-05, "loss": 0.0109, "step": 667910 }, { "epoch": 1.73, "learning_rate": 4.029825211713381e-05, "loss": 0.0077, "step": 667920 }, { "epoch": 1.73, "learning_rate": 4.0294363900762345e-05, "loss": 0.0108, "step": 667930 }, { "epoch": 1.73, "learning_rate": 4.029047568439088e-05, "loss": 0.0077, "step": 667940 }, { "epoch": 1.73, "learning_rate": 4.028658746801942e-05, "loss": 0.0099, "step": 667950 }, { "epoch": 1.73, "learning_rate": 4.0282699251647956e-05, "loss": 0.0059, "step": 667960 }, { "epoch": 1.73, "learning_rate": 4.027881103527649e-05, "loss": 0.0082, "step": 667970 }, { "epoch": 1.73, "learning_rate": 4.0274922818905026e-05, "loss": 0.0104, "step": 667980 }, { "epoch": 1.73, "learning_rate": 4.027103460253356e-05, "loss": 0.0077, "step": 667990 }, { "epoch": 1.73, "learning_rate": 4.0267146386162096e-05, "loss": 0.0069, "step": 668000 }, { "epoch": 1.73, "eval_cer": 0.8816620968520765, "eval_loss": 0.005121828522533178, "eval_runtime": 107.7417, "eval_samples_per_second": 18.563, "eval_steps_per_second": 4.641, "step": 668000 }, { "epoch": 1.73, "learning_rate": 4.026325816979063e-05, "loss": 0.0053, "step": 668010 }, { "epoch": 1.73, "learning_rate": 4.0259369953419165e-05, "loss": 0.0096, "step": 668020 }, { "epoch": 1.73, "learning_rate": 4.0255481737047693e-05, "loss": 0.0078, "step": 668030 }, { "epoch": 1.73, "learning_rate": 4.025159352067623e-05, "loss": 0.0107, "step": 668040 }, { "epoch": 1.73, "learning_rate": 4.024770530430477e-05, "loss": 0.0074, "step": 668050 }, { "epoch": 1.73, "learning_rate": 4.0243817087933305e-05, "loss": 0.0083, "step": 668060 }, { "epoch": 1.73, "learning_rate": 4.023992887156184e-05, "loss": 0.0077, "step": 668070 }, { "epoch": 1.73, "learning_rate": 4.0236040655190374e-05, "loss": 0.0067, "step": 668080 }, { "epoch": 1.73, "learning_rate": 4.023215243881891e-05, "loss": 0.0066, "step": 668090 }, { "epoch": 1.73, "learning_rate": 4.0228264222447444e-05, "loss": 0.0081, "step": 668100 }, { "epoch": 1.73, "learning_rate": 4.022437600607598e-05, "loss": 0.0103, "step": 668110 }, { "epoch": 1.73, "learning_rate": 4.0220487789704514e-05, "loss": 0.0074, "step": 668120 }, { "epoch": 1.73, "learning_rate": 4.0216599573333056e-05, "loss": 0.0064, "step": 668130 }, { "epoch": 1.73, "learning_rate": 4.021271135696159e-05, "loss": 0.0093, "step": 668140 }, { "epoch": 1.73, "learning_rate": 4.0208823140590125e-05, "loss": 0.0088, "step": 668150 }, { "epoch": 1.73, "learning_rate": 4.020493492421866e-05, "loss": 0.0061, "step": 668160 }, { "epoch": 1.73, "learning_rate": 4.0201046707847195e-05, "loss": 0.0064, "step": 668170 }, { "epoch": 1.73, "learning_rate": 4.019715849147573e-05, "loss": 0.0065, "step": 668180 }, { "epoch": 1.73, "learning_rate": 4.0193270275104265e-05, "loss": 0.007, "step": 668190 }, { "epoch": 1.73, "learning_rate": 4.01893820587328e-05, "loss": 0.0109, "step": 668200 }, { "epoch": 1.73, "learning_rate": 4.018549384236134e-05, "loss": 0.0073, "step": 668210 }, { "epoch": 1.73, "learning_rate": 4.0181605625989876e-05, "loss": 0.0101, "step": 668220 }, { "epoch": 1.73, "learning_rate": 4.017771740961841e-05, "loss": 0.0088, "step": 668230 }, { "epoch": 1.73, "learning_rate": 4.0173829193246946e-05, "loss": 0.0069, "step": 668240 }, { "epoch": 1.73, "learning_rate": 4.016994097687548e-05, "loss": 0.0122, "step": 668250 }, { "epoch": 1.73, "learning_rate": 4.0166052760504016e-05, "loss": 0.0068, "step": 668260 }, { "epoch": 1.73, "learning_rate": 4.016216454413255e-05, "loss": 0.0099, "step": 668270 }, { "epoch": 1.73, "learning_rate": 4.015827632776108e-05, "loss": 0.0073, "step": 668280 }, { "epoch": 1.73, "learning_rate": 4.015438811138961e-05, "loss": 0.0082, "step": 668290 }, { "epoch": 1.73, "learning_rate": 4.015049989501815e-05, "loss": 0.0088, "step": 668300 }, { "epoch": 1.73, "learning_rate": 4.014661167864669e-05, "loss": 0.0079, "step": 668310 }, { "epoch": 1.73, "learning_rate": 4.0142723462275225e-05, "loss": 0.0085, "step": 668320 }, { "epoch": 1.73, "learning_rate": 4.013883524590376e-05, "loss": 0.0096, "step": 668330 }, { "epoch": 1.73, "learning_rate": 4.0134947029532294e-05, "loss": 0.0104, "step": 668340 }, { "epoch": 1.73, "learning_rate": 4.013105881316083e-05, "loss": 0.0096, "step": 668350 }, { "epoch": 1.73, "learning_rate": 4.0127170596789364e-05, "loss": 0.0094, "step": 668360 }, { "epoch": 1.73, "learning_rate": 4.01232823804179e-05, "loss": 0.0077, "step": 668370 }, { "epoch": 1.73, "learning_rate": 4.0119394164046434e-05, "loss": 0.007, "step": 668380 }, { "epoch": 1.73, "learning_rate": 4.0115505947674976e-05, "loss": 0.0085, "step": 668390 }, { "epoch": 1.73, "learning_rate": 4.011161773130351e-05, "loss": 0.0051, "step": 668400 }, { "epoch": 1.73, "learning_rate": 4.0107729514932045e-05, "loss": 0.0072, "step": 668410 }, { "epoch": 1.73, "learning_rate": 4.010384129856058e-05, "loss": 0.0092, "step": 668420 }, { "epoch": 1.73, "learning_rate": 4.0099953082189115e-05, "loss": 0.0075, "step": 668430 }, { "epoch": 1.73, "learning_rate": 4.009606486581765e-05, "loss": 0.006, "step": 668440 }, { "epoch": 1.73, "learning_rate": 4.0092176649446185e-05, "loss": 0.0061, "step": 668450 }, { "epoch": 1.73, "learning_rate": 4.008828843307472e-05, "loss": 0.0084, "step": 668460 }, { "epoch": 1.73, "learning_rate": 4.008440021670326e-05, "loss": 0.0088, "step": 668470 }, { "epoch": 1.73, "learning_rate": 4.0080512000331796e-05, "loss": 0.0073, "step": 668480 }, { "epoch": 1.73, "learning_rate": 4.007662378396033e-05, "loss": 0.0081, "step": 668490 }, { "epoch": 1.73, "learning_rate": 4.0072735567588866e-05, "loss": 0.009, "step": 668500 }, { "epoch": 1.73, "learning_rate": 4.00688473512174e-05, "loss": 0.0082, "step": 668510 }, { "epoch": 1.73, "learning_rate": 4.0064959134845936e-05, "loss": 0.0064, "step": 668520 }, { "epoch": 1.73, "learning_rate": 4.0061070918474464e-05, "loss": 0.0068, "step": 668530 }, { "epoch": 1.73, "learning_rate": 4.0057182702103e-05, "loss": 0.0072, "step": 668540 }, { "epoch": 1.73, "learning_rate": 4.005329448573153e-05, "loss": 0.0079, "step": 668550 }, { "epoch": 1.73, "learning_rate": 4.004940626936007e-05, "loss": 0.0073, "step": 668560 }, { "epoch": 1.73, "learning_rate": 4.004551805298861e-05, "loss": 0.0093, "step": 668570 }, { "epoch": 1.73, "learning_rate": 4.0041629836617145e-05, "loss": 0.0088, "step": 668580 }, { "epoch": 1.73, "learning_rate": 4.003774162024568e-05, "loss": 0.0093, "step": 668590 }, { "epoch": 1.73, "learning_rate": 4.0033853403874214e-05, "loss": 0.008, "step": 668600 }, { "epoch": 1.73, "learning_rate": 4.002996518750275e-05, "loss": 0.0098, "step": 668610 }, { "epoch": 1.73, "learning_rate": 4.0026076971131284e-05, "loss": 0.0115, "step": 668620 }, { "epoch": 1.73, "learning_rate": 4.002218875475982e-05, "loss": 0.0071, "step": 668630 }, { "epoch": 1.73, "learning_rate": 4.0018300538388354e-05, "loss": 0.0078, "step": 668640 }, { "epoch": 1.73, "learning_rate": 4.0014412322016895e-05, "loss": 0.0101, "step": 668650 }, { "epoch": 1.73, "learning_rate": 4.001052410564543e-05, "loss": 0.006, "step": 668660 }, { "epoch": 1.73, "learning_rate": 4.0006635889273965e-05, "loss": 0.0064, "step": 668670 }, { "epoch": 1.73, "learning_rate": 4.00027476729025e-05, "loss": 0.0091, "step": 668680 }, { "epoch": 1.73, "learning_rate": 3.9998859456531035e-05, "loss": 0.0062, "step": 668690 }, { "epoch": 1.73, "learning_rate": 3.999497124015957e-05, "loss": 0.0084, "step": 668700 }, { "epoch": 1.73, "learning_rate": 3.9991083023788105e-05, "loss": 0.0077, "step": 668710 }, { "epoch": 1.73, "learning_rate": 3.998719480741664e-05, "loss": 0.0081, "step": 668720 }, { "epoch": 1.73, "learning_rate": 3.9983306591045174e-05, "loss": 0.0074, "step": 668730 }, { "epoch": 1.73, "learning_rate": 3.9979418374673716e-05, "loss": 0.0079, "step": 668740 }, { "epoch": 1.73, "learning_rate": 3.997553015830225e-05, "loss": 0.0098, "step": 668750 }, { "epoch": 1.73, "learning_rate": 3.9971641941930786e-05, "loss": 0.0092, "step": 668760 }, { "epoch": 1.73, "learning_rate": 3.996775372555932e-05, "loss": 0.0094, "step": 668770 }, { "epoch": 1.73, "learning_rate": 3.996386550918785e-05, "loss": 0.0077, "step": 668780 }, { "epoch": 1.73, "learning_rate": 3.9959977292816384e-05, "loss": 0.0078, "step": 668790 }, { "epoch": 1.73, "learning_rate": 3.995608907644492e-05, "loss": 0.011, "step": 668800 }, { "epoch": 1.73, "learning_rate": 3.995220086007345e-05, "loss": 0.0089, "step": 668810 }, { "epoch": 1.73, "learning_rate": 3.994831264370199e-05, "loss": 0.0067, "step": 668820 }, { "epoch": 1.73, "learning_rate": 3.994442442733053e-05, "loss": 0.0106, "step": 668830 }, { "epoch": 1.73, "learning_rate": 3.9940536210959065e-05, "loss": 0.0132, "step": 668840 }, { "epoch": 1.73, "learning_rate": 3.99366479945876e-05, "loss": 0.0074, "step": 668850 }, { "epoch": 1.73, "learning_rate": 3.9932759778216134e-05, "loss": 0.0081, "step": 668860 }, { "epoch": 1.73, "learning_rate": 3.992887156184467e-05, "loss": 0.0071, "step": 668870 }, { "epoch": 1.73, "learning_rate": 3.9924983345473204e-05, "loss": 0.008, "step": 668880 }, { "epoch": 1.73, "learning_rate": 3.992109512910174e-05, "loss": 0.0072, "step": 668890 }, { "epoch": 1.73, "learning_rate": 3.9917206912730274e-05, "loss": 0.0084, "step": 668900 }, { "epoch": 1.73, "learning_rate": 3.991331869635881e-05, "loss": 0.0081, "step": 668910 }, { "epoch": 1.73, "learning_rate": 3.990943047998735e-05, "loss": 0.0102, "step": 668920 }, { "epoch": 1.73, "learning_rate": 3.9905542263615885e-05, "loss": 0.0112, "step": 668930 }, { "epoch": 1.73, "learning_rate": 3.990165404724442e-05, "loss": 0.0096, "step": 668940 }, { "epoch": 1.73, "learning_rate": 3.9897765830872955e-05, "loss": 0.0089, "step": 668950 }, { "epoch": 1.73, "learning_rate": 3.989387761450149e-05, "loss": 0.0078, "step": 668960 }, { "epoch": 1.73, "learning_rate": 3.9889989398130025e-05, "loss": 0.0099, "step": 668970 }, { "epoch": 1.73, "learning_rate": 3.988610118175856e-05, "loss": 0.0069, "step": 668980 }, { "epoch": 1.73, "learning_rate": 3.9882212965387094e-05, "loss": 0.0089, "step": 668990 }, { "epoch": 1.73, "learning_rate": 3.9878324749015636e-05, "loss": 0.01, "step": 669000 }, { "epoch": 1.73, "eval_cer": 0.8816592975782083, "eval_loss": 0.005148761440068483, "eval_runtime": 107.7864, "eval_samples_per_second": 18.555, "eval_steps_per_second": 4.639, "step": 669000 }, { "epoch": 1.73, "learning_rate": 3.987443653264417e-05, "loss": 0.0073, "step": 669010 }, { "epoch": 1.73, "learning_rate": 3.98705483162727e-05, "loss": 0.0071, "step": 669020 }, { "epoch": 1.73, "learning_rate": 3.9866660099901234e-05, "loss": 0.0073, "step": 669030 }, { "epoch": 1.73, "learning_rate": 3.986277188352977e-05, "loss": 0.008, "step": 669040 }, { "epoch": 1.73, "learning_rate": 3.9858883667158303e-05, "loss": 0.0085, "step": 669050 }, { "epoch": 1.73, "learning_rate": 3.985499545078684e-05, "loss": 0.0091, "step": 669060 }, { "epoch": 1.73, "learning_rate": 3.985110723441537e-05, "loss": 0.0085, "step": 669070 }, { "epoch": 1.73, "learning_rate": 3.984721901804391e-05, "loss": 0.007, "step": 669080 }, { "epoch": 1.73, "learning_rate": 3.984333080167244e-05, "loss": 0.0076, "step": 669090 }, { "epoch": 1.73, "learning_rate": 3.9839442585300985e-05, "loss": 0.0071, "step": 669100 }, { "epoch": 1.73, "learning_rate": 3.983555436892952e-05, "loss": 0.0072, "step": 669110 }, { "epoch": 1.73, "learning_rate": 3.9831666152558054e-05, "loss": 0.0076, "step": 669120 }, { "epoch": 1.73, "learning_rate": 3.982777793618659e-05, "loss": 0.0064, "step": 669130 }, { "epoch": 1.73, "learning_rate": 3.9823889719815124e-05, "loss": 0.0079, "step": 669140 }, { "epoch": 1.73, "learning_rate": 3.982000150344366e-05, "loss": 0.0114, "step": 669150 }, { "epoch": 1.73, "learning_rate": 3.9816113287072194e-05, "loss": 0.0073, "step": 669160 }, { "epoch": 1.73, "learning_rate": 3.981222507070073e-05, "loss": 0.0061, "step": 669170 }, { "epoch": 1.73, "learning_rate": 3.980833685432927e-05, "loss": 0.0068, "step": 669180 }, { "epoch": 1.73, "learning_rate": 3.9804448637957805e-05, "loss": 0.0076, "step": 669190 }, { "epoch": 1.73, "learning_rate": 3.980056042158634e-05, "loss": 0.0084, "step": 669200 }, { "epoch": 1.73, "learning_rate": 3.9796672205214875e-05, "loss": 0.0047, "step": 669210 }, { "epoch": 1.73, "learning_rate": 3.979278398884341e-05, "loss": 0.0102, "step": 669220 }, { "epoch": 1.73, "learning_rate": 3.9788895772471945e-05, "loss": 0.0075, "step": 669230 }, { "epoch": 1.73, "learning_rate": 3.978500755610048e-05, "loss": 0.0073, "step": 669240 }, { "epoch": 1.73, "learning_rate": 3.9781119339729014e-05, "loss": 0.008, "step": 669250 }, { "epoch": 1.73, "learning_rate": 3.9777231123357556e-05, "loss": 0.0092, "step": 669260 }, { "epoch": 1.73, "learning_rate": 3.977334290698608e-05, "loss": 0.007, "step": 669270 }, { "epoch": 1.73, "learning_rate": 3.976945469061462e-05, "loss": 0.006, "step": 669280 }, { "epoch": 1.73, "learning_rate": 3.9765566474243154e-05, "loss": 0.0091, "step": 669290 }, { "epoch": 1.73, "learning_rate": 3.976167825787169e-05, "loss": 0.0093, "step": 669300 }, { "epoch": 1.73, "learning_rate": 3.9757790041500223e-05, "loss": 0.0072, "step": 669310 }, { "epoch": 1.73, "learning_rate": 3.975390182512876e-05, "loss": 0.0062, "step": 669320 }, { "epoch": 1.73, "learning_rate": 3.975001360875729e-05, "loss": 0.0077, "step": 669330 }, { "epoch": 1.74, "learning_rate": 3.974612539238583e-05, "loss": 0.0064, "step": 669340 }, { "epoch": 1.74, "learning_rate": 3.974223717601436e-05, "loss": 0.008, "step": 669350 }, { "epoch": 1.74, "learning_rate": 3.9738348959642905e-05, "loss": 0.0086, "step": 669360 }, { "epoch": 1.74, "learning_rate": 3.973446074327144e-05, "loss": 0.0061, "step": 669370 }, { "epoch": 1.74, "learning_rate": 3.9730572526899974e-05, "loss": 0.009, "step": 669380 }, { "epoch": 1.74, "learning_rate": 3.972668431052851e-05, "loss": 0.0072, "step": 669390 }, { "epoch": 1.74, "learning_rate": 3.9722796094157044e-05, "loss": 0.008, "step": 669400 }, { "epoch": 1.74, "learning_rate": 3.971890787778558e-05, "loss": 0.0098, "step": 669410 }, { "epoch": 1.74, "learning_rate": 3.9715019661414114e-05, "loss": 0.0057, "step": 669420 }, { "epoch": 1.74, "learning_rate": 3.971113144504265e-05, "loss": 0.0095, "step": 669430 }, { "epoch": 1.74, "learning_rate": 3.970724322867119e-05, "loss": 0.0076, "step": 669440 }, { "epoch": 1.74, "learning_rate": 3.9703355012299725e-05, "loss": 0.0061, "step": 669450 }, { "epoch": 1.74, "learning_rate": 3.969946679592826e-05, "loss": 0.0094, "step": 669460 }, { "epoch": 1.74, "learning_rate": 3.9695578579556795e-05, "loss": 0.0082, "step": 669470 }, { "epoch": 1.74, "learning_rate": 3.969169036318533e-05, "loss": 0.0184, "step": 669480 }, { "epoch": 1.74, "learning_rate": 3.9687802146813865e-05, "loss": 0.0087, "step": 669490 }, { "epoch": 1.74, "learning_rate": 3.96839139304424e-05, "loss": 0.0088, "step": 669500 }, { "epoch": 1.74, "learning_rate": 3.9680025714070934e-05, "loss": 0.0099, "step": 669510 }, { "epoch": 1.74, "learning_rate": 3.967613749769946e-05, "loss": 0.0078, "step": 669520 }, { "epoch": 1.74, "learning_rate": 3.9672249281328e-05, "loss": 0.0082, "step": 669530 }, { "epoch": 1.74, "learning_rate": 3.966836106495654e-05, "loss": 0.0072, "step": 669540 }, { "epoch": 1.74, "learning_rate": 3.9664472848585074e-05, "loss": 0.0073, "step": 669550 }, { "epoch": 1.74, "learning_rate": 3.966058463221361e-05, "loss": 0.0114, "step": 669560 }, { "epoch": 1.74, "learning_rate": 3.9656696415842143e-05, "loss": 0.0092, "step": 669570 }, { "epoch": 1.74, "learning_rate": 3.965280819947068e-05, "loss": 0.0062, "step": 669580 }, { "epoch": 1.74, "learning_rate": 3.964891998309921e-05, "loss": 0.0078, "step": 669590 }, { "epoch": 1.74, "learning_rate": 3.964503176672775e-05, "loss": 0.0111, "step": 669600 }, { "epoch": 1.74, "learning_rate": 3.964114355035628e-05, "loss": 0.0107, "step": 669610 }, { "epoch": 1.74, "learning_rate": 3.9637255333984824e-05, "loss": 0.0092, "step": 669620 }, { "epoch": 1.74, "learning_rate": 3.963336711761336e-05, "loss": 0.0097, "step": 669630 }, { "epoch": 1.74, "learning_rate": 3.9629478901241894e-05, "loss": 0.0079, "step": 669640 }, { "epoch": 1.74, "learning_rate": 3.962559068487043e-05, "loss": 0.008, "step": 669650 }, { "epoch": 1.74, "learning_rate": 3.9621702468498964e-05, "loss": 0.0114, "step": 669660 }, { "epoch": 1.74, "learning_rate": 3.96178142521275e-05, "loss": 0.0119, "step": 669670 }, { "epoch": 1.74, "learning_rate": 3.9613926035756034e-05, "loss": 0.0093, "step": 669680 }, { "epoch": 1.74, "learning_rate": 3.961003781938457e-05, "loss": 0.0077, "step": 669690 }, { "epoch": 1.74, "learning_rate": 3.960614960301311e-05, "loss": 0.0061, "step": 669700 }, { "epoch": 1.74, "learning_rate": 3.9602261386641645e-05, "loss": 0.0081, "step": 669710 }, { "epoch": 1.74, "learning_rate": 3.959837317027018e-05, "loss": 0.007, "step": 669720 }, { "epoch": 1.74, "learning_rate": 3.9594484953898715e-05, "loss": 0.0048, "step": 669730 }, { "epoch": 1.74, "learning_rate": 3.959059673752725e-05, "loss": 0.0077, "step": 669740 }, { "epoch": 1.74, "learning_rate": 3.9586708521155784e-05, "loss": 0.0098, "step": 669750 }, { "epoch": 1.74, "learning_rate": 3.958282030478432e-05, "loss": 0.0081, "step": 669760 }, { "epoch": 1.74, "learning_rate": 3.957893208841285e-05, "loss": 0.0076, "step": 669770 }, { "epoch": 1.74, "learning_rate": 3.957504387204138e-05, "loss": 0.0081, "step": 669780 }, { "epoch": 1.74, "learning_rate": 3.957115565566992e-05, "loss": 0.0056, "step": 669790 }, { "epoch": 1.74, "learning_rate": 3.956726743929846e-05, "loss": 0.0087, "step": 669800 }, { "epoch": 1.74, "learning_rate": 3.9563379222926994e-05, "loss": 0.008, "step": 669810 }, { "epoch": 1.74, "learning_rate": 3.955949100655553e-05, "loss": 0.0087, "step": 669820 }, { "epoch": 1.74, "learning_rate": 3.955560279018406e-05, "loss": 0.0071, "step": 669830 }, { "epoch": 1.74, "learning_rate": 3.95517145738126e-05, "loss": 0.0173, "step": 669840 }, { "epoch": 1.74, "learning_rate": 3.954782635744113e-05, "loss": 0.0066, "step": 669850 }, { "epoch": 1.74, "learning_rate": 3.954393814106967e-05, "loss": 0.0083, "step": 669860 }, { "epoch": 1.74, "learning_rate": 3.95400499246982e-05, "loss": 0.0066, "step": 669870 }, { "epoch": 1.74, "learning_rate": 3.9536161708326744e-05, "loss": 0.0098, "step": 669880 }, { "epoch": 1.74, "learning_rate": 3.953227349195528e-05, "loss": 0.0087, "step": 669890 }, { "epoch": 1.74, "learning_rate": 3.9528385275583814e-05, "loss": 0.0057, "step": 669900 }, { "epoch": 1.74, "learning_rate": 3.952449705921235e-05, "loss": 0.0088, "step": 669910 }, { "epoch": 1.74, "learning_rate": 3.9520608842840884e-05, "loss": 0.0111, "step": 669920 }, { "epoch": 1.74, "learning_rate": 3.951672062646942e-05, "loss": 0.0072, "step": 669930 }, { "epoch": 1.74, "learning_rate": 3.9512832410097954e-05, "loss": 0.007, "step": 669940 }, { "epoch": 1.74, "learning_rate": 3.950894419372649e-05, "loss": 0.0119, "step": 669950 }, { "epoch": 1.74, "learning_rate": 3.950505597735503e-05, "loss": 0.0062, "step": 669960 }, { "epoch": 1.74, "learning_rate": 3.9501167760983565e-05, "loss": 0.0096, "step": 669970 }, { "epoch": 1.74, "learning_rate": 3.94972795446121e-05, "loss": 0.0061, "step": 669980 }, { "epoch": 1.74, "learning_rate": 3.9493391328240635e-05, "loss": 0.0078, "step": 669990 }, { "epoch": 1.74, "learning_rate": 3.948950311186917e-05, "loss": 0.0099, "step": 670000 }, { "epoch": 1.74, "eval_cer": 0.8816634964890108, "eval_loss": 0.005133858881890774, "eval_runtime": 107.9299, "eval_samples_per_second": 18.531, "eval_steps_per_second": 4.633, "step": 670000 }, { "epoch": 1.74, "learning_rate": 3.9485614895497704e-05, "loss": 0.0056, "step": 670010 }, { "epoch": 1.74, "learning_rate": 3.948172667912623e-05, "loss": 0.0103, "step": 670020 }, { "epoch": 1.74, "learning_rate": 3.947783846275477e-05, "loss": 0.0142, "step": 670030 }, { "epoch": 1.74, "learning_rate": 3.94739502463833e-05, "loss": 0.0069, "step": 670040 }, { "epoch": 1.74, "learning_rate": 3.947006203001184e-05, "loss": 0.0089, "step": 670050 }, { "epoch": 1.74, "learning_rate": 3.946617381364038e-05, "loss": 0.0086, "step": 670060 }, { "epoch": 1.74, "learning_rate": 3.9462285597268914e-05, "loss": 0.0107, "step": 670070 }, { "epoch": 1.74, "learning_rate": 3.945839738089745e-05, "loss": 0.0117, "step": 670080 }, { "epoch": 1.74, "learning_rate": 3.945450916452598e-05, "loss": 0.007, "step": 670090 }, { "epoch": 1.74, "learning_rate": 3.945062094815452e-05, "loss": 0.0081, "step": 670100 }, { "epoch": 1.74, "learning_rate": 3.944673273178305e-05, "loss": 0.007, "step": 670110 }, { "epoch": 1.74, "learning_rate": 3.944284451541159e-05, "loss": 0.0073, "step": 670120 }, { "epoch": 1.74, "learning_rate": 3.943895629904012e-05, "loss": 0.0079, "step": 670130 }, { "epoch": 1.74, "learning_rate": 3.9435068082668664e-05, "loss": 0.007, "step": 670140 }, { "epoch": 1.74, "learning_rate": 3.94311798662972e-05, "loss": 0.0072, "step": 670150 }, { "epoch": 1.74, "learning_rate": 3.9427291649925734e-05, "loss": 0.008, "step": 670160 }, { "epoch": 1.74, "learning_rate": 3.942340343355427e-05, "loss": 0.0085, "step": 670170 }, { "epoch": 1.74, "learning_rate": 3.9419515217182804e-05, "loss": 0.0069, "step": 670180 }, { "epoch": 1.74, "learning_rate": 3.941562700081134e-05, "loss": 0.0118, "step": 670190 }, { "epoch": 1.74, "learning_rate": 3.9411738784439874e-05, "loss": 0.008, "step": 670200 }, { "epoch": 1.74, "learning_rate": 3.940785056806841e-05, "loss": 0.0079, "step": 670210 }, { "epoch": 1.74, "learning_rate": 3.940396235169694e-05, "loss": 0.0098, "step": 670220 }, { "epoch": 1.74, "learning_rate": 3.9400074135325485e-05, "loss": 0.0074, "step": 670230 }, { "epoch": 1.74, "learning_rate": 3.939618591895402e-05, "loss": 0.0085, "step": 670240 }, { "epoch": 1.74, "learning_rate": 3.9392297702582555e-05, "loss": 0.0081, "step": 670250 }, { "epoch": 1.74, "learning_rate": 3.938840948621109e-05, "loss": 0.0068, "step": 670260 }, { "epoch": 1.74, "learning_rate": 3.938452126983962e-05, "loss": 0.006, "step": 670270 }, { "epoch": 1.74, "learning_rate": 3.938063305346815e-05, "loss": 0.0066, "step": 670280 }, { "epoch": 1.74, "learning_rate": 3.937674483709669e-05, "loss": 0.0068, "step": 670290 }, { "epoch": 1.74, "learning_rate": 3.937285662072522e-05, "loss": 0.008, "step": 670300 }, { "epoch": 1.74, "learning_rate": 3.936896840435376e-05, "loss": 0.0096, "step": 670310 }, { "epoch": 1.74, "learning_rate": 3.936508018798229e-05, "loss": 0.0084, "step": 670320 }, { "epoch": 1.74, "learning_rate": 3.9361191971610834e-05, "loss": 0.0068, "step": 670330 }, { "epoch": 1.74, "learning_rate": 3.935730375523937e-05, "loss": 0.0067, "step": 670340 }, { "epoch": 1.74, "learning_rate": 3.93534155388679e-05, "loss": 0.0064, "step": 670350 }, { "epoch": 1.74, "learning_rate": 3.934952732249644e-05, "loss": 0.0077, "step": 670360 }, { "epoch": 1.74, "learning_rate": 3.934563910612497e-05, "loss": 0.006, "step": 670370 }, { "epoch": 1.74, "learning_rate": 3.934175088975351e-05, "loss": 0.0075, "step": 670380 }, { "epoch": 1.74, "learning_rate": 3.933786267338204e-05, "loss": 0.0084, "step": 670390 }, { "epoch": 1.74, "learning_rate": 3.933397445701058e-05, "loss": 0.0076, "step": 670400 }, { "epoch": 1.74, "learning_rate": 3.933008624063912e-05, "loss": 0.0084, "step": 670410 }, { "epoch": 1.74, "learning_rate": 3.9326198024267654e-05, "loss": 0.0076, "step": 670420 }, { "epoch": 1.74, "learning_rate": 3.932230980789619e-05, "loss": 0.0054, "step": 670430 }, { "epoch": 1.74, "learning_rate": 3.9318421591524724e-05, "loss": 0.0057, "step": 670440 }, { "epoch": 1.74, "learning_rate": 3.931453337515326e-05, "loss": 0.0083, "step": 670450 }, { "epoch": 1.74, "learning_rate": 3.9310645158781794e-05, "loss": 0.0099, "step": 670460 }, { "epoch": 1.74, "learning_rate": 3.930675694241033e-05, "loss": 0.006, "step": 670470 }, { "epoch": 1.74, "learning_rate": 3.930286872603886e-05, "loss": 0.0067, "step": 670480 }, { "epoch": 1.74, "learning_rate": 3.9298980509667405e-05, "loss": 0.0079, "step": 670490 }, { "epoch": 1.74, "learning_rate": 3.929509229329594e-05, "loss": 0.0087, "step": 670500 }, { "epoch": 1.74, "learning_rate": 3.929120407692447e-05, "loss": 0.006, "step": 670510 }, { "epoch": 1.74, "learning_rate": 3.9287315860553e-05, "loss": 0.0081, "step": 670520 }, { "epoch": 1.74, "learning_rate": 3.928342764418154e-05, "loss": 0.007, "step": 670530 }, { "epoch": 1.74, "learning_rate": 3.927953942781007e-05, "loss": 0.0107, "step": 670540 }, { "epoch": 1.74, "learning_rate": 3.927565121143861e-05, "loss": 0.0075, "step": 670550 }, { "epoch": 1.74, "learning_rate": 3.927176299506714e-05, "loss": 0.007, "step": 670560 }, { "epoch": 1.74, "learning_rate": 3.926787477869568e-05, "loss": 0.0078, "step": 670570 }, { "epoch": 1.74, "learning_rate": 3.926398656232421e-05, "loss": 0.0064, "step": 670580 }, { "epoch": 1.74, "learning_rate": 3.9260098345952753e-05, "loss": 0.0101, "step": 670590 }, { "epoch": 1.74, "learning_rate": 3.925621012958129e-05, "loss": 0.007, "step": 670600 }, { "epoch": 1.74, "learning_rate": 3.925232191320982e-05, "loss": 0.0079, "step": 670610 }, { "epoch": 1.74, "learning_rate": 3.924843369683836e-05, "loss": 0.0083, "step": 670620 }, { "epoch": 1.74, "learning_rate": 3.924454548046689e-05, "loss": 0.0084, "step": 670630 }, { "epoch": 1.74, "learning_rate": 3.924065726409543e-05, "loss": 0.0075, "step": 670640 }, { "epoch": 1.74, "learning_rate": 3.923676904772396e-05, "loss": 0.0093, "step": 670650 }, { "epoch": 1.74, "learning_rate": 3.92328808313525e-05, "loss": 0.0073, "step": 670660 }, { "epoch": 1.74, "learning_rate": 3.922899261498104e-05, "loss": 0.0092, "step": 670670 }, { "epoch": 1.74, "learning_rate": 3.9225104398609574e-05, "loss": 0.0065, "step": 670680 }, { "epoch": 1.74, "learning_rate": 3.922121618223811e-05, "loss": 0.0066, "step": 670690 }, { "epoch": 1.74, "learning_rate": 3.9217327965866644e-05, "loss": 0.0061, "step": 670700 }, { "epoch": 1.74, "learning_rate": 3.921343974949518e-05, "loss": 0.0088, "step": 670710 }, { "epoch": 1.74, "learning_rate": 3.9209551533123713e-05, "loss": 0.0097, "step": 670720 }, { "epoch": 1.74, "learning_rate": 3.920566331675225e-05, "loss": 0.0065, "step": 670730 }, { "epoch": 1.74, "learning_rate": 3.920177510038078e-05, "loss": 0.0083, "step": 670740 }, { "epoch": 1.74, "learning_rate": 3.9197886884009325e-05, "loss": 0.0067, "step": 670750 }, { "epoch": 1.74, "learning_rate": 3.9193998667637846e-05, "loss": 0.0067, "step": 670760 }, { "epoch": 1.74, "learning_rate": 3.919011045126639e-05, "loss": 0.0103, "step": 670770 }, { "epoch": 1.74, "learning_rate": 3.918622223489492e-05, "loss": 0.0085, "step": 670780 }, { "epoch": 1.74, "learning_rate": 3.918233401852346e-05, "loss": 0.0083, "step": 670790 }, { "epoch": 1.74, "learning_rate": 3.917844580215199e-05, "loss": 0.006, "step": 670800 }, { "epoch": 1.74, "learning_rate": 3.917455758578053e-05, "loss": 0.0061, "step": 670810 }, { "epoch": 1.74, "learning_rate": 3.917066936940906e-05, "loss": 0.0084, "step": 670820 }, { "epoch": 1.74, "learning_rate": 3.91667811530376e-05, "loss": 0.0077, "step": 670830 }, { "epoch": 1.74, "learning_rate": 3.916289293666613e-05, "loss": 0.006, "step": 670840 }, { "epoch": 1.74, "learning_rate": 3.9159004720294673e-05, "loss": 0.006, "step": 670850 }, { "epoch": 1.74, "learning_rate": 3.915511650392321e-05, "loss": 0.0062, "step": 670860 }, { "epoch": 1.74, "learning_rate": 3.915122828755174e-05, "loss": 0.0074, "step": 670870 }, { "epoch": 1.74, "learning_rate": 3.914734007118028e-05, "loss": 0.0074, "step": 670880 }, { "epoch": 1.74, "learning_rate": 3.914345185480881e-05, "loss": 0.0095, "step": 670890 }, { "epoch": 1.74, "learning_rate": 3.913956363843735e-05, "loss": 0.006, "step": 670900 }, { "epoch": 1.74, "learning_rate": 3.913567542206588e-05, "loss": 0.0055, "step": 670910 }, { "epoch": 1.74, "learning_rate": 3.913178720569442e-05, "loss": 0.0085, "step": 670920 }, { "epoch": 1.74, "learning_rate": 3.912789898932296e-05, "loss": 0.0088, "step": 670930 }, { "epoch": 1.74, "learning_rate": 3.9124010772951494e-05, "loss": 0.0117, "step": 670940 }, { "epoch": 1.74, "learning_rate": 3.912012255658003e-05, "loss": 0.0078, "step": 670950 }, { "epoch": 1.74, "learning_rate": 3.9116234340208564e-05, "loss": 0.0097, "step": 670960 }, { "epoch": 1.74, "learning_rate": 3.91123461238371e-05, "loss": 0.0067, "step": 670970 }, { "epoch": 1.74, "learning_rate": 3.9108457907465633e-05, "loss": 0.0073, "step": 670980 }, { "epoch": 1.74, "learning_rate": 3.910456969109417e-05, "loss": 0.0103, "step": 670990 }, { "epoch": 1.74, "learning_rate": 3.91006814747227e-05, "loss": 0.0069, "step": 671000 }, { "epoch": 1.74, "eval_cer": 0.8816662957628791, "eval_loss": 0.005163580644875765, "eval_runtime": 107.8528, "eval_samples_per_second": 18.544, "eval_steps_per_second": 4.636, "step": 671000 }, { "epoch": 1.74, "learning_rate": 3.909679325835123e-05, "loss": 0.0099, "step": 671010 }, { "epoch": 1.74, "learning_rate": 3.9092905041979766e-05, "loss": 0.007, "step": 671020 }, { "epoch": 1.74, "learning_rate": 3.908901682560831e-05, "loss": 0.0075, "step": 671030 }, { "epoch": 1.74, "learning_rate": 3.908512860923684e-05, "loss": 0.0086, "step": 671040 }, { "epoch": 1.74, "learning_rate": 3.908124039286538e-05, "loss": 0.0076, "step": 671050 }, { "epoch": 1.74, "learning_rate": 3.907735217649391e-05, "loss": 0.0082, "step": 671060 }, { "epoch": 1.74, "learning_rate": 3.907346396012245e-05, "loss": 0.0084, "step": 671070 }, { "epoch": 1.74, "learning_rate": 3.906957574375098e-05, "loss": 0.0098, "step": 671080 }, { "epoch": 1.74, "learning_rate": 3.906568752737952e-05, "loss": 0.0157, "step": 671090 }, { "epoch": 1.74, "learning_rate": 3.906179931100805e-05, "loss": 0.0093, "step": 671100 }, { "epoch": 1.74, "learning_rate": 3.905791109463659e-05, "loss": 0.0092, "step": 671110 }, { "epoch": 1.74, "learning_rate": 3.905402287826513e-05, "loss": 0.0094, "step": 671120 }, { "epoch": 1.74, "learning_rate": 3.905013466189366e-05, "loss": 0.0082, "step": 671130 }, { "epoch": 1.74, "learning_rate": 3.90462464455222e-05, "loss": 0.0063, "step": 671140 }, { "epoch": 1.74, "learning_rate": 3.904235822915073e-05, "loss": 0.0079, "step": 671150 }, { "epoch": 1.74, "learning_rate": 3.903847001277927e-05, "loss": 0.0088, "step": 671160 }, { "epoch": 1.74, "learning_rate": 3.90345817964078e-05, "loss": 0.0092, "step": 671170 }, { "epoch": 1.74, "learning_rate": 3.903069358003634e-05, "loss": 0.0077, "step": 671180 }, { "epoch": 1.74, "learning_rate": 3.902680536366488e-05, "loss": 0.0092, "step": 671190 }, { "epoch": 1.74, "learning_rate": 3.9022917147293414e-05, "loss": 0.0075, "step": 671200 }, { "epoch": 1.74, "learning_rate": 3.901902893092195e-05, "loss": 0.0075, "step": 671210 }, { "epoch": 1.74, "learning_rate": 3.9015140714550484e-05, "loss": 0.007, "step": 671220 }, { "epoch": 1.74, "learning_rate": 3.901125249817902e-05, "loss": 0.0096, "step": 671230 }, { "epoch": 1.74, "learning_rate": 3.900736428180755e-05, "loss": 0.0086, "step": 671240 }, { "epoch": 1.74, "learning_rate": 3.900347606543609e-05, "loss": 0.0084, "step": 671250 }, { "epoch": 1.74, "learning_rate": 3.8999587849064616e-05, "loss": 0.0078, "step": 671260 }, { "epoch": 1.74, "learning_rate": 3.899569963269315e-05, "loss": 0.0109, "step": 671270 }, { "epoch": 1.74, "learning_rate": 3.8991811416321686e-05, "loss": 0.0104, "step": 671280 }, { "epoch": 1.74, "learning_rate": 3.898792319995023e-05, "loss": 0.0081, "step": 671290 }, { "epoch": 1.74, "learning_rate": 3.898403498357876e-05, "loss": 0.0066, "step": 671300 }, { "epoch": 1.74, "learning_rate": 3.89801467672073e-05, "loss": 0.0097, "step": 671310 }, { "epoch": 1.74, "learning_rate": 3.897625855083583e-05, "loss": 0.0083, "step": 671320 }, { "epoch": 1.74, "learning_rate": 3.897237033446437e-05, "loss": 0.0065, "step": 671330 }, { "epoch": 1.74, "learning_rate": 3.89684821180929e-05, "loss": 0.0073, "step": 671340 }, { "epoch": 1.74, "learning_rate": 3.896459390172144e-05, "loss": 0.0056, "step": 671350 }, { "epoch": 1.74, "learning_rate": 3.896070568534997e-05, "loss": 0.0062, "step": 671360 }, { "epoch": 1.74, "learning_rate": 3.895681746897851e-05, "loss": 0.0091, "step": 671370 }, { "epoch": 1.74, "learning_rate": 3.895292925260705e-05, "loss": 0.0068, "step": 671380 }, { "epoch": 1.74, "learning_rate": 3.894904103623558e-05, "loss": 0.0072, "step": 671390 }, { "epoch": 1.74, "learning_rate": 3.894515281986412e-05, "loss": 0.0065, "step": 671400 }, { "epoch": 1.74, "learning_rate": 3.894126460349265e-05, "loss": 0.0081, "step": 671410 }, { "epoch": 1.74, "learning_rate": 3.893737638712119e-05, "loss": 0.0058, "step": 671420 }, { "epoch": 1.74, "learning_rate": 3.893348817074972e-05, "loss": 0.0061, "step": 671430 }, { "epoch": 1.74, "learning_rate": 3.892959995437826e-05, "loss": 0.0064, "step": 671440 }, { "epoch": 1.74, "learning_rate": 3.89257117380068e-05, "loss": 0.0069, "step": 671450 }, { "epoch": 1.74, "learning_rate": 3.8921823521635334e-05, "loss": 0.0083, "step": 671460 }, { "epoch": 1.74, "learning_rate": 3.891793530526387e-05, "loss": 0.0071, "step": 671470 }, { "epoch": 1.74, "learning_rate": 3.8914047088892404e-05, "loss": 0.0101, "step": 671480 }, { "epoch": 1.74, "learning_rate": 3.891015887252094e-05, "loss": 0.0086, "step": 671490 }, { "epoch": 1.74, "learning_rate": 3.890627065614947e-05, "loss": 0.0069, "step": 671500 }, { "epoch": 1.74, "learning_rate": 3.8902382439778e-05, "loss": 0.0083, "step": 671510 }, { "epoch": 1.74, "learning_rate": 3.8898494223406536e-05, "loss": 0.0068, "step": 671520 }, { "epoch": 1.74, "learning_rate": 3.889460600703507e-05, "loss": 0.0102, "step": 671530 }, { "epoch": 1.74, "learning_rate": 3.8890717790663606e-05, "loss": 0.0114, "step": 671540 }, { "epoch": 1.74, "learning_rate": 3.888682957429215e-05, "loss": 0.007, "step": 671550 }, { "epoch": 1.74, "learning_rate": 3.888294135792068e-05, "loss": 0.0077, "step": 671560 }, { "epoch": 1.74, "learning_rate": 3.887905314154922e-05, "loss": 0.0078, "step": 671570 }, { "epoch": 1.74, "learning_rate": 3.887516492517775e-05, "loss": 0.0095, "step": 671580 }, { "epoch": 1.74, "learning_rate": 3.887127670880629e-05, "loss": 0.0124, "step": 671590 }, { "epoch": 1.74, "learning_rate": 3.886738849243482e-05, "loss": 0.0076, "step": 671600 }, { "epoch": 1.74, "learning_rate": 3.886350027606336e-05, "loss": 0.0064, "step": 671610 }, { "epoch": 1.74, "learning_rate": 3.885961205969189e-05, "loss": 0.0073, "step": 671620 }, { "epoch": 1.74, "learning_rate": 3.8855723843320427e-05, "loss": 0.0057, "step": 671630 }, { "epoch": 1.74, "learning_rate": 3.885183562694897e-05, "loss": 0.0067, "step": 671640 }, { "epoch": 1.74, "learning_rate": 3.88479474105775e-05, "loss": 0.0075, "step": 671650 }, { "epoch": 1.74, "learning_rate": 3.884405919420604e-05, "loss": 0.0074, "step": 671660 }, { "epoch": 1.74, "learning_rate": 3.884017097783457e-05, "loss": 0.0094, "step": 671670 }, { "epoch": 1.74, "learning_rate": 3.883628276146311e-05, "loss": 0.0082, "step": 671680 }, { "epoch": 1.74, "learning_rate": 3.883239454509164e-05, "loss": 0.0118, "step": 671690 }, { "epoch": 1.74, "learning_rate": 3.882850632872018e-05, "loss": 0.0062, "step": 671700 }, { "epoch": 1.74, "learning_rate": 3.882461811234871e-05, "loss": 0.0065, "step": 671710 }, { "epoch": 1.74, "learning_rate": 3.8820729895977254e-05, "loss": 0.0064, "step": 671720 }, { "epoch": 1.74, "learning_rate": 3.881684167960579e-05, "loss": 0.0066, "step": 671730 }, { "epoch": 1.74, "learning_rate": 3.8812953463234324e-05, "loss": 0.0071, "step": 671740 }, { "epoch": 1.74, "learning_rate": 3.880906524686285e-05, "loss": 0.0071, "step": 671750 }, { "epoch": 1.74, "learning_rate": 3.8805177030491386e-05, "loss": 0.0059, "step": 671760 }, { "epoch": 1.74, "learning_rate": 3.880128881411992e-05, "loss": 0.0069, "step": 671770 }, { "epoch": 1.74, "learning_rate": 3.8797400597748456e-05, "loss": 0.0085, "step": 671780 }, { "epoch": 1.74, "learning_rate": 3.879351238137699e-05, "loss": 0.0076, "step": 671790 }, { "epoch": 1.74, "learning_rate": 3.8789624165005526e-05, "loss": 0.0076, "step": 671800 }, { "epoch": 1.74, "learning_rate": 3.878573594863406e-05, "loss": 0.0102, "step": 671810 }, { "epoch": 1.74, "learning_rate": 3.87818477322626e-05, "loss": 0.0079, "step": 671820 }, { "epoch": 1.74, "learning_rate": 3.877795951589114e-05, "loss": 0.0073, "step": 671830 }, { "epoch": 1.74, "learning_rate": 3.877407129951967e-05, "loss": 0.0055, "step": 671840 }, { "epoch": 1.74, "learning_rate": 3.877018308314821e-05, "loss": 0.0058, "step": 671850 }, { "epoch": 1.74, "learning_rate": 3.876629486677674e-05, "loss": 0.0074, "step": 671860 }, { "epoch": 1.74, "learning_rate": 3.876240665040528e-05, "loss": 0.0078, "step": 671870 }, { "epoch": 1.74, "learning_rate": 3.875851843403381e-05, "loss": 0.0056, "step": 671880 }, { "epoch": 1.74, "learning_rate": 3.8754630217662346e-05, "loss": 0.0065, "step": 671890 }, { "epoch": 1.74, "learning_rate": 3.875074200129089e-05, "loss": 0.0093, "step": 671900 }, { "epoch": 1.74, "learning_rate": 3.874685378491942e-05, "loss": 0.0069, "step": 671910 }, { "epoch": 1.74, "learning_rate": 3.874296556854796e-05, "loss": 0.008, "step": 671920 }, { "epoch": 1.74, "learning_rate": 3.873907735217649e-05, "loss": 0.0091, "step": 671930 }, { "epoch": 1.74, "learning_rate": 3.873518913580503e-05, "loss": 0.0084, "step": 671940 }, { "epoch": 1.74, "learning_rate": 3.873130091943356e-05, "loss": 0.0098, "step": 671950 }, { "epoch": 1.74, "learning_rate": 3.87274127030621e-05, "loss": 0.0065, "step": 671960 }, { "epoch": 1.74, "learning_rate": 3.872352448669063e-05, "loss": 0.009, "step": 671970 }, { "epoch": 1.74, "learning_rate": 3.8719636270319174e-05, "loss": 0.0073, "step": 671980 }, { "epoch": 1.74, "learning_rate": 3.871574805394771e-05, "loss": 0.0052, "step": 671990 }, { "epoch": 1.74, "learning_rate": 3.871185983757624e-05, "loss": 0.008, "step": 672000 }, { "epoch": 1.74, "eval_cer": 0.8816508997566032, "eval_loss": 0.00507059833034873, "eval_runtime": 107.8496, "eval_samples_per_second": 18.544, "eval_steps_per_second": 4.636, "step": 672000 }, { "epoch": 1.74, "learning_rate": 3.870797162120477e-05, "loss": 0.01, "step": 672010 }, { "epoch": 1.74, "learning_rate": 3.8704083404833306e-05, "loss": 0.0073, "step": 672020 }, { "epoch": 1.74, "learning_rate": 3.870019518846184e-05, "loss": 0.0084, "step": 672030 }, { "epoch": 1.74, "learning_rate": 3.8696306972090376e-05, "loss": 0.0082, "step": 672040 }, { "epoch": 1.74, "learning_rate": 3.869241875571891e-05, "loss": 0.0114, "step": 672050 }, { "epoch": 1.74, "learning_rate": 3.8688530539347446e-05, "loss": 0.0093, "step": 672060 }, { "epoch": 1.74, "learning_rate": 3.868464232297598e-05, "loss": 0.0082, "step": 672070 }, { "epoch": 1.74, "learning_rate": 3.868075410660452e-05, "loss": 0.0097, "step": 672080 }, { "epoch": 1.74, "learning_rate": 3.867686589023306e-05, "loss": 0.0088, "step": 672090 }, { "epoch": 1.74, "learning_rate": 3.867297767386159e-05, "loss": 0.0108, "step": 672100 }, { "epoch": 1.74, "learning_rate": 3.866908945749013e-05, "loss": 0.0081, "step": 672110 }, { "epoch": 1.74, "learning_rate": 3.866520124111866e-05, "loss": 0.0071, "step": 672120 }, { "epoch": 1.74, "learning_rate": 3.86613130247472e-05, "loss": 0.0078, "step": 672130 }, { "epoch": 1.74, "learning_rate": 3.865742480837573e-05, "loss": 0.0068, "step": 672140 }, { "epoch": 1.74, "learning_rate": 3.8653536592004266e-05, "loss": 0.0081, "step": 672150 }, { "epoch": 1.74, "learning_rate": 3.864964837563281e-05, "loss": 0.0085, "step": 672160 }, { "epoch": 1.74, "learning_rate": 3.864576015926134e-05, "loss": 0.01, "step": 672170 }, { "epoch": 1.74, "learning_rate": 3.864187194288988e-05, "loss": 0.0081, "step": 672180 }, { "epoch": 1.74, "learning_rate": 3.863798372651841e-05, "loss": 0.0069, "step": 672190 }, { "epoch": 1.74, "learning_rate": 3.863409551014695e-05, "loss": 0.0081, "step": 672200 }, { "epoch": 1.74, "learning_rate": 3.863020729377548e-05, "loss": 0.0086, "step": 672210 }, { "epoch": 1.74, "learning_rate": 3.862631907740402e-05, "loss": 0.0101, "step": 672220 }, { "epoch": 1.74, "learning_rate": 3.862243086103255e-05, "loss": 0.0099, "step": 672230 }, { "epoch": 1.74, "learning_rate": 3.8618542644661094e-05, "loss": 0.0079, "step": 672240 }, { "epoch": 1.74, "learning_rate": 3.8614654428289615e-05, "loss": 0.0054, "step": 672250 }, { "epoch": 1.74, "learning_rate": 3.861076621191816e-05, "loss": 0.0095, "step": 672260 }, { "epoch": 1.74, "learning_rate": 3.860687799554669e-05, "loss": 0.0058, "step": 672270 }, { "epoch": 1.74, "learning_rate": 3.8602989779175226e-05, "loss": 0.01, "step": 672280 }, { "epoch": 1.74, "learning_rate": 3.859910156280376e-05, "loss": 0.0062, "step": 672290 }, { "epoch": 1.74, "learning_rate": 3.8595213346432296e-05, "loss": 0.0065, "step": 672300 }, { "epoch": 1.74, "learning_rate": 3.859132513006083e-05, "loss": 0.0119, "step": 672310 }, { "epoch": 1.74, "learning_rate": 3.8587436913689366e-05, "loss": 0.006, "step": 672320 }, { "epoch": 1.74, "learning_rate": 3.85835486973179e-05, "loss": 0.0091, "step": 672330 }, { "epoch": 1.74, "learning_rate": 3.857966048094644e-05, "loss": 0.0073, "step": 672340 }, { "epoch": 1.74, "learning_rate": 3.857577226457498e-05, "loss": 0.007, "step": 672350 }, { "epoch": 1.74, "learning_rate": 3.857188404820351e-05, "loss": 0.0094, "step": 672360 }, { "epoch": 1.74, "learning_rate": 3.856799583183205e-05, "loss": 0.0065, "step": 672370 }, { "epoch": 1.74, "learning_rate": 3.856410761546058e-05, "loss": 0.0083, "step": 672380 }, { "epoch": 1.74, "learning_rate": 3.856021939908912e-05, "loss": 0.0088, "step": 672390 }, { "epoch": 1.74, "learning_rate": 3.855633118271765e-05, "loss": 0.0136, "step": 672400 }, { "epoch": 1.74, "learning_rate": 3.8552442966346186e-05, "loss": 0.0099, "step": 672410 }, { "epoch": 1.74, "learning_rate": 3.854855474997473e-05, "loss": 0.0157, "step": 672420 }, { "epoch": 1.74, "learning_rate": 3.854466653360326e-05, "loss": 0.0082, "step": 672430 }, { "epoch": 1.74, "learning_rate": 3.85407783172318e-05, "loss": 0.007, "step": 672440 }, { "epoch": 1.74, "learning_rate": 3.853689010086033e-05, "loss": 0.0067, "step": 672450 }, { "epoch": 1.74, "learning_rate": 3.853300188448887e-05, "loss": 0.013, "step": 672460 }, { "epoch": 1.74, "learning_rate": 3.85291136681174e-05, "loss": 0.0075, "step": 672470 }, { "epoch": 1.74, "learning_rate": 3.852522545174594e-05, "loss": 0.0093, "step": 672480 }, { "epoch": 1.74, "learning_rate": 3.852133723537447e-05, "loss": 0.0096, "step": 672490 }, { "epoch": 1.74, "learning_rate": 3.8517449019003e-05, "loss": 0.0073, "step": 672500 }, { "epoch": 1.74, "learning_rate": 3.8513560802631535e-05, "loss": 0.0065, "step": 672510 }, { "epoch": 1.74, "learning_rate": 3.850967258626008e-05, "loss": 0.0089, "step": 672520 }, { "epoch": 1.74, "learning_rate": 3.850578436988861e-05, "loss": 0.0097, "step": 672530 }, { "epoch": 1.74, "learning_rate": 3.8501896153517146e-05, "loss": 0.0111, "step": 672540 }, { "epoch": 1.74, "learning_rate": 3.849800793714568e-05, "loss": 0.0068, "step": 672550 }, { "epoch": 1.74, "learning_rate": 3.8494119720774216e-05, "loss": 0.0066, "step": 672560 }, { "epoch": 1.74, "learning_rate": 3.849023150440275e-05, "loss": 0.0056, "step": 672570 }, { "epoch": 1.74, "learning_rate": 3.8486343288031286e-05, "loss": 0.0095, "step": 672580 }, { "epoch": 1.74, "learning_rate": 3.848245507165982e-05, "loss": 0.0087, "step": 672590 }, { "epoch": 1.74, "learning_rate": 3.847856685528836e-05, "loss": 0.0088, "step": 672600 }, { "epoch": 1.74, "learning_rate": 3.84746786389169e-05, "loss": 0.0084, "step": 672610 }, { "epoch": 1.74, "learning_rate": 3.847079042254543e-05, "loss": 0.0101, "step": 672620 }, { "epoch": 1.74, "learning_rate": 3.846690220617397e-05, "loss": 0.0087, "step": 672630 }, { "epoch": 1.74, "learning_rate": 3.84630139898025e-05, "loss": 0.0073, "step": 672640 }, { "epoch": 1.74, "learning_rate": 3.8459125773431037e-05, "loss": 0.0088, "step": 672650 }, { "epoch": 1.74, "learning_rate": 3.845523755705957e-05, "loss": 0.0088, "step": 672660 }, { "epoch": 1.74, "learning_rate": 3.8451349340688106e-05, "loss": 0.0069, "step": 672670 }, { "epoch": 1.74, "learning_rate": 3.844746112431665e-05, "loss": 0.0075, "step": 672680 }, { "epoch": 1.74, "learning_rate": 3.844357290794518e-05, "loss": 0.0079, "step": 672690 }, { "epoch": 1.74, "learning_rate": 3.843968469157372e-05, "loss": 0.0063, "step": 672700 }, { "epoch": 1.74, "learning_rate": 3.843579647520225e-05, "loss": 0.0065, "step": 672710 }, { "epoch": 1.74, "learning_rate": 3.843190825883079e-05, "loss": 0.0093, "step": 672720 }, { "epoch": 1.74, "learning_rate": 3.842802004245932e-05, "loss": 0.007, "step": 672730 }, { "epoch": 1.74, "learning_rate": 3.842413182608786e-05, "loss": 0.0076, "step": 672740 }, { "epoch": 1.74, "learning_rate": 3.8420243609716385e-05, "loss": 0.0078, "step": 672750 }, { "epoch": 1.74, "learning_rate": 3.841635539334492e-05, "loss": 0.0103, "step": 672760 }, { "epoch": 1.74, "learning_rate": 3.8412467176973455e-05, "loss": 0.0075, "step": 672770 }, { "epoch": 1.74, "learning_rate": 3.8408578960601997e-05, "loss": 0.0084, "step": 672780 }, { "epoch": 1.74, "learning_rate": 3.840469074423053e-05, "loss": 0.007, "step": 672790 }, { "epoch": 1.74, "learning_rate": 3.8400802527859066e-05, "loss": 0.008, "step": 672800 }, { "epoch": 1.74, "learning_rate": 3.83969143114876e-05, "loss": 0.0078, "step": 672810 }, { "epoch": 1.74, "learning_rate": 3.8393026095116136e-05, "loss": 0.0102, "step": 672820 }, { "epoch": 1.74, "learning_rate": 3.838913787874467e-05, "loss": 0.0068, "step": 672830 }, { "epoch": 1.74, "learning_rate": 3.8385249662373206e-05, "loss": 0.0077, "step": 672840 }, { "epoch": 1.74, "learning_rate": 3.838136144600174e-05, "loss": 0.0081, "step": 672850 }, { "epoch": 1.74, "learning_rate": 3.837747322963028e-05, "loss": 0.0091, "step": 672860 }, { "epoch": 1.74, "learning_rate": 3.837358501325882e-05, "loss": 0.0087, "step": 672870 }, { "epoch": 1.74, "learning_rate": 3.836969679688735e-05, "loss": 0.0072, "step": 672880 }, { "epoch": 1.74, "learning_rate": 3.836580858051589e-05, "loss": 0.0096, "step": 672890 }, { "epoch": 1.74, "learning_rate": 3.836192036414442e-05, "loss": 0.0073, "step": 672900 }, { "epoch": 1.74, "learning_rate": 3.8358032147772957e-05, "loss": 0.0102, "step": 672910 }, { "epoch": 1.74, "learning_rate": 3.835414393140149e-05, "loss": 0.0068, "step": 672920 }, { "epoch": 1.74, "learning_rate": 3.8350255715030026e-05, "loss": 0.0075, "step": 672930 }, { "epoch": 1.74, "learning_rate": 3.834636749865856e-05, "loss": 0.0088, "step": 672940 }, { "epoch": 1.74, "learning_rate": 3.83424792822871e-05, "loss": 0.0048, "step": 672950 }, { "epoch": 1.74, "learning_rate": 3.833859106591564e-05, "loss": 0.009, "step": 672960 }, { "epoch": 1.74, "learning_rate": 3.833470284954417e-05, "loss": 0.0073, "step": 672970 }, { "epoch": 1.74, "learning_rate": 3.833081463317271e-05, "loss": 0.0082, "step": 672980 }, { "epoch": 1.74, "learning_rate": 3.8326926416801235e-05, "loss": 0.0086, "step": 672990 }, { "epoch": 1.74, "learning_rate": 3.832303820042977e-05, "loss": 0.0095, "step": 673000 }, { "epoch": 1.74, "eval_cer": 0.8816620968520765, "eval_loss": 0.005063023883849382, "eval_runtime": 108.0509, "eval_samples_per_second": 18.51, "eval_steps_per_second": 4.627, "step": 673000 }, { "epoch": 1.74, "learning_rate": 3.8319149984058305e-05, "loss": 0.0098, "step": 673010 }, { "epoch": 1.74, "learning_rate": 3.831526176768684e-05, "loss": 0.0068, "step": 673020 }, { "epoch": 1.74, "learning_rate": 3.8311373551315375e-05, "loss": 0.0071, "step": 673030 }, { "epoch": 1.74, "learning_rate": 3.8307485334943917e-05, "loss": 0.0094, "step": 673040 }, { "epoch": 1.74, "learning_rate": 3.830359711857245e-05, "loss": 0.006, "step": 673050 }, { "epoch": 1.74, "learning_rate": 3.8299708902200986e-05, "loss": 0.0064, "step": 673060 }, { "epoch": 1.74, "learning_rate": 3.829582068582952e-05, "loss": 0.0074, "step": 673070 }, { "epoch": 1.74, "learning_rate": 3.8291932469458056e-05, "loss": 0.0081, "step": 673080 }, { "epoch": 1.74, "learning_rate": 3.828804425308659e-05, "loss": 0.0069, "step": 673090 }, { "epoch": 1.74, "learning_rate": 3.8284156036715126e-05, "loss": 0.0052, "step": 673100 }, { "epoch": 1.74, "learning_rate": 3.828026782034366e-05, "loss": 0.0088, "step": 673110 }, { "epoch": 1.74, "learning_rate": 3.8276379603972195e-05, "loss": 0.0078, "step": 673120 }, { "epoch": 1.74, "learning_rate": 3.827249138760074e-05, "loss": 0.0086, "step": 673130 }, { "epoch": 1.74, "learning_rate": 3.826860317122927e-05, "loss": 0.0077, "step": 673140 }, { "epoch": 1.74, "learning_rate": 3.826471495485781e-05, "loss": 0.0086, "step": 673150 }, { "epoch": 1.74, "learning_rate": 3.826082673848634e-05, "loss": 0.0064, "step": 673160 }, { "epoch": 1.74, "learning_rate": 3.8256938522114876e-05, "loss": 0.0062, "step": 673170 }, { "epoch": 1.74, "learning_rate": 3.825305030574341e-05, "loss": 0.0074, "step": 673180 }, { "epoch": 1.75, "learning_rate": 3.8249162089371946e-05, "loss": 0.0068, "step": 673190 }, { "epoch": 1.75, "learning_rate": 3.824527387300048e-05, "loss": 0.007, "step": 673200 }, { "epoch": 1.75, "learning_rate": 3.824138565662902e-05, "loss": 0.0056, "step": 673210 }, { "epoch": 1.75, "learning_rate": 3.823749744025756e-05, "loss": 0.0083, "step": 673220 }, { "epoch": 1.75, "learning_rate": 3.823360922388609e-05, "loss": 0.0081, "step": 673230 }, { "epoch": 1.75, "learning_rate": 3.822972100751462e-05, "loss": 0.0076, "step": 673240 }, { "epoch": 1.75, "learning_rate": 3.8225832791143155e-05, "loss": 0.007, "step": 673250 }, { "epoch": 1.75, "learning_rate": 3.822194457477169e-05, "loss": 0.0075, "step": 673260 }, { "epoch": 1.75, "learning_rate": 3.8218056358400225e-05, "loss": 0.006, "step": 673270 }, { "epoch": 1.75, "learning_rate": 3.821416814202876e-05, "loss": 0.0114, "step": 673280 }, { "epoch": 1.75, "learning_rate": 3.8210279925657295e-05, "loss": 0.0084, "step": 673290 }, { "epoch": 1.75, "learning_rate": 3.820639170928583e-05, "loss": 0.0068, "step": 673300 }, { "epoch": 1.75, "learning_rate": 3.820250349291437e-05, "loss": 0.0094, "step": 673310 }, { "epoch": 1.75, "learning_rate": 3.8198615276542906e-05, "loss": 0.0078, "step": 673320 }, { "epoch": 1.75, "learning_rate": 3.819472706017144e-05, "loss": 0.0066, "step": 673330 }, { "epoch": 1.75, "learning_rate": 3.8190838843799976e-05, "loss": 0.0091, "step": 673340 }, { "epoch": 1.75, "learning_rate": 3.818695062742851e-05, "loss": 0.0078, "step": 673350 }, { "epoch": 1.75, "learning_rate": 3.8183062411057046e-05, "loss": 0.0059, "step": 673360 }, { "epoch": 1.75, "learning_rate": 3.817917419468558e-05, "loss": 0.0065, "step": 673370 }, { "epoch": 1.75, "learning_rate": 3.8175285978314115e-05, "loss": 0.0108, "step": 673380 }, { "epoch": 1.75, "learning_rate": 3.817139776194266e-05, "loss": 0.012, "step": 673390 }, { "epoch": 1.75, "learning_rate": 3.816750954557119e-05, "loss": 0.0106, "step": 673400 }, { "epoch": 1.75, "learning_rate": 3.816362132919973e-05, "loss": 0.009, "step": 673410 }, { "epoch": 1.75, "learning_rate": 3.815973311282826e-05, "loss": 0.0063, "step": 673420 }, { "epoch": 1.75, "learning_rate": 3.8155844896456796e-05, "loss": 0.0094, "step": 673430 }, { "epoch": 1.75, "learning_rate": 3.815195668008533e-05, "loss": 0.0112, "step": 673440 }, { "epoch": 1.75, "learning_rate": 3.8148068463713866e-05, "loss": 0.0072, "step": 673450 }, { "epoch": 1.75, "learning_rate": 3.81441802473424e-05, "loss": 0.0081, "step": 673460 }, { "epoch": 1.75, "learning_rate": 3.814029203097094e-05, "loss": 0.0056, "step": 673470 }, { "epoch": 1.75, "learning_rate": 3.813640381459948e-05, "loss": 0.0075, "step": 673480 }, { "epoch": 1.75, "learning_rate": 3.8132515598228006e-05, "loss": 0.0084, "step": 673490 }, { "epoch": 1.75, "learning_rate": 3.812862738185654e-05, "loss": 0.0088, "step": 673500 }, { "epoch": 1.75, "learning_rate": 3.8124739165485075e-05, "loss": 0.0078, "step": 673510 }, { "epoch": 1.75, "learning_rate": 3.812085094911361e-05, "loss": 0.0066, "step": 673520 }, { "epoch": 1.75, "learning_rate": 3.8116962732742145e-05, "loss": 0.0076, "step": 673530 }, { "epoch": 1.75, "learning_rate": 3.811307451637068e-05, "loss": 0.0071, "step": 673540 }, { "epoch": 1.75, "learning_rate": 3.8109186299999215e-05, "loss": 0.0094, "step": 673550 }, { "epoch": 1.75, "learning_rate": 3.810529808362775e-05, "loss": 0.0073, "step": 673560 }, { "epoch": 1.75, "learning_rate": 3.810140986725629e-05, "loss": 0.0065, "step": 673570 }, { "epoch": 1.75, "learning_rate": 3.8097521650884826e-05, "loss": 0.0073, "step": 673580 }, { "epoch": 1.75, "learning_rate": 3.809363343451336e-05, "loss": 0.0078, "step": 673590 }, { "epoch": 1.75, "learning_rate": 3.8089745218141896e-05, "loss": 0.0073, "step": 673600 }, { "epoch": 1.75, "learning_rate": 3.808585700177043e-05, "loss": 0.0073, "step": 673610 }, { "epoch": 1.75, "learning_rate": 3.8081968785398966e-05, "loss": 0.0094, "step": 673620 }, { "epoch": 1.75, "learning_rate": 3.80780805690275e-05, "loss": 0.0085, "step": 673630 }, { "epoch": 1.75, "learning_rate": 3.8074192352656035e-05, "loss": 0.008, "step": 673640 }, { "epoch": 1.75, "learning_rate": 3.807030413628458e-05, "loss": 0.0106, "step": 673650 }, { "epoch": 1.75, "learning_rate": 3.806641591991311e-05, "loss": 0.0088, "step": 673660 }, { "epoch": 1.75, "learning_rate": 3.806252770354165e-05, "loss": 0.0075, "step": 673670 }, { "epoch": 1.75, "learning_rate": 3.805863948717018e-05, "loss": 0.0051, "step": 673680 }, { "epoch": 1.75, "learning_rate": 3.8054751270798716e-05, "loss": 0.0068, "step": 673690 }, { "epoch": 1.75, "learning_rate": 3.805086305442725e-05, "loss": 0.0116, "step": 673700 }, { "epoch": 1.75, "learning_rate": 3.8046974838055786e-05, "loss": 0.0081, "step": 673710 }, { "epoch": 1.75, "learning_rate": 3.804308662168432e-05, "loss": 0.008, "step": 673720 }, { "epoch": 1.75, "learning_rate": 3.803919840531286e-05, "loss": 0.008, "step": 673730 }, { "epoch": 1.75, "learning_rate": 3.8035310188941384e-05, "loss": 0.0089, "step": 673740 }, { "epoch": 1.75, "learning_rate": 3.8031421972569926e-05, "loss": 0.0064, "step": 673750 }, { "epoch": 1.75, "learning_rate": 3.802753375619846e-05, "loss": 0.0059, "step": 673760 }, { "epoch": 1.75, "learning_rate": 3.8023645539826995e-05, "loss": 0.0063, "step": 673770 }, { "epoch": 1.75, "learning_rate": 3.801975732345553e-05, "loss": 0.0086, "step": 673780 }, { "epoch": 1.75, "learning_rate": 3.8015869107084065e-05, "loss": 0.0074, "step": 673790 }, { "epoch": 1.75, "learning_rate": 3.80119808907126e-05, "loss": 0.0082, "step": 673800 }, { "epoch": 1.75, "learning_rate": 3.8008092674341135e-05, "loss": 0.0078, "step": 673810 }, { "epoch": 1.75, "learning_rate": 3.800420445796967e-05, "loss": 0.0085, "step": 673820 }, { "epoch": 1.75, "learning_rate": 3.800031624159821e-05, "loss": 0.0078, "step": 673830 }, { "epoch": 1.75, "learning_rate": 3.7996428025226746e-05, "loss": 0.0092, "step": 673840 }, { "epoch": 1.75, "learning_rate": 3.799253980885528e-05, "loss": 0.007, "step": 673850 }, { "epoch": 1.75, "learning_rate": 3.7988651592483816e-05, "loss": 0.0084, "step": 673860 }, { "epoch": 1.75, "learning_rate": 3.798476337611235e-05, "loss": 0.0074, "step": 673870 }, { "epoch": 1.75, "learning_rate": 3.7980875159740886e-05, "loss": 0.0088, "step": 673880 }, { "epoch": 1.75, "learning_rate": 3.797698694336942e-05, "loss": 0.0064, "step": 673890 }, { "epoch": 1.75, "learning_rate": 3.7973098726997955e-05, "loss": 0.0075, "step": 673900 }, { "epoch": 1.75, "learning_rate": 3.79692105106265e-05, "loss": 0.0077, "step": 673910 }, { "epoch": 1.75, "learning_rate": 3.796532229425503e-05, "loss": 0.0057, "step": 673920 }, { "epoch": 1.75, "learning_rate": 3.796143407788357e-05, "loss": 0.0093, "step": 673930 }, { "epoch": 1.75, "learning_rate": 3.79575458615121e-05, "loss": 0.0072, "step": 673940 }, { "epoch": 1.75, "learning_rate": 3.7953657645140636e-05, "loss": 0.0066, "step": 673950 }, { "epoch": 1.75, "learning_rate": 3.794976942876917e-05, "loss": 0.0074, "step": 673960 }, { "epoch": 1.75, "learning_rate": 3.7945881212397706e-05, "loss": 0.0097, "step": 673970 }, { "epoch": 1.75, "learning_rate": 3.794199299602624e-05, "loss": 0.0086, "step": 673980 }, { "epoch": 1.75, "learning_rate": 3.793810477965477e-05, "loss": 0.0078, "step": 673990 }, { "epoch": 1.75, "learning_rate": 3.7934216563283304e-05, "loss": 0.0062, "step": 674000 }, { "epoch": 1.75, "eval_cer": 0.8816830914060892, "eval_loss": 0.004991509020328522, "eval_runtime": 108.0875, "eval_samples_per_second": 18.504, "eval_steps_per_second": 4.626, "step": 674000 }, { "epoch": 1.75, "learning_rate": 3.7930328346911846e-05, "loss": 0.0074, "step": 674010 }, { "epoch": 1.75, "learning_rate": 3.792644013054038e-05, "loss": 0.0093, "step": 674020 }, { "epoch": 1.75, "learning_rate": 3.7922551914168915e-05, "loss": 0.0126, "step": 674030 }, { "epoch": 1.75, "learning_rate": 3.791866369779745e-05, "loss": 0.0077, "step": 674040 }, { "epoch": 1.75, "learning_rate": 3.7914775481425985e-05, "loss": 0.0088, "step": 674050 }, { "epoch": 1.75, "learning_rate": 3.791088726505452e-05, "loss": 0.0074, "step": 674060 }, { "epoch": 1.75, "learning_rate": 3.7906999048683055e-05, "loss": 0.0102, "step": 674070 }, { "epoch": 1.75, "learning_rate": 3.790311083231159e-05, "loss": 0.0074, "step": 674080 }, { "epoch": 1.75, "learning_rate": 3.789922261594013e-05, "loss": 0.0116, "step": 674090 }, { "epoch": 1.75, "learning_rate": 3.7895334399568666e-05, "loss": 0.0064, "step": 674100 }, { "epoch": 1.75, "learning_rate": 3.78914461831972e-05, "loss": 0.0081, "step": 674110 }, { "epoch": 1.75, "learning_rate": 3.7887557966825736e-05, "loss": 0.007, "step": 674120 }, { "epoch": 1.75, "learning_rate": 3.788366975045427e-05, "loss": 0.0058, "step": 674130 }, { "epoch": 1.75, "learning_rate": 3.7879781534082805e-05, "loss": 0.0073, "step": 674140 }, { "epoch": 1.75, "learning_rate": 3.787589331771134e-05, "loss": 0.0061, "step": 674150 }, { "epoch": 1.75, "learning_rate": 3.7872005101339875e-05, "loss": 0.0061, "step": 674160 }, { "epoch": 1.75, "learning_rate": 3.786811688496842e-05, "loss": 0.0094, "step": 674170 }, { "epoch": 1.75, "learning_rate": 3.786422866859695e-05, "loss": 0.0046, "step": 674180 }, { "epoch": 1.75, "learning_rate": 3.7860340452225487e-05, "loss": 0.0078, "step": 674190 }, { "epoch": 1.75, "learning_rate": 3.785645223585402e-05, "loss": 0.009, "step": 674200 }, { "epoch": 1.75, "learning_rate": 3.7852564019482556e-05, "loss": 0.01, "step": 674210 }, { "epoch": 1.75, "learning_rate": 3.784867580311109e-05, "loss": 0.0055, "step": 674220 }, { "epoch": 1.75, "learning_rate": 3.784478758673962e-05, "loss": 0.0096, "step": 674230 }, { "epoch": 1.75, "learning_rate": 3.7840899370368154e-05, "loss": 0.0155, "step": 674240 }, { "epoch": 1.75, "learning_rate": 3.783701115399669e-05, "loss": 0.0081, "step": 674250 }, { "epoch": 1.75, "learning_rate": 3.7833122937625224e-05, "loss": 0.0075, "step": 674260 }, { "epoch": 1.75, "learning_rate": 3.7829234721253765e-05, "loss": 0.0084, "step": 674270 }, { "epoch": 1.75, "learning_rate": 3.78253465048823e-05, "loss": 0.0068, "step": 674280 }, { "epoch": 1.75, "learning_rate": 3.7821458288510835e-05, "loss": 0.0068, "step": 674290 }, { "epoch": 1.75, "learning_rate": 3.781757007213937e-05, "loss": 0.0085, "step": 674300 }, { "epoch": 1.75, "learning_rate": 3.7813681855767905e-05, "loss": 0.0078, "step": 674310 }, { "epoch": 1.75, "learning_rate": 3.780979363939644e-05, "loss": 0.0072, "step": 674320 }, { "epoch": 1.75, "learning_rate": 3.7805905423024975e-05, "loss": 0.0088, "step": 674330 }, { "epoch": 1.75, "learning_rate": 3.780201720665351e-05, "loss": 0.0095, "step": 674340 }, { "epoch": 1.75, "learning_rate": 3.779812899028205e-05, "loss": 0.0075, "step": 674350 }, { "epoch": 1.75, "learning_rate": 3.7794240773910586e-05, "loss": 0.0077, "step": 674360 }, { "epoch": 1.75, "learning_rate": 3.779035255753912e-05, "loss": 0.0056, "step": 674370 }, { "epoch": 1.75, "learning_rate": 3.7786464341167656e-05, "loss": 0.0078, "step": 674380 }, { "epoch": 1.75, "learning_rate": 3.778257612479619e-05, "loss": 0.008, "step": 674390 }, { "epoch": 1.75, "learning_rate": 3.7778687908424725e-05, "loss": 0.0064, "step": 674400 }, { "epoch": 1.75, "learning_rate": 3.777479969205326e-05, "loss": 0.0082, "step": 674410 }, { "epoch": 1.75, "learning_rate": 3.7770911475681795e-05, "loss": 0.0081, "step": 674420 }, { "epoch": 1.75, "learning_rate": 3.776702325931033e-05, "loss": 0.0099, "step": 674430 }, { "epoch": 1.75, "learning_rate": 3.776313504293887e-05, "loss": 0.0081, "step": 674440 }, { "epoch": 1.75, "learning_rate": 3.7759246826567407e-05, "loss": 0.0101, "step": 674450 }, { "epoch": 1.75, "learning_rate": 3.775535861019594e-05, "loss": 0.0101, "step": 674460 }, { "epoch": 1.75, "learning_rate": 3.7751470393824476e-05, "loss": 0.0068, "step": 674470 }, { "epoch": 1.75, "learning_rate": 3.7747582177453004e-05, "loss": 0.0057, "step": 674480 }, { "epoch": 1.75, "learning_rate": 3.774369396108154e-05, "loss": 0.0082, "step": 674490 }, { "epoch": 1.75, "learning_rate": 3.7739805744710074e-05, "loss": 0.0085, "step": 674500 }, { "epoch": 1.75, "learning_rate": 3.773591752833861e-05, "loss": 0.0083, "step": 674510 }, { "epoch": 1.75, "learning_rate": 3.7732029311967144e-05, "loss": 0.0047, "step": 674520 }, { "epoch": 1.75, "learning_rate": 3.772814109559568e-05, "loss": 0.006, "step": 674530 }, { "epoch": 1.75, "learning_rate": 3.772425287922422e-05, "loss": 0.0056, "step": 674540 }, { "epoch": 1.75, "learning_rate": 3.7720364662852755e-05, "loss": 0.008, "step": 674550 }, { "epoch": 1.75, "learning_rate": 3.771647644648129e-05, "loss": 0.0059, "step": 674560 }, { "epoch": 1.75, "learning_rate": 3.7712588230109825e-05, "loss": 0.0064, "step": 674570 }, { "epoch": 1.75, "learning_rate": 3.770870001373836e-05, "loss": 0.0088, "step": 674580 }, { "epoch": 1.75, "learning_rate": 3.7704811797366895e-05, "loss": 0.007, "step": 674590 }, { "epoch": 1.75, "learning_rate": 3.770092358099543e-05, "loss": 0.0085, "step": 674600 }, { "epoch": 1.75, "learning_rate": 3.7697035364623964e-05, "loss": 0.0091, "step": 674610 }, { "epoch": 1.75, "learning_rate": 3.7693147148252506e-05, "loss": 0.0097, "step": 674620 }, { "epoch": 1.75, "learning_rate": 3.768925893188104e-05, "loss": 0.0066, "step": 674630 }, { "epoch": 1.75, "learning_rate": 3.7685370715509576e-05, "loss": 0.0066, "step": 674640 }, { "epoch": 1.75, "learning_rate": 3.768148249913811e-05, "loss": 0.0075, "step": 674650 }, { "epoch": 1.75, "learning_rate": 3.7677594282766645e-05, "loss": 0.0078, "step": 674660 }, { "epoch": 1.75, "learning_rate": 3.767370606639518e-05, "loss": 0.0062, "step": 674670 }, { "epoch": 1.75, "learning_rate": 3.7669817850023715e-05, "loss": 0.0077, "step": 674680 }, { "epoch": 1.75, "learning_rate": 3.766592963365225e-05, "loss": 0.0077, "step": 674690 }, { "epoch": 1.75, "learning_rate": 3.766204141728079e-05, "loss": 0.0065, "step": 674700 }, { "epoch": 1.75, "learning_rate": 3.7658153200909326e-05, "loss": 0.0062, "step": 674710 }, { "epoch": 1.75, "learning_rate": 3.765426498453786e-05, "loss": 0.0079, "step": 674720 }, { "epoch": 1.75, "learning_rate": 3.765037676816639e-05, "loss": 0.0085, "step": 674730 }, { "epoch": 1.75, "learning_rate": 3.7646488551794924e-05, "loss": 0.0085, "step": 674740 }, { "epoch": 1.75, "learning_rate": 3.764260033542346e-05, "loss": 0.0085, "step": 674750 }, { "epoch": 1.75, "learning_rate": 3.7638712119051994e-05, "loss": 0.008, "step": 674760 }, { "epoch": 1.75, "learning_rate": 3.763482390268053e-05, "loss": 0.0078, "step": 674770 }, { "epoch": 1.75, "learning_rate": 3.7630935686309064e-05, "loss": 0.0111, "step": 674780 }, { "epoch": 1.75, "learning_rate": 3.76270474699376e-05, "loss": 0.0095, "step": 674790 }, { "epoch": 1.75, "learning_rate": 3.762315925356614e-05, "loss": 0.0079, "step": 674800 }, { "epoch": 1.75, "learning_rate": 3.7619271037194675e-05, "loss": 0.0082, "step": 674810 }, { "epoch": 1.75, "learning_rate": 3.761538282082321e-05, "loss": 0.0073, "step": 674820 }, { "epoch": 1.75, "learning_rate": 3.7611494604451745e-05, "loss": 0.0073, "step": 674830 }, { "epoch": 1.75, "learning_rate": 3.760760638808028e-05, "loss": 0.0072, "step": 674840 }, { "epoch": 1.75, "learning_rate": 3.7603718171708815e-05, "loss": 0.0062, "step": 674850 }, { "epoch": 1.75, "learning_rate": 3.759982995533735e-05, "loss": 0.0077, "step": 674860 }, { "epoch": 1.75, "learning_rate": 3.7595941738965884e-05, "loss": 0.005, "step": 674870 }, { "epoch": 1.75, "learning_rate": 3.7592053522594426e-05, "loss": 0.0076, "step": 674880 }, { "epoch": 1.75, "learning_rate": 3.758816530622296e-05, "loss": 0.0102, "step": 674890 }, { "epoch": 1.75, "learning_rate": 3.7584277089851496e-05, "loss": 0.0062, "step": 674900 }, { "epoch": 1.75, "learning_rate": 3.758038887348003e-05, "loss": 0.0094, "step": 674910 }, { "epoch": 1.75, "learning_rate": 3.7576500657108565e-05, "loss": 0.0057, "step": 674920 }, { "epoch": 1.75, "learning_rate": 3.75726124407371e-05, "loss": 0.012, "step": 674930 }, { "epoch": 1.75, "learning_rate": 3.7568724224365635e-05, "loss": 0.0097, "step": 674940 }, { "epoch": 1.75, "learning_rate": 3.756483600799417e-05, "loss": 0.01, "step": 674950 }, { "epoch": 1.75, "learning_rate": 3.756094779162271e-05, "loss": 0.0079, "step": 674960 }, { "epoch": 1.75, "learning_rate": 3.7557059575251246e-05, "loss": 0.0078, "step": 674970 }, { "epoch": 1.75, "learning_rate": 3.7553171358879775e-05, "loss": 0.007, "step": 674980 }, { "epoch": 1.75, "learning_rate": 3.754928314250831e-05, "loss": 0.0074, "step": 674990 }, { "epoch": 1.75, "learning_rate": 3.7545394926136844e-05, "loss": 0.0091, "step": 675000 }, { "epoch": 1.75, "eval_cer": 0.8816704946736816, "eval_loss": 0.00502510741353035, "eval_runtime": 108.0489, "eval_samples_per_second": 18.51, "eval_steps_per_second": 4.628, "step": 675000 }, { "epoch": 1.75, "learning_rate": 3.754150670976538e-05, "loss": 0.0073, "step": 675010 }, { "epoch": 1.75, "learning_rate": 3.7537618493393914e-05, "loss": 0.0076, "step": 675020 }, { "epoch": 1.75, "learning_rate": 3.753373027702245e-05, "loss": 0.0047, "step": 675030 }, { "epoch": 1.75, "learning_rate": 3.7529842060650984e-05, "loss": 0.0078, "step": 675040 }, { "epoch": 1.75, "learning_rate": 3.752595384427952e-05, "loss": 0.0072, "step": 675050 }, { "epoch": 1.75, "learning_rate": 3.752206562790806e-05, "loss": 0.0073, "step": 675060 }, { "epoch": 1.75, "learning_rate": 3.7518177411536595e-05, "loss": 0.0061, "step": 675070 }, { "epoch": 1.75, "learning_rate": 3.751428919516513e-05, "loss": 0.0091, "step": 675080 }, { "epoch": 1.75, "learning_rate": 3.7510400978793665e-05, "loss": 0.0083, "step": 675090 }, { "epoch": 1.75, "learning_rate": 3.75065127624222e-05, "loss": 0.0083, "step": 675100 }, { "epoch": 1.75, "learning_rate": 3.7502624546050734e-05, "loss": 0.0077, "step": 675110 }, { "epoch": 1.75, "learning_rate": 3.749873632967927e-05, "loss": 0.0094, "step": 675120 }, { "epoch": 1.75, "learning_rate": 3.7494848113307804e-05, "loss": 0.0057, "step": 675130 }, { "epoch": 1.75, "learning_rate": 3.7490959896936346e-05, "loss": 0.008, "step": 675140 }, { "epoch": 1.75, "learning_rate": 3.748707168056488e-05, "loss": 0.0087, "step": 675150 }, { "epoch": 1.75, "learning_rate": 3.7483183464193416e-05, "loss": 0.0074, "step": 675160 }, { "epoch": 1.75, "learning_rate": 3.7479295247821944e-05, "loss": 0.0092, "step": 675170 }, { "epoch": 1.75, "learning_rate": 3.747540703145048e-05, "loss": 0.0057, "step": 675180 }, { "epoch": 1.75, "learning_rate": 3.747151881507902e-05, "loss": 0.0072, "step": 675190 }, { "epoch": 1.75, "learning_rate": 3.7467630598707555e-05, "loss": 0.007, "step": 675200 }, { "epoch": 1.75, "learning_rate": 3.746374238233609e-05, "loss": 0.0123, "step": 675210 }, { "epoch": 1.75, "learning_rate": 3.7459854165964625e-05, "loss": 0.0109, "step": 675220 }, { "epoch": 1.75, "learning_rate": 3.745596594959316e-05, "loss": 0.0092, "step": 675230 }, { "epoch": 1.75, "learning_rate": 3.7452077733221694e-05, "loss": 0.0082, "step": 675240 }, { "epoch": 1.75, "learning_rate": 3.744818951685023e-05, "loss": 0.0075, "step": 675250 }, { "epoch": 1.75, "learning_rate": 3.7444301300478764e-05, "loss": 0.007, "step": 675260 }, { "epoch": 1.75, "learning_rate": 3.7440413084107306e-05, "loss": 0.006, "step": 675270 }, { "epoch": 1.75, "learning_rate": 3.743652486773584e-05, "loss": 0.0084, "step": 675280 }, { "epoch": 1.75, "learning_rate": 3.743263665136437e-05, "loss": 0.0073, "step": 675290 }, { "epoch": 1.75, "learning_rate": 3.7428748434992904e-05, "loss": 0.0057, "step": 675300 }, { "epoch": 1.75, "learning_rate": 3.742486021862144e-05, "loss": 0.0056, "step": 675310 }, { "epoch": 1.75, "learning_rate": 3.742097200224998e-05, "loss": 0.0077, "step": 675320 }, { "epoch": 1.75, "learning_rate": 3.7417083785878515e-05, "loss": 0.0086, "step": 675330 }, { "epoch": 1.75, "learning_rate": 3.741319556950705e-05, "loss": 0.0072, "step": 675340 }, { "epoch": 1.75, "learning_rate": 3.7409307353135585e-05, "loss": 0.0094, "step": 675350 }, { "epoch": 1.75, "learning_rate": 3.740541913676412e-05, "loss": 0.0073, "step": 675360 }, { "epoch": 1.75, "learning_rate": 3.7401530920392654e-05, "loss": 0.0067, "step": 675370 }, { "epoch": 1.75, "learning_rate": 3.739764270402119e-05, "loss": 0.0076, "step": 675380 }, { "epoch": 1.75, "learning_rate": 3.7393754487649724e-05, "loss": 0.0075, "step": 675390 }, { "epoch": 1.75, "learning_rate": 3.7389866271278266e-05, "loss": 0.011, "step": 675400 }, { "epoch": 1.75, "learning_rate": 3.7385978054906794e-05, "loss": 0.0094, "step": 675410 }, { "epoch": 1.75, "learning_rate": 3.738208983853533e-05, "loss": 0.006, "step": 675420 }, { "epoch": 1.75, "learning_rate": 3.7378201622163864e-05, "loss": 0.0075, "step": 675430 }, { "epoch": 1.75, "learning_rate": 3.73743134057924e-05, "loss": 0.0075, "step": 675440 }, { "epoch": 1.75, "learning_rate": 3.737042518942094e-05, "loss": 0.0068, "step": 675450 }, { "epoch": 1.75, "learning_rate": 3.7366536973049475e-05, "loss": 0.008, "step": 675460 }, { "epoch": 1.75, "learning_rate": 3.736264875667801e-05, "loss": 0.0079, "step": 675470 }, { "epoch": 1.75, "learning_rate": 3.7358760540306545e-05, "loss": 0.0075, "step": 675480 }, { "epoch": 1.75, "learning_rate": 3.735487232393508e-05, "loss": 0.0072, "step": 675490 }, { "epoch": 1.75, "learning_rate": 3.7350984107563614e-05, "loss": 0.0085, "step": 675500 }, { "epoch": 1.75, "learning_rate": 3.734709589119215e-05, "loss": 0.0061, "step": 675510 }, { "epoch": 1.75, "learning_rate": 3.7343207674820684e-05, "loss": 0.0075, "step": 675520 }, { "epoch": 1.75, "learning_rate": 3.7339319458449226e-05, "loss": 0.0072, "step": 675530 }, { "epoch": 1.75, "learning_rate": 3.7335431242077754e-05, "loss": 0.0093, "step": 675540 }, { "epoch": 1.75, "learning_rate": 3.733154302570629e-05, "loss": 0.0116, "step": 675550 }, { "epoch": 1.75, "learning_rate": 3.7327654809334824e-05, "loss": 0.0081, "step": 675560 }, { "epoch": 1.75, "learning_rate": 3.732376659296336e-05, "loss": 0.0053, "step": 675570 }, { "epoch": 1.75, "learning_rate": 3.73198783765919e-05, "loss": 0.0087, "step": 675580 }, { "epoch": 1.75, "learning_rate": 3.7315990160220435e-05, "loss": 0.0066, "step": 675590 }, { "epoch": 1.75, "learning_rate": 3.731210194384897e-05, "loss": 0.0083, "step": 675600 }, { "epoch": 1.75, "learning_rate": 3.7308213727477505e-05, "loss": 0.0078, "step": 675610 }, { "epoch": 1.75, "learning_rate": 3.730432551110604e-05, "loss": 0.0059, "step": 675620 }, { "epoch": 1.75, "learning_rate": 3.7300437294734574e-05, "loss": 0.0118, "step": 675630 }, { "epoch": 1.75, "learning_rate": 3.729654907836311e-05, "loss": 0.0076, "step": 675640 }, { "epoch": 1.75, "learning_rate": 3.7292660861991644e-05, "loss": 0.007, "step": 675650 }, { "epoch": 1.75, "learning_rate": 3.728877264562018e-05, "loss": 0.0129, "step": 675660 }, { "epoch": 1.75, "learning_rate": 3.7284884429248714e-05, "loss": 0.0083, "step": 675670 }, { "epoch": 1.75, "learning_rate": 3.728099621287725e-05, "loss": 0.0099, "step": 675680 }, { "epoch": 1.75, "learning_rate": 3.7277107996505784e-05, "loss": 0.0111, "step": 675690 }, { "epoch": 1.75, "learning_rate": 3.727321978013432e-05, "loss": 0.0105, "step": 675700 }, { "epoch": 1.75, "learning_rate": 3.726933156376286e-05, "loss": 0.006, "step": 675710 }, { "epoch": 1.75, "learning_rate": 3.7265443347391395e-05, "loss": 0.009, "step": 675720 }, { "epoch": 1.75, "learning_rate": 3.726155513101993e-05, "loss": 0.0109, "step": 675730 }, { "epoch": 1.75, "learning_rate": 3.7257666914648465e-05, "loss": 0.0072, "step": 675740 }, { "epoch": 1.75, "learning_rate": 3.7253778698277e-05, "loss": 0.0088, "step": 675750 }, { "epoch": 1.75, "learning_rate": 3.7249890481905534e-05, "loss": 0.009, "step": 675760 }, { "epoch": 1.75, "learning_rate": 3.724600226553407e-05, "loss": 0.0069, "step": 675770 }, { "epoch": 1.75, "learning_rate": 3.7242114049162604e-05, "loss": 0.0095, "step": 675780 }, { "epoch": 1.75, "learning_rate": 3.723822583279114e-05, "loss": 0.0086, "step": 675790 }, { "epoch": 1.75, "learning_rate": 3.7234337616419674e-05, "loss": 0.0099, "step": 675800 }, { "epoch": 1.75, "learning_rate": 3.723044940004821e-05, "loss": 0.0073, "step": 675810 }, { "epoch": 1.75, "learning_rate": 3.7226561183676744e-05, "loss": 0.0092, "step": 675820 }, { "epoch": 1.75, "learning_rate": 3.722267296730528e-05, "loss": 0.0076, "step": 675830 }, { "epoch": 1.75, "learning_rate": 3.721878475093381e-05, "loss": 0.0076, "step": 675840 }, { "epoch": 1.75, "learning_rate": 3.7214896534562355e-05, "loss": 0.0105, "step": 675850 }, { "epoch": 1.75, "learning_rate": 3.721100831819089e-05, "loss": 0.0087, "step": 675860 }, { "epoch": 1.75, "learning_rate": 3.7207120101819425e-05, "loss": 0.008, "step": 675870 }, { "epoch": 1.75, "learning_rate": 3.720323188544796e-05, "loss": 0.0062, "step": 675880 }, { "epoch": 1.75, "learning_rate": 3.7199343669076494e-05, "loss": 0.007, "step": 675890 }, { "epoch": 1.75, "learning_rate": 3.719545545270503e-05, "loss": 0.0082, "step": 675900 }, { "epoch": 1.75, "learning_rate": 3.7191567236333564e-05, "loss": 0.0101, "step": 675910 }, { "epoch": 1.75, "learning_rate": 3.71876790199621e-05, "loss": 0.0072, "step": 675920 }, { "epoch": 1.75, "learning_rate": 3.7183790803590634e-05, "loss": 0.0068, "step": 675930 }, { "epoch": 1.75, "learning_rate": 3.717990258721917e-05, "loss": 0.0079, "step": 675940 }, { "epoch": 1.75, "learning_rate": 3.7176014370847704e-05, "loss": 0.0104, "step": 675950 }, { "epoch": 1.75, "learning_rate": 3.717212615447624e-05, "loss": 0.0084, "step": 675960 }, { "epoch": 1.75, "learning_rate": 3.716823793810477e-05, "loss": 0.0049, "step": 675970 }, { "epoch": 1.75, "learning_rate": 3.7164349721733315e-05, "loss": 0.0097, "step": 675980 }, { "epoch": 1.75, "learning_rate": 3.716046150536185e-05, "loss": 0.0078, "step": 675990 }, { "epoch": 1.75, "learning_rate": 3.7156573288990385e-05, "loss": 0.0102, "step": 676000 }, { "epoch": 1.75, "eval_cer": 0.8816662957628791, "eval_loss": 0.005067652557045221, "eval_runtime": 107.7059, "eval_samples_per_second": 18.569, "eval_steps_per_second": 4.642, "step": 676000 }, { "epoch": 1.75, "learning_rate": 3.715268507261892e-05, "loss": 0.0069, "step": 676010 }, { "epoch": 1.75, "learning_rate": 3.7148796856247454e-05, "loss": 0.0073, "step": 676020 }, { "epoch": 1.75, "learning_rate": 3.714490863987599e-05, "loss": 0.0096, "step": 676030 }, { "epoch": 1.75, "learning_rate": 3.7141020423504524e-05, "loss": 0.007, "step": 676040 }, { "epoch": 1.75, "learning_rate": 3.713713220713306e-05, "loss": 0.01, "step": 676050 }, { "epoch": 1.75, "learning_rate": 3.7133243990761594e-05, "loss": 0.0067, "step": 676060 }, { "epoch": 1.75, "learning_rate": 3.712935577439013e-05, "loss": 0.0067, "step": 676070 }, { "epoch": 1.75, "learning_rate": 3.7125467558018663e-05, "loss": 0.0054, "step": 676080 }, { "epoch": 1.75, "learning_rate": 3.71215793416472e-05, "loss": 0.0079, "step": 676090 }, { "epoch": 1.75, "learning_rate": 3.711769112527573e-05, "loss": 0.0074, "step": 676100 }, { "epoch": 1.75, "learning_rate": 3.7113802908904275e-05, "loss": 0.0075, "step": 676110 }, { "epoch": 1.75, "learning_rate": 3.710991469253281e-05, "loss": 0.0073, "step": 676120 }, { "epoch": 1.75, "learning_rate": 3.7106026476161345e-05, "loss": 0.0078, "step": 676130 }, { "epoch": 1.75, "learning_rate": 3.710213825978988e-05, "loss": 0.0089, "step": 676140 }, { "epoch": 1.75, "learning_rate": 3.7098250043418414e-05, "loss": 0.0081, "step": 676150 }, { "epoch": 1.75, "learning_rate": 3.709436182704695e-05, "loss": 0.0075, "step": 676160 }, { "epoch": 1.75, "learning_rate": 3.7090473610675484e-05, "loss": 0.0084, "step": 676170 }, { "epoch": 1.75, "learning_rate": 3.708658539430402e-05, "loss": 0.009, "step": 676180 }, { "epoch": 1.75, "learning_rate": 3.7082697177932554e-05, "loss": 0.0084, "step": 676190 }, { "epoch": 1.75, "learning_rate": 3.707880896156109e-05, "loss": 0.0096, "step": 676200 }, { "epoch": 1.75, "learning_rate": 3.7074920745189623e-05, "loss": 0.0131, "step": 676210 }, { "epoch": 1.75, "learning_rate": 3.707103252881816e-05, "loss": 0.0081, "step": 676220 }, { "epoch": 1.75, "learning_rate": 3.706714431244669e-05, "loss": 0.0091, "step": 676230 }, { "epoch": 1.75, "learning_rate": 3.7063256096075235e-05, "loss": 0.0108, "step": 676240 }, { "epoch": 1.75, "learning_rate": 3.705936787970377e-05, "loss": 0.0087, "step": 676250 }, { "epoch": 1.75, "learning_rate": 3.7055479663332305e-05, "loss": 0.0091, "step": 676260 }, { "epoch": 1.75, "learning_rate": 3.705159144696084e-05, "loss": 0.0066, "step": 676270 }, { "epoch": 1.75, "learning_rate": 3.704770323058937e-05, "loss": 0.0071, "step": 676280 }, { "epoch": 1.75, "learning_rate": 3.704381501421791e-05, "loss": 0.0064, "step": 676290 }, { "epoch": 1.75, "learning_rate": 3.7039926797846444e-05, "loss": 0.0076, "step": 676300 }, { "epoch": 1.75, "learning_rate": 3.703603858147498e-05, "loss": 0.0061, "step": 676310 }, { "epoch": 1.75, "learning_rate": 3.7032150365103514e-05, "loss": 0.0079, "step": 676320 }, { "epoch": 1.75, "learning_rate": 3.702826214873205e-05, "loss": 0.0077, "step": 676330 }, { "epoch": 1.75, "learning_rate": 3.7024373932360583e-05, "loss": 0.0065, "step": 676340 }, { "epoch": 1.75, "learning_rate": 3.702048571598912e-05, "loss": 0.0085, "step": 676350 }, { "epoch": 1.75, "learning_rate": 3.701659749961765e-05, "loss": 0.0064, "step": 676360 }, { "epoch": 1.75, "learning_rate": 3.7012709283246195e-05, "loss": 0.0072, "step": 676370 }, { "epoch": 1.75, "learning_rate": 3.700882106687473e-05, "loss": 0.0048, "step": 676380 }, { "epoch": 1.75, "learning_rate": 3.7004932850503265e-05, "loss": 0.006, "step": 676390 }, { "epoch": 1.75, "learning_rate": 3.70010446341318e-05, "loss": 0.0084, "step": 676400 }, { "epoch": 1.75, "learning_rate": 3.699715641776033e-05, "loss": 0.008, "step": 676410 }, { "epoch": 1.75, "learning_rate": 3.699326820138887e-05, "loss": 0.0072, "step": 676420 }, { "epoch": 1.75, "learning_rate": 3.6989379985017404e-05, "loss": 0.0118, "step": 676430 }, { "epoch": 1.75, "learning_rate": 3.698549176864594e-05, "loss": 0.0065, "step": 676440 }, { "epoch": 1.75, "learning_rate": 3.6981603552274474e-05, "loss": 0.0101, "step": 676450 }, { "epoch": 1.75, "learning_rate": 3.697771533590301e-05, "loss": 0.0059, "step": 676460 }, { "epoch": 1.75, "learning_rate": 3.6973827119531543e-05, "loss": 0.0065, "step": 676470 }, { "epoch": 1.75, "learning_rate": 3.696993890316008e-05, "loss": 0.01, "step": 676480 }, { "epoch": 1.75, "learning_rate": 3.696605068678861e-05, "loss": 0.0073, "step": 676490 }, { "epoch": 1.75, "learning_rate": 3.6962162470417155e-05, "loss": 0.0089, "step": 676500 }, { "epoch": 1.75, "learning_rate": 3.695827425404569e-05, "loss": 0.0086, "step": 676510 }, { "epoch": 1.75, "learning_rate": 3.6954386037674225e-05, "loss": 0.0078, "step": 676520 }, { "epoch": 1.75, "learning_rate": 3.695049782130275e-05, "loss": 0.0064, "step": 676530 }, { "epoch": 1.75, "learning_rate": 3.694660960493129e-05, "loss": 0.0097, "step": 676540 }, { "epoch": 1.75, "learning_rate": 3.694272138855983e-05, "loss": 0.0078, "step": 676550 }, { "epoch": 1.75, "learning_rate": 3.6938833172188364e-05, "loss": 0.0089, "step": 676560 }, { "epoch": 1.75, "learning_rate": 3.69349449558169e-05, "loss": 0.0081, "step": 676570 }, { "epoch": 1.75, "learning_rate": 3.6931056739445434e-05, "loss": 0.0102, "step": 676580 }, { "epoch": 1.75, "learning_rate": 3.692716852307397e-05, "loss": 0.0076, "step": 676590 }, { "epoch": 1.75, "learning_rate": 3.6923280306702503e-05, "loss": 0.0076, "step": 676600 }, { "epoch": 1.75, "learning_rate": 3.691939209033104e-05, "loss": 0.0055, "step": 676610 }, { "epoch": 1.75, "learning_rate": 3.691550387395957e-05, "loss": 0.006, "step": 676620 }, { "epoch": 1.75, "learning_rate": 3.6911615657588115e-05, "loss": 0.0091, "step": 676630 }, { "epoch": 1.75, "learning_rate": 3.690772744121665e-05, "loss": 0.0081, "step": 676640 }, { "epoch": 1.75, "learning_rate": 3.690383922484518e-05, "loss": 0.0075, "step": 676650 }, { "epoch": 1.75, "learning_rate": 3.689995100847371e-05, "loss": 0.0076, "step": 676660 }, { "epoch": 1.75, "learning_rate": 3.689606279210225e-05, "loss": 0.0071, "step": 676670 }, { "epoch": 1.75, "learning_rate": 3.689217457573079e-05, "loss": 0.0074, "step": 676680 }, { "epoch": 1.75, "learning_rate": 3.6888286359359324e-05, "loss": 0.0082, "step": 676690 }, { "epoch": 1.75, "learning_rate": 3.688439814298786e-05, "loss": 0.0064, "step": 676700 }, { "epoch": 1.75, "learning_rate": 3.6880509926616394e-05, "loss": 0.0078, "step": 676710 }, { "epoch": 1.75, "learning_rate": 3.687662171024493e-05, "loss": 0.0121, "step": 676720 }, { "epoch": 1.75, "learning_rate": 3.687273349387346e-05, "loss": 0.0101, "step": 676730 }, { "epoch": 1.75, "learning_rate": 3.6868845277502e-05, "loss": 0.0066, "step": 676740 }, { "epoch": 1.75, "learning_rate": 3.686495706113053e-05, "loss": 0.0086, "step": 676750 }, { "epoch": 1.75, "learning_rate": 3.6861068844759075e-05, "loss": 0.0075, "step": 676760 }, { "epoch": 1.75, "learning_rate": 3.685718062838761e-05, "loss": 0.0096, "step": 676770 }, { "epoch": 1.75, "learning_rate": 3.685329241201614e-05, "loss": 0.0083, "step": 676780 }, { "epoch": 1.75, "learning_rate": 3.684940419564467e-05, "loss": 0.0079, "step": 676790 }, { "epoch": 1.75, "learning_rate": 3.684551597927321e-05, "loss": 0.0069, "step": 676800 }, { "epoch": 1.75, "learning_rate": 3.684162776290175e-05, "loss": 0.0088, "step": 676810 }, { "epoch": 1.75, "learning_rate": 3.6837739546530284e-05, "loss": 0.0073, "step": 676820 }, { "epoch": 1.75, "learning_rate": 3.683385133015882e-05, "loss": 0.0079, "step": 676830 }, { "epoch": 1.75, "learning_rate": 3.6829963113787354e-05, "loss": 0.0069, "step": 676840 }, { "epoch": 1.75, "learning_rate": 3.682607489741589e-05, "loss": 0.0063, "step": 676850 }, { "epoch": 1.75, "learning_rate": 3.682218668104442e-05, "loss": 0.0056, "step": 676860 }, { "epoch": 1.75, "learning_rate": 3.681829846467296e-05, "loss": 0.0055, "step": 676870 }, { "epoch": 1.75, "learning_rate": 3.681441024830149e-05, "loss": 0.0054, "step": 676880 }, { "epoch": 1.75, "learning_rate": 3.6810522031930035e-05, "loss": 0.009, "step": 676890 }, { "epoch": 1.75, "learning_rate": 3.680663381555856e-05, "loss": 0.0063, "step": 676900 }, { "epoch": 1.75, "learning_rate": 3.68027455991871e-05, "loss": 0.0085, "step": 676910 }, { "epoch": 1.75, "learning_rate": 3.679885738281563e-05, "loss": 0.0077, "step": 676920 }, { "epoch": 1.75, "learning_rate": 3.679496916644417e-05, "loss": 0.0093, "step": 676930 }, { "epoch": 1.75, "learning_rate": 3.679108095007271e-05, "loss": 0.0063, "step": 676940 }, { "epoch": 1.75, "learning_rate": 3.6787192733701244e-05, "loss": 0.0072, "step": 676950 }, { "epoch": 1.75, "learning_rate": 3.678330451732978e-05, "loss": 0.0075, "step": 676960 }, { "epoch": 1.75, "learning_rate": 3.6779416300958314e-05, "loss": 0.0077, "step": 676970 }, { "epoch": 1.75, "learning_rate": 3.677552808458685e-05, "loss": 0.0093, "step": 676980 }, { "epoch": 1.75, "learning_rate": 3.677163986821538e-05, "loss": 0.0085, "step": 676990 }, { "epoch": 1.75, "learning_rate": 3.676775165184392e-05, "loss": 0.0086, "step": 677000 }, { "epoch": 1.75, "eval_cer": 0.8816690950367475, "eval_loss": 0.005042629782110453, "eval_runtime": 108.0533, "eval_samples_per_second": 18.509, "eval_steps_per_second": 4.627, "step": 677000 }, { "epoch": 1.75, "learning_rate": 3.676386343547245e-05, "loss": 0.0103, "step": 677010 }, { "epoch": 1.75, "learning_rate": 3.6759975219100995e-05, "loss": 0.0082, "step": 677020 }, { "epoch": 1.75, "learning_rate": 3.675608700272952e-05, "loss": 0.0064, "step": 677030 }, { "epoch": 1.75, "learning_rate": 3.675219878635806e-05, "loss": 0.0082, "step": 677040 }, { "epoch": 1.76, "learning_rate": 3.674831056998659e-05, "loss": 0.0071, "step": 677050 }, { "epoch": 1.76, "learning_rate": 3.674442235361513e-05, "loss": 0.0061, "step": 677060 }, { "epoch": 1.76, "learning_rate": 3.674053413724367e-05, "loss": 0.0075, "step": 677070 }, { "epoch": 1.76, "learning_rate": 3.6736645920872204e-05, "loss": 0.0084, "step": 677080 }, { "epoch": 1.76, "learning_rate": 3.673275770450074e-05, "loss": 0.0072, "step": 677090 }, { "epoch": 1.76, "learning_rate": 3.6728869488129274e-05, "loss": 0.009, "step": 677100 }, { "epoch": 1.76, "learning_rate": 3.672498127175781e-05, "loss": 0.0065, "step": 677110 }, { "epoch": 1.76, "learning_rate": 3.672109305538634e-05, "loss": 0.008, "step": 677120 }, { "epoch": 1.76, "learning_rate": 3.671720483901488e-05, "loss": 0.0082, "step": 677130 }, { "epoch": 1.76, "learning_rate": 3.671331662264341e-05, "loss": 0.0072, "step": 677140 }, { "epoch": 1.76, "learning_rate": 3.670942840627195e-05, "loss": 0.0069, "step": 677150 }, { "epoch": 1.76, "learning_rate": 3.670554018990048e-05, "loss": 0.0072, "step": 677160 }, { "epoch": 1.76, "learning_rate": 3.670165197352902e-05, "loss": 0.0058, "step": 677170 }, { "epoch": 1.76, "learning_rate": 3.669776375715755e-05, "loss": 0.0076, "step": 677180 }, { "epoch": 1.76, "learning_rate": 3.669387554078609e-05, "loss": 0.0101, "step": 677190 }, { "epoch": 1.76, "learning_rate": 3.668998732441462e-05, "loss": 0.0072, "step": 677200 }, { "epoch": 1.76, "learning_rate": 3.6686099108043164e-05, "loss": 0.017, "step": 677210 }, { "epoch": 1.76, "learning_rate": 3.66822108916717e-05, "loss": 0.009, "step": 677220 }, { "epoch": 1.76, "learning_rate": 3.6678322675300234e-05, "loss": 0.0084, "step": 677230 }, { "epoch": 1.76, "learning_rate": 3.667443445892877e-05, "loss": 0.0074, "step": 677240 }, { "epoch": 1.76, "learning_rate": 3.66705462425573e-05, "loss": 0.0069, "step": 677250 }, { "epoch": 1.76, "learning_rate": 3.666665802618584e-05, "loss": 0.0073, "step": 677260 }, { "epoch": 1.76, "learning_rate": 3.666276980981437e-05, "loss": 0.0153, "step": 677270 }, { "epoch": 1.76, "learning_rate": 3.665888159344291e-05, "loss": 0.0058, "step": 677280 }, { "epoch": 1.76, "learning_rate": 3.665499337707144e-05, "loss": 0.0062, "step": 677290 }, { "epoch": 1.76, "learning_rate": 3.665110516069998e-05, "loss": 0.0086, "step": 677300 }, { "epoch": 1.76, "learning_rate": 3.664721694432851e-05, "loss": 0.0075, "step": 677310 }, { "epoch": 1.76, "learning_rate": 3.664332872795705e-05, "loss": 0.0067, "step": 677320 }, { "epoch": 1.76, "learning_rate": 3.663944051158558e-05, "loss": 0.0103, "step": 677330 }, { "epoch": 1.76, "learning_rate": 3.6635552295214124e-05, "loss": 0.0092, "step": 677340 }, { "epoch": 1.76, "learning_rate": 3.663166407884266e-05, "loss": 0.0079, "step": 677350 }, { "epoch": 1.76, "learning_rate": 3.6627775862471194e-05, "loss": 0.0063, "step": 677360 }, { "epoch": 1.76, "learning_rate": 3.662388764609973e-05, "loss": 0.0073, "step": 677370 }, { "epoch": 1.76, "learning_rate": 3.661999942972826e-05, "loss": 0.0071, "step": 677380 }, { "epoch": 1.76, "learning_rate": 3.66161112133568e-05, "loss": 0.0077, "step": 677390 }, { "epoch": 1.76, "learning_rate": 3.661222299698533e-05, "loss": 0.0066, "step": 677400 }, { "epoch": 1.76, "learning_rate": 3.660833478061387e-05, "loss": 0.0069, "step": 677410 }, { "epoch": 1.76, "learning_rate": 3.66044465642424e-05, "loss": 0.0091, "step": 677420 }, { "epoch": 1.76, "learning_rate": 3.660055834787094e-05, "loss": 0.0079, "step": 677430 }, { "epoch": 1.76, "learning_rate": 3.659667013149947e-05, "loss": 0.0078, "step": 677440 }, { "epoch": 1.76, "learning_rate": 3.659278191512801e-05, "loss": 0.006, "step": 677450 }, { "epoch": 1.76, "learning_rate": 3.658889369875654e-05, "loss": 0.0074, "step": 677460 }, { "epoch": 1.76, "learning_rate": 3.6585005482385084e-05, "loss": 0.0096, "step": 677470 }, { "epoch": 1.76, "learning_rate": 3.658111726601362e-05, "loss": 0.0073, "step": 677480 }, { "epoch": 1.76, "learning_rate": 3.6577229049642154e-05, "loss": 0.0068, "step": 677490 }, { "epoch": 1.76, "learning_rate": 3.657334083327069e-05, "loss": 0.0066, "step": 677500 }, { "epoch": 1.76, "learning_rate": 3.656945261689922e-05, "loss": 0.0079, "step": 677510 }, { "epoch": 1.76, "learning_rate": 3.656556440052776e-05, "loss": 0.0079, "step": 677520 }, { "epoch": 1.76, "learning_rate": 3.656167618415629e-05, "loss": 0.0072, "step": 677530 }, { "epoch": 1.76, "learning_rate": 3.655778796778483e-05, "loss": 0.0074, "step": 677540 }, { "epoch": 1.76, "learning_rate": 3.655389975141336e-05, "loss": 0.0058, "step": 677550 }, { "epoch": 1.76, "learning_rate": 3.65500115350419e-05, "loss": 0.0076, "step": 677560 }, { "epoch": 1.76, "learning_rate": 3.654612331867043e-05, "loss": 0.0097, "step": 677570 }, { "epoch": 1.76, "learning_rate": 3.654223510229897e-05, "loss": 0.008, "step": 677580 }, { "epoch": 1.76, "learning_rate": 3.65383468859275e-05, "loss": 0.0047, "step": 677590 }, { "epoch": 1.76, "learning_rate": 3.6534458669556044e-05, "loss": 0.0085, "step": 677600 }, { "epoch": 1.76, "learning_rate": 3.653057045318458e-05, "loss": 0.0067, "step": 677610 }, { "epoch": 1.76, "learning_rate": 3.6526682236813113e-05, "loss": 0.0073, "step": 677620 }, { "epoch": 1.76, "learning_rate": 3.652279402044165e-05, "loss": 0.007, "step": 677630 }, { "epoch": 1.76, "learning_rate": 3.651890580407018e-05, "loss": 0.0088, "step": 677640 }, { "epoch": 1.76, "learning_rate": 3.651501758769872e-05, "loss": 0.0062, "step": 677650 }, { "epoch": 1.76, "learning_rate": 3.651112937132725e-05, "loss": 0.0112, "step": 677660 }, { "epoch": 1.76, "learning_rate": 3.650724115495579e-05, "loss": 0.0082, "step": 677670 }, { "epoch": 1.76, "learning_rate": 3.650335293858432e-05, "loss": 0.0075, "step": 677680 }, { "epoch": 1.76, "learning_rate": 3.649946472221286e-05, "loss": 0.0089, "step": 677690 }, { "epoch": 1.76, "learning_rate": 3.649557650584139e-05, "loss": 0.0073, "step": 677700 }, { "epoch": 1.76, "learning_rate": 3.649168828946993e-05, "loss": 0.0074, "step": 677710 }, { "epoch": 1.76, "learning_rate": 3.648780007309846e-05, "loss": 0.0053, "step": 677720 }, { "epoch": 1.76, "learning_rate": 3.6483911856727004e-05, "loss": 0.0083, "step": 677730 }, { "epoch": 1.76, "learning_rate": 3.648002364035554e-05, "loss": 0.0083, "step": 677740 }, { "epoch": 1.76, "learning_rate": 3.6476135423984073e-05, "loss": 0.0082, "step": 677750 }, { "epoch": 1.76, "learning_rate": 3.647224720761261e-05, "loss": 0.0067, "step": 677760 }, { "epoch": 1.76, "learning_rate": 3.6468358991241136e-05, "loss": 0.0064, "step": 677770 }, { "epoch": 1.76, "learning_rate": 3.646447077486968e-05, "loss": 0.0085, "step": 677780 }, { "epoch": 1.76, "learning_rate": 3.646058255849821e-05, "loss": 0.0056, "step": 677790 }, { "epoch": 1.76, "learning_rate": 3.645669434212675e-05, "loss": 0.009, "step": 677800 }, { "epoch": 1.76, "learning_rate": 3.645280612575528e-05, "loss": 0.0073, "step": 677810 }, { "epoch": 1.76, "learning_rate": 3.644891790938382e-05, "loss": 0.0081, "step": 677820 }, { "epoch": 1.76, "learning_rate": 3.644502969301235e-05, "loss": 0.0078, "step": 677830 }, { "epoch": 1.76, "learning_rate": 3.644114147664089e-05, "loss": 0.0095, "step": 677840 }, { "epoch": 1.76, "learning_rate": 3.643725326026942e-05, "loss": 0.0093, "step": 677850 }, { "epoch": 1.76, "learning_rate": 3.6433365043897964e-05, "loss": 0.007, "step": 677860 }, { "epoch": 1.76, "learning_rate": 3.64294768275265e-05, "loss": 0.0087, "step": 677870 }, { "epoch": 1.76, "learning_rate": 3.6425588611155033e-05, "loss": 0.0128, "step": 677880 }, { "epoch": 1.76, "learning_rate": 3.642170039478356e-05, "loss": 0.0058, "step": 677890 }, { "epoch": 1.76, "learning_rate": 3.6417812178412096e-05, "loss": 0.0078, "step": 677900 }, { "epoch": 1.76, "learning_rate": 3.641392396204064e-05, "loss": 0.0058, "step": 677910 }, { "epoch": 1.76, "learning_rate": 3.641003574566917e-05, "loss": 0.0081, "step": 677920 }, { "epoch": 1.76, "learning_rate": 3.640614752929771e-05, "loss": 0.0062, "step": 677930 }, { "epoch": 1.76, "learning_rate": 3.640225931292624e-05, "loss": 0.0081, "step": 677940 }, { "epoch": 1.76, "learning_rate": 3.639837109655478e-05, "loss": 0.0063, "step": 677950 }, { "epoch": 1.76, "learning_rate": 3.639448288018331e-05, "loss": 0.0094, "step": 677960 }, { "epoch": 1.76, "learning_rate": 3.639059466381185e-05, "loss": 0.0067, "step": 677970 }, { "epoch": 1.76, "learning_rate": 3.638670644744038e-05, "loss": 0.0051, "step": 677980 }, { "epoch": 1.76, "learning_rate": 3.6382818231068924e-05, "loss": 0.0096, "step": 677990 }, { "epoch": 1.76, "learning_rate": 3.637893001469746e-05, "loss": 0.0085, "step": 678000 }, { "epoch": 1.76, "eval_cer": 0.8817012866862336, "eval_loss": 0.0050600310787558556, "eval_runtime": 107.7885, "eval_samples_per_second": 18.555, "eval_steps_per_second": 4.639, "step": 678000 }, { "epoch": 1.76, "learning_rate": 3.6375041798325993e-05, "loss": 0.0085, "step": 678010 }, { "epoch": 1.76, "learning_rate": 3.637115358195452e-05, "loss": 0.0086, "step": 678020 }, { "epoch": 1.76, "learning_rate": 3.6367265365583056e-05, "loss": 0.0069, "step": 678030 }, { "epoch": 1.76, "learning_rate": 3.63633771492116e-05, "loss": 0.0071, "step": 678040 }, { "epoch": 1.76, "learning_rate": 3.635948893284013e-05, "loss": 0.0077, "step": 678050 }, { "epoch": 1.76, "learning_rate": 3.635560071646867e-05, "loss": 0.0053, "step": 678060 }, { "epoch": 1.76, "learning_rate": 3.63517125000972e-05, "loss": 0.0091, "step": 678070 }, { "epoch": 1.76, "learning_rate": 3.634782428372574e-05, "loss": 0.0075, "step": 678080 }, { "epoch": 1.76, "learning_rate": 3.634393606735427e-05, "loss": 0.008, "step": 678090 }, { "epoch": 1.76, "learning_rate": 3.634004785098281e-05, "loss": 0.0065, "step": 678100 }, { "epoch": 1.76, "learning_rate": 3.633615963461134e-05, "loss": 0.007, "step": 678110 }, { "epoch": 1.76, "learning_rate": 3.6332271418239884e-05, "loss": 0.0081, "step": 678120 }, { "epoch": 1.76, "learning_rate": 3.632838320186842e-05, "loss": 0.0081, "step": 678130 }, { "epoch": 1.76, "learning_rate": 3.632449498549695e-05, "loss": 0.0078, "step": 678140 }, { "epoch": 1.76, "learning_rate": 3.632060676912548e-05, "loss": 0.0081, "step": 678150 }, { "epoch": 1.76, "learning_rate": 3.6316718552754016e-05, "loss": 0.0092, "step": 678160 }, { "epoch": 1.76, "learning_rate": 3.631283033638256e-05, "loss": 0.0078, "step": 678170 }, { "epoch": 1.76, "learning_rate": 3.630894212001109e-05, "loss": 0.0096, "step": 678180 }, { "epoch": 1.76, "learning_rate": 3.630505390363963e-05, "loss": 0.0087, "step": 678190 }, { "epoch": 1.76, "learning_rate": 3.630116568726816e-05, "loss": 0.0105, "step": 678200 }, { "epoch": 1.76, "learning_rate": 3.62972774708967e-05, "loss": 0.015, "step": 678210 }, { "epoch": 1.76, "learning_rate": 3.629338925452523e-05, "loss": 0.009, "step": 678220 }, { "epoch": 1.76, "learning_rate": 3.628950103815377e-05, "loss": 0.0074, "step": 678230 }, { "epoch": 1.76, "learning_rate": 3.62856128217823e-05, "loss": 0.0084, "step": 678240 }, { "epoch": 1.76, "learning_rate": 3.6281724605410844e-05, "loss": 0.0078, "step": 678250 }, { "epoch": 1.76, "learning_rate": 3.627783638903938e-05, "loss": 0.008, "step": 678260 }, { "epoch": 1.76, "learning_rate": 3.6273948172667907e-05, "loss": 0.0074, "step": 678270 }, { "epoch": 1.76, "learning_rate": 3.627005995629644e-05, "loss": 0.0056, "step": 678280 }, { "epoch": 1.76, "learning_rate": 3.6266171739924976e-05, "loss": 0.0106, "step": 678290 }, { "epoch": 1.76, "learning_rate": 3.626228352355352e-05, "loss": 0.0073, "step": 678300 }, { "epoch": 1.76, "learning_rate": 3.625839530718205e-05, "loss": 0.0077, "step": 678310 }, { "epoch": 1.76, "learning_rate": 3.625450709081059e-05, "loss": 0.0094, "step": 678320 }, { "epoch": 1.76, "learning_rate": 3.625061887443912e-05, "loss": 0.0081, "step": 678330 }, { "epoch": 1.76, "learning_rate": 3.624673065806766e-05, "loss": 0.0061, "step": 678340 }, { "epoch": 1.76, "learning_rate": 3.624284244169619e-05, "loss": 0.0073, "step": 678350 }, { "epoch": 1.76, "learning_rate": 3.623895422532473e-05, "loss": 0.0069, "step": 678360 }, { "epoch": 1.76, "learning_rate": 3.623506600895326e-05, "loss": 0.0075, "step": 678370 }, { "epoch": 1.76, "learning_rate": 3.6231177792581804e-05, "loss": 0.0077, "step": 678380 }, { "epoch": 1.76, "learning_rate": 3.622728957621033e-05, "loss": 0.0128, "step": 678390 }, { "epoch": 1.76, "learning_rate": 3.6223401359838867e-05, "loss": 0.0071, "step": 678400 }, { "epoch": 1.76, "learning_rate": 3.62195131434674e-05, "loss": 0.0054, "step": 678410 }, { "epoch": 1.76, "learning_rate": 3.6215624927095936e-05, "loss": 0.0086, "step": 678420 }, { "epoch": 1.76, "learning_rate": 3.621173671072448e-05, "loss": 0.0057, "step": 678430 }, { "epoch": 1.76, "learning_rate": 3.620784849435301e-05, "loss": 0.011, "step": 678440 }, { "epoch": 1.76, "learning_rate": 3.620396027798155e-05, "loss": 0.0076, "step": 678450 }, { "epoch": 1.76, "learning_rate": 3.620007206161008e-05, "loss": 0.007, "step": 678460 }, { "epoch": 1.76, "learning_rate": 3.619618384523862e-05, "loss": 0.0151, "step": 678470 }, { "epoch": 1.76, "learning_rate": 3.619229562886715e-05, "loss": 0.0063, "step": 678480 }, { "epoch": 1.76, "learning_rate": 3.618840741249569e-05, "loss": 0.0087, "step": 678490 }, { "epoch": 1.76, "learning_rate": 3.618451919612422e-05, "loss": 0.0057, "step": 678500 }, { "epoch": 1.76, "learning_rate": 3.618063097975276e-05, "loss": 0.0078, "step": 678510 }, { "epoch": 1.76, "learning_rate": 3.617674276338129e-05, "loss": 0.0082, "step": 678520 }, { "epoch": 1.76, "learning_rate": 3.6172854547009827e-05, "loss": 0.0071, "step": 678530 }, { "epoch": 1.76, "learning_rate": 3.616896633063836e-05, "loss": 0.009, "step": 678540 }, { "epoch": 1.76, "learning_rate": 3.6165078114266896e-05, "loss": 0.007, "step": 678550 }, { "epoch": 1.76, "learning_rate": 3.616118989789544e-05, "loss": 0.0086, "step": 678560 }, { "epoch": 1.76, "learning_rate": 3.615730168152397e-05, "loss": 0.0061, "step": 678570 }, { "epoch": 1.76, "learning_rate": 3.615341346515251e-05, "loss": 0.009, "step": 678580 }, { "epoch": 1.76, "learning_rate": 3.614952524878104e-05, "loss": 0.0085, "step": 678590 }, { "epoch": 1.76, "learning_rate": 3.614563703240958e-05, "loss": 0.0092, "step": 678600 }, { "epoch": 1.76, "learning_rate": 3.614174881603811e-05, "loss": 0.0062, "step": 678610 }, { "epoch": 1.76, "learning_rate": 3.613786059966665e-05, "loss": 0.0058, "step": 678620 }, { "epoch": 1.76, "learning_rate": 3.613397238329518e-05, "loss": 0.0101, "step": 678630 }, { "epoch": 1.76, "learning_rate": 3.613008416692372e-05, "loss": 0.0059, "step": 678640 }, { "epoch": 1.76, "learning_rate": 3.612619595055225e-05, "loss": 0.0067, "step": 678650 }, { "epoch": 1.76, "learning_rate": 3.6122307734180787e-05, "loss": 0.0103, "step": 678660 }, { "epoch": 1.76, "learning_rate": 3.611841951780932e-05, "loss": 0.0072, "step": 678670 }, { "epoch": 1.76, "learning_rate": 3.6114531301437856e-05, "loss": 0.0063, "step": 678680 }, { "epoch": 1.76, "learning_rate": 3.611064308506639e-05, "loss": 0.0071, "step": 678690 }, { "epoch": 1.76, "learning_rate": 3.610675486869493e-05, "loss": 0.0113, "step": 678700 }, { "epoch": 1.76, "learning_rate": 3.610286665232347e-05, "loss": 0.0056, "step": 678710 }, { "epoch": 1.76, "learning_rate": 3.6098978435952e-05, "loss": 0.0085, "step": 678720 }, { "epoch": 1.76, "learning_rate": 3.609509021958054e-05, "loss": 0.0088, "step": 678730 }, { "epoch": 1.76, "learning_rate": 3.609120200320907e-05, "loss": 0.0051, "step": 678740 }, { "epoch": 1.76, "learning_rate": 3.608731378683761e-05, "loss": 0.0101, "step": 678750 }, { "epoch": 1.76, "learning_rate": 3.608342557046614e-05, "loss": 0.0083, "step": 678760 }, { "epoch": 1.76, "learning_rate": 3.607953735409468e-05, "loss": 0.0064, "step": 678770 }, { "epoch": 1.76, "learning_rate": 3.607564913772321e-05, "loss": 0.0075, "step": 678780 }, { "epoch": 1.76, "learning_rate": 3.6071760921351746e-05, "loss": 0.0069, "step": 678790 }, { "epoch": 1.76, "learning_rate": 3.606787270498028e-05, "loss": 0.0072, "step": 678800 }, { "epoch": 1.76, "learning_rate": 3.6063984488608816e-05, "loss": 0.0065, "step": 678810 }, { "epoch": 1.76, "learning_rate": 3.606009627223735e-05, "loss": 0.0086, "step": 678820 }, { "epoch": 1.76, "learning_rate": 3.605620805586589e-05, "loss": 0.0055, "step": 678830 }, { "epoch": 1.76, "learning_rate": 3.605231983949443e-05, "loss": 0.008, "step": 678840 }, { "epoch": 1.76, "learning_rate": 3.604843162312296e-05, "loss": 0.0095, "step": 678850 }, { "epoch": 1.76, "learning_rate": 3.60445434067515e-05, "loss": 0.0061, "step": 678860 }, { "epoch": 1.76, "learning_rate": 3.604065519038003e-05, "loss": 0.0077, "step": 678870 }, { "epoch": 1.76, "learning_rate": 3.603676697400857e-05, "loss": 0.0067, "step": 678880 }, { "epoch": 1.76, "learning_rate": 3.60328787576371e-05, "loss": 0.0059, "step": 678890 }, { "epoch": 1.76, "learning_rate": 3.602899054126564e-05, "loss": 0.0097, "step": 678900 }, { "epoch": 1.76, "learning_rate": 3.602510232489417e-05, "loss": 0.0074, "step": 678910 }, { "epoch": 1.76, "learning_rate": 3.6021214108522706e-05, "loss": 0.0075, "step": 678920 }, { "epoch": 1.76, "learning_rate": 3.601732589215124e-05, "loss": 0.0069, "step": 678930 }, { "epoch": 1.76, "learning_rate": 3.6013437675779776e-05, "loss": 0.0071, "step": 678940 }, { "epoch": 1.76, "learning_rate": 3.600954945940831e-05, "loss": 0.0083, "step": 678950 }, { "epoch": 1.76, "learning_rate": 3.600566124303685e-05, "loss": 0.0065, "step": 678960 }, { "epoch": 1.76, "learning_rate": 3.600177302666539e-05, "loss": 0.008, "step": 678970 }, { "epoch": 1.76, "learning_rate": 3.599788481029392e-05, "loss": 0.0056, "step": 678980 }, { "epoch": 1.76, "learning_rate": 3.599399659392246e-05, "loss": 0.0069, "step": 678990 }, { "epoch": 1.76, "learning_rate": 3.599010837755099e-05, "loss": 0.0079, "step": 679000 }, { "epoch": 1.76, "eval_cer": 0.8816592975782083, "eval_loss": 0.00512329675257206, "eval_runtime": 108.0539, "eval_samples_per_second": 18.509, "eval_steps_per_second": 4.627, "step": 679000 }, { "epoch": 1.76, "learning_rate": 3.598622016117953e-05, "loss": 0.0068, "step": 679010 }, { "epoch": 1.76, "learning_rate": 3.598233194480806e-05, "loss": 0.0103, "step": 679020 }, { "epoch": 1.76, "learning_rate": 3.59784437284366e-05, "loss": 0.0082, "step": 679030 }, { "epoch": 1.76, "learning_rate": 3.597455551206513e-05, "loss": 0.0083, "step": 679040 }, { "epoch": 1.76, "learning_rate": 3.5970667295693666e-05, "loss": 0.0123, "step": 679050 }, { "epoch": 1.76, "learning_rate": 3.59667790793222e-05, "loss": 0.0088, "step": 679060 }, { "epoch": 1.76, "learning_rate": 3.5962890862950736e-05, "loss": 0.0074, "step": 679070 }, { "epoch": 1.76, "learning_rate": 3.595900264657927e-05, "loss": 0.0068, "step": 679080 }, { "epoch": 1.76, "learning_rate": 3.595511443020781e-05, "loss": 0.0083, "step": 679090 }, { "epoch": 1.76, "learning_rate": 3.595122621383635e-05, "loss": 0.0058, "step": 679100 }, { "epoch": 1.76, "learning_rate": 3.594733799746488e-05, "loss": 0.0071, "step": 679110 }, { "epoch": 1.76, "learning_rate": 3.594344978109342e-05, "loss": 0.0099, "step": 679120 }, { "epoch": 1.76, "learning_rate": 3.5939561564721945e-05, "loss": 0.0072, "step": 679130 }, { "epoch": 1.76, "learning_rate": 3.593567334835049e-05, "loss": 0.0107, "step": 679140 }, { "epoch": 1.76, "learning_rate": 3.593178513197902e-05, "loss": 0.0064, "step": 679150 }, { "epoch": 1.76, "learning_rate": 3.592789691560756e-05, "loss": 0.0069, "step": 679160 }, { "epoch": 1.76, "learning_rate": 3.592400869923609e-05, "loss": 0.0094, "step": 679170 }, { "epoch": 1.76, "learning_rate": 3.5920120482864626e-05, "loss": 0.0081, "step": 679180 }, { "epoch": 1.76, "learning_rate": 3.591623226649316e-05, "loss": 0.0074, "step": 679190 }, { "epoch": 1.76, "learning_rate": 3.5912344050121696e-05, "loss": 0.01, "step": 679200 }, { "epoch": 1.76, "learning_rate": 3.590845583375023e-05, "loss": 0.0091, "step": 679210 }, { "epoch": 1.76, "learning_rate": 3.590456761737877e-05, "loss": 0.0109, "step": 679220 }, { "epoch": 1.76, "learning_rate": 3.590067940100731e-05, "loss": 0.0082, "step": 679230 }, { "epoch": 1.76, "learning_rate": 3.589679118463584e-05, "loss": 0.0077, "step": 679240 }, { "epoch": 1.76, "learning_rate": 3.589290296826438e-05, "loss": 0.0099, "step": 679250 }, { "epoch": 1.76, "learning_rate": 3.5889014751892905e-05, "loss": 0.0106, "step": 679260 }, { "epoch": 1.76, "learning_rate": 3.588512653552145e-05, "loss": 0.0067, "step": 679270 }, { "epoch": 1.76, "learning_rate": 3.588123831914998e-05, "loss": 0.008, "step": 679280 }, { "epoch": 1.76, "learning_rate": 3.587735010277852e-05, "loss": 0.0099, "step": 679290 }, { "epoch": 1.76, "learning_rate": 3.587346188640705e-05, "loss": 0.007, "step": 679300 }, { "epoch": 1.76, "learning_rate": 3.5869573670035586e-05, "loss": 0.0088, "step": 679310 }, { "epoch": 1.76, "learning_rate": 3.586568545366412e-05, "loss": 0.0057, "step": 679320 }, { "epoch": 1.76, "learning_rate": 3.5861797237292656e-05, "loss": 0.0073, "step": 679330 }, { "epoch": 1.76, "learning_rate": 3.585790902092119e-05, "loss": 0.0075, "step": 679340 }, { "epoch": 1.76, "learning_rate": 3.585402080454973e-05, "loss": 0.0078, "step": 679350 }, { "epoch": 1.76, "learning_rate": 3.585013258817827e-05, "loss": 0.0058, "step": 679360 }, { "epoch": 1.76, "learning_rate": 3.58462443718068e-05, "loss": 0.0073, "step": 679370 }, { "epoch": 1.76, "learning_rate": 3.584235615543533e-05, "loss": 0.0093, "step": 679380 }, { "epoch": 1.76, "learning_rate": 3.5838467939063865e-05, "loss": 0.0095, "step": 679390 }, { "epoch": 1.76, "learning_rate": 3.583457972269241e-05, "loss": 0.0112, "step": 679400 }, { "epoch": 1.76, "learning_rate": 3.583069150632094e-05, "loss": 0.0135, "step": 679410 }, { "epoch": 1.76, "learning_rate": 3.582680328994948e-05, "loss": 0.0098, "step": 679420 }, { "epoch": 1.76, "learning_rate": 3.582291507357801e-05, "loss": 0.0088, "step": 679430 }, { "epoch": 1.76, "learning_rate": 3.5819026857206546e-05, "loss": 0.008, "step": 679440 }, { "epoch": 1.76, "learning_rate": 3.581513864083508e-05, "loss": 0.0068, "step": 679450 }, { "epoch": 1.76, "learning_rate": 3.5811250424463616e-05, "loss": 0.0077, "step": 679460 }, { "epoch": 1.76, "learning_rate": 3.580736220809215e-05, "loss": 0.009, "step": 679470 }, { "epoch": 1.76, "learning_rate": 3.580347399172069e-05, "loss": 0.0073, "step": 679480 }, { "epoch": 1.76, "learning_rate": 3.579958577534923e-05, "loss": 0.0076, "step": 679490 }, { "epoch": 1.76, "learning_rate": 3.579569755897776e-05, "loss": 0.0088, "step": 679500 }, { "epoch": 1.76, "learning_rate": 3.579180934260629e-05, "loss": 0.012, "step": 679510 }, { "epoch": 1.76, "learning_rate": 3.5787921126234825e-05, "loss": 0.0068, "step": 679520 }, { "epoch": 1.76, "learning_rate": 3.578403290986337e-05, "loss": 0.0077, "step": 679530 }, { "epoch": 1.76, "learning_rate": 3.57801446934919e-05, "loss": 0.0047, "step": 679540 }, { "epoch": 1.76, "learning_rate": 3.577625647712044e-05, "loss": 0.0062, "step": 679550 }, { "epoch": 1.76, "learning_rate": 3.577236826074897e-05, "loss": 0.0074, "step": 679560 }, { "epoch": 1.76, "learning_rate": 3.5768480044377506e-05, "loss": 0.0087, "step": 679570 }, { "epoch": 1.76, "learning_rate": 3.576459182800604e-05, "loss": 0.0083, "step": 679580 }, { "epoch": 1.76, "learning_rate": 3.5760703611634576e-05, "loss": 0.0082, "step": 679590 }, { "epoch": 1.76, "learning_rate": 3.575681539526311e-05, "loss": 0.0101, "step": 679600 }, { "epoch": 1.76, "learning_rate": 3.575292717889165e-05, "loss": 0.0088, "step": 679610 }, { "epoch": 1.76, "learning_rate": 3.574903896252019e-05, "loss": 0.0091, "step": 679620 }, { "epoch": 1.76, "learning_rate": 3.5745150746148716e-05, "loss": 0.0091, "step": 679630 }, { "epoch": 1.76, "learning_rate": 3.574126252977725e-05, "loss": 0.009, "step": 679640 }, { "epoch": 1.76, "learning_rate": 3.5737374313405785e-05, "loss": 0.0098, "step": 679650 }, { "epoch": 1.76, "learning_rate": 3.573348609703433e-05, "loss": 0.0065, "step": 679660 }, { "epoch": 1.76, "learning_rate": 3.572959788066286e-05, "loss": 0.0115, "step": 679670 }, { "epoch": 1.76, "learning_rate": 3.5725709664291397e-05, "loss": 0.0108, "step": 679680 }, { "epoch": 1.76, "learning_rate": 3.572182144791993e-05, "loss": 0.008, "step": 679690 }, { "epoch": 1.76, "learning_rate": 3.5717933231548466e-05, "loss": 0.0111, "step": 679700 }, { "epoch": 1.76, "learning_rate": 3.5714045015177e-05, "loss": 0.0081, "step": 679710 }, { "epoch": 1.76, "learning_rate": 3.5710156798805536e-05, "loss": 0.0104, "step": 679720 }, { "epoch": 1.76, "learning_rate": 3.570626858243407e-05, "loss": 0.0064, "step": 679730 }, { "epoch": 1.76, "learning_rate": 3.570238036606261e-05, "loss": 0.0073, "step": 679740 }, { "epoch": 1.76, "learning_rate": 3.569849214969115e-05, "loss": 0.0069, "step": 679750 }, { "epoch": 1.76, "learning_rate": 3.5694603933319675e-05, "loss": 0.0078, "step": 679760 }, { "epoch": 1.76, "learning_rate": 3.569071571694821e-05, "loss": 0.0067, "step": 679770 }, { "epoch": 1.76, "learning_rate": 3.5686827500576745e-05, "loss": 0.0057, "step": 679780 }, { "epoch": 1.76, "learning_rate": 3.568293928420529e-05, "loss": 0.011, "step": 679790 }, { "epoch": 1.76, "learning_rate": 3.567905106783382e-05, "loss": 0.0083, "step": 679800 }, { "epoch": 1.76, "learning_rate": 3.5675162851462357e-05, "loss": 0.0084, "step": 679810 }, { "epoch": 1.76, "learning_rate": 3.567127463509089e-05, "loss": 0.0063, "step": 679820 }, { "epoch": 1.76, "learning_rate": 3.5667386418719426e-05, "loss": 0.0089, "step": 679830 }, { "epoch": 1.76, "learning_rate": 3.566349820234796e-05, "loss": 0.0079, "step": 679840 }, { "epoch": 1.76, "learning_rate": 3.5659609985976496e-05, "loss": 0.0077, "step": 679850 }, { "epoch": 1.76, "learning_rate": 3.565572176960503e-05, "loss": 0.0068, "step": 679860 }, { "epoch": 1.76, "learning_rate": 3.565183355323357e-05, "loss": 0.0089, "step": 679870 }, { "epoch": 1.76, "learning_rate": 3.56479453368621e-05, "loss": 0.0122, "step": 679880 }, { "epoch": 1.76, "learning_rate": 3.5644057120490635e-05, "loss": 0.006, "step": 679890 }, { "epoch": 1.76, "learning_rate": 3.564016890411917e-05, "loss": 0.0073, "step": 679900 }, { "epoch": 1.76, "learning_rate": 3.5636280687747705e-05, "loss": 0.0082, "step": 679910 }, { "epoch": 1.76, "learning_rate": 3.563239247137625e-05, "loss": 0.008, "step": 679920 }, { "epoch": 1.76, "learning_rate": 3.562850425500478e-05, "loss": 0.0097, "step": 679930 }, { "epoch": 1.76, "learning_rate": 3.5624616038633317e-05, "loss": 0.0061, "step": 679940 }, { "epoch": 1.76, "learning_rate": 3.562072782226185e-05, "loss": 0.0077, "step": 679950 }, { "epoch": 1.76, "learning_rate": 3.5616839605890386e-05, "loss": 0.0089, "step": 679960 }, { "epoch": 1.76, "learning_rate": 3.561295138951892e-05, "loss": 0.0087, "step": 679970 }, { "epoch": 1.76, "learning_rate": 3.5609063173147456e-05, "loss": 0.0092, "step": 679980 }, { "epoch": 1.76, "learning_rate": 3.560517495677599e-05, "loss": 0.0096, "step": 679990 }, { "epoch": 1.76, "learning_rate": 3.5601286740404526e-05, "loss": 0.006, "step": 680000 }, { "epoch": 1.76, "eval_cer": 0.8816858906799576, "eval_loss": 0.005062996409833431, "eval_runtime": 107.9149, "eval_samples_per_second": 18.533, "eval_steps_per_second": 4.633, "step": 680000 }, { "epoch": 1.76, "learning_rate": 3.559739852403306e-05, "loss": 0.0052, "step": 680010 }, { "epoch": 1.76, "learning_rate": 3.5593510307661595e-05, "loss": 0.0064, "step": 680020 }, { "epoch": 1.76, "learning_rate": 3.558962209129013e-05, "loss": 0.0052, "step": 680030 }, { "epoch": 1.76, "learning_rate": 3.5585733874918665e-05, "loss": 0.0084, "step": 680040 }, { "epoch": 1.76, "learning_rate": 3.55818456585472e-05, "loss": 0.0117, "step": 680050 }, { "epoch": 1.76, "learning_rate": 3.557795744217574e-05, "loss": 0.005, "step": 680060 }, { "epoch": 1.76, "learning_rate": 3.5574069225804277e-05, "loss": 0.0104, "step": 680070 }, { "epoch": 1.76, "learning_rate": 3.557018100943281e-05, "loss": 0.0075, "step": 680080 }, { "epoch": 1.76, "learning_rate": 3.5566292793061346e-05, "loss": 0.0066, "step": 680090 }, { "epoch": 1.76, "learning_rate": 3.556240457668988e-05, "loss": 0.0076, "step": 680100 }, { "epoch": 1.76, "learning_rate": 3.5558516360318416e-05, "loss": 0.0114, "step": 680110 }, { "epoch": 1.76, "learning_rate": 3.555462814394695e-05, "loss": 0.0079, "step": 680120 }, { "epoch": 1.76, "learning_rate": 3.5550739927575486e-05, "loss": 0.0092, "step": 680130 }, { "epoch": 1.76, "learning_rate": 3.554685171120402e-05, "loss": 0.0092, "step": 680140 }, { "epoch": 1.76, "learning_rate": 3.5542963494832555e-05, "loss": 0.0058, "step": 680150 }, { "epoch": 1.76, "learning_rate": 3.553907527846109e-05, "loss": 0.0093, "step": 680160 }, { "epoch": 1.76, "learning_rate": 3.5535187062089625e-05, "loss": 0.0071, "step": 680170 }, { "epoch": 1.76, "learning_rate": 3.553129884571816e-05, "loss": 0.0083, "step": 680180 }, { "epoch": 1.76, "learning_rate": 3.55274106293467e-05, "loss": 0.0076, "step": 680190 }, { "epoch": 1.76, "learning_rate": 3.5523522412975237e-05, "loss": 0.0111, "step": 680200 }, { "epoch": 1.76, "learning_rate": 3.551963419660377e-05, "loss": 0.006, "step": 680210 }, { "epoch": 1.76, "learning_rate": 3.5515745980232306e-05, "loss": 0.0066, "step": 680220 }, { "epoch": 1.76, "learning_rate": 3.551185776386084e-05, "loss": 0.0064, "step": 680230 }, { "epoch": 1.76, "learning_rate": 3.5507969547489376e-05, "loss": 0.0072, "step": 680240 }, { "epoch": 1.76, "learning_rate": 3.550408133111791e-05, "loss": 0.0062, "step": 680250 }, { "epoch": 1.76, "learning_rate": 3.5500193114746446e-05, "loss": 0.0074, "step": 680260 }, { "epoch": 1.76, "learning_rate": 3.549630489837498e-05, "loss": 0.0074, "step": 680270 }, { "epoch": 1.76, "learning_rate": 3.5492416682003515e-05, "loss": 0.0067, "step": 680280 }, { "epoch": 1.76, "learning_rate": 3.548852846563205e-05, "loss": 0.0066, "step": 680290 }, { "epoch": 1.76, "learning_rate": 3.5484640249260585e-05, "loss": 0.0069, "step": 680300 }, { "epoch": 1.76, "learning_rate": 3.548075203288912e-05, "loss": 0.007, "step": 680310 }, { "epoch": 1.76, "learning_rate": 3.547686381651766e-05, "loss": 0.0094, "step": 680320 }, { "epoch": 1.76, "learning_rate": 3.5472975600146196e-05, "loss": 0.0077, "step": 680330 }, { "epoch": 1.76, "learning_rate": 3.546908738377473e-05, "loss": 0.0073, "step": 680340 }, { "epoch": 1.76, "learning_rate": 3.5465199167403266e-05, "loss": 0.0086, "step": 680350 }, { "epoch": 1.76, "learning_rate": 3.54613109510318e-05, "loss": 0.0066, "step": 680360 }, { "epoch": 1.76, "learning_rate": 3.5457422734660336e-05, "loss": 0.0077, "step": 680370 }, { "epoch": 1.76, "learning_rate": 3.545353451828887e-05, "loss": 0.0051, "step": 680380 }, { "epoch": 1.76, "learning_rate": 3.5449646301917406e-05, "loss": 0.0067, "step": 680390 }, { "epoch": 1.76, "learning_rate": 3.544575808554594e-05, "loss": 0.0091, "step": 680400 }, { "epoch": 1.76, "learning_rate": 3.5441869869174475e-05, "loss": 0.0091, "step": 680410 }, { "epoch": 1.76, "learning_rate": 3.543798165280301e-05, "loss": 0.007, "step": 680420 }, { "epoch": 1.76, "learning_rate": 3.5434093436431545e-05, "loss": 0.0088, "step": 680430 }, { "epoch": 1.76, "learning_rate": 3.543020522006008e-05, "loss": 0.0061, "step": 680440 }, { "epoch": 1.76, "learning_rate": 3.542631700368862e-05, "loss": 0.0087, "step": 680450 }, { "epoch": 1.76, "learning_rate": 3.5422428787317156e-05, "loss": 0.0092, "step": 680460 }, { "epoch": 1.76, "learning_rate": 3.541854057094569e-05, "loss": 0.0072, "step": 680470 }, { "epoch": 1.76, "learning_rate": 3.5414652354574226e-05, "loss": 0.0068, "step": 680480 }, { "epoch": 1.76, "learning_rate": 3.541076413820276e-05, "loss": 0.0065, "step": 680490 }, { "epoch": 1.76, "learning_rate": 3.5406875921831296e-05, "loss": 0.0072, "step": 680500 }, { "epoch": 1.76, "learning_rate": 3.540298770545983e-05, "loss": 0.0086, "step": 680510 }, { "epoch": 1.76, "learning_rate": 3.5399099489088366e-05, "loss": 0.0089, "step": 680520 }, { "epoch": 1.76, "learning_rate": 3.53952112727169e-05, "loss": 0.0081, "step": 680530 }, { "epoch": 1.76, "learning_rate": 3.5391323056345435e-05, "loss": 0.0095, "step": 680540 }, { "epoch": 1.76, "learning_rate": 3.538743483997397e-05, "loss": 0.0069, "step": 680550 }, { "epoch": 1.76, "learning_rate": 3.5383546623602505e-05, "loss": 0.0084, "step": 680560 }, { "epoch": 1.76, "learning_rate": 3.537965840723104e-05, "loss": 0.0086, "step": 680570 }, { "epoch": 1.76, "learning_rate": 3.537577019085958e-05, "loss": 0.0072, "step": 680580 }, { "epoch": 1.76, "learning_rate": 3.5371881974488116e-05, "loss": 0.0057, "step": 680590 }, { "epoch": 1.76, "learning_rate": 3.536799375811665e-05, "loss": 0.0086, "step": 680600 }, { "epoch": 1.76, "learning_rate": 3.5364105541745186e-05, "loss": 0.0066, "step": 680610 }, { "epoch": 1.76, "learning_rate": 3.5360217325373714e-05, "loss": 0.0075, "step": 680620 }, { "epoch": 1.76, "learning_rate": 3.5356329109002256e-05, "loss": 0.0082, "step": 680630 }, { "epoch": 1.76, "learning_rate": 3.535244089263079e-05, "loss": 0.0058, "step": 680640 }, { "epoch": 1.76, "learning_rate": 3.5348552676259326e-05, "loss": 0.0077, "step": 680650 }, { "epoch": 1.76, "learning_rate": 3.534466445988786e-05, "loss": 0.005, "step": 680660 }, { "epoch": 1.76, "learning_rate": 3.5340776243516395e-05, "loss": 0.006, "step": 680670 }, { "epoch": 1.76, "learning_rate": 3.533688802714493e-05, "loss": 0.0075, "step": 680680 }, { "epoch": 1.76, "learning_rate": 3.5332999810773465e-05, "loss": 0.0079, "step": 680690 }, { "epoch": 1.76, "learning_rate": 3.5329111594402e-05, "loss": 0.0068, "step": 680700 }, { "epoch": 1.76, "learning_rate": 3.532522337803054e-05, "loss": 0.007, "step": 680710 }, { "epoch": 1.76, "learning_rate": 3.5321335161659076e-05, "loss": 0.0056, "step": 680720 }, { "epoch": 1.76, "learning_rate": 3.531744694528761e-05, "loss": 0.0107, "step": 680730 }, { "epoch": 1.76, "learning_rate": 3.5313558728916146e-05, "loss": 0.0066, "step": 680740 }, { "epoch": 1.76, "learning_rate": 3.5309670512544674e-05, "loss": 0.0076, "step": 680750 }, { "epoch": 1.76, "learning_rate": 3.5305782296173216e-05, "loss": 0.0087, "step": 680760 }, { "epoch": 1.76, "learning_rate": 3.530189407980175e-05, "loss": 0.0103, "step": 680770 }, { "epoch": 1.76, "learning_rate": 3.5298005863430286e-05, "loss": 0.0085, "step": 680780 }, { "epoch": 1.76, "learning_rate": 3.529411764705882e-05, "loss": 0.0055, "step": 680790 }, { "epoch": 1.76, "learning_rate": 3.5290229430687355e-05, "loss": 0.0068, "step": 680800 }, { "epoch": 1.76, "learning_rate": 3.528634121431589e-05, "loss": 0.0096, "step": 680810 }, { "epoch": 1.76, "learning_rate": 3.5282452997944425e-05, "loss": 0.008, "step": 680820 }, { "epoch": 1.76, "learning_rate": 3.527856478157296e-05, "loss": 0.0058, "step": 680830 }, { "epoch": 1.76, "learning_rate": 3.52746765652015e-05, "loss": 0.0068, "step": 680840 }, { "epoch": 1.76, "learning_rate": 3.5270788348830036e-05, "loss": 0.0105, "step": 680850 }, { "epoch": 1.76, "learning_rate": 3.526690013245857e-05, "loss": 0.006, "step": 680860 }, { "epoch": 1.76, "learning_rate": 3.52630119160871e-05, "loss": 0.0064, "step": 680870 }, { "epoch": 1.76, "learning_rate": 3.5259123699715634e-05, "loss": 0.0062, "step": 680880 }, { "epoch": 1.76, "learning_rate": 3.5255235483344176e-05, "loss": 0.0093, "step": 680890 }, { "epoch": 1.76, "learning_rate": 3.525134726697271e-05, "loss": 0.0089, "step": 680900 }, { "epoch": 1.77, "learning_rate": 3.5247459050601246e-05, "loss": 0.0075, "step": 680910 }, { "epoch": 1.77, "learning_rate": 3.524357083422978e-05, "loss": 0.0074, "step": 680920 }, { "epoch": 1.77, "learning_rate": 3.5239682617858315e-05, "loss": 0.0093, "step": 680930 }, { "epoch": 1.77, "learning_rate": 3.523579440148685e-05, "loss": 0.0096, "step": 680940 }, { "epoch": 1.77, "learning_rate": 3.5231906185115385e-05, "loss": 0.0079, "step": 680950 }, { "epoch": 1.77, "learning_rate": 3.522801796874392e-05, "loss": 0.0076, "step": 680960 }, { "epoch": 1.77, "learning_rate": 3.522412975237246e-05, "loss": 0.0073, "step": 680970 }, { "epoch": 1.77, "learning_rate": 3.5220241536000996e-05, "loss": 0.008, "step": 680980 }, { "epoch": 1.77, "learning_rate": 3.521635331962953e-05, "loss": 0.0072, "step": 680990 }, { "epoch": 1.77, "learning_rate": 3.521246510325806e-05, "loss": 0.0071, "step": 681000 }, { "epoch": 1.77, "eval_cer": 0.88167329394755, "eval_loss": 0.004988801199942827, "eval_runtime": 107.9177, "eval_samples_per_second": 18.533, "eval_steps_per_second": 4.633, "step": 681000 }, { "epoch": 1.77, "learning_rate": 3.5208576886886594e-05, "loss": 0.0076, "step": 681010 }, { "epoch": 1.77, "learning_rate": 3.5204688670515136e-05, "loss": 0.0057, "step": 681020 }, { "epoch": 1.77, "learning_rate": 3.520080045414367e-05, "loss": 0.0067, "step": 681030 }, { "epoch": 1.77, "learning_rate": 3.5196912237772206e-05, "loss": 0.007, "step": 681040 }, { "epoch": 1.77, "learning_rate": 3.519302402140074e-05, "loss": 0.0066, "step": 681050 }, { "epoch": 1.77, "learning_rate": 3.5189135805029275e-05, "loss": 0.0092, "step": 681060 }, { "epoch": 1.77, "learning_rate": 3.518524758865781e-05, "loss": 0.0083, "step": 681070 }, { "epoch": 1.77, "learning_rate": 3.5181359372286345e-05, "loss": 0.0078, "step": 681080 }, { "epoch": 1.77, "learning_rate": 3.517747115591488e-05, "loss": 0.0072, "step": 681090 }, { "epoch": 1.77, "learning_rate": 3.517358293954342e-05, "loss": 0.0077, "step": 681100 }, { "epoch": 1.77, "learning_rate": 3.5169694723171956e-05, "loss": 0.0082, "step": 681110 }, { "epoch": 1.77, "learning_rate": 3.5165806506800484e-05, "loss": 0.0107, "step": 681120 }, { "epoch": 1.77, "learning_rate": 3.516191829042902e-05, "loss": 0.0091, "step": 681130 }, { "epoch": 1.77, "learning_rate": 3.5158030074057554e-05, "loss": 0.0066, "step": 681140 }, { "epoch": 1.77, "learning_rate": 3.5154141857686096e-05, "loss": 0.0078, "step": 681150 }, { "epoch": 1.77, "learning_rate": 3.515025364131463e-05, "loss": 0.0052, "step": 681160 }, { "epoch": 1.77, "learning_rate": 3.5146365424943166e-05, "loss": 0.0103, "step": 681170 }, { "epoch": 1.77, "learning_rate": 3.51424772085717e-05, "loss": 0.0071, "step": 681180 }, { "epoch": 1.77, "learning_rate": 3.5138588992200235e-05, "loss": 0.0073, "step": 681190 }, { "epoch": 1.77, "learning_rate": 3.513470077582877e-05, "loss": 0.0075, "step": 681200 }, { "epoch": 1.77, "learning_rate": 3.5130812559457305e-05, "loss": 0.0074, "step": 681210 }, { "epoch": 1.77, "learning_rate": 3.512692434308584e-05, "loss": 0.0106, "step": 681220 }, { "epoch": 1.77, "learning_rate": 3.512303612671438e-05, "loss": 0.0076, "step": 681230 }, { "epoch": 1.77, "learning_rate": 3.511914791034291e-05, "loss": 0.0106, "step": 681240 }, { "epoch": 1.77, "learning_rate": 3.5115259693971444e-05, "loss": 0.0083, "step": 681250 }, { "epoch": 1.77, "learning_rate": 3.511137147759998e-05, "loss": 0.0073, "step": 681260 }, { "epoch": 1.77, "learning_rate": 3.5107483261228514e-05, "loss": 0.0096, "step": 681270 }, { "epoch": 1.77, "learning_rate": 3.5103595044857056e-05, "loss": 0.0058, "step": 681280 }, { "epoch": 1.77, "learning_rate": 3.509970682848559e-05, "loss": 0.0071, "step": 681290 }, { "epoch": 1.77, "learning_rate": 3.5095818612114125e-05, "loss": 0.0062, "step": 681300 }, { "epoch": 1.77, "learning_rate": 3.509193039574266e-05, "loss": 0.0094, "step": 681310 }, { "epoch": 1.77, "learning_rate": 3.5088042179371195e-05, "loss": 0.0097, "step": 681320 }, { "epoch": 1.77, "learning_rate": 3.508415396299973e-05, "loss": 0.0076, "step": 681330 }, { "epoch": 1.77, "learning_rate": 3.5080265746628265e-05, "loss": 0.0072, "step": 681340 }, { "epoch": 1.77, "learning_rate": 3.50763775302568e-05, "loss": 0.0071, "step": 681350 }, { "epoch": 1.77, "learning_rate": 3.5072489313885335e-05, "loss": 0.0064, "step": 681360 }, { "epoch": 1.77, "learning_rate": 3.506860109751387e-05, "loss": 0.0072, "step": 681370 }, { "epoch": 1.77, "learning_rate": 3.5064712881142404e-05, "loss": 0.0056, "step": 681380 }, { "epoch": 1.77, "learning_rate": 3.506082466477094e-05, "loss": 0.0069, "step": 681390 }, { "epoch": 1.77, "learning_rate": 3.5056936448399474e-05, "loss": 0.0077, "step": 681400 }, { "epoch": 1.77, "learning_rate": 3.505304823202801e-05, "loss": 0.0074, "step": 681410 }, { "epoch": 1.77, "learning_rate": 3.504916001565655e-05, "loss": 0.0068, "step": 681420 }, { "epoch": 1.77, "learning_rate": 3.5045271799285085e-05, "loss": 0.0088, "step": 681430 }, { "epoch": 1.77, "learning_rate": 3.504138358291362e-05, "loss": 0.0063, "step": 681440 }, { "epoch": 1.77, "learning_rate": 3.5037495366542155e-05, "loss": 0.0071, "step": 681450 }, { "epoch": 1.77, "learning_rate": 3.503360715017069e-05, "loss": 0.0077, "step": 681460 }, { "epoch": 1.77, "learning_rate": 3.5029718933799225e-05, "loss": 0.0061, "step": 681470 }, { "epoch": 1.77, "learning_rate": 3.502583071742776e-05, "loss": 0.0067, "step": 681480 }, { "epoch": 1.77, "learning_rate": 3.5021942501056295e-05, "loss": 0.0055, "step": 681490 }, { "epoch": 1.77, "learning_rate": 3.501805428468483e-05, "loss": 0.006, "step": 681500 }, { "epoch": 1.77, "learning_rate": 3.5014166068313364e-05, "loss": 0.0084, "step": 681510 }, { "epoch": 1.77, "learning_rate": 3.50102778519419e-05, "loss": 0.0094, "step": 681520 }, { "epoch": 1.77, "learning_rate": 3.5006389635570434e-05, "loss": 0.0064, "step": 681530 }, { "epoch": 1.77, "learning_rate": 3.500250141919897e-05, "loss": 0.0068, "step": 681540 }, { "epoch": 1.77, "learning_rate": 3.499861320282751e-05, "loss": 0.0092, "step": 681550 }, { "epoch": 1.77, "learning_rate": 3.4994724986456045e-05, "loss": 0.0056, "step": 681560 }, { "epoch": 1.77, "learning_rate": 3.499083677008458e-05, "loss": 0.0063, "step": 681570 }, { "epoch": 1.77, "learning_rate": 3.4986948553713115e-05, "loss": 0.0069, "step": 681580 }, { "epoch": 1.77, "learning_rate": 3.498306033734165e-05, "loss": 0.0096, "step": 681590 }, { "epoch": 1.77, "learning_rate": 3.4979172120970185e-05, "loss": 0.0076, "step": 681600 }, { "epoch": 1.77, "learning_rate": 3.497528390459872e-05, "loss": 0.0085, "step": 681610 }, { "epoch": 1.77, "learning_rate": 3.4971395688227255e-05, "loss": 0.0088, "step": 681620 }, { "epoch": 1.77, "learning_rate": 3.496750747185579e-05, "loss": 0.0079, "step": 681630 }, { "epoch": 1.77, "learning_rate": 3.4963619255484324e-05, "loss": 0.0082, "step": 681640 }, { "epoch": 1.77, "learning_rate": 3.495973103911286e-05, "loss": 0.0087, "step": 681650 }, { "epoch": 1.77, "learning_rate": 3.4955842822741394e-05, "loss": 0.0136, "step": 681660 }, { "epoch": 1.77, "learning_rate": 3.495195460636993e-05, "loss": 0.0079, "step": 681670 }, { "epoch": 1.77, "learning_rate": 3.494806638999847e-05, "loss": 0.0068, "step": 681680 }, { "epoch": 1.77, "learning_rate": 3.4944178173627005e-05, "loss": 0.0074, "step": 681690 }, { "epoch": 1.77, "learning_rate": 3.494028995725554e-05, "loss": 0.0065, "step": 681700 }, { "epoch": 1.77, "learning_rate": 3.4936401740884075e-05, "loss": 0.0062, "step": 681710 }, { "epoch": 1.77, "learning_rate": 3.493251352451261e-05, "loss": 0.0069, "step": 681720 }, { "epoch": 1.77, "learning_rate": 3.4928625308141145e-05, "loss": 0.0059, "step": 681730 }, { "epoch": 1.77, "learning_rate": 3.492473709176968e-05, "loss": 0.0069, "step": 681740 }, { "epoch": 1.77, "learning_rate": 3.4920848875398215e-05, "loss": 0.0085, "step": 681750 }, { "epoch": 1.77, "learning_rate": 3.491696065902675e-05, "loss": 0.0069, "step": 681760 }, { "epoch": 1.77, "learning_rate": 3.4913072442655284e-05, "loss": 0.0086, "step": 681770 }, { "epoch": 1.77, "learning_rate": 3.490918422628382e-05, "loss": 0.0071, "step": 681780 }, { "epoch": 1.77, "learning_rate": 3.4905296009912354e-05, "loss": 0.0058, "step": 681790 }, { "epoch": 1.77, "learning_rate": 3.490140779354089e-05, "loss": 0.0097, "step": 681800 }, { "epoch": 1.77, "learning_rate": 3.489751957716943e-05, "loss": 0.0056, "step": 681810 }, { "epoch": 1.77, "learning_rate": 3.4893631360797965e-05, "loss": 0.0079, "step": 681820 }, { "epoch": 1.77, "learning_rate": 3.48897431444265e-05, "loss": 0.0094, "step": 681830 }, { "epoch": 1.77, "learning_rate": 3.4885854928055035e-05, "loss": 0.0057, "step": 681840 }, { "epoch": 1.77, "learning_rate": 3.488196671168357e-05, "loss": 0.006, "step": 681850 }, { "epoch": 1.77, "learning_rate": 3.4878078495312105e-05, "loss": 0.0081, "step": 681860 }, { "epoch": 1.77, "learning_rate": 3.487419027894064e-05, "loss": 0.0055, "step": 681870 }, { "epoch": 1.77, "learning_rate": 3.4870302062569175e-05, "loss": 0.0067, "step": 681880 }, { "epoch": 1.77, "learning_rate": 3.486641384619771e-05, "loss": 0.0086, "step": 681890 }, { "epoch": 1.77, "learning_rate": 3.4862525629826244e-05, "loss": 0.0048, "step": 681900 }, { "epoch": 1.77, "learning_rate": 3.485863741345478e-05, "loss": 0.0067, "step": 681910 }, { "epoch": 1.77, "learning_rate": 3.4854749197083314e-05, "loss": 0.0091, "step": 681920 }, { "epoch": 1.77, "learning_rate": 3.485086098071185e-05, "loss": 0.0094, "step": 681930 }, { "epoch": 1.77, "learning_rate": 3.484697276434039e-05, "loss": 0.0077, "step": 681940 }, { "epoch": 1.77, "learning_rate": 3.4843084547968925e-05, "loss": 0.0094, "step": 681950 }, { "epoch": 1.77, "learning_rate": 3.483919633159746e-05, "loss": 0.0075, "step": 681960 }, { "epoch": 1.77, "learning_rate": 3.4835308115225995e-05, "loss": 0.0092, "step": 681970 }, { "epoch": 1.77, "learning_rate": 3.483141989885453e-05, "loss": 0.0086, "step": 681980 }, { "epoch": 1.77, "learning_rate": 3.4827531682483065e-05, "loss": 0.0071, "step": 681990 }, { "epoch": 1.77, "learning_rate": 3.48236434661116e-05, "loss": 0.0079, "step": 682000 }, { "epoch": 1.77, "eval_cer": 0.8816774928583525, "eval_loss": 0.004874969832599163, "eval_runtime": 107.8015, "eval_samples_per_second": 18.553, "eval_steps_per_second": 4.638, "step": 682000 }, { "epoch": 1.77, "learning_rate": 3.4819755249740135e-05, "loss": 0.0052, "step": 682010 }, { "epoch": 1.77, "learning_rate": 3.481586703336867e-05, "loss": 0.0065, "step": 682020 }, { "epoch": 1.77, "learning_rate": 3.4811978816997204e-05, "loss": 0.0099, "step": 682030 }, { "epoch": 1.77, "learning_rate": 3.480809060062574e-05, "loss": 0.0072, "step": 682040 }, { "epoch": 1.77, "learning_rate": 3.4804202384254274e-05, "loss": 0.0047, "step": 682050 }, { "epoch": 1.77, "learning_rate": 3.480031416788281e-05, "loss": 0.0061, "step": 682060 }, { "epoch": 1.77, "learning_rate": 3.479642595151135e-05, "loss": 0.0079, "step": 682070 }, { "epoch": 1.77, "learning_rate": 3.4792537735139885e-05, "loss": 0.0074, "step": 682080 }, { "epoch": 1.77, "learning_rate": 3.478864951876842e-05, "loss": 0.0069, "step": 682090 }, { "epoch": 1.77, "learning_rate": 3.4784761302396955e-05, "loss": 0.0082, "step": 682100 }, { "epoch": 1.77, "learning_rate": 3.478087308602548e-05, "loss": 0.0067, "step": 682110 }, { "epoch": 1.77, "learning_rate": 3.4776984869654025e-05, "loss": 0.0051, "step": 682120 }, { "epoch": 1.77, "learning_rate": 3.477309665328256e-05, "loss": 0.0066, "step": 682130 }, { "epoch": 1.77, "learning_rate": 3.4769208436911095e-05, "loss": 0.0076, "step": 682140 }, { "epoch": 1.77, "learning_rate": 3.476532022053963e-05, "loss": 0.0062, "step": 682150 }, { "epoch": 1.77, "learning_rate": 3.4761432004168164e-05, "loss": 0.0058, "step": 682160 }, { "epoch": 1.77, "learning_rate": 3.47575437877967e-05, "loss": 0.0102, "step": 682170 }, { "epoch": 1.77, "learning_rate": 3.4753655571425234e-05, "loss": 0.0135, "step": 682180 }, { "epoch": 1.77, "learning_rate": 3.474976735505377e-05, "loss": 0.0088, "step": 682190 }, { "epoch": 1.77, "learning_rate": 3.474587913868231e-05, "loss": 0.0111, "step": 682200 }, { "epoch": 1.77, "learning_rate": 3.4741990922310845e-05, "loss": 0.0073, "step": 682210 }, { "epoch": 1.77, "learning_rate": 3.473810270593938e-05, "loss": 0.0054, "step": 682220 }, { "epoch": 1.77, "learning_rate": 3.4734214489567915e-05, "loss": 0.0091, "step": 682230 }, { "epoch": 1.77, "learning_rate": 3.473032627319644e-05, "loss": 0.0058, "step": 682240 }, { "epoch": 1.77, "learning_rate": 3.4726438056824985e-05, "loss": 0.0073, "step": 682250 }, { "epoch": 1.77, "learning_rate": 3.472254984045352e-05, "loss": 0.0091, "step": 682260 }, { "epoch": 1.77, "learning_rate": 3.4718661624082054e-05, "loss": 0.0085, "step": 682270 }, { "epoch": 1.77, "learning_rate": 3.471477340771059e-05, "loss": 0.0067, "step": 682280 }, { "epoch": 1.77, "learning_rate": 3.4710885191339124e-05, "loss": 0.0086, "step": 682290 }, { "epoch": 1.77, "learning_rate": 3.470699697496766e-05, "loss": 0.0078, "step": 682300 }, { "epoch": 1.77, "learning_rate": 3.4703108758596194e-05, "loss": 0.0061, "step": 682310 }, { "epoch": 1.77, "learning_rate": 3.469922054222473e-05, "loss": 0.0084, "step": 682320 }, { "epoch": 1.77, "learning_rate": 3.469533232585327e-05, "loss": 0.0101, "step": 682330 }, { "epoch": 1.77, "learning_rate": 3.4691444109481805e-05, "loss": 0.0072, "step": 682340 }, { "epoch": 1.77, "learning_rate": 3.468755589311034e-05, "loss": 0.0054, "step": 682350 }, { "epoch": 1.77, "learning_rate": 3.468366767673887e-05, "loss": 0.0078, "step": 682360 }, { "epoch": 1.77, "learning_rate": 3.46797794603674e-05, "loss": 0.0102, "step": 682370 }, { "epoch": 1.77, "learning_rate": 3.4675891243995945e-05, "loss": 0.0078, "step": 682380 }, { "epoch": 1.77, "learning_rate": 3.467200302762448e-05, "loss": 0.0089, "step": 682390 }, { "epoch": 1.77, "learning_rate": 3.4668114811253014e-05, "loss": 0.0077, "step": 682400 }, { "epoch": 1.77, "learning_rate": 3.466422659488155e-05, "loss": 0.0071, "step": 682410 }, { "epoch": 1.77, "learning_rate": 3.4660338378510084e-05, "loss": 0.0071, "step": 682420 }, { "epoch": 1.77, "learning_rate": 3.465645016213862e-05, "loss": 0.0089, "step": 682430 }, { "epoch": 1.77, "learning_rate": 3.4652561945767154e-05, "loss": 0.0072, "step": 682440 }, { "epoch": 1.77, "learning_rate": 3.464867372939569e-05, "loss": 0.0065, "step": 682450 }, { "epoch": 1.77, "learning_rate": 3.464478551302423e-05, "loss": 0.0096, "step": 682460 }, { "epoch": 1.77, "learning_rate": 3.4640897296652765e-05, "loss": 0.0081, "step": 682470 }, { "epoch": 1.77, "learning_rate": 3.463700908028129e-05, "loss": 0.0079, "step": 682480 }, { "epoch": 1.77, "learning_rate": 3.463312086390983e-05, "loss": 0.0052, "step": 682490 }, { "epoch": 1.77, "learning_rate": 3.462923264753836e-05, "loss": 0.0062, "step": 682500 }, { "epoch": 1.77, "learning_rate": 3.4625344431166905e-05, "loss": 0.0062, "step": 682510 }, { "epoch": 1.77, "learning_rate": 3.462145621479544e-05, "loss": 0.0087, "step": 682520 }, { "epoch": 1.77, "learning_rate": 3.4617567998423974e-05, "loss": 0.0082, "step": 682530 }, { "epoch": 1.77, "learning_rate": 3.461367978205251e-05, "loss": 0.0057, "step": 682540 }, { "epoch": 1.77, "learning_rate": 3.4609791565681044e-05, "loss": 0.008, "step": 682550 }, { "epoch": 1.77, "learning_rate": 3.460590334930958e-05, "loss": 0.0094, "step": 682560 }, { "epoch": 1.77, "learning_rate": 3.4602015132938114e-05, "loss": 0.0075, "step": 682570 }, { "epoch": 1.77, "learning_rate": 3.459812691656665e-05, "loss": 0.0069, "step": 682580 }, { "epoch": 1.77, "learning_rate": 3.459423870019519e-05, "loss": 0.0065, "step": 682590 }, { "epoch": 1.77, "learning_rate": 3.4590350483823725e-05, "loss": 0.0047, "step": 682600 }, { "epoch": 1.77, "learning_rate": 3.458646226745225e-05, "loss": 0.0068, "step": 682610 }, { "epoch": 1.77, "learning_rate": 3.458257405108079e-05, "loss": 0.0054, "step": 682620 }, { "epoch": 1.77, "learning_rate": 3.457868583470932e-05, "loss": 0.0094, "step": 682630 }, { "epoch": 1.77, "learning_rate": 3.4574797618337865e-05, "loss": 0.0097, "step": 682640 }, { "epoch": 1.77, "learning_rate": 3.45709094019664e-05, "loss": 0.0076, "step": 682650 }, { "epoch": 1.77, "learning_rate": 3.4567021185594934e-05, "loss": 0.0053, "step": 682660 }, { "epoch": 1.77, "learning_rate": 3.456313296922347e-05, "loss": 0.0072, "step": 682670 }, { "epoch": 1.77, "learning_rate": 3.4559244752852004e-05, "loss": 0.0079, "step": 682680 }, { "epoch": 1.77, "learning_rate": 3.455535653648054e-05, "loss": 0.0078, "step": 682690 }, { "epoch": 1.77, "learning_rate": 3.4551468320109074e-05, "loss": 0.0053, "step": 682700 }, { "epoch": 1.77, "learning_rate": 3.454758010373761e-05, "loss": 0.0096, "step": 682710 }, { "epoch": 1.77, "learning_rate": 3.4543691887366144e-05, "loss": 0.006, "step": 682720 }, { "epoch": 1.77, "learning_rate": 3.453980367099468e-05, "loss": 0.0042, "step": 682730 }, { "epoch": 1.77, "learning_rate": 3.453591545462321e-05, "loss": 0.0055, "step": 682740 }, { "epoch": 1.77, "learning_rate": 3.453202723825175e-05, "loss": 0.0108, "step": 682750 }, { "epoch": 1.77, "learning_rate": 3.452813902188028e-05, "loss": 0.0059, "step": 682760 }, { "epoch": 1.77, "learning_rate": 3.4524250805508825e-05, "loss": 0.0083, "step": 682770 }, { "epoch": 1.77, "learning_rate": 3.452036258913736e-05, "loss": 0.0089, "step": 682780 }, { "epoch": 1.77, "learning_rate": 3.4516474372765894e-05, "loss": 0.006, "step": 682790 }, { "epoch": 1.77, "learning_rate": 3.451258615639443e-05, "loss": 0.0071, "step": 682800 }, { "epoch": 1.77, "learning_rate": 3.4508697940022964e-05, "loss": 0.0071, "step": 682810 }, { "epoch": 1.77, "learning_rate": 3.45048097236515e-05, "loss": 0.0075, "step": 682820 }, { "epoch": 1.77, "learning_rate": 3.4500921507280034e-05, "loss": 0.0085, "step": 682830 }, { "epoch": 1.77, "learning_rate": 3.449703329090857e-05, "loss": 0.0088, "step": 682840 }, { "epoch": 1.77, "learning_rate": 3.4493145074537104e-05, "loss": 0.0069, "step": 682850 }, { "epoch": 1.77, "learning_rate": 3.448925685816564e-05, "loss": 0.0104, "step": 682860 }, { "epoch": 1.77, "learning_rate": 3.448536864179417e-05, "loss": 0.0112, "step": 682870 }, { "epoch": 1.77, "learning_rate": 3.448148042542271e-05, "loss": 0.0077, "step": 682880 }, { "epoch": 1.77, "learning_rate": 3.447759220905124e-05, "loss": 0.0082, "step": 682890 }, { "epoch": 1.77, "learning_rate": 3.447370399267978e-05, "loss": 0.0063, "step": 682900 }, { "epoch": 1.77, "learning_rate": 3.446981577630832e-05, "loss": 0.0098, "step": 682910 }, { "epoch": 1.77, "learning_rate": 3.4465927559936854e-05, "loss": 0.0072, "step": 682920 }, { "epoch": 1.77, "learning_rate": 3.446203934356539e-05, "loss": 0.0054, "step": 682930 }, { "epoch": 1.77, "learning_rate": 3.4458151127193924e-05, "loss": 0.0123, "step": 682940 }, { "epoch": 1.77, "learning_rate": 3.445426291082246e-05, "loss": 0.0075, "step": 682950 }, { "epoch": 1.77, "learning_rate": 3.4450374694450994e-05, "loss": 0.0074, "step": 682960 }, { "epoch": 1.77, "learning_rate": 3.444648647807953e-05, "loss": 0.008, "step": 682970 }, { "epoch": 1.77, "learning_rate": 3.4442598261708064e-05, "loss": 0.0071, "step": 682980 }, { "epoch": 1.77, "learning_rate": 3.44387100453366e-05, "loss": 0.0079, "step": 682990 }, { "epoch": 1.77, "learning_rate": 3.443482182896513e-05, "loss": 0.0072, "step": 683000 }, { "epoch": 1.77, "eval_cer": 0.8816788924952867, "eval_loss": 0.00494320597499609, "eval_runtime": 107.8159, "eval_samples_per_second": 18.55, "eval_steps_per_second": 4.638, "step": 683000 }, { "epoch": 1.77, "learning_rate": 3.443093361259367e-05, "loss": 0.0079, "step": 683010 }, { "epoch": 1.77, "learning_rate": 3.44270453962222e-05, "loss": 0.0058, "step": 683020 }, { "epoch": 1.77, "learning_rate": 3.442315717985074e-05, "loss": 0.0086, "step": 683030 }, { "epoch": 1.77, "learning_rate": 3.441926896347928e-05, "loss": 0.0087, "step": 683040 }, { "epoch": 1.77, "learning_rate": 3.4415380747107814e-05, "loss": 0.0076, "step": 683050 }, { "epoch": 1.77, "learning_rate": 3.441149253073635e-05, "loss": 0.005, "step": 683060 }, { "epoch": 1.77, "learning_rate": 3.4407604314364884e-05, "loss": 0.0059, "step": 683070 }, { "epoch": 1.77, "learning_rate": 3.440371609799342e-05, "loss": 0.0065, "step": 683080 }, { "epoch": 1.77, "learning_rate": 3.4399827881621954e-05, "loss": 0.0073, "step": 683090 }, { "epoch": 1.77, "learning_rate": 3.439593966525049e-05, "loss": 0.0065, "step": 683100 }, { "epoch": 1.77, "learning_rate": 3.4392051448879024e-05, "loss": 0.0071, "step": 683110 }, { "epoch": 1.77, "learning_rate": 3.438816323250756e-05, "loss": 0.0084, "step": 683120 }, { "epoch": 1.77, "learning_rate": 3.438427501613609e-05, "loss": 0.0089, "step": 683130 }, { "epoch": 1.77, "learning_rate": 3.438038679976463e-05, "loss": 0.0064, "step": 683140 }, { "epoch": 1.77, "learning_rate": 3.437649858339316e-05, "loss": 0.0065, "step": 683150 }, { "epoch": 1.77, "learning_rate": 3.43726103670217e-05, "loss": 0.0048, "step": 683160 }, { "epoch": 1.77, "learning_rate": 3.436872215065024e-05, "loss": 0.0072, "step": 683170 }, { "epoch": 1.77, "learning_rate": 3.4364833934278774e-05, "loss": 0.0066, "step": 683180 }, { "epoch": 1.77, "learning_rate": 3.436094571790731e-05, "loss": 0.0114, "step": 683190 }, { "epoch": 1.77, "learning_rate": 3.4357057501535844e-05, "loss": 0.009, "step": 683200 }, { "epoch": 1.77, "learning_rate": 3.435316928516438e-05, "loss": 0.0098, "step": 683210 }, { "epoch": 1.77, "learning_rate": 3.4349281068792914e-05, "loss": 0.0093, "step": 683220 }, { "epoch": 1.77, "learning_rate": 3.434539285242145e-05, "loss": 0.008, "step": 683230 }, { "epoch": 1.77, "learning_rate": 3.4341504636049983e-05, "loss": 0.0076, "step": 683240 }, { "epoch": 1.77, "learning_rate": 3.433761641967852e-05, "loss": 0.0115, "step": 683250 }, { "epoch": 1.77, "learning_rate": 3.433372820330705e-05, "loss": 0.005, "step": 683260 }, { "epoch": 1.77, "learning_rate": 3.432983998693559e-05, "loss": 0.0066, "step": 683270 }, { "epoch": 1.77, "learning_rate": 3.432595177056412e-05, "loss": 0.0081, "step": 683280 }, { "epoch": 1.77, "learning_rate": 3.432206355419266e-05, "loss": 0.0065, "step": 683290 }, { "epoch": 1.77, "learning_rate": 3.43181753378212e-05, "loss": 0.0077, "step": 683300 }, { "epoch": 1.77, "learning_rate": 3.4314287121449734e-05, "loss": 0.008, "step": 683310 }, { "epoch": 1.77, "learning_rate": 3.431039890507827e-05, "loss": 0.0063, "step": 683320 }, { "epoch": 1.77, "learning_rate": 3.4306510688706804e-05, "loss": 0.0071, "step": 683330 }, { "epoch": 1.77, "learning_rate": 3.430262247233534e-05, "loss": 0.0071, "step": 683340 }, { "epoch": 1.77, "learning_rate": 3.4298734255963874e-05, "loss": 0.0143, "step": 683350 }, { "epoch": 1.77, "learning_rate": 3.429484603959241e-05, "loss": 0.009, "step": 683360 }, { "epoch": 1.77, "learning_rate": 3.4290957823220943e-05, "loss": 0.0097, "step": 683370 }, { "epoch": 1.77, "learning_rate": 3.428706960684948e-05, "loss": 0.0074, "step": 683380 }, { "epoch": 1.77, "learning_rate": 3.428318139047801e-05, "loss": 0.0064, "step": 683390 }, { "epoch": 1.77, "learning_rate": 3.427929317410655e-05, "loss": 0.0077, "step": 683400 }, { "epoch": 1.77, "learning_rate": 3.427540495773508e-05, "loss": 0.0066, "step": 683410 }, { "epoch": 1.77, "learning_rate": 3.427151674136362e-05, "loss": 0.0051, "step": 683420 }, { "epoch": 1.77, "learning_rate": 3.426762852499216e-05, "loss": 0.0069, "step": 683430 }, { "epoch": 1.77, "learning_rate": 3.4263740308620694e-05, "loss": 0.0084, "step": 683440 }, { "epoch": 1.77, "learning_rate": 3.425985209224923e-05, "loss": 0.0059, "step": 683450 }, { "epoch": 1.77, "learning_rate": 3.4255963875877764e-05, "loss": 0.0082, "step": 683460 }, { "epoch": 1.77, "learning_rate": 3.42520756595063e-05, "loss": 0.0069, "step": 683470 }, { "epoch": 1.77, "learning_rate": 3.4248187443134834e-05, "loss": 0.0079, "step": 683480 }, { "epoch": 1.77, "learning_rate": 3.424429922676337e-05, "loss": 0.0099, "step": 683490 }, { "epoch": 1.77, "learning_rate": 3.4240411010391903e-05, "loss": 0.0105, "step": 683500 }, { "epoch": 1.77, "learning_rate": 3.423652279402044e-05, "loss": 0.0087, "step": 683510 }, { "epoch": 1.77, "learning_rate": 3.423263457764897e-05, "loss": 0.0093, "step": 683520 }, { "epoch": 1.77, "learning_rate": 3.422874636127751e-05, "loss": 0.0059, "step": 683530 }, { "epoch": 1.77, "learning_rate": 3.422485814490604e-05, "loss": 0.0075, "step": 683540 }, { "epoch": 1.77, "learning_rate": 3.422096992853458e-05, "loss": 0.0086, "step": 683550 }, { "epoch": 1.77, "learning_rate": 3.421708171216312e-05, "loss": 0.0092, "step": 683560 }, { "epoch": 1.77, "learning_rate": 3.4213193495791654e-05, "loss": 0.0071, "step": 683570 }, { "epoch": 1.77, "learning_rate": 3.420930527942019e-05, "loss": 0.0096, "step": 683580 }, { "epoch": 1.77, "learning_rate": 3.4205417063048724e-05, "loss": 0.0091, "step": 683590 }, { "epoch": 1.77, "learning_rate": 3.420152884667725e-05, "loss": 0.0059, "step": 683600 }, { "epoch": 1.77, "learning_rate": 3.4197640630305794e-05, "loss": 0.0062, "step": 683610 }, { "epoch": 1.77, "learning_rate": 3.419375241393433e-05, "loss": 0.0064, "step": 683620 }, { "epoch": 1.77, "learning_rate": 3.4189864197562863e-05, "loss": 0.0116, "step": 683630 }, { "epoch": 1.77, "learning_rate": 3.41859759811914e-05, "loss": 0.0124, "step": 683640 }, { "epoch": 1.77, "learning_rate": 3.418208776481993e-05, "loss": 0.0061, "step": 683650 }, { "epoch": 1.77, "learning_rate": 3.417819954844847e-05, "loss": 0.0078, "step": 683660 }, { "epoch": 1.77, "learning_rate": 3.4174311332077e-05, "loss": 0.0058, "step": 683670 }, { "epoch": 1.77, "learning_rate": 3.417042311570554e-05, "loss": 0.0074, "step": 683680 }, { "epoch": 1.77, "learning_rate": 3.416653489933408e-05, "loss": 0.0067, "step": 683690 }, { "epoch": 1.77, "learning_rate": 3.4162646682962614e-05, "loss": 0.0086, "step": 683700 }, { "epoch": 1.77, "learning_rate": 3.415875846659115e-05, "loss": 0.0088, "step": 683710 }, { "epoch": 1.77, "learning_rate": 3.415487025021968e-05, "loss": 0.0131, "step": 683720 }, { "epoch": 1.77, "learning_rate": 3.415098203384821e-05, "loss": 0.0076, "step": 683730 }, { "epoch": 1.77, "learning_rate": 3.4147093817476754e-05, "loss": 0.0083, "step": 683740 }, { "epoch": 1.77, "learning_rate": 3.414320560110529e-05, "loss": 0.0166, "step": 683750 }, { "epoch": 1.77, "learning_rate": 3.413931738473382e-05, "loss": 0.0072, "step": 683760 }, { "epoch": 1.77, "learning_rate": 3.413542916836236e-05, "loss": 0.0076, "step": 683770 }, { "epoch": 1.77, "learning_rate": 3.413154095199089e-05, "loss": 0.0093, "step": 683780 }, { "epoch": 1.77, "learning_rate": 3.412765273561943e-05, "loss": 0.0065, "step": 683790 }, { "epoch": 1.77, "learning_rate": 3.412376451924796e-05, "loss": 0.0071, "step": 683800 }, { "epoch": 1.77, "learning_rate": 3.41198763028765e-05, "loss": 0.0086, "step": 683810 }, { "epoch": 1.77, "learning_rate": 3.411598808650504e-05, "loss": 0.01, "step": 683820 }, { "epoch": 1.77, "learning_rate": 3.4112099870133574e-05, "loss": 0.0068, "step": 683830 }, { "epoch": 1.77, "learning_rate": 3.410821165376211e-05, "loss": 0.0089, "step": 683840 }, { "epoch": 1.77, "learning_rate": 3.410432343739064e-05, "loss": 0.0064, "step": 683850 }, { "epoch": 1.77, "learning_rate": 3.410043522101917e-05, "loss": 0.0086, "step": 683860 }, { "epoch": 1.77, "learning_rate": 3.4096547004647714e-05, "loss": 0.0066, "step": 683870 }, { "epoch": 1.77, "learning_rate": 3.409265878827625e-05, "loss": 0.0062, "step": 683880 }, { "epoch": 1.77, "learning_rate": 3.408877057190478e-05, "loss": 0.007, "step": 683890 }, { "epoch": 1.77, "learning_rate": 3.408488235553332e-05, "loss": 0.0059, "step": 683900 }, { "epoch": 1.77, "learning_rate": 3.408099413916185e-05, "loss": 0.0096, "step": 683910 }, { "epoch": 1.77, "learning_rate": 3.407710592279039e-05, "loss": 0.0093, "step": 683920 }, { "epoch": 1.77, "learning_rate": 3.407321770641892e-05, "loss": 0.0095, "step": 683930 }, { "epoch": 1.77, "learning_rate": 3.406932949004746e-05, "loss": 0.0068, "step": 683940 }, { "epoch": 1.77, "learning_rate": 3.4065441273676e-05, "loss": 0.0075, "step": 683950 }, { "epoch": 1.77, "learning_rate": 3.4061553057304534e-05, "loss": 0.0073, "step": 683960 }, { "epoch": 1.77, "learning_rate": 3.405766484093306e-05, "loss": 0.0068, "step": 683970 }, { "epoch": 1.77, "learning_rate": 3.40537766245616e-05, "loss": 0.0067, "step": 683980 }, { "epoch": 1.77, "learning_rate": 3.404988840819013e-05, "loss": 0.0065, "step": 683990 }, { "epoch": 1.77, "learning_rate": 3.4046000191818674e-05, "loss": 0.0057, "step": 684000 }, { "epoch": 1.77, "eval_cer": 0.8816802921322209, "eval_loss": 0.005055462475866079, "eval_runtime": 107.5085, "eval_samples_per_second": 18.603, "eval_steps_per_second": 4.651, "step": 684000 }, { "epoch": 1.77, "learning_rate": 3.404211197544721e-05, "loss": 0.0084, "step": 684010 }, { "epoch": 1.77, "learning_rate": 3.403822375907574e-05, "loss": 0.0081, "step": 684020 }, { "epoch": 1.77, "learning_rate": 3.403433554270428e-05, "loss": 0.0093, "step": 684030 }, { "epoch": 1.77, "learning_rate": 3.403044732633281e-05, "loss": 0.0074, "step": 684040 }, { "epoch": 1.77, "learning_rate": 3.402655910996135e-05, "loss": 0.0088, "step": 684050 }, { "epoch": 1.77, "learning_rate": 3.402267089358988e-05, "loss": 0.0059, "step": 684060 }, { "epoch": 1.77, "learning_rate": 3.401878267721842e-05, "loss": 0.0076, "step": 684070 }, { "epoch": 1.77, "learning_rate": 3.401489446084696e-05, "loss": 0.0063, "step": 684080 }, { "epoch": 1.77, "learning_rate": 3.4011006244475494e-05, "loss": 0.0075, "step": 684090 }, { "epoch": 1.77, "learning_rate": 3.400711802810402e-05, "loss": 0.0068, "step": 684100 }, { "epoch": 1.77, "learning_rate": 3.400322981173256e-05, "loss": 0.0079, "step": 684110 }, { "epoch": 1.77, "learning_rate": 3.399934159536109e-05, "loss": 0.009, "step": 684120 }, { "epoch": 1.77, "learning_rate": 3.3995453378989634e-05, "loss": 0.0058, "step": 684130 }, { "epoch": 1.77, "learning_rate": 3.399156516261817e-05, "loss": 0.0089, "step": 684140 }, { "epoch": 1.77, "learning_rate": 3.39876769462467e-05, "loss": 0.0068, "step": 684150 }, { "epoch": 1.77, "learning_rate": 3.398378872987524e-05, "loss": 0.0066, "step": 684160 }, { "epoch": 1.77, "learning_rate": 3.397990051350377e-05, "loss": 0.0065, "step": 684170 }, { "epoch": 1.77, "learning_rate": 3.397601229713231e-05, "loss": 0.0102, "step": 684180 }, { "epoch": 1.77, "learning_rate": 3.397212408076084e-05, "loss": 0.0089, "step": 684190 }, { "epoch": 1.77, "learning_rate": 3.396823586438938e-05, "loss": 0.0094, "step": 684200 }, { "epoch": 1.77, "learning_rate": 3.396434764801791e-05, "loss": 0.0076, "step": 684210 }, { "epoch": 1.77, "learning_rate": 3.396045943164645e-05, "loss": 0.0078, "step": 684220 }, { "epoch": 1.77, "learning_rate": 3.395657121527498e-05, "loss": 0.0054, "step": 684230 }, { "epoch": 1.77, "learning_rate": 3.395268299890352e-05, "loss": 0.0107, "step": 684240 }, { "epoch": 1.77, "learning_rate": 3.394879478253205e-05, "loss": 0.0068, "step": 684250 }, { "epoch": 1.77, "learning_rate": 3.394490656616059e-05, "loss": 0.007, "step": 684260 }, { "epoch": 1.77, "learning_rate": 3.394101834978913e-05, "loss": 0.0106, "step": 684270 }, { "epoch": 1.77, "learning_rate": 3.393713013341766e-05, "loss": 0.0083, "step": 684280 }, { "epoch": 1.77, "learning_rate": 3.39332419170462e-05, "loss": 0.0087, "step": 684290 }, { "epoch": 1.77, "learning_rate": 3.392935370067473e-05, "loss": 0.008, "step": 684300 }, { "epoch": 1.77, "learning_rate": 3.392546548430327e-05, "loss": 0.0069, "step": 684310 }, { "epoch": 1.77, "learning_rate": 3.39215772679318e-05, "loss": 0.0071, "step": 684320 }, { "epoch": 1.77, "learning_rate": 3.391768905156034e-05, "loss": 0.007, "step": 684330 }, { "epoch": 1.77, "learning_rate": 3.391380083518887e-05, "loss": 0.0099, "step": 684340 }, { "epoch": 1.77, "learning_rate": 3.390991261881741e-05, "loss": 0.0103, "step": 684350 }, { "epoch": 1.77, "learning_rate": 3.390602440244594e-05, "loss": 0.0067, "step": 684360 }, { "epoch": 1.77, "learning_rate": 3.390213618607448e-05, "loss": 0.0066, "step": 684370 }, { "epoch": 1.77, "learning_rate": 3.389824796970301e-05, "loss": 0.0077, "step": 684380 }, { "epoch": 1.77, "learning_rate": 3.389435975333155e-05, "loss": 0.0071, "step": 684390 }, { "epoch": 1.77, "learning_rate": 3.389047153696009e-05, "loss": 0.0126, "step": 684400 }, { "epoch": 1.77, "learning_rate": 3.388658332058862e-05, "loss": 0.0087, "step": 684410 }, { "epoch": 1.77, "learning_rate": 3.388269510421716e-05, "loss": 0.0082, "step": 684420 }, { "epoch": 1.77, "learning_rate": 3.387880688784569e-05, "loss": 0.0045, "step": 684430 }, { "epoch": 1.77, "learning_rate": 3.387491867147423e-05, "loss": 0.0087, "step": 684440 }, { "epoch": 1.77, "learning_rate": 3.387103045510276e-05, "loss": 0.0058, "step": 684450 }, { "epoch": 1.77, "learning_rate": 3.38671422387313e-05, "loss": 0.0083, "step": 684460 }, { "epoch": 1.77, "learning_rate": 3.386325402235983e-05, "loss": 0.0091, "step": 684470 }, { "epoch": 1.77, "learning_rate": 3.385936580598837e-05, "loss": 0.0069, "step": 684480 }, { "epoch": 1.77, "learning_rate": 3.38554775896169e-05, "loss": 0.0081, "step": 684490 }, { "epoch": 1.77, "learning_rate": 3.385158937324544e-05, "loss": 0.0085, "step": 684500 }, { "epoch": 1.77, "learning_rate": 3.384770115687397e-05, "loss": 0.0093, "step": 684510 }, { "epoch": 1.77, "learning_rate": 3.384381294050251e-05, "loss": 0.0067, "step": 684520 }, { "epoch": 1.77, "learning_rate": 3.383992472413105e-05, "loss": 0.0066, "step": 684530 }, { "epoch": 1.77, "learning_rate": 3.383603650775958e-05, "loss": 0.0057, "step": 684540 }, { "epoch": 1.77, "learning_rate": 3.383214829138812e-05, "loss": 0.0094, "step": 684550 }, { "epoch": 1.77, "learning_rate": 3.382826007501665e-05, "loss": 0.0065, "step": 684560 }, { "epoch": 1.77, "learning_rate": 3.382437185864519e-05, "loss": 0.0072, "step": 684570 }, { "epoch": 1.77, "learning_rate": 3.382048364227372e-05, "loss": 0.0081, "step": 684580 }, { "epoch": 1.77, "learning_rate": 3.381659542590226e-05, "loss": 0.0078, "step": 684590 }, { "epoch": 1.77, "learning_rate": 3.381270720953079e-05, "loss": 0.0073, "step": 684600 }, { "epoch": 1.77, "learning_rate": 3.380881899315933e-05, "loss": 0.0063, "step": 684610 }, { "epoch": 1.77, "learning_rate": 3.380493077678786e-05, "loss": 0.0065, "step": 684620 }, { "epoch": 1.77, "learning_rate": 3.38010425604164e-05, "loss": 0.0068, "step": 684630 }, { "epoch": 1.77, "learning_rate": 3.379715434404493e-05, "loss": 0.0075, "step": 684640 }, { "epoch": 1.77, "learning_rate": 3.379326612767347e-05, "loss": 0.0068, "step": 684650 }, { "epoch": 1.77, "learning_rate": 3.378937791130201e-05, "loss": 0.0079, "step": 684660 }, { "epoch": 1.77, "learning_rate": 3.378548969493054e-05, "loss": 0.0073, "step": 684670 }, { "epoch": 1.77, "learning_rate": 3.378160147855908e-05, "loss": 0.0065, "step": 684680 }, { "epoch": 1.77, "learning_rate": 3.377771326218761e-05, "loss": 0.0076, "step": 684690 }, { "epoch": 1.77, "learning_rate": 3.377382504581615e-05, "loss": 0.0045, "step": 684700 }, { "epoch": 1.77, "learning_rate": 3.376993682944468e-05, "loss": 0.0069, "step": 684710 }, { "epoch": 1.77, "learning_rate": 3.376604861307322e-05, "loss": 0.0082, "step": 684720 }, { "epoch": 1.77, "learning_rate": 3.376216039670175e-05, "loss": 0.0055, "step": 684730 }, { "epoch": 1.77, "learning_rate": 3.375827218033029e-05, "loss": 0.0073, "step": 684740 }, { "epoch": 1.77, "learning_rate": 3.375438396395882e-05, "loss": 0.0071, "step": 684750 }, { "epoch": 1.77, "learning_rate": 3.375049574758736e-05, "loss": 0.0106, "step": 684760 }, { "epoch": 1.78, "learning_rate": 3.374660753121589e-05, "loss": 0.0074, "step": 684770 }, { "epoch": 1.78, "learning_rate": 3.374271931484443e-05, "loss": 0.0081, "step": 684780 }, { "epoch": 1.78, "learning_rate": 3.373883109847297e-05, "loss": 0.0082, "step": 684790 }, { "epoch": 1.78, "learning_rate": 3.37349428821015e-05, "loss": 0.0077, "step": 684800 }, { "epoch": 1.78, "learning_rate": 3.373105466573004e-05, "loss": 0.0075, "step": 684810 }, { "epoch": 1.78, "learning_rate": 3.372716644935857e-05, "loss": 0.0068, "step": 684820 }, { "epoch": 1.78, "learning_rate": 3.372327823298711e-05, "loss": 0.0078, "step": 684830 }, { "epoch": 1.78, "learning_rate": 3.371939001661564e-05, "loss": 0.0083, "step": 684840 }, { "epoch": 1.78, "learning_rate": 3.371550180024418e-05, "loss": 0.0074, "step": 684850 }, { "epoch": 1.78, "learning_rate": 3.371161358387271e-05, "loss": 0.0074, "step": 684860 }, { "epoch": 1.78, "learning_rate": 3.370772536750125e-05, "loss": 0.0107, "step": 684870 }, { "epoch": 1.78, "learning_rate": 3.370383715112978e-05, "loss": 0.0078, "step": 684880 }, { "epoch": 1.78, "learning_rate": 3.369994893475832e-05, "loss": 0.0069, "step": 684890 }, { "epoch": 1.78, "learning_rate": 3.369606071838685e-05, "loss": 0.0073, "step": 684900 }, { "epoch": 1.78, "learning_rate": 3.369217250201539e-05, "loss": 0.008, "step": 684910 }, { "epoch": 1.78, "learning_rate": 3.368828428564393e-05, "loss": 0.0061, "step": 684920 }, { "epoch": 1.78, "learning_rate": 3.368439606927246e-05, "loss": 0.0072, "step": 684930 }, { "epoch": 1.78, "learning_rate": 3.3680507852901e-05, "loss": 0.0075, "step": 684940 }, { "epoch": 1.78, "learning_rate": 3.367661963652953e-05, "loss": 0.0099, "step": 684950 }, { "epoch": 1.78, "learning_rate": 3.367273142015807e-05, "loss": 0.0072, "step": 684960 }, { "epoch": 1.78, "learning_rate": 3.36688432037866e-05, "loss": 0.0065, "step": 684970 }, { "epoch": 1.78, "learning_rate": 3.366495498741514e-05, "loss": 0.0092, "step": 684980 }, { "epoch": 1.78, "learning_rate": 3.366106677104367e-05, "loss": 0.0129, "step": 684990 }, { "epoch": 1.78, "learning_rate": 3.365717855467221e-05, "loss": 0.0097, "step": 685000 }, { "epoch": 1.78, "eval_cer": 0.881688689953826, "eval_loss": 0.004874881356954575, "eval_runtime": 107.9053, "eval_samples_per_second": 18.535, "eval_steps_per_second": 4.634, "step": 685000 }, { "epoch": 1.78, "learning_rate": 3.365329033830074e-05, "loss": 0.0082, "step": 685010 }, { "epoch": 1.78, "learning_rate": 3.364940212192928e-05, "loss": 0.0099, "step": 685020 }, { "epoch": 1.78, "learning_rate": 3.364551390555781e-05, "loss": 0.0086, "step": 685030 }, { "epoch": 1.78, "learning_rate": 3.364162568918635e-05, "loss": 0.0072, "step": 685040 }, { "epoch": 1.78, "learning_rate": 3.363773747281489e-05, "loss": 0.0082, "step": 685050 }, { "epoch": 1.78, "learning_rate": 3.363384925644342e-05, "loss": 0.0096, "step": 685060 }, { "epoch": 1.78, "learning_rate": 3.362996104007196e-05, "loss": 0.0063, "step": 685070 }, { "epoch": 1.78, "learning_rate": 3.362607282370049e-05, "loss": 0.0074, "step": 685080 }, { "epoch": 1.78, "learning_rate": 3.362218460732902e-05, "loss": 0.0078, "step": 685090 }, { "epoch": 1.78, "learning_rate": 3.361829639095756e-05, "loss": 0.0064, "step": 685100 }, { "epoch": 1.78, "learning_rate": 3.36144081745861e-05, "loss": 0.0073, "step": 685110 }, { "epoch": 1.78, "learning_rate": 3.361051995821463e-05, "loss": 0.0066, "step": 685120 }, { "epoch": 1.78, "learning_rate": 3.360663174184317e-05, "loss": 0.0082, "step": 685130 }, { "epoch": 1.78, "learning_rate": 3.36027435254717e-05, "loss": 0.0118, "step": 685140 }, { "epoch": 1.78, "learning_rate": 3.359885530910024e-05, "loss": 0.0082, "step": 685150 }, { "epoch": 1.78, "learning_rate": 3.359496709272877e-05, "loss": 0.0077, "step": 685160 }, { "epoch": 1.78, "learning_rate": 3.359107887635731e-05, "loss": 0.0081, "step": 685170 }, { "epoch": 1.78, "learning_rate": 3.358719065998585e-05, "loss": 0.0075, "step": 685180 }, { "epoch": 1.78, "learning_rate": 3.358330244361438e-05, "loss": 0.0071, "step": 685190 }, { "epoch": 1.78, "learning_rate": 3.357941422724292e-05, "loss": 0.0069, "step": 685200 }, { "epoch": 1.78, "learning_rate": 3.3575526010871446e-05, "loss": 0.009, "step": 685210 }, { "epoch": 1.78, "learning_rate": 3.357163779449998e-05, "loss": 0.0065, "step": 685220 }, { "epoch": 1.78, "learning_rate": 3.356774957812852e-05, "loss": 0.0049, "step": 685230 }, { "epoch": 1.78, "learning_rate": 3.356386136175706e-05, "loss": 0.0079, "step": 685240 }, { "epoch": 1.78, "learning_rate": 3.355997314538559e-05, "loss": 0.0082, "step": 685250 }, { "epoch": 1.78, "learning_rate": 3.355608492901413e-05, "loss": 0.0107, "step": 685260 }, { "epoch": 1.78, "learning_rate": 3.355219671264266e-05, "loss": 0.0074, "step": 685270 }, { "epoch": 1.78, "learning_rate": 3.35483084962712e-05, "loss": 0.0079, "step": 685280 }, { "epoch": 1.78, "learning_rate": 3.354442027989973e-05, "loss": 0.008, "step": 685290 }, { "epoch": 1.78, "learning_rate": 3.3540532063528267e-05, "loss": 0.0106, "step": 685300 }, { "epoch": 1.78, "learning_rate": 3.353664384715681e-05, "loss": 0.007, "step": 685310 }, { "epoch": 1.78, "learning_rate": 3.353275563078534e-05, "loss": 0.0063, "step": 685320 }, { "epoch": 1.78, "learning_rate": 3.352886741441388e-05, "loss": 0.0116, "step": 685330 }, { "epoch": 1.78, "learning_rate": 3.3524979198042406e-05, "loss": 0.0076, "step": 685340 }, { "epoch": 1.78, "learning_rate": 3.352109098167094e-05, "loss": 0.0101, "step": 685350 }, { "epoch": 1.78, "learning_rate": 3.351720276529948e-05, "loss": 0.0061, "step": 685360 }, { "epoch": 1.78, "learning_rate": 3.351331454892802e-05, "loss": 0.0079, "step": 685370 }, { "epoch": 1.78, "learning_rate": 3.350942633255655e-05, "loss": 0.0092, "step": 685380 }, { "epoch": 1.78, "learning_rate": 3.350553811618509e-05, "loss": 0.0097, "step": 685390 }, { "epoch": 1.78, "learning_rate": 3.350164989981362e-05, "loss": 0.0135, "step": 685400 }, { "epoch": 1.78, "learning_rate": 3.349776168344216e-05, "loss": 0.0074, "step": 685410 }, { "epoch": 1.78, "learning_rate": 3.349387346707069e-05, "loss": 0.0075, "step": 685420 }, { "epoch": 1.78, "learning_rate": 3.3489985250699227e-05, "loss": 0.0089, "step": 685430 }, { "epoch": 1.78, "learning_rate": 3.348609703432777e-05, "loss": 0.0082, "step": 685440 }, { "epoch": 1.78, "learning_rate": 3.34822088179563e-05, "loss": 0.0054, "step": 685450 }, { "epoch": 1.78, "learning_rate": 3.347832060158483e-05, "loss": 0.0064, "step": 685460 }, { "epoch": 1.78, "learning_rate": 3.3474432385213366e-05, "loss": 0.0065, "step": 685470 }, { "epoch": 1.78, "learning_rate": 3.34705441688419e-05, "loss": 0.0103, "step": 685480 }, { "epoch": 1.78, "learning_rate": 3.346665595247044e-05, "loss": 0.0104, "step": 685490 }, { "epoch": 1.78, "learning_rate": 3.346276773609898e-05, "loss": 0.0078, "step": 685500 }, { "epoch": 1.78, "learning_rate": 3.345887951972751e-05, "loss": 0.0073, "step": 685510 }, { "epoch": 1.78, "learning_rate": 3.345499130335605e-05, "loss": 0.0074, "step": 685520 }, { "epoch": 1.78, "learning_rate": 3.345110308698458e-05, "loss": 0.0078, "step": 685530 }, { "epoch": 1.78, "learning_rate": 3.344721487061312e-05, "loss": 0.0063, "step": 685540 }, { "epoch": 1.78, "learning_rate": 3.344332665424165e-05, "loss": 0.0123, "step": 685550 }, { "epoch": 1.78, "learning_rate": 3.3439438437870187e-05, "loss": 0.0067, "step": 685560 }, { "epoch": 1.78, "learning_rate": 3.343555022149872e-05, "loss": 0.0095, "step": 685570 }, { "epoch": 1.78, "learning_rate": 3.343166200512726e-05, "loss": 0.0071, "step": 685580 }, { "epoch": 1.78, "learning_rate": 3.342777378875579e-05, "loss": 0.0072, "step": 685590 }, { "epoch": 1.78, "learning_rate": 3.3423885572384326e-05, "loss": 0.0056, "step": 685600 }, { "epoch": 1.78, "learning_rate": 3.341999735601286e-05, "loss": 0.0069, "step": 685610 }, { "epoch": 1.78, "learning_rate": 3.3416109139641396e-05, "loss": 0.008, "step": 685620 }, { "epoch": 1.78, "learning_rate": 3.341222092326994e-05, "loss": 0.0076, "step": 685630 }, { "epoch": 1.78, "learning_rate": 3.340833270689847e-05, "loss": 0.0088, "step": 685640 }, { "epoch": 1.78, "learning_rate": 3.340444449052701e-05, "loss": 0.0096, "step": 685650 }, { "epoch": 1.78, "learning_rate": 3.340055627415554e-05, "loss": 0.0053, "step": 685660 }, { "epoch": 1.78, "learning_rate": 3.339666805778408e-05, "loss": 0.0078, "step": 685670 }, { "epoch": 1.78, "learning_rate": 3.339277984141261e-05, "loss": 0.0074, "step": 685680 }, { "epoch": 1.78, "learning_rate": 3.3388891625041147e-05, "loss": 0.0085, "step": 685690 }, { "epoch": 1.78, "learning_rate": 3.338500340866968e-05, "loss": 0.0078, "step": 685700 }, { "epoch": 1.78, "learning_rate": 3.3381115192298216e-05, "loss": 0.011, "step": 685710 }, { "epoch": 1.78, "learning_rate": 3.337722697592675e-05, "loss": 0.009, "step": 685720 }, { "epoch": 1.78, "learning_rate": 3.3373338759555286e-05, "loss": 0.0065, "step": 685730 }, { "epoch": 1.78, "learning_rate": 3.336945054318382e-05, "loss": 0.0064, "step": 685740 }, { "epoch": 1.78, "learning_rate": 3.3365562326812356e-05, "loss": 0.0059, "step": 685750 }, { "epoch": 1.78, "learning_rate": 3.33616741104409e-05, "loss": 0.0058, "step": 685760 }, { "epoch": 1.78, "learning_rate": 3.335778589406943e-05, "loss": 0.0075, "step": 685770 }, { "epoch": 1.78, "learning_rate": 3.335389767769797e-05, "loss": 0.0057, "step": 685780 }, { "epoch": 1.78, "learning_rate": 3.33500094613265e-05, "loss": 0.0085, "step": 685790 }, { "epoch": 1.78, "learning_rate": 3.334612124495504e-05, "loss": 0.0078, "step": 685800 }, { "epoch": 1.78, "learning_rate": 3.334223302858357e-05, "loss": 0.0054, "step": 685810 }, { "epoch": 1.78, "learning_rate": 3.3338344812212106e-05, "loss": 0.0112, "step": 685820 }, { "epoch": 1.78, "learning_rate": 3.333445659584064e-05, "loss": 0.0086, "step": 685830 }, { "epoch": 1.78, "learning_rate": 3.3330568379469176e-05, "loss": 0.0119, "step": 685840 }, { "epoch": 1.78, "learning_rate": 3.332668016309771e-05, "loss": 0.0054, "step": 685850 }, { "epoch": 1.78, "learning_rate": 3.3322791946726246e-05, "loss": 0.0076, "step": 685860 }, { "epoch": 1.78, "learning_rate": 3.331890373035478e-05, "loss": 0.009, "step": 685870 }, { "epoch": 1.78, "learning_rate": 3.3315015513983316e-05, "loss": 0.0089, "step": 685880 }, { "epoch": 1.78, "learning_rate": 3.331112729761186e-05, "loss": 0.0068, "step": 685890 }, { "epoch": 1.78, "learning_rate": 3.330723908124039e-05, "loss": 0.0081, "step": 685900 }, { "epoch": 1.78, "learning_rate": 3.330335086486893e-05, "loss": 0.009, "step": 685910 }, { "epoch": 1.78, "learning_rate": 3.329946264849746e-05, "loss": 0.0084, "step": 685920 }, { "epoch": 1.78, "learning_rate": 3.3295574432126e-05, "loss": 0.0084, "step": 685930 }, { "epoch": 1.78, "learning_rate": 3.329168621575453e-05, "loss": 0.0112, "step": 685940 }, { "epoch": 1.78, "learning_rate": 3.3287797999383066e-05, "loss": 0.008, "step": 685950 }, { "epoch": 1.78, "learning_rate": 3.32839097830116e-05, "loss": 0.005, "step": 685960 }, { "epoch": 1.78, "learning_rate": 3.3280021566640136e-05, "loss": 0.0063, "step": 685970 }, { "epoch": 1.78, "learning_rate": 3.327613335026867e-05, "loss": 0.0068, "step": 685980 }, { "epoch": 1.78, "learning_rate": 3.3272245133897206e-05, "loss": 0.0093, "step": 685990 }, { "epoch": 1.78, "learning_rate": 3.326835691752574e-05, "loss": 0.0074, "step": 686000 }, { "epoch": 1.78, "eval_cer": 0.8816746935844841, "eval_loss": 0.004924887791275978, "eval_runtime": 107.9307, "eval_samples_per_second": 18.53, "eval_steps_per_second": 4.633, "step": 686000 }, { "epoch": 1.78, "learning_rate": 3.3264468701154276e-05, "loss": 0.0065, "step": 686010 }, { "epoch": 1.78, "learning_rate": 3.326058048478282e-05, "loss": 0.0071, "step": 686020 }, { "epoch": 1.78, "learning_rate": 3.325669226841135e-05, "loss": 0.0117, "step": 686030 }, { "epoch": 1.78, "learning_rate": 3.325280405203989e-05, "loss": 0.0079, "step": 686040 }, { "epoch": 1.78, "learning_rate": 3.324891583566842e-05, "loss": 0.0103, "step": 686050 }, { "epoch": 1.78, "learning_rate": 3.324502761929696e-05, "loss": 0.0077, "step": 686060 }, { "epoch": 1.78, "learning_rate": 3.324113940292549e-05, "loss": 0.007, "step": 686070 }, { "epoch": 1.78, "learning_rate": 3.3237251186554026e-05, "loss": 0.0069, "step": 686080 }, { "epoch": 1.78, "learning_rate": 3.323336297018256e-05, "loss": 0.01, "step": 686090 }, { "epoch": 1.78, "learning_rate": 3.3229474753811096e-05, "loss": 0.0075, "step": 686100 }, { "epoch": 1.78, "learning_rate": 3.322558653743963e-05, "loss": 0.0079, "step": 686110 }, { "epoch": 1.78, "learning_rate": 3.3221698321068166e-05, "loss": 0.0097, "step": 686120 }, { "epoch": 1.78, "learning_rate": 3.32178101046967e-05, "loss": 0.0054, "step": 686130 }, { "epoch": 1.78, "learning_rate": 3.3213921888325236e-05, "loss": 0.006, "step": 686140 }, { "epoch": 1.78, "learning_rate": 3.321003367195378e-05, "loss": 0.006, "step": 686150 }, { "epoch": 1.78, "learning_rate": 3.320614545558231e-05, "loss": 0.0096, "step": 686160 }, { "epoch": 1.78, "learning_rate": 3.320225723921085e-05, "loss": 0.0086, "step": 686170 }, { "epoch": 1.78, "learning_rate": 3.319836902283938e-05, "loss": 0.007, "step": 686180 }, { "epoch": 1.78, "learning_rate": 3.319448080646792e-05, "loss": 0.0061, "step": 686190 }, { "epoch": 1.78, "learning_rate": 3.319059259009645e-05, "loss": 0.0064, "step": 686200 }, { "epoch": 1.78, "learning_rate": 3.3186704373724986e-05, "loss": 0.007, "step": 686210 }, { "epoch": 1.78, "learning_rate": 3.318281615735352e-05, "loss": 0.0076, "step": 686220 }, { "epoch": 1.78, "learning_rate": 3.3178927940982056e-05, "loss": 0.0054, "step": 686230 }, { "epoch": 1.78, "learning_rate": 3.317503972461059e-05, "loss": 0.0098, "step": 686240 }, { "epoch": 1.78, "learning_rate": 3.3171151508239126e-05, "loss": 0.0072, "step": 686250 }, { "epoch": 1.78, "learning_rate": 3.316726329186766e-05, "loss": 0.0095, "step": 686260 }, { "epoch": 1.78, "learning_rate": 3.3163375075496196e-05, "loss": 0.0084, "step": 686270 }, { "epoch": 1.78, "learning_rate": 3.315948685912474e-05, "loss": 0.0067, "step": 686280 }, { "epoch": 1.78, "learning_rate": 3.315559864275327e-05, "loss": 0.0081, "step": 686290 }, { "epoch": 1.78, "learning_rate": 3.315171042638181e-05, "loss": 0.0062, "step": 686300 }, { "epoch": 1.78, "learning_rate": 3.314782221001034e-05, "loss": 0.0089, "step": 686310 }, { "epoch": 1.78, "learning_rate": 3.314393399363888e-05, "loss": 0.0078, "step": 686320 }, { "epoch": 1.78, "learning_rate": 3.314004577726741e-05, "loss": 0.0072, "step": 686330 }, { "epoch": 1.78, "learning_rate": 3.3136157560895946e-05, "loss": 0.0149, "step": 686340 }, { "epoch": 1.78, "learning_rate": 3.313226934452448e-05, "loss": 0.0058, "step": 686350 }, { "epoch": 1.78, "learning_rate": 3.3128381128153016e-05, "loss": 0.0061, "step": 686360 }, { "epoch": 1.78, "learning_rate": 3.312449291178155e-05, "loss": 0.0052, "step": 686370 }, { "epoch": 1.78, "learning_rate": 3.3120604695410086e-05, "loss": 0.0069, "step": 686380 }, { "epoch": 1.78, "learning_rate": 3.311671647903862e-05, "loss": 0.0063, "step": 686390 }, { "epoch": 1.78, "learning_rate": 3.3112828262667156e-05, "loss": 0.006, "step": 686400 }, { "epoch": 1.78, "learning_rate": 3.31089400462957e-05, "loss": 0.0077, "step": 686410 }, { "epoch": 1.78, "learning_rate": 3.310505182992423e-05, "loss": 0.0067, "step": 686420 }, { "epoch": 1.78, "learning_rate": 3.310116361355277e-05, "loss": 0.0083, "step": 686430 }, { "epoch": 1.78, "learning_rate": 3.30972753971813e-05, "loss": 0.0084, "step": 686440 }, { "epoch": 1.78, "learning_rate": 3.309338718080983e-05, "loss": 0.0084, "step": 686450 }, { "epoch": 1.78, "learning_rate": 3.308949896443837e-05, "loss": 0.0071, "step": 686460 }, { "epoch": 1.78, "learning_rate": 3.3085610748066906e-05, "loss": 0.0061, "step": 686470 }, { "epoch": 1.78, "learning_rate": 3.308172253169544e-05, "loss": 0.0068, "step": 686480 }, { "epoch": 1.78, "learning_rate": 3.3077834315323976e-05, "loss": 0.0073, "step": 686490 }, { "epoch": 1.78, "learning_rate": 3.307394609895251e-05, "loss": 0.0066, "step": 686500 }, { "epoch": 1.78, "learning_rate": 3.3070057882581046e-05, "loss": 0.0073, "step": 686510 }, { "epoch": 1.78, "learning_rate": 3.306616966620958e-05, "loss": 0.0071, "step": 686520 }, { "epoch": 1.78, "learning_rate": 3.3062281449838116e-05, "loss": 0.0081, "step": 686530 }, { "epoch": 1.78, "learning_rate": 3.305839323346666e-05, "loss": 0.0059, "step": 686540 }, { "epoch": 1.78, "learning_rate": 3.305450501709519e-05, "loss": 0.0088, "step": 686550 }, { "epoch": 1.78, "learning_rate": 3.305061680072373e-05, "loss": 0.0073, "step": 686560 }, { "epoch": 1.78, "learning_rate": 3.304672858435226e-05, "loss": 0.007, "step": 686570 }, { "epoch": 1.78, "learning_rate": 3.304284036798079e-05, "loss": 0.0077, "step": 686580 }, { "epoch": 1.78, "learning_rate": 3.303895215160933e-05, "loss": 0.007, "step": 686590 }, { "epoch": 1.78, "learning_rate": 3.3035063935237866e-05, "loss": 0.0062, "step": 686600 }, { "epoch": 1.78, "learning_rate": 3.30311757188664e-05, "loss": 0.0061, "step": 686610 }, { "epoch": 1.78, "learning_rate": 3.3027287502494936e-05, "loss": 0.0065, "step": 686620 }, { "epoch": 1.78, "learning_rate": 3.302339928612347e-05, "loss": 0.0089, "step": 686630 }, { "epoch": 1.78, "learning_rate": 3.3019511069752006e-05, "loss": 0.0064, "step": 686640 }, { "epoch": 1.78, "learning_rate": 3.301562285338054e-05, "loss": 0.007, "step": 686650 }, { "epoch": 1.78, "learning_rate": 3.3011734637009076e-05, "loss": 0.0065, "step": 686660 }, { "epoch": 1.78, "learning_rate": 3.300784642063762e-05, "loss": 0.0094, "step": 686670 }, { "epoch": 1.78, "learning_rate": 3.300395820426615e-05, "loss": 0.0074, "step": 686680 }, { "epoch": 1.78, "learning_rate": 3.300006998789469e-05, "loss": 0.0065, "step": 686690 }, { "epoch": 1.78, "learning_rate": 3.2996181771523215e-05, "loss": 0.0083, "step": 686700 }, { "epoch": 1.78, "learning_rate": 3.299229355515175e-05, "loss": 0.0064, "step": 686710 }, { "epoch": 1.78, "learning_rate": 3.298840533878029e-05, "loss": 0.0078, "step": 686720 }, { "epoch": 1.78, "learning_rate": 3.2984517122408826e-05, "loss": 0.0113, "step": 686730 }, { "epoch": 1.78, "learning_rate": 3.298062890603736e-05, "loss": 0.005, "step": 686740 }, { "epoch": 1.78, "learning_rate": 3.2976740689665896e-05, "loss": 0.0062, "step": 686750 }, { "epoch": 1.78, "learning_rate": 3.297285247329443e-05, "loss": 0.0065, "step": 686760 }, { "epoch": 1.78, "learning_rate": 3.2968964256922966e-05, "loss": 0.0071, "step": 686770 }, { "epoch": 1.78, "learning_rate": 3.29650760405515e-05, "loss": 0.0081, "step": 686780 }, { "epoch": 1.78, "learning_rate": 3.2961187824180035e-05, "loss": 0.0058, "step": 686790 }, { "epoch": 1.78, "learning_rate": 3.295729960780858e-05, "loss": 0.0089, "step": 686800 }, { "epoch": 1.78, "learning_rate": 3.295341139143711e-05, "loss": 0.0082, "step": 686810 }, { "epoch": 1.78, "learning_rate": 3.294952317506565e-05, "loss": 0.0064, "step": 686820 }, { "epoch": 1.78, "learning_rate": 3.2945634958694175e-05, "loss": 0.0067, "step": 686830 }, { "epoch": 1.78, "learning_rate": 3.294174674232271e-05, "loss": 0.0055, "step": 686840 }, { "epoch": 1.78, "learning_rate": 3.293785852595125e-05, "loss": 0.0109, "step": 686850 }, { "epoch": 1.78, "learning_rate": 3.2933970309579786e-05, "loss": 0.0075, "step": 686860 }, { "epoch": 1.78, "learning_rate": 3.293008209320832e-05, "loss": 0.0083, "step": 686870 }, { "epoch": 1.78, "learning_rate": 3.2926193876836856e-05, "loss": 0.008, "step": 686880 }, { "epoch": 1.78, "learning_rate": 3.292230566046539e-05, "loss": 0.0085, "step": 686890 }, { "epoch": 1.78, "learning_rate": 3.2918417444093926e-05, "loss": 0.0095, "step": 686900 }, { "epoch": 1.78, "learning_rate": 3.291452922772246e-05, "loss": 0.0082, "step": 686910 }, { "epoch": 1.78, "learning_rate": 3.2910641011350995e-05, "loss": 0.0086, "step": 686920 }, { "epoch": 1.78, "learning_rate": 3.290675279497953e-05, "loss": 0.0103, "step": 686930 }, { "epoch": 1.78, "learning_rate": 3.290286457860807e-05, "loss": 0.0084, "step": 686940 }, { "epoch": 1.78, "learning_rate": 3.28989763622366e-05, "loss": 0.0093, "step": 686950 }, { "epoch": 1.78, "learning_rate": 3.2895088145865135e-05, "loss": 0.0084, "step": 686960 }, { "epoch": 1.78, "learning_rate": 3.289119992949367e-05, "loss": 0.0088, "step": 686970 }, { "epoch": 1.78, "learning_rate": 3.2887311713122205e-05, "loss": 0.0093, "step": 686980 }, { "epoch": 1.78, "learning_rate": 3.2883423496750746e-05, "loss": 0.0066, "step": 686990 }, { "epoch": 1.78, "learning_rate": 3.287953528037928e-05, "loss": 0.0064, "step": 687000 }, { "epoch": 1.78, "eval_cer": 0.8816662957628791, "eval_loss": 0.004868320655077696, "eval_runtime": 107.8854, "eval_samples_per_second": 18.538, "eval_steps_per_second": 4.635, "step": 687000 }, { "epoch": 1.78, "learning_rate": 3.2875647064007816e-05, "loss": 0.0093, "step": 687010 }, { "epoch": 1.78, "learning_rate": 3.287175884763635e-05, "loss": 0.0051, "step": 687020 }, { "epoch": 1.78, "learning_rate": 3.2867870631264886e-05, "loss": 0.0068, "step": 687030 }, { "epoch": 1.78, "learning_rate": 3.286398241489342e-05, "loss": 0.0066, "step": 687040 }, { "epoch": 1.78, "learning_rate": 3.2860094198521955e-05, "loss": 0.0083, "step": 687050 }, { "epoch": 1.78, "learning_rate": 3.285620598215049e-05, "loss": 0.0089, "step": 687060 }, { "epoch": 1.78, "learning_rate": 3.2852317765779025e-05, "loss": 0.0077, "step": 687070 }, { "epoch": 1.78, "learning_rate": 3.284842954940756e-05, "loss": 0.0076, "step": 687080 }, { "epoch": 1.78, "learning_rate": 3.2844541333036095e-05, "loss": 0.0122, "step": 687090 }, { "epoch": 1.78, "learning_rate": 3.284065311666463e-05, "loss": 0.0073, "step": 687100 }, { "epoch": 1.78, "learning_rate": 3.2836764900293165e-05, "loss": 0.0101, "step": 687110 }, { "epoch": 1.78, "learning_rate": 3.2832876683921706e-05, "loss": 0.0085, "step": 687120 }, { "epoch": 1.78, "learning_rate": 3.282898846755024e-05, "loss": 0.0078, "step": 687130 }, { "epoch": 1.78, "learning_rate": 3.2825100251178776e-05, "loss": 0.0062, "step": 687140 }, { "epoch": 1.78, "learning_rate": 3.282121203480731e-05, "loss": 0.0093, "step": 687150 }, { "epoch": 1.78, "learning_rate": 3.2817323818435846e-05, "loss": 0.0081, "step": 687160 }, { "epoch": 1.78, "learning_rate": 3.281343560206438e-05, "loss": 0.0061, "step": 687170 }, { "epoch": 1.78, "learning_rate": 3.2809547385692915e-05, "loss": 0.0075, "step": 687180 }, { "epoch": 1.78, "learning_rate": 3.280565916932145e-05, "loss": 0.0095, "step": 687190 }, { "epoch": 1.78, "learning_rate": 3.2801770952949985e-05, "loss": 0.0086, "step": 687200 }, { "epoch": 1.78, "learning_rate": 3.279788273657852e-05, "loss": 0.008, "step": 687210 }, { "epoch": 1.78, "learning_rate": 3.2793994520207055e-05, "loss": 0.007, "step": 687220 }, { "epoch": 1.78, "learning_rate": 3.279010630383559e-05, "loss": 0.0073, "step": 687230 }, { "epoch": 1.78, "learning_rate": 3.2786218087464125e-05, "loss": 0.0079, "step": 687240 }, { "epoch": 1.78, "learning_rate": 3.2782329871092666e-05, "loss": 0.0058, "step": 687250 }, { "epoch": 1.78, "learning_rate": 3.27784416547212e-05, "loss": 0.0062, "step": 687260 }, { "epoch": 1.78, "learning_rate": 3.2774553438349736e-05, "loss": 0.0112, "step": 687270 }, { "epoch": 1.78, "learning_rate": 3.277066522197827e-05, "loss": 0.0095, "step": 687280 }, { "epoch": 1.78, "learning_rate": 3.2766777005606806e-05, "loss": 0.0077, "step": 687290 }, { "epoch": 1.78, "learning_rate": 3.276288878923534e-05, "loss": 0.0064, "step": 687300 }, { "epoch": 1.78, "learning_rate": 3.2759000572863875e-05, "loss": 0.0066, "step": 687310 }, { "epoch": 1.78, "learning_rate": 3.275511235649241e-05, "loss": 0.0082, "step": 687320 }, { "epoch": 1.78, "learning_rate": 3.2751224140120945e-05, "loss": 0.0075, "step": 687330 }, { "epoch": 1.78, "learning_rate": 3.274733592374948e-05, "loss": 0.006, "step": 687340 }, { "epoch": 1.78, "learning_rate": 3.2743447707378015e-05, "loss": 0.0073, "step": 687350 }, { "epoch": 1.78, "learning_rate": 3.273955949100655e-05, "loss": 0.0064, "step": 687360 }, { "epoch": 1.78, "learning_rate": 3.2735671274635085e-05, "loss": 0.0082, "step": 687370 }, { "epoch": 1.78, "learning_rate": 3.2731783058263626e-05, "loss": 0.0063, "step": 687380 }, { "epoch": 1.78, "learning_rate": 3.272789484189216e-05, "loss": 0.0056, "step": 687390 }, { "epoch": 1.78, "learning_rate": 3.2724006625520696e-05, "loss": 0.0104, "step": 687400 }, { "epoch": 1.78, "learning_rate": 3.272011840914923e-05, "loss": 0.0094, "step": 687410 }, { "epoch": 1.78, "learning_rate": 3.2716230192777766e-05, "loss": 0.0103, "step": 687420 }, { "epoch": 1.78, "learning_rate": 3.27123419764063e-05, "loss": 0.008, "step": 687430 }, { "epoch": 1.78, "learning_rate": 3.2708453760034835e-05, "loss": 0.0074, "step": 687440 }, { "epoch": 1.78, "learning_rate": 3.270456554366337e-05, "loss": 0.0057, "step": 687450 }, { "epoch": 1.78, "learning_rate": 3.2700677327291905e-05, "loss": 0.0078, "step": 687460 }, { "epoch": 1.78, "learning_rate": 3.269678911092044e-05, "loss": 0.0078, "step": 687470 }, { "epoch": 1.78, "learning_rate": 3.2692900894548975e-05, "loss": 0.0104, "step": 687480 }, { "epoch": 1.78, "learning_rate": 3.268901267817751e-05, "loss": 0.0094, "step": 687490 }, { "epoch": 1.78, "learning_rate": 3.2685124461806045e-05, "loss": 0.008, "step": 687500 }, { "epoch": 1.78, "learning_rate": 3.2681236245434586e-05, "loss": 0.0078, "step": 687510 }, { "epoch": 1.78, "learning_rate": 3.267734802906312e-05, "loss": 0.0076, "step": 687520 }, { "epoch": 1.78, "learning_rate": 3.2673459812691656e-05, "loss": 0.007, "step": 687530 }, { "epoch": 1.78, "learning_rate": 3.266957159632019e-05, "loss": 0.0082, "step": 687540 }, { "epoch": 1.78, "learning_rate": 3.2665683379948726e-05, "loss": 0.0063, "step": 687550 }, { "epoch": 1.78, "learning_rate": 3.266179516357726e-05, "loss": 0.006, "step": 687560 }, { "epoch": 1.78, "learning_rate": 3.2657906947205795e-05, "loss": 0.0081, "step": 687570 }, { "epoch": 1.78, "learning_rate": 3.265401873083433e-05, "loss": 0.009, "step": 687580 }, { "epoch": 1.78, "learning_rate": 3.2650130514462865e-05, "loss": 0.008, "step": 687590 }, { "epoch": 1.78, "learning_rate": 3.26462422980914e-05, "loss": 0.0057, "step": 687600 }, { "epoch": 1.78, "learning_rate": 3.2642354081719935e-05, "loss": 0.0083, "step": 687610 }, { "epoch": 1.78, "learning_rate": 3.263846586534847e-05, "loss": 0.0093, "step": 687620 }, { "epoch": 1.78, "learning_rate": 3.2634577648977005e-05, "loss": 0.0091, "step": 687630 }, { "epoch": 1.78, "learning_rate": 3.2630689432605546e-05, "loss": 0.006, "step": 687640 }, { "epoch": 1.78, "learning_rate": 3.262680121623408e-05, "loss": 0.0085, "step": 687650 }, { "epoch": 1.78, "learning_rate": 3.2622912999862616e-05, "loss": 0.0086, "step": 687660 }, { "epoch": 1.78, "learning_rate": 3.261902478349115e-05, "loss": 0.0073, "step": 687670 }, { "epoch": 1.78, "learning_rate": 3.2615136567119686e-05, "loss": 0.0076, "step": 687680 }, { "epoch": 1.78, "learning_rate": 3.261124835074822e-05, "loss": 0.0068, "step": 687690 }, { "epoch": 1.78, "learning_rate": 3.2607360134376755e-05, "loss": 0.0054, "step": 687700 }, { "epoch": 1.78, "learning_rate": 3.260347191800529e-05, "loss": 0.008, "step": 687710 }, { "epoch": 1.78, "learning_rate": 3.2599583701633825e-05, "loss": 0.007, "step": 687720 }, { "epoch": 1.78, "learning_rate": 3.259569548526236e-05, "loss": 0.007, "step": 687730 }, { "epoch": 1.78, "learning_rate": 3.2591807268890895e-05, "loss": 0.0073, "step": 687740 }, { "epoch": 1.78, "learning_rate": 3.258791905251943e-05, "loss": 0.0071, "step": 687750 }, { "epoch": 1.78, "learning_rate": 3.2584030836147964e-05, "loss": 0.0072, "step": 687760 }, { "epoch": 1.78, "learning_rate": 3.2580142619776506e-05, "loss": 0.0072, "step": 687770 }, { "epoch": 1.78, "learning_rate": 3.257625440340504e-05, "loss": 0.0072, "step": 687780 }, { "epoch": 1.78, "learning_rate": 3.2572366187033576e-05, "loss": 0.0066, "step": 687790 }, { "epoch": 1.78, "learning_rate": 3.256847797066211e-05, "loss": 0.0075, "step": 687800 }, { "epoch": 1.78, "learning_rate": 3.2564589754290646e-05, "loss": 0.0093, "step": 687810 }, { "epoch": 1.78, "learning_rate": 3.256070153791918e-05, "loss": 0.0079, "step": 687820 }, { "epoch": 1.78, "learning_rate": 3.2556813321547715e-05, "loss": 0.0083, "step": 687830 }, { "epoch": 1.78, "learning_rate": 3.255292510517625e-05, "loss": 0.0072, "step": 687840 }, { "epoch": 1.78, "learning_rate": 3.2549036888804785e-05, "loss": 0.0123, "step": 687850 }, { "epoch": 1.78, "learning_rate": 3.254514867243332e-05, "loss": 0.0125, "step": 687860 }, { "epoch": 1.78, "learning_rate": 3.2541260456061855e-05, "loss": 0.0087, "step": 687870 }, { "epoch": 1.78, "learning_rate": 3.253737223969039e-05, "loss": 0.0067, "step": 687880 }, { "epoch": 1.78, "learning_rate": 3.2533484023318924e-05, "loss": 0.0069, "step": 687890 }, { "epoch": 1.78, "learning_rate": 3.2529595806947466e-05, "loss": 0.0073, "step": 687900 }, { "epoch": 1.78, "learning_rate": 3.2525707590576e-05, "loss": 0.0084, "step": 687910 }, { "epoch": 1.78, "learning_rate": 3.2521819374204536e-05, "loss": 0.0082, "step": 687920 }, { "epoch": 1.78, "learning_rate": 3.251793115783307e-05, "loss": 0.0063, "step": 687930 }, { "epoch": 1.78, "learning_rate": 3.25140429414616e-05, "loss": 0.0073, "step": 687940 }, { "epoch": 1.78, "learning_rate": 3.251015472509014e-05, "loss": 0.0078, "step": 687950 }, { "epoch": 1.78, "learning_rate": 3.2506266508718675e-05, "loss": 0.0093, "step": 687960 }, { "epoch": 1.78, "learning_rate": 3.250237829234721e-05, "loss": 0.0071, "step": 687970 }, { "epoch": 1.78, "learning_rate": 3.2498490075975745e-05, "loss": 0.0065, "step": 687980 }, { "epoch": 1.78, "learning_rate": 3.249460185960428e-05, "loss": 0.0078, "step": 687990 }, { "epoch": 1.78, "learning_rate": 3.2490713643232815e-05, "loss": 0.0107, "step": 688000 }, { "epoch": 1.78, "eval_cer": 0.8816928888646285, "eval_loss": 0.004783975426107645, "eval_runtime": 108.0049, "eval_samples_per_second": 18.518, "eval_steps_per_second": 4.629, "step": 688000 }, { "epoch": 1.78, "learning_rate": 3.248682542686135e-05, "loss": 0.0049, "step": 688010 }, { "epoch": 1.78, "learning_rate": 3.2482937210489884e-05, "loss": 0.0076, "step": 688020 }, { "epoch": 1.78, "learning_rate": 3.2479048994118426e-05, "loss": 0.0085, "step": 688030 }, { "epoch": 1.78, "learning_rate": 3.247516077774696e-05, "loss": 0.0049, "step": 688040 }, { "epoch": 1.78, "learning_rate": 3.2471272561375496e-05, "loss": 0.0089, "step": 688050 }, { "epoch": 1.78, "learning_rate": 3.246738434500403e-05, "loss": 0.0059, "step": 688060 }, { "epoch": 1.78, "learning_rate": 3.246349612863256e-05, "loss": 0.0085, "step": 688070 }, { "epoch": 1.78, "learning_rate": 3.24596079122611e-05, "loss": 0.0078, "step": 688080 }, { "epoch": 1.78, "learning_rate": 3.2455719695889635e-05, "loss": 0.0109, "step": 688090 }, { "epoch": 1.78, "learning_rate": 3.245183147951817e-05, "loss": 0.0076, "step": 688100 }, { "epoch": 1.78, "learning_rate": 3.2447943263146705e-05, "loss": 0.0114, "step": 688110 }, { "epoch": 1.78, "learning_rate": 3.244405504677524e-05, "loss": 0.0083, "step": 688120 }, { "epoch": 1.78, "learning_rate": 3.2440166830403775e-05, "loss": 0.005, "step": 688130 }, { "epoch": 1.78, "learning_rate": 3.243627861403231e-05, "loss": 0.008, "step": 688140 }, { "epoch": 1.78, "learning_rate": 3.2432390397660844e-05, "loss": 0.0078, "step": 688150 }, { "epoch": 1.78, "learning_rate": 3.2428502181289386e-05, "loss": 0.0086, "step": 688160 }, { "epoch": 1.78, "learning_rate": 3.242461396491792e-05, "loss": 0.006, "step": 688170 }, { "epoch": 1.78, "learning_rate": 3.2420725748546456e-05, "loss": 0.0111, "step": 688180 }, { "epoch": 1.78, "learning_rate": 3.2416837532174984e-05, "loss": 0.0073, "step": 688190 }, { "epoch": 1.78, "learning_rate": 3.241294931580352e-05, "loss": 0.0089, "step": 688200 }, { "epoch": 1.78, "learning_rate": 3.240906109943206e-05, "loss": 0.0112, "step": 688210 }, { "epoch": 1.78, "learning_rate": 3.2405172883060595e-05, "loss": 0.0077, "step": 688220 }, { "epoch": 1.78, "learning_rate": 3.240128466668913e-05, "loss": 0.0075, "step": 688230 }, { "epoch": 1.78, "learning_rate": 3.2397396450317665e-05, "loss": 0.0073, "step": 688240 }, { "epoch": 1.78, "learning_rate": 3.23935082339462e-05, "loss": 0.0068, "step": 688250 }, { "epoch": 1.78, "learning_rate": 3.2389620017574735e-05, "loss": 0.0091, "step": 688260 }, { "epoch": 1.78, "learning_rate": 3.238573180120327e-05, "loss": 0.0059, "step": 688270 }, { "epoch": 1.78, "learning_rate": 3.2381843584831804e-05, "loss": 0.0077, "step": 688280 }, { "epoch": 1.78, "learning_rate": 3.2377955368460346e-05, "loss": 0.0067, "step": 688290 }, { "epoch": 1.78, "learning_rate": 3.237406715208888e-05, "loss": 0.0055, "step": 688300 }, { "epoch": 1.78, "learning_rate": 3.237017893571741e-05, "loss": 0.0092, "step": 688310 }, { "epoch": 1.78, "learning_rate": 3.2366290719345944e-05, "loss": 0.0105, "step": 688320 }, { "epoch": 1.78, "learning_rate": 3.236240250297448e-05, "loss": 0.0072, "step": 688330 }, { "epoch": 1.78, "learning_rate": 3.235851428660302e-05, "loss": 0.0098, "step": 688340 }, { "epoch": 1.78, "learning_rate": 3.2354626070231555e-05, "loss": 0.0066, "step": 688350 }, { "epoch": 1.78, "learning_rate": 3.235073785386009e-05, "loss": 0.0076, "step": 688360 }, { "epoch": 1.78, "learning_rate": 3.2346849637488625e-05, "loss": 0.0085, "step": 688370 }, { "epoch": 1.78, "learning_rate": 3.234296142111716e-05, "loss": 0.0067, "step": 688380 }, { "epoch": 1.78, "learning_rate": 3.2339073204745695e-05, "loss": 0.0176, "step": 688390 }, { "epoch": 1.78, "learning_rate": 3.233518498837423e-05, "loss": 0.0105, "step": 688400 }, { "epoch": 1.78, "learning_rate": 3.2331296772002764e-05, "loss": 0.01, "step": 688410 }, { "epoch": 1.78, "learning_rate": 3.23274085556313e-05, "loss": 0.0085, "step": 688420 }, { "epoch": 1.78, "learning_rate": 3.232352033925984e-05, "loss": 0.007, "step": 688430 }, { "epoch": 1.78, "learning_rate": 3.231963212288837e-05, "loss": 0.0084, "step": 688440 }, { "epoch": 1.78, "learning_rate": 3.2315743906516904e-05, "loss": 0.0064, "step": 688450 }, { "epoch": 1.78, "learning_rate": 3.231185569014544e-05, "loss": 0.0095, "step": 688460 }, { "epoch": 1.78, "learning_rate": 3.2307967473773974e-05, "loss": 0.0086, "step": 688470 }, { "epoch": 1.78, "learning_rate": 3.2304079257402515e-05, "loss": 0.0088, "step": 688480 }, { "epoch": 1.78, "learning_rate": 3.230019104103105e-05, "loss": 0.0096, "step": 688490 }, { "epoch": 1.78, "learning_rate": 3.2296302824659585e-05, "loss": 0.0062, "step": 688500 }, { "epoch": 1.78, "learning_rate": 3.229241460828812e-05, "loss": 0.0059, "step": 688510 }, { "epoch": 1.78, "learning_rate": 3.2288526391916655e-05, "loss": 0.0058, "step": 688520 }, { "epoch": 1.78, "learning_rate": 3.228463817554519e-05, "loss": 0.0073, "step": 688530 }, { "epoch": 1.78, "learning_rate": 3.2280749959173724e-05, "loss": 0.0091, "step": 688540 }, { "epoch": 1.78, "learning_rate": 3.227686174280226e-05, "loss": 0.0086, "step": 688550 }, { "epoch": 1.78, "learning_rate": 3.2272973526430794e-05, "loss": 0.0062, "step": 688560 }, { "epoch": 1.78, "learning_rate": 3.226908531005933e-05, "loss": 0.0071, "step": 688570 }, { "epoch": 1.78, "learning_rate": 3.2265197093687864e-05, "loss": 0.0086, "step": 688580 }, { "epoch": 1.78, "learning_rate": 3.22613088773164e-05, "loss": 0.0076, "step": 688590 }, { "epoch": 1.78, "learning_rate": 3.2257420660944934e-05, "loss": 0.0086, "step": 688600 }, { "epoch": 1.78, "learning_rate": 3.2253532444573475e-05, "loss": 0.0102, "step": 688610 }, { "epoch": 1.79, "learning_rate": 3.224964422820201e-05, "loss": 0.0107, "step": 688620 }, { "epoch": 1.79, "learning_rate": 3.2245756011830545e-05, "loss": 0.0073, "step": 688630 }, { "epoch": 1.79, "learning_rate": 3.224186779545908e-05, "loss": 0.0069, "step": 688640 }, { "epoch": 1.79, "learning_rate": 3.2237979579087615e-05, "loss": 0.0089, "step": 688650 }, { "epoch": 1.79, "learning_rate": 3.223409136271615e-05, "loss": 0.0079, "step": 688660 }, { "epoch": 1.79, "learning_rate": 3.2230203146344684e-05, "loss": 0.0083, "step": 688670 }, { "epoch": 1.79, "learning_rate": 3.222631492997322e-05, "loss": 0.0073, "step": 688680 }, { "epoch": 1.79, "learning_rate": 3.2222426713601754e-05, "loss": 0.0079, "step": 688690 }, { "epoch": 1.79, "learning_rate": 3.221853849723029e-05, "loss": 0.0072, "step": 688700 }, { "epoch": 1.79, "learning_rate": 3.2214650280858824e-05, "loss": 0.0072, "step": 688710 }, { "epoch": 1.79, "learning_rate": 3.221076206448736e-05, "loss": 0.0052, "step": 688720 }, { "epoch": 1.79, "learning_rate": 3.2206873848115893e-05, "loss": 0.0061, "step": 688730 }, { "epoch": 1.79, "learning_rate": 3.2202985631744435e-05, "loss": 0.008, "step": 688740 }, { "epoch": 1.79, "learning_rate": 3.219909741537297e-05, "loss": 0.0052, "step": 688750 }, { "epoch": 1.79, "learning_rate": 3.2195209199001505e-05, "loss": 0.0071, "step": 688760 }, { "epoch": 1.79, "learning_rate": 3.219132098263004e-05, "loss": 0.0072, "step": 688770 }, { "epoch": 1.79, "learning_rate": 3.2187432766258575e-05, "loss": 0.0098, "step": 688780 }, { "epoch": 1.79, "learning_rate": 3.218354454988711e-05, "loss": 0.0095, "step": 688790 }, { "epoch": 1.79, "learning_rate": 3.2179656333515644e-05, "loss": 0.0076, "step": 688800 }, { "epoch": 1.79, "learning_rate": 3.217576811714418e-05, "loss": 0.0086, "step": 688810 }, { "epoch": 1.79, "learning_rate": 3.2171879900772714e-05, "loss": 0.0077, "step": 688820 }, { "epoch": 1.79, "learning_rate": 3.216799168440125e-05, "loss": 0.0081, "step": 688830 }, { "epoch": 1.79, "learning_rate": 3.2164103468029784e-05, "loss": 0.0078, "step": 688840 }, { "epoch": 1.79, "learning_rate": 3.216021525165832e-05, "loss": 0.0065, "step": 688850 }, { "epoch": 1.79, "learning_rate": 3.2156327035286853e-05, "loss": 0.0081, "step": 688860 }, { "epoch": 1.79, "learning_rate": 3.2152438818915395e-05, "loss": 0.007, "step": 688870 }, { "epoch": 1.79, "learning_rate": 3.214855060254393e-05, "loss": 0.0081, "step": 688880 }, { "epoch": 1.79, "learning_rate": 3.2144662386172465e-05, "loss": 0.0053, "step": 688890 }, { "epoch": 1.79, "learning_rate": 3.2140774169801e-05, "loss": 0.0048, "step": 688900 }, { "epoch": 1.79, "learning_rate": 3.2136885953429535e-05, "loss": 0.0073, "step": 688910 }, { "epoch": 1.79, "learning_rate": 3.213299773705807e-05, "loss": 0.0058, "step": 688920 }, { "epoch": 1.79, "learning_rate": 3.2129109520686604e-05, "loss": 0.0085, "step": 688930 }, { "epoch": 1.79, "learning_rate": 3.212522130431514e-05, "loss": 0.007, "step": 688940 }, { "epoch": 1.79, "learning_rate": 3.2121333087943674e-05, "loss": 0.0116, "step": 688950 }, { "epoch": 1.79, "learning_rate": 3.211744487157221e-05, "loss": 0.0109, "step": 688960 }, { "epoch": 1.79, "learning_rate": 3.2113556655200744e-05, "loss": 0.0059, "step": 688970 }, { "epoch": 1.79, "learning_rate": 3.210966843882928e-05, "loss": 0.0073, "step": 688980 }, { "epoch": 1.79, "learning_rate": 3.2105780222457813e-05, "loss": 0.006, "step": 688990 }, { "epoch": 1.79, "learning_rate": 3.2101892006086355e-05, "loss": 0.0075, "step": 689000 }, { "epoch": 1.79, "eval_cer": 0.881657897941274, "eval_loss": 0.0048148115165531635, "eval_runtime": 107.906, "eval_samples_per_second": 18.535, "eval_steps_per_second": 4.634, "step": 689000 }, { "epoch": 1.79, "learning_rate": 3.209800378971489e-05, "loss": 0.0083, "step": 689010 }, { "epoch": 1.79, "learning_rate": 3.2094115573343425e-05, "loss": 0.0053, "step": 689020 }, { "epoch": 1.79, "learning_rate": 3.209022735697196e-05, "loss": 0.0062, "step": 689030 }, { "epoch": 1.79, "learning_rate": 3.2086339140600495e-05, "loss": 0.0073, "step": 689040 }, { "epoch": 1.79, "learning_rate": 3.208245092422903e-05, "loss": 0.0072, "step": 689050 }, { "epoch": 1.79, "learning_rate": 3.2078562707857564e-05, "loss": 0.0068, "step": 689060 }, { "epoch": 1.79, "learning_rate": 3.20746744914861e-05, "loss": 0.0071, "step": 689070 }, { "epoch": 1.79, "learning_rate": 3.2070786275114634e-05, "loss": 0.0048, "step": 689080 }, { "epoch": 1.79, "learning_rate": 3.206689805874317e-05, "loss": 0.0067, "step": 689090 }, { "epoch": 1.79, "learning_rate": 3.2063009842371704e-05, "loss": 0.0065, "step": 689100 }, { "epoch": 1.79, "learning_rate": 3.205912162600024e-05, "loss": 0.0061, "step": 689110 }, { "epoch": 1.79, "learning_rate": 3.2055233409628773e-05, "loss": 0.0061, "step": 689120 }, { "epoch": 1.79, "learning_rate": 3.2051345193257315e-05, "loss": 0.0069, "step": 689130 }, { "epoch": 1.79, "learning_rate": 3.204745697688585e-05, "loss": 0.0068, "step": 689140 }, { "epoch": 1.79, "learning_rate": 3.2043568760514385e-05, "loss": 0.0071, "step": 689150 }, { "epoch": 1.79, "learning_rate": 3.203968054414292e-05, "loss": 0.0072, "step": 689160 }, { "epoch": 1.79, "learning_rate": 3.2035792327771455e-05, "loss": 0.0052, "step": 689170 }, { "epoch": 1.79, "learning_rate": 3.203190411139999e-05, "loss": 0.0079, "step": 689180 }, { "epoch": 1.79, "learning_rate": 3.2028015895028524e-05, "loss": 0.0061, "step": 689190 }, { "epoch": 1.79, "learning_rate": 3.202412767865706e-05, "loss": 0.01, "step": 689200 }, { "epoch": 1.79, "learning_rate": 3.2020239462285594e-05, "loss": 0.007, "step": 689210 }, { "epoch": 1.79, "learning_rate": 3.201635124591413e-05, "loss": 0.0057, "step": 689220 }, { "epoch": 1.79, "learning_rate": 3.2012463029542664e-05, "loss": 0.0075, "step": 689230 }, { "epoch": 1.79, "learning_rate": 3.20085748131712e-05, "loss": 0.0062, "step": 689240 }, { "epoch": 1.79, "learning_rate": 3.2004686596799733e-05, "loss": 0.0078, "step": 689250 }, { "epoch": 1.79, "learning_rate": 3.2000798380428275e-05, "loss": 0.006, "step": 689260 }, { "epoch": 1.79, "learning_rate": 3.199691016405681e-05, "loss": 0.0052, "step": 689270 }, { "epoch": 1.79, "learning_rate": 3.1993021947685345e-05, "loss": 0.0102, "step": 689280 }, { "epoch": 1.79, "learning_rate": 3.198913373131388e-05, "loss": 0.0055, "step": 689290 }, { "epoch": 1.79, "learning_rate": 3.1985245514942414e-05, "loss": 0.0082, "step": 689300 }, { "epoch": 1.79, "learning_rate": 3.198135729857095e-05, "loss": 0.0069, "step": 689310 }, { "epoch": 1.79, "learning_rate": 3.1977469082199484e-05, "loss": 0.008, "step": 689320 }, { "epoch": 1.79, "learning_rate": 3.197358086582802e-05, "loss": 0.0073, "step": 689330 }, { "epoch": 1.79, "learning_rate": 3.1969692649456554e-05, "loss": 0.007, "step": 689340 }, { "epoch": 1.79, "learning_rate": 3.196580443308509e-05, "loss": 0.0064, "step": 689350 }, { "epoch": 1.79, "learning_rate": 3.1961916216713624e-05, "loss": 0.0069, "step": 689360 }, { "epoch": 1.79, "learning_rate": 3.195802800034216e-05, "loss": 0.0071, "step": 689370 }, { "epoch": 1.79, "learning_rate": 3.195413978397069e-05, "loss": 0.0112, "step": 689380 }, { "epoch": 1.79, "learning_rate": 3.1950251567599235e-05, "loss": 0.0082, "step": 689390 }, { "epoch": 1.79, "learning_rate": 3.194636335122777e-05, "loss": 0.0082, "step": 689400 }, { "epoch": 1.79, "learning_rate": 3.1942475134856305e-05, "loss": 0.0074, "step": 689410 }, { "epoch": 1.79, "learning_rate": 3.193858691848484e-05, "loss": 0.0076, "step": 689420 }, { "epoch": 1.79, "learning_rate": 3.193469870211337e-05, "loss": 0.0089, "step": 689430 }, { "epoch": 1.79, "learning_rate": 3.193081048574191e-05, "loss": 0.0109, "step": 689440 }, { "epoch": 1.79, "learning_rate": 3.1926922269370444e-05, "loss": 0.0075, "step": 689450 }, { "epoch": 1.79, "learning_rate": 3.192303405299898e-05, "loss": 0.0067, "step": 689460 }, { "epoch": 1.79, "learning_rate": 3.1919145836627514e-05, "loss": 0.0088, "step": 689470 }, { "epoch": 1.79, "learning_rate": 3.191525762025605e-05, "loss": 0.0073, "step": 689480 }, { "epoch": 1.79, "learning_rate": 3.1911369403884584e-05, "loss": 0.0067, "step": 689490 }, { "epoch": 1.79, "learning_rate": 3.190748118751312e-05, "loss": 0.006, "step": 689500 }, { "epoch": 1.79, "learning_rate": 3.190359297114165e-05, "loss": 0.0072, "step": 689510 }, { "epoch": 1.79, "learning_rate": 3.1899704754770195e-05, "loss": 0.0085, "step": 689520 }, { "epoch": 1.79, "learning_rate": 3.189581653839873e-05, "loss": 0.0076, "step": 689530 }, { "epoch": 1.79, "learning_rate": 3.1891928322027265e-05, "loss": 0.0045, "step": 689540 }, { "epoch": 1.79, "learning_rate": 3.18880401056558e-05, "loss": 0.0066, "step": 689550 }, { "epoch": 1.79, "learning_rate": 3.188415188928433e-05, "loss": 0.0137, "step": 689560 }, { "epoch": 1.79, "learning_rate": 3.188026367291287e-05, "loss": 0.0096, "step": 689570 }, { "epoch": 1.79, "learning_rate": 3.1876375456541404e-05, "loss": 0.0116, "step": 689580 }, { "epoch": 1.79, "learning_rate": 3.187248724016994e-05, "loss": 0.0061, "step": 689590 }, { "epoch": 1.79, "learning_rate": 3.1868599023798474e-05, "loss": 0.0083, "step": 689600 }, { "epoch": 1.79, "learning_rate": 3.186471080742701e-05, "loss": 0.0071, "step": 689610 }, { "epoch": 1.79, "learning_rate": 3.1860822591055544e-05, "loss": 0.0076, "step": 689620 }, { "epoch": 1.79, "learning_rate": 3.185693437468408e-05, "loss": 0.0086, "step": 689630 }, { "epoch": 1.79, "learning_rate": 3.185304615831261e-05, "loss": 0.0083, "step": 689640 }, { "epoch": 1.79, "learning_rate": 3.1849157941941155e-05, "loss": 0.0094, "step": 689650 }, { "epoch": 1.79, "learning_rate": 3.184526972556969e-05, "loss": 0.0078, "step": 689660 }, { "epoch": 1.79, "learning_rate": 3.1841381509198225e-05, "loss": 0.0108, "step": 689670 }, { "epoch": 1.79, "learning_rate": 3.183749329282675e-05, "loss": 0.0056, "step": 689680 }, { "epoch": 1.79, "learning_rate": 3.183360507645529e-05, "loss": 0.0095, "step": 689690 }, { "epoch": 1.79, "learning_rate": 3.182971686008383e-05, "loss": 0.0095, "step": 689700 }, { "epoch": 1.79, "learning_rate": 3.1825828643712364e-05, "loss": 0.008, "step": 689710 }, { "epoch": 1.79, "learning_rate": 3.18219404273409e-05, "loss": 0.0107, "step": 689720 }, { "epoch": 1.79, "learning_rate": 3.1818052210969434e-05, "loss": 0.006, "step": 689730 }, { "epoch": 1.79, "learning_rate": 3.181416399459797e-05, "loss": 0.0093, "step": 689740 }, { "epoch": 1.79, "learning_rate": 3.1810275778226504e-05, "loss": 0.0081, "step": 689750 }, { "epoch": 1.79, "learning_rate": 3.180638756185504e-05, "loss": 0.006, "step": 689760 }, { "epoch": 1.79, "learning_rate": 3.180249934548357e-05, "loss": 0.0087, "step": 689770 }, { "epoch": 1.79, "learning_rate": 3.179861112911211e-05, "loss": 0.0122, "step": 689780 }, { "epoch": 1.79, "learning_rate": 3.179472291274065e-05, "loss": 0.0103, "step": 689790 }, { "epoch": 1.79, "learning_rate": 3.179083469636918e-05, "loss": 0.0106, "step": 689800 }, { "epoch": 1.79, "learning_rate": 3.178694647999771e-05, "loss": 0.0074, "step": 689810 }, { "epoch": 1.79, "learning_rate": 3.178305826362625e-05, "loss": 0.0052, "step": 689820 }, { "epoch": 1.79, "learning_rate": 3.177917004725478e-05, "loss": 0.0074, "step": 689830 }, { "epoch": 1.79, "learning_rate": 3.1775281830883324e-05, "loss": 0.0075, "step": 689840 }, { "epoch": 1.79, "learning_rate": 3.177139361451186e-05, "loss": 0.0081, "step": 689850 }, { "epoch": 1.79, "learning_rate": 3.1767505398140394e-05, "loss": 0.0065, "step": 689860 }, { "epoch": 1.79, "learning_rate": 3.176361718176893e-05, "loss": 0.01, "step": 689870 }, { "epoch": 1.79, "learning_rate": 3.1759728965397464e-05, "loss": 0.0082, "step": 689880 }, { "epoch": 1.79, "learning_rate": 3.1755840749026e-05, "loss": 0.0065, "step": 689890 }, { "epoch": 1.79, "learning_rate": 3.175195253265453e-05, "loss": 0.0063, "step": 689900 }, { "epoch": 1.79, "learning_rate": 3.174806431628307e-05, "loss": 0.0077, "step": 689910 }, { "epoch": 1.79, "learning_rate": 3.174417609991161e-05, "loss": 0.0088, "step": 689920 }, { "epoch": 1.79, "learning_rate": 3.174028788354014e-05, "loss": 0.0093, "step": 689930 }, { "epoch": 1.79, "learning_rate": 3.173639966716867e-05, "loss": 0.0088, "step": 689940 }, { "epoch": 1.79, "learning_rate": 3.173251145079721e-05, "loss": 0.007, "step": 689950 }, { "epoch": 1.79, "learning_rate": 3.172862323442574e-05, "loss": 0.0065, "step": 689960 }, { "epoch": 1.79, "learning_rate": 3.1724735018054284e-05, "loss": 0.0097, "step": 689970 }, { "epoch": 1.79, "learning_rate": 3.172084680168282e-05, "loss": 0.0081, "step": 689980 }, { "epoch": 1.79, "learning_rate": 3.1716958585311354e-05, "loss": 0.0098, "step": 689990 }, { "epoch": 1.79, "learning_rate": 3.171307036893989e-05, "loss": 0.0066, "step": 690000 }, { "epoch": 1.79, "eval_cer": 0.88167329394755, "eval_loss": 0.004875406622886658, "eval_runtime": 107.9167, "eval_samples_per_second": 18.533, "eval_steps_per_second": 4.633, "step": 690000 }, { "epoch": 1.79, "learning_rate": 3.1709182152568424e-05, "loss": 0.0085, "step": 690010 }, { "epoch": 1.79, "learning_rate": 3.170529393619696e-05, "loss": 0.0063, "step": 690020 }, { "epoch": 1.79, "learning_rate": 3.170140571982549e-05, "loss": 0.0071, "step": 690030 }, { "epoch": 1.79, "learning_rate": 3.169751750345403e-05, "loss": 0.0078, "step": 690040 }, { "epoch": 1.79, "learning_rate": 3.169362928708256e-05, "loss": 0.007, "step": 690050 }, { "epoch": 1.79, "learning_rate": 3.16897410707111e-05, "loss": 0.007, "step": 690060 }, { "epoch": 1.79, "learning_rate": 3.168585285433963e-05, "loss": 0.0056, "step": 690070 }, { "epoch": 1.79, "learning_rate": 3.168196463796817e-05, "loss": 0.0078, "step": 690080 }, { "epoch": 1.79, "learning_rate": 3.16780764215967e-05, "loss": 0.0084, "step": 690090 }, { "epoch": 1.79, "learning_rate": 3.1674188205225244e-05, "loss": 0.0066, "step": 690100 }, { "epoch": 1.79, "learning_rate": 3.167029998885378e-05, "loss": 0.0089, "step": 690110 }, { "epoch": 1.79, "learning_rate": 3.1666411772482314e-05, "loss": 0.0069, "step": 690120 }, { "epoch": 1.79, "learning_rate": 3.166252355611085e-05, "loss": 0.0065, "step": 690130 }, { "epoch": 1.79, "learning_rate": 3.1658635339739384e-05, "loss": 0.0098, "step": 690140 }, { "epoch": 1.79, "learning_rate": 3.165474712336792e-05, "loss": 0.0079, "step": 690150 }, { "epoch": 1.79, "learning_rate": 3.165085890699645e-05, "loss": 0.0097, "step": 690160 }, { "epoch": 1.79, "learning_rate": 3.164697069062499e-05, "loss": 0.0072, "step": 690170 }, { "epoch": 1.79, "learning_rate": 3.164308247425352e-05, "loss": 0.0113, "step": 690180 }, { "epoch": 1.79, "learning_rate": 3.163919425788206e-05, "loss": 0.0086, "step": 690190 }, { "epoch": 1.79, "learning_rate": 3.163530604151059e-05, "loss": 0.0079, "step": 690200 }, { "epoch": 1.79, "learning_rate": 3.163141782513913e-05, "loss": 0.008, "step": 690210 }, { "epoch": 1.79, "learning_rate": 3.162752960876766e-05, "loss": 0.0079, "step": 690220 }, { "epoch": 1.79, "learning_rate": 3.1623641392396204e-05, "loss": 0.0075, "step": 690230 }, { "epoch": 1.79, "learning_rate": 3.161975317602474e-05, "loss": 0.0077, "step": 690240 }, { "epoch": 1.79, "learning_rate": 3.1615864959653274e-05, "loss": 0.0089, "step": 690250 }, { "epoch": 1.79, "learning_rate": 3.161197674328181e-05, "loss": 0.0052, "step": 690260 }, { "epoch": 1.79, "learning_rate": 3.1608088526910343e-05, "loss": 0.0069, "step": 690270 }, { "epoch": 1.79, "learning_rate": 3.160420031053888e-05, "loss": 0.0096, "step": 690280 }, { "epoch": 1.79, "learning_rate": 3.160031209416741e-05, "loss": 0.0073, "step": 690290 }, { "epoch": 1.79, "learning_rate": 3.159642387779595e-05, "loss": 0.0093, "step": 690300 }, { "epoch": 1.79, "learning_rate": 3.159253566142448e-05, "loss": 0.0095, "step": 690310 }, { "epoch": 1.79, "learning_rate": 3.158864744505302e-05, "loss": 0.0068, "step": 690320 }, { "epoch": 1.79, "learning_rate": 3.158475922868155e-05, "loss": 0.011, "step": 690330 }, { "epoch": 1.79, "learning_rate": 3.158087101231009e-05, "loss": 0.0079, "step": 690340 }, { "epoch": 1.79, "learning_rate": 3.157698279593862e-05, "loss": 0.0059, "step": 690350 }, { "epoch": 1.79, "learning_rate": 3.1573094579567164e-05, "loss": 0.0067, "step": 690360 }, { "epoch": 1.79, "learning_rate": 3.15692063631957e-05, "loss": 0.0055, "step": 690370 }, { "epoch": 1.79, "learning_rate": 3.1565318146824234e-05, "loss": 0.0091, "step": 690380 }, { "epoch": 1.79, "learning_rate": 3.156142993045277e-05, "loss": 0.0101, "step": 690390 }, { "epoch": 1.79, "learning_rate": 3.1557541714081303e-05, "loss": 0.0067, "step": 690400 }, { "epoch": 1.79, "learning_rate": 3.155365349770984e-05, "loss": 0.0091, "step": 690410 }, { "epoch": 1.79, "learning_rate": 3.154976528133837e-05, "loss": 0.0071, "step": 690420 }, { "epoch": 1.79, "learning_rate": 3.154587706496691e-05, "loss": 0.0073, "step": 690430 }, { "epoch": 1.79, "learning_rate": 3.154198884859544e-05, "loss": 0.0075, "step": 690440 }, { "epoch": 1.79, "learning_rate": 3.153810063222398e-05, "loss": 0.0061, "step": 690450 }, { "epoch": 1.79, "learning_rate": 3.153421241585251e-05, "loss": 0.0067, "step": 690460 }, { "epoch": 1.79, "learning_rate": 3.153032419948105e-05, "loss": 0.0092, "step": 690470 }, { "epoch": 1.79, "learning_rate": 3.152643598310958e-05, "loss": 0.0071, "step": 690480 }, { "epoch": 1.79, "learning_rate": 3.1522547766738124e-05, "loss": 0.0072, "step": 690490 }, { "epoch": 1.79, "learning_rate": 3.151865955036666e-05, "loss": 0.008, "step": 690500 }, { "epoch": 1.79, "learning_rate": 3.1514771333995194e-05, "loss": 0.006, "step": 690510 }, { "epoch": 1.79, "learning_rate": 3.151088311762373e-05, "loss": 0.0089, "step": 690520 }, { "epoch": 1.79, "learning_rate": 3.1506994901252263e-05, "loss": 0.0071, "step": 690530 }, { "epoch": 1.79, "learning_rate": 3.15031066848808e-05, "loss": 0.0088, "step": 690540 }, { "epoch": 1.79, "learning_rate": 3.149921846850933e-05, "loss": 0.0059, "step": 690550 }, { "epoch": 1.79, "learning_rate": 3.149533025213787e-05, "loss": 0.0062, "step": 690560 }, { "epoch": 1.79, "learning_rate": 3.14914420357664e-05, "loss": 0.0068, "step": 690570 }, { "epoch": 1.79, "learning_rate": 3.148755381939494e-05, "loss": 0.0067, "step": 690580 }, { "epoch": 1.79, "learning_rate": 3.148366560302347e-05, "loss": 0.0093, "step": 690590 }, { "epoch": 1.79, "learning_rate": 3.147977738665201e-05, "loss": 0.0098, "step": 690600 }, { "epoch": 1.79, "learning_rate": 3.147588917028054e-05, "loss": 0.0064, "step": 690610 }, { "epoch": 1.79, "learning_rate": 3.1472000953909084e-05, "loss": 0.0058, "step": 690620 }, { "epoch": 1.79, "learning_rate": 3.146811273753762e-05, "loss": 0.0107, "step": 690630 }, { "epoch": 1.79, "learning_rate": 3.1464224521166154e-05, "loss": 0.0154, "step": 690640 }, { "epoch": 1.79, "learning_rate": 3.146033630479469e-05, "loss": 0.0094, "step": 690650 }, { "epoch": 1.79, "learning_rate": 3.1456448088423223e-05, "loss": 0.0071, "step": 690660 }, { "epoch": 1.79, "learning_rate": 3.145255987205176e-05, "loss": 0.008, "step": 690670 }, { "epoch": 1.79, "learning_rate": 3.144867165568029e-05, "loss": 0.006, "step": 690680 }, { "epoch": 1.79, "learning_rate": 3.144478343930883e-05, "loss": 0.0054, "step": 690690 }, { "epoch": 1.79, "learning_rate": 3.144089522293736e-05, "loss": 0.0082, "step": 690700 }, { "epoch": 1.79, "learning_rate": 3.14370070065659e-05, "loss": 0.0079, "step": 690710 }, { "epoch": 1.79, "learning_rate": 3.143311879019443e-05, "loss": 0.0101, "step": 690720 }, { "epoch": 1.79, "learning_rate": 3.142923057382297e-05, "loss": 0.0085, "step": 690730 }, { "epoch": 1.79, "learning_rate": 3.14253423574515e-05, "loss": 0.0064, "step": 690740 }, { "epoch": 1.79, "learning_rate": 3.1421454141080044e-05, "loss": 0.0088, "step": 690750 }, { "epoch": 1.79, "learning_rate": 3.141756592470858e-05, "loss": 0.0071, "step": 690760 }, { "epoch": 1.79, "learning_rate": 3.1413677708337114e-05, "loss": 0.008, "step": 690770 }, { "epoch": 1.79, "learning_rate": 3.140978949196565e-05, "loss": 0.0072, "step": 690780 }, { "epoch": 1.79, "learning_rate": 3.1405901275594183e-05, "loss": 0.0079, "step": 690790 }, { "epoch": 1.79, "learning_rate": 3.140201305922272e-05, "loss": 0.0068, "step": 690800 }, { "epoch": 1.79, "learning_rate": 3.139812484285125e-05, "loss": 0.0072, "step": 690810 }, { "epoch": 1.79, "learning_rate": 3.139423662647979e-05, "loss": 0.0084, "step": 690820 }, { "epoch": 1.79, "learning_rate": 3.139034841010832e-05, "loss": 0.0084, "step": 690830 }, { "epoch": 1.79, "learning_rate": 3.138646019373686e-05, "loss": 0.0051, "step": 690840 }, { "epoch": 1.79, "learning_rate": 3.138257197736539e-05, "loss": 0.0073, "step": 690850 }, { "epoch": 1.79, "learning_rate": 3.137868376099393e-05, "loss": 0.0054, "step": 690860 }, { "epoch": 1.79, "learning_rate": 3.137479554462246e-05, "loss": 0.0068, "step": 690870 }, { "epoch": 1.79, "learning_rate": 3.1370907328251004e-05, "loss": 0.0056, "step": 690880 }, { "epoch": 1.79, "learning_rate": 3.136701911187954e-05, "loss": 0.0059, "step": 690890 }, { "epoch": 1.79, "learning_rate": 3.1363130895508074e-05, "loss": 0.0104, "step": 690900 }, { "epoch": 1.79, "learning_rate": 3.135924267913661e-05, "loss": 0.0102, "step": 690910 }, { "epoch": 1.79, "learning_rate": 3.1355354462765137e-05, "loss": 0.0082, "step": 690920 }, { "epoch": 1.79, "learning_rate": 3.135146624639368e-05, "loss": 0.0076, "step": 690930 }, { "epoch": 1.79, "learning_rate": 3.134757803002221e-05, "loss": 0.0089, "step": 690940 }, { "epoch": 1.79, "learning_rate": 3.134368981365075e-05, "loss": 0.0086, "step": 690950 }, { "epoch": 1.79, "learning_rate": 3.133980159727928e-05, "loss": 0.0079, "step": 690960 }, { "epoch": 1.79, "learning_rate": 3.133591338090782e-05, "loss": 0.0083, "step": 690970 }, { "epoch": 1.79, "learning_rate": 3.133202516453635e-05, "loss": 0.0078, "step": 690980 }, { "epoch": 1.79, "learning_rate": 3.132813694816489e-05, "loss": 0.0126, "step": 690990 }, { "epoch": 1.79, "learning_rate": 3.132424873179342e-05, "loss": 0.0087, "step": 691000 }, { "epoch": 1.79, "eval_cer": 0.8816550986674057, "eval_loss": 0.004775453358888626, "eval_runtime": 107.7867, "eval_samples_per_second": 18.555, "eval_steps_per_second": 4.639, "step": 691000 }, { "epoch": 1.79, "learning_rate": 3.1320360515421964e-05, "loss": 0.0098, "step": 691010 }, { "epoch": 1.79, "learning_rate": 3.13164722990505e-05, "loss": 0.0075, "step": 691020 }, { "epoch": 1.79, "learning_rate": 3.1312584082679034e-05, "loss": 0.0059, "step": 691030 }, { "epoch": 1.79, "learning_rate": 3.130869586630756e-05, "loss": 0.0068, "step": 691040 }, { "epoch": 1.79, "learning_rate": 3.1304807649936097e-05, "loss": 0.0073, "step": 691050 }, { "epoch": 1.79, "learning_rate": 3.130091943356464e-05, "loss": 0.0073, "step": 691060 }, { "epoch": 1.79, "learning_rate": 3.129703121719317e-05, "loss": 0.0116, "step": 691070 }, { "epoch": 1.79, "learning_rate": 3.129314300082171e-05, "loss": 0.0089, "step": 691080 }, { "epoch": 1.79, "learning_rate": 3.128925478445024e-05, "loss": 0.0085, "step": 691090 }, { "epoch": 1.79, "learning_rate": 3.128536656807878e-05, "loss": 0.0069, "step": 691100 }, { "epoch": 1.79, "learning_rate": 3.128147835170731e-05, "loss": 0.0068, "step": 691110 }, { "epoch": 1.79, "learning_rate": 3.127759013533585e-05, "loss": 0.0068, "step": 691120 }, { "epoch": 1.79, "learning_rate": 3.127370191896438e-05, "loss": 0.0092, "step": 691130 }, { "epoch": 1.79, "learning_rate": 3.126981370259292e-05, "loss": 0.0079, "step": 691140 }, { "epoch": 1.79, "learning_rate": 3.126592548622146e-05, "loss": 0.0093, "step": 691150 }, { "epoch": 1.79, "learning_rate": 3.1262037269849994e-05, "loss": 0.0065, "step": 691160 }, { "epoch": 1.79, "learning_rate": 3.125814905347852e-05, "loss": 0.007, "step": 691170 }, { "epoch": 1.79, "learning_rate": 3.1254260837107057e-05, "loss": 0.0071, "step": 691180 }, { "epoch": 1.79, "learning_rate": 3.125037262073559e-05, "loss": 0.006, "step": 691190 }, { "epoch": 1.79, "learning_rate": 3.124648440436413e-05, "loss": 0.0065, "step": 691200 }, { "epoch": 1.79, "learning_rate": 3.124259618799267e-05, "loss": 0.0067, "step": 691210 }, { "epoch": 1.79, "learning_rate": 3.12387079716212e-05, "loss": 0.0073, "step": 691220 }, { "epoch": 1.79, "learning_rate": 3.123481975524974e-05, "loss": 0.0058, "step": 691230 }, { "epoch": 1.79, "learning_rate": 3.123093153887827e-05, "loss": 0.0069, "step": 691240 }, { "epoch": 1.79, "learning_rate": 3.122704332250681e-05, "loss": 0.0086, "step": 691250 }, { "epoch": 1.79, "learning_rate": 3.122315510613534e-05, "loss": 0.0072, "step": 691260 }, { "epoch": 1.79, "learning_rate": 3.121926688976388e-05, "loss": 0.0066, "step": 691270 }, { "epoch": 1.79, "learning_rate": 3.121537867339242e-05, "loss": 0.0071, "step": 691280 }, { "epoch": 1.79, "learning_rate": 3.121149045702095e-05, "loss": 0.0072, "step": 691290 }, { "epoch": 1.79, "learning_rate": 3.120760224064948e-05, "loss": 0.0098, "step": 691300 }, { "epoch": 1.79, "learning_rate": 3.1203714024278017e-05, "loss": 0.0067, "step": 691310 }, { "epoch": 1.79, "learning_rate": 3.119982580790655e-05, "loss": 0.0089, "step": 691320 }, { "epoch": 1.79, "learning_rate": 3.119593759153509e-05, "loss": 0.0087, "step": 691330 }, { "epoch": 1.79, "learning_rate": 3.119204937516363e-05, "loss": 0.008, "step": 691340 }, { "epoch": 1.79, "learning_rate": 3.118816115879216e-05, "loss": 0.0109, "step": 691350 }, { "epoch": 1.79, "learning_rate": 3.11842729424207e-05, "loss": 0.0072, "step": 691360 }, { "epoch": 1.79, "learning_rate": 3.118038472604923e-05, "loss": 0.0067, "step": 691370 }, { "epoch": 1.79, "learning_rate": 3.117649650967777e-05, "loss": 0.0088, "step": 691380 }, { "epoch": 1.79, "learning_rate": 3.11726082933063e-05, "loss": 0.0061, "step": 691390 }, { "epoch": 1.79, "learning_rate": 3.116872007693484e-05, "loss": 0.0077, "step": 691400 }, { "epoch": 1.79, "learning_rate": 3.116483186056338e-05, "loss": 0.0101, "step": 691410 }, { "epoch": 1.79, "learning_rate": 3.116094364419191e-05, "loss": 0.0094, "step": 691420 }, { "epoch": 1.79, "learning_rate": 3.115705542782044e-05, "loss": 0.0072, "step": 691430 }, { "epoch": 1.79, "learning_rate": 3.1153167211448976e-05, "loss": 0.0091, "step": 691440 }, { "epoch": 1.79, "learning_rate": 3.114927899507751e-05, "loss": 0.0093, "step": 691450 }, { "epoch": 1.79, "learning_rate": 3.114539077870605e-05, "loss": 0.0069, "step": 691460 }, { "epoch": 1.79, "learning_rate": 3.114150256233459e-05, "loss": 0.0086, "step": 691470 }, { "epoch": 1.79, "learning_rate": 3.113761434596312e-05, "loss": 0.006, "step": 691480 }, { "epoch": 1.79, "learning_rate": 3.113372612959166e-05, "loss": 0.0072, "step": 691490 }, { "epoch": 1.79, "learning_rate": 3.112983791322019e-05, "loss": 0.0083, "step": 691500 }, { "epoch": 1.79, "learning_rate": 3.112594969684873e-05, "loss": 0.0078, "step": 691510 }, { "epoch": 1.79, "learning_rate": 3.112206148047726e-05, "loss": 0.0105, "step": 691520 }, { "epoch": 1.79, "learning_rate": 3.11181732641058e-05, "loss": 0.0074, "step": 691530 }, { "epoch": 1.79, "learning_rate": 3.111428504773433e-05, "loss": 0.0069, "step": 691540 }, { "epoch": 1.79, "learning_rate": 3.111039683136287e-05, "loss": 0.0084, "step": 691550 }, { "epoch": 1.79, "learning_rate": 3.11065086149914e-05, "loss": 0.0071, "step": 691560 }, { "epoch": 1.79, "learning_rate": 3.1102620398619936e-05, "loss": 0.0078, "step": 691570 }, { "epoch": 1.79, "learning_rate": 3.109873218224847e-05, "loss": 0.0067, "step": 691580 }, { "epoch": 1.79, "learning_rate": 3.109484396587701e-05, "loss": 0.0043, "step": 691590 }, { "epoch": 1.79, "learning_rate": 3.109095574950555e-05, "loss": 0.0063, "step": 691600 }, { "epoch": 1.79, "learning_rate": 3.108706753313408e-05, "loss": 0.0082, "step": 691610 }, { "epoch": 1.79, "learning_rate": 3.108317931676262e-05, "loss": 0.0103, "step": 691620 }, { "epoch": 1.79, "learning_rate": 3.107929110039115e-05, "loss": 0.0088, "step": 691630 }, { "epoch": 1.79, "learning_rate": 3.107540288401969e-05, "loss": 0.009, "step": 691640 }, { "epoch": 1.79, "learning_rate": 3.107151466764822e-05, "loss": 0.008, "step": 691650 }, { "epoch": 1.79, "learning_rate": 3.106762645127676e-05, "loss": 0.0109, "step": 691660 }, { "epoch": 1.79, "learning_rate": 3.106373823490529e-05, "loss": 0.0069, "step": 691670 }, { "epoch": 1.79, "learning_rate": 3.105985001853383e-05, "loss": 0.007, "step": 691680 }, { "epoch": 1.79, "learning_rate": 3.105596180216236e-05, "loss": 0.0062, "step": 691690 }, { "epoch": 1.79, "learning_rate": 3.1052073585790896e-05, "loss": 0.0087, "step": 691700 }, { "epoch": 1.79, "learning_rate": 3.104818536941943e-05, "loss": 0.0076, "step": 691710 }, { "epoch": 1.79, "learning_rate": 3.104429715304797e-05, "loss": 0.0082, "step": 691720 }, { "epoch": 1.79, "learning_rate": 3.104040893667651e-05, "loss": 0.0083, "step": 691730 }, { "epoch": 1.79, "learning_rate": 3.103652072030504e-05, "loss": 0.0073, "step": 691740 }, { "epoch": 1.79, "learning_rate": 3.103263250393358e-05, "loss": 0.0109, "step": 691750 }, { "epoch": 1.79, "learning_rate": 3.102874428756211e-05, "loss": 0.0072, "step": 691760 }, { "epoch": 1.79, "learning_rate": 3.102485607119065e-05, "loss": 0.0072, "step": 691770 }, { "epoch": 1.79, "learning_rate": 3.102096785481918e-05, "loss": 0.0077, "step": 691780 }, { "epoch": 1.79, "learning_rate": 3.101707963844772e-05, "loss": 0.013, "step": 691790 }, { "epoch": 1.79, "learning_rate": 3.101319142207625e-05, "loss": 0.0075, "step": 691800 }, { "epoch": 1.79, "learning_rate": 3.100930320570479e-05, "loss": 0.0074, "step": 691810 }, { "epoch": 1.79, "learning_rate": 3.100541498933332e-05, "loss": 0.0089, "step": 691820 }, { "epoch": 1.79, "learning_rate": 3.1001526772961856e-05, "loss": 0.0109, "step": 691830 }, { "epoch": 1.79, "learning_rate": 3.099763855659039e-05, "loss": 0.0076, "step": 691840 }, { "epoch": 1.79, "learning_rate": 3.099375034021893e-05, "loss": 0.0058, "step": 691850 }, { "epoch": 1.79, "learning_rate": 3.098986212384747e-05, "loss": 0.0063, "step": 691860 }, { "epoch": 1.79, "learning_rate": 3.0985973907476e-05, "loss": 0.0097, "step": 691870 }, { "epoch": 1.79, "learning_rate": 3.098208569110454e-05, "loss": 0.0078, "step": 691880 }, { "epoch": 1.79, "learning_rate": 3.097819747473307e-05, "loss": 0.0068, "step": 691890 }, { "epoch": 1.79, "learning_rate": 3.097430925836161e-05, "loss": 0.0072, "step": 691900 }, { "epoch": 1.79, "learning_rate": 3.097042104199014e-05, "loss": 0.0073, "step": 691910 }, { "epoch": 1.79, "learning_rate": 3.096653282561868e-05, "loss": 0.0081, "step": 691920 }, { "epoch": 1.79, "learning_rate": 3.096264460924721e-05, "loss": 0.0092, "step": 691930 }, { "epoch": 1.79, "learning_rate": 3.095875639287575e-05, "loss": 0.0049, "step": 691940 }, { "epoch": 1.79, "learning_rate": 3.095486817650428e-05, "loss": 0.0072, "step": 691950 }, { "epoch": 1.79, "learning_rate": 3.0950979960132816e-05, "loss": 0.0058, "step": 691960 }, { "epoch": 1.79, "learning_rate": 3.094709174376135e-05, "loss": 0.0059, "step": 691970 }, { "epoch": 1.79, "learning_rate": 3.094320352738989e-05, "loss": 0.0078, "step": 691980 }, { "epoch": 1.79, "learning_rate": 3.093931531101843e-05, "loss": 0.0105, "step": 691990 }, { "epoch": 1.79, "learning_rate": 3.093542709464696e-05, "loss": 0.0078, "step": 692000 }, { "epoch": 1.79, "eval_cer": 0.8816606972151424, "eval_loss": 0.0048337411135435104, "eval_runtime": 107.7159, "eval_samples_per_second": 18.567, "eval_steps_per_second": 4.642, "step": 692000 }, { "epoch": 1.79, "learning_rate": 3.09315388782755e-05, "loss": 0.0086, "step": 692010 }, { "epoch": 1.79, "learning_rate": 3.092765066190403e-05, "loss": 0.0076, "step": 692020 }, { "epoch": 1.79, "learning_rate": 3.092376244553257e-05, "loss": 0.0056, "step": 692030 }, { "epoch": 1.79, "learning_rate": 3.09198742291611e-05, "loss": 0.006, "step": 692040 }, { "epoch": 1.79, "learning_rate": 3.091598601278964e-05, "loss": 0.0092, "step": 692050 }, { "epoch": 1.79, "learning_rate": 3.091209779641817e-05, "loss": 0.0089, "step": 692060 }, { "epoch": 1.79, "learning_rate": 3.090820958004671e-05, "loss": 0.0081, "step": 692070 }, { "epoch": 1.79, "learning_rate": 3.090432136367524e-05, "loss": 0.0061, "step": 692080 }, { "epoch": 1.79, "learning_rate": 3.0900433147303776e-05, "loss": 0.008, "step": 692090 }, { "epoch": 1.79, "learning_rate": 3.089654493093231e-05, "loss": 0.0086, "step": 692100 }, { "epoch": 1.79, "learning_rate": 3.089265671456085e-05, "loss": 0.0096, "step": 692110 }, { "epoch": 1.79, "learning_rate": 3.088876849818939e-05, "loss": 0.0098, "step": 692120 }, { "epoch": 1.79, "learning_rate": 3.088488028181792e-05, "loss": 0.007, "step": 692130 }, { "epoch": 1.79, "learning_rate": 3.088099206544646e-05, "loss": 0.0103, "step": 692140 }, { "epoch": 1.79, "learning_rate": 3.087710384907499e-05, "loss": 0.0088, "step": 692150 }, { "epoch": 1.79, "learning_rate": 3.087321563270353e-05, "loss": 0.0101, "step": 692160 }, { "epoch": 1.79, "learning_rate": 3.086932741633206e-05, "loss": 0.0055, "step": 692170 }, { "epoch": 1.79, "learning_rate": 3.08654391999606e-05, "loss": 0.0074, "step": 692180 }, { "epoch": 1.79, "learning_rate": 3.086155098358913e-05, "loss": 0.0056, "step": 692190 }, { "epoch": 1.79, "learning_rate": 3.085766276721767e-05, "loss": 0.0086, "step": 692200 }, { "epoch": 1.79, "learning_rate": 3.08537745508462e-05, "loss": 0.0078, "step": 692210 }, { "epoch": 1.79, "learning_rate": 3.0849886334474736e-05, "loss": 0.0099, "step": 692220 }, { "epoch": 1.79, "learning_rate": 3.084599811810327e-05, "loss": 0.0074, "step": 692230 }, { "epoch": 1.79, "learning_rate": 3.084210990173181e-05, "loss": 0.007, "step": 692240 }, { "epoch": 1.79, "learning_rate": 3.083822168536035e-05, "loss": 0.008, "step": 692250 }, { "epoch": 1.79, "learning_rate": 3.083433346898888e-05, "loss": 0.0073, "step": 692260 }, { "epoch": 1.79, "learning_rate": 3.083044525261742e-05, "loss": 0.0069, "step": 692270 }, { "epoch": 1.79, "learning_rate": 3.0826557036245946e-05, "loss": 0.0068, "step": 692280 }, { "epoch": 1.79, "learning_rate": 3.082266881987449e-05, "loss": 0.007, "step": 692290 }, { "epoch": 1.79, "learning_rate": 3.081878060350302e-05, "loss": 0.0126, "step": 692300 }, { "epoch": 1.79, "learning_rate": 3.081489238713156e-05, "loss": 0.0072, "step": 692310 }, { "epoch": 1.79, "learning_rate": 3.081100417076009e-05, "loss": 0.0063, "step": 692320 }, { "epoch": 1.79, "learning_rate": 3.0807115954388627e-05, "loss": 0.0082, "step": 692330 }, { "epoch": 1.79, "learning_rate": 3.080322773801716e-05, "loss": 0.0065, "step": 692340 }, { "epoch": 1.79, "learning_rate": 3.0799339521645696e-05, "loss": 0.0096, "step": 692350 }, { "epoch": 1.79, "learning_rate": 3.079545130527423e-05, "loss": 0.0068, "step": 692360 }, { "epoch": 1.79, "learning_rate": 3.079156308890277e-05, "loss": 0.0069, "step": 692370 }, { "epoch": 1.79, "learning_rate": 3.078767487253131e-05, "loss": 0.0068, "step": 692380 }, { "epoch": 1.79, "learning_rate": 3.078378665615984e-05, "loss": 0.0056, "step": 692390 }, { "epoch": 1.79, "learning_rate": 3.077989843978838e-05, "loss": 0.0075, "step": 692400 }, { "epoch": 1.79, "learning_rate": 3.0776010223416905e-05, "loss": 0.0088, "step": 692410 }, { "epoch": 1.79, "learning_rate": 3.077212200704545e-05, "loss": 0.0059, "step": 692420 }, { "epoch": 1.79, "learning_rate": 3.076823379067398e-05, "loss": 0.0102, "step": 692430 }, { "epoch": 1.79, "learning_rate": 3.076434557430252e-05, "loss": 0.0067, "step": 692440 }, { "epoch": 1.79, "learning_rate": 3.076045735793105e-05, "loss": 0.0114, "step": 692450 }, { "epoch": 1.79, "learning_rate": 3.0756569141559587e-05, "loss": 0.0069, "step": 692460 }, { "epoch": 1.79, "learning_rate": 3.075268092518812e-05, "loss": 0.0062, "step": 692470 }, { "epoch": 1.8, "learning_rate": 3.0748792708816656e-05, "loss": 0.0091, "step": 692480 }, { "epoch": 1.8, "learning_rate": 3.074490449244519e-05, "loss": 0.0093, "step": 692490 }, { "epoch": 1.8, "learning_rate": 3.074101627607373e-05, "loss": 0.0069, "step": 692500 }, { "epoch": 1.8, "learning_rate": 3.073712805970227e-05, "loss": 0.0063, "step": 692510 }, { "epoch": 1.8, "learning_rate": 3.07332398433308e-05, "loss": 0.0065, "step": 692520 }, { "epoch": 1.8, "learning_rate": 3.072935162695933e-05, "loss": 0.0064, "step": 692530 }, { "epoch": 1.8, "learning_rate": 3.0725463410587865e-05, "loss": 0.0079, "step": 692540 }, { "epoch": 1.8, "learning_rate": 3.072157519421641e-05, "loss": 0.0062, "step": 692550 }, { "epoch": 1.8, "learning_rate": 3.071768697784494e-05, "loss": 0.0079, "step": 692560 }, { "epoch": 1.8, "learning_rate": 3.071379876147348e-05, "loss": 0.0086, "step": 692570 }, { "epoch": 1.8, "learning_rate": 3.070991054510201e-05, "loss": 0.0051, "step": 692580 }, { "epoch": 1.8, "learning_rate": 3.0706022328730547e-05, "loss": 0.006, "step": 692590 }, { "epoch": 1.8, "learning_rate": 3.070213411235908e-05, "loss": 0.008, "step": 692600 }, { "epoch": 1.8, "learning_rate": 3.0698245895987616e-05, "loss": 0.0076, "step": 692610 }, { "epoch": 1.8, "learning_rate": 3.069435767961615e-05, "loss": 0.0046, "step": 692620 }, { "epoch": 1.8, "learning_rate": 3.0690469463244686e-05, "loss": 0.008, "step": 692630 }, { "epoch": 1.8, "learning_rate": 3.068658124687323e-05, "loss": 0.0085, "step": 692640 }, { "epoch": 1.8, "learning_rate": 3.068269303050176e-05, "loss": 0.0074, "step": 692650 }, { "epoch": 1.8, "learning_rate": 3.067880481413029e-05, "loss": 0.0075, "step": 692660 }, { "epoch": 1.8, "learning_rate": 3.0674916597758825e-05, "loss": 0.0069, "step": 692670 }, { "epoch": 1.8, "learning_rate": 3.067102838138736e-05, "loss": 0.0074, "step": 692680 }, { "epoch": 1.8, "learning_rate": 3.06671401650159e-05, "loss": 0.0085, "step": 692690 }, { "epoch": 1.8, "learning_rate": 3.066325194864444e-05, "loss": 0.0049, "step": 692700 }, { "epoch": 1.8, "learning_rate": 3.065936373227297e-05, "loss": 0.0075, "step": 692710 }, { "epoch": 1.8, "learning_rate": 3.0655475515901507e-05, "loss": 0.0071, "step": 692720 }, { "epoch": 1.8, "learning_rate": 3.065158729953004e-05, "loss": 0.0048, "step": 692730 }, { "epoch": 1.8, "learning_rate": 3.0647699083158576e-05, "loss": 0.0067, "step": 692740 }, { "epoch": 1.8, "learning_rate": 3.064381086678711e-05, "loss": 0.0066, "step": 692750 }, { "epoch": 1.8, "learning_rate": 3.0639922650415646e-05, "loss": 0.0095, "step": 692760 }, { "epoch": 1.8, "learning_rate": 3.063603443404419e-05, "loss": 0.007, "step": 692770 }, { "epoch": 1.8, "learning_rate": 3.0632146217672716e-05, "loss": 0.0095, "step": 692780 }, { "epoch": 1.8, "learning_rate": 3.062825800130125e-05, "loss": 0.007, "step": 692790 }, { "epoch": 1.8, "learning_rate": 3.0624369784929785e-05, "loss": 0.0089, "step": 692800 }, { "epoch": 1.8, "learning_rate": 3.062048156855832e-05, "loss": 0.0064, "step": 692810 }, { "epoch": 1.8, "learning_rate": 3.061659335218686e-05, "loss": 0.0077, "step": 692820 }, { "epoch": 1.8, "learning_rate": 3.06127051358154e-05, "loss": 0.0086, "step": 692830 }, { "epoch": 1.8, "learning_rate": 3.060881691944393e-05, "loss": 0.0069, "step": 692840 }, { "epoch": 1.8, "learning_rate": 3.0604928703072467e-05, "loss": 0.0076, "step": 692850 }, { "epoch": 1.8, "learning_rate": 3.0601040486701e-05, "loss": 0.01, "step": 692860 }, { "epoch": 1.8, "learning_rate": 3.0597152270329536e-05, "loss": 0.0073, "step": 692870 }, { "epoch": 1.8, "learning_rate": 3.059326405395807e-05, "loss": 0.0079, "step": 692880 }, { "epoch": 1.8, "learning_rate": 3.0589375837586606e-05, "loss": 0.0094, "step": 692890 }, { "epoch": 1.8, "learning_rate": 3.058548762121514e-05, "loss": 0.0068, "step": 692900 }, { "epoch": 1.8, "learning_rate": 3.0581599404843676e-05, "loss": 0.011, "step": 692910 }, { "epoch": 1.8, "learning_rate": 3.057771118847221e-05, "loss": 0.0069, "step": 692920 }, { "epoch": 1.8, "learning_rate": 3.0573822972100745e-05, "loss": 0.0057, "step": 692930 }, { "epoch": 1.8, "learning_rate": 3.056993475572928e-05, "loss": 0.0117, "step": 692940 }, { "epoch": 1.8, "learning_rate": 3.056604653935782e-05, "loss": 0.008, "step": 692950 }, { "epoch": 1.8, "learning_rate": 3.056215832298636e-05, "loss": 0.01, "step": 692960 }, { "epoch": 1.8, "learning_rate": 3.055827010661489e-05, "loss": 0.0088, "step": 692970 }, { "epoch": 1.8, "learning_rate": 3.0554381890243426e-05, "loss": 0.0077, "step": 692980 }, { "epoch": 1.8, "learning_rate": 3.055049367387196e-05, "loss": 0.0051, "step": 692990 }, { "epoch": 1.8, "learning_rate": 3.0546605457500496e-05, "loss": 0.0101, "step": 693000 }, { "epoch": 1.8, "eval_cer": 0.8816495001196689, "eval_loss": 0.004749494604766369, "eval_runtime": 107.7534, "eval_samples_per_second": 18.561, "eval_steps_per_second": 4.64, "step": 693000 }, { "epoch": 1.8, "learning_rate": 3.054271724112903e-05, "loss": 0.0095, "step": 693010 }, { "epoch": 1.8, "learning_rate": 3.0538829024757566e-05, "loss": 0.0098, "step": 693020 }, { "epoch": 1.8, "learning_rate": 3.05349408083861e-05, "loss": 0.0081, "step": 693030 }, { "epoch": 1.8, "learning_rate": 3.0531052592014636e-05, "loss": 0.0101, "step": 693040 }, { "epoch": 1.8, "learning_rate": 3.052716437564317e-05, "loss": 0.0067, "step": 693050 }, { "epoch": 1.8, "learning_rate": 3.0523276159271705e-05, "loss": 0.0094, "step": 693060 }, { "epoch": 1.8, "learning_rate": 3.051938794290024e-05, "loss": 0.0082, "step": 693070 }, { "epoch": 1.8, "learning_rate": 3.051549972652878e-05, "loss": 0.0078, "step": 693080 }, { "epoch": 1.8, "learning_rate": 3.0511611510157313e-05, "loss": 0.0077, "step": 693090 }, { "epoch": 1.8, "learning_rate": 3.050772329378585e-05, "loss": 0.0063, "step": 693100 }, { "epoch": 1.8, "learning_rate": 3.0503835077414386e-05, "loss": 0.0076, "step": 693110 }, { "epoch": 1.8, "learning_rate": 3.049994686104292e-05, "loss": 0.0085, "step": 693120 }, { "epoch": 1.8, "learning_rate": 3.0496058644671456e-05, "loss": 0.0059, "step": 693130 }, { "epoch": 1.8, "learning_rate": 3.0492170428299994e-05, "loss": 0.0096, "step": 693140 }, { "epoch": 1.8, "learning_rate": 3.0488282211928526e-05, "loss": 0.0056, "step": 693150 }, { "epoch": 1.8, "learning_rate": 3.048439399555706e-05, "loss": 0.0072, "step": 693160 }, { "epoch": 1.8, "learning_rate": 3.0480505779185596e-05, "loss": 0.0051, "step": 693170 }, { "epoch": 1.8, "learning_rate": 3.047661756281413e-05, "loss": 0.0062, "step": 693180 }, { "epoch": 1.8, "learning_rate": 3.047272934644267e-05, "loss": 0.0079, "step": 693190 }, { "epoch": 1.8, "learning_rate": 3.0468841130071204e-05, "loss": 0.0073, "step": 693200 }, { "epoch": 1.8, "learning_rate": 3.046495291369974e-05, "loss": 0.0084, "step": 693210 }, { "epoch": 1.8, "learning_rate": 3.0461064697328273e-05, "loss": 0.0073, "step": 693220 }, { "epoch": 1.8, "learning_rate": 3.045717648095681e-05, "loss": 0.0073, "step": 693230 }, { "epoch": 1.8, "learning_rate": 3.0453288264585346e-05, "loss": 0.0048, "step": 693240 }, { "epoch": 1.8, "learning_rate": 3.044940004821388e-05, "loss": 0.0102, "step": 693250 }, { "epoch": 1.8, "learning_rate": 3.0445511831842416e-05, "loss": 0.0093, "step": 693260 }, { "epoch": 1.8, "learning_rate": 3.0441623615470954e-05, "loss": 0.0064, "step": 693270 }, { "epoch": 1.8, "learning_rate": 3.0437735399099486e-05, "loss": 0.0091, "step": 693280 }, { "epoch": 1.8, "learning_rate": 3.043384718272802e-05, "loss": 0.0074, "step": 693290 }, { "epoch": 1.8, "learning_rate": 3.0429958966356556e-05, "loss": 0.008, "step": 693300 }, { "epoch": 1.8, "learning_rate": 3.042607074998509e-05, "loss": 0.0085, "step": 693310 }, { "epoch": 1.8, "learning_rate": 3.042218253361363e-05, "loss": 0.0093, "step": 693320 }, { "epoch": 1.8, "learning_rate": 3.0418294317242164e-05, "loss": 0.0062, "step": 693330 }, { "epoch": 1.8, "learning_rate": 3.04144061008707e-05, "loss": 0.0081, "step": 693340 }, { "epoch": 1.8, "learning_rate": 3.0410517884499233e-05, "loss": 0.0095, "step": 693350 }, { "epoch": 1.8, "learning_rate": 3.040662966812777e-05, "loss": 0.0085, "step": 693360 }, { "epoch": 1.8, "learning_rate": 3.0402741451756306e-05, "loss": 0.0078, "step": 693370 }, { "epoch": 1.8, "learning_rate": 3.039885323538484e-05, "loss": 0.007, "step": 693380 }, { "epoch": 1.8, "learning_rate": 3.0394965019013376e-05, "loss": 0.0087, "step": 693390 }, { "epoch": 1.8, "learning_rate": 3.0391076802641908e-05, "loss": 0.0087, "step": 693400 }, { "epoch": 1.8, "learning_rate": 3.0387188586270446e-05, "loss": 0.0043, "step": 693410 }, { "epoch": 1.8, "learning_rate": 3.038330036989898e-05, "loss": 0.0086, "step": 693420 }, { "epoch": 1.8, "learning_rate": 3.0379412153527516e-05, "loss": 0.0085, "step": 693430 }, { "epoch": 1.8, "learning_rate": 3.037552393715605e-05, "loss": 0.0059, "step": 693440 }, { "epoch": 1.8, "learning_rate": 3.037163572078459e-05, "loss": 0.0065, "step": 693450 }, { "epoch": 1.8, "learning_rate": 3.0367747504413124e-05, "loss": 0.0062, "step": 693460 }, { "epoch": 1.8, "learning_rate": 3.036385928804166e-05, "loss": 0.012, "step": 693470 }, { "epoch": 1.8, "learning_rate": 3.0359971071670193e-05, "loss": 0.0097, "step": 693480 }, { "epoch": 1.8, "learning_rate": 3.035608285529873e-05, "loss": 0.0073, "step": 693490 }, { "epoch": 1.8, "learning_rate": 3.0352194638927266e-05, "loss": 0.0085, "step": 693500 }, { "epoch": 1.8, "learning_rate": 3.03483064225558e-05, "loss": 0.0051, "step": 693510 }, { "epoch": 1.8, "learning_rate": 3.0344418206184336e-05, "loss": 0.006, "step": 693520 }, { "epoch": 1.8, "learning_rate": 3.0340529989812868e-05, "loss": 0.0079, "step": 693530 }, { "epoch": 1.8, "learning_rate": 3.0336641773441406e-05, "loss": 0.0069, "step": 693540 }, { "epoch": 1.8, "learning_rate": 3.033275355706994e-05, "loss": 0.0067, "step": 693550 }, { "epoch": 1.8, "learning_rate": 3.0328865340698476e-05, "loss": 0.0064, "step": 693560 }, { "epoch": 1.8, "learning_rate": 3.032497712432701e-05, "loss": 0.0083, "step": 693570 }, { "epoch": 1.8, "learning_rate": 3.032108890795555e-05, "loss": 0.0091, "step": 693580 }, { "epoch": 1.8, "learning_rate": 3.0317200691584084e-05, "loss": 0.0073, "step": 693590 }, { "epoch": 1.8, "learning_rate": 3.031331247521262e-05, "loss": 0.0061, "step": 693600 }, { "epoch": 1.8, "learning_rate": 3.0309424258841153e-05, "loss": 0.0078, "step": 693610 }, { "epoch": 1.8, "learning_rate": 3.030553604246969e-05, "loss": 0.0076, "step": 693620 }, { "epoch": 1.8, "learning_rate": 3.0301647826098226e-05, "loss": 0.0086, "step": 693630 }, { "epoch": 1.8, "learning_rate": 3.029775960972676e-05, "loss": 0.0075, "step": 693640 }, { "epoch": 1.8, "learning_rate": 3.0293871393355293e-05, "loss": 0.0074, "step": 693650 }, { "epoch": 1.8, "learning_rate": 3.0289983176983828e-05, "loss": 0.0059, "step": 693660 }, { "epoch": 1.8, "learning_rate": 3.0286094960612366e-05, "loss": 0.008, "step": 693670 }, { "epoch": 1.8, "learning_rate": 3.02822067442409e-05, "loss": 0.0063, "step": 693680 }, { "epoch": 1.8, "learning_rate": 3.0278318527869436e-05, "loss": 0.0066, "step": 693690 }, { "epoch": 1.8, "learning_rate": 3.027443031149797e-05, "loss": 0.0074, "step": 693700 }, { "epoch": 1.8, "learning_rate": 3.027054209512651e-05, "loss": 0.0076, "step": 693710 }, { "epoch": 1.8, "learning_rate": 3.0266653878755044e-05, "loss": 0.0089, "step": 693720 }, { "epoch": 1.8, "learning_rate": 3.026276566238358e-05, "loss": 0.0085, "step": 693730 }, { "epoch": 1.8, "learning_rate": 3.0258877446012113e-05, "loss": 0.0093, "step": 693740 }, { "epoch": 1.8, "learning_rate": 3.025498922964065e-05, "loss": 0.0068, "step": 693750 }, { "epoch": 1.8, "learning_rate": 3.0251101013269186e-05, "loss": 0.0084, "step": 693760 }, { "epoch": 1.8, "learning_rate": 3.0247212796897718e-05, "loss": 0.0095, "step": 693770 }, { "epoch": 1.8, "learning_rate": 3.0243324580526253e-05, "loss": 0.0083, "step": 693780 }, { "epoch": 1.8, "learning_rate": 3.0239436364154788e-05, "loss": 0.0114, "step": 693790 }, { "epoch": 1.8, "learning_rate": 3.0235548147783326e-05, "loss": 0.0059, "step": 693800 }, { "epoch": 1.8, "learning_rate": 3.023165993141186e-05, "loss": 0.0071, "step": 693810 }, { "epoch": 1.8, "learning_rate": 3.0227771715040396e-05, "loss": 0.0078, "step": 693820 }, { "epoch": 1.8, "learning_rate": 3.022388349866893e-05, "loss": 0.0057, "step": 693830 }, { "epoch": 1.8, "learning_rate": 3.021999528229747e-05, "loss": 0.0082, "step": 693840 }, { "epoch": 1.8, "learning_rate": 3.0216107065926003e-05, "loss": 0.0058, "step": 693850 }, { "epoch": 1.8, "learning_rate": 3.021221884955454e-05, "loss": 0.0056, "step": 693860 }, { "epoch": 1.8, "learning_rate": 3.0208330633183073e-05, "loss": 0.0099, "step": 693870 }, { "epoch": 1.8, "learning_rate": 3.020444241681161e-05, "loss": 0.007, "step": 693880 }, { "epoch": 1.8, "learning_rate": 3.0200554200440146e-05, "loss": 0.0064, "step": 693890 }, { "epoch": 1.8, "learning_rate": 3.0196665984068678e-05, "loss": 0.0073, "step": 693900 }, { "epoch": 1.8, "learning_rate": 3.0192777767697213e-05, "loss": 0.0082, "step": 693910 }, { "epoch": 1.8, "learning_rate": 3.0188889551325748e-05, "loss": 0.0074, "step": 693920 }, { "epoch": 1.8, "learning_rate": 3.0185001334954286e-05, "loss": 0.0084, "step": 693930 }, { "epoch": 1.8, "learning_rate": 3.018111311858282e-05, "loss": 0.0077, "step": 693940 }, { "epoch": 1.8, "learning_rate": 3.0177224902211355e-05, "loss": 0.0073, "step": 693950 }, { "epoch": 1.8, "learning_rate": 3.017333668583989e-05, "loss": 0.0083, "step": 693960 }, { "epoch": 1.8, "learning_rate": 3.0169448469468425e-05, "loss": 0.0098, "step": 693970 }, { "epoch": 1.8, "learning_rate": 3.0165560253096963e-05, "loss": 0.0079, "step": 693980 }, { "epoch": 1.8, "learning_rate": 3.01616720367255e-05, "loss": 0.0069, "step": 693990 }, { "epoch": 1.8, "learning_rate": 3.0157783820354033e-05, "loss": 0.0054, "step": 694000 }, { "epoch": 1.8, "eval_cer": 0.8816662957628791, "eval_loss": 0.004784898832440376, "eval_runtime": 107.6263, "eval_samples_per_second": 18.583, "eval_steps_per_second": 4.646, "step": 694000 }, { "epoch": 1.8, "learning_rate": 3.0153895603982568e-05, "loss": 0.0083, "step": 694010 }, { "epoch": 1.8, "learning_rate": 3.01500073876111e-05, "loss": 0.0052, "step": 694020 }, { "epoch": 1.8, "learning_rate": 3.0146119171239638e-05, "loss": 0.0085, "step": 694030 }, { "epoch": 1.8, "learning_rate": 3.0142230954868173e-05, "loss": 0.0062, "step": 694040 }, { "epoch": 1.8, "learning_rate": 3.0138342738496707e-05, "loss": 0.0069, "step": 694050 }, { "epoch": 1.8, "learning_rate": 3.0134454522125242e-05, "loss": 0.0099, "step": 694060 }, { "epoch": 1.8, "learning_rate": 3.013056630575378e-05, "loss": 0.0084, "step": 694070 }, { "epoch": 1.8, "learning_rate": 3.0126678089382315e-05, "loss": 0.0077, "step": 694080 }, { "epoch": 1.8, "learning_rate": 3.012278987301085e-05, "loss": 0.009, "step": 694090 }, { "epoch": 1.8, "learning_rate": 3.0118901656639385e-05, "loss": 0.0085, "step": 694100 }, { "epoch": 1.8, "learning_rate": 3.0115013440267923e-05, "loss": 0.0083, "step": 694110 }, { "epoch": 1.8, "learning_rate": 3.0111125223896458e-05, "loss": 0.0064, "step": 694120 }, { "epoch": 1.8, "learning_rate": 3.0107237007524993e-05, "loss": 0.0077, "step": 694130 }, { "epoch": 1.8, "learning_rate": 3.0103348791153528e-05, "loss": 0.0094, "step": 694140 }, { "epoch": 1.8, "learning_rate": 3.009946057478206e-05, "loss": 0.0068, "step": 694150 }, { "epoch": 1.8, "learning_rate": 3.0095572358410598e-05, "loss": 0.0071, "step": 694160 }, { "epoch": 1.8, "learning_rate": 3.0091684142039133e-05, "loss": 0.0049, "step": 694170 }, { "epoch": 1.8, "learning_rate": 3.0087795925667667e-05, "loss": 0.0085, "step": 694180 }, { "epoch": 1.8, "learning_rate": 3.0083907709296202e-05, "loss": 0.0061, "step": 694190 }, { "epoch": 1.8, "learning_rate": 3.008001949292474e-05, "loss": 0.0077, "step": 694200 }, { "epoch": 1.8, "learning_rate": 3.0076131276553275e-05, "loss": 0.0078, "step": 694210 }, { "epoch": 1.8, "learning_rate": 3.007224306018181e-05, "loss": 0.0052, "step": 694220 }, { "epoch": 1.8, "learning_rate": 3.0068354843810345e-05, "loss": 0.0056, "step": 694230 }, { "epoch": 1.8, "learning_rate": 3.0064466627438883e-05, "loss": 0.0077, "step": 694240 }, { "epoch": 1.8, "learning_rate": 3.0060578411067418e-05, "loss": 0.0086, "step": 694250 }, { "epoch": 1.8, "learning_rate": 3.0056690194695953e-05, "loss": 0.008, "step": 694260 }, { "epoch": 1.8, "learning_rate": 3.0052801978324485e-05, "loss": 0.0077, "step": 694270 }, { "epoch": 1.8, "learning_rate": 3.004891376195302e-05, "loss": 0.0058, "step": 694280 }, { "epoch": 1.8, "learning_rate": 3.0045025545581558e-05, "loss": 0.0093, "step": 694290 }, { "epoch": 1.8, "learning_rate": 3.0041137329210093e-05, "loss": 0.0075, "step": 694300 }, { "epoch": 1.8, "learning_rate": 3.0037249112838627e-05, "loss": 0.0066, "step": 694310 }, { "epoch": 1.8, "learning_rate": 3.0033360896467162e-05, "loss": 0.0063, "step": 694320 }, { "epoch": 1.8, "learning_rate": 3.00294726800957e-05, "loss": 0.0088, "step": 694330 }, { "epoch": 1.8, "learning_rate": 3.0025584463724235e-05, "loss": 0.0078, "step": 694340 }, { "epoch": 1.8, "learning_rate": 3.002169624735277e-05, "loss": 0.0088, "step": 694350 }, { "epoch": 1.8, "learning_rate": 3.0017808030981305e-05, "loss": 0.01, "step": 694360 }, { "epoch": 1.8, "learning_rate": 3.0013919814609843e-05, "loss": 0.0057, "step": 694370 }, { "epoch": 1.8, "learning_rate": 3.0010031598238378e-05, "loss": 0.0085, "step": 694380 }, { "epoch": 1.8, "learning_rate": 3.000614338186691e-05, "loss": 0.0082, "step": 694390 }, { "epoch": 1.8, "learning_rate": 3.0002255165495445e-05, "loss": 0.0072, "step": 694400 }, { "epoch": 1.8, "learning_rate": 2.999836694912398e-05, "loss": 0.007, "step": 694410 }, { "epoch": 1.8, "learning_rate": 2.9994478732752518e-05, "loss": 0.0086, "step": 694420 }, { "epoch": 1.8, "learning_rate": 2.9990590516381053e-05, "loss": 0.0055, "step": 694430 }, { "epoch": 1.8, "learning_rate": 2.9986702300009587e-05, "loss": 0.0075, "step": 694440 }, { "epoch": 1.8, "learning_rate": 2.9982814083638122e-05, "loss": 0.0054, "step": 694450 }, { "epoch": 1.8, "learning_rate": 2.997892586726666e-05, "loss": 0.0064, "step": 694460 }, { "epoch": 1.8, "learning_rate": 2.9975037650895195e-05, "loss": 0.007, "step": 694470 }, { "epoch": 1.8, "learning_rate": 2.997114943452373e-05, "loss": 0.0065, "step": 694480 }, { "epoch": 1.8, "learning_rate": 2.9967261218152265e-05, "loss": 0.0161, "step": 694490 }, { "epoch": 1.8, "learning_rate": 2.9963373001780803e-05, "loss": 0.0084, "step": 694500 }, { "epoch": 1.8, "learning_rate": 2.9959484785409338e-05, "loss": 0.0044, "step": 694510 }, { "epoch": 1.8, "learning_rate": 2.995559656903787e-05, "loss": 0.0082, "step": 694520 }, { "epoch": 1.8, "learning_rate": 2.9951708352666405e-05, "loss": 0.01, "step": 694530 }, { "epoch": 1.8, "learning_rate": 2.994782013629494e-05, "loss": 0.0047, "step": 694540 }, { "epoch": 1.8, "learning_rate": 2.9943931919923478e-05, "loss": 0.0069, "step": 694550 }, { "epoch": 1.8, "learning_rate": 2.9940043703552013e-05, "loss": 0.006, "step": 694560 }, { "epoch": 1.8, "learning_rate": 2.9936155487180547e-05, "loss": 0.0093, "step": 694570 }, { "epoch": 1.8, "learning_rate": 2.9932267270809082e-05, "loss": 0.0117, "step": 694580 }, { "epoch": 1.8, "learning_rate": 2.992837905443762e-05, "loss": 0.0067, "step": 694590 }, { "epoch": 1.8, "learning_rate": 2.9924490838066155e-05, "loss": 0.0082, "step": 694600 }, { "epoch": 1.8, "learning_rate": 2.992060262169469e-05, "loss": 0.0077, "step": 694610 }, { "epoch": 1.8, "learning_rate": 2.9916714405323225e-05, "loss": 0.0084, "step": 694620 }, { "epoch": 1.8, "learning_rate": 2.9912826188951763e-05, "loss": 0.0068, "step": 694630 }, { "epoch": 1.8, "learning_rate": 2.9908937972580295e-05, "loss": 0.01, "step": 694640 }, { "epoch": 1.8, "learning_rate": 2.990504975620883e-05, "loss": 0.0085, "step": 694650 }, { "epoch": 1.8, "learning_rate": 2.9901161539837365e-05, "loss": 0.0065, "step": 694660 }, { "epoch": 1.8, "learning_rate": 2.98972733234659e-05, "loss": 0.0091, "step": 694670 }, { "epoch": 1.8, "learning_rate": 2.9893385107094438e-05, "loss": 0.0089, "step": 694680 }, { "epoch": 1.8, "learning_rate": 2.9889496890722973e-05, "loss": 0.0081, "step": 694690 }, { "epoch": 1.8, "learning_rate": 2.9885608674351507e-05, "loss": 0.0082, "step": 694700 }, { "epoch": 1.8, "learning_rate": 2.9881720457980042e-05, "loss": 0.0085, "step": 694710 }, { "epoch": 1.8, "learning_rate": 2.987783224160858e-05, "loss": 0.008, "step": 694720 }, { "epoch": 1.8, "learning_rate": 2.9873944025237115e-05, "loss": 0.0071, "step": 694730 }, { "epoch": 1.8, "learning_rate": 2.987005580886565e-05, "loss": 0.0084, "step": 694740 }, { "epoch": 1.8, "learning_rate": 2.9866167592494185e-05, "loss": 0.0079, "step": 694750 }, { "epoch": 1.8, "learning_rate": 2.9862279376122723e-05, "loss": 0.0062, "step": 694760 }, { "epoch": 1.8, "learning_rate": 2.9858391159751255e-05, "loss": 0.0104, "step": 694770 }, { "epoch": 1.8, "learning_rate": 2.985450294337979e-05, "loss": 0.0079, "step": 694780 }, { "epoch": 1.8, "learning_rate": 2.9850614727008325e-05, "loss": 0.008, "step": 694790 }, { "epoch": 1.8, "learning_rate": 2.984672651063686e-05, "loss": 0.006, "step": 694800 }, { "epoch": 1.8, "learning_rate": 2.9842838294265398e-05, "loss": 0.0117, "step": 694810 }, { "epoch": 1.8, "learning_rate": 2.9838950077893932e-05, "loss": 0.0093, "step": 694820 }, { "epoch": 1.8, "learning_rate": 2.9835061861522467e-05, "loss": 0.0068, "step": 694830 }, { "epoch": 1.8, "learning_rate": 2.9831173645151002e-05, "loss": 0.0088, "step": 694840 }, { "epoch": 1.8, "learning_rate": 2.982728542877954e-05, "loss": 0.0091, "step": 694850 }, { "epoch": 1.8, "learning_rate": 2.9823397212408075e-05, "loss": 0.0075, "step": 694860 }, { "epoch": 1.8, "learning_rate": 2.981950899603661e-05, "loss": 0.0054, "step": 694870 }, { "epoch": 1.8, "learning_rate": 2.9815620779665145e-05, "loss": 0.0076, "step": 694880 }, { "epoch": 1.8, "learning_rate": 2.9811732563293677e-05, "loss": 0.0092, "step": 694890 }, { "epoch": 1.8, "learning_rate": 2.9807844346922215e-05, "loss": 0.0069, "step": 694900 }, { "epoch": 1.8, "learning_rate": 2.980395613055075e-05, "loss": 0.0064, "step": 694910 }, { "epoch": 1.8, "learning_rate": 2.9800067914179284e-05, "loss": 0.0075, "step": 694920 }, { "epoch": 1.8, "learning_rate": 2.979617969780782e-05, "loss": 0.0073, "step": 694930 }, { "epoch": 1.8, "learning_rate": 2.9792291481436358e-05, "loss": 0.0077, "step": 694940 }, { "epoch": 1.8, "learning_rate": 2.9788403265064892e-05, "loss": 0.008, "step": 694950 }, { "epoch": 1.8, "learning_rate": 2.9784515048693427e-05, "loss": 0.0084, "step": 694960 }, { "epoch": 1.8, "learning_rate": 2.9780626832321962e-05, "loss": 0.0057, "step": 694970 }, { "epoch": 1.8, "learning_rate": 2.97767386159505e-05, "loss": 0.0087, "step": 694980 }, { "epoch": 1.8, "learning_rate": 2.9772850399579035e-05, "loss": 0.0091, "step": 694990 }, { "epoch": 1.8, "learning_rate": 2.976896218320757e-05, "loss": 0.006, "step": 695000 }, { "epoch": 1.8, "eval_cer": 0.8816872903168917, "eval_loss": 0.004791451618075371, "eval_runtime": 107.7436, "eval_samples_per_second": 18.563, "eval_steps_per_second": 4.641, "step": 695000 }, { "epoch": 1.8, "learning_rate": 2.97650739668361e-05, "loss": 0.0068, "step": 695010 }, { "epoch": 1.8, "learning_rate": 2.9761185750464636e-05, "loss": 0.0071, "step": 695020 }, { "epoch": 1.8, "learning_rate": 2.9757297534093175e-05, "loss": 0.0068, "step": 695030 }, { "epoch": 1.8, "learning_rate": 2.975340931772171e-05, "loss": 0.0083, "step": 695040 }, { "epoch": 1.8, "learning_rate": 2.9749521101350244e-05, "loss": 0.0074, "step": 695050 }, { "epoch": 1.8, "learning_rate": 2.974563288497878e-05, "loss": 0.0067, "step": 695060 }, { "epoch": 1.8, "learning_rate": 2.9741744668607318e-05, "loss": 0.0067, "step": 695070 }, { "epoch": 1.8, "learning_rate": 2.9737856452235852e-05, "loss": 0.0086, "step": 695080 }, { "epoch": 1.8, "learning_rate": 2.9733968235864387e-05, "loss": 0.0098, "step": 695090 }, { "epoch": 1.8, "learning_rate": 2.9730080019492922e-05, "loss": 0.0082, "step": 695100 }, { "epoch": 1.8, "learning_rate": 2.972619180312146e-05, "loss": 0.0086, "step": 695110 }, { "epoch": 1.8, "learning_rate": 2.9722303586749995e-05, "loss": 0.0067, "step": 695120 }, { "epoch": 1.8, "learning_rate": 2.971841537037853e-05, "loss": 0.0071, "step": 695130 }, { "epoch": 1.8, "learning_rate": 2.971452715400706e-05, "loss": 0.0089, "step": 695140 }, { "epoch": 1.8, "learning_rate": 2.9710638937635596e-05, "loss": 0.0102, "step": 695150 }, { "epoch": 1.8, "learning_rate": 2.9706750721264135e-05, "loss": 0.0084, "step": 695160 }, { "epoch": 1.8, "learning_rate": 2.970286250489267e-05, "loss": 0.009, "step": 695170 }, { "epoch": 1.8, "learning_rate": 2.9698974288521204e-05, "loss": 0.0071, "step": 695180 }, { "epoch": 1.8, "learning_rate": 2.969508607214974e-05, "loss": 0.0072, "step": 695190 }, { "epoch": 1.8, "learning_rate": 2.9691197855778278e-05, "loss": 0.0094, "step": 695200 }, { "epoch": 1.8, "learning_rate": 2.9687309639406812e-05, "loss": 0.0067, "step": 695210 }, { "epoch": 1.8, "learning_rate": 2.9683421423035347e-05, "loss": 0.0068, "step": 695220 }, { "epoch": 1.8, "learning_rate": 2.9679533206663882e-05, "loss": 0.0092, "step": 695230 }, { "epoch": 1.8, "learning_rate": 2.967564499029242e-05, "loss": 0.0066, "step": 695240 }, { "epoch": 1.8, "learning_rate": 2.9671756773920955e-05, "loss": 0.0068, "step": 695250 }, { "epoch": 1.8, "learning_rate": 2.9667868557549487e-05, "loss": 0.009, "step": 695260 }, { "epoch": 1.8, "learning_rate": 2.966398034117802e-05, "loss": 0.0072, "step": 695270 }, { "epoch": 1.8, "learning_rate": 2.9660092124806556e-05, "loss": 0.0061, "step": 695280 }, { "epoch": 1.8, "learning_rate": 2.9656203908435095e-05, "loss": 0.0067, "step": 695290 }, { "epoch": 1.8, "learning_rate": 2.965231569206363e-05, "loss": 0.0115, "step": 695300 }, { "epoch": 1.8, "learning_rate": 2.9648427475692164e-05, "loss": 0.0072, "step": 695310 }, { "epoch": 1.8, "learning_rate": 2.96445392593207e-05, "loss": 0.007, "step": 695320 }, { "epoch": 1.8, "learning_rate": 2.9640651042949234e-05, "loss": 0.0072, "step": 695330 }, { "epoch": 1.8, "learning_rate": 2.9636762826577772e-05, "loss": 0.0081, "step": 695340 }, { "epoch": 1.8, "learning_rate": 2.9632874610206307e-05, "loss": 0.0044, "step": 695350 }, { "epoch": 1.8, "learning_rate": 2.9628986393834842e-05, "loss": 0.0065, "step": 695360 }, { "epoch": 1.8, "learning_rate": 2.9625098177463377e-05, "loss": 0.0087, "step": 695370 }, { "epoch": 1.8, "learning_rate": 2.9621209961091915e-05, "loss": 0.0099, "step": 695380 }, { "epoch": 1.8, "learning_rate": 2.9617321744720447e-05, "loss": 0.0067, "step": 695390 }, { "epoch": 1.8, "learning_rate": 2.961343352834898e-05, "loss": 0.0068, "step": 695400 }, { "epoch": 1.8, "learning_rate": 2.9609545311977516e-05, "loss": 0.0074, "step": 695410 }, { "epoch": 1.8, "learning_rate": 2.960565709560605e-05, "loss": 0.0064, "step": 695420 }, { "epoch": 1.8, "learning_rate": 2.960176887923459e-05, "loss": 0.009, "step": 695430 }, { "epoch": 1.8, "learning_rate": 2.9597880662863124e-05, "loss": 0.0077, "step": 695440 }, { "epoch": 1.8, "learning_rate": 2.959399244649166e-05, "loss": 0.0077, "step": 695450 }, { "epoch": 1.8, "learning_rate": 2.9590104230120194e-05, "loss": 0.0069, "step": 695460 }, { "epoch": 1.8, "learning_rate": 2.9586216013748732e-05, "loss": 0.0089, "step": 695470 }, { "epoch": 1.8, "learning_rate": 2.9582327797377267e-05, "loss": 0.0056, "step": 695480 }, { "epoch": 1.8, "learning_rate": 2.9578439581005802e-05, "loss": 0.0116, "step": 695490 }, { "epoch": 1.8, "learning_rate": 2.9574551364634337e-05, "loss": 0.006, "step": 695500 }, { "epoch": 1.8, "learning_rate": 2.957066314826287e-05, "loss": 0.0073, "step": 695510 }, { "epoch": 1.8, "learning_rate": 2.9566774931891407e-05, "loss": 0.0092, "step": 695520 }, { "epoch": 1.8, "learning_rate": 2.956288671551994e-05, "loss": 0.0064, "step": 695530 }, { "epoch": 1.8, "learning_rate": 2.9558998499148476e-05, "loss": 0.0062, "step": 695540 }, { "epoch": 1.8, "learning_rate": 2.955511028277701e-05, "loss": 0.0077, "step": 695550 }, { "epoch": 1.8, "learning_rate": 2.955122206640555e-05, "loss": 0.009, "step": 695560 }, { "epoch": 1.8, "learning_rate": 2.9547333850034084e-05, "loss": 0.0082, "step": 695570 }, { "epoch": 1.8, "learning_rate": 2.954344563366262e-05, "loss": 0.0051, "step": 695580 }, { "epoch": 1.8, "learning_rate": 2.9539557417291154e-05, "loss": 0.0059, "step": 695590 }, { "epoch": 1.8, "learning_rate": 2.9535669200919692e-05, "loss": 0.0086, "step": 695600 }, { "epoch": 1.8, "learning_rate": 2.9531780984548227e-05, "loss": 0.0071, "step": 695610 }, { "epoch": 1.8, "learning_rate": 2.9527892768176762e-05, "loss": 0.0065, "step": 695620 }, { "epoch": 1.8, "learning_rate": 2.9524004551805294e-05, "loss": 0.0085, "step": 695630 }, { "epoch": 1.8, "learning_rate": 2.952011633543383e-05, "loss": 0.0078, "step": 695640 }, { "epoch": 1.8, "learning_rate": 2.9516228119062367e-05, "loss": 0.0067, "step": 695650 }, { "epoch": 1.8, "learning_rate": 2.95123399026909e-05, "loss": 0.0103, "step": 695660 }, { "epoch": 1.8, "learning_rate": 2.9508451686319436e-05, "loss": 0.0055, "step": 695670 }, { "epoch": 1.8, "learning_rate": 2.950456346994797e-05, "loss": 0.0063, "step": 695680 }, { "epoch": 1.8, "learning_rate": 2.950067525357651e-05, "loss": 0.0054, "step": 695690 }, { "epoch": 1.8, "learning_rate": 2.9496787037205044e-05, "loss": 0.0066, "step": 695700 }, { "epoch": 1.8, "learning_rate": 2.949289882083358e-05, "loss": 0.0071, "step": 695710 }, { "epoch": 1.8, "learning_rate": 2.9489010604462114e-05, "loss": 0.0051, "step": 695720 }, { "epoch": 1.8, "learning_rate": 2.9485122388090652e-05, "loss": 0.0071, "step": 695730 }, { "epoch": 1.8, "learning_rate": 2.9481234171719187e-05, "loss": 0.0062, "step": 695740 }, { "epoch": 1.8, "learning_rate": 2.9477345955347722e-05, "loss": 0.0094, "step": 695750 }, { "epoch": 1.8, "learning_rate": 2.9473457738976254e-05, "loss": 0.0092, "step": 695760 }, { "epoch": 1.8, "learning_rate": 2.946956952260479e-05, "loss": 0.0071, "step": 695770 }, { "epoch": 1.8, "learning_rate": 2.9465681306233327e-05, "loss": 0.0079, "step": 695780 }, { "epoch": 1.8, "learning_rate": 2.946179308986186e-05, "loss": 0.0091, "step": 695790 }, { "epoch": 1.8, "learning_rate": 2.9457904873490396e-05, "loss": 0.0066, "step": 695800 }, { "epoch": 1.8, "learning_rate": 2.945401665711893e-05, "loss": 0.0074, "step": 695810 }, { "epoch": 1.8, "learning_rate": 2.945012844074747e-05, "loss": 0.0069, "step": 695820 }, { "epoch": 1.8, "learning_rate": 2.9446240224376004e-05, "loss": 0.0087, "step": 695830 }, { "epoch": 1.8, "learning_rate": 2.944235200800454e-05, "loss": 0.0058, "step": 695840 }, { "epoch": 1.8, "learning_rate": 2.9438463791633074e-05, "loss": 0.0069, "step": 695850 }, { "epoch": 1.8, "learning_rate": 2.9434575575261612e-05, "loss": 0.0063, "step": 695860 }, { "epoch": 1.8, "learning_rate": 2.9430687358890147e-05, "loss": 0.0102, "step": 695870 }, { "epoch": 1.8, "learning_rate": 2.942679914251868e-05, "loss": 0.0098, "step": 695880 }, { "epoch": 1.8, "learning_rate": 2.9422910926147213e-05, "loss": 0.0089, "step": 695890 }, { "epoch": 1.8, "learning_rate": 2.941902270977575e-05, "loss": 0.0072, "step": 695900 }, { "epoch": 1.8, "learning_rate": 2.9415134493404287e-05, "loss": 0.0076, "step": 695910 }, { "epoch": 1.8, "learning_rate": 2.941124627703282e-05, "loss": 0.0105, "step": 695920 }, { "epoch": 1.8, "learning_rate": 2.9407358060661356e-05, "loss": 0.0059, "step": 695930 }, { "epoch": 1.8, "learning_rate": 2.940346984428989e-05, "loss": 0.009, "step": 695940 }, { "epoch": 1.8, "learning_rate": 2.939958162791843e-05, "loss": 0.0087, "step": 695950 }, { "epoch": 1.8, "learning_rate": 2.9395693411546964e-05, "loss": 0.0071, "step": 695960 }, { "epoch": 1.8, "learning_rate": 2.93918051951755e-05, "loss": 0.008, "step": 695970 }, { "epoch": 1.8, "learning_rate": 2.9387916978804034e-05, "loss": 0.0101, "step": 695980 }, { "epoch": 1.8, "learning_rate": 2.9384028762432572e-05, "loss": 0.0097, "step": 695990 }, { "epoch": 1.8, "learning_rate": 2.9380140546061107e-05, "loss": 0.0075, "step": 696000 }, { "epoch": 1.8, "eval_cer": 0.8816327044764588, "eval_loss": 0.004856035113334656, "eval_runtime": 107.862, "eval_samples_per_second": 18.542, "eval_steps_per_second": 4.636, "step": 696000 }, { "epoch": 1.8, "learning_rate": 2.937625232968964e-05, "loss": 0.0067, "step": 696010 }, { "epoch": 1.8, "learning_rate": 2.9372364113318173e-05, "loss": 0.0093, "step": 696020 }, { "epoch": 1.8, "learning_rate": 2.936847589694671e-05, "loss": 0.0081, "step": 696030 }, { "epoch": 1.8, "learning_rate": 2.9364587680575247e-05, "loss": 0.0079, "step": 696040 }, { "epoch": 1.8, "learning_rate": 2.936069946420378e-05, "loss": 0.0092, "step": 696050 }, { "epoch": 1.8, "learning_rate": 2.9356811247832316e-05, "loss": 0.0074, "step": 696060 }, { "epoch": 1.8, "learning_rate": 2.935292303146085e-05, "loss": 0.0087, "step": 696070 }, { "epoch": 1.8, "learning_rate": 2.934903481508939e-05, "loss": 0.0082, "step": 696080 }, { "epoch": 1.8, "learning_rate": 2.9345146598717924e-05, "loss": 0.0094, "step": 696090 }, { "epoch": 1.8, "learning_rate": 2.934125838234646e-05, "loss": 0.0068, "step": 696100 }, { "epoch": 1.8, "learning_rate": 2.9337370165974994e-05, "loss": 0.01, "step": 696110 }, { "epoch": 1.8, "learning_rate": 2.9333481949603532e-05, "loss": 0.0044, "step": 696120 }, { "epoch": 1.8, "learning_rate": 2.9329593733232064e-05, "loss": 0.0076, "step": 696130 }, { "epoch": 1.8, "learning_rate": 2.93257055168606e-05, "loss": 0.0076, "step": 696140 }, { "epoch": 1.8, "learning_rate": 2.9321817300489133e-05, "loss": 0.0061, "step": 696150 }, { "epoch": 1.8, "learning_rate": 2.9317929084117668e-05, "loss": 0.0067, "step": 696160 }, { "epoch": 1.8, "learning_rate": 2.9314040867746207e-05, "loss": 0.0063, "step": 696170 }, { "epoch": 1.8, "learning_rate": 2.931015265137474e-05, "loss": 0.0075, "step": 696180 }, { "epoch": 1.8, "learning_rate": 2.9306264435003276e-05, "loss": 0.0074, "step": 696190 }, { "epoch": 1.8, "learning_rate": 2.930237621863181e-05, "loss": 0.0049, "step": 696200 }, { "epoch": 1.8, "learning_rate": 2.929848800226035e-05, "loss": 0.0107, "step": 696210 }, { "epoch": 1.8, "learning_rate": 2.9294599785888884e-05, "loss": 0.0104, "step": 696220 }, { "epoch": 1.8, "learning_rate": 2.929071156951742e-05, "loss": 0.0075, "step": 696230 }, { "epoch": 1.8, "learning_rate": 2.9286823353145954e-05, "loss": 0.0061, "step": 696240 }, { "epoch": 1.8, "learning_rate": 2.9282935136774485e-05, "loss": 0.0098, "step": 696250 }, { "epoch": 1.8, "learning_rate": 2.9279046920403024e-05, "loss": 0.0066, "step": 696260 }, { "epoch": 1.8, "learning_rate": 2.927515870403156e-05, "loss": 0.0059, "step": 696270 }, { "epoch": 1.8, "learning_rate": 2.9271270487660093e-05, "loss": 0.0063, "step": 696280 }, { "epoch": 1.8, "learning_rate": 2.9267382271288628e-05, "loss": 0.0095, "step": 696290 }, { "epoch": 1.8, "learning_rate": 2.9263494054917167e-05, "loss": 0.0061, "step": 696300 }, { "epoch": 1.8, "learning_rate": 2.92596058385457e-05, "loss": 0.0081, "step": 696310 }, { "epoch": 1.8, "learning_rate": 2.9255717622174236e-05, "loss": 0.0081, "step": 696320 }, { "epoch": 1.8, "learning_rate": 2.925182940580277e-05, "loss": 0.0075, "step": 696330 }, { "epoch": 1.81, "learning_rate": 2.924794118943131e-05, "loss": 0.0068, "step": 696340 }, { "epoch": 1.81, "learning_rate": 2.9244052973059844e-05, "loss": 0.0119, "step": 696350 }, { "epoch": 1.81, "learning_rate": 2.924016475668838e-05, "loss": 0.0085, "step": 696360 }, { "epoch": 1.81, "learning_rate": 2.9236276540316914e-05, "loss": 0.0096, "step": 696370 }, { "epoch": 1.81, "learning_rate": 2.9232388323945445e-05, "loss": 0.0063, "step": 696380 }, { "epoch": 1.81, "learning_rate": 2.9228500107573984e-05, "loss": 0.0064, "step": 696390 }, { "epoch": 1.81, "learning_rate": 2.922461189120252e-05, "loss": 0.0083, "step": 696400 }, { "epoch": 1.81, "learning_rate": 2.9220723674831053e-05, "loss": 0.0079, "step": 696410 }, { "epoch": 1.81, "learning_rate": 2.9216835458459588e-05, "loss": 0.0084, "step": 696420 }, { "epoch": 1.81, "learning_rate": 2.9212947242088126e-05, "loss": 0.0059, "step": 696430 }, { "epoch": 1.81, "learning_rate": 2.920905902571666e-05, "loss": 0.0082, "step": 696440 }, { "epoch": 1.81, "learning_rate": 2.9205170809345196e-05, "loss": 0.0092, "step": 696450 }, { "epoch": 1.81, "learning_rate": 2.920128259297373e-05, "loss": 0.0068, "step": 696460 }, { "epoch": 1.81, "learning_rate": 2.919739437660227e-05, "loss": 0.0056, "step": 696470 }, { "epoch": 1.81, "learning_rate": 2.9193506160230804e-05, "loss": 0.0143, "step": 696480 }, { "epoch": 1.81, "learning_rate": 2.918961794385934e-05, "loss": 0.0075, "step": 696490 }, { "epoch": 1.81, "learning_rate": 2.918572972748787e-05, "loss": 0.011, "step": 696500 }, { "epoch": 1.81, "learning_rate": 2.9181841511116405e-05, "loss": 0.0062, "step": 696510 }, { "epoch": 1.81, "learning_rate": 2.9177953294744944e-05, "loss": 0.0065, "step": 696520 }, { "epoch": 1.81, "learning_rate": 2.917406507837348e-05, "loss": 0.0081, "step": 696530 }, { "epoch": 1.81, "learning_rate": 2.9170176862002013e-05, "loss": 0.0065, "step": 696540 }, { "epoch": 1.81, "learning_rate": 2.9166288645630548e-05, "loss": 0.0058, "step": 696550 }, { "epoch": 1.81, "learning_rate": 2.9162400429259086e-05, "loss": 0.0086, "step": 696560 }, { "epoch": 1.81, "learning_rate": 2.915851221288762e-05, "loss": 0.0067, "step": 696570 }, { "epoch": 1.81, "learning_rate": 2.9154623996516156e-05, "loss": 0.006, "step": 696580 }, { "epoch": 1.81, "learning_rate": 2.915073578014469e-05, "loss": 0.0071, "step": 696590 }, { "epoch": 1.81, "learning_rate": 2.914684756377323e-05, "loss": 0.0083, "step": 696600 }, { "epoch": 1.81, "learning_rate": 2.9142959347401764e-05, "loss": 0.0078, "step": 696610 }, { "epoch": 1.81, "learning_rate": 2.91390711310303e-05, "loss": 0.0063, "step": 696620 }, { "epoch": 1.81, "learning_rate": 2.913518291465883e-05, "loss": 0.0056, "step": 696630 }, { "epoch": 1.81, "learning_rate": 2.9131294698287365e-05, "loss": 0.0087, "step": 696640 }, { "epoch": 1.81, "learning_rate": 2.9127406481915904e-05, "loss": 0.0079, "step": 696650 }, { "epoch": 1.81, "learning_rate": 2.912351826554444e-05, "loss": 0.0077, "step": 696660 }, { "epoch": 1.81, "learning_rate": 2.9119630049172973e-05, "loss": 0.0091, "step": 696670 }, { "epoch": 1.81, "learning_rate": 2.9115741832801508e-05, "loss": 0.0072, "step": 696680 }, { "epoch": 1.81, "learning_rate": 2.9111853616430046e-05, "loss": 0.0057, "step": 696690 }, { "epoch": 1.81, "learning_rate": 2.910796540005858e-05, "loss": 0.0048, "step": 696700 }, { "epoch": 1.81, "learning_rate": 2.9104077183687116e-05, "loss": 0.0088, "step": 696710 }, { "epoch": 1.81, "learning_rate": 2.910018896731565e-05, "loss": 0.0059, "step": 696720 }, { "epoch": 1.81, "learning_rate": 2.9096300750944186e-05, "loss": 0.0071, "step": 696730 }, { "epoch": 1.81, "learning_rate": 2.9092412534572724e-05, "loss": 0.0062, "step": 696740 }, { "epoch": 1.81, "learning_rate": 2.9088524318201256e-05, "loss": 0.0076, "step": 696750 }, { "epoch": 1.81, "learning_rate": 2.908463610182979e-05, "loss": 0.0071, "step": 696760 }, { "epoch": 1.81, "learning_rate": 2.9080747885458325e-05, "loss": 0.0107, "step": 696770 }, { "epoch": 1.81, "learning_rate": 2.907685966908686e-05, "loss": 0.0069, "step": 696780 }, { "epoch": 1.81, "learning_rate": 2.90729714527154e-05, "loss": 0.0057, "step": 696790 }, { "epoch": 1.81, "learning_rate": 2.9069083236343933e-05, "loss": 0.0078, "step": 696800 }, { "epoch": 1.81, "learning_rate": 2.9065195019972468e-05, "loss": 0.007, "step": 696810 }, { "epoch": 1.81, "learning_rate": 2.9061306803601003e-05, "loss": 0.0079, "step": 696820 }, { "epoch": 1.81, "learning_rate": 2.905741858722954e-05, "loss": 0.0082, "step": 696830 }, { "epoch": 1.81, "learning_rate": 2.9053530370858076e-05, "loss": 0.0082, "step": 696840 }, { "epoch": 1.81, "learning_rate": 2.904964215448661e-05, "loss": 0.0071, "step": 696850 }, { "epoch": 1.81, "learning_rate": 2.9045753938115146e-05, "loss": 0.0075, "step": 696860 }, { "epoch": 1.81, "learning_rate": 2.9041865721743677e-05, "loss": 0.0085, "step": 696870 }, { "epoch": 1.81, "learning_rate": 2.9037977505372216e-05, "loss": 0.0078, "step": 696880 }, { "epoch": 1.81, "learning_rate": 2.903408928900075e-05, "loss": 0.0073, "step": 696890 }, { "epoch": 1.81, "learning_rate": 2.9030201072629285e-05, "loss": 0.0089, "step": 696900 }, { "epoch": 1.81, "learning_rate": 2.902631285625782e-05, "loss": 0.0078, "step": 696910 }, { "epoch": 1.81, "learning_rate": 2.902242463988636e-05, "loss": 0.007, "step": 696920 }, { "epoch": 1.81, "learning_rate": 2.9018536423514893e-05, "loss": 0.0085, "step": 696930 }, { "epoch": 1.81, "learning_rate": 2.9014648207143428e-05, "loss": 0.0078, "step": 696940 }, { "epoch": 1.81, "learning_rate": 2.9010759990771963e-05, "loss": 0.0088, "step": 696950 }, { "epoch": 1.81, "learning_rate": 2.90068717744005e-05, "loss": 0.0065, "step": 696960 }, { "epoch": 1.81, "learning_rate": 2.9002983558029036e-05, "loss": 0.0059, "step": 696970 }, { "epoch": 1.81, "learning_rate": 2.899909534165757e-05, "loss": 0.0056, "step": 696980 }, { "epoch": 1.81, "learning_rate": 2.8995207125286106e-05, "loss": 0.0086, "step": 696990 }, { "epoch": 1.81, "learning_rate": 2.8991318908914637e-05, "loss": 0.0083, "step": 697000 }, { "epoch": 1.81, "eval_cer": 0.8816564983043399, "eval_loss": 0.004735656548291445, "eval_runtime": 107.8044, "eval_samples_per_second": 18.552, "eval_steps_per_second": 4.638, "step": 697000 }, { "epoch": 1.81, "learning_rate": 2.8987430692543176e-05, "loss": 0.0103, "step": 697010 }, { "epoch": 1.81, "learning_rate": 2.898354247617171e-05, "loss": 0.0063, "step": 697020 }, { "epoch": 1.81, "learning_rate": 2.8979654259800245e-05, "loss": 0.0114, "step": 697030 }, { "epoch": 1.81, "learning_rate": 2.897576604342878e-05, "loss": 0.0059, "step": 697040 }, { "epoch": 1.81, "learning_rate": 2.897187782705732e-05, "loss": 0.0089, "step": 697050 }, { "epoch": 1.81, "learning_rate": 2.8967989610685853e-05, "loss": 0.0079, "step": 697060 }, { "epoch": 1.81, "learning_rate": 2.8964101394314388e-05, "loss": 0.0086, "step": 697070 }, { "epoch": 1.81, "learning_rate": 2.8960213177942923e-05, "loss": 0.0051, "step": 697080 }, { "epoch": 1.81, "learning_rate": 2.895632496157146e-05, "loss": 0.0071, "step": 697090 }, { "epoch": 1.81, "learning_rate": 2.8952436745199996e-05, "loss": 0.007, "step": 697100 }, { "epoch": 1.81, "learning_rate": 2.894854852882853e-05, "loss": 0.007, "step": 697110 }, { "epoch": 1.81, "learning_rate": 2.8944660312457062e-05, "loss": 0.0074, "step": 697120 }, { "epoch": 1.81, "learning_rate": 2.8940772096085597e-05, "loss": 0.0054, "step": 697130 }, { "epoch": 1.81, "learning_rate": 2.8936883879714136e-05, "loss": 0.0055, "step": 697140 }, { "epoch": 1.81, "learning_rate": 2.893299566334267e-05, "loss": 0.0064, "step": 697150 }, { "epoch": 1.81, "learning_rate": 2.8929107446971205e-05, "loss": 0.0115, "step": 697160 }, { "epoch": 1.81, "learning_rate": 2.892521923059974e-05, "loss": 0.0075, "step": 697170 }, { "epoch": 1.81, "learning_rate": 2.892133101422828e-05, "loss": 0.0052, "step": 697180 }, { "epoch": 1.81, "learning_rate": 2.8917442797856813e-05, "loss": 0.0078, "step": 697190 }, { "epoch": 1.81, "learning_rate": 2.8913554581485348e-05, "loss": 0.0065, "step": 697200 }, { "epoch": 1.81, "learning_rate": 2.8909666365113883e-05, "loss": 0.0071, "step": 697210 }, { "epoch": 1.81, "learning_rate": 2.890577814874242e-05, "loss": 0.0052, "step": 697220 }, { "epoch": 1.81, "learning_rate": 2.8901889932370956e-05, "loss": 0.0093, "step": 697230 }, { "epoch": 1.81, "learning_rate": 2.889800171599949e-05, "loss": 0.0075, "step": 697240 }, { "epoch": 1.81, "learning_rate": 2.8894113499628022e-05, "loss": 0.0135, "step": 697250 }, { "epoch": 1.81, "learning_rate": 2.8890225283256557e-05, "loss": 0.0079, "step": 697260 }, { "epoch": 1.81, "learning_rate": 2.8886337066885096e-05, "loss": 0.0066, "step": 697270 }, { "epoch": 1.81, "learning_rate": 2.888244885051363e-05, "loss": 0.0062, "step": 697280 }, { "epoch": 1.81, "learning_rate": 2.8878560634142165e-05, "loss": 0.0074, "step": 697290 }, { "epoch": 1.81, "learning_rate": 2.88746724177707e-05, "loss": 0.0064, "step": 697300 }, { "epoch": 1.81, "learning_rate": 2.887078420139924e-05, "loss": 0.0104, "step": 697310 }, { "epoch": 1.81, "learning_rate": 2.8866895985027773e-05, "loss": 0.0066, "step": 697320 }, { "epoch": 1.81, "learning_rate": 2.8863007768656308e-05, "loss": 0.0092, "step": 697330 }, { "epoch": 1.81, "learning_rate": 2.8859119552284843e-05, "loss": 0.0074, "step": 697340 }, { "epoch": 1.81, "learning_rate": 2.885523133591338e-05, "loss": 0.0051, "step": 697350 }, { "epoch": 1.81, "learning_rate": 2.8851343119541916e-05, "loss": 0.0061, "step": 697360 }, { "epoch": 1.81, "learning_rate": 2.8847454903170448e-05, "loss": 0.0082, "step": 697370 }, { "epoch": 1.81, "learning_rate": 2.8843566686798982e-05, "loss": 0.0082, "step": 697380 }, { "epoch": 1.81, "learning_rate": 2.8839678470427517e-05, "loss": 0.0061, "step": 697390 }, { "epoch": 1.81, "learning_rate": 2.8835790254056055e-05, "loss": 0.0071, "step": 697400 }, { "epoch": 1.81, "learning_rate": 2.883190203768459e-05, "loss": 0.0086, "step": 697410 }, { "epoch": 1.81, "learning_rate": 2.8828013821313125e-05, "loss": 0.0071, "step": 697420 }, { "epoch": 1.81, "learning_rate": 2.882412560494166e-05, "loss": 0.0064, "step": 697430 }, { "epoch": 1.81, "learning_rate": 2.88202373885702e-05, "loss": 0.0093, "step": 697440 }, { "epoch": 1.81, "learning_rate": 2.8816349172198733e-05, "loss": 0.0079, "step": 697450 }, { "epoch": 1.81, "learning_rate": 2.8812460955827268e-05, "loss": 0.0094, "step": 697460 }, { "epoch": 1.81, "learning_rate": 2.8808572739455803e-05, "loss": 0.0091, "step": 697470 }, { "epoch": 1.81, "learning_rate": 2.880468452308434e-05, "loss": 0.0076, "step": 697480 }, { "epoch": 1.81, "learning_rate": 2.8800796306712873e-05, "loss": 0.005, "step": 697490 }, { "epoch": 1.81, "learning_rate": 2.8796908090341407e-05, "loss": 0.0099, "step": 697500 }, { "epoch": 1.81, "learning_rate": 2.8793019873969942e-05, "loss": 0.007, "step": 697510 }, { "epoch": 1.81, "learning_rate": 2.8789131657598477e-05, "loss": 0.0109, "step": 697520 }, { "epoch": 1.81, "learning_rate": 2.8785243441227015e-05, "loss": 0.0319, "step": 697530 }, { "epoch": 1.81, "learning_rate": 2.878135522485555e-05, "loss": 0.0065, "step": 697540 }, { "epoch": 1.81, "learning_rate": 2.8777467008484085e-05, "loss": 0.0073, "step": 697550 }, { "epoch": 1.81, "learning_rate": 2.877357879211262e-05, "loss": 0.0058, "step": 697560 }, { "epoch": 1.81, "learning_rate": 2.8769690575741158e-05, "loss": 0.0123, "step": 697570 }, { "epoch": 1.81, "learning_rate": 2.8765802359369693e-05, "loss": 0.0098, "step": 697580 }, { "epoch": 1.81, "learning_rate": 2.8761914142998228e-05, "loss": 0.0076, "step": 697590 }, { "epoch": 1.81, "learning_rate": 2.8758025926626763e-05, "loss": 0.0075, "step": 697600 }, { "epoch": 1.81, "learning_rate": 2.87541377102553e-05, "loss": 0.0059, "step": 697610 }, { "epoch": 1.81, "learning_rate": 2.8750249493883833e-05, "loss": 0.0075, "step": 697620 }, { "epoch": 1.81, "learning_rate": 2.8746361277512367e-05, "loss": 0.0069, "step": 697630 }, { "epoch": 1.81, "learning_rate": 2.8742473061140902e-05, "loss": 0.0081, "step": 697640 }, { "epoch": 1.81, "learning_rate": 2.8738584844769437e-05, "loss": 0.0063, "step": 697650 }, { "epoch": 1.81, "learning_rate": 2.8734696628397975e-05, "loss": 0.0068, "step": 697660 }, { "epoch": 1.81, "learning_rate": 2.873080841202651e-05, "loss": 0.0069, "step": 697670 }, { "epoch": 1.81, "learning_rate": 2.8726920195655045e-05, "loss": 0.0105, "step": 697680 }, { "epoch": 1.81, "learning_rate": 2.872303197928358e-05, "loss": 0.0084, "step": 697690 }, { "epoch": 1.81, "learning_rate": 2.8719143762912118e-05, "loss": 0.0112, "step": 697700 }, { "epoch": 1.81, "learning_rate": 2.8715255546540653e-05, "loss": 0.0093, "step": 697710 }, { "epoch": 1.81, "learning_rate": 2.8711367330169188e-05, "loss": 0.008, "step": 697720 }, { "epoch": 1.81, "learning_rate": 2.8707479113797723e-05, "loss": 0.0122, "step": 697730 }, { "epoch": 1.81, "learning_rate": 2.8703590897426254e-05, "loss": 0.0082, "step": 697740 }, { "epoch": 1.81, "learning_rate": 2.8699702681054793e-05, "loss": 0.0082, "step": 697750 }, { "epoch": 1.81, "learning_rate": 2.8695814464683327e-05, "loss": 0.0069, "step": 697760 }, { "epoch": 1.81, "learning_rate": 2.8691926248311862e-05, "loss": 0.0054, "step": 697770 }, { "epoch": 1.81, "learning_rate": 2.8688038031940397e-05, "loss": 0.0081, "step": 697780 }, { "epoch": 1.81, "learning_rate": 2.8684149815568935e-05, "loss": 0.0068, "step": 697790 }, { "epoch": 1.81, "learning_rate": 2.868026159919747e-05, "loss": 0.0066, "step": 697800 }, { "epoch": 1.81, "learning_rate": 2.8676373382826005e-05, "loss": 0.0066, "step": 697810 }, { "epoch": 1.81, "learning_rate": 2.867248516645454e-05, "loss": 0.0089, "step": 697820 }, { "epoch": 1.81, "learning_rate": 2.8668596950083078e-05, "loss": 0.0086, "step": 697830 }, { "epoch": 1.81, "learning_rate": 2.8664708733711613e-05, "loss": 0.0068, "step": 697840 }, { "epoch": 1.81, "learning_rate": 2.8660820517340148e-05, "loss": 0.0124, "step": 697850 }, { "epoch": 1.81, "learning_rate": 2.8656932300968683e-05, "loss": 0.0119, "step": 697860 }, { "epoch": 1.81, "learning_rate": 2.8653044084597214e-05, "loss": 0.0069, "step": 697870 }, { "epoch": 1.81, "learning_rate": 2.8649155868225753e-05, "loss": 0.0082, "step": 697880 }, { "epoch": 1.81, "learning_rate": 2.8645267651854287e-05, "loss": 0.0058, "step": 697890 }, { "epoch": 1.81, "learning_rate": 2.8641379435482822e-05, "loss": 0.0116, "step": 697900 }, { "epoch": 1.81, "learning_rate": 2.8637491219111357e-05, "loss": 0.0089, "step": 697910 }, { "epoch": 1.81, "learning_rate": 2.8633603002739895e-05, "loss": 0.0063, "step": 697920 }, { "epoch": 1.81, "learning_rate": 2.862971478636843e-05, "loss": 0.0066, "step": 697930 }, { "epoch": 1.81, "learning_rate": 2.8625826569996965e-05, "loss": 0.0056, "step": 697940 }, { "epoch": 1.81, "learning_rate": 2.86219383536255e-05, "loss": 0.0061, "step": 697950 }, { "epoch": 1.81, "learning_rate": 2.8618050137254038e-05, "loss": 0.0073, "step": 697960 }, { "epoch": 1.81, "learning_rate": 2.8614161920882573e-05, "loss": 0.0062, "step": 697970 }, { "epoch": 1.81, "learning_rate": 2.8610273704511108e-05, "loss": 0.0077, "step": 697980 }, { "epoch": 1.81, "learning_rate": 2.860638548813964e-05, "loss": 0.0052, "step": 697990 }, { "epoch": 1.81, "learning_rate": 2.8602497271768174e-05, "loss": 0.0049, "step": 698000 }, { "epoch": 1.81, "eval_cer": 0.8816467008458005, "eval_loss": 0.004819649271667004, "eval_runtime": 107.8195, "eval_samples_per_second": 18.55, "eval_steps_per_second": 4.637, "step": 698000 }, { "epoch": 1.81, "learning_rate": 2.8598609055396713e-05, "loss": 0.0071, "step": 698010 }, { "epoch": 1.81, "learning_rate": 2.8594720839025247e-05, "loss": 0.0065, "step": 698020 }, { "epoch": 1.81, "learning_rate": 2.8590832622653782e-05, "loss": 0.0103, "step": 698030 }, { "epoch": 1.81, "learning_rate": 2.8586944406282317e-05, "loss": 0.0074, "step": 698040 }, { "epoch": 1.81, "learning_rate": 2.8583056189910855e-05, "loss": 0.0084, "step": 698050 }, { "epoch": 1.81, "learning_rate": 2.857916797353939e-05, "loss": 0.007, "step": 698060 }, { "epoch": 1.81, "learning_rate": 2.8575279757167925e-05, "loss": 0.0078, "step": 698070 }, { "epoch": 1.81, "learning_rate": 2.857139154079646e-05, "loss": 0.0089, "step": 698080 }, { "epoch": 1.81, "learning_rate": 2.8567503324424995e-05, "loss": 0.0065, "step": 698090 }, { "epoch": 1.81, "learning_rate": 2.8563615108053533e-05, "loss": 0.0052, "step": 698100 }, { "epoch": 1.81, "learning_rate": 2.8559726891682068e-05, "loss": 0.0071, "step": 698110 }, { "epoch": 1.81, "learning_rate": 2.85558386753106e-05, "loss": 0.0076, "step": 698120 }, { "epoch": 1.81, "learning_rate": 2.8551950458939134e-05, "loss": 0.0068, "step": 698130 }, { "epoch": 1.81, "learning_rate": 2.8548062242567673e-05, "loss": 0.0067, "step": 698140 }, { "epoch": 1.81, "learning_rate": 2.8544174026196207e-05, "loss": 0.0105, "step": 698150 }, { "epoch": 1.81, "learning_rate": 2.8540285809824742e-05, "loss": 0.0073, "step": 698160 }, { "epoch": 1.81, "learning_rate": 2.8536397593453277e-05, "loss": 0.009, "step": 698170 }, { "epoch": 1.81, "learning_rate": 2.8532509377081812e-05, "loss": 0.0076, "step": 698180 }, { "epoch": 1.81, "learning_rate": 2.852862116071035e-05, "loss": 0.0103, "step": 698190 }, { "epoch": 1.81, "learning_rate": 2.8524732944338885e-05, "loss": 0.0071, "step": 698200 }, { "epoch": 1.81, "learning_rate": 2.852084472796742e-05, "loss": 0.0078, "step": 698210 }, { "epoch": 1.81, "learning_rate": 2.8516956511595955e-05, "loss": 0.0067, "step": 698220 }, { "epoch": 1.81, "learning_rate": 2.8513068295224493e-05, "loss": 0.009, "step": 698230 }, { "epoch": 1.81, "learning_rate": 2.8509180078853025e-05, "loss": 0.0096, "step": 698240 }, { "epoch": 1.81, "learning_rate": 2.850529186248156e-05, "loss": 0.0082, "step": 698250 }, { "epoch": 1.81, "learning_rate": 2.8501403646110094e-05, "loss": 0.0052, "step": 698260 }, { "epoch": 1.81, "learning_rate": 2.849751542973863e-05, "loss": 0.0048, "step": 698270 }, { "epoch": 1.81, "learning_rate": 2.8493627213367167e-05, "loss": 0.0065, "step": 698280 }, { "epoch": 1.81, "learning_rate": 2.8489738996995702e-05, "loss": 0.0069, "step": 698290 }, { "epoch": 1.81, "learning_rate": 2.8485850780624237e-05, "loss": 0.007, "step": 698300 }, { "epoch": 1.81, "learning_rate": 2.8481962564252772e-05, "loss": 0.0073, "step": 698310 }, { "epoch": 1.81, "learning_rate": 2.847807434788131e-05, "loss": 0.0066, "step": 698320 }, { "epoch": 1.81, "learning_rate": 2.8474186131509845e-05, "loss": 0.0131, "step": 698330 }, { "epoch": 1.81, "learning_rate": 2.847029791513838e-05, "loss": 0.0089, "step": 698340 }, { "epoch": 1.81, "learning_rate": 2.8466409698766915e-05, "loss": 0.0103, "step": 698350 }, { "epoch": 1.81, "learning_rate": 2.8462521482395446e-05, "loss": 0.0066, "step": 698360 }, { "epoch": 1.81, "learning_rate": 2.8458633266023984e-05, "loss": 0.0094, "step": 698370 }, { "epoch": 1.81, "learning_rate": 2.845474504965252e-05, "loss": 0.01, "step": 698380 }, { "epoch": 1.81, "learning_rate": 2.8450856833281054e-05, "loss": 0.0078, "step": 698390 }, { "epoch": 1.81, "learning_rate": 2.844696861690959e-05, "loss": 0.0092, "step": 698400 }, { "epoch": 1.81, "learning_rate": 2.8443080400538127e-05, "loss": 0.0057, "step": 698410 }, { "epoch": 1.81, "learning_rate": 2.8439192184166662e-05, "loss": 0.0057, "step": 698420 }, { "epoch": 1.81, "learning_rate": 2.8435303967795197e-05, "loss": 0.0059, "step": 698430 }, { "epoch": 1.81, "learning_rate": 2.8431415751423732e-05, "loss": 0.0083, "step": 698440 }, { "epoch": 1.81, "learning_rate": 2.842752753505227e-05, "loss": 0.0087, "step": 698450 }, { "epoch": 1.81, "learning_rate": 2.8423639318680805e-05, "loss": 0.0098, "step": 698460 }, { "epoch": 1.81, "learning_rate": 2.841975110230934e-05, "loss": 0.0058, "step": 698470 }, { "epoch": 1.81, "learning_rate": 2.8415862885937875e-05, "loss": 0.0097, "step": 698480 }, { "epoch": 1.81, "learning_rate": 2.8411974669566406e-05, "loss": 0.0066, "step": 698490 }, { "epoch": 1.81, "learning_rate": 2.8408086453194944e-05, "loss": 0.0068, "step": 698500 }, { "epoch": 1.81, "learning_rate": 2.840419823682348e-05, "loss": 0.0073, "step": 698510 }, { "epoch": 1.81, "learning_rate": 2.8400310020452014e-05, "loss": 0.0071, "step": 698520 }, { "epoch": 1.81, "learning_rate": 2.839642180408055e-05, "loss": 0.01, "step": 698530 }, { "epoch": 1.81, "learning_rate": 2.8392533587709087e-05, "loss": 0.0085, "step": 698540 }, { "epoch": 1.81, "learning_rate": 2.8388645371337622e-05, "loss": 0.0088, "step": 698550 }, { "epoch": 1.81, "learning_rate": 2.8384757154966157e-05, "loss": 0.006, "step": 698560 }, { "epoch": 1.81, "learning_rate": 2.8380868938594692e-05, "loss": 0.0073, "step": 698570 }, { "epoch": 1.81, "learning_rate": 2.837698072222323e-05, "loss": 0.009, "step": 698580 }, { "epoch": 1.81, "learning_rate": 2.8373092505851765e-05, "loss": 0.0096, "step": 698590 }, { "epoch": 1.81, "learning_rate": 2.83692042894803e-05, "loss": 0.0067, "step": 698600 }, { "epoch": 1.81, "learning_rate": 2.836531607310883e-05, "loss": 0.0076, "step": 698610 }, { "epoch": 1.81, "learning_rate": 2.8361427856737366e-05, "loss": 0.0061, "step": 698620 }, { "epoch": 1.81, "learning_rate": 2.8357539640365904e-05, "loss": 0.0084, "step": 698630 }, { "epoch": 1.81, "learning_rate": 2.835365142399444e-05, "loss": 0.008, "step": 698640 }, { "epoch": 1.81, "learning_rate": 2.8349763207622974e-05, "loss": 0.0077, "step": 698650 }, { "epoch": 1.81, "learning_rate": 2.834587499125151e-05, "loss": 0.0065, "step": 698660 }, { "epoch": 1.81, "learning_rate": 2.8341986774880047e-05, "loss": 0.0084, "step": 698670 }, { "epoch": 1.81, "learning_rate": 2.8338098558508582e-05, "loss": 0.0069, "step": 698680 }, { "epoch": 1.81, "learning_rate": 2.8334210342137117e-05, "loss": 0.0065, "step": 698690 }, { "epoch": 1.81, "learning_rate": 2.8330322125765652e-05, "loss": 0.0088, "step": 698700 }, { "epoch": 1.81, "learning_rate": 2.832643390939419e-05, "loss": 0.0072, "step": 698710 }, { "epoch": 1.81, "learning_rate": 2.8322545693022725e-05, "loss": 0.0069, "step": 698720 }, { "epoch": 1.81, "learning_rate": 2.831865747665126e-05, "loss": 0.0068, "step": 698730 }, { "epoch": 1.81, "learning_rate": 2.831476926027979e-05, "loss": 0.0082, "step": 698740 }, { "epoch": 1.81, "learning_rate": 2.8310881043908326e-05, "loss": 0.0086, "step": 698750 }, { "epoch": 1.81, "learning_rate": 2.8306992827536864e-05, "loss": 0.0069, "step": 698760 }, { "epoch": 1.81, "learning_rate": 2.83031046111654e-05, "loss": 0.006, "step": 698770 }, { "epoch": 1.81, "learning_rate": 2.8299216394793934e-05, "loss": 0.007, "step": 698780 }, { "epoch": 1.81, "learning_rate": 2.829532817842247e-05, "loss": 0.0062, "step": 698790 }, { "epoch": 1.81, "learning_rate": 2.8291439962051007e-05, "loss": 0.0083, "step": 698800 }, { "epoch": 1.81, "learning_rate": 2.8287551745679542e-05, "loss": 0.0063, "step": 698810 }, { "epoch": 1.81, "learning_rate": 2.8283663529308077e-05, "loss": 0.006, "step": 698820 }, { "epoch": 1.81, "learning_rate": 2.8279775312936612e-05, "loss": 0.0068, "step": 698830 }, { "epoch": 1.81, "learning_rate": 2.827588709656515e-05, "loss": 0.0057, "step": 698840 }, { "epoch": 1.81, "learning_rate": 2.8271998880193685e-05, "loss": 0.0057, "step": 698850 }, { "epoch": 1.81, "learning_rate": 2.8268110663822216e-05, "loss": 0.0071, "step": 698860 }, { "epoch": 1.81, "learning_rate": 2.826422244745075e-05, "loss": 0.0066, "step": 698870 }, { "epoch": 1.81, "learning_rate": 2.8260334231079286e-05, "loss": 0.0078, "step": 698880 }, { "epoch": 1.81, "learning_rate": 2.8256446014707824e-05, "loss": 0.0063, "step": 698890 }, { "epoch": 1.81, "learning_rate": 2.825255779833636e-05, "loss": 0.0072, "step": 698900 }, { "epoch": 1.81, "learning_rate": 2.8248669581964894e-05, "loss": 0.0078, "step": 698910 }, { "epoch": 1.81, "learning_rate": 2.824478136559343e-05, "loss": 0.0069, "step": 698920 }, { "epoch": 1.81, "learning_rate": 2.8240893149221967e-05, "loss": 0.0047, "step": 698930 }, { "epoch": 1.81, "learning_rate": 2.8237004932850502e-05, "loss": 0.0078, "step": 698940 }, { "epoch": 1.81, "learning_rate": 2.8233116716479037e-05, "loss": 0.0082, "step": 698950 }, { "epoch": 1.81, "learning_rate": 2.8229228500107572e-05, "loss": 0.0067, "step": 698960 }, { "epoch": 1.81, "learning_rate": 2.822534028373611e-05, "loss": 0.0062, "step": 698970 }, { "epoch": 1.81, "learning_rate": 2.822145206736464e-05, "loss": 0.0054, "step": 698980 }, { "epoch": 1.81, "learning_rate": 2.8217563850993176e-05, "loss": 0.009, "step": 698990 }, { "epoch": 1.81, "learning_rate": 2.821367563462171e-05, "loss": 0.007, "step": 699000 }, { "epoch": 1.81, "eval_cer": 0.8816564983043399, "eval_loss": 0.004687727894634008, "eval_runtime": 107.7875, "eval_samples_per_second": 18.555, "eval_steps_per_second": 4.639, "step": 699000 }, { "epoch": 1.81, "learning_rate": 2.8209787418250246e-05, "loss": 0.0046, "step": 699010 }, { "epoch": 1.81, "learning_rate": 2.8205899201878784e-05, "loss": 0.0052, "step": 699020 }, { "epoch": 1.81, "learning_rate": 2.820201098550732e-05, "loss": 0.0068, "step": 699030 }, { "epoch": 1.81, "learning_rate": 2.8198122769135854e-05, "loss": 0.0071, "step": 699040 }, { "epoch": 1.81, "learning_rate": 2.819423455276439e-05, "loss": 0.008, "step": 699050 }, { "epoch": 1.81, "learning_rate": 2.8190346336392927e-05, "loss": 0.0079, "step": 699060 }, { "epoch": 1.81, "learning_rate": 2.8186458120021462e-05, "loss": 0.0078, "step": 699070 }, { "epoch": 1.81, "learning_rate": 2.8182569903649997e-05, "loss": 0.0077, "step": 699080 }, { "epoch": 1.81, "learning_rate": 2.8178681687278532e-05, "loss": 0.0068, "step": 699090 }, { "epoch": 1.81, "learning_rate": 2.817479347090707e-05, "loss": 0.0061, "step": 699100 }, { "epoch": 1.81, "learning_rate": 2.81709052545356e-05, "loss": 0.0066, "step": 699110 }, { "epoch": 1.81, "learning_rate": 2.8167017038164136e-05, "loss": 0.0059, "step": 699120 }, { "epoch": 1.81, "learning_rate": 2.816312882179267e-05, "loss": 0.0071, "step": 699130 }, { "epoch": 1.81, "learning_rate": 2.8159240605421206e-05, "loss": 0.008, "step": 699140 }, { "epoch": 1.81, "learning_rate": 2.8155352389049744e-05, "loss": 0.0072, "step": 699150 }, { "epoch": 1.81, "learning_rate": 2.815146417267828e-05, "loss": 0.0059, "step": 699160 }, { "epoch": 1.81, "learning_rate": 2.8147575956306814e-05, "loss": 0.0074, "step": 699170 }, { "epoch": 1.81, "learning_rate": 2.814368773993535e-05, "loss": 0.0082, "step": 699180 }, { "epoch": 1.81, "learning_rate": 2.8139799523563887e-05, "loss": 0.0088, "step": 699190 }, { "epoch": 1.81, "learning_rate": 2.8135911307192422e-05, "loss": 0.0066, "step": 699200 }, { "epoch": 1.81, "learning_rate": 2.8132023090820957e-05, "loss": 0.0084, "step": 699210 }, { "epoch": 1.81, "learning_rate": 2.8128134874449492e-05, "loss": 0.0083, "step": 699220 }, { "epoch": 1.81, "learning_rate": 2.8124246658078023e-05, "loss": 0.0072, "step": 699230 }, { "epoch": 1.81, "learning_rate": 2.812035844170656e-05, "loss": 0.0052, "step": 699240 }, { "epoch": 1.81, "learning_rate": 2.8116470225335096e-05, "loss": 0.0115, "step": 699250 }, { "epoch": 1.81, "learning_rate": 2.811258200896363e-05, "loss": 0.0097, "step": 699260 }, { "epoch": 1.81, "learning_rate": 2.8108693792592166e-05, "loss": 0.0079, "step": 699270 }, { "epoch": 1.81, "learning_rate": 2.8104805576220704e-05, "loss": 0.009, "step": 699280 }, { "epoch": 1.81, "learning_rate": 2.810091735984924e-05, "loss": 0.0074, "step": 699290 }, { "epoch": 1.81, "learning_rate": 2.8097029143477774e-05, "loss": 0.0067, "step": 699300 }, { "epoch": 1.81, "learning_rate": 2.809314092710631e-05, "loss": 0.0059, "step": 699310 }, { "epoch": 1.81, "learning_rate": 2.8089252710734847e-05, "loss": 0.0089, "step": 699320 }, { "epoch": 1.81, "learning_rate": 2.8085364494363382e-05, "loss": 0.0062, "step": 699330 }, { "epoch": 1.81, "learning_rate": 2.8081476277991917e-05, "loss": 0.0114, "step": 699340 }, { "epoch": 1.81, "learning_rate": 2.8077588061620452e-05, "loss": 0.0053, "step": 699350 }, { "epoch": 1.81, "learning_rate": 2.8073699845248983e-05, "loss": 0.0069, "step": 699360 }, { "epoch": 1.81, "learning_rate": 2.806981162887752e-05, "loss": 0.0119, "step": 699370 }, { "epoch": 1.81, "learning_rate": 2.8065923412506056e-05, "loss": 0.006, "step": 699380 }, { "epoch": 1.81, "learning_rate": 2.806203519613459e-05, "loss": 0.0059, "step": 699390 }, { "epoch": 1.81, "learning_rate": 2.8058146979763126e-05, "loss": 0.0079, "step": 699400 }, { "epoch": 1.81, "learning_rate": 2.8054258763391664e-05, "loss": 0.0083, "step": 699410 }, { "epoch": 1.81, "learning_rate": 2.80503705470202e-05, "loss": 0.0065, "step": 699420 }, { "epoch": 1.81, "learning_rate": 2.8046482330648734e-05, "loss": 0.0092, "step": 699430 }, { "epoch": 1.81, "learning_rate": 2.804259411427727e-05, "loss": 0.0063, "step": 699440 }, { "epoch": 1.81, "learning_rate": 2.8038705897905807e-05, "loss": 0.0059, "step": 699450 }, { "epoch": 1.81, "learning_rate": 2.8034817681534342e-05, "loss": 0.0064, "step": 699460 }, { "epoch": 1.81, "learning_rate": 2.8030929465162877e-05, "loss": 0.0086, "step": 699470 }, { "epoch": 1.81, "learning_rate": 2.802704124879141e-05, "loss": 0.0096, "step": 699480 }, { "epoch": 1.81, "learning_rate": 2.8023153032419943e-05, "loss": 0.0074, "step": 699490 }, { "epoch": 1.81, "learning_rate": 2.801926481604848e-05, "loss": 0.0046, "step": 699500 }, { "epoch": 1.81, "learning_rate": 2.8015376599677016e-05, "loss": 0.0061, "step": 699510 }, { "epoch": 1.81, "learning_rate": 2.801148838330555e-05, "loss": 0.009, "step": 699520 }, { "epoch": 1.81, "learning_rate": 2.8007600166934086e-05, "loss": 0.0069, "step": 699530 }, { "epoch": 1.81, "learning_rate": 2.800371195056262e-05, "loss": 0.0065, "step": 699540 }, { "epoch": 1.81, "learning_rate": 2.799982373419116e-05, "loss": 0.0061, "step": 699550 }, { "epoch": 1.81, "learning_rate": 2.7995935517819694e-05, "loss": 0.0067, "step": 699560 }, { "epoch": 1.81, "learning_rate": 2.799204730144823e-05, "loss": 0.008, "step": 699570 }, { "epoch": 1.81, "learning_rate": 2.7988159085076764e-05, "loss": 0.005, "step": 699580 }, { "epoch": 1.81, "learning_rate": 2.7984270868705302e-05, "loss": 0.0113, "step": 699590 }, { "epoch": 1.81, "learning_rate": 2.7980382652333833e-05, "loss": 0.006, "step": 699600 }, { "epoch": 1.81, "learning_rate": 2.797649443596237e-05, "loss": 0.0089, "step": 699610 }, { "epoch": 1.81, "learning_rate": 2.7972606219590903e-05, "loss": 0.0054, "step": 699620 }, { "epoch": 1.81, "learning_rate": 2.7968718003219438e-05, "loss": 0.0101, "step": 699630 }, { "epoch": 1.81, "learning_rate": 2.7964829786847976e-05, "loss": 0.0075, "step": 699640 }, { "epoch": 1.81, "learning_rate": 2.796094157047651e-05, "loss": 0.0085, "step": 699650 }, { "epoch": 1.81, "learning_rate": 2.7957053354105046e-05, "loss": 0.0078, "step": 699660 }, { "epoch": 1.81, "learning_rate": 2.795316513773358e-05, "loss": 0.0078, "step": 699670 }, { "epoch": 1.81, "learning_rate": 2.794927692136212e-05, "loss": 0.0081, "step": 699680 }, { "epoch": 1.81, "learning_rate": 2.7945388704990654e-05, "loss": 0.008, "step": 699690 }, { "epoch": 1.81, "learning_rate": 2.794150048861919e-05, "loss": 0.006, "step": 699700 }, { "epoch": 1.81, "learning_rate": 2.7937612272247724e-05, "loss": 0.0071, "step": 699710 }, { "epoch": 1.81, "learning_rate": 2.7933724055876262e-05, "loss": 0.006, "step": 699720 }, { "epoch": 1.81, "learning_rate": 2.7929835839504793e-05, "loss": 0.0096, "step": 699730 }, { "epoch": 1.81, "learning_rate": 2.7925947623133328e-05, "loss": 0.0067, "step": 699740 }, { "epoch": 1.81, "learning_rate": 2.7922059406761863e-05, "loss": 0.0067, "step": 699750 }, { "epoch": 1.81, "learning_rate": 2.7918171190390398e-05, "loss": 0.0053, "step": 699760 }, { "epoch": 1.81, "learning_rate": 2.7914282974018936e-05, "loss": 0.0068, "step": 699770 }, { "epoch": 1.81, "learning_rate": 2.791039475764747e-05, "loss": 0.0063, "step": 699780 }, { "epoch": 1.81, "learning_rate": 2.7906506541276006e-05, "loss": 0.0068, "step": 699790 }, { "epoch": 1.81, "learning_rate": 2.790261832490454e-05, "loss": 0.006, "step": 699800 }, { "epoch": 1.81, "learning_rate": 2.789873010853308e-05, "loss": 0.0075, "step": 699810 }, { "epoch": 1.81, "learning_rate": 2.7894841892161614e-05, "loss": 0.007, "step": 699820 }, { "epoch": 1.81, "learning_rate": 2.789095367579015e-05, "loss": 0.0091, "step": 699830 }, { "epoch": 1.81, "learning_rate": 2.7887065459418684e-05, "loss": 0.0078, "step": 699840 }, { "epoch": 1.81, "learning_rate": 2.7883177243047215e-05, "loss": 0.0066, "step": 699850 }, { "epoch": 1.81, "learning_rate": 2.7879289026675753e-05, "loss": 0.0091, "step": 699860 }, { "epoch": 1.81, "learning_rate": 2.7875400810304288e-05, "loss": 0.0064, "step": 699870 }, { "epoch": 1.81, "learning_rate": 2.7871512593932823e-05, "loss": 0.0096, "step": 699880 }, { "epoch": 1.81, "learning_rate": 2.7867624377561358e-05, "loss": 0.0068, "step": 699890 }, { "epoch": 1.81, "learning_rate": 2.7863736161189896e-05, "loss": 0.0061, "step": 699900 }, { "epoch": 1.81, "learning_rate": 2.785984794481843e-05, "loss": 0.0062, "step": 699910 }, { "epoch": 1.81, "learning_rate": 2.7855959728446966e-05, "loss": 0.0072, "step": 699920 }, { "epoch": 1.81, "learning_rate": 2.78520715120755e-05, "loss": 0.0057, "step": 699930 }, { "epoch": 1.81, "learning_rate": 2.784818329570404e-05, "loss": 0.0067, "step": 699940 }, { "epoch": 1.81, "learning_rate": 2.7844295079332574e-05, "loss": 0.0077, "step": 699950 }, { "epoch": 1.81, "learning_rate": 2.784040686296111e-05, "loss": 0.0087, "step": 699960 }, { "epoch": 1.81, "learning_rate": 2.7836518646589644e-05, "loss": 0.0066, "step": 699970 }, { "epoch": 1.81, "learning_rate": 2.7832630430218175e-05, "loss": 0.007, "step": 699980 }, { "epoch": 1.81, "learning_rate": 2.7828742213846713e-05, "loss": 0.0084, "step": 699990 }, { "epoch": 1.81, "learning_rate": 2.7824853997475248e-05, "loss": 0.0151, "step": 700000 }, { "epoch": 1.81, "eval_cer": 0.88167329394755, "eval_loss": 0.004671318922191858, "eval_runtime": 107.97, "eval_samples_per_second": 18.524, "eval_steps_per_second": 4.631, "step": 700000 }, { "epoch": 1.81, "learning_rate": 2.7820965781103783e-05, "loss": 0.0065, "step": 700010 }, { "epoch": 1.81, "learning_rate": 2.7817077564732318e-05, "loss": 0.007, "step": 700020 }, { "epoch": 1.81, "learning_rate": 2.7813189348360856e-05, "loss": 0.0085, "step": 700030 }, { "epoch": 1.81, "learning_rate": 2.780930113198939e-05, "loss": 0.008, "step": 700040 }, { "epoch": 1.81, "learning_rate": 2.7805412915617926e-05, "loss": 0.0107, "step": 700050 }, { "epoch": 1.81, "learning_rate": 2.780152469924646e-05, "loss": 0.0078, "step": 700060 }, { "epoch": 1.81, "learning_rate": 2.7797636482875e-05, "loss": 0.0056, "step": 700070 }, { "epoch": 1.81, "learning_rate": 2.7793748266503534e-05, "loss": 0.0058, "step": 700080 }, { "epoch": 1.81, "learning_rate": 2.778986005013207e-05, "loss": 0.0086, "step": 700090 }, { "epoch": 1.81, "learning_rate": 2.77859718337606e-05, "loss": 0.0075, "step": 700100 }, { "epoch": 1.81, "learning_rate": 2.7782083617389135e-05, "loss": 0.0072, "step": 700110 }, { "epoch": 1.81, "learning_rate": 2.7778195401017673e-05, "loss": 0.0071, "step": 700120 }, { "epoch": 1.81, "learning_rate": 2.7774307184646208e-05, "loss": 0.0101, "step": 700130 }, { "epoch": 1.81, "learning_rate": 2.7770418968274743e-05, "loss": 0.0056, "step": 700140 }, { "epoch": 1.81, "learning_rate": 2.7766530751903278e-05, "loss": 0.0063, "step": 700150 }, { "epoch": 1.81, "learning_rate": 2.7762642535531816e-05, "loss": 0.006, "step": 700160 }, { "epoch": 1.81, "learning_rate": 2.775875431916035e-05, "loss": 0.0072, "step": 700170 }, { "epoch": 1.81, "learning_rate": 2.7754866102788886e-05, "loss": 0.0081, "step": 700180 }, { "epoch": 1.81, "learning_rate": 2.775097788641742e-05, "loss": 0.0066, "step": 700190 }, { "epoch": 1.82, "learning_rate": 2.774708967004596e-05, "loss": 0.007, "step": 700200 }, { "epoch": 1.82, "learning_rate": 2.7743201453674494e-05, "loss": 0.0076, "step": 700210 }, { "epoch": 1.82, "learning_rate": 2.7739313237303025e-05, "loss": 0.0098, "step": 700220 }, { "epoch": 1.82, "learning_rate": 2.773542502093156e-05, "loss": 0.0065, "step": 700230 }, { "epoch": 1.82, "learning_rate": 2.7731536804560095e-05, "loss": 0.0074, "step": 700240 }, { "epoch": 1.82, "learning_rate": 2.7727648588188633e-05, "loss": 0.0077, "step": 700250 }, { "epoch": 1.82, "learning_rate": 2.7723760371817168e-05, "loss": 0.008, "step": 700260 }, { "epoch": 1.82, "learning_rate": 2.7719872155445703e-05, "loss": 0.0071, "step": 700270 }, { "epoch": 1.82, "learning_rate": 2.7715983939074238e-05, "loss": 0.0062, "step": 700280 }, { "epoch": 1.82, "learning_rate": 2.7712095722702776e-05, "loss": 0.0071, "step": 700290 }, { "epoch": 1.82, "learning_rate": 2.770820750633131e-05, "loss": 0.0087, "step": 700300 }, { "epoch": 1.82, "learning_rate": 2.7704319289959846e-05, "loss": 0.007, "step": 700310 }, { "epoch": 1.82, "learning_rate": 2.770043107358838e-05, "loss": 0.009, "step": 700320 }, { "epoch": 1.82, "learning_rate": 2.769654285721692e-05, "loss": 0.0089, "step": 700330 }, { "epoch": 1.82, "learning_rate": 2.7692654640845454e-05, "loss": 0.0073, "step": 700340 }, { "epoch": 1.82, "learning_rate": 2.7688766424473985e-05, "loss": 0.008, "step": 700350 }, { "epoch": 1.82, "learning_rate": 2.768487820810252e-05, "loss": 0.0068, "step": 700360 }, { "epoch": 1.82, "learning_rate": 2.7680989991731055e-05, "loss": 0.0068, "step": 700370 }, { "epoch": 1.82, "learning_rate": 2.7677101775359593e-05, "loss": 0.0074, "step": 700380 }, { "epoch": 1.82, "learning_rate": 2.7673213558988128e-05, "loss": 0.0075, "step": 700390 }, { "epoch": 1.82, "learning_rate": 2.7669325342616663e-05, "loss": 0.008, "step": 700400 }, { "epoch": 1.82, "learning_rate": 2.7665437126245198e-05, "loss": 0.0074, "step": 700410 }, { "epoch": 1.82, "learning_rate": 2.7661548909873736e-05, "loss": 0.0056, "step": 700420 }, { "epoch": 1.82, "learning_rate": 2.765766069350227e-05, "loss": 0.0071, "step": 700430 }, { "epoch": 1.82, "learning_rate": 2.7653772477130806e-05, "loss": 0.0064, "step": 700440 }, { "epoch": 1.82, "learning_rate": 2.764988426075934e-05, "loss": 0.005, "step": 700450 }, { "epoch": 1.82, "learning_rate": 2.764599604438788e-05, "loss": 0.0098, "step": 700460 }, { "epoch": 1.82, "learning_rate": 2.764210782801641e-05, "loss": 0.0063, "step": 700470 }, { "epoch": 1.82, "learning_rate": 2.7638219611644945e-05, "loss": 0.0069, "step": 700480 }, { "epoch": 1.82, "learning_rate": 2.763433139527348e-05, "loss": 0.0083, "step": 700490 }, { "epoch": 1.82, "learning_rate": 2.7630443178902015e-05, "loss": 0.0069, "step": 700500 }, { "epoch": 1.82, "learning_rate": 2.7626554962530553e-05, "loss": 0.0093, "step": 700510 }, { "epoch": 1.82, "learning_rate": 2.7622666746159088e-05, "loss": 0.0071, "step": 700520 }, { "epoch": 1.82, "learning_rate": 2.7618778529787623e-05, "loss": 0.0076, "step": 700530 }, { "epoch": 1.82, "learning_rate": 2.7614890313416158e-05, "loss": 0.0067, "step": 700540 }, { "epoch": 1.82, "learning_rate": 2.7611002097044696e-05, "loss": 0.0078, "step": 700550 }, { "epoch": 1.82, "learning_rate": 2.760711388067323e-05, "loss": 0.0116, "step": 700560 }, { "epoch": 1.82, "learning_rate": 2.7603225664301766e-05, "loss": 0.0048, "step": 700570 }, { "epoch": 1.82, "learning_rate": 2.75993374479303e-05, "loss": 0.0077, "step": 700580 }, { "epoch": 1.82, "learning_rate": 2.759544923155884e-05, "loss": 0.0073, "step": 700590 }, { "epoch": 1.82, "learning_rate": 2.759156101518737e-05, "loss": 0.0086, "step": 700600 }, { "epoch": 1.82, "learning_rate": 2.7587672798815905e-05, "loss": 0.0069, "step": 700610 }, { "epoch": 1.82, "learning_rate": 2.758378458244444e-05, "loss": 0.0063, "step": 700620 }, { "epoch": 1.82, "learning_rate": 2.7579896366072975e-05, "loss": 0.0084, "step": 700630 }, { "epoch": 1.82, "learning_rate": 2.7576008149701513e-05, "loss": 0.0053, "step": 700640 }, { "epoch": 1.82, "learning_rate": 2.7572119933330048e-05, "loss": 0.009, "step": 700650 }, { "epoch": 1.82, "learning_rate": 2.7568231716958583e-05, "loss": 0.0064, "step": 700660 }, { "epoch": 1.82, "learning_rate": 2.7564343500587118e-05, "loss": 0.0086, "step": 700670 }, { "epoch": 1.82, "learning_rate": 2.7560455284215656e-05, "loss": 0.0101, "step": 700680 }, { "epoch": 1.82, "learning_rate": 2.755656706784419e-05, "loss": 0.0077, "step": 700690 }, { "epoch": 1.82, "learning_rate": 2.7552678851472726e-05, "loss": 0.0074, "step": 700700 }, { "epoch": 1.82, "learning_rate": 2.754879063510126e-05, "loss": 0.0067, "step": 700710 }, { "epoch": 1.82, "learning_rate": 2.7544902418729792e-05, "loss": 0.0074, "step": 700720 }, { "epoch": 1.82, "learning_rate": 2.754101420235833e-05, "loss": 0.0058, "step": 700730 }, { "epoch": 1.82, "learning_rate": 2.7537125985986865e-05, "loss": 0.007, "step": 700740 }, { "epoch": 1.82, "learning_rate": 2.75332377696154e-05, "loss": 0.0078, "step": 700750 }, { "epoch": 1.82, "learning_rate": 2.7529349553243935e-05, "loss": 0.0054, "step": 700760 }, { "epoch": 1.82, "learning_rate": 2.7525461336872473e-05, "loss": 0.0077, "step": 700770 }, { "epoch": 1.82, "learning_rate": 2.7521573120501008e-05, "loss": 0.0056, "step": 700780 }, { "epoch": 1.82, "learning_rate": 2.7517684904129543e-05, "loss": 0.0094, "step": 700790 }, { "epoch": 1.82, "learning_rate": 2.7513796687758078e-05, "loss": 0.0066, "step": 700800 }, { "epoch": 1.82, "learning_rate": 2.7509908471386616e-05, "loss": 0.0066, "step": 700810 }, { "epoch": 1.82, "learning_rate": 2.750602025501515e-05, "loss": 0.0067, "step": 700820 }, { "epoch": 1.82, "learning_rate": 2.7502132038643686e-05, "loss": 0.0104, "step": 700830 }, { "epoch": 1.82, "learning_rate": 2.7498243822272217e-05, "loss": 0.0075, "step": 700840 }, { "epoch": 1.82, "learning_rate": 2.7494355605900752e-05, "loss": 0.0081, "step": 700850 }, { "epoch": 1.82, "learning_rate": 2.749046738952929e-05, "loss": 0.0086, "step": 700860 }, { "epoch": 1.82, "learning_rate": 2.7486579173157825e-05, "loss": 0.0087, "step": 700870 }, { "epoch": 1.82, "learning_rate": 2.748269095678636e-05, "loss": 0.0052, "step": 700880 }, { "epoch": 1.82, "learning_rate": 2.7478802740414895e-05, "loss": 0.0082, "step": 700890 }, { "epoch": 1.82, "learning_rate": 2.7474914524043433e-05, "loss": 0.0059, "step": 700900 }, { "epoch": 1.82, "learning_rate": 2.7471026307671968e-05, "loss": 0.0096, "step": 700910 }, { "epoch": 1.82, "learning_rate": 2.7467138091300503e-05, "loss": 0.0057, "step": 700920 }, { "epoch": 1.82, "learning_rate": 2.7463249874929038e-05, "loss": 0.0095, "step": 700930 }, { "epoch": 1.82, "learning_rate": 2.7459361658557573e-05, "loss": 0.0105, "step": 700940 }, { "epoch": 1.82, "learning_rate": 2.745547344218611e-05, "loss": 0.0063, "step": 700950 }, { "epoch": 1.82, "learning_rate": 2.7451585225814646e-05, "loss": 0.01, "step": 700960 }, { "epoch": 1.82, "learning_rate": 2.7447697009443177e-05, "loss": 0.0058, "step": 700970 }, { "epoch": 1.82, "learning_rate": 2.7443808793071712e-05, "loss": 0.0057, "step": 700980 }, { "epoch": 1.82, "learning_rate": 2.7439920576700247e-05, "loss": 0.0089, "step": 700990 }, { "epoch": 1.82, "learning_rate": 2.7436032360328785e-05, "loss": 0.0071, "step": 701000 }, { "epoch": 1.82, "eval_cer": 0.8816704946736816, "eval_loss": 0.0047097280621528625, "eval_runtime": 107.7701, "eval_samples_per_second": 18.558, "eval_steps_per_second": 4.64, "step": 701000 }, { "epoch": 1.82, "learning_rate": 2.743214414395732e-05, "loss": 0.0093, "step": 701010 }, { "epoch": 1.82, "learning_rate": 2.7428255927585855e-05, "loss": 0.0052, "step": 701020 }, { "epoch": 1.82, "learning_rate": 2.742436771121439e-05, "loss": 0.0073, "step": 701030 }, { "epoch": 1.82, "learning_rate": 2.7420479494842928e-05, "loss": 0.004, "step": 701040 }, { "epoch": 1.82, "learning_rate": 2.7416591278471463e-05, "loss": 0.0088, "step": 701050 }, { "epoch": 1.82, "learning_rate": 2.7412703062099998e-05, "loss": 0.0077, "step": 701060 }, { "epoch": 1.82, "learning_rate": 2.7408814845728533e-05, "loss": 0.0071, "step": 701070 }, { "epoch": 1.82, "learning_rate": 2.740492662935707e-05, "loss": 0.007, "step": 701080 }, { "epoch": 1.82, "learning_rate": 2.7401038412985602e-05, "loss": 0.0057, "step": 701090 }, { "epoch": 1.82, "learning_rate": 2.7397150196614137e-05, "loss": 0.0064, "step": 701100 }, { "epoch": 1.82, "learning_rate": 2.7393261980242672e-05, "loss": 0.008, "step": 701110 }, { "epoch": 1.82, "learning_rate": 2.7389373763871207e-05, "loss": 0.0078, "step": 701120 }, { "epoch": 1.82, "learning_rate": 2.7385485547499745e-05, "loss": 0.0082, "step": 701130 }, { "epoch": 1.82, "learning_rate": 2.738159733112828e-05, "loss": 0.0068, "step": 701140 }, { "epoch": 1.82, "learning_rate": 2.7377709114756815e-05, "loss": 0.0072, "step": 701150 }, { "epoch": 1.82, "learning_rate": 2.737382089838535e-05, "loss": 0.0077, "step": 701160 }, { "epoch": 1.82, "learning_rate": 2.7369932682013888e-05, "loss": 0.007, "step": 701170 }, { "epoch": 1.82, "learning_rate": 2.7366044465642423e-05, "loss": 0.0107, "step": 701180 }, { "epoch": 1.82, "learning_rate": 2.7362156249270958e-05, "loss": 0.0069, "step": 701190 }, { "epoch": 1.82, "learning_rate": 2.7358268032899493e-05, "loss": 0.0089, "step": 701200 }, { "epoch": 1.82, "learning_rate": 2.735437981652803e-05, "loss": 0.0071, "step": 701210 }, { "epoch": 1.82, "learning_rate": 2.7350491600156562e-05, "loss": 0.0068, "step": 701220 }, { "epoch": 1.82, "learning_rate": 2.7346603383785097e-05, "loss": 0.0094, "step": 701230 }, { "epoch": 1.82, "learning_rate": 2.7342715167413632e-05, "loss": 0.0094, "step": 701240 }, { "epoch": 1.82, "learning_rate": 2.7338826951042167e-05, "loss": 0.0063, "step": 701250 }, { "epoch": 1.82, "learning_rate": 2.7334938734670705e-05, "loss": 0.0073, "step": 701260 }, { "epoch": 1.82, "learning_rate": 2.733105051829924e-05, "loss": 0.0062, "step": 701270 }, { "epoch": 1.82, "learning_rate": 2.7327162301927775e-05, "loss": 0.0089, "step": 701280 }, { "epoch": 1.82, "learning_rate": 2.732327408555631e-05, "loss": 0.0074, "step": 701290 }, { "epoch": 1.82, "learning_rate": 2.7319385869184848e-05, "loss": 0.0062, "step": 701300 }, { "epoch": 1.82, "learning_rate": 2.7315497652813383e-05, "loss": 0.0063, "step": 701310 }, { "epoch": 1.82, "learning_rate": 2.7311609436441918e-05, "loss": 0.0062, "step": 701320 }, { "epoch": 1.82, "learning_rate": 2.7307721220070453e-05, "loss": 0.0061, "step": 701330 }, { "epoch": 1.82, "learning_rate": 2.7303833003698984e-05, "loss": 0.0088, "step": 701340 }, { "epoch": 1.82, "learning_rate": 2.7299944787327522e-05, "loss": 0.0075, "step": 701350 }, { "epoch": 1.82, "learning_rate": 2.7296056570956057e-05, "loss": 0.0071, "step": 701360 }, { "epoch": 1.82, "learning_rate": 2.7292168354584592e-05, "loss": 0.0054, "step": 701370 }, { "epoch": 1.82, "learning_rate": 2.7288280138213127e-05, "loss": 0.0126, "step": 701380 }, { "epoch": 1.82, "learning_rate": 2.7284391921841665e-05, "loss": 0.0069, "step": 701390 }, { "epoch": 1.82, "learning_rate": 2.72805037054702e-05, "loss": 0.0065, "step": 701400 }, { "epoch": 1.82, "learning_rate": 2.7276615489098735e-05, "loss": 0.0071, "step": 701410 }, { "epoch": 1.82, "learning_rate": 2.727272727272727e-05, "loss": 0.0075, "step": 701420 }, { "epoch": 1.82, "learning_rate": 2.7268839056355808e-05, "loss": 0.0131, "step": 701430 }, { "epoch": 1.82, "learning_rate": 2.7264950839984343e-05, "loss": 0.0075, "step": 701440 }, { "epoch": 1.82, "learning_rate": 2.7261062623612878e-05, "loss": 0.0078, "step": 701450 }, { "epoch": 1.82, "learning_rate": 2.725717440724141e-05, "loss": 0.0069, "step": 701460 }, { "epoch": 1.82, "learning_rate": 2.7253286190869944e-05, "loss": 0.0084, "step": 701470 }, { "epoch": 1.82, "learning_rate": 2.7249397974498482e-05, "loss": 0.0061, "step": 701480 }, { "epoch": 1.82, "learning_rate": 2.7245509758127017e-05, "loss": 0.0073, "step": 701490 }, { "epoch": 1.82, "learning_rate": 2.7241621541755552e-05, "loss": 0.0086, "step": 701500 }, { "epoch": 1.82, "learning_rate": 2.7237733325384087e-05, "loss": 0.0058, "step": 701510 }, { "epoch": 1.82, "learning_rate": 2.7233845109012625e-05, "loss": 0.0071, "step": 701520 }, { "epoch": 1.82, "learning_rate": 2.722995689264116e-05, "loss": 0.0049, "step": 701530 }, { "epoch": 1.82, "learning_rate": 2.7226068676269695e-05, "loss": 0.0067, "step": 701540 }, { "epoch": 1.82, "learning_rate": 2.722218045989823e-05, "loss": 0.0106, "step": 701550 }, { "epoch": 1.82, "learning_rate": 2.7218292243526768e-05, "loss": 0.0057, "step": 701560 }, { "epoch": 1.82, "learning_rate": 2.7214404027155303e-05, "loss": 0.01, "step": 701570 }, { "epoch": 1.82, "learning_rate": 2.7210515810783838e-05, "loss": 0.0082, "step": 701580 }, { "epoch": 1.82, "learning_rate": 2.720662759441237e-05, "loss": 0.0071, "step": 701590 }, { "epoch": 1.82, "learning_rate": 2.7202739378040904e-05, "loss": 0.0074, "step": 701600 }, { "epoch": 1.82, "learning_rate": 2.7198851161669442e-05, "loss": 0.0089, "step": 701610 }, { "epoch": 1.82, "learning_rate": 2.7194962945297977e-05, "loss": 0.0082, "step": 701620 }, { "epoch": 1.82, "learning_rate": 2.7191074728926512e-05, "loss": 0.0057, "step": 701630 }, { "epoch": 1.82, "learning_rate": 2.7187186512555047e-05, "loss": 0.0075, "step": 701640 }, { "epoch": 1.82, "learning_rate": 2.7183298296183585e-05, "loss": 0.0063, "step": 701650 }, { "epoch": 1.82, "learning_rate": 2.717941007981212e-05, "loss": 0.0075, "step": 701660 }, { "epoch": 1.82, "learning_rate": 2.7175521863440655e-05, "loss": 0.0076, "step": 701670 }, { "epoch": 1.82, "learning_rate": 2.717163364706919e-05, "loss": 0.0098, "step": 701680 }, { "epoch": 1.82, "learning_rate": 2.7167745430697728e-05, "loss": 0.0097, "step": 701690 }, { "epoch": 1.82, "learning_rate": 2.7163857214326263e-05, "loss": 0.008, "step": 701700 }, { "epoch": 1.82, "learning_rate": 2.7159968997954794e-05, "loss": 0.0054, "step": 701710 }, { "epoch": 1.82, "learning_rate": 2.715608078158333e-05, "loss": 0.0062, "step": 701720 }, { "epoch": 1.82, "learning_rate": 2.7152192565211864e-05, "loss": 0.0065, "step": 701730 }, { "epoch": 1.82, "learning_rate": 2.7148304348840402e-05, "loss": 0.011, "step": 701740 }, { "epoch": 1.82, "learning_rate": 2.7144416132468937e-05, "loss": 0.0068, "step": 701750 }, { "epoch": 1.82, "learning_rate": 2.7140527916097472e-05, "loss": 0.0066, "step": 701760 }, { "epoch": 1.82, "learning_rate": 2.7136639699726007e-05, "loss": 0.0081, "step": 701770 }, { "epoch": 1.82, "learning_rate": 2.7132751483354545e-05, "loss": 0.0058, "step": 701780 }, { "epoch": 1.82, "learning_rate": 2.712886326698308e-05, "loss": 0.0081, "step": 701790 }, { "epoch": 1.82, "learning_rate": 2.7124975050611615e-05, "loss": 0.008, "step": 701800 }, { "epoch": 1.82, "learning_rate": 2.712108683424015e-05, "loss": 0.008, "step": 701810 }, { "epoch": 1.82, "learning_rate": 2.7117198617868688e-05, "loss": 0.0056, "step": 701820 }, { "epoch": 1.82, "learning_rate": 2.7113310401497223e-05, "loss": 0.0082, "step": 701830 }, { "epoch": 1.82, "learning_rate": 2.7109422185125754e-05, "loss": 0.0066, "step": 701840 }, { "epoch": 1.82, "learning_rate": 2.710553396875429e-05, "loss": 0.005, "step": 701850 }, { "epoch": 1.82, "learning_rate": 2.7101645752382824e-05, "loss": 0.0055, "step": 701860 }, { "epoch": 1.82, "learning_rate": 2.7097757536011362e-05, "loss": 0.0083, "step": 701870 }, { "epoch": 1.82, "learning_rate": 2.7093869319639897e-05, "loss": 0.0067, "step": 701880 }, { "epoch": 1.82, "learning_rate": 2.7089981103268432e-05, "loss": 0.0079, "step": 701890 }, { "epoch": 1.82, "learning_rate": 2.7086092886896967e-05, "loss": 0.0091, "step": 701900 }, { "epoch": 1.82, "learning_rate": 2.7082204670525505e-05, "loss": 0.0086, "step": 701910 }, { "epoch": 1.82, "learning_rate": 2.707831645415404e-05, "loss": 0.0077, "step": 701920 }, { "epoch": 1.82, "learning_rate": 2.7074428237782575e-05, "loss": 0.0082, "step": 701930 }, { "epoch": 1.82, "learning_rate": 2.707054002141111e-05, "loss": 0.0087, "step": 701940 }, { "epoch": 1.82, "learning_rate": 2.7066651805039648e-05, "loss": 0.0089, "step": 701950 }, { "epoch": 1.82, "learning_rate": 2.706276358866818e-05, "loss": 0.0074, "step": 701960 }, { "epoch": 1.82, "learning_rate": 2.7058875372296714e-05, "loss": 0.007, "step": 701970 }, { "epoch": 1.82, "learning_rate": 2.705498715592525e-05, "loss": 0.0049, "step": 701980 }, { "epoch": 1.82, "learning_rate": 2.7051098939553784e-05, "loss": 0.0074, "step": 701990 }, { "epoch": 1.82, "learning_rate": 2.7047210723182322e-05, "loss": 0.0054, "step": 702000 }, { "epoch": 1.82, "eval_cer": 0.8816662957628791, "eval_loss": 0.004621751606464386, "eval_runtime": 107.8759, "eval_samples_per_second": 18.54, "eval_steps_per_second": 4.635, "step": 702000 }, { "epoch": 1.82, "learning_rate": 2.7043322506810857e-05, "loss": 0.0067, "step": 702010 }, { "epoch": 1.82, "learning_rate": 2.7039434290439392e-05, "loss": 0.0087, "step": 702020 }, { "epoch": 1.82, "learning_rate": 2.7035546074067927e-05, "loss": 0.01, "step": 702030 }, { "epoch": 1.82, "learning_rate": 2.7031657857696465e-05, "loss": 0.0076, "step": 702040 }, { "epoch": 1.82, "learning_rate": 2.7027769641325e-05, "loss": 0.0104, "step": 702050 }, { "epoch": 1.82, "learning_rate": 2.7023881424953535e-05, "loss": 0.0057, "step": 702060 }, { "epoch": 1.82, "learning_rate": 2.701999320858207e-05, "loss": 0.0092, "step": 702070 }, { "epoch": 1.82, "learning_rate": 2.70161049922106e-05, "loss": 0.0079, "step": 702080 }, { "epoch": 1.82, "learning_rate": 2.701221677583914e-05, "loss": 0.0052, "step": 702090 }, { "epoch": 1.82, "learning_rate": 2.7008328559467674e-05, "loss": 0.0057, "step": 702100 }, { "epoch": 1.82, "learning_rate": 2.700444034309621e-05, "loss": 0.008, "step": 702110 }, { "epoch": 1.82, "learning_rate": 2.7000552126724744e-05, "loss": 0.008, "step": 702120 }, { "epoch": 1.82, "learning_rate": 2.6996663910353282e-05, "loss": 0.0093, "step": 702130 }, { "epoch": 1.82, "learning_rate": 2.6992775693981817e-05, "loss": 0.0076, "step": 702140 }, { "epoch": 1.82, "learning_rate": 2.6988887477610352e-05, "loss": 0.0077, "step": 702150 }, { "epoch": 1.82, "learning_rate": 2.6984999261238887e-05, "loss": 0.0047, "step": 702160 }, { "epoch": 1.82, "learning_rate": 2.6981111044867425e-05, "loss": 0.0049, "step": 702170 }, { "epoch": 1.82, "learning_rate": 2.697722282849596e-05, "loss": 0.0064, "step": 702180 }, { "epoch": 1.82, "learning_rate": 2.6973334612124495e-05, "loss": 0.0092, "step": 702190 }, { "epoch": 1.82, "learning_rate": 2.696944639575303e-05, "loss": 0.006, "step": 702200 }, { "epoch": 1.82, "learning_rate": 2.696555817938156e-05, "loss": 0.0071, "step": 702210 }, { "epoch": 1.82, "learning_rate": 2.69616699630101e-05, "loss": 0.0087, "step": 702220 }, { "epoch": 1.82, "learning_rate": 2.6957781746638634e-05, "loss": 0.0081, "step": 702230 }, { "epoch": 1.82, "learning_rate": 2.695389353026717e-05, "loss": 0.0066, "step": 702240 }, { "epoch": 1.82, "learning_rate": 2.6950005313895704e-05, "loss": 0.0085, "step": 702250 }, { "epoch": 1.82, "learning_rate": 2.6946117097524242e-05, "loss": 0.0112, "step": 702260 }, { "epoch": 1.82, "learning_rate": 2.6942228881152777e-05, "loss": 0.0129, "step": 702270 }, { "epoch": 1.82, "learning_rate": 2.6938340664781312e-05, "loss": 0.0087, "step": 702280 }, { "epoch": 1.82, "learning_rate": 2.6934452448409847e-05, "loss": 0.006, "step": 702290 }, { "epoch": 1.82, "learning_rate": 2.693056423203838e-05, "loss": 0.006, "step": 702300 }, { "epoch": 1.82, "learning_rate": 2.692667601566692e-05, "loss": 0.0049, "step": 702310 }, { "epoch": 1.82, "learning_rate": 2.6922787799295455e-05, "loss": 0.0062, "step": 702320 }, { "epoch": 1.82, "learning_rate": 2.6918899582923986e-05, "loss": 0.0056, "step": 702330 }, { "epoch": 1.82, "learning_rate": 2.691501136655252e-05, "loss": 0.0087, "step": 702340 }, { "epoch": 1.82, "learning_rate": 2.6911123150181056e-05, "loss": 0.0091, "step": 702350 }, { "epoch": 1.82, "learning_rate": 2.6907234933809594e-05, "loss": 0.0101, "step": 702360 }, { "epoch": 1.82, "learning_rate": 2.690334671743813e-05, "loss": 0.0064, "step": 702370 }, { "epoch": 1.82, "learning_rate": 2.6899458501066664e-05, "loss": 0.0083, "step": 702380 }, { "epoch": 1.82, "learning_rate": 2.68955702846952e-05, "loss": 0.006, "step": 702390 }, { "epoch": 1.82, "learning_rate": 2.6891682068323737e-05, "loss": 0.0066, "step": 702400 }, { "epoch": 1.82, "learning_rate": 2.6887793851952272e-05, "loss": 0.0072, "step": 702410 }, { "epoch": 1.82, "learning_rate": 2.6883905635580807e-05, "loss": 0.0069, "step": 702420 }, { "epoch": 1.82, "learning_rate": 2.688001741920934e-05, "loss": 0.0087, "step": 702430 }, { "epoch": 1.82, "learning_rate": 2.687612920283788e-05, "loss": 0.0084, "step": 702440 }, { "epoch": 1.82, "learning_rate": 2.6872240986466415e-05, "loss": 0.0083, "step": 702450 }, { "epoch": 1.82, "learning_rate": 2.6868352770094946e-05, "loss": 0.0114, "step": 702460 }, { "epoch": 1.82, "learning_rate": 2.686446455372348e-05, "loss": 0.0067, "step": 702470 }, { "epoch": 1.82, "learning_rate": 2.6860576337352016e-05, "loss": 0.0084, "step": 702480 }, { "epoch": 1.82, "learning_rate": 2.6856688120980554e-05, "loss": 0.0068, "step": 702490 }, { "epoch": 1.82, "learning_rate": 2.685279990460909e-05, "loss": 0.0064, "step": 702500 }, { "epoch": 1.82, "learning_rate": 2.6848911688237624e-05, "loss": 0.0054, "step": 702510 }, { "epoch": 1.82, "learning_rate": 2.684502347186616e-05, "loss": 0.0077, "step": 702520 }, { "epoch": 1.82, "learning_rate": 2.6841135255494697e-05, "loss": 0.0096, "step": 702530 }, { "epoch": 1.82, "learning_rate": 2.6837247039123232e-05, "loss": 0.007, "step": 702540 }, { "epoch": 1.82, "learning_rate": 2.6833358822751767e-05, "loss": 0.0062, "step": 702550 }, { "epoch": 1.82, "learning_rate": 2.68294706063803e-05, "loss": 0.0062, "step": 702560 }, { "epoch": 1.82, "learning_rate": 2.682558239000884e-05, "loss": 0.0075, "step": 702570 }, { "epoch": 1.82, "learning_rate": 2.682169417363737e-05, "loss": 0.0068, "step": 702580 }, { "epoch": 1.82, "learning_rate": 2.6817805957265906e-05, "loss": 0.0079, "step": 702590 }, { "epoch": 1.82, "learning_rate": 2.681391774089444e-05, "loss": 0.0097, "step": 702600 }, { "epoch": 1.82, "learning_rate": 2.6810029524522976e-05, "loss": 0.0071, "step": 702610 }, { "epoch": 1.82, "learning_rate": 2.6806141308151514e-05, "loss": 0.0061, "step": 702620 }, { "epoch": 1.82, "learning_rate": 2.680225309178005e-05, "loss": 0.0058, "step": 702630 }, { "epoch": 1.82, "learning_rate": 2.6798364875408584e-05, "loss": 0.0063, "step": 702640 }, { "epoch": 1.82, "learning_rate": 2.679447665903712e-05, "loss": 0.0082, "step": 702650 }, { "epoch": 1.82, "learning_rate": 2.6790588442665657e-05, "loss": 0.0104, "step": 702660 }, { "epoch": 1.82, "learning_rate": 2.6786700226294192e-05, "loss": 0.0073, "step": 702670 }, { "epoch": 1.82, "learning_rate": 2.6782812009922727e-05, "loss": 0.0071, "step": 702680 }, { "epoch": 1.82, "learning_rate": 2.677892379355126e-05, "loss": 0.0095, "step": 702690 }, { "epoch": 1.82, "learning_rate": 2.67750355771798e-05, "loss": 0.006, "step": 702700 }, { "epoch": 1.82, "learning_rate": 2.677114736080833e-05, "loss": 0.0117, "step": 702710 }, { "epoch": 1.82, "learning_rate": 2.6767259144436866e-05, "loss": 0.0076, "step": 702720 }, { "epoch": 1.82, "learning_rate": 2.67633709280654e-05, "loss": 0.0063, "step": 702730 }, { "epoch": 1.82, "learning_rate": 2.6759482711693936e-05, "loss": 0.0079, "step": 702740 }, { "epoch": 1.82, "learning_rate": 2.6755594495322474e-05, "loss": 0.0076, "step": 702750 }, { "epoch": 1.82, "learning_rate": 2.675170627895101e-05, "loss": 0.0053, "step": 702760 }, { "epoch": 1.82, "learning_rate": 2.6747818062579544e-05, "loss": 0.0063, "step": 702770 }, { "epoch": 1.82, "learning_rate": 2.674392984620808e-05, "loss": 0.0091, "step": 702780 }, { "epoch": 1.82, "learning_rate": 2.6740041629836617e-05, "loss": 0.0057, "step": 702790 }, { "epoch": 1.82, "learning_rate": 2.6736153413465152e-05, "loss": 0.0078, "step": 702800 }, { "epoch": 1.82, "learning_rate": 2.6732265197093687e-05, "loss": 0.0074, "step": 702810 }, { "epoch": 1.82, "learning_rate": 2.672837698072222e-05, "loss": 0.007, "step": 702820 }, { "epoch": 1.82, "learning_rate": 2.6724488764350753e-05, "loss": 0.0061, "step": 702830 }, { "epoch": 1.82, "learning_rate": 2.672060054797929e-05, "loss": 0.0106, "step": 702840 }, { "epoch": 1.82, "learning_rate": 2.6716712331607826e-05, "loss": 0.0068, "step": 702850 }, { "epoch": 1.82, "learning_rate": 2.671282411523636e-05, "loss": 0.0055, "step": 702860 }, { "epoch": 1.82, "learning_rate": 2.6708935898864896e-05, "loss": 0.0096, "step": 702870 }, { "epoch": 1.82, "learning_rate": 2.6705047682493434e-05, "loss": 0.0086, "step": 702880 }, { "epoch": 1.82, "learning_rate": 2.670115946612197e-05, "loss": 0.0102, "step": 702890 }, { "epoch": 1.82, "learning_rate": 2.6697271249750504e-05, "loss": 0.0063, "step": 702900 }, { "epoch": 1.82, "learning_rate": 2.669338303337904e-05, "loss": 0.0107, "step": 702910 }, { "epoch": 1.82, "learning_rate": 2.6689494817007577e-05, "loss": 0.0067, "step": 702920 }, { "epoch": 1.82, "learning_rate": 2.6685606600636112e-05, "loss": 0.0075, "step": 702930 }, { "epoch": 1.82, "learning_rate": 2.6681718384264647e-05, "loss": 0.0083, "step": 702940 }, { "epoch": 1.82, "learning_rate": 2.6677830167893178e-05, "loss": 0.0077, "step": 702950 }, { "epoch": 1.82, "learning_rate": 2.6673941951521713e-05, "loss": 0.0071, "step": 702960 }, { "epoch": 1.82, "learning_rate": 2.667005373515025e-05, "loss": 0.0062, "step": 702970 }, { "epoch": 1.82, "learning_rate": 2.6666165518778786e-05, "loss": 0.0063, "step": 702980 }, { "epoch": 1.82, "learning_rate": 2.666227730240732e-05, "loss": 0.0078, "step": 702990 }, { "epoch": 1.82, "learning_rate": 2.6658389086035856e-05, "loss": 0.0066, "step": 703000 }, { "epoch": 1.82, "eval_cer": 0.8816453012088664, "eval_loss": 0.004601156339049339, "eval_runtime": 107.7473, "eval_samples_per_second": 18.562, "eval_steps_per_second": 4.64, "step": 703000 }, { "epoch": 1.82, "learning_rate": 2.6654500869664394e-05, "loss": 0.0082, "step": 703010 }, { "epoch": 1.82, "learning_rate": 2.665061265329293e-05, "loss": 0.0077, "step": 703020 }, { "epoch": 1.82, "learning_rate": 2.6646724436921464e-05, "loss": 0.008, "step": 703030 }, { "epoch": 1.82, "learning_rate": 2.664283622055e-05, "loss": 0.0083, "step": 703040 }, { "epoch": 1.82, "learning_rate": 2.6638948004178537e-05, "loss": 0.0101, "step": 703050 }, { "epoch": 1.82, "learning_rate": 2.6635059787807072e-05, "loss": 0.0065, "step": 703060 }, { "epoch": 1.82, "learning_rate": 2.6631171571435607e-05, "loss": 0.0068, "step": 703070 }, { "epoch": 1.82, "learning_rate": 2.6627283355064138e-05, "loss": 0.0075, "step": 703080 }, { "epoch": 1.82, "learning_rate": 2.6623395138692673e-05, "loss": 0.0084, "step": 703090 }, { "epoch": 1.82, "learning_rate": 2.661950692232121e-05, "loss": 0.0063, "step": 703100 }, { "epoch": 1.82, "learning_rate": 2.6615618705949746e-05, "loss": 0.0091, "step": 703110 }, { "epoch": 1.82, "learning_rate": 2.661173048957828e-05, "loss": 0.0072, "step": 703120 }, { "epoch": 1.82, "learning_rate": 2.6607842273206816e-05, "loss": 0.0073, "step": 703130 }, { "epoch": 1.82, "learning_rate": 2.6603954056835354e-05, "loss": 0.0064, "step": 703140 }, { "epoch": 1.82, "learning_rate": 2.660006584046389e-05, "loss": 0.0101, "step": 703150 }, { "epoch": 1.82, "learning_rate": 2.6596177624092424e-05, "loss": 0.0067, "step": 703160 }, { "epoch": 1.82, "learning_rate": 2.659228940772096e-05, "loss": 0.0092, "step": 703170 }, { "epoch": 1.82, "learning_rate": 2.6588401191349497e-05, "loss": 0.0063, "step": 703180 }, { "epoch": 1.82, "learning_rate": 2.658451297497803e-05, "loss": 0.0059, "step": 703190 }, { "epoch": 1.82, "learning_rate": 2.6580624758606563e-05, "loss": 0.0077, "step": 703200 }, { "epoch": 1.82, "learning_rate": 2.6576736542235098e-05, "loss": 0.0071, "step": 703210 }, { "epoch": 1.82, "learning_rate": 2.6572848325863633e-05, "loss": 0.0064, "step": 703220 }, { "epoch": 1.82, "learning_rate": 2.656896010949217e-05, "loss": 0.0148, "step": 703230 }, { "epoch": 1.82, "learning_rate": 2.6565071893120706e-05, "loss": 0.0053, "step": 703240 }, { "epoch": 1.82, "learning_rate": 2.656118367674924e-05, "loss": 0.0079, "step": 703250 }, { "epoch": 1.82, "learning_rate": 2.6557295460377776e-05, "loss": 0.0067, "step": 703260 }, { "epoch": 1.82, "learning_rate": 2.6553407244006314e-05, "loss": 0.0081, "step": 703270 }, { "epoch": 1.82, "learning_rate": 2.654951902763485e-05, "loss": 0.0077, "step": 703280 }, { "epoch": 1.82, "learning_rate": 2.6545630811263384e-05, "loss": 0.0079, "step": 703290 }, { "epoch": 1.82, "learning_rate": 2.654174259489192e-05, "loss": 0.0075, "step": 703300 }, { "epoch": 1.82, "learning_rate": 2.6537854378520457e-05, "loss": 0.0079, "step": 703310 }, { "epoch": 1.82, "learning_rate": 2.653396616214899e-05, "loss": 0.0068, "step": 703320 }, { "epoch": 1.82, "learning_rate": 2.6530077945777523e-05, "loss": 0.0072, "step": 703330 }, { "epoch": 1.82, "learning_rate": 2.6526189729406058e-05, "loss": 0.008, "step": 703340 }, { "epoch": 1.82, "learning_rate": 2.6522301513034593e-05, "loss": 0.0092, "step": 703350 }, { "epoch": 1.82, "learning_rate": 2.651841329666313e-05, "loss": 0.0069, "step": 703360 }, { "epoch": 1.82, "learning_rate": 2.6514525080291666e-05, "loss": 0.0085, "step": 703370 }, { "epoch": 1.82, "learning_rate": 2.65106368639202e-05, "loss": 0.0084, "step": 703380 }, { "epoch": 1.82, "learning_rate": 2.6506748647548736e-05, "loss": 0.0089, "step": 703390 }, { "epoch": 1.82, "learning_rate": 2.6502860431177274e-05, "loss": 0.0094, "step": 703400 }, { "epoch": 1.82, "learning_rate": 2.649897221480581e-05, "loss": 0.0061, "step": 703410 }, { "epoch": 1.82, "learning_rate": 2.6495083998434344e-05, "loss": 0.0079, "step": 703420 }, { "epoch": 1.82, "learning_rate": 2.649119578206288e-05, "loss": 0.0079, "step": 703430 }, { "epoch": 1.82, "learning_rate": 2.6487307565691417e-05, "loss": 0.0071, "step": 703440 }, { "epoch": 1.82, "learning_rate": 2.6483419349319948e-05, "loss": 0.0068, "step": 703450 }, { "epoch": 1.82, "learning_rate": 2.6479531132948483e-05, "loss": 0.0068, "step": 703460 }, { "epoch": 1.82, "learning_rate": 2.6475642916577018e-05, "loss": 0.0077, "step": 703470 }, { "epoch": 1.82, "learning_rate": 2.6471754700205553e-05, "loss": 0.0083, "step": 703480 }, { "epoch": 1.82, "learning_rate": 2.646786648383409e-05, "loss": 0.0055, "step": 703490 }, { "epoch": 1.82, "learning_rate": 2.6463978267462626e-05, "loss": 0.007, "step": 703500 }, { "epoch": 1.82, "learning_rate": 2.646009005109116e-05, "loss": 0.0085, "step": 703510 }, { "epoch": 1.82, "learning_rate": 2.6456201834719696e-05, "loss": 0.0075, "step": 703520 }, { "epoch": 1.82, "learning_rate": 2.6452313618348234e-05, "loss": 0.0072, "step": 703530 }, { "epoch": 1.82, "learning_rate": 2.644842540197677e-05, "loss": 0.0101, "step": 703540 }, { "epoch": 1.82, "learning_rate": 2.6444537185605304e-05, "loss": 0.0153, "step": 703550 }, { "epoch": 1.82, "learning_rate": 2.644064896923384e-05, "loss": 0.007, "step": 703560 }, { "epoch": 1.82, "learning_rate": 2.643676075286237e-05, "loss": 0.0046, "step": 703570 }, { "epoch": 1.82, "learning_rate": 2.6432872536490908e-05, "loss": 0.0101, "step": 703580 }, { "epoch": 1.82, "learning_rate": 2.6428984320119443e-05, "loss": 0.0068, "step": 703590 }, { "epoch": 1.82, "learning_rate": 2.6425096103747978e-05, "loss": 0.0083, "step": 703600 }, { "epoch": 1.82, "learning_rate": 2.6421207887376513e-05, "loss": 0.007, "step": 703610 }, { "epoch": 1.82, "learning_rate": 2.641731967100505e-05, "loss": 0.0067, "step": 703620 }, { "epoch": 1.82, "learning_rate": 2.6413431454633586e-05, "loss": 0.0067, "step": 703630 }, { "epoch": 1.82, "learning_rate": 2.640954323826212e-05, "loss": 0.0073, "step": 703640 }, { "epoch": 1.82, "learning_rate": 2.6405655021890656e-05, "loss": 0.0078, "step": 703650 }, { "epoch": 1.82, "learning_rate": 2.6401766805519194e-05, "loss": 0.0093, "step": 703660 }, { "epoch": 1.82, "learning_rate": 2.639787858914773e-05, "loss": 0.0087, "step": 703670 }, { "epoch": 1.82, "learning_rate": 2.6393990372776264e-05, "loss": 0.0084, "step": 703680 }, { "epoch": 1.82, "learning_rate": 2.63901021564048e-05, "loss": 0.0075, "step": 703690 }, { "epoch": 1.82, "learning_rate": 2.638621394003333e-05, "loss": 0.0054, "step": 703700 }, { "epoch": 1.82, "learning_rate": 2.6382325723661868e-05, "loss": 0.0077, "step": 703710 }, { "epoch": 1.82, "learning_rate": 2.6378437507290403e-05, "loss": 0.0077, "step": 703720 }, { "epoch": 1.82, "learning_rate": 2.6374549290918938e-05, "loss": 0.0162, "step": 703730 }, { "epoch": 1.82, "learning_rate": 2.6370661074547473e-05, "loss": 0.0084, "step": 703740 }, { "epoch": 1.82, "learning_rate": 2.6366772858176008e-05, "loss": 0.0068, "step": 703750 }, { "epoch": 1.82, "learning_rate": 2.6362884641804546e-05, "loss": 0.0079, "step": 703760 }, { "epoch": 1.82, "learning_rate": 2.635899642543308e-05, "loss": 0.0061, "step": 703770 }, { "epoch": 1.82, "learning_rate": 2.6355108209061616e-05, "loss": 0.0071, "step": 703780 }, { "epoch": 1.82, "learning_rate": 2.635121999269015e-05, "loss": 0.0093, "step": 703790 }, { "epoch": 1.82, "learning_rate": 2.634733177631869e-05, "loss": 0.0181, "step": 703800 }, { "epoch": 1.82, "learning_rate": 2.6343443559947224e-05, "loss": 0.0092, "step": 703810 }, { "epoch": 1.82, "learning_rate": 2.6339555343575755e-05, "loss": 0.0085, "step": 703820 }, { "epoch": 1.82, "learning_rate": 2.633566712720429e-05, "loss": 0.0082, "step": 703830 }, { "epoch": 1.82, "learning_rate": 2.6331778910832825e-05, "loss": 0.0089, "step": 703840 }, { "epoch": 1.82, "learning_rate": 2.6327890694461363e-05, "loss": 0.0094, "step": 703850 }, { "epoch": 1.82, "learning_rate": 2.6324002478089898e-05, "loss": 0.0078, "step": 703860 }, { "epoch": 1.82, "learning_rate": 2.6320114261718433e-05, "loss": 0.0082, "step": 703870 }, { "epoch": 1.82, "learning_rate": 2.6316226045346968e-05, "loss": 0.0077, "step": 703880 }, { "epoch": 1.82, "learning_rate": 2.6312337828975506e-05, "loss": 0.0083, "step": 703890 }, { "epoch": 1.82, "learning_rate": 2.630844961260404e-05, "loss": 0.0074, "step": 703900 }, { "epoch": 1.82, "learning_rate": 2.6304561396232576e-05, "loss": 0.0098, "step": 703910 }, { "epoch": 1.82, "learning_rate": 2.630067317986111e-05, "loss": 0.0111, "step": 703920 }, { "epoch": 1.82, "learning_rate": 2.629678496348965e-05, "loss": 0.0056, "step": 703930 }, { "epoch": 1.82, "learning_rate": 2.6292896747118184e-05, "loss": 0.0086, "step": 703940 }, { "epoch": 1.82, "learning_rate": 2.6289008530746715e-05, "loss": 0.0082, "step": 703950 }, { "epoch": 1.82, "learning_rate": 2.628512031437525e-05, "loss": 0.0079, "step": 703960 }, { "epoch": 1.82, "learning_rate": 2.6281232098003785e-05, "loss": 0.0062, "step": 703970 }, { "epoch": 1.82, "learning_rate": 2.6277343881632323e-05, "loss": 0.005, "step": 703980 }, { "epoch": 1.82, "learning_rate": 2.6273455665260858e-05, "loss": 0.0065, "step": 703990 }, { "epoch": 1.82, "learning_rate": 2.6269567448889393e-05, "loss": 0.0061, "step": 704000 }, { "epoch": 1.82, "eval_cer": 0.8816634964890108, "eval_loss": 0.004665213171392679, "eval_runtime": 107.9314, "eval_samples_per_second": 18.53, "eval_steps_per_second": 4.633, "step": 704000 }, { "epoch": 1.82, "learning_rate": 2.6265679232517928e-05, "loss": 0.0105, "step": 704010 }, { "epoch": 1.82, "learning_rate": 2.6261791016146466e-05, "loss": 0.0067, "step": 704020 }, { "epoch": 1.82, "learning_rate": 2.6257902799775e-05, "loss": 0.0064, "step": 704030 }, { "epoch": 1.82, "learning_rate": 2.6254014583403536e-05, "loss": 0.0073, "step": 704040 }, { "epoch": 1.82, "learning_rate": 2.625012636703207e-05, "loss": 0.0094, "step": 704050 }, { "epoch": 1.83, "learning_rate": 2.624623815066061e-05, "loss": 0.0094, "step": 704060 }, { "epoch": 1.83, "learning_rate": 2.624234993428914e-05, "loss": 0.0053, "step": 704070 }, { "epoch": 1.83, "learning_rate": 2.6238461717917675e-05, "loss": 0.0084, "step": 704080 }, { "epoch": 1.83, "learning_rate": 2.623457350154621e-05, "loss": 0.0057, "step": 704090 }, { "epoch": 1.83, "learning_rate": 2.6230685285174745e-05, "loss": 0.0052, "step": 704100 }, { "epoch": 1.83, "learning_rate": 2.6226797068803283e-05, "loss": 0.0058, "step": 704110 }, { "epoch": 1.83, "learning_rate": 2.6222908852431818e-05, "loss": 0.0076, "step": 704120 }, { "epoch": 1.83, "learning_rate": 2.6219020636060353e-05, "loss": 0.0076, "step": 704130 }, { "epoch": 1.83, "learning_rate": 2.6215132419688888e-05, "loss": 0.0082, "step": 704140 }, { "epoch": 1.83, "learning_rate": 2.6211244203317426e-05, "loss": 0.0063, "step": 704150 }, { "epoch": 1.83, "learning_rate": 2.620735598694596e-05, "loss": 0.0069, "step": 704160 }, { "epoch": 1.83, "learning_rate": 2.6203467770574496e-05, "loss": 0.0073, "step": 704170 }, { "epoch": 1.83, "learning_rate": 2.619957955420303e-05, "loss": 0.0084, "step": 704180 }, { "epoch": 1.83, "learning_rate": 2.6195691337831562e-05, "loss": 0.0102, "step": 704190 }, { "epoch": 1.83, "learning_rate": 2.61918031214601e-05, "loss": 0.0069, "step": 704200 }, { "epoch": 1.83, "learning_rate": 2.6187914905088635e-05, "loss": 0.006, "step": 704210 }, { "epoch": 1.83, "learning_rate": 2.618402668871717e-05, "loss": 0.0079, "step": 704220 }, { "epoch": 1.83, "learning_rate": 2.6180138472345705e-05, "loss": 0.0128, "step": 704230 }, { "epoch": 1.83, "learning_rate": 2.6176250255974243e-05, "loss": 0.0053, "step": 704240 }, { "epoch": 1.83, "learning_rate": 2.6172362039602778e-05, "loss": 0.0073, "step": 704250 }, { "epoch": 1.83, "learning_rate": 2.6168473823231313e-05, "loss": 0.009, "step": 704260 }, { "epoch": 1.83, "learning_rate": 2.6164585606859848e-05, "loss": 0.0071, "step": 704270 }, { "epoch": 1.83, "learning_rate": 2.6160697390488386e-05, "loss": 0.0083, "step": 704280 }, { "epoch": 1.83, "learning_rate": 2.615680917411692e-05, "loss": 0.007, "step": 704290 }, { "epoch": 1.83, "learning_rate": 2.6152920957745456e-05, "loss": 0.0053, "step": 704300 }, { "epoch": 1.83, "learning_rate": 2.614903274137399e-05, "loss": 0.0043, "step": 704310 }, { "epoch": 1.83, "learning_rate": 2.6145144525002522e-05, "loss": 0.007, "step": 704320 }, { "epoch": 1.83, "learning_rate": 2.614125630863106e-05, "loss": 0.007, "step": 704330 }, { "epoch": 1.83, "learning_rate": 2.6137368092259595e-05, "loss": 0.011, "step": 704340 }, { "epoch": 1.83, "learning_rate": 2.613347987588813e-05, "loss": 0.0069, "step": 704350 }, { "epoch": 1.83, "learning_rate": 2.6129591659516665e-05, "loss": 0.0073, "step": 704360 }, { "epoch": 1.83, "learning_rate": 2.6125703443145203e-05, "loss": 0.0127, "step": 704370 }, { "epoch": 1.83, "learning_rate": 2.6121815226773738e-05, "loss": 0.0056, "step": 704380 }, { "epoch": 1.83, "learning_rate": 2.6117927010402273e-05, "loss": 0.0036, "step": 704390 }, { "epoch": 1.83, "learning_rate": 2.6114038794030808e-05, "loss": 0.009, "step": 704400 }, { "epoch": 1.83, "learning_rate": 2.6110150577659346e-05, "loss": 0.0071, "step": 704410 }, { "epoch": 1.83, "learning_rate": 2.610626236128788e-05, "loss": 0.0058, "step": 704420 }, { "epoch": 1.83, "learning_rate": 2.6102374144916416e-05, "loss": 0.0066, "step": 704430 }, { "epoch": 1.83, "learning_rate": 2.6098485928544947e-05, "loss": 0.0071, "step": 704440 }, { "epoch": 1.83, "learning_rate": 2.6094597712173482e-05, "loss": 0.0077, "step": 704450 }, { "epoch": 1.83, "learning_rate": 2.609070949580202e-05, "loss": 0.0089, "step": 704460 }, { "epoch": 1.83, "learning_rate": 2.6086821279430555e-05, "loss": 0.0062, "step": 704470 }, { "epoch": 1.83, "learning_rate": 2.608293306305909e-05, "loss": 0.007, "step": 704480 }, { "epoch": 1.83, "learning_rate": 2.6079044846687625e-05, "loss": 0.0059, "step": 704490 }, { "epoch": 1.83, "learning_rate": 2.6075156630316163e-05, "loss": 0.0079, "step": 704500 }, { "epoch": 1.83, "learning_rate": 2.6071268413944698e-05, "loss": 0.0073, "step": 704510 }, { "epoch": 1.83, "learning_rate": 2.6067380197573233e-05, "loss": 0.005, "step": 704520 }, { "epoch": 1.83, "learning_rate": 2.6063491981201768e-05, "loss": 0.0081, "step": 704530 }, { "epoch": 1.83, "learning_rate": 2.6059603764830306e-05, "loss": 0.0105, "step": 704540 }, { "epoch": 1.83, "learning_rate": 2.605571554845884e-05, "loss": 0.0066, "step": 704550 }, { "epoch": 1.83, "learning_rate": 2.6051827332087375e-05, "loss": 0.0082, "step": 704560 }, { "epoch": 1.83, "learning_rate": 2.6047939115715907e-05, "loss": 0.0079, "step": 704570 }, { "epoch": 1.83, "learning_rate": 2.6044050899344442e-05, "loss": 0.0075, "step": 704580 }, { "epoch": 1.83, "learning_rate": 2.604016268297298e-05, "loss": 0.0075, "step": 704590 }, { "epoch": 1.83, "learning_rate": 2.6036274466601515e-05, "loss": 0.0089, "step": 704600 }, { "epoch": 1.83, "learning_rate": 2.603238625023005e-05, "loss": 0.0078, "step": 704610 }, { "epoch": 1.83, "learning_rate": 2.6028498033858585e-05, "loss": 0.0067, "step": 704620 }, { "epoch": 1.83, "learning_rate": 2.6024609817487123e-05, "loss": 0.0067, "step": 704630 }, { "epoch": 1.83, "learning_rate": 2.6020721601115658e-05, "loss": 0.0059, "step": 704640 }, { "epoch": 1.83, "learning_rate": 2.6016833384744193e-05, "loss": 0.0083, "step": 704650 }, { "epoch": 1.83, "learning_rate": 2.6012945168372727e-05, "loss": 0.0057, "step": 704660 }, { "epoch": 1.83, "learning_rate": 2.6009056952001266e-05, "loss": 0.006, "step": 704670 }, { "epoch": 1.83, "learning_rate": 2.60051687356298e-05, "loss": 0.0076, "step": 704680 }, { "epoch": 1.83, "learning_rate": 2.6001280519258332e-05, "loss": 0.0078, "step": 704690 }, { "epoch": 1.83, "learning_rate": 2.5997392302886867e-05, "loss": 0.0068, "step": 704700 }, { "epoch": 1.83, "learning_rate": 2.5993504086515402e-05, "loss": 0.0068, "step": 704710 }, { "epoch": 1.83, "learning_rate": 2.598961587014394e-05, "loss": 0.0107, "step": 704720 }, { "epoch": 1.83, "learning_rate": 2.5985727653772475e-05, "loss": 0.0097, "step": 704730 }, { "epoch": 1.83, "learning_rate": 2.598183943740101e-05, "loss": 0.0083, "step": 704740 }, { "epoch": 1.83, "learning_rate": 2.5977951221029545e-05, "loss": 0.0068, "step": 704750 }, { "epoch": 1.83, "learning_rate": 2.5974063004658083e-05, "loss": 0.008, "step": 704760 }, { "epoch": 1.83, "learning_rate": 2.5970174788286618e-05, "loss": 0.0064, "step": 704770 }, { "epoch": 1.83, "learning_rate": 2.5966286571915153e-05, "loss": 0.0071, "step": 704780 }, { "epoch": 1.83, "learning_rate": 2.5962398355543687e-05, "loss": 0.0056, "step": 704790 }, { "epoch": 1.83, "learning_rate": 2.5958510139172226e-05, "loss": 0.0065, "step": 704800 }, { "epoch": 1.83, "learning_rate": 2.5954621922800757e-05, "loss": 0.0065, "step": 704810 }, { "epoch": 1.83, "learning_rate": 2.5950733706429292e-05, "loss": 0.0066, "step": 704820 }, { "epoch": 1.83, "learning_rate": 2.5946845490057827e-05, "loss": 0.0076, "step": 704830 }, { "epoch": 1.83, "learning_rate": 2.5942957273686362e-05, "loss": 0.0089, "step": 704840 }, { "epoch": 1.83, "learning_rate": 2.59390690573149e-05, "loss": 0.0067, "step": 704850 }, { "epoch": 1.83, "learning_rate": 2.5935180840943435e-05, "loss": 0.0099, "step": 704860 }, { "epoch": 1.83, "learning_rate": 2.593129262457197e-05, "loss": 0.0056, "step": 704870 }, { "epoch": 1.83, "learning_rate": 2.5927404408200505e-05, "loss": 0.0071, "step": 704880 }, { "epoch": 1.83, "learning_rate": 2.5923516191829043e-05, "loss": 0.0089, "step": 704890 }, { "epoch": 1.83, "learning_rate": 2.5919627975457578e-05, "loss": 0.0076, "step": 704900 }, { "epoch": 1.83, "learning_rate": 2.5915739759086113e-05, "loss": 0.0045, "step": 704910 }, { "epoch": 1.83, "learning_rate": 2.5911851542714647e-05, "loss": 0.0085, "step": 704920 }, { "epoch": 1.83, "learning_rate": 2.5907963326343186e-05, "loss": 0.0081, "step": 704930 }, { "epoch": 1.83, "learning_rate": 2.5904075109971717e-05, "loss": 0.0074, "step": 704940 }, { "epoch": 1.83, "learning_rate": 2.5900186893600252e-05, "loss": 0.0112, "step": 704950 }, { "epoch": 1.83, "learning_rate": 2.5896298677228787e-05, "loss": 0.0088, "step": 704960 }, { "epoch": 1.83, "learning_rate": 2.5892410460857322e-05, "loss": 0.0066, "step": 704970 }, { "epoch": 1.83, "learning_rate": 2.588852224448586e-05, "loss": 0.0101, "step": 704980 }, { "epoch": 1.83, "learning_rate": 2.5884634028114395e-05, "loss": 0.0083, "step": 704990 }, { "epoch": 1.83, "learning_rate": 2.588074581174293e-05, "loss": 0.0078, "step": 705000 }, { "epoch": 1.83, "eval_cer": 0.8816634964890108, "eval_loss": 0.004623005166649818, "eval_runtime": 107.8175, "eval_samples_per_second": 18.55, "eval_steps_per_second": 4.637, "step": 705000 }, { "epoch": 1.83, "learning_rate": 2.5876857595371465e-05, "loss": 0.0086, "step": 705010 }, { "epoch": 1.83, "learning_rate": 2.5872969379000003e-05, "loss": 0.0053, "step": 705020 }, { "epoch": 1.83, "learning_rate": 2.5869081162628538e-05, "loss": 0.0074, "step": 705030 }, { "epoch": 1.83, "learning_rate": 2.5865192946257073e-05, "loss": 0.0071, "step": 705040 }, { "epoch": 1.83, "learning_rate": 2.5861304729885607e-05, "loss": 0.0063, "step": 705050 }, { "epoch": 1.83, "learning_rate": 2.585741651351414e-05, "loss": 0.0061, "step": 705060 }, { "epoch": 1.83, "learning_rate": 2.5853528297142677e-05, "loss": 0.0063, "step": 705070 }, { "epoch": 1.83, "learning_rate": 2.5849640080771212e-05, "loss": 0.0063, "step": 705080 }, { "epoch": 1.83, "learning_rate": 2.5845751864399747e-05, "loss": 0.0056, "step": 705090 }, { "epoch": 1.83, "learning_rate": 2.5841863648028282e-05, "loss": 0.0084, "step": 705100 }, { "epoch": 1.83, "learning_rate": 2.5837975431656817e-05, "loss": 0.0064, "step": 705110 }, { "epoch": 1.83, "learning_rate": 2.5834087215285355e-05, "loss": 0.0062, "step": 705120 }, { "epoch": 1.83, "learning_rate": 2.583019899891389e-05, "loss": 0.0063, "step": 705130 }, { "epoch": 1.83, "learning_rate": 2.5826310782542425e-05, "loss": 0.0079, "step": 705140 }, { "epoch": 1.83, "learning_rate": 2.582242256617096e-05, "loss": 0.0074, "step": 705150 }, { "epoch": 1.83, "learning_rate": 2.5818534349799498e-05, "loss": 0.0058, "step": 705160 }, { "epoch": 1.83, "learning_rate": 2.5814646133428033e-05, "loss": 0.0088, "step": 705170 }, { "epoch": 1.83, "learning_rate": 2.5810757917056567e-05, "loss": 0.006, "step": 705180 }, { "epoch": 1.83, "learning_rate": 2.58068697006851e-05, "loss": 0.0077, "step": 705190 }, { "epoch": 1.83, "learning_rate": 2.5802981484313634e-05, "loss": 0.0075, "step": 705200 }, { "epoch": 1.83, "learning_rate": 2.5799093267942172e-05, "loss": 0.0088, "step": 705210 }, { "epoch": 1.83, "learning_rate": 2.5795205051570707e-05, "loss": 0.0087, "step": 705220 }, { "epoch": 1.83, "learning_rate": 2.579131683519924e-05, "loss": 0.0076, "step": 705230 }, { "epoch": 1.83, "learning_rate": 2.5787428618827777e-05, "loss": 0.0064, "step": 705240 }, { "epoch": 1.83, "learning_rate": 2.5783540402456315e-05, "loss": 0.0088, "step": 705250 }, { "epoch": 1.83, "learning_rate": 2.577965218608485e-05, "loss": 0.0071, "step": 705260 }, { "epoch": 1.83, "learning_rate": 2.5775763969713385e-05, "loss": 0.0083, "step": 705270 }, { "epoch": 1.83, "learning_rate": 2.577187575334192e-05, "loss": 0.0077, "step": 705280 }, { "epoch": 1.83, "learning_rate": 2.5767987536970458e-05, "loss": 0.0082, "step": 705290 }, { "epoch": 1.83, "learning_rate": 2.5764099320598992e-05, "loss": 0.0094, "step": 705300 }, { "epoch": 1.83, "learning_rate": 2.5760211104227524e-05, "loss": 0.0051, "step": 705310 }, { "epoch": 1.83, "learning_rate": 2.575632288785606e-05, "loss": 0.0101, "step": 705320 }, { "epoch": 1.83, "learning_rate": 2.5752434671484594e-05, "loss": 0.0073, "step": 705330 }, { "epoch": 1.83, "learning_rate": 2.5748546455113132e-05, "loss": 0.0053, "step": 705340 }, { "epoch": 1.83, "learning_rate": 2.5744658238741667e-05, "loss": 0.0092, "step": 705350 }, { "epoch": 1.83, "learning_rate": 2.57407700223702e-05, "loss": 0.0078, "step": 705360 }, { "epoch": 1.83, "learning_rate": 2.5736881805998737e-05, "loss": 0.0063, "step": 705370 }, { "epoch": 1.83, "learning_rate": 2.5732993589627275e-05, "loss": 0.0091, "step": 705380 }, { "epoch": 1.83, "learning_rate": 2.572910537325581e-05, "loss": 0.0062, "step": 705390 }, { "epoch": 1.83, "learning_rate": 2.5725217156884345e-05, "loss": 0.0097, "step": 705400 }, { "epoch": 1.83, "learning_rate": 2.572132894051288e-05, "loss": 0.0082, "step": 705410 }, { "epoch": 1.83, "learning_rate": 2.5717440724141418e-05, "loss": 0.0059, "step": 705420 }, { "epoch": 1.83, "learning_rate": 2.571355250776995e-05, "loss": 0.0064, "step": 705430 }, { "epoch": 1.83, "learning_rate": 2.5709664291398484e-05, "loss": 0.0071, "step": 705440 }, { "epoch": 1.83, "learning_rate": 2.570577607502702e-05, "loss": 0.007, "step": 705450 }, { "epoch": 1.83, "learning_rate": 2.5701887858655554e-05, "loss": 0.006, "step": 705460 }, { "epoch": 1.83, "learning_rate": 2.5697999642284092e-05, "loss": 0.0088, "step": 705470 }, { "epoch": 1.83, "learning_rate": 2.5694111425912627e-05, "loss": 0.008, "step": 705480 }, { "epoch": 1.83, "learning_rate": 2.569022320954116e-05, "loss": 0.0074, "step": 705490 }, { "epoch": 1.83, "learning_rate": 2.5686334993169697e-05, "loss": 0.0084, "step": 705500 }, { "epoch": 1.83, "learning_rate": 2.5682446776798235e-05, "loss": 0.0059, "step": 705510 }, { "epoch": 1.83, "learning_rate": 2.567855856042677e-05, "loss": 0.0075, "step": 705520 }, { "epoch": 1.83, "learning_rate": 2.5674670344055304e-05, "loss": 0.0105, "step": 705530 }, { "epoch": 1.83, "learning_rate": 2.567078212768384e-05, "loss": 0.006, "step": 705540 }, { "epoch": 1.83, "learning_rate": 2.5666893911312378e-05, "loss": 0.0091, "step": 705550 }, { "epoch": 1.83, "learning_rate": 2.566300569494091e-05, "loss": 0.0057, "step": 705560 }, { "epoch": 1.83, "learning_rate": 2.5659117478569444e-05, "loss": 0.0097, "step": 705570 }, { "epoch": 1.83, "learning_rate": 2.565522926219798e-05, "loss": 0.0053, "step": 705580 }, { "epoch": 1.83, "learning_rate": 2.5651341045826514e-05, "loss": 0.0067, "step": 705590 }, { "epoch": 1.83, "learning_rate": 2.5647452829455052e-05, "loss": 0.0058, "step": 705600 }, { "epoch": 1.83, "learning_rate": 2.5643564613083587e-05, "loss": 0.0061, "step": 705610 }, { "epoch": 1.83, "learning_rate": 2.563967639671212e-05, "loss": 0.0055, "step": 705620 }, { "epoch": 1.83, "learning_rate": 2.5635788180340656e-05, "loss": 0.0074, "step": 705630 }, { "epoch": 1.83, "learning_rate": 2.5631899963969195e-05, "loss": 0.0071, "step": 705640 }, { "epoch": 1.83, "learning_rate": 2.562801174759773e-05, "loss": 0.0071, "step": 705650 }, { "epoch": 1.83, "learning_rate": 2.5624123531226264e-05, "loss": 0.0073, "step": 705660 }, { "epoch": 1.83, "learning_rate": 2.56202353148548e-05, "loss": 0.0058, "step": 705670 }, { "epoch": 1.83, "learning_rate": 2.561634709848333e-05, "loss": 0.0102, "step": 705680 }, { "epoch": 1.83, "learning_rate": 2.561245888211187e-05, "loss": 0.0088, "step": 705690 }, { "epoch": 1.83, "learning_rate": 2.5608570665740404e-05, "loss": 0.006, "step": 705700 }, { "epoch": 1.83, "learning_rate": 2.560468244936894e-05, "loss": 0.0096, "step": 705710 }, { "epoch": 1.83, "learning_rate": 2.5600794232997474e-05, "loss": 0.0073, "step": 705720 }, { "epoch": 1.83, "learning_rate": 2.5596906016626012e-05, "loss": 0.0066, "step": 705730 }, { "epoch": 1.83, "learning_rate": 2.5593017800254547e-05, "loss": 0.009, "step": 705740 }, { "epoch": 1.83, "learning_rate": 2.558912958388308e-05, "loss": 0.0096, "step": 705750 }, { "epoch": 1.83, "learning_rate": 2.5585241367511616e-05, "loss": 0.0072, "step": 705760 }, { "epoch": 1.83, "learning_rate": 2.5581353151140155e-05, "loss": 0.0093, "step": 705770 }, { "epoch": 1.83, "learning_rate": 2.557746493476869e-05, "loss": 0.0074, "step": 705780 }, { "epoch": 1.83, "learning_rate": 2.5573576718397224e-05, "loss": 0.0066, "step": 705790 }, { "epoch": 1.83, "learning_rate": 2.556968850202576e-05, "loss": 0.0069, "step": 705800 }, { "epoch": 1.83, "learning_rate": 2.556580028565429e-05, "loss": 0.0078, "step": 705810 }, { "epoch": 1.83, "learning_rate": 2.556191206928283e-05, "loss": 0.0066, "step": 705820 }, { "epoch": 1.83, "learning_rate": 2.5558023852911364e-05, "loss": 0.0083, "step": 705830 }, { "epoch": 1.83, "learning_rate": 2.55541356365399e-05, "loss": 0.007, "step": 705840 }, { "epoch": 1.83, "learning_rate": 2.5550247420168434e-05, "loss": 0.0074, "step": 705850 }, { "epoch": 1.83, "learning_rate": 2.5546359203796972e-05, "loss": 0.0075, "step": 705860 }, { "epoch": 1.83, "learning_rate": 2.5542470987425507e-05, "loss": 0.005, "step": 705870 }, { "epoch": 1.83, "learning_rate": 2.553858277105404e-05, "loss": 0.0063, "step": 705880 }, { "epoch": 1.83, "learning_rate": 2.5534694554682576e-05, "loss": 0.0053, "step": 705890 }, { "epoch": 1.83, "learning_rate": 2.5530806338311115e-05, "loss": 0.0082, "step": 705900 }, { "epoch": 1.83, "learning_rate": 2.552691812193965e-05, "loss": 0.0057, "step": 705910 }, { "epoch": 1.83, "learning_rate": 2.5523029905568184e-05, "loss": 0.007, "step": 705920 }, { "epoch": 1.83, "learning_rate": 2.5519141689196716e-05, "loss": 0.0086, "step": 705930 }, { "epoch": 1.83, "learning_rate": 2.551525347282525e-05, "loss": 0.0081, "step": 705940 }, { "epoch": 1.83, "learning_rate": 2.551136525645379e-05, "loss": 0.012, "step": 705950 }, { "epoch": 1.83, "learning_rate": 2.5507477040082324e-05, "loss": 0.0086, "step": 705960 }, { "epoch": 1.83, "learning_rate": 2.550358882371086e-05, "loss": 0.0089, "step": 705970 }, { "epoch": 1.83, "learning_rate": 2.5499700607339394e-05, "loss": 0.0104, "step": 705980 }, { "epoch": 1.83, "learning_rate": 2.5495812390967932e-05, "loss": 0.0088, "step": 705990 }, { "epoch": 1.83, "learning_rate": 2.5491924174596467e-05, "loss": 0.0094, "step": 706000 }, { "epoch": 1.83, "eval_cer": 0.8816592975782083, "eval_loss": 0.004630614072084427, "eval_runtime": 107.9819, "eval_samples_per_second": 18.522, "eval_steps_per_second": 4.63, "step": 706000 }, { "epoch": 1.83, "learning_rate": 2.5488035958225e-05, "loss": 0.0078, "step": 706010 }, { "epoch": 1.83, "learning_rate": 2.5484147741853536e-05, "loss": 0.0082, "step": 706020 }, { "epoch": 1.83, "learning_rate": 2.5480259525482075e-05, "loss": 0.0075, "step": 706030 }, { "epoch": 1.83, "learning_rate": 2.547637130911061e-05, "loss": 0.006, "step": 706040 }, { "epoch": 1.83, "learning_rate": 2.547248309273914e-05, "loss": 0.0078, "step": 706050 }, { "epoch": 1.83, "learning_rate": 2.5468594876367676e-05, "loss": 0.0101, "step": 706060 }, { "epoch": 1.83, "learning_rate": 2.546470665999621e-05, "loss": 0.0076, "step": 706070 }, { "epoch": 1.83, "learning_rate": 2.546081844362475e-05, "loss": 0.0095, "step": 706080 }, { "epoch": 1.83, "learning_rate": 2.5456930227253284e-05, "loss": 0.0055, "step": 706090 }, { "epoch": 1.83, "learning_rate": 2.545304201088182e-05, "loss": 0.0073, "step": 706100 }, { "epoch": 1.83, "learning_rate": 2.5449153794510354e-05, "loss": 0.006, "step": 706110 }, { "epoch": 1.83, "learning_rate": 2.5445265578138892e-05, "loss": 0.0063, "step": 706120 }, { "epoch": 1.83, "learning_rate": 2.5441377361767427e-05, "loss": 0.0091, "step": 706130 }, { "epoch": 1.83, "learning_rate": 2.543748914539596e-05, "loss": 0.0068, "step": 706140 }, { "epoch": 1.83, "learning_rate": 2.5433600929024496e-05, "loss": 0.0082, "step": 706150 }, { "epoch": 1.83, "learning_rate": 2.5429712712653035e-05, "loss": 0.0066, "step": 706160 }, { "epoch": 1.83, "learning_rate": 2.542582449628157e-05, "loss": 0.007, "step": 706170 }, { "epoch": 1.83, "learning_rate": 2.54219362799101e-05, "loss": 0.0069, "step": 706180 }, { "epoch": 1.83, "learning_rate": 2.5418048063538636e-05, "loss": 0.0087, "step": 706190 }, { "epoch": 1.83, "learning_rate": 2.541415984716717e-05, "loss": 0.0085, "step": 706200 }, { "epoch": 1.83, "learning_rate": 2.541027163079571e-05, "loss": 0.0073, "step": 706210 }, { "epoch": 1.83, "learning_rate": 2.5406383414424244e-05, "loss": 0.0069, "step": 706220 }, { "epoch": 1.83, "learning_rate": 2.540249519805278e-05, "loss": 0.0088, "step": 706230 }, { "epoch": 1.83, "learning_rate": 2.5398606981681314e-05, "loss": 0.0073, "step": 706240 }, { "epoch": 1.83, "learning_rate": 2.5394718765309852e-05, "loss": 0.006, "step": 706250 }, { "epoch": 1.83, "learning_rate": 2.5390830548938387e-05, "loss": 0.0069, "step": 706260 }, { "epoch": 1.83, "learning_rate": 2.538694233256692e-05, "loss": 0.0067, "step": 706270 }, { "epoch": 1.83, "learning_rate": 2.5383054116195456e-05, "loss": 0.0074, "step": 706280 }, { "epoch": 1.83, "learning_rate": 2.5379165899823995e-05, "loss": 0.0076, "step": 706290 }, { "epoch": 1.83, "learning_rate": 2.5375277683452526e-05, "loss": 0.0079, "step": 706300 }, { "epoch": 1.83, "learning_rate": 2.537138946708106e-05, "loss": 0.008, "step": 706310 }, { "epoch": 1.83, "learning_rate": 2.5367501250709596e-05, "loss": 0.0071, "step": 706320 }, { "epoch": 1.83, "learning_rate": 2.536361303433813e-05, "loss": 0.0084, "step": 706330 }, { "epoch": 1.83, "learning_rate": 2.535972481796667e-05, "loss": 0.0076, "step": 706340 }, { "epoch": 1.83, "learning_rate": 2.5355836601595204e-05, "loss": 0.0049, "step": 706350 }, { "epoch": 1.83, "learning_rate": 2.535194838522374e-05, "loss": 0.0073, "step": 706360 }, { "epoch": 1.83, "learning_rate": 2.5348060168852274e-05, "loss": 0.0074, "step": 706370 }, { "epoch": 1.83, "learning_rate": 2.5344171952480812e-05, "loss": 0.0084, "step": 706380 }, { "epoch": 1.83, "learning_rate": 2.5340283736109347e-05, "loss": 0.0091, "step": 706390 }, { "epoch": 1.83, "learning_rate": 2.533639551973788e-05, "loss": 0.0057, "step": 706400 }, { "epoch": 1.83, "learning_rate": 2.5332507303366416e-05, "loss": 0.0063, "step": 706410 }, { "epoch": 1.83, "learning_rate": 2.5328619086994955e-05, "loss": 0.0077, "step": 706420 }, { "epoch": 1.83, "learning_rate": 2.5324730870623486e-05, "loss": 0.0062, "step": 706430 }, { "epoch": 1.83, "learning_rate": 2.532084265425202e-05, "loss": 0.0081, "step": 706440 }, { "epoch": 1.83, "learning_rate": 2.5316954437880556e-05, "loss": 0.0064, "step": 706450 }, { "epoch": 1.83, "learning_rate": 2.531306622150909e-05, "loss": 0.0084, "step": 706460 }, { "epoch": 1.83, "learning_rate": 2.530917800513763e-05, "loss": 0.0096, "step": 706470 }, { "epoch": 1.83, "learning_rate": 2.5305289788766164e-05, "loss": 0.0103, "step": 706480 }, { "epoch": 1.83, "learning_rate": 2.53014015723947e-05, "loss": 0.0051, "step": 706490 }, { "epoch": 1.83, "learning_rate": 2.5297513356023233e-05, "loss": 0.0078, "step": 706500 }, { "epoch": 1.83, "learning_rate": 2.529362513965177e-05, "loss": 0.0063, "step": 706510 }, { "epoch": 1.83, "learning_rate": 2.5289736923280307e-05, "loss": 0.0104, "step": 706520 }, { "epoch": 1.83, "learning_rate": 2.528584870690884e-05, "loss": 0.0066, "step": 706530 }, { "epoch": 1.83, "learning_rate": 2.5281960490537376e-05, "loss": 0.0063, "step": 706540 }, { "epoch": 1.83, "learning_rate": 2.5278072274165908e-05, "loss": 0.0101, "step": 706550 }, { "epoch": 1.83, "learning_rate": 2.5274184057794443e-05, "loss": 0.0101, "step": 706560 }, { "epoch": 1.83, "learning_rate": 2.527029584142298e-05, "loss": 0.0059, "step": 706570 }, { "epoch": 1.83, "learning_rate": 2.5266407625051516e-05, "loss": 0.0083, "step": 706580 }, { "epoch": 1.83, "learning_rate": 2.526251940868005e-05, "loss": 0.0076, "step": 706590 }, { "epoch": 1.83, "learning_rate": 2.5258631192308585e-05, "loss": 0.0076, "step": 706600 }, { "epoch": 1.83, "learning_rate": 2.5254742975937124e-05, "loss": 0.0079, "step": 706610 }, { "epoch": 1.83, "learning_rate": 2.525085475956566e-05, "loss": 0.0111, "step": 706620 }, { "epoch": 1.83, "learning_rate": 2.5246966543194193e-05, "loss": 0.007, "step": 706630 }, { "epoch": 1.83, "learning_rate": 2.524307832682273e-05, "loss": 0.0052, "step": 706640 }, { "epoch": 1.83, "learning_rate": 2.5239190110451267e-05, "loss": 0.0087, "step": 706650 }, { "epoch": 1.83, "learning_rate": 2.52353018940798e-05, "loss": 0.0065, "step": 706660 }, { "epoch": 1.83, "learning_rate": 2.5231413677708333e-05, "loss": 0.0095, "step": 706670 }, { "epoch": 1.83, "learning_rate": 2.5227525461336868e-05, "loss": 0.0052, "step": 706680 }, { "epoch": 1.83, "learning_rate": 2.5223637244965403e-05, "loss": 0.0087, "step": 706690 }, { "epoch": 1.83, "learning_rate": 2.521974902859394e-05, "loss": 0.0066, "step": 706700 }, { "epoch": 1.83, "learning_rate": 2.5215860812222476e-05, "loss": 0.0076, "step": 706710 }, { "epoch": 1.83, "learning_rate": 2.521197259585101e-05, "loss": 0.0085, "step": 706720 }, { "epoch": 1.83, "learning_rate": 2.5208084379479545e-05, "loss": 0.0071, "step": 706730 }, { "epoch": 1.83, "learning_rate": 2.5204196163108084e-05, "loss": 0.0081, "step": 706740 }, { "epoch": 1.83, "learning_rate": 2.520030794673662e-05, "loss": 0.0093, "step": 706750 }, { "epoch": 1.83, "learning_rate": 2.5196419730365153e-05, "loss": 0.0071, "step": 706760 }, { "epoch": 1.83, "learning_rate": 2.5192531513993688e-05, "loss": 0.0058, "step": 706770 }, { "epoch": 1.83, "learning_rate": 2.5188643297622227e-05, "loss": 0.0072, "step": 706780 }, { "epoch": 1.83, "learning_rate": 2.518475508125076e-05, "loss": 0.0081, "step": 706790 }, { "epoch": 1.83, "learning_rate": 2.5180866864879293e-05, "loss": 0.008, "step": 706800 }, { "epoch": 1.83, "learning_rate": 2.5176978648507828e-05, "loss": 0.0082, "step": 706810 }, { "epoch": 1.83, "learning_rate": 2.5173090432136363e-05, "loss": 0.0092, "step": 706820 }, { "epoch": 1.83, "learning_rate": 2.51692022157649e-05, "loss": 0.0094, "step": 706830 }, { "epoch": 1.83, "learning_rate": 2.5165313999393436e-05, "loss": 0.0109, "step": 706840 }, { "epoch": 1.83, "learning_rate": 2.516142578302197e-05, "loss": 0.0073, "step": 706850 }, { "epoch": 1.83, "learning_rate": 2.5157537566650505e-05, "loss": 0.0076, "step": 706860 }, { "epoch": 1.83, "learning_rate": 2.5153649350279044e-05, "loss": 0.0074, "step": 706870 }, { "epoch": 1.83, "learning_rate": 2.514976113390758e-05, "loss": 0.0077, "step": 706880 }, { "epoch": 1.83, "learning_rate": 2.5145872917536113e-05, "loss": 0.0092, "step": 706890 }, { "epoch": 1.83, "learning_rate": 2.5141984701164648e-05, "loss": 0.0078, "step": 706900 }, { "epoch": 1.83, "learning_rate": 2.5138096484793187e-05, "loss": 0.0076, "step": 706910 }, { "epoch": 1.83, "learning_rate": 2.5134208268421718e-05, "loss": 0.0058, "step": 706920 }, { "epoch": 1.83, "learning_rate": 2.5130320052050253e-05, "loss": 0.0102, "step": 706930 }, { "epoch": 1.83, "learning_rate": 2.5126431835678788e-05, "loss": 0.0076, "step": 706940 }, { "epoch": 1.83, "learning_rate": 2.5122543619307323e-05, "loss": 0.0066, "step": 706950 }, { "epoch": 1.83, "learning_rate": 2.511865540293586e-05, "loss": 0.0075, "step": 706960 }, { "epoch": 1.83, "learning_rate": 2.5114767186564396e-05, "loss": 0.0076, "step": 706970 }, { "epoch": 1.83, "learning_rate": 2.511087897019293e-05, "loss": 0.0057, "step": 706980 }, { "epoch": 1.83, "learning_rate": 2.5106990753821465e-05, "loss": 0.0085, "step": 706990 }, { "epoch": 1.83, "learning_rate": 2.5103102537450004e-05, "loss": 0.0058, "step": 707000 }, { "epoch": 1.83, "eval_cer": 0.8816550986674057, "eval_loss": 0.004591579083353281, "eval_runtime": 107.8494, "eval_samples_per_second": 18.544, "eval_steps_per_second": 4.636, "step": 707000 }, { "epoch": 1.83, "learning_rate": 2.509921432107854e-05, "loss": 0.0054, "step": 707010 }, { "epoch": 1.83, "learning_rate": 2.5095326104707073e-05, "loss": 0.0088, "step": 707020 }, { "epoch": 1.83, "learning_rate": 2.5091437888335608e-05, "loss": 0.0108, "step": 707030 }, { "epoch": 1.83, "learning_rate": 2.5087549671964146e-05, "loss": 0.0101, "step": 707040 }, { "epoch": 1.83, "learning_rate": 2.5083661455592678e-05, "loss": 0.0072, "step": 707050 }, { "epoch": 1.83, "learning_rate": 2.5079773239221213e-05, "loss": 0.0097, "step": 707060 }, { "epoch": 1.83, "learning_rate": 2.5075885022849748e-05, "loss": 0.0118, "step": 707070 }, { "epoch": 1.83, "learning_rate": 2.5071996806478283e-05, "loss": 0.0074, "step": 707080 }, { "epoch": 1.83, "learning_rate": 2.506810859010682e-05, "loss": 0.0073, "step": 707090 }, { "epoch": 1.83, "learning_rate": 2.5064220373735356e-05, "loss": 0.0073, "step": 707100 }, { "epoch": 1.83, "learning_rate": 2.506033215736389e-05, "loss": 0.0096, "step": 707110 }, { "epoch": 1.83, "learning_rate": 2.5056443940992425e-05, "loss": 0.0066, "step": 707120 }, { "epoch": 1.83, "learning_rate": 2.5052555724620964e-05, "loss": 0.0086, "step": 707130 }, { "epoch": 1.83, "learning_rate": 2.50486675082495e-05, "loss": 0.0085, "step": 707140 }, { "epoch": 1.83, "learning_rate": 2.5044779291878033e-05, "loss": 0.0048, "step": 707150 }, { "epoch": 1.83, "learning_rate": 2.5040891075506568e-05, "loss": 0.0074, "step": 707160 }, { "epoch": 1.83, "learning_rate": 2.50370028591351e-05, "loss": 0.0083, "step": 707170 }, { "epoch": 1.83, "learning_rate": 2.5033114642763638e-05, "loss": 0.0091, "step": 707180 }, { "epoch": 1.83, "learning_rate": 2.5029226426392173e-05, "loss": 0.0065, "step": 707190 }, { "epoch": 1.83, "learning_rate": 2.5025338210020708e-05, "loss": 0.0062, "step": 707200 }, { "epoch": 1.83, "learning_rate": 2.5021449993649243e-05, "loss": 0.0062, "step": 707210 }, { "epoch": 1.83, "learning_rate": 2.501756177727778e-05, "loss": 0.0069, "step": 707220 }, { "epoch": 1.83, "learning_rate": 2.5013673560906316e-05, "loss": 0.0064, "step": 707230 }, { "epoch": 1.83, "learning_rate": 2.500978534453485e-05, "loss": 0.0069, "step": 707240 }, { "epoch": 1.83, "learning_rate": 2.5005897128163385e-05, "loss": 0.0065, "step": 707250 }, { "epoch": 1.83, "learning_rate": 2.5002008911791924e-05, "loss": 0.0062, "step": 707260 }, { "epoch": 1.83, "learning_rate": 2.499812069542046e-05, "loss": 0.0078, "step": 707270 }, { "epoch": 1.83, "learning_rate": 2.4994232479048993e-05, "loss": 0.0056, "step": 707280 }, { "epoch": 1.83, "learning_rate": 2.4990344262677525e-05, "loss": 0.0058, "step": 707290 }, { "epoch": 1.83, "learning_rate": 2.498645604630606e-05, "loss": 0.0158, "step": 707300 }, { "epoch": 1.83, "learning_rate": 2.4982567829934598e-05, "loss": 0.0076, "step": 707310 }, { "epoch": 1.83, "learning_rate": 2.4978679613563133e-05, "loss": 0.0054, "step": 707320 }, { "epoch": 1.83, "learning_rate": 2.4974791397191668e-05, "loss": 0.0083, "step": 707330 }, { "epoch": 1.83, "learning_rate": 2.4970903180820203e-05, "loss": 0.0066, "step": 707340 }, { "epoch": 1.83, "learning_rate": 2.496701496444874e-05, "loss": 0.0097, "step": 707350 }, { "epoch": 1.83, "learning_rate": 2.4963126748077276e-05, "loss": 0.006, "step": 707360 }, { "epoch": 1.83, "learning_rate": 2.495923853170581e-05, "loss": 0.0061, "step": 707370 }, { "epoch": 1.83, "learning_rate": 2.4955350315334345e-05, "loss": 0.0075, "step": 707380 }, { "epoch": 1.83, "learning_rate": 2.4951462098962884e-05, "loss": 0.0065, "step": 707390 }, { "epoch": 1.83, "learning_rate": 2.494757388259142e-05, "loss": 0.0064, "step": 707400 }, { "epoch": 1.83, "learning_rate": 2.4943685666219953e-05, "loss": 0.0103, "step": 707410 }, { "epoch": 1.83, "learning_rate": 2.4939797449848485e-05, "loss": 0.0057, "step": 707420 }, { "epoch": 1.83, "learning_rate": 2.493590923347702e-05, "loss": 0.0086, "step": 707430 }, { "epoch": 1.83, "learning_rate": 2.4932021017105558e-05, "loss": 0.0107, "step": 707440 }, { "epoch": 1.83, "learning_rate": 2.4928132800734093e-05, "loss": 0.0054, "step": 707450 }, { "epoch": 1.83, "learning_rate": 2.4924244584362628e-05, "loss": 0.0059, "step": 707460 }, { "epoch": 1.83, "learning_rate": 2.4920356367991162e-05, "loss": 0.0076, "step": 707470 }, { "epoch": 1.83, "learning_rate": 2.49164681516197e-05, "loss": 0.0096, "step": 707480 }, { "epoch": 1.83, "learning_rate": 2.4912579935248236e-05, "loss": 0.0093, "step": 707490 }, { "epoch": 1.83, "learning_rate": 2.490869171887677e-05, "loss": 0.0073, "step": 707500 }, { "epoch": 1.83, "learning_rate": 2.4904803502505305e-05, "loss": 0.0077, "step": 707510 }, { "epoch": 1.83, "learning_rate": 2.4900915286133844e-05, "loss": 0.0082, "step": 707520 }, { "epoch": 1.83, "learning_rate": 2.489702706976238e-05, "loss": 0.0093, "step": 707530 }, { "epoch": 1.83, "learning_rate": 2.489313885339091e-05, "loss": 0.0063, "step": 707540 }, { "epoch": 1.83, "learning_rate": 2.4889250637019445e-05, "loss": 0.009, "step": 707550 }, { "epoch": 1.83, "learning_rate": 2.488536242064798e-05, "loss": 0.0057, "step": 707560 }, { "epoch": 1.83, "learning_rate": 2.4881474204276518e-05, "loss": 0.0083, "step": 707570 }, { "epoch": 1.83, "learning_rate": 2.4877585987905053e-05, "loss": 0.0084, "step": 707580 }, { "epoch": 1.83, "learning_rate": 2.4873697771533588e-05, "loss": 0.008, "step": 707590 }, { "epoch": 1.83, "learning_rate": 2.4869809555162122e-05, "loss": 0.0077, "step": 707600 }, { "epoch": 1.83, "learning_rate": 2.486592133879066e-05, "loss": 0.0101, "step": 707610 }, { "epoch": 1.83, "learning_rate": 2.4862033122419196e-05, "loss": 0.0066, "step": 707620 }, { "epoch": 1.83, "learning_rate": 2.485814490604773e-05, "loss": 0.0079, "step": 707630 }, { "epoch": 1.83, "learning_rate": 2.4854256689676265e-05, "loss": 0.0065, "step": 707640 }, { "epoch": 1.83, "learning_rate": 2.4850368473304804e-05, "loss": 0.0079, "step": 707650 }, { "epoch": 1.83, "learning_rate": 2.484648025693334e-05, "loss": 0.0055, "step": 707660 }, { "epoch": 1.83, "learning_rate": 2.484259204056187e-05, "loss": 0.0064, "step": 707670 }, { "epoch": 1.83, "learning_rate": 2.4838703824190405e-05, "loss": 0.0049, "step": 707680 }, { "epoch": 1.83, "learning_rate": 2.483481560781894e-05, "loss": 0.0079, "step": 707690 }, { "epoch": 1.83, "learning_rate": 2.4830927391447478e-05, "loss": 0.0067, "step": 707700 }, { "epoch": 1.83, "learning_rate": 2.4827039175076013e-05, "loss": 0.0103, "step": 707710 }, { "epoch": 1.83, "learning_rate": 2.4823150958704548e-05, "loss": 0.008, "step": 707720 }, { "epoch": 1.83, "learning_rate": 2.4819262742333082e-05, "loss": 0.0057, "step": 707730 }, { "epoch": 1.83, "learning_rate": 2.481537452596162e-05, "loss": 0.0069, "step": 707740 }, { "epoch": 1.83, "learning_rate": 2.4811486309590156e-05, "loss": 0.0075, "step": 707750 }, { "epoch": 1.83, "learning_rate": 2.480759809321869e-05, "loss": 0.0068, "step": 707760 }, { "epoch": 1.83, "learning_rate": 2.4803709876847225e-05, "loss": 0.0086, "step": 707770 }, { "epoch": 1.83, "learning_rate": 2.4799821660475764e-05, "loss": 0.0068, "step": 707780 }, { "epoch": 1.83, "learning_rate": 2.4795933444104295e-05, "loss": 0.0076, "step": 707790 }, { "epoch": 1.83, "learning_rate": 2.479204522773283e-05, "loss": 0.0045, "step": 707800 }, { "epoch": 1.83, "learning_rate": 2.4788157011361365e-05, "loss": 0.0075, "step": 707810 }, { "epoch": 1.83, "learning_rate": 2.47842687949899e-05, "loss": 0.0133, "step": 707820 }, { "epoch": 1.83, "learning_rate": 2.4780380578618438e-05, "loss": 0.006, "step": 707830 }, { "epoch": 1.83, "learning_rate": 2.4776492362246973e-05, "loss": 0.0073, "step": 707840 }, { "epoch": 1.83, "learning_rate": 2.4772604145875508e-05, "loss": 0.0065, "step": 707850 }, { "epoch": 1.83, "learning_rate": 2.4768715929504042e-05, "loss": 0.0088, "step": 707860 }, { "epoch": 1.83, "learning_rate": 2.476482771313258e-05, "loss": 0.0052, "step": 707870 }, { "epoch": 1.83, "learning_rate": 2.4760939496761116e-05, "loss": 0.0073, "step": 707880 }, { "epoch": 1.83, "learning_rate": 2.475705128038965e-05, "loss": 0.0097, "step": 707890 }, { "epoch": 1.83, "learning_rate": 2.4753163064018185e-05, "loss": 0.0073, "step": 707900 }, { "epoch": 1.84, "learning_rate": 2.474927484764672e-05, "loss": 0.0059, "step": 707910 }, { "epoch": 1.84, "learning_rate": 2.4745386631275255e-05, "loss": 0.0068, "step": 707920 }, { "epoch": 1.84, "learning_rate": 2.474149841490379e-05, "loss": 0.0071, "step": 707930 }, { "epoch": 1.84, "learning_rate": 2.4737610198532325e-05, "loss": 0.0078, "step": 707940 }, { "epoch": 1.84, "learning_rate": 2.473372198216086e-05, "loss": 0.0076, "step": 707950 }, { "epoch": 1.84, "learning_rate": 2.4729833765789394e-05, "loss": 0.0059, "step": 707960 }, { "epoch": 1.84, "learning_rate": 2.4725945549417933e-05, "loss": 0.0078, "step": 707970 }, { "epoch": 1.84, "learning_rate": 2.4722057333046468e-05, "loss": 0.0057, "step": 707980 }, { "epoch": 1.84, "learning_rate": 2.4718169116675002e-05, "loss": 0.0065, "step": 707990 }, { "epoch": 1.84, "learning_rate": 2.4714280900303537e-05, "loss": 0.006, "step": 708000 }, { "epoch": 1.84, "eval_cer": 0.8816481004827348, "eval_loss": 0.004648663103580475, "eval_runtime": 107.9525, "eval_samples_per_second": 18.527, "eval_steps_per_second": 4.632, "step": 708000 }, { "epoch": 1.84, "learning_rate": 2.4710392683932075e-05, "loss": 0.0102, "step": 708010 }, { "epoch": 1.84, "learning_rate": 2.470650446756061e-05, "loss": 0.0075, "step": 708020 }, { "epoch": 1.84, "learning_rate": 2.4702616251189145e-05, "loss": 0.0065, "step": 708030 }, { "epoch": 1.84, "learning_rate": 2.4698728034817677e-05, "loss": 0.0081, "step": 708040 }, { "epoch": 1.84, "learning_rate": 2.469483981844621e-05, "loss": 0.0119, "step": 708050 }, { "epoch": 1.84, "learning_rate": 2.469095160207475e-05, "loss": 0.0081, "step": 708060 }, { "epoch": 1.84, "learning_rate": 2.4687063385703285e-05, "loss": 0.0094, "step": 708070 }, { "epoch": 1.84, "learning_rate": 2.468317516933182e-05, "loss": 0.0059, "step": 708080 }, { "epoch": 1.84, "learning_rate": 2.4679286952960354e-05, "loss": 0.0077, "step": 708090 }, { "epoch": 1.84, "learning_rate": 2.4675398736588893e-05, "loss": 0.0076, "step": 708100 }, { "epoch": 1.84, "learning_rate": 2.4671510520217427e-05, "loss": 0.0071, "step": 708110 }, { "epoch": 1.84, "learning_rate": 2.4667622303845962e-05, "loss": 0.0079, "step": 708120 }, { "epoch": 1.84, "learning_rate": 2.4663734087474497e-05, "loss": 0.0087, "step": 708130 }, { "epoch": 1.84, "learning_rate": 2.4659845871103035e-05, "loss": 0.0071, "step": 708140 }, { "epoch": 1.84, "learning_rate": 2.465595765473157e-05, "loss": 0.0067, "step": 708150 }, { "epoch": 1.84, "learning_rate": 2.4652069438360102e-05, "loss": 0.0078, "step": 708160 }, { "epoch": 1.84, "learning_rate": 2.4648181221988637e-05, "loss": 0.006, "step": 708170 }, { "epoch": 1.84, "learning_rate": 2.464429300561717e-05, "loss": 0.0093, "step": 708180 }, { "epoch": 1.84, "learning_rate": 2.464040478924571e-05, "loss": 0.0072, "step": 708190 }, { "epoch": 1.84, "learning_rate": 2.4636516572874245e-05, "loss": 0.0109, "step": 708200 }, { "epoch": 1.84, "learning_rate": 2.463262835650278e-05, "loss": 0.0057, "step": 708210 }, { "epoch": 1.84, "learning_rate": 2.4628740140131314e-05, "loss": 0.0069, "step": 708220 }, { "epoch": 1.84, "learning_rate": 2.4624851923759853e-05, "loss": 0.0073, "step": 708230 }, { "epoch": 1.84, "learning_rate": 2.4620963707388387e-05, "loss": 0.0113, "step": 708240 }, { "epoch": 1.84, "learning_rate": 2.4617075491016922e-05, "loss": 0.008, "step": 708250 }, { "epoch": 1.84, "learning_rate": 2.4613187274645457e-05, "loss": 0.0081, "step": 708260 }, { "epoch": 1.84, "learning_rate": 2.4609299058273995e-05, "loss": 0.0063, "step": 708270 }, { "epoch": 1.84, "learning_rate": 2.460541084190253e-05, "loss": 0.0056, "step": 708280 }, { "epoch": 1.84, "learning_rate": 2.4601522625531062e-05, "loss": 0.0091, "step": 708290 }, { "epoch": 1.84, "learning_rate": 2.4597634409159597e-05, "loss": 0.0099, "step": 708300 }, { "epoch": 1.84, "learning_rate": 2.459374619278813e-05, "loss": 0.0071, "step": 708310 }, { "epoch": 1.84, "learning_rate": 2.458985797641667e-05, "loss": 0.0067, "step": 708320 }, { "epoch": 1.84, "learning_rate": 2.4585969760045205e-05, "loss": 0.0076, "step": 708330 }, { "epoch": 1.84, "learning_rate": 2.458208154367374e-05, "loss": 0.0096, "step": 708340 }, { "epoch": 1.84, "learning_rate": 2.4578193327302274e-05, "loss": 0.0058, "step": 708350 }, { "epoch": 1.84, "learning_rate": 2.4574305110930813e-05, "loss": 0.0073, "step": 708360 }, { "epoch": 1.84, "learning_rate": 2.4570416894559347e-05, "loss": 0.0124, "step": 708370 }, { "epoch": 1.84, "learning_rate": 2.4566528678187882e-05, "loss": 0.0061, "step": 708380 }, { "epoch": 1.84, "learning_rate": 2.4562640461816417e-05, "loss": 0.0099, "step": 708390 }, { "epoch": 1.84, "learning_rate": 2.4558752245444955e-05, "loss": 0.007, "step": 708400 }, { "epoch": 1.84, "learning_rate": 2.4554864029073487e-05, "loss": 0.0063, "step": 708410 }, { "epoch": 1.84, "learning_rate": 2.4550975812702022e-05, "loss": 0.0082, "step": 708420 }, { "epoch": 1.84, "learning_rate": 2.4547087596330557e-05, "loss": 0.0063, "step": 708430 }, { "epoch": 1.84, "learning_rate": 2.454319937995909e-05, "loss": 0.0062, "step": 708440 }, { "epoch": 1.84, "learning_rate": 2.453931116358763e-05, "loss": 0.0077, "step": 708450 }, { "epoch": 1.84, "learning_rate": 2.4535422947216165e-05, "loss": 0.0056, "step": 708460 }, { "epoch": 1.84, "learning_rate": 2.45315347308447e-05, "loss": 0.0093, "step": 708470 }, { "epoch": 1.84, "learning_rate": 2.4527646514473234e-05, "loss": 0.0095, "step": 708480 }, { "epoch": 1.84, "learning_rate": 2.4523758298101773e-05, "loss": 0.0092, "step": 708490 }, { "epoch": 1.84, "learning_rate": 2.4519870081730307e-05, "loss": 0.0082, "step": 708500 }, { "epoch": 1.84, "learning_rate": 2.4515981865358842e-05, "loss": 0.0111, "step": 708510 }, { "epoch": 1.84, "learning_rate": 2.4512093648987377e-05, "loss": 0.0052, "step": 708520 }, { "epoch": 1.84, "learning_rate": 2.4508205432615915e-05, "loss": 0.0065, "step": 708530 }, { "epoch": 1.84, "learning_rate": 2.4504317216244447e-05, "loss": 0.008, "step": 708540 }, { "epoch": 1.84, "learning_rate": 2.4500428999872982e-05, "loss": 0.0049, "step": 708550 }, { "epoch": 1.84, "learning_rate": 2.4496540783501517e-05, "loss": 0.0051, "step": 708560 }, { "epoch": 1.84, "learning_rate": 2.449265256713005e-05, "loss": 0.0074, "step": 708570 }, { "epoch": 1.84, "learning_rate": 2.448876435075859e-05, "loss": 0.008, "step": 708580 }, { "epoch": 1.84, "learning_rate": 2.4484876134387125e-05, "loss": 0.0095, "step": 708590 }, { "epoch": 1.84, "learning_rate": 2.448098791801566e-05, "loss": 0.0069, "step": 708600 }, { "epoch": 1.84, "learning_rate": 2.4477099701644194e-05, "loss": 0.0065, "step": 708610 }, { "epoch": 1.84, "learning_rate": 2.4473211485272733e-05, "loss": 0.0065, "step": 708620 }, { "epoch": 1.84, "learning_rate": 2.4469323268901267e-05, "loss": 0.0088, "step": 708630 }, { "epoch": 1.84, "learning_rate": 2.4465435052529802e-05, "loss": 0.009, "step": 708640 }, { "epoch": 1.84, "learning_rate": 2.4461546836158337e-05, "loss": 0.0111, "step": 708650 }, { "epoch": 1.84, "learning_rate": 2.445765861978687e-05, "loss": 0.0119, "step": 708660 }, { "epoch": 1.84, "learning_rate": 2.4453770403415407e-05, "loss": 0.0057, "step": 708670 }, { "epoch": 1.84, "learning_rate": 2.4449882187043942e-05, "loss": 0.0055, "step": 708680 }, { "epoch": 1.84, "learning_rate": 2.4445993970672477e-05, "loss": 0.007, "step": 708690 }, { "epoch": 1.84, "learning_rate": 2.444210575430101e-05, "loss": 0.007, "step": 708700 }, { "epoch": 1.84, "learning_rate": 2.443821753792955e-05, "loss": 0.0094, "step": 708710 }, { "epoch": 1.84, "learning_rate": 2.4434329321558085e-05, "loss": 0.0077, "step": 708720 }, { "epoch": 1.84, "learning_rate": 2.443044110518662e-05, "loss": 0.0096, "step": 708730 }, { "epoch": 1.84, "learning_rate": 2.4426552888815154e-05, "loss": 0.0103, "step": 708740 }, { "epoch": 1.84, "learning_rate": 2.4422664672443693e-05, "loss": 0.0072, "step": 708750 }, { "epoch": 1.84, "learning_rate": 2.4418776456072227e-05, "loss": 0.0092, "step": 708760 }, { "epoch": 1.84, "learning_rate": 2.4414888239700762e-05, "loss": 0.0064, "step": 708770 }, { "epoch": 1.84, "learning_rate": 2.4411000023329294e-05, "loss": 0.0094, "step": 708780 }, { "epoch": 1.84, "learning_rate": 2.440711180695783e-05, "loss": 0.0073, "step": 708790 }, { "epoch": 1.84, "learning_rate": 2.4403223590586367e-05, "loss": 0.0075, "step": 708800 }, { "epoch": 1.84, "learning_rate": 2.43993353742149e-05, "loss": 0.0098, "step": 708810 }, { "epoch": 1.84, "learning_rate": 2.4395447157843437e-05, "loss": 0.0064, "step": 708820 }, { "epoch": 1.84, "learning_rate": 2.439155894147197e-05, "loss": 0.0078, "step": 708830 }, { "epoch": 1.84, "learning_rate": 2.438767072510051e-05, "loss": 0.0078, "step": 708840 }, { "epoch": 1.84, "learning_rate": 2.4383782508729045e-05, "loss": 0.0089, "step": 708850 }, { "epoch": 1.84, "learning_rate": 2.437989429235758e-05, "loss": 0.0085, "step": 708860 }, { "epoch": 1.84, "learning_rate": 2.4376006075986114e-05, "loss": 0.0067, "step": 708870 }, { "epoch": 1.84, "learning_rate": 2.4372117859614652e-05, "loss": 0.0072, "step": 708880 }, { "epoch": 1.84, "learning_rate": 2.4368229643243187e-05, "loss": 0.0078, "step": 708890 }, { "epoch": 1.84, "learning_rate": 2.4364341426871722e-05, "loss": 0.0068, "step": 708900 }, { "epoch": 1.84, "learning_rate": 2.4360453210500254e-05, "loss": 0.0056, "step": 708910 }, { "epoch": 1.84, "learning_rate": 2.435656499412879e-05, "loss": 0.0065, "step": 708920 }, { "epoch": 1.84, "learning_rate": 2.4352676777757327e-05, "loss": 0.0072, "step": 708930 }, { "epoch": 1.84, "learning_rate": 2.434878856138586e-05, "loss": 0.0078, "step": 708940 }, { "epoch": 1.84, "learning_rate": 2.4344900345014397e-05, "loss": 0.0071, "step": 708950 }, { "epoch": 1.84, "learning_rate": 2.434101212864293e-05, "loss": 0.0084, "step": 708960 }, { "epoch": 1.84, "learning_rate": 2.433712391227147e-05, "loss": 0.0058, "step": 708970 }, { "epoch": 1.84, "learning_rate": 2.4333235695900004e-05, "loss": 0.0086, "step": 708980 }, { "epoch": 1.84, "learning_rate": 2.432934747952854e-05, "loss": 0.0066, "step": 708990 }, { "epoch": 1.84, "learning_rate": 2.4325459263157074e-05, "loss": 0.007, "step": 709000 }, { "epoch": 1.84, "eval_cer": 0.8816355037503272, "eval_loss": 0.004716834053397179, "eval_runtime": 107.9456, "eval_samples_per_second": 18.528, "eval_steps_per_second": 4.632, "step": 709000 }, { "epoch": 1.84, "learning_rate": 2.4321571046785612e-05, "loss": 0.0075, "step": 709010 }, { "epoch": 1.84, "learning_rate": 2.4317682830414147e-05, "loss": 0.0085, "step": 709020 }, { "epoch": 1.84, "learning_rate": 2.431379461404268e-05, "loss": 0.0058, "step": 709030 }, { "epoch": 1.84, "learning_rate": 2.4309906397671214e-05, "loss": 0.0119, "step": 709040 }, { "epoch": 1.84, "learning_rate": 2.430601818129975e-05, "loss": 0.0096, "step": 709050 }, { "epoch": 1.84, "learning_rate": 2.4302129964928287e-05, "loss": 0.0083, "step": 709060 }, { "epoch": 1.84, "learning_rate": 2.429824174855682e-05, "loss": 0.0077, "step": 709070 }, { "epoch": 1.84, "learning_rate": 2.4294353532185356e-05, "loss": 0.0098, "step": 709080 }, { "epoch": 1.84, "learning_rate": 2.429046531581389e-05, "loss": 0.0116, "step": 709090 }, { "epoch": 1.84, "learning_rate": 2.428657709944243e-05, "loss": 0.0071, "step": 709100 }, { "epoch": 1.84, "learning_rate": 2.4282688883070964e-05, "loss": 0.0062, "step": 709110 }, { "epoch": 1.84, "learning_rate": 2.42788006666995e-05, "loss": 0.0084, "step": 709120 }, { "epoch": 1.84, "learning_rate": 2.4274912450328034e-05, "loss": 0.0078, "step": 709130 }, { "epoch": 1.84, "learning_rate": 2.4271024233956572e-05, "loss": 0.0075, "step": 709140 }, { "epoch": 1.84, "learning_rate": 2.4267136017585107e-05, "loss": 0.0065, "step": 709150 }, { "epoch": 1.84, "learning_rate": 2.426324780121364e-05, "loss": 0.0105, "step": 709160 }, { "epoch": 1.84, "learning_rate": 2.4259359584842174e-05, "loss": 0.0083, "step": 709170 }, { "epoch": 1.84, "learning_rate": 2.425547136847071e-05, "loss": 0.007, "step": 709180 }, { "epoch": 1.84, "learning_rate": 2.4251583152099247e-05, "loss": 0.0081, "step": 709190 }, { "epoch": 1.84, "learning_rate": 2.424769493572778e-05, "loss": 0.0057, "step": 709200 }, { "epoch": 1.84, "learning_rate": 2.4243806719356316e-05, "loss": 0.0078, "step": 709210 }, { "epoch": 1.84, "learning_rate": 2.423991850298485e-05, "loss": 0.0061, "step": 709220 }, { "epoch": 1.84, "learning_rate": 2.423603028661339e-05, "loss": 0.0062, "step": 709230 }, { "epoch": 1.84, "learning_rate": 2.4232142070241924e-05, "loss": 0.008, "step": 709240 }, { "epoch": 1.84, "learning_rate": 2.422825385387046e-05, "loss": 0.007, "step": 709250 }, { "epoch": 1.84, "learning_rate": 2.4224365637498994e-05, "loss": 0.0084, "step": 709260 }, { "epoch": 1.84, "learning_rate": 2.422047742112753e-05, "loss": 0.0075, "step": 709270 }, { "epoch": 1.84, "learning_rate": 2.4216589204756064e-05, "loss": 0.0111, "step": 709280 }, { "epoch": 1.84, "learning_rate": 2.42127009883846e-05, "loss": 0.0083, "step": 709290 }, { "epoch": 1.84, "learning_rate": 2.4208812772013134e-05, "loss": 0.0053, "step": 709300 }, { "epoch": 1.84, "learning_rate": 2.420492455564167e-05, "loss": 0.0089, "step": 709310 }, { "epoch": 1.84, "learning_rate": 2.4201036339270203e-05, "loss": 0.0064, "step": 709320 }, { "epoch": 1.84, "learning_rate": 2.419714812289874e-05, "loss": 0.0081, "step": 709330 }, { "epoch": 1.84, "learning_rate": 2.4193259906527276e-05, "loss": 0.0068, "step": 709340 }, { "epoch": 1.84, "learning_rate": 2.418937169015581e-05, "loss": 0.0061, "step": 709350 }, { "epoch": 1.84, "learning_rate": 2.4185483473784346e-05, "loss": 0.0063, "step": 709360 }, { "epoch": 1.84, "learning_rate": 2.4181595257412884e-05, "loss": 0.0066, "step": 709370 }, { "epoch": 1.84, "learning_rate": 2.417770704104142e-05, "loss": 0.0091, "step": 709380 }, { "epoch": 1.84, "learning_rate": 2.4173818824669954e-05, "loss": 0.0079, "step": 709390 }, { "epoch": 1.84, "learning_rate": 2.4169930608298486e-05, "loss": 0.0071, "step": 709400 }, { "epoch": 1.84, "learning_rate": 2.416604239192702e-05, "loss": 0.0087, "step": 709410 }, { "epoch": 1.84, "learning_rate": 2.416215417555556e-05, "loss": 0.0083, "step": 709420 }, { "epoch": 1.84, "learning_rate": 2.4158265959184094e-05, "loss": 0.0085, "step": 709430 }, { "epoch": 1.84, "learning_rate": 2.415437774281263e-05, "loss": 0.0086, "step": 709440 }, { "epoch": 1.84, "learning_rate": 2.4150489526441163e-05, "loss": 0.0059, "step": 709450 }, { "epoch": 1.84, "learning_rate": 2.41466013100697e-05, "loss": 0.0135, "step": 709460 }, { "epoch": 1.84, "learning_rate": 2.4142713093698236e-05, "loss": 0.0074, "step": 709470 }, { "epoch": 1.84, "learning_rate": 2.413882487732677e-05, "loss": 0.0068, "step": 709480 }, { "epoch": 1.84, "learning_rate": 2.4134936660955306e-05, "loss": 0.0177, "step": 709490 }, { "epoch": 1.84, "learning_rate": 2.4131048444583844e-05, "loss": 0.01, "step": 709500 }, { "epoch": 1.84, "learning_rate": 2.412716022821238e-05, "loss": 0.0073, "step": 709510 }, { "epoch": 1.84, "learning_rate": 2.4123272011840914e-05, "loss": 0.0058, "step": 709520 }, { "epoch": 1.84, "learning_rate": 2.4119383795469446e-05, "loss": 0.0094, "step": 709530 }, { "epoch": 1.84, "learning_rate": 2.411549557909798e-05, "loss": 0.0106, "step": 709540 }, { "epoch": 1.84, "learning_rate": 2.411160736272652e-05, "loss": 0.0088, "step": 709550 }, { "epoch": 1.84, "learning_rate": 2.4107719146355054e-05, "loss": 0.0109, "step": 709560 }, { "epoch": 1.84, "learning_rate": 2.410383092998359e-05, "loss": 0.0064, "step": 709570 }, { "epoch": 1.84, "learning_rate": 2.4099942713612123e-05, "loss": 0.0083, "step": 709580 }, { "epoch": 1.84, "learning_rate": 2.409605449724066e-05, "loss": 0.0057, "step": 709590 }, { "epoch": 1.84, "learning_rate": 2.4092166280869196e-05, "loss": 0.0067, "step": 709600 }, { "epoch": 1.84, "learning_rate": 2.408827806449773e-05, "loss": 0.0076, "step": 709610 }, { "epoch": 1.84, "learning_rate": 2.4084389848126266e-05, "loss": 0.0094, "step": 709620 }, { "epoch": 1.84, "learning_rate": 2.4080501631754804e-05, "loss": 0.0067, "step": 709630 }, { "epoch": 1.84, "learning_rate": 2.407661341538334e-05, "loss": 0.0084, "step": 709640 }, { "epoch": 1.84, "learning_rate": 2.407272519901187e-05, "loss": 0.0074, "step": 709650 }, { "epoch": 1.84, "learning_rate": 2.4068836982640406e-05, "loss": 0.0091, "step": 709660 }, { "epoch": 1.84, "learning_rate": 2.406494876626894e-05, "loss": 0.0071, "step": 709670 }, { "epoch": 1.84, "learning_rate": 2.406106054989748e-05, "loss": 0.0067, "step": 709680 }, { "epoch": 1.84, "learning_rate": 2.4057172333526014e-05, "loss": 0.0069, "step": 709690 }, { "epoch": 1.84, "learning_rate": 2.405328411715455e-05, "loss": 0.0085, "step": 709700 }, { "epoch": 1.84, "learning_rate": 2.4049395900783083e-05, "loss": 0.0108, "step": 709710 }, { "epoch": 1.84, "learning_rate": 2.404550768441162e-05, "loss": 0.0081, "step": 709720 }, { "epoch": 1.84, "learning_rate": 2.4041619468040156e-05, "loss": 0.0078, "step": 709730 }, { "epoch": 1.84, "learning_rate": 2.403773125166869e-05, "loss": 0.013, "step": 709740 }, { "epoch": 1.84, "learning_rate": 2.4033843035297226e-05, "loss": 0.0067, "step": 709750 }, { "epoch": 1.84, "learning_rate": 2.4029954818925764e-05, "loss": 0.0063, "step": 709760 }, { "epoch": 1.84, "learning_rate": 2.40260666025543e-05, "loss": 0.0076, "step": 709770 }, { "epoch": 1.84, "learning_rate": 2.402217838618283e-05, "loss": 0.006, "step": 709780 }, { "epoch": 1.84, "learning_rate": 2.4018290169811366e-05, "loss": 0.0088, "step": 709790 }, { "epoch": 1.84, "learning_rate": 2.40144019534399e-05, "loss": 0.0086, "step": 709800 }, { "epoch": 1.84, "learning_rate": 2.401051373706844e-05, "loss": 0.0086, "step": 709810 }, { "epoch": 1.84, "learning_rate": 2.4006625520696974e-05, "loss": 0.0069, "step": 709820 }, { "epoch": 1.84, "learning_rate": 2.400273730432551e-05, "loss": 0.0082, "step": 709830 }, { "epoch": 1.84, "learning_rate": 2.3998849087954043e-05, "loss": 0.0087, "step": 709840 }, { "epoch": 1.84, "learning_rate": 2.399496087158258e-05, "loss": 0.0088, "step": 709850 }, { "epoch": 1.84, "learning_rate": 2.3991072655211116e-05, "loss": 0.0074, "step": 709860 }, { "epoch": 1.84, "learning_rate": 2.398718443883965e-05, "loss": 0.0068, "step": 709870 }, { "epoch": 1.84, "learning_rate": 2.3983296222468186e-05, "loss": 0.006, "step": 709880 }, { "epoch": 1.84, "learning_rate": 2.3979408006096724e-05, "loss": 0.007, "step": 709890 }, { "epoch": 1.84, "learning_rate": 2.3975519789725256e-05, "loss": 0.0072, "step": 709900 }, { "epoch": 1.84, "learning_rate": 2.397163157335379e-05, "loss": 0.0057, "step": 709910 }, { "epoch": 1.84, "learning_rate": 2.3967743356982326e-05, "loss": 0.0066, "step": 709920 }, { "epoch": 1.84, "learning_rate": 2.396385514061086e-05, "loss": 0.0062, "step": 709930 }, { "epoch": 1.84, "learning_rate": 2.39599669242394e-05, "loss": 0.007, "step": 709940 }, { "epoch": 1.84, "learning_rate": 2.3956078707867933e-05, "loss": 0.0076, "step": 709950 }, { "epoch": 1.84, "learning_rate": 2.395219049149647e-05, "loss": 0.0063, "step": 709960 }, { "epoch": 1.84, "learning_rate": 2.3948302275125003e-05, "loss": 0.0084, "step": 709970 }, { "epoch": 1.84, "learning_rate": 2.394441405875354e-05, "loss": 0.0074, "step": 709980 }, { "epoch": 1.84, "learning_rate": 2.3940525842382076e-05, "loss": 0.0089, "step": 709990 }, { "epoch": 1.84, "learning_rate": 2.393663762601061e-05, "loss": 0.0087, "step": 710000 }, { "epoch": 1.84, "eval_cer": 0.881642501934998, "eval_loss": 0.00460857292637229, "eval_runtime": 107.9419, "eval_samples_per_second": 18.528, "eval_steps_per_second": 4.632, "step": 710000 }, { "epoch": 1.84, "learning_rate": 2.3932749409639146e-05, "loss": 0.0064, "step": 710010 }, { "epoch": 1.84, "learning_rate": 2.3928861193267678e-05, "loss": 0.0111, "step": 710020 }, { "epoch": 1.84, "learning_rate": 2.3924972976896216e-05, "loss": 0.0067, "step": 710030 }, { "epoch": 1.84, "learning_rate": 2.392108476052475e-05, "loss": 0.0085, "step": 710040 }, { "epoch": 1.84, "learning_rate": 2.3917196544153285e-05, "loss": 0.0082, "step": 710050 }, { "epoch": 1.84, "learning_rate": 2.391330832778182e-05, "loss": 0.0061, "step": 710060 }, { "epoch": 1.84, "learning_rate": 2.390942011141036e-05, "loss": 0.007, "step": 710070 }, { "epoch": 1.84, "learning_rate": 2.3905531895038893e-05, "loss": 0.007, "step": 710080 }, { "epoch": 1.84, "learning_rate": 2.390164367866743e-05, "loss": 0.0073, "step": 710090 }, { "epoch": 1.84, "learning_rate": 2.3897755462295963e-05, "loss": 0.0081, "step": 710100 }, { "epoch": 1.84, "learning_rate": 2.38938672459245e-05, "loss": 0.0066, "step": 710110 }, { "epoch": 1.84, "learning_rate": 2.3889979029553036e-05, "loss": 0.0078, "step": 710120 }, { "epoch": 1.84, "learning_rate": 2.388609081318157e-05, "loss": 0.0064, "step": 710130 }, { "epoch": 1.84, "learning_rate": 2.3882202596810106e-05, "loss": 0.0078, "step": 710140 }, { "epoch": 1.84, "learning_rate": 2.3878314380438638e-05, "loss": 0.0076, "step": 710150 }, { "epoch": 1.84, "learning_rate": 2.3874426164067176e-05, "loss": 0.005, "step": 710160 }, { "epoch": 1.84, "learning_rate": 2.387053794769571e-05, "loss": 0.0058, "step": 710170 }, { "epoch": 1.84, "learning_rate": 2.3866649731324245e-05, "loss": 0.0066, "step": 710180 }, { "epoch": 1.84, "learning_rate": 2.386276151495278e-05, "loss": 0.0049, "step": 710190 }, { "epoch": 1.84, "learning_rate": 2.385887329858132e-05, "loss": 0.0086, "step": 710200 }, { "epoch": 1.84, "learning_rate": 2.3854985082209853e-05, "loss": 0.0073, "step": 710210 }, { "epoch": 1.84, "learning_rate": 2.385109686583839e-05, "loss": 0.008, "step": 710220 }, { "epoch": 1.84, "learning_rate": 2.3847208649466923e-05, "loss": 0.0061, "step": 710230 }, { "epoch": 1.84, "learning_rate": 2.384332043309546e-05, "loss": 0.0091, "step": 710240 }, { "epoch": 1.84, "learning_rate": 2.3839432216723996e-05, "loss": 0.0073, "step": 710250 }, { "epoch": 1.84, "learning_rate": 2.383554400035253e-05, "loss": 0.0054, "step": 710260 }, { "epoch": 1.84, "learning_rate": 2.3831655783981063e-05, "loss": 0.0056, "step": 710270 }, { "epoch": 1.84, "learning_rate": 2.3827767567609597e-05, "loss": 0.0074, "step": 710280 }, { "epoch": 1.84, "learning_rate": 2.3823879351238136e-05, "loss": 0.0077, "step": 710290 }, { "epoch": 1.84, "learning_rate": 2.381999113486667e-05, "loss": 0.0061, "step": 710300 }, { "epoch": 1.84, "learning_rate": 2.3816102918495205e-05, "loss": 0.007, "step": 710310 }, { "epoch": 1.84, "learning_rate": 2.381221470212374e-05, "loss": 0.0081, "step": 710320 }, { "epoch": 1.84, "learning_rate": 2.380832648575228e-05, "loss": 0.0065, "step": 710330 }, { "epoch": 1.84, "learning_rate": 2.3804438269380813e-05, "loss": 0.0069, "step": 710340 }, { "epoch": 1.84, "learning_rate": 2.3800550053009348e-05, "loss": 0.0089, "step": 710350 }, { "epoch": 1.84, "learning_rate": 2.3796661836637883e-05, "loss": 0.008, "step": 710360 }, { "epoch": 1.84, "learning_rate": 2.379277362026642e-05, "loss": 0.0069, "step": 710370 }, { "epoch": 1.84, "learning_rate": 2.3788885403894956e-05, "loss": 0.0078, "step": 710380 }, { "epoch": 1.84, "learning_rate": 2.378499718752349e-05, "loss": 0.0065, "step": 710390 }, { "epoch": 1.84, "learning_rate": 2.3781108971152023e-05, "loss": 0.0113, "step": 710400 }, { "epoch": 1.84, "learning_rate": 2.3777220754780557e-05, "loss": 0.0057, "step": 710410 }, { "epoch": 1.84, "learning_rate": 2.3773332538409096e-05, "loss": 0.0095, "step": 710420 }, { "epoch": 1.84, "learning_rate": 2.376944432203763e-05, "loss": 0.0105, "step": 710430 }, { "epoch": 1.84, "learning_rate": 2.3765556105666165e-05, "loss": 0.0067, "step": 710440 }, { "epoch": 1.84, "learning_rate": 2.37616678892947e-05, "loss": 0.0073, "step": 710450 }, { "epoch": 1.84, "learning_rate": 2.375777967292324e-05, "loss": 0.0067, "step": 710460 }, { "epoch": 1.84, "learning_rate": 2.3753891456551773e-05, "loss": 0.0091, "step": 710470 }, { "epoch": 1.84, "learning_rate": 2.3750003240180308e-05, "loss": 0.0107, "step": 710480 }, { "epoch": 1.84, "learning_rate": 2.3746115023808843e-05, "loss": 0.0103, "step": 710490 }, { "epoch": 1.84, "learning_rate": 2.374222680743738e-05, "loss": 0.0092, "step": 710500 }, { "epoch": 1.84, "learning_rate": 2.3738338591065916e-05, "loss": 0.0086, "step": 710510 }, { "epoch": 1.84, "learning_rate": 2.3734450374694448e-05, "loss": 0.0076, "step": 710520 }, { "epoch": 1.84, "learning_rate": 2.3730562158322983e-05, "loss": 0.0058, "step": 710530 }, { "epoch": 1.84, "learning_rate": 2.3726673941951517e-05, "loss": 0.008, "step": 710540 }, { "epoch": 1.84, "learning_rate": 2.3722785725580056e-05, "loss": 0.0084, "step": 710550 }, { "epoch": 1.84, "learning_rate": 2.371889750920859e-05, "loss": 0.0057, "step": 710560 }, { "epoch": 1.84, "learning_rate": 2.3715009292837125e-05, "loss": 0.0051, "step": 710570 }, { "epoch": 1.84, "learning_rate": 2.371112107646566e-05, "loss": 0.0079, "step": 710580 }, { "epoch": 1.84, "learning_rate": 2.37072328600942e-05, "loss": 0.0044, "step": 710590 }, { "epoch": 1.84, "learning_rate": 2.3703344643722733e-05, "loss": 0.0083, "step": 710600 }, { "epoch": 1.84, "learning_rate": 2.3699456427351268e-05, "loss": 0.0058, "step": 710610 }, { "epoch": 1.84, "learning_rate": 2.3695568210979803e-05, "loss": 0.0077, "step": 710620 }, { "epoch": 1.84, "learning_rate": 2.369167999460834e-05, "loss": 0.0087, "step": 710630 }, { "epoch": 1.84, "learning_rate": 2.3687791778236873e-05, "loss": 0.0056, "step": 710640 }, { "epoch": 1.84, "learning_rate": 2.3683903561865408e-05, "loss": 0.006, "step": 710650 }, { "epoch": 1.84, "learning_rate": 2.3680015345493943e-05, "loss": 0.0076, "step": 710660 }, { "epoch": 1.84, "learning_rate": 2.3676127129122477e-05, "loss": 0.0069, "step": 710670 }, { "epoch": 1.84, "learning_rate": 2.3672238912751016e-05, "loss": 0.0094, "step": 710680 }, { "epoch": 1.84, "learning_rate": 2.366835069637955e-05, "loss": 0.0087, "step": 710690 }, { "epoch": 1.84, "learning_rate": 2.3664462480008085e-05, "loss": 0.0077, "step": 710700 }, { "epoch": 1.84, "learning_rate": 2.366057426363662e-05, "loss": 0.0076, "step": 710710 }, { "epoch": 1.84, "learning_rate": 2.3656686047265155e-05, "loss": 0.0104, "step": 710720 }, { "epoch": 1.84, "learning_rate": 2.3652797830893693e-05, "loss": 0.0104, "step": 710730 }, { "epoch": 1.84, "learning_rate": 2.3648909614522228e-05, "loss": 0.0076, "step": 710740 }, { "epoch": 1.84, "learning_rate": 2.3645021398150763e-05, "loss": 0.0078, "step": 710750 }, { "epoch": 1.84, "learning_rate": 2.3641133181779298e-05, "loss": 0.0089, "step": 710760 }, { "epoch": 1.84, "learning_rate": 2.363724496540783e-05, "loss": 0.009, "step": 710770 }, { "epoch": 1.84, "learning_rate": 2.3633356749036368e-05, "loss": 0.0112, "step": 710780 }, { "epoch": 1.84, "learning_rate": 2.3629468532664903e-05, "loss": 0.0074, "step": 710790 }, { "epoch": 1.84, "learning_rate": 2.3625580316293437e-05, "loss": 0.0048, "step": 710800 }, { "epoch": 1.84, "learning_rate": 2.3621692099921972e-05, "loss": 0.0061, "step": 710810 }, { "epoch": 1.84, "learning_rate": 2.361780388355051e-05, "loss": 0.0081, "step": 710820 }, { "epoch": 1.84, "learning_rate": 2.3613915667179045e-05, "loss": 0.0094, "step": 710830 }, { "epoch": 1.84, "learning_rate": 2.361002745080758e-05, "loss": 0.009, "step": 710840 }, { "epoch": 1.84, "learning_rate": 2.3606139234436115e-05, "loss": 0.0064, "step": 710850 }, { "epoch": 1.84, "learning_rate": 2.3602251018064653e-05, "loss": 0.0091, "step": 710860 }, { "epoch": 1.84, "learning_rate": 2.3598362801693188e-05, "loss": 0.0089, "step": 710870 }, { "epoch": 1.84, "learning_rate": 2.3594474585321723e-05, "loss": 0.0061, "step": 710880 }, { "epoch": 1.84, "learning_rate": 2.3590586368950255e-05, "loss": 0.0071, "step": 710890 }, { "epoch": 1.84, "learning_rate": 2.358669815257879e-05, "loss": 0.0083, "step": 710900 }, { "epoch": 1.84, "learning_rate": 2.3582809936207328e-05, "loss": 0.0081, "step": 710910 }, { "epoch": 1.84, "learning_rate": 2.3578921719835862e-05, "loss": 0.0064, "step": 710920 }, { "epoch": 1.84, "learning_rate": 2.3575033503464397e-05, "loss": 0.0078, "step": 710930 }, { "epoch": 1.84, "learning_rate": 2.3571145287092932e-05, "loss": 0.0094, "step": 710940 }, { "epoch": 1.84, "learning_rate": 2.356725707072147e-05, "loss": 0.0088, "step": 710950 }, { "epoch": 1.84, "learning_rate": 2.3563368854350005e-05, "loss": 0.0055, "step": 710960 }, { "epoch": 1.84, "learning_rate": 2.355948063797854e-05, "loss": 0.0094, "step": 710970 }, { "epoch": 1.84, "learning_rate": 2.3555592421607075e-05, "loss": 0.0063, "step": 710980 }, { "epoch": 1.84, "learning_rate": 2.3551704205235613e-05, "loss": 0.0046, "step": 710990 }, { "epoch": 1.84, "learning_rate": 2.3547815988864148e-05, "loss": 0.0083, "step": 711000 }, { "epoch": 1.84, "eval_cer": 0.8816634964890108, "eval_loss": 0.004514896310865879, "eval_runtime": 107.7072, "eval_samples_per_second": 18.569, "eval_steps_per_second": 4.642, "step": 711000 }, { "epoch": 1.84, "learning_rate": 2.3543927772492683e-05, "loss": 0.0106, "step": 711010 }, { "epoch": 1.84, "learning_rate": 2.3540039556121214e-05, "loss": 0.007, "step": 711020 }, { "epoch": 1.84, "learning_rate": 2.353615133974975e-05, "loss": 0.0063, "step": 711030 }, { "epoch": 1.84, "learning_rate": 2.3532263123378288e-05, "loss": 0.0073, "step": 711040 }, { "epoch": 1.84, "learning_rate": 2.3528374907006822e-05, "loss": 0.0051, "step": 711050 }, { "epoch": 1.84, "learning_rate": 2.3524486690635357e-05, "loss": 0.0124, "step": 711060 }, { "epoch": 1.84, "learning_rate": 2.3520598474263892e-05, "loss": 0.0062, "step": 711070 }, { "epoch": 1.84, "learning_rate": 2.351671025789243e-05, "loss": 0.0071, "step": 711080 }, { "epoch": 1.84, "learning_rate": 2.3512822041520965e-05, "loss": 0.0062, "step": 711090 }, { "epoch": 1.84, "learning_rate": 2.35089338251495e-05, "loss": 0.0079, "step": 711100 }, { "epoch": 1.84, "learning_rate": 2.3505045608778035e-05, "loss": 0.0075, "step": 711110 }, { "epoch": 1.84, "learning_rate": 2.3501157392406573e-05, "loss": 0.0089, "step": 711120 }, { "epoch": 1.84, "learning_rate": 2.3497269176035108e-05, "loss": 0.0077, "step": 711130 }, { "epoch": 1.84, "learning_rate": 2.349338095966364e-05, "loss": 0.0072, "step": 711140 }, { "epoch": 1.84, "learning_rate": 2.3489492743292174e-05, "loss": 0.008, "step": 711150 }, { "epoch": 1.84, "learning_rate": 2.348560452692071e-05, "loss": 0.008, "step": 711160 }, { "epoch": 1.84, "learning_rate": 2.3481716310549248e-05, "loss": 0.0057, "step": 711170 }, { "epoch": 1.84, "learning_rate": 2.3477828094177782e-05, "loss": 0.0075, "step": 711180 }, { "epoch": 1.84, "learning_rate": 2.3473939877806317e-05, "loss": 0.0069, "step": 711190 }, { "epoch": 1.84, "learning_rate": 2.3470051661434852e-05, "loss": 0.0062, "step": 711200 }, { "epoch": 1.84, "learning_rate": 2.346616344506339e-05, "loss": 0.0068, "step": 711210 }, { "epoch": 1.84, "learning_rate": 2.3462275228691925e-05, "loss": 0.0109, "step": 711220 }, { "epoch": 1.84, "learning_rate": 2.345838701232046e-05, "loss": 0.0063, "step": 711230 }, { "epoch": 1.84, "learning_rate": 2.3454498795948995e-05, "loss": 0.0072, "step": 711240 }, { "epoch": 1.84, "learning_rate": 2.3450610579577533e-05, "loss": 0.0087, "step": 711250 }, { "epoch": 1.84, "learning_rate": 2.3446722363206065e-05, "loss": 0.0054, "step": 711260 }, { "epoch": 1.84, "learning_rate": 2.34428341468346e-05, "loss": 0.0053, "step": 711270 }, { "epoch": 1.84, "learning_rate": 2.3438945930463134e-05, "loss": 0.0098, "step": 711280 }, { "epoch": 1.84, "learning_rate": 2.343505771409167e-05, "loss": 0.0077, "step": 711290 }, { "epoch": 1.84, "learning_rate": 2.3431169497720208e-05, "loss": 0.0077, "step": 711300 }, { "epoch": 1.84, "learning_rate": 2.3427281281348742e-05, "loss": 0.0072, "step": 711310 }, { "epoch": 1.84, "learning_rate": 2.3423393064977277e-05, "loss": 0.0089, "step": 711320 }, { "epoch": 1.84, "learning_rate": 2.3419504848605812e-05, "loss": 0.0065, "step": 711330 }, { "epoch": 1.84, "learning_rate": 2.341561663223435e-05, "loss": 0.0084, "step": 711340 }, { "epoch": 1.84, "learning_rate": 2.3411728415862885e-05, "loss": 0.007, "step": 711350 }, { "epoch": 1.84, "learning_rate": 2.340784019949142e-05, "loss": 0.0073, "step": 711360 }, { "epoch": 1.84, "learning_rate": 2.3403951983119955e-05, "loss": 0.0099, "step": 711370 }, { "epoch": 1.84, "learning_rate": 2.3400063766748493e-05, "loss": 0.006, "step": 711380 }, { "epoch": 1.84, "learning_rate": 2.3396175550377025e-05, "loss": 0.0089, "step": 711390 }, { "epoch": 1.84, "learning_rate": 2.339228733400556e-05, "loss": 0.0106, "step": 711400 }, { "epoch": 1.84, "learning_rate": 2.3388399117634094e-05, "loss": 0.0085, "step": 711410 }, { "epoch": 1.84, "learning_rate": 2.338451090126263e-05, "loss": 0.0114, "step": 711420 }, { "epoch": 1.84, "learning_rate": 2.3380622684891168e-05, "loss": 0.0072, "step": 711430 }, { "epoch": 1.84, "learning_rate": 2.3376734468519702e-05, "loss": 0.0061, "step": 711440 }, { "epoch": 1.84, "learning_rate": 2.3372846252148237e-05, "loss": 0.0078, "step": 711450 }, { "epoch": 1.84, "learning_rate": 2.3368958035776772e-05, "loss": 0.0059, "step": 711460 }, { "epoch": 1.84, "learning_rate": 2.336506981940531e-05, "loss": 0.009, "step": 711470 }, { "epoch": 1.84, "learning_rate": 2.3361181603033845e-05, "loss": 0.0084, "step": 711480 }, { "epoch": 1.84, "learning_rate": 2.335729338666238e-05, "loss": 0.0074, "step": 711490 }, { "epoch": 1.84, "learning_rate": 2.3353405170290915e-05, "loss": 0.0086, "step": 711500 }, { "epoch": 1.84, "learning_rate": 2.3349516953919446e-05, "loss": 0.0058, "step": 711510 }, { "epoch": 1.84, "learning_rate": 2.3345628737547985e-05, "loss": 0.0075, "step": 711520 }, { "epoch": 1.84, "learning_rate": 2.334174052117652e-05, "loss": 0.0063, "step": 711530 }, { "epoch": 1.84, "learning_rate": 2.3337852304805054e-05, "loss": 0.0091, "step": 711540 }, { "epoch": 1.84, "learning_rate": 2.333396408843359e-05, "loss": 0.0065, "step": 711550 }, { "epoch": 1.84, "learning_rate": 2.3330075872062128e-05, "loss": 0.0064, "step": 711560 }, { "epoch": 1.84, "learning_rate": 2.3326187655690662e-05, "loss": 0.0078, "step": 711570 }, { "epoch": 1.84, "learning_rate": 2.3322299439319197e-05, "loss": 0.0093, "step": 711580 }, { "epoch": 1.84, "learning_rate": 2.3318411222947732e-05, "loss": 0.01, "step": 711590 }, { "epoch": 1.84, "learning_rate": 2.331452300657627e-05, "loss": 0.0069, "step": 711600 }, { "epoch": 1.84, "learning_rate": 2.3310634790204805e-05, "loss": 0.0084, "step": 711610 }, { "epoch": 1.84, "learning_rate": 2.330674657383334e-05, "loss": 0.009, "step": 711620 }, { "epoch": 1.84, "learning_rate": 2.3302858357461875e-05, "loss": 0.0067, "step": 711630 }, { "epoch": 1.84, "learning_rate": 2.3298970141090406e-05, "loss": 0.0067, "step": 711640 }, { "epoch": 1.84, "learning_rate": 2.3295081924718945e-05, "loss": 0.0098, "step": 711650 }, { "epoch": 1.84, "learning_rate": 2.329119370834748e-05, "loss": 0.0078, "step": 711660 }, { "epoch": 1.84, "learning_rate": 2.3287305491976014e-05, "loss": 0.0082, "step": 711670 }, { "epoch": 1.84, "learning_rate": 2.328341727560455e-05, "loss": 0.0065, "step": 711680 }, { "epoch": 1.84, "learning_rate": 2.3279529059233087e-05, "loss": 0.0084, "step": 711690 }, { "epoch": 1.84, "learning_rate": 2.3275640842861622e-05, "loss": 0.0069, "step": 711700 }, { "epoch": 1.84, "learning_rate": 2.3271752626490157e-05, "loss": 0.0068, "step": 711710 }, { "epoch": 1.84, "learning_rate": 2.3267864410118692e-05, "loss": 0.0072, "step": 711720 }, { "epoch": 1.84, "learning_rate": 2.326397619374723e-05, "loss": 0.0068, "step": 711730 }, { "epoch": 1.84, "learning_rate": 2.3260087977375765e-05, "loss": 0.0085, "step": 711740 }, { "epoch": 1.84, "learning_rate": 2.32561997610043e-05, "loss": 0.0075, "step": 711750 }, { "epoch": 1.84, "learning_rate": 2.325231154463283e-05, "loss": 0.0055, "step": 711760 }, { "epoch": 1.85, "learning_rate": 2.3248423328261366e-05, "loss": 0.0093, "step": 711770 }, { "epoch": 1.85, "learning_rate": 2.3244535111889905e-05, "loss": 0.007, "step": 711780 }, { "epoch": 1.85, "learning_rate": 2.324064689551844e-05, "loss": 0.0075, "step": 711790 }, { "epoch": 1.85, "learning_rate": 2.3236758679146974e-05, "loss": 0.0103, "step": 711800 }, { "epoch": 1.85, "learning_rate": 2.323287046277551e-05, "loss": 0.0084, "step": 711810 }, { "epoch": 1.85, "learning_rate": 2.3228982246404047e-05, "loss": 0.0088, "step": 711820 }, { "epoch": 1.85, "learning_rate": 2.3225094030032582e-05, "loss": 0.007, "step": 711830 }, { "epoch": 1.85, "learning_rate": 2.3221205813661117e-05, "loss": 0.0077, "step": 711840 }, { "epoch": 1.85, "learning_rate": 2.3217317597289652e-05, "loss": 0.0083, "step": 711850 }, { "epoch": 1.85, "learning_rate": 2.321342938091819e-05, "loss": 0.0093, "step": 711860 }, { "epoch": 1.85, "learning_rate": 2.3209541164546725e-05, "loss": 0.0056, "step": 711870 }, { "epoch": 1.85, "learning_rate": 2.3205652948175257e-05, "loss": 0.0079, "step": 711880 }, { "epoch": 1.85, "learning_rate": 2.320176473180379e-05, "loss": 0.0066, "step": 711890 }, { "epoch": 1.85, "learning_rate": 2.3197876515432326e-05, "loss": 0.0077, "step": 711900 }, { "epoch": 1.85, "learning_rate": 2.3193988299060865e-05, "loss": 0.0074, "step": 711910 }, { "epoch": 1.85, "learning_rate": 2.31901000826894e-05, "loss": 0.0085, "step": 711920 }, { "epoch": 1.85, "learning_rate": 2.3186211866317934e-05, "loss": 0.0105, "step": 711930 }, { "epoch": 1.85, "learning_rate": 2.318232364994647e-05, "loss": 0.0075, "step": 711940 }, { "epoch": 1.85, "learning_rate": 2.3178435433575007e-05, "loss": 0.0054, "step": 711950 }, { "epoch": 1.85, "learning_rate": 2.3174547217203542e-05, "loss": 0.0112, "step": 711960 }, { "epoch": 1.85, "learning_rate": 2.3170659000832077e-05, "loss": 0.0094, "step": 711970 }, { "epoch": 1.85, "learning_rate": 2.3166770784460612e-05, "loss": 0.0096, "step": 711980 }, { "epoch": 1.85, "learning_rate": 2.316288256808915e-05, "loss": 0.0063, "step": 711990 }, { "epoch": 1.85, "learning_rate": 2.3158994351717685e-05, "loss": 0.0065, "step": 712000 }, { "epoch": 1.85, "eval_cer": 0.8816439015719323, "eval_loss": 0.004501926247030497, "eval_runtime": 107.8113, "eval_samples_per_second": 18.551, "eval_steps_per_second": 4.638, "step": 712000 }, { "epoch": 1.85, "learning_rate": 2.3155106135346217e-05, "loss": 0.0066, "step": 712010 }, { "epoch": 1.85, "learning_rate": 2.315121791897475e-05, "loss": 0.0074, "step": 712020 }, { "epoch": 1.85, "learning_rate": 2.3147329702603286e-05, "loss": 0.0054, "step": 712030 }, { "epoch": 1.85, "learning_rate": 2.3143441486231825e-05, "loss": 0.0085, "step": 712040 }, { "epoch": 1.85, "learning_rate": 2.313955326986036e-05, "loss": 0.0077, "step": 712050 }, { "epoch": 1.85, "learning_rate": 2.3135665053488894e-05, "loss": 0.0052, "step": 712060 }, { "epoch": 1.85, "learning_rate": 2.313177683711743e-05, "loss": 0.0068, "step": 712070 }, { "epoch": 1.85, "learning_rate": 2.3127888620745964e-05, "loss": 0.007, "step": 712080 }, { "epoch": 1.85, "learning_rate": 2.3124000404374502e-05, "loss": 0.0073, "step": 712090 }, { "epoch": 1.85, "learning_rate": 2.3120112188003037e-05, "loss": 0.0075, "step": 712100 }, { "epoch": 1.85, "learning_rate": 2.3116223971631572e-05, "loss": 0.0062, "step": 712110 }, { "epoch": 1.85, "learning_rate": 2.3112335755260107e-05, "loss": 0.0097, "step": 712120 }, { "epoch": 1.85, "learning_rate": 2.3108447538888642e-05, "loss": 0.0069, "step": 712130 }, { "epoch": 1.85, "learning_rate": 2.3104559322517177e-05, "loss": 0.0049, "step": 712140 }, { "epoch": 1.85, "learning_rate": 2.310067110614571e-05, "loss": 0.0068, "step": 712150 }, { "epoch": 1.85, "learning_rate": 2.3096782889774246e-05, "loss": 0.0075, "step": 712160 }, { "epoch": 1.85, "learning_rate": 2.309289467340278e-05, "loss": 0.0068, "step": 712170 }, { "epoch": 1.85, "learning_rate": 2.308900645703132e-05, "loss": 0.0082, "step": 712180 }, { "epoch": 1.85, "learning_rate": 2.3085118240659854e-05, "loss": 0.0074, "step": 712190 }, { "epoch": 1.85, "learning_rate": 2.308123002428839e-05, "loss": 0.0065, "step": 712200 }, { "epoch": 1.85, "learning_rate": 2.3077341807916924e-05, "loss": 0.0098, "step": 712210 }, { "epoch": 1.85, "learning_rate": 2.3073453591545462e-05, "loss": 0.0066, "step": 712220 }, { "epoch": 1.85, "learning_rate": 2.3069565375173997e-05, "loss": 0.0086, "step": 712230 }, { "epoch": 1.85, "learning_rate": 2.3065677158802532e-05, "loss": 0.0075, "step": 712240 }, { "epoch": 1.85, "learning_rate": 2.3061788942431067e-05, "loss": 0.0061, "step": 712250 }, { "epoch": 1.85, "learning_rate": 2.30579007260596e-05, "loss": 0.0062, "step": 712260 }, { "epoch": 1.85, "learning_rate": 2.3054012509688137e-05, "loss": 0.0081, "step": 712270 }, { "epoch": 1.85, "learning_rate": 2.305012429331667e-05, "loss": 0.0065, "step": 712280 }, { "epoch": 1.85, "learning_rate": 2.3046236076945206e-05, "loss": 0.0081, "step": 712290 }, { "epoch": 1.85, "learning_rate": 2.304234786057374e-05, "loss": 0.0064, "step": 712300 }, { "epoch": 1.85, "learning_rate": 2.303845964420228e-05, "loss": 0.0062, "step": 712310 }, { "epoch": 1.85, "learning_rate": 2.3034571427830814e-05, "loss": 0.0066, "step": 712320 }, { "epoch": 1.85, "learning_rate": 2.303068321145935e-05, "loss": 0.0082, "step": 712330 }, { "epoch": 1.85, "learning_rate": 2.3026794995087884e-05, "loss": 0.0079, "step": 712340 }, { "epoch": 1.85, "learning_rate": 2.3022906778716422e-05, "loss": 0.0086, "step": 712350 }, { "epoch": 1.85, "learning_rate": 2.3019018562344957e-05, "loss": 0.0064, "step": 712360 }, { "epoch": 1.85, "learning_rate": 2.3015130345973492e-05, "loss": 0.0085, "step": 712370 }, { "epoch": 1.85, "learning_rate": 2.3011242129602023e-05, "loss": 0.0068, "step": 712380 }, { "epoch": 1.85, "learning_rate": 2.3007353913230558e-05, "loss": 0.0094, "step": 712390 }, { "epoch": 1.85, "learning_rate": 2.3003465696859097e-05, "loss": 0.0062, "step": 712400 }, { "epoch": 1.85, "learning_rate": 2.299957748048763e-05, "loss": 0.0088, "step": 712410 }, { "epoch": 1.85, "learning_rate": 2.2995689264116166e-05, "loss": 0.0076, "step": 712420 }, { "epoch": 1.85, "learning_rate": 2.29918010477447e-05, "loss": 0.0099, "step": 712430 }, { "epoch": 1.85, "learning_rate": 2.298791283137324e-05, "loss": 0.0071, "step": 712440 }, { "epoch": 1.85, "learning_rate": 2.2984024615001774e-05, "loss": 0.0077, "step": 712450 }, { "epoch": 1.85, "learning_rate": 2.298013639863031e-05, "loss": 0.0083, "step": 712460 }, { "epoch": 1.85, "learning_rate": 2.2976248182258844e-05, "loss": 0.0067, "step": 712470 }, { "epoch": 1.85, "learning_rate": 2.2972359965887382e-05, "loss": 0.0055, "step": 712480 }, { "epoch": 1.85, "learning_rate": 2.2968471749515917e-05, "loss": 0.0059, "step": 712490 }, { "epoch": 1.85, "learning_rate": 2.2964583533144452e-05, "loss": 0.0064, "step": 712500 }, { "epoch": 1.85, "learning_rate": 2.2960695316772983e-05, "loss": 0.0056, "step": 712510 }, { "epoch": 1.85, "learning_rate": 2.2956807100401518e-05, "loss": 0.0099, "step": 712520 }, { "epoch": 1.85, "learning_rate": 2.2952918884030057e-05, "loss": 0.0069, "step": 712530 }, { "epoch": 1.85, "learning_rate": 2.294903066765859e-05, "loss": 0.007, "step": 712540 }, { "epoch": 1.85, "learning_rate": 2.2945142451287126e-05, "loss": 0.0069, "step": 712550 }, { "epoch": 1.85, "learning_rate": 2.294125423491566e-05, "loss": 0.0071, "step": 712560 }, { "epoch": 1.85, "learning_rate": 2.29373660185442e-05, "loss": 0.008, "step": 712570 }, { "epoch": 1.85, "learning_rate": 2.2933477802172734e-05, "loss": 0.0102, "step": 712580 }, { "epoch": 1.85, "learning_rate": 2.292958958580127e-05, "loss": 0.0068, "step": 712590 }, { "epoch": 1.85, "learning_rate": 2.2925701369429804e-05, "loss": 0.0062, "step": 712600 }, { "epoch": 1.85, "learning_rate": 2.2921813153058342e-05, "loss": 0.0099, "step": 712610 }, { "epoch": 1.85, "learning_rate": 2.2917924936686877e-05, "loss": 0.0088, "step": 712620 }, { "epoch": 1.85, "learning_rate": 2.291403672031541e-05, "loss": 0.0064, "step": 712630 }, { "epoch": 1.85, "learning_rate": 2.2910148503943943e-05, "loss": 0.0084, "step": 712640 }, { "epoch": 1.85, "learning_rate": 2.2906260287572478e-05, "loss": 0.0066, "step": 712650 }, { "epoch": 1.85, "learning_rate": 2.2902372071201016e-05, "loss": 0.012, "step": 712660 }, { "epoch": 1.85, "learning_rate": 2.289848385482955e-05, "loss": 0.0051, "step": 712670 }, { "epoch": 1.85, "learning_rate": 2.2894595638458086e-05, "loss": 0.0064, "step": 712680 }, { "epoch": 1.85, "learning_rate": 2.289070742208662e-05, "loss": 0.0072, "step": 712690 }, { "epoch": 1.85, "learning_rate": 2.288681920571516e-05, "loss": 0.0094, "step": 712700 }, { "epoch": 1.85, "learning_rate": 2.2882930989343694e-05, "loss": 0.0092, "step": 712710 }, { "epoch": 1.85, "learning_rate": 2.287904277297223e-05, "loss": 0.0056, "step": 712720 }, { "epoch": 1.85, "learning_rate": 2.2875154556600764e-05, "loss": 0.007, "step": 712730 }, { "epoch": 1.85, "learning_rate": 2.2871266340229302e-05, "loss": 0.0063, "step": 712740 }, { "epoch": 1.85, "learning_rate": 2.2867378123857834e-05, "loss": 0.0095, "step": 712750 }, { "epoch": 1.85, "learning_rate": 2.286348990748637e-05, "loss": 0.007, "step": 712760 }, { "epoch": 1.85, "learning_rate": 2.2859601691114903e-05, "loss": 0.006, "step": 712770 }, { "epoch": 1.85, "learning_rate": 2.2855713474743438e-05, "loss": 0.0094, "step": 712780 }, { "epoch": 1.85, "learning_rate": 2.2851825258371976e-05, "loss": 0.0077, "step": 712790 }, { "epoch": 1.85, "learning_rate": 2.284793704200051e-05, "loss": 0.008, "step": 712800 }, { "epoch": 1.85, "learning_rate": 2.2844048825629046e-05, "loss": 0.007, "step": 712810 }, { "epoch": 1.85, "learning_rate": 2.284016060925758e-05, "loss": 0.0083, "step": 712820 }, { "epoch": 1.85, "learning_rate": 2.283627239288612e-05, "loss": 0.0071, "step": 712830 }, { "epoch": 1.85, "learning_rate": 2.2832384176514654e-05, "loss": 0.0065, "step": 712840 }, { "epoch": 1.85, "learning_rate": 2.282849596014319e-05, "loss": 0.0065, "step": 712850 }, { "epoch": 1.85, "learning_rate": 2.2824607743771724e-05, "loss": 0.0092, "step": 712860 }, { "epoch": 1.85, "learning_rate": 2.2820719527400262e-05, "loss": 0.0108, "step": 712870 }, { "epoch": 1.85, "learning_rate": 2.2816831311028794e-05, "loss": 0.0075, "step": 712880 }, { "epoch": 1.85, "learning_rate": 2.281294309465733e-05, "loss": 0.0069, "step": 712890 }, { "epoch": 1.85, "learning_rate": 2.2809054878285863e-05, "loss": 0.0076, "step": 712900 }, { "epoch": 1.85, "learning_rate": 2.2805166661914398e-05, "loss": 0.0076, "step": 712910 }, { "epoch": 1.85, "learning_rate": 2.2801278445542936e-05, "loss": 0.0063, "step": 712920 }, { "epoch": 1.85, "learning_rate": 2.279739022917147e-05, "loss": 0.0087, "step": 712930 }, { "epoch": 1.85, "learning_rate": 2.2793502012800006e-05, "loss": 0.0053, "step": 712940 }, { "epoch": 1.85, "learning_rate": 2.278961379642854e-05, "loss": 0.0094, "step": 712950 }, { "epoch": 1.85, "learning_rate": 2.278572558005708e-05, "loss": 0.0082, "step": 712960 }, { "epoch": 1.85, "learning_rate": 2.2781837363685614e-05, "loss": 0.0058, "step": 712970 }, { "epoch": 1.85, "learning_rate": 2.277794914731415e-05, "loss": 0.0068, "step": 712980 }, { "epoch": 1.85, "learning_rate": 2.2774060930942684e-05, "loss": 0.0116, "step": 712990 }, { "epoch": 1.85, "learning_rate": 2.2770172714571215e-05, "loss": 0.0081, "step": 713000 }, { "epoch": 1.85, "eval_cer": 0.8816690950367475, "eval_loss": 0.004550943151116371, "eval_runtime": 107.8933, "eval_samples_per_second": 18.537, "eval_steps_per_second": 4.634, "step": 713000 }, { "epoch": 1.85, "learning_rate": 2.2766284498199754e-05, "loss": 0.0067, "step": 713010 }, { "epoch": 1.85, "learning_rate": 2.276239628182829e-05, "loss": 0.0072, "step": 713020 }, { "epoch": 1.85, "learning_rate": 2.2758508065456823e-05, "loss": 0.0065, "step": 713030 }, { "epoch": 1.85, "learning_rate": 2.2754619849085358e-05, "loss": 0.0049, "step": 713040 }, { "epoch": 1.85, "learning_rate": 2.2750731632713896e-05, "loss": 0.0079, "step": 713050 }, { "epoch": 1.85, "learning_rate": 2.274684341634243e-05, "loss": 0.007, "step": 713060 }, { "epoch": 1.85, "learning_rate": 2.2742955199970966e-05, "loss": 0.0062, "step": 713070 }, { "epoch": 1.85, "learning_rate": 2.27390669835995e-05, "loss": 0.0088, "step": 713080 }, { "epoch": 1.85, "learning_rate": 2.273517876722804e-05, "loss": 0.0064, "step": 713090 }, { "epoch": 1.85, "learning_rate": 2.2731290550856574e-05, "loss": 0.0067, "step": 713100 }, { "epoch": 1.85, "learning_rate": 2.272740233448511e-05, "loss": 0.0091, "step": 713110 }, { "epoch": 1.85, "learning_rate": 2.2723514118113644e-05, "loss": 0.0069, "step": 713120 }, { "epoch": 1.85, "learning_rate": 2.2719625901742175e-05, "loss": 0.0093, "step": 713130 }, { "epoch": 1.85, "learning_rate": 2.2715737685370714e-05, "loss": 0.0083, "step": 713140 }, { "epoch": 1.85, "learning_rate": 2.271184946899925e-05, "loss": 0.0104, "step": 713150 }, { "epoch": 1.85, "learning_rate": 2.2707961252627783e-05, "loss": 0.0066, "step": 713160 }, { "epoch": 1.85, "learning_rate": 2.2704073036256318e-05, "loss": 0.0068, "step": 713170 }, { "epoch": 1.85, "learning_rate": 2.2700184819884856e-05, "loss": 0.0077, "step": 713180 }, { "epoch": 1.85, "learning_rate": 2.269629660351339e-05, "loss": 0.0117, "step": 713190 }, { "epoch": 1.85, "learning_rate": 2.2692408387141926e-05, "loss": 0.0079, "step": 713200 }, { "epoch": 1.85, "learning_rate": 2.268852017077046e-05, "loss": 0.0091, "step": 713210 }, { "epoch": 1.85, "learning_rate": 2.2684631954399e-05, "loss": 0.0074, "step": 713220 }, { "epoch": 1.85, "learning_rate": 2.2680743738027534e-05, "loss": 0.0065, "step": 713230 }, { "epoch": 1.85, "learning_rate": 2.267685552165607e-05, "loss": 0.0069, "step": 713240 }, { "epoch": 1.85, "learning_rate": 2.26729673052846e-05, "loss": 0.0077, "step": 713250 }, { "epoch": 1.85, "learning_rate": 2.2669079088913135e-05, "loss": 0.0081, "step": 713260 }, { "epoch": 1.85, "learning_rate": 2.2665190872541674e-05, "loss": 0.0088, "step": 713270 }, { "epoch": 1.85, "learning_rate": 2.266130265617021e-05, "loss": 0.0115, "step": 713280 }, { "epoch": 1.85, "learning_rate": 2.2657414439798743e-05, "loss": 0.0078, "step": 713290 }, { "epoch": 1.85, "learning_rate": 2.2653526223427278e-05, "loss": 0.0058, "step": 713300 }, { "epoch": 1.85, "learning_rate": 2.2649638007055816e-05, "loss": 0.009, "step": 713310 }, { "epoch": 1.85, "learning_rate": 2.264574979068435e-05, "loss": 0.0063, "step": 713320 }, { "epoch": 1.85, "learning_rate": 2.2641861574312886e-05, "loss": 0.0082, "step": 713330 }, { "epoch": 1.85, "learning_rate": 2.263797335794142e-05, "loss": 0.0075, "step": 713340 }, { "epoch": 1.85, "learning_rate": 2.263408514156996e-05, "loss": 0.0077, "step": 713350 }, { "epoch": 1.85, "learning_rate": 2.2630196925198494e-05, "loss": 0.0064, "step": 713360 }, { "epoch": 1.85, "learning_rate": 2.2626308708827026e-05, "loss": 0.0074, "step": 713370 }, { "epoch": 1.85, "learning_rate": 2.262242049245556e-05, "loss": 0.0114, "step": 713380 }, { "epoch": 1.85, "learning_rate": 2.2618532276084095e-05, "loss": 0.0079, "step": 713390 }, { "epoch": 1.85, "learning_rate": 2.2614644059712634e-05, "loss": 0.0074, "step": 713400 }, { "epoch": 1.85, "learning_rate": 2.261075584334117e-05, "loss": 0.01, "step": 713410 }, { "epoch": 1.85, "learning_rate": 2.2606867626969703e-05, "loss": 0.0088, "step": 713420 }, { "epoch": 1.85, "learning_rate": 2.2602979410598238e-05, "loss": 0.0062, "step": 713430 }, { "epoch": 1.85, "learning_rate": 2.2599091194226776e-05, "loss": 0.0062, "step": 713440 }, { "epoch": 1.85, "learning_rate": 2.259520297785531e-05, "loss": 0.008, "step": 713450 }, { "epoch": 1.85, "learning_rate": 2.2591314761483846e-05, "loss": 0.0087, "step": 713460 }, { "epoch": 1.85, "learning_rate": 2.258742654511238e-05, "loss": 0.0062, "step": 713470 }, { "epoch": 1.85, "learning_rate": 2.2583538328740916e-05, "loss": 0.0069, "step": 713480 }, { "epoch": 1.85, "learning_rate": 2.2579650112369454e-05, "loss": 0.0105, "step": 713490 }, { "epoch": 1.85, "learning_rate": 2.2575761895997986e-05, "loss": 0.0087, "step": 713500 }, { "epoch": 1.85, "learning_rate": 2.257187367962652e-05, "loss": 0.0059, "step": 713510 }, { "epoch": 1.85, "learning_rate": 2.2567985463255055e-05, "loss": 0.0066, "step": 713520 }, { "epoch": 1.85, "learning_rate": 2.256409724688359e-05, "loss": 0.01, "step": 713530 }, { "epoch": 1.85, "learning_rate": 2.256020903051213e-05, "loss": 0.0055, "step": 713540 }, { "epoch": 1.85, "learning_rate": 2.2556320814140663e-05, "loss": 0.0063, "step": 713550 }, { "epoch": 1.85, "learning_rate": 2.2552432597769198e-05, "loss": 0.0063, "step": 713560 }, { "epoch": 1.85, "learning_rate": 2.2548544381397733e-05, "loss": 0.0083, "step": 713570 }, { "epoch": 1.85, "learning_rate": 2.254465616502627e-05, "loss": 0.0059, "step": 713580 }, { "epoch": 1.85, "learning_rate": 2.2540767948654806e-05, "loss": 0.0059, "step": 713590 }, { "epoch": 1.85, "learning_rate": 2.253687973228334e-05, "loss": 0.0069, "step": 713600 }, { "epoch": 1.85, "learning_rate": 2.2532991515911876e-05, "loss": 0.0067, "step": 713610 }, { "epoch": 1.85, "learning_rate": 2.2529103299540407e-05, "loss": 0.0068, "step": 713620 }, { "epoch": 1.85, "learning_rate": 2.2525215083168945e-05, "loss": 0.0087, "step": 713630 }, { "epoch": 1.85, "learning_rate": 2.252132686679748e-05, "loss": 0.0083, "step": 713640 }, { "epoch": 1.85, "learning_rate": 2.2517438650426015e-05, "loss": 0.0058, "step": 713650 }, { "epoch": 1.85, "learning_rate": 2.251355043405455e-05, "loss": 0.0085, "step": 713660 }, { "epoch": 1.85, "learning_rate": 2.250966221768309e-05, "loss": 0.0056, "step": 713670 }, { "epoch": 1.85, "learning_rate": 2.2505774001311623e-05, "loss": 0.0071, "step": 713680 }, { "epoch": 1.85, "learning_rate": 2.2501885784940158e-05, "loss": 0.0083, "step": 713690 }, { "epoch": 1.85, "learning_rate": 2.2497997568568693e-05, "loss": 0.008, "step": 713700 }, { "epoch": 1.85, "learning_rate": 2.249410935219723e-05, "loss": 0.0078, "step": 713710 }, { "epoch": 1.85, "learning_rate": 2.2490221135825766e-05, "loss": 0.0051, "step": 713720 }, { "epoch": 1.85, "learning_rate": 2.24863329194543e-05, "loss": 0.0056, "step": 713730 }, { "epoch": 1.85, "learning_rate": 2.2482444703082836e-05, "loss": 0.0052, "step": 713740 }, { "epoch": 1.85, "learning_rate": 2.2478556486711367e-05, "loss": 0.0061, "step": 713750 }, { "epoch": 1.85, "learning_rate": 2.2474668270339905e-05, "loss": 0.0059, "step": 713760 }, { "epoch": 1.85, "learning_rate": 2.247078005396844e-05, "loss": 0.0052, "step": 713770 }, { "epoch": 1.85, "learning_rate": 2.2466891837596975e-05, "loss": 0.0078, "step": 713780 }, { "epoch": 1.85, "learning_rate": 2.246300362122551e-05, "loss": 0.0081, "step": 713790 }, { "epoch": 1.85, "learning_rate": 2.2459115404854048e-05, "loss": 0.0107, "step": 713800 }, { "epoch": 1.85, "learning_rate": 2.2455227188482583e-05, "loss": 0.0088, "step": 713810 }, { "epoch": 1.85, "learning_rate": 2.2451338972111118e-05, "loss": 0.0066, "step": 713820 }, { "epoch": 1.85, "learning_rate": 2.2447450755739653e-05, "loss": 0.0062, "step": 713830 }, { "epoch": 1.85, "learning_rate": 2.244356253936819e-05, "loss": 0.0088, "step": 713840 }, { "epoch": 1.85, "learning_rate": 2.2439674322996726e-05, "loss": 0.006, "step": 713850 }, { "epoch": 1.85, "learning_rate": 2.243578610662526e-05, "loss": 0.0067, "step": 713860 }, { "epoch": 1.85, "learning_rate": 2.2431897890253792e-05, "loss": 0.0098, "step": 713870 }, { "epoch": 1.85, "learning_rate": 2.2428009673882327e-05, "loss": 0.007, "step": 713880 }, { "epoch": 1.85, "learning_rate": 2.2424121457510865e-05, "loss": 0.0065, "step": 713890 }, { "epoch": 1.85, "learning_rate": 2.24202332411394e-05, "loss": 0.0074, "step": 713900 }, { "epoch": 1.85, "learning_rate": 2.2416345024767935e-05, "loss": 0.0085, "step": 713910 }, { "epoch": 1.85, "learning_rate": 2.241245680839647e-05, "loss": 0.0073, "step": 713920 }, { "epoch": 1.85, "learning_rate": 2.2408568592025008e-05, "loss": 0.0065, "step": 713930 }, { "epoch": 1.85, "learning_rate": 2.2404680375653543e-05, "loss": 0.005, "step": 713940 }, { "epoch": 1.85, "learning_rate": 2.2400792159282078e-05, "loss": 0.0058, "step": 713950 }, { "epoch": 1.85, "learning_rate": 2.2396903942910613e-05, "loss": 0.0087, "step": 713960 }, { "epoch": 1.85, "learning_rate": 2.239301572653915e-05, "loss": 0.0071, "step": 713970 }, { "epoch": 1.85, "learning_rate": 2.2389127510167686e-05, "loss": 0.0058, "step": 713980 }, { "epoch": 1.85, "learning_rate": 2.2385239293796217e-05, "loss": 0.0098, "step": 713990 }, { "epoch": 1.85, "learning_rate": 2.2381351077424752e-05, "loss": 0.006, "step": 714000 }, { "epoch": 1.85, "eval_cer": 0.8816746935844841, "eval_loss": 0.004546701442450285, "eval_runtime": 107.8645, "eval_samples_per_second": 18.542, "eval_steps_per_second": 4.635, "step": 714000 }, { "epoch": 1.85, "learning_rate": 2.2377462861053287e-05, "loss": 0.0107, "step": 714010 }, { "epoch": 1.85, "learning_rate": 2.2373574644681825e-05, "loss": 0.0077, "step": 714020 }, { "epoch": 1.85, "learning_rate": 2.236968642831036e-05, "loss": 0.0079, "step": 714030 }, { "epoch": 1.85, "learning_rate": 2.2365798211938895e-05, "loss": 0.007, "step": 714040 }, { "epoch": 1.85, "learning_rate": 2.236190999556743e-05, "loss": 0.007, "step": 714050 }, { "epoch": 1.85, "learning_rate": 2.2358021779195968e-05, "loss": 0.007, "step": 714060 }, { "epoch": 1.85, "learning_rate": 2.2354133562824503e-05, "loss": 0.0069, "step": 714070 }, { "epoch": 1.85, "learning_rate": 2.2350245346453038e-05, "loss": 0.0082, "step": 714080 }, { "epoch": 1.85, "learning_rate": 2.2346357130081573e-05, "loss": 0.0081, "step": 714090 }, { "epoch": 1.85, "learning_rate": 2.234246891371011e-05, "loss": 0.0072, "step": 714100 }, { "epoch": 1.85, "learning_rate": 2.2338580697338646e-05, "loss": 0.007, "step": 714110 }, { "epoch": 1.85, "learning_rate": 2.2334692480967177e-05, "loss": 0.0086, "step": 714120 }, { "epoch": 1.85, "learning_rate": 2.2330804264595712e-05, "loss": 0.0059, "step": 714130 }, { "epoch": 1.85, "learning_rate": 2.2326916048224247e-05, "loss": 0.0069, "step": 714140 }, { "epoch": 1.85, "learning_rate": 2.2323027831852785e-05, "loss": 0.0092, "step": 714150 }, { "epoch": 1.85, "learning_rate": 2.231913961548132e-05, "loss": 0.0078, "step": 714160 }, { "epoch": 1.85, "learning_rate": 2.2315251399109855e-05, "loss": 0.0061, "step": 714170 }, { "epoch": 1.85, "learning_rate": 2.231136318273839e-05, "loss": 0.0059, "step": 714180 }, { "epoch": 1.85, "learning_rate": 2.2307474966366928e-05, "loss": 0.0078, "step": 714190 }, { "epoch": 1.85, "learning_rate": 2.2303586749995463e-05, "loss": 0.0077, "step": 714200 }, { "epoch": 1.85, "learning_rate": 2.2299698533623998e-05, "loss": 0.0066, "step": 714210 }, { "epoch": 1.85, "learning_rate": 2.2295810317252533e-05, "loss": 0.0088, "step": 714220 }, { "epoch": 1.85, "learning_rate": 2.229192210088107e-05, "loss": 0.0066, "step": 714230 }, { "epoch": 1.85, "learning_rate": 2.2288033884509603e-05, "loss": 0.0089, "step": 714240 }, { "epoch": 1.85, "learning_rate": 2.2284145668138137e-05, "loss": 0.0079, "step": 714250 }, { "epoch": 1.85, "learning_rate": 2.2280257451766672e-05, "loss": 0.0091, "step": 714260 }, { "epoch": 1.85, "learning_rate": 2.2276369235395207e-05, "loss": 0.0086, "step": 714270 }, { "epoch": 1.85, "learning_rate": 2.2272481019023745e-05, "loss": 0.0086, "step": 714280 }, { "epoch": 1.85, "learning_rate": 2.226859280265228e-05, "loss": 0.0061, "step": 714290 }, { "epoch": 1.85, "learning_rate": 2.2264704586280815e-05, "loss": 0.0082, "step": 714300 }, { "epoch": 1.85, "learning_rate": 2.226081636990935e-05, "loss": 0.009, "step": 714310 }, { "epoch": 1.85, "learning_rate": 2.2256928153537888e-05, "loss": 0.0139, "step": 714320 }, { "epoch": 1.85, "learning_rate": 2.2253039937166423e-05, "loss": 0.0069, "step": 714330 }, { "epoch": 1.85, "learning_rate": 2.2249151720794958e-05, "loss": 0.0057, "step": 714340 }, { "epoch": 1.85, "learning_rate": 2.2245263504423493e-05, "loss": 0.0068, "step": 714350 }, { "epoch": 1.85, "learning_rate": 2.224137528805203e-05, "loss": 0.0067, "step": 714360 }, { "epoch": 1.85, "learning_rate": 2.2237487071680563e-05, "loss": 0.0086, "step": 714370 }, { "epoch": 1.85, "learning_rate": 2.2233598855309097e-05, "loss": 0.0072, "step": 714380 }, { "epoch": 1.85, "learning_rate": 2.2229710638937632e-05, "loss": 0.0049, "step": 714390 }, { "epoch": 1.85, "learning_rate": 2.2225822422566167e-05, "loss": 0.0088, "step": 714400 }, { "epoch": 1.85, "learning_rate": 2.2221934206194705e-05, "loss": 0.0063, "step": 714410 }, { "epoch": 1.85, "learning_rate": 2.221804598982324e-05, "loss": 0.0073, "step": 714420 }, { "epoch": 1.85, "learning_rate": 2.2214157773451775e-05, "loss": 0.0086, "step": 714430 }, { "epoch": 1.85, "learning_rate": 2.221026955708031e-05, "loss": 0.0061, "step": 714440 }, { "epoch": 1.85, "learning_rate": 2.2206381340708848e-05, "loss": 0.0098, "step": 714450 }, { "epoch": 1.85, "learning_rate": 2.2202493124337383e-05, "loss": 0.0093, "step": 714460 }, { "epoch": 1.85, "learning_rate": 2.2198604907965918e-05, "loss": 0.0076, "step": 714470 }, { "epoch": 1.85, "learning_rate": 2.2194716691594453e-05, "loss": 0.0087, "step": 714480 }, { "epoch": 1.85, "learning_rate": 2.2190828475222984e-05, "loss": 0.0074, "step": 714490 }, { "epoch": 1.85, "learning_rate": 2.2186940258851522e-05, "loss": 0.0054, "step": 714500 }, { "epoch": 1.85, "learning_rate": 2.2183052042480057e-05, "loss": 0.006, "step": 714510 }, { "epoch": 1.85, "learning_rate": 2.2179163826108592e-05, "loss": 0.0064, "step": 714520 }, { "epoch": 1.85, "learning_rate": 2.2175275609737127e-05, "loss": 0.0067, "step": 714530 }, { "epoch": 1.85, "learning_rate": 2.2171387393365665e-05, "loss": 0.009, "step": 714540 }, { "epoch": 1.85, "learning_rate": 2.21674991769942e-05, "loss": 0.0053, "step": 714550 }, { "epoch": 1.85, "learning_rate": 2.2163610960622735e-05, "loss": 0.0096, "step": 714560 }, { "epoch": 1.85, "learning_rate": 2.215972274425127e-05, "loss": 0.0078, "step": 714570 }, { "epoch": 1.85, "learning_rate": 2.2155834527879808e-05, "loss": 0.0045, "step": 714580 }, { "epoch": 1.85, "learning_rate": 2.2151946311508343e-05, "loss": 0.0065, "step": 714590 }, { "epoch": 1.85, "learning_rate": 2.2148058095136878e-05, "loss": 0.0075, "step": 714600 }, { "epoch": 1.85, "learning_rate": 2.214416987876541e-05, "loss": 0.0068, "step": 714610 }, { "epoch": 1.85, "learning_rate": 2.2140281662393944e-05, "loss": 0.0073, "step": 714620 }, { "epoch": 1.85, "learning_rate": 2.2136393446022482e-05, "loss": 0.0086, "step": 714630 }, { "epoch": 1.85, "learning_rate": 2.2132505229651017e-05, "loss": 0.0077, "step": 714640 }, { "epoch": 1.85, "learning_rate": 2.2128617013279552e-05, "loss": 0.0075, "step": 714650 }, { "epoch": 1.85, "learning_rate": 2.2124728796908087e-05, "loss": 0.007, "step": 714660 }, { "epoch": 1.85, "learning_rate": 2.2120840580536625e-05, "loss": 0.0074, "step": 714670 }, { "epoch": 1.85, "learning_rate": 2.211695236416516e-05, "loss": 0.0065, "step": 714680 }, { "epoch": 1.85, "learning_rate": 2.2113064147793695e-05, "loss": 0.0078, "step": 714690 }, { "epoch": 1.85, "learning_rate": 2.210917593142223e-05, "loss": 0.0064, "step": 714700 }, { "epoch": 1.85, "learning_rate": 2.2105287715050768e-05, "loss": 0.0069, "step": 714710 }, { "epoch": 1.85, "learning_rate": 2.2101399498679303e-05, "loss": 0.0069, "step": 714720 }, { "epoch": 1.85, "learning_rate": 2.2097511282307838e-05, "loss": 0.0078, "step": 714730 }, { "epoch": 1.85, "learning_rate": 2.209362306593637e-05, "loss": 0.0072, "step": 714740 }, { "epoch": 1.85, "learning_rate": 2.2089734849564904e-05, "loss": 0.0059, "step": 714750 }, { "epoch": 1.85, "learning_rate": 2.2085846633193442e-05, "loss": 0.0115, "step": 714760 }, { "epoch": 1.85, "learning_rate": 2.2081958416821977e-05, "loss": 0.0086, "step": 714770 }, { "epoch": 1.85, "learning_rate": 2.2078070200450512e-05, "loss": 0.0062, "step": 714780 }, { "epoch": 1.85, "learning_rate": 2.2074181984079047e-05, "loss": 0.0063, "step": 714790 }, { "epoch": 1.85, "learning_rate": 2.2070293767707585e-05, "loss": 0.0053, "step": 714800 }, { "epoch": 1.85, "learning_rate": 2.206640555133612e-05, "loss": 0.0071, "step": 714810 }, { "epoch": 1.85, "learning_rate": 2.2062517334964655e-05, "loss": 0.0075, "step": 714820 }, { "epoch": 1.85, "learning_rate": 2.205862911859319e-05, "loss": 0.0083, "step": 714830 }, { "epoch": 1.85, "learning_rate": 2.2054740902221725e-05, "loss": 0.013, "step": 714840 }, { "epoch": 1.85, "learning_rate": 2.2050852685850263e-05, "loss": 0.0063, "step": 714850 }, { "epoch": 1.85, "learning_rate": 2.2046964469478794e-05, "loss": 0.0061, "step": 714860 }, { "epoch": 1.85, "learning_rate": 2.204307625310733e-05, "loss": 0.0063, "step": 714870 }, { "epoch": 1.85, "learning_rate": 2.2039188036735864e-05, "loss": 0.0076, "step": 714880 }, { "epoch": 1.85, "learning_rate": 2.2035299820364402e-05, "loss": 0.0087, "step": 714890 }, { "epoch": 1.85, "learning_rate": 2.2031411603992937e-05, "loss": 0.0078, "step": 714900 }, { "epoch": 1.85, "learning_rate": 2.2027523387621472e-05, "loss": 0.0096, "step": 714910 }, { "epoch": 1.85, "learning_rate": 2.2023635171250007e-05, "loss": 0.0077, "step": 714920 }, { "epoch": 1.85, "learning_rate": 2.2019746954878542e-05, "loss": 0.0069, "step": 714930 }, { "epoch": 1.85, "learning_rate": 2.201585873850708e-05, "loss": 0.0113, "step": 714940 }, { "epoch": 1.85, "learning_rate": 2.2011970522135615e-05, "loss": 0.0115, "step": 714950 }, { "epoch": 1.85, "learning_rate": 2.200808230576415e-05, "loss": 0.0065, "step": 714960 }, { "epoch": 1.85, "learning_rate": 2.2004194089392685e-05, "loss": 0.008, "step": 714970 }, { "epoch": 1.85, "learning_rate": 2.2000305873021223e-05, "loss": 0.0064, "step": 714980 }, { "epoch": 1.85, "learning_rate": 2.1996417656649754e-05, "loss": 0.0075, "step": 714990 }, { "epoch": 1.85, "learning_rate": 2.199252944027829e-05, "loss": 0.0061, "step": 715000 }, { "epoch": 1.85, "eval_cer": 0.8816662957628791, "eval_loss": 0.004574858583509922, "eval_runtime": 107.8934, "eval_samples_per_second": 18.537, "eval_steps_per_second": 4.634, "step": 715000 }, { "epoch": 1.85, "learning_rate": 2.1988641223906824e-05, "loss": 0.0066, "step": 715010 }, { "epoch": 1.85, "learning_rate": 2.198475300753536e-05, "loss": 0.0071, "step": 715020 }, { "epoch": 1.85, "learning_rate": 2.1980864791163897e-05, "loss": 0.0066, "step": 715030 }, { "epoch": 1.85, "learning_rate": 2.1976976574792432e-05, "loss": 0.0067, "step": 715040 }, { "epoch": 1.85, "learning_rate": 2.1973088358420967e-05, "loss": 0.0071, "step": 715050 }, { "epoch": 1.85, "learning_rate": 2.1969200142049502e-05, "loss": 0.0076, "step": 715060 }, { "epoch": 1.85, "learning_rate": 2.196531192567804e-05, "loss": 0.0059, "step": 715070 }, { "epoch": 1.85, "learning_rate": 2.1961423709306575e-05, "loss": 0.0093, "step": 715080 }, { "epoch": 1.85, "learning_rate": 2.195753549293511e-05, "loss": 0.0061, "step": 715090 }, { "epoch": 1.85, "learning_rate": 2.1953647276563645e-05, "loss": 0.0088, "step": 715100 }, { "epoch": 1.85, "learning_rate": 2.1949759060192176e-05, "loss": 0.0071, "step": 715110 }, { "epoch": 1.85, "learning_rate": 2.1945870843820714e-05, "loss": 0.0056, "step": 715120 }, { "epoch": 1.85, "learning_rate": 2.194198262744925e-05, "loss": 0.0069, "step": 715130 }, { "epoch": 1.85, "learning_rate": 2.1938094411077784e-05, "loss": 0.0071, "step": 715140 }, { "epoch": 1.85, "learning_rate": 2.193420619470632e-05, "loss": 0.007, "step": 715150 }, { "epoch": 1.85, "learning_rate": 2.1930317978334857e-05, "loss": 0.0086, "step": 715160 }, { "epoch": 1.85, "learning_rate": 2.1926429761963392e-05, "loss": 0.0089, "step": 715170 }, { "epoch": 1.85, "learning_rate": 2.1922541545591927e-05, "loss": 0.0073, "step": 715180 }, { "epoch": 1.85, "learning_rate": 2.1918653329220462e-05, "loss": 0.007, "step": 715190 }, { "epoch": 1.85, "learning_rate": 2.1914765112849e-05, "loss": 0.0086, "step": 715200 }, { "epoch": 1.85, "learning_rate": 2.1910876896477535e-05, "loss": 0.0067, "step": 715210 }, { "epoch": 1.85, "learning_rate": 2.190698868010607e-05, "loss": 0.0054, "step": 715220 }, { "epoch": 1.85, "learning_rate": 2.19031004637346e-05, "loss": 0.007, "step": 715230 }, { "epoch": 1.85, "learning_rate": 2.1899212247363136e-05, "loss": 0.0066, "step": 715240 }, { "epoch": 1.85, "learning_rate": 2.1895324030991674e-05, "loss": 0.0054, "step": 715250 }, { "epoch": 1.85, "learning_rate": 2.189143581462021e-05, "loss": 0.0091, "step": 715260 }, { "epoch": 1.85, "learning_rate": 2.1887547598248744e-05, "loss": 0.0094, "step": 715270 }, { "epoch": 1.85, "learning_rate": 2.188365938187728e-05, "loss": 0.007, "step": 715280 }, { "epoch": 1.85, "learning_rate": 2.1879771165505817e-05, "loss": 0.0077, "step": 715290 }, { "epoch": 1.85, "learning_rate": 2.1875882949134352e-05, "loss": 0.007, "step": 715300 }, { "epoch": 1.85, "learning_rate": 2.1871994732762887e-05, "loss": 0.0054, "step": 715310 }, { "epoch": 1.85, "learning_rate": 2.1868106516391422e-05, "loss": 0.0058, "step": 715320 }, { "epoch": 1.85, "learning_rate": 2.186421830001996e-05, "loss": 0.0105, "step": 715330 }, { "epoch": 1.85, "learning_rate": 2.1860330083648495e-05, "loss": 0.0086, "step": 715340 }, { "epoch": 1.85, "learning_rate": 2.185644186727703e-05, "loss": 0.0072, "step": 715350 }, { "epoch": 1.85, "learning_rate": 2.185255365090556e-05, "loss": 0.008, "step": 715360 }, { "epoch": 1.85, "learning_rate": 2.1848665434534096e-05, "loss": 0.009, "step": 715370 }, { "epoch": 1.85, "learning_rate": 2.1844777218162634e-05, "loss": 0.0073, "step": 715380 }, { "epoch": 1.85, "learning_rate": 2.184088900179117e-05, "loss": 0.0082, "step": 715390 }, { "epoch": 1.85, "learning_rate": 2.1837000785419704e-05, "loss": 0.0084, "step": 715400 }, { "epoch": 1.85, "learning_rate": 2.183311256904824e-05, "loss": 0.0135, "step": 715410 }, { "epoch": 1.85, "learning_rate": 2.1829224352676777e-05, "loss": 0.0067, "step": 715420 }, { "epoch": 1.85, "learning_rate": 2.1825336136305312e-05, "loss": 0.0074, "step": 715430 }, { "epoch": 1.85, "learning_rate": 2.1821447919933847e-05, "loss": 0.0062, "step": 715440 }, { "epoch": 1.85, "learning_rate": 2.1817559703562382e-05, "loss": 0.0051, "step": 715450 }, { "epoch": 1.85, "learning_rate": 2.181367148719092e-05, "loss": 0.0052, "step": 715460 }, { "epoch": 1.85, "learning_rate": 2.1809783270819455e-05, "loss": 0.0078, "step": 715470 }, { "epoch": 1.85, "learning_rate": 2.1805895054447986e-05, "loss": 0.0071, "step": 715480 }, { "epoch": 1.85, "learning_rate": 2.180200683807652e-05, "loss": 0.0073, "step": 715490 }, { "epoch": 1.85, "learning_rate": 2.1798118621705056e-05, "loss": 0.0132, "step": 715500 }, { "epoch": 1.85, "learning_rate": 2.1794230405333594e-05, "loss": 0.0094, "step": 715510 }, { "epoch": 1.85, "learning_rate": 2.179034218896213e-05, "loss": 0.0094, "step": 715520 }, { "epoch": 1.85, "learning_rate": 2.1786453972590664e-05, "loss": 0.0087, "step": 715530 }, { "epoch": 1.85, "learning_rate": 2.17825657562192e-05, "loss": 0.0071, "step": 715540 }, { "epoch": 1.85, "learning_rate": 2.1778677539847737e-05, "loss": 0.0092, "step": 715550 }, { "epoch": 1.85, "learning_rate": 2.1774789323476272e-05, "loss": 0.0109, "step": 715560 }, { "epoch": 1.85, "learning_rate": 2.1770901107104807e-05, "loss": 0.006, "step": 715570 }, { "epoch": 1.85, "learning_rate": 2.1767012890733342e-05, "loss": 0.0067, "step": 715580 }, { "epoch": 1.85, "learning_rate": 2.176312467436188e-05, "loss": 0.0065, "step": 715590 }, { "epoch": 1.85, "learning_rate": 2.1759236457990415e-05, "loss": 0.0056, "step": 715600 }, { "epoch": 1.85, "learning_rate": 2.1755348241618946e-05, "loss": 0.0093, "step": 715610 }, { "epoch": 1.85, "learning_rate": 2.175146002524748e-05, "loss": 0.0085, "step": 715620 }, { "epoch": 1.86, "learning_rate": 2.1747571808876016e-05, "loss": 0.0069, "step": 715630 }, { "epoch": 1.86, "learning_rate": 2.1743683592504554e-05, "loss": 0.0077, "step": 715640 }, { "epoch": 1.86, "learning_rate": 2.173979537613309e-05, "loss": 0.0076, "step": 715650 }, { "epoch": 1.86, "learning_rate": 2.1735907159761624e-05, "loss": 0.0076, "step": 715660 }, { "epoch": 1.86, "learning_rate": 2.173201894339016e-05, "loss": 0.0069, "step": 715670 }, { "epoch": 1.86, "learning_rate": 2.1728130727018697e-05, "loss": 0.0075, "step": 715680 }, { "epoch": 1.86, "learning_rate": 2.1724242510647232e-05, "loss": 0.0063, "step": 715690 }, { "epoch": 1.86, "learning_rate": 2.1720354294275767e-05, "loss": 0.0053, "step": 715700 }, { "epoch": 1.86, "learning_rate": 2.1716466077904302e-05, "loss": 0.0084, "step": 715710 }, { "epoch": 1.86, "learning_rate": 2.171257786153284e-05, "loss": 0.0084, "step": 715720 }, { "epoch": 1.86, "learning_rate": 2.170868964516137e-05, "loss": 0.0085, "step": 715730 }, { "epoch": 1.86, "learning_rate": 2.1704801428789906e-05, "loss": 0.0062, "step": 715740 }, { "epoch": 1.86, "learning_rate": 2.170091321241844e-05, "loss": 0.007, "step": 715750 }, { "epoch": 1.86, "learning_rate": 2.1697024996046976e-05, "loss": 0.0079, "step": 715760 }, { "epoch": 1.86, "learning_rate": 2.1693136779675514e-05, "loss": 0.0071, "step": 715770 }, { "epoch": 1.86, "learning_rate": 2.168924856330405e-05, "loss": 0.0099, "step": 715780 }, { "epoch": 1.86, "learning_rate": 2.1685360346932584e-05, "loss": 0.0082, "step": 715790 }, { "epoch": 1.86, "learning_rate": 2.168147213056112e-05, "loss": 0.0092, "step": 715800 }, { "epoch": 1.86, "learning_rate": 2.1677583914189657e-05, "loss": 0.0067, "step": 715810 }, { "epoch": 1.86, "learning_rate": 2.1673695697818192e-05, "loss": 0.0054, "step": 715820 }, { "epoch": 1.86, "learning_rate": 2.1669807481446727e-05, "loss": 0.0069, "step": 715830 }, { "epoch": 1.86, "learning_rate": 2.166591926507526e-05, "loss": 0.0086, "step": 715840 }, { "epoch": 1.86, "learning_rate": 2.1662031048703793e-05, "loss": 0.0064, "step": 715850 }, { "epoch": 1.86, "learning_rate": 2.165814283233233e-05, "loss": 0.0075, "step": 715860 }, { "epoch": 1.86, "learning_rate": 2.1654254615960866e-05, "loss": 0.006, "step": 715870 }, { "epoch": 1.86, "learning_rate": 2.16503663995894e-05, "loss": 0.0072, "step": 715880 }, { "epoch": 1.86, "learning_rate": 2.1646478183217936e-05, "loss": 0.0084, "step": 715890 }, { "epoch": 1.86, "learning_rate": 2.1642589966846474e-05, "loss": 0.0055, "step": 715900 }, { "epoch": 1.86, "learning_rate": 2.163870175047501e-05, "loss": 0.0096, "step": 715910 }, { "epoch": 1.86, "learning_rate": 2.1634813534103544e-05, "loss": 0.0064, "step": 715920 }, { "epoch": 1.86, "learning_rate": 2.163092531773208e-05, "loss": 0.0083, "step": 715930 }, { "epoch": 1.86, "learning_rate": 2.1627037101360617e-05, "loss": 0.0077, "step": 715940 }, { "epoch": 1.86, "learning_rate": 2.1623148884989152e-05, "loss": 0.0083, "step": 715950 }, { "epoch": 1.86, "learning_rate": 2.1619260668617687e-05, "loss": 0.0076, "step": 715960 }, { "epoch": 1.86, "learning_rate": 2.161537245224622e-05, "loss": 0.0076, "step": 715970 }, { "epoch": 1.86, "learning_rate": 2.1611484235874753e-05, "loss": 0.008, "step": 715980 }, { "epoch": 1.86, "learning_rate": 2.160759601950329e-05, "loss": 0.0062, "step": 715990 }, { "epoch": 1.86, "learning_rate": 2.1603707803131826e-05, "loss": 0.0059, "step": 716000 }, { "epoch": 1.86, "eval_cer": 0.8816774928583525, "eval_loss": 0.004547602031379938, "eval_runtime": 107.8685, "eval_samples_per_second": 18.541, "eval_steps_per_second": 4.635, "step": 716000 }, { "epoch": 1.86, "learning_rate": 2.159981958676036e-05, "loss": 0.0093, "step": 716010 }, { "epoch": 1.86, "learning_rate": 2.1595931370388896e-05, "loss": 0.0072, "step": 716020 }, { "epoch": 1.86, "learning_rate": 2.1592043154017434e-05, "loss": 0.0079, "step": 716030 }, { "epoch": 1.86, "learning_rate": 2.158815493764597e-05, "loss": 0.0082, "step": 716040 }, { "epoch": 1.86, "learning_rate": 2.1584266721274504e-05, "loss": 0.005, "step": 716050 }, { "epoch": 1.86, "learning_rate": 2.158037850490304e-05, "loss": 0.0095, "step": 716060 }, { "epoch": 1.86, "learning_rate": 2.1576490288531577e-05, "loss": 0.0095, "step": 716070 }, { "epoch": 1.86, "learning_rate": 2.1572602072160112e-05, "loss": 0.0059, "step": 716080 }, { "epoch": 1.86, "learning_rate": 2.1568713855788647e-05, "loss": 0.0072, "step": 716090 }, { "epoch": 1.86, "learning_rate": 2.1564825639417178e-05, "loss": 0.005, "step": 716100 }, { "epoch": 1.86, "learning_rate": 2.1560937423045713e-05, "loss": 0.0065, "step": 716110 }, { "epoch": 1.86, "learning_rate": 2.155704920667425e-05, "loss": 0.0053, "step": 716120 }, { "epoch": 1.86, "learning_rate": 2.1553160990302786e-05, "loss": 0.0053, "step": 716130 }, { "epoch": 1.86, "learning_rate": 2.154927277393132e-05, "loss": 0.0058, "step": 716140 }, { "epoch": 1.86, "learning_rate": 2.1545384557559856e-05, "loss": 0.0073, "step": 716150 }, { "epoch": 1.86, "learning_rate": 2.1541496341188394e-05, "loss": 0.0083, "step": 716160 }, { "epoch": 1.86, "learning_rate": 2.153760812481693e-05, "loss": 0.0083, "step": 716170 }, { "epoch": 1.86, "learning_rate": 2.1533719908445464e-05, "loss": 0.0073, "step": 716180 }, { "epoch": 1.86, "learning_rate": 2.1529831692074e-05, "loss": 0.0075, "step": 716190 }, { "epoch": 1.86, "learning_rate": 2.1525943475702537e-05, "loss": 0.0075, "step": 716200 }, { "epoch": 1.86, "learning_rate": 2.1522055259331072e-05, "loss": 0.0093, "step": 716210 }, { "epoch": 1.86, "learning_rate": 2.1518167042959607e-05, "loss": 0.0082, "step": 716220 }, { "epoch": 1.86, "learning_rate": 2.1514278826588138e-05, "loss": 0.0062, "step": 716230 }, { "epoch": 1.86, "learning_rate": 2.1510390610216673e-05, "loss": 0.0059, "step": 716240 }, { "epoch": 1.86, "learning_rate": 2.150650239384521e-05, "loss": 0.0095, "step": 716250 }, { "epoch": 1.86, "learning_rate": 2.1502614177473746e-05, "loss": 0.007, "step": 716260 }, { "epoch": 1.86, "learning_rate": 2.149872596110228e-05, "loss": 0.0065, "step": 716270 }, { "epoch": 1.86, "learning_rate": 2.1494837744730816e-05, "loss": 0.0062, "step": 716280 }, { "epoch": 1.86, "learning_rate": 2.149094952835935e-05, "loss": 0.0064, "step": 716290 }, { "epoch": 1.86, "learning_rate": 2.148706131198789e-05, "loss": 0.0066, "step": 716300 }, { "epoch": 1.86, "learning_rate": 2.1483173095616424e-05, "loss": 0.0063, "step": 716310 }, { "epoch": 1.86, "learning_rate": 2.147928487924496e-05, "loss": 0.008, "step": 716320 }, { "epoch": 1.86, "learning_rate": 2.1475396662873494e-05, "loss": 0.0073, "step": 716330 }, { "epoch": 1.86, "learning_rate": 2.1471508446502032e-05, "loss": 0.0069, "step": 716340 }, { "epoch": 1.86, "learning_rate": 2.1467620230130563e-05, "loss": 0.0059, "step": 716350 }, { "epoch": 1.86, "learning_rate": 2.1463732013759098e-05, "loss": 0.0044, "step": 716360 }, { "epoch": 1.86, "learning_rate": 2.1459843797387633e-05, "loss": 0.0086, "step": 716370 }, { "epoch": 1.86, "learning_rate": 2.1455955581016168e-05, "loss": 0.0067, "step": 716380 }, { "epoch": 1.86, "learning_rate": 2.1452067364644706e-05, "loss": 0.0074, "step": 716390 }, { "epoch": 1.86, "learning_rate": 2.144817914827324e-05, "loss": 0.0066, "step": 716400 }, { "epoch": 1.86, "learning_rate": 2.1444290931901776e-05, "loss": 0.0087, "step": 716410 }, { "epoch": 1.86, "learning_rate": 2.144040271553031e-05, "loss": 0.0046, "step": 716420 }, { "epoch": 1.86, "learning_rate": 2.143651449915885e-05, "loss": 0.0071, "step": 716430 }, { "epoch": 1.86, "learning_rate": 2.1432626282787384e-05, "loss": 0.0101, "step": 716440 }, { "epoch": 1.86, "learning_rate": 2.142873806641592e-05, "loss": 0.0059, "step": 716450 }, { "epoch": 1.86, "learning_rate": 2.1424849850044454e-05, "loss": 0.0072, "step": 716460 }, { "epoch": 1.86, "learning_rate": 2.1420961633672985e-05, "loss": 0.0045, "step": 716470 }, { "epoch": 1.86, "learning_rate": 2.1417073417301523e-05, "loss": 0.0082, "step": 716480 }, { "epoch": 1.86, "learning_rate": 2.1413185200930058e-05, "loss": 0.0056, "step": 716490 }, { "epoch": 1.86, "learning_rate": 2.1409296984558593e-05, "loss": 0.0055, "step": 716500 }, { "epoch": 1.86, "learning_rate": 2.1405408768187128e-05, "loss": 0.0072, "step": 716510 }, { "epoch": 1.86, "learning_rate": 2.1401520551815666e-05, "loss": 0.0068, "step": 716520 }, { "epoch": 1.86, "learning_rate": 2.13976323354442e-05, "loss": 0.0067, "step": 716530 }, { "epoch": 1.86, "learning_rate": 2.1393744119072736e-05, "loss": 0.0091, "step": 716540 }, { "epoch": 1.86, "learning_rate": 2.138985590270127e-05, "loss": 0.0067, "step": 716550 }, { "epoch": 1.86, "learning_rate": 2.138596768632981e-05, "loss": 0.0083, "step": 716560 }, { "epoch": 1.86, "learning_rate": 2.1382079469958344e-05, "loss": 0.0073, "step": 716570 }, { "epoch": 1.86, "learning_rate": 2.137819125358688e-05, "loss": 0.0056, "step": 716580 }, { "epoch": 1.86, "learning_rate": 2.1374303037215414e-05, "loss": 0.0067, "step": 716590 }, { "epoch": 1.86, "learning_rate": 2.1370414820843945e-05, "loss": 0.0097, "step": 716600 }, { "epoch": 1.86, "learning_rate": 2.1366526604472483e-05, "loss": 0.0067, "step": 716610 }, { "epoch": 1.86, "learning_rate": 2.1362638388101018e-05, "loss": 0.0078, "step": 716620 }, { "epoch": 1.86, "learning_rate": 2.1358750171729553e-05, "loss": 0.0072, "step": 716630 }, { "epoch": 1.86, "learning_rate": 2.1354861955358088e-05, "loss": 0.0061, "step": 716640 }, { "epoch": 1.86, "learning_rate": 2.1350973738986626e-05, "loss": 0.0081, "step": 716650 }, { "epoch": 1.86, "learning_rate": 2.134708552261516e-05, "loss": 0.0059, "step": 716660 }, { "epoch": 1.86, "learning_rate": 2.1343197306243696e-05, "loss": 0.0069, "step": 716670 }, { "epoch": 1.86, "learning_rate": 2.133930908987223e-05, "loss": 0.0067, "step": 716680 }, { "epoch": 1.86, "learning_rate": 2.133542087350077e-05, "loss": 0.0067, "step": 716690 }, { "epoch": 1.86, "learning_rate": 2.1331532657129304e-05, "loss": 0.0065, "step": 716700 }, { "epoch": 1.86, "learning_rate": 2.132764444075784e-05, "loss": 0.0071, "step": 716710 }, { "epoch": 1.86, "learning_rate": 2.132375622438637e-05, "loss": 0.0074, "step": 716720 }, { "epoch": 1.86, "learning_rate": 2.1319868008014905e-05, "loss": 0.0068, "step": 716730 }, { "epoch": 1.86, "learning_rate": 2.1315979791643443e-05, "loss": 0.009, "step": 716740 }, { "epoch": 1.86, "learning_rate": 2.1312091575271978e-05, "loss": 0.007, "step": 716750 }, { "epoch": 1.86, "learning_rate": 2.1308203358900513e-05, "loss": 0.0083, "step": 716760 }, { "epoch": 1.86, "learning_rate": 2.1304315142529048e-05, "loss": 0.0071, "step": 716770 }, { "epoch": 1.86, "learning_rate": 2.1300426926157586e-05, "loss": 0.0073, "step": 716780 }, { "epoch": 1.86, "learning_rate": 2.129653870978612e-05, "loss": 0.0077, "step": 716790 }, { "epoch": 1.86, "learning_rate": 2.1292650493414656e-05, "loss": 0.0074, "step": 716800 }, { "epoch": 1.86, "learning_rate": 2.128876227704319e-05, "loss": 0.0062, "step": 716810 }, { "epoch": 1.86, "learning_rate": 2.128487406067173e-05, "loss": 0.0094, "step": 716820 }, { "epoch": 1.86, "learning_rate": 2.1280985844300264e-05, "loss": 0.0078, "step": 716830 }, { "epoch": 1.86, "learning_rate": 2.12770976279288e-05, "loss": 0.0065, "step": 716840 }, { "epoch": 1.86, "learning_rate": 2.127320941155733e-05, "loss": 0.0078, "step": 716850 }, { "epoch": 1.86, "learning_rate": 2.1269321195185865e-05, "loss": 0.0084, "step": 716860 }, { "epoch": 1.86, "learning_rate": 2.1265432978814403e-05, "loss": 0.0066, "step": 716870 }, { "epoch": 1.86, "learning_rate": 2.1261544762442938e-05, "loss": 0.0077, "step": 716880 }, { "epoch": 1.86, "learning_rate": 2.1257656546071473e-05, "loss": 0.0087, "step": 716890 }, { "epoch": 1.86, "learning_rate": 2.1253768329700008e-05, "loss": 0.008, "step": 716900 }, { "epoch": 1.86, "learning_rate": 2.1249880113328546e-05, "loss": 0.0083, "step": 716910 }, { "epoch": 1.86, "learning_rate": 2.124599189695708e-05, "loss": 0.0076, "step": 716920 }, { "epoch": 1.86, "learning_rate": 2.1242103680585616e-05, "loss": 0.0055, "step": 716930 }, { "epoch": 1.86, "learning_rate": 2.123821546421415e-05, "loss": 0.0093, "step": 716940 }, { "epoch": 1.86, "learning_rate": 2.123432724784269e-05, "loss": 0.0062, "step": 716950 }, { "epoch": 1.86, "learning_rate": 2.1230439031471224e-05, "loss": 0.007, "step": 716960 }, { "epoch": 1.86, "learning_rate": 2.1226550815099755e-05, "loss": 0.0083, "step": 716970 }, { "epoch": 1.86, "learning_rate": 2.122266259872829e-05, "loss": 0.0063, "step": 716980 }, { "epoch": 1.86, "learning_rate": 2.1218774382356825e-05, "loss": 0.0107, "step": 716990 }, { "epoch": 1.86, "learning_rate": 2.1214886165985363e-05, "loss": 0.0063, "step": 717000 }, { "epoch": 1.86, "eval_cer": 0.8816844910430235, "eval_loss": 0.0045911758206784725, "eval_runtime": 107.8933, "eval_samples_per_second": 18.537, "eval_steps_per_second": 4.634, "step": 717000 }, { "epoch": 1.86, "learning_rate": 2.1210997949613898e-05, "loss": 0.0072, "step": 717010 }, { "epoch": 1.86, "learning_rate": 2.1207109733242433e-05, "loss": 0.0069, "step": 717020 }, { "epoch": 1.86, "learning_rate": 2.1203221516870968e-05, "loss": 0.0062, "step": 717030 }, { "epoch": 1.86, "learning_rate": 2.1199333300499506e-05, "loss": 0.0072, "step": 717040 }, { "epoch": 1.86, "learning_rate": 2.119544508412804e-05, "loss": 0.0079, "step": 717050 }, { "epoch": 1.86, "learning_rate": 2.1191556867756576e-05, "loss": 0.006, "step": 717060 }, { "epoch": 1.86, "learning_rate": 2.118766865138511e-05, "loss": 0.0085, "step": 717070 }, { "epoch": 1.86, "learning_rate": 2.118378043501365e-05, "loss": 0.0063, "step": 717080 }, { "epoch": 1.86, "learning_rate": 2.1179892218642184e-05, "loss": 0.0073, "step": 717090 }, { "epoch": 1.86, "learning_rate": 2.1176004002270715e-05, "loss": 0.0074, "step": 717100 }, { "epoch": 1.86, "learning_rate": 2.117211578589925e-05, "loss": 0.0064, "step": 717110 }, { "epoch": 1.86, "learning_rate": 2.1168227569527785e-05, "loss": 0.0049, "step": 717120 }, { "epoch": 1.86, "learning_rate": 2.1164339353156323e-05, "loss": 0.006, "step": 717130 }, { "epoch": 1.86, "learning_rate": 2.1160451136784858e-05, "loss": 0.0067, "step": 717140 }, { "epoch": 1.86, "learning_rate": 2.1156562920413393e-05, "loss": 0.0051, "step": 717150 }, { "epoch": 1.86, "learning_rate": 2.1152674704041928e-05, "loss": 0.0064, "step": 717160 }, { "epoch": 1.86, "learning_rate": 2.1148786487670466e-05, "loss": 0.0078, "step": 717170 }, { "epoch": 1.86, "learning_rate": 2.1144898271299e-05, "loss": 0.006, "step": 717180 }, { "epoch": 1.86, "learning_rate": 2.1141010054927536e-05, "loss": 0.007, "step": 717190 }, { "epoch": 1.86, "learning_rate": 2.113712183855607e-05, "loss": 0.0071, "step": 717200 }, { "epoch": 1.86, "learning_rate": 2.113323362218461e-05, "loss": 0.0066, "step": 717210 }, { "epoch": 1.86, "learning_rate": 2.112934540581314e-05, "loss": 0.0057, "step": 717220 }, { "epoch": 1.86, "learning_rate": 2.1125457189441675e-05, "loss": 0.0046, "step": 717230 }, { "epoch": 1.86, "learning_rate": 2.112156897307021e-05, "loss": 0.0059, "step": 717240 }, { "epoch": 1.86, "learning_rate": 2.1117680756698745e-05, "loss": 0.0093, "step": 717250 }, { "epoch": 1.86, "learning_rate": 2.1113792540327283e-05, "loss": 0.0078, "step": 717260 }, { "epoch": 1.86, "learning_rate": 2.1109904323955818e-05, "loss": 0.0058, "step": 717270 }, { "epoch": 1.86, "learning_rate": 2.1106016107584353e-05, "loss": 0.0089, "step": 717280 }, { "epoch": 1.86, "learning_rate": 2.1102127891212888e-05, "loss": 0.0092, "step": 717290 }, { "epoch": 1.86, "learning_rate": 2.1098239674841426e-05, "loss": 0.0048, "step": 717300 }, { "epoch": 1.86, "learning_rate": 2.109435145846996e-05, "loss": 0.0064, "step": 717310 }, { "epoch": 1.86, "learning_rate": 2.1090463242098496e-05, "loss": 0.0064, "step": 717320 }, { "epoch": 1.86, "learning_rate": 2.108657502572703e-05, "loss": 0.0071, "step": 717330 }, { "epoch": 1.86, "learning_rate": 2.1082686809355562e-05, "loss": 0.0109, "step": 717340 }, { "epoch": 1.86, "learning_rate": 2.10787985929841e-05, "loss": 0.0079, "step": 717350 }, { "epoch": 1.86, "learning_rate": 2.1074910376612635e-05, "loss": 0.0079, "step": 717360 }, { "epoch": 1.86, "learning_rate": 2.107102216024117e-05, "loss": 0.0059, "step": 717370 }, { "epoch": 1.86, "learning_rate": 2.1067133943869705e-05, "loss": 0.0071, "step": 717380 }, { "epoch": 1.86, "learning_rate": 2.1063245727498243e-05, "loss": 0.0067, "step": 717390 }, { "epoch": 1.86, "learning_rate": 2.1059357511126778e-05, "loss": 0.0062, "step": 717400 }, { "epoch": 1.86, "learning_rate": 2.1055469294755313e-05, "loss": 0.0056, "step": 717410 }, { "epoch": 1.86, "learning_rate": 2.1051581078383848e-05, "loss": 0.0099, "step": 717420 }, { "epoch": 1.86, "learning_rate": 2.1047692862012386e-05, "loss": 0.0064, "step": 717430 }, { "epoch": 1.86, "learning_rate": 2.104380464564092e-05, "loss": 0.0097, "step": 717440 }, { "epoch": 1.86, "learning_rate": 2.1039916429269456e-05, "loss": 0.0058, "step": 717450 }, { "epoch": 1.86, "learning_rate": 2.103602821289799e-05, "loss": 0.007, "step": 717460 }, { "epoch": 1.86, "learning_rate": 2.1032139996526522e-05, "loss": 0.0067, "step": 717470 }, { "epoch": 1.86, "learning_rate": 2.102825178015506e-05, "loss": 0.0071, "step": 717480 }, { "epoch": 1.86, "learning_rate": 2.1024363563783595e-05, "loss": 0.008, "step": 717490 }, { "epoch": 1.86, "learning_rate": 2.102047534741213e-05, "loss": 0.0069, "step": 717500 }, { "epoch": 1.86, "learning_rate": 2.1016587131040665e-05, "loss": 0.0106, "step": 717510 }, { "epoch": 1.86, "learning_rate": 2.1012698914669203e-05, "loss": 0.005, "step": 717520 }, { "epoch": 1.86, "learning_rate": 2.1008810698297738e-05, "loss": 0.0058, "step": 717530 }, { "epoch": 1.86, "learning_rate": 2.1004922481926273e-05, "loss": 0.0074, "step": 717540 }, { "epoch": 1.86, "learning_rate": 2.1001034265554808e-05, "loss": 0.0069, "step": 717550 }, { "epoch": 1.86, "learning_rate": 2.0997146049183346e-05, "loss": 0.0057, "step": 717560 }, { "epoch": 1.86, "learning_rate": 2.099325783281188e-05, "loss": 0.008, "step": 717570 }, { "epoch": 1.86, "learning_rate": 2.0989369616440416e-05, "loss": 0.0057, "step": 717580 }, { "epoch": 1.86, "learning_rate": 2.0985481400068947e-05, "loss": 0.0063, "step": 717590 }, { "epoch": 1.86, "learning_rate": 2.0981593183697482e-05, "loss": 0.0073, "step": 717600 }, { "epoch": 1.86, "learning_rate": 2.097770496732602e-05, "loss": 0.0073, "step": 717610 }, { "epoch": 1.86, "learning_rate": 2.0973816750954555e-05, "loss": 0.006, "step": 717620 }, { "epoch": 1.86, "learning_rate": 2.096992853458309e-05, "loss": 0.0072, "step": 717630 }, { "epoch": 1.86, "learning_rate": 2.0966040318211625e-05, "loss": 0.0074, "step": 717640 }, { "epoch": 1.86, "learning_rate": 2.0962152101840163e-05, "loss": 0.0085, "step": 717650 }, { "epoch": 1.86, "learning_rate": 2.0958263885468698e-05, "loss": 0.0101, "step": 717660 }, { "epoch": 1.86, "learning_rate": 2.0954375669097233e-05, "loss": 0.007, "step": 717670 }, { "epoch": 1.86, "learning_rate": 2.0950487452725768e-05, "loss": 0.0092, "step": 717680 }, { "epoch": 1.86, "learning_rate": 2.0946599236354303e-05, "loss": 0.0108, "step": 717690 }, { "epoch": 1.86, "learning_rate": 2.094271101998284e-05, "loss": 0.0076, "step": 717700 }, { "epoch": 1.86, "learning_rate": 2.0938822803611376e-05, "loss": 0.0079, "step": 717710 }, { "epoch": 1.86, "learning_rate": 2.0934934587239907e-05, "loss": 0.0097, "step": 717720 }, { "epoch": 1.86, "learning_rate": 2.0931046370868442e-05, "loss": 0.0057, "step": 717730 }, { "epoch": 1.86, "learning_rate": 2.0927158154496977e-05, "loss": 0.0058, "step": 717740 }, { "epoch": 1.86, "learning_rate": 2.0923269938125515e-05, "loss": 0.0072, "step": 717750 }, { "epoch": 1.86, "learning_rate": 2.091938172175405e-05, "loss": 0.0069, "step": 717760 }, { "epoch": 1.86, "learning_rate": 2.0915493505382585e-05, "loss": 0.0074, "step": 717770 }, { "epoch": 1.86, "learning_rate": 2.091160528901112e-05, "loss": 0.006, "step": 717780 }, { "epoch": 1.86, "learning_rate": 2.0907717072639658e-05, "loss": 0.0073, "step": 717790 }, { "epoch": 1.86, "learning_rate": 2.0903828856268193e-05, "loss": 0.0054, "step": 717800 }, { "epoch": 1.86, "learning_rate": 2.0899940639896728e-05, "loss": 0.0063, "step": 717810 }, { "epoch": 1.86, "learning_rate": 2.0896052423525263e-05, "loss": 0.0086, "step": 717820 }, { "epoch": 1.86, "learning_rate": 2.08921642071538e-05, "loss": 0.007, "step": 717830 }, { "epoch": 1.86, "learning_rate": 2.0888275990782332e-05, "loss": 0.0084, "step": 717840 }, { "epoch": 1.86, "learning_rate": 2.0884387774410867e-05, "loss": 0.0078, "step": 717850 }, { "epoch": 1.86, "learning_rate": 2.0880499558039402e-05, "loss": 0.0087, "step": 717860 }, { "epoch": 1.86, "learning_rate": 2.0876611341667937e-05, "loss": 0.0081, "step": 717870 }, { "epoch": 1.86, "learning_rate": 2.0872723125296475e-05, "loss": 0.0101, "step": 717880 }, { "epoch": 1.86, "learning_rate": 2.086883490892501e-05, "loss": 0.0062, "step": 717890 }, { "epoch": 1.86, "learning_rate": 2.0864946692553545e-05, "loss": 0.007, "step": 717900 }, { "epoch": 1.86, "learning_rate": 2.086105847618208e-05, "loss": 0.0082, "step": 717910 }, { "epoch": 1.86, "learning_rate": 2.0857170259810618e-05, "loss": 0.0112, "step": 717920 }, { "epoch": 1.86, "learning_rate": 2.0853282043439153e-05, "loss": 0.0083, "step": 717930 }, { "epoch": 1.86, "learning_rate": 2.0849393827067688e-05, "loss": 0.0082, "step": 717940 }, { "epoch": 1.86, "learning_rate": 2.0845505610696223e-05, "loss": 0.0065, "step": 717950 }, { "epoch": 1.86, "learning_rate": 2.0841617394324754e-05, "loss": 0.0056, "step": 717960 }, { "epoch": 1.86, "learning_rate": 2.0837729177953292e-05, "loss": 0.0065, "step": 717970 }, { "epoch": 1.86, "learning_rate": 2.0833840961581827e-05, "loss": 0.0091, "step": 717980 }, { "epoch": 1.86, "learning_rate": 2.0829952745210362e-05, "loss": 0.0111, "step": 717990 }, { "epoch": 1.86, "learning_rate": 2.0826064528838897e-05, "loss": 0.0059, "step": 718000 }, { "epoch": 1.86, "eval_cer": 0.8816536990304715, "eval_loss": 0.004619268234819174, "eval_runtime": 107.8627, "eval_samples_per_second": 18.542, "eval_steps_per_second": 4.636, "step": 718000 }, { "epoch": 1.86, "learning_rate": 2.0822176312467435e-05, "loss": 0.0051, "step": 718010 }, { "epoch": 1.86, "learning_rate": 2.081828809609597e-05, "loss": 0.0088, "step": 718020 }, { "epoch": 1.86, "learning_rate": 2.0814399879724505e-05, "loss": 0.0103, "step": 718030 }, { "epoch": 1.86, "learning_rate": 2.081051166335304e-05, "loss": 0.0098, "step": 718040 }, { "epoch": 1.86, "learning_rate": 2.0806623446981578e-05, "loss": 0.0098, "step": 718050 }, { "epoch": 1.86, "learning_rate": 2.0802735230610113e-05, "loss": 0.0066, "step": 718060 }, { "epoch": 1.86, "learning_rate": 2.0798847014238648e-05, "loss": 0.0089, "step": 718070 }, { "epoch": 1.86, "learning_rate": 2.0794958797867182e-05, "loss": 0.0056, "step": 718080 }, { "epoch": 1.86, "learning_rate": 2.0791070581495714e-05, "loss": 0.0061, "step": 718090 }, { "epoch": 1.86, "learning_rate": 2.0787182365124252e-05, "loss": 0.0085, "step": 718100 }, { "epoch": 1.86, "learning_rate": 2.0783294148752787e-05, "loss": 0.0066, "step": 718110 }, { "epoch": 1.86, "learning_rate": 2.0779405932381322e-05, "loss": 0.0062, "step": 718120 }, { "epoch": 1.86, "learning_rate": 2.0775517716009857e-05, "loss": 0.0082, "step": 718130 }, { "epoch": 1.86, "learning_rate": 2.0771629499638395e-05, "loss": 0.0075, "step": 718140 }, { "epoch": 1.86, "learning_rate": 2.076774128326693e-05, "loss": 0.0071, "step": 718150 }, { "epoch": 1.86, "learning_rate": 2.0763853066895465e-05, "loss": 0.0114, "step": 718160 }, { "epoch": 1.86, "learning_rate": 2.0759964850524e-05, "loss": 0.0088, "step": 718170 }, { "epoch": 1.86, "learning_rate": 2.0756076634152538e-05, "loss": 0.0075, "step": 718180 }, { "epoch": 1.86, "learning_rate": 2.0752188417781073e-05, "loss": 0.0061, "step": 718190 }, { "epoch": 1.86, "learning_rate": 2.0748300201409608e-05, "loss": 0.008, "step": 718200 }, { "epoch": 1.86, "learning_rate": 2.074441198503814e-05, "loss": 0.0079, "step": 718210 }, { "epoch": 1.86, "learning_rate": 2.0740523768666674e-05, "loss": 0.0065, "step": 718220 }, { "epoch": 1.86, "learning_rate": 2.0736635552295212e-05, "loss": 0.0076, "step": 718230 }, { "epoch": 1.86, "learning_rate": 2.0732747335923747e-05, "loss": 0.007, "step": 718240 }, { "epoch": 1.86, "learning_rate": 2.0728859119552282e-05, "loss": 0.0074, "step": 718250 }, { "epoch": 1.86, "learning_rate": 2.0724970903180817e-05, "loss": 0.009, "step": 718260 }, { "epoch": 1.86, "learning_rate": 2.0721082686809355e-05, "loss": 0.007, "step": 718270 }, { "epoch": 1.86, "learning_rate": 2.071719447043789e-05, "loss": 0.0082, "step": 718280 }, { "epoch": 1.86, "learning_rate": 2.0713306254066425e-05, "loss": 0.0071, "step": 718290 }, { "epoch": 1.86, "learning_rate": 2.070941803769496e-05, "loss": 0.0053, "step": 718300 }, { "epoch": 1.86, "learning_rate": 2.0705529821323498e-05, "loss": 0.0064, "step": 718310 }, { "epoch": 1.86, "learning_rate": 2.0701641604952033e-05, "loss": 0.006, "step": 718320 }, { "epoch": 1.86, "learning_rate": 2.0697753388580568e-05, "loss": 0.0076, "step": 718330 }, { "epoch": 1.86, "learning_rate": 2.06938651722091e-05, "loss": 0.0085, "step": 718340 }, { "epoch": 1.86, "learning_rate": 2.0689976955837634e-05, "loss": 0.011, "step": 718350 }, { "epoch": 1.86, "learning_rate": 2.0686088739466172e-05, "loss": 0.0079, "step": 718360 }, { "epoch": 1.86, "learning_rate": 2.0682200523094707e-05, "loss": 0.0076, "step": 718370 }, { "epoch": 1.86, "learning_rate": 2.0678312306723242e-05, "loss": 0.0066, "step": 718380 }, { "epoch": 1.86, "learning_rate": 2.0674424090351777e-05, "loss": 0.0111, "step": 718390 }, { "epoch": 1.86, "learning_rate": 2.0670535873980315e-05, "loss": 0.0065, "step": 718400 }, { "epoch": 1.86, "learning_rate": 2.066664765760885e-05, "loss": 0.0098, "step": 718410 }, { "epoch": 1.86, "learning_rate": 2.0662759441237385e-05, "loss": 0.0095, "step": 718420 }, { "epoch": 1.86, "learning_rate": 2.065887122486592e-05, "loss": 0.0054, "step": 718430 }, { "epoch": 1.86, "learning_rate": 2.0654983008494458e-05, "loss": 0.0083, "step": 718440 }, { "epoch": 1.86, "learning_rate": 2.0651094792122993e-05, "loss": 0.0069, "step": 718450 }, { "epoch": 1.86, "learning_rate": 2.0647206575751524e-05, "loss": 0.0087, "step": 718460 }, { "epoch": 1.86, "learning_rate": 2.064331835938006e-05, "loss": 0.0081, "step": 718470 }, { "epoch": 1.86, "learning_rate": 2.0639430143008594e-05, "loss": 0.0055, "step": 718480 }, { "epoch": 1.86, "learning_rate": 2.0635541926637132e-05, "loss": 0.0094, "step": 718490 }, { "epoch": 1.86, "learning_rate": 2.0631653710265667e-05, "loss": 0.0062, "step": 718500 }, { "epoch": 1.86, "learning_rate": 2.0627765493894202e-05, "loss": 0.0091, "step": 718510 }, { "epoch": 1.86, "learning_rate": 2.0623877277522737e-05, "loss": 0.0067, "step": 718520 }, { "epoch": 1.86, "learning_rate": 2.0619989061151275e-05, "loss": 0.0096, "step": 718530 }, { "epoch": 1.86, "learning_rate": 2.061610084477981e-05, "loss": 0.0067, "step": 718540 }, { "epoch": 1.86, "learning_rate": 2.0612212628408345e-05, "loss": 0.0061, "step": 718550 }, { "epoch": 1.86, "learning_rate": 2.060832441203688e-05, "loss": 0.0072, "step": 718560 }, { "epoch": 1.86, "learning_rate": 2.0604436195665418e-05, "loss": 0.0083, "step": 718570 }, { "epoch": 1.86, "learning_rate": 2.060054797929395e-05, "loss": 0.0093, "step": 718580 }, { "epoch": 1.86, "learning_rate": 2.0596659762922484e-05, "loss": 0.006, "step": 718590 }, { "epoch": 1.86, "learning_rate": 2.059277154655102e-05, "loss": 0.0073, "step": 718600 }, { "epoch": 1.86, "learning_rate": 2.0588883330179554e-05, "loss": 0.0081, "step": 718610 }, { "epoch": 1.86, "learning_rate": 2.0584995113808092e-05, "loss": 0.0099, "step": 718620 }, { "epoch": 1.86, "learning_rate": 2.0581106897436627e-05, "loss": 0.0057, "step": 718630 }, { "epoch": 1.86, "learning_rate": 2.0577218681065162e-05, "loss": 0.0062, "step": 718640 }, { "epoch": 1.86, "learning_rate": 2.0573330464693697e-05, "loss": 0.0065, "step": 718650 }, { "epoch": 1.86, "learning_rate": 2.0569442248322235e-05, "loss": 0.0101, "step": 718660 }, { "epoch": 1.86, "learning_rate": 2.056555403195077e-05, "loss": 0.0117, "step": 718670 }, { "epoch": 1.86, "learning_rate": 2.0561665815579305e-05, "loss": 0.0071, "step": 718680 }, { "epoch": 1.86, "learning_rate": 2.055777759920784e-05, "loss": 0.0059, "step": 718690 }, { "epoch": 1.86, "learning_rate": 2.0553889382836378e-05, "loss": 0.0087, "step": 718700 }, { "epoch": 1.86, "learning_rate": 2.055000116646491e-05, "loss": 0.0068, "step": 718710 }, { "epoch": 1.86, "learning_rate": 2.0546112950093444e-05, "loss": 0.0053, "step": 718720 }, { "epoch": 1.86, "learning_rate": 2.054222473372198e-05, "loss": 0.0059, "step": 718730 }, { "epoch": 1.86, "learning_rate": 2.0538336517350514e-05, "loss": 0.007, "step": 718740 }, { "epoch": 1.86, "learning_rate": 2.0534448300979052e-05, "loss": 0.0065, "step": 718750 }, { "epoch": 1.86, "learning_rate": 2.0530560084607587e-05, "loss": 0.0083, "step": 718760 }, { "epoch": 1.86, "learning_rate": 2.0526671868236122e-05, "loss": 0.0073, "step": 718770 }, { "epoch": 1.86, "learning_rate": 2.0522783651864657e-05, "loss": 0.0077, "step": 718780 }, { "epoch": 1.86, "learning_rate": 2.0518895435493195e-05, "loss": 0.0065, "step": 718790 }, { "epoch": 1.86, "learning_rate": 2.051500721912173e-05, "loss": 0.0079, "step": 718800 }, { "epoch": 1.86, "learning_rate": 2.0511119002750265e-05, "loss": 0.0058, "step": 718810 }, { "epoch": 1.86, "learning_rate": 2.05072307863788e-05, "loss": 0.0063, "step": 718820 }, { "epoch": 1.86, "learning_rate": 2.050334257000733e-05, "loss": 0.0065, "step": 718830 }, { "epoch": 1.86, "learning_rate": 2.049945435363587e-05, "loss": 0.0094, "step": 718840 }, { "epoch": 1.86, "learning_rate": 2.0495566137264404e-05, "loss": 0.0084, "step": 718850 }, { "epoch": 1.86, "learning_rate": 2.049167792089294e-05, "loss": 0.0048, "step": 718860 }, { "epoch": 1.86, "learning_rate": 2.0487789704521474e-05, "loss": 0.0095, "step": 718870 }, { "epoch": 1.86, "learning_rate": 2.0483901488150012e-05, "loss": 0.0041, "step": 718880 }, { "epoch": 1.86, "learning_rate": 2.0480013271778547e-05, "loss": 0.0089, "step": 718890 }, { "epoch": 1.86, "learning_rate": 2.0476125055407082e-05, "loss": 0.0054, "step": 718900 }, { "epoch": 1.86, "learning_rate": 2.0472236839035617e-05, "loss": 0.0106, "step": 718910 }, { "epoch": 1.86, "learning_rate": 2.0468348622664155e-05, "loss": 0.0066, "step": 718920 }, { "epoch": 1.86, "learning_rate": 2.046446040629269e-05, "loss": 0.0074, "step": 718930 }, { "epoch": 1.86, "learning_rate": 2.0460572189921225e-05, "loss": 0.0052, "step": 718940 }, { "epoch": 1.86, "learning_rate": 2.045668397354976e-05, "loss": 0.0102, "step": 718950 }, { "epoch": 1.86, "learning_rate": 2.045279575717829e-05, "loss": 0.0089, "step": 718960 }, { "epoch": 1.86, "learning_rate": 2.044890754080683e-05, "loss": 0.0106, "step": 718970 }, { "epoch": 1.86, "learning_rate": 2.0445019324435364e-05, "loss": 0.0105, "step": 718980 }, { "epoch": 1.86, "learning_rate": 2.04411311080639e-05, "loss": 0.005, "step": 718990 }, { "epoch": 1.86, "learning_rate": 2.0437242891692434e-05, "loss": 0.0064, "step": 719000 }, { "epoch": 1.86, "eval_cer": 0.8816816917691551, "eval_loss": 0.004639680031687021, "eval_runtime": 107.9354, "eval_samples_per_second": 18.53, "eval_steps_per_second": 4.632, "step": 719000 }, { "epoch": 1.86, "learning_rate": 2.0433354675320972e-05, "loss": 0.0082, "step": 719010 }, { "epoch": 1.86, "learning_rate": 2.0429466458949507e-05, "loss": 0.0072, "step": 719020 }, { "epoch": 1.86, "learning_rate": 2.0425578242578042e-05, "loss": 0.0074, "step": 719030 }, { "epoch": 1.86, "learning_rate": 2.0421690026206577e-05, "loss": 0.0079, "step": 719040 }, { "epoch": 1.86, "learning_rate": 2.041780180983511e-05, "loss": 0.0097, "step": 719050 }, { "epoch": 1.86, "learning_rate": 2.041391359346365e-05, "loss": 0.0061, "step": 719060 }, { "epoch": 1.86, "learning_rate": 2.0410025377092185e-05, "loss": 0.0081, "step": 719070 }, { "epoch": 1.86, "learning_rate": 2.0406137160720716e-05, "loss": 0.0053, "step": 719080 }, { "epoch": 1.86, "learning_rate": 2.040224894434925e-05, "loss": 0.0064, "step": 719090 }, { "epoch": 1.86, "learning_rate": 2.0398360727977786e-05, "loss": 0.0054, "step": 719100 }, { "epoch": 1.86, "learning_rate": 2.0394472511606324e-05, "loss": 0.0064, "step": 719110 }, { "epoch": 1.86, "learning_rate": 2.039058429523486e-05, "loss": 0.0085, "step": 719120 }, { "epoch": 1.86, "learning_rate": 2.0386696078863394e-05, "loss": 0.0065, "step": 719130 }, { "epoch": 1.86, "learning_rate": 2.038280786249193e-05, "loss": 0.0088, "step": 719140 }, { "epoch": 1.86, "learning_rate": 2.0378919646120467e-05, "loss": 0.0072, "step": 719150 }, { "epoch": 1.86, "learning_rate": 2.0375031429749002e-05, "loss": 0.0102, "step": 719160 }, { "epoch": 1.86, "learning_rate": 2.0371143213377537e-05, "loss": 0.0078, "step": 719170 }, { "epoch": 1.86, "learning_rate": 2.036725499700607e-05, "loss": 0.0067, "step": 719180 }, { "epoch": 1.86, "learning_rate": 2.036336678063461e-05, "loss": 0.0082, "step": 719190 }, { "epoch": 1.86, "learning_rate": 2.035947856426314e-05, "loss": 0.0064, "step": 719200 }, { "epoch": 1.86, "learning_rate": 2.0355590347891676e-05, "loss": 0.0081, "step": 719210 }, { "epoch": 1.86, "learning_rate": 2.035170213152021e-05, "loss": 0.0051, "step": 719220 }, { "epoch": 1.86, "learning_rate": 2.0347813915148746e-05, "loss": 0.0073, "step": 719230 }, { "epoch": 1.86, "learning_rate": 2.0343925698777284e-05, "loss": 0.0054, "step": 719240 }, { "epoch": 1.86, "learning_rate": 2.034003748240582e-05, "loss": 0.0083, "step": 719250 }, { "epoch": 1.86, "learning_rate": 2.0336149266034354e-05, "loss": 0.0082, "step": 719260 }, { "epoch": 1.86, "learning_rate": 2.033226104966289e-05, "loss": 0.0072, "step": 719270 }, { "epoch": 1.86, "learning_rate": 2.0328372833291427e-05, "loss": 0.0074, "step": 719280 }, { "epoch": 1.86, "learning_rate": 2.0324484616919962e-05, "loss": 0.0044, "step": 719290 }, { "epoch": 1.86, "learning_rate": 2.0320596400548497e-05, "loss": 0.0086, "step": 719300 }, { "epoch": 1.86, "learning_rate": 2.031670818417703e-05, "loss": 0.0092, "step": 719310 }, { "epoch": 1.86, "learning_rate": 2.031281996780557e-05, "loss": 0.0109, "step": 719320 }, { "epoch": 1.86, "learning_rate": 2.03089317514341e-05, "loss": 0.0071, "step": 719330 }, { "epoch": 1.86, "learning_rate": 2.0305043535062636e-05, "loss": 0.0076, "step": 719340 }, { "epoch": 1.86, "learning_rate": 2.030115531869117e-05, "loss": 0.0078, "step": 719350 }, { "epoch": 1.86, "learning_rate": 2.0297267102319706e-05, "loss": 0.0081, "step": 719360 }, { "epoch": 1.86, "learning_rate": 2.0293378885948244e-05, "loss": 0.0087, "step": 719370 }, { "epoch": 1.86, "learning_rate": 2.028949066957678e-05, "loss": 0.0076, "step": 719380 }, { "epoch": 1.86, "learning_rate": 2.0285602453205314e-05, "loss": 0.0101, "step": 719390 }, { "epoch": 1.86, "learning_rate": 2.028171423683385e-05, "loss": 0.0074, "step": 719400 }, { "epoch": 1.86, "learning_rate": 2.0277826020462387e-05, "loss": 0.0082, "step": 719410 }, { "epoch": 1.86, "learning_rate": 2.027393780409092e-05, "loss": 0.0074, "step": 719420 }, { "epoch": 1.86, "learning_rate": 2.0270049587719457e-05, "loss": 0.0077, "step": 719430 }, { "epoch": 1.86, "learning_rate": 2.026616137134799e-05, "loss": 0.0128, "step": 719440 }, { "epoch": 1.86, "learning_rate": 2.0262273154976523e-05, "loss": 0.007, "step": 719450 }, { "epoch": 1.86, "learning_rate": 2.025838493860506e-05, "loss": 0.0095, "step": 719460 }, { "epoch": 1.86, "learning_rate": 2.0254496722233596e-05, "loss": 0.0055, "step": 719470 }, { "epoch": 1.86, "learning_rate": 2.025060850586213e-05, "loss": 0.0106, "step": 719480 }, { "epoch": 1.87, "learning_rate": 2.0246720289490666e-05, "loss": 0.0099, "step": 719490 }, { "epoch": 1.87, "learning_rate": 2.0242832073119204e-05, "loss": 0.0081, "step": 719500 }, { "epoch": 1.87, "learning_rate": 2.023894385674774e-05, "loss": 0.0066, "step": 719510 }, { "epoch": 1.87, "learning_rate": 2.0235055640376274e-05, "loss": 0.0065, "step": 719520 }, { "epoch": 1.87, "learning_rate": 2.023116742400481e-05, "loss": 0.0084, "step": 719530 }, { "epoch": 1.87, "learning_rate": 2.0227279207633347e-05, "loss": 0.0058, "step": 719540 }, { "epoch": 1.87, "learning_rate": 2.022339099126188e-05, "loss": 0.0082, "step": 719550 }, { "epoch": 1.87, "learning_rate": 2.0219502774890417e-05, "loss": 0.0075, "step": 719560 }, { "epoch": 1.87, "learning_rate": 2.021561455851895e-05, "loss": 0.0071, "step": 719570 }, { "epoch": 1.87, "learning_rate": 2.0211726342147483e-05, "loss": 0.0052, "step": 719580 }, { "epoch": 1.87, "learning_rate": 2.020783812577602e-05, "loss": 0.0109, "step": 719590 }, { "epoch": 1.87, "learning_rate": 2.0203949909404556e-05, "loss": 0.0092, "step": 719600 }, { "epoch": 1.87, "learning_rate": 2.020006169303309e-05, "loss": 0.0067, "step": 719610 }, { "epoch": 1.87, "learning_rate": 2.0196173476661626e-05, "loss": 0.0096, "step": 719620 }, { "epoch": 1.87, "learning_rate": 2.0192285260290164e-05, "loss": 0.0094, "step": 719630 }, { "epoch": 1.87, "learning_rate": 2.01883970439187e-05, "loss": 0.0071, "step": 719640 }, { "epoch": 1.87, "learning_rate": 2.0184508827547234e-05, "loss": 0.0107, "step": 719650 }, { "epoch": 1.87, "learning_rate": 2.018062061117577e-05, "loss": 0.0072, "step": 719660 }, { "epoch": 1.87, "learning_rate": 2.0176732394804307e-05, "loss": 0.0073, "step": 719670 }, { "epoch": 1.87, "learning_rate": 2.017284417843284e-05, "loss": 0.0098, "step": 719680 }, { "epoch": 1.87, "learning_rate": 2.0168955962061376e-05, "loss": 0.0074, "step": 719690 }, { "epoch": 1.87, "learning_rate": 2.0165067745689908e-05, "loss": 0.0073, "step": 719700 }, { "epoch": 1.87, "learning_rate": 2.0161179529318443e-05, "loss": 0.0052, "step": 719710 }, { "epoch": 1.87, "learning_rate": 2.015729131294698e-05, "loss": 0.0071, "step": 719720 }, { "epoch": 1.87, "learning_rate": 2.0153403096575516e-05, "loss": 0.0095, "step": 719730 }, { "epoch": 1.87, "learning_rate": 2.014951488020405e-05, "loss": 0.0068, "step": 719740 }, { "epoch": 1.87, "learning_rate": 2.0145626663832586e-05, "loss": 0.005, "step": 719750 }, { "epoch": 1.87, "learning_rate": 2.0141738447461124e-05, "loss": 0.0058, "step": 719760 }, { "epoch": 1.87, "learning_rate": 2.013785023108966e-05, "loss": 0.0069, "step": 719770 }, { "epoch": 1.87, "learning_rate": 2.0133962014718194e-05, "loss": 0.0053, "step": 719780 }, { "epoch": 1.87, "learning_rate": 2.013007379834673e-05, "loss": 0.012, "step": 719790 }, { "epoch": 1.87, "learning_rate": 2.0126185581975267e-05, "loss": 0.0067, "step": 719800 }, { "epoch": 1.87, "learning_rate": 2.01222973656038e-05, "loss": 0.0084, "step": 719810 }, { "epoch": 1.87, "learning_rate": 2.0118409149232333e-05, "loss": 0.0079, "step": 719820 }, { "epoch": 1.87, "learning_rate": 2.0114520932860868e-05, "loss": 0.0071, "step": 719830 }, { "epoch": 1.87, "learning_rate": 2.0110632716489403e-05, "loss": 0.0078, "step": 719840 }, { "epoch": 1.87, "learning_rate": 2.010674450011794e-05, "loss": 0.01, "step": 719850 }, { "epoch": 1.87, "learning_rate": 2.0102856283746476e-05, "loss": 0.0052, "step": 719860 }, { "epoch": 1.87, "learning_rate": 2.009896806737501e-05, "loss": 0.0065, "step": 719870 }, { "epoch": 1.87, "learning_rate": 2.0095079851003546e-05, "loss": 0.0071, "step": 719880 }, { "epoch": 1.87, "learning_rate": 2.0091191634632084e-05, "loss": 0.0101, "step": 719890 }, { "epoch": 1.87, "learning_rate": 2.008730341826062e-05, "loss": 0.0063, "step": 719900 }, { "epoch": 1.87, "learning_rate": 2.0083415201889154e-05, "loss": 0.009, "step": 719910 }, { "epoch": 1.87, "learning_rate": 2.007952698551769e-05, "loss": 0.0077, "step": 719920 }, { "epoch": 1.87, "learning_rate": 2.0075638769146227e-05, "loss": 0.0072, "step": 719930 }, { "epoch": 1.87, "learning_rate": 2.007175055277476e-05, "loss": 0.0083, "step": 719940 }, { "epoch": 1.87, "learning_rate": 2.0067862336403293e-05, "loss": 0.0061, "step": 719950 }, { "epoch": 1.87, "learning_rate": 2.0063974120031828e-05, "loss": 0.008, "step": 719960 }, { "epoch": 1.87, "learning_rate": 2.0060085903660363e-05, "loss": 0.008, "step": 719970 }, { "epoch": 1.87, "learning_rate": 2.00561976872889e-05, "loss": 0.0061, "step": 719980 }, { "epoch": 1.87, "learning_rate": 2.0052309470917436e-05, "loss": 0.0077, "step": 719990 }, { "epoch": 1.87, "learning_rate": 2.004842125454597e-05, "loss": 0.0043, "step": 720000 }, { "epoch": 1.87, "eval_cer": 0.8816858906799576, "eval_loss": 0.004609877709299326, "eval_runtime": 107.6819, "eval_samples_per_second": 18.573, "eval_steps_per_second": 4.643, "step": 720000 }, { "epoch": 1.87, "learning_rate": 2.0044533038174506e-05, "loss": 0.0063, "step": 720010 }, { "epoch": 1.87, "learning_rate": 2.0040644821803044e-05, "loss": 0.008, "step": 720020 }, { "epoch": 1.87, "learning_rate": 2.003675660543158e-05, "loss": 0.0078, "step": 720030 }, { "epoch": 1.87, "learning_rate": 2.0032868389060114e-05, "loss": 0.0081, "step": 720040 }, { "epoch": 1.87, "learning_rate": 2.002898017268865e-05, "loss": 0.01, "step": 720050 }, { "epoch": 1.87, "learning_rate": 2.0025091956317187e-05, "loss": 0.0063, "step": 720060 }, { "epoch": 1.87, "learning_rate": 2.0021203739945718e-05, "loss": 0.006, "step": 720070 }, { "epoch": 1.87, "learning_rate": 2.0017315523574253e-05, "loss": 0.0062, "step": 720080 }, { "epoch": 1.87, "learning_rate": 2.0013427307202788e-05, "loss": 0.0067, "step": 720090 }, { "epoch": 1.87, "learning_rate": 2.0009539090831323e-05, "loss": 0.0106, "step": 720100 }, { "epoch": 1.87, "learning_rate": 2.000565087445986e-05, "loss": 0.0111, "step": 720110 }, { "epoch": 1.87, "learning_rate": 2.0001762658088396e-05, "loss": 0.0089, "step": 720120 }, { "epoch": 1.87, "learning_rate": 1.999787444171693e-05, "loss": 0.0069, "step": 720130 }, { "epoch": 1.87, "learning_rate": 1.9993986225345466e-05, "loss": 0.0092, "step": 720140 }, { "epoch": 1.87, "learning_rate": 1.9990098008974004e-05, "loss": 0.0071, "step": 720150 }, { "epoch": 1.87, "learning_rate": 1.998620979260254e-05, "loss": 0.0106, "step": 720160 }, { "epoch": 1.87, "learning_rate": 1.9982321576231074e-05, "loss": 0.0101, "step": 720170 }, { "epoch": 1.87, "learning_rate": 1.997843335985961e-05, "loss": 0.0053, "step": 720180 }, { "epoch": 1.87, "learning_rate": 1.9974545143488147e-05, "loss": 0.0063, "step": 720190 }, { "epoch": 1.87, "learning_rate": 1.9970656927116678e-05, "loss": 0.0065, "step": 720200 }, { "epoch": 1.87, "learning_rate": 1.9966768710745213e-05, "loss": 0.0062, "step": 720210 }, { "epoch": 1.87, "learning_rate": 1.9962880494373748e-05, "loss": 0.0091, "step": 720220 }, { "epoch": 1.87, "learning_rate": 1.9958992278002283e-05, "loss": 0.0071, "step": 720230 }, { "epoch": 1.87, "learning_rate": 1.995510406163082e-05, "loss": 0.0087, "step": 720240 }, { "epoch": 1.87, "learning_rate": 1.9951215845259356e-05, "loss": 0.0065, "step": 720250 }, { "epoch": 1.87, "learning_rate": 1.994732762888789e-05, "loss": 0.0101, "step": 720260 }, { "epoch": 1.87, "learning_rate": 1.9943439412516426e-05, "loss": 0.0073, "step": 720270 }, { "epoch": 1.87, "learning_rate": 1.9939551196144964e-05, "loss": 0.006, "step": 720280 }, { "epoch": 1.87, "learning_rate": 1.99356629797735e-05, "loss": 0.005, "step": 720290 }, { "epoch": 1.87, "learning_rate": 1.9931774763402034e-05, "loss": 0.0062, "step": 720300 }, { "epoch": 1.87, "learning_rate": 1.992788654703057e-05, "loss": 0.0067, "step": 720310 }, { "epoch": 1.87, "learning_rate": 1.99239983306591e-05, "loss": 0.0087, "step": 720320 }, { "epoch": 1.87, "learning_rate": 1.9920110114287638e-05, "loss": 0.0078, "step": 720330 }, { "epoch": 1.87, "learning_rate": 1.9916221897916173e-05, "loss": 0.0062, "step": 720340 }, { "epoch": 1.87, "learning_rate": 1.9912333681544708e-05, "loss": 0.0055, "step": 720350 }, { "epoch": 1.87, "learning_rate": 1.9908445465173243e-05, "loss": 0.0079, "step": 720360 }, { "epoch": 1.87, "learning_rate": 1.990455724880178e-05, "loss": 0.0062, "step": 720370 }, { "epoch": 1.87, "learning_rate": 1.9900669032430316e-05, "loss": 0.0064, "step": 720380 }, { "epoch": 1.87, "learning_rate": 1.989678081605885e-05, "loss": 0.0099, "step": 720390 }, { "epoch": 1.87, "learning_rate": 1.9892892599687386e-05, "loss": 0.0068, "step": 720400 }, { "epoch": 1.87, "learning_rate": 1.9889004383315924e-05, "loss": 0.0097, "step": 720410 }, { "epoch": 1.87, "learning_rate": 1.988511616694446e-05, "loss": 0.0069, "step": 720420 }, { "epoch": 1.87, "learning_rate": 1.9881227950572994e-05, "loss": 0.0113, "step": 720430 }, { "epoch": 1.87, "learning_rate": 1.9877339734201525e-05, "loss": 0.0058, "step": 720440 }, { "epoch": 1.87, "learning_rate": 1.987345151783006e-05, "loss": 0.007, "step": 720450 }, { "epoch": 1.87, "learning_rate": 1.9869563301458598e-05, "loss": 0.0076, "step": 720460 }, { "epoch": 1.87, "learning_rate": 1.9865675085087133e-05, "loss": 0.0065, "step": 720470 }, { "epoch": 1.87, "learning_rate": 1.9861786868715668e-05, "loss": 0.0079, "step": 720480 }, { "epoch": 1.87, "learning_rate": 1.9857898652344203e-05, "loss": 0.007, "step": 720490 }, { "epoch": 1.87, "learning_rate": 1.9854010435972738e-05, "loss": 0.0132, "step": 720500 }, { "epoch": 1.87, "learning_rate": 1.9850122219601276e-05, "loss": 0.0084, "step": 720510 }, { "epoch": 1.87, "learning_rate": 1.984623400322981e-05, "loss": 0.0061, "step": 720520 }, { "epoch": 1.87, "learning_rate": 1.9842345786858346e-05, "loss": 0.0078, "step": 720530 }, { "epoch": 1.87, "learning_rate": 1.983845757048688e-05, "loss": 0.0065, "step": 720540 }, { "epoch": 1.87, "learning_rate": 1.983456935411542e-05, "loss": 0.0058, "step": 720550 }, { "epoch": 1.87, "learning_rate": 1.9830681137743953e-05, "loss": 0.007, "step": 720560 }, { "epoch": 1.87, "learning_rate": 1.9826792921372485e-05, "loss": 0.0096, "step": 720570 }, { "epoch": 1.87, "learning_rate": 1.982290470500102e-05, "loss": 0.0049, "step": 720580 }, { "epoch": 1.87, "learning_rate": 1.9819016488629555e-05, "loss": 0.0069, "step": 720590 }, { "epoch": 1.87, "learning_rate": 1.9815128272258093e-05, "loss": 0.0075, "step": 720600 }, { "epoch": 1.87, "learning_rate": 1.9811240055886628e-05, "loss": 0.0076, "step": 720610 }, { "epoch": 1.87, "learning_rate": 1.9807351839515163e-05, "loss": 0.0076, "step": 720620 }, { "epoch": 1.87, "learning_rate": 1.9803463623143698e-05, "loss": 0.0059, "step": 720630 }, { "epoch": 1.87, "learning_rate": 1.9799575406772236e-05, "loss": 0.0074, "step": 720640 }, { "epoch": 1.87, "learning_rate": 1.979568719040077e-05, "loss": 0.0086, "step": 720650 }, { "epoch": 1.87, "learning_rate": 1.9791798974029305e-05, "loss": 0.0068, "step": 720660 }, { "epoch": 1.87, "learning_rate": 1.978791075765784e-05, "loss": 0.0072, "step": 720670 }, { "epoch": 1.87, "learning_rate": 1.978402254128638e-05, "loss": 0.0072, "step": 720680 }, { "epoch": 1.87, "learning_rate": 1.978013432491491e-05, "loss": 0.0064, "step": 720690 }, { "epoch": 1.87, "learning_rate": 1.9776246108543445e-05, "loss": 0.0074, "step": 720700 }, { "epoch": 1.87, "learning_rate": 1.977235789217198e-05, "loss": 0.008, "step": 720710 }, { "epoch": 1.87, "learning_rate": 1.9768469675800515e-05, "loss": 0.0083, "step": 720720 }, { "epoch": 1.87, "learning_rate": 1.9764581459429053e-05, "loss": 0.0079, "step": 720730 }, { "epoch": 1.87, "learning_rate": 1.9760693243057588e-05, "loss": 0.0115, "step": 720740 }, { "epoch": 1.87, "learning_rate": 1.9756805026686123e-05, "loss": 0.0095, "step": 720750 }, { "epoch": 1.87, "learning_rate": 1.9752916810314657e-05, "loss": 0.0072, "step": 720760 }, { "epoch": 1.87, "learning_rate": 1.9749028593943196e-05, "loss": 0.0081, "step": 720770 }, { "epoch": 1.87, "learning_rate": 1.974514037757173e-05, "loss": 0.0057, "step": 720780 }, { "epoch": 1.87, "learning_rate": 1.9741252161200265e-05, "loss": 0.0076, "step": 720790 }, { "epoch": 1.87, "learning_rate": 1.97373639448288e-05, "loss": 0.0056, "step": 720800 }, { "epoch": 1.87, "learning_rate": 1.973347572845734e-05, "loss": 0.0057, "step": 720810 }, { "epoch": 1.87, "learning_rate": 1.972958751208587e-05, "loss": 0.0061, "step": 720820 }, { "epoch": 1.87, "learning_rate": 1.9725699295714405e-05, "loss": 0.0051, "step": 720830 }, { "epoch": 1.87, "learning_rate": 1.972181107934294e-05, "loss": 0.007, "step": 720840 }, { "epoch": 1.87, "learning_rate": 1.9717922862971475e-05, "loss": 0.0054, "step": 720850 }, { "epoch": 1.87, "learning_rate": 1.9714034646600013e-05, "loss": 0.0074, "step": 720860 }, { "epoch": 1.87, "learning_rate": 1.9710146430228548e-05, "loss": 0.0084, "step": 720870 }, { "epoch": 1.87, "learning_rate": 1.9706258213857083e-05, "loss": 0.0086, "step": 720880 }, { "epoch": 1.87, "learning_rate": 1.9702369997485617e-05, "loss": 0.0077, "step": 720890 }, { "epoch": 1.87, "learning_rate": 1.9698481781114156e-05, "loss": 0.0076, "step": 720900 }, { "epoch": 1.87, "learning_rate": 1.969459356474269e-05, "loss": 0.0074, "step": 720910 }, { "epoch": 1.87, "learning_rate": 1.9690705348371225e-05, "loss": 0.0072, "step": 720920 }, { "epoch": 1.87, "learning_rate": 1.968681713199976e-05, "loss": 0.0068, "step": 720930 }, { "epoch": 1.87, "learning_rate": 1.9682928915628292e-05, "loss": 0.0075, "step": 720940 }, { "epoch": 1.87, "learning_rate": 1.967904069925683e-05, "loss": 0.0086, "step": 720950 }, { "epoch": 1.87, "learning_rate": 1.9675152482885365e-05, "loss": 0.0089, "step": 720960 }, { "epoch": 1.87, "learning_rate": 1.96712642665139e-05, "loss": 0.0059, "step": 720970 }, { "epoch": 1.87, "learning_rate": 1.9667376050142435e-05, "loss": 0.007, "step": 720980 }, { "epoch": 1.87, "learning_rate": 1.9663487833770973e-05, "loss": 0.0065, "step": 720990 }, { "epoch": 1.87, "learning_rate": 1.9659599617399508e-05, "loss": 0.0056, "step": 721000 }, { "epoch": 1.87, "eval_cer": 0.881688689953826, "eval_loss": 0.004578019957989454, "eval_runtime": 107.5931, "eval_samples_per_second": 18.589, "eval_steps_per_second": 4.647, "step": 721000 }, { "epoch": 1.87, "learning_rate": 1.9655711401028043e-05, "loss": 0.008, "step": 721010 }, { "epoch": 1.87, "learning_rate": 1.9651823184656577e-05, "loss": 0.0082, "step": 721020 }, { "epoch": 1.87, "learning_rate": 1.9647934968285116e-05, "loss": 0.0098, "step": 721030 }, { "epoch": 1.87, "learning_rate": 1.964404675191365e-05, "loss": 0.0103, "step": 721040 }, { "epoch": 1.87, "learning_rate": 1.9640158535542185e-05, "loss": 0.0064, "step": 721050 }, { "epoch": 1.87, "learning_rate": 1.9636270319170717e-05, "loss": 0.0061, "step": 721060 }, { "epoch": 1.87, "learning_rate": 1.9632382102799252e-05, "loss": 0.0079, "step": 721070 }, { "epoch": 1.87, "learning_rate": 1.962849388642779e-05, "loss": 0.0061, "step": 721080 }, { "epoch": 1.87, "learning_rate": 1.9624605670056325e-05, "loss": 0.0079, "step": 721090 }, { "epoch": 1.87, "learning_rate": 1.962071745368486e-05, "loss": 0.0054, "step": 721100 }, { "epoch": 1.87, "learning_rate": 1.9616829237313395e-05, "loss": 0.0077, "step": 721110 }, { "epoch": 1.87, "learning_rate": 1.9612941020941933e-05, "loss": 0.007, "step": 721120 }, { "epoch": 1.87, "learning_rate": 1.9609052804570468e-05, "loss": 0.0075, "step": 721130 }, { "epoch": 1.87, "learning_rate": 1.9605164588199003e-05, "loss": 0.008, "step": 721140 }, { "epoch": 1.87, "learning_rate": 1.9601276371827537e-05, "loss": 0.0082, "step": 721150 }, { "epoch": 1.87, "learning_rate": 1.9597388155456076e-05, "loss": 0.0077, "step": 721160 }, { "epoch": 1.87, "learning_rate": 1.959349993908461e-05, "loss": 0.0062, "step": 721170 }, { "epoch": 1.87, "learning_rate": 1.9589611722713145e-05, "loss": 0.0073, "step": 721180 }, { "epoch": 1.87, "learning_rate": 1.9585723506341677e-05, "loss": 0.0067, "step": 721190 }, { "epoch": 1.87, "learning_rate": 1.9581835289970212e-05, "loss": 0.0074, "step": 721200 }, { "epoch": 1.87, "learning_rate": 1.957794707359875e-05, "loss": 0.0053, "step": 721210 }, { "epoch": 1.87, "learning_rate": 1.9574058857227285e-05, "loss": 0.006, "step": 721220 }, { "epoch": 1.87, "learning_rate": 1.957017064085582e-05, "loss": 0.0089, "step": 721230 }, { "epoch": 1.87, "learning_rate": 1.9566282424484355e-05, "loss": 0.0084, "step": 721240 }, { "epoch": 1.87, "learning_rate": 1.9562394208112893e-05, "loss": 0.0109, "step": 721250 }, { "epoch": 1.87, "learning_rate": 1.9558505991741428e-05, "loss": 0.0072, "step": 721260 }, { "epoch": 1.87, "learning_rate": 1.9554617775369963e-05, "loss": 0.0075, "step": 721270 }, { "epoch": 1.87, "learning_rate": 1.9550729558998497e-05, "loss": 0.0076, "step": 721280 }, { "epoch": 1.87, "learning_rate": 1.9546841342627036e-05, "loss": 0.0065, "step": 721290 }, { "epoch": 1.87, "learning_rate": 1.954295312625557e-05, "loss": 0.0057, "step": 721300 }, { "epoch": 1.87, "learning_rate": 1.9539064909884102e-05, "loss": 0.008, "step": 721310 }, { "epoch": 1.87, "learning_rate": 1.9535176693512637e-05, "loss": 0.0058, "step": 721320 }, { "epoch": 1.87, "learning_rate": 1.9531288477141172e-05, "loss": 0.0063, "step": 721330 }, { "epoch": 1.87, "learning_rate": 1.952740026076971e-05, "loss": 0.0097, "step": 721340 }, { "epoch": 1.87, "learning_rate": 1.9523512044398245e-05, "loss": 0.0123, "step": 721350 }, { "epoch": 1.87, "learning_rate": 1.951962382802678e-05, "loss": 0.0094, "step": 721360 }, { "epoch": 1.87, "learning_rate": 1.9515735611655315e-05, "loss": 0.0084, "step": 721370 }, { "epoch": 1.87, "learning_rate": 1.9511847395283853e-05, "loss": 0.0064, "step": 721380 }, { "epoch": 1.87, "learning_rate": 1.9507959178912388e-05, "loss": 0.0068, "step": 721390 }, { "epoch": 1.87, "learning_rate": 1.9504070962540923e-05, "loss": 0.0065, "step": 721400 }, { "epoch": 1.87, "learning_rate": 1.9500182746169457e-05, "loss": 0.0065, "step": 721410 }, { "epoch": 1.87, "learning_rate": 1.9496294529797996e-05, "loss": 0.0087, "step": 721420 }, { "epoch": 1.87, "learning_rate": 1.949240631342653e-05, "loss": 0.0069, "step": 721430 }, { "epoch": 1.87, "learning_rate": 1.9488518097055062e-05, "loss": 0.0072, "step": 721440 }, { "epoch": 1.87, "learning_rate": 1.9484629880683597e-05, "loss": 0.0056, "step": 721450 }, { "epoch": 1.87, "learning_rate": 1.948074166431213e-05, "loss": 0.0092, "step": 721460 }, { "epoch": 1.87, "learning_rate": 1.947685344794067e-05, "loss": 0.0068, "step": 721470 }, { "epoch": 1.87, "learning_rate": 1.9472965231569205e-05, "loss": 0.0068, "step": 721480 }, { "epoch": 1.87, "learning_rate": 1.946907701519774e-05, "loss": 0.008, "step": 721490 }, { "epoch": 1.87, "learning_rate": 1.9465188798826275e-05, "loss": 0.009, "step": 721500 }, { "epoch": 1.87, "learning_rate": 1.9461300582454813e-05, "loss": 0.0083, "step": 721510 }, { "epoch": 1.87, "learning_rate": 1.9457412366083348e-05, "loss": 0.0053, "step": 721520 }, { "epoch": 1.87, "learning_rate": 1.9453524149711882e-05, "loss": 0.0075, "step": 721530 }, { "epoch": 1.87, "learning_rate": 1.9449635933340417e-05, "loss": 0.0081, "step": 721540 }, { "epoch": 1.87, "learning_rate": 1.9445747716968956e-05, "loss": 0.0057, "step": 721550 }, { "epoch": 1.87, "learning_rate": 1.9441859500597487e-05, "loss": 0.0081, "step": 721560 }, { "epoch": 1.87, "learning_rate": 1.9437971284226022e-05, "loss": 0.0086, "step": 721570 }, { "epoch": 1.87, "learning_rate": 1.9434083067854557e-05, "loss": 0.0064, "step": 721580 }, { "epoch": 1.87, "learning_rate": 1.943019485148309e-05, "loss": 0.0072, "step": 721590 }, { "epoch": 1.87, "learning_rate": 1.942630663511163e-05, "loss": 0.0061, "step": 721600 }, { "epoch": 1.87, "learning_rate": 1.9422418418740165e-05, "loss": 0.0078, "step": 721610 }, { "epoch": 1.87, "learning_rate": 1.94185302023687e-05, "loss": 0.0074, "step": 721620 }, { "epoch": 1.87, "learning_rate": 1.9414641985997234e-05, "loss": 0.0125, "step": 721630 }, { "epoch": 1.87, "learning_rate": 1.9410753769625773e-05, "loss": 0.0065, "step": 721640 }, { "epoch": 1.87, "learning_rate": 1.9406865553254308e-05, "loss": 0.0084, "step": 721650 }, { "epoch": 1.87, "learning_rate": 1.9402977336882842e-05, "loss": 0.0064, "step": 721660 }, { "epoch": 1.87, "learning_rate": 1.9399089120511377e-05, "loss": 0.0052, "step": 721670 }, { "epoch": 1.87, "learning_rate": 1.9395200904139916e-05, "loss": 0.0062, "step": 721680 }, { "epoch": 1.87, "learning_rate": 1.9391312687768447e-05, "loss": 0.0094, "step": 721690 }, { "epoch": 1.87, "learning_rate": 1.9387424471396982e-05, "loss": 0.0079, "step": 721700 }, { "epoch": 1.87, "learning_rate": 1.9383536255025517e-05, "loss": 0.0107, "step": 721710 }, { "epoch": 1.87, "learning_rate": 1.937964803865405e-05, "loss": 0.0045, "step": 721720 }, { "epoch": 1.87, "learning_rate": 1.937575982228259e-05, "loss": 0.0081, "step": 721730 }, { "epoch": 1.87, "learning_rate": 1.9371871605911125e-05, "loss": 0.007, "step": 721740 }, { "epoch": 1.87, "learning_rate": 1.936798338953966e-05, "loss": 0.0085, "step": 721750 }, { "epoch": 1.87, "learning_rate": 1.9364095173168194e-05, "loss": 0.0079, "step": 721760 }, { "epoch": 1.87, "learning_rate": 1.9360206956796733e-05, "loss": 0.0099, "step": 721770 }, { "epoch": 1.87, "learning_rate": 1.9356318740425268e-05, "loss": 0.0076, "step": 721780 }, { "epoch": 1.87, "learning_rate": 1.9352430524053802e-05, "loss": 0.0052, "step": 721790 }, { "epoch": 1.87, "learning_rate": 1.9348542307682337e-05, "loss": 0.0065, "step": 721800 }, { "epoch": 1.87, "learning_rate": 1.934465409131087e-05, "loss": 0.0089, "step": 721810 }, { "epoch": 1.87, "learning_rate": 1.9340765874939407e-05, "loss": 0.0068, "step": 721820 }, { "epoch": 1.87, "learning_rate": 1.9336877658567942e-05, "loss": 0.0086, "step": 721830 }, { "epoch": 1.87, "learning_rate": 1.9332989442196477e-05, "loss": 0.0073, "step": 721840 }, { "epoch": 1.87, "learning_rate": 1.932910122582501e-05, "loss": 0.0108, "step": 721850 }, { "epoch": 1.87, "learning_rate": 1.932521300945355e-05, "loss": 0.0064, "step": 721860 }, { "epoch": 1.87, "learning_rate": 1.9321324793082085e-05, "loss": 0.0092, "step": 721870 }, { "epoch": 1.87, "learning_rate": 1.931743657671062e-05, "loss": 0.0088, "step": 721880 }, { "epoch": 1.87, "learning_rate": 1.9313548360339154e-05, "loss": 0.0062, "step": 721890 }, { "epoch": 1.87, "learning_rate": 1.930966014396769e-05, "loss": 0.0069, "step": 721900 }, { "epoch": 1.87, "learning_rate": 1.9305771927596228e-05, "loss": 0.0088, "step": 721910 }, { "epoch": 1.87, "learning_rate": 1.9301883711224762e-05, "loss": 0.0066, "step": 721920 }, { "epoch": 1.87, "learning_rate": 1.9297995494853294e-05, "loss": 0.0076, "step": 721930 }, { "epoch": 1.87, "learning_rate": 1.929410727848183e-05, "loss": 0.0081, "step": 721940 }, { "epoch": 1.87, "learning_rate": 1.9290219062110364e-05, "loss": 0.0074, "step": 721950 }, { "epoch": 1.87, "learning_rate": 1.9286330845738902e-05, "loss": 0.0081, "step": 721960 }, { "epoch": 1.87, "learning_rate": 1.9282442629367437e-05, "loss": 0.0066, "step": 721970 }, { "epoch": 1.87, "learning_rate": 1.927855441299597e-05, "loss": 0.0085, "step": 721980 }, { "epoch": 1.87, "learning_rate": 1.9274666196624506e-05, "loss": 0.0044, "step": 721990 }, { "epoch": 1.87, "learning_rate": 1.9270777980253045e-05, "loss": 0.0066, "step": 722000 }, { "epoch": 1.87, "eval_cer": 0.8816718943106159, "eval_loss": 0.004583498928695917, "eval_runtime": 107.8568, "eval_samples_per_second": 18.543, "eval_steps_per_second": 4.636, "step": 722000 }, { "epoch": 1.87, "learning_rate": 1.926688976388158e-05, "loss": 0.0056, "step": 722010 }, { "epoch": 1.87, "learning_rate": 1.9263001547510114e-05, "loss": 0.0065, "step": 722020 }, { "epoch": 1.87, "learning_rate": 1.925911333113865e-05, "loss": 0.0063, "step": 722030 }, { "epoch": 1.87, "learning_rate": 1.9255225114767188e-05, "loss": 0.0082, "step": 722040 }, { "epoch": 1.87, "learning_rate": 1.9251336898395722e-05, "loss": 0.0068, "step": 722050 }, { "epoch": 1.87, "learning_rate": 1.9247448682024254e-05, "loss": 0.0073, "step": 722060 }, { "epoch": 1.87, "learning_rate": 1.924356046565279e-05, "loss": 0.007, "step": 722070 }, { "epoch": 1.87, "learning_rate": 1.9239672249281324e-05, "loss": 0.0084, "step": 722080 }, { "epoch": 1.87, "learning_rate": 1.9235784032909862e-05, "loss": 0.011, "step": 722090 }, { "epoch": 1.87, "learning_rate": 1.9231895816538397e-05, "loss": 0.0075, "step": 722100 }, { "epoch": 1.87, "learning_rate": 1.922800760016693e-05, "loss": 0.006, "step": 722110 }, { "epoch": 1.87, "learning_rate": 1.9224119383795466e-05, "loss": 0.0069, "step": 722120 }, { "epoch": 1.87, "learning_rate": 1.9220231167424005e-05, "loss": 0.0086, "step": 722130 }, { "epoch": 1.87, "learning_rate": 1.921634295105254e-05, "loss": 0.0074, "step": 722140 }, { "epoch": 1.87, "learning_rate": 1.9212454734681074e-05, "loss": 0.0049, "step": 722150 }, { "epoch": 1.87, "learning_rate": 1.920856651830961e-05, "loss": 0.0076, "step": 722160 }, { "epoch": 1.87, "learning_rate": 1.9204678301938148e-05, "loss": 0.0085, "step": 722170 }, { "epoch": 1.87, "learning_rate": 1.920079008556668e-05, "loss": 0.0065, "step": 722180 }, { "epoch": 1.87, "learning_rate": 1.9196901869195214e-05, "loss": 0.0074, "step": 722190 }, { "epoch": 1.87, "learning_rate": 1.919301365282375e-05, "loss": 0.0093, "step": 722200 }, { "epoch": 1.87, "learning_rate": 1.9189125436452284e-05, "loss": 0.008, "step": 722210 }, { "epoch": 1.87, "learning_rate": 1.9185237220080822e-05, "loss": 0.007, "step": 722220 }, { "epoch": 1.87, "learning_rate": 1.9181349003709357e-05, "loss": 0.0076, "step": 722230 }, { "epoch": 1.87, "learning_rate": 1.917746078733789e-05, "loss": 0.0067, "step": 722240 }, { "epoch": 1.87, "learning_rate": 1.9173572570966426e-05, "loss": 0.0058, "step": 722250 }, { "epoch": 1.87, "learning_rate": 1.9169684354594965e-05, "loss": 0.0084, "step": 722260 }, { "epoch": 1.87, "learning_rate": 1.91657961382235e-05, "loss": 0.0093, "step": 722270 }, { "epoch": 1.87, "learning_rate": 1.9161907921852034e-05, "loss": 0.0072, "step": 722280 }, { "epoch": 1.87, "learning_rate": 1.915801970548057e-05, "loss": 0.0069, "step": 722290 }, { "epoch": 1.87, "learning_rate": 1.9154131489109107e-05, "loss": 0.0075, "step": 722300 }, { "epoch": 1.87, "learning_rate": 1.915024327273764e-05, "loss": 0.0093, "step": 722310 }, { "epoch": 1.87, "learning_rate": 1.9146355056366174e-05, "loss": 0.0051, "step": 722320 }, { "epoch": 1.87, "learning_rate": 1.914246683999471e-05, "loss": 0.0067, "step": 722330 }, { "epoch": 1.87, "learning_rate": 1.9138578623623244e-05, "loss": 0.0078, "step": 722340 }, { "epoch": 1.87, "learning_rate": 1.9134690407251782e-05, "loss": 0.0061, "step": 722350 }, { "epoch": 1.87, "learning_rate": 1.9130802190880317e-05, "loss": 0.008, "step": 722360 }, { "epoch": 1.87, "learning_rate": 1.912691397450885e-05, "loss": 0.0064, "step": 722370 }, { "epoch": 1.87, "learning_rate": 1.9123025758137386e-05, "loss": 0.0082, "step": 722380 }, { "epoch": 1.87, "learning_rate": 1.9119137541765925e-05, "loss": 0.0089, "step": 722390 }, { "epoch": 1.87, "learning_rate": 1.911524932539446e-05, "loss": 0.0068, "step": 722400 }, { "epoch": 1.87, "learning_rate": 1.9111361109022994e-05, "loss": 0.0082, "step": 722410 }, { "epoch": 1.87, "learning_rate": 1.910747289265153e-05, "loss": 0.0084, "step": 722420 }, { "epoch": 1.87, "learning_rate": 1.910358467628006e-05, "loss": 0.0099, "step": 722430 }, { "epoch": 1.87, "learning_rate": 1.90996964599086e-05, "loss": 0.0087, "step": 722440 }, { "epoch": 1.87, "learning_rate": 1.9095808243537134e-05, "loss": 0.006, "step": 722450 }, { "epoch": 1.87, "learning_rate": 1.909192002716567e-05, "loss": 0.0063, "step": 722460 }, { "epoch": 1.87, "learning_rate": 1.9088031810794204e-05, "loss": 0.0062, "step": 722470 }, { "epoch": 1.87, "learning_rate": 1.9084143594422742e-05, "loss": 0.0066, "step": 722480 }, { "epoch": 1.87, "learning_rate": 1.9080255378051277e-05, "loss": 0.0062, "step": 722490 }, { "epoch": 1.87, "learning_rate": 1.907636716167981e-05, "loss": 0.0075, "step": 722500 }, { "epoch": 1.87, "learning_rate": 1.9072478945308346e-05, "loss": 0.0066, "step": 722510 }, { "epoch": 1.87, "learning_rate": 1.9068590728936885e-05, "loss": 0.0086, "step": 722520 }, { "epoch": 1.87, "learning_rate": 1.906470251256542e-05, "loss": 0.007, "step": 722530 }, { "epoch": 1.87, "learning_rate": 1.9060814296193954e-05, "loss": 0.0102, "step": 722540 }, { "epoch": 1.87, "learning_rate": 1.9056926079822486e-05, "loss": 0.0079, "step": 722550 }, { "epoch": 1.87, "learning_rate": 1.905303786345102e-05, "loss": 0.0076, "step": 722560 }, { "epoch": 1.87, "learning_rate": 1.904914964707956e-05, "loss": 0.0059, "step": 722570 }, { "epoch": 1.87, "learning_rate": 1.9045261430708094e-05, "loss": 0.0072, "step": 722580 }, { "epoch": 1.87, "learning_rate": 1.904137321433663e-05, "loss": 0.006, "step": 722590 }, { "epoch": 1.87, "learning_rate": 1.9037484997965163e-05, "loss": 0.0072, "step": 722600 }, { "epoch": 1.87, "learning_rate": 1.9033596781593702e-05, "loss": 0.0062, "step": 722610 }, { "epoch": 1.87, "learning_rate": 1.9029708565222237e-05, "loss": 0.007, "step": 722620 }, { "epoch": 1.87, "learning_rate": 1.902582034885077e-05, "loss": 0.007, "step": 722630 }, { "epoch": 1.87, "learning_rate": 1.9021932132479306e-05, "loss": 0.0066, "step": 722640 }, { "epoch": 1.87, "learning_rate": 1.9018043916107845e-05, "loss": 0.0059, "step": 722650 }, { "epoch": 1.87, "learning_rate": 1.901415569973638e-05, "loss": 0.0087, "step": 722660 }, { "epoch": 1.87, "learning_rate": 1.9010267483364914e-05, "loss": 0.007, "step": 722670 }, { "epoch": 1.87, "learning_rate": 1.9006379266993446e-05, "loss": 0.0065, "step": 722680 }, { "epoch": 1.87, "learning_rate": 1.900249105062198e-05, "loss": 0.0091, "step": 722690 }, { "epoch": 1.87, "learning_rate": 1.899860283425052e-05, "loss": 0.0067, "step": 722700 }, { "epoch": 1.87, "learning_rate": 1.8994714617879054e-05, "loss": 0.0069, "step": 722710 }, { "epoch": 1.87, "learning_rate": 1.899082640150759e-05, "loss": 0.0098, "step": 722720 }, { "epoch": 1.87, "learning_rate": 1.8986938185136123e-05, "loss": 0.0102, "step": 722730 }, { "epoch": 1.87, "learning_rate": 1.8983049968764662e-05, "loss": 0.0068, "step": 722740 }, { "epoch": 1.87, "learning_rate": 1.8979161752393197e-05, "loss": 0.0072, "step": 722750 }, { "epoch": 1.87, "learning_rate": 1.897527353602173e-05, "loss": 0.0088, "step": 722760 }, { "epoch": 1.87, "learning_rate": 1.8971385319650266e-05, "loss": 0.0095, "step": 722770 }, { "epoch": 1.87, "learning_rate": 1.8967497103278805e-05, "loss": 0.0063, "step": 722780 }, { "epoch": 1.87, "learning_rate": 1.896360888690734e-05, "loss": 0.0069, "step": 722790 }, { "epoch": 1.87, "learning_rate": 1.895972067053587e-05, "loss": 0.0083, "step": 722800 }, { "epoch": 1.87, "learning_rate": 1.8955832454164406e-05, "loss": 0.006, "step": 722810 }, { "epoch": 1.87, "learning_rate": 1.895194423779294e-05, "loss": 0.0075, "step": 722820 }, { "epoch": 1.87, "learning_rate": 1.894805602142148e-05, "loss": 0.0062, "step": 722830 }, { "epoch": 1.87, "learning_rate": 1.8944167805050014e-05, "loss": 0.0077, "step": 722840 }, { "epoch": 1.87, "learning_rate": 1.894027958867855e-05, "loss": 0.0073, "step": 722850 }, { "epoch": 1.87, "learning_rate": 1.8936391372307083e-05, "loss": 0.007, "step": 722860 }, { "epoch": 1.87, "learning_rate": 1.8932503155935622e-05, "loss": 0.0101, "step": 722870 }, { "epoch": 1.87, "learning_rate": 1.8928614939564157e-05, "loss": 0.0071, "step": 722880 }, { "epoch": 1.87, "learning_rate": 1.892472672319269e-05, "loss": 0.0068, "step": 722890 }, { "epoch": 1.87, "learning_rate": 1.8920838506821226e-05, "loss": 0.0054, "step": 722900 }, { "epoch": 1.87, "learning_rate": 1.8916950290449765e-05, "loss": 0.0116, "step": 722910 }, { "epoch": 1.87, "learning_rate": 1.89130620740783e-05, "loss": 0.008, "step": 722920 }, { "epoch": 1.87, "learning_rate": 1.890917385770683e-05, "loss": 0.0055, "step": 722930 }, { "epoch": 1.87, "learning_rate": 1.8905285641335366e-05, "loss": 0.0056, "step": 722940 }, { "epoch": 1.87, "learning_rate": 1.89013974249639e-05, "loss": 0.0086, "step": 722950 }, { "epoch": 1.87, "learning_rate": 1.889750920859244e-05, "loss": 0.0089, "step": 722960 }, { "epoch": 1.87, "learning_rate": 1.8893620992220974e-05, "loss": 0.0129, "step": 722970 }, { "epoch": 1.87, "learning_rate": 1.888973277584951e-05, "loss": 0.0079, "step": 722980 }, { "epoch": 1.87, "learning_rate": 1.8885844559478043e-05, "loss": 0.0055, "step": 722990 }, { "epoch": 1.87, "learning_rate": 1.888195634310658e-05, "loss": 0.0082, "step": 723000 }, { "epoch": 1.87, "eval_cer": 0.8816648961259449, "eval_loss": 0.004544729832559824, "eval_runtime": 107.9044, "eval_samples_per_second": 18.535, "eval_steps_per_second": 4.634, "step": 723000 }, { "epoch": 1.87, "learning_rate": 1.8878068126735117e-05, "loss": 0.0091, "step": 723010 }, { "epoch": 1.87, "learning_rate": 1.887417991036365e-05, "loss": 0.0069, "step": 723020 }, { "epoch": 1.87, "learning_rate": 1.8870291693992186e-05, "loss": 0.0084, "step": 723030 }, { "epoch": 1.87, "learning_rate": 1.8866403477620725e-05, "loss": 0.0118, "step": 723040 }, { "epoch": 1.87, "learning_rate": 1.8862515261249256e-05, "loss": 0.0062, "step": 723050 }, { "epoch": 1.87, "learning_rate": 1.885862704487779e-05, "loss": 0.0066, "step": 723060 }, { "epoch": 1.87, "learning_rate": 1.8854738828506326e-05, "loss": 0.0081, "step": 723070 }, { "epoch": 1.87, "learning_rate": 1.885085061213486e-05, "loss": 0.0088, "step": 723080 }, { "epoch": 1.87, "learning_rate": 1.88469623957634e-05, "loss": 0.0066, "step": 723090 }, { "epoch": 1.87, "learning_rate": 1.8843074179391934e-05, "loss": 0.0077, "step": 723100 }, { "epoch": 1.87, "learning_rate": 1.883918596302047e-05, "loss": 0.0083, "step": 723110 }, { "epoch": 1.87, "learning_rate": 1.8835297746649003e-05, "loss": 0.0075, "step": 723120 }, { "epoch": 1.87, "learning_rate": 1.883140953027754e-05, "loss": 0.0065, "step": 723130 }, { "epoch": 1.87, "learning_rate": 1.8827521313906077e-05, "loss": 0.0061, "step": 723140 }, { "epoch": 1.87, "learning_rate": 1.882363309753461e-05, "loss": 0.0034, "step": 723150 }, { "epoch": 1.87, "learning_rate": 1.8819744881163146e-05, "loss": 0.0075, "step": 723160 }, { "epoch": 1.87, "learning_rate": 1.8815856664791678e-05, "loss": 0.0064, "step": 723170 }, { "epoch": 1.87, "learning_rate": 1.8811968448420216e-05, "loss": 0.0092, "step": 723180 }, { "epoch": 1.87, "learning_rate": 1.880808023204875e-05, "loss": 0.0078, "step": 723190 }, { "epoch": 1.87, "learning_rate": 1.8804192015677286e-05, "loss": 0.0085, "step": 723200 }, { "epoch": 1.87, "learning_rate": 1.880030379930582e-05, "loss": 0.0069, "step": 723210 }, { "epoch": 1.87, "learning_rate": 1.879641558293436e-05, "loss": 0.0057, "step": 723220 }, { "epoch": 1.87, "learning_rate": 1.8792527366562894e-05, "loss": 0.0057, "step": 723230 }, { "epoch": 1.87, "learning_rate": 1.878863915019143e-05, "loss": 0.0094, "step": 723240 }, { "epoch": 1.87, "learning_rate": 1.8784750933819963e-05, "loss": 0.0078, "step": 723250 }, { "epoch": 1.87, "learning_rate": 1.8780862717448498e-05, "loss": 0.0085, "step": 723260 }, { "epoch": 1.87, "learning_rate": 1.8776974501077036e-05, "loss": 0.0088, "step": 723270 }, { "epoch": 1.87, "learning_rate": 1.877308628470557e-05, "loss": 0.0079, "step": 723280 }, { "epoch": 1.87, "learning_rate": 1.8769198068334106e-05, "loss": 0.0087, "step": 723290 }, { "epoch": 1.87, "learning_rate": 1.8765309851962638e-05, "loss": 0.0056, "step": 723300 }, { "epoch": 1.87, "learning_rate": 1.8761421635591173e-05, "loss": 0.0055, "step": 723310 }, { "epoch": 1.87, "learning_rate": 1.875753341921971e-05, "loss": 0.0076, "step": 723320 }, { "epoch": 1.87, "learning_rate": 1.8753645202848246e-05, "loss": 0.0075, "step": 723330 }, { "epoch": 1.88, "learning_rate": 1.874975698647678e-05, "loss": 0.008, "step": 723340 }, { "epoch": 1.88, "learning_rate": 1.8745868770105315e-05, "loss": 0.0061, "step": 723350 }, { "epoch": 1.88, "learning_rate": 1.8741980553733854e-05, "loss": 0.006, "step": 723360 }, { "epoch": 1.88, "learning_rate": 1.873809233736239e-05, "loss": 0.0083, "step": 723370 }, { "epoch": 1.88, "learning_rate": 1.8734204120990923e-05, "loss": 0.0054, "step": 723380 }, { "epoch": 1.88, "learning_rate": 1.8730315904619458e-05, "loss": 0.0079, "step": 723390 }, { "epoch": 1.88, "learning_rate": 1.8726427688247993e-05, "loss": 0.0066, "step": 723400 }, { "epoch": 1.88, "learning_rate": 1.8722539471876528e-05, "loss": 0.0077, "step": 723410 }, { "epoch": 1.88, "learning_rate": 1.8718651255505066e-05, "loss": 0.0053, "step": 723420 }, { "epoch": 1.88, "learning_rate": 1.87147630391336e-05, "loss": 0.0103, "step": 723430 }, { "epoch": 1.88, "learning_rate": 1.8710874822762136e-05, "loss": 0.0069, "step": 723440 }, { "epoch": 1.88, "learning_rate": 1.870698660639067e-05, "loss": 0.01, "step": 723450 }, { "epoch": 1.88, "learning_rate": 1.8703098390019206e-05, "loss": 0.0119, "step": 723460 }, { "epoch": 1.88, "learning_rate": 1.869921017364774e-05, "loss": 0.0089, "step": 723470 }, { "epoch": 1.88, "learning_rate": 1.8695321957276275e-05, "loss": 0.0104, "step": 723480 }, { "epoch": 1.88, "learning_rate": 1.8691433740904814e-05, "loss": 0.0078, "step": 723490 }, { "epoch": 1.88, "learning_rate": 1.868754552453335e-05, "loss": 0.0058, "step": 723500 }, { "epoch": 1.88, "learning_rate": 1.8683657308161883e-05, "loss": 0.0089, "step": 723510 }, { "epoch": 1.88, "learning_rate": 1.8679769091790418e-05, "loss": 0.0064, "step": 723520 }, { "epoch": 1.88, "learning_rate": 1.8675880875418953e-05, "loss": 0.0056, "step": 723530 }, { "epoch": 1.88, "learning_rate": 1.8671992659047488e-05, "loss": 0.0072, "step": 723540 }, { "epoch": 1.88, "learning_rate": 1.8668104442676026e-05, "loss": 0.0069, "step": 723550 }, { "epoch": 1.88, "learning_rate": 1.866421622630456e-05, "loss": 0.0069, "step": 723560 }, { "epoch": 1.88, "learning_rate": 1.8660328009933096e-05, "loss": 0.006, "step": 723570 }, { "epoch": 1.88, "learning_rate": 1.865643979356163e-05, "loss": 0.0053, "step": 723580 }, { "epoch": 1.88, "learning_rate": 1.8652551577190166e-05, "loss": 0.006, "step": 723590 }, { "epoch": 1.88, "learning_rate": 1.86486633608187e-05, "loss": 0.0079, "step": 723600 }, { "epoch": 1.88, "learning_rate": 1.8644775144447235e-05, "loss": 0.0095, "step": 723610 }, { "epoch": 1.88, "learning_rate": 1.8640886928075774e-05, "loss": 0.0068, "step": 723620 }, { "epoch": 1.88, "learning_rate": 1.863699871170431e-05, "loss": 0.0067, "step": 723630 }, { "epoch": 1.88, "learning_rate": 1.8633110495332843e-05, "loss": 0.0067, "step": 723640 }, { "epoch": 1.88, "learning_rate": 1.8629222278961378e-05, "loss": 0.0066, "step": 723650 }, { "epoch": 1.88, "learning_rate": 1.8625334062589913e-05, "loss": 0.0168, "step": 723660 }, { "epoch": 1.88, "learning_rate": 1.8621445846218448e-05, "loss": 0.0073, "step": 723670 }, { "epoch": 1.88, "learning_rate": 1.8617557629846986e-05, "loss": 0.0076, "step": 723680 }, { "epoch": 1.88, "learning_rate": 1.861366941347552e-05, "loss": 0.0069, "step": 723690 }, { "epoch": 1.88, "learning_rate": 1.8609781197104052e-05, "loss": 0.005, "step": 723700 }, { "epoch": 1.88, "learning_rate": 1.860589298073259e-05, "loss": 0.0065, "step": 723710 }, { "epoch": 1.88, "learning_rate": 1.8602004764361126e-05, "loss": 0.0051, "step": 723720 }, { "epoch": 1.88, "learning_rate": 1.859811654798966e-05, "loss": 0.007, "step": 723730 }, { "epoch": 1.88, "learning_rate": 1.8594228331618195e-05, "loss": 0.0065, "step": 723740 }, { "epoch": 1.88, "learning_rate": 1.8590340115246734e-05, "loss": 0.007, "step": 723750 }, { "epoch": 1.88, "learning_rate": 1.8586451898875265e-05, "loss": 0.0047, "step": 723760 }, { "epoch": 1.88, "learning_rate": 1.8582563682503803e-05, "loss": 0.0064, "step": 723770 }, { "epoch": 1.88, "learning_rate": 1.8578675466132338e-05, "loss": 0.0078, "step": 723780 }, { "epoch": 1.88, "learning_rate": 1.8574787249760873e-05, "loss": 0.0104, "step": 723790 }, { "epoch": 1.88, "learning_rate": 1.8570899033389408e-05, "loss": 0.0066, "step": 723800 }, { "epoch": 1.88, "learning_rate": 1.8567010817017946e-05, "loss": 0.0051, "step": 723810 }, { "epoch": 1.88, "learning_rate": 1.856312260064648e-05, "loss": 0.007, "step": 723820 }, { "epoch": 1.88, "learning_rate": 1.8559234384275012e-05, "loss": 0.0099, "step": 723830 }, { "epoch": 1.88, "learning_rate": 1.855534616790355e-05, "loss": 0.0055, "step": 723840 }, { "epoch": 1.88, "learning_rate": 1.8551457951532086e-05, "loss": 0.0081, "step": 723850 }, { "epoch": 1.88, "learning_rate": 1.854756973516062e-05, "loss": 0.0108, "step": 723860 }, { "epoch": 1.88, "learning_rate": 1.8543681518789155e-05, "loss": 0.0115, "step": 723870 }, { "epoch": 1.88, "learning_rate": 1.8539793302417694e-05, "loss": 0.0119, "step": 723880 }, { "epoch": 1.88, "learning_rate": 1.8535905086046225e-05, "loss": 0.0069, "step": 723890 }, { "epoch": 1.88, "learning_rate": 1.8532016869674763e-05, "loss": 0.0084, "step": 723900 }, { "epoch": 1.88, "learning_rate": 1.8528128653303298e-05, "loss": 0.0069, "step": 723910 }, { "epoch": 1.88, "learning_rate": 1.8524240436931833e-05, "loss": 0.0083, "step": 723920 }, { "epoch": 1.88, "learning_rate": 1.8520352220560368e-05, "loss": 0.0069, "step": 723930 }, { "epoch": 1.88, "learning_rate": 1.8516464004188903e-05, "loss": 0.0071, "step": 723940 }, { "epoch": 1.88, "learning_rate": 1.8512575787817438e-05, "loss": 0.0079, "step": 723950 }, { "epoch": 1.88, "learning_rate": 1.8508687571445972e-05, "loss": 0.0088, "step": 723960 }, { "epoch": 1.88, "learning_rate": 1.850479935507451e-05, "loss": 0.0076, "step": 723970 }, { "epoch": 1.88, "learning_rate": 1.8500911138703046e-05, "loss": 0.0057, "step": 723980 }, { "epoch": 1.88, "learning_rate": 1.849702292233158e-05, "loss": 0.007, "step": 723990 }, { "epoch": 1.88, "learning_rate": 1.8493134705960115e-05, "loss": 0.0073, "step": 724000 }, { "epoch": 1.88, "eval_cer": 0.8816704946736816, "eval_loss": 0.004569494165480137, "eval_runtime": 107.7253, "eval_samples_per_second": 18.566, "eval_steps_per_second": 4.641, "step": 724000 }, { "epoch": 1.88, "learning_rate": 1.848924648958865e-05, "loss": 0.007, "step": 724010 }, { "epoch": 1.88, "learning_rate": 1.8485358273217185e-05, "loss": 0.0067, "step": 724020 }, { "epoch": 1.88, "learning_rate": 1.848147005684572e-05, "loss": 0.0092, "step": 724030 }, { "epoch": 1.88, "learning_rate": 1.8477581840474258e-05, "loss": 0.0058, "step": 724040 }, { "epoch": 1.88, "learning_rate": 1.8473693624102793e-05, "loss": 0.0074, "step": 724050 }, { "epoch": 1.88, "learning_rate": 1.8469805407731328e-05, "loss": 0.0109, "step": 724060 }, { "epoch": 1.88, "learning_rate": 1.8465917191359863e-05, "loss": 0.0093, "step": 724070 }, { "epoch": 1.88, "learning_rate": 1.8462028974988398e-05, "loss": 0.0084, "step": 724080 }, { "epoch": 1.88, "learning_rate": 1.8458140758616932e-05, "loss": 0.0075, "step": 724090 }, { "epoch": 1.88, "learning_rate": 1.845425254224547e-05, "loss": 0.0072, "step": 724100 }, { "epoch": 1.88, "learning_rate": 1.8450364325874006e-05, "loss": 0.0071, "step": 724110 }, { "epoch": 1.88, "learning_rate": 1.844647610950254e-05, "loss": 0.0049, "step": 724120 }, { "epoch": 1.88, "learning_rate": 1.8442587893131075e-05, "loss": 0.008, "step": 724130 }, { "epoch": 1.88, "learning_rate": 1.843869967675961e-05, "loss": 0.0065, "step": 724140 }, { "epoch": 1.88, "learning_rate": 1.8434811460388145e-05, "loss": 0.0062, "step": 724150 }, { "epoch": 1.88, "learning_rate": 1.843092324401668e-05, "loss": 0.0105, "step": 724160 }, { "epoch": 1.88, "learning_rate": 1.8427035027645218e-05, "loss": 0.0072, "step": 724170 }, { "epoch": 1.88, "learning_rate": 1.8423146811273753e-05, "loss": 0.0037, "step": 724180 }, { "epoch": 1.88, "learning_rate": 1.8419258594902288e-05, "loss": 0.0051, "step": 724190 }, { "epoch": 1.88, "learning_rate": 1.8415370378530823e-05, "loss": 0.0089, "step": 724200 }, { "epoch": 1.88, "learning_rate": 1.8411482162159358e-05, "loss": 0.0081, "step": 724210 }, { "epoch": 1.88, "learning_rate": 1.8407593945787892e-05, "loss": 0.0126, "step": 724220 }, { "epoch": 1.88, "learning_rate": 1.840370572941643e-05, "loss": 0.0079, "step": 724230 }, { "epoch": 1.88, "learning_rate": 1.8399817513044965e-05, "loss": 0.0068, "step": 724240 }, { "epoch": 1.88, "learning_rate": 1.83959292966735e-05, "loss": 0.0069, "step": 724250 }, { "epoch": 1.88, "learning_rate": 1.8392041080302035e-05, "loss": 0.0096, "step": 724260 }, { "epoch": 1.88, "learning_rate": 1.838815286393057e-05, "loss": 0.0075, "step": 724270 }, { "epoch": 1.88, "learning_rate": 1.8384264647559105e-05, "loss": 0.0079, "step": 724280 }, { "epoch": 1.88, "learning_rate": 1.838037643118764e-05, "loss": 0.0088, "step": 724290 }, { "epoch": 1.88, "learning_rate": 1.8376488214816178e-05, "loss": 0.0071, "step": 724300 }, { "epoch": 1.88, "learning_rate": 1.8372599998444713e-05, "loss": 0.0069, "step": 724310 }, { "epoch": 1.88, "learning_rate": 1.8368711782073248e-05, "loss": 0.0062, "step": 724320 }, { "epoch": 1.88, "learning_rate": 1.8364823565701783e-05, "loss": 0.0067, "step": 724330 }, { "epoch": 1.88, "learning_rate": 1.8360935349330317e-05, "loss": 0.007, "step": 724340 }, { "epoch": 1.88, "learning_rate": 1.8357047132958852e-05, "loss": 0.007, "step": 724350 }, { "epoch": 1.88, "learning_rate": 1.835315891658739e-05, "loss": 0.0071, "step": 724360 }, { "epoch": 1.88, "learning_rate": 1.8349270700215925e-05, "loss": 0.006, "step": 724370 }, { "epoch": 1.88, "learning_rate": 1.8345382483844457e-05, "loss": 0.0086, "step": 724380 }, { "epoch": 1.88, "learning_rate": 1.8341494267472995e-05, "loss": 0.0077, "step": 724390 }, { "epoch": 1.88, "learning_rate": 1.833760605110153e-05, "loss": 0.0089, "step": 724400 }, { "epoch": 1.88, "learning_rate": 1.8333717834730065e-05, "loss": 0.0069, "step": 724410 }, { "epoch": 1.88, "learning_rate": 1.83298296183586e-05, "loss": 0.0085, "step": 724420 }, { "epoch": 1.88, "learning_rate": 1.8325941401987138e-05, "loss": 0.0065, "step": 724430 }, { "epoch": 1.88, "learning_rate": 1.8322053185615673e-05, "loss": 0.0063, "step": 724440 }, { "epoch": 1.88, "learning_rate": 1.8318164969244208e-05, "loss": 0.0073, "step": 724450 }, { "epoch": 1.88, "learning_rate": 1.8314276752872743e-05, "loss": 0.0118, "step": 724460 }, { "epoch": 1.88, "learning_rate": 1.8310388536501277e-05, "loss": 0.0128, "step": 724470 }, { "epoch": 1.88, "learning_rate": 1.8306500320129812e-05, "loss": 0.0069, "step": 724480 }, { "epoch": 1.88, "learning_rate": 1.830261210375835e-05, "loss": 0.0061, "step": 724490 }, { "epoch": 1.88, "learning_rate": 1.8298723887386885e-05, "loss": 0.0092, "step": 724500 }, { "epoch": 1.88, "learning_rate": 1.8294835671015417e-05, "loss": 0.008, "step": 724510 }, { "epoch": 1.88, "learning_rate": 1.8290947454643955e-05, "loss": 0.0075, "step": 724520 }, { "epoch": 1.88, "learning_rate": 1.828705923827249e-05, "loss": 0.0062, "step": 724530 }, { "epoch": 1.88, "learning_rate": 1.8283171021901025e-05, "loss": 0.0063, "step": 724540 }, { "epoch": 1.88, "learning_rate": 1.827928280552956e-05, "loss": 0.0064, "step": 724550 }, { "epoch": 1.88, "learning_rate": 1.8275394589158098e-05, "loss": 0.0072, "step": 724560 }, { "epoch": 1.88, "learning_rate": 1.827150637278663e-05, "loss": 0.0075, "step": 724570 }, { "epoch": 1.88, "learning_rate": 1.8267618156415168e-05, "loss": 0.008, "step": 724580 }, { "epoch": 1.88, "learning_rate": 1.8263729940043703e-05, "loss": 0.0088, "step": 724590 }, { "epoch": 1.88, "learning_rate": 1.8259841723672237e-05, "loss": 0.0104, "step": 724600 }, { "epoch": 1.88, "learning_rate": 1.8255953507300772e-05, "loss": 0.0072, "step": 724610 }, { "epoch": 1.88, "learning_rate": 1.825206529092931e-05, "loss": 0.0082, "step": 724620 }, { "epoch": 1.88, "learning_rate": 1.8248177074557842e-05, "loss": 0.0078, "step": 724630 }, { "epoch": 1.88, "learning_rate": 1.8244288858186377e-05, "loss": 0.0077, "step": 724640 }, { "epoch": 1.88, "learning_rate": 1.8240400641814915e-05, "loss": 0.0069, "step": 724650 }, { "epoch": 1.88, "learning_rate": 1.823651242544345e-05, "loss": 0.0075, "step": 724660 }, { "epoch": 1.88, "learning_rate": 1.8232624209071985e-05, "loss": 0.0064, "step": 724670 }, { "epoch": 1.88, "learning_rate": 1.822873599270052e-05, "loss": 0.0078, "step": 724680 }, { "epoch": 1.88, "learning_rate": 1.8224847776329055e-05, "loss": 0.01, "step": 724690 }, { "epoch": 1.88, "learning_rate": 1.822095955995759e-05, "loss": 0.0075, "step": 724700 }, { "epoch": 1.88, "learning_rate": 1.8217071343586124e-05, "loss": 0.0075, "step": 724710 }, { "epoch": 1.88, "learning_rate": 1.8213183127214663e-05, "loss": 0.0074, "step": 724720 }, { "epoch": 1.88, "learning_rate": 1.8209294910843197e-05, "loss": 0.0134, "step": 724730 }, { "epoch": 1.88, "learning_rate": 1.8205406694471732e-05, "loss": 0.0058, "step": 724740 }, { "epoch": 1.88, "learning_rate": 1.8201518478100267e-05, "loss": 0.007, "step": 724750 }, { "epoch": 1.88, "learning_rate": 1.8197630261728802e-05, "loss": 0.0065, "step": 724760 }, { "epoch": 1.88, "learning_rate": 1.8193742045357337e-05, "loss": 0.0097, "step": 724770 }, { "epoch": 1.88, "learning_rate": 1.8189853828985875e-05, "loss": 0.0056, "step": 724780 }, { "epoch": 1.88, "learning_rate": 1.818596561261441e-05, "loss": 0.0084, "step": 724790 }, { "epoch": 1.88, "learning_rate": 1.8182077396242945e-05, "loss": 0.0067, "step": 724800 }, { "epoch": 1.88, "learning_rate": 1.817818917987148e-05, "loss": 0.0069, "step": 724810 }, { "epoch": 1.88, "learning_rate": 1.8174300963500015e-05, "loss": 0.0081, "step": 724820 }, { "epoch": 1.88, "learning_rate": 1.817041274712855e-05, "loss": 0.0063, "step": 724830 }, { "epoch": 1.88, "learning_rate": 1.8166524530757084e-05, "loss": 0.0077, "step": 724840 }, { "epoch": 1.88, "learning_rate": 1.8162636314385623e-05, "loss": 0.0084, "step": 724850 }, { "epoch": 1.88, "learning_rate": 1.8158748098014157e-05, "loss": 0.0089, "step": 724860 }, { "epoch": 1.88, "learning_rate": 1.8154859881642692e-05, "loss": 0.0062, "step": 724870 }, { "epoch": 1.88, "learning_rate": 1.8150971665271227e-05, "loss": 0.0079, "step": 724880 }, { "epoch": 1.88, "learning_rate": 1.8147083448899762e-05, "loss": 0.0068, "step": 724890 }, { "epoch": 1.88, "learning_rate": 1.8143195232528297e-05, "loss": 0.007, "step": 724900 }, { "epoch": 1.88, "learning_rate": 1.8139307016156835e-05, "loss": 0.0078, "step": 724910 }, { "epoch": 1.88, "learning_rate": 1.813541879978537e-05, "loss": 0.0071, "step": 724920 }, { "epoch": 1.88, "learning_rate": 1.8131530583413905e-05, "loss": 0.007, "step": 724930 }, { "epoch": 1.88, "learning_rate": 1.812764236704244e-05, "loss": 0.0096, "step": 724940 }, { "epoch": 1.88, "learning_rate": 1.8123754150670975e-05, "loss": 0.0084, "step": 724950 }, { "epoch": 1.88, "learning_rate": 1.811986593429951e-05, "loss": 0.0083, "step": 724960 }, { "epoch": 1.88, "learning_rate": 1.8115977717928044e-05, "loss": 0.0058, "step": 724970 }, { "epoch": 1.88, "learning_rate": 1.8112089501556583e-05, "loss": 0.0062, "step": 724980 }, { "epoch": 1.88, "learning_rate": 1.8108201285185117e-05, "loss": 0.0095, "step": 724990 }, { "epoch": 1.88, "learning_rate": 1.8104313068813652e-05, "loss": 0.0082, "step": 725000 }, { "epoch": 1.88, "eval_cer": 0.8816662957628791, "eval_loss": 0.004590142983943224, "eval_runtime": 107.8781, "eval_samples_per_second": 18.539, "eval_steps_per_second": 4.635, "step": 725000 }, { "epoch": 1.88, "learning_rate": 1.8100424852442187e-05, "loss": 0.0062, "step": 725010 }, { "epoch": 1.88, "learning_rate": 1.8096536636070722e-05, "loss": 0.0078, "step": 725020 }, { "epoch": 1.88, "learning_rate": 1.8092648419699257e-05, "loss": 0.0069, "step": 725030 }, { "epoch": 1.88, "learning_rate": 1.8088760203327795e-05, "loss": 0.0066, "step": 725040 }, { "epoch": 1.88, "learning_rate": 1.808487198695633e-05, "loss": 0.0073, "step": 725050 }, { "epoch": 1.88, "learning_rate": 1.8080983770584865e-05, "loss": 0.0071, "step": 725060 }, { "epoch": 1.88, "learning_rate": 1.80770955542134e-05, "loss": 0.0111, "step": 725070 }, { "epoch": 1.88, "learning_rate": 1.8073207337841935e-05, "loss": 0.0088, "step": 725080 }, { "epoch": 1.88, "learning_rate": 1.806931912147047e-05, "loss": 0.0079, "step": 725090 }, { "epoch": 1.88, "learning_rate": 1.8065430905099004e-05, "loss": 0.006, "step": 725100 }, { "epoch": 1.88, "learning_rate": 1.8061542688727542e-05, "loss": 0.0063, "step": 725110 }, { "epoch": 1.88, "learning_rate": 1.8057654472356077e-05, "loss": 0.0051, "step": 725120 }, { "epoch": 1.88, "learning_rate": 1.8053766255984612e-05, "loss": 0.0089, "step": 725130 }, { "epoch": 1.88, "learning_rate": 1.8049878039613147e-05, "loss": 0.0057, "step": 725140 }, { "epoch": 1.88, "learning_rate": 1.8045989823241682e-05, "loss": 0.006, "step": 725150 }, { "epoch": 1.88, "learning_rate": 1.8042101606870217e-05, "loss": 0.0078, "step": 725160 }, { "epoch": 1.88, "learning_rate": 1.8038213390498755e-05, "loss": 0.0065, "step": 725170 }, { "epoch": 1.88, "learning_rate": 1.803432517412729e-05, "loss": 0.0076, "step": 725180 }, { "epoch": 1.88, "learning_rate": 1.803043695775582e-05, "loss": 0.0076, "step": 725190 }, { "epoch": 1.88, "learning_rate": 1.802654874138436e-05, "loss": 0.0079, "step": 725200 }, { "epoch": 1.88, "learning_rate": 1.8022660525012894e-05, "loss": 0.0123, "step": 725210 }, { "epoch": 1.88, "learning_rate": 1.801877230864143e-05, "loss": 0.0068, "step": 725220 }, { "epoch": 1.88, "learning_rate": 1.8014884092269964e-05, "loss": 0.0081, "step": 725230 }, { "epoch": 1.88, "learning_rate": 1.8010995875898502e-05, "loss": 0.0054, "step": 725240 }, { "epoch": 1.88, "learning_rate": 1.8007107659527034e-05, "loss": 0.005, "step": 725250 }, { "epoch": 1.88, "learning_rate": 1.8003219443155572e-05, "loss": 0.0079, "step": 725260 }, { "epoch": 1.88, "learning_rate": 1.7999331226784107e-05, "loss": 0.0069, "step": 725270 }, { "epoch": 1.88, "learning_rate": 1.7995443010412642e-05, "loss": 0.005, "step": 725280 }, { "epoch": 1.88, "learning_rate": 1.7991554794041177e-05, "loss": 0.0119, "step": 725290 }, { "epoch": 1.88, "learning_rate": 1.7987666577669715e-05, "loss": 0.0086, "step": 725300 }, { "epoch": 1.88, "learning_rate": 1.7983778361298246e-05, "loss": 0.0122, "step": 725310 }, { "epoch": 1.88, "learning_rate": 1.797989014492678e-05, "loss": 0.0044, "step": 725320 }, { "epoch": 1.88, "learning_rate": 1.797600192855532e-05, "loss": 0.0084, "step": 725330 }, { "epoch": 1.88, "learning_rate": 1.7972113712183854e-05, "loss": 0.0115, "step": 725340 }, { "epoch": 1.88, "learning_rate": 1.796822549581239e-05, "loss": 0.0088, "step": 725350 }, { "epoch": 1.88, "learning_rate": 1.7964337279440924e-05, "loss": 0.0076, "step": 725360 }, { "epoch": 1.88, "learning_rate": 1.7960449063069462e-05, "loss": 0.0051, "step": 725370 }, { "epoch": 1.88, "learning_rate": 1.7956560846697994e-05, "loss": 0.0071, "step": 725380 }, { "epoch": 1.88, "learning_rate": 1.795267263032653e-05, "loss": 0.0072, "step": 725390 }, { "epoch": 1.88, "learning_rate": 1.7948784413955067e-05, "loss": 0.0072, "step": 725400 }, { "epoch": 1.88, "learning_rate": 1.7944896197583602e-05, "loss": 0.0076, "step": 725410 }, { "epoch": 1.88, "learning_rate": 1.7941007981212137e-05, "loss": 0.0071, "step": 725420 }, { "epoch": 1.88, "learning_rate": 1.793711976484067e-05, "loss": 0.0096, "step": 725430 }, { "epoch": 1.88, "learning_rate": 1.7933231548469206e-05, "loss": 0.0066, "step": 725440 }, { "epoch": 1.88, "learning_rate": 1.792934333209774e-05, "loss": 0.006, "step": 725450 }, { "epoch": 1.88, "learning_rate": 1.792545511572628e-05, "loss": 0.007, "step": 725460 }, { "epoch": 1.88, "learning_rate": 1.7921566899354814e-05, "loss": 0.0071, "step": 725470 }, { "epoch": 1.88, "learning_rate": 1.791767868298335e-05, "loss": 0.0074, "step": 725480 }, { "epoch": 1.88, "learning_rate": 1.7913790466611884e-05, "loss": 0.0069, "step": 725490 }, { "epoch": 1.88, "learning_rate": 1.790990225024042e-05, "loss": 0.0051, "step": 725500 }, { "epoch": 1.88, "learning_rate": 1.7906014033868954e-05, "loss": 0.0066, "step": 725510 }, { "epoch": 1.88, "learning_rate": 1.790212581749749e-05, "loss": 0.0086, "step": 725520 }, { "epoch": 1.88, "learning_rate": 1.7898237601126027e-05, "loss": 0.006, "step": 725530 }, { "epoch": 1.88, "learning_rate": 1.7894349384754562e-05, "loss": 0.0101, "step": 725540 }, { "epoch": 1.88, "learning_rate": 1.7890461168383097e-05, "loss": 0.0082, "step": 725550 }, { "epoch": 1.88, "learning_rate": 1.788657295201163e-05, "loss": 0.0069, "step": 725560 }, { "epoch": 1.88, "learning_rate": 1.7882684735640166e-05, "loss": 0.0066, "step": 725570 }, { "epoch": 1.88, "learning_rate": 1.78787965192687e-05, "loss": 0.0065, "step": 725580 }, { "epoch": 1.88, "learning_rate": 1.787490830289724e-05, "loss": 0.0078, "step": 725590 }, { "epoch": 1.88, "learning_rate": 1.7871020086525774e-05, "loss": 0.0057, "step": 725600 }, { "epoch": 1.88, "learning_rate": 1.786713187015431e-05, "loss": 0.0062, "step": 725610 }, { "epoch": 1.88, "learning_rate": 1.7863243653782844e-05, "loss": 0.0064, "step": 725620 }, { "epoch": 1.88, "learning_rate": 1.785935543741138e-05, "loss": 0.0081, "step": 725630 }, { "epoch": 1.88, "learning_rate": 1.7855467221039914e-05, "loss": 0.0079, "step": 725640 }, { "epoch": 1.88, "learning_rate": 1.785157900466845e-05, "loss": 0.0105, "step": 725650 }, { "epoch": 1.88, "learning_rate": 1.7847690788296987e-05, "loss": 0.0049, "step": 725660 }, { "epoch": 1.88, "learning_rate": 1.7843802571925522e-05, "loss": 0.0085, "step": 725670 }, { "epoch": 1.88, "learning_rate": 1.7839914355554057e-05, "loss": 0.0062, "step": 725680 }, { "epoch": 1.88, "learning_rate": 1.783602613918259e-05, "loss": 0.0075, "step": 725690 }, { "epoch": 1.88, "learning_rate": 1.7832137922811126e-05, "loss": 0.0077, "step": 725700 }, { "epoch": 1.88, "learning_rate": 1.782824970643966e-05, "loss": 0.0046, "step": 725710 }, { "epoch": 1.88, "learning_rate": 1.78243614900682e-05, "loss": 0.0054, "step": 725720 }, { "epoch": 1.88, "learning_rate": 1.7820473273696734e-05, "loss": 0.005, "step": 725730 }, { "epoch": 1.88, "learning_rate": 1.781658505732527e-05, "loss": 0.0094, "step": 725740 }, { "epoch": 1.88, "learning_rate": 1.7812696840953804e-05, "loss": 0.0137, "step": 725750 }, { "epoch": 1.88, "learning_rate": 1.780880862458234e-05, "loss": 0.0082, "step": 725760 }, { "epoch": 1.88, "learning_rate": 1.7804920408210874e-05, "loss": 0.0055, "step": 725770 }, { "epoch": 1.88, "learning_rate": 1.780103219183941e-05, "loss": 0.0065, "step": 725780 }, { "epoch": 1.88, "learning_rate": 1.7797143975467947e-05, "loss": 0.0045, "step": 725790 }, { "epoch": 1.88, "learning_rate": 1.7793255759096482e-05, "loss": 0.0093, "step": 725800 }, { "epoch": 1.88, "learning_rate": 1.7789367542725017e-05, "loss": 0.0061, "step": 725810 }, { "epoch": 1.88, "learning_rate": 1.778547932635355e-05, "loss": 0.006, "step": 725820 }, { "epoch": 1.88, "learning_rate": 1.7781591109982086e-05, "loss": 0.0072, "step": 725830 }, { "epoch": 1.88, "learning_rate": 1.777770289361062e-05, "loss": 0.0073, "step": 725840 }, { "epoch": 1.88, "learning_rate": 1.777381467723916e-05, "loss": 0.0083, "step": 725850 }, { "epoch": 1.88, "learning_rate": 1.7769926460867694e-05, "loss": 0.0078, "step": 725860 }, { "epoch": 1.88, "learning_rate": 1.7766038244496226e-05, "loss": 0.0118, "step": 725870 }, { "epoch": 1.88, "learning_rate": 1.7762150028124764e-05, "loss": 0.0052, "step": 725880 }, { "epoch": 1.88, "learning_rate": 1.77582618117533e-05, "loss": 0.0064, "step": 725890 }, { "epoch": 1.88, "learning_rate": 1.7754373595381834e-05, "loss": 0.0066, "step": 725900 }, { "epoch": 1.88, "learning_rate": 1.775048537901037e-05, "loss": 0.01, "step": 725910 }, { "epoch": 1.88, "learning_rate": 1.7746597162638907e-05, "loss": 0.0086, "step": 725920 }, { "epoch": 1.88, "learning_rate": 1.774270894626744e-05, "loss": 0.009, "step": 725930 }, { "epoch": 1.88, "learning_rate": 1.7738820729895977e-05, "loss": 0.0088, "step": 725940 }, { "epoch": 1.88, "learning_rate": 1.773493251352451e-05, "loss": 0.0071, "step": 725950 }, { "epoch": 1.88, "learning_rate": 1.7731044297153046e-05, "loss": 0.01, "step": 725960 }, { "epoch": 1.88, "learning_rate": 1.772715608078158e-05, "loss": 0.0065, "step": 725970 }, { "epoch": 1.88, "learning_rate": 1.772326786441012e-05, "loss": 0.0077, "step": 725980 }, { "epoch": 1.88, "learning_rate": 1.7719379648038654e-05, "loss": 0.0061, "step": 725990 }, { "epoch": 1.88, "learning_rate": 1.7715491431667186e-05, "loss": 0.0098, "step": 726000 }, { "epoch": 1.88, "eval_cer": 0.88167329394755, "eval_loss": 0.004557341802865267, "eval_runtime": 107.9128, "eval_samples_per_second": 18.533, "eval_steps_per_second": 4.633, "step": 726000 }, { "epoch": 1.88, "learning_rate": 1.7711603215295724e-05, "loss": 0.0057, "step": 726010 }, { "epoch": 1.88, "learning_rate": 1.770771499892426e-05, "loss": 0.011, "step": 726020 }, { "epoch": 1.88, "learning_rate": 1.7703826782552794e-05, "loss": 0.0065, "step": 726030 }, { "epoch": 1.88, "learning_rate": 1.769993856618133e-05, "loss": 0.0106, "step": 726040 }, { "epoch": 1.88, "learning_rate": 1.7696050349809867e-05, "loss": 0.0054, "step": 726050 }, { "epoch": 1.88, "learning_rate": 1.76921621334384e-05, "loss": 0.0062, "step": 726060 }, { "epoch": 1.88, "learning_rate": 1.7688273917066933e-05, "loss": 0.0056, "step": 726070 }, { "epoch": 1.88, "learning_rate": 1.768438570069547e-05, "loss": 0.0085, "step": 726080 }, { "epoch": 1.88, "learning_rate": 1.7680497484324006e-05, "loss": 0.0054, "step": 726090 }, { "epoch": 1.88, "learning_rate": 1.767660926795254e-05, "loss": 0.0102, "step": 726100 }, { "epoch": 1.88, "learning_rate": 1.7672721051581076e-05, "loss": 0.0058, "step": 726110 }, { "epoch": 1.88, "learning_rate": 1.766883283520961e-05, "loss": 0.007, "step": 726120 }, { "epoch": 1.88, "learning_rate": 1.7664944618838146e-05, "loss": 0.0077, "step": 726130 }, { "epoch": 1.88, "learning_rate": 1.7661056402466684e-05, "loss": 0.0091, "step": 726140 }, { "epoch": 1.88, "learning_rate": 1.765716818609522e-05, "loss": 0.0083, "step": 726150 }, { "epoch": 1.88, "learning_rate": 1.7653279969723754e-05, "loss": 0.0086, "step": 726160 }, { "epoch": 1.88, "learning_rate": 1.764939175335229e-05, "loss": 0.0084, "step": 726170 }, { "epoch": 1.88, "learning_rate": 1.7645503536980823e-05, "loss": 0.0097, "step": 726180 }, { "epoch": 1.88, "learning_rate": 1.764161532060936e-05, "loss": 0.009, "step": 726190 }, { "epoch": 1.88, "learning_rate": 1.7637727104237893e-05, "loss": 0.0081, "step": 726200 }, { "epoch": 1.88, "learning_rate": 1.763383888786643e-05, "loss": 0.008, "step": 726210 }, { "epoch": 1.88, "learning_rate": 1.7629950671494966e-05, "loss": 0.0088, "step": 726220 }, { "epoch": 1.88, "learning_rate": 1.76260624551235e-05, "loss": 0.0072, "step": 726230 }, { "epoch": 1.88, "learning_rate": 1.7622174238752036e-05, "loss": 0.0059, "step": 726240 }, { "epoch": 1.88, "learning_rate": 1.761828602238057e-05, "loss": 0.0067, "step": 726250 }, { "epoch": 1.88, "learning_rate": 1.7614397806009106e-05, "loss": 0.01, "step": 726260 }, { "epoch": 1.88, "learning_rate": 1.7610509589637644e-05, "loss": 0.0082, "step": 726270 }, { "epoch": 1.88, "learning_rate": 1.760662137326618e-05, "loss": 0.0064, "step": 726280 }, { "epoch": 1.88, "learning_rate": 1.7602733156894714e-05, "loss": 0.0063, "step": 726290 }, { "epoch": 1.88, "learning_rate": 1.759884494052325e-05, "loss": 0.0063, "step": 726300 }, { "epoch": 1.88, "learning_rate": 1.7594956724151783e-05, "loss": 0.008, "step": 726310 }, { "epoch": 1.88, "learning_rate": 1.759106850778032e-05, "loss": 0.0094, "step": 726320 }, { "epoch": 1.88, "learning_rate": 1.7587180291408853e-05, "loss": 0.0063, "step": 726330 }, { "epoch": 1.88, "learning_rate": 1.758329207503739e-05, "loss": 0.0089, "step": 726340 }, { "epoch": 1.88, "learning_rate": 1.7579403858665926e-05, "loss": 0.0059, "step": 726350 }, { "epoch": 1.88, "learning_rate": 1.757551564229446e-05, "loss": 0.0064, "step": 726360 }, { "epoch": 1.88, "learning_rate": 1.7571627425922996e-05, "loss": 0.0058, "step": 726370 }, { "epoch": 1.88, "learning_rate": 1.756773920955153e-05, "loss": 0.0086, "step": 726380 }, { "epoch": 1.88, "learning_rate": 1.7563850993180066e-05, "loss": 0.0104, "step": 726390 }, { "epoch": 1.88, "learning_rate": 1.7559962776808604e-05, "loss": 0.0089, "step": 726400 }, { "epoch": 1.88, "learning_rate": 1.755607456043714e-05, "loss": 0.0082, "step": 726410 }, { "epoch": 1.88, "learning_rate": 1.7552186344065674e-05, "loss": 0.0051, "step": 726420 }, { "epoch": 1.88, "learning_rate": 1.754829812769421e-05, "loss": 0.0067, "step": 726430 }, { "epoch": 1.88, "learning_rate": 1.7544409911322743e-05, "loss": 0.0062, "step": 726440 }, { "epoch": 1.88, "learning_rate": 1.7540521694951278e-05, "loss": 0.0114, "step": 726450 }, { "epoch": 1.88, "learning_rate": 1.7536633478579813e-05, "loss": 0.0067, "step": 726460 }, { "epoch": 1.88, "learning_rate": 1.753274526220835e-05, "loss": 0.0085, "step": 726470 }, { "epoch": 1.88, "learning_rate": 1.7528857045836886e-05, "loss": 0.0072, "step": 726480 }, { "epoch": 1.88, "learning_rate": 1.752496882946542e-05, "loss": 0.0084, "step": 726490 }, { "epoch": 1.88, "learning_rate": 1.7521080613093956e-05, "loss": 0.0067, "step": 726500 }, { "epoch": 1.88, "learning_rate": 1.751719239672249e-05, "loss": 0.0081, "step": 726510 }, { "epoch": 1.88, "learning_rate": 1.7513304180351026e-05, "loss": 0.0057, "step": 726520 }, { "epoch": 1.88, "learning_rate": 1.7509415963979564e-05, "loss": 0.0068, "step": 726530 }, { "epoch": 1.88, "learning_rate": 1.75055277476081e-05, "loss": 0.0049, "step": 726540 }, { "epoch": 1.88, "learning_rate": 1.750163953123663e-05, "loss": 0.0096, "step": 726550 }, { "epoch": 1.88, "learning_rate": 1.749775131486517e-05, "loss": 0.0076, "step": 726560 }, { "epoch": 1.88, "learning_rate": 1.7493863098493703e-05, "loss": 0.0082, "step": 726570 }, { "epoch": 1.88, "learning_rate": 1.7489974882122238e-05, "loss": 0.0071, "step": 726580 }, { "epoch": 1.88, "learning_rate": 1.7486086665750773e-05, "loss": 0.0086, "step": 726590 }, { "epoch": 1.88, "learning_rate": 1.748219844937931e-05, "loss": 0.0074, "step": 726600 }, { "epoch": 1.88, "learning_rate": 1.7478310233007846e-05, "loss": 0.0069, "step": 726610 }, { "epoch": 1.88, "learning_rate": 1.747442201663638e-05, "loss": 0.0083, "step": 726620 }, { "epoch": 1.88, "learning_rate": 1.7470533800264916e-05, "loss": 0.0076, "step": 726630 }, { "epoch": 1.88, "learning_rate": 1.746664558389345e-05, "loss": 0.0055, "step": 726640 }, { "epoch": 1.88, "learning_rate": 1.7462757367521986e-05, "loss": 0.008, "step": 726650 }, { "epoch": 1.88, "learning_rate": 1.7458869151150524e-05, "loss": 0.0053, "step": 726660 }, { "epoch": 1.88, "learning_rate": 1.745498093477906e-05, "loss": 0.0107, "step": 726670 }, { "epoch": 1.88, "learning_rate": 1.745109271840759e-05, "loss": 0.0056, "step": 726680 }, { "epoch": 1.88, "learning_rate": 1.744720450203613e-05, "loss": 0.007, "step": 726690 }, { "epoch": 1.88, "learning_rate": 1.7443316285664663e-05, "loss": 0.0062, "step": 726700 }, { "epoch": 1.88, "learning_rate": 1.7439428069293198e-05, "loss": 0.0052, "step": 726710 }, { "epoch": 1.88, "learning_rate": 1.7435539852921733e-05, "loss": 0.0074, "step": 726720 }, { "epoch": 1.88, "learning_rate": 1.743165163655027e-05, "loss": 0.0065, "step": 726730 }, { "epoch": 1.88, "learning_rate": 1.7427763420178803e-05, "loss": 0.006, "step": 726740 }, { "epoch": 1.88, "learning_rate": 1.742387520380734e-05, "loss": 0.0089, "step": 726750 }, { "epoch": 1.88, "learning_rate": 1.7419986987435876e-05, "loss": 0.0055, "step": 726760 }, { "epoch": 1.88, "learning_rate": 1.741609877106441e-05, "loss": 0.0078, "step": 726770 }, { "epoch": 1.88, "learning_rate": 1.7412210554692946e-05, "loss": 0.0062, "step": 726780 }, { "epoch": 1.88, "learning_rate": 1.740832233832148e-05, "loss": 0.008, "step": 726790 }, { "epoch": 1.88, "learning_rate": 1.7404434121950015e-05, "loss": 0.0073, "step": 726800 }, { "epoch": 1.88, "learning_rate": 1.740054590557855e-05, "loss": 0.0076, "step": 726810 }, { "epoch": 1.88, "learning_rate": 1.739665768920709e-05, "loss": 0.0088, "step": 726820 }, { "epoch": 1.88, "learning_rate": 1.7392769472835623e-05, "loss": 0.0053, "step": 726830 }, { "epoch": 1.88, "learning_rate": 1.7388881256464158e-05, "loss": 0.0078, "step": 726840 }, { "epoch": 1.88, "learning_rate": 1.7384993040092693e-05, "loss": 0.0074, "step": 726850 }, { "epoch": 1.88, "learning_rate": 1.7381104823721228e-05, "loss": 0.0063, "step": 726860 }, { "epoch": 1.88, "learning_rate": 1.7377216607349763e-05, "loss": 0.0074, "step": 726870 }, { "epoch": 1.88, "learning_rate": 1.7373328390978298e-05, "loss": 0.0076, "step": 726880 }, { "epoch": 1.88, "learning_rate": 1.7369440174606836e-05, "loss": 0.0072, "step": 726890 }, { "epoch": 1.88, "learning_rate": 1.736555195823537e-05, "loss": 0.0072, "step": 726900 }, { "epoch": 1.88, "learning_rate": 1.7361663741863906e-05, "loss": 0.0067, "step": 726910 }, { "epoch": 1.88, "learning_rate": 1.735777552549244e-05, "loss": 0.0064, "step": 726920 }, { "epoch": 1.88, "learning_rate": 1.7353887309120975e-05, "loss": 0.0055, "step": 726930 }, { "epoch": 1.88, "learning_rate": 1.734999909274951e-05, "loss": 0.0074, "step": 726940 }, { "epoch": 1.88, "learning_rate": 1.734611087637805e-05, "loss": 0.006, "step": 726950 }, { "epoch": 1.88, "learning_rate": 1.7342222660006583e-05, "loss": 0.0094, "step": 726960 }, { "epoch": 1.88, "learning_rate": 1.7338334443635118e-05, "loss": 0.0047, "step": 726970 }, { "epoch": 1.88, "learning_rate": 1.7334446227263653e-05, "loss": 0.0091, "step": 726980 }, { "epoch": 1.88, "learning_rate": 1.7330558010892188e-05, "loss": 0.0086, "step": 726990 }, { "epoch": 1.88, "learning_rate": 1.7326669794520723e-05, "loss": 0.0083, "step": 727000 }, { "epoch": 1.88, "eval_cer": 0.8816690950367475, "eval_loss": 0.004555822350084782, "eval_runtime": 107.8877, "eval_samples_per_second": 18.538, "eval_steps_per_second": 4.634, "step": 727000 }, { "epoch": 1.88, "learning_rate": 1.7322781578149258e-05, "loss": 0.007, "step": 727010 }, { "epoch": 1.88, "learning_rate": 1.7318893361777796e-05, "loss": 0.0041, "step": 727020 }, { "epoch": 1.88, "learning_rate": 1.731500514540633e-05, "loss": 0.0105, "step": 727030 }, { "epoch": 1.88, "learning_rate": 1.7311116929034866e-05, "loss": 0.0072, "step": 727040 }, { "epoch": 1.88, "learning_rate": 1.73072287126634e-05, "loss": 0.008, "step": 727050 }, { "epoch": 1.88, "learning_rate": 1.7303340496291935e-05, "loss": 0.0062, "step": 727060 }, { "epoch": 1.88, "learning_rate": 1.729945227992047e-05, "loss": 0.0072, "step": 727070 }, { "epoch": 1.88, "learning_rate": 1.729556406354901e-05, "loss": 0.0107, "step": 727080 }, { "epoch": 1.88, "learning_rate": 1.7291675847177543e-05, "loss": 0.0055, "step": 727090 }, { "epoch": 1.88, "learning_rate": 1.7287787630806078e-05, "loss": 0.0059, "step": 727100 }, { "epoch": 1.88, "learning_rate": 1.7283899414434613e-05, "loss": 0.0108, "step": 727110 }, { "epoch": 1.88, "learning_rate": 1.7280011198063148e-05, "loss": 0.0078, "step": 727120 }, { "epoch": 1.88, "learning_rate": 1.7276122981691683e-05, "loss": 0.0081, "step": 727130 }, { "epoch": 1.88, "learning_rate": 1.7272234765320218e-05, "loss": 0.0069, "step": 727140 }, { "epoch": 1.88, "learning_rate": 1.7268346548948756e-05, "loss": 0.0057, "step": 727150 }, { "epoch": 1.88, "learning_rate": 1.726445833257729e-05, "loss": 0.0058, "step": 727160 }, { "epoch": 1.88, "learning_rate": 1.7260570116205826e-05, "loss": 0.0056, "step": 727170 }, { "epoch": 1.88, "learning_rate": 1.725668189983436e-05, "loss": 0.0073, "step": 727180 }, { "epoch": 1.88, "learning_rate": 1.7252793683462895e-05, "loss": 0.0047, "step": 727190 }, { "epoch": 1.89, "learning_rate": 1.724890546709143e-05, "loss": 0.005, "step": 727200 }, { "epoch": 1.89, "learning_rate": 1.724501725071997e-05, "loss": 0.0082, "step": 727210 }, { "epoch": 1.89, "learning_rate": 1.7241129034348503e-05, "loss": 0.0098, "step": 727220 }, { "epoch": 1.89, "learning_rate": 1.7237240817977038e-05, "loss": 0.0093, "step": 727230 }, { "epoch": 1.89, "learning_rate": 1.7233352601605573e-05, "loss": 0.0064, "step": 727240 }, { "epoch": 1.89, "learning_rate": 1.7229464385234108e-05, "loss": 0.0095, "step": 727250 }, { "epoch": 1.89, "learning_rate": 1.7225576168862643e-05, "loss": 0.0071, "step": 727260 }, { "epoch": 1.89, "learning_rate": 1.7221687952491178e-05, "loss": 0.0056, "step": 727270 }, { "epoch": 1.89, "learning_rate": 1.7217799736119716e-05, "loss": 0.0059, "step": 727280 }, { "epoch": 1.89, "learning_rate": 1.721391151974825e-05, "loss": 0.0063, "step": 727290 }, { "epoch": 1.89, "learning_rate": 1.7210023303376786e-05, "loss": 0.0077, "step": 727300 }, { "epoch": 1.89, "learning_rate": 1.720613508700532e-05, "loss": 0.006, "step": 727310 }, { "epoch": 1.89, "learning_rate": 1.7202246870633855e-05, "loss": 0.0096, "step": 727320 }, { "epoch": 1.89, "learning_rate": 1.719835865426239e-05, "loss": 0.0082, "step": 727330 }, { "epoch": 1.89, "learning_rate": 1.719447043789093e-05, "loss": 0.0109, "step": 727340 }, { "epoch": 1.89, "learning_rate": 1.7190582221519463e-05, "loss": 0.0096, "step": 727350 }, { "epoch": 1.89, "learning_rate": 1.7186694005147995e-05, "loss": 0.0062, "step": 727360 }, { "epoch": 1.89, "learning_rate": 1.7182805788776533e-05, "loss": 0.0041, "step": 727370 }, { "epoch": 1.89, "learning_rate": 1.7178917572405068e-05, "loss": 0.0059, "step": 727380 }, { "epoch": 1.89, "learning_rate": 1.7175029356033603e-05, "loss": 0.007, "step": 727390 }, { "epoch": 1.89, "learning_rate": 1.7171141139662138e-05, "loss": 0.0071, "step": 727400 }, { "epoch": 1.89, "learning_rate": 1.7167252923290676e-05, "loss": 0.0063, "step": 727410 }, { "epoch": 1.89, "learning_rate": 1.7163364706919207e-05, "loss": 0.0079, "step": 727420 }, { "epoch": 1.89, "learning_rate": 1.7159476490547746e-05, "loss": 0.0081, "step": 727430 }, { "epoch": 1.89, "learning_rate": 1.715558827417628e-05, "loss": 0.0065, "step": 727440 }, { "epoch": 1.89, "learning_rate": 1.7151700057804815e-05, "loss": 0.0104, "step": 727450 }, { "epoch": 1.89, "learning_rate": 1.714781184143335e-05, "loss": 0.0077, "step": 727460 }, { "epoch": 1.89, "learning_rate": 1.7143923625061885e-05, "loss": 0.0042, "step": 727470 }, { "epoch": 1.89, "learning_rate": 1.714003540869042e-05, "loss": 0.0077, "step": 727480 }, { "epoch": 1.89, "learning_rate": 1.7136147192318955e-05, "loss": 0.0073, "step": 727490 }, { "epoch": 1.89, "learning_rate": 1.7132258975947493e-05, "loss": 0.0041, "step": 727500 }, { "epoch": 1.89, "learning_rate": 1.7128370759576028e-05, "loss": 0.0084, "step": 727510 }, { "epoch": 1.89, "learning_rate": 1.7124482543204563e-05, "loss": 0.0103, "step": 727520 }, { "epoch": 1.89, "learning_rate": 1.7120594326833098e-05, "loss": 0.0091, "step": 727530 }, { "epoch": 1.89, "learning_rate": 1.7116706110461636e-05, "loss": 0.0108, "step": 727540 }, { "epoch": 1.89, "learning_rate": 1.7112817894090167e-05, "loss": 0.0061, "step": 727550 }, { "epoch": 1.89, "learning_rate": 1.7108929677718702e-05, "loss": 0.008, "step": 727560 }, { "epoch": 1.89, "learning_rate": 1.710504146134724e-05, "loss": 0.007, "step": 727570 }, { "epoch": 1.89, "learning_rate": 1.7101153244975775e-05, "loss": 0.0071, "step": 727580 }, { "epoch": 1.89, "learning_rate": 1.709726502860431e-05, "loss": 0.0074, "step": 727590 }, { "epoch": 1.89, "learning_rate": 1.7093376812232845e-05, "loss": 0.0061, "step": 727600 }, { "epoch": 1.89, "learning_rate": 1.708948859586138e-05, "loss": 0.0074, "step": 727610 }, { "epoch": 1.89, "learning_rate": 1.7085600379489915e-05, "loss": 0.0071, "step": 727620 }, { "epoch": 1.89, "learning_rate": 1.7081712163118453e-05, "loss": 0.0078, "step": 727630 }, { "epoch": 1.89, "learning_rate": 1.7077823946746988e-05, "loss": 0.0062, "step": 727640 }, { "epoch": 1.89, "learning_rate": 1.7073935730375523e-05, "loss": 0.0076, "step": 727650 }, { "epoch": 1.89, "learning_rate": 1.7070047514004058e-05, "loss": 0.007, "step": 727660 }, { "epoch": 1.89, "learning_rate": 1.7066159297632592e-05, "loss": 0.007, "step": 727670 }, { "epoch": 1.89, "learning_rate": 1.7062271081261127e-05, "loss": 0.0071, "step": 727680 }, { "epoch": 1.89, "learning_rate": 1.7058382864889662e-05, "loss": 0.0057, "step": 727690 }, { "epoch": 1.89, "learning_rate": 1.70544946485182e-05, "loss": 0.0079, "step": 727700 }, { "epoch": 1.89, "learning_rate": 1.7050606432146735e-05, "loss": 0.0065, "step": 727710 }, { "epoch": 1.89, "learning_rate": 1.704671821577527e-05, "loss": 0.0071, "step": 727720 }, { "epoch": 1.89, "learning_rate": 1.7042829999403805e-05, "loss": 0.0063, "step": 727730 }, { "epoch": 1.89, "learning_rate": 1.703894178303234e-05, "loss": 0.0086, "step": 727740 }, { "epoch": 1.89, "learning_rate": 1.7035053566660875e-05, "loss": 0.0093, "step": 727750 }, { "epoch": 1.89, "learning_rate": 1.7031165350289413e-05, "loss": 0.0055, "step": 727760 }, { "epoch": 1.89, "learning_rate": 1.7027277133917948e-05, "loss": 0.0069, "step": 727770 }, { "epoch": 1.89, "learning_rate": 1.7023388917546483e-05, "loss": 0.0073, "step": 727780 }, { "epoch": 1.89, "learning_rate": 1.7019500701175018e-05, "loss": 0.0088, "step": 727790 }, { "epoch": 1.89, "learning_rate": 1.7015612484803552e-05, "loss": 0.0063, "step": 727800 }, { "epoch": 1.89, "learning_rate": 1.7011724268432087e-05, "loss": 0.0086, "step": 727810 }, { "epoch": 1.89, "learning_rate": 1.7007836052060622e-05, "loss": 0.0066, "step": 727820 }, { "epoch": 1.89, "learning_rate": 1.700394783568916e-05, "loss": 0.0051, "step": 727830 }, { "epoch": 1.89, "learning_rate": 1.7000059619317695e-05, "loss": 0.0079, "step": 727840 }, { "epoch": 1.89, "learning_rate": 1.699617140294623e-05, "loss": 0.0089, "step": 727850 }, { "epoch": 1.89, "learning_rate": 1.6992283186574765e-05, "loss": 0.0081, "step": 727860 }, { "epoch": 1.89, "learning_rate": 1.69883949702033e-05, "loss": 0.0107, "step": 727870 }, { "epoch": 1.89, "learning_rate": 1.6984506753831835e-05, "loss": 0.0073, "step": 727880 }, { "epoch": 1.89, "learning_rate": 1.6980618537460373e-05, "loss": 0.0066, "step": 727890 }, { "epoch": 1.89, "learning_rate": 1.6976730321088908e-05, "loss": 0.0061, "step": 727900 }, { "epoch": 1.89, "learning_rate": 1.6972842104717443e-05, "loss": 0.0067, "step": 727910 }, { "epoch": 1.89, "learning_rate": 1.6968953888345977e-05, "loss": 0.0096, "step": 727920 }, { "epoch": 1.89, "learning_rate": 1.6965065671974512e-05, "loss": 0.0065, "step": 727930 }, { "epoch": 1.89, "learning_rate": 1.6961177455603047e-05, "loss": 0.0053, "step": 727940 }, { "epoch": 1.89, "learning_rate": 1.6957289239231582e-05, "loss": 0.0078, "step": 727950 }, { "epoch": 1.89, "learning_rate": 1.695340102286012e-05, "loss": 0.0081, "step": 727960 }, { "epoch": 1.89, "learning_rate": 1.6949512806488655e-05, "loss": 0.0069, "step": 727970 }, { "epoch": 1.89, "learning_rate": 1.694562459011719e-05, "loss": 0.0066, "step": 727980 }, { "epoch": 1.89, "learning_rate": 1.6941736373745725e-05, "loss": 0.006, "step": 727990 }, { "epoch": 1.89, "learning_rate": 1.693784815737426e-05, "loss": 0.0083, "step": 728000 }, { "epoch": 1.89, "eval_cer": 0.8816536990304715, "eval_loss": 0.004557101055979729, "eval_runtime": 107.9878, "eval_samples_per_second": 18.521, "eval_steps_per_second": 4.63, "step": 728000 }, { "epoch": 1.89, "learning_rate": 1.6933959941002795e-05, "loss": 0.0058, "step": 728010 }, { "epoch": 1.89, "learning_rate": 1.6930071724631333e-05, "loss": 0.0069, "step": 728020 }, { "epoch": 1.89, "learning_rate": 1.6926183508259868e-05, "loss": 0.0079, "step": 728030 }, { "epoch": 1.89, "learning_rate": 1.69222952918884e-05, "loss": 0.0083, "step": 728040 }, { "epoch": 1.89, "learning_rate": 1.6918407075516937e-05, "loss": 0.0102, "step": 728050 }, { "epoch": 1.89, "learning_rate": 1.6914518859145472e-05, "loss": 0.0055, "step": 728060 }, { "epoch": 1.89, "learning_rate": 1.6910630642774007e-05, "loss": 0.0071, "step": 728070 }, { "epoch": 1.89, "learning_rate": 1.6906742426402542e-05, "loss": 0.0076, "step": 728080 }, { "epoch": 1.89, "learning_rate": 1.690285421003108e-05, "loss": 0.0068, "step": 728090 }, { "epoch": 1.89, "learning_rate": 1.6898965993659612e-05, "loss": 0.0075, "step": 728100 }, { "epoch": 1.89, "learning_rate": 1.689507777728815e-05, "loss": 0.0055, "step": 728110 }, { "epoch": 1.89, "learning_rate": 1.6891189560916685e-05, "loss": 0.0073, "step": 728120 }, { "epoch": 1.89, "learning_rate": 1.688730134454522e-05, "loss": 0.0073, "step": 728130 }, { "epoch": 1.89, "learning_rate": 1.6883413128173755e-05, "loss": 0.0094, "step": 728140 }, { "epoch": 1.89, "learning_rate": 1.687952491180229e-05, "loss": 0.0075, "step": 728150 }, { "epoch": 1.89, "learning_rate": 1.6875636695430828e-05, "loss": 0.0066, "step": 728160 }, { "epoch": 1.89, "learning_rate": 1.687174847905936e-05, "loss": 0.0063, "step": 728170 }, { "epoch": 1.89, "learning_rate": 1.6867860262687897e-05, "loss": 0.0088, "step": 728180 }, { "epoch": 1.89, "learning_rate": 1.6863972046316432e-05, "loss": 0.0058, "step": 728190 }, { "epoch": 1.89, "learning_rate": 1.6860083829944967e-05, "loss": 0.0059, "step": 728200 }, { "epoch": 1.89, "learning_rate": 1.6856195613573502e-05, "loss": 0.0054, "step": 728210 }, { "epoch": 1.89, "learning_rate": 1.685230739720204e-05, "loss": 0.0107, "step": 728220 }, { "epoch": 1.89, "learning_rate": 1.6848419180830572e-05, "loss": 0.0136, "step": 728230 }, { "epoch": 1.89, "learning_rate": 1.6844530964459107e-05, "loss": 0.0065, "step": 728240 }, { "epoch": 1.89, "learning_rate": 1.6840642748087645e-05, "loss": 0.0075, "step": 728250 }, { "epoch": 1.89, "learning_rate": 1.683675453171618e-05, "loss": 0.0086, "step": 728260 }, { "epoch": 1.89, "learning_rate": 1.6832866315344715e-05, "loss": 0.0101, "step": 728270 }, { "epoch": 1.89, "learning_rate": 1.682897809897325e-05, "loss": 0.0084, "step": 728280 }, { "epoch": 1.89, "learning_rate": 1.6825089882601784e-05, "loss": 0.0087, "step": 728290 }, { "epoch": 1.89, "learning_rate": 1.682120166623032e-05, "loss": 0.0107, "step": 728300 }, { "epoch": 1.89, "learning_rate": 1.6817313449858857e-05, "loss": 0.0084, "step": 728310 }, { "epoch": 1.89, "learning_rate": 1.6813425233487392e-05, "loss": 0.0069, "step": 728320 }, { "epoch": 1.89, "learning_rate": 1.6809537017115927e-05, "loss": 0.0064, "step": 728330 }, { "epoch": 1.89, "learning_rate": 1.6805648800744462e-05, "loss": 0.0061, "step": 728340 }, { "epoch": 1.89, "learning_rate": 1.6801760584372997e-05, "loss": 0.0085, "step": 728350 }, { "epoch": 1.89, "learning_rate": 1.6797872368001532e-05, "loss": 0.0073, "step": 728360 }, { "epoch": 1.89, "learning_rate": 1.6793984151630067e-05, "loss": 0.0078, "step": 728370 }, { "epoch": 1.89, "learning_rate": 1.6790095935258605e-05, "loss": 0.0054, "step": 728380 }, { "epoch": 1.89, "learning_rate": 1.678620771888714e-05, "loss": 0.0073, "step": 728390 }, { "epoch": 1.89, "learning_rate": 1.6782319502515675e-05, "loss": 0.0084, "step": 728400 }, { "epoch": 1.89, "learning_rate": 1.677843128614421e-05, "loss": 0.0088, "step": 728410 }, { "epoch": 1.89, "learning_rate": 1.6774543069772744e-05, "loss": 0.0067, "step": 728420 }, { "epoch": 1.89, "learning_rate": 1.677065485340128e-05, "loss": 0.0058, "step": 728430 }, { "epoch": 1.89, "learning_rate": 1.6766766637029817e-05, "loss": 0.0078, "step": 728440 }, { "epoch": 1.89, "learning_rate": 1.6762878420658352e-05, "loss": 0.0058, "step": 728450 }, { "epoch": 1.89, "learning_rate": 1.6758990204286887e-05, "loss": 0.0057, "step": 728460 }, { "epoch": 1.89, "learning_rate": 1.6755101987915422e-05, "loss": 0.0073, "step": 728470 }, { "epoch": 1.89, "learning_rate": 1.6751213771543957e-05, "loss": 0.0074, "step": 728480 }, { "epoch": 1.89, "learning_rate": 1.674732555517249e-05, "loss": 0.0115, "step": 728490 }, { "epoch": 1.89, "learning_rate": 1.6743437338801027e-05, "loss": 0.006, "step": 728500 }, { "epoch": 1.89, "learning_rate": 1.6739549122429565e-05, "loss": 0.0069, "step": 728510 }, { "epoch": 1.89, "learning_rate": 1.67356609060581e-05, "loss": 0.005, "step": 728520 }, { "epoch": 1.89, "learning_rate": 1.6731772689686635e-05, "loss": 0.0088, "step": 728530 }, { "epoch": 1.89, "learning_rate": 1.672788447331517e-05, "loss": 0.0068, "step": 728540 }, { "epoch": 1.89, "learning_rate": 1.6723996256943704e-05, "loss": 0.0081, "step": 728550 }, { "epoch": 1.89, "learning_rate": 1.672010804057224e-05, "loss": 0.0069, "step": 728560 }, { "epoch": 1.89, "learning_rate": 1.6716219824200777e-05, "loss": 0.0083, "step": 728570 }, { "epoch": 1.89, "learning_rate": 1.6712331607829312e-05, "loss": 0.0071, "step": 728580 }, { "epoch": 1.89, "learning_rate": 1.6708443391457847e-05, "loss": 0.0071, "step": 728590 }, { "epoch": 1.89, "learning_rate": 1.6704555175086382e-05, "loss": 0.0065, "step": 728600 }, { "epoch": 1.89, "learning_rate": 1.6700666958714917e-05, "loss": 0.008, "step": 728610 }, { "epoch": 1.89, "learning_rate": 1.669677874234345e-05, "loss": 0.009, "step": 728620 }, { "epoch": 1.89, "learning_rate": 1.6692890525971987e-05, "loss": 0.008, "step": 728630 }, { "epoch": 1.89, "learning_rate": 1.6689002309600525e-05, "loss": 0.0105, "step": 728640 }, { "epoch": 1.89, "learning_rate": 1.668511409322906e-05, "loss": 0.0064, "step": 728650 }, { "epoch": 1.89, "learning_rate": 1.6681225876857595e-05, "loss": 0.0099, "step": 728660 }, { "epoch": 1.89, "learning_rate": 1.667733766048613e-05, "loss": 0.0074, "step": 728670 }, { "epoch": 1.89, "learning_rate": 1.6673449444114664e-05, "loss": 0.0072, "step": 728680 }, { "epoch": 1.89, "learning_rate": 1.66695612277432e-05, "loss": 0.0055, "step": 728690 }, { "epoch": 1.89, "learning_rate": 1.6665673011371737e-05, "loss": 0.0066, "step": 728700 }, { "epoch": 1.89, "learning_rate": 1.6661784795000272e-05, "loss": 0.0078, "step": 728710 }, { "epoch": 1.89, "learning_rate": 1.6657896578628807e-05, "loss": 0.0065, "step": 728720 }, { "epoch": 1.89, "learning_rate": 1.6654008362257342e-05, "loss": 0.01, "step": 728730 }, { "epoch": 1.89, "learning_rate": 1.6650120145885877e-05, "loss": 0.0058, "step": 728740 }, { "epoch": 1.89, "learning_rate": 1.664623192951441e-05, "loss": 0.0084, "step": 728750 }, { "epoch": 1.89, "learning_rate": 1.6642343713142947e-05, "loss": 0.008, "step": 728760 }, { "epoch": 1.89, "learning_rate": 1.6638455496771485e-05, "loss": 0.0085, "step": 728770 }, { "epoch": 1.89, "learning_rate": 1.663456728040002e-05, "loss": 0.0067, "step": 728780 }, { "epoch": 1.89, "learning_rate": 1.6630679064028554e-05, "loss": 0.0088, "step": 728790 }, { "epoch": 1.89, "learning_rate": 1.662679084765709e-05, "loss": 0.0094, "step": 728800 }, { "epoch": 1.89, "learning_rate": 1.6622902631285624e-05, "loss": 0.0094, "step": 728810 }, { "epoch": 1.89, "learning_rate": 1.661901441491416e-05, "loss": 0.0064, "step": 728820 }, { "epoch": 1.89, "learning_rate": 1.6615126198542694e-05, "loss": 0.0077, "step": 728830 }, { "epoch": 1.89, "learning_rate": 1.6611237982171232e-05, "loss": 0.0065, "step": 728840 }, { "epoch": 1.89, "learning_rate": 1.6607349765799764e-05, "loss": 0.0074, "step": 728850 }, { "epoch": 1.89, "learning_rate": 1.6603461549428302e-05, "loss": 0.0049, "step": 728860 }, { "epoch": 1.89, "learning_rate": 1.6599573333056837e-05, "loss": 0.0076, "step": 728870 }, { "epoch": 1.89, "learning_rate": 1.659568511668537e-05, "loss": 0.0063, "step": 728880 }, { "epoch": 1.89, "learning_rate": 1.6591796900313906e-05, "loss": 0.0081, "step": 728890 }, { "epoch": 1.89, "learning_rate": 1.6587908683942445e-05, "loss": 0.0065, "step": 728900 }, { "epoch": 1.89, "learning_rate": 1.6584020467570976e-05, "loss": 0.0072, "step": 728910 }, { "epoch": 1.89, "learning_rate": 1.658013225119951e-05, "loss": 0.0069, "step": 728920 }, { "epoch": 1.89, "learning_rate": 1.657624403482805e-05, "loss": 0.0103, "step": 728930 }, { "epoch": 1.89, "learning_rate": 1.6572355818456584e-05, "loss": 0.0053, "step": 728940 }, { "epoch": 1.89, "learning_rate": 1.656846760208512e-05, "loss": 0.0051, "step": 728950 }, { "epoch": 1.89, "learning_rate": 1.6564579385713654e-05, "loss": 0.0075, "step": 728960 }, { "epoch": 1.89, "learning_rate": 1.656069116934219e-05, "loss": 0.0063, "step": 728970 }, { "epoch": 1.89, "learning_rate": 1.6556802952970724e-05, "loss": 0.007, "step": 728980 }, { "epoch": 1.89, "learning_rate": 1.6552914736599262e-05, "loss": 0.0079, "step": 728990 }, { "epoch": 1.89, "learning_rate": 1.6549026520227797e-05, "loss": 0.0087, "step": 729000 }, { "epoch": 1.89, "eval_cer": 0.8816676953998133, "eval_loss": 0.004516036249697208, "eval_runtime": 107.8591, "eval_samples_per_second": 18.543, "eval_steps_per_second": 4.636, "step": 729000 }, { "epoch": 1.89, "learning_rate": 1.654513830385633e-05, "loss": 0.0087, "step": 729010 }, { "epoch": 1.89, "learning_rate": 1.6541250087484866e-05, "loss": 0.0127, "step": 729020 }, { "epoch": 1.89, "learning_rate": 1.6537361871113405e-05, "loss": 0.0065, "step": 729030 }, { "epoch": 1.89, "learning_rate": 1.6533473654741936e-05, "loss": 0.0053, "step": 729040 }, { "epoch": 1.89, "learning_rate": 1.652958543837047e-05, "loss": 0.0085, "step": 729050 }, { "epoch": 1.89, "learning_rate": 1.652569722199901e-05, "loss": 0.0072, "step": 729060 }, { "epoch": 1.89, "learning_rate": 1.6521809005627544e-05, "loss": 0.006, "step": 729070 }, { "epoch": 1.89, "learning_rate": 1.651792078925608e-05, "loss": 0.0103, "step": 729080 }, { "epoch": 1.89, "learning_rate": 1.6514032572884614e-05, "loss": 0.007, "step": 729090 }, { "epoch": 1.89, "learning_rate": 1.651014435651315e-05, "loss": 0.0071, "step": 729100 }, { "epoch": 1.89, "learning_rate": 1.6506256140141684e-05, "loss": 0.0066, "step": 729110 }, { "epoch": 1.89, "learning_rate": 1.6502367923770222e-05, "loss": 0.0058, "step": 729120 }, { "epoch": 1.89, "learning_rate": 1.6498479707398757e-05, "loss": 0.0085, "step": 729130 }, { "epoch": 1.89, "learning_rate": 1.649459149102729e-05, "loss": 0.0061, "step": 729140 }, { "epoch": 1.89, "learning_rate": 1.6490703274655826e-05, "loss": 0.0081, "step": 729150 }, { "epoch": 1.89, "learning_rate": 1.648681505828436e-05, "loss": 0.0067, "step": 729160 }, { "epoch": 1.89, "learning_rate": 1.6482926841912896e-05, "loss": 0.0069, "step": 729170 }, { "epoch": 1.89, "learning_rate": 1.647903862554143e-05, "loss": 0.0062, "step": 729180 }, { "epoch": 1.89, "learning_rate": 1.647515040916997e-05, "loss": 0.0061, "step": 729190 }, { "epoch": 1.89, "learning_rate": 1.6471262192798504e-05, "loss": 0.0051, "step": 729200 }, { "epoch": 1.89, "learning_rate": 1.646737397642704e-05, "loss": 0.0065, "step": 729210 }, { "epoch": 1.89, "learning_rate": 1.6463485760055574e-05, "loss": 0.0095, "step": 729220 }, { "epoch": 1.89, "learning_rate": 1.645959754368411e-05, "loss": 0.0055, "step": 729230 }, { "epoch": 1.89, "learning_rate": 1.6455709327312644e-05, "loss": 0.0065, "step": 729240 }, { "epoch": 1.89, "learning_rate": 1.6451821110941182e-05, "loss": 0.0057, "step": 729250 }, { "epoch": 1.89, "learning_rate": 1.6447932894569717e-05, "loss": 0.0054, "step": 729260 }, { "epoch": 1.89, "learning_rate": 1.644404467819825e-05, "loss": 0.0068, "step": 729270 }, { "epoch": 1.89, "learning_rate": 1.6440156461826786e-05, "loss": 0.0056, "step": 729280 }, { "epoch": 1.89, "learning_rate": 1.643626824545532e-05, "loss": 0.0068, "step": 729290 }, { "epoch": 1.89, "learning_rate": 1.6432380029083856e-05, "loss": 0.0059, "step": 729300 }, { "epoch": 1.89, "learning_rate": 1.642849181271239e-05, "loss": 0.0063, "step": 729310 }, { "epoch": 1.89, "learning_rate": 1.642460359634093e-05, "loss": 0.008, "step": 729320 }, { "epoch": 1.89, "learning_rate": 1.6420715379969464e-05, "loss": 0.0062, "step": 729330 }, { "epoch": 1.89, "learning_rate": 1.6416827163598e-05, "loss": 0.0063, "step": 729340 }, { "epoch": 1.89, "learning_rate": 1.6412938947226534e-05, "loss": 0.0065, "step": 729350 }, { "epoch": 1.89, "learning_rate": 1.640905073085507e-05, "loss": 0.0089, "step": 729360 }, { "epoch": 1.89, "learning_rate": 1.6405162514483604e-05, "loss": 0.0058, "step": 729370 }, { "epoch": 1.89, "learning_rate": 1.6401274298112142e-05, "loss": 0.0073, "step": 729380 }, { "epoch": 1.89, "learning_rate": 1.6397386081740677e-05, "loss": 0.0059, "step": 729390 }, { "epoch": 1.89, "learning_rate": 1.639349786536921e-05, "loss": 0.0071, "step": 729400 }, { "epoch": 1.89, "learning_rate": 1.6389609648997746e-05, "loss": 0.0071, "step": 729410 }, { "epoch": 1.89, "learning_rate": 1.638572143262628e-05, "loss": 0.0094, "step": 729420 }, { "epoch": 1.89, "learning_rate": 1.6381833216254816e-05, "loss": 0.0056, "step": 729430 }, { "epoch": 1.89, "learning_rate": 1.637794499988335e-05, "loss": 0.0096, "step": 729440 }, { "epoch": 1.89, "learning_rate": 1.637405678351189e-05, "loss": 0.0076, "step": 729450 }, { "epoch": 1.89, "learning_rate": 1.6370168567140424e-05, "loss": 0.0085, "step": 729460 }, { "epoch": 1.89, "learning_rate": 1.636628035076896e-05, "loss": 0.009, "step": 729470 }, { "epoch": 1.89, "learning_rate": 1.6362392134397494e-05, "loss": 0.0093, "step": 729480 }, { "epoch": 1.89, "learning_rate": 1.635850391802603e-05, "loss": 0.0085, "step": 729490 }, { "epoch": 1.89, "learning_rate": 1.6354615701654564e-05, "loss": 0.005, "step": 729500 }, { "epoch": 1.89, "learning_rate": 1.6350727485283102e-05, "loss": 0.0083, "step": 729510 }, { "epoch": 1.89, "learning_rate": 1.6346839268911637e-05, "loss": 0.0056, "step": 729520 }, { "epoch": 1.89, "learning_rate": 1.6342951052540168e-05, "loss": 0.0063, "step": 729530 }, { "epoch": 1.89, "learning_rate": 1.6339062836168706e-05, "loss": 0.0046, "step": 729540 }, { "epoch": 1.89, "learning_rate": 1.633517461979724e-05, "loss": 0.0069, "step": 729550 }, { "epoch": 1.89, "learning_rate": 1.6331286403425776e-05, "loss": 0.0049, "step": 729560 }, { "epoch": 1.89, "learning_rate": 1.632739818705431e-05, "loss": 0.0051, "step": 729570 }, { "epoch": 1.89, "learning_rate": 1.632350997068285e-05, "loss": 0.0093, "step": 729580 }, { "epoch": 1.89, "learning_rate": 1.631962175431138e-05, "loss": 0.0099, "step": 729590 }, { "epoch": 1.89, "learning_rate": 1.6315733537939916e-05, "loss": 0.0072, "step": 729600 }, { "epoch": 1.89, "learning_rate": 1.6311845321568454e-05, "loss": 0.0069, "step": 729610 }, { "epoch": 1.89, "learning_rate": 1.630795710519699e-05, "loss": 0.0071, "step": 729620 }, { "epoch": 1.89, "learning_rate": 1.6304068888825524e-05, "loss": 0.0084, "step": 729630 }, { "epoch": 1.89, "learning_rate": 1.630018067245406e-05, "loss": 0.0073, "step": 729640 }, { "epoch": 1.89, "learning_rate": 1.6296292456082597e-05, "loss": 0.0086, "step": 729650 }, { "epoch": 1.89, "learning_rate": 1.6292404239711128e-05, "loss": 0.0087, "step": 729660 }, { "epoch": 1.89, "learning_rate": 1.6288516023339666e-05, "loss": 0.0056, "step": 729670 }, { "epoch": 1.89, "learning_rate": 1.62846278069682e-05, "loss": 0.0053, "step": 729680 }, { "epoch": 1.89, "learning_rate": 1.6280739590596736e-05, "loss": 0.0059, "step": 729690 }, { "epoch": 1.89, "learning_rate": 1.627685137422527e-05, "loss": 0.0096, "step": 729700 }, { "epoch": 1.89, "learning_rate": 1.627296315785381e-05, "loss": 0.007, "step": 729710 }, { "epoch": 1.89, "learning_rate": 1.626907494148234e-05, "loss": 0.006, "step": 729720 }, { "epoch": 1.89, "learning_rate": 1.6265186725110876e-05, "loss": 0.0059, "step": 729730 }, { "epoch": 1.89, "learning_rate": 1.6261298508739414e-05, "loss": 0.0088, "step": 729740 }, { "epoch": 1.89, "learning_rate": 1.625741029236795e-05, "loss": 0.007, "step": 729750 }, { "epoch": 1.89, "learning_rate": 1.6253522075996483e-05, "loss": 0.0056, "step": 729760 }, { "epoch": 1.89, "learning_rate": 1.624963385962502e-05, "loss": 0.0059, "step": 729770 }, { "epoch": 1.89, "learning_rate": 1.6245745643253553e-05, "loss": 0.0088, "step": 729780 }, { "epoch": 1.89, "learning_rate": 1.6241857426882088e-05, "loss": 0.0085, "step": 729790 }, { "epoch": 1.89, "learning_rate": 1.6237969210510626e-05, "loss": 0.007, "step": 729800 }, { "epoch": 1.89, "learning_rate": 1.623408099413916e-05, "loss": 0.007, "step": 729810 }, { "epoch": 1.89, "learning_rate": 1.6230192777767696e-05, "loss": 0.0056, "step": 729820 }, { "epoch": 1.89, "learning_rate": 1.622630456139623e-05, "loss": 0.0051, "step": 729830 }, { "epoch": 1.89, "learning_rate": 1.6222416345024766e-05, "loss": 0.0063, "step": 729840 }, { "epoch": 1.89, "learning_rate": 1.62185281286533e-05, "loss": 0.0079, "step": 729850 }, { "epoch": 1.89, "learning_rate": 1.6214639912281835e-05, "loss": 0.0042, "step": 729860 }, { "epoch": 1.89, "learning_rate": 1.6210751695910374e-05, "loss": 0.0086, "step": 729870 }, { "epoch": 1.89, "learning_rate": 1.620686347953891e-05, "loss": 0.0064, "step": 729880 }, { "epoch": 1.89, "learning_rate": 1.6202975263167443e-05, "loss": 0.0064, "step": 729890 }, { "epoch": 1.89, "learning_rate": 1.619908704679598e-05, "loss": 0.0069, "step": 729900 }, { "epoch": 1.89, "learning_rate": 1.6195198830424513e-05, "loss": 0.0069, "step": 729910 }, { "epoch": 1.89, "learning_rate": 1.6191310614053048e-05, "loss": 0.0101, "step": 729920 }, { "epoch": 1.89, "learning_rate": 1.6187422397681586e-05, "loss": 0.0064, "step": 729930 }, { "epoch": 1.89, "learning_rate": 1.618353418131012e-05, "loss": 0.0081, "step": 729940 }, { "epoch": 1.89, "learning_rate": 1.6179645964938656e-05, "loss": 0.0049, "step": 729950 }, { "epoch": 1.89, "learning_rate": 1.617575774856719e-05, "loss": 0.0078, "step": 729960 }, { "epoch": 1.89, "learning_rate": 1.6171869532195726e-05, "loss": 0.006, "step": 729970 }, { "epoch": 1.89, "learning_rate": 1.616798131582426e-05, "loss": 0.0079, "step": 729980 }, { "epoch": 1.89, "learning_rate": 1.6164093099452795e-05, "loss": 0.0062, "step": 729990 }, { "epoch": 1.89, "learning_rate": 1.6160204883081334e-05, "loss": 0.0071, "step": 730000 }, { "epoch": 1.89, "eval_cer": 0.8816620968520765, "eval_loss": 0.004505546763539314, "eval_runtime": 107.7228, "eval_samples_per_second": 18.566, "eval_steps_per_second": 4.642, "step": 730000 }, { "epoch": 1.89, "learning_rate": 1.615631666670987e-05, "loss": 0.0076, "step": 730010 }, { "epoch": 1.89, "learning_rate": 1.6152428450338403e-05, "loss": 0.0074, "step": 730020 }, { "epoch": 1.89, "learning_rate": 1.6148540233966938e-05, "loss": 0.0059, "step": 730030 }, { "epoch": 1.89, "learning_rate": 1.6144652017595473e-05, "loss": 0.0079, "step": 730040 }, { "epoch": 1.89, "learning_rate": 1.6140763801224008e-05, "loss": 0.0085, "step": 730050 }, { "epoch": 1.89, "learning_rate": 1.6136875584852546e-05, "loss": 0.0053, "step": 730060 }, { "epoch": 1.89, "learning_rate": 1.613298736848108e-05, "loss": 0.0067, "step": 730070 }, { "epoch": 1.89, "learning_rate": 1.6129099152109616e-05, "loss": 0.0056, "step": 730080 }, { "epoch": 1.89, "learning_rate": 1.612521093573815e-05, "loss": 0.0126, "step": 730090 }, { "epoch": 1.89, "learning_rate": 1.6121322719366686e-05, "loss": 0.012, "step": 730100 }, { "epoch": 1.89, "learning_rate": 1.611743450299522e-05, "loss": 0.0072, "step": 730110 }, { "epoch": 1.89, "learning_rate": 1.6113546286623755e-05, "loss": 0.0077, "step": 730120 }, { "epoch": 1.89, "learning_rate": 1.6109658070252294e-05, "loss": 0.0107, "step": 730130 }, { "epoch": 1.89, "learning_rate": 1.610576985388083e-05, "loss": 0.0053, "step": 730140 }, { "epoch": 1.89, "learning_rate": 1.6101881637509363e-05, "loss": 0.0057, "step": 730150 }, { "epoch": 1.89, "learning_rate": 1.6097993421137898e-05, "loss": 0.0056, "step": 730160 }, { "epoch": 1.89, "learning_rate": 1.6094105204766433e-05, "loss": 0.0052, "step": 730170 }, { "epoch": 1.89, "learning_rate": 1.6090216988394968e-05, "loss": 0.0084, "step": 730180 }, { "epoch": 1.89, "learning_rate": 1.6086328772023506e-05, "loss": 0.0092, "step": 730190 }, { "epoch": 1.89, "learning_rate": 1.608244055565204e-05, "loss": 0.0043, "step": 730200 }, { "epoch": 1.89, "learning_rate": 1.6078552339280573e-05, "loss": 0.0071, "step": 730210 }, { "epoch": 1.89, "learning_rate": 1.607466412290911e-05, "loss": 0.004, "step": 730220 }, { "epoch": 1.89, "learning_rate": 1.6070775906537646e-05, "loss": 0.0071, "step": 730230 }, { "epoch": 1.89, "learning_rate": 1.606688769016618e-05, "loss": 0.0082, "step": 730240 }, { "epoch": 1.89, "learning_rate": 1.6062999473794715e-05, "loss": 0.0073, "step": 730250 }, { "epoch": 1.89, "learning_rate": 1.6059111257423254e-05, "loss": 0.0078, "step": 730260 }, { "epoch": 1.89, "learning_rate": 1.605522304105179e-05, "loss": 0.0077, "step": 730270 }, { "epoch": 1.89, "learning_rate": 1.605133482468032e-05, "loss": 0.0048, "step": 730280 }, { "epoch": 1.89, "learning_rate": 1.6047446608308858e-05, "loss": 0.0101, "step": 730290 }, { "epoch": 1.89, "learning_rate": 1.6043558391937393e-05, "loss": 0.0084, "step": 730300 }, { "epoch": 1.89, "learning_rate": 1.6039670175565928e-05, "loss": 0.0093, "step": 730310 }, { "epoch": 1.89, "learning_rate": 1.6035781959194463e-05, "loss": 0.0078, "step": 730320 }, { "epoch": 1.89, "learning_rate": 1.6031893742823e-05, "loss": 0.0072, "step": 730330 }, { "epoch": 1.89, "learning_rate": 1.6028005526451533e-05, "loss": 0.0065, "step": 730340 }, { "epoch": 1.89, "learning_rate": 1.602411731008007e-05, "loss": 0.0072, "step": 730350 }, { "epoch": 1.89, "learning_rate": 1.6020229093708606e-05, "loss": 0.0075, "step": 730360 }, { "epoch": 1.89, "learning_rate": 1.601634087733714e-05, "loss": 0.0085, "step": 730370 }, { "epoch": 1.89, "learning_rate": 1.6012452660965675e-05, "loss": 0.0062, "step": 730380 }, { "epoch": 1.89, "learning_rate": 1.6008564444594214e-05, "loss": 0.0063, "step": 730390 }, { "epoch": 1.89, "learning_rate": 1.6004676228222745e-05, "loss": 0.0069, "step": 730400 }, { "epoch": 1.89, "learning_rate": 1.600078801185128e-05, "loss": 0.0045, "step": 730410 }, { "epoch": 1.89, "learning_rate": 1.5996899795479818e-05, "loss": 0.0055, "step": 730420 }, { "epoch": 1.89, "learning_rate": 1.5993011579108353e-05, "loss": 0.0074, "step": 730430 }, { "epoch": 1.89, "learning_rate": 1.5989123362736888e-05, "loss": 0.0074, "step": 730440 }, { "epoch": 1.89, "learning_rate": 1.5985235146365423e-05, "loss": 0.0054, "step": 730450 }, { "epoch": 1.89, "learning_rate": 1.5981346929993958e-05, "loss": 0.0073, "step": 730460 }, { "epoch": 1.89, "learning_rate": 1.5977458713622493e-05, "loss": 0.0057, "step": 730470 }, { "epoch": 1.89, "learning_rate": 1.597357049725103e-05, "loss": 0.007, "step": 730480 }, { "epoch": 1.89, "learning_rate": 1.5969682280879566e-05, "loss": 0.0073, "step": 730490 }, { "epoch": 1.89, "learning_rate": 1.59657940645081e-05, "loss": 0.0072, "step": 730500 }, { "epoch": 1.89, "learning_rate": 1.5961905848136635e-05, "loss": 0.0057, "step": 730510 }, { "epoch": 1.89, "learning_rate": 1.595801763176517e-05, "loss": 0.0074, "step": 730520 }, { "epoch": 1.89, "learning_rate": 1.5954129415393705e-05, "loss": 0.0075, "step": 730530 }, { "epoch": 1.89, "learning_rate": 1.595024119902224e-05, "loss": 0.0058, "step": 730540 }, { "epoch": 1.89, "learning_rate": 1.5946352982650778e-05, "loss": 0.006, "step": 730550 }, { "epoch": 1.89, "learning_rate": 1.5942464766279313e-05, "loss": 0.0075, "step": 730560 }, { "epoch": 1.89, "learning_rate": 1.5938576549907848e-05, "loss": 0.0075, "step": 730570 }, { "epoch": 1.89, "learning_rate": 1.5934688333536383e-05, "loss": 0.0082, "step": 730580 }, { "epoch": 1.89, "learning_rate": 1.5930800117164918e-05, "loss": 0.0074, "step": 730590 }, { "epoch": 1.89, "learning_rate": 1.5926911900793453e-05, "loss": 0.0061, "step": 730600 }, { "epoch": 1.89, "learning_rate": 1.592302368442199e-05, "loss": 0.0058, "step": 730610 }, { "epoch": 1.89, "learning_rate": 1.5919135468050526e-05, "loss": 0.0083, "step": 730620 }, { "epoch": 1.89, "learning_rate": 1.591524725167906e-05, "loss": 0.0066, "step": 730630 }, { "epoch": 1.89, "learning_rate": 1.5911359035307595e-05, "loss": 0.0063, "step": 730640 }, { "epoch": 1.89, "learning_rate": 1.590747081893613e-05, "loss": 0.0063, "step": 730650 }, { "epoch": 1.89, "learning_rate": 1.5903582602564665e-05, "loss": 0.0062, "step": 730660 }, { "epoch": 1.89, "learning_rate": 1.58996943861932e-05, "loss": 0.0073, "step": 730670 }, { "epoch": 1.89, "learning_rate": 1.5895806169821738e-05, "loss": 0.007, "step": 730680 }, { "epoch": 1.89, "learning_rate": 1.5891917953450273e-05, "loss": 0.0066, "step": 730690 }, { "epoch": 1.89, "learning_rate": 1.5888029737078808e-05, "loss": 0.0062, "step": 730700 }, { "epoch": 1.89, "learning_rate": 1.5884141520707343e-05, "loss": 0.0088, "step": 730710 }, { "epoch": 1.89, "learning_rate": 1.5880253304335878e-05, "loss": 0.0072, "step": 730720 }, { "epoch": 1.89, "learning_rate": 1.5876365087964412e-05, "loss": 0.0079, "step": 730730 }, { "epoch": 1.89, "learning_rate": 1.587247687159295e-05, "loss": 0.0074, "step": 730740 }, { "epoch": 1.89, "learning_rate": 1.5868588655221486e-05, "loss": 0.0056, "step": 730750 }, { "epoch": 1.89, "learning_rate": 1.586470043885002e-05, "loss": 0.0075, "step": 730760 }, { "epoch": 1.89, "learning_rate": 1.5860812222478555e-05, "loss": 0.0064, "step": 730770 }, { "epoch": 1.89, "learning_rate": 1.585692400610709e-05, "loss": 0.0055, "step": 730780 }, { "epoch": 1.89, "learning_rate": 1.5853035789735625e-05, "loss": 0.0078, "step": 730790 }, { "epoch": 1.89, "learning_rate": 1.584914757336416e-05, "loss": 0.0148, "step": 730800 }, { "epoch": 1.89, "learning_rate": 1.5845259356992698e-05, "loss": 0.0072, "step": 730810 }, { "epoch": 1.89, "learning_rate": 1.5841371140621233e-05, "loss": 0.0059, "step": 730820 }, { "epoch": 1.89, "learning_rate": 1.5837482924249768e-05, "loss": 0.0087, "step": 730830 }, { "epoch": 1.89, "learning_rate": 1.5833594707878303e-05, "loss": 0.0084, "step": 730840 }, { "epoch": 1.89, "learning_rate": 1.5829706491506838e-05, "loss": 0.0056, "step": 730850 }, { "epoch": 1.89, "learning_rate": 1.5825818275135372e-05, "loss": 0.0058, "step": 730860 }, { "epoch": 1.89, "learning_rate": 1.582193005876391e-05, "loss": 0.0071, "step": 730870 }, { "epoch": 1.89, "learning_rate": 1.5818041842392446e-05, "loss": 0.0066, "step": 730880 }, { "epoch": 1.89, "learning_rate": 1.581415362602098e-05, "loss": 0.009, "step": 730890 }, { "epoch": 1.89, "learning_rate": 1.5810265409649515e-05, "loss": 0.0059, "step": 730900 }, { "epoch": 1.89, "learning_rate": 1.580637719327805e-05, "loss": 0.0059, "step": 730910 }, { "epoch": 1.89, "learning_rate": 1.5802488976906585e-05, "loss": 0.0052, "step": 730920 }, { "epoch": 1.89, "learning_rate": 1.579860076053512e-05, "loss": 0.007, "step": 730930 }, { "epoch": 1.89, "learning_rate": 1.5794712544163658e-05, "loss": 0.0068, "step": 730940 }, { "epoch": 1.89, "learning_rate": 1.5790824327792193e-05, "loss": 0.0094, "step": 730950 }, { "epoch": 1.89, "learning_rate": 1.5786936111420724e-05, "loss": 0.0046, "step": 730960 }, { "epoch": 1.89, "learning_rate": 1.5783047895049263e-05, "loss": 0.0052, "step": 730970 }, { "epoch": 1.89, "learning_rate": 1.5779159678677798e-05, "loss": 0.0081, "step": 730980 }, { "epoch": 1.89, "learning_rate": 1.5775271462306332e-05, "loss": 0.0067, "step": 730990 }, { "epoch": 1.89, "learning_rate": 1.5771383245934867e-05, "loss": 0.0073, "step": 731000 }, { "epoch": 1.89, "eval_cer": 0.881657897941274, "eval_loss": 0.004491262603551149, "eval_runtime": 107.9137, "eval_samples_per_second": 18.533, "eval_steps_per_second": 4.633, "step": 731000 }, { "epoch": 1.89, "learning_rate": 1.5767495029563406e-05, "loss": 0.0076, "step": 731010 }, { "epoch": 1.89, "learning_rate": 1.5763606813191937e-05, "loss": 0.0068, "step": 731020 }, { "epoch": 1.89, "learning_rate": 1.5759718596820475e-05, "loss": 0.0068, "step": 731030 }, { "epoch": 1.89, "learning_rate": 1.575583038044901e-05, "loss": 0.009, "step": 731040 }, { "epoch": 1.89, "learning_rate": 1.5751942164077545e-05, "loss": 0.0069, "step": 731050 }, { "epoch": 1.9, "learning_rate": 1.574805394770608e-05, "loss": 0.0065, "step": 731060 }, { "epoch": 1.9, "learning_rate": 1.5744165731334618e-05, "loss": 0.0066, "step": 731070 }, { "epoch": 1.9, "learning_rate": 1.574027751496315e-05, "loss": 0.0066, "step": 731080 }, { "epoch": 1.9, "learning_rate": 1.5736389298591684e-05, "loss": 0.0088, "step": 731090 }, { "epoch": 1.9, "learning_rate": 1.5732501082220223e-05, "loss": 0.0086, "step": 731100 }, { "epoch": 1.9, "learning_rate": 1.5728612865848758e-05, "loss": 0.0051, "step": 731110 }, { "epoch": 1.9, "learning_rate": 1.5724724649477292e-05, "loss": 0.0085, "step": 731120 }, { "epoch": 1.9, "learning_rate": 1.5720836433105827e-05, "loss": 0.0053, "step": 731130 }, { "epoch": 1.9, "learning_rate": 1.5716948216734362e-05, "loss": 0.0075, "step": 731140 }, { "epoch": 1.9, "learning_rate": 1.5713060000362897e-05, "loss": 0.0057, "step": 731150 }, { "epoch": 1.9, "learning_rate": 1.5709171783991435e-05, "loss": 0.0064, "step": 731160 }, { "epoch": 1.9, "learning_rate": 1.570528356761997e-05, "loss": 0.0067, "step": 731170 }, { "epoch": 1.9, "learning_rate": 1.5701395351248505e-05, "loss": 0.0086, "step": 731180 }, { "epoch": 1.9, "learning_rate": 1.569750713487704e-05, "loss": 0.0056, "step": 731190 }, { "epoch": 1.9, "learning_rate": 1.5693618918505578e-05, "loss": 0.0078, "step": 731200 }, { "epoch": 1.9, "learning_rate": 1.568973070213411e-05, "loss": 0.0073, "step": 731210 }, { "epoch": 1.9, "learning_rate": 1.5685842485762644e-05, "loss": 0.0094, "step": 731220 }, { "epoch": 1.9, "learning_rate": 1.5681954269391183e-05, "loss": 0.0057, "step": 731230 }, { "epoch": 1.9, "learning_rate": 1.5678066053019718e-05, "loss": 0.0083, "step": 731240 }, { "epoch": 1.9, "learning_rate": 1.5674177836648252e-05, "loss": 0.0088, "step": 731250 }, { "epoch": 1.9, "learning_rate": 1.5670289620276787e-05, "loss": 0.0068, "step": 731260 }, { "epoch": 1.9, "learning_rate": 1.5666401403905322e-05, "loss": 0.0089, "step": 731270 }, { "epoch": 1.9, "learning_rate": 1.5662513187533857e-05, "loss": 0.0094, "step": 731280 }, { "epoch": 1.9, "learning_rate": 1.5658624971162395e-05, "loss": 0.0074, "step": 731290 }, { "epoch": 1.9, "learning_rate": 1.565473675479093e-05, "loss": 0.0065, "step": 731300 }, { "epoch": 1.9, "learning_rate": 1.5650848538419465e-05, "loss": 0.0073, "step": 731310 }, { "epoch": 1.9, "learning_rate": 1.5646960322048e-05, "loss": 0.0103, "step": 731320 }, { "epoch": 1.9, "learning_rate": 1.5643072105676535e-05, "loss": 0.0082, "step": 731330 }, { "epoch": 1.9, "learning_rate": 1.563918388930507e-05, "loss": 0.0057, "step": 731340 }, { "epoch": 1.9, "learning_rate": 1.5635295672933604e-05, "loss": 0.0048, "step": 731350 }, { "epoch": 1.9, "learning_rate": 1.5631407456562143e-05, "loss": 0.0056, "step": 731360 }, { "epoch": 1.9, "learning_rate": 1.5627519240190677e-05, "loss": 0.009, "step": 731370 }, { "epoch": 1.9, "learning_rate": 1.5623631023819212e-05, "loss": 0.0059, "step": 731380 }, { "epoch": 1.9, "learning_rate": 1.5619742807447747e-05, "loss": 0.0079, "step": 731390 }, { "epoch": 1.9, "learning_rate": 1.5615854591076282e-05, "loss": 0.0071, "step": 731400 }, { "epoch": 1.9, "learning_rate": 1.5611966374704817e-05, "loss": 0.007, "step": 731410 }, { "epoch": 1.9, "learning_rate": 1.5608078158333355e-05, "loss": 0.0073, "step": 731420 }, { "epoch": 1.9, "learning_rate": 1.560418994196189e-05, "loss": 0.0099, "step": 731430 }, { "epoch": 1.9, "learning_rate": 1.5600301725590425e-05, "loss": 0.0057, "step": 731440 }, { "epoch": 1.9, "learning_rate": 1.559641350921896e-05, "loss": 0.0137, "step": 731450 }, { "epoch": 1.9, "learning_rate": 1.5592525292847495e-05, "loss": 0.0091, "step": 731460 }, { "epoch": 1.9, "learning_rate": 1.558863707647603e-05, "loss": 0.0055, "step": 731470 }, { "epoch": 1.9, "learning_rate": 1.5584748860104564e-05, "loss": 0.0054, "step": 731480 }, { "epoch": 1.9, "learning_rate": 1.5580860643733103e-05, "loss": 0.0089, "step": 731490 }, { "epoch": 1.9, "learning_rate": 1.5576972427361637e-05, "loss": 0.004, "step": 731500 }, { "epoch": 1.9, "learning_rate": 1.5573084210990172e-05, "loss": 0.007, "step": 731510 }, { "epoch": 1.9, "learning_rate": 1.5569195994618707e-05, "loss": 0.0095, "step": 731520 }, { "epoch": 1.9, "learning_rate": 1.5565307778247242e-05, "loss": 0.0058, "step": 731530 }, { "epoch": 1.9, "learning_rate": 1.5561419561875777e-05, "loss": 0.0042, "step": 731540 }, { "epoch": 1.9, "learning_rate": 1.5557531345504315e-05, "loss": 0.0097, "step": 731550 }, { "epoch": 1.9, "learning_rate": 1.555364312913285e-05, "loss": 0.0083, "step": 731560 }, { "epoch": 1.9, "learning_rate": 1.5549754912761385e-05, "loss": 0.0076, "step": 731570 }, { "epoch": 1.9, "learning_rate": 1.554586669638992e-05, "loss": 0.0075, "step": 731580 }, { "epoch": 1.9, "learning_rate": 1.5541978480018455e-05, "loss": 0.0072, "step": 731590 }, { "epoch": 1.9, "learning_rate": 1.553809026364699e-05, "loss": 0.0095, "step": 731600 }, { "epoch": 1.9, "learning_rate": 1.5534202047275524e-05, "loss": 0.0109, "step": 731610 }, { "epoch": 1.9, "learning_rate": 1.5530313830904063e-05, "loss": 0.006, "step": 731620 }, { "epoch": 1.9, "learning_rate": 1.5526425614532597e-05, "loss": 0.0052, "step": 731630 }, { "epoch": 1.9, "learning_rate": 1.5522537398161132e-05, "loss": 0.0094, "step": 731640 }, { "epoch": 1.9, "learning_rate": 1.5518649181789667e-05, "loss": 0.0069, "step": 731650 }, { "epoch": 1.9, "learning_rate": 1.5514760965418202e-05, "loss": 0.0077, "step": 731660 }, { "epoch": 1.9, "learning_rate": 1.5510872749046737e-05, "loss": 0.0081, "step": 731670 }, { "epoch": 1.9, "learning_rate": 1.5506984532675272e-05, "loss": 0.0073, "step": 731680 }, { "epoch": 1.9, "learning_rate": 1.550309631630381e-05, "loss": 0.0073, "step": 731690 }, { "epoch": 1.9, "learning_rate": 1.549920809993234e-05, "loss": 0.0087, "step": 731700 }, { "epoch": 1.9, "learning_rate": 1.549531988356088e-05, "loss": 0.008, "step": 731710 }, { "epoch": 1.9, "learning_rate": 1.5491431667189415e-05, "loss": 0.0091, "step": 731720 }, { "epoch": 1.9, "learning_rate": 1.548754345081795e-05, "loss": 0.0068, "step": 731730 }, { "epoch": 1.9, "learning_rate": 1.5483655234446484e-05, "loss": 0.0072, "step": 731740 }, { "epoch": 1.9, "learning_rate": 1.5479767018075023e-05, "loss": 0.0072, "step": 731750 }, { "epoch": 1.9, "learning_rate": 1.5475878801703554e-05, "loss": 0.0087, "step": 731760 }, { "epoch": 1.9, "learning_rate": 1.547199058533209e-05, "loss": 0.0058, "step": 731770 }, { "epoch": 1.9, "learning_rate": 1.5468102368960627e-05, "loss": 0.0061, "step": 731780 }, { "epoch": 1.9, "learning_rate": 1.5464214152589162e-05, "loss": 0.0055, "step": 731790 }, { "epoch": 1.9, "learning_rate": 1.5460325936217697e-05, "loss": 0.0068, "step": 731800 }, { "epoch": 1.9, "learning_rate": 1.5456437719846232e-05, "loss": 0.0063, "step": 731810 }, { "epoch": 1.9, "learning_rate": 1.545254950347477e-05, "loss": 0.0067, "step": 731820 }, { "epoch": 1.9, "learning_rate": 1.54486612871033e-05, "loss": 0.007, "step": 731830 }, { "epoch": 1.9, "learning_rate": 1.544477307073184e-05, "loss": 0.0059, "step": 731840 }, { "epoch": 1.9, "learning_rate": 1.5440884854360375e-05, "loss": 0.0072, "step": 731850 }, { "epoch": 1.9, "learning_rate": 1.543699663798891e-05, "loss": 0.0057, "step": 731860 }, { "epoch": 1.9, "learning_rate": 1.5433108421617444e-05, "loss": 0.0076, "step": 731870 }, { "epoch": 1.9, "learning_rate": 1.5429220205245983e-05, "loss": 0.0064, "step": 731880 }, { "epoch": 1.9, "learning_rate": 1.5425331988874514e-05, "loss": 0.0063, "step": 731890 }, { "epoch": 1.9, "learning_rate": 1.542144377250305e-05, "loss": 0.0079, "step": 731900 }, { "epoch": 1.9, "learning_rate": 1.5417555556131587e-05, "loss": 0.0066, "step": 731910 }, { "epoch": 1.9, "learning_rate": 1.5413667339760122e-05, "loss": 0.0085, "step": 731920 }, { "epoch": 1.9, "learning_rate": 1.5409779123388657e-05, "loss": 0.0058, "step": 731930 }, { "epoch": 1.9, "learning_rate": 1.5405890907017192e-05, "loss": 0.0058, "step": 731940 }, { "epoch": 1.9, "learning_rate": 1.5402002690645727e-05, "loss": 0.0051, "step": 731950 }, { "epoch": 1.9, "learning_rate": 1.539811447427426e-05, "loss": 0.0067, "step": 731960 }, { "epoch": 1.9, "learning_rate": 1.53942262579028e-05, "loss": 0.0066, "step": 731970 }, { "epoch": 1.9, "learning_rate": 1.5390338041531335e-05, "loss": 0.0062, "step": 731980 }, { "epoch": 1.9, "learning_rate": 1.538644982515987e-05, "loss": 0.007, "step": 731990 }, { "epoch": 1.9, "learning_rate": 1.5382561608788404e-05, "loss": 0.0063, "step": 732000 }, { "epoch": 1.9, "eval_cer": 0.8816676953998133, "eval_loss": 0.004524824675172567, "eval_runtime": 107.8657, "eval_samples_per_second": 18.542, "eval_steps_per_second": 4.635, "step": 732000 }, { "epoch": 1.9, "learning_rate": 1.537867339241694e-05, "loss": 0.0089, "step": 732010 }, { "epoch": 1.9, "learning_rate": 1.5374785176045474e-05, "loss": 0.0103, "step": 732020 }, { "epoch": 1.9, "learning_rate": 1.537089695967401e-05, "loss": 0.0067, "step": 732030 }, { "epoch": 1.9, "learning_rate": 1.5367008743302547e-05, "loss": 0.0067, "step": 732040 }, { "epoch": 1.9, "learning_rate": 1.5363120526931082e-05, "loss": 0.008, "step": 732050 }, { "epoch": 1.9, "learning_rate": 1.5359232310559617e-05, "loss": 0.007, "step": 732060 }, { "epoch": 1.9, "learning_rate": 1.535534409418815e-05, "loss": 0.0062, "step": 732070 }, { "epoch": 1.9, "learning_rate": 1.5351455877816687e-05, "loss": 0.0062, "step": 732080 }, { "epoch": 1.9, "learning_rate": 1.534756766144522e-05, "loss": 0.0079, "step": 732090 }, { "epoch": 1.9, "learning_rate": 1.534367944507376e-05, "loss": 0.006, "step": 732100 }, { "epoch": 1.9, "learning_rate": 1.5339791228702295e-05, "loss": 0.0075, "step": 732110 }, { "epoch": 1.9, "learning_rate": 1.533590301233083e-05, "loss": 0.0065, "step": 732120 }, { "epoch": 1.9, "learning_rate": 1.5332014795959364e-05, "loss": 0.0069, "step": 732130 }, { "epoch": 1.9, "learning_rate": 1.53281265795879e-05, "loss": 0.0068, "step": 732140 }, { "epoch": 1.9, "learning_rate": 1.5324238363216434e-05, "loss": 0.0065, "step": 732150 }, { "epoch": 1.9, "learning_rate": 1.532035014684497e-05, "loss": 0.0061, "step": 732160 }, { "epoch": 1.9, "learning_rate": 1.5316461930473507e-05, "loss": 0.0066, "step": 732170 }, { "epoch": 1.9, "learning_rate": 1.5312573714102042e-05, "loss": 0.0075, "step": 732180 }, { "epoch": 1.9, "learning_rate": 1.5308685497730577e-05, "loss": 0.0085, "step": 732190 }, { "epoch": 1.9, "learning_rate": 1.530479728135911e-05, "loss": 0.0076, "step": 732200 }, { "epoch": 1.9, "learning_rate": 1.5300909064987647e-05, "loss": 0.0073, "step": 732210 }, { "epoch": 1.9, "learning_rate": 1.529702084861618e-05, "loss": 0.006, "step": 732220 }, { "epoch": 1.9, "learning_rate": 1.529313263224472e-05, "loss": 0.0056, "step": 732230 }, { "epoch": 1.9, "learning_rate": 1.5289244415873254e-05, "loss": 0.0087, "step": 732240 }, { "epoch": 1.9, "learning_rate": 1.528535619950179e-05, "loss": 0.0055, "step": 732250 }, { "epoch": 1.9, "learning_rate": 1.5281467983130324e-05, "loss": 0.0071, "step": 732260 }, { "epoch": 1.9, "learning_rate": 1.527757976675886e-05, "loss": 0.0067, "step": 732270 }, { "epoch": 1.9, "learning_rate": 1.5273691550387394e-05, "loss": 0.0136, "step": 732280 }, { "epoch": 1.9, "learning_rate": 1.526980333401593e-05, "loss": 0.0077, "step": 732290 }, { "epoch": 1.9, "learning_rate": 1.5265915117644467e-05, "loss": 0.007, "step": 732300 }, { "epoch": 1.9, "learning_rate": 1.5262026901273002e-05, "loss": 0.0066, "step": 732310 }, { "epoch": 1.9, "learning_rate": 1.5258138684901535e-05, "loss": 0.0072, "step": 732320 }, { "epoch": 1.9, "learning_rate": 1.5254250468530072e-05, "loss": 0.0059, "step": 732330 }, { "epoch": 1.9, "learning_rate": 1.5250362252158606e-05, "loss": 0.0086, "step": 732340 }, { "epoch": 1.9, "learning_rate": 1.5246474035787141e-05, "loss": 0.0089, "step": 732350 }, { "epoch": 1.9, "learning_rate": 1.5242585819415678e-05, "loss": 0.005, "step": 732360 }, { "epoch": 1.9, "learning_rate": 1.5238697603044213e-05, "loss": 0.0065, "step": 732370 }, { "epoch": 1.9, "learning_rate": 1.5234809386672748e-05, "loss": 0.0092, "step": 732380 }, { "epoch": 1.9, "learning_rate": 1.5230921170301282e-05, "loss": 0.0084, "step": 732390 }, { "epoch": 1.9, "learning_rate": 1.5227032953929819e-05, "loss": 0.0053, "step": 732400 }, { "epoch": 1.9, "learning_rate": 1.5223144737558354e-05, "loss": 0.0085, "step": 732410 }, { "epoch": 1.9, "learning_rate": 1.521925652118689e-05, "loss": 0.0091, "step": 732420 }, { "epoch": 1.9, "learning_rate": 1.5215368304815425e-05, "loss": 0.0059, "step": 732430 }, { "epoch": 1.9, "learning_rate": 1.5211480088443962e-05, "loss": 0.0049, "step": 732440 }, { "epoch": 1.9, "learning_rate": 1.5207591872072495e-05, "loss": 0.0072, "step": 732450 }, { "epoch": 1.9, "learning_rate": 1.520370365570103e-05, "loss": 0.0058, "step": 732460 }, { "epoch": 1.9, "learning_rate": 1.5199815439329566e-05, "loss": 0.0081, "step": 732470 }, { "epoch": 1.9, "learning_rate": 1.5195927222958101e-05, "loss": 0.007, "step": 732480 }, { "epoch": 1.9, "learning_rate": 1.5192039006586638e-05, "loss": 0.0056, "step": 732490 }, { "epoch": 1.9, "learning_rate": 1.5188150790215173e-05, "loss": 0.0084, "step": 732500 }, { "epoch": 1.9, "learning_rate": 1.5184262573843708e-05, "loss": 0.0076, "step": 732510 }, { "epoch": 1.9, "learning_rate": 1.5180374357472242e-05, "loss": 0.0074, "step": 732520 }, { "epoch": 1.9, "learning_rate": 1.5176486141100779e-05, "loss": 0.0055, "step": 732530 }, { "epoch": 1.9, "learning_rate": 1.5172597924729314e-05, "loss": 0.0086, "step": 732540 }, { "epoch": 1.9, "learning_rate": 1.516870970835785e-05, "loss": 0.0108, "step": 732550 }, { "epoch": 1.9, "learning_rate": 1.5164821491986385e-05, "loss": 0.0058, "step": 732560 }, { "epoch": 1.9, "learning_rate": 1.5160933275614918e-05, "loss": 0.0081, "step": 732570 }, { "epoch": 1.9, "learning_rate": 1.5157045059243455e-05, "loss": 0.0072, "step": 732580 }, { "epoch": 1.9, "learning_rate": 1.515315684287199e-05, "loss": 0.0078, "step": 732590 }, { "epoch": 1.9, "learning_rate": 1.5149268626500526e-05, "loss": 0.0053, "step": 732600 }, { "epoch": 1.9, "learning_rate": 1.5145380410129061e-05, "loss": 0.0084, "step": 732610 }, { "epoch": 1.9, "learning_rate": 1.5141492193757598e-05, "loss": 0.0063, "step": 732620 }, { "epoch": 1.9, "learning_rate": 1.5137603977386131e-05, "loss": 0.0078, "step": 732630 }, { "epoch": 1.9, "learning_rate": 1.5133715761014668e-05, "loss": 0.0084, "step": 732640 }, { "epoch": 1.9, "learning_rate": 1.5129827544643202e-05, "loss": 0.0082, "step": 732650 }, { "epoch": 1.9, "learning_rate": 1.5125939328271739e-05, "loss": 0.0082, "step": 732660 }, { "epoch": 1.9, "learning_rate": 1.5122051111900274e-05, "loss": 0.0041, "step": 732670 }, { "epoch": 1.9, "learning_rate": 1.511816289552881e-05, "loss": 0.0088, "step": 732680 }, { "epoch": 1.9, "learning_rate": 1.5114274679157344e-05, "loss": 0.0086, "step": 732690 }, { "epoch": 1.9, "learning_rate": 1.5110386462785878e-05, "loss": 0.007, "step": 732700 }, { "epoch": 1.9, "learning_rate": 1.5106498246414415e-05, "loss": 0.006, "step": 732710 }, { "epoch": 1.9, "learning_rate": 1.510261003004295e-05, "loss": 0.0053, "step": 732720 }, { "epoch": 1.9, "learning_rate": 1.5098721813671486e-05, "loss": 0.0063, "step": 732730 }, { "epoch": 1.9, "learning_rate": 1.5094833597300021e-05, "loss": 0.0058, "step": 732740 }, { "epoch": 1.9, "learning_rate": 1.5090945380928558e-05, "loss": 0.0075, "step": 732750 }, { "epoch": 1.9, "learning_rate": 1.5087057164557091e-05, "loss": 0.011, "step": 732760 }, { "epoch": 1.9, "learning_rate": 1.5083168948185628e-05, "loss": 0.012, "step": 732770 }, { "epoch": 1.9, "learning_rate": 1.5079280731814162e-05, "loss": 0.0062, "step": 732780 }, { "epoch": 1.9, "learning_rate": 1.5075392515442699e-05, "loss": 0.0081, "step": 732790 }, { "epoch": 1.9, "learning_rate": 1.5071504299071234e-05, "loss": 0.0065, "step": 732800 }, { "epoch": 1.9, "learning_rate": 1.506761608269977e-05, "loss": 0.0059, "step": 732810 }, { "epoch": 1.9, "learning_rate": 1.5063727866328304e-05, "loss": 0.0073, "step": 732820 }, { "epoch": 1.9, "learning_rate": 1.5059839649956838e-05, "loss": 0.0072, "step": 732830 }, { "epoch": 1.9, "learning_rate": 1.5055951433585375e-05, "loss": 0.0085, "step": 732840 }, { "epoch": 1.9, "learning_rate": 1.505206321721391e-05, "loss": 0.0072, "step": 732850 }, { "epoch": 1.9, "learning_rate": 1.5048175000842446e-05, "loss": 0.0054, "step": 732860 }, { "epoch": 1.9, "learning_rate": 1.5044286784470981e-05, "loss": 0.0091, "step": 732870 }, { "epoch": 1.9, "learning_rate": 1.5040398568099516e-05, "loss": 0.0072, "step": 732880 }, { "epoch": 1.9, "learning_rate": 1.5036510351728051e-05, "loss": 0.0059, "step": 732890 }, { "epoch": 1.9, "learning_rate": 1.5032622135356588e-05, "loss": 0.0121, "step": 732900 }, { "epoch": 1.9, "learning_rate": 1.5028733918985122e-05, "loss": 0.0054, "step": 732910 }, { "epoch": 1.9, "learning_rate": 1.5024845702613659e-05, "loss": 0.0083, "step": 732920 }, { "epoch": 1.9, "learning_rate": 1.5020957486242194e-05, "loss": 0.0089, "step": 732930 }, { "epoch": 1.9, "learning_rate": 1.5017069269870727e-05, "loss": 0.0062, "step": 732940 }, { "epoch": 1.9, "learning_rate": 1.5013181053499264e-05, "loss": 0.0082, "step": 732950 }, { "epoch": 1.9, "learning_rate": 1.5009292837127798e-05, "loss": 0.0057, "step": 732960 }, { "epoch": 1.9, "learning_rate": 1.5005404620756335e-05, "loss": 0.0055, "step": 732970 }, { "epoch": 1.9, "learning_rate": 1.500151640438487e-05, "loss": 0.0091, "step": 732980 }, { "epoch": 1.9, "learning_rate": 1.4997628188013406e-05, "loss": 0.006, "step": 732990 }, { "epoch": 1.9, "learning_rate": 1.4993739971641941e-05, "loss": 0.0092, "step": 733000 }, { "epoch": 1.9, "eval_cer": 0.8816718943106159, "eval_loss": 0.004549098201096058, "eval_runtime": 107.784, "eval_samples_per_second": 18.556, "eval_steps_per_second": 4.639, "step": 733000 }, { "epoch": 1.9, "learning_rate": 1.4989851755270476e-05, "loss": 0.0063, "step": 733010 }, { "epoch": 1.9, "learning_rate": 1.4985963538899011e-05, "loss": 0.0087, "step": 733020 }, { "epoch": 1.9, "learning_rate": 1.4982075322527546e-05, "loss": 0.0084, "step": 733030 }, { "epoch": 1.9, "learning_rate": 1.4978187106156082e-05, "loss": 0.0079, "step": 733040 }, { "epoch": 1.9, "learning_rate": 1.4974298889784617e-05, "loss": 0.0069, "step": 733050 }, { "epoch": 1.9, "learning_rate": 1.4970410673413154e-05, "loss": 0.0075, "step": 733060 }, { "epoch": 1.9, "learning_rate": 1.4966522457041687e-05, "loss": 0.0075, "step": 733070 }, { "epoch": 1.9, "learning_rate": 1.4962634240670224e-05, "loss": 0.0069, "step": 733080 }, { "epoch": 1.9, "learning_rate": 1.4958746024298758e-05, "loss": 0.009, "step": 733090 }, { "epoch": 1.9, "learning_rate": 1.4954857807927295e-05, "loss": 0.0064, "step": 733100 }, { "epoch": 1.9, "learning_rate": 1.495096959155583e-05, "loss": 0.0059, "step": 733110 }, { "epoch": 1.9, "learning_rate": 1.4947081375184366e-05, "loss": 0.0071, "step": 733120 }, { "epoch": 1.9, "learning_rate": 1.49431931588129e-05, "loss": 0.0078, "step": 733130 }, { "epoch": 1.9, "learning_rate": 1.4939304942441434e-05, "loss": 0.0067, "step": 733140 }, { "epoch": 1.9, "learning_rate": 1.4935416726069971e-05, "loss": 0.0064, "step": 733150 }, { "epoch": 1.9, "learning_rate": 1.4931528509698506e-05, "loss": 0.0056, "step": 733160 }, { "epoch": 1.9, "learning_rate": 1.4927640293327042e-05, "loss": 0.006, "step": 733170 }, { "epoch": 1.9, "learning_rate": 1.4923752076955577e-05, "loss": 0.0056, "step": 733180 }, { "epoch": 1.9, "learning_rate": 1.4919863860584112e-05, "loss": 0.0061, "step": 733190 }, { "epoch": 1.9, "learning_rate": 1.4915975644212647e-05, "loss": 0.0056, "step": 733200 }, { "epoch": 1.9, "learning_rate": 1.4912087427841183e-05, "loss": 0.0064, "step": 733210 }, { "epoch": 1.9, "learning_rate": 1.4908199211469718e-05, "loss": 0.0081, "step": 733220 }, { "epoch": 1.9, "learning_rate": 1.4904310995098255e-05, "loss": 0.0062, "step": 733230 }, { "epoch": 1.9, "learning_rate": 1.490042277872679e-05, "loss": 0.0064, "step": 733240 }, { "epoch": 1.9, "learning_rate": 1.4896534562355323e-05, "loss": 0.0078, "step": 733250 }, { "epoch": 1.9, "learning_rate": 1.489264634598386e-05, "loss": 0.0048, "step": 733260 }, { "epoch": 1.9, "learning_rate": 1.4888758129612394e-05, "loss": 0.009, "step": 733270 }, { "epoch": 1.9, "learning_rate": 1.4884869913240931e-05, "loss": 0.0081, "step": 733280 }, { "epoch": 1.9, "learning_rate": 1.4880981696869466e-05, "loss": 0.008, "step": 733290 }, { "epoch": 1.9, "learning_rate": 1.4877093480498002e-05, "loss": 0.0079, "step": 733300 }, { "epoch": 1.9, "learning_rate": 1.4873205264126537e-05, "loss": 0.0072, "step": 733310 }, { "epoch": 1.9, "learning_rate": 1.4869317047755072e-05, "loss": 0.008, "step": 733320 }, { "epoch": 1.9, "learning_rate": 1.4865428831383607e-05, "loss": 0.005, "step": 733330 }, { "epoch": 1.9, "learning_rate": 1.4861540615012143e-05, "loss": 0.0076, "step": 733340 }, { "epoch": 1.9, "learning_rate": 1.4857652398640678e-05, "loss": 0.0107, "step": 733350 }, { "epoch": 1.9, "learning_rate": 1.4853764182269215e-05, "loss": 0.0055, "step": 733360 }, { "epoch": 1.9, "learning_rate": 1.484987596589775e-05, "loss": 0.0072, "step": 733370 }, { "epoch": 1.9, "learning_rate": 1.4845987749526283e-05, "loss": 0.0065, "step": 733380 }, { "epoch": 1.9, "learning_rate": 1.484209953315482e-05, "loss": 0.0066, "step": 733390 }, { "epoch": 1.9, "learning_rate": 1.4838211316783354e-05, "loss": 0.0066, "step": 733400 }, { "epoch": 1.9, "learning_rate": 1.4834323100411891e-05, "loss": 0.0067, "step": 733410 }, { "epoch": 1.9, "learning_rate": 1.4830434884040426e-05, "loss": 0.0062, "step": 733420 }, { "epoch": 1.9, "learning_rate": 1.4826546667668962e-05, "loss": 0.0054, "step": 733430 }, { "epoch": 1.9, "learning_rate": 1.4822658451297495e-05, "loss": 0.0079, "step": 733440 }, { "epoch": 1.9, "learning_rate": 1.4818770234926032e-05, "loss": 0.009, "step": 733450 }, { "epoch": 1.9, "learning_rate": 1.4814882018554567e-05, "loss": 0.0062, "step": 733460 }, { "epoch": 1.9, "learning_rate": 1.4810993802183103e-05, "loss": 0.0059, "step": 733470 }, { "epoch": 1.9, "learning_rate": 1.4807105585811638e-05, "loss": 0.0064, "step": 733480 }, { "epoch": 1.9, "learning_rate": 1.4803217369440175e-05, "loss": 0.0076, "step": 733490 }, { "epoch": 1.9, "learning_rate": 1.4799329153068708e-05, "loss": 0.0063, "step": 733500 }, { "epoch": 1.9, "learning_rate": 1.4795440936697243e-05, "loss": 0.0083, "step": 733510 }, { "epoch": 1.9, "learning_rate": 1.479155272032578e-05, "loss": 0.0061, "step": 733520 }, { "epoch": 1.9, "learning_rate": 1.4787664503954314e-05, "loss": 0.0064, "step": 733530 }, { "epoch": 1.9, "learning_rate": 1.4783776287582851e-05, "loss": 0.0041, "step": 733540 }, { "epoch": 1.9, "learning_rate": 1.4779888071211386e-05, "loss": 0.0048, "step": 733550 }, { "epoch": 1.9, "learning_rate": 1.477599985483992e-05, "loss": 0.0073, "step": 733560 }, { "epoch": 1.9, "learning_rate": 1.4772111638468455e-05, "loss": 0.009, "step": 733570 }, { "epoch": 1.9, "learning_rate": 1.4768223422096992e-05, "loss": 0.0073, "step": 733580 }, { "epoch": 1.9, "learning_rate": 1.4764335205725527e-05, "loss": 0.0067, "step": 733590 }, { "epoch": 1.9, "learning_rate": 1.4760446989354063e-05, "loss": 0.0043, "step": 733600 }, { "epoch": 1.9, "learning_rate": 1.4756558772982598e-05, "loss": 0.0084, "step": 733610 }, { "epoch": 1.9, "learning_rate": 1.4752670556611135e-05, "loss": 0.006, "step": 733620 }, { "epoch": 1.9, "learning_rate": 1.4748782340239668e-05, "loss": 0.0051, "step": 733630 }, { "epoch": 1.9, "learning_rate": 1.4744894123868203e-05, "loss": 0.0078, "step": 733640 }, { "epoch": 1.9, "learning_rate": 1.474100590749674e-05, "loss": 0.0072, "step": 733650 }, { "epoch": 1.9, "learning_rate": 1.4737117691125274e-05, "loss": 0.0077, "step": 733660 }, { "epoch": 1.9, "learning_rate": 1.473322947475381e-05, "loss": 0.0075, "step": 733670 }, { "epoch": 1.9, "learning_rate": 1.4729341258382346e-05, "loss": 0.0077, "step": 733680 }, { "epoch": 1.9, "learning_rate": 1.472545304201088e-05, "loss": 0.0087, "step": 733690 }, { "epoch": 1.9, "learning_rate": 1.4721564825639415e-05, "loss": 0.0064, "step": 733700 }, { "epoch": 1.9, "learning_rate": 1.4717676609267952e-05, "loss": 0.0049, "step": 733710 }, { "epoch": 1.9, "learning_rate": 1.4713788392896487e-05, "loss": 0.0087, "step": 733720 }, { "epoch": 1.9, "learning_rate": 1.4709900176525022e-05, "loss": 0.0072, "step": 733730 }, { "epoch": 1.9, "learning_rate": 1.4706011960153558e-05, "loss": 0.0085, "step": 733740 }, { "epoch": 1.9, "learning_rate": 1.4702123743782091e-05, "loss": 0.008, "step": 733750 }, { "epoch": 1.9, "learning_rate": 1.4698235527410628e-05, "loss": 0.0062, "step": 733760 }, { "epoch": 1.9, "learning_rate": 1.4694347311039163e-05, "loss": 0.0082, "step": 733770 }, { "epoch": 1.9, "learning_rate": 1.46904590946677e-05, "loss": 0.0077, "step": 733780 }, { "epoch": 1.9, "learning_rate": 1.4686570878296234e-05, "loss": 0.0087, "step": 733790 }, { "epoch": 1.9, "learning_rate": 1.468268266192477e-05, "loss": 0.0059, "step": 733800 }, { "epoch": 1.9, "learning_rate": 1.4678794445553304e-05, "loss": 0.0053, "step": 733810 }, { "epoch": 1.9, "learning_rate": 1.4674906229181839e-05, "loss": 0.0079, "step": 733820 }, { "epoch": 1.9, "learning_rate": 1.4671018012810375e-05, "loss": 0.0088, "step": 733830 }, { "epoch": 1.9, "learning_rate": 1.466712979643891e-05, "loss": 0.0059, "step": 733840 }, { "epoch": 1.9, "learning_rate": 1.4663241580067447e-05, "loss": 0.0077, "step": 733850 }, { "epoch": 1.9, "learning_rate": 1.4659353363695982e-05, "loss": 0.0097, "step": 733860 }, { "epoch": 1.9, "learning_rate": 1.4655465147324517e-05, "loss": 0.0075, "step": 733870 }, { "epoch": 1.9, "learning_rate": 1.4651576930953051e-05, "loss": 0.0091, "step": 733880 }, { "epoch": 1.9, "learning_rate": 1.4647688714581588e-05, "loss": 0.0077, "step": 733890 }, { "epoch": 1.9, "learning_rate": 1.4643800498210123e-05, "loss": 0.007, "step": 733900 }, { "epoch": 1.9, "learning_rate": 1.463991228183866e-05, "loss": 0.007, "step": 733910 }, { "epoch": 1.9, "learning_rate": 1.4636024065467194e-05, "loss": 0.0069, "step": 733920 }, { "epoch": 1.9, "learning_rate": 1.463213584909573e-05, "loss": 0.0063, "step": 733930 }, { "epoch": 1.9, "learning_rate": 1.4628247632724264e-05, "loss": 0.0057, "step": 733940 }, { "epoch": 1.9, "learning_rate": 1.4624359416352799e-05, "loss": 0.0158, "step": 733950 }, { "epoch": 1.9, "learning_rate": 1.4620471199981335e-05, "loss": 0.0068, "step": 733960 }, { "epoch": 1.9, "learning_rate": 1.461658298360987e-05, "loss": 0.0057, "step": 733970 }, { "epoch": 1.9, "learning_rate": 1.4612694767238407e-05, "loss": 0.0065, "step": 733980 }, { "epoch": 1.9, "learning_rate": 1.4608806550866942e-05, "loss": 0.0094, "step": 733990 }, { "epoch": 1.9, "learning_rate": 1.4604918334495477e-05, "loss": 0.0072, "step": 734000 }, { "epoch": 1.9, "eval_cer": 0.8816606972151424, "eval_loss": 0.0044957599602639675, "eval_runtime": 107.9535, "eval_samples_per_second": 18.526, "eval_steps_per_second": 4.632, "step": 734000 }, { "epoch": 1.9, "learning_rate": 1.4601030118124011e-05, "loss": 0.0064, "step": 734010 }, { "epoch": 1.9, "learning_rate": 1.4597141901752548e-05, "loss": 0.011, "step": 734020 }, { "epoch": 1.9, "learning_rate": 1.4593253685381083e-05, "loss": 0.0067, "step": 734030 }, { "epoch": 1.9, "learning_rate": 1.458936546900962e-05, "loss": 0.0082, "step": 734040 }, { "epoch": 1.9, "learning_rate": 1.4585477252638154e-05, "loss": 0.0079, "step": 734050 }, { "epoch": 1.9, "learning_rate": 1.4581589036266687e-05, "loss": 0.0081, "step": 734060 }, { "epoch": 1.9, "learning_rate": 1.4577700819895224e-05, "loss": 0.008, "step": 734070 }, { "epoch": 1.9, "learning_rate": 1.4573812603523759e-05, "loss": 0.0085, "step": 734080 }, { "epoch": 1.9, "learning_rate": 1.4569924387152295e-05, "loss": 0.0061, "step": 734090 }, { "epoch": 1.9, "learning_rate": 1.456603617078083e-05, "loss": 0.0077, "step": 734100 }, { "epoch": 1.9, "learning_rate": 1.4562147954409367e-05, "loss": 0.0075, "step": 734110 }, { "epoch": 1.9, "learning_rate": 1.45582597380379e-05, "loss": 0.0085, "step": 734120 }, { "epoch": 1.9, "learning_rate": 1.4554371521666436e-05, "loss": 0.0079, "step": 734130 }, { "epoch": 1.9, "learning_rate": 1.4550483305294971e-05, "loss": 0.0058, "step": 734140 }, { "epoch": 1.9, "learning_rate": 1.4546595088923508e-05, "loss": 0.008, "step": 734150 }, { "epoch": 1.9, "learning_rate": 1.4542706872552043e-05, "loss": 0.0063, "step": 734160 }, { "epoch": 1.9, "learning_rate": 1.453881865618058e-05, "loss": 0.0067, "step": 734170 }, { "epoch": 1.9, "learning_rate": 1.4534930439809112e-05, "loss": 0.0059, "step": 734180 }, { "epoch": 1.9, "learning_rate": 1.4531042223437647e-05, "loss": 0.0106, "step": 734190 }, { "epoch": 1.9, "learning_rate": 1.4527154007066184e-05, "loss": 0.0087, "step": 734200 }, { "epoch": 1.9, "learning_rate": 1.4523265790694719e-05, "loss": 0.0065, "step": 734210 }, { "epoch": 1.9, "learning_rate": 1.4519377574323255e-05, "loss": 0.0059, "step": 734220 }, { "epoch": 1.9, "learning_rate": 1.451548935795179e-05, "loss": 0.0062, "step": 734230 }, { "epoch": 1.9, "learning_rate": 1.4511601141580327e-05, "loss": 0.0065, "step": 734240 }, { "epoch": 1.9, "learning_rate": 1.450771292520886e-05, "loss": 0.0072, "step": 734250 }, { "epoch": 1.9, "learning_rate": 1.4503824708837396e-05, "loss": 0.0096, "step": 734260 }, { "epoch": 1.9, "learning_rate": 1.4499936492465931e-05, "loss": 0.007, "step": 734270 }, { "epoch": 1.9, "learning_rate": 1.4496048276094468e-05, "loss": 0.0061, "step": 734280 }, { "epoch": 1.9, "learning_rate": 1.4492160059723003e-05, "loss": 0.0086, "step": 734290 }, { "epoch": 1.9, "learning_rate": 1.448827184335154e-05, "loss": 0.006, "step": 734300 }, { "epoch": 1.9, "learning_rate": 1.4484383626980072e-05, "loss": 0.0107, "step": 734310 }, { "epoch": 1.9, "learning_rate": 1.4480495410608607e-05, "loss": 0.0055, "step": 734320 }, { "epoch": 1.9, "learning_rate": 1.4476607194237144e-05, "loss": 0.0068, "step": 734330 }, { "epoch": 1.9, "learning_rate": 1.4472718977865679e-05, "loss": 0.0066, "step": 734340 }, { "epoch": 1.9, "learning_rate": 1.4468830761494215e-05, "loss": 0.0069, "step": 734350 }, { "epoch": 1.9, "learning_rate": 1.446494254512275e-05, "loss": 0.0067, "step": 734360 }, { "epoch": 1.9, "learning_rate": 1.4461054328751285e-05, "loss": 0.0126, "step": 734370 }, { "epoch": 1.9, "learning_rate": 1.445716611237982e-05, "loss": 0.0074, "step": 734380 }, { "epoch": 1.9, "learning_rate": 1.4453277896008356e-05, "loss": 0.0075, "step": 734390 }, { "epoch": 1.9, "learning_rate": 1.4449389679636891e-05, "loss": 0.007, "step": 734400 }, { "epoch": 1.9, "learning_rate": 1.4445501463265426e-05, "loss": 0.0055, "step": 734410 }, { "epoch": 1.9, "learning_rate": 1.4441613246893963e-05, "loss": 0.0096, "step": 734420 }, { "epoch": 1.9, "learning_rate": 1.4437725030522496e-05, "loss": 0.0091, "step": 734430 }, { "epoch": 1.9, "learning_rate": 1.4433836814151032e-05, "loss": 0.0063, "step": 734440 }, { "epoch": 1.9, "learning_rate": 1.4429948597779567e-05, "loss": 0.006, "step": 734450 }, { "epoch": 1.9, "learning_rate": 1.4426060381408104e-05, "loss": 0.0084, "step": 734460 }, { "epoch": 1.9, "learning_rate": 1.4422172165036639e-05, "loss": 0.0052, "step": 734470 }, { "epoch": 1.9, "learning_rate": 1.4418283948665175e-05, "loss": 0.01, "step": 734480 }, { "epoch": 1.9, "learning_rate": 1.4414395732293708e-05, "loss": 0.0162, "step": 734490 }, { "epoch": 1.9, "learning_rate": 1.4410507515922243e-05, "loss": 0.0057, "step": 734500 }, { "epoch": 1.9, "learning_rate": 1.440661929955078e-05, "loss": 0.0071, "step": 734510 }, { "epoch": 1.9, "learning_rate": 1.4402731083179315e-05, "loss": 0.0094, "step": 734520 }, { "epoch": 1.9, "learning_rate": 1.4398842866807851e-05, "loss": 0.0087, "step": 734530 }, { "epoch": 1.9, "learning_rate": 1.4394954650436386e-05, "loss": 0.0087, "step": 734540 }, { "epoch": 1.9, "learning_rate": 1.4391066434064923e-05, "loss": 0.007, "step": 734550 }, { "epoch": 1.9, "learning_rate": 1.4387178217693456e-05, "loss": 0.0084, "step": 734560 }, { "epoch": 1.9, "learning_rate": 1.4383290001321992e-05, "loss": 0.0068, "step": 734570 }, { "epoch": 1.9, "learning_rate": 1.4379401784950527e-05, "loss": 0.0067, "step": 734580 }, { "epoch": 1.9, "learning_rate": 1.4375513568579064e-05, "loss": 0.0063, "step": 734590 }, { "epoch": 1.9, "learning_rate": 1.4371625352207599e-05, "loss": 0.0053, "step": 734600 }, { "epoch": 1.9, "learning_rate": 1.4367737135836135e-05, "loss": 0.0069, "step": 734610 }, { "epoch": 1.9, "learning_rate": 1.4363848919464668e-05, "loss": 0.0053, "step": 734620 }, { "epoch": 1.9, "learning_rate": 1.4359960703093203e-05, "loss": 0.0066, "step": 734630 }, { "epoch": 1.9, "learning_rate": 1.435607248672174e-05, "loss": 0.0083, "step": 734640 }, { "epoch": 1.9, "learning_rate": 1.4352184270350275e-05, "loss": 0.0078, "step": 734650 }, { "epoch": 1.9, "learning_rate": 1.4348296053978811e-05, "loss": 0.0056, "step": 734660 }, { "epoch": 1.9, "learning_rate": 1.4344407837607346e-05, "loss": 0.0077, "step": 734670 }, { "epoch": 1.9, "learning_rate": 1.4340519621235881e-05, "loss": 0.0093, "step": 734680 }, { "epoch": 1.9, "learning_rate": 1.4336631404864416e-05, "loss": 0.0099, "step": 734690 }, { "epoch": 1.9, "learning_rate": 1.4332743188492952e-05, "loss": 0.0058, "step": 734700 }, { "epoch": 1.9, "learning_rate": 1.4328854972121487e-05, "loss": 0.0062, "step": 734710 }, { "epoch": 1.9, "learning_rate": 1.4324966755750024e-05, "loss": 0.0066, "step": 734720 }, { "epoch": 1.9, "learning_rate": 1.4321078539378559e-05, "loss": 0.0077, "step": 734730 }, { "epoch": 1.9, "learning_rate": 1.4317190323007092e-05, "loss": 0.006, "step": 734740 }, { "epoch": 1.9, "learning_rate": 1.4313302106635628e-05, "loss": 0.006, "step": 734750 }, { "epoch": 1.9, "learning_rate": 1.4309413890264163e-05, "loss": 0.0066, "step": 734760 }, { "epoch": 1.9, "learning_rate": 1.43055256738927e-05, "loss": 0.0075, "step": 734770 }, { "epoch": 1.9, "learning_rate": 1.4301637457521235e-05, "loss": 0.0059, "step": 734780 }, { "epoch": 1.9, "learning_rate": 1.4297749241149771e-05, "loss": 0.009, "step": 734790 }, { "epoch": 1.9, "learning_rate": 1.4293861024778304e-05, "loss": 0.009, "step": 734800 }, { "epoch": 1.9, "learning_rate": 1.4289972808406841e-05, "loss": 0.0056, "step": 734810 }, { "epoch": 1.9, "learning_rate": 1.4286084592035376e-05, "loss": 0.0069, "step": 734820 }, { "epoch": 1.9, "learning_rate": 1.4282196375663912e-05, "loss": 0.0039, "step": 734830 }, { "epoch": 1.9, "learning_rate": 1.4278308159292447e-05, "loss": 0.0046, "step": 734840 }, { "epoch": 1.9, "learning_rate": 1.4274419942920984e-05, "loss": 0.0062, "step": 734850 }, { "epoch": 1.9, "learning_rate": 1.4270531726549519e-05, "loss": 0.0077, "step": 734860 }, { "epoch": 1.9, "learning_rate": 1.4266643510178052e-05, "loss": 0.0079, "step": 734870 }, { "epoch": 1.9, "learning_rate": 1.4262755293806588e-05, "loss": 0.0074, "step": 734880 }, { "epoch": 1.9, "learning_rate": 1.4258867077435123e-05, "loss": 0.0075, "step": 734890 }, { "epoch": 1.9, "learning_rate": 1.425497886106366e-05, "loss": 0.0082, "step": 734900 }, { "epoch": 1.9, "learning_rate": 1.4251090644692195e-05, "loss": 0.0048, "step": 734910 }, { "epoch": 1.91, "learning_rate": 1.4247202428320731e-05, "loss": 0.0075, "step": 734920 }, { "epoch": 1.91, "learning_rate": 1.4243314211949264e-05, "loss": 0.0066, "step": 734930 }, { "epoch": 1.91, "learning_rate": 1.4239425995577801e-05, "loss": 0.0073, "step": 734940 }, { "epoch": 1.91, "learning_rate": 1.4235537779206336e-05, "loss": 0.0059, "step": 734950 }, { "epoch": 1.91, "learning_rate": 1.4231649562834872e-05, "loss": 0.0079, "step": 734960 }, { "epoch": 1.91, "learning_rate": 1.4227761346463407e-05, "loss": 0.0077, "step": 734970 }, { "epoch": 1.91, "learning_rate": 1.4223873130091944e-05, "loss": 0.0063, "step": 734980 }, { "epoch": 1.91, "learning_rate": 1.4219984913720477e-05, "loss": 0.0045, "step": 734990 }, { "epoch": 1.91, "learning_rate": 1.4216096697349012e-05, "loss": 0.0104, "step": 735000 }, { "epoch": 1.91, "eval_cer": 0.8816676953998133, "eval_loss": 0.004462803713977337, "eval_runtime": 108.0687, "eval_samples_per_second": 18.507, "eval_steps_per_second": 4.627, "step": 735000 }, { "epoch": 1.91, "learning_rate": 1.4212208480977548e-05, "loss": 0.0057, "step": 735010 }, { "epoch": 1.91, "learning_rate": 1.4208320264606083e-05, "loss": 0.0098, "step": 735020 }, { "epoch": 1.91, "learning_rate": 1.420443204823462e-05, "loss": 0.006, "step": 735030 }, { "epoch": 1.91, "learning_rate": 1.4200543831863155e-05, "loss": 0.01, "step": 735040 }, { "epoch": 1.91, "learning_rate": 1.419665561549169e-05, "loss": 0.0084, "step": 735050 }, { "epoch": 1.91, "learning_rate": 1.4192767399120224e-05, "loss": 0.0058, "step": 735060 }, { "epoch": 1.91, "learning_rate": 1.4188879182748761e-05, "loss": 0.0079, "step": 735070 }, { "epoch": 1.91, "learning_rate": 1.4184990966377296e-05, "loss": 0.0076, "step": 735080 }, { "epoch": 1.91, "learning_rate": 1.4181102750005832e-05, "loss": 0.007, "step": 735090 }, { "epoch": 1.91, "learning_rate": 1.4177214533634367e-05, "loss": 0.0091, "step": 735100 }, { "epoch": 1.91, "learning_rate": 1.41733263172629e-05, "loss": 0.0063, "step": 735110 }, { "epoch": 1.91, "learning_rate": 1.4169438100891437e-05, "loss": 0.0082, "step": 735120 }, { "epoch": 1.91, "learning_rate": 1.4165549884519972e-05, "loss": 0.0058, "step": 735130 }, { "epoch": 1.91, "learning_rate": 1.4161661668148508e-05, "loss": 0.0067, "step": 735140 }, { "epoch": 1.91, "learning_rate": 1.4157773451777043e-05, "loss": 0.0089, "step": 735150 }, { "epoch": 1.91, "learning_rate": 1.415388523540558e-05, "loss": 0.0073, "step": 735160 }, { "epoch": 1.91, "learning_rate": 1.4149997019034115e-05, "loss": 0.0066, "step": 735170 }, { "epoch": 1.91, "learning_rate": 1.4146108802662648e-05, "loss": 0.0079, "step": 735180 }, { "epoch": 1.91, "learning_rate": 1.4142220586291184e-05, "loss": 0.0063, "step": 735190 }, { "epoch": 1.91, "learning_rate": 1.413833236991972e-05, "loss": 0.0076, "step": 735200 }, { "epoch": 1.91, "learning_rate": 1.4134444153548256e-05, "loss": 0.0055, "step": 735210 }, { "epoch": 1.91, "learning_rate": 1.413055593717679e-05, "loss": 0.0058, "step": 735220 }, { "epoch": 1.91, "learning_rate": 1.4126667720805327e-05, "loss": 0.0077, "step": 735230 }, { "epoch": 1.91, "learning_rate": 1.412277950443386e-05, "loss": 0.0094, "step": 735240 }, { "epoch": 1.91, "learning_rate": 1.4118891288062397e-05, "loss": 0.0045, "step": 735250 }, { "epoch": 1.91, "learning_rate": 1.4115003071690932e-05, "loss": 0.0069, "step": 735260 }, { "epoch": 1.91, "learning_rate": 1.4111114855319468e-05, "loss": 0.0086, "step": 735270 }, { "epoch": 1.91, "learning_rate": 1.4107226638948003e-05, "loss": 0.008, "step": 735280 }, { "epoch": 1.91, "learning_rate": 1.410333842257654e-05, "loss": 0.0089, "step": 735290 }, { "epoch": 1.91, "learning_rate": 1.4099450206205073e-05, "loss": 0.0066, "step": 735300 }, { "epoch": 1.91, "learning_rate": 1.4095561989833608e-05, "loss": 0.0059, "step": 735310 }, { "epoch": 1.91, "learning_rate": 1.4091673773462144e-05, "loss": 0.0078, "step": 735320 }, { "epoch": 1.91, "learning_rate": 1.408778555709068e-05, "loss": 0.0084, "step": 735330 }, { "epoch": 1.91, "learning_rate": 1.4083897340719216e-05, "loss": 0.0094, "step": 735340 }, { "epoch": 1.91, "learning_rate": 1.408000912434775e-05, "loss": 0.006, "step": 735350 }, { "epoch": 1.91, "learning_rate": 1.4076120907976285e-05, "loss": 0.0072, "step": 735360 }, { "epoch": 1.91, "learning_rate": 1.407223269160482e-05, "loss": 0.0077, "step": 735370 }, { "epoch": 1.91, "learning_rate": 1.4068344475233357e-05, "loss": 0.0093, "step": 735380 }, { "epoch": 1.91, "learning_rate": 1.4064456258861892e-05, "loss": 0.005, "step": 735390 }, { "epoch": 1.91, "learning_rate": 1.4060568042490428e-05, "loss": 0.0069, "step": 735400 }, { "epoch": 1.91, "learning_rate": 1.4056679826118963e-05, "loss": 0.0058, "step": 735410 }, { "epoch": 1.91, "learning_rate": 1.4052791609747496e-05, "loss": 0.0079, "step": 735420 }, { "epoch": 1.91, "learning_rate": 1.4048903393376033e-05, "loss": 0.0056, "step": 735430 }, { "epoch": 1.91, "learning_rate": 1.4045015177004568e-05, "loss": 0.0067, "step": 735440 }, { "epoch": 1.91, "learning_rate": 1.4041126960633104e-05, "loss": 0.0073, "step": 735450 }, { "epoch": 1.91, "learning_rate": 1.4037238744261639e-05, "loss": 0.0093, "step": 735460 }, { "epoch": 1.91, "learning_rate": 1.4033350527890176e-05, "loss": 0.0091, "step": 735470 }, { "epoch": 1.91, "learning_rate": 1.402946231151871e-05, "loss": 0.0055, "step": 735480 }, { "epoch": 1.91, "learning_rate": 1.4025574095147245e-05, "loss": 0.0046, "step": 735490 }, { "epoch": 1.91, "learning_rate": 1.402168587877578e-05, "loss": 0.0085, "step": 735500 }, { "epoch": 1.91, "learning_rate": 1.4017797662404317e-05, "loss": 0.0075, "step": 735510 }, { "epoch": 1.91, "learning_rate": 1.4013909446032852e-05, "loss": 0.0083, "step": 735520 }, { "epoch": 1.91, "learning_rate": 1.4010021229661388e-05, "loss": 0.0065, "step": 735530 }, { "epoch": 1.91, "learning_rate": 1.4006133013289923e-05, "loss": 0.0059, "step": 735540 }, { "epoch": 1.91, "learning_rate": 1.4002244796918456e-05, "loss": 0.0066, "step": 735550 }, { "epoch": 1.91, "learning_rate": 1.3998356580546993e-05, "loss": 0.0066, "step": 735560 }, { "epoch": 1.91, "learning_rate": 1.3994468364175528e-05, "loss": 0.0056, "step": 735570 }, { "epoch": 1.91, "learning_rate": 1.3990580147804064e-05, "loss": 0.0062, "step": 735580 }, { "epoch": 1.91, "learning_rate": 1.3986691931432599e-05, "loss": 0.0113, "step": 735590 }, { "epoch": 1.91, "learning_rate": 1.3982803715061136e-05, "loss": 0.0092, "step": 735600 }, { "epoch": 1.91, "learning_rate": 1.3978915498689669e-05, "loss": 0.0063, "step": 735610 }, { "epoch": 1.91, "learning_rate": 1.3975027282318205e-05, "loss": 0.0065, "step": 735620 }, { "epoch": 1.91, "learning_rate": 1.397113906594674e-05, "loss": 0.008, "step": 735630 }, { "epoch": 1.91, "learning_rate": 1.3967250849575277e-05, "loss": 0.0087, "step": 735640 }, { "epoch": 1.91, "learning_rate": 1.3963362633203812e-05, "loss": 0.0071, "step": 735650 }, { "epoch": 1.91, "learning_rate": 1.3959474416832348e-05, "loss": 0.0068, "step": 735660 }, { "epoch": 1.91, "learning_rate": 1.3955586200460881e-05, "loss": 0.0071, "step": 735670 }, { "epoch": 1.91, "learning_rate": 1.3951697984089416e-05, "loss": 0.0073, "step": 735680 }, { "epoch": 1.91, "learning_rate": 1.3947809767717953e-05, "loss": 0.0059, "step": 735690 }, { "epoch": 1.91, "learning_rate": 1.3943921551346488e-05, "loss": 0.0086, "step": 735700 }, { "epoch": 1.91, "learning_rate": 1.3940033334975024e-05, "loss": 0.0077, "step": 735710 }, { "epoch": 1.91, "learning_rate": 1.3936145118603559e-05, "loss": 0.0081, "step": 735720 }, { "epoch": 1.91, "learning_rate": 1.3932256902232094e-05, "loss": 0.0079, "step": 735730 }, { "epoch": 1.91, "learning_rate": 1.3928368685860629e-05, "loss": 0.0097, "step": 735740 }, { "epoch": 1.91, "learning_rate": 1.3924480469489165e-05, "loss": 0.0058, "step": 735750 }, { "epoch": 1.91, "learning_rate": 1.39205922531177e-05, "loss": 0.0081, "step": 735760 }, { "epoch": 1.91, "learning_rate": 1.3916704036746237e-05, "loss": 0.0067, "step": 735770 }, { "epoch": 1.91, "learning_rate": 1.3912815820374772e-05, "loss": 0.0068, "step": 735780 }, { "epoch": 1.91, "learning_rate": 1.3908927604003307e-05, "loss": 0.0078, "step": 735790 }, { "epoch": 1.91, "learning_rate": 1.3905039387631841e-05, "loss": 0.0057, "step": 735800 }, { "epoch": 1.91, "learning_rate": 1.3901151171260376e-05, "loss": 0.0063, "step": 735810 }, { "epoch": 1.91, "learning_rate": 1.3897262954888913e-05, "loss": 0.0072, "step": 735820 }, { "epoch": 1.91, "learning_rate": 1.3893374738517448e-05, "loss": 0.0063, "step": 735830 }, { "epoch": 1.91, "learning_rate": 1.3889486522145984e-05, "loss": 0.0088, "step": 735840 }, { "epoch": 1.91, "learning_rate": 1.3885598305774519e-05, "loss": 0.0097, "step": 735850 }, { "epoch": 1.91, "learning_rate": 1.3881710089403052e-05, "loss": 0.0079, "step": 735860 }, { "epoch": 1.91, "learning_rate": 1.3877821873031589e-05, "loss": 0.0065, "step": 735870 }, { "epoch": 1.91, "learning_rate": 1.3873933656660124e-05, "loss": 0.0093, "step": 735880 }, { "epoch": 1.91, "learning_rate": 1.387004544028866e-05, "loss": 0.0073, "step": 735890 }, { "epoch": 1.91, "learning_rate": 1.3866157223917195e-05, "loss": 0.0091, "step": 735900 }, { "epoch": 1.91, "learning_rate": 1.3862269007545732e-05, "loss": 0.0066, "step": 735910 }, { "epoch": 1.91, "learning_rate": 1.3858380791174265e-05, "loss": 0.0048, "step": 735920 }, { "epoch": 1.91, "learning_rate": 1.3854492574802801e-05, "loss": 0.0065, "step": 735930 }, { "epoch": 1.91, "learning_rate": 1.3850604358431336e-05, "loss": 0.0068, "step": 735940 }, { "epoch": 1.91, "learning_rate": 1.3846716142059873e-05, "loss": 0.0091, "step": 735950 }, { "epoch": 1.91, "learning_rate": 1.3842827925688408e-05, "loss": 0.0064, "step": 735960 }, { "epoch": 1.91, "learning_rate": 1.3838939709316944e-05, "loss": 0.0064, "step": 735970 }, { "epoch": 1.91, "learning_rate": 1.3835051492945477e-05, "loss": 0.0082, "step": 735980 }, { "epoch": 1.91, "learning_rate": 1.3831163276574012e-05, "loss": 0.0101, "step": 735990 }, { "epoch": 1.91, "learning_rate": 1.3827275060202549e-05, "loss": 0.0074, "step": 736000 }, { "epoch": 1.91, "eval_cer": 0.8816550986674057, "eval_loss": 0.004494575317949057, "eval_runtime": 107.9239, "eval_samples_per_second": 18.532, "eval_steps_per_second": 4.633, "step": 736000 }, { "epoch": 1.91, "learning_rate": 1.3823386843831084e-05, "loss": 0.0083, "step": 736010 }, { "epoch": 1.91, "learning_rate": 1.381949862745962e-05, "loss": 0.0069, "step": 736020 }, { "epoch": 1.91, "learning_rate": 1.3815610411088155e-05, "loss": 0.0076, "step": 736030 }, { "epoch": 1.91, "learning_rate": 1.381172219471669e-05, "loss": 0.008, "step": 736040 }, { "epoch": 1.91, "learning_rate": 1.3807833978345225e-05, "loss": 0.0088, "step": 736050 }, { "epoch": 1.91, "learning_rate": 1.3803945761973761e-05, "loss": 0.0073, "step": 736060 }, { "epoch": 1.91, "learning_rate": 1.3800057545602296e-05, "loss": 0.0077, "step": 736070 }, { "epoch": 1.91, "learning_rate": 1.3796169329230833e-05, "loss": 0.0084, "step": 736080 }, { "epoch": 1.91, "learning_rate": 1.3792281112859368e-05, "loss": 0.0082, "step": 736090 }, { "epoch": 1.91, "learning_rate": 1.3788392896487904e-05, "loss": 0.0047, "step": 736100 }, { "epoch": 1.91, "learning_rate": 1.3784504680116437e-05, "loss": 0.0073, "step": 736110 }, { "epoch": 1.91, "learning_rate": 1.3780616463744972e-05, "loss": 0.0079, "step": 736120 }, { "epoch": 1.91, "learning_rate": 1.3776728247373509e-05, "loss": 0.0066, "step": 736130 }, { "epoch": 1.91, "learning_rate": 1.3772840031002044e-05, "loss": 0.0067, "step": 736140 }, { "epoch": 1.91, "learning_rate": 1.376895181463058e-05, "loss": 0.0061, "step": 736150 }, { "epoch": 1.91, "learning_rate": 1.3765063598259115e-05, "loss": 0.0055, "step": 736160 }, { "epoch": 1.91, "learning_rate": 1.376117538188765e-05, "loss": 0.0085, "step": 736170 }, { "epoch": 1.91, "learning_rate": 1.3757287165516185e-05, "loss": 0.0096, "step": 736180 }, { "epoch": 1.91, "learning_rate": 1.3753398949144721e-05, "loss": 0.0099, "step": 736190 }, { "epoch": 1.91, "learning_rate": 1.3749510732773256e-05, "loss": 0.0087, "step": 736200 }, { "epoch": 1.91, "learning_rate": 1.3745622516401793e-05, "loss": 0.0071, "step": 736210 }, { "epoch": 1.91, "learning_rate": 1.3741734300030328e-05, "loss": 0.0087, "step": 736220 }, { "epoch": 1.91, "learning_rate": 1.373784608365886e-05, "loss": 0.0081, "step": 736230 }, { "epoch": 1.91, "learning_rate": 1.3733957867287397e-05, "loss": 0.0075, "step": 736240 }, { "epoch": 1.91, "learning_rate": 1.3730069650915932e-05, "loss": 0.0071, "step": 736250 }, { "epoch": 1.91, "learning_rate": 1.3726181434544469e-05, "loss": 0.0068, "step": 736260 }, { "epoch": 1.91, "learning_rate": 1.3722293218173004e-05, "loss": 0.0076, "step": 736270 }, { "epoch": 1.91, "learning_rate": 1.371840500180154e-05, "loss": 0.0067, "step": 736280 }, { "epoch": 1.91, "learning_rate": 1.3714516785430073e-05, "loss": 0.007, "step": 736290 }, { "epoch": 1.91, "learning_rate": 1.371062856905861e-05, "loss": 0.0063, "step": 736300 }, { "epoch": 1.91, "learning_rate": 1.3706740352687145e-05, "loss": 0.0052, "step": 736310 }, { "epoch": 1.91, "learning_rate": 1.3702852136315681e-05, "loss": 0.0056, "step": 736320 }, { "epoch": 1.91, "learning_rate": 1.3698963919944216e-05, "loss": 0.0052, "step": 736330 }, { "epoch": 1.91, "learning_rate": 1.3695075703572753e-05, "loss": 0.0068, "step": 736340 }, { "epoch": 1.91, "learning_rate": 1.3691187487201286e-05, "loss": 0.0057, "step": 736350 }, { "epoch": 1.91, "learning_rate": 1.368729927082982e-05, "loss": 0.0061, "step": 736360 }, { "epoch": 1.91, "learning_rate": 1.3683411054458357e-05, "loss": 0.0073, "step": 736370 }, { "epoch": 1.91, "learning_rate": 1.3679522838086892e-05, "loss": 0.0052, "step": 736380 }, { "epoch": 1.91, "learning_rate": 1.3675634621715429e-05, "loss": 0.0054, "step": 736390 }, { "epoch": 1.91, "learning_rate": 1.3671746405343964e-05, "loss": 0.008, "step": 736400 }, { "epoch": 1.91, "learning_rate": 1.36678581889725e-05, "loss": 0.0049, "step": 736410 }, { "epoch": 1.91, "learning_rate": 1.3663969972601033e-05, "loss": 0.0086, "step": 736420 }, { "epoch": 1.91, "learning_rate": 1.366008175622957e-05, "loss": 0.0064, "step": 736430 }, { "epoch": 1.91, "learning_rate": 1.3656193539858105e-05, "loss": 0.0063, "step": 736440 }, { "epoch": 1.91, "learning_rate": 1.3652305323486641e-05, "loss": 0.0074, "step": 736450 }, { "epoch": 1.91, "learning_rate": 1.3648417107115176e-05, "loss": 0.0085, "step": 736460 }, { "epoch": 1.91, "learning_rate": 1.3644528890743713e-05, "loss": 0.0088, "step": 736470 }, { "epoch": 1.91, "learning_rate": 1.3640640674372246e-05, "loss": 0.0065, "step": 736480 }, { "epoch": 1.91, "learning_rate": 1.363675245800078e-05, "loss": 0.0082, "step": 736490 }, { "epoch": 1.91, "learning_rate": 1.3632864241629317e-05, "loss": 0.006, "step": 736500 }, { "epoch": 1.91, "learning_rate": 1.3628976025257852e-05, "loss": 0.009, "step": 736510 }, { "epoch": 1.91, "learning_rate": 1.3625087808886389e-05, "loss": 0.0078, "step": 736520 }, { "epoch": 1.91, "learning_rate": 1.3621199592514924e-05, "loss": 0.0068, "step": 736530 }, { "epoch": 1.91, "learning_rate": 1.3617311376143458e-05, "loss": 0.0082, "step": 736540 }, { "epoch": 1.91, "learning_rate": 1.3613423159771993e-05, "loss": 0.0061, "step": 736550 }, { "epoch": 1.91, "learning_rate": 1.3609534943400528e-05, "loss": 0.0043, "step": 736560 }, { "epoch": 1.91, "learning_rate": 1.3605646727029065e-05, "loss": 0.0066, "step": 736570 }, { "epoch": 1.91, "learning_rate": 1.36017585106576e-05, "loss": 0.0056, "step": 736580 }, { "epoch": 1.91, "learning_rate": 1.3597870294286136e-05, "loss": 0.0084, "step": 736590 }, { "epoch": 1.91, "learning_rate": 1.359398207791467e-05, "loss": 0.0083, "step": 736600 }, { "epoch": 1.91, "learning_rate": 1.3590093861543206e-05, "loss": 0.0071, "step": 736610 }, { "epoch": 1.91, "learning_rate": 1.358620564517174e-05, "loss": 0.0071, "step": 736620 }, { "epoch": 1.91, "learning_rate": 1.3582317428800277e-05, "loss": 0.0054, "step": 736630 }, { "epoch": 1.91, "learning_rate": 1.3578429212428812e-05, "loss": 0.0057, "step": 736640 }, { "epoch": 1.91, "learning_rate": 1.3574540996057349e-05, "loss": 0.0081, "step": 736650 }, { "epoch": 1.91, "learning_rate": 1.3570652779685882e-05, "loss": 0.0077, "step": 736660 }, { "epoch": 1.91, "learning_rate": 1.3566764563314417e-05, "loss": 0.0057, "step": 736670 }, { "epoch": 1.91, "learning_rate": 1.3562876346942953e-05, "loss": 0.0069, "step": 736680 }, { "epoch": 1.91, "learning_rate": 1.3558988130571488e-05, "loss": 0.0074, "step": 736690 }, { "epoch": 1.91, "learning_rate": 1.3555099914200025e-05, "loss": 0.0077, "step": 736700 }, { "epoch": 1.91, "learning_rate": 1.355121169782856e-05, "loss": 0.006, "step": 736710 }, { "epoch": 1.91, "learning_rate": 1.3547323481457096e-05, "loss": 0.0055, "step": 736720 }, { "epoch": 1.91, "learning_rate": 1.354343526508563e-05, "loss": 0.0055, "step": 736730 }, { "epoch": 1.91, "learning_rate": 1.3539547048714166e-05, "loss": 0.0067, "step": 736740 }, { "epoch": 1.91, "learning_rate": 1.35356588323427e-05, "loss": 0.0107, "step": 736750 }, { "epoch": 1.91, "learning_rate": 1.3531770615971237e-05, "loss": 0.0068, "step": 736760 }, { "epoch": 1.91, "learning_rate": 1.3527882399599772e-05, "loss": 0.007, "step": 736770 }, { "epoch": 1.91, "learning_rate": 1.3523994183228309e-05, "loss": 0.0066, "step": 736780 }, { "epoch": 1.91, "learning_rate": 1.3520105966856842e-05, "loss": 0.0059, "step": 736790 }, { "epoch": 1.91, "learning_rate": 1.3516217750485377e-05, "loss": 0.0089, "step": 736800 }, { "epoch": 1.91, "learning_rate": 1.3512329534113913e-05, "loss": 0.0072, "step": 736810 }, { "epoch": 1.91, "learning_rate": 1.3508441317742448e-05, "loss": 0.0082, "step": 736820 }, { "epoch": 1.91, "learning_rate": 1.3504553101370985e-05, "loss": 0.0113, "step": 736830 }, { "epoch": 1.91, "learning_rate": 1.350066488499952e-05, "loss": 0.0083, "step": 736840 }, { "epoch": 1.91, "learning_rate": 1.3496776668628054e-05, "loss": 0.0068, "step": 736850 }, { "epoch": 1.91, "learning_rate": 1.349288845225659e-05, "loss": 0.0045, "step": 736860 }, { "epoch": 1.91, "learning_rate": 1.3489000235885126e-05, "loss": 0.0065, "step": 736870 }, { "epoch": 1.91, "learning_rate": 1.348511201951366e-05, "loss": 0.0058, "step": 736880 }, { "epoch": 1.91, "learning_rate": 1.3481223803142197e-05, "loss": 0.0064, "step": 736890 }, { "epoch": 1.91, "learning_rate": 1.3477335586770732e-05, "loss": 0.0083, "step": 736900 }, { "epoch": 1.91, "learning_rate": 1.3473447370399265e-05, "loss": 0.0071, "step": 736910 }, { "epoch": 1.91, "learning_rate": 1.3469559154027802e-05, "loss": 0.0073, "step": 736920 }, { "epoch": 1.91, "learning_rate": 1.3465670937656337e-05, "loss": 0.0075, "step": 736930 }, { "epoch": 1.91, "learning_rate": 1.3461782721284873e-05, "loss": 0.0111, "step": 736940 }, { "epoch": 1.91, "learning_rate": 1.3457894504913408e-05, "loss": 0.0068, "step": 736950 }, { "epoch": 1.91, "learning_rate": 1.3454006288541945e-05, "loss": 0.0067, "step": 736960 }, { "epoch": 1.91, "learning_rate": 1.3450118072170478e-05, "loss": 0.0078, "step": 736970 }, { "epoch": 1.91, "learning_rate": 1.3446229855799014e-05, "loss": 0.005, "step": 736980 }, { "epoch": 1.91, "learning_rate": 1.344234163942755e-05, "loss": 0.0102, "step": 736990 }, { "epoch": 1.91, "learning_rate": 1.3438453423056086e-05, "loss": 0.0076, "step": 737000 }, { "epoch": 1.91, "eval_cer": 0.8816620968520765, "eval_loss": 0.004480063449591398, "eval_runtime": 107.9366, "eval_samples_per_second": 18.529, "eval_steps_per_second": 4.632, "step": 737000 }, { "epoch": 1.91, "learning_rate": 1.343456520668462e-05, "loss": 0.0063, "step": 737010 }, { "epoch": 1.91, "learning_rate": 1.3430676990313157e-05, "loss": 0.0056, "step": 737020 }, { "epoch": 1.91, "learning_rate": 1.3426788773941692e-05, "loss": 0.0078, "step": 737030 }, { "epoch": 1.91, "learning_rate": 1.3422900557570225e-05, "loss": 0.0046, "step": 737040 }, { "epoch": 1.91, "learning_rate": 1.3419012341198762e-05, "loss": 0.0082, "step": 737050 }, { "epoch": 1.91, "learning_rate": 1.3415124124827297e-05, "loss": 0.0084, "step": 737060 }, { "epoch": 1.91, "learning_rate": 1.3411235908455833e-05, "loss": 0.0127, "step": 737070 }, { "epoch": 1.91, "learning_rate": 1.3407347692084368e-05, "loss": 0.0067, "step": 737080 }, { "epoch": 1.91, "learning_rate": 1.3403459475712905e-05, "loss": 0.0075, "step": 737090 }, { "epoch": 1.91, "learning_rate": 1.3399571259341438e-05, "loss": 0.0092, "step": 737100 }, { "epoch": 1.91, "learning_rate": 1.3395683042969974e-05, "loss": 0.006, "step": 737110 }, { "epoch": 1.91, "learning_rate": 1.339179482659851e-05, "loss": 0.006, "step": 737120 }, { "epoch": 1.91, "learning_rate": 1.3387906610227046e-05, "loss": 0.0054, "step": 737130 }, { "epoch": 1.91, "learning_rate": 1.338401839385558e-05, "loss": 0.0083, "step": 737140 }, { "epoch": 1.91, "learning_rate": 1.3380130177484117e-05, "loss": 0.0059, "step": 737150 }, { "epoch": 1.91, "learning_rate": 1.337624196111265e-05, "loss": 0.0052, "step": 737160 }, { "epoch": 1.91, "learning_rate": 1.3372353744741185e-05, "loss": 0.0074, "step": 737170 }, { "epoch": 1.91, "learning_rate": 1.3368465528369722e-05, "loss": 0.0053, "step": 737180 }, { "epoch": 1.91, "learning_rate": 1.3364577311998257e-05, "loss": 0.007, "step": 737190 }, { "epoch": 1.91, "learning_rate": 1.3360689095626793e-05, "loss": 0.0084, "step": 737200 }, { "epoch": 1.91, "learning_rate": 1.3356800879255328e-05, "loss": 0.006, "step": 737210 }, { "epoch": 1.91, "learning_rate": 1.3352912662883863e-05, "loss": 0.0068, "step": 737220 }, { "epoch": 1.91, "learning_rate": 1.3349024446512398e-05, "loss": 0.0093, "step": 737230 }, { "epoch": 1.91, "learning_rate": 1.3345136230140933e-05, "loss": 0.0071, "step": 737240 }, { "epoch": 1.91, "learning_rate": 1.3341248013769469e-05, "loss": 0.005, "step": 737250 }, { "epoch": 1.91, "learning_rate": 1.3337359797398004e-05, "loss": 0.0072, "step": 737260 }, { "epoch": 1.91, "learning_rate": 1.333347158102654e-05, "loss": 0.0073, "step": 737270 }, { "epoch": 1.91, "learning_rate": 1.3329583364655074e-05, "loss": 0.0067, "step": 737280 }, { "epoch": 1.91, "learning_rate": 1.332569514828361e-05, "loss": 0.0071, "step": 737290 }, { "epoch": 1.91, "learning_rate": 1.3321806931912145e-05, "loss": 0.0107, "step": 737300 }, { "epoch": 1.91, "learning_rate": 1.3317918715540682e-05, "loss": 0.0114, "step": 737310 }, { "epoch": 1.91, "learning_rate": 1.3314030499169217e-05, "loss": 0.0082, "step": 737320 }, { "epoch": 1.91, "learning_rate": 1.3310142282797753e-05, "loss": 0.0057, "step": 737330 }, { "epoch": 1.91, "learning_rate": 1.3306254066426288e-05, "loss": 0.0092, "step": 737340 }, { "epoch": 1.91, "learning_rate": 1.3302365850054821e-05, "loss": 0.0069, "step": 737350 }, { "epoch": 1.91, "learning_rate": 1.3298477633683358e-05, "loss": 0.0077, "step": 737360 }, { "epoch": 1.91, "learning_rate": 1.3294589417311893e-05, "loss": 0.0063, "step": 737370 }, { "epoch": 1.91, "learning_rate": 1.3290701200940429e-05, "loss": 0.01, "step": 737380 }, { "epoch": 1.91, "learning_rate": 1.3286812984568964e-05, "loss": 0.0055, "step": 737390 }, { "epoch": 1.91, "learning_rate": 1.32829247681975e-05, "loss": 0.0063, "step": 737400 }, { "epoch": 1.91, "learning_rate": 1.3279036551826034e-05, "loss": 0.0075, "step": 737410 }, { "epoch": 1.91, "learning_rate": 1.327514833545457e-05, "loss": 0.0065, "step": 737420 }, { "epoch": 1.91, "learning_rate": 1.3271260119083105e-05, "loss": 0.0075, "step": 737430 }, { "epoch": 1.91, "learning_rate": 1.3267371902711642e-05, "loss": 0.0087, "step": 737440 }, { "epoch": 1.91, "learning_rate": 1.3263483686340177e-05, "loss": 0.0061, "step": 737450 }, { "epoch": 1.91, "learning_rate": 1.3259595469968713e-05, "loss": 0.0088, "step": 737460 }, { "epoch": 1.91, "learning_rate": 1.3255707253597246e-05, "loss": 0.0071, "step": 737470 }, { "epoch": 1.91, "learning_rate": 1.3251819037225781e-05, "loss": 0.0057, "step": 737480 }, { "epoch": 1.91, "learning_rate": 1.3247930820854318e-05, "loss": 0.006, "step": 737490 }, { "epoch": 1.91, "learning_rate": 1.3244042604482853e-05, "loss": 0.0072, "step": 737500 }, { "epoch": 1.91, "learning_rate": 1.3240154388111389e-05, "loss": 0.0053, "step": 737510 }, { "epoch": 1.91, "learning_rate": 1.3236266171739924e-05, "loss": 0.0059, "step": 737520 }, { "epoch": 1.91, "learning_rate": 1.3232377955368459e-05, "loss": 0.0061, "step": 737530 }, { "epoch": 1.91, "learning_rate": 1.3228489738996994e-05, "loss": 0.009, "step": 737540 }, { "epoch": 1.91, "learning_rate": 1.322460152262553e-05, "loss": 0.007, "step": 737550 }, { "epoch": 1.91, "learning_rate": 1.3220713306254065e-05, "loss": 0.0073, "step": 737560 }, { "epoch": 1.91, "learning_rate": 1.3216825089882602e-05, "loss": 0.007, "step": 737570 }, { "epoch": 1.91, "learning_rate": 1.3212936873511137e-05, "loss": 0.0082, "step": 737580 }, { "epoch": 1.91, "learning_rate": 1.320904865713967e-05, "loss": 0.0076, "step": 737590 }, { "epoch": 1.91, "learning_rate": 1.3205160440768206e-05, "loss": 0.0072, "step": 737600 }, { "epoch": 1.91, "learning_rate": 1.3201272224396741e-05, "loss": 0.0071, "step": 737610 }, { "epoch": 1.91, "learning_rate": 1.3197384008025278e-05, "loss": 0.0073, "step": 737620 }, { "epoch": 1.91, "learning_rate": 1.3193495791653813e-05, "loss": 0.011, "step": 737630 }, { "epoch": 1.91, "learning_rate": 1.3189607575282349e-05, "loss": 0.0057, "step": 737640 }, { "epoch": 1.91, "learning_rate": 1.3185719358910884e-05, "loss": 0.0059, "step": 737650 }, { "epoch": 1.91, "learning_rate": 1.3181831142539419e-05, "loss": 0.0077, "step": 737660 }, { "epoch": 1.91, "learning_rate": 1.3177942926167954e-05, "loss": 0.0092, "step": 737670 }, { "epoch": 1.91, "learning_rate": 1.317405470979649e-05, "loss": 0.0062, "step": 737680 }, { "epoch": 1.91, "learning_rate": 1.3170166493425025e-05, "loss": 0.0077, "step": 737690 }, { "epoch": 1.91, "learning_rate": 1.3166278277053562e-05, "loss": 0.0072, "step": 737700 }, { "epoch": 1.91, "learning_rate": 1.3162390060682096e-05, "loss": 0.008, "step": 737710 }, { "epoch": 1.91, "learning_rate": 1.315850184431063e-05, "loss": 0.0049, "step": 737720 }, { "epoch": 1.91, "learning_rate": 1.3154613627939166e-05, "loss": 0.0049, "step": 737730 }, { "epoch": 1.91, "learning_rate": 1.3150725411567701e-05, "loss": 0.0078, "step": 737740 }, { "epoch": 1.91, "learning_rate": 1.3146837195196238e-05, "loss": 0.006, "step": 737750 }, { "epoch": 1.91, "learning_rate": 1.3142948978824772e-05, "loss": 0.0063, "step": 737760 }, { "epoch": 1.91, "learning_rate": 1.3139060762453309e-05, "loss": 0.0099, "step": 737770 }, { "epoch": 1.91, "learning_rate": 1.3135172546081842e-05, "loss": 0.0078, "step": 737780 }, { "epoch": 1.91, "learning_rate": 1.3131284329710379e-05, "loss": 0.0097, "step": 737790 }, { "epoch": 1.91, "learning_rate": 1.3127396113338914e-05, "loss": 0.0058, "step": 737800 }, { "epoch": 1.91, "learning_rate": 1.312350789696745e-05, "loss": 0.0079, "step": 737810 }, { "epoch": 1.91, "learning_rate": 1.3119619680595985e-05, "loss": 0.0089, "step": 737820 }, { "epoch": 1.91, "learning_rate": 1.3115731464224522e-05, "loss": 0.009, "step": 737830 }, { "epoch": 1.91, "learning_rate": 1.3111843247853055e-05, "loss": 0.0056, "step": 737840 }, { "epoch": 1.91, "learning_rate": 1.310795503148159e-05, "loss": 0.0078, "step": 737850 }, { "epoch": 1.91, "learning_rate": 1.3104066815110126e-05, "loss": 0.0048, "step": 737860 }, { "epoch": 1.91, "learning_rate": 1.3100178598738661e-05, "loss": 0.008, "step": 737870 }, { "epoch": 1.91, "learning_rate": 1.3096290382367198e-05, "loss": 0.007, "step": 737880 }, { "epoch": 1.91, "learning_rate": 1.3092402165995732e-05, "loss": 0.0065, "step": 737890 }, { "epoch": 1.91, "learning_rate": 1.3088513949624269e-05, "loss": 0.006, "step": 737900 }, { "epoch": 1.91, "learning_rate": 1.3084625733252802e-05, "loss": 0.0093, "step": 737910 }, { "epoch": 1.91, "learning_rate": 1.3080737516881339e-05, "loss": 0.0065, "step": 737920 }, { "epoch": 1.91, "learning_rate": 1.3076849300509874e-05, "loss": 0.0101, "step": 737930 }, { "epoch": 1.91, "learning_rate": 1.3072961084138408e-05, "loss": 0.0096, "step": 737940 }, { "epoch": 1.91, "learning_rate": 1.3069072867766945e-05, "loss": 0.0059, "step": 737950 }, { "epoch": 1.91, "learning_rate": 1.306518465139548e-05, "loss": 0.0077, "step": 737960 }, { "epoch": 1.91, "learning_rate": 1.3061296435024015e-05, "loss": 0.0067, "step": 737970 }, { "epoch": 1.91, "learning_rate": 1.305740821865255e-05, "loss": 0.0067, "step": 737980 }, { "epoch": 1.91, "learning_rate": 1.3053520002281086e-05, "loss": 0.0058, "step": 737990 }, { "epoch": 1.91, "learning_rate": 1.3049631785909621e-05, "loss": 0.0075, "step": 738000 }, { "epoch": 1.91, "eval_cer": 0.8816536990304715, "eval_loss": 0.004501659423112869, "eval_runtime": 107.8766, "eval_samples_per_second": 18.54, "eval_steps_per_second": 4.635, "step": 738000 }, { "epoch": 1.91, "learning_rate": 1.3045743569538158e-05, "loss": 0.0072, "step": 738010 }, { "epoch": 1.91, "learning_rate": 1.3041855353166692e-05, "loss": 0.0074, "step": 738020 }, { "epoch": 1.91, "learning_rate": 1.3037967136795226e-05, "loss": 0.0069, "step": 738030 }, { "epoch": 1.91, "learning_rate": 1.3034078920423762e-05, "loss": 0.0073, "step": 738040 }, { "epoch": 1.91, "learning_rate": 1.3030190704052297e-05, "loss": 0.0061, "step": 738050 }, { "epoch": 1.91, "learning_rate": 1.3026302487680834e-05, "loss": 0.0071, "step": 738060 }, { "epoch": 1.91, "learning_rate": 1.3022414271309368e-05, "loss": 0.0055, "step": 738070 }, { "epoch": 1.91, "learning_rate": 1.3018526054937905e-05, "loss": 0.0069, "step": 738080 }, { "epoch": 1.91, "learning_rate": 1.3014637838566438e-05, "loss": 0.0072, "step": 738090 }, { "epoch": 1.91, "learning_rate": 1.3010749622194975e-05, "loss": 0.0099, "step": 738100 }, { "epoch": 1.91, "learning_rate": 1.300686140582351e-05, "loss": 0.0075, "step": 738110 }, { "epoch": 1.91, "learning_rate": 1.3002973189452046e-05, "loss": 0.0074, "step": 738120 }, { "epoch": 1.91, "learning_rate": 1.2999084973080581e-05, "loss": 0.0085, "step": 738130 }, { "epoch": 1.91, "learning_rate": 1.2995196756709118e-05, "loss": 0.0059, "step": 738140 }, { "epoch": 1.91, "learning_rate": 1.299130854033765e-05, "loss": 0.0063, "step": 738150 }, { "epoch": 1.91, "learning_rate": 1.2987420323966186e-05, "loss": 0.0128, "step": 738160 }, { "epoch": 1.91, "learning_rate": 1.2983532107594722e-05, "loss": 0.0059, "step": 738170 }, { "epoch": 1.91, "learning_rate": 1.2979643891223257e-05, "loss": 0.0061, "step": 738180 }, { "epoch": 1.91, "learning_rate": 1.2975755674851794e-05, "loss": 0.0072, "step": 738190 }, { "epoch": 1.91, "learning_rate": 1.2971867458480328e-05, "loss": 0.0053, "step": 738200 }, { "epoch": 1.91, "learning_rate": 1.2967979242108865e-05, "loss": 0.0078, "step": 738210 }, { "epoch": 1.91, "learning_rate": 1.2964091025737398e-05, "loss": 0.0099, "step": 738220 }, { "epoch": 1.91, "learning_rate": 1.2960202809365935e-05, "loss": 0.0063, "step": 738230 }, { "epoch": 1.91, "learning_rate": 1.295631459299447e-05, "loss": 0.0069, "step": 738240 }, { "epoch": 1.91, "learning_rate": 1.2952426376623006e-05, "loss": 0.006, "step": 738250 }, { "epoch": 1.91, "learning_rate": 1.2948538160251541e-05, "loss": 0.0075, "step": 738260 }, { "epoch": 1.91, "learning_rate": 1.2944649943880078e-05, "loss": 0.0069, "step": 738270 }, { "epoch": 1.91, "learning_rate": 1.294076172750861e-05, "loss": 0.0087, "step": 738280 }, { "epoch": 1.91, "learning_rate": 1.2936873511137146e-05, "loss": 0.0071, "step": 738290 }, { "epoch": 1.91, "learning_rate": 1.2932985294765682e-05, "loss": 0.006, "step": 738300 }, { "epoch": 1.91, "learning_rate": 1.2929097078394217e-05, "loss": 0.0054, "step": 738310 }, { "epoch": 1.91, "learning_rate": 1.2925208862022754e-05, "loss": 0.0049, "step": 738320 }, { "epoch": 1.91, "learning_rate": 1.2921320645651288e-05, "loss": 0.0061, "step": 738330 }, { "epoch": 1.91, "learning_rate": 1.2917432429279823e-05, "loss": 0.0082, "step": 738340 }, { "epoch": 1.91, "learning_rate": 1.2913544212908358e-05, "loss": 0.0102, "step": 738350 }, { "epoch": 1.91, "learning_rate": 1.2909655996536895e-05, "loss": 0.0066, "step": 738360 }, { "epoch": 1.91, "learning_rate": 1.290576778016543e-05, "loss": 0.008, "step": 738370 }, { "epoch": 1.91, "learning_rate": 1.2901879563793966e-05, "loss": 0.0073, "step": 738380 }, { "epoch": 1.91, "learning_rate": 1.2897991347422501e-05, "loss": 0.0069, "step": 738390 }, { "epoch": 1.91, "learning_rate": 1.2894103131051034e-05, "loss": 0.0087, "step": 738400 }, { "epoch": 1.91, "learning_rate": 1.289021491467957e-05, "loss": 0.0067, "step": 738410 }, { "epoch": 1.91, "learning_rate": 1.2886326698308106e-05, "loss": 0.0068, "step": 738420 }, { "epoch": 1.91, "learning_rate": 1.2882438481936642e-05, "loss": 0.0064, "step": 738430 }, { "epoch": 1.91, "learning_rate": 1.2878550265565177e-05, "loss": 0.007, "step": 738440 }, { "epoch": 1.91, "learning_rate": 1.2874662049193714e-05, "loss": 0.0056, "step": 738450 }, { "epoch": 1.91, "learning_rate": 1.2870773832822247e-05, "loss": 0.0058, "step": 738460 }, { "epoch": 1.91, "learning_rate": 1.2866885616450783e-05, "loss": 0.0071, "step": 738470 }, { "epoch": 1.91, "learning_rate": 1.2862997400079318e-05, "loss": 0.0071, "step": 738480 }, { "epoch": 1.91, "learning_rate": 1.2859109183707855e-05, "loss": 0.0065, "step": 738490 }, { "epoch": 1.91, "learning_rate": 1.285522096733639e-05, "loss": 0.0057, "step": 738500 }, { "epoch": 1.91, "learning_rate": 1.2851332750964926e-05, "loss": 0.0093, "step": 738510 }, { "epoch": 1.91, "learning_rate": 1.2847444534593461e-05, "loss": 0.0053, "step": 738520 }, { "epoch": 1.91, "learning_rate": 1.2843556318221994e-05, "loss": 0.0089, "step": 738530 }, { "epoch": 1.91, "learning_rate": 1.283966810185053e-05, "loss": 0.0077, "step": 738540 }, { "epoch": 1.91, "learning_rate": 1.2835779885479066e-05, "loss": 0.0054, "step": 738550 }, { "epoch": 1.91, "learning_rate": 1.2831891669107602e-05, "loss": 0.0085, "step": 738560 }, { "epoch": 1.91, "learning_rate": 1.2828003452736137e-05, "loss": 0.0073, "step": 738570 }, { "epoch": 1.91, "learning_rate": 1.2824115236364673e-05, "loss": 0.0065, "step": 738580 }, { "epoch": 1.91, "learning_rate": 1.2820227019993207e-05, "loss": 0.0071, "step": 738590 }, { "epoch": 1.91, "learning_rate": 1.2816338803621743e-05, "loss": 0.0087, "step": 738600 }, { "epoch": 1.91, "learning_rate": 1.2812450587250278e-05, "loss": 0.0076, "step": 738610 }, { "epoch": 1.91, "learning_rate": 1.2808562370878813e-05, "loss": 0.0051, "step": 738620 }, { "epoch": 1.91, "learning_rate": 1.280467415450735e-05, "loss": 0.0083, "step": 738630 }, { "epoch": 1.91, "learning_rate": 1.2800785938135884e-05, "loss": 0.0061, "step": 738640 }, { "epoch": 1.91, "learning_rate": 1.279689772176442e-05, "loss": 0.0079, "step": 738650 }, { "epoch": 1.91, "learning_rate": 1.2793009505392954e-05, "loss": 0.0062, "step": 738660 }, { "epoch": 1.91, "learning_rate": 1.278912128902149e-05, "loss": 0.0057, "step": 738670 }, { "epoch": 1.91, "learning_rate": 1.2785233072650025e-05, "loss": 0.0054, "step": 738680 }, { "epoch": 1.91, "learning_rate": 1.2781344856278562e-05, "loss": 0.0074, "step": 738690 }, { "epoch": 1.91, "learning_rate": 1.2777456639907097e-05, "loss": 0.0067, "step": 738700 }, { "epoch": 1.91, "learning_rate": 1.277356842353563e-05, "loss": 0.0082, "step": 738710 }, { "epoch": 1.91, "learning_rate": 1.2769680207164167e-05, "loss": 0.0049, "step": 738720 }, { "epoch": 1.91, "learning_rate": 1.2765791990792701e-05, "loss": 0.0065, "step": 738730 }, { "epoch": 1.91, "learning_rate": 1.2761903774421238e-05, "loss": 0.0078, "step": 738740 }, { "epoch": 1.91, "learning_rate": 1.2758015558049773e-05, "loss": 0.0077, "step": 738750 }, { "epoch": 1.91, "learning_rate": 1.275412734167831e-05, "loss": 0.0096, "step": 738760 }, { "epoch": 1.91, "learning_rate": 1.2750239125306843e-05, "loss": 0.0069, "step": 738770 }, { "epoch": 1.92, "learning_rate": 1.274635090893538e-05, "loss": 0.0056, "step": 738780 }, { "epoch": 1.92, "learning_rate": 1.2742462692563914e-05, "loss": 0.0055, "step": 738790 }, { "epoch": 1.92, "learning_rate": 1.273857447619245e-05, "loss": 0.007, "step": 738800 }, { "epoch": 1.92, "learning_rate": 1.2734686259820985e-05, "loss": 0.0078, "step": 738810 }, { "epoch": 1.92, "learning_rate": 1.2730798043449522e-05, "loss": 0.007, "step": 738820 }, { "epoch": 1.92, "learning_rate": 1.2726909827078057e-05, "loss": 0.0064, "step": 738830 }, { "epoch": 1.92, "learning_rate": 1.272302161070659e-05, "loss": 0.0085, "step": 738840 }, { "epoch": 1.92, "learning_rate": 1.2719133394335127e-05, "loss": 0.0091, "step": 738850 }, { "epoch": 1.92, "learning_rate": 1.2715245177963661e-05, "loss": 0.0074, "step": 738860 }, { "epoch": 1.92, "learning_rate": 1.2711356961592198e-05, "loss": 0.0058, "step": 738870 }, { "epoch": 1.92, "learning_rate": 1.2707468745220733e-05, "loss": 0.0099, "step": 738880 }, { "epoch": 1.92, "learning_rate": 1.270358052884927e-05, "loss": 0.0079, "step": 738890 }, { "epoch": 1.92, "learning_rate": 1.2699692312477803e-05, "loss": 0.0053, "step": 738900 }, { "epoch": 1.92, "learning_rate": 1.269580409610634e-05, "loss": 0.0061, "step": 738910 }, { "epoch": 1.92, "learning_rate": 1.2691915879734874e-05, "loss": 0.006, "step": 738920 }, { "epoch": 1.92, "learning_rate": 1.268802766336341e-05, "loss": 0.01, "step": 738930 }, { "epoch": 1.92, "learning_rate": 1.2684139446991945e-05, "loss": 0.0073, "step": 738940 }, { "epoch": 1.92, "learning_rate": 1.2680251230620482e-05, "loss": 0.0067, "step": 738950 }, { "epoch": 1.92, "learning_rate": 1.2676363014249015e-05, "loss": 0.0082, "step": 738960 }, { "epoch": 1.92, "learning_rate": 1.267247479787755e-05, "loss": 0.0073, "step": 738970 }, { "epoch": 1.92, "learning_rate": 1.2668586581506087e-05, "loss": 0.0074, "step": 738980 }, { "epoch": 1.92, "learning_rate": 1.2664698365134621e-05, "loss": 0.0083, "step": 738990 }, { "epoch": 1.92, "learning_rate": 1.2660810148763158e-05, "loss": 0.0075, "step": 739000 }, { "epoch": 1.92, "eval_cer": 0.8816592975782083, "eval_loss": 0.004513974767178297, "eval_runtime": 107.8813, "eval_samples_per_second": 18.539, "eval_steps_per_second": 4.635, "step": 739000 }, { "epoch": 1.92, "learning_rate": 1.2656921932391693e-05, "loss": 0.008, "step": 739010 }, { "epoch": 1.92, "learning_rate": 1.2653033716020228e-05, "loss": 0.0059, "step": 739020 }, { "epoch": 1.92, "learning_rate": 1.2649145499648763e-05, "loss": 0.0075, "step": 739030 }, { "epoch": 1.92, "learning_rate": 1.2645257283277299e-05, "loss": 0.0052, "step": 739040 }, { "epoch": 1.92, "learning_rate": 1.2641369066905834e-05, "loss": 0.0087, "step": 739050 }, { "epoch": 1.92, "learning_rate": 1.263748085053437e-05, "loss": 0.0091, "step": 739060 }, { "epoch": 1.92, "learning_rate": 1.2633592634162905e-05, "loss": 0.0053, "step": 739070 }, { "epoch": 1.92, "learning_rate": 1.2629704417791439e-05, "loss": 0.0049, "step": 739080 }, { "epoch": 1.92, "learning_rate": 1.2625816201419975e-05, "loss": 0.0069, "step": 739090 }, { "epoch": 1.92, "learning_rate": 1.262192798504851e-05, "loss": 0.0079, "step": 739100 }, { "epoch": 1.92, "learning_rate": 1.2618039768677047e-05, "loss": 0.0062, "step": 739110 }, { "epoch": 1.92, "learning_rate": 1.2614151552305581e-05, "loss": 0.0082, "step": 739120 }, { "epoch": 1.92, "learning_rate": 1.2610263335934118e-05, "loss": 0.0058, "step": 739130 }, { "epoch": 1.92, "learning_rate": 1.2606375119562653e-05, "loss": 0.0079, "step": 739140 }, { "epoch": 1.92, "learning_rate": 1.2602486903191188e-05, "loss": 0.0055, "step": 739150 }, { "epoch": 1.92, "learning_rate": 1.2598598686819723e-05, "loss": 0.006, "step": 739160 }, { "epoch": 1.92, "learning_rate": 1.2594710470448259e-05, "loss": 0.0099, "step": 739170 }, { "epoch": 1.92, "learning_rate": 1.2590822254076794e-05, "loss": 0.0083, "step": 739180 }, { "epoch": 1.92, "learning_rate": 1.258693403770533e-05, "loss": 0.0075, "step": 739190 }, { "epoch": 1.92, "learning_rate": 1.2583045821333865e-05, "loss": 0.0064, "step": 739200 }, { "epoch": 1.92, "learning_rate": 1.2579157604962399e-05, "loss": 0.0089, "step": 739210 }, { "epoch": 1.92, "learning_rate": 1.2575269388590935e-05, "loss": 0.0062, "step": 739220 }, { "epoch": 1.92, "learning_rate": 1.257138117221947e-05, "loss": 0.0052, "step": 739230 }, { "epoch": 1.92, "learning_rate": 1.2567492955848007e-05, "loss": 0.0096, "step": 739240 }, { "epoch": 1.92, "learning_rate": 1.2563604739476541e-05, "loss": 0.0081, "step": 739250 }, { "epoch": 1.92, "learning_rate": 1.2559716523105078e-05, "loss": 0.0088, "step": 739260 }, { "epoch": 1.92, "learning_rate": 1.2555828306733611e-05, "loss": 0.0083, "step": 739270 }, { "epoch": 1.92, "learning_rate": 1.2551940090362148e-05, "loss": 0.0074, "step": 739280 }, { "epoch": 1.92, "learning_rate": 1.2548051873990683e-05, "loss": 0.0074, "step": 739290 }, { "epoch": 1.92, "learning_rate": 1.2544163657619219e-05, "loss": 0.0107, "step": 739300 }, { "epoch": 1.92, "learning_rate": 1.2540275441247754e-05, "loss": 0.0081, "step": 739310 }, { "epoch": 1.92, "learning_rate": 1.2536387224876289e-05, "loss": 0.0073, "step": 739320 }, { "epoch": 1.92, "learning_rate": 1.2532499008504824e-05, "loss": 0.0079, "step": 739330 }, { "epoch": 1.92, "learning_rate": 1.2528610792133359e-05, "loss": 0.0108, "step": 739340 }, { "epoch": 1.92, "learning_rate": 1.2524722575761895e-05, "loss": 0.0079, "step": 739350 }, { "epoch": 1.92, "learning_rate": 1.252083435939043e-05, "loss": 0.0085, "step": 739360 }, { "epoch": 1.92, "learning_rate": 1.2516946143018967e-05, "loss": 0.0121, "step": 739370 }, { "epoch": 1.92, "learning_rate": 1.2513057926647501e-05, "loss": 0.0069, "step": 739380 }, { "epoch": 1.92, "learning_rate": 1.2509169710276035e-05, "loss": 0.007, "step": 739390 }, { "epoch": 1.92, "learning_rate": 1.2505281493904571e-05, "loss": 0.0068, "step": 739400 }, { "epoch": 1.92, "learning_rate": 1.2501393277533106e-05, "loss": 0.0079, "step": 739410 }, { "epoch": 1.92, "learning_rate": 1.2497505061161643e-05, "loss": 0.007, "step": 739420 }, { "epoch": 1.92, "learning_rate": 1.2493616844790177e-05, "loss": 0.0063, "step": 739430 }, { "epoch": 1.92, "learning_rate": 1.2489728628418714e-05, "loss": 0.0088, "step": 739440 }, { "epoch": 1.92, "learning_rate": 1.2485840412047249e-05, "loss": 0.0066, "step": 739450 }, { "epoch": 1.92, "learning_rate": 1.2481952195675784e-05, "loss": 0.0056, "step": 739460 }, { "epoch": 1.92, "learning_rate": 1.2478063979304319e-05, "loss": 0.006, "step": 739470 }, { "epoch": 1.92, "learning_rate": 1.2474175762932855e-05, "loss": 0.011, "step": 739480 }, { "epoch": 1.92, "learning_rate": 1.247028754656139e-05, "loss": 0.0113, "step": 739490 }, { "epoch": 1.92, "learning_rate": 1.2466399330189926e-05, "loss": 0.0085, "step": 739500 }, { "epoch": 1.92, "learning_rate": 1.2462511113818461e-05, "loss": 0.0062, "step": 739510 }, { "epoch": 1.92, "learning_rate": 1.2458622897446995e-05, "loss": 0.0049, "step": 739520 }, { "epoch": 1.92, "learning_rate": 1.2454734681075531e-05, "loss": 0.0071, "step": 739530 }, { "epoch": 1.92, "learning_rate": 1.2450846464704066e-05, "loss": 0.0066, "step": 739540 }, { "epoch": 1.92, "learning_rate": 1.2446958248332602e-05, "loss": 0.0071, "step": 739550 }, { "epoch": 1.92, "learning_rate": 1.2443070031961137e-05, "loss": 0.008, "step": 739560 }, { "epoch": 1.92, "learning_rate": 1.2439181815589674e-05, "loss": 0.0071, "step": 739570 }, { "epoch": 1.92, "learning_rate": 1.2435293599218207e-05, "loss": 0.0055, "step": 739580 }, { "epoch": 1.92, "learning_rate": 1.2431405382846744e-05, "loss": 0.007, "step": 739590 }, { "epoch": 1.92, "learning_rate": 1.2427517166475278e-05, "loss": 0.0085, "step": 739600 }, { "epoch": 1.92, "learning_rate": 1.2423628950103815e-05, "loss": 0.0078, "step": 739610 }, { "epoch": 1.92, "learning_rate": 1.241974073373235e-05, "loss": 0.0047, "step": 739620 }, { "epoch": 1.92, "learning_rate": 1.2415852517360886e-05, "loss": 0.0058, "step": 739630 }, { "epoch": 1.92, "learning_rate": 1.241196430098942e-05, "loss": 0.0073, "step": 739640 }, { "epoch": 1.92, "learning_rate": 1.2408076084617954e-05, "loss": 0.007, "step": 739650 }, { "epoch": 1.92, "learning_rate": 1.2404187868246491e-05, "loss": 0.0069, "step": 739660 }, { "epoch": 1.92, "learning_rate": 1.2400299651875026e-05, "loss": 0.0086, "step": 739670 }, { "epoch": 1.92, "learning_rate": 1.2396411435503562e-05, "loss": 0.0068, "step": 739680 }, { "epoch": 1.92, "learning_rate": 1.2392523219132097e-05, "loss": 0.0073, "step": 739690 }, { "epoch": 1.92, "learning_rate": 1.2388635002760632e-05, "loss": 0.0073, "step": 739700 }, { "epoch": 1.92, "learning_rate": 1.2384746786389167e-05, "loss": 0.0102, "step": 739710 }, { "epoch": 1.92, "learning_rate": 1.2380858570017704e-05, "loss": 0.0097, "step": 739720 }, { "epoch": 1.92, "learning_rate": 1.2376970353646238e-05, "loss": 0.0059, "step": 739730 }, { "epoch": 1.92, "learning_rate": 1.2373082137274775e-05, "loss": 0.0087, "step": 739740 }, { "epoch": 1.92, "learning_rate": 1.236919392090331e-05, "loss": 0.0047, "step": 739750 }, { "epoch": 1.92, "learning_rate": 1.2365305704531846e-05, "loss": 0.008, "step": 739760 }, { "epoch": 1.92, "learning_rate": 1.236141748816038e-05, "loss": 0.0064, "step": 739770 }, { "epoch": 1.92, "learning_rate": 1.2357529271788914e-05, "loss": 0.0076, "step": 739780 }, { "epoch": 1.92, "learning_rate": 1.2353641055417451e-05, "loss": 0.0084, "step": 739790 }, { "epoch": 1.92, "learning_rate": 1.2349752839045986e-05, "loss": 0.0101, "step": 739800 }, { "epoch": 1.92, "learning_rate": 1.2345864622674522e-05, "loss": 0.0068, "step": 739810 }, { "epoch": 1.92, "learning_rate": 1.2341976406303057e-05, "loss": 0.0079, "step": 739820 }, { "epoch": 1.92, "learning_rate": 1.2338088189931592e-05, "loss": 0.0061, "step": 739830 }, { "epoch": 1.92, "learning_rate": 1.2334199973560127e-05, "loss": 0.0098, "step": 739840 }, { "epoch": 1.92, "learning_rate": 1.2330311757188664e-05, "loss": 0.0068, "step": 739850 }, { "epoch": 1.92, "learning_rate": 1.2326423540817198e-05, "loss": 0.0077, "step": 739860 }, { "epoch": 1.92, "learning_rate": 1.2322535324445735e-05, "loss": 0.0094, "step": 739870 }, { "epoch": 1.92, "learning_rate": 1.231864710807427e-05, "loss": 0.0088, "step": 739880 }, { "epoch": 1.92, "learning_rate": 1.2314758891702803e-05, "loss": 0.0078, "step": 739890 }, { "epoch": 1.92, "learning_rate": 1.231087067533134e-05, "loss": 0.0069, "step": 739900 }, { "epoch": 1.92, "learning_rate": 1.2306982458959874e-05, "loss": 0.0081, "step": 739910 }, { "epoch": 1.92, "learning_rate": 1.2303094242588411e-05, "loss": 0.0067, "step": 739920 }, { "epoch": 1.92, "learning_rate": 1.2299206026216946e-05, "loss": 0.012, "step": 739930 }, { "epoch": 1.92, "learning_rate": 1.2295317809845482e-05, "loss": 0.0073, "step": 739940 }, { "epoch": 1.92, "learning_rate": 1.2291429593474016e-05, "loss": 0.008, "step": 739950 }, { "epoch": 1.92, "learning_rate": 1.2287541377102552e-05, "loss": 0.01, "step": 739960 }, { "epoch": 1.92, "learning_rate": 1.2283653160731087e-05, "loss": 0.0063, "step": 739970 }, { "epoch": 1.92, "learning_rate": 1.2279764944359624e-05, "loss": 0.0076, "step": 739980 }, { "epoch": 1.92, "learning_rate": 1.2275876727988158e-05, "loss": 0.0093, "step": 739990 }, { "epoch": 1.92, "learning_rate": 1.2271988511616693e-05, "loss": 0.0065, "step": 740000 }, { "epoch": 1.92, "eval_cer": 0.8816606972151424, "eval_loss": 0.004454230424016714, "eval_runtime": 108.0552, "eval_samples_per_second": 18.509, "eval_steps_per_second": 4.627, "step": 740000 }, { "epoch": 1.92, "learning_rate": 1.2268100295245228e-05, "loss": 0.0118, "step": 740010 }, { "epoch": 1.92, "learning_rate": 1.2264212078873763e-05, "loss": 0.0093, "step": 740020 }, { "epoch": 1.92, "learning_rate": 1.22603238625023e-05, "loss": 0.0056, "step": 740030 }, { "epoch": 1.92, "learning_rate": 1.2256435646130834e-05, "loss": 0.0078, "step": 740040 }, { "epoch": 1.92, "learning_rate": 1.2252547429759371e-05, "loss": 0.0089, "step": 740050 }, { "epoch": 1.92, "learning_rate": 1.2248659213387906e-05, "loss": 0.0092, "step": 740060 }, { "epoch": 1.92, "learning_rate": 1.2244770997016442e-05, "loss": 0.0068, "step": 740070 }, { "epoch": 1.92, "learning_rate": 1.2240882780644976e-05, "loss": 0.0081, "step": 740080 }, { "epoch": 1.92, "learning_rate": 1.223699456427351e-05, "loss": 0.0106, "step": 740090 }, { "epoch": 1.92, "learning_rate": 1.2233106347902047e-05, "loss": 0.0077, "step": 740100 }, { "epoch": 1.92, "learning_rate": 1.2229218131530582e-05, "loss": 0.0112, "step": 740110 }, { "epoch": 1.92, "learning_rate": 1.2225329915159118e-05, "loss": 0.007, "step": 740120 }, { "epoch": 1.92, "learning_rate": 1.2221441698787653e-05, "loss": 0.0076, "step": 740130 }, { "epoch": 1.92, "learning_rate": 1.2217553482416188e-05, "loss": 0.0073, "step": 740140 }, { "epoch": 1.92, "learning_rate": 1.2213665266044723e-05, "loss": 0.0074, "step": 740150 }, { "epoch": 1.92, "learning_rate": 1.220977704967326e-05, "loss": 0.0052, "step": 740160 }, { "epoch": 1.92, "learning_rate": 1.2205888833301794e-05, "loss": 0.0072, "step": 740170 }, { "epoch": 1.92, "learning_rate": 1.2202000616930331e-05, "loss": 0.0088, "step": 740180 }, { "epoch": 1.92, "learning_rate": 1.2198112400558866e-05, "loss": 0.0068, "step": 740190 }, { "epoch": 1.92, "learning_rate": 1.2194224184187399e-05, "loss": 0.0069, "step": 740200 }, { "epoch": 1.92, "learning_rate": 1.2190335967815936e-05, "loss": 0.006, "step": 740210 }, { "epoch": 1.92, "learning_rate": 1.218644775144447e-05, "loss": 0.0067, "step": 740220 }, { "epoch": 1.92, "learning_rate": 1.2182559535073007e-05, "loss": 0.0068, "step": 740230 }, { "epoch": 1.92, "learning_rate": 1.2178671318701542e-05, "loss": 0.008, "step": 740240 }, { "epoch": 1.92, "learning_rate": 1.2174783102330078e-05, "loss": 0.0063, "step": 740250 }, { "epoch": 1.92, "learning_rate": 1.2170894885958612e-05, "loss": 0.0078, "step": 740260 }, { "epoch": 1.92, "learning_rate": 1.2167006669587148e-05, "loss": 0.0077, "step": 740270 }, { "epoch": 1.92, "learning_rate": 1.2163118453215683e-05, "loss": 0.0078, "step": 740280 }, { "epoch": 1.92, "learning_rate": 1.215923023684422e-05, "loss": 0.0066, "step": 740290 }, { "epoch": 1.92, "learning_rate": 1.2155342020472754e-05, "loss": 0.0071, "step": 740300 }, { "epoch": 1.92, "learning_rate": 1.2151453804101291e-05, "loss": 0.008, "step": 740310 }, { "epoch": 1.92, "learning_rate": 1.2147565587729824e-05, "loss": 0.0083, "step": 740320 }, { "epoch": 1.92, "learning_rate": 1.2143677371358359e-05, "loss": 0.0092, "step": 740330 }, { "epoch": 1.92, "learning_rate": 1.2139789154986896e-05, "loss": 0.008, "step": 740340 }, { "epoch": 1.92, "learning_rate": 1.213590093861543e-05, "loss": 0.0072, "step": 740350 }, { "epoch": 1.92, "learning_rate": 1.2132012722243967e-05, "loss": 0.005, "step": 740360 }, { "epoch": 1.92, "learning_rate": 1.2128124505872502e-05, "loss": 0.0059, "step": 740370 }, { "epoch": 1.92, "learning_rate": 1.2124236289501038e-05, "loss": 0.0063, "step": 740380 }, { "epoch": 1.92, "learning_rate": 1.2120348073129572e-05, "loss": 0.0077, "step": 740390 }, { "epoch": 1.92, "learning_rate": 1.2116459856758108e-05, "loss": 0.0077, "step": 740400 }, { "epoch": 1.92, "learning_rate": 1.2112571640386643e-05, "loss": 0.0051, "step": 740410 }, { "epoch": 1.92, "learning_rate": 1.210868342401518e-05, "loss": 0.0058, "step": 740420 }, { "epoch": 1.92, "learning_rate": 1.2104795207643714e-05, "loss": 0.0063, "step": 740430 }, { "epoch": 1.92, "learning_rate": 1.2100906991272251e-05, "loss": 0.0075, "step": 740440 }, { "epoch": 1.92, "learning_rate": 1.2097018774900784e-05, "loss": 0.0098, "step": 740450 }, { "epoch": 1.92, "learning_rate": 1.2093130558529319e-05, "loss": 0.0068, "step": 740460 }, { "epoch": 1.92, "learning_rate": 1.2089242342157855e-05, "loss": 0.0055, "step": 740470 }, { "epoch": 1.92, "learning_rate": 1.208535412578639e-05, "loss": 0.0092, "step": 740480 }, { "epoch": 1.92, "learning_rate": 1.2081465909414927e-05, "loss": 0.0082, "step": 740490 }, { "epoch": 1.92, "learning_rate": 1.2077577693043462e-05, "loss": 0.0085, "step": 740500 }, { "epoch": 1.92, "learning_rate": 1.2073689476671997e-05, "loss": 0.0056, "step": 740510 }, { "epoch": 1.92, "learning_rate": 1.2069801260300531e-05, "loss": 0.0086, "step": 740520 }, { "epoch": 1.92, "learning_rate": 1.2065913043929068e-05, "loss": 0.0088, "step": 740530 }, { "epoch": 1.92, "learning_rate": 1.2062024827557603e-05, "loss": 0.0076, "step": 740540 }, { "epoch": 1.92, "learning_rate": 1.205813661118614e-05, "loss": 0.0061, "step": 740550 }, { "epoch": 1.92, "learning_rate": 1.2054248394814674e-05, "loss": 0.0089, "step": 740560 }, { "epoch": 1.92, "learning_rate": 1.2050360178443207e-05, "loss": 0.0076, "step": 740570 }, { "epoch": 1.92, "learning_rate": 1.2046471962071744e-05, "loss": 0.013, "step": 740580 }, { "epoch": 1.92, "learning_rate": 1.2042583745700279e-05, "loss": 0.0074, "step": 740590 }, { "epoch": 1.92, "learning_rate": 1.2038695529328815e-05, "loss": 0.0069, "step": 740600 }, { "epoch": 1.92, "learning_rate": 1.203480731295735e-05, "loss": 0.0068, "step": 740610 }, { "epoch": 1.92, "learning_rate": 1.2030919096585887e-05, "loss": 0.0061, "step": 740620 }, { "epoch": 1.92, "learning_rate": 1.202703088021442e-05, "loss": 0.0101, "step": 740630 }, { "epoch": 1.92, "learning_rate": 1.2023142663842957e-05, "loss": 0.0053, "step": 740640 }, { "epoch": 1.92, "learning_rate": 1.2019254447471491e-05, "loss": 0.0066, "step": 740650 }, { "epoch": 1.92, "learning_rate": 1.2015366231100028e-05, "loss": 0.0073, "step": 740660 }, { "epoch": 1.92, "learning_rate": 1.2011478014728563e-05, "loss": 0.0058, "step": 740670 }, { "epoch": 1.92, "learning_rate": 1.20075897983571e-05, "loss": 0.0059, "step": 740680 }, { "epoch": 1.92, "learning_rate": 1.2003701581985634e-05, "loss": 0.0069, "step": 740690 }, { "epoch": 1.92, "learning_rate": 1.1999813365614167e-05, "loss": 0.0063, "step": 740700 }, { "epoch": 1.92, "learning_rate": 1.1995925149242704e-05, "loss": 0.005, "step": 740710 }, { "epoch": 1.92, "learning_rate": 1.1992036932871239e-05, "loss": 0.0074, "step": 740720 }, { "epoch": 1.92, "learning_rate": 1.1988148716499775e-05, "loss": 0.0068, "step": 740730 }, { "epoch": 1.92, "learning_rate": 1.198426050012831e-05, "loss": 0.0087, "step": 740740 }, { "epoch": 1.92, "learning_rate": 1.1980372283756847e-05, "loss": 0.0063, "step": 740750 }, { "epoch": 1.92, "learning_rate": 1.197648406738538e-05, "loss": 0.0073, "step": 740760 }, { "epoch": 1.92, "learning_rate": 1.1972595851013915e-05, "loss": 0.0105, "step": 740770 }, { "epoch": 1.92, "learning_rate": 1.1968707634642451e-05, "loss": 0.0087, "step": 740780 }, { "epoch": 1.92, "learning_rate": 1.1964819418270986e-05, "loss": 0.0072, "step": 740790 }, { "epoch": 1.92, "learning_rate": 1.1960931201899523e-05, "loss": 0.01, "step": 740800 }, { "epoch": 1.92, "learning_rate": 1.1957042985528058e-05, "loss": 0.0085, "step": 740810 }, { "epoch": 1.92, "learning_rate": 1.1953154769156593e-05, "loss": 0.0053, "step": 740820 }, { "epoch": 1.92, "learning_rate": 1.1949266552785127e-05, "loss": 0.0069, "step": 740830 }, { "epoch": 1.92, "learning_rate": 1.1945378336413664e-05, "loss": 0.0061, "step": 740840 }, { "epoch": 1.92, "learning_rate": 1.1941490120042199e-05, "loss": 0.0074, "step": 740850 }, { "epoch": 1.92, "learning_rate": 1.1937601903670735e-05, "loss": 0.0062, "step": 740860 }, { "epoch": 1.92, "learning_rate": 1.193371368729927e-05, "loss": 0.0061, "step": 740870 }, { "epoch": 1.92, "learning_rate": 1.1929825470927803e-05, "loss": 0.0075, "step": 740880 }, { "epoch": 1.92, "learning_rate": 1.192593725455634e-05, "loss": 0.0088, "step": 740890 }, { "epoch": 1.92, "learning_rate": 1.1922049038184875e-05, "loss": 0.0061, "step": 740900 }, { "epoch": 1.92, "learning_rate": 1.1918160821813411e-05, "loss": 0.0086, "step": 740910 }, { "epoch": 1.92, "learning_rate": 1.1914272605441946e-05, "loss": 0.0062, "step": 740920 }, { "epoch": 1.92, "learning_rate": 1.1910384389070483e-05, "loss": 0.0061, "step": 740930 }, { "epoch": 1.92, "learning_rate": 1.1906496172699016e-05, "loss": 0.0049, "step": 740940 }, { "epoch": 1.92, "learning_rate": 1.1902607956327553e-05, "loss": 0.0074, "step": 740950 }, { "epoch": 1.92, "learning_rate": 1.1898719739956087e-05, "loss": 0.0051, "step": 740960 }, { "epoch": 1.92, "learning_rate": 1.1894831523584624e-05, "loss": 0.0079, "step": 740970 }, { "epoch": 1.92, "learning_rate": 1.1890943307213159e-05, "loss": 0.0064, "step": 740980 }, { "epoch": 1.92, "learning_rate": 1.1887055090841695e-05, "loss": 0.0059, "step": 740990 }, { "epoch": 1.92, "learning_rate": 1.188316687447023e-05, "loss": 0.007, "step": 741000 }, { "epoch": 1.92, "eval_cer": 0.8816774928583525, "eval_loss": 0.004421970807015896, "eval_runtime": 108.0147, "eval_samples_per_second": 18.516, "eval_steps_per_second": 4.629, "step": 741000 }, { "epoch": 1.92, "learning_rate": 1.1879278658098763e-05, "loss": 0.0069, "step": 741010 }, { "epoch": 1.92, "learning_rate": 1.18753904417273e-05, "loss": 0.0086, "step": 741020 }, { "epoch": 1.92, "learning_rate": 1.1871502225355835e-05, "loss": 0.0042, "step": 741030 }, { "epoch": 1.92, "learning_rate": 1.1867614008984371e-05, "loss": 0.0071, "step": 741040 }, { "epoch": 1.92, "learning_rate": 1.1863725792612906e-05, "loss": 0.0065, "step": 741050 }, { "epoch": 1.92, "learning_rate": 1.1859837576241443e-05, "loss": 0.0078, "step": 741060 }, { "epoch": 1.92, "learning_rate": 1.1855949359869976e-05, "loss": 0.0062, "step": 741070 }, { "epoch": 1.92, "learning_rate": 1.1852061143498513e-05, "loss": 0.0057, "step": 741080 }, { "epoch": 1.92, "learning_rate": 1.1848172927127047e-05, "loss": 0.0049, "step": 741090 }, { "epoch": 1.92, "learning_rate": 1.1844284710755584e-05, "loss": 0.0052, "step": 741100 }, { "epoch": 1.92, "learning_rate": 1.1840396494384119e-05, "loss": 0.0056, "step": 741110 }, { "epoch": 1.92, "learning_rate": 1.1836508278012655e-05, "loss": 0.0058, "step": 741120 }, { "epoch": 1.92, "learning_rate": 1.1832620061641189e-05, "loss": 0.0068, "step": 741130 }, { "epoch": 1.92, "learning_rate": 1.1828731845269723e-05, "loss": 0.0067, "step": 741140 }, { "epoch": 1.92, "learning_rate": 1.182484362889826e-05, "loss": 0.0053, "step": 741150 }, { "epoch": 1.92, "learning_rate": 1.1820955412526795e-05, "loss": 0.0089, "step": 741160 }, { "epoch": 1.92, "learning_rate": 1.1817067196155331e-05, "loss": 0.0063, "step": 741170 }, { "epoch": 1.92, "learning_rate": 1.1813178979783866e-05, "loss": 0.0057, "step": 741180 }, { "epoch": 1.92, "learning_rate": 1.1809290763412401e-05, "loss": 0.0075, "step": 741190 }, { "epoch": 1.92, "learning_rate": 1.1805402547040936e-05, "loss": 0.0084, "step": 741200 }, { "epoch": 1.92, "learning_rate": 1.1801514330669472e-05, "loss": 0.0072, "step": 741210 }, { "epoch": 1.92, "learning_rate": 1.1797626114298007e-05, "loss": 0.0084, "step": 741220 }, { "epoch": 1.92, "learning_rate": 1.1793737897926544e-05, "loss": 0.0059, "step": 741230 }, { "epoch": 1.92, "learning_rate": 1.1789849681555079e-05, "loss": 0.0087, "step": 741240 }, { "epoch": 1.92, "learning_rate": 1.1785961465183612e-05, "loss": 0.0078, "step": 741250 }, { "epoch": 1.92, "learning_rate": 1.1782073248812149e-05, "loss": 0.006, "step": 741260 }, { "epoch": 1.92, "learning_rate": 1.1778185032440683e-05, "loss": 0.0056, "step": 741270 }, { "epoch": 1.92, "learning_rate": 1.177429681606922e-05, "loss": 0.0052, "step": 741280 }, { "epoch": 1.92, "learning_rate": 1.1770408599697755e-05, "loss": 0.0064, "step": 741290 }, { "epoch": 1.92, "learning_rate": 1.1766520383326291e-05, "loss": 0.0051, "step": 741300 }, { "epoch": 1.92, "learning_rate": 1.1762632166954826e-05, "loss": 0.0078, "step": 741310 }, { "epoch": 1.92, "learning_rate": 1.1758743950583361e-05, "loss": 0.0066, "step": 741320 }, { "epoch": 1.92, "learning_rate": 1.1754855734211896e-05, "loss": 0.01, "step": 741330 }, { "epoch": 1.92, "learning_rate": 1.1750967517840432e-05, "loss": 0.0062, "step": 741340 }, { "epoch": 1.92, "learning_rate": 1.1747079301468967e-05, "loss": 0.0049, "step": 741350 }, { "epoch": 1.92, "learning_rate": 1.1743191085097504e-05, "loss": 0.0069, "step": 741360 }, { "epoch": 1.92, "learning_rate": 1.1739302868726039e-05, "loss": 0.0097, "step": 741370 }, { "epoch": 1.92, "learning_rate": 1.1735414652354572e-05, "loss": 0.0052, "step": 741380 }, { "epoch": 1.92, "learning_rate": 1.1731526435983108e-05, "loss": 0.007, "step": 741390 }, { "epoch": 1.92, "learning_rate": 1.1727638219611643e-05, "loss": 0.0074, "step": 741400 }, { "epoch": 1.92, "learning_rate": 1.172375000324018e-05, "loss": 0.0082, "step": 741410 }, { "epoch": 1.92, "learning_rate": 1.1719861786868715e-05, "loss": 0.01, "step": 741420 }, { "epoch": 1.92, "learning_rate": 1.1715973570497251e-05, "loss": 0.0086, "step": 741430 }, { "epoch": 1.92, "learning_rate": 1.1712085354125784e-05, "loss": 0.0069, "step": 741440 }, { "epoch": 1.92, "learning_rate": 1.170819713775432e-05, "loss": 0.0065, "step": 741450 }, { "epoch": 1.92, "learning_rate": 1.1704308921382856e-05, "loss": 0.0063, "step": 741460 }, { "epoch": 1.92, "learning_rate": 1.170042070501139e-05, "loss": 0.0073, "step": 741470 }, { "epoch": 1.92, "learning_rate": 1.1696532488639927e-05, "loss": 0.0053, "step": 741480 }, { "epoch": 1.92, "learning_rate": 1.1692644272268462e-05, "loss": 0.0069, "step": 741490 }, { "epoch": 1.92, "learning_rate": 1.1688756055896997e-05, "loss": 0.0078, "step": 741500 }, { "epoch": 1.92, "learning_rate": 1.1684867839525532e-05, "loss": 0.0076, "step": 741510 }, { "epoch": 1.92, "learning_rate": 1.1680979623154068e-05, "loss": 0.0101, "step": 741520 }, { "epoch": 1.92, "learning_rate": 1.1677091406782603e-05, "loss": 0.0057, "step": 741530 }, { "epoch": 1.92, "learning_rate": 1.167320319041114e-05, "loss": 0.0083, "step": 741540 }, { "epoch": 1.92, "learning_rate": 1.1669314974039675e-05, "loss": 0.0063, "step": 741550 }, { "epoch": 1.92, "learning_rate": 1.1665426757668208e-05, "loss": 0.0051, "step": 741560 }, { "epoch": 1.92, "learning_rate": 1.1661538541296744e-05, "loss": 0.0079, "step": 741570 }, { "epoch": 1.92, "learning_rate": 1.165765032492528e-05, "loss": 0.0138, "step": 741580 }, { "epoch": 1.92, "learning_rate": 1.1653762108553816e-05, "loss": 0.0063, "step": 741590 }, { "epoch": 1.92, "learning_rate": 1.164987389218235e-05, "loss": 0.0049, "step": 741600 }, { "epoch": 1.92, "learning_rate": 1.1645985675810887e-05, "loss": 0.0048, "step": 741610 }, { "epoch": 1.92, "learning_rate": 1.1642097459439422e-05, "loss": 0.0092, "step": 741620 }, { "epoch": 1.92, "learning_rate": 1.1638209243067957e-05, "loss": 0.0066, "step": 741630 }, { "epoch": 1.92, "learning_rate": 1.1634321026696492e-05, "loss": 0.0073, "step": 741640 }, { "epoch": 1.92, "learning_rate": 1.1630432810325028e-05, "loss": 0.0055, "step": 741650 }, { "epoch": 1.92, "learning_rate": 1.1626544593953563e-05, "loss": 0.0076, "step": 741660 }, { "epoch": 1.92, "learning_rate": 1.16226563775821e-05, "loss": 0.0057, "step": 741670 }, { "epoch": 1.92, "learning_rate": 1.1618768161210635e-05, "loss": 0.0068, "step": 741680 }, { "epoch": 1.92, "learning_rate": 1.1614879944839168e-05, "loss": 0.0083, "step": 741690 }, { "epoch": 1.92, "learning_rate": 1.1610991728467704e-05, "loss": 0.0063, "step": 741700 }, { "epoch": 1.92, "learning_rate": 1.160710351209624e-05, "loss": 0.0109, "step": 741710 }, { "epoch": 1.92, "learning_rate": 1.1603215295724776e-05, "loss": 0.0086, "step": 741720 }, { "epoch": 1.92, "learning_rate": 1.159932707935331e-05, "loss": 0.0051, "step": 741730 }, { "epoch": 1.92, "learning_rate": 1.1595438862981847e-05, "loss": 0.0041, "step": 741740 }, { "epoch": 1.92, "learning_rate": 1.159155064661038e-05, "loss": 0.0065, "step": 741750 }, { "epoch": 1.92, "learning_rate": 1.1587662430238917e-05, "loss": 0.0049, "step": 741760 }, { "epoch": 1.92, "learning_rate": 1.1583774213867452e-05, "loss": 0.0073, "step": 741770 }, { "epoch": 1.92, "learning_rate": 1.1579885997495988e-05, "loss": 0.0064, "step": 741780 }, { "epoch": 1.92, "learning_rate": 1.1575997781124523e-05, "loss": 0.0072, "step": 741790 }, { "epoch": 1.92, "learning_rate": 1.157210956475306e-05, "loss": 0.0088, "step": 741800 }, { "epoch": 1.92, "learning_rate": 1.1568221348381593e-05, "loss": 0.0071, "step": 741810 }, { "epoch": 1.92, "learning_rate": 1.1564333132010128e-05, "loss": 0.0069, "step": 741820 }, { "epoch": 1.92, "learning_rate": 1.1560444915638664e-05, "loss": 0.007, "step": 741830 }, { "epoch": 1.92, "learning_rate": 1.15565566992672e-05, "loss": 0.007, "step": 741840 }, { "epoch": 1.92, "learning_rate": 1.1552668482895736e-05, "loss": 0.0081, "step": 741850 }, { "epoch": 1.92, "learning_rate": 1.154878026652427e-05, "loss": 0.0096, "step": 741860 }, { "epoch": 1.92, "learning_rate": 1.1544892050152806e-05, "loss": 0.0087, "step": 741870 }, { "epoch": 1.92, "learning_rate": 1.154100383378134e-05, "loss": 0.0069, "step": 741880 }, { "epoch": 1.92, "learning_rate": 1.1537115617409877e-05, "loss": 0.0054, "step": 741890 }, { "epoch": 1.92, "learning_rate": 1.1533227401038412e-05, "loss": 0.0071, "step": 741900 }, { "epoch": 1.92, "learning_rate": 1.1529339184666948e-05, "loss": 0.0058, "step": 741910 }, { "epoch": 1.92, "learning_rate": 1.1525450968295483e-05, "loss": 0.0069, "step": 741920 }, { "epoch": 1.92, "learning_rate": 1.152156275192402e-05, "loss": 0.0066, "step": 741930 }, { "epoch": 1.92, "learning_rate": 1.1517674535552553e-05, "loss": 0.0053, "step": 741940 }, { "epoch": 1.92, "learning_rate": 1.1513786319181088e-05, "loss": 0.0086, "step": 741950 }, { "epoch": 1.92, "learning_rate": 1.1509898102809624e-05, "loss": 0.0102, "step": 741960 }, { "epoch": 1.92, "learning_rate": 1.150600988643816e-05, "loss": 0.0057, "step": 741970 }, { "epoch": 1.92, "learning_rate": 1.1502121670066696e-05, "loss": 0.0072, "step": 741980 }, { "epoch": 1.92, "learning_rate": 1.149823345369523e-05, "loss": 0.008, "step": 741990 }, { "epoch": 1.92, "learning_rate": 1.1494345237323766e-05, "loss": 0.0085, "step": 742000 }, { "epoch": 1.92, "eval_cer": 0.8816676953998133, "eval_loss": 0.004464298021048307, "eval_runtime": 107.8257, "eval_samples_per_second": 18.548, "eval_steps_per_second": 4.637, "step": 742000 }, { "epoch": 1.92, "learning_rate": 1.14904570209523e-05, "loss": 0.0036, "step": 742010 }, { "epoch": 1.92, "learning_rate": 1.1486568804580837e-05, "loss": 0.0067, "step": 742020 }, { "epoch": 1.92, "learning_rate": 1.1482680588209372e-05, "loss": 0.0072, "step": 742030 }, { "epoch": 1.92, "learning_rate": 1.1478792371837908e-05, "loss": 0.0057, "step": 742040 }, { "epoch": 1.92, "learning_rate": 1.1474904155466443e-05, "loss": 0.0089, "step": 742050 }, { "epoch": 1.92, "learning_rate": 1.1471015939094976e-05, "loss": 0.0065, "step": 742060 }, { "epoch": 1.92, "learning_rate": 1.1467127722723513e-05, "loss": 0.0066, "step": 742070 }, { "epoch": 1.92, "learning_rate": 1.1463239506352048e-05, "loss": 0.0072, "step": 742080 }, { "epoch": 1.92, "learning_rate": 1.1459351289980584e-05, "loss": 0.0094, "step": 742090 }, { "epoch": 1.92, "learning_rate": 1.145546307360912e-05, "loss": 0.0061, "step": 742100 }, { "epoch": 1.92, "learning_rate": 1.1451574857237656e-05, "loss": 0.0069, "step": 742110 }, { "epoch": 1.92, "learning_rate": 1.1447686640866189e-05, "loss": 0.0057, "step": 742120 }, { "epoch": 1.92, "learning_rate": 1.1443798424494724e-05, "loss": 0.0067, "step": 742130 }, { "epoch": 1.92, "learning_rate": 1.143991020812326e-05, "loss": 0.0063, "step": 742140 }, { "epoch": 1.92, "learning_rate": 1.1436021991751795e-05, "loss": 0.0079, "step": 742150 }, { "epoch": 1.92, "learning_rate": 1.1432133775380332e-05, "loss": 0.0063, "step": 742160 }, { "epoch": 1.92, "learning_rate": 1.1428245559008867e-05, "loss": 0.0062, "step": 742170 }, { "epoch": 1.92, "learning_rate": 1.1424357342637401e-05, "loss": 0.0073, "step": 742180 }, { "epoch": 1.92, "learning_rate": 1.1420469126265936e-05, "loss": 0.0075, "step": 742190 }, { "epoch": 1.92, "learning_rate": 1.1416580909894473e-05, "loss": 0.0056, "step": 742200 }, { "epoch": 1.92, "learning_rate": 1.1412692693523008e-05, "loss": 0.0095, "step": 742210 }, { "epoch": 1.92, "learning_rate": 1.1408804477151544e-05, "loss": 0.0079, "step": 742220 }, { "epoch": 1.92, "learning_rate": 1.140491626078008e-05, "loss": 0.0041, "step": 742230 }, { "epoch": 1.92, "learning_rate": 1.1401028044408616e-05, "loss": 0.008, "step": 742240 }, { "epoch": 1.92, "learning_rate": 1.1397139828037149e-05, "loss": 0.0063, "step": 742250 }, { "epoch": 1.92, "learning_rate": 1.1393251611665684e-05, "loss": 0.0097, "step": 742260 }, { "epoch": 1.92, "learning_rate": 1.138936339529422e-05, "loss": 0.0087, "step": 742270 }, { "epoch": 1.92, "learning_rate": 1.1385475178922755e-05, "loss": 0.0097, "step": 742280 }, { "epoch": 1.92, "learning_rate": 1.1381586962551292e-05, "loss": 0.0069, "step": 742290 }, { "epoch": 1.92, "learning_rate": 1.1377698746179827e-05, "loss": 0.0051, "step": 742300 }, { "epoch": 1.92, "learning_rate": 1.1373810529808361e-05, "loss": 0.0085, "step": 742310 }, { "epoch": 1.92, "learning_rate": 1.1369922313436896e-05, "loss": 0.0088, "step": 742320 }, { "epoch": 1.92, "learning_rate": 1.1366034097065433e-05, "loss": 0.0054, "step": 742330 }, { "epoch": 1.92, "learning_rate": 1.1362145880693968e-05, "loss": 0.0074, "step": 742340 }, { "epoch": 1.92, "learning_rate": 1.1358257664322504e-05, "loss": 0.0081, "step": 742350 }, { "epoch": 1.92, "learning_rate": 1.135436944795104e-05, "loss": 0.0059, "step": 742360 }, { "epoch": 1.92, "learning_rate": 1.1350481231579572e-05, "loss": 0.0072, "step": 742370 }, { "epoch": 1.92, "learning_rate": 1.1346593015208109e-05, "loss": 0.0085, "step": 742380 }, { "epoch": 1.92, "learning_rate": 1.1342704798836644e-05, "loss": 0.0073, "step": 742390 }, { "epoch": 1.92, "learning_rate": 1.133881658246518e-05, "loss": 0.0072, "step": 742400 }, { "epoch": 1.92, "learning_rate": 1.1334928366093715e-05, "loss": 0.0067, "step": 742410 }, { "epoch": 1.92, "learning_rate": 1.1331040149722252e-05, "loss": 0.0071, "step": 742420 }, { "epoch": 1.92, "learning_rate": 1.1327151933350785e-05, "loss": 0.0071, "step": 742430 }, { "epoch": 1.92, "learning_rate": 1.1323263716979321e-05, "loss": 0.0062, "step": 742440 }, { "epoch": 1.92, "learning_rate": 1.1319375500607856e-05, "loss": 0.0047, "step": 742450 }, { "epoch": 1.92, "learning_rate": 1.1315487284236393e-05, "loss": 0.0052, "step": 742460 }, { "epoch": 1.92, "learning_rate": 1.1311599067864928e-05, "loss": 0.0077, "step": 742470 }, { "epoch": 1.92, "learning_rate": 1.1307710851493464e-05, "loss": 0.0077, "step": 742480 }, { "epoch": 1.92, "learning_rate": 1.1303822635121999e-05, "loss": 0.0061, "step": 742490 }, { "epoch": 1.92, "learning_rate": 1.1299934418750532e-05, "loss": 0.006, "step": 742500 }, { "epoch": 1.92, "learning_rate": 1.1296046202379069e-05, "loss": 0.0052, "step": 742510 }, { "epoch": 1.92, "learning_rate": 1.1292157986007604e-05, "loss": 0.0063, "step": 742520 }, { "epoch": 1.92, "learning_rate": 1.128826976963614e-05, "loss": 0.0074, "step": 742530 }, { "epoch": 1.92, "learning_rate": 1.1284381553264675e-05, "loss": 0.0086, "step": 742540 }, { "epoch": 1.92, "learning_rate": 1.1280493336893212e-05, "loss": 0.0094, "step": 742550 }, { "epoch": 1.92, "learning_rate": 1.1276605120521745e-05, "loss": 0.0112, "step": 742560 }, { "epoch": 1.92, "learning_rate": 1.1272716904150281e-05, "loss": 0.0074, "step": 742570 }, { "epoch": 1.92, "learning_rate": 1.1268828687778816e-05, "loss": 0.0069, "step": 742580 }, { "epoch": 1.92, "learning_rate": 1.1264940471407353e-05, "loss": 0.0083, "step": 742590 }, { "epoch": 1.92, "learning_rate": 1.1261052255035888e-05, "loss": 0.0063, "step": 742600 }, { "epoch": 1.92, "learning_rate": 1.1257164038664424e-05, "loss": 0.0072, "step": 742610 }, { "epoch": 1.92, "learning_rate": 1.1253275822292957e-05, "loss": 0.0053, "step": 742620 }, { "epoch": 1.93, "learning_rate": 1.1249387605921492e-05, "loss": 0.0058, "step": 742630 }, { "epoch": 1.93, "learning_rate": 1.1245499389550029e-05, "loss": 0.006, "step": 742640 }, { "epoch": 1.93, "learning_rate": 1.1241611173178564e-05, "loss": 0.0077, "step": 742650 }, { "epoch": 1.93, "learning_rate": 1.12377229568071e-05, "loss": 0.0066, "step": 742660 }, { "epoch": 1.93, "learning_rate": 1.1233834740435635e-05, "loss": 0.0076, "step": 742670 }, { "epoch": 1.93, "learning_rate": 1.122994652406417e-05, "loss": 0.0075, "step": 742680 }, { "epoch": 1.93, "learning_rate": 1.1226058307692705e-05, "loss": 0.007, "step": 742690 }, { "epoch": 1.93, "learning_rate": 1.1222170091321241e-05, "loss": 0.0062, "step": 742700 }, { "epoch": 1.93, "learning_rate": 1.1218281874949776e-05, "loss": 0.006, "step": 742710 }, { "epoch": 1.93, "learning_rate": 1.1214393658578313e-05, "loss": 0.0084, "step": 742720 }, { "epoch": 1.93, "learning_rate": 1.1210505442206848e-05, "loss": 0.0071, "step": 742730 }, { "epoch": 1.93, "learning_rate": 1.1206617225835381e-05, "loss": 0.007, "step": 742740 }, { "epoch": 1.93, "learning_rate": 1.1202729009463917e-05, "loss": 0.0075, "step": 742750 }, { "epoch": 1.93, "learning_rate": 1.1198840793092452e-05, "loss": 0.0089, "step": 742760 }, { "epoch": 1.93, "learning_rate": 1.1194952576720989e-05, "loss": 0.0078, "step": 742770 }, { "epoch": 1.93, "learning_rate": 1.1191064360349524e-05, "loss": 0.0059, "step": 742780 }, { "epoch": 1.93, "learning_rate": 1.118717614397806e-05, "loss": 0.0069, "step": 742790 }, { "epoch": 1.93, "learning_rate": 1.1183287927606595e-05, "loss": 0.0084, "step": 742800 }, { "epoch": 1.93, "learning_rate": 1.117939971123513e-05, "loss": 0.0047, "step": 742810 }, { "epoch": 1.93, "learning_rate": 1.1175511494863665e-05, "loss": 0.0078, "step": 742820 }, { "epoch": 1.93, "learning_rate": 1.11716232784922e-05, "loss": 0.0057, "step": 742830 }, { "epoch": 1.93, "learning_rate": 1.1167735062120736e-05, "loss": 0.0093, "step": 742840 }, { "epoch": 1.93, "learning_rate": 1.1163846845749271e-05, "loss": 0.0044, "step": 742850 }, { "epoch": 1.93, "learning_rate": 1.1159958629377808e-05, "loss": 0.0078, "step": 742860 }, { "epoch": 1.93, "learning_rate": 1.115607041300634e-05, "loss": 0.0064, "step": 742870 }, { "epoch": 1.93, "learning_rate": 1.1152182196634877e-05, "loss": 0.0072, "step": 742880 }, { "epoch": 1.93, "learning_rate": 1.1148293980263412e-05, "loss": 0.0059, "step": 742890 }, { "epoch": 1.93, "learning_rate": 1.1144405763891949e-05, "loss": 0.0078, "step": 742900 }, { "epoch": 1.93, "learning_rate": 1.1140517547520484e-05, "loss": 0.0085, "step": 742910 }, { "epoch": 1.93, "learning_rate": 1.113662933114902e-05, "loss": 0.0068, "step": 742920 }, { "epoch": 1.93, "learning_rate": 1.1132741114777553e-05, "loss": 0.0048, "step": 742930 }, { "epoch": 1.93, "learning_rate": 1.1128852898406088e-05, "loss": 0.0079, "step": 742940 }, { "epoch": 1.93, "learning_rate": 1.1124964682034625e-05, "loss": 0.0074, "step": 742950 }, { "epoch": 1.93, "learning_rate": 1.112107646566316e-05, "loss": 0.0072, "step": 742960 }, { "epoch": 1.93, "learning_rate": 1.1117188249291696e-05, "loss": 0.0067, "step": 742970 }, { "epoch": 1.93, "learning_rate": 1.1113300032920231e-05, "loss": 0.0064, "step": 742980 }, { "epoch": 1.93, "learning_rate": 1.1109411816548766e-05, "loss": 0.0061, "step": 742990 }, { "epoch": 1.93, "learning_rate": 1.11055236001773e-05, "loss": 0.0076, "step": 743000 }, { "epoch": 1.93, "eval_cer": 0.8816606972151424, "eval_loss": 0.004454338923096657, "eval_runtime": 107.8248, "eval_samples_per_second": 18.549, "eval_steps_per_second": 4.637, "step": 743000 }, { "epoch": 1.93, "learning_rate": 1.1101635383805837e-05, "loss": 0.0086, "step": 743010 }, { "epoch": 1.93, "learning_rate": 1.1097747167434372e-05, "loss": 0.005, "step": 743020 }, { "epoch": 1.93, "learning_rate": 1.1093858951062909e-05, "loss": 0.0075, "step": 743030 }, { "epoch": 1.93, "learning_rate": 1.1089970734691444e-05, "loss": 0.0053, "step": 743040 }, { "epoch": 1.93, "learning_rate": 1.1086082518319977e-05, "loss": 0.0062, "step": 743050 }, { "epoch": 1.93, "learning_rate": 1.1082194301948513e-05, "loss": 0.0068, "step": 743060 }, { "epoch": 1.93, "learning_rate": 1.1078306085577048e-05, "loss": 0.0076, "step": 743070 }, { "epoch": 1.93, "learning_rate": 1.1074417869205585e-05, "loss": 0.008, "step": 743080 }, { "epoch": 1.93, "learning_rate": 1.107052965283412e-05, "loss": 0.0071, "step": 743090 }, { "epoch": 1.93, "learning_rate": 1.1066641436462656e-05, "loss": 0.0063, "step": 743100 }, { "epoch": 1.93, "learning_rate": 1.1062753220091191e-05, "loss": 0.0072, "step": 743110 }, { "epoch": 1.93, "learning_rate": 1.1058865003719726e-05, "loss": 0.0119, "step": 743120 }, { "epoch": 1.93, "learning_rate": 1.105497678734826e-05, "loss": 0.0075, "step": 743130 }, { "epoch": 1.93, "learning_rate": 1.1051088570976797e-05, "loss": 0.0077, "step": 743140 }, { "epoch": 1.93, "learning_rate": 1.1047200354605332e-05, "loss": 0.0123, "step": 743150 }, { "epoch": 1.93, "learning_rate": 1.1043312138233869e-05, "loss": 0.0074, "step": 743160 }, { "epoch": 1.93, "learning_rate": 1.1039423921862404e-05, "loss": 0.0073, "step": 743170 }, { "epoch": 1.93, "learning_rate": 1.1035535705490937e-05, "loss": 0.0061, "step": 743180 }, { "epoch": 1.93, "learning_rate": 1.1031647489119473e-05, "loss": 0.0068, "step": 743190 }, { "epoch": 1.93, "learning_rate": 1.1027759272748008e-05, "loss": 0.0086, "step": 743200 }, { "epoch": 1.93, "learning_rate": 1.1023871056376545e-05, "loss": 0.0057, "step": 743210 }, { "epoch": 1.93, "learning_rate": 1.101998284000508e-05, "loss": 0.0056, "step": 743220 }, { "epoch": 1.93, "learning_rate": 1.1016094623633616e-05, "loss": 0.0061, "step": 743230 }, { "epoch": 1.93, "learning_rate": 1.101220640726215e-05, "loss": 0.0053, "step": 743240 }, { "epoch": 1.93, "learning_rate": 1.1008318190890686e-05, "loss": 0.0081, "step": 743250 }, { "epoch": 1.93, "learning_rate": 1.100442997451922e-05, "loss": 0.0086, "step": 743260 }, { "epoch": 1.93, "learning_rate": 1.1000541758147757e-05, "loss": 0.0057, "step": 743270 }, { "epoch": 1.93, "learning_rate": 1.0996653541776292e-05, "loss": 0.0081, "step": 743280 }, { "epoch": 1.93, "learning_rate": 1.0992765325404829e-05, "loss": 0.0086, "step": 743290 }, { "epoch": 1.93, "learning_rate": 1.0988877109033362e-05, "loss": 0.0091, "step": 743300 }, { "epoch": 1.93, "learning_rate": 1.0984988892661897e-05, "loss": 0.0065, "step": 743310 }, { "epoch": 1.93, "learning_rate": 1.0981100676290433e-05, "loss": 0.0083, "step": 743320 }, { "epoch": 1.93, "learning_rate": 1.0977212459918968e-05, "loss": 0.0141, "step": 743330 }, { "epoch": 1.93, "learning_rate": 1.0973324243547505e-05, "loss": 0.0064, "step": 743340 }, { "epoch": 1.93, "learning_rate": 1.096943602717604e-05, "loss": 0.0073, "step": 743350 }, { "epoch": 1.93, "learning_rate": 1.0965547810804574e-05, "loss": 0.0061, "step": 743360 }, { "epoch": 1.93, "learning_rate": 1.096165959443311e-05, "loss": 0.006, "step": 743370 }, { "epoch": 1.93, "learning_rate": 1.0957771378061646e-05, "loss": 0.0057, "step": 743380 }, { "epoch": 1.93, "learning_rate": 1.095388316169018e-05, "loss": 0.0056, "step": 743390 }, { "epoch": 1.93, "learning_rate": 1.0949994945318717e-05, "loss": 0.0069, "step": 743400 }, { "epoch": 1.93, "learning_rate": 1.0946106728947252e-05, "loss": 0.0079, "step": 743410 }, { "epoch": 1.93, "learning_rate": 1.0942218512575789e-05, "loss": 0.0071, "step": 743420 }, { "epoch": 1.93, "learning_rate": 1.0938330296204322e-05, "loss": 0.0052, "step": 743430 }, { "epoch": 1.93, "learning_rate": 1.0934442079832857e-05, "loss": 0.0066, "step": 743440 }, { "epoch": 1.93, "learning_rate": 1.0930553863461393e-05, "loss": 0.0071, "step": 743450 }, { "epoch": 1.93, "learning_rate": 1.0926665647089928e-05, "loss": 0.0059, "step": 743460 }, { "epoch": 1.93, "learning_rate": 1.0922777430718465e-05, "loss": 0.0069, "step": 743470 }, { "epoch": 1.93, "learning_rate": 1.0918889214347e-05, "loss": 0.0066, "step": 743480 }, { "epoch": 1.93, "learning_rate": 1.0915000997975534e-05, "loss": 0.0069, "step": 743490 }, { "epoch": 1.93, "learning_rate": 1.091111278160407e-05, "loss": 0.009, "step": 743500 }, { "epoch": 1.93, "learning_rate": 1.0907224565232604e-05, "loss": 0.0092, "step": 743510 }, { "epoch": 1.93, "learning_rate": 1.090333634886114e-05, "loss": 0.0033, "step": 743520 }, { "epoch": 1.93, "learning_rate": 1.0899448132489676e-05, "loss": 0.0076, "step": 743530 }, { "epoch": 1.93, "learning_rate": 1.0895559916118212e-05, "loss": 0.006, "step": 743540 }, { "epoch": 1.93, "learning_rate": 1.0891671699746745e-05, "loss": 0.006, "step": 743550 }, { "epoch": 1.93, "learning_rate": 1.0887783483375282e-05, "loss": 0.006, "step": 743560 }, { "epoch": 1.93, "learning_rate": 1.0883895267003817e-05, "loss": 0.0115, "step": 743570 }, { "epoch": 1.93, "learning_rate": 1.0880007050632353e-05, "loss": 0.0071, "step": 743580 }, { "epoch": 1.93, "learning_rate": 1.0876118834260888e-05, "loss": 0.0052, "step": 743590 }, { "epoch": 1.93, "learning_rate": 1.0872230617889425e-05, "loss": 0.0066, "step": 743600 }, { "epoch": 1.93, "learning_rate": 1.0868342401517958e-05, "loss": 0.0059, "step": 743610 }, { "epoch": 1.93, "learning_rate": 1.0864454185146493e-05, "loss": 0.0067, "step": 743620 }, { "epoch": 1.93, "learning_rate": 1.086056596877503e-05, "loss": 0.0059, "step": 743630 }, { "epoch": 1.93, "learning_rate": 1.0856677752403564e-05, "loss": 0.0083, "step": 743640 }, { "epoch": 1.93, "learning_rate": 1.08527895360321e-05, "loss": 0.0063, "step": 743650 }, { "epoch": 1.93, "learning_rate": 1.0848901319660636e-05, "loss": 0.0086, "step": 743660 }, { "epoch": 1.93, "learning_rate": 1.084501310328917e-05, "loss": 0.0075, "step": 743670 }, { "epoch": 1.93, "learning_rate": 1.0841124886917705e-05, "loss": 0.0066, "step": 743680 }, { "epoch": 1.93, "learning_rate": 1.0837236670546242e-05, "loss": 0.0057, "step": 743690 }, { "epoch": 1.93, "learning_rate": 1.0833348454174777e-05, "loss": 0.007, "step": 743700 }, { "epoch": 1.93, "learning_rate": 1.0829460237803313e-05, "loss": 0.0064, "step": 743710 }, { "epoch": 1.93, "learning_rate": 1.0825572021431848e-05, "loss": 0.0055, "step": 743720 }, { "epoch": 1.93, "learning_rate": 1.0821683805060385e-05, "loss": 0.0053, "step": 743730 }, { "epoch": 1.93, "learning_rate": 1.0817795588688918e-05, "loss": 0.0061, "step": 743740 }, { "epoch": 1.93, "learning_rate": 1.0813907372317453e-05, "loss": 0.0078, "step": 743750 }, { "epoch": 1.93, "learning_rate": 1.081001915594599e-05, "loss": 0.0076, "step": 743760 }, { "epoch": 1.93, "learning_rate": 1.0806130939574524e-05, "loss": 0.0081, "step": 743770 }, { "epoch": 1.93, "learning_rate": 1.080224272320306e-05, "loss": 0.01, "step": 743780 }, { "epoch": 1.93, "learning_rate": 1.0798354506831596e-05, "loss": 0.0073, "step": 743790 }, { "epoch": 1.93, "learning_rate": 1.079446629046013e-05, "loss": 0.0062, "step": 743800 }, { "epoch": 1.93, "learning_rate": 1.0790578074088665e-05, "loss": 0.006, "step": 743810 }, { "epoch": 1.93, "learning_rate": 1.0786689857717202e-05, "loss": 0.006, "step": 743820 }, { "epoch": 1.93, "learning_rate": 1.0782801641345737e-05, "loss": 0.0072, "step": 743830 }, { "epoch": 1.93, "learning_rate": 1.0778913424974273e-05, "loss": 0.0078, "step": 743840 }, { "epoch": 1.93, "learning_rate": 1.0775025208602808e-05, "loss": 0.0063, "step": 743850 }, { "epoch": 1.93, "learning_rate": 1.0771136992231341e-05, "loss": 0.0084, "step": 743860 }, { "epoch": 1.93, "learning_rate": 1.0767248775859878e-05, "loss": 0.007, "step": 743870 }, { "epoch": 1.93, "learning_rate": 1.0763360559488413e-05, "loss": 0.0089, "step": 743880 }, { "epoch": 1.93, "learning_rate": 1.075947234311695e-05, "loss": 0.0052, "step": 743890 }, { "epoch": 1.93, "learning_rate": 1.0755584126745484e-05, "loss": 0.0068, "step": 743900 }, { "epoch": 1.93, "learning_rate": 1.075169591037402e-05, "loss": 0.0054, "step": 743910 }, { "epoch": 1.93, "learning_rate": 1.0747807694002554e-05, "loss": 0.0049, "step": 743920 }, { "epoch": 1.93, "learning_rate": 1.074391947763109e-05, "loss": 0.0051, "step": 743930 }, { "epoch": 1.93, "learning_rate": 1.0740031261259625e-05, "loss": 0.0078, "step": 743940 }, { "epoch": 1.93, "learning_rate": 1.0736143044888162e-05, "loss": 0.0085, "step": 743950 }, { "epoch": 1.93, "learning_rate": 1.0732254828516697e-05, "loss": 0.0064, "step": 743960 }, { "epoch": 1.93, "learning_rate": 1.0728366612145233e-05, "loss": 0.0071, "step": 743970 }, { "epoch": 1.93, "learning_rate": 1.0724478395773766e-05, "loss": 0.0062, "step": 743980 }, { "epoch": 1.93, "learning_rate": 1.0720590179402301e-05, "loss": 0.0072, "step": 743990 }, { "epoch": 1.93, "learning_rate": 1.0716701963030838e-05, "loss": 0.0062, "step": 744000 }, { "epoch": 1.93, "eval_cer": 0.8816704946736816, "eval_loss": 0.0045136138796806335, "eval_runtime": 107.8856, "eval_samples_per_second": 18.538, "eval_steps_per_second": 4.635, "step": 744000 }, { "epoch": 1.93, "learning_rate": 1.0712813746659373e-05, "loss": 0.0057, "step": 744010 }, { "epoch": 1.93, "learning_rate": 1.070892553028791e-05, "loss": 0.0105, "step": 744020 }, { "epoch": 1.93, "learning_rate": 1.0705037313916444e-05, "loss": 0.0097, "step": 744030 }, { "epoch": 1.93, "learning_rate": 1.070114909754498e-05, "loss": 0.0081, "step": 744040 }, { "epoch": 1.93, "learning_rate": 1.0697260881173514e-05, "loss": 0.0055, "step": 744050 }, { "epoch": 1.93, "learning_rate": 1.069337266480205e-05, "loss": 0.01, "step": 744060 }, { "epoch": 1.93, "learning_rate": 1.0689484448430585e-05, "loss": 0.0062, "step": 744070 }, { "epoch": 1.93, "learning_rate": 1.0685596232059122e-05, "loss": 0.0064, "step": 744080 }, { "epoch": 1.93, "learning_rate": 1.0681708015687657e-05, "loss": 0.0051, "step": 744090 }, { "epoch": 1.93, "learning_rate": 1.0677819799316193e-05, "loss": 0.0069, "step": 744100 }, { "epoch": 1.93, "learning_rate": 1.0673931582944726e-05, "loss": 0.0062, "step": 744110 }, { "epoch": 1.93, "learning_rate": 1.0670043366573261e-05, "loss": 0.0046, "step": 744120 }, { "epoch": 1.93, "learning_rate": 1.0666155150201798e-05, "loss": 0.0063, "step": 744130 }, { "epoch": 1.93, "learning_rate": 1.0662266933830333e-05, "loss": 0.0068, "step": 744140 }, { "epoch": 1.93, "learning_rate": 1.065837871745887e-05, "loss": 0.0072, "step": 744150 }, { "epoch": 1.93, "learning_rate": 1.0654490501087404e-05, "loss": 0.0083, "step": 744160 }, { "epoch": 1.93, "learning_rate": 1.0650602284715939e-05, "loss": 0.0061, "step": 744170 }, { "epoch": 1.93, "learning_rate": 1.0646714068344474e-05, "loss": 0.0062, "step": 744180 }, { "epoch": 1.93, "learning_rate": 1.064282585197301e-05, "loss": 0.0078, "step": 744190 }, { "epoch": 1.93, "learning_rate": 1.0638937635601545e-05, "loss": 0.0075, "step": 744200 }, { "epoch": 1.93, "learning_rate": 1.063504941923008e-05, "loss": 0.007, "step": 744210 }, { "epoch": 1.93, "learning_rate": 1.0631161202858617e-05, "loss": 0.0091, "step": 744220 }, { "epoch": 1.93, "learning_rate": 1.062727298648715e-05, "loss": 0.0072, "step": 744230 }, { "epoch": 1.93, "learning_rate": 1.0623384770115686e-05, "loss": 0.0113, "step": 744240 }, { "epoch": 1.93, "learning_rate": 1.0619496553744221e-05, "loss": 0.0072, "step": 744250 }, { "epoch": 1.93, "learning_rate": 1.0615608337372758e-05, "loss": 0.006, "step": 744260 }, { "epoch": 1.93, "learning_rate": 1.0611720121001293e-05, "loss": 0.0076, "step": 744270 }, { "epoch": 1.93, "learning_rate": 1.0607831904629829e-05, "loss": 0.0052, "step": 744280 }, { "epoch": 1.93, "learning_rate": 1.0603943688258362e-05, "loss": 0.0083, "step": 744290 }, { "epoch": 1.93, "learning_rate": 1.0600055471886897e-05, "loss": 0.0078, "step": 744300 }, { "epoch": 1.93, "learning_rate": 1.0596167255515434e-05, "loss": 0.0063, "step": 744310 }, { "epoch": 1.93, "learning_rate": 1.0592279039143969e-05, "loss": 0.0095, "step": 744320 }, { "epoch": 1.93, "learning_rate": 1.0588390822772505e-05, "loss": 0.0071, "step": 744330 }, { "epoch": 1.93, "learning_rate": 1.058450260640104e-05, "loss": 0.0068, "step": 744340 }, { "epoch": 1.93, "learning_rate": 1.0580614390029577e-05, "loss": 0.004, "step": 744350 }, { "epoch": 1.93, "learning_rate": 1.057672617365811e-05, "loss": 0.0055, "step": 744360 }, { "epoch": 1.93, "learning_rate": 1.0572837957286646e-05, "loss": 0.0052, "step": 744370 }, { "epoch": 1.93, "learning_rate": 1.0568949740915181e-05, "loss": 0.0054, "step": 744380 }, { "epoch": 1.93, "learning_rate": 1.0565061524543718e-05, "loss": 0.0094, "step": 744390 }, { "epoch": 1.93, "learning_rate": 1.0561173308172253e-05, "loss": 0.0095, "step": 744400 }, { "epoch": 1.93, "learning_rate": 1.0557285091800789e-05, "loss": 0.0084, "step": 744410 }, { "epoch": 1.93, "learning_rate": 1.0553396875429322e-05, "loss": 0.0078, "step": 744420 }, { "epoch": 1.93, "learning_rate": 1.0549508659057857e-05, "loss": 0.0059, "step": 744430 }, { "epoch": 1.93, "learning_rate": 1.0545620442686394e-05, "loss": 0.0076, "step": 744440 }, { "epoch": 1.93, "learning_rate": 1.0541732226314929e-05, "loss": 0.0073, "step": 744450 }, { "epoch": 1.93, "learning_rate": 1.0537844009943465e-05, "loss": 0.0054, "step": 744460 }, { "epoch": 1.93, "learning_rate": 1.0533955793572e-05, "loss": 0.0072, "step": 744470 }, { "epoch": 1.93, "learning_rate": 1.0530067577200535e-05, "loss": 0.0095, "step": 744480 }, { "epoch": 1.93, "learning_rate": 1.052617936082907e-05, "loss": 0.008, "step": 744490 }, { "epoch": 1.93, "learning_rate": 1.0522291144457606e-05, "loss": 0.0078, "step": 744500 }, { "epoch": 1.93, "learning_rate": 1.0518402928086141e-05, "loss": 0.0045, "step": 744510 }, { "epoch": 1.93, "learning_rate": 1.0514514711714678e-05, "loss": 0.0075, "step": 744520 }, { "epoch": 1.93, "learning_rate": 1.0510626495343213e-05, "loss": 0.0075, "step": 744530 }, { "epoch": 1.93, "learning_rate": 1.0506738278971746e-05, "loss": 0.0098, "step": 744540 }, { "epoch": 1.93, "learning_rate": 1.0502850062600282e-05, "loss": 0.0074, "step": 744550 }, { "epoch": 1.93, "learning_rate": 1.0498961846228817e-05, "loss": 0.0074, "step": 744560 }, { "epoch": 1.93, "learning_rate": 1.0495073629857354e-05, "loss": 0.0099, "step": 744570 }, { "epoch": 1.93, "learning_rate": 1.0491185413485889e-05, "loss": 0.009, "step": 744580 }, { "epoch": 1.93, "learning_rate": 1.0487297197114425e-05, "loss": 0.0054, "step": 744590 }, { "epoch": 1.93, "learning_rate": 1.0483408980742958e-05, "loss": 0.0064, "step": 744600 }, { "epoch": 1.93, "learning_rate": 1.0479520764371495e-05, "loss": 0.0095, "step": 744610 }, { "epoch": 1.93, "learning_rate": 1.047563254800003e-05, "loss": 0.0074, "step": 744620 }, { "epoch": 1.93, "learning_rate": 1.0471744331628566e-05, "loss": 0.0065, "step": 744630 }, { "epoch": 1.93, "learning_rate": 1.0467856115257101e-05, "loss": 0.0072, "step": 744640 }, { "epoch": 1.93, "learning_rate": 1.0463967898885638e-05, "loss": 0.0072, "step": 744650 }, { "epoch": 1.93, "learning_rate": 1.0460079682514173e-05, "loss": 0.0075, "step": 744660 }, { "epoch": 1.93, "learning_rate": 1.0456191466142706e-05, "loss": 0.0075, "step": 744670 }, { "epoch": 1.93, "learning_rate": 1.0452303249771242e-05, "loss": 0.0066, "step": 744680 }, { "epoch": 1.93, "learning_rate": 1.0448415033399777e-05, "loss": 0.0063, "step": 744690 }, { "epoch": 1.93, "learning_rate": 1.0444526817028314e-05, "loss": 0.0058, "step": 744700 }, { "epoch": 1.93, "learning_rate": 1.0440638600656849e-05, "loss": 0.0066, "step": 744710 }, { "epoch": 1.93, "learning_rate": 1.0436750384285385e-05, "loss": 0.009, "step": 744720 }, { "epoch": 1.93, "learning_rate": 1.0432862167913918e-05, "loss": 0.0064, "step": 744730 }, { "epoch": 1.93, "learning_rate": 1.0428973951542455e-05, "loss": 0.0067, "step": 744740 }, { "epoch": 1.93, "learning_rate": 1.042508573517099e-05, "loss": 0.0058, "step": 744750 }, { "epoch": 1.93, "learning_rate": 1.0421197518799526e-05, "loss": 0.0054, "step": 744760 }, { "epoch": 1.93, "learning_rate": 1.0417309302428061e-05, "loss": 0.0059, "step": 744770 }, { "epoch": 1.93, "learning_rate": 1.0413421086056598e-05, "loss": 0.0053, "step": 744780 }, { "epoch": 1.93, "learning_rate": 1.040953286968513e-05, "loss": 0.0068, "step": 744790 }, { "epoch": 1.93, "learning_rate": 1.0405644653313666e-05, "loss": 0.0064, "step": 744800 }, { "epoch": 1.93, "learning_rate": 1.0401756436942202e-05, "loss": 0.0066, "step": 744810 }, { "epoch": 1.93, "learning_rate": 1.0397868220570737e-05, "loss": 0.0051, "step": 744820 }, { "epoch": 1.93, "learning_rate": 1.0393980004199274e-05, "loss": 0.0066, "step": 744830 }, { "epoch": 1.93, "learning_rate": 1.0390091787827808e-05, "loss": 0.0068, "step": 744840 }, { "epoch": 1.93, "learning_rate": 1.0386203571456343e-05, "loss": 0.0059, "step": 744850 }, { "epoch": 1.93, "learning_rate": 1.0382315355084878e-05, "loss": 0.0071, "step": 744860 }, { "epoch": 1.93, "learning_rate": 1.0378427138713415e-05, "loss": 0.0071, "step": 744870 }, { "epoch": 1.93, "learning_rate": 1.037453892234195e-05, "loss": 0.0061, "step": 744880 }, { "epoch": 1.93, "learning_rate": 1.0370650705970484e-05, "loss": 0.0059, "step": 744890 }, { "epoch": 1.93, "learning_rate": 1.0366762489599021e-05, "loss": 0.0071, "step": 744900 }, { "epoch": 1.93, "learning_rate": 1.0362874273227554e-05, "loss": 0.0079, "step": 744910 }, { "epoch": 1.93, "learning_rate": 1.035898605685609e-05, "loss": 0.0069, "step": 744920 }, { "epoch": 1.93, "learning_rate": 1.0355097840484626e-05, "loss": 0.0056, "step": 744930 }, { "epoch": 1.93, "learning_rate": 1.0351209624113162e-05, "loss": 0.0048, "step": 744940 }, { "epoch": 1.93, "learning_rate": 1.0347321407741697e-05, "loss": 0.0074, "step": 744950 }, { "epoch": 1.93, "learning_rate": 1.0343433191370234e-05, "loss": 0.0054, "step": 744960 }, { "epoch": 1.93, "learning_rate": 1.0339544974998768e-05, "loss": 0.0064, "step": 744970 }, { "epoch": 1.93, "learning_rate": 1.0335656758627302e-05, "loss": 0.0092, "step": 744980 }, { "epoch": 1.93, "learning_rate": 1.0331768542255838e-05, "loss": 0.0072, "step": 744990 }, { "epoch": 1.93, "learning_rate": 1.0327880325884373e-05, "loss": 0.0089, "step": 745000 }, { "epoch": 1.93, "eval_cer": 0.8816620968520765, "eval_loss": 0.0044491966255009174, "eval_runtime": 107.8288, "eval_samples_per_second": 18.548, "eval_steps_per_second": 4.637, "step": 745000 }, { "epoch": 1.93, "learning_rate": 1.032399210951291e-05, "loss": 0.0082, "step": 745010 }, { "epoch": 1.93, "learning_rate": 1.0320103893141444e-05, "loss": 0.0073, "step": 745020 }, { "epoch": 1.93, "learning_rate": 1.0316215676769981e-05, "loss": 0.0064, "step": 745030 }, { "epoch": 1.93, "learning_rate": 1.0312327460398514e-05, "loss": 0.0047, "step": 745040 }, { "epoch": 1.93, "learning_rate": 1.030843924402705e-05, "loss": 0.0069, "step": 745050 }, { "epoch": 1.93, "learning_rate": 1.0304551027655586e-05, "loss": 0.007, "step": 745060 }, { "epoch": 1.93, "learning_rate": 1.0300662811284122e-05, "loss": 0.0083, "step": 745070 }, { "epoch": 1.93, "learning_rate": 1.0296774594912657e-05, "loss": 0.0086, "step": 745080 }, { "epoch": 1.93, "learning_rate": 1.0292886378541194e-05, "loss": 0.007, "step": 745090 }, { "epoch": 1.93, "learning_rate": 1.0288998162169727e-05, "loss": 0.0079, "step": 745100 }, { "epoch": 1.93, "learning_rate": 1.0285109945798262e-05, "loss": 0.0069, "step": 745110 }, { "epoch": 1.93, "learning_rate": 1.0281221729426798e-05, "loss": 0.0062, "step": 745120 }, { "epoch": 1.93, "learning_rate": 1.0277333513055333e-05, "loss": 0.0048, "step": 745130 }, { "epoch": 1.93, "learning_rate": 1.027344529668387e-05, "loss": 0.006, "step": 745140 }, { "epoch": 1.93, "learning_rate": 1.0269557080312404e-05, "loss": 0.0075, "step": 745150 }, { "epoch": 1.93, "learning_rate": 1.026566886394094e-05, "loss": 0.0087, "step": 745160 }, { "epoch": 1.93, "learning_rate": 1.0261780647569474e-05, "loss": 0.0104, "step": 745170 }, { "epoch": 1.93, "learning_rate": 1.025789243119801e-05, "loss": 0.007, "step": 745180 }, { "epoch": 1.93, "learning_rate": 1.0254004214826546e-05, "loss": 0.0054, "step": 745190 }, { "epoch": 1.93, "learning_rate": 1.0250115998455082e-05, "loss": 0.0078, "step": 745200 }, { "epoch": 1.93, "learning_rate": 1.0246227782083617e-05, "loss": 0.0059, "step": 745210 }, { "epoch": 1.93, "learning_rate": 1.024233956571215e-05, "loss": 0.0088, "step": 745220 }, { "epoch": 1.93, "learning_rate": 1.0238451349340687e-05, "loss": 0.008, "step": 745230 }, { "epoch": 1.93, "learning_rate": 1.0234563132969222e-05, "loss": 0.0075, "step": 745240 }, { "epoch": 1.93, "learning_rate": 1.0230674916597758e-05, "loss": 0.0077, "step": 745250 }, { "epoch": 1.93, "learning_rate": 1.0226786700226293e-05, "loss": 0.0063, "step": 745260 }, { "epoch": 1.93, "learning_rate": 1.022289848385483e-05, "loss": 0.0122, "step": 745270 }, { "epoch": 1.93, "learning_rate": 1.0219010267483364e-05, "loss": 0.0063, "step": 745280 }, { "epoch": 1.93, "learning_rate": 1.02151220511119e-05, "loss": 0.0076, "step": 745290 }, { "epoch": 1.93, "learning_rate": 1.0211233834740434e-05, "loss": 0.0049, "step": 745300 }, { "epoch": 1.93, "learning_rate": 1.020734561836897e-05, "loss": 0.0075, "step": 745310 }, { "epoch": 1.93, "learning_rate": 1.0203457401997506e-05, "loss": 0.0056, "step": 745320 }, { "epoch": 1.93, "learning_rate": 1.0199569185626042e-05, "loss": 0.008, "step": 745330 }, { "epoch": 1.93, "learning_rate": 1.0195680969254577e-05, "loss": 0.0074, "step": 745340 }, { "epoch": 1.93, "learning_rate": 1.019179275288311e-05, "loss": 0.0076, "step": 745350 }, { "epoch": 1.93, "learning_rate": 1.0187904536511647e-05, "loss": 0.005, "step": 745360 }, { "epoch": 1.93, "learning_rate": 1.0184016320140182e-05, "loss": 0.0087, "step": 745370 }, { "epoch": 1.93, "learning_rate": 1.0180128103768718e-05, "loss": 0.0068, "step": 745380 }, { "epoch": 1.93, "learning_rate": 1.0176239887397253e-05, "loss": 0.0081, "step": 745390 }, { "epoch": 1.93, "learning_rate": 1.017235167102579e-05, "loss": 0.007, "step": 745400 }, { "epoch": 1.93, "learning_rate": 1.0168463454654323e-05, "loss": 0.0064, "step": 745410 }, { "epoch": 1.93, "learning_rate": 1.016457523828286e-05, "loss": 0.0076, "step": 745420 }, { "epoch": 1.93, "learning_rate": 1.0160687021911394e-05, "loss": 0.0112, "step": 745430 }, { "epoch": 1.93, "learning_rate": 1.015679880553993e-05, "loss": 0.0083, "step": 745440 }, { "epoch": 1.93, "learning_rate": 1.0152910589168466e-05, "loss": 0.0088, "step": 745450 }, { "epoch": 1.93, "learning_rate": 1.0149022372797002e-05, "loss": 0.0073, "step": 745460 }, { "epoch": 1.93, "learning_rate": 1.0145134156425535e-05, "loss": 0.005, "step": 745470 }, { "epoch": 1.93, "learning_rate": 1.014124594005407e-05, "loss": 0.007, "step": 745480 }, { "epoch": 1.93, "learning_rate": 1.0137357723682607e-05, "loss": 0.0051, "step": 745490 }, { "epoch": 1.93, "learning_rate": 1.0133469507311142e-05, "loss": 0.0094, "step": 745500 }, { "epoch": 1.93, "learning_rate": 1.0129581290939678e-05, "loss": 0.008, "step": 745510 }, { "epoch": 1.93, "learning_rate": 1.0125693074568213e-05, "loss": 0.0062, "step": 745520 }, { "epoch": 1.93, "learning_rate": 1.0121804858196748e-05, "loss": 0.0059, "step": 745530 }, { "epoch": 1.93, "learning_rate": 1.0117916641825283e-05, "loss": 0.0078, "step": 745540 }, { "epoch": 1.93, "learning_rate": 1.011402842545382e-05, "loss": 0.0057, "step": 745550 }, { "epoch": 1.93, "learning_rate": 1.0110140209082354e-05, "loss": 0.0053, "step": 745560 }, { "epoch": 1.93, "learning_rate": 1.010625199271089e-05, "loss": 0.0051, "step": 745570 }, { "epoch": 1.93, "learning_rate": 1.0102363776339426e-05, "loss": 0.008, "step": 745580 }, { "epoch": 1.93, "learning_rate": 1.009847555996796e-05, "loss": 0.0074, "step": 745590 }, { "epoch": 1.93, "learning_rate": 1.0094587343596495e-05, "loss": 0.0079, "step": 745600 }, { "epoch": 1.93, "learning_rate": 1.009069912722503e-05, "loss": 0.0078, "step": 745610 }, { "epoch": 1.93, "learning_rate": 1.0086810910853567e-05, "loss": 0.006, "step": 745620 }, { "epoch": 1.93, "learning_rate": 1.0082922694482102e-05, "loss": 0.0073, "step": 745630 }, { "epoch": 1.93, "learning_rate": 1.0079034478110638e-05, "loss": 0.0059, "step": 745640 }, { "epoch": 1.93, "learning_rate": 1.0075146261739173e-05, "loss": 0.0099, "step": 745650 }, { "epoch": 1.93, "learning_rate": 1.0071258045367706e-05, "loss": 0.0047, "step": 745660 }, { "epoch": 1.93, "learning_rate": 1.0067369828996243e-05, "loss": 0.0059, "step": 745670 }, { "epoch": 1.93, "learning_rate": 1.0063481612624778e-05, "loss": 0.0077, "step": 745680 }, { "epoch": 1.93, "learning_rate": 1.0059593396253314e-05, "loss": 0.0068, "step": 745690 }, { "epoch": 1.93, "learning_rate": 1.0055705179881849e-05, "loss": 0.0078, "step": 745700 }, { "epoch": 1.93, "learning_rate": 1.0051816963510385e-05, "loss": 0.0076, "step": 745710 }, { "epoch": 1.93, "learning_rate": 1.0047928747138919e-05, "loss": 0.0067, "step": 745720 }, { "epoch": 1.93, "learning_rate": 1.0044040530767455e-05, "loss": 0.0072, "step": 745730 }, { "epoch": 1.93, "learning_rate": 1.004015231439599e-05, "loss": 0.006, "step": 745740 }, { "epoch": 1.93, "learning_rate": 1.0036264098024527e-05, "loss": 0.0058, "step": 745750 }, { "epoch": 1.93, "learning_rate": 1.0032375881653061e-05, "loss": 0.0047, "step": 745760 }, { "epoch": 1.93, "learning_rate": 1.0028487665281598e-05, "loss": 0.0062, "step": 745770 }, { "epoch": 1.93, "learning_rate": 1.0024599448910131e-05, "loss": 0.0119, "step": 745780 }, { "epoch": 1.93, "learning_rate": 1.0020711232538666e-05, "loss": 0.0061, "step": 745790 }, { "epoch": 1.93, "learning_rate": 1.0016823016167203e-05, "loss": 0.009, "step": 745800 }, { "epoch": 1.93, "learning_rate": 1.0012934799795737e-05, "loss": 0.004, "step": 745810 }, { "epoch": 1.93, "learning_rate": 1.0009046583424274e-05, "loss": 0.0068, "step": 745820 }, { "epoch": 1.93, "learning_rate": 1.0005158367052809e-05, "loss": 0.0066, "step": 745830 }, { "epoch": 1.93, "learning_rate": 1.0001270150681344e-05, "loss": 0.0059, "step": 745840 }, { "epoch": 1.93, "learning_rate": 9.997381934309879e-06, "loss": 0.0071, "step": 745850 }, { "epoch": 1.93, "learning_rate": 9.993493717938415e-06, "loss": 0.0057, "step": 745860 }, { "epoch": 1.93, "learning_rate": 9.98960550156695e-06, "loss": 0.0103, "step": 745870 }, { "epoch": 1.93, "learning_rate": 9.985717285195487e-06, "loss": 0.0073, "step": 745880 }, { "epoch": 1.93, "learning_rate": 9.981829068824021e-06, "loss": 0.0093, "step": 745890 }, { "epoch": 1.93, "learning_rate": 9.977940852452558e-06, "loss": 0.007, "step": 745900 }, { "epoch": 1.93, "learning_rate": 9.974052636081091e-06, "loss": 0.009, "step": 745910 }, { "epoch": 1.93, "learning_rate": 9.970164419709626e-06, "loss": 0.008, "step": 745920 }, { "epoch": 1.93, "learning_rate": 9.966276203338163e-06, "loss": 0.0082, "step": 745930 }, { "epoch": 1.93, "learning_rate": 9.962387986966697e-06, "loss": 0.0066, "step": 745940 }, { "epoch": 1.93, "learning_rate": 9.958499770595234e-06, "loss": 0.0061, "step": 745950 }, { "epoch": 1.93, "learning_rate": 9.954611554223769e-06, "loss": 0.0054, "step": 745960 }, { "epoch": 1.93, "learning_rate": 9.950723337852304e-06, "loss": 0.0055, "step": 745970 }, { "epoch": 1.93, "learning_rate": 9.946835121480839e-06, "loss": 0.0091, "step": 745980 }, { "epoch": 1.93, "learning_rate": 9.942946905109375e-06, "loss": 0.0091, "step": 745990 }, { "epoch": 1.93, "learning_rate": 9.93905868873791e-06, "loss": 0.0067, "step": 746000 }, { "epoch": 1.93, "eval_cer": 0.8816802921322209, "eval_loss": 0.004460540134459734, "eval_runtime": 107.8774, "eval_samples_per_second": 18.54, "eval_steps_per_second": 4.635, "step": 746000 }, { "epoch": 1.93, "learning_rate": 9.935170472366447e-06, "loss": 0.006, "step": 746010 }, { "epoch": 1.93, "learning_rate": 9.931282255994981e-06, "loss": 0.0063, "step": 746020 }, { "epoch": 1.93, "learning_rate": 9.927394039623515e-06, "loss": 0.0051, "step": 746030 }, { "epoch": 1.93, "learning_rate": 9.923505823252051e-06, "loss": 0.0071, "step": 746040 }, { "epoch": 1.93, "learning_rate": 9.919617606880586e-06, "loss": 0.0056, "step": 746050 }, { "epoch": 1.93, "learning_rate": 9.915729390509123e-06, "loss": 0.0052, "step": 746060 }, { "epoch": 1.93, "learning_rate": 9.911841174137657e-06, "loss": 0.0068, "step": 746070 }, { "epoch": 1.93, "learning_rate": 9.907952957766194e-06, "loss": 0.0074, "step": 746080 }, { "epoch": 1.93, "learning_rate": 9.904064741394727e-06, "loss": 0.0048, "step": 746090 }, { "epoch": 1.93, "learning_rate": 9.900176525023264e-06, "loss": 0.0074, "step": 746100 }, { "epoch": 1.93, "learning_rate": 9.896288308651799e-06, "loss": 0.0055, "step": 746110 }, { "epoch": 1.93, "learning_rate": 9.892400092280335e-06, "loss": 0.0046, "step": 746120 }, { "epoch": 1.93, "learning_rate": 9.88851187590887e-06, "loss": 0.0057, "step": 746130 }, { "epoch": 1.93, "learning_rate": 9.884623659537407e-06, "loss": 0.0089, "step": 746140 }, { "epoch": 1.93, "learning_rate": 9.88073544316594e-06, "loss": 0.0096, "step": 746150 }, { "epoch": 1.93, "learning_rate": 9.876847226794475e-06, "loss": 0.008, "step": 746160 }, { "epoch": 1.93, "learning_rate": 9.872959010423011e-06, "loss": 0.0114, "step": 746170 }, { "epoch": 1.93, "learning_rate": 9.869070794051546e-06, "loss": 0.0065, "step": 746180 }, { "epoch": 1.93, "learning_rate": 9.865182577680083e-06, "loss": 0.0072, "step": 746190 }, { "epoch": 1.93, "learning_rate": 9.861294361308617e-06, "loss": 0.0087, "step": 746200 }, { "epoch": 1.93, "learning_rate": 9.857406144937154e-06, "loss": 0.0061, "step": 746210 }, { "epoch": 1.93, "learning_rate": 9.853517928565687e-06, "loss": 0.0055, "step": 746220 }, { "epoch": 1.93, "learning_rate": 9.849629712194224e-06, "loss": 0.0096, "step": 746230 }, { "epoch": 1.93, "learning_rate": 9.845741495822759e-06, "loss": 0.0054, "step": 746240 }, { "epoch": 1.93, "learning_rate": 9.841853279451295e-06, "loss": 0.01, "step": 746250 }, { "epoch": 1.93, "learning_rate": 9.83796506307983e-06, "loss": 0.0056, "step": 746260 }, { "epoch": 1.93, "learning_rate": 9.834076846708365e-06, "loss": 0.007, "step": 746270 }, { "epoch": 1.93, "learning_rate": 9.8301886303369e-06, "loss": 0.0062, "step": 746280 }, { "epoch": 1.93, "learning_rate": 9.826300413965435e-06, "loss": 0.0081, "step": 746290 }, { "epoch": 1.93, "learning_rate": 9.822412197593971e-06, "loss": 0.0092, "step": 746300 }, { "epoch": 1.93, "learning_rate": 9.818523981222506e-06, "loss": 0.0095, "step": 746310 }, { "epoch": 1.93, "learning_rate": 9.814635764851043e-06, "loss": 0.0099, "step": 746320 }, { "epoch": 1.93, "learning_rate": 9.810747548479577e-06, "loss": 0.0058, "step": 746330 }, { "epoch": 1.93, "learning_rate": 9.80685933210811e-06, "loss": 0.0079, "step": 746340 }, { "epoch": 1.93, "learning_rate": 9.802971115736647e-06, "loss": 0.007, "step": 746350 }, { "epoch": 1.93, "learning_rate": 9.799082899365182e-06, "loss": 0.0077, "step": 746360 }, { "epoch": 1.93, "learning_rate": 9.795194682993719e-06, "loss": 0.005, "step": 746370 }, { "epoch": 1.93, "learning_rate": 9.791306466622253e-06, "loss": 0.0102, "step": 746380 }, { "epoch": 1.93, "learning_rate": 9.78741825025079e-06, "loss": 0.0061, "step": 746390 }, { "epoch": 1.93, "learning_rate": 9.783530033879323e-06, "loss": 0.0107, "step": 746400 }, { "epoch": 1.93, "learning_rate": 9.77964181750786e-06, "loss": 0.0076, "step": 746410 }, { "epoch": 1.93, "learning_rate": 9.775753601136395e-06, "loss": 0.0102, "step": 746420 }, { "epoch": 1.93, "learning_rate": 9.771865384764931e-06, "loss": 0.0104, "step": 746430 }, { "epoch": 1.93, "learning_rate": 9.767977168393466e-06, "loss": 0.0066, "step": 746440 }, { "epoch": 1.93, "learning_rate": 9.764088952022003e-06, "loss": 0.0085, "step": 746450 }, { "epoch": 1.93, "learning_rate": 9.760200735650536e-06, "loss": 0.0047, "step": 746460 }, { "epoch": 1.93, "learning_rate": 9.75631251927907e-06, "loss": 0.0065, "step": 746470 }, { "epoch": 1.93, "learning_rate": 9.752424302907607e-06, "loss": 0.0066, "step": 746480 }, { "epoch": 1.94, "learning_rate": 9.748536086536142e-06, "loss": 0.0062, "step": 746490 }, { "epoch": 1.94, "learning_rate": 9.744647870164679e-06, "loss": 0.0074, "step": 746500 }, { "epoch": 1.94, "learning_rate": 9.740759653793213e-06, "loss": 0.006, "step": 746510 }, { "epoch": 1.94, "learning_rate": 9.73687143742175e-06, "loss": 0.0057, "step": 746520 }, { "epoch": 1.94, "learning_rate": 9.732983221050283e-06, "loss": 0.0065, "step": 746530 }, { "epoch": 1.94, "learning_rate": 9.72909500467882e-06, "loss": 0.0067, "step": 746540 }, { "epoch": 1.94, "learning_rate": 9.725206788307355e-06, "loss": 0.0089, "step": 746550 }, { "epoch": 1.94, "learning_rate": 9.721318571935891e-06, "loss": 0.0064, "step": 746560 }, { "epoch": 1.94, "learning_rate": 9.717430355564426e-06, "loss": 0.0072, "step": 746570 }, { "epoch": 1.94, "learning_rate": 9.713542139192962e-06, "loss": 0.0059, "step": 746580 }, { "epoch": 1.94, "learning_rate": 9.709653922821496e-06, "loss": 0.0106, "step": 746590 }, { "epoch": 1.94, "learning_rate": 9.70576570645003e-06, "loss": 0.0064, "step": 746600 }, { "epoch": 1.94, "learning_rate": 9.701877490078567e-06, "loss": 0.0067, "step": 746610 }, { "epoch": 1.94, "learning_rate": 9.697989273707102e-06, "loss": 0.008, "step": 746620 }, { "epoch": 1.94, "learning_rate": 9.694101057335638e-06, "loss": 0.0114, "step": 746630 }, { "epoch": 1.94, "learning_rate": 9.690212840964173e-06, "loss": 0.0054, "step": 746640 }, { "epoch": 1.94, "learning_rate": 9.686324624592708e-06, "loss": 0.0073, "step": 746650 }, { "epoch": 1.94, "learning_rate": 9.682436408221243e-06, "loss": 0.006, "step": 746660 }, { "epoch": 1.94, "learning_rate": 9.67854819184978e-06, "loss": 0.0062, "step": 746670 }, { "epoch": 1.94, "learning_rate": 9.674659975478314e-06, "loss": 0.0076, "step": 746680 }, { "epoch": 1.94, "learning_rate": 9.670771759106851e-06, "loss": 0.0073, "step": 746690 }, { "epoch": 1.94, "learning_rate": 9.666883542735386e-06, "loss": 0.0089, "step": 746700 }, { "epoch": 1.94, "learning_rate": 9.662995326363919e-06, "loss": 0.0086, "step": 746710 }, { "epoch": 1.94, "learning_rate": 9.659107109992456e-06, "loss": 0.0053, "step": 746720 }, { "epoch": 1.94, "learning_rate": 9.65521889362099e-06, "loss": 0.0053, "step": 746730 }, { "epoch": 1.94, "learning_rate": 9.651330677249527e-06, "loss": 0.0104, "step": 746740 }, { "epoch": 1.94, "learning_rate": 9.647442460878062e-06, "loss": 0.0067, "step": 746750 }, { "epoch": 1.94, "learning_rate": 9.643554244506598e-06, "loss": 0.0074, "step": 746760 }, { "epoch": 1.94, "learning_rate": 9.639666028135132e-06, "loss": 0.0064, "step": 746770 }, { "epoch": 1.94, "learning_rate": 9.635777811763668e-06, "loss": 0.0061, "step": 746780 }, { "epoch": 1.94, "learning_rate": 9.631889595392203e-06, "loss": 0.0065, "step": 746790 }, { "epoch": 1.94, "learning_rate": 9.62800137902074e-06, "loss": 0.0067, "step": 746800 }, { "epoch": 1.94, "learning_rate": 9.624113162649274e-06, "loss": 0.0063, "step": 746810 }, { "epoch": 1.94, "learning_rate": 9.620224946277811e-06, "loss": 0.0052, "step": 746820 }, { "epoch": 1.94, "learning_rate": 9.616336729906346e-06, "loss": 0.0071, "step": 746830 }, { "epoch": 1.94, "learning_rate": 9.612448513534879e-06, "loss": 0.0083, "step": 746840 }, { "epoch": 1.94, "learning_rate": 9.608560297163416e-06, "loss": 0.0076, "step": 746850 }, { "epoch": 1.94, "learning_rate": 9.60467208079195e-06, "loss": 0.0047, "step": 746860 }, { "epoch": 1.94, "learning_rate": 9.600783864420487e-06, "loss": 0.0092, "step": 746870 }, { "epoch": 1.94, "learning_rate": 9.596895648049022e-06, "loss": 0.0069, "step": 746880 }, { "epoch": 1.94, "learning_rate": 9.593007431677558e-06, "loss": 0.0087, "step": 746890 }, { "epoch": 1.94, "learning_rate": 9.589119215306092e-06, "loss": 0.0089, "step": 746900 }, { "epoch": 1.94, "learning_rate": 9.585230998934628e-06, "loss": 0.0075, "step": 746910 }, { "epoch": 1.94, "learning_rate": 9.581342782563163e-06, "loss": 0.0062, "step": 746920 }, { "epoch": 1.94, "learning_rate": 9.5774545661917e-06, "loss": 0.0079, "step": 746930 }, { "epoch": 1.94, "learning_rate": 9.573566349820234e-06, "loss": 0.0065, "step": 746940 }, { "epoch": 1.94, "learning_rate": 9.569678133448771e-06, "loss": 0.0088, "step": 746950 }, { "epoch": 1.94, "learning_rate": 9.565789917077304e-06, "loss": 0.0065, "step": 746960 }, { "epoch": 1.94, "learning_rate": 9.561901700705839e-06, "loss": 0.007, "step": 746970 }, { "epoch": 1.94, "learning_rate": 9.558013484334376e-06, "loss": 0.0051, "step": 746980 }, { "epoch": 1.94, "learning_rate": 9.55412526796291e-06, "loss": 0.009, "step": 746990 }, { "epoch": 1.94, "learning_rate": 9.550237051591447e-06, "loss": 0.0055, "step": 747000 }, { "epoch": 1.94, "eval_cer": 0.8816760932214184, "eval_loss": 0.0044586677104234695, "eval_runtime": 107.824, "eval_samples_per_second": 18.549, "eval_steps_per_second": 4.637, "step": 747000 }, { "epoch": 1.94, "learning_rate": 9.546348835219982e-06, "loss": 0.0108, "step": 747010 }, { "epoch": 1.94, "learning_rate": 9.542460618848515e-06, "loss": 0.0068, "step": 747020 }, { "epoch": 1.94, "learning_rate": 9.538572402477052e-06, "loss": 0.0128, "step": 747030 }, { "epoch": 1.94, "learning_rate": 9.534684186105586e-06, "loss": 0.0101, "step": 747040 }, { "epoch": 1.94, "learning_rate": 9.530795969734123e-06, "loss": 0.008, "step": 747050 }, { "epoch": 1.94, "learning_rate": 9.526907753362658e-06, "loss": 0.0068, "step": 747060 }, { "epoch": 1.94, "learning_rate": 9.523019536991194e-06, "loss": 0.007, "step": 747070 }, { "epoch": 1.94, "learning_rate": 9.51913132061973e-06, "loss": 0.0146, "step": 747080 }, { "epoch": 1.94, "learning_rate": 9.515243104248264e-06, "loss": 0.0066, "step": 747090 }, { "epoch": 1.94, "learning_rate": 9.511354887876799e-06, "loss": 0.0061, "step": 747100 }, { "epoch": 1.94, "learning_rate": 9.507466671505336e-06, "loss": 0.0091, "step": 747110 }, { "epoch": 1.94, "learning_rate": 9.50357845513387e-06, "loss": 0.0046, "step": 747120 }, { "epoch": 1.94, "learning_rate": 9.499690238762407e-06, "loss": 0.007, "step": 747130 }, { "epoch": 1.94, "learning_rate": 9.495802022390942e-06, "loss": 0.0059, "step": 747140 }, { "epoch": 1.94, "learning_rate": 9.491913806019475e-06, "loss": 0.0059, "step": 747150 }, { "epoch": 1.94, "learning_rate": 9.488025589648012e-06, "loss": 0.0054, "step": 747160 }, { "epoch": 1.94, "learning_rate": 9.484137373276546e-06, "loss": 0.0053, "step": 747170 }, { "epoch": 1.94, "learning_rate": 9.480249156905083e-06, "loss": 0.0058, "step": 747180 }, { "epoch": 1.94, "learning_rate": 9.476360940533618e-06, "loss": 0.0071, "step": 747190 }, { "epoch": 1.94, "learning_rate": 9.472472724162154e-06, "loss": 0.0065, "step": 747200 }, { "epoch": 1.94, "learning_rate": 9.468584507790688e-06, "loss": 0.0065, "step": 747210 }, { "epoch": 1.94, "learning_rate": 9.464696291419224e-06, "loss": 0.0073, "step": 747220 }, { "epoch": 1.94, "learning_rate": 9.460808075047759e-06, "loss": 0.0105, "step": 747230 }, { "epoch": 1.94, "learning_rate": 9.456919858676296e-06, "loss": 0.008, "step": 747240 }, { "epoch": 1.94, "learning_rate": 9.45303164230483e-06, "loss": 0.0051, "step": 747250 }, { "epoch": 1.94, "learning_rate": 9.449143425933367e-06, "loss": 0.0078, "step": 747260 }, { "epoch": 1.94, "learning_rate": 9.4452552095619e-06, "loss": 0.0077, "step": 747270 }, { "epoch": 1.94, "learning_rate": 9.441366993190435e-06, "loss": 0.0086, "step": 747280 }, { "epoch": 1.94, "learning_rate": 9.437478776818972e-06, "loss": 0.0076, "step": 747290 }, { "epoch": 1.94, "learning_rate": 9.433590560447506e-06, "loss": 0.0059, "step": 747300 }, { "epoch": 1.94, "learning_rate": 9.429702344076043e-06, "loss": 0.0054, "step": 747310 }, { "epoch": 1.94, "learning_rate": 9.425814127704578e-06, "loss": 0.0067, "step": 747320 }, { "epoch": 1.94, "learning_rate": 9.421925911333113e-06, "loss": 0.0072, "step": 747330 }, { "epoch": 1.94, "learning_rate": 9.418037694961648e-06, "loss": 0.0082, "step": 747340 }, { "epoch": 1.94, "learning_rate": 9.414149478590184e-06, "loss": 0.0079, "step": 747350 }, { "epoch": 1.94, "learning_rate": 9.410261262218719e-06, "loss": 0.0066, "step": 747360 }, { "epoch": 1.94, "learning_rate": 9.406373045847256e-06, "loss": 0.0068, "step": 747370 }, { "epoch": 1.94, "learning_rate": 9.40248482947579e-06, "loss": 0.0066, "step": 747380 }, { "epoch": 1.94, "learning_rate": 9.398596613104327e-06, "loss": 0.0045, "step": 747390 }, { "epoch": 1.94, "learning_rate": 9.39470839673286e-06, "loss": 0.0063, "step": 747400 }, { "epoch": 1.94, "learning_rate": 9.390820180361395e-06, "loss": 0.0082, "step": 747410 }, { "epoch": 1.94, "learning_rate": 9.386931963989932e-06, "loss": 0.0056, "step": 747420 }, { "epoch": 1.94, "learning_rate": 9.383043747618466e-06, "loss": 0.0075, "step": 747430 }, { "epoch": 1.94, "learning_rate": 9.379155531247003e-06, "loss": 0.0075, "step": 747440 }, { "epoch": 1.94, "learning_rate": 9.375267314875538e-06, "loss": 0.0065, "step": 747450 }, { "epoch": 1.94, "learning_rate": 9.371379098504073e-06, "loss": 0.006, "step": 747460 }, { "epoch": 1.94, "learning_rate": 9.367490882132608e-06, "loss": 0.0081, "step": 747470 }, { "epoch": 1.94, "learning_rate": 9.363602665761144e-06, "loss": 0.0068, "step": 747480 }, { "epoch": 1.94, "learning_rate": 9.359714449389679e-06, "loss": 0.0058, "step": 747490 }, { "epoch": 1.94, "learning_rate": 9.355826233018214e-06, "loss": 0.008, "step": 747500 }, { "epoch": 1.94, "learning_rate": 9.351938016646749e-06, "loss": 0.007, "step": 747510 }, { "epoch": 1.94, "learning_rate": 9.348049800275285e-06, "loss": 0.0068, "step": 747520 }, { "epoch": 1.94, "learning_rate": 9.34416158390382e-06, "loss": 0.0048, "step": 747530 }, { "epoch": 1.94, "learning_rate": 9.340273367532355e-06, "loss": 0.0053, "step": 747540 }, { "epoch": 1.94, "learning_rate": 9.336385151160891e-06, "loss": 0.0078, "step": 747550 }, { "epoch": 1.94, "learning_rate": 9.332496934789426e-06, "loss": 0.0071, "step": 747560 }, { "epoch": 1.94, "learning_rate": 9.328608718417961e-06, "loss": 0.0092, "step": 747570 }, { "epoch": 1.94, "learning_rate": 9.324720502046498e-06, "loss": 0.0071, "step": 747580 }, { "epoch": 1.94, "learning_rate": 9.320832285675033e-06, "loss": 0.0065, "step": 747590 }, { "epoch": 1.94, "learning_rate": 9.316944069303567e-06, "loss": 0.0076, "step": 747600 }, { "epoch": 1.94, "learning_rate": 9.313055852932104e-06, "loss": 0.006, "step": 747610 }, { "epoch": 1.94, "learning_rate": 9.309167636560639e-06, "loss": 0.0062, "step": 747620 }, { "epoch": 1.94, "learning_rate": 9.305279420189174e-06, "loss": 0.0039, "step": 747630 }, { "epoch": 1.94, "learning_rate": 9.301391203817709e-06, "loss": 0.0067, "step": 747640 }, { "epoch": 1.94, "learning_rate": 9.297502987446245e-06, "loss": 0.0082, "step": 747650 }, { "epoch": 1.94, "learning_rate": 9.29361477107478e-06, "loss": 0.0105, "step": 747660 }, { "epoch": 1.94, "learning_rate": 9.289726554703315e-06, "loss": 0.0062, "step": 747670 }, { "epoch": 1.94, "learning_rate": 9.285838338331851e-06, "loss": 0.0078, "step": 747680 }, { "epoch": 1.94, "learning_rate": 9.281950121960386e-06, "loss": 0.0082, "step": 747690 }, { "epoch": 1.94, "learning_rate": 9.278061905588921e-06, "loss": 0.0072, "step": 747700 }, { "epoch": 1.94, "learning_rate": 9.274173689217458e-06, "loss": 0.0099, "step": 747710 }, { "epoch": 1.94, "learning_rate": 9.270285472845991e-06, "loss": 0.0069, "step": 747720 }, { "epoch": 1.94, "learning_rate": 9.266397256474527e-06, "loss": 0.0076, "step": 747730 }, { "epoch": 1.94, "learning_rate": 9.262509040103062e-06, "loss": 0.0063, "step": 747740 }, { "epoch": 1.94, "learning_rate": 9.258620823731597e-06, "loss": 0.0063, "step": 747750 }, { "epoch": 1.94, "learning_rate": 9.254732607360134e-06, "loss": 0.0053, "step": 747760 }, { "epoch": 1.94, "learning_rate": 9.250844390988669e-06, "loss": 0.0099, "step": 747770 }, { "epoch": 1.94, "learning_rate": 9.246956174617203e-06, "loss": 0.0063, "step": 747780 }, { "epoch": 1.94, "learning_rate": 9.24306795824574e-06, "loss": 0.0085, "step": 747790 }, { "epoch": 1.94, "learning_rate": 9.239179741874275e-06, "loss": 0.0064, "step": 747800 }, { "epoch": 1.94, "learning_rate": 9.23529152550281e-06, "loss": 0.0062, "step": 747810 }, { "epoch": 1.94, "learning_rate": 9.231403309131346e-06, "loss": 0.0076, "step": 747820 }, { "epoch": 1.94, "learning_rate": 9.227515092759881e-06, "loss": 0.0047, "step": 747830 }, { "epoch": 1.94, "learning_rate": 9.223626876388416e-06, "loss": 0.0065, "step": 747840 }, { "epoch": 1.94, "learning_rate": 9.219738660016951e-06, "loss": 0.005, "step": 747850 }, { "epoch": 1.94, "learning_rate": 9.215850443645487e-06, "loss": 0.011, "step": 747860 }, { "epoch": 1.94, "learning_rate": 9.211962227274022e-06, "loss": 0.0052, "step": 747870 }, { "epoch": 1.94, "learning_rate": 9.208074010902557e-06, "loss": 0.0053, "step": 747880 }, { "epoch": 1.94, "learning_rate": 9.204185794531094e-06, "loss": 0.0046, "step": 747890 }, { "epoch": 1.94, "learning_rate": 9.200297578159629e-06, "loss": 0.0074, "step": 747900 }, { "epoch": 1.94, "learning_rate": 9.196409361788163e-06, "loss": 0.0063, "step": 747910 }, { "epoch": 1.94, "learning_rate": 9.1925211454167e-06, "loss": 0.0044, "step": 747920 }, { "epoch": 1.94, "learning_rate": 9.188632929045235e-06, "loss": 0.0067, "step": 747930 }, { "epoch": 1.94, "learning_rate": 9.18474471267377e-06, "loss": 0.0081, "step": 747940 }, { "epoch": 1.94, "learning_rate": 9.180856496302306e-06, "loss": 0.0049, "step": 747950 }, { "epoch": 1.94, "learning_rate": 9.176968279930841e-06, "loss": 0.0068, "step": 747960 }, { "epoch": 1.94, "learning_rate": 9.173080063559376e-06, "loss": 0.0049, "step": 747970 }, { "epoch": 1.94, "learning_rate": 9.169191847187911e-06, "loss": 0.0061, "step": 747980 }, { "epoch": 1.94, "learning_rate": 9.165303630816447e-06, "loss": 0.0086, "step": 747990 }, { "epoch": 1.94, "learning_rate": 9.161415414444982e-06, "loss": 0.0062, "step": 748000 }, { "epoch": 1.94, "eval_cer": 0.8816774928583525, "eval_loss": 0.004467161372303963, "eval_runtime": 107.7694, "eval_samples_per_second": 18.558, "eval_steps_per_second": 4.64, "step": 748000 }, { "epoch": 1.94, "learning_rate": 9.157527198073517e-06, "loss": 0.0074, "step": 748010 }, { "epoch": 1.94, "learning_rate": 9.153638981702054e-06, "loss": 0.0083, "step": 748020 }, { "epoch": 1.94, "learning_rate": 9.149750765330589e-06, "loss": 0.0077, "step": 748030 }, { "epoch": 1.94, "learning_rate": 9.145862548959123e-06, "loss": 0.0063, "step": 748040 }, { "epoch": 1.94, "learning_rate": 9.14197433258766e-06, "loss": 0.0051, "step": 748050 }, { "epoch": 1.94, "learning_rate": 9.138086116216193e-06, "loss": 0.0089, "step": 748060 }, { "epoch": 1.94, "learning_rate": 9.13419789984473e-06, "loss": 0.0056, "step": 748070 }, { "epoch": 1.94, "learning_rate": 9.130309683473265e-06, "loss": 0.0133, "step": 748080 }, { "epoch": 1.94, "learning_rate": 9.1264214671018e-06, "loss": 0.0096, "step": 748090 }, { "epoch": 1.94, "learning_rate": 9.122533250730336e-06, "loss": 0.0062, "step": 748100 }, { "epoch": 1.94, "learning_rate": 9.11864503435887e-06, "loss": 0.0067, "step": 748110 }, { "epoch": 1.94, "learning_rate": 9.114756817987406e-06, "loss": 0.0072, "step": 748120 }, { "epoch": 1.94, "learning_rate": 9.110868601615942e-06, "loss": 0.006, "step": 748130 }, { "epoch": 1.94, "learning_rate": 9.106980385244477e-06, "loss": 0.0083, "step": 748140 }, { "epoch": 1.94, "learning_rate": 9.103092168873014e-06, "loss": 0.0062, "step": 748150 }, { "epoch": 1.94, "learning_rate": 9.099203952501549e-06, "loss": 0.0074, "step": 748160 }, { "epoch": 1.94, "learning_rate": 9.095315736130083e-06, "loss": 0.0069, "step": 748170 }, { "epoch": 1.94, "learning_rate": 9.09142751975862e-06, "loss": 0.0073, "step": 748180 }, { "epoch": 1.94, "learning_rate": 9.087539303387153e-06, "loss": 0.0079, "step": 748190 }, { "epoch": 1.94, "learning_rate": 9.08365108701569e-06, "loss": 0.0063, "step": 748200 }, { "epoch": 1.94, "learning_rate": 9.079762870644225e-06, "loss": 0.006, "step": 748210 }, { "epoch": 1.94, "learning_rate": 9.07587465427276e-06, "loss": 0.0073, "step": 748220 }, { "epoch": 1.94, "learning_rate": 9.071986437901296e-06, "loss": 0.0069, "step": 748230 }, { "epoch": 1.94, "learning_rate": 9.06809822152983e-06, "loss": 0.0063, "step": 748240 }, { "epoch": 1.94, "learning_rate": 9.064210005158366e-06, "loss": 0.0061, "step": 748250 }, { "epoch": 1.94, "learning_rate": 9.060321788786902e-06, "loss": 0.0069, "step": 748260 }, { "epoch": 1.94, "learning_rate": 9.056433572415437e-06, "loss": 0.0059, "step": 748270 }, { "epoch": 1.94, "learning_rate": 9.052545356043972e-06, "loss": 0.0079, "step": 748280 }, { "epoch": 1.94, "learning_rate": 9.048657139672509e-06, "loss": 0.0058, "step": 748290 }, { "epoch": 1.94, "learning_rate": 9.044768923301043e-06, "loss": 0.0076, "step": 748300 }, { "epoch": 1.94, "learning_rate": 9.040880706929578e-06, "loss": 0.0066, "step": 748310 }, { "epoch": 1.94, "learning_rate": 9.036992490558113e-06, "loss": 0.008, "step": 748320 }, { "epoch": 1.94, "learning_rate": 9.03310427418665e-06, "loss": 0.0044, "step": 748330 }, { "epoch": 1.94, "learning_rate": 9.029216057815185e-06, "loss": 0.0102, "step": 748340 }, { "epoch": 1.94, "learning_rate": 9.02532784144372e-06, "loss": 0.0048, "step": 748350 }, { "epoch": 1.94, "learning_rate": 9.021439625072256e-06, "loss": 0.0076, "step": 748360 }, { "epoch": 1.94, "learning_rate": 9.01755140870079e-06, "loss": 0.0052, "step": 748370 }, { "epoch": 1.94, "learning_rate": 9.013663192329326e-06, "loss": 0.0068, "step": 748380 }, { "epoch": 1.94, "learning_rate": 9.009774975957862e-06, "loss": 0.007, "step": 748390 }, { "epoch": 1.94, "learning_rate": 9.005886759586395e-06, "loss": 0.0057, "step": 748400 }, { "epoch": 1.94, "learning_rate": 9.001998543214932e-06, "loss": 0.0074, "step": 748410 }, { "epoch": 1.94, "learning_rate": 8.998110326843467e-06, "loss": 0.0065, "step": 748420 }, { "epoch": 1.94, "learning_rate": 8.994222110472002e-06, "loss": 0.0091, "step": 748430 }, { "epoch": 1.94, "learning_rate": 8.990333894100538e-06, "loss": 0.0061, "step": 748440 }, { "epoch": 1.94, "learning_rate": 8.986445677729073e-06, "loss": 0.0083, "step": 748450 }, { "epoch": 1.94, "learning_rate": 8.98255746135761e-06, "loss": 0.0075, "step": 748460 }, { "epoch": 1.94, "learning_rate": 8.978669244986144e-06, "loss": 0.0069, "step": 748470 }, { "epoch": 1.94, "learning_rate": 8.97478102861468e-06, "loss": 0.0064, "step": 748480 }, { "epoch": 1.94, "learning_rate": 8.970892812243216e-06, "loss": 0.0076, "step": 748490 }, { "epoch": 1.94, "learning_rate": 8.96700459587175e-06, "loss": 0.0084, "step": 748500 }, { "epoch": 1.94, "learning_rate": 8.963116379500286e-06, "loss": 0.0062, "step": 748510 }, { "epoch": 1.94, "learning_rate": 8.959228163128822e-06, "loss": 0.0062, "step": 748520 }, { "epoch": 1.94, "learning_rate": 8.955339946757355e-06, "loss": 0.0069, "step": 748530 }, { "epoch": 1.94, "learning_rate": 8.951451730385892e-06, "loss": 0.0058, "step": 748540 }, { "epoch": 1.94, "learning_rate": 8.947563514014427e-06, "loss": 0.0068, "step": 748550 }, { "epoch": 1.94, "learning_rate": 8.943675297642962e-06, "loss": 0.0093, "step": 748560 }, { "epoch": 1.94, "learning_rate": 8.939787081271498e-06, "loss": 0.0062, "step": 748570 }, { "epoch": 1.94, "learning_rate": 8.935898864900033e-06, "loss": 0.0065, "step": 748580 }, { "epoch": 1.94, "learning_rate": 8.932010648528568e-06, "loss": 0.0087, "step": 748590 }, { "epoch": 1.94, "learning_rate": 8.928122432157104e-06, "loss": 0.0079, "step": 748600 }, { "epoch": 1.94, "learning_rate": 8.92423421578564e-06, "loss": 0.0072, "step": 748610 }, { "epoch": 1.94, "learning_rate": 8.920345999414174e-06, "loss": 0.0091, "step": 748620 }, { "epoch": 1.94, "learning_rate": 8.91645778304271e-06, "loss": 0.0088, "step": 748630 }, { "epoch": 1.94, "learning_rate": 8.912569566671246e-06, "loss": 0.0056, "step": 748640 }, { "epoch": 1.94, "learning_rate": 8.90868135029978e-06, "loss": 0.0054, "step": 748650 }, { "epoch": 1.94, "learning_rate": 8.904793133928315e-06, "loss": 0.0062, "step": 748660 }, { "epoch": 1.94, "learning_rate": 8.900904917556852e-06, "loss": 0.0075, "step": 748670 }, { "epoch": 1.94, "learning_rate": 8.897016701185387e-06, "loss": 0.0071, "step": 748680 }, { "epoch": 1.94, "learning_rate": 8.893128484813922e-06, "loss": 0.0081, "step": 748690 }, { "epoch": 1.94, "learning_rate": 8.889240268442458e-06, "loss": 0.0088, "step": 748700 }, { "epoch": 1.94, "learning_rate": 8.885352052070993e-06, "loss": 0.0073, "step": 748710 }, { "epoch": 1.94, "learning_rate": 8.881463835699528e-06, "loss": 0.0089, "step": 748720 }, { "epoch": 1.94, "learning_rate": 8.877575619328064e-06, "loss": 0.0084, "step": 748730 }, { "epoch": 1.94, "learning_rate": 8.8736874029566e-06, "loss": 0.0053, "step": 748740 }, { "epoch": 1.94, "learning_rate": 8.869799186585134e-06, "loss": 0.0068, "step": 748750 }, { "epoch": 1.94, "learning_rate": 8.865910970213669e-06, "loss": 0.0071, "step": 748760 }, { "epoch": 1.94, "learning_rate": 8.862022753842206e-06, "loss": 0.0078, "step": 748770 }, { "epoch": 1.94, "learning_rate": 8.85813453747074e-06, "loss": 0.0114, "step": 748780 }, { "epoch": 1.94, "learning_rate": 8.854246321099275e-06, "loss": 0.0071, "step": 748790 }, { "epoch": 1.94, "learning_rate": 8.850358104727812e-06, "loss": 0.0073, "step": 748800 }, { "epoch": 1.94, "learning_rate": 8.846469888356347e-06, "loss": 0.0063, "step": 748810 }, { "epoch": 1.94, "learning_rate": 8.842581671984882e-06, "loss": 0.0117, "step": 748820 }, { "epoch": 1.94, "learning_rate": 8.838693455613418e-06, "loss": 0.0097, "step": 748830 }, { "epoch": 1.94, "learning_rate": 8.834805239241953e-06, "loss": 0.0059, "step": 748840 }, { "epoch": 1.94, "learning_rate": 8.830917022870488e-06, "loss": 0.0079, "step": 748850 }, { "epoch": 1.94, "learning_rate": 8.827028806499024e-06, "loss": 0.007, "step": 748860 }, { "epoch": 1.94, "learning_rate": 8.823140590127558e-06, "loss": 0.0074, "step": 748870 }, { "epoch": 1.94, "learning_rate": 8.819252373756094e-06, "loss": 0.0048, "step": 748880 }, { "epoch": 1.94, "learning_rate": 8.815364157384629e-06, "loss": 0.0062, "step": 748890 }, { "epoch": 1.94, "learning_rate": 8.811475941013164e-06, "loss": 0.0084, "step": 748900 }, { "epoch": 1.94, "learning_rate": 8.8075877246417e-06, "loss": 0.0091, "step": 748910 }, { "epoch": 1.94, "learning_rate": 8.803699508270235e-06, "loss": 0.0093, "step": 748920 }, { "epoch": 1.94, "learning_rate": 8.79981129189877e-06, "loss": 0.004, "step": 748930 }, { "epoch": 1.94, "learning_rate": 8.795923075527307e-06, "loss": 0.0066, "step": 748940 }, { "epoch": 1.94, "learning_rate": 8.792034859155842e-06, "loss": 0.0067, "step": 748950 }, { "epoch": 1.94, "learning_rate": 8.788146642784376e-06, "loss": 0.0038, "step": 748960 }, { "epoch": 1.94, "learning_rate": 8.784258426412913e-06, "loss": 0.0068, "step": 748970 }, { "epoch": 1.94, "learning_rate": 8.780370210041448e-06, "loss": 0.006, "step": 748980 }, { "epoch": 1.94, "learning_rate": 8.776481993669983e-06, "loss": 0.0062, "step": 748990 }, { "epoch": 1.94, "learning_rate": 8.772593777298518e-06, "loss": 0.0066, "step": 749000 }, { "epoch": 1.94, "eval_cer": 0.8816662957628791, "eval_loss": 0.004472545813769102, "eval_runtime": 108.118, "eval_samples_per_second": 18.498, "eval_steps_per_second": 4.625, "step": 749000 }, { "epoch": 1.94, "learning_rate": 8.768705560927054e-06, "loss": 0.0079, "step": 749010 }, { "epoch": 1.94, "learning_rate": 8.764817344555589e-06, "loss": 0.0056, "step": 749020 }, { "epoch": 1.94, "learning_rate": 8.760929128184124e-06, "loss": 0.0103, "step": 749030 }, { "epoch": 1.94, "learning_rate": 8.75704091181266e-06, "loss": 0.0065, "step": 749040 }, { "epoch": 1.94, "learning_rate": 8.753152695441195e-06, "loss": 0.0095, "step": 749050 }, { "epoch": 1.94, "learning_rate": 8.74926447906973e-06, "loss": 0.0077, "step": 749060 }, { "epoch": 1.94, "learning_rate": 8.745376262698267e-06, "loss": 0.0071, "step": 749070 }, { "epoch": 1.94, "learning_rate": 8.741488046326802e-06, "loss": 0.0076, "step": 749080 }, { "epoch": 1.94, "learning_rate": 8.737599829955336e-06, "loss": 0.0089, "step": 749090 }, { "epoch": 1.94, "learning_rate": 8.733711613583871e-06, "loss": 0.0065, "step": 749100 }, { "epoch": 1.94, "learning_rate": 8.729823397212408e-06, "loss": 0.0055, "step": 749110 }, { "epoch": 1.94, "learning_rate": 8.725935180840943e-06, "loss": 0.0091, "step": 749120 }, { "epoch": 1.94, "learning_rate": 8.722046964469478e-06, "loss": 0.0064, "step": 749130 }, { "epoch": 1.94, "learning_rate": 8.718158748098014e-06, "loss": 0.008, "step": 749140 }, { "epoch": 1.94, "learning_rate": 8.714270531726549e-06, "loss": 0.0054, "step": 749150 }, { "epoch": 1.94, "learning_rate": 8.710382315355084e-06, "loss": 0.0071, "step": 749160 }, { "epoch": 1.94, "learning_rate": 8.70649409898362e-06, "loss": 0.0071, "step": 749170 }, { "epoch": 1.94, "learning_rate": 8.702605882612155e-06, "loss": 0.0056, "step": 749180 }, { "epoch": 1.94, "learning_rate": 8.69871766624069e-06, "loss": 0.0076, "step": 749190 }, { "epoch": 1.94, "learning_rate": 8.694829449869227e-06, "loss": 0.0049, "step": 749200 }, { "epoch": 1.94, "learning_rate": 8.69094123349776e-06, "loss": 0.0062, "step": 749210 }, { "epoch": 1.94, "learning_rate": 8.687053017126296e-06, "loss": 0.0063, "step": 749220 }, { "epoch": 1.94, "learning_rate": 8.683164800754831e-06, "loss": 0.0064, "step": 749230 }, { "epoch": 1.94, "learning_rate": 8.679276584383366e-06, "loss": 0.0078, "step": 749240 }, { "epoch": 1.94, "learning_rate": 8.675388368011903e-06, "loss": 0.0077, "step": 749250 }, { "epoch": 1.94, "learning_rate": 8.671500151640438e-06, "loss": 0.0072, "step": 749260 }, { "epoch": 1.94, "learning_rate": 8.667611935268972e-06, "loss": 0.0076, "step": 749270 }, { "epoch": 1.94, "learning_rate": 8.663723718897509e-06, "loss": 0.0064, "step": 749280 }, { "epoch": 1.94, "learning_rate": 8.659835502526044e-06, "loss": 0.0098, "step": 749290 }, { "epoch": 1.94, "learning_rate": 8.655947286154579e-06, "loss": 0.0104, "step": 749300 }, { "epoch": 1.94, "learning_rate": 8.652059069783115e-06, "loss": 0.005, "step": 749310 }, { "epoch": 1.94, "learning_rate": 8.64817085341165e-06, "loss": 0.0073, "step": 749320 }, { "epoch": 1.94, "learning_rate": 8.644282637040185e-06, "loss": 0.0063, "step": 749330 }, { "epoch": 1.94, "learning_rate": 8.64039442066872e-06, "loss": 0.0062, "step": 749340 }, { "epoch": 1.94, "learning_rate": 8.636506204297256e-06, "loss": 0.0054, "step": 749350 }, { "epoch": 1.94, "learning_rate": 8.632617987925791e-06, "loss": 0.0069, "step": 749360 }, { "epoch": 1.94, "learning_rate": 8.628729771554326e-06, "loss": 0.0061, "step": 749370 }, { "epoch": 1.94, "learning_rate": 8.624841555182863e-06, "loss": 0.0086, "step": 749380 }, { "epoch": 1.94, "learning_rate": 8.620953338811397e-06, "loss": 0.0078, "step": 749390 }, { "epoch": 1.94, "learning_rate": 8.617065122439932e-06, "loss": 0.007, "step": 749400 }, { "epoch": 1.94, "learning_rate": 8.613176906068469e-06, "loss": 0.0051, "step": 749410 }, { "epoch": 1.94, "learning_rate": 8.609288689697004e-06, "loss": 0.0066, "step": 749420 }, { "epoch": 1.94, "learning_rate": 8.605400473325539e-06, "loss": 0.0074, "step": 749430 }, { "epoch": 1.94, "learning_rate": 8.601512256954073e-06, "loss": 0.0056, "step": 749440 }, { "epoch": 1.94, "learning_rate": 8.59762404058261e-06, "loss": 0.0095, "step": 749450 }, { "epoch": 1.94, "learning_rate": 8.593735824211145e-06, "loss": 0.0089, "step": 749460 }, { "epoch": 1.94, "learning_rate": 8.58984760783968e-06, "loss": 0.0085, "step": 749470 }, { "epoch": 1.94, "learning_rate": 8.585959391468216e-06, "loss": 0.0063, "step": 749480 }, { "epoch": 1.94, "learning_rate": 8.582071175096751e-06, "loss": 0.0052, "step": 749490 }, { "epoch": 1.94, "learning_rate": 8.578182958725286e-06, "loss": 0.0068, "step": 749500 }, { "epoch": 1.94, "learning_rate": 8.574294742353823e-06, "loss": 0.0083, "step": 749510 }, { "epoch": 1.94, "learning_rate": 8.570406525982357e-06, "loss": 0.0086, "step": 749520 }, { "epoch": 1.94, "learning_rate": 8.566518309610892e-06, "loss": 0.0074, "step": 749530 }, { "epoch": 1.94, "learning_rate": 8.562630093239429e-06, "loss": 0.008, "step": 749540 }, { "epoch": 1.94, "learning_rate": 8.558741876867962e-06, "loss": 0.0077, "step": 749550 }, { "epoch": 1.94, "learning_rate": 8.554853660496499e-06, "loss": 0.0064, "step": 749560 }, { "epoch": 1.94, "learning_rate": 8.550965444125033e-06, "loss": 0.0071, "step": 749570 }, { "epoch": 1.94, "learning_rate": 8.547077227753568e-06, "loss": 0.0044, "step": 749580 }, { "epoch": 1.94, "learning_rate": 8.543189011382105e-06, "loss": 0.0077, "step": 749590 }, { "epoch": 1.94, "learning_rate": 8.53930079501064e-06, "loss": 0.0092, "step": 749600 }, { "epoch": 1.94, "learning_rate": 8.535412578639175e-06, "loss": 0.0094, "step": 749610 }, { "epoch": 1.94, "learning_rate": 8.531524362267711e-06, "loss": 0.0076, "step": 749620 }, { "epoch": 1.94, "learning_rate": 8.527636145896246e-06, "loss": 0.0088, "step": 749630 }, { "epoch": 1.94, "learning_rate": 8.523747929524781e-06, "loss": 0.0064, "step": 749640 }, { "epoch": 1.94, "learning_rate": 8.519859713153317e-06, "loss": 0.0067, "step": 749650 }, { "epoch": 1.94, "learning_rate": 8.515971496781852e-06, "loss": 0.0078, "step": 749660 }, { "epoch": 1.94, "learning_rate": 8.512083280410387e-06, "loss": 0.0054, "step": 749670 }, { "epoch": 1.94, "learning_rate": 8.508195064038922e-06, "loss": 0.0073, "step": 749680 }, { "epoch": 1.94, "learning_rate": 8.504306847667459e-06, "loss": 0.0077, "step": 749690 }, { "epoch": 1.94, "learning_rate": 8.500418631295993e-06, "loss": 0.0057, "step": 749700 }, { "epoch": 1.94, "learning_rate": 8.496530414924528e-06, "loss": 0.0045, "step": 749710 }, { "epoch": 1.94, "learning_rate": 8.492642198553065e-06, "loss": 0.0072, "step": 749720 }, { "epoch": 1.94, "learning_rate": 8.4887539821816e-06, "loss": 0.0059, "step": 749730 }, { "epoch": 1.94, "learning_rate": 8.484865765810135e-06, "loss": 0.0089, "step": 749740 }, { "epoch": 1.94, "learning_rate": 8.480977549438671e-06, "loss": 0.0087, "step": 749750 }, { "epoch": 1.94, "learning_rate": 8.477089333067206e-06, "loss": 0.0061, "step": 749760 }, { "epoch": 1.94, "learning_rate": 8.473201116695741e-06, "loss": 0.0059, "step": 749770 }, { "epoch": 1.94, "learning_rate": 8.469312900324276e-06, "loss": 0.0075, "step": 749780 }, { "epoch": 1.94, "learning_rate": 8.465424683952812e-06, "loss": 0.0069, "step": 749790 }, { "epoch": 1.94, "learning_rate": 8.461536467581347e-06, "loss": 0.0057, "step": 749800 }, { "epoch": 1.94, "learning_rate": 8.457648251209882e-06, "loss": 0.0059, "step": 749810 }, { "epoch": 1.94, "learning_rate": 8.453760034838419e-06, "loss": 0.0053, "step": 749820 }, { "epoch": 1.94, "learning_rate": 8.449871818466953e-06, "loss": 0.0057, "step": 749830 }, { "epoch": 1.94, "learning_rate": 8.445983602095488e-06, "loss": 0.005, "step": 749840 }, { "epoch": 1.94, "learning_rate": 8.442095385724025e-06, "loss": 0.0065, "step": 749850 }, { "epoch": 1.94, "learning_rate": 8.43820716935256e-06, "loss": 0.0057, "step": 749860 }, { "epoch": 1.94, "learning_rate": 8.434318952981095e-06, "loss": 0.0059, "step": 749870 }, { "epoch": 1.94, "learning_rate": 8.430430736609631e-06, "loss": 0.0058, "step": 749880 }, { "epoch": 1.94, "learning_rate": 8.426542520238164e-06, "loss": 0.0104, "step": 749890 }, { "epoch": 1.94, "learning_rate": 8.4226543038667e-06, "loss": 0.0083, "step": 749900 }, { "epoch": 1.94, "learning_rate": 8.418766087495236e-06, "loss": 0.0072, "step": 749910 }, { "epoch": 1.94, "learning_rate": 8.41487787112377e-06, "loss": 0.0095, "step": 749920 }, { "epoch": 1.94, "learning_rate": 8.410989654752307e-06, "loss": 0.0084, "step": 749930 }, { "epoch": 1.94, "learning_rate": 8.407101438380842e-06, "loss": 0.0065, "step": 749940 }, { "epoch": 1.94, "learning_rate": 8.403213222009377e-06, "loss": 0.0071, "step": 749950 }, { "epoch": 1.94, "learning_rate": 8.399325005637913e-06, "loss": 0.0101, "step": 749960 }, { "epoch": 1.94, "learning_rate": 8.395436789266448e-06, "loss": 0.0067, "step": 749970 }, { "epoch": 1.94, "learning_rate": 8.391548572894983e-06, "loss": 0.0079, "step": 749980 }, { "epoch": 1.94, "learning_rate": 8.38766035652352e-06, "loss": 0.0076, "step": 749990 }, { "epoch": 1.94, "learning_rate": 8.383772140152055e-06, "loss": 0.007, "step": 750000 }, { "epoch": 1.94, "eval_cer": 0.8816662957628791, "eval_loss": 0.00447363406419754, "eval_runtime": 107.9666, "eval_samples_per_second": 18.524, "eval_steps_per_second": 4.631, "step": 750000 }, { "epoch": 1.94, "learning_rate": 8.379883923780591e-06, "loss": 0.0101, "step": 750010 }, { "epoch": 1.94, "learning_rate": 8.375995707409124e-06, "loss": 0.0045, "step": 750020 }, { "epoch": 1.94, "learning_rate": 8.37210749103766e-06, "loss": 0.0071, "step": 750030 }, { "epoch": 1.94, "learning_rate": 8.368219274666196e-06, "loss": 0.0054, "step": 750040 }, { "epoch": 1.94, "learning_rate": 8.36433105829473e-06, "loss": 0.0067, "step": 750050 }, { "epoch": 1.94, "learning_rate": 8.360442841923267e-06, "loss": 0.0062, "step": 750060 }, { "epoch": 1.94, "learning_rate": 8.356554625551802e-06, "loss": 0.006, "step": 750070 }, { "epoch": 1.94, "learning_rate": 8.352666409180337e-06, "loss": 0.0057, "step": 750080 }, { "epoch": 1.94, "learning_rate": 8.348778192808873e-06, "loss": 0.0066, "step": 750090 }, { "epoch": 1.94, "learning_rate": 8.344889976437408e-06, "loss": 0.0099, "step": 750100 }, { "epoch": 1.94, "learning_rate": 8.341001760065943e-06, "loss": 0.005, "step": 750110 }, { "epoch": 1.94, "learning_rate": 8.33711354369448e-06, "loss": 0.0069, "step": 750120 }, { "epoch": 1.94, "learning_rate": 8.333225327323015e-06, "loss": 0.0092, "step": 750130 }, { "epoch": 1.94, "learning_rate": 8.32933711095155e-06, "loss": 0.0087, "step": 750140 }, { "epoch": 1.94, "learning_rate": 8.325448894580084e-06, "loss": 0.0059, "step": 750150 }, { "epoch": 1.94, "learning_rate": 8.32156067820862e-06, "loss": 0.0065, "step": 750160 }, { "epoch": 1.94, "learning_rate": 8.317672461837156e-06, "loss": 0.0065, "step": 750170 }, { "epoch": 1.94, "learning_rate": 8.31378424546569e-06, "loss": 0.0081, "step": 750180 }, { "epoch": 1.94, "learning_rate": 8.309896029094227e-06, "loss": 0.0071, "step": 750190 }, { "epoch": 1.94, "learning_rate": 8.306007812722762e-06, "loss": 0.0085, "step": 750200 }, { "epoch": 1.94, "learning_rate": 8.302119596351297e-06, "loss": 0.0067, "step": 750210 }, { "epoch": 1.94, "learning_rate": 8.298231379979833e-06, "loss": 0.0057, "step": 750220 }, { "epoch": 1.94, "learning_rate": 8.294343163608367e-06, "loss": 0.0052, "step": 750230 }, { "epoch": 1.94, "learning_rate": 8.290454947236903e-06, "loss": 0.0074, "step": 750240 }, { "epoch": 1.94, "learning_rate": 8.286566730865438e-06, "loss": 0.0071, "step": 750250 }, { "epoch": 1.94, "learning_rate": 8.282678514493973e-06, "loss": 0.0091, "step": 750260 }, { "epoch": 1.94, "learning_rate": 8.27879029812251e-06, "loss": 0.0066, "step": 750270 }, { "epoch": 1.94, "learning_rate": 8.274902081751044e-06, "loss": 0.0066, "step": 750280 }, { "epoch": 1.94, "learning_rate": 8.271013865379579e-06, "loss": 0.0085, "step": 750290 }, { "epoch": 1.94, "learning_rate": 8.267125649008116e-06, "loss": 0.007, "step": 750300 }, { "epoch": 1.94, "learning_rate": 8.26323743263665e-06, "loss": 0.008, "step": 750310 }, { "epoch": 1.94, "learning_rate": 8.259349216265187e-06, "loss": 0.0059, "step": 750320 }, { "epoch": 1.94, "learning_rate": 8.255460999893722e-06, "loss": 0.0058, "step": 750330 }, { "epoch": 1.94, "learning_rate": 8.251572783522257e-06, "loss": 0.0072, "step": 750340 }, { "epoch": 1.95, "learning_rate": 8.247684567150793e-06, "loss": 0.009, "step": 750350 }, { "epoch": 1.95, "learning_rate": 8.243796350779326e-06, "loss": 0.0054, "step": 750360 }, { "epoch": 1.95, "learning_rate": 8.239908134407863e-06, "loss": 0.0061, "step": 750370 }, { "epoch": 1.95, "learning_rate": 8.236019918036398e-06, "loss": 0.0069, "step": 750380 }, { "epoch": 1.95, "learning_rate": 8.232131701664933e-06, "loss": 0.0075, "step": 750390 }, { "epoch": 1.95, "learning_rate": 8.22824348529347e-06, "loss": 0.0056, "step": 750400 }, { "epoch": 1.95, "learning_rate": 8.224355268922004e-06, "loss": 0.0049, "step": 750410 }, { "epoch": 1.95, "learning_rate": 8.220467052550539e-06, "loss": 0.0056, "step": 750420 }, { "epoch": 1.95, "learning_rate": 8.216578836179076e-06, "loss": 0.0091, "step": 750430 }, { "epoch": 1.95, "learning_rate": 8.21269061980761e-06, "loss": 0.0056, "step": 750440 }, { "epoch": 1.95, "learning_rate": 8.208802403436145e-06, "loss": 0.0121, "step": 750450 }, { "epoch": 1.95, "learning_rate": 8.204914187064682e-06, "loss": 0.0071, "step": 750460 }, { "epoch": 1.95, "learning_rate": 8.201025970693217e-06, "loss": 0.0073, "step": 750470 }, { "epoch": 1.95, "learning_rate": 8.197137754321752e-06, "loss": 0.0076, "step": 750480 }, { "epoch": 1.95, "learning_rate": 8.193249537950286e-06, "loss": 0.0071, "step": 750490 }, { "epoch": 1.95, "learning_rate": 8.189361321578823e-06, "loss": 0.0062, "step": 750500 }, { "epoch": 1.95, "learning_rate": 8.185473105207358e-06, "loss": 0.0089, "step": 750510 }, { "epoch": 1.95, "learning_rate": 8.181584888835893e-06, "loss": 0.0072, "step": 750520 }, { "epoch": 1.95, "learning_rate": 8.17769667246443e-06, "loss": 0.0072, "step": 750530 }, { "epoch": 1.95, "learning_rate": 8.173808456092964e-06, "loss": 0.009, "step": 750540 }, { "epoch": 1.95, "learning_rate": 8.169920239721499e-06, "loss": 0.0049, "step": 750550 }, { "epoch": 1.95, "learning_rate": 8.166032023350036e-06, "loss": 0.0058, "step": 750560 }, { "epoch": 1.95, "learning_rate": 8.162143806978569e-06, "loss": 0.006, "step": 750570 }, { "epoch": 1.95, "learning_rate": 8.158255590607105e-06, "loss": 0.0075, "step": 750580 }, { "epoch": 1.95, "learning_rate": 8.15436737423564e-06, "loss": 0.0083, "step": 750590 }, { "epoch": 1.95, "learning_rate": 8.150479157864177e-06, "loss": 0.008, "step": 750600 }, { "epoch": 1.95, "learning_rate": 8.146590941492712e-06, "loss": 0.0047, "step": 750610 }, { "epoch": 1.95, "learning_rate": 8.142702725121246e-06, "loss": 0.0054, "step": 750620 }, { "epoch": 1.95, "learning_rate": 8.138814508749783e-06, "loss": 0.0067, "step": 750630 }, { "epoch": 1.95, "learning_rate": 8.134926292378318e-06, "loss": 0.0077, "step": 750640 }, { "epoch": 1.95, "learning_rate": 8.131038076006853e-06, "loss": 0.0075, "step": 750650 }, { "epoch": 1.95, "learning_rate": 8.12714985963539e-06, "loss": 0.0057, "step": 750660 }, { "epoch": 1.95, "learning_rate": 8.123261643263924e-06, "loss": 0.0069, "step": 750670 }, { "epoch": 1.95, "learning_rate": 8.119373426892459e-06, "loss": 0.0083, "step": 750680 }, { "epoch": 1.95, "learning_rate": 8.115485210520996e-06, "loss": 0.0082, "step": 750690 }, { "epoch": 1.95, "learning_rate": 8.111596994149529e-06, "loss": 0.0072, "step": 750700 }, { "epoch": 1.95, "learning_rate": 8.107708777778065e-06, "loss": 0.0071, "step": 750710 }, { "epoch": 1.95, "learning_rate": 8.1038205614066e-06, "loss": 0.0082, "step": 750720 }, { "epoch": 1.95, "learning_rate": 8.099932345035135e-06, "loss": 0.0093, "step": 750730 }, { "epoch": 1.95, "learning_rate": 8.096044128663672e-06, "loss": 0.0076, "step": 750740 }, { "epoch": 1.95, "learning_rate": 8.092155912292206e-06, "loss": 0.0077, "step": 750750 }, { "epoch": 1.95, "learning_rate": 8.088267695920741e-06, "loss": 0.0053, "step": 750760 }, { "epoch": 1.95, "learning_rate": 8.084379479549278e-06, "loss": 0.0063, "step": 750770 }, { "epoch": 1.95, "learning_rate": 8.080491263177813e-06, "loss": 0.0092, "step": 750780 }, { "epoch": 1.95, "learning_rate": 8.076603046806348e-06, "loss": 0.0062, "step": 750790 }, { "epoch": 1.95, "learning_rate": 8.072714830434884e-06, "loss": 0.0076, "step": 750800 }, { "epoch": 1.95, "learning_rate": 8.068826614063419e-06, "loss": 0.0076, "step": 750810 }, { "epoch": 1.95, "learning_rate": 8.064938397691954e-06, "loss": 0.0114, "step": 750820 }, { "epoch": 1.95, "learning_rate": 8.061050181320489e-06, "loss": 0.0104, "step": 750830 }, { "epoch": 1.95, "learning_rate": 8.057161964949025e-06, "loss": 0.0061, "step": 750840 }, { "epoch": 1.95, "learning_rate": 8.05327374857756e-06, "loss": 0.0049, "step": 750850 }, { "epoch": 1.95, "learning_rate": 8.049385532206095e-06, "loss": 0.0059, "step": 750860 }, { "epoch": 1.95, "learning_rate": 8.045497315834632e-06, "loss": 0.0078, "step": 750870 }, { "epoch": 1.95, "learning_rate": 8.041609099463166e-06, "loss": 0.006, "step": 750880 }, { "epoch": 1.95, "learning_rate": 8.037720883091701e-06, "loss": 0.0062, "step": 750890 }, { "epoch": 1.95, "learning_rate": 8.033832666720238e-06, "loss": 0.0068, "step": 750900 }, { "epoch": 1.95, "learning_rate": 8.029944450348773e-06, "loss": 0.0063, "step": 750910 }, { "epoch": 1.95, "learning_rate": 8.026056233977308e-06, "loss": 0.0066, "step": 750920 }, { "epoch": 1.95, "learning_rate": 8.022168017605842e-06, "loss": 0.0058, "step": 750930 }, { "epoch": 1.95, "learning_rate": 8.018279801234379e-06, "loss": 0.0069, "step": 750940 }, { "epoch": 1.95, "learning_rate": 8.014391584862914e-06, "loss": 0.0078, "step": 750950 }, { "epoch": 1.95, "learning_rate": 8.010503368491449e-06, "loss": 0.0071, "step": 750960 }, { "epoch": 1.95, "learning_rate": 8.006615152119985e-06, "loss": 0.0068, "step": 750970 }, { "epoch": 1.95, "learning_rate": 8.00272693574852e-06, "loss": 0.0084, "step": 750980 }, { "epoch": 1.95, "learning_rate": 7.998838719377055e-06, "loss": 0.0057, "step": 750990 }, { "epoch": 1.95, "learning_rate": 7.994950503005592e-06, "loss": 0.0091, "step": 751000 }, { "epoch": 1.95, "eval_cer": 0.8816690950367475, "eval_loss": 0.004483851604163647, "eval_runtime": 107.9182, "eval_samples_per_second": 18.533, "eval_steps_per_second": 4.633, "step": 751000 }, { "epoch": 1.95, "learning_rate": 7.991062286634126e-06, "loss": 0.0082, "step": 751010 }, { "epoch": 1.95, "learning_rate": 7.987174070262661e-06, "loss": 0.0057, "step": 751020 }, { "epoch": 1.95, "learning_rate": 7.983285853891198e-06, "loss": 0.0054, "step": 751030 }, { "epoch": 1.95, "learning_rate": 7.979397637519731e-06, "loss": 0.0099, "step": 751040 }, { "epoch": 1.95, "learning_rate": 7.975509421148268e-06, "loss": 0.0041, "step": 751050 }, { "epoch": 1.95, "learning_rate": 7.971621204776802e-06, "loss": 0.0077, "step": 751060 }, { "epoch": 1.95, "learning_rate": 7.967732988405337e-06, "loss": 0.0064, "step": 751070 }, { "epoch": 1.95, "learning_rate": 7.963844772033874e-06, "loss": 0.0066, "step": 751080 }, { "epoch": 1.95, "learning_rate": 7.959956555662409e-06, "loss": 0.0059, "step": 751090 }, { "epoch": 1.95, "learning_rate": 7.956068339290944e-06, "loss": 0.0077, "step": 751100 }, { "epoch": 1.95, "learning_rate": 7.95218012291948e-06, "loss": 0.0078, "step": 751110 }, { "epoch": 1.95, "learning_rate": 7.948291906548015e-06, "loss": 0.0058, "step": 751120 }, { "epoch": 1.95, "learning_rate": 7.94440369017655e-06, "loss": 0.0048, "step": 751130 }, { "epoch": 1.95, "learning_rate": 7.940515473805086e-06, "loss": 0.0074, "step": 751140 }, { "epoch": 1.95, "learning_rate": 7.936627257433621e-06, "loss": 0.0047, "step": 751150 }, { "epoch": 1.95, "learning_rate": 7.932739041062156e-06, "loss": 0.0095, "step": 751160 }, { "epoch": 1.95, "learning_rate": 7.928850824690691e-06, "loss": 0.0078, "step": 751170 }, { "epoch": 1.95, "learning_rate": 7.924962608319227e-06, "loss": 0.0065, "step": 751180 }, { "epoch": 1.95, "learning_rate": 7.921074391947762e-06, "loss": 0.0088, "step": 751190 }, { "epoch": 1.95, "learning_rate": 7.917186175576297e-06, "loss": 0.006, "step": 751200 }, { "epoch": 1.95, "learning_rate": 7.913297959204834e-06, "loss": 0.006, "step": 751210 }, { "epoch": 1.95, "learning_rate": 7.909409742833369e-06, "loss": 0.0078, "step": 751220 }, { "epoch": 1.95, "learning_rate": 7.905521526461903e-06, "loss": 0.0071, "step": 751230 }, { "epoch": 1.95, "learning_rate": 7.90163331009044e-06, "loss": 0.0059, "step": 751240 }, { "epoch": 1.95, "learning_rate": 7.897745093718975e-06, "loss": 0.0067, "step": 751250 }, { "epoch": 1.95, "learning_rate": 7.89385687734751e-06, "loss": 0.0064, "step": 751260 }, { "epoch": 1.95, "learning_rate": 7.889968660976045e-06, "loss": 0.0071, "step": 751270 }, { "epoch": 1.95, "learning_rate": 7.886080444604581e-06, "loss": 0.006, "step": 751280 }, { "epoch": 1.95, "learning_rate": 7.882192228233116e-06, "loss": 0.0067, "step": 751290 }, { "epoch": 1.95, "learning_rate": 7.878304011861651e-06, "loss": 0.0077, "step": 751300 }, { "epoch": 1.95, "learning_rate": 7.874415795490187e-06, "loss": 0.007, "step": 751310 }, { "epoch": 1.95, "learning_rate": 7.870527579118722e-06, "loss": 0.0088, "step": 751320 }, { "epoch": 1.95, "learning_rate": 7.866639362747257e-06, "loss": 0.0083, "step": 751330 }, { "epoch": 1.95, "learning_rate": 7.862751146375794e-06, "loss": 0.0055, "step": 751340 }, { "epoch": 1.95, "learning_rate": 7.858862930004329e-06, "loss": 0.0079, "step": 751350 }, { "epoch": 1.95, "learning_rate": 7.854974713632863e-06, "loss": 0.0066, "step": 751360 }, { "epoch": 1.95, "learning_rate": 7.8510864972614e-06, "loss": 0.0071, "step": 751370 }, { "epoch": 1.95, "learning_rate": 7.847198280889933e-06, "loss": 0.0124, "step": 751380 }, { "epoch": 1.95, "learning_rate": 7.84331006451847e-06, "loss": 0.0073, "step": 751390 }, { "epoch": 1.95, "learning_rate": 7.839421848147005e-06, "loss": 0.0071, "step": 751400 }, { "epoch": 1.95, "learning_rate": 7.83553363177554e-06, "loss": 0.0093, "step": 751410 }, { "epoch": 1.95, "learning_rate": 7.831645415404076e-06, "loss": 0.0068, "step": 751420 }, { "epoch": 1.95, "learning_rate": 7.827757199032611e-06, "loss": 0.007, "step": 751430 }, { "epoch": 1.95, "learning_rate": 7.823868982661146e-06, "loss": 0.0072, "step": 751440 }, { "epoch": 1.95, "learning_rate": 7.819980766289682e-06, "loss": 0.0055, "step": 751450 }, { "epoch": 1.95, "learning_rate": 7.816092549918217e-06, "loss": 0.0087, "step": 751460 }, { "epoch": 1.95, "learning_rate": 7.812204333546752e-06, "loss": 0.0057, "step": 751470 }, { "epoch": 1.95, "learning_rate": 7.808316117175289e-06, "loss": 0.0078, "step": 751480 }, { "epoch": 1.95, "learning_rate": 7.804427900803823e-06, "loss": 0.0055, "step": 751490 }, { "epoch": 1.95, "learning_rate": 7.800539684432358e-06, "loss": 0.0077, "step": 751500 }, { "epoch": 1.95, "learning_rate": 7.796651468060893e-06, "loss": 0.0121, "step": 751510 }, { "epoch": 1.95, "learning_rate": 7.79276325168943e-06, "loss": 0.0061, "step": 751520 }, { "epoch": 1.95, "learning_rate": 7.788875035317965e-06, "loss": 0.0086, "step": 751530 }, { "epoch": 1.95, "learning_rate": 7.7849868189465e-06, "loss": 0.008, "step": 751540 }, { "epoch": 1.95, "learning_rate": 7.781098602575036e-06, "loss": 0.0073, "step": 751550 }, { "epoch": 1.95, "learning_rate": 7.777210386203571e-06, "loss": 0.0067, "step": 751560 }, { "epoch": 1.95, "learning_rate": 7.773322169832106e-06, "loss": 0.0076, "step": 751570 }, { "epoch": 1.95, "learning_rate": 7.769433953460642e-06, "loss": 0.0076, "step": 751580 }, { "epoch": 1.95, "learning_rate": 7.765545737089177e-06, "loss": 0.0062, "step": 751590 }, { "epoch": 1.95, "learning_rate": 7.761657520717712e-06, "loss": 0.0078, "step": 751600 }, { "epoch": 1.95, "learning_rate": 7.757769304346247e-06, "loss": 0.0063, "step": 751610 }, { "epoch": 1.95, "learning_rate": 7.753881087974783e-06, "loss": 0.0061, "step": 751620 }, { "epoch": 1.95, "learning_rate": 7.749992871603318e-06, "loss": 0.007, "step": 751630 }, { "epoch": 1.95, "learning_rate": 7.746104655231853e-06, "loss": 0.0074, "step": 751640 }, { "epoch": 1.95, "learning_rate": 7.74221643886039e-06, "loss": 0.0062, "step": 751650 }, { "epoch": 1.95, "learning_rate": 7.738328222488925e-06, "loss": 0.0123, "step": 751660 }, { "epoch": 1.95, "learning_rate": 7.73444000611746e-06, "loss": 0.0071, "step": 751670 }, { "epoch": 1.95, "learning_rate": 7.730551789745996e-06, "loss": 0.0063, "step": 751680 }, { "epoch": 1.95, "learning_rate": 7.72666357337453e-06, "loss": 0.0074, "step": 751690 }, { "epoch": 1.95, "learning_rate": 7.722775357003066e-06, "loss": 0.0094, "step": 751700 }, { "epoch": 1.95, "learning_rate": 7.718887140631602e-06, "loss": 0.0078, "step": 751710 }, { "epoch": 1.95, "learning_rate": 7.714998924260135e-06, "loss": 0.0077, "step": 751720 }, { "epoch": 1.95, "learning_rate": 7.711110707888672e-06, "loss": 0.0061, "step": 751730 }, { "epoch": 1.95, "learning_rate": 7.707222491517207e-06, "loss": 0.0068, "step": 751740 }, { "epoch": 1.95, "learning_rate": 7.703334275145742e-06, "loss": 0.0064, "step": 751750 }, { "epoch": 1.95, "learning_rate": 7.699446058774278e-06, "loss": 0.0054, "step": 751760 }, { "epoch": 1.95, "learning_rate": 7.695557842402813e-06, "loss": 0.0053, "step": 751770 }, { "epoch": 1.95, "learning_rate": 7.691669626031348e-06, "loss": 0.012, "step": 751780 }, { "epoch": 1.95, "learning_rate": 7.687781409659885e-06, "loss": 0.0049, "step": 751790 }, { "epoch": 1.95, "learning_rate": 7.68389319328842e-06, "loss": 0.0082, "step": 751800 }, { "epoch": 1.95, "learning_rate": 7.680004976916954e-06, "loss": 0.0084, "step": 751810 }, { "epoch": 1.95, "learning_rate": 7.67611676054549e-06, "loss": 0.0054, "step": 751820 }, { "epoch": 1.95, "learning_rate": 7.672228544174026e-06, "loss": 0.0056, "step": 751830 }, { "epoch": 1.95, "learning_rate": 7.668340327802562e-06, "loss": 0.0105, "step": 751840 }, { "epoch": 1.95, "learning_rate": 7.664452111431095e-06, "loss": 0.0066, "step": 751850 }, { "epoch": 1.95, "learning_rate": 7.660563895059632e-06, "loss": 0.0074, "step": 751860 }, { "epoch": 1.95, "learning_rate": 7.656675678688167e-06, "loss": 0.0058, "step": 751870 }, { "epoch": 1.95, "learning_rate": 7.652787462316702e-06, "loss": 0.0076, "step": 751880 }, { "epoch": 1.95, "learning_rate": 7.648899245945238e-06, "loss": 0.0083, "step": 751890 }, { "epoch": 1.95, "learning_rate": 7.645011029573773e-06, "loss": 0.0064, "step": 751900 }, { "epoch": 1.95, "learning_rate": 7.641122813202308e-06, "loss": 0.0054, "step": 751910 }, { "epoch": 1.95, "learning_rate": 7.637234596830844e-06, "loss": 0.0085, "step": 751920 }, { "epoch": 1.95, "learning_rate": 7.63334638045938e-06, "loss": 0.007, "step": 751930 }, { "epoch": 1.95, "learning_rate": 7.629458164087914e-06, "loss": 0.0044, "step": 751940 }, { "epoch": 1.95, "learning_rate": 7.62556994771645e-06, "loss": 0.0089, "step": 751950 }, { "epoch": 1.95, "learning_rate": 7.621681731344986e-06, "loss": 0.0061, "step": 751960 }, { "epoch": 1.95, "learning_rate": 7.6177935149735205e-06, "loss": 0.0072, "step": 751970 }, { "epoch": 1.95, "learning_rate": 7.613905298602056e-06, "loss": 0.0086, "step": 751980 }, { "epoch": 1.95, "learning_rate": 7.610017082230592e-06, "loss": 0.007, "step": 751990 }, { "epoch": 1.95, "learning_rate": 7.606128865859126e-06, "loss": 0.0071, "step": 752000 }, { "epoch": 1.95, "eval_cer": 0.8816676953998133, "eval_loss": 0.004463730845600367, "eval_runtime": 107.8824, "eval_samples_per_second": 18.539, "eval_steps_per_second": 4.635, "step": 752000 }, { "epoch": 1.95, "learning_rate": 7.602240649487662e-06, "loss": 0.0076, "step": 752010 }, { "epoch": 1.95, "learning_rate": 7.598352433116197e-06, "loss": 0.007, "step": 752020 }, { "epoch": 1.95, "learning_rate": 7.594464216744732e-06, "loss": 0.0065, "step": 752030 }, { "epoch": 1.95, "learning_rate": 7.590576000373268e-06, "loss": 0.0075, "step": 752040 }, { "epoch": 1.95, "learning_rate": 7.586687784001804e-06, "loss": 0.0036, "step": 752050 }, { "epoch": 1.95, "learning_rate": 7.5827995676303385e-06, "loss": 0.0057, "step": 752060 }, { "epoch": 1.95, "learning_rate": 7.578911351258874e-06, "loss": 0.0108, "step": 752070 }, { "epoch": 1.95, "learning_rate": 7.57502313488741e-06, "loss": 0.0082, "step": 752080 }, { "epoch": 1.95, "learning_rate": 7.571134918515945e-06, "loss": 0.0058, "step": 752090 }, { "epoch": 1.95, "learning_rate": 7.5672467021444805e-06, "loss": 0.0071, "step": 752100 }, { "epoch": 1.95, "learning_rate": 7.563358485773016e-06, "loss": 0.0056, "step": 752110 }, { "epoch": 1.95, "learning_rate": 7.55947026940155e-06, "loss": 0.0068, "step": 752120 }, { "epoch": 1.95, "learning_rate": 7.555582053030086e-06, "loss": 0.0071, "step": 752130 }, { "epoch": 1.95, "learning_rate": 7.551693836658622e-06, "loss": 0.0054, "step": 752140 }, { "epoch": 1.95, "learning_rate": 7.547805620287157e-06, "loss": 0.006, "step": 752150 }, { "epoch": 1.95, "learning_rate": 7.543917403915692e-06, "loss": 0.0061, "step": 752160 }, { "epoch": 1.95, "learning_rate": 7.540029187544228e-06, "loss": 0.0076, "step": 752170 }, { "epoch": 1.95, "learning_rate": 7.536140971172764e-06, "loss": 0.0083, "step": 752180 }, { "epoch": 1.95, "learning_rate": 7.5322527548012985e-06, "loss": 0.0053, "step": 752190 }, { "epoch": 1.95, "learning_rate": 7.528364538429834e-06, "loss": 0.0074, "step": 752200 }, { "epoch": 1.95, "learning_rate": 7.52447632205837e-06, "loss": 0.0083, "step": 752210 }, { "epoch": 1.95, "learning_rate": 7.520588105686905e-06, "loss": 0.0063, "step": 752220 }, { "epoch": 1.95, "learning_rate": 7.51669988931544e-06, "loss": 0.0061, "step": 752230 }, { "epoch": 1.95, "learning_rate": 7.512811672943975e-06, "loss": 0.0112, "step": 752240 }, { "epoch": 1.95, "learning_rate": 7.50892345657251e-06, "loss": 0.0058, "step": 752250 }, { "epoch": 1.95, "learning_rate": 7.505035240201046e-06, "loss": 0.0068, "step": 752260 }, { "epoch": 1.95, "learning_rate": 7.501147023829582e-06, "loss": 0.0068, "step": 752270 }, { "epoch": 1.95, "learning_rate": 7.4972588074581165e-06, "loss": 0.0081, "step": 752280 }, { "epoch": 1.95, "learning_rate": 7.493370591086652e-06, "loss": 0.0069, "step": 752290 }, { "epoch": 1.95, "learning_rate": 7.489482374715188e-06, "loss": 0.0091, "step": 752300 }, { "epoch": 1.95, "learning_rate": 7.485594158343723e-06, "loss": 0.0076, "step": 752310 }, { "epoch": 1.95, "learning_rate": 7.4817059419722584e-06, "loss": 0.0065, "step": 752320 }, { "epoch": 1.95, "learning_rate": 7.477817725600794e-06, "loss": 0.0088, "step": 752330 }, { "epoch": 1.95, "learning_rate": 7.473929509229328e-06, "loss": 0.0083, "step": 752340 }, { "epoch": 1.95, "learning_rate": 7.470041292857864e-06, "loss": 0.0074, "step": 752350 }, { "epoch": 1.95, "learning_rate": 7.4661530764864e-06, "loss": 0.007, "step": 752360 }, { "epoch": 1.95, "learning_rate": 7.4622648601149344e-06, "loss": 0.0072, "step": 752370 }, { "epoch": 1.95, "learning_rate": 7.45837664374347e-06, "loss": 0.0074, "step": 752380 }, { "epoch": 1.95, "learning_rate": 7.454488427372006e-06, "loss": 0.0055, "step": 752390 }, { "epoch": 1.95, "learning_rate": 7.450600211000541e-06, "loss": 0.0073, "step": 752400 }, { "epoch": 1.95, "learning_rate": 7.4467119946290764e-06, "loss": 0.0064, "step": 752410 }, { "epoch": 1.95, "learning_rate": 7.442823778257612e-06, "loss": 0.0071, "step": 752420 }, { "epoch": 1.95, "learning_rate": 7.438935561886147e-06, "loss": 0.0068, "step": 752430 }, { "epoch": 1.95, "learning_rate": 7.435047345514683e-06, "loss": 0.0061, "step": 752440 }, { "epoch": 1.95, "learning_rate": 7.431159129143218e-06, "loss": 0.0091, "step": 752450 }, { "epoch": 1.95, "learning_rate": 7.427270912771754e-06, "loss": 0.006, "step": 752460 }, { "epoch": 1.95, "learning_rate": 7.423382696400288e-06, "loss": 0.008, "step": 752470 }, { "epoch": 1.95, "learning_rate": 7.419494480028824e-06, "loss": 0.0091, "step": 752480 }, { "epoch": 1.95, "learning_rate": 7.4156062636573596e-06, "loss": 0.0075, "step": 752490 }, { "epoch": 1.95, "learning_rate": 7.411718047285894e-06, "loss": 0.0053, "step": 752500 }, { "epoch": 1.95, "learning_rate": 7.40782983091443e-06, "loss": 0.0066, "step": 752510 }, { "epoch": 1.95, "learning_rate": 7.403941614542966e-06, "loss": 0.0074, "step": 752520 }, { "epoch": 1.95, "learning_rate": 7.400053398171501e-06, "loss": 0.0073, "step": 752530 }, { "epoch": 1.95, "learning_rate": 7.396165181800036e-06, "loss": 0.0053, "step": 752540 }, { "epoch": 1.95, "learning_rate": 7.392276965428572e-06, "loss": 0.0087, "step": 752550 }, { "epoch": 1.95, "learning_rate": 7.388388749057107e-06, "loss": 0.0062, "step": 752560 }, { "epoch": 1.95, "learning_rate": 7.384500532685643e-06, "loss": 0.006, "step": 752570 }, { "epoch": 1.95, "learning_rate": 7.3806123163141775e-06, "loss": 0.0069, "step": 752580 }, { "epoch": 1.95, "learning_rate": 7.376724099942712e-06, "loss": 0.0051, "step": 752590 }, { "epoch": 1.95, "learning_rate": 7.372835883571248e-06, "loss": 0.007, "step": 752600 }, { "epoch": 1.95, "learning_rate": 7.368947667199784e-06, "loss": 0.0063, "step": 752610 }, { "epoch": 1.95, "learning_rate": 7.365059450828319e-06, "loss": 0.007, "step": 752620 }, { "epoch": 1.95, "learning_rate": 7.361171234456854e-06, "loss": 0.0049, "step": 752630 }, { "epoch": 1.95, "learning_rate": 7.35728301808539e-06, "loss": 0.0054, "step": 752640 }, { "epoch": 1.95, "learning_rate": 7.353394801713925e-06, "loss": 0.0075, "step": 752650 }, { "epoch": 1.95, "learning_rate": 7.349506585342461e-06, "loss": 0.0053, "step": 752660 }, { "epoch": 1.95, "learning_rate": 7.345618368970996e-06, "loss": 0.0074, "step": 752670 }, { "epoch": 1.95, "learning_rate": 7.34173015259953e-06, "loss": 0.0073, "step": 752680 }, { "epoch": 1.95, "learning_rate": 7.337841936228066e-06, "loss": 0.0097, "step": 752690 }, { "epoch": 1.95, "learning_rate": 7.333953719856602e-06, "loss": 0.006, "step": 752700 }, { "epoch": 1.95, "learning_rate": 7.330065503485137e-06, "loss": 0.0059, "step": 752710 }, { "epoch": 1.95, "learning_rate": 7.326177287113672e-06, "loss": 0.0075, "step": 752720 }, { "epoch": 1.95, "learning_rate": 7.322289070742208e-06, "loss": 0.0093, "step": 752730 }, { "epoch": 1.95, "learning_rate": 7.318400854370744e-06, "loss": 0.0073, "step": 752740 }, { "epoch": 1.95, "learning_rate": 7.314512637999279e-06, "loss": 0.0083, "step": 752750 }, { "epoch": 1.95, "learning_rate": 7.310624421627814e-06, "loss": 0.0089, "step": 752760 }, { "epoch": 1.95, "learning_rate": 7.30673620525635e-06, "loss": 0.0065, "step": 752770 }, { "epoch": 1.95, "learning_rate": 7.302847988884885e-06, "loss": 0.0063, "step": 752780 }, { "epoch": 1.95, "learning_rate": 7.298959772513421e-06, "loss": 0.0061, "step": 752790 }, { "epoch": 1.95, "learning_rate": 7.295071556141956e-06, "loss": 0.0093, "step": 752800 }, { "epoch": 1.95, "learning_rate": 7.29118333977049e-06, "loss": 0.0069, "step": 752810 }, { "epoch": 1.95, "learning_rate": 7.287295123399026e-06, "loss": 0.0093, "step": 752820 }, { "epoch": 1.95, "learning_rate": 7.283406907027562e-06, "loss": 0.0071, "step": 752830 }, { "epoch": 1.95, "learning_rate": 7.279518690656097e-06, "loss": 0.0049, "step": 752840 }, { "epoch": 1.95, "learning_rate": 7.275630474284632e-06, "loss": 0.0062, "step": 752850 }, { "epoch": 1.95, "learning_rate": 7.271742257913168e-06, "loss": 0.0067, "step": 752860 }, { "epoch": 1.95, "learning_rate": 7.267854041541703e-06, "loss": 0.009, "step": 752870 }, { "epoch": 1.95, "learning_rate": 7.263965825170239e-06, "loss": 0.006, "step": 752880 }, { "epoch": 1.95, "learning_rate": 7.260077608798774e-06, "loss": 0.0069, "step": 752890 }, { "epoch": 1.95, "learning_rate": 7.256189392427309e-06, "loss": 0.0075, "step": 752900 }, { "epoch": 1.95, "learning_rate": 7.252301176055845e-06, "loss": 0.0065, "step": 752910 }, { "epoch": 1.95, "learning_rate": 7.24841295968438e-06, "loss": 0.0055, "step": 752920 }, { "epoch": 1.95, "learning_rate": 7.244524743312915e-06, "loss": 0.0046, "step": 752930 }, { "epoch": 1.95, "learning_rate": 7.24063652694145e-06, "loss": 0.0054, "step": 752940 }, { "epoch": 1.95, "learning_rate": 7.236748310569986e-06, "loss": 0.0076, "step": 752950 }, { "epoch": 1.95, "learning_rate": 7.232860094198521e-06, "loss": 0.0065, "step": 752960 }, { "epoch": 1.95, "learning_rate": 7.228971877827057e-06, "loss": 0.0071, "step": 752970 }, { "epoch": 1.95, "learning_rate": 7.225083661455592e-06, "loss": 0.0084, "step": 752980 }, { "epoch": 1.95, "learning_rate": 7.221195445084127e-06, "loss": 0.0088, "step": 752990 }, { "epoch": 1.95, "learning_rate": 7.217307228712663e-06, "loss": 0.0054, "step": 753000 }, { "epoch": 1.95, "eval_cer": 0.8816774928583525, "eval_loss": 0.004489977844059467, "eval_runtime": 107.9347, "eval_samples_per_second": 18.53, "eval_steps_per_second": 4.632, "step": 753000 }, { "epoch": 1.95, "learning_rate": 7.213419012341199e-06, "loss": 0.0053, "step": 753010 }, { "epoch": 1.95, "learning_rate": 7.209530795969733e-06, "loss": 0.0079, "step": 753020 }, { "epoch": 1.95, "learning_rate": 7.205642579598268e-06, "loss": 0.0054, "step": 753030 }, { "epoch": 1.95, "learning_rate": 7.201754363226804e-06, "loss": 0.0088, "step": 753040 }, { "epoch": 1.95, "learning_rate": 7.19786614685534e-06, "loss": 0.0062, "step": 753050 }, { "epoch": 1.95, "learning_rate": 7.193977930483875e-06, "loss": 0.0068, "step": 753060 }, { "epoch": 1.95, "learning_rate": 7.19008971411241e-06, "loss": 0.0074, "step": 753070 }, { "epoch": 1.95, "learning_rate": 7.186201497740946e-06, "loss": 0.0065, "step": 753080 }, { "epoch": 1.95, "learning_rate": 7.182313281369481e-06, "loss": 0.0079, "step": 753090 }, { "epoch": 1.95, "learning_rate": 7.178425064998017e-06, "loss": 0.0045, "step": 753100 }, { "epoch": 1.95, "learning_rate": 7.174536848626552e-06, "loss": 0.0067, "step": 753110 }, { "epoch": 1.95, "learning_rate": 7.170648632255087e-06, "loss": 0.0067, "step": 753120 }, { "epoch": 1.95, "learning_rate": 7.166760415883623e-06, "loss": 0.0082, "step": 753130 }, { "epoch": 1.95, "learning_rate": 7.162872199512159e-06, "loss": 0.0066, "step": 753140 }, { "epoch": 1.95, "learning_rate": 7.158983983140693e-06, "loss": 0.0075, "step": 753150 }, { "epoch": 1.95, "learning_rate": 7.155095766769228e-06, "loss": 0.008, "step": 753160 }, { "epoch": 1.95, "learning_rate": 7.151207550397764e-06, "loss": 0.0071, "step": 753170 }, { "epoch": 1.95, "learning_rate": 7.147319334026299e-06, "loss": 0.0064, "step": 753180 }, { "epoch": 1.95, "learning_rate": 7.143431117654835e-06, "loss": 0.0085, "step": 753190 }, { "epoch": 1.95, "learning_rate": 7.13954290128337e-06, "loss": 0.0074, "step": 753200 }, { "epoch": 1.95, "learning_rate": 7.135654684911905e-06, "loss": 0.0051, "step": 753210 }, { "epoch": 1.95, "learning_rate": 7.131766468540441e-06, "loss": 0.0054, "step": 753220 }, { "epoch": 1.95, "learning_rate": 7.127878252168977e-06, "loss": 0.0082, "step": 753230 }, { "epoch": 1.95, "learning_rate": 7.1239900357975114e-06, "loss": 0.0055, "step": 753240 }, { "epoch": 1.95, "learning_rate": 7.120101819426047e-06, "loss": 0.0068, "step": 753250 }, { "epoch": 1.95, "learning_rate": 7.116213603054583e-06, "loss": 0.0116, "step": 753260 }, { "epoch": 1.95, "learning_rate": 7.112325386683117e-06, "loss": 0.0062, "step": 753270 }, { "epoch": 1.95, "learning_rate": 7.108437170311653e-06, "loss": 0.0052, "step": 753280 }, { "epoch": 1.95, "learning_rate": 7.104548953940188e-06, "loss": 0.0076, "step": 753290 }, { "epoch": 1.95, "learning_rate": 7.100660737568723e-06, "loss": 0.0051, "step": 753300 }, { "epoch": 1.95, "learning_rate": 7.096772521197259e-06, "loss": 0.0055, "step": 753310 }, { "epoch": 1.95, "learning_rate": 7.0928843048257946e-06, "loss": 0.0086, "step": 753320 }, { "epoch": 1.95, "learning_rate": 7.0889960884543294e-06, "loss": 0.0091, "step": 753330 }, { "epoch": 1.95, "learning_rate": 7.085107872082865e-06, "loss": 0.0059, "step": 753340 }, { "epoch": 1.95, "learning_rate": 7.081219655711401e-06, "loss": 0.0067, "step": 753350 }, { "epoch": 1.95, "learning_rate": 7.0773314393399366e-06, "loss": 0.0081, "step": 753360 }, { "epoch": 1.95, "learning_rate": 7.0734432229684706e-06, "loss": 0.0058, "step": 753370 }, { "epoch": 1.95, "learning_rate": 7.069555006597006e-06, "loss": 0.0053, "step": 753380 }, { "epoch": 1.95, "learning_rate": 7.065666790225542e-06, "loss": 0.0068, "step": 753390 }, { "epoch": 1.95, "learning_rate": 7.061778573854077e-06, "loss": 0.0078, "step": 753400 }, { "epoch": 1.95, "learning_rate": 7.0578903574826126e-06, "loss": 0.009, "step": 753410 }, { "epoch": 1.95, "learning_rate": 7.054002141111148e-06, "loss": 0.0085, "step": 753420 }, { "epoch": 1.95, "learning_rate": 7.050113924739683e-06, "loss": 0.0064, "step": 753430 }, { "epoch": 1.95, "learning_rate": 7.046225708368219e-06, "loss": 0.0067, "step": 753440 }, { "epoch": 1.95, "learning_rate": 7.0423374919967545e-06, "loss": 0.006, "step": 753450 }, { "epoch": 1.95, "learning_rate": 7.038449275625289e-06, "loss": 0.0066, "step": 753460 }, { "epoch": 1.95, "learning_rate": 7.034561059253825e-06, "loss": 0.0063, "step": 753470 }, { "epoch": 1.95, "learning_rate": 7.030672842882361e-06, "loss": 0.0054, "step": 753480 }, { "epoch": 1.95, "learning_rate": 7.026784626510895e-06, "loss": 0.0055, "step": 753490 }, { "epoch": 1.95, "learning_rate": 7.0228964101394305e-06, "loss": 0.0068, "step": 753500 }, { "epoch": 1.95, "learning_rate": 7.019008193767966e-06, "loss": 0.0063, "step": 753510 }, { "epoch": 1.95, "learning_rate": 7.015119977396501e-06, "loss": 0.0049, "step": 753520 }, { "epoch": 1.95, "learning_rate": 7.011231761025037e-06, "loss": 0.0075, "step": 753530 }, { "epoch": 1.95, "learning_rate": 7.0073435446535725e-06, "loss": 0.0059, "step": 753540 }, { "epoch": 1.95, "learning_rate": 7.003455328282107e-06, "loss": 0.0059, "step": 753550 }, { "epoch": 1.95, "learning_rate": 6.999567111910643e-06, "loss": 0.0094, "step": 753560 }, { "epoch": 1.95, "learning_rate": 6.995678895539179e-06, "loss": 0.0075, "step": 753570 }, { "epoch": 1.95, "learning_rate": 6.991790679167714e-06, "loss": 0.0078, "step": 753580 }, { "epoch": 1.95, "learning_rate": 6.987902462796249e-06, "loss": 0.0086, "step": 753590 }, { "epoch": 1.95, "learning_rate": 6.984014246424785e-06, "loss": 0.0092, "step": 753600 }, { "epoch": 1.95, "learning_rate": 6.980126030053319e-06, "loss": 0.0094, "step": 753610 }, { "epoch": 1.95, "learning_rate": 6.976237813681855e-06, "loss": 0.0061, "step": 753620 }, { "epoch": 1.95, "learning_rate": 6.9723495973103905e-06, "loss": 0.008, "step": 753630 }, { "epoch": 1.95, "learning_rate": 6.968461380938925e-06, "loss": 0.0059, "step": 753640 }, { "epoch": 1.95, "learning_rate": 6.964573164567461e-06, "loss": 0.0061, "step": 753650 }, { "epoch": 1.95, "learning_rate": 6.960684948195997e-06, "loss": 0.0074, "step": 753660 }, { "epoch": 1.95, "learning_rate": 6.9567967318245325e-06, "loss": 0.0068, "step": 753670 }, { "epoch": 1.95, "learning_rate": 6.952908515453067e-06, "loss": 0.0068, "step": 753680 }, { "epoch": 1.95, "learning_rate": 6.949020299081603e-06, "loss": 0.0072, "step": 753690 }, { "epoch": 1.95, "learning_rate": 6.945132082710139e-06, "loss": 0.0061, "step": 753700 }, { "epoch": 1.95, "learning_rate": 6.941243866338673e-06, "loss": 0.0071, "step": 753710 }, { "epoch": 1.95, "learning_rate": 6.9373556499672085e-06, "loss": 0.0067, "step": 753720 }, { "epoch": 1.95, "learning_rate": 6.933467433595744e-06, "loss": 0.0085, "step": 753730 }, { "epoch": 1.95, "learning_rate": 6.929579217224279e-06, "loss": 0.0068, "step": 753740 }, { "epoch": 1.95, "learning_rate": 6.925691000852815e-06, "loss": 0.0054, "step": 753750 }, { "epoch": 1.95, "learning_rate": 6.9218027844813505e-06, "loss": 0.0065, "step": 753760 }, { "epoch": 1.95, "learning_rate": 6.917914568109885e-06, "loss": 0.006, "step": 753770 }, { "epoch": 1.95, "learning_rate": 6.914026351738421e-06, "loss": 0.0056, "step": 753780 }, { "epoch": 1.95, "learning_rate": 6.910138135366957e-06, "loss": 0.0067, "step": 753790 }, { "epoch": 1.95, "learning_rate": 6.906249918995492e-06, "loss": 0.0051, "step": 753800 }, { "epoch": 1.95, "learning_rate": 6.902361702624027e-06, "loss": 0.0085, "step": 753810 }, { "epoch": 1.95, "learning_rate": 6.898473486252563e-06, "loss": 0.007, "step": 753820 }, { "epoch": 1.95, "learning_rate": 6.894585269881097e-06, "loss": 0.0057, "step": 753830 }, { "epoch": 1.95, "learning_rate": 6.890697053509633e-06, "loss": 0.0077, "step": 753840 }, { "epoch": 1.95, "learning_rate": 6.8868088371381685e-06, "loss": 0.0075, "step": 753850 }, { "epoch": 1.95, "learning_rate": 6.882920620766703e-06, "loss": 0.0072, "step": 753860 }, { "epoch": 1.95, "learning_rate": 6.879032404395239e-06, "loss": 0.0074, "step": 753870 }, { "epoch": 1.95, "learning_rate": 6.875144188023775e-06, "loss": 0.008, "step": 753880 }, { "epoch": 1.95, "learning_rate": 6.87125597165231e-06, "loss": 0.0053, "step": 753890 }, { "epoch": 1.95, "learning_rate": 6.867367755280845e-06, "loss": 0.0098, "step": 753900 }, { "epoch": 1.95, "learning_rate": 6.863479538909381e-06, "loss": 0.005, "step": 753910 }, { "epoch": 1.95, "learning_rate": 6.859591322537916e-06, "loss": 0.0065, "step": 753920 }, { "epoch": 1.95, "learning_rate": 6.855703106166452e-06, "loss": 0.0057, "step": 753930 }, { "epoch": 1.95, "learning_rate": 6.851814889794987e-06, "loss": 0.0073, "step": 753940 }, { "epoch": 1.95, "learning_rate": 6.847926673423521e-06, "loss": 0.0064, "step": 753950 }, { "epoch": 1.95, "learning_rate": 6.844038457052057e-06, "loss": 0.0063, "step": 753960 }, { "epoch": 1.95, "learning_rate": 6.840150240680593e-06, "loss": 0.0076, "step": 753970 }, { "epoch": 1.95, "learning_rate": 6.8362620243091285e-06, "loss": 0.0071, "step": 753980 }, { "epoch": 1.95, "learning_rate": 6.832373807937663e-06, "loss": 0.0063, "step": 753990 }, { "epoch": 1.95, "learning_rate": 6.828485591566199e-06, "loss": 0.006, "step": 754000 }, { "epoch": 1.95, "eval_cer": 0.8816760932214184, "eval_loss": 0.004459910560399294, "eval_runtime": 107.9724, "eval_samples_per_second": 18.523, "eval_steps_per_second": 4.631, "step": 754000 }, { "epoch": 1.95, "learning_rate": 6.824597375194735e-06, "loss": 0.0062, "step": 754010 }, { "epoch": 1.95, "learning_rate": 6.82070915882327e-06, "loss": 0.0076, "step": 754020 }, { "epoch": 1.95, "learning_rate": 6.816820942451805e-06, "loss": 0.0079, "step": 754030 }, { "epoch": 1.95, "learning_rate": 6.812932726080341e-06, "loss": 0.008, "step": 754040 }, { "epoch": 1.95, "learning_rate": 6.809044509708875e-06, "loss": 0.008, "step": 754050 }, { "epoch": 1.95, "learning_rate": 6.805156293337411e-06, "loss": 0.0057, "step": 754060 }, { "epoch": 1.95, "learning_rate": 6.8012680769659464e-06, "loss": 0.008, "step": 754070 }, { "epoch": 1.95, "learning_rate": 6.797379860594481e-06, "loss": 0.0081, "step": 754080 }, { "epoch": 1.95, "learning_rate": 6.793491644223017e-06, "loss": 0.0065, "step": 754090 }, { "epoch": 1.95, "learning_rate": 6.789603427851553e-06, "loss": 0.0068, "step": 754100 }, { "epoch": 1.95, "learning_rate": 6.785715211480088e-06, "loss": 0.0056, "step": 754110 }, { "epoch": 1.95, "learning_rate": 6.781826995108623e-06, "loss": 0.0077, "step": 754120 }, { "epoch": 1.95, "learning_rate": 6.777938778737159e-06, "loss": 0.0097, "step": 754130 }, { "epoch": 1.95, "learning_rate": 6.774050562365694e-06, "loss": 0.0074, "step": 754140 }, { "epoch": 1.95, "learning_rate": 6.77016234599423e-06, "loss": 0.009, "step": 754150 }, { "epoch": 1.95, "learning_rate": 6.766274129622765e-06, "loss": 0.0075, "step": 754160 }, { "epoch": 1.95, "learning_rate": 6.762385913251299e-06, "loss": 0.0057, "step": 754170 }, { "epoch": 1.95, "learning_rate": 6.758497696879835e-06, "loss": 0.0061, "step": 754180 }, { "epoch": 1.95, "learning_rate": 6.754609480508371e-06, "loss": 0.0056, "step": 754190 }, { "epoch": 1.95, "learning_rate": 6.750721264136906e-06, "loss": 0.0059, "step": 754200 }, { "epoch": 1.96, "learning_rate": 6.746833047765441e-06, "loss": 0.0063, "step": 754210 }, { "epoch": 1.96, "learning_rate": 6.742944831393977e-06, "loss": 0.0093, "step": 754220 }, { "epoch": 1.96, "learning_rate": 6.739056615022512e-06, "loss": 0.0056, "step": 754230 }, { "epoch": 1.96, "learning_rate": 6.7351683986510476e-06, "loss": 0.0058, "step": 754240 }, { "epoch": 1.96, "learning_rate": 6.731280182279583e-06, "loss": 0.0087, "step": 754250 }, { "epoch": 1.96, "learning_rate": 6.727391965908118e-06, "loss": 0.0067, "step": 754260 }, { "epoch": 1.96, "learning_rate": 6.723503749536654e-06, "loss": 0.0076, "step": 754270 }, { "epoch": 1.96, "learning_rate": 6.7196155331651896e-06, "loss": 0.0066, "step": 754280 }, { "epoch": 1.96, "learning_rate": 6.715727316793725e-06, "loss": 0.0061, "step": 754290 }, { "epoch": 1.96, "learning_rate": 6.711839100422259e-06, "loss": 0.0092, "step": 754300 }, { "epoch": 1.96, "learning_rate": 6.707950884050795e-06, "loss": 0.0063, "step": 754310 }, { "epoch": 1.96, "learning_rate": 6.704062667679331e-06, "loss": 0.0086, "step": 754320 }, { "epoch": 1.96, "learning_rate": 6.7001744513078656e-06, "loss": 0.0081, "step": 754330 }, { "epoch": 1.96, "learning_rate": 6.696286234936401e-06, "loss": 0.0074, "step": 754340 }, { "epoch": 1.96, "learning_rate": 6.692398018564937e-06, "loss": 0.0065, "step": 754350 }, { "epoch": 1.96, "learning_rate": 6.688509802193472e-06, "loss": 0.0055, "step": 754360 }, { "epoch": 1.96, "learning_rate": 6.6846215858220075e-06, "loss": 0.0072, "step": 754370 }, { "epoch": 1.96, "learning_rate": 6.680733369450543e-06, "loss": 0.0068, "step": 754380 }, { "epoch": 1.96, "learning_rate": 6.676845153079077e-06, "loss": 0.0072, "step": 754390 }, { "epoch": 1.96, "learning_rate": 6.672956936707613e-06, "loss": 0.0098, "step": 754400 }, { "epoch": 1.96, "learning_rate": 6.669068720336149e-06, "loss": 0.0069, "step": 754410 }, { "epoch": 1.96, "learning_rate": 6.6651805039646835e-06, "loss": 0.0061, "step": 754420 }, { "epoch": 1.96, "learning_rate": 6.661292287593219e-06, "loss": 0.0081, "step": 754430 }, { "epoch": 1.96, "learning_rate": 6.657404071221755e-06, "loss": 0.0079, "step": 754440 }, { "epoch": 1.96, "learning_rate": 6.65351585485029e-06, "loss": 0.0085, "step": 754450 }, { "epoch": 1.96, "learning_rate": 6.6496276384788255e-06, "loss": 0.0065, "step": 754460 }, { "epoch": 1.96, "learning_rate": 6.645739422107361e-06, "loss": 0.0051, "step": 754470 }, { "epoch": 1.96, "learning_rate": 6.641851205735896e-06, "loss": 0.0057, "step": 754480 }, { "epoch": 1.96, "learning_rate": 6.637962989364432e-06, "loss": 0.0053, "step": 754490 }, { "epoch": 1.96, "learning_rate": 6.6340747729929675e-06, "loss": 0.0075, "step": 754500 }, { "epoch": 1.96, "learning_rate": 6.6301865566215015e-06, "loss": 0.0077, "step": 754510 }, { "epoch": 1.96, "learning_rate": 6.626298340250037e-06, "loss": 0.0082, "step": 754520 }, { "epoch": 1.96, "learning_rate": 6.622410123878573e-06, "loss": 0.0085, "step": 754530 }, { "epoch": 1.96, "learning_rate": 6.618521907507108e-06, "loss": 0.007, "step": 754540 }, { "epoch": 1.96, "learning_rate": 6.6146336911356435e-06, "loss": 0.004, "step": 754550 }, { "epoch": 1.96, "learning_rate": 6.610745474764179e-06, "loss": 0.0095, "step": 754560 }, { "epoch": 1.96, "learning_rate": 6.606857258392714e-06, "loss": 0.006, "step": 754570 }, { "epoch": 1.96, "learning_rate": 6.60296904202125e-06, "loss": 0.0074, "step": 754580 }, { "epoch": 1.96, "learning_rate": 6.5990808256497855e-06, "loss": 0.0064, "step": 754590 }, { "epoch": 1.96, "learning_rate": 6.595192609278321e-06, "loss": 0.0059, "step": 754600 }, { "epoch": 1.96, "learning_rate": 6.591304392906856e-06, "loss": 0.0063, "step": 754610 }, { "epoch": 1.96, "learning_rate": 6.587416176535392e-06, "loss": 0.0054, "step": 754620 }, { "epoch": 1.96, "learning_rate": 6.5835279601639275e-06, "loss": 0.0044, "step": 754630 }, { "epoch": 1.96, "learning_rate": 6.5796397437924615e-06, "loss": 0.0057, "step": 754640 }, { "epoch": 1.96, "learning_rate": 6.575751527420997e-06, "loss": 0.0082, "step": 754650 }, { "epoch": 1.96, "learning_rate": 6.571863311049533e-06, "loss": 0.0094, "step": 754660 }, { "epoch": 1.96, "learning_rate": 6.567975094678068e-06, "loss": 0.0101, "step": 754670 }, { "epoch": 1.96, "learning_rate": 6.5640868783066035e-06, "loss": 0.0061, "step": 754680 }, { "epoch": 1.96, "learning_rate": 6.560198661935139e-06, "loss": 0.0056, "step": 754690 }, { "epoch": 1.96, "learning_rate": 6.556310445563674e-06, "loss": 0.0065, "step": 754700 }, { "epoch": 1.96, "learning_rate": 6.55242222919221e-06, "loss": 0.0092, "step": 754710 }, { "epoch": 1.96, "learning_rate": 6.5485340128207455e-06, "loss": 0.0079, "step": 754720 }, { "epoch": 1.96, "learning_rate": 6.5446457964492795e-06, "loss": 0.0071, "step": 754730 }, { "epoch": 1.96, "learning_rate": 6.540757580077815e-06, "loss": 0.0047, "step": 754740 }, { "epoch": 1.96, "learning_rate": 6.536869363706351e-06, "loss": 0.0087, "step": 754750 }, { "epoch": 1.96, "learning_rate": 6.532981147334886e-06, "loss": 0.0066, "step": 754760 }, { "epoch": 1.96, "learning_rate": 6.5290929309634215e-06, "loss": 0.0067, "step": 754770 }, { "epoch": 1.96, "learning_rate": 6.525204714591957e-06, "loss": 0.0104, "step": 754780 }, { "epoch": 1.96, "learning_rate": 6.521316498220492e-06, "loss": 0.0079, "step": 754790 }, { "epoch": 1.96, "learning_rate": 6.517428281849028e-06, "loss": 0.0071, "step": 754800 }, { "epoch": 1.96, "learning_rate": 6.5135400654775635e-06, "loss": 0.0085, "step": 754810 }, { "epoch": 1.96, "learning_rate": 6.509651849106098e-06, "loss": 0.0083, "step": 754820 }, { "epoch": 1.96, "learning_rate": 6.505763632734634e-06, "loss": 0.0062, "step": 754830 }, { "epoch": 1.96, "learning_rate": 6.50187541636317e-06, "loss": 0.0058, "step": 754840 }, { "epoch": 1.96, "learning_rate": 6.497987199991704e-06, "loss": 0.0095, "step": 754850 }, { "epoch": 1.96, "learning_rate": 6.4940989836202395e-06, "loss": 0.0058, "step": 754860 }, { "epoch": 1.96, "learning_rate": 6.490210767248775e-06, "loss": 0.0082, "step": 754870 }, { "epoch": 1.96, "learning_rate": 6.48632255087731e-06, "loss": 0.0056, "step": 754880 }, { "epoch": 1.96, "learning_rate": 6.482434334505846e-06, "loss": 0.0094, "step": 754890 }, { "epoch": 1.96, "learning_rate": 6.4785461181343815e-06, "loss": 0.0099, "step": 754900 }, { "epoch": 1.96, "learning_rate": 6.474657901762917e-06, "loss": 0.0051, "step": 754910 }, { "epoch": 1.96, "learning_rate": 6.470769685391452e-06, "loss": 0.0076, "step": 754920 }, { "epoch": 1.96, "learning_rate": 6.466881469019988e-06, "loss": 0.0081, "step": 754930 }, { "epoch": 1.96, "learning_rate": 6.4629932526485234e-06, "loss": 0.0094, "step": 754940 }, { "epoch": 1.96, "learning_rate": 6.459105036277058e-06, "loss": 0.0071, "step": 754950 }, { "epoch": 1.96, "learning_rate": 6.455216819905594e-06, "loss": 0.0077, "step": 754960 }, { "epoch": 1.96, "learning_rate": 6.45132860353413e-06, "loss": 0.0062, "step": 754970 }, { "epoch": 1.96, "learning_rate": 6.447440387162664e-06, "loss": 0.0063, "step": 754980 }, { "epoch": 1.96, "learning_rate": 6.4435521707911994e-06, "loss": 0.0062, "step": 754990 }, { "epoch": 1.96, "learning_rate": 6.439663954419735e-06, "loss": 0.0078, "step": 755000 }, { "epoch": 1.96, "eval_cer": 0.8816844910430235, "eval_loss": 0.004422630183398724, "eval_runtime": 107.997, "eval_samples_per_second": 18.519, "eval_steps_per_second": 4.63, "step": 755000 }, { "epoch": 1.96, "learning_rate": 6.43577573804827e-06, "loss": 0.0054, "step": 755010 }, { "epoch": 1.96, "learning_rate": 6.431887521676806e-06, "loss": 0.0058, "step": 755020 }, { "epoch": 1.96, "learning_rate": 6.4279993053053414e-06, "loss": 0.0085, "step": 755030 }, { "epoch": 1.96, "learning_rate": 6.424111088933876e-06, "loss": 0.0067, "step": 755040 }, { "epoch": 1.96, "learning_rate": 6.420222872562412e-06, "loss": 0.0135, "step": 755050 }, { "epoch": 1.96, "learning_rate": 6.416334656190948e-06, "loss": 0.0077, "step": 755060 }, { "epoch": 1.96, "learning_rate": 6.412446439819482e-06, "loss": 0.0065, "step": 755070 }, { "epoch": 1.96, "learning_rate": 6.4085582234480174e-06, "loss": 0.0071, "step": 755080 }, { "epoch": 1.96, "learning_rate": 6.404670007076553e-06, "loss": 0.0072, "step": 755090 }, { "epoch": 1.96, "learning_rate": 6.400781790705088e-06, "loss": 0.0056, "step": 755100 }, { "epoch": 1.96, "learning_rate": 6.396893574333624e-06, "loss": 0.0062, "step": 755110 }, { "epoch": 1.96, "learning_rate": 6.3930053579621594e-06, "loss": 0.0085, "step": 755120 }, { "epoch": 1.96, "learning_rate": 6.389117141590694e-06, "loss": 0.0079, "step": 755130 }, { "epoch": 1.96, "learning_rate": 6.38522892521923e-06, "loss": 0.0084, "step": 755140 }, { "epoch": 1.96, "learning_rate": 6.381340708847766e-06, "loss": 0.0051, "step": 755150 }, { "epoch": 1.96, "learning_rate": 6.3774524924763006e-06, "loss": 0.0068, "step": 755160 }, { "epoch": 1.96, "learning_rate": 6.373564276104836e-06, "loss": 0.007, "step": 755170 }, { "epoch": 1.96, "learning_rate": 6.369676059733372e-06, "loss": 0.0063, "step": 755180 }, { "epoch": 1.96, "learning_rate": 6.365787843361908e-06, "loss": 0.0078, "step": 755190 }, { "epoch": 1.96, "learning_rate": 6.361899626990442e-06, "loss": 0.008, "step": 755200 }, { "epoch": 1.96, "learning_rate": 6.358011410618977e-06, "loss": 0.0065, "step": 755210 }, { "epoch": 1.96, "learning_rate": 6.354123194247513e-06, "loss": 0.0084, "step": 755220 }, { "epoch": 1.96, "learning_rate": 6.350234977876048e-06, "loss": 0.0087, "step": 755230 }, { "epoch": 1.96, "learning_rate": 6.346346761504584e-06, "loss": 0.0092, "step": 755240 }, { "epoch": 1.96, "learning_rate": 6.342458545133119e-06, "loss": 0.0067, "step": 755250 }, { "epoch": 1.96, "learning_rate": 6.338570328761654e-06, "loss": 0.0062, "step": 755260 }, { "epoch": 1.96, "learning_rate": 6.33468211239019e-06, "loss": 0.0083, "step": 755270 }, { "epoch": 1.96, "learning_rate": 6.330793896018726e-06, "loss": 0.0062, "step": 755280 }, { "epoch": 1.96, "learning_rate": 6.3269056796472605e-06, "loss": 0.0059, "step": 755290 }, { "epoch": 1.96, "learning_rate": 6.323017463275796e-06, "loss": 0.0059, "step": 755300 }, { "epoch": 1.96, "learning_rate": 6.319129246904332e-06, "loss": 0.0055, "step": 755310 }, { "epoch": 1.96, "learning_rate": 6.315241030532866e-06, "loss": 0.0063, "step": 755320 }, { "epoch": 1.96, "learning_rate": 6.311352814161402e-06, "loss": 0.0054, "step": 755330 }, { "epoch": 1.96, "learning_rate": 6.307464597789937e-06, "loss": 0.006, "step": 755340 }, { "epoch": 1.96, "learning_rate": 6.303576381418472e-06, "loss": 0.0057, "step": 755350 }, { "epoch": 1.96, "learning_rate": 6.299688165047008e-06, "loss": 0.0105, "step": 755360 }, { "epoch": 1.96, "learning_rate": 6.295799948675544e-06, "loss": 0.0091, "step": 755370 }, { "epoch": 1.96, "learning_rate": 6.2919117323040785e-06, "loss": 0.0088, "step": 755380 }, { "epoch": 1.96, "learning_rate": 6.288023515932614e-06, "loss": 0.0072, "step": 755390 }, { "epoch": 1.96, "learning_rate": 6.28413529956115e-06, "loss": 0.0071, "step": 755400 }, { "epoch": 1.96, "learning_rate": 6.280247083189684e-06, "loss": 0.0065, "step": 755410 }, { "epoch": 1.96, "learning_rate": 6.27635886681822e-06, "loss": 0.0075, "step": 755420 }, { "epoch": 1.96, "learning_rate": 6.272470650446755e-06, "loss": 0.0036, "step": 755430 }, { "epoch": 1.96, "learning_rate": 6.26858243407529e-06, "loss": 0.0061, "step": 755440 }, { "epoch": 1.96, "learning_rate": 6.264694217703826e-06, "loss": 0.005, "step": 755450 }, { "epoch": 1.96, "learning_rate": 6.260806001332362e-06, "loss": 0.008, "step": 755460 }, { "epoch": 1.96, "learning_rate": 6.2569177849608965e-06, "loss": 0.0066, "step": 755470 }, { "epoch": 1.96, "learning_rate": 6.253029568589432e-06, "loss": 0.0064, "step": 755480 }, { "epoch": 1.96, "learning_rate": 6.249141352217968e-06, "loss": 0.0064, "step": 755490 }, { "epoch": 1.96, "learning_rate": 6.245253135846504e-06, "loss": 0.0071, "step": 755500 }, { "epoch": 1.96, "learning_rate": 6.2413649194750385e-06, "loss": 0.0072, "step": 755510 }, { "epoch": 1.96, "learning_rate": 6.237476703103574e-06, "loss": 0.0065, "step": 755520 }, { "epoch": 1.96, "learning_rate": 6.23358848673211e-06, "loss": 0.0065, "step": 755530 }, { "epoch": 1.96, "learning_rate": 6.229700270360644e-06, "loss": 0.0054, "step": 755540 }, { "epoch": 1.96, "learning_rate": 6.22581205398918e-06, "loss": 0.0073, "step": 755550 }, { "epoch": 1.96, "learning_rate": 6.221923837617715e-06, "loss": 0.0056, "step": 755560 }, { "epoch": 1.96, "learning_rate": 6.21803562124625e-06, "loss": 0.0082, "step": 755570 }, { "epoch": 1.96, "learning_rate": 6.214147404874786e-06, "loss": 0.0073, "step": 755580 }, { "epoch": 1.96, "learning_rate": 6.210259188503322e-06, "loss": 0.0059, "step": 755590 }, { "epoch": 1.96, "learning_rate": 6.2063709721318565e-06, "loss": 0.0064, "step": 755600 }, { "epoch": 1.96, "learning_rate": 6.202482755760392e-06, "loss": 0.0072, "step": 755610 }, { "epoch": 1.96, "learning_rate": 6.198594539388928e-06, "loss": 0.0047, "step": 755620 }, { "epoch": 1.96, "learning_rate": 6.194706323017463e-06, "loss": 0.008, "step": 755630 }, { "epoch": 1.96, "learning_rate": 6.1908181066459985e-06, "loss": 0.0072, "step": 755640 }, { "epoch": 1.96, "learning_rate": 6.186929890274534e-06, "loss": 0.0095, "step": 755650 }, { "epoch": 1.96, "learning_rate": 6.183041673903068e-06, "loss": 0.0085, "step": 755660 }, { "epoch": 1.96, "learning_rate": 6.179153457531604e-06, "loss": 0.0068, "step": 755670 }, { "epoch": 1.96, "learning_rate": 6.17526524116014e-06, "loss": 0.0082, "step": 755680 }, { "epoch": 1.96, "learning_rate": 6.1713770247886745e-06, "loss": 0.0069, "step": 755690 }, { "epoch": 1.96, "learning_rate": 6.16748880841721e-06, "loss": 0.0056, "step": 755700 }, { "epoch": 1.96, "learning_rate": 6.163600592045746e-06, "loss": 0.007, "step": 755710 }, { "epoch": 1.96, "learning_rate": 6.159712375674281e-06, "loss": 0.0061, "step": 755720 }, { "epoch": 1.96, "learning_rate": 6.1558241593028165e-06, "loss": 0.0056, "step": 755730 }, { "epoch": 1.96, "learning_rate": 6.151935942931352e-06, "loss": 0.0082, "step": 755740 }, { "epoch": 1.96, "learning_rate": 6.148047726559886e-06, "loss": 0.0097, "step": 755750 }, { "epoch": 1.96, "learning_rate": 6.144159510188422e-06, "loss": 0.0053, "step": 755760 }, { "epoch": 1.96, "learning_rate": 6.140271293816958e-06, "loss": 0.0062, "step": 755770 }, { "epoch": 1.96, "learning_rate": 6.1363830774454925e-06, "loss": 0.0054, "step": 755780 }, { "epoch": 1.96, "learning_rate": 6.132494861074028e-06, "loss": 0.0079, "step": 755790 }, { "epoch": 1.96, "learning_rate": 6.128606644702564e-06, "loss": 0.0065, "step": 755800 }, { "epoch": 1.96, "learning_rate": 6.1247184283311e-06, "loss": 0.0078, "step": 755810 }, { "epoch": 1.96, "learning_rate": 6.1208302119596345e-06, "loss": 0.0064, "step": 755820 }, { "epoch": 1.96, "learning_rate": 6.11694199558817e-06, "loss": 0.009, "step": 755830 }, { "epoch": 1.96, "learning_rate": 6.113053779216706e-06, "loss": 0.005, "step": 755840 }, { "epoch": 1.96, "learning_rate": 6.109165562845241e-06, "loss": 0.009, "step": 755850 }, { "epoch": 1.96, "learning_rate": 6.1052773464737764e-06, "loss": 0.0091, "step": 755860 }, { "epoch": 1.96, "learning_rate": 6.101389130102312e-06, "loss": 0.006, "step": 755870 }, { "epoch": 1.96, "learning_rate": 6.097500913730846e-06, "loss": 0.0078, "step": 755880 }, { "epoch": 1.96, "learning_rate": 6.093612697359382e-06, "loss": 0.0071, "step": 755890 }, { "epoch": 1.96, "learning_rate": 6.089724480987918e-06, "loss": 0.0097, "step": 755900 }, { "epoch": 1.96, "learning_rate": 6.0858362646164524e-06, "loss": 0.0069, "step": 755910 }, { "epoch": 1.96, "learning_rate": 6.081948048244988e-06, "loss": 0.0061, "step": 755920 }, { "epoch": 1.96, "learning_rate": 6.078059831873524e-06, "loss": 0.0092, "step": 755930 }, { "epoch": 1.96, "learning_rate": 6.074171615502059e-06, "loss": 0.0051, "step": 755940 }, { "epoch": 1.96, "learning_rate": 6.0702833991305944e-06, "loss": 0.0051, "step": 755950 }, { "epoch": 1.96, "learning_rate": 6.06639518275913e-06, "loss": 0.0075, "step": 755960 }, { "epoch": 1.96, "learning_rate": 6.062506966387665e-06, "loss": 0.0075, "step": 755970 }, { "epoch": 1.96, "learning_rate": 6.058618750016201e-06, "loss": 0.0083, "step": 755980 }, { "epoch": 1.96, "learning_rate": 6.054730533644736e-06, "loss": 0.0068, "step": 755990 }, { "epoch": 1.96, "learning_rate": 6.0508423172732704e-06, "loss": 0.0069, "step": 756000 }, { "epoch": 1.96, "eval_cer": 0.8816816917691551, "eval_loss": 0.0044304681941866875, "eval_runtime": 107.8956, "eval_samples_per_second": 18.536, "eval_steps_per_second": 4.634, "step": 756000 }, { "epoch": 1.96, "learning_rate": 6.046954100901806e-06, "loss": 0.0073, "step": 756010 }, { "epoch": 1.96, "learning_rate": 6.043065884530342e-06, "loss": 0.0079, "step": 756020 }, { "epoch": 1.96, "learning_rate": 6.039177668158877e-06, "loss": 0.0056, "step": 756030 }, { "epoch": 1.96, "learning_rate": 6.035289451787412e-06, "loss": 0.0072, "step": 756040 }, { "epoch": 1.96, "learning_rate": 6.031401235415948e-06, "loss": 0.0086, "step": 756050 }, { "epoch": 1.96, "learning_rate": 6.027513019044483e-06, "loss": 0.0083, "step": 756060 }, { "epoch": 1.96, "learning_rate": 6.023624802673019e-06, "loss": 0.0082, "step": 756070 }, { "epoch": 1.96, "learning_rate": 6.019736586301554e-06, "loss": 0.0087, "step": 756080 }, { "epoch": 1.96, "learning_rate": 6.0158483699300884e-06, "loss": 0.005, "step": 756090 }, { "epoch": 1.96, "learning_rate": 6.011960153558624e-06, "loss": 0.0061, "step": 756100 }, { "epoch": 1.96, "learning_rate": 6.00807193718716e-06, "loss": 0.0051, "step": 756110 }, { "epoch": 1.96, "learning_rate": 6.0041837208156956e-06, "loss": 0.0056, "step": 756120 }, { "epoch": 1.96, "learning_rate": 6.00029550444423e-06, "loss": 0.0057, "step": 756130 }, { "epoch": 1.96, "learning_rate": 5.996407288072766e-06, "loss": 0.0071, "step": 756140 }, { "epoch": 1.96, "learning_rate": 5.992519071701302e-06, "loss": 0.0122, "step": 756150 }, { "epoch": 1.96, "learning_rate": 5.988630855329837e-06, "loss": 0.0069, "step": 756160 }, { "epoch": 1.96, "learning_rate": 5.984742638958372e-06, "loss": 0.0075, "step": 756170 }, { "epoch": 1.96, "learning_rate": 5.980854422586908e-06, "loss": 0.0071, "step": 756180 }, { "epoch": 1.96, "learning_rate": 5.976966206215443e-06, "loss": 0.0062, "step": 756190 }, { "epoch": 1.96, "learning_rate": 5.973077989843979e-06, "loss": 0.0057, "step": 756200 }, { "epoch": 1.96, "learning_rate": 5.969189773472514e-06, "loss": 0.0093, "step": 756210 }, { "epoch": 1.96, "learning_rate": 5.965301557101048e-06, "loss": 0.0072, "step": 756220 }, { "epoch": 1.96, "learning_rate": 5.961413340729584e-06, "loss": 0.0097, "step": 756230 }, { "epoch": 1.96, "learning_rate": 5.95752512435812e-06, "loss": 0.0069, "step": 756240 }, { "epoch": 1.96, "learning_rate": 5.953636907986655e-06, "loss": 0.0054, "step": 756250 }, { "epoch": 1.96, "learning_rate": 5.94974869161519e-06, "loss": 0.0041, "step": 756260 }, { "epoch": 1.96, "learning_rate": 5.945860475243726e-06, "loss": 0.0062, "step": 756270 }, { "epoch": 1.96, "learning_rate": 5.941972258872261e-06, "loss": 0.0067, "step": 756280 }, { "epoch": 1.96, "learning_rate": 5.938084042500797e-06, "loss": 0.008, "step": 756290 }, { "epoch": 1.96, "learning_rate": 5.934195826129332e-06, "loss": 0.0056, "step": 756300 }, { "epoch": 1.96, "learning_rate": 5.930307609757867e-06, "loss": 0.0058, "step": 756310 }, { "epoch": 1.96, "learning_rate": 5.926419393386403e-06, "loss": 0.0099, "step": 756320 }, { "epoch": 1.96, "learning_rate": 5.922531177014939e-06, "loss": 0.006, "step": 756330 }, { "epoch": 1.96, "learning_rate": 5.918642960643473e-06, "loss": 0.0071, "step": 756340 }, { "epoch": 1.96, "learning_rate": 5.914754744272008e-06, "loss": 0.0066, "step": 756350 }, { "epoch": 1.96, "learning_rate": 5.910866527900544e-06, "loss": 0.0059, "step": 756360 }, { "epoch": 1.96, "learning_rate": 5.906978311529079e-06, "loss": 0.0077, "step": 756370 }, { "epoch": 1.96, "learning_rate": 5.903090095157615e-06, "loss": 0.007, "step": 756380 }, { "epoch": 1.96, "learning_rate": 5.89920187878615e-06, "loss": 0.0081, "step": 756390 }, { "epoch": 1.96, "learning_rate": 5.895313662414685e-06, "loss": 0.0077, "step": 756400 }, { "epoch": 1.96, "learning_rate": 5.891425446043221e-06, "loss": 0.0068, "step": 756410 }, { "epoch": 1.96, "learning_rate": 5.887537229671757e-06, "loss": 0.0069, "step": 756420 }, { "epoch": 1.96, "learning_rate": 5.883649013300292e-06, "loss": 0.007, "step": 756430 }, { "epoch": 1.96, "learning_rate": 5.879760796928826e-06, "loss": 0.0067, "step": 756440 }, { "epoch": 1.96, "learning_rate": 5.875872580557362e-06, "loss": 0.005, "step": 756450 }, { "epoch": 1.96, "learning_rate": 5.871984364185898e-06, "loss": 0.0052, "step": 756460 }, { "epoch": 1.96, "learning_rate": 5.868096147814433e-06, "loss": 0.0071, "step": 756470 }, { "epoch": 1.96, "learning_rate": 5.864207931442968e-06, "loss": 0.0078, "step": 756480 }, { "epoch": 1.96, "learning_rate": 5.860319715071504e-06, "loss": 0.0078, "step": 756490 }, { "epoch": 1.96, "learning_rate": 5.856431498700039e-06, "loss": 0.0068, "step": 756500 }, { "epoch": 1.96, "learning_rate": 5.852543282328575e-06, "loss": 0.0056, "step": 756510 }, { "epoch": 1.96, "learning_rate": 5.84865506595711e-06, "loss": 0.005, "step": 756520 }, { "epoch": 1.96, "learning_rate": 5.844766849585645e-06, "loss": 0.0088, "step": 756530 }, { "epoch": 1.96, "learning_rate": 5.840878633214181e-06, "loss": 0.006, "step": 756540 }, { "epoch": 1.96, "learning_rate": 5.836990416842717e-06, "loss": 0.0081, "step": 756550 }, { "epoch": 1.96, "learning_rate": 5.833102200471251e-06, "loss": 0.0099, "step": 756560 }, { "epoch": 1.96, "learning_rate": 5.829213984099786e-06, "loss": 0.0084, "step": 756570 }, { "epoch": 1.96, "learning_rate": 5.825325767728322e-06, "loss": 0.0057, "step": 756580 }, { "epoch": 1.96, "learning_rate": 5.821437551356857e-06, "loss": 0.0056, "step": 756590 }, { "epoch": 1.96, "learning_rate": 5.817549334985393e-06, "loss": 0.008, "step": 756600 }, { "epoch": 1.96, "learning_rate": 5.813661118613928e-06, "loss": 0.0078, "step": 756610 }, { "epoch": 1.96, "learning_rate": 5.809772902242463e-06, "loss": 0.008, "step": 756620 }, { "epoch": 1.96, "learning_rate": 5.805884685870999e-06, "loss": 0.0071, "step": 756630 }, { "epoch": 1.96, "learning_rate": 5.801996469499535e-06, "loss": 0.0104, "step": 756640 }, { "epoch": 1.96, "learning_rate": 5.7981082531280695e-06, "loss": 0.0068, "step": 756650 }, { "epoch": 1.96, "learning_rate": 5.794220036756605e-06, "loss": 0.0051, "step": 756660 }, { "epoch": 1.96, "learning_rate": 5.790331820385141e-06, "loss": 0.0064, "step": 756670 }, { "epoch": 1.96, "learning_rate": 5.786443604013675e-06, "loss": 0.0067, "step": 756680 }, { "epoch": 1.96, "learning_rate": 5.782555387642211e-06, "loss": 0.0071, "step": 756690 }, { "epoch": 1.96, "learning_rate": 5.778667171270746e-06, "loss": 0.0057, "step": 756700 }, { "epoch": 1.96, "learning_rate": 5.774778954899281e-06, "loss": 0.009, "step": 756710 }, { "epoch": 1.96, "learning_rate": 5.770890738527817e-06, "loss": 0.0113, "step": 756720 }, { "epoch": 1.96, "learning_rate": 5.767002522156353e-06, "loss": 0.0093, "step": 756730 }, { "epoch": 1.96, "learning_rate": 5.763114305784888e-06, "loss": 0.0065, "step": 756740 }, { "epoch": 1.96, "learning_rate": 5.759226089413423e-06, "loss": 0.0061, "step": 756750 }, { "epoch": 1.96, "learning_rate": 5.755337873041959e-06, "loss": 0.0059, "step": 756760 }, { "epoch": 1.96, "learning_rate": 5.751449656670495e-06, "loss": 0.0078, "step": 756770 }, { "epoch": 1.96, "learning_rate": 5.747561440299029e-06, "loss": 0.0052, "step": 756780 }, { "epoch": 1.96, "learning_rate": 5.743673223927564e-06, "loss": 0.007, "step": 756790 }, { "epoch": 1.96, "learning_rate": 5.7397850075561e-06, "loss": 0.0074, "step": 756800 }, { "epoch": 1.96, "learning_rate": 5.735896791184635e-06, "loss": 0.0094, "step": 756810 }, { "epoch": 1.96, "learning_rate": 5.732008574813171e-06, "loss": 0.0057, "step": 756820 }, { "epoch": 1.96, "learning_rate": 5.728120358441706e-06, "loss": 0.0088, "step": 756830 }, { "epoch": 1.96, "learning_rate": 5.724232142070241e-06, "loss": 0.007, "step": 756840 }, { "epoch": 1.96, "learning_rate": 5.720343925698777e-06, "loss": 0.0072, "step": 756850 }, { "epoch": 1.96, "learning_rate": 5.7164557093273126e-06, "loss": 0.0055, "step": 756860 }, { "epoch": 1.96, "learning_rate": 5.7125674929558474e-06, "loss": 0.0086, "step": 756870 }, { "epoch": 1.96, "learning_rate": 5.708679276584383e-06, "loss": 0.0069, "step": 756880 }, { "epoch": 1.96, "learning_rate": 5.704791060212919e-06, "loss": 0.0079, "step": 756890 }, { "epoch": 1.96, "learning_rate": 5.700902843841453e-06, "loss": 0.0082, "step": 756900 }, { "epoch": 1.96, "learning_rate": 5.6970146274699886e-06, "loss": 0.0063, "step": 756910 }, { "epoch": 1.96, "learning_rate": 5.693126411098524e-06, "loss": 0.007, "step": 756920 }, { "epoch": 1.96, "learning_rate": 5.689238194727059e-06, "loss": 0.0069, "step": 756930 }, { "epoch": 1.96, "learning_rate": 5.685349978355595e-06, "loss": 0.0062, "step": 756940 }, { "epoch": 1.96, "learning_rate": 5.6814617619841306e-06, "loss": 0.0052, "step": 756950 }, { "epoch": 1.96, "learning_rate": 5.677573545612665e-06, "loss": 0.0073, "step": 756960 }, { "epoch": 1.96, "learning_rate": 5.673685329241201e-06, "loss": 0.0082, "step": 756970 }, { "epoch": 1.96, "learning_rate": 5.669797112869737e-06, "loss": 0.0057, "step": 756980 }, { "epoch": 1.96, "learning_rate": 5.665908896498272e-06, "loss": 0.0066, "step": 756990 }, { "epoch": 1.96, "learning_rate": 5.662020680126807e-06, "loss": 0.0082, "step": 757000 }, { "epoch": 1.96, "eval_cer": 0.8816760932214184, "eval_loss": 0.004407000262290239, "eval_runtime": 107.9473, "eval_samples_per_second": 18.528, "eval_steps_per_second": 4.632, "step": 757000 }, { "epoch": 1.96, "learning_rate": 5.658132463755343e-06, "loss": 0.0073, "step": 757010 }, { "epoch": 1.96, "learning_rate": 5.654244247383877e-06, "loss": 0.0082, "step": 757020 }, { "epoch": 1.96, "learning_rate": 5.650356031012413e-06, "loss": 0.0049, "step": 757030 }, { "epoch": 1.96, "learning_rate": 5.6464678146409485e-06, "loss": 0.007, "step": 757040 }, { "epoch": 1.96, "learning_rate": 5.642579598269484e-06, "loss": 0.0073, "step": 757050 }, { "epoch": 1.96, "learning_rate": 5.638691381898019e-06, "loss": 0.0067, "step": 757060 }, { "epoch": 1.96, "learning_rate": 5.634803165526555e-06, "loss": 0.0075, "step": 757070 }, { "epoch": 1.96, "learning_rate": 5.6309149491550905e-06, "loss": 0.0078, "step": 757080 }, { "epoch": 1.96, "learning_rate": 5.627026732783625e-06, "loss": 0.0083, "step": 757090 }, { "epoch": 1.96, "learning_rate": 5.623138516412161e-06, "loss": 0.0063, "step": 757100 }, { "epoch": 1.96, "learning_rate": 5.619250300040697e-06, "loss": 0.0083, "step": 757110 }, { "epoch": 1.96, "learning_rate": 5.615362083669231e-06, "loss": 0.0077, "step": 757120 }, { "epoch": 1.96, "learning_rate": 5.6114738672977665e-06, "loss": 0.0086, "step": 757130 }, { "epoch": 1.96, "learning_rate": 5.607585650926302e-06, "loss": 0.0058, "step": 757140 }, { "epoch": 1.96, "learning_rate": 5.603697434554837e-06, "loss": 0.0081, "step": 757150 }, { "epoch": 1.96, "learning_rate": 5.599809218183373e-06, "loss": 0.0107, "step": 757160 }, { "epoch": 1.96, "learning_rate": 5.5959210018119085e-06, "loss": 0.0085, "step": 757170 }, { "epoch": 1.96, "learning_rate": 5.592032785440443e-06, "loss": 0.0056, "step": 757180 }, { "epoch": 1.96, "learning_rate": 5.588144569068979e-06, "loss": 0.0084, "step": 757190 }, { "epoch": 1.96, "learning_rate": 5.584256352697515e-06, "loss": 0.0063, "step": 757200 }, { "epoch": 1.96, "learning_rate": 5.58036813632605e-06, "loss": 0.008, "step": 757210 }, { "epoch": 1.96, "learning_rate": 5.576479919954585e-06, "loss": 0.0051, "step": 757220 }, { "epoch": 1.96, "learning_rate": 5.572591703583121e-06, "loss": 0.0059, "step": 757230 }, { "epoch": 1.96, "learning_rate": 5.568703487211655e-06, "loss": 0.0052, "step": 757240 }, { "epoch": 1.96, "learning_rate": 5.564815270840191e-06, "loss": 0.0106, "step": 757250 }, { "epoch": 1.96, "learning_rate": 5.5609270544687265e-06, "loss": 0.0087, "step": 757260 }, { "epoch": 1.96, "learning_rate": 5.557038838097261e-06, "loss": 0.006, "step": 757270 }, { "epoch": 1.96, "learning_rate": 5.553150621725797e-06, "loss": 0.0062, "step": 757280 }, { "epoch": 1.96, "learning_rate": 5.549262405354333e-06, "loss": 0.0055, "step": 757290 }, { "epoch": 1.96, "learning_rate": 5.545374188982868e-06, "loss": 0.0075, "step": 757300 }, { "epoch": 1.96, "learning_rate": 5.541485972611403e-06, "loss": 0.0055, "step": 757310 }, { "epoch": 1.96, "learning_rate": 5.537597756239939e-06, "loss": 0.0119, "step": 757320 }, { "epoch": 1.96, "learning_rate": 5.533709539868474e-06, "loss": 0.0042, "step": 757330 }, { "epoch": 1.96, "learning_rate": 5.52982132349701e-06, "loss": 0.0053, "step": 757340 }, { "epoch": 1.96, "learning_rate": 5.525933107125545e-06, "loss": 0.0065, "step": 757350 }, { "epoch": 1.96, "learning_rate": 5.522044890754081e-06, "loss": 0.0092, "step": 757360 }, { "epoch": 1.96, "learning_rate": 5.518156674382615e-06, "loss": 0.0082, "step": 757370 }, { "epoch": 1.96, "learning_rate": 5.514268458011151e-06, "loss": 0.0089, "step": 757380 }, { "epoch": 1.96, "learning_rate": 5.5103802416396865e-06, "loss": 0.0066, "step": 757390 }, { "epoch": 1.96, "learning_rate": 5.506492025268221e-06, "loss": 0.0072, "step": 757400 }, { "epoch": 1.96, "learning_rate": 5.502603808896757e-06, "loss": 0.011, "step": 757410 }, { "epoch": 1.96, "learning_rate": 5.498715592525293e-06, "loss": 0.0061, "step": 757420 }, { "epoch": 1.96, "learning_rate": 5.494827376153828e-06, "loss": 0.0093, "step": 757430 }, { "epoch": 1.96, "learning_rate": 5.490939159782363e-06, "loss": 0.008, "step": 757440 }, { "epoch": 1.96, "learning_rate": 5.487050943410899e-06, "loss": 0.0062, "step": 757450 }, { "epoch": 1.96, "learning_rate": 5.483162727039434e-06, "loss": 0.0064, "step": 757460 }, { "epoch": 1.96, "learning_rate": 5.479274510667969e-06, "loss": 0.0061, "step": 757470 }, { "epoch": 1.96, "learning_rate": 5.4753862942965045e-06, "loss": 0.0057, "step": 757480 }, { "epoch": 1.96, "learning_rate": 5.471498077925039e-06, "loss": 0.0066, "step": 757490 }, { "epoch": 1.96, "learning_rate": 5.467609861553575e-06, "loss": 0.0073, "step": 757500 }, { "epoch": 1.96, "learning_rate": 5.463721645182111e-06, "loss": 0.0083, "step": 757510 }, { "epoch": 1.96, "learning_rate": 5.459833428810646e-06, "loss": 0.0101, "step": 757520 }, { "epoch": 1.96, "learning_rate": 5.455945212439181e-06, "loss": 0.0071, "step": 757530 }, { "epoch": 1.96, "learning_rate": 5.452056996067717e-06, "loss": 0.0057, "step": 757540 }, { "epoch": 1.96, "learning_rate": 5.448168779696252e-06, "loss": 0.0063, "step": 757550 }, { "epoch": 1.96, "learning_rate": 5.444280563324788e-06, "loss": 0.0066, "step": 757560 }, { "epoch": 1.96, "learning_rate": 5.440392346953323e-06, "loss": 0.0088, "step": 757570 }, { "epoch": 1.96, "learning_rate": 5.436504130581857e-06, "loss": 0.0082, "step": 757580 }, { "epoch": 1.96, "learning_rate": 5.432615914210393e-06, "loss": 0.0072, "step": 757590 }, { "epoch": 1.96, "learning_rate": 5.428727697838929e-06, "loss": 0.0094, "step": 757600 }, { "epoch": 1.96, "learning_rate": 5.424839481467464e-06, "loss": 0.0094, "step": 757610 }, { "epoch": 1.96, "learning_rate": 5.420951265095999e-06, "loss": 0.0076, "step": 757620 }, { "epoch": 1.96, "learning_rate": 5.417063048724535e-06, "loss": 0.0073, "step": 757630 }, { "epoch": 1.96, "learning_rate": 5.413174832353071e-06, "loss": 0.0058, "step": 757640 }, { "epoch": 1.96, "learning_rate": 5.409286615981606e-06, "loss": 0.007, "step": 757650 }, { "epoch": 1.96, "learning_rate": 5.405398399610141e-06, "loss": 0.0109, "step": 757660 }, { "epoch": 1.96, "learning_rate": 5.401510183238677e-06, "loss": 0.0061, "step": 757670 }, { "epoch": 1.96, "learning_rate": 5.397621966867212e-06, "loss": 0.0084, "step": 757680 }, { "epoch": 1.96, "learning_rate": 5.393733750495748e-06, "loss": 0.0082, "step": 757690 }, { "epoch": 1.96, "learning_rate": 5.389845534124283e-06, "loss": 0.0064, "step": 757700 }, { "epoch": 1.96, "learning_rate": 5.385957317752817e-06, "loss": 0.0054, "step": 757710 }, { "epoch": 1.96, "learning_rate": 5.382069101381353e-06, "loss": 0.007, "step": 757720 }, { "epoch": 1.96, "learning_rate": 5.378180885009889e-06, "loss": 0.0065, "step": 757730 }, { "epoch": 1.96, "learning_rate": 5.374292668638424e-06, "loss": 0.0087, "step": 757740 }, { "epoch": 1.96, "learning_rate": 5.370404452266959e-06, "loss": 0.0079, "step": 757750 }, { "epoch": 1.96, "learning_rate": 5.366516235895495e-06, "loss": 0.005, "step": 757760 }, { "epoch": 1.96, "learning_rate": 5.36262801952403e-06, "loss": 0.0088, "step": 757770 }, { "epoch": 1.96, "learning_rate": 5.3587398031525656e-06, "loss": 0.0075, "step": 757780 }, { "epoch": 1.96, "learning_rate": 5.354851586781101e-06, "loss": 0.0065, "step": 757790 }, { "epoch": 1.96, "learning_rate": 5.350963370409636e-06, "loss": 0.0072, "step": 757800 }, { "epoch": 1.96, "learning_rate": 5.347075154038171e-06, "loss": 0.0059, "step": 757810 }, { "epoch": 1.96, "learning_rate": 5.343186937666707e-06, "loss": 0.0106, "step": 757820 }, { "epoch": 1.96, "learning_rate": 5.3392987212952416e-06, "loss": 0.0072, "step": 757830 }, { "epoch": 1.96, "learning_rate": 5.335410504923777e-06, "loss": 0.0091, "step": 757840 }, { "epoch": 1.96, "learning_rate": 5.331522288552313e-06, "loss": 0.0061, "step": 757850 }, { "epoch": 1.96, "learning_rate": 5.327634072180848e-06, "loss": 0.0056, "step": 757860 }, { "epoch": 1.96, "learning_rate": 5.3237458558093836e-06, "loss": 0.0077, "step": 757870 }, { "epoch": 1.96, "learning_rate": 5.319857639437919e-06, "loss": 0.0092, "step": 757880 }, { "epoch": 1.96, "learning_rate": 5.315969423066454e-06, "loss": 0.0091, "step": 757890 }, { "epoch": 1.96, "learning_rate": 5.31208120669499e-06, "loss": 0.0079, "step": 757900 }, { "epoch": 1.96, "learning_rate": 5.3081929903235255e-06, "loss": 0.0068, "step": 757910 }, { "epoch": 1.96, "learning_rate": 5.3043047739520596e-06, "loss": 0.0062, "step": 757920 }, { "epoch": 1.96, "learning_rate": 5.300416557580595e-06, "loss": 0.0064, "step": 757930 }, { "epoch": 1.96, "learning_rate": 5.296528341209131e-06, "loss": 0.0074, "step": 757940 }, { "epoch": 1.96, "learning_rate": 5.292640124837667e-06, "loss": 0.0073, "step": 757950 }, { "epoch": 1.96, "learning_rate": 5.2887519084662015e-06, "loss": 0.0065, "step": 757960 }, { "epoch": 1.96, "learning_rate": 5.284863692094737e-06, "loss": 0.0074, "step": 757970 }, { "epoch": 1.96, "learning_rate": 5.280975475723273e-06, "loss": 0.0113, "step": 757980 }, { "epoch": 1.96, "learning_rate": 5.277087259351808e-06, "loss": 0.0063, "step": 757990 }, { "epoch": 1.96, "learning_rate": 5.2731990429803435e-06, "loss": 0.0063, "step": 758000 }, { "epoch": 1.96, "eval_cer": 0.8816634964890108, "eval_loss": 0.0044049047864973545, "eval_runtime": 108.0473, "eval_samples_per_second": 18.51, "eval_steps_per_second": 4.628, "step": 758000 }, { "epoch": 1.96, "learning_rate": 5.269310826608879e-06, "loss": 0.0068, "step": 758010 }, { "epoch": 1.96, "learning_rate": 5.265422610237414e-06, "loss": 0.0066, "step": 758020 }, { "epoch": 1.96, "learning_rate": 5.26153439386595e-06, "loss": 0.0089, "step": 758030 }, { "epoch": 1.96, "learning_rate": 5.2576461774944855e-06, "loss": 0.0094, "step": 758040 }, { "epoch": 1.96, "learning_rate": 5.2537579611230195e-06, "loss": 0.0059, "step": 758050 }, { "epoch": 1.96, "learning_rate": 5.249869744751555e-06, "loss": 0.0058, "step": 758060 }, { "epoch": 1.97, "learning_rate": 5.245981528380091e-06, "loss": 0.006, "step": 758070 }, { "epoch": 1.97, "learning_rate": 5.242093312008626e-06, "loss": 0.0056, "step": 758080 }, { "epoch": 1.97, "learning_rate": 5.2382050956371615e-06, "loss": 0.0065, "step": 758090 }, { "epoch": 1.97, "learning_rate": 5.234316879265697e-06, "loss": 0.0087, "step": 758100 }, { "epoch": 1.97, "learning_rate": 5.230428662894232e-06, "loss": 0.0062, "step": 758110 }, { "epoch": 1.97, "learning_rate": 5.226540446522768e-06, "loss": 0.008, "step": 758120 }, { "epoch": 1.97, "learning_rate": 5.2226522301513035e-06, "loss": 0.0065, "step": 758130 }, { "epoch": 1.97, "learning_rate": 5.218764013779838e-06, "loss": 0.0073, "step": 758140 }, { "epoch": 1.97, "learning_rate": 5.214875797408374e-06, "loss": 0.0073, "step": 758150 }, { "epoch": 1.97, "learning_rate": 5.210987581036909e-06, "loss": 0.006, "step": 758160 }, { "epoch": 1.97, "learning_rate": 5.207099364665444e-06, "loss": 0.0082, "step": 758170 }, { "epoch": 1.97, "learning_rate": 5.2032111482939795e-06, "loss": 0.0063, "step": 758180 }, { "epoch": 1.97, "learning_rate": 5.199322931922515e-06, "loss": 0.0067, "step": 758190 }, { "epoch": 1.97, "learning_rate": 5.19543471555105e-06, "loss": 0.0056, "step": 758200 }, { "epoch": 1.97, "learning_rate": 5.191546499179586e-06, "loss": 0.0051, "step": 758210 }, { "epoch": 1.97, "learning_rate": 5.1876582828081215e-06, "loss": 0.0064, "step": 758220 }, { "epoch": 1.97, "learning_rate": 5.183770066436656e-06, "loss": 0.0061, "step": 758230 }, { "epoch": 1.97, "learning_rate": 5.179881850065192e-06, "loss": 0.0074, "step": 758240 }, { "epoch": 1.97, "learning_rate": 5.175993633693728e-06, "loss": 0.0074, "step": 758250 }, { "epoch": 1.97, "learning_rate": 5.1721054173222635e-06, "loss": 0.0079, "step": 758260 }, { "epoch": 1.97, "learning_rate": 5.1682172009507975e-06, "loss": 0.0046, "step": 758270 }, { "epoch": 1.97, "learning_rate": 5.164328984579333e-06, "loss": 0.0044, "step": 758280 }, { "epoch": 1.97, "learning_rate": 5.160440768207869e-06, "loss": 0.0081, "step": 758290 }, { "epoch": 1.97, "learning_rate": 5.156552551836404e-06, "loss": 0.0069, "step": 758300 }, { "epoch": 1.97, "learning_rate": 5.1526643354649395e-06, "loss": 0.0086, "step": 758310 }, { "epoch": 1.97, "learning_rate": 5.148776119093475e-06, "loss": 0.0059, "step": 758320 }, { "epoch": 1.97, "learning_rate": 5.14488790272201e-06, "loss": 0.0056, "step": 758330 }, { "epoch": 1.97, "learning_rate": 5.140999686350546e-06, "loss": 0.0068, "step": 758340 }, { "epoch": 1.97, "learning_rate": 5.1371114699790815e-06, "loss": 0.0063, "step": 758350 }, { "epoch": 1.97, "learning_rate": 5.133223253607616e-06, "loss": 0.0057, "step": 758360 }, { "epoch": 1.97, "learning_rate": 5.129335037236152e-06, "loss": 0.0061, "step": 758370 }, { "epoch": 1.97, "learning_rate": 5.125446820864688e-06, "loss": 0.0062, "step": 758380 }, { "epoch": 1.97, "learning_rate": 5.121558604493222e-06, "loss": 0.0075, "step": 758390 }, { "epoch": 1.97, "learning_rate": 5.1176703881217575e-06, "loss": 0.0074, "step": 758400 }, { "epoch": 1.97, "learning_rate": 5.113782171750293e-06, "loss": 0.0088, "step": 758410 }, { "epoch": 1.97, "learning_rate": 5.109893955378828e-06, "loss": 0.0074, "step": 758420 }, { "epoch": 1.97, "learning_rate": 5.106005739007364e-06, "loss": 0.0086, "step": 758430 }, { "epoch": 1.97, "learning_rate": 5.1021175226358995e-06, "loss": 0.0055, "step": 758440 }, { "epoch": 1.97, "learning_rate": 5.098229306264434e-06, "loss": 0.0069, "step": 758450 }, { "epoch": 1.97, "learning_rate": 5.09434108989297e-06, "loss": 0.0062, "step": 758460 }, { "epoch": 1.97, "learning_rate": 5.090452873521506e-06, "loss": 0.0052, "step": 758470 }, { "epoch": 1.97, "learning_rate": 5.086564657150041e-06, "loss": 0.0079, "step": 758480 }, { "epoch": 1.97, "learning_rate": 5.082676440778576e-06, "loss": 0.0077, "step": 758490 }, { "epoch": 1.97, "learning_rate": 5.078788224407112e-06, "loss": 0.0075, "step": 758500 }, { "epoch": 1.97, "learning_rate": 5.074900008035646e-06, "loss": 0.0082, "step": 758510 }, { "epoch": 1.97, "learning_rate": 5.071011791664182e-06, "loss": 0.006, "step": 758520 }, { "epoch": 1.97, "learning_rate": 5.0671235752927175e-06, "loss": 0.0063, "step": 758530 }, { "epoch": 1.97, "learning_rate": 5.063235358921252e-06, "loss": 0.0085, "step": 758540 }, { "epoch": 1.97, "learning_rate": 5.059347142549788e-06, "loss": 0.0067, "step": 758550 }, { "epoch": 1.97, "learning_rate": 5.055458926178324e-06, "loss": 0.006, "step": 758560 }, { "epoch": 1.97, "learning_rate": 5.0515707098068594e-06, "loss": 0.007, "step": 758570 }, { "epoch": 1.97, "learning_rate": 5.047682493435394e-06, "loss": 0.0077, "step": 758580 }, { "epoch": 1.97, "learning_rate": 5.04379427706393e-06, "loss": 0.008, "step": 758590 }, { "epoch": 1.97, "learning_rate": 5.039906060692466e-06, "loss": 0.0069, "step": 758600 }, { "epoch": 1.97, "learning_rate": 5.036017844321e-06, "loss": 0.0067, "step": 758610 }, { "epoch": 1.97, "learning_rate": 5.0321296279495354e-06, "loss": 0.0059, "step": 758620 }, { "epoch": 1.97, "learning_rate": 5.028241411578071e-06, "loss": 0.0077, "step": 758630 }, { "epoch": 1.97, "learning_rate": 5.024353195206606e-06, "loss": 0.0074, "step": 758640 }, { "epoch": 1.97, "learning_rate": 5.020464978835142e-06, "loss": 0.0052, "step": 758650 }, { "epoch": 1.97, "learning_rate": 5.0165767624636774e-06, "loss": 0.0051, "step": 758660 }, { "epoch": 1.97, "learning_rate": 5.012688546092212e-06, "loss": 0.0068, "step": 758670 }, { "epoch": 1.97, "learning_rate": 5.008800329720748e-06, "loss": 0.0076, "step": 758680 }, { "epoch": 1.97, "learning_rate": 5.004912113349284e-06, "loss": 0.0089, "step": 758690 }, { "epoch": 1.97, "learning_rate": 5.0010238969778186e-06, "loss": 0.0058, "step": 758700 }, { "epoch": 1.97, "learning_rate": 4.997135680606354e-06, "loss": 0.0062, "step": 758710 }, { "epoch": 1.97, "learning_rate": 4.99324746423489e-06, "loss": 0.0078, "step": 758720 }, { "epoch": 1.97, "learning_rate": 4.989359247863424e-06, "loss": 0.0072, "step": 758730 }, { "epoch": 1.97, "learning_rate": 4.98547103149196e-06, "loss": 0.0088, "step": 758740 }, { "epoch": 1.97, "learning_rate": 4.981582815120495e-06, "loss": 0.0086, "step": 758750 }, { "epoch": 1.97, "learning_rate": 4.97769459874903e-06, "loss": 0.0079, "step": 758760 }, { "epoch": 1.97, "learning_rate": 4.973806382377566e-06, "loss": 0.0061, "step": 758770 }, { "epoch": 1.97, "learning_rate": 4.969918166006102e-06, "loss": 0.008, "step": 758780 }, { "epoch": 1.97, "learning_rate": 4.9660299496346366e-06, "loss": 0.0076, "step": 758790 }, { "epoch": 1.97, "learning_rate": 4.962141733263172e-06, "loss": 0.0087, "step": 758800 }, { "epoch": 1.97, "learning_rate": 4.958253516891708e-06, "loss": 0.0089, "step": 758810 }, { "epoch": 1.97, "learning_rate": 4.954365300520243e-06, "loss": 0.0084, "step": 758820 }, { "epoch": 1.97, "learning_rate": 4.9504770841487785e-06, "loss": 0.0065, "step": 758830 }, { "epoch": 1.97, "learning_rate": 4.946588867777314e-06, "loss": 0.0055, "step": 758840 }, { "epoch": 1.97, "learning_rate": 4.942700651405848e-06, "loss": 0.0101, "step": 758850 }, { "epoch": 1.97, "learning_rate": 4.938812435034384e-06, "loss": 0.0071, "step": 758860 }, { "epoch": 1.97, "learning_rate": 4.93492421866292e-06, "loss": 0.0067, "step": 758870 }, { "epoch": 1.97, "learning_rate": 4.931036002291455e-06, "loss": 0.0114, "step": 758880 }, { "epoch": 1.97, "learning_rate": 4.92714778591999e-06, "loss": 0.0053, "step": 758890 }, { "epoch": 1.97, "learning_rate": 4.923259569548526e-06, "loss": 0.0067, "step": 758900 }, { "epoch": 1.97, "learning_rate": 4.919371353177062e-06, "loss": 0.0064, "step": 758910 }, { "epoch": 1.97, "learning_rate": 4.9154831368055965e-06, "loss": 0.0051, "step": 758920 }, { "epoch": 1.97, "learning_rate": 4.911594920434132e-06, "loss": 0.0074, "step": 758930 }, { "epoch": 1.97, "learning_rate": 4.907706704062668e-06, "loss": 0.0098, "step": 758940 }, { "epoch": 1.97, "learning_rate": 4.903818487691202e-06, "loss": 0.0072, "step": 758950 }, { "epoch": 1.97, "learning_rate": 4.899930271319738e-06, "loss": 0.0062, "step": 758960 }, { "epoch": 1.97, "learning_rate": 4.896042054948273e-06, "loss": 0.0084, "step": 758970 }, { "epoch": 1.97, "learning_rate": 4.892153838576808e-06, "loss": 0.0072, "step": 758980 }, { "epoch": 1.97, "learning_rate": 4.888265622205344e-06, "loss": 0.0092, "step": 758990 }, { "epoch": 1.97, "learning_rate": 4.88437740583388e-06, "loss": 0.0065, "step": 759000 }, { "epoch": 1.97, "eval_cer": 0.8816746935844841, "eval_loss": 0.004368713591247797, "eval_runtime": 107.9594, "eval_samples_per_second": 18.525, "eval_steps_per_second": 4.631, "step": 759000 }, { "epoch": 1.97, "learning_rate": 4.8804891894624145e-06, "loss": 0.0074, "step": 759010 }, { "epoch": 1.97, "learning_rate": 4.87660097309095e-06, "loss": 0.0064, "step": 759020 }, { "epoch": 1.97, "learning_rate": 4.872712756719486e-06, "loss": 0.0095, "step": 759030 }, { "epoch": 1.97, "learning_rate": 4.868824540348021e-06, "loss": 0.0046, "step": 759040 }, { "epoch": 1.97, "learning_rate": 4.8649363239765565e-06, "loss": 0.0068, "step": 759050 }, { "epoch": 1.97, "learning_rate": 4.861048107605092e-06, "loss": 0.0081, "step": 759060 }, { "epoch": 1.97, "learning_rate": 4.857159891233626e-06, "loss": 0.008, "step": 759070 }, { "epoch": 1.97, "learning_rate": 4.853271674862162e-06, "loss": 0.0072, "step": 759080 }, { "epoch": 1.97, "learning_rate": 4.849383458490698e-06, "loss": 0.0083, "step": 759090 }, { "epoch": 1.97, "learning_rate": 4.8454952421192325e-06, "loss": 0.0075, "step": 759100 }, { "epoch": 1.97, "learning_rate": 4.841607025747768e-06, "loss": 0.0042, "step": 759110 }, { "epoch": 1.97, "learning_rate": 4.837718809376304e-06, "loss": 0.006, "step": 759120 }, { "epoch": 1.97, "learning_rate": 4.833830593004839e-06, "loss": 0.0077, "step": 759130 }, { "epoch": 1.97, "learning_rate": 4.8299423766333745e-06, "loss": 0.0095, "step": 759140 }, { "epoch": 1.97, "learning_rate": 4.82605416026191e-06, "loss": 0.006, "step": 759150 }, { "epoch": 1.97, "learning_rate": 4.822165943890445e-06, "loss": 0.0076, "step": 759160 }, { "epoch": 1.97, "learning_rate": 4.818277727518981e-06, "loss": 0.0067, "step": 759170 }, { "epoch": 1.97, "learning_rate": 4.8143895111475165e-06, "loss": 0.0076, "step": 759180 }, { "epoch": 1.97, "learning_rate": 4.810501294776052e-06, "loss": 0.0099, "step": 759190 }, { "epoch": 1.97, "learning_rate": 4.806613078404586e-06, "loss": 0.0055, "step": 759200 }, { "epoch": 1.97, "learning_rate": 4.802724862033122e-06, "loss": 0.0085, "step": 759210 }, { "epoch": 1.97, "learning_rate": 4.798836645661658e-06, "loss": 0.0052, "step": 759220 }, { "epoch": 1.97, "learning_rate": 4.7949484292901925e-06, "loss": 0.0072, "step": 759230 }, { "epoch": 1.97, "learning_rate": 4.791060212918728e-06, "loss": 0.0056, "step": 759240 }, { "epoch": 1.97, "learning_rate": 4.787171996547264e-06, "loss": 0.0085, "step": 759250 }, { "epoch": 1.97, "learning_rate": 4.783283780175799e-06, "loss": 0.01, "step": 759260 }, { "epoch": 1.97, "learning_rate": 4.7793955638043345e-06, "loss": 0.007, "step": 759270 }, { "epoch": 1.97, "learning_rate": 4.77550734743287e-06, "loss": 0.0067, "step": 759280 }, { "epoch": 1.97, "learning_rate": 4.771619131061404e-06, "loss": 0.0068, "step": 759290 }, { "epoch": 1.97, "learning_rate": 4.76773091468994e-06, "loss": 0.0106, "step": 759300 }, { "epoch": 1.97, "learning_rate": 4.763842698318476e-06, "loss": 0.0076, "step": 759310 }, { "epoch": 1.97, "learning_rate": 4.7599544819470105e-06, "loss": 0.0093, "step": 759320 }, { "epoch": 1.97, "learning_rate": 4.756066265575546e-06, "loss": 0.0076, "step": 759330 }, { "epoch": 1.97, "learning_rate": 4.752178049204082e-06, "loss": 0.0068, "step": 759340 }, { "epoch": 1.97, "learning_rate": 4.748289832832617e-06, "loss": 0.0069, "step": 759350 }, { "epoch": 1.97, "learning_rate": 4.7444016164611525e-06, "loss": 0.0083, "step": 759360 }, { "epoch": 1.97, "learning_rate": 4.740513400089688e-06, "loss": 0.0101, "step": 759370 }, { "epoch": 1.97, "learning_rate": 4.736625183718223e-06, "loss": 0.0079, "step": 759380 }, { "epoch": 1.97, "learning_rate": 4.732736967346759e-06, "loss": 0.0143, "step": 759390 }, { "epoch": 1.97, "learning_rate": 4.7288487509752944e-06, "loss": 0.0065, "step": 759400 }, { "epoch": 1.97, "learning_rate": 4.7249605346038285e-06, "loss": 0.0069, "step": 759410 }, { "epoch": 1.97, "learning_rate": 4.721072318232364e-06, "loss": 0.0064, "step": 759420 }, { "epoch": 1.97, "learning_rate": 4.7171841018609e-06, "loss": 0.0062, "step": 759430 }, { "epoch": 1.97, "learning_rate": 4.713295885489435e-06, "loss": 0.0095, "step": 759440 }, { "epoch": 1.97, "learning_rate": 4.7094076691179705e-06, "loss": 0.0076, "step": 759450 }, { "epoch": 1.97, "learning_rate": 4.705519452746506e-06, "loss": 0.0053, "step": 759460 }, { "epoch": 1.97, "learning_rate": 4.701631236375041e-06, "loss": 0.0074, "step": 759470 }, { "epoch": 1.97, "learning_rate": 4.697743020003577e-06, "loss": 0.0074, "step": 759480 }, { "epoch": 1.97, "learning_rate": 4.6938548036321124e-06, "loss": 0.0089, "step": 759490 }, { "epoch": 1.97, "learning_rate": 4.689966587260648e-06, "loss": 0.0068, "step": 759500 }, { "epoch": 1.97, "learning_rate": 4.686078370889183e-06, "loss": 0.0069, "step": 759510 }, { "epoch": 1.97, "learning_rate": 4.682190154517719e-06, "loss": 0.0058, "step": 759520 }, { "epoch": 1.97, "learning_rate": 4.678301938146254e-06, "loss": 0.0066, "step": 759530 }, { "epoch": 1.97, "learning_rate": 4.6744137217747884e-06, "loss": 0.0053, "step": 759540 }, { "epoch": 1.97, "learning_rate": 4.670525505403324e-06, "loss": 0.0061, "step": 759550 }, { "epoch": 1.97, "learning_rate": 4.66663728903186e-06, "loss": 0.0055, "step": 759560 }, { "epoch": 1.97, "learning_rate": 4.6627490726603956e-06, "loss": 0.007, "step": 759570 }, { "epoch": 1.97, "learning_rate": 4.6588608562889304e-06, "loss": 0.0058, "step": 759580 }, { "epoch": 1.97, "learning_rate": 4.654972639917465e-06, "loss": 0.0053, "step": 759590 }, { "epoch": 1.97, "learning_rate": 4.651084423546001e-06, "loss": 0.0071, "step": 759600 }, { "epoch": 1.97, "learning_rate": 4.647196207174537e-06, "loss": 0.0046, "step": 759610 }, { "epoch": 1.97, "learning_rate": 4.6433079908030716e-06, "loss": 0.0068, "step": 759620 }, { "epoch": 1.97, "learning_rate": 4.639419774431607e-06, "loss": 0.0066, "step": 759630 }, { "epoch": 1.97, "learning_rate": 4.635531558060142e-06, "loss": 0.0062, "step": 759640 }, { "epoch": 1.97, "learning_rate": 4.631643341688678e-06, "loss": 0.0085, "step": 759650 }, { "epoch": 1.97, "learning_rate": 4.6277551253172136e-06, "loss": 0.0051, "step": 759660 }, { "epoch": 1.97, "learning_rate": 4.623866908945748e-06, "loss": 0.0059, "step": 759670 }, { "epoch": 1.97, "learning_rate": 4.619978692574284e-06, "loss": 0.0091, "step": 759680 }, { "epoch": 1.97, "learning_rate": 4.61609047620282e-06, "loss": 0.0077, "step": 759690 }, { "epoch": 1.97, "learning_rate": 4.612202259831355e-06, "loss": 0.0079, "step": 759700 }, { "epoch": 1.97, "learning_rate": 4.60831404345989e-06, "loss": 0.0078, "step": 759710 }, { "epoch": 1.97, "learning_rate": 4.604425827088425e-06, "loss": 0.0066, "step": 759720 }, { "epoch": 1.97, "learning_rate": 4.600537610716961e-06, "loss": 0.0068, "step": 759730 }, { "epoch": 1.97, "learning_rate": 4.596649394345497e-06, "loss": 0.0043, "step": 759740 }, { "epoch": 1.97, "learning_rate": 4.5927611779740315e-06, "loss": 0.008, "step": 759750 }, { "epoch": 1.97, "learning_rate": 4.588872961602566e-06, "loss": 0.0065, "step": 759760 }, { "epoch": 1.97, "learning_rate": 4.584984745231102e-06, "loss": 0.0066, "step": 759770 }, { "epoch": 1.97, "learning_rate": 4.581096528859638e-06, "loss": 0.0078, "step": 759780 }, { "epoch": 1.97, "learning_rate": 4.577208312488173e-06, "loss": 0.0055, "step": 759790 }, { "epoch": 1.97, "learning_rate": 4.573320096116708e-06, "loss": 0.0071, "step": 759800 }, { "epoch": 1.97, "learning_rate": 4.569431879745243e-06, "loss": 0.0058, "step": 759810 }, { "epoch": 1.97, "learning_rate": 4.565543663373779e-06, "loss": 0.007, "step": 759820 }, { "epoch": 1.97, "learning_rate": 4.561655447002315e-06, "loss": 0.0082, "step": 759830 }, { "epoch": 1.97, "learning_rate": 4.5577672306308495e-06, "loss": 0.0066, "step": 759840 }, { "epoch": 1.97, "learning_rate": 4.553879014259385e-06, "loss": 0.0066, "step": 759850 }, { "epoch": 1.97, "learning_rate": 4.549990797887921e-06, "loss": 0.0059, "step": 759860 }, { "epoch": 1.97, "learning_rate": 4.546102581516456e-06, "loss": 0.0072, "step": 759870 }, { "epoch": 1.97, "learning_rate": 4.5422143651449915e-06, "loss": 0.01, "step": 759880 }, { "epoch": 1.97, "learning_rate": 4.538326148773526e-06, "loss": 0.0045, "step": 759890 }, { "epoch": 1.97, "learning_rate": 4.534437932402062e-06, "loss": 0.0061, "step": 759900 }, { "epoch": 1.97, "learning_rate": 4.530549716030598e-06, "loss": 0.0072, "step": 759910 }, { "epoch": 1.97, "learning_rate": 4.526661499659133e-06, "loss": 0.0042, "step": 759920 }, { "epoch": 1.97, "learning_rate": 4.5227732832876675e-06, "loss": 0.0065, "step": 759930 }, { "epoch": 1.97, "learning_rate": 4.518885066916203e-06, "loss": 0.0089, "step": 759940 }, { "epoch": 1.97, "learning_rate": 4.514996850544739e-06, "loss": 0.0049, "step": 759950 }, { "epoch": 1.97, "learning_rate": 4.511108634173274e-06, "loss": 0.0058, "step": 759960 }, { "epoch": 1.97, "learning_rate": 4.5072204178018095e-06, "loss": 0.0104, "step": 759970 }, { "epoch": 1.97, "learning_rate": 4.503332201430344e-06, "loss": 0.0064, "step": 759980 }, { "epoch": 1.97, "learning_rate": 4.49944398505888e-06, "loss": 0.0079, "step": 759990 }, { "epoch": 1.97, "learning_rate": 4.495555768687416e-06, "loss": 0.0055, "step": 760000 }, { "epoch": 1.97, "eval_cer": 0.8816788924952867, "eval_loss": 0.004402776248753071, "eval_runtime": 107.9755, "eval_samples_per_second": 18.523, "eval_steps_per_second": 4.631, "step": 760000 }, { "epoch": 1.97, "learning_rate": 4.491667552315951e-06, "loss": 0.0056, "step": 760010 }, { "epoch": 1.97, "learning_rate": 4.487779335944486e-06, "loss": 0.0072, "step": 760020 }, { "epoch": 1.97, "learning_rate": 4.483891119573022e-06, "loss": 0.0071, "step": 760030 }, { "epoch": 1.97, "learning_rate": 4.480002903201557e-06, "loss": 0.0063, "step": 760040 }, { "epoch": 1.97, "learning_rate": 4.476114686830093e-06, "loss": 0.0047, "step": 760050 }, { "epoch": 1.97, "learning_rate": 4.4722264704586275e-06, "loss": 0.0066, "step": 760060 }, { "epoch": 1.97, "learning_rate": 4.468338254087163e-06, "loss": 0.0083, "step": 760070 }, { "epoch": 1.97, "learning_rate": 4.464450037715699e-06, "loss": 0.0065, "step": 760080 }, { "epoch": 1.97, "learning_rate": 4.460561821344234e-06, "loss": 0.0081, "step": 760090 }, { "epoch": 1.97, "learning_rate": 4.456673604972769e-06, "loss": 0.0069, "step": 760100 }, { "epoch": 1.97, "learning_rate": 4.452785388601304e-06, "loss": 0.0115, "step": 760110 }, { "epoch": 1.97, "learning_rate": 4.44889717222984e-06, "loss": 0.0062, "step": 760120 }, { "epoch": 1.97, "learning_rate": 4.445008955858375e-06, "loss": 0.0057, "step": 760130 }, { "epoch": 1.97, "learning_rate": 4.441120739486911e-06, "loss": 0.0074, "step": 760140 }, { "epoch": 1.97, "learning_rate": 4.4372325231154455e-06, "loss": 0.0086, "step": 760150 }, { "epoch": 1.97, "learning_rate": 4.433344306743981e-06, "loss": 0.0059, "step": 760160 }, { "epoch": 1.97, "learning_rate": 4.429456090372517e-06, "loss": 0.0048, "step": 760170 }, { "epoch": 1.97, "learning_rate": 4.425567874001052e-06, "loss": 0.0053, "step": 760180 }, { "epoch": 1.97, "learning_rate": 4.4216796576295875e-06, "loss": 0.0086, "step": 760190 }, { "epoch": 1.97, "learning_rate": 4.417791441258123e-06, "loss": 0.0085, "step": 760200 }, { "epoch": 1.97, "learning_rate": 4.413903224886658e-06, "loss": 0.0091, "step": 760210 }, { "epoch": 1.97, "learning_rate": 4.410015008515194e-06, "loss": 0.0053, "step": 760220 }, { "epoch": 1.97, "learning_rate": 4.406126792143729e-06, "loss": 0.0057, "step": 760230 }, { "epoch": 1.97, "learning_rate": 4.402238575772264e-06, "loss": 0.0046, "step": 760240 }, { "epoch": 1.97, "learning_rate": 4.3983503594008e-06, "loss": 0.0061, "step": 760250 }, { "epoch": 1.97, "learning_rate": 4.394462143029335e-06, "loss": 0.0064, "step": 760260 }, { "epoch": 1.97, "learning_rate": 4.39057392665787e-06, "loss": 0.0071, "step": 760270 }, { "epoch": 1.97, "learning_rate": 4.3866857102864055e-06, "loss": 0.0061, "step": 760280 }, { "epoch": 1.97, "learning_rate": 4.382797493914941e-06, "loss": 0.0079, "step": 760290 }, { "epoch": 1.97, "learning_rate": 4.378909277543476e-06, "loss": 0.0074, "step": 760300 }, { "epoch": 1.97, "learning_rate": 4.375021061172012e-06, "loss": 0.0063, "step": 760310 }, { "epoch": 1.97, "learning_rate": 4.371132844800547e-06, "loss": 0.0076, "step": 760320 }, { "epoch": 1.97, "learning_rate": 4.367244628429082e-06, "loss": 0.0061, "step": 760330 }, { "epoch": 1.97, "learning_rate": 4.363356412057618e-06, "loss": 0.0077, "step": 760340 }, { "epoch": 1.97, "learning_rate": 4.359468195686153e-06, "loss": 0.0075, "step": 760350 }, { "epoch": 1.97, "learning_rate": 4.355579979314689e-06, "loss": 0.0078, "step": 760360 }, { "epoch": 1.97, "learning_rate": 4.351691762943224e-06, "loss": 0.0053, "step": 760370 }, { "epoch": 1.97, "learning_rate": 4.347803546571759e-06, "loss": 0.0081, "step": 760380 }, { "epoch": 1.97, "learning_rate": 4.343915330200295e-06, "loss": 0.0055, "step": 760390 }, { "epoch": 1.97, "learning_rate": 4.34002711382883e-06, "loss": 0.0055, "step": 760400 }, { "epoch": 1.97, "learning_rate": 4.3361388974573654e-06, "loss": 0.0082, "step": 760410 }, { "epoch": 1.97, "learning_rate": 4.332250681085901e-06, "loss": 0.008, "step": 760420 }, { "epoch": 1.97, "learning_rate": 4.328362464714436e-06, "loss": 0.0079, "step": 760430 }, { "epoch": 1.97, "learning_rate": 4.324474248342971e-06, "loss": 0.0087, "step": 760440 }, { "epoch": 1.97, "learning_rate": 4.320586031971507e-06, "loss": 0.0063, "step": 760450 }, { "epoch": 1.97, "learning_rate": 4.316697815600042e-06, "loss": 0.0091, "step": 760460 }, { "epoch": 1.97, "learning_rate": 4.312809599228578e-06, "loss": 0.0065, "step": 760470 }, { "epoch": 1.97, "learning_rate": 4.308921382857113e-06, "loss": 0.006, "step": 760480 }, { "epoch": 1.97, "learning_rate": 4.305033166485648e-06, "loss": 0.0099, "step": 760490 }, { "epoch": 1.97, "learning_rate": 4.3011449501141834e-06, "loss": 0.0086, "step": 760500 }, { "epoch": 1.97, "learning_rate": 4.297256733742719e-06, "loss": 0.0059, "step": 760510 }, { "epoch": 1.97, "learning_rate": 4.293368517371254e-06, "loss": 0.0072, "step": 760520 }, { "epoch": 1.97, "learning_rate": 4.28948030099979e-06, "loss": 0.0074, "step": 760530 }, { "epoch": 1.97, "learning_rate": 4.285592084628325e-06, "loss": 0.0055, "step": 760540 }, { "epoch": 1.97, "learning_rate": 4.28170386825686e-06, "loss": 0.0077, "step": 760550 }, { "epoch": 1.97, "learning_rate": 4.277815651885396e-06, "loss": 0.0118, "step": 760560 }, { "epoch": 1.97, "learning_rate": 4.273927435513931e-06, "loss": 0.0073, "step": 760570 }, { "epoch": 1.97, "learning_rate": 4.2700392191424666e-06, "loss": 0.0078, "step": 760580 }, { "epoch": 1.97, "learning_rate": 4.266151002771002e-06, "loss": 0.0058, "step": 760590 }, { "epoch": 1.97, "learning_rate": 4.262262786399537e-06, "loss": 0.0049, "step": 760600 }, { "epoch": 1.97, "learning_rate": 4.258374570028072e-06, "loss": 0.0085, "step": 760610 }, { "epoch": 1.97, "learning_rate": 4.254486353656608e-06, "loss": 0.0064, "step": 760620 }, { "epoch": 1.97, "learning_rate": 4.250598137285143e-06, "loss": 0.0068, "step": 760630 }, { "epoch": 1.97, "learning_rate": 4.246709920913679e-06, "loss": 0.0053, "step": 760640 }, { "epoch": 1.97, "learning_rate": 4.242821704542214e-06, "loss": 0.0036, "step": 760650 }, { "epoch": 1.97, "learning_rate": 4.238933488170749e-06, "loss": 0.0078, "step": 760660 }, { "epoch": 1.97, "learning_rate": 4.2350452717992845e-06, "loss": 0.0068, "step": 760670 }, { "epoch": 1.97, "learning_rate": 4.23115705542782e-06, "loss": 0.008, "step": 760680 }, { "epoch": 1.97, "learning_rate": 4.227268839056355e-06, "loss": 0.0061, "step": 760690 }, { "epoch": 1.97, "learning_rate": 4.223380622684891e-06, "loss": 0.0056, "step": 760700 }, { "epoch": 1.97, "learning_rate": 4.2194924063134265e-06, "loss": 0.0059, "step": 760710 }, { "epoch": 1.97, "learning_rate": 4.215604189941961e-06, "loss": 0.006, "step": 760720 }, { "epoch": 1.97, "learning_rate": 4.211715973570497e-06, "loss": 0.0068, "step": 760730 }, { "epoch": 1.97, "learning_rate": 4.207827757199032e-06, "loss": 0.0079, "step": 760740 }, { "epoch": 1.97, "learning_rate": 4.203939540827568e-06, "loss": 0.0064, "step": 760750 }, { "epoch": 1.97, "learning_rate": 4.200051324456103e-06, "loss": 0.0073, "step": 760760 }, { "epoch": 1.97, "learning_rate": 4.196163108084638e-06, "loss": 0.0062, "step": 760770 }, { "epoch": 1.97, "learning_rate": 4.192274891713174e-06, "loss": 0.0079, "step": 760780 }, { "epoch": 1.97, "learning_rate": 4.188386675341709e-06, "loss": 0.0062, "step": 760790 }, { "epoch": 1.97, "learning_rate": 4.1844984589702445e-06, "loss": 0.01, "step": 760800 }, { "epoch": 1.97, "learning_rate": 4.18061024259878e-06, "loss": 0.0064, "step": 760810 }, { "epoch": 1.97, "learning_rate": 4.176722026227315e-06, "loss": 0.0077, "step": 760820 }, { "epoch": 1.97, "learning_rate": 4.17283380985585e-06, "loss": 0.0067, "step": 760830 }, { "epoch": 1.97, "learning_rate": 4.168945593484386e-06, "loss": 0.0063, "step": 760840 }, { "epoch": 1.97, "learning_rate": 4.165057377112921e-06, "loss": 0.007, "step": 760850 }, { "epoch": 1.97, "learning_rate": 4.161169160741456e-06, "loss": 0.0056, "step": 760860 }, { "epoch": 1.97, "learning_rate": 4.157280944369992e-06, "loss": 0.0065, "step": 760870 }, { "epoch": 1.97, "learning_rate": 4.153392727998528e-06, "loss": 0.0077, "step": 760880 }, { "epoch": 1.97, "learning_rate": 4.1495045116270625e-06, "loss": 0.0074, "step": 760890 }, { "epoch": 1.97, "learning_rate": 4.145616295255598e-06, "loss": 0.0092, "step": 760900 }, { "epoch": 1.97, "learning_rate": 4.141728078884133e-06, "loss": 0.006, "step": 760910 }, { "epoch": 1.97, "learning_rate": 4.137839862512669e-06, "loss": 0.0105, "step": 760920 }, { "epoch": 1.97, "learning_rate": 4.1339516461412045e-06, "loss": 0.0071, "step": 760930 }, { "epoch": 1.97, "learning_rate": 4.130063429769739e-06, "loss": 0.0095, "step": 760940 }, { "epoch": 1.97, "learning_rate": 4.126175213398275e-06, "loss": 0.0067, "step": 760950 }, { "epoch": 1.97, "learning_rate": 4.12228699702681e-06, "loss": 0.0065, "step": 760960 }, { "epoch": 1.97, "learning_rate": 4.118398780655346e-06, "loss": 0.0068, "step": 760970 }, { "epoch": 1.97, "learning_rate": 4.114510564283881e-06, "loss": 0.0065, "step": 760980 }, { "epoch": 1.97, "learning_rate": 4.110622347912416e-06, "loss": 0.0054, "step": 760990 }, { "epoch": 1.97, "learning_rate": 4.106734131540951e-06, "loss": 0.0046, "step": 761000 }, { "epoch": 1.97, "eval_cer": 0.8816956881384969, "eval_loss": 0.00441008573397994, "eval_runtime": 107.8116, "eval_samples_per_second": 18.551, "eval_steps_per_second": 4.638, "step": 761000 }, { "epoch": 1.97, "learning_rate": 4.102845915169487e-06, "loss": 0.0075, "step": 761010 }, { "epoch": 1.97, "learning_rate": 4.0989576987980225e-06, "loss": 0.0078, "step": 761020 }, { "epoch": 1.97, "learning_rate": 4.095069482426557e-06, "loss": 0.0074, "step": 761030 }, { "epoch": 1.97, "learning_rate": 4.091181266055093e-06, "loss": 0.0066, "step": 761040 }, { "epoch": 1.97, "learning_rate": 4.087293049683629e-06, "loss": 0.0059, "step": 761050 }, { "epoch": 1.97, "learning_rate": 4.083404833312164e-06, "loss": 0.0075, "step": 761060 }, { "epoch": 1.97, "learning_rate": 4.079516616940699e-06, "loss": 0.0061, "step": 761070 }, { "epoch": 1.97, "learning_rate": 4.075628400569234e-06, "loss": 0.0063, "step": 761080 }, { "epoch": 1.97, "learning_rate": 4.07174018419777e-06, "loss": 0.0079, "step": 761090 }, { "epoch": 1.97, "learning_rate": 4.067851967826306e-06, "loss": 0.0071, "step": 761100 }, { "epoch": 1.97, "learning_rate": 4.0639637514548405e-06, "loss": 0.009, "step": 761110 }, { "epoch": 1.97, "learning_rate": 4.060075535083376e-06, "loss": 0.0115, "step": 761120 }, { "epoch": 1.97, "learning_rate": 4.056187318711911e-06, "loss": 0.0052, "step": 761130 }, { "epoch": 1.97, "learning_rate": 4.052299102340447e-06, "loss": 0.011, "step": 761140 }, { "epoch": 1.97, "learning_rate": 4.0484108859689825e-06, "loss": 0.0063, "step": 761150 }, { "epoch": 1.97, "learning_rate": 4.044522669597517e-06, "loss": 0.0059, "step": 761160 }, { "epoch": 1.97, "learning_rate": 4.040634453226052e-06, "loss": 0.0056, "step": 761170 }, { "epoch": 1.97, "learning_rate": 4.036746236854588e-06, "loss": 0.0081, "step": 761180 }, { "epoch": 1.97, "learning_rate": 4.032858020483124e-06, "loss": 0.0075, "step": 761190 }, { "epoch": 1.97, "learning_rate": 4.0289698041116585e-06, "loss": 0.0093, "step": 761200 }, { "epoch": 1.97, "learning_rate": 4.025081587740194e-06, "loss": 0.006, "step": 761210 }, { "epoch": 1.97, "learning_rate": 4.02119337136873e-06, "loss": 0.0054, "step": 761220 }, { "epoch": 1.97, "learning_rate": 4.017305154997265e-06, "loss": 0.0072, "step": 761230 }, { "epoch": 1.97, "learning_rate": 4.0134169386258004e-06, "loss": 0.011, "step": 761240 }, { "epoch": 1.97, "learning_rate": 4.009528722254335e-06, "loss": 0.0068, "step": 761250 }, { "epoch": 1.97, "learning_rate": 4.005640505882871e-06, "loss": 0.01, "step": 761260 }, { "epoch": 1.97, "learning_rate": 4.001752289511407e-06, "loss": 0.005, "step": 761270 }, { "epoch": 1.97, "learning_rate": 3.997864073139942e-06, "loss": 0.0065, "step": 761280 }, { "epoch": 1.97, "learning_rate": 3.993975856768477e-06, "loss": 0.0098, "step": 761290 }, { "epoch": 1.97, "learning_rate": 3.990087640397012e-06, "loss": 0.0085, "step": 761300 }, { "epoch": 1.97, "learning_rate": 3.986199424025548e-06, "loss": 0.0055, "step": 761310 }, { "epoch": 1.97, "learning_rate": 3.9823112076540836e-06, "loss": 0.0063, "step": 761320 }, { "epoch": 1.97, "learning_rate": 3.9784229912826184e-06, "loss": 0.0062, "step": 761330 }, { "epoch": 1.97, "learning_rate": 3.974534774911153e-06, "loss": 0.0047, "step": 761340 }, { "epoch": 1.97, "learning_rate": 3.970646558539689e-06, "loss": 0.0066, "step": 761350 }, { "epoch": 1.97, "learning_rate": 3.966758342168225e-06, "loss": 0.0054, "step": 761360 }, { "epoch": 1.97, "learning_rate": 3.9628701257967596e-06, "loss": 0.0069, "step": 761370 }, { "epoch": 1.97, "learning_rate": 3.958981909425295e-06, "loss": 0.0069, "step": 761380 }, { "epoch": 1.97, "learning_rate": 3.955093693053831e-06, "loss": 0.0054, "step": 761390 }, { "epoch": 1.97, "learning_rate": 3.951205476682367e-06, "loss": 0.0069, "step": 761400 }, { "epoch": 1.97, "learning_rate": 3.9473172603109016e-06, "loss": 0.0116, "step": 761410 }, { "epoch": 1.97, "learning_rate": 3.9434290439394364e-06, "loss": 0.006, "step": 761420 }, { "epoch": 1.97, "learning_rate": 3.939540827567972e-06, "loss": 0.0091, "step": 761430 }, { "epoch": 1.97, "learning_rate": 3.935652611196508e-06, "loss": 0.0058, "step": 761440 }, { "epoch": 1.97, "learning_rate": 3.931764394825043e-06, "loss": 0.0077, "step": 761450 }, { "epoch": 1.97, "learning_rate": 3.927876178453578e-06, "loss": 0.0079, "step": 761460 }, { "epoch": 1.97, "learning_rate": 3.923987962082113e-06, "loss": 0.0063, "step": 761470 }, { "epoch": 1.97, "learning_rate": 3.920099745710649e-06, "loss": 0.0067, "step": 761480 }, { "epoch": 1.97, "learning_rate": 3.916211529339185e-06, "loss": 0.0067, "step": 761490 }, { "epoch": 1.97, "learning_rate": 3.9123233129677196e-06, "loss": 0.0095, "step": 761500 }, { "epoch": 1.97, "learning_rate": 3.908435096596254e-06, "loss": 0.005, "step": 761510 }, { "epoch": 1.97, "learning_rate": 3.90454688022479e-06, "loss": 0.0074, "step": 761520 }, { "epoch": 1.97, "learning_rate": 3.900658663853326e-06, "loss": 0.0085, "step": 761530 }, { "epoch": 1.97, "learning_rate": 3.8967704474818615e-06, "loss": 0.0063, "step": 761540 }, { "epoch": 1.97, "learning_rate": 3.892882231110396e-06, "loss": 0.007, "step": 761550 }, { "epoch": 1.97, "learning_rate": 3.888994014738932e-06, "loss": 0.0057, "step": 761560 }, { "epoch": 1.97, "learning_rate": 3.885105798367468e-06, "loss": 0.0059, "step": 761570 }, { "epoch": 1.97, "learning_rate": 3.881217581996003e-06, "loss": 0.0057, "step": 761580 }, { "epoch": 1.97, "learning_rate": 3.8773293656245375e-06, "loss": 0.0055, "step": 761590 }, { "epoch": 1.97, "learning_rate": 3.873441149253073e-06, "loss": 0.0084, "step": 761600 }, { "epoch": 1.97, "learning_rate": 3.869552932881609e-06, "loss": 0.0059, "step": 761610 }, { "epoch": 1.97, "learning_rate": 3.865664716510144e-06, "loss": 0.0055, "step": 761620 }, { "epoch": 1.97, "learning_rate": 3.8617765001386795e-06, "loss": 0.0068, "step": 761630 }, { "epoch": 1.97, "learning_rate": 3.857888283767214e-06, "loss": 0.0062, "step": 761640 }, { "epoch": 1.97, "learning_rate": 3.85400006739575e-06, "loss": 0.01, "step": 761650 }, { "epoch": 1.97, "learning_rate": 3.850111851024286e-06, "loss": 0.0055, "step": 761660 }, { "epoch": 1.97, "learning_rate": 3.846223634652821e-06, "loss": 0.0044, "step": 761670 }, { "epoch": 1.97, "learning_rate": 3.8423354182813555e-06, "loss": 0.0066, "step": 761680 }, { "epoch": 1.97, "learning_rate": 3.838447201909891e-06, "loss": 0.0078, "step": 761690 }, { "epoch": 1.97, "learning_rate": 3.834558985538427e-06, "loss": 0.0065, "step": 761700 }, { "epoch": 1.97, "learning_rate": 3.830670769166963e-06, "loss": 0.0076, "step": 761710 }, { "epoch": 1.97, "learning_rate": 3.8267825527954975e-06, "loss": 0.0074, "step": 761720 }, { "epoch": 1.97, "learning_rate": 3.822894336424033e-06, "loss": 0.0045, "step": 761730 }, { "epoch": 1.97, "learning_rate": 3.819006120052569e-06, "loss": 0.0069, "step": 761740 }, { "epoch": 1.97, "learning_rate": 3.815117903681104e-06, "loss": 0.0057, "step": 761750 }, { "epoch": 1.97, "learning_rate": 3.811229687309639e-06, "loss": 0.0064, "step": 761760 }, { "epoch": 1.97, "learning_rate": 3.8073414709381748e-06, "loss": 0.0063, "step": 761770 }, { "epoch": 1.97, "learning_rate": 3.8034532545667096e-06, "loss": 0.0057, "step": 761780 }, { "epoch": 1.97, "learning_rate": 3.799565038195245e-06, "loss": 0.0059, "step": 761790 }, { "epoch": 1.97, "learning_rate": 3.7956768218237806e-06, "loss": 0.0088, "step": 761800 }, { "epoch": 1.97, "learning_rate": 3.791788605452316e-06, "loss": 0.0072, "step": 761810 }, { "epoch": 1.97, "learning_rate": 3.7879003890808512e-06, "loss": 0.0067, "step": 761820 }, { "epoch": 1.97, "learning_rate": 3.7840121727093865e-06, "loss": 0.0125, "step": 761830 }, { "epoch": 1.97, "learning_rate": 3.7801239563379218e-06, "loss": 0.007, "step": 761840 }, { "epoch": 1.97, "learning_rate": 3.7762357399664575e-06, "loss": 0.0059, "step": 761850 }, { "epoch": 1.97, "learning_rate": 3.7723475235949928e-06, "loss": 0.0071, "step": 761860 }, { "epoch": 1.97, "learning_rate": 3.768459307223528e-06, "loss": 0.0055, "step": 761870 }, { "epoch": 1.97, "learning_rate": 3.7645710908520638e-06, "loss": 0.0042, "step": 761880 }, { "epoch": 1.97, "learning_rate": 3.7606828744805986e-06, "loss": 0.0078, "step": 761890 }, { "epoch": 1.97, "learning_rate": 3.756794658109134e-06, "loss": 0.0064, "step": 761900 }, { "epoch": 1.97, "learning_rate": 3.7529064417376696e-06, "loss": 0.0085, "step": 761910 }, { "epoch": 1.98, "learning_rate": 3.749018225366205e-06, "loss": 0.0084, "step": 761920 }, { "epoch": 1.98, "learning_rate": 3.74513000899474e-06, "loss": 0.0058, "step": 761930 }, { "epoch": 1.98, "learning_rate": 3.741241792623276e-06, "loss": 0.0058, "step": 761940 }, { "epoch": 1.98, "learning_rate": 3.7373535762518108e-06, "loss": 0.006, "step": 761950 }, { "epoch": 1.98, "learning_rate": 3.733465359880346e-06, "loss": 0.0076, "step": 761960 }, { "epoch": 1.98, "learning_rate": 3.7295771435088818e-06, "loss": 0.007, "step": 761970 }, { "epoch": 1.98, "learning_rate": 3.725688927137417e-06, "loss": 0.0066, "step": 761980 }, { "epoch": 1.98, "learning_rate": 3.7218007107659523e-06, "loss": 0.008, "step": 761990 }, { "epoch": 1.98, "learning_rate": 3.7179124943944876e-06, "loss": 0.01, "step": 762000 }, { "epoch": 1.98, "eval_cer": 0.8816900895907601, "eval_loss": 0.0043979547917842865, "eval_runtime": 107.9627, "eval_samples_per_second": 18.525, "eval_steps_per_second": 4.631, "step": 762000 }, { "epoch": 1.98, "learning_rate": 3.714024278023023e-06, "loss": 0.0057, "step": 762010 }, { "epoch": 1.98, "learning_rate": 3.7101360616515586e-06, "loss": 0.0092, "step": 762020 }, { "epoch": 1.98, "learning_rate": 3.706247845280094e-06, "loss": 0.0064, "step": 762030 }, { "epoch": 1.98, "learning_rate": 3.702359628908629e-06, "loss": 0.0096, "step": 762040 }, { "epoch": 1.98, "learning_rate": 3.698471412537165e-06, "loss": 0.0087, "step": 762050 }, { "epoch": 1.98, "learning_rate": 3.6945831961656997e-06, "loss": 0.0046, "step": 762060 }, { "epoch": 1.98, "learning_rate": 3.690694979794235e-06, "loss": 0.0067, "step": 762070 }, { "epoch": 1.98, "learning_rate": 3.6868067634227707e-06, "loss": 0.0079, "step": 762080 }, { "epoch": 1.98, "learning_rate": 3.682918547051306e-06, "loss": 0.0066, "step": 762090 }, { "epoch": 1.98, "learning_rate": 3.6790303306798413e-06, "loss": 0.0087, "step": 762100 }, { "epoch": 1.98, "learning_rate": 3.675142114308377e-06, "loss": 0.007, "step": 762110 }, { "epoch": 1.98, "learning_rate": 3.671253897936912e-06, "loss": 0.0078, "step": 762120 }, { "epoch": 1.98, "learning_rate": 3.667365681565447e-06, "loss": 0.0063, "step": 762130 }, { "epoch": 1.98, "learning_rate": 3.663477465193983e-06, "loss": 0.007, "step": 762140 }, { "epoch": 1.98, "learning_rate": 3.659589248822518e-06, "loss": 0.0078, "step": 762150 }, { "epoch": 1.98, "learning_rate": 3.655701032451054e-06, "loss": 0.0058, "step": 762160 }, { "epoch": 1.98, "learning_rate": 3.651812816079589e-06, "loss": 0.0054, "step": 762170 }, { "epoch": 1.98, "learning_rate": 3.647924599708124e-06, "loss": 0.0074, "step": 762180 }, { "epoch": 1.98, "learning_rate": 3.6440363833366597e-06, "loss": 0.0069, "step": 762190 }, { "epoch": 1.98, "learning_rate": 3.640148166965195e-06, "loss": 0.0076, "step": 762200 }, { "epoch": 1.98, "learning_rate": 3.6362599505937303e-06, "loss": 0.0082, "step": 762210 }, { "epoch": 1.98, "learning_rate": 3.632371734222266e-06, "loss": 0.0077, "step": 762220 }, { "epoch": 1.98, "learning_rate": 3.628483517850801e-06, "loss": 0.0072, "step": 762230 }, { "epoch": 1.98, "learning_rate": 3.624595301479336e-06, "loss": 0.0078, "step": 762240 }, { "epoch": 1.98, "learning_rate": 3.620707085107872e-06, "loss": 0.0048, "step": 762250 }, { "epoch": 1.98, "learning_rate": 3.616818868736407e-06, "loss": 0.0089, "step": 762260 }, { "epoch": 1.98, "learning_rate": 3.6129306523649424e-06, "loss": 0.0066, "step": 762270 }, { "epoch": 1.98, "learning_rate": 3.609042435993478e-06, "loss": 0.0075, "step": 762280 }, { "epoch": 1.98, "learning_rate": 3.605154219622013e-06, "loss": 0.0112, "step": 762290 }, { "epoch": 1.98, "learning_rate": 3.6012660032505483e-06, "loss": 0.0059, "step": 762300 }, { "epoch": 1.98, "learning_rate": 3.597377786879084e-06, "loss": 0.0049, "step": 762310 }, { "epoch": 1.98, "learning_rate": 3.5934895705076193e-06, "loss": 0.0069, "step": 762320 }, { "epoch": 1.98, "learning_rate": 3.589601354136155e-06, "loss": 0.0059, "step": 762330 }, { "epoch": 1.98, "learning_rate": 3.5857131377646903e-06, "loss": 0.0082, "step": 762340 }, { "epoch": 1.98, "learning_rate": 3.581824921393225e-06, "loss": 0.0074, "step": 762350 }, { "epoch": 1.98, "learning_rate": 3.577936705021761e-06, "loss": 0.0058, "step": 762360 }, { "epoch": 1.98, "learning_rate": 3.574048488650296e-06, "loss": 0.0075, "step": 762370 }, { "epoch": 1.98, "learning_rate": 3.5701602722788314e-06, "loss": 0.0077, "step": 762380 }, { "epoch": 1.98, "learning_rate": 3.566272055907367e-06, "loss": 0.0062, "step": 762390 }, { "epoch": 1.98, "learning_rate": 3.562383839535902e-06, "loss": 0.0097, "step": 762400 }, { "epoch": 1.98, "learning_rate": 3.5584956231644373e-06, "loss": 0.0073, "step": 762410 }, { "epoch": 1.98, "learning_rate": 3.554607406792973e-06, "loss": 0.0063, "step": 762420 }, { "epoch": 1.98, "learning_rate": 3.5507191904215083e-06, "loss": 0.0074, "step": 762430 }, { "epoch": 1.98, "learning_rate": 3.5468309740500435e-06, "loss": 0.0059, "step": 762440 }, { "epoch": 1.98, "learning_rate": 3.5429427576785793e-06, "loss": 0.0068, "step": 762450 }, { "epoch": 1.98, "learning_rate": 3.539054541307114e-06, "loss": 0.0063, "step": 762460 }, { "epoch": 1.98, "learning_rate": 3.53516632493565e-06, "loss": 0.005, "step": 762470 }, { "epoch": 1.98, "learning_rate": 3.531278108564185e-06, "loss": 0.0075, "step": 762480 }, { "epoch": 1.98, "learning_rate": 3.5273898921927204e-06, "loss": 0.0071, "step": 762490 }, { "epoch": 1.98, "learning_rate": 3.523501675821256e-06, "loss": 0.005, "step": 762500 }, { "epoch": 1.98, "learning_rate": 3.5196134594497914e-06, "loss": 0.0096, "step": 762510 }, { "epoch": 1.98, "learning_rate": 3.5157252430783262e-06, "loss": 0.0068, "step": 762520 }, { "epoch": 1.98, "learning_rate": 3.511837026706862e-06, "loss": 0.0079, "step": 762530 }, { "epoch": 1.98, "learning_rate": 3.5079488103353972e-06, "loss": 0.0051, "step": 762540 }, { "epoch": 1.98, "learning_rate": 3.5040605939639325e-06, "loss": 0.008, "step": 762550 }, { "epoch": 1.98, "learning_rate": 3.5001723775924682e-06, "loss": 0.0054, "step": 762560 }, { "epoch": 1.98, "learning_rate": 3.496284161221003e-06, "loss": 0.0068, "step": 762570 }, { "epoch": 1.98, "learning_rate": 3.4923959448495384e-06, "loss": 0.008, "step": 762580 }, { "epoch": 1.98, "learning_rate": 3.488507728478074e-06, "loss": 0.0062, "step": 762590 }, { "epoch": 1.98, "learning_rate": 3.4846195121066094e-06, "loss": 0.0053, "step": 762600 }, { "epoch": 1.98, "learning_rate": 3.480731295735145e-06, "loss": 0.008, "step": 762610 }, { "epoch": 1.98, "learning_rate": 3.4768430793636804e-06, "loss": 0.0079, "step": 762620 }, { "epoch": 1.98, "learning_rate": 3.4729548629922152e-06, "loss": 0.0057, "step": 762630 }, { "epoch": 1.98, "learning_rate": 3.469066646620751e-06, "loss": 0.0046, "step": 762640 }, { "epoch": 1.98, "learning_rate": 3.4651784302492862e-06, "loss": 0.0058, "step": 762650 }, { "epoch": 1.98, "learning_rate": 3.4612902138778215e-06, "loss": 0.0073, "step": 762660 }, { "epoch": 1.98, "learning_rate": 3.4574019975063572e-06, "loss": 0.0072, "step": 762670 }, { "epoch": 1.98, "learning_rate": 3.4535137811348925e-06, "loss": 0.008, "step": 762680 }, { "epoch": 1.98, "learning_rate": 3.4496255647634274e-06, "loss": 0.0041, "step": 762690 }, { "epoch": 1.98, "learning_rate": 3.445737348391963e-06, "loss": 0.0048, "step": 762700 }, { "epoch": 1.98, "learning_rate": 3.4418491320204984e-06, "loss": 0.0102, "step": 762710 }, { "epoch": 1.98, "learning_rate": 3.4379609156490336e-06, "loss": 0.0055, "step": 762720 }, { "epoch": 1.98, "learning_rate": 3.4340726992775694e-06, "loss": 0.0051, "step": 762730 }, { "epoch": 1.98, "learning_rate": 3.430184482906104e-06, "loss": 0.0092, "step": 762740 }, { "epoch": 1.98, "learning_rate": 3.4262962665346395e-06, "loss": 0.0061, "step": 762750 }, { "epoch": 1.98, "learning_rate": 3.422408050163175e-06, "loss": 0.006, "step": 762760 }, { "epoch": 1.98, "learning_rate": 3.4185198337917105e-06, "loss": 0.0073, "step": 762770 }, { "epoch": 1.98, "learning_rate": 3.414631617420246e-06, "loss": 0.007, "step": 762780 }, { "epoch": 1.98, "learning_rate": 3.4107434010487815e-06, "loss": 0.0069, "step": 762790 }, { "epoch": 1.98, "learning_rate": 3.4068551846773163e-06, "loss": 0.0074, "step": 762800 }, { "epoch": 1.98, "learning_rate": 3.402966968305852e-06, "loss": 0.01, "step": 762810 }, { "epoch": 1.98, "learning_rate": 3.3990787519343873e-06, "loss": 0.008, "step": 762820 }, { "epoch": 1.98, "learning_rate": 3.3951905355629226e-06, "loss": 0.0096, "step": 762830 }, { "epoch": 1.98, "learning_rate": 3.3913023191914583e-06, "loss": 0.0081, "step": 762840 }, { "epoch": 1.98, "learning_rate": 3.3874141028199936e-06, "loss": 0.007, "step": 762850 }, { "epoch": 1.98, "learning_rate": 3.3835258864485285e-06, "loss": 0.0067, "step": 762860 }, { "epoch": 1.98, "learning_rate": 3.379637670077064e-06, "loss": 0.0062, "step": 762870 }, { "epoch": 1.98, "learning_rate": 3.3757494537055995e-06, "loss": 0.0077, "step": 762880 }, { "epoch": 1.98, "learning_rate": 3.3718612373341348e-06, "loss": 0.0054, "step": 762890 }, { "epoch": 1.98, "learning_rate": 3.3679730209626705e-06, "loss": 0.0083, "step": 762900 }, { "epoch": 1.98, "learning_rate": 3.3640848045912053e-06, "loss": 0.0072, "step": 762910 }, { "epoch": 1.98, "learning_rate": 3.360196588219741e-06, "loss": 0.0085, "step": 762920 }, { "epoch": 1.98, "learning_rate": 3.3563083718482763e-06, "loss": 0.0065, "step": 762930 }, { "epoch": 1.98, "learning_rate": 3.3524201554768116e-06, "loss": 0.0064, "step": 762940 }, { "epoch": 1.98, "learning_rate": 3.3485319391053473e-06, "loss": 0.0077, "step": 762950 }, { "epoch": 1.98, "learning_rate": 3.3446437227338826e-06, "loss": 0.0078, "step": 762960 }, { "epoch": 1.98, "learning_rate": 3.3407555063624175e-06, "loss": 0.0073, "step": 762970 }, { "epoch": 1.98, "learning_rate": 3.336867289990953e-06, "loss": 0.0072, "step": 762980 }, { "epoch": 1.98, "learning_rate": 3.3329790736194885e-06, "loss": 0.0071, "step": 762990 }, { "epoch": 1.98, "learning_rate": 3.3290908572480237e-06, "loss": 0.0095, "step": 763000 }, { "epoch": 1.98, "eval_cer": 0.8816942885015627, "eval_loss": 0.004390762187540531, "eval_runtime": 107.772, "eval_samples_per_second": 18.558, "eval_steps_per_second": 4.639, "step": 763000 }, { "epoch": 1.98, "learning_rate": 3.3252026408765594e-06, "loss": 0.0091, "step": 763010 }, { "epoch": 1.98, "learning_rate": 3.3213144245050947e-06, "loss": 0.0068, "step": 763020 }, { "epoch": 1.98, "learning_rate": 3.3174262081336296e-06, "loss": 0.0058, "step": 763030 }, { "epoch": 1.98, "learning_rate": 3.3135379917621653e-06, "loss": 0.0066, "step": 763040 }, { "epoch": 1.98, "learning_rate": 3.3096497753907006e-06, "loss": 0.0067, "step": 763050 }, { "epoch": 1.98, "learning_rate": 3.305761559019236e-06, "loss": 0.0065, "step": 763060 }, { "epoch": 1.98, "learning_rate": 3.3018733426477716e-06, "loss": 0.0092, "step": 763070 }, { "epoch": 1.98, "learning_rate": 3.2979851262763064e-06, "loss": 0.0046, "step": 763080 }, { "epoch": 1.98, "learning_rate": 3.294096909904842e-06, "loss": 0.0053, "step": 763090 }, { "epoch": 1.98, "learning_rate": 3.2902086935333774e-06, "loss": 0.0056, "step": 763100 }, { "epoch": 1.98, "learning_rate": 3.2863204771619127e-06, "loss": 0.0059, "step": 763110 }, { "epoch": 1.98, "learning_rate": 3.2824322607904484e-06, "loss": 0.0062, "step": 763120 }, { "epoch": 1.98, "learning_rate": 3.2785440444189837e-06, "loss": 0.0068, "step": 763130 }, { "epoch": 1.98, "learning_rate": 3.2746558280475186e-06, "loss": 0.0091, "step": 763140 }, { "epoch": 1.98, "learning_rate": 3.2707676116760543e-06, "loss": 0.006, "step": 763150 }, { "epoch": 1.98, "learning_rate": 3.2668793953045896e-06, "loss": 0.0085, "step": 763160 }, { "epoch": 1.98, "learning_rate": 3.262991178933125e-06, "loss": 0.0065, "step": 763170 }, { "epoch": 1.98, "learning_rate": 3.2591029625616606e-06, "loss": 0.0052, "step": 763180 }, { "epoch": 1.98, "learning_rate": 3.255214746190196e-06, "loss": 0.0084, "step": 763190 }, { "epoch": 1.98, "learning_rate": 3.2513265298187307e-06, "loss": 0.004, "step": 763200 }, { "epoch": 1.98, "learning_rate": 3.2474383134472664e-06, "loss": 0.0055, "step": 763210 }, { "epoch": 1.98, "learning_rate": 3.2435500970758017e-06, "loss": 0.0065, "step": 763220 }, { "epoch": 1.98, "learning_rate": 3.2396618807043374e-06, "loss": 0.0096, "step": 763230 }, { "epoch": 1.98, "learning_rate": 3.2357736643328727e-06, "loss": 0.0058, "step": 763240 }, { "epoch": 1.98, "learning_rate": 3.2318854479614076e-06, "loss": 0.0089, "step": 763250 }, { "epoch": 1.98, "learning_rate": 3.2279972315899433e-06, "loss": 0.0059, "step": 763260 }, { "epoch": 1.98, "learning_rate": 3.2241090152184786e-06, "loss": 0.0061, "step": 763270 }, { "epoch": 1.98, "learning_rate": 3.220220798847014e-06, "loss": 0.0076, "step": 763280 }, { "epoch": 1.98, "learning_rate": 3.2163325824755495e-06, "loss": 0.007, "step": 763290 }, { "epoch": 1.98, "learning_rate": 3.212444366104085e-06, "loss": 0.0061, "step": 763300 }, { "epoch": 1.98, "learning_rate": 3.2085561497326197e-06, "loss": 0.0067, "step": 763310 }, { "epoch": 1.98, "learning_rate": 3.2046679333611554e-06, "loss": 0.0072, "step": 763320 }, { "epoch": 1.98, "learning_rate": 3.2007797169896907e-06, "loss": 0.0066, "step": 763330 }, { "epoch": 1.98, "learning_rate": 3.196891500618226e-06, "loss": 0.0099, "step": 763340 }, { "epoch": 1.98, "learning_rate": 3.1930032842467617e-06, "loss": 0.0083, "step": 763350 }, { "epoch": 1.98, "learning_rate": 3.189115067875297e-06, "loss": 0.0079, "step": 763360 }, { "epoch": 1.98, "learning_rate": 3.185226851503832e-06, "loss": 0.0062, "step": 763370 }, { "epoch": 1.98, "learning_rate": 3.1813386351323675e-06, "loss": 0.0076, "step": 763380 }, { "epoch": 1.98, "learning_rate": 3.177450418760903e-06, "loss": 0.0087, "step": 763390 }, { "epoch": 1.98, "learning_rate": 3.1735622023894385e-06, "loss": 0.0054, "step": 763400 }, { "epoch": 1.98, "learning_rate": 3.169673986017974e-06, "loss": 0.0063, "step": 763410 }, { "epoch": 1.98, "learning_rate": 3.1657857696465087e-06, "loss": 0.0062, "step": 763420 }, { "epoch": 1.98, "learning_rate": 3.1618975532750444e-06, "loss": 0.007, "step": 763430 }, { "epoch": 1.98, "learning_rate": 3.1580093369035797e-06, "loss": 0.0061, "step": 763440 }, { "epoch": 1.98, "learning_rate": 3.154121120532115e-06, "loss": 0.0082, "step": 763450 }, { "epoch": 1.98, "learning_rate": 3.1502329041606507e-06, "loss": 0.0074, "step": 763460 }, { "epoch": 1.98, "learning_rate": 3.146344687789186e-06, "loss": 0.0064, "step": 763470 }, { "epoch": 1.98, "learning_rate": 3.142456471417721e-06, "loss": 0.0067, "step": 763480 }, { "epoch": 1.98, "learning_rate": 3.1385682550462565e-06, "loss": 0.0069, "step": 763490 }, { "epoch": 1.98, "learning_rate": 3.134680038674792e-06, "loss": 0.0068, "step": 763500 }, { "epoch": 1.98, "learning_rate": 3.130791822303327e-06, "loss": 0.005, "step": 763510 }, { "epoch": 1.98, "learning_rate": 3.126903605931863e-06, "loss": 0.0058, "step": 763520 }, { "epoch": 1.98, "learning_rate": 3.123015389560398e-06, "loss": 0.0076, "step": 763530 }, { "epoch": 1.98, "learning_rate": 3.119127173188934e-06, "loss": 0.0078, "step": 763540 }, { "epoch": 1.98, "learning_rate": 3.1152389568174687e-06, "loss": 0.0057, "step": 763550 }, { "epoch": 1.98, "learning_rate": 3.111350740446004e-06, "loss": 0.0057, "step": 763560 }, { "epoch": 1.98, "learning_rate": 3.1074625240745396e-06, "loss": 0.0065, "step": 763570 }, { "epoch": 1.98, "learning_rate": 3.103574307703075e-06, "loss": 0.0076, "step": 763580 }, { "epoch": 1.98, "learning_rate": 3.09968609133161e-06, "loss": 0.0064, "step": 763590 }, { "epoch": 1.98, "learning_rate": 3.0957978749601455e-06, "loss": 0.0104, "step": 763600 }, { "epoch": 1.98, "learning_rate": 3.0919096585886808e-06, "loss": 0.008, "step": 763610 }, { "epoch": 1.98, "learning_rate": 3.088021442217216e-06, "loss": 0.0061, "step": 763620 }, { "epoch": 1.98, "learning_rate": 3.0841332258457518e-06, "loss": 0.0067, "step": 763630 }, { "epoch": 1.98, "learning_rate": 3.080245009474287e-06, "loss": 0.0094, "step": 763640 }, { "epoch": 1.98, "learning_rate": 3.076356793102822e-06, "loss": 0.0056, "step": 763650 }, { "epoch": 1.98, "learning_rate": 3.0724685767313576e-06, "loss": 0.0056, "step": 763660 }, { "epoch": 1.98, "learning_rate": 3.068580360359893e-06, "loss": 0.0084, "step": 763670 }, { "epoch": 1.98, "learning_rate": 3.064692143988428e-06, "loss": 0.0061, "step": 763680 }, { "epoch": 1.98, "learning_rate": 3.060803927616964e-06, "loss": 0.0061, "step": 763690 }, { "epoch": 1.98, "learning_rate": 3.056915711245499e-06, "loss": 0.0103, "step": 763700 }, { "epoch": 1.98, "learning_rate": 3.053027494874035e-06, "loss": 0.0086, "step": 763710 }, { "epoch": 1.98, "learning_rate": 3.0491392785025698e-06, "loss": 0.0077, "step": 763720 }, { "epoch": 1.98, "learning_rate": 3.045251062131105e-06, "loss": 0.0073, "step": 763730 }, { "epoch": 1.98, "learning_rate": 3.0413628457596408e-06, "loss": 0.0071, "step": 763740 }, { "epoch": 1.98, "learning_rate": 3.037474629388176e-06, "loss": 0.005, "step": 763750 }, { "epoch": 1.98, "learning_rate": 3.033586413016711e-06, "loss": 0.0059, "step": 763760 }, { "epoch": 1.98, "learning_rate": 3.0296981966452466e-06, "loss": 0.0097, "step": 763770 }, { "epoch": 1.98, "learning_rate": 3.025809980273782e-06, "loss": 0.0075, "step": 763780 }, { "epoch": 1.98, "learning_rate": 3.021921763902317e-06, "loss": 0.0061, "step": 763790 }, { "epoch": 1.98, "learning_rate": 3.018033547530853e-06, "loss": 0.0068, "step": 763800 }, { "epoch": 1.98, "learning_rate": 3.014145331159388e-06, "loss": 0.0088, "step": 763810 }, { "epoch": 1.98, "learning_rate": 3.010257114787923e-06, "loss": 0.006, "step": 763820 }, { "epoch": 1.98, "learning_rate": 3.0063688984164587e-06, "loss": 0.007, "step": 763830 }, { "epoch": 1.98, "learning_rate": 3.002480682044994e-06, "loss": 0.0075, "step": 763840 }, { "epoch": 1.98, "learning_rate": 2.9985924656735297e-06, "loss": 0.0083, "step": 763850 }, { "epoch": 1.98, "learning_rate": 2.994704249302065e-06, "loss": 0.0071, "step": 763860 }, { "epoch": 1.98, "learning_rate": 2.9908160329306003e-06, "loss": 0.0075, "step": 763870 }, { "epoch": 1.98, "learning_rate": 2.986927816559136e-06, "loss": 0.0095, "step": 763880 }, { "epoch": 1.98, "learning_rate": 2.983039600187671e-06, "loss": 0.0059, "step": 763890 }, { "epoch": 1.98, "learning_rate": 2.979151383816206e-06, "loss": 0.0063, "step": 763900 }, { "epoch": 1.98, "learning_rate": 2.975263167444742e-06, "loss": 0.0055, "step": 763910 }, { "epoch": 1.98, "learning_rate": 2.971374951073277e-06, "loss": 0.0073, "step": 763920 }, { "epoch": 1.98, "learning_rate": 2.967486734701812e-06, "loss": 0.0089, "step": 763930 }, { "epoch": 1.98, "learning_rate": 2.9635985183303477e-06, "loss": 0.0083, "step": 763940 }, { "epoch": 1.98, "learning_rate": 2.959710301958883e-06, "loss": 0.0069, "step": 763950 }, { "epoch": 1.98, "learning_rate": 2.9558220855874183e-06, "loss": 0.0103, "step": 763960 }, { "epoch": 1.98, "learning_rate": 2.951933869215954e-06, "loss": 0.0056, "step": 763970 }, { "epoch": 1.98, "learning_rate": 2.9480456528444893e-06, "loss": 0.0071, "step": 763980 }, { "epoch": 1.98, "learning_rate": 2.944157436473025e-06, "loss": 0.0088, "step": 763990 }, { "epoch": 1.98, "learning_rate": 2.94026922010156e-06, "loss": 0.0063, "step": 764000 }, { "epoch": 1.98, "eval_cer": 0.8816872903168917, "eval_loss": 0.004406400490552187, "eval_runtime": 107.9975, "eval_samples_per_second": 18.519, "eval_steps_per_second": 4.63, "step": 764000 }, { "epoch": 1.98, "learning_rate": 2.936381003730095e-06, "loss": 0.0069, "step": 764010 }, { "epoch": 1.98, "learning_rate": 2.932492787358631e-06, "loss": 0.0057, "step": 764020 }, { "epoch": 1.98, "learning_rate": 2.928604570987166e-06, "loss": 0.0065, "step": 764030 }, { "epoch": 1.98, "learning_rate": 2.9247163546157014e-06, "loss": 0.0085, "step": 764040 }, { "epoch": 1.98, "learning_rate": 2.920828138244237e-06, "loss": 0.0103, "step": 764050 }, { "epoch": 1.98, "learning_rate": 2.916939921872772e-06, "loss": 0.0075, "step": 764060 }, { "epoch": 1.98, "learning_rate": 2.9130517055013073e-06, "loss": 0.0057, "step": 764070 }, { "epoch": 1.98, "learning_rate": 2.909163489129843e-06, "loss": 0.007, "step": 764080 }, { "epoch": 1.98, "learning_rate": 2.9052752727583783e-06, "loss": 0.0073, "step": 764090 }, { "epoch": 1.98, "learning_rate": 2.901387056386913e-06, "loss": 0.0086, "step": 764100 }, { "epoch": 1.98, "learning_rate": 2.897498840015449e-06, "loss": 0.0061, "step": 764110 }, { "epoch": 1.98, "learning_rate": 2.893610623643984e-06, "loss": 0.0067, "step": 764120 }, { "epoch": 1.98, "learning_rate": 2.8897224072725194e-06, "loss": 0.006, "step": 764130 }, { "epoch": 1.98, "learning_rate": 2.885834190901055e-06, "loss": 0.0052, "step": 764140 }, { "epoch": 1.98, "learning_rate": 2.8819459745295904e-06, "loss": 0.0059, "step": 764150 }, { "epoch": 1.98, "learning_rate": 2.878057758158126e-06, "loss": 0.0073, "step": 764160 }, { "epoch": 1.98, "learning_rate": 2.874169541786661e-06, "loss": 0.0058, "step": 764170 }, { "epoch": 1.98, "learning_rate": 2.8702813254151963e-06, "loss": 0.0105, "step": 764180 }, { "epoch": 1.98, "learning_rate": 2.866393109043732e-06, "loss": 0.0102, "step": 764190 }, { "epoch": 1.98, "learning_rate": 2.8625048926722673e-06, "loss": 0.0059, "step": 764200 }, { "epoch": 1.98, "learning_rate": 2.8586166763008025e-06, "loss": 0.0056, "step": 764210 }, { "epoch": 1.98, "learning_rate": 2.8547284599293383e-06, "loss": 0.0068, "step": 764220 }, { "epoch": 1.98, "learning_rate": 2.850840243557873e-06, "loss": 0.0069, "step": 764230 }, { "epoch": 1.98, "learning_rate": 2.8469520271864084e-06, "loss": 0.007, "step": 764240 }, { "epoch": 1.98, "learning_rate": 2.843063810814944e-06, "loss": 0.0046, "step": 764250 }, { "epoch": 1.98, "learning_rate": 2.8391755944434794e-06, "loss": 0.0074, "step": 764260 }, { "epoch": 1.98, "learning_rate": 2.8352873780720147e-06, "loss": 0.0083, "step": 764270 }, { "epoch": 1.98, "learning_rate": 2.83139916170055e-06, "loss": 0.005, "step": 764280 }, { "epoch": 1.98, "learning_rate": 2.8275109453290852e-06, "loss": 0.0076, "step": 764290 }, { "epoch": 1.98, "learning_rate": 2.823622728957621e-06, "loss": 0.0094, "step": 764300 }, { "epoch": 1.98, "learning_rate": 2.8197345125861562e-06, "loss": 0.0069, "step": 764310 }, { "epoch": 1.98, "learning_rate": 2.8158462962146915e-06, "loss": 0.0083, "step": 764320 }, { "epoch": 1.98, "learning_rate": 2.8119580798432272e-06, "loss": 0.0085, "step": 764330 }, { "epoch": 1.98, "learning_rate": 2.808069863471762e-06, "loss": 0.0088, "step": 764340 }, { "epoch": 1.98, "learning_rate": 2.8041816471002974e-06, "loss": 0.0116, "step": 764350 }, { "epoch": 1.98, "learning_rate": 2.800293430728833e-06, "loss": 0.0079, "step": 764360 }, { "epoch": 1.98, "learning_rate": 2.7964052143573684e-06, "loss": 0.0082, "step": 764370 }, { "epoch": 1.98, "learning_rate": 2.7925169979859037e-06, "loss": 0.01, "step": 764380 }, { "epoch": 1.98, "learning_rate": 2.7886287816144394e-06, "loss": 0.0063, "step": 764390 }, { "epoch": 1.98, "learning_rate": 2.7847405652429742e-06, "loss": 0.0062, "step": 764400 }, { "epoch": 1.98, "learning_rate": 2.7808523488715095e-06, "loss": 0.0064, "step": 764410 }, { "epoch": 1.98, "learning_rate": 2.7769641325000452e-06, "loss": 0.0075, "step": 764420 }, { "epoch": 1.98, "learning_rate": 2.7730759161285805e-06, "loss": 0.0055, "step": 764430 }, { "epoch": 1.98, "learning_rate": 2.769187699757116e-06, "loss": 0.0072, "step": 764440 }, { "epoch": 1.98, "learning_rate": 2.765299483385651e-06, "loss": 0.005, "step": 764450 }, { "epoch": 1.98, "learning_rate": 2.7614112670141864e-06, "loss": 0.0052, "step": 764460 }, { "epoch": 1.98, "learning_rate": 2.757523050642722e-06, "loss": 0.0063, "step": 764470 }, { "epoch": 1.98, "learning_rate": 2.7536348342712574e-06, "loss": 0.0067, "step": 764480 }, { "epoch": 1.98, "learning_rate": 2.7497466178997926e-06, "loss": 0.0061, "step": 764490 }, { "epoch": 1.98, "learning_rate": 2.7458584015283284e-06, "loss": 0.007, "step": 764500 }, { "epoch": 1.98, "learning_rate": 2.7419701851568632e-06, "loss": 0.0058, "step": 764510 }, { "epoch": 1.98, "learning_rate": 2.7380819687853985e-06, "loss": 0.0055, "step": 764520 }, { "epoch": 1.98, "learning_rate": 2.734193752413934e-06, "loss": 0.0053, "step": 764530 }, { "epoch": 1.98, "learning_rate": 2.7303055360424695e-06, "loss": 0.0057, "step": 764540 }, { "epoch": 1.98, "learning_rate": 2.7264173196710048e-06, "loss": 0.0071, "step": 764550 }, { "epoch": 1.98, "learning_rate": 2.7225291032995405e-06, "loss": 0.0063, "step": 764560 }, { "epoch": 1.98, "learning_rate": 2.7186408869280753e-06, "loss": 0.0059, "step": 764570 }, { "epoch": 1.98, "learning_rate": 2.7147526705566106e-06, "loss": 0.0076, "step": 764580 }, { "epoch": 1.98, "learning_rate": 2.7108644541851463e-06, "loss": 0.0093, "step": 764590 }, { "epoch": 1.98, "learning_rate": 2.7069762378136816e-06, "loss": 0.008, "step": 764600 }, { "epoch": 1.98, "learning_rate": 2.7030880214422173e-06, "loss": 0.0086, "step": 764610 }, { "epoch": 1.98, "learning_rate": 2.699199805070752e-06, "loss": 0.0082, "step": 764620 }, { "epoch": 1.98, "learning_rate": 2.6953115886992875e-06, "loss": 0.0063, "step": 764630 }, { "epoch": 1.98, "learning_rate": 2.691423372327823e-06, "loss": 0.0065, "step": 764640 }, { "epoch": 1.98, "learning_rate": 2.6875351559563585e-06, "loss": 0.0074, "step": 764650 }, { "epoch": 1.98, "learning_rate": 2.6836469395848938e-06, "loss": 0.0072, "step": 764660 }, { "epoch": 1.98, "learning_rate": 2.6797587232134295e-06, "loss": 0.0076, "step": 764670 }, { "epoch": 1.98, "learning_rate": 2.6758705068419643e-06, "loss": 0.0078, "step": 764680 }, { "epoch": 1.98, "learning_rate": 2.6719822904704996e-06, "loss": 0.0071, "step": 764690 }, { "epoch": 1.98, "learning_rate": 2.6680940740990353e-06, "loss": 0.0053, "step": 764700 }, { "epoch": 1.98, "learning_rate": 2.6642058577275706e-06, "loss": 0.0065, "step": 764710 }, { "epoch": 1.98, "learning_rate": 2.660317641356106e-06, "loss": 0.0065, "step": 764720 }, { "epoch": 1.98, "learning_rate": 2.6564294249846416e-06, "loss": 0.0092, "step": 764730 }, { "epoch": 1.98, "learning_rate": 2.6525412086131765e-06, "loss": 0.0083, "step": 764740 }, { "epoch": 1.98, "learning_rate": 2.6486529922417117e-06, "loss": 0.0073, "step": 764750 }, { "epoch": 1.98, "learning_rate": 2.6447647758702475e-06, "loss": 0.0071, "step": 764760 }, { "epoch": 1.98, "learning_rate": 2.6408765594987827e-06, "loss": 0.0053, "step": 764770 }, { "epoch": 1.98, "learning_rate": 2.6369883431273185e-06, "loss": 0.008, "step": 764780 }, { "epoch": 1.98, "learning_rate": 2.6331001267558533e-06, "loss": 0.0083, "step": 764790 }, { "epoch": 1.98, "learning_rate": 2.6292119103843886e-06, "loss": 0.0087, "step": 764800 }, { "epoch": 1.98, "learning_rate": 2.6253236940129243e-06, "loss": 0.0092, "step": 764810 }, { "epoch": 1.98, "learning_rate": 2.6214354776414596e-06, "loss": 0.0061, "step": 764820 }, { "epoch": 1.98, "learning_rate": 2.617547261269995e-06, "loss": 0.0058, "step": 764830 }, { "epoch": 1.98, "learning_rate": 2.6136590448985306e-06, "loss": 0.0068, "step": 764840 }, { "epoch": 1.98, "learning_rate": 2.6097708285270654e-06, "loss": 0.0062, "step": 764850 }, { "epoch": 1.98, "learning_rate": 2.6058826121556007e-06, "loss": 0.0091, "step": 764860 }, { "epoch": 1.98, "learning_rate": 2.6019943957841364e-06, "loss": 0.0067, "step": 764870 }, { "epoch": 1.98, "learning_rate": 2.5981061794126717e-06, "loss": 0.0066, "step": 764880 }, { "epoch": 1.98, "learning_rate": 2.594217963041207e-06, "loss": 0.0064, "step": 764890 }, { "epoch": 1.98, "learning_rate": 2.5903297466697427e-06, "loss": 0.0077, "step": 764900 }, { "epoch": 1.98, "learning_rate": 2.5864415302982776e-06, "loss": 0.0064, "step": 764910 }, { "epoch": 1.98, "learning_rate": 2.5825533139268133e-06, "loss": 0.0066, "step": 764920 }, { "epoch": 1.98, "learning_rate": 2.5786650975553486e-06, "loss": 0.0065, "step": 764930 }, { "epoch": 1.98, "learning_rate": 2.574776881183884e-06, "loss": 0.0069, "step": 764940 }, { "epoch": 1.98, "learning_rate": 2.5708886648124196e-06, "loss": 0.0076, "step": 764950 }, { "epoch": 1.98, "learning_rate": 2.567000448440955e-06, "loss": 0.0067, "step": 764960 }, { "epoch": 1.98, "learning_rate": 2.5631122320694897e-06, "loss": 0.0054, "step": 764970 }, { "epoch": 1.98, "learning_rate": 2.5592240156980254e-06, "loss": 0.0072, "step": 764980 }, { "epoch": 1.98, "learning_rate": 2.5553357993265607e-06, "loss": 0.0092, "step": 764990 }, { "epoch": 1.98, "learning_rate": 2.551447582955096e-06, "loss": 0.0062, "step": 765000 }, { "epoch": 1.98, "eval_cer": 0.8816942885015627, "eval_loss": 0.004388539120554924, "eval_runtime": 107.9641, "eval_samples_per_second": 18.525, "eval_steps_per_second": 4.631, "step": 765000 }, { "epoch": 1.98, "learning_rate": 2.5475593665836317e-06, "loss": 0.0057, "step": 765010 }, { "epoch": 1.98, "learning_rate": 2.5436711502121666e-06, "loss": 0.0068, "step": 765020 }, { "epoch": 1.98, "learning_rate": 2.539782933840702e-06, "loss": 0.0075, "step": 765030 }, { "epoch": 1.98, "learning_rate": 2.5358947174692376e-06, "loss": 0.0046, "step": 765040 }, { "epoch": 1.98, "learning_rate": 2.532006501097773e-06, "loss": 0.0071, "step": 765050 }, { "epoch": 1.98, "learning_rate": 2.5281182847263085e-06, "loss": 0.0069, "step": 765060 }, { "epoch": 1.98, "learning_rate": 2.524230068354844e-06, "loss": 0.0082, "step": 765070 }, { "epoch": 1.98, "learning_rate": 2.5203418519833787e-06, "loss": 0.0069, "step": 765080 }, { "epoch": 1.98, "learning_rate": 2.5164536356119144e-06, "loss": 0.0084, "step": 765090 }, { "epoch": 1.98, "learning_rate": 2.5125654192404497e-06, "loss": 0.0054, "step": 765100 }, { "epoch": 1.98, "learning_rate": 2.508677202868985e-06, "loss": 0.0072, "step": 765110 }, { "epoch": 1.98, "learning_rate": 2.5047889864975207e-06, "loss": 0.0042, "step": 765120 }, { "epoch": 1.98, "learning_rate": 2.500900770126056e-06, "loss": 0.0046, "step": 765130 }, { "epoch": 1.98, "learning_rate": 2.497012553754591e-06, "loss": 0.0061, "step": 765140 }, { "epoch": 1.98, "learning_rate": 2.4931243373831265e-06, "loss": 0.0075, "step": 765150 }, { "epoch": 1.98, "learning_rate": 2.489236121011662e-06, "loss": 0.0079, "step": 765160 }, { "epoch": 1.98, "learning_rate": 2.485347904640197e-06, "loss": 0.0075, "step": 765170 }, { "epoch": 1.98, "learning_rate": 2.481459688268733e-06, "loss": 0.0082, "step": 765180 }, { "epoch": 1.98, "learning_rate": 2.4775714718972677e-06, "loss": 0.0061, "step": 765190 }, { "epoch": 1.98, "learning_rate": 2.473683255525803e-06, "loss": 0.0096, "step": 765200 }, { "epoch": 1.98, "learning_rate": 2.4697950391543387e-06, "loss": 0.0078, "step": 765210 }, { "epoch": 1.98, "learning_rate": 2.465906822782874e-06, "loss": 0.0061, "step": 765220 }, { "epoch": 1.98, "learning_rate": 2.4620186064114097e-06, "loss": 0.0062, "step": 765230 }, { "epoch": 1.98, "learning_rate": 2.458130390039945e-06, "loss": 0.0063, "step": 765240 }, { "epoch": 1.98, "learning_rate": 2.45424217366848e-06, "loss": 0.0059, "step": 765250 }, { "epoch": 1.98, "learning_rate": 2.4503539572970155e-06, "loss": 0.0073, "step": 765260 }, { "epoch": 1.98, "learning_rate": 2.446465740925551e-06, "loss": 0.0064, "step": 765270 }, { "epoch": 1.98, "learning_rate": 2.442577524554086e-06, "loss": 0.0076, "step": 765280 }, { "epoch": 1.98, "learning_rate": 2.438689308182622e-06, "loss": 0.0068, "step": 765290 }, { "epoch": 1.98, "learning_rate": 2.434801091811157e-06, "loss": 0.0077, "step": 765300 }, { "epoch": 1.98, "learning_rate": 2.430912875439692e-06, "loss": 0.0062, "step": 765310 }, { "epoch": 1.98, "learning_rate": 2.4270246590682277e-06, "loss": 0.0066, "step": 765320 }, { "epoch": 1.98, "learning_rate": 2.423136442696763e-06, "loss": 0.006, "step": 765330 }, { "epoch": 1.98, "learning_rate": 2.4192482263252982e-06, "loss": 0.0095, "step": 765340 }, { "epoch": 1.98, "learning_rate": 2.415360009953834e-06, "loss": 0.0088, "step": 765350 }, { "epoch": 1.98, "learning_rate": 2.411471793582369e-06, "loss": 0.0073, "step": 765360 }, { "epoch": 1.98, "learning_rate": 2.4075835772109045e-06, "loss": 0.0084, "step": 765370 }, { "epoch": 1.98, "learning_rate": 2.4036953608394398e-06, "loss": 0.0087, "step": 765380 }, { "epoch": 1.98, "learning_rate": 2.399807144467975e-06, "loss": 0.0079, "step": 765390 }, { "epoch": 1.98, "learning_rate": 2.3959189280965108e-06, "loss": 0.0058, "step": 765400 }, { "epoch": 1.98, "learning_rate": 2.392030711725046e-06, "loss": 0.0059, "step": 765410 }, { "epoch": 1.98, "learning_rate": 2.388142495353581e-06, "loss": 0.0061, "step": 765420 }, { "epoch": 1.98, "learning_rate": 2.3842542789821166e-06, "loss": 0.0079, "step": 765430 }, { "epoch": 1.98, "learning_rate": 2.380366062610652e-06, "loss": 0.0051, "step": 765440 }, { "epoch": 1.98, "learning_rate": 2.376477846239187e-06, "loss": 0.0071, "step": 765450 }, { "epoch": 1.98, "learning_rate": 2.372589629867723e-06, "loss": 0.0047, "step": 765460 }, { "epoch": 1.98, "learning_rate": 2.368701413496258e-06, "loss": 0.0037, "step": 765470 }, { "epoch": 1.98, "learning_rate": 2.364813197124793e-06, "loss": 0.0073, "step": 765480 }, { "epoch": 1.98, "learning_rate": 2.3609249807533288e-06, "loss": 0.006, "step": 765490 }, { "epoch": 1.98, "learning_rate": 2.357036764381864e-06, "loss": 0.006, "step": 765500 }, { "epoch": 1.98, "learning_rate": 2.3531485480103993e-06, "loss": 0.007, "step": 765510 }, { "epoch": 1.98, "learning_rate": 2.349260331638935e-06, "loss": 0.0068, "step": 765520 }, { "epoch": 1.98, "learning_rate": 2.34537211526747e-06, "loss": 0.0077, "step": 765530 }, { "epoch": 1.98, "learning_rate": 2.3414838988960056e-06, "loss": 0.0057, "step": 765540 }, { "epoch": 1.98, "learning_rate": 2.337595682524541e-06, "loss": 0.0068, "step": 765550 }, { "epoch": 1.98, "learning_rate": 2.3337074661530766e-06, "loss": 0.0099, "step": 765560 }, { "epoch": 1.98, "learning_rate": 2.3298192497816115e-06, "loss": 0.0061, "step": 765570 }, { "epoch": 1.98, "learning_rate": 2.325931033410147e-06, "loss": 0.0101, "step": 765580 }, { "epoch": 1.98, "learning_rate": 2.3220428170386825e-06, "loss": 0.0069, "step": 765590 }, { "epoch": 1.98, "learning_rate": 2.3181546006672178e-06, "loss": 0.0064, "step": 765600 }, { "epoch": 1.98, "learning_rate": 2.314266384295753e-06, "loss": 0.006, "step": 765610 }, { "epoch": 1.98, "learning_rate": 2.3103781679242883e-06, "loss": 0.0066, "step": 765620 }, { "epoch": 1.98, "learning_rate": 2.3064899515528236e-06, "loss": 0.0045, "step": 765630 }, { "epoch": 1.98, "learning_rate": 2.3026017351813593e-06, "loss": 0.0069, "step": 765640 }, { "epoch": 1.98, "learning_rate": 2.2987135188098946e-06, "loss": 0.0058, "step": 765650 }, { "epoch": 1.98, "learning_rate": 2.29482530243843e-06, "loss": 0.0062, "step": 765660 }, { "epoch": 1.98, "learning_rate": 2.290937086066965e-06, "loss": 0.0074, "step": 765670 }, { "epoch": 1.98, "learning_rate": 2.2870488696955005e-06, "loss": 0.0066, "step": 765680 }, { "epoch": 1.98, "learning_rate": 2.283160653324036e-06, "loss": 0.0069, "step": 765690 }, { "epoch": 1.98, "learning_rate": 2.279272436952571e-06, "loss": 0.0076, "step": 765700 }, { "epoch": 1.98, "learning_rate": 2.2753842205811067e-06, "loss": 0.0067, "step": 765710 }, { "epoch": 1.98, "learning_rate": 2.271496004209642e-06, "loss": 0.0073, "step": 765720 }, { "epoch": 1.98, "learning_rate": 2.2676077878381777e-06, "loss": 0.0066, "step": 765730 }, { "epoch": 1.98, "learning_rate": 2.2637195714667126e-06, "loss": 0.0078, "step": 765740 }, { "epoch": 1.98, "learning_rate": 2.2598313550952483e-06, "loss": 0.0074, "step": 765750 }, { "epoch": 1.98, "learning_rate": 2.2559431387237836e-06, "loss": 0.0093, "step": 765760 }, { "epoch": 1.98, "learning_rate": 2.252054922352319e-06, "loss": 0.0051, "step": 765770 }, { "epoch": 1.99, "learning_rate": 2.248166705980854e-06, "loss": 0.006, "step": 765780 }, { "epoch": 1.99, "learning_rate": 2.2442784896093894e-06, "loss": 0.006, "step": 765790 }, { "epoch": 1.99, "learning_rate": 2.240390273237925e-06, "loss": 0.0049, "step": 765800 }, { "epoch": 1.99, "learning_rate": 2.2365020568664604e-06, "loss": 0.0064, "step": 765810 }, { "epoch": 1.99, "learning_rate": 2.2326138404949957e-06, "loss": 0.0069, "step": 765820 }, { "epoch": 1.99, "learning_rate": 2.228725624123531e-06, "loss": 0.0058, "step": 765830 }, { "epoch": 1.99, "learning_rate": 2.2248374077520663e-06, "loss": 0.0057, "step": 765840 }, { "epoch": 1.99, "learning_rate": 2.2209491913806016e-06, "loss": 0.0049, "step": 765850 }, { "epoch": 1.99, "learning_rate": 2.2170609750091373e-06, "loss": 0.0131, "step": 765860 }, { "epoch": 1.99, "learning_rate": 2.2131727586376726e-06, "loss": 0.0057, "step": 765870 }, { "epoch": 1.99, "learning_rate": 2.209284542266208e-06, "loss": 0.0082, "step": 765880 }, { "epoch": 1.99, "learning_rate": 2.205396325894743e-06, "loss": 0.005, "step": 765890 }, { "epoch": 1.99, "learning_rate": 2.201508109523279e-06, "loss": 0.007, "step": 765900 }, { "epoch": 1.99, "learning_rate": 2.1976198931518137e-06, "loss": 0.0071, "step": 765910 }, { "epoch": 1.99, "learning_rate": 2.1937316767803494e-06, "loss": 0.0054, "step": 765920 }, { "epoch": 1.99, "learning_rate": 2.1898434604088847e-06, "loss": 0.0069, "step": 765930 }, { "epoch": 1.99, "learning_rate": 2.18595524403742e-06, "loss": 0.0082, "step": 765940 }, { "epoch": 1.99, "learning_rate": 2.1820670276659553e-06, "loss": 0.0068, "step": 765950 }, { "epoch": 1.99, "learning_rate": 2.1781788112944906e-06, "loss": 0.0094, "step": 765960 }, { "epoch": 1.99, "learning_rate": 2.1742905949230263e-06, "loss": 0.008, "step": 765970 }, { "epoch": 1.99, "learning_rate": 2.1704023785515615e-06, "loss": 0.0065, "step": 765980 }, { "epoch": 1.99, "learning_rate": 2.166514162180097e-06, "loss": 0.0065, "step": 765990 }, { "epoch": 1.99, "learning_rate": 2.162625945808632e-06, "loss": 0.008, "step": 766000 }, { "epoch": 1.99, "eval_cer": 0.8816956881384969, "eval_loss": 0.004399578087031841, "eval_runtime": 107.8197, "eval_samples_per_second": 18.549, "eval_steps_per_second": 4.637, "step": 766000 }, { "epoch": 1.99, "learning_rate": 2.1587377294371674e-06, "loss": 0.0067, "step": 766010 }, { "epoch": 1.99, "learning_rate": 2.1548495130657027e-06, "loss": 0.0061, "step": 766020 }, { "epoch": 1.99, "learning_rate": 2.1509612966942384e-06, "loss": 0.0066, "step": 766030 }, { "epoch": 1.99, "learning_rate": 2.1470730803227737e-06, "loss": 0.0051, "step": 766040 }, { "epoch": 1.99, "learning_rate": 2.143184863951309e-06, "loss": 0.0076, "step": 766050 }, { "epoch": 1.99, "learning_rate": 2.1392966475798443e-06, "loss": 0.007, "step": 766060 }, { "epoch": 1.99, "learning_rate": 2.13540843120838e-06, "loss": 0.0073, "step": 766070 }, { "epoch": 1.99, "learning_rate": 2.131520214836915e-06, "loss": 0.0064, "step": 766080 }, { "epoch": 1.99, "learning_rate": 2.1276319984654505e-06, "loss": 0.0075, "step": 766090 }, { "epoch": 1.99, "learning_rate": 2.123743782093986e-06, "loss": 0.0097, "step": 766100 }, { "epoch": 1.99, "learning_rate": 2.119855565722521e-06, "loss": 0.0078, "step": 766110 }, { "epoch": 1.99, "learning_rate": 2.1159673493510564e-06, "loss": 0.0056, "step": 766120 }, { "epoch": 1.99, "learning_rate": 2.1120791329795917e-06, "loss": 0.0054, "step": 766130 }, { "epoch": 1.99, "learning_rate": 2.1081909166081274e-06, "loss": 0.0077, "step": 766140 }, { "epoch": 1.99, "learning_rate": 2.1043027002366627e-06, "loss": 0.0063, "step": 766150 }, { "epoch": 1.99, "learning_rate": 2.100414483865198e-06, "loss": 0.0062, "step": 766160 }, { "epoch": 1.99, "learning_rate": 2.0965262674937332e-06, "loss": 0.005, "step": 766170 }, { "epoch": 1.99, "learning_rate": 2.092638051122269e-06, "loss": 0.0086, "step": 766180 }, { "epoch": 1.99, "learning_rate": 2.088749834750804e-06, "loss": 0.005, "step": 766190 }, { "epoch": 1.99, "learning_rate": 2.0848616183793395e-06, "loss": 0.0067, "step": 766200 }, { "epoch": 1.99, "learning_rate": 2.080973402007875e-06, "loss": 0.0068, "step": 766210 }, { "epoch": 1.99, "learning_rate": 2.07708518563641e-06, "loss": 0.0093, "step": 766220 }, { "epoch": 1.99, "learning_rate": 2.0731969692649454e-06, "loss": 0.0059, "step": 766230 }, { "epoch": 1.99, "learning_rate": 2.069308752893481e-06, "loss": 0.0068, "step": 766240 }, { "epoch": 1.99, "learning_rate": 2.0654205365220164e-06, "loss": 0.0082, "step": 766250 }, { "epoch": 1.99, "learning_rate": 2.0615323201505516e-06, "loss": 0.0067, "step": 766260 }, { "epoch": 1.99, "learning_rate": 2.057644103779087e-06, "loss": 0.0062, "step": 766270 }, { "epoch": 1.99, "learning_rate": 2.0537558874076222e-06, "loss": 0.0065, "step": 766280 }, { "epoch": 1.99, "learning_rate": 2.0498676710361575e-06, "loss": 0.0061, "step": 766290 }, { "epoch": 1.99, "learning_rate": 2.0459794546646928e-06, "loss": 0.0057, "step": 766300 }, { "epoch": 1.99, "learning_rate": 2.0420912382932285e-06, "loss": 0.0076, "step": 766310 }, { "epoch": 1.99, "learning_rate": 2.0382030219217638e-06, "loss": 0.0069, "step": 766320 }, { "epoch": 1.99, "learning_rate": 2.034314805550299e-06, "loss": 0.0083, "step": 766330 }, { "epoch": 1.99, "learning_rate": 2.0304265891788343e-06, "loss": 0.0077, "step": 766340 }, { "epoch": 1.99, "learning_rate": 2.02653837280737e-06, "loss": 0.0085, "step": 766350 }, { "epoch": 1.99, "learning_rate": 2.022650156435905e-06, "loss": 0.0069, "step": 766360 }, { "epoch": 1.99, "learning_rate": 2.0187619400644406e-06, "loss": 0.0055, "step": 766370 }, { "epoch": 1.99, "learning_rate": 2.014873723692976e-06, "loss": 0.0055, "step": 766380 }, { "epoch": 1.99, "learning_rate": 2.010985507321511e-06, "loss": 0.0085, "step": 766390 }, { "epoch": 1.99, "learning_rate": 2.0070972909500465e-06, "loss": 0.0049, "step": 766400 }, { "epoch": 1.99, "learning_rate": 2.003209074578582e-06, "loss": 0.0058, "step": 766410 }, { "epoch": 1.99, "learning_rate": 1.9993208582071175e-06, "loss": 0.006, "step": 766420 }, { "epoch": 1.99, "learning_rate": 1.9954326418356528e-06, "loss": 0.0074, "step": 766430 }, { "epoch": 1.99, "learning_rate": 1.991544425464188e-06, "loss": 0.0065, "step": 766440 }, { "epoch": 1.99, "learning_rate": 1.9876562090927233e-06, "loss": 0.0084, "step": 766450 }, { "epoch": 1.99, "learning_rate": 1.9837679927212586e-06, "loss": 0.0062, "step": 766460 }, { "epoch": 1.99, "learning_rate": 1.979879776349794e-06, "loss": 0.0052, "step": 766470 }, { "epoch": 1.99, "learning_rate": 1.9759915599783296e-06, "loss": 0.0071, "step": 766480 }, { "epoch": 1.99, "learning_rate": 1.972103343606865e-06, "loss": 0.0063, "step": 766490 }, { "epoch": 1.99, "learning_rate": 1.9682151272354e-06, "loss": 0.008, "step": 766500 }, { "epoch": 1.99, "learning_rate": 1.9643269108639355e-06, "loss": 0.006, "step": 766510 }, { "epoch": 1.99, "learning_rate": 1.960438694492471e-06, "loss": 0.0066, "step": 766520 }, { "epoch": 1.99, "learning_rate": 1.956550478121006e-06, "loss": 0.0061, "step": 766530 }, { "epoch": 1.99, "learning_rate": 1.9526622617495417e-06, "loss": 0.0063, "step": 766540 }, { "epoch": 1.99, "learning_rate": 1.948774045378077e-06, "loss": 0.0088, "step": 766550 }, { "epoch": 1.99, "learning_rate": 1.9448858290066123e-06, "loss": 0.0067, "step": 766560 }, { "epoch": 1.99, "learning_rate": 1.9409976126351476e-06, "loss": 0.0076, "step": 766570 }, { "epoch": 1.99, "learning_rate": 1.9371093962636833e-06, "loss": 0.0059, "step": 766580 }, { "epoch": 1.99, "learning_rate": 1.9332211798922186e-06, "loss": 0.0078, "step": 766590 }, { "epoch": 1.99, "learning_rate": 1.929332963520754e-06, "loss": 0.005, "step": 766600 }, { "epoch": 1.99, "learning_rate": 1.925444747149289e-06, "loss": 0.0056, "step": 766610 }, { "epoch": 1.99, "learning_rate": 1.9215565307778244e-06, "loss": 0.0076, "step": 766620 }, { "epoch": 1.99, "learning_rate": 1.91766831440636e-06, "loss": 0.0056, "step": 766630 }, { "epoch": 1.99, "learning_rate": 1.913780098034895e-06, "loss": 0.0104, "step": 766640 }, { "epoch": 1.99, "learning_rate": 1.9098918816634307e-06, "loss": 0.0103, "step": 766650 }, { "epoch": 1.99, "learning_rate": 1.906003665291966e-06, "loss": 0.0056, "step": 766660 }, { "epoch": 1.99, "learning_rate": 1.9021154489205013e-06, "loss": 0.0054, "step": 766670 }, { "epoch": 1.99, "learning_rate": 1.8982272325490368e-06, "loss": 0.0056, "step": 766680 }, { "epoch": 1.99, "learning_rate": 1.894339016177572e-06, "loss": 0.0091, "step": 766690 }, { "epoch": 1.99, "learning_rate": 1.8904507998061074e-06, "loss": 0.0056, "step": 766700 }, { "epoch": 1.99, "learning_rate": 1.8865625834346429e-06, "loss": 0.0064, "step": 766710 }, { "epoch": 1.99, "learning_rate": 1.8826743670631781e-06, "loss": 0.0068, "step": 766720 }, { "epoch": 1.99, "learning_rate": 1.8787861506917136e-06, "loss": 0.0056, "step": 766730 }, { "epoch": 1.99, "learning_rate": 1.8748979343202487e-06, "loss": 0.0068, "step": 766740 }, { "epoch": 1.99, "learning_rate": 1.8710097179487842e-06, "loss": 0.0045, "step": 766750 }, { "epoch": 1.99, "learning_rate": 1.8671215015773197e-06, "loss": 0.0067, "step": 766760 }, { "epoch": 1.99, "learning_rate": 1.8632332852058548e-06, "loss": 0.0047, "step": 766770 }, { "epoch": 1.99, "learning_rate": 1.8593450688343903e-06, "loss": 0.0087, "step": 766780 }, { "epoch": 1.99, "learning_rate": 1.8554568524629258e-06, "loss": 0.0072, "step": 766790 }, { "epoch": 1.99, "learning_rate": 1.851568636091461e-06, "loss": 0.0057, "step": 766800 }, { "epoch": 1.99, "learning_rate": 1.8476804197199963e-06, "loss": 0.0083, "step": 766810 }, { "epoch": 1.99, "learning_rate": 1.8437922033485318e-06, "loss": 0.0076, "step": 766820 }, { "epoch": 1.99, "learning_rate": 1.8399039869770671e-06, "loss": 0.0063, "step": 766830 }, { "epoch": 1.99, "learning_rate": 1.8360157706056024e-06, "loss": 0.0067, "step": 766840 }, { "epoch": 1.99, "learning_rate": 1.832127554234138e-06, "loss": 0.005, "step": 766850 }, { "epoch": 1.99, "learning_rate": 1.8282393378626732e-06, "loss": 0.0063, "step": 766860 }, { "epoch": 1.99, "learning_rate": 1.8243511214912087e-06, "loss": 0.0086, "step": 766870 }, { "epoch": 1.99, "learning_rate": 1.820462905119744e-06, "loss": 0.0081, "step": 766880 }, { "epoch": 1.99, "learning_rate": 1.8165746887482793e-06, "loss": 0.0063, "step": 766890 }, { "epoch": 1.99, "learning_rate": 1.8126864723768148e-06, "loss": 0.0071, "step": 766900 }, { "epoch": 1.99, "learning_rate": 1.8087982560053498e-06, "loss": 0.0069, "step": 766910 }, { "epoch": 1.99, "learning_rate": 1.8049100396338853e-06, "loss": 0.0066, "step": 766920 }, { "epoch": 1.99, "learning_rate": 1.8010218232624208e-06, "loss": 0.0085, "step": 766930 }, { "epoch": 1.99, "learning_rate": 1.7971336068909563e-06, "loss": 0.0077, "step": 766940 }, { "epoch": 1.99, "learning_rate": 1.7932453905194914e-06, "loss": 0.0066, "step": 766950 }, { "epoch": 1.99, "learning_rate": 1.7893571741480269e-06, "loss": 0.0077, "step": 766960 }, { "epoch": 1.99, "learning_rate": 1.7854689577765622e-06, "loss": 0.0063, "step": 766970 }, { "epoch": 1.99, "learning_rate": 1.7815807414050975e-06, "loss": 0.0054, "step": 766980 }, { "epoch": 1.99, "learning_rate": 1.777692525033633e-06, "loss": 0.0073, "step": 766990 }, { "epoch": 1.99, "learning_rate": 1.7738043086621682e-06, "loss": 0.0079, "step": 767000 }, { "epoch": 1.99, "eval_cer": 0.8816928888646285, "eval_loss": 0.004389285109937191, "eval_runtime": 108.0952, "eval_samples_per_second": 18.502, "eval_steps_per_second": 4.626, "step": 767000 }, { "epoch": 1.99, "learning_rate": 1.7699160922907037e-06, "loss": 0.0067, "step": 767010 }, { "epoch": 1.99, "learning_rate": 1.766027875919239e-06, "loss": 0.0054, "step": 767020 }, { "epoch": 1.99, "learning_rate": 1.7621396595477743e-06, "loss": 0.0094, "step": 767030 }, { "epoch": 1.99, "learning_rate": 1.7582514431763098e-06, "loss": 0.0083, "step": 767040 }, { "epoch": 1.99, "learning_rate": 1.754363226804845e-06, "loss": 0.0087, "step": 767050 }, { "epoch": 1.99, "learning_rate": 1.7504750104333804e-06, "loss": 0.0076, "step": 767060 }, { "epoch": 1.99, "learning_rate": 1.7465867940619159e-06, "loss": 0.0056, "step": 767070 }, { "epoch": 1.99, "learning_rate": 1.742698577690451e-06, "loss": 0.0055, "step": 767080 }, { "epoch": 1.99, "learning_rate": 1.7388103613189864e-06, "loss": 0.0115, "step": 767090 }, { "epoch": 1.99, "learning_rate": 1.734922144947522e-06, "loss": 0.0086, "step": 767100 }, { "epoch": 1.99, "learning_rate": 1.7310339285760574e-06, "loss": 0.0076, "step": 767110 }, { "epoch": 1.99, "learning_rate": 1.7271457122045925e-06, "loss": 0.009, "step": 767120 }, { "epoch": 1.99, "learning_rate": 1.723257495833128e-06, "loss": 0.0059, "step": 767130 }, { "epoch": 1.99, "learning_rate": 1.7193692794616635e-06, "loss": 0.0054, "step": 767140 }, { "epoch": 1.99, "learning_rate": 1.7154810630901986e-06, "loss": 0.0058, "step": 767150 }, { "epoch": 1.99, "learning_rate": 1.711592846718734e-06, "loss": 0.0079, "step": 767160 }, { "epoch": 1.99, "learning_rate": 1.7077046303472694e-06, "loss": 0.008, "step": 767170 }, { "epoch": 1.99, "learning_rate": 1.7038164139758049e-06, "loss": 0.0061, "step": 767180 }, { "epoch": 1.99, "learning_rate": 1.6999281976043401e-06, "loss": 0.0079, "step": 767190 }, { "epoch": 1.99, "learning_rate": 1.6960399812328754e-06, "loss": 0.0055, "step": 767200 }, { "epoch": 1.99, "learning_rate": 1.692151764861411e-06, "loss": 0.0063, "step": 767210 }, { "epoch": 1.99, "learning_rate": 1.6882635484899462e-06, "loss": 0.0087, "step": 767220 }, { "epoch": 1.99, "learning_rate": 1.6843753321184815e-06, "loss": 0.0081, "step": 767230 }, { "epoch": 1.99, "learning_rate": 1.680487115747017e-06, "loss": 0.0061, "step": 767240 }, { "epoch": 1.99, "learning_rate": 1.6765988993755525e-06, "loss": 0.0063, "step": 767250 }, { "epoch": 1.99, "learning_rate": 1.6727106830040876e-06, "loss": 0.0067, "step": 767260 }, { "epoch": 1.99, "learning_rate": 1.668822466632623e-06, "loss": 0.0054, "step": 767270 }, { "epoch": 1.99, "learning_rate": 1.6649342502611586e-06, "loss": 0.0054, "step": 767280 }, { "epoch": 1.99, "learning_rate": 1.6610460338896936e-06, "loss": 0.0073, "step": 767290 }, { "epoch": 1.99, "learning_rate": 1.6571578175182291e-06, "loss": 0.0101, "step": 767300 }, { "epoch": 1.99, "learning_rate": 1.6532696011467646e-06, "loss": 0.0135, "step": 767310 }, { "epoch": 1.99, "learning_rate": 1.6493813847753e-06, "loss": 0.0066, "step": 767320 }, { "epoch": 1.99, "learning_rate": 1.6454931684038352e-06, "loss": 0.0067, "step": 767330 }, { "epoch": 1.99, "learning_rate": 1.6416049520323705e-06, "loss": 0.0068, "step": 767340 }, { "epoch": 1.99, "learning_rate": 1.637716735660906e-06, "loss": 0.0096, "step": 767350 }, { "epoch": 1.99, "learning_rate": 1.6338285192894413e-06, "loss": 0.0089, "step": 767360 }, { "epoch": 1.99, "learning_rate": 1.6299403029179765e-06, "loss": 0.0068, "step": 767370 }, { "epoch": 1.99, "learning_rate": 1.626052086546512e-06, "loss": 0.0059, "step": 767380 }, { "epoch": 1.99, "learning_rate": 1.6221638701750473e-06, "loss": 0.0068, "step": 767390 }, { "epoch": 1.99, "learning_rate": 1.6182756538035826e-06, "loss": 0.0104, "step": 767400 }, { "epoch": 1.99, "learning_rate": 1.614387437432118e-06, "loss": 0.0051, "step": 767410 }, { "epoch": 1.99, "learning_rate": 1.6104992210606536e-06, "loss": 0.0072, "step": 767420 }, { "epoch": 1.99, "learning_rate": 1.6066110046891887e-06, "loss": 0.0053, "step": 767430 }, { "epoch": 1.99, "learning_rate": 1.6027227883177242e-06, "loss": 0.0081, "step": 767440 }, { "epoch": 1.99, "learning_rate": 1.5988345719462597e-06, "loss": 0.0076, "step": 767450 }, { "epoch": 1.99, "learning_rate": 1.5949463555747947e-06, "loss": 0.0067, "step": 767460 }, { "epoch": 1.99, "learning_rate": 1.5910581392033302e-06, "loss": 0.007, "step": 767470 }, { "epoch": 1.99, "learning_rate": 1.5871699228318657e-06, "loss": 0.0058, "step": 767480 }, { "epoch": 1.99, "learning_rate": 1.583281706460401e-06, "loss": 0.0056, "step": 767490 }, { "epoch": 1.99, "learning_rate": 1.5793934900889363e-06, "loss": 0.008, "step": 767500 }, { "epoch": 1.99, "learning_rate": 1.5755052737174716e-06, "loss": 0.004, "step": 767510 }, { "epoch": 1.99, "learning_rate": 1.571617057346007e-06, "loss": 0.0064, "step": 767520 }, { "epoch": 1.99, "learning_rate": 1.5677288409745424e-06, "loss": 0.0077, "step": 767530 }, { "epoch": 1.99, "learning_rate": 1.5638406246030777e-06, "loss": 0.0089, "step": 767540 }, { "epoch": 1.99, "learning_rate": 1.5599524082316132e-06, "loss": 0.0054, "step": 767550 }, { "epoch": 1.99, "learning_rate": 1.5560641918601487e-06, "loss": 0.0087, "step": 767560 }, { "epoch": 1.99, "learning_rate": 1.5521759754886837e-06, "loss": 0.0078, "step": 767570 }, { "epoch": 1.99, "learning_rate": 1.5482877591172192e-06, "loss": 0.0069, "step": 767580 }, { "epoch": 1.99, "learning_rate": 1.5443995427457547e-06, "loss": 0.009, "step": 767590 }, { "epoch": 1.99, "learning_rate": 1.5405113263742898e-06, "loss": 0.0078, "step": 767600 }, { "epoch": 1.99, "learning_rate": 1.5366231100028253e-06, "loss": 0.0062, "step": 767610 }, { "epoch": 1.99, "learning_rate": 1.5327348936313608e-06, "loss": 0.0079, "step": 767620 }, { "epoch": 1.99, "learning_rate": 1.528846677259896e-06, "loss": 0.0071, "step": 767630 }, { "epoch": 1.99, "learning_rate": 1.5249584608884314e-06, "loss": 0.0097, "step": 767640 }, { "epoch": 1.99, "learning_rate": 1.5210702445169669e-06, "loss": 0.0069, "step": 767650 }, { "epoch": 1.99, "learning_rate": 1.5171820281455021e-06, "loss": 0.0055, "step": 767660 }, { "epoch": 1.99, "learning_rate": 1.5132938117740374e-06, "loss": 0.0062, "step": 767670 }, { "epoch": 1.99, "learning_rate": 1.5094055954025727e-06, "loss": 0.008, "step": 767680 }, { "epoch": 1.99, "learning_rate": 1.5055173790311082e-06, "loss": 0.0056, "step": 767690 }, { "epoch": 1.99, "learning_rate": 1.5016291626596437e-06, "loss": 0.0068, "step": 767700 }, { "epoch": 1.99, "learning_rate": 1.4977409462881788e-06, "loss": 0.006, "step": 767710 }, { "epoch": 1.99, "learning_rate": 1.4938527299167143e-06, "loss": 0.0065, "step": 767720 }, { "epoch": 1.99, "learning_rate": 1.4899645135452498e-06, "loss": 0.0057, "step": 767730 }, { "epoch": 1.99, "learning_rate": 1.4860762971737848e-06, "loss": 0.0061, "step": 767740 }, { "epoch": 1.99, "learning_rate": 1.4821880808023203e-06, "loss": 0.0069, "step": 767750 }, { "epoch": 1.99, "learning_rate": 1.4782998644308558e-06, "loss": 0.0066, "step": 767760 }, { "epoch": 1.99, "learning_rate": 1.474411648059391e-06, "loss": 0.0056, "step": 767770 }, { "epoch": 1.99, "learning_rate": 1.4705234316879264e-06, "loss": 0.0066, "step": 767780 }, { "epoch": 1.99, "learning_rate": 1.466635215316462e-06, "loss": 0.0089, "step": 767790 }, { "epoch": 1.99, "learning_rate": 1.4627469989449972e-06, "loss": 0.0083, "step": 767800 }, { "epoch": 1.99, "learning_rate": 1.4588587825735325e-06, "loss": 0.0071, "step": 767810 }, { "epoch": 1.99, "learning_rate": 1.454970566202068e-06, "loss": 0.0078, "step": 767820 }, { "epoch": 1.99, "learning_rate": 1.4510823498306033e-06, "loss": 0.0042, "step": 767830 }, { "epoch": 1.99, "learning_rate": 1.4471941334591385e-06, "loss": 0.0089, "step": 767840 }, { "epoch": 1.99, "learning_rate": 1.4433059170876738e-06, "loss": 0.0074, "step": 767850 }, { "epoch": 1.99, "learning_rate": 1.4394177007162093e-06, "loss": 0.0073, "step": 767860 }, { "epoch": 1.99, "learning_rate": 1.4355294843447448e-06, "loss": 0.005, "step": 767870 }, { "epoch": 1.99, "learning_rate": 1.4316412679732799e-06, "loss": 0.0067, "step": 767880 }, { "epoch": 1.99, "learning_rate": 1.4277530516018154e-06, "loss": 0.0061, "step": 767890 }, { "epoch": 1.99, "learning_rate": 1.4238648352303509e-06, "loss": 0.0053, "step": 767900 }, { "epoch": 1.99, "learning_rate": 1.419976618858886e-06, "loss": 0.0061, "step": 767910 }, { "epoch": 1.99, "learning_rate": 1.4160884024874215e-06, "loss": 0.0087, "step": 767920 }, { "epoch": 1.99, "learning_rate": 1.412200186115957e-06, "loss": 0.0084, "step": 767930 }, { "epoch": 1.99, "learning_rate": 1.4083119697444922e-06, "loss": 0.0075, "step": 767940 }, { "epoch": 1.99, "learning_rate": 1.4044237533730275e-06, "loss": 0.0082, "step": 767950 }, { "epoch": 1.99, "learning_rate": 1.400535537001563e-06, "loss": 0.0071, "step": 767960 }, { "epoch": 1.99, "learning_rate": 1.3966473206300983e-06, "loss": 0.0074, "step": 767970 }, { "epoch": 1.99, "learning_rate": 1.3927591042586336e-06, "loss": 0.0049, "step": 767980 }, { "epoch": 1.99, "learning_rate": 1.388870887887169e-06, "loss": 0.0047, "step": 767990 }, { "epoch": 1.99, "learning_rate": 1.3849826715157044e-06, "loss": 0.0059, "step": 768000 }, { "epoch": 1.99, "eval_cer": 0.8816788924952867, "eval_loss": 0.004371436312794685, "eval_runtime": 108.0539, "eval_samples_per_second": 18.509, "eval_steps_per_second": 4.627, "step": 768000 }, { "epoch": 1.99, "learning_rate": 1.3810944551442399e-06, "loss": 0.0103, "step": 768010 }, { "epoch": 1.99, "learning_rate": 1.3772062387727752e-06, "loss": 0.0067, "step": 768020 }, { "epoch": 1.99, "learning_rate": 1.3733180224013104e-06, "loss": 0.0046, "step": 768030 }, { "epoch": 1.99, "learning_rate": 1.369429806029846e-06, "loss": 0.0063, "step": 768040 }, { "epoch": 1.99, "learning_rate": 1.365541589658381e-06, "loss": 0.0059, "step": 768050 }, { "epoch": 1.99, "learning_rate": 1.3616533732869165e-06, "loss": 0.0071, "step": 768060 }, { "epoch": 1.99, "learning_rate": 1.357765156915452e-06, "loss": 0.009, "step": 768070 }, { "epoch": 1.99, "learning_rate": 1.353876940543987e-06, "loss": 0.0067, "step": 768080 }, { "epoch": 1.99, "learning_rate": 1.3499887241725226e-06, "loss": 0.0095, "step": 768090 }, { "epoch": 1.99, "learning_rate": 1.346100507801058e-06, "loss": 0.0063, "step": 768100 }, { "epoch": 1.99, "learning_rate": 1.3422122914295934e-06, "loss": 0.0059, "step": 768110 }, { "epoch": 1.99, "learning_rate": 1.3383240750581286e-06, "loss": 0.0066, "step": 768120 }, { "epoch": 1.99, "learning_rate": 1.3344358586866641e-06, "loss": 0.0058, "step": 768130 }, { "epoch": 1.99, "learning_rate": 1.3305476423151994e-06, "loss": 0.007, "step": 768140 }, { "epoch": 1.99, "learning_rate": 1.3266594259437347e-06, "loss": 0.0082, "step": 768150 }, { "epoch": 1.99, "learning_rate": 1.3227712095722702e-06, "loss": 0.0073, "step": 768160 }, { "epoch": 1.99, "learning_rate": 1.3188829932008055e-06, "loss": 0.0051, "step": 768170 }, { "epoch": 1.99, "learning_rate": 1.314994776829341e-06, "loss": 0.0073, "step": 768180 }, { "epoch": 1.99, "learning_rate": 1.3111065604578763e-06, "loss": 0.0056, "step": 768190 }, { "epoch": 1.99, "learning_rate": 1.3072183440864116e-06, "loss": 0.0055, "step": 768200 }, { "epoch": 1.99, "learning_rate": 1.303330127714947e-06, "loss": 0.0057, "step": 768210 }, { "epoch": 1.99, "learning_rate": 1.2994419113434821e-06, "loss": 0.0057, "step": 768220 }, { "epoch": 1.99, "learning_rate": 1.2955536949720176e-06, "loss": 0.007, "step": 768230 }, { "epoch": 1.99, "learning_rate": 1.2916654786005531e-06, "loss": 0.0073, "step": 768240 }, { "epoch": 1.99, "learning_rate": 1.2877772622290886e-06, "loss": 0.0064, "step": 768250 }, { "epoch": 1.99, "learning_rate": 1.2838890458576237e-06, "loss": 0.0083, "step": 768260 }, { "epoch": 1.99, "learning_rate": 1.2800008294861592e-06, "loss": 0.0114, "step": 768270 }, { "epoch": 1.99, "learning_rate": 1.2761126131146945e-06, "loss": 0.0065, "step": 768280 }, { "epoch": 1.99, "learning_rate": 1.2722243967432298e-06, "loss": 0.0052, "step": 768290 }, { "epoch": 1.99, "learning_rate": 1.2683361803717652e-06, "loss": 0.0054, "step": 768300 }, { "epoch": 1.99, "learning_rate": 1.2644479640003005e-06, "loss": 0.0062, "step": 768310 }, { "epoch": 1.99, "learning_rate": 1.260559747628836e-06, "loss": 0.0066, "step": 768320 }, { "epoch": 1.99, "learning_rate": 1.2566715312573713e-06, "loss": 0.0058, "step": 768330 }, { "epoch": 1.99, "learning_rate": 1.2527833148859066e-06, "loss": 0.0062, "step": 768340 }, { "epoch": 1.99, "learning_rate": 1.248895098514442e-06, "loss": 0.0073, "step": 768350 }, { "epoch": 1.99, "learning_rate": 1.2450068821429774e-06, "loss": 0.0082, "step": 768360 }, { "epoch": 1.99, "learning_rate": 1.2411186657715127e-06, "loss": 0.0067, "step": 768370 }, { "epoch": 1.99, "learning_rate": 1.2372304494000482e-06, "loss": 0.0061, "step": 768380 }, { "epoch": 1.99, "learning_rate": 1.2333422330285837e-06, "loss": 0.0068, "step": 768390 }, { "epoch": 1.99, "learning_rate": 1.2294540166571187e-06, "loss": 0.0085, "step": 768400 }, { "epoch": 1.99, "learning_rate": 1.2255658002856542e-06, "loss": 0.0064, "step": 768410 }, { "epoch": 1.99, "learning_rate": 1.2216775839141897e-06, "loss": 0.0085, "step": 768420 }, { "epoch": 1.99, "learning_rate": 1.2177893675427248e-06, "loss": 0.0079, "step": 768430 }, { "epoch": 1.99, "learning_rate": 1.2139011511712603e-06, "loss": 0.0053, "step": 768440 }, { "epoch": 1.99, "learning_rate": 1.2100129347997958e-06, "loss": 0.0076, "step": 768450 }, { "epoch": 1.99, "learning_rate": 1.2061247184283309e-06, "loss": 0.0091, "step": 768460 }, { "epoch": 1.99, "learning_rate": 1.2022365020568664e-06, "loss": 0.0092, "step": 768470 }, { "epoch": 1.99, "learning_rate": 1.1983482856854017e-06, "loss": 0.0064, "step": 768480 }, { "epoch": 1.99, "learning_rate": 1.1944600693139371e-06, "loss": 0.0083, "step": 768490 }, { "epoch": 1.99, "learning_rate": 1.1905718529424724e-06, "loss": 0.0058, "step": 768500 }, { "epoch": 1.99, "learning_rate": 1.1866836365710077e-06, "loss": 0.0066, "step": 768510 }, { "epoch": 1.99, "learning_rate": 1.1827954201995432e-06, "loss": 0.0044, "step": 768520 }, { "epoch": 1.99, "learning_rate": 1.1789072038280785e-06, "loss": 0.0101, "step": 768530 }, { "epoch": 1.99, "learning_rate": 1.1750189874566138e-06, "loss": 0.0076, "step": 768540 }, { "epoch": 1.99, "learning_rate": 1.1711307710851493e-06, "loss": 0.0125, "step": 768550 }, { "epoch": 1.99, "learning_rate": 1.1672425547136846e-06, "loss": 0.0063, "step": 768560 }, { "epoch": 1.99, "learning_rate": 1.16335433834222e-06, "loss": 0.0081, "step": 768570 }, { "epoch": 1.99, "learning_rate": 1.1594661219707553e-06, "loss": 0.0074, "step": 768580 }, { "epoch": 1.99, "learning_rate": 1.1555779055992906e-06, "loss": 0.0064, "step": 768590 }, { "epoch": 1.99, "learning_rate": 1.1516896892278261e-06, "loss": 0.0077, "step": 768600 }, { "epoch": 1.99, "learning_rate": 1.1478014728563614e-06, "loss": 0.0085, "step": 768610 }, { "epoch": 1.99, "learning_rate": 1.143913256484897e-06, "loss": 0.0071, "step": 768620 }, { "epoch": 1.99, "learning_rate": 1.1400250401134322e-06, "loss": 0.0087, "step": 768630 }, { "epoch": 1.99, "learning_rate": 1.1361368237419675e-06, "loss": 0.0081, "step": 768640 }, { "epoch": 1.99, "learning_rate": 1.1322486073705028e-06, "loss": 0.0066, "step": 768650 }, { "epoch": 1.99, "learning_rate": 1.1283603909990383e-06, "loss": 0.0066, "step": 768660 }, { "epoch": 1.99, "learning_rate": 1.1244721746275735e-06, "loss": 0.0069, "step": 768670 }, { "epoch": 1.99, "learning_rate": 1.1205839582561088e-06, "loss": 0.0063, "step": 768680 }, { "epoch": 1.99, "learning_rate": 1.1166957418846443e-06, "loss": 0.009, "step": 768690 }, { "epoch": 1.99, "learning_rate": 1.1128075255131796e-06, "loss": 0.0077, "step": 768700 }, { "epoch": 1.99, "learning_rate": 1.108919309141715e-06, "loss": 0.0063, "step": 768710 }, { "epoch": 1.99, "learning_rate": 1.1050310927702504e-06, "loss": 0.0044, "step": 768720 }, { "epoch": 1.99, "learning_rate": 1.1011428763987857e-06, "loss": 0.0092, "step": 768730 }, { "epoch": 1.99, "learning_rate": 1.0972546600273212e-06, "loss": 0.0062, "step": 768740 }, { "epoch": 1.99, "learning_rate": 1.0933664436558565e-06, "loss": 0.007, "step": 768750 }, { "epoch": 1.99, "learning_rate": 1.089478227284392e-06, "loss": 0.0064, "step": 768760 }, { "epoch": 1.99, "learning_rate": 1.0855900109129272e-06, "loss": 0.0099, "step": 768770 }, { "epoch": 1.99, "learning_rate": 1.0817017945414625e-06, "loss": 0.0072, "step": 768780 }, { "epoch": 1.99, "learning_rate": 1.077813578169998e-06, "loss": 0.0101, "step": 768790 }, { "epoch": 1.99, "learning_rate": 1.0739253617985333e-06, "loss": 0.0067, "step": 768800 }, { "epoch": 1.99, "learning_rate": 1.0700371454270686e-06, "loss": 0.0087, "step": 768810 }, { "epoch": 1.99, "learning_rate": 1.0661489290556039e-06, "loss": 0.0091, "step": 768820 }, { "epoch": 1.99, "learning_rate": 1.0622607126841394e-06, "loss": 0.0061, "step": 768830 }, { "epoch": 1.99, "learning_rate": 1.0583724963126747e-06, "loss": 0.007, "step": 768840 }, { "epoch": 1.99, "learning_rate": 1.05448427994121e-06, "loss": 0.0066, "step": 768850 }, { "epoch": 1.99, "learning_rate": 1.0505960635697454e-06, "loss": 0.0095, "step": 768860 }, { "epoch": 1.99, "learning_rate": 1.0467078471982807e-06, "loss": 0.0066, "step": 768870 }, { "epoch": 1.99, "learning_rate": 1.0428196308268162e-06, "loss": 0.0057, "step": 768880 }, { "epoch": 1.99, "learning_rate": 1.0389314144553515e-06, "loss": 0.0059, "step": 768890 }, { "epoch": 1.99, "learning_rate": 1.0350431980838868e-06, "loss": 0.0066, "step": 768900 }, { "epoch": 1.99, "learning_rate": 1.0311549817124223e-06, "loss": 0.0079, "step": 768910 }, { "epoch": 1.99, "learning_rate": 1.0272667653409576e-06, "loss": 0.0088, "step": 768920 }, { "epoch": 1.99, "learning_rate": 1.023378548969493e-06, "loss": 0.0074, "step": 768930 }, { "epoch": 1.99, "learning_rate": 1.0194903325980284e-06, "loss": 0.0076, "step": 768940 }, { "epoch": 1.99, "learning_rate": 1.0156021162265636e-06, "loss": 0.0057, "step": 768950 }, { "epoch": 1.99, "learning_rate": 1.0117138998550991e-06, "loss": 0.0072, "step": 768960 }, { "epoch": 1.99, "learning_rate": 1.0078256834836344e-06, "loss": 0.0064, "step": 768970 }, { "epoch": 1.99, "learning_rate": 1.0039374671121697e-06, "loss": 0.0075, "step": 768980 }, { "epoch": 1.99, "learning_rate": 1.000049250740705e-06, "loss": 0.0074, "step": 768990 }, { "epoch": 1.99, "learning_rate": 9.961610343692405e-07, "loss": 0.0086, "step": 769000 }, { "epoch": 1.99, "eval_cer": 0.8816788924952867, "eval_loss": 0.0043708933517336845, "eval_runtime": 107.9473, "eval_samples_per_second": 18.528, "eval_steps_per_second": 4.632, "step": 769000 }, { "epoch": 1.99, "learning_rate": 9.922728179977758e-07, "loss": 0.0062, "step": 769010 }, { "epoch": 1.99, "learning_rate": 9.883846016263113e-07, "loss": 0.0065, "step": 769020 }, { "epoch": 1.99, "learning_rate": 9.844963852548466e-07, "loss": 0.0067, "step": 769030 }, { "epoch": 1.99, "learning_rate": 9.806081688833818e-07, "loss": 0.0072, "step": 769040 }, { "epoch": 1.99, "learning_rate": 9.767199525119173e-07, "loss": 0.0084, "step": 769050 }, { "epoch": 1.99, "learning_rate": 9.728317361404526e-07, "loss": 0.0086, "step": 769060 }, { "epoch": 1.99, "learning_rate": 9.689435197689881e-07, "loss": 0.0098, "step": 769070 }, { "epoch": 1.99, "learning_rate": 9.650553033975234e-07, "loss": 0.0072, "step": 769080 }, { "epoch": 1.99, "learning_rate": 9.611670870260587e-07, "loss": 0.0071, "step": 769090 }, { "epoch": 1.99, "learning_rate": 9.572788706545942e-07, "loss": 0.0058, "step": 769100 }, { "epoch": 1.99, "learning_rate": 9.533906542831295e-07, "loss": 0.0097, "step": 769110 }, { "epoch": 1.99, "learning_rate": 9.495024379116649e-07, "loss": 0.0098, "step": 769120 }, { "epoch": 1.99, "learning_rate": 9.456142215402002e-07, "loss": 0.0126, "step": 769130 }, { "epoch": 1.99, "learning_rate": 9.417260051687356e-07, "loss": 0.0062, "step": 769140 }, { "epoch": 1.99, "learning_rate": 9.378377887972709e-07, "loss": 0.0059, "step": 769150 }, { "epoch": 1.99, "learning_rate": 9.339495724258062e-07, "loss": 0.0071, "step": 769160 }, { "epoch": 1.99, "learning_rate": 9.300613560543416e-07, "loss": 0.0067, "step": 769170 }, { "epoch": 1.99, "learning_rate": 9.26173139682877e-07, "loss": 0.0065, "step": 769180 }, { "epoch": 1.99, "learning_rate": 9.222849233114124e-07, "loss": 0.0079, "step": 769190 }, { "epoch": 1.99, "learning_rate": 9.183967069399477e-07, "loss": 0.0054, "step": 769200 }, { "epoch": 1.99, "learning_rate": 9.145084905684832e-07, "loss": 0.0067, "step": 769210 }, { "epoch": 1.99, "learning_rate": 9.106202741970185e-07, "loss": 0.0074, "step": 769220 }, { "epoch": 1.99, "learning_rate": 9.067320578255537e-07, "loss": 0.0075, "step": 769230 }, { "epoch": 1.99, "learning_rate": 9.028438414540891e-07, "loss": 0.009, "step": 769240 }, { "epoch": 1.99, "learning_rate": 8.989556250826245e-07, "loss": 0.0071, "step": 769250 }, { "epoch": 1.99, "learning_rate": 8.950674087111599e-07, "loss": 0.0064, "step": 769260 }, { "epoch": 1.99, "learning_rate": 8.911791923396952e-07, "loss": 0.0052, "step": 769270 }, { "epoch": 1.99, "learning_rate": 8.872909759682306e-07, "loss": 0.0081, "step": 769280 }, { "epoch": 1.99, "learning_rate": 8.83402759596766e-07, "loss": 0.0066, "step": 769290 }, { "epoch": 1.99, "learning_rate": 8.795145432253013e-07, "loss": 0.0044, "step": 769300 }, { "epoch": 1.99, "learning_rate": 8.756263268538368e-07, "loss": 0.0074, "step": 769310 }, { "epoch": 1.99, "learning_rate": 8.71738110482372e-07, "loss": 0.0085, "step": 769320 }, { "epoch": 1.99, "learning_rate": 8.678498941109074e-07, "loss": 0.0075, "step": 769330 }, { "epoch": 1.99, "learning_rate": 8.639616777394427e-07, "loss": 0.0068, "step": 769340 }, { "epoch": 1.99, "learning_rate": 8.600734613679781e-07, "loss": 0.005, "step": 769350 }, { "epoch": 1.99, "learning_rate": 8.561852449965135e-07, "loss": 0.0087, "step": 769360 }, { "epoch": 1.99, "learning_rate": 8.522970286250488e-07, "loss": 0.0068, "step": 769370 }, { "epoch": 1.99, "learning_rate": 8.484088122535843e-07, "loss": 0.0048, "step": 769380 }, { "epoch": 1.99, "learning_rate": 8.445205958821196e-07, "loss": 0.0076, "step": 769390 }, { "epoch": 1.99, "learning_rate": 8.406323795106549e-07, "loss": 0.0074, "step": 769400 }, { "epoch": 1.99, "learning_rate": 8.367441631391904e-07, "loss": 0.0069, "step": 769410 }, { "epoch": 1.99, "learning_rate": 8.328559467677256e-07, "loss": 0.0085, "step": 769420 }, { "epoch": 1.99, "learning_rate": 8.28967730396261e-07, "loss": 0.006, "step": 769430 }, { "epoch": 1.99, "learning_rate": 8.250795140247963e-07, "loss": 0.0068, "step": 769440 }, { "epoch": 1.99, "learning_rate": 8.211912976533318e-07, "loss": 0.0064, "step": 769450 }, { "epoch": 1.99, "learning_rate": 8.173030812818671e-07, "loss": 0.005, "step": 769460 }, { "epoch": 1.99, "learning_rate": 8.134148649104024e-07, "loss": 0.0055, "step": 769470 }, { "epoch": 1.99, "learning_rate": 8.095266485389379e-07, "loss": 0.0079, "step": 769480 }, { "epoch": 1.99, "learning_rate": 8.056384321674732e-07, "loss": 0.0073, "step": 769490 }, { "epoch": 1.99, "learning_rate": 8.017502157960086e-07, "loss": 0.0055, "step": 769500 }, { "epoch": 1.99, "learning_rate": 7.978619994245438e-07, "loss": 0.0067, "step": 769510 }, { "epoch": 1.99, "learning_rate": 7.939737830530793e-07, "loss": 0.0098, "step": 769520 }, { "epoch": 1.99, "learning_rate": 7.900855666816146e-07, "loss": 0.0102, "step": 769530 }, { "epoch": 1.99, "learning_rate": 7.861973503101499e-07, "loss": 0.0067, "step": 769540 }, { "epoch": 1.99, "learning_rate": 7.823091339386854e-07, "loss": 0.0049, "step": 769550 }, { "epoch": 1.99, "learning_rate": 7.784209175672207e-07, "loss": 0.007, "step": 769560 }, { "epoch": 1.99, "learning_rate": 7.745327011957561e-07, "loss": 0.0056, "step": 769570 }, { "epoch": 1.99, "learning_rate": 7.706444848242915e-07, "loss": 0.0058, "step": 769580 }, { "epoch": 1.99, "learning_rate": 7.667562684528268e-07, "loss": 0.0077, "step": 769590 }, { "epoch": 1.99, "learning_rate": 7.628680520813621e-07, "loss": 0.0066, "step": 769600 }, { "epoch": 1.99, "learning_rate": 7.589798357098974e-07, "loss": 0.0092, "step": 769610 }, { "epoch": 1.99, "learning_rate": 7.550916193384329e-07, "loss": 0.0065, "step": 769620 }, { "epoch": 1.99, "learning_rate": 7.512034029669682e-07, "loss": 0.0068, "step": 769630 }, { "epoch": 2.0, "learning_rate": 7.473151865955036e-07, "loss": 0.008, "step": 769640 }, { "epoch": 2.0, "learning_rate": 7.43426970224039e-07, "loss": 0.0067, "step": 769650 }, { "epoch": 2.0, "learning_rate": 7.395387538525743e-07, "loss": 0.0068, "step": 769660 }, { "epoch": 2.0, "learning_rate": 7.356505374811097e-07, "loss": 0.0044, "step": 769670 }, { "epoch": 2.0, "learning_rate": 7.31762321109645e-07, "loss": 0.0061, "step": 769680 }, { "epoch": 2.0, "learning_rate": 7.278741047381805e-07, "loss": 0.0066, "step": 769690 }, { "epoch": 2.0, "learning_rate": 7.239858883667157e-07, "loss": 0.0058, "step": 769700 }, { "epoch": 2.0, "learning_rate": 7.200976719952512e-07, "loss": 0.0074, "step": 769710 }, { "epoch": 2.0, "learning_rate": 7.162094556237865e-07, "loss": 0.006, "step": 769720 }, { "epoch": 2.0, "learning_rate": 7.123212392523218e-07, "loss": 0.0064, "step": 769730 }, { "epoch": 2.0, "learning_rate": 7.084330228808572e-07, "loss": 0.0092, "step": 769740 }, { "epoch": 2.0, "learning_rate": 7.045448065093926e-07, "loss": 0.0077, "step": 769750 }, { "epoch": 2.0, "learning_rate": 7.00656590137928e-07, "loss": 0.0064, "step": 769760 }, { "epoch": 2.0, "learning_rate": 6.967683737664633e-07, "loss": 0.0066, "step": 769770 }, { "epoch": 2.0, "learning_rate": 6.928801573949986e-07, "loss": 0.0072, "step": 769780 }, { "epoch": 2.0, "learning_rate": 6.88991941023534e-07, "loss": 0.0073, "step": 769790 }, { "epoch": 2.0, "learning_rate": 6.851037246520693e-07, "loss": 0.0083, "step": 769800 }, { "epoch": 2.0, "learning_rate": 6.812155082806047e-07, "loss": 0.007, "step": 769810 }, { "epoch": 2.0, "learning_rate": 6.773272919091401e-07, "loss": 0.0075, "step": 769820 }, { "epoch": 2.0, "learning_rate": 6.734390755376755e-07, "loss": 0.0079, "step": 769830 }, { "epoch": 2.0, "learning_rate": 6.695508591662108e-07, "loss": 0.0095, "step": 769840 }, { "epoch": 2.0, "learning_rate": 6.656626427947462e-07, "loss": 0.0066, "step": 769850 }, { "epoch": 2.0, "learning_rate": 6.617744264232816e-07, "loss": 0.0075, "step": 769860 }, { "epoch": 2.0, "learning_rate": 6.578862100518169e-07, "loss": 0.0068, "step": 769870 }, { "epoch": 2.0, "learning_rate": 6.539979936803524e-07, "loss": 0.0087, "step": 769880 }, { "epoch": 2.0, "learning_rate": 6.501097773088876e-07, "loss": 0.0056, "step": 769890 }, { "epoch": 2.0, "learning_rate": 6.46221560937423e-07, "loss": 0.0067, "step": 769900 }, { "epoch": 2.0, "learning_rate": 6.423333445659583e-07, "loss": 0.0055, "step": 769910 }, { "epoch": 2.0, "learning_rate": 6.384451281944937e-07, "loss": 0.0064, "step": 769920 }, { "epoch": 2.0, "learning_rate": 6.345569118230291e-07, "loss": 0.0068, "step": 769930 }, { "epoch": 2.0, "learning_rate": 6.306686954515644e-07, "loss": 0.0055, "step": 769940 }, { "epoch": 2.0, "learning_rate": 6.267804790800999e-07, "loss": 0.0082, "step": 769950 }, { "epoch": 2.0, "learning_rate": 6.228922627086352e-07, "loss": 0.0077, "step": 769960 }, { "epoch": 2.0, "learning_rate": 6.190040463371704e-07, "loss": 0.0055, "step": 769970 }, { "epoch": 2.0, "learning_rate": 6.151158299657059e-07, "loss": 0.0089, "step": 769980 }, { "epoch": 2.0, "learning_rate": 6.112276135942412e-07, "loss": 0.0051, "step": 769990 }, { "epoch": 2.0, "learning_rate": 6.073393972227766e-07, "loss": 0.0051, "step": 770000 }, { "epoch": 2.0, "eval_cer": 0.8816788924952867, "eval_loss": 0.00436586607247591, "eval_runtime": 108.0178, "eval_samples_per_second": 18.515, "eval_steps_per_second": 4.629, "step": 770000 }, { "epoch": 2.0, "learning_rate": 6.034511808513119e-07, "loss": 0.0065, "step": 770010 }, { "epoch": 2.0, "learning_rate": 5.995629644798474e-07, "loss": 0.0052, "step": 770020 }, { "epoch": 2.0, "learning_rate": 5.956747481083827e-07, "loss": 0.008, "step": 770030 }, { "epoch": 2.0, "learning_rate": 5.91786531736918e-07, "loss": 0.0058, "step": 770040 }, { "epoch": 2.0, "learning_rate": 5.878983153654535e-07, "loss": 0.0072, "step": 770050 }, { "epoch": 2.0, "learning_rate": 5.840100989939888e-07, "loss": 0.0079, "step": 770060 }, { "epoch": 2.0, "learning_rate": 5.801218826225241e-07, "loss": 0.0043, "step": 770070 }, { "epoch": 2.0, "learning_rate": 5.762336662510594e-07, "loss": 0.0069, "step": 770080 }, { "epoch": 2.0, "learning_rate": 5.723454498795948e-07, "loss": 0.0128, "step": 770090 }, { "epoch": 2.0, "learning_rate": 5.684572335081302e-07, "loss": 0.0064, "step": 770100 }, { "epoch": 2.0, "learning_rate": 5.645690171366656e-07, "loss": 0.0059, "step": 770110 }, { "epoch": 2.0, "learning_rate": 5.60680800765201e-07, "loss": 0.0053, "step": 770120 }, { "epoch": 2.0, "learning_rate": 5.567925843937363e-07, "loss": 0.0107, "step": 770130 }, { "epoch": 2.0, "learning_rate": 5.529043680222717e-07, "loss": 0.0075, "step": 770140 }, { "epoch": 2.0, "learning_rate": 5.490161516508071e-07, "loss": 0.0054, "step": 770150 }, { "epoch": 2.0, "learning_rate": 5.451279352793423e-07, "loss": 0.0061, "step": 770160 }, { "epoch": 2.0, "learning_rate": 5.412397189078777e-07, "loss": 0.0061, "step": 770170 }, { "epoch": 2.0, "learning_rate": 5.373515025364131e-07, "loss": 0.0068, "step": 770180 }, { "epoch": 2.0, "learning_rate": 5.334632861649484e-07, "loss": 0.0064, "step": 770190 }, { "epoch": 2.0, "learning_rate": 5.295750697934838e-07, "loss": 0.0049, "step": 770200 }, { "epoch": 2.0, "learning_rate": 5.256868534220192e-07, "loss": 0.0084, "step": 770210 }, { "epoch": 2.0, "learning_rate": 5.217986370505546e-07, "loss": 0.0049, "step": 770220 }, { "epoch": 2.0, "learning_rate": 5.179104206790899e-07, "loss": 0.0052, "step": 770230 }, { "epoch": 2.0, "learning_rate": 5.140222043076253e-07, "loss": 0.006, "step": 770240 }, { "epoch": 2.0, "learning_rate": 5.101339879361605e-07, "loss": 0.0058, "step": 770250 }, { "epoch": 2.0, "learning_rate": 5.062457715646959e-07, "loss": 0.0064, "step": 770260 }, { "epoch": 2.0, "learning_rate": 5.023575551932313e-07, "loss": 0.0116, "step": 770270 }, { "epoch": 2.0, "learning_rate": 4.984693388217667e-07, "loss": 0.0056, "step": 770280 }, { "epoch": 2.0, "learning_rate": 4.945811224503021e-07, "loss": 0.0058, "step": 770290 }, { "epoch": 2.0, "learning_rate": 4.906929060788375e-07, "loss": 0.0069, "step": 770300 }, { "epoch": 2.0, "learning_rate": 4.868046897073728e-07, "loss": 0.0073, "step": 770310 }, { "epoch": 2.0, "learning_rate": 4.829164733359082e-07, "loss": 0.0056, "step": 770320 }, { "epoch": 2.0, "learning_rate": 4.790282569644435e-07, "loss": 0.0067, "step": 770330 }, { "epoch": 2.0, "learning_rate": 4.7514004059297885e-07, "loss": 0.0064, "step": 770340 }, { "epoch": 2.0, "learning_rate": 4.7125182422151424e-07, "loss": 0.0051, "step": 770350 }, { "epoch": 2.0, "learning_rate": 4.6736360785004963e-07, "loss": 0.0059, "step": 770360 }, { "epoch": 2.0, "learning_rate": 4.6347539147858497e-07, "loss": 0.0066, "step": 770370 }, { "epoch": 2.0, "learning_rate": 4.595871751071203e-07, "loss": 0.0063, "step": 770380 }, { "epoch": 2.0, "learning_rate": 4.5569895873565565e-07, "loss": 0.0088, "step": 770390 }, { "epoch": 2.0, "learning_rate": 4.5181074236419104e-07, "loss": 0.0102, "step": 770400 }, { "epoch": 2.0, "learning_rate": 4.4792252599272643e-07, "loss": 0.0071, "step": 770410 }, { "epoch": 2.0, "learning_rate": 4.4403430962126177e-07, "loss": 0.0058, "step": 770420 }, { "epoch": 2.0, "learning_rate": 4.4014609324979716e-07, "loss": 0.0068, "step": 770430 }, { "epoch": 2.0, "learning_rate": 4.3625787687833244e-07, "loss": 0.0063, "step": 770440 }, { "epoch": 2.0, "learning_rate": 4.3236966050686783e-07, "loss": 0.0061, "step": 770450 }, { "epoch": 2.0, "learning_rate": 4.284814441354032e-07, "loss": 0.0107, "step": 770460 }, { "epoch": 2.0, "learning_rate": 4.2459322776393856e-07, "loss": 0.0053, "step": 770470 }, { "epoch": 2.0, "learning_rate": 4.2070501139247395e-07, "loss": 0.0092, "step": 770480 }, { "epoch": 2.0, "learning_rate": 4.168167950210093e-07, "loss": 0.0077, "step": 770490 }, { "epoch": 2.0, "learning_rate": 4.1292857864954463e-07, "loss": 0.0075, "step": 770500 }, { "epoch": 2.0, "learning_rate": 4.0904036227807997e-07, "loss": 0.0115, "step": 770510 }, { "epoch": 2.0, "learning_rate": 4.0515214590661536e-07, "loss": 0.0079, "step": 770520 }, { "epoch": 2.0, "learning_rate": 4.0126392953515075e-07, "loss": 0.007, "step": 770530 }, { "epoch": 2.0, "learning_rate": 3.973757131636861e-07, "loss": 0.0064, "step": 770540 }, { "epoch": 2.0, "learning_rate": 3.934874967922215e-07, "loss": 0.0063, "step": 770550 }, { "epoch": 2.0, "learning_rate": 3.8959928042075687e-07, "loss": 0.007, "step": 770560 }, { "epoch": 2.0, "learning_rate": 3.8571106404929216e-07, "loss": 0.01, "step": 770570 }, { "epoch": 2.0, "learning_rate": 3.8182284767782755e-07, "loss": 0.0093, "step": 770580 }, { "epoch": 2.0, "learning_rate": 3.779346313063629e-07, "loss": 0.0092, "step": 770590 }, { "epoch": 2.0, "learning_rate": 3.740464149348983e-07, "loss": 0.0078, "step": 770600 }, { "epoch": 2.0, "learning_rate": 3.7015819856343367e-07, "loss": 0.0053, "step": 770610 }, { "epoch": 2.0, "learning_rate": 3.66269982191969e-07, "loss": 0.0061, "step": 770620 }, { "epoch": 2.0, "learning_rate": 3.6238176582050434e-07, "loss": 0.0084, "step": 770630 }, { "epoch": 2.0, "learning_rate": 3.584935494490397e-07, "loss": 0.0091, "step": 770640 }, { "epoch": 2.0, "learning_rate": 3.5460533307757507e-07, "loss": 0.0083, "step": 770650 }, { "epoch": 2.0, "learning_rate": 3.507171167061104e-07, "loss": 0.0064, "step": 770660 }, { "epoch": 2.0, "learning_rate": 3.468289003346458e-07, "loss": 0.0055, "step": 770670 }, { "epoch": 2.0, "learning_rate": 3.429406839631812e-07, "loss": 0.0087, "step": 770680 }, { "epoch": 2.0, "learning_rate": 3.390524675917165e-07, "loss": 0.0072, "step": 770690 }, { "epoch": 2.0, "learning_rate": 3.3516425122025187e-07, "loss": 0.0071, "step": 770700 }, { "epoch": 2.0, "learning_rate": 3.312760348487872e-07, "loss": 0.0065, "step": 770710 }, { "epoch": 2.0, "learning_rate": 3.273878184773226e-07, "loss": 0.0083, "step": 770720 }, { "epoch": 2.0, "learning_rate": 3.23499602105858e-07, "loss": 0.0073, "step": 770730 }, { "epoch": 2.0, "learning_rate": 3.196113857343933e-07, "loss": 0.0065, "step": 770740 }, { "epoch": 2.0, "learning_rate": 3.157231693629287e-07, "loss": 0.0089, "step": 770750 }, { "epoch": 2.0, "learning_rate": 3.11834952991464e-07, "loss": 0.0087, "step": 770760 }, { "epoch": 2.0, "learning_rate": 3.079467366199994e-07, "loss": 0.0083, "step": 770770 }, { "epoch": 2.0, "learning_rate": 3.040585202485348e-07, "loss": 0.0059, "step": 770780 }, { "epoch": 2.0, "learning_rate": 3.001703038770701e-07, "loss": 0.0055, "step": 770790 }, { "epoch": 2.0, "learning_rate": 2.962820875056055e-07, "loss": 0.0077, "step": 770800 }, { "epoch": 2.0, "learning_rate": 2.9239387113414085e-07, "loss": 0.0056, "step": 770810 }, { "epoch": 2.0, "learning_rate": 2.8850565476267624e-07, "loss": 0.0086, "step": 770820 }, { "epoch": 2.0, "learning_rate": 2.846174383912116e-07, "loss": 0.0038, "step": 770830 }, { "epoch": 2.0, "learning_rate": 2.807292220197469e-07, "loss": 0.0069, "step": 770840 }, { "epoch": 2.0, "learning_rate": 2.768410056482823e-07, "loss": 0.0064, "step": 770850 }, { "epoch": 2.0, "learning_rate": 2.7295278927681764e-07, "loss": 0.0126, "step": 770860 }, { "epoch": 2.0, "learning_rate": 2.69064572905353e-07, "loss": 0.0084, "step": 770870 }, { "epoch": 2.0, "learning_rate": 2.6517635653388837e-07, "loss": 0.0053, "step": 770880 }, { "epoch": 2.0, "learning_rate": 2.6128814016242376e-07, "loss": 0.0068, "step": 770890 }, { "epoch": 2.0, "learning_rate": 2.573999237909591e-07, "loss": 0.0053, "step": 770900 }, { "epoch": 2.0, "learning_rate": 2.5351170741949444e-07, "loss": 0.0073, "step": 770910 }, { "epoch": 2.0, "learning_rate": 2.4962349104802983e-07, "loss": 0.0065, "step": 770920 }, { "epoch": 2.0, "learning_rate": 2.4573527467656517e-07, "loss": 0.0073, "step": 770930 }, { "epoch": 2.0, "learning_rate": 2.4184705830510056e-07, "loss": 0.0066, "step": 770940 }, { "epoch": 2.0, "learning_rate": 2.3795884193363592e-07, "loss": 0.0074, "step": 770950 }, { "epoch": 2.0, "learning_rate": 2.3407062556217126e-07, "loss": 0.0095, "step": 770960 }, { "epoch": 2.0, "learning_rate": 2.3018240919070663e-07, "loss": 0.006, "step": 770970 }, { "epoch": 2.0, "learning_rate": 2.26294192819242e-07, "loss": 0.0079, "step": 770980 }, { "epoch": 2.0, "learning_rate": 2.2240597644777733e-07, "loss": 0.0069, "step": 770990 }, { "epoch": 2.0, "learning_rate": 2.185177600763127e-07, "loss": 0.0071, "step": 771000 }, { "epoch": 2.0, "eval_cer": 0.8816788924952867, "eval_loss": 0.004364285618066788, "eval_runtime": 107.9463, "eval_samples_per_second": 18.528, "eval_steps_per_second": 4.632, "step": 771000 }, { "epoch": 2.0, "learning_rate": 2.1462954370484808e-07, "loss": 0.0041, "step": 771010 }, { "epoch": 2.0, "learning_rate": 2.1074132733338342e-07, "loss": 0.0091, "step": 771020 }, { "epoch": 2.0, "learning_rate": 2.068531109619188e-07, "loss": 0.0075, "step": 771030 }, { "epoch": 2.0, "learning_rate": 2.0296489459045415e-07, "loss": 0.0069, "step": 771040 }, { "epoch": 2.0, "learning_rate": 1.990766782189895e-07, "loss": 0.0062, "step": 771050 }, { "epoch": 2.0, "learning_rate": 1.9518846184752488e-07, "loss": 0.0067, "step": 771060 }, { "epoch": 2.0, "learning_rate": 1.9130024547606024e-07, "loss": 0.0062, "step": 771070 }, { "epoch": 2.0, "learning_rate": 1.874120291045956e-07, "loss": 0.01, "step": 771080 }, { "epoch": 2.0, "learning_rate": 1.8352381273313095e-07, "loss": 0.007, "step": 771090 }, { "epoch": 2.0, "learning_rate": 1.796355963616663e-07, "loss": 0.0065, "step": 771100 }, { "epoch": 2.0, "learning_rate": 1.757473799902017e-07, "loss": 0.0065, "step": 771110 }, { "epoch": 2.0, "learning_rate": 1.7185916361873704e-07, "loss": 0.0053, "step": 771120 }, { "epoch": 2.0, "learning_rate": 1.679709472472724e-07, "loss": 0.0059, "step": 771130 }, { "epoch": 2.0, "learning_rate": 1.6408273087580777e-07, "loss": 0.0062, "step": 771140 }, { "epoch": 2.0, "learning_rate": 1.601945145043431e-07, "loss": 0.0066, "step": 771150 }, { "epoch": 2.0, "learning_rate": 1.563062981328785e-07, "loss": 0.0076, "step": 771160 }, { "epoch": 2.0, "learning_rate": 1.5241808176141386e-07, "loss": 0.0112, "step": 771170 }, { "epoch": 2.0, "learning_rate": 1.485298653899492e-07, "loss": 0.0067, "step": 771180 }, { "epoch": 2.0, "learning_rate": 1.4464164901848456e-07, "loss": 0.0063, "step": 771190 }, { "epoch": 2.0, "learning_rate": 1.4075343264701993e-07, "loss": 0.0078, "step": 771200 }, { "epoch": 2.0, "learning_rate": 1.368652162755553e-07, "loss": 0.0077, "step": 771210 }, { "epoch": 2.0, "learning_rate": 1.3297699990409066e-07, "loss": 0.0093, "step": 771220 }, { "epoch": 2.0, "learning_rate": 1.2908878353262602e-07, "loss": 0.0099, "step": 771230 }, { "epoch": 2.0, "learning_rate": 1.252005671611614e-07, "loss": 0.0067, "step": 771240 }, { "epoch": 2.0, "learning_rate": 1.2131235078969672e-07, "loss": 0.0088, "step": 771250 }, { "epoch": 2.0, "learning_rate": 1.174241344182321e-07, "loss": 0.0064, "step": 771260 }, { "epoch": 2.0, "learning_rate": 1.1353591804676745e-07, "loss": 0.0065, "step": 771270 }, { "epoch": 2.0, "learning_rate": 1.0964770167530282e-07, "loss": 0.0083, "step": 771280 }, { "epoch": 2.0, "learning_rate": 1.0575948530383818e-07, "loss": 0.006, "step": 771290 }, { "epoch": 2.0, "learning_rate": 1.0187126893237353e-07, "loss": 0.0068, "step": 771300 }, { "epoch": 2.0, "learning_rate": 9.79830525609089e-08, "loss": 0.0067, "step": 771310 }, { "epoch": 2.0, "learning_rate": 9.409483618944426e-08, "loss": 0.006, "step": 771320 }, { "epoch": 2.0, "learning_rate": 9.020661981797961e-08, "loss": 0.0059, "step": 771330 }, { "epoch": 2.0, "learning_rate": 8.631840344651499e-08, "loss": 0.0068, "step": 771340 }, { "epoch": 2.0, "learning_rate": 8.243018707505034e-08, "loss": 0.0079, "step": 771350 }, { "epoch": 2.0, "learning_rate": 7.854197070358571e-08, "loss": 0.0049, "step": 771360 }, { "epoch": 2.0, "learning_rate": 7.465375433212107e-08, "loss": 0.0048, "step": 771370 }, { "epoch": 2.0, "learning_rate": 7.076553796065642e-08, "loss": 0.0066, "step": 771380 }, { "epoch": 2.0, "learning_rate": 6.687732158919179e-08, "loss": 0.0075, "step": 771390 }, { "epoch": 2.0, "learning_rate": 6.298910521772715e-08, "loss": 0.0064, "step": 771400 }, { "epoch": 2.0, "learning_rate": 5.910088884626251e-08, "loss": 0.0066, "step": 771410 }, { "epoch": 2.0, "learning_rate": 5.5212672474797874e-08, "loss": 0.0103, "step": 771420 }, { "epoch": 2.0, "learning_rate": 5.132445610333324e-08, "loss": 0.0052, "step": 771430 }, { "epoch": 2.0, "learning_rate": 4.743623973186859e-08, "loss": 0.0088, "step": 771440 }, { "epoch": 2.0, "learning_rate": 4.3548023360403954e-08, "loss": 0.0068, "step": 771450 }, { "epoch": 2.0, "learning_rate": 3.965980698893932e-08, "loss": 0.0046, "step": 771460 }, { "epoch": 2.0, "learning_rate": 3.5771590617474676e-08, "loss": 0.0062, "step": 771470 }, { "epoch": 2.0, "learning_rate": 3.1883374246010034e-08, "loss": 0.011, "step": 771480 }, { "epoch": 2.0, "learning_rate": 2.7995157874545402e-08, "loss": 0.0047, "step": 771490 }, { "epoch": 2.0, "learning_rate": 2.410694150308076e-08, "loss": 0.0062, "step": 771500 }, { "epoch": 2.0, "learning_rate": 2.0218725131616124e-08, "loss": 0.005, "step": 771510 }, { "epoch": 2.0, "learning_rate": 1.6330508760151485e-08, "loss": 0.0062, "step": 771520 }, { "epoch": 2.0, "learning_rate": 1.2442292388686843e-08, "loss": 0.0069, "step": 771530 }, { "epoch": 2.0, "learning_rate": 8.554076017222206e-09, "loss": 0.0052, "step": 771540 }, { "epoch": 2.0, "learning_rate": 4.665859645757567e-09, "loss": 0.0056, "step": 771550 }, { "epoch": 2.0, "learning_rate": 7.776432742929277e-10, "loss": 0.0065, "step": 771560 }, { "epoch": 2.0, "step": 771562, "total_flos": 2.7387918028032307e+18, "train_loss": 0.015195539450556274, "train_runtime": 661141.8667, "train_samples_per_second": 37.344, "train_steps_per_second": 1.167 } ], "max_steps": 771562, "num_train_epochs": 2, "total_flos": 2.7387918028032307e+18, "trial_name": null, "trial_params": null }